diff --git a/all_results.json b/all_results.json index d417069f16c233f3c46d6a8ce956827c58d83629..7472efabd169314a5f1ea8c5e879af6f91ecd6a0 100644 --- a/all_results.json +++ b/all_results.json @@ -1,8 +1,8 @@ { "epoch": 2.0, - "train_loss": 0.013614018808192265, - "train_runtime": 415192.129, - "train_samples": 6342779, - "train_samples_per_second": 30.553, - "train_steps_per_second": 0.955 + "train_loss": 0.015195539450556274, + "train_runtime": 661141.8667, + "train_samples": 12344999, + "train_samples_per_second": 37.344, + "train_steps_per_second": 1.167 } \ No newline at end of file diff --git a/pytorch_model.bin b/pytorch_model.bin index cb2a97963ba95d317243fa7bc9485ff977581b85..90daa47ec5cc323236c40ddbf881fdeb95371def 100644 --- a/pytorch_model.bin +++ b/pytorch_model.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:6ed26ed7830bddb2e53106a9f1e2d9eac7db42270845f34d6f3315c387c147b5 +oid sha256:5b82fac2d1e46ee1cd545a142942ec2977a5a94a204440d5baab0a9049617b45 size 557971229 diff --git a/train_results.json b/train_results.json index d417069f16c233f3c46d6a8ce956827c58d83629..7472efabd169314a5f1ea8c5e879af6f91ecd6a0 100644 --- a/train_results.json +++ b/train_results.json @@ -1,8 +1,8 @@ { "epoch": 2.0, - "train_loss": 0.013614018808192265, - "train_runtime": 415192.129, - "train_samples": 6342779, - "train_samples_per_second": 30.553, - "train_steps_per_second": 0.955 + "train_loss": 0.015195539450556274, + "train_runtime": 661141.8667, + "train_samples": 12344999, + "train_samples_per_second": 37.344, + "train_steps_per_second": 1.167 } \ No newline at end of file diff --git a/trainer_state.json b/trainer_state.json index 4625ccb9b4b27dfb586ee9d649b812a83b4c1a67..ed4e9b38b75341809e334a2a5c5da6b2b2f945a4 100644 --- a/trainer_state.json +++ b/trainer_state.json @@ -1,241441 +1,469900 @@ { - "best_metric": 0.9143955354015062, - "best_model_checkpoint": "./models/bart-base-spelling-nl-3m-3-2nd/checkpoint-390000", - "epoch": 1.999991171063792, - "global_step": 396422, + "best_metric": 0.8816327044764588, + "best_model_checkpoint": "./models/bart-base-spelling-nl-9m-3/checkpoint-696000", + "epoch": 1.999998703928716, + "global_step": 771562, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.0, - "learning_rate": 0.00029999243230698596, - "loss": 0.7347, + "learning_rate": 0.0002999961117836285, + "loss": 0.9868, "step": 10 }, { "epoch": 0.0, - "learning_rate": 0.00029998486461397194, - "loss": 0.2215, + "learning_rate": 0.000299992223567257, + "loss": 0.289, "step": 20 }, { "epoch": 0.0, - "learning_rate": 0.0002999772969209579, - "loss": 0.1811, + "learning_rate": 0.00029998833535088557, + "loss": 0.1965, "step": 30 }, { "epoch": 0.0, - "learning_rate": 0.00029996972922794395, - "loss": 0.1745, + "learning_rate": 0.00029998444713451414, + "loss": 0.1664, "step": 40 }, { "epoch": 0.0, - "learning_rate": 0.00029996216153492994, - "loss": 0.1605, + "learning_rate": 0.00029998055891814265, + "loss": 0.1631, "step": 50 }, { "epoch": 0.0, - "learning_rate": 0.0002999545938419159, - "loss": 0.1534, + "learning_rate": 0.00029997667070177117, + "loss": 0.1647, "step": 60 }, { "epoch": 0.0, - "learning_rate": 0.0002999470261489019, - "loss": 0.1525, + "learning_rate": 0.00029997278248539974, + "loss": 0.1531, "step": 70 }, { "epoch": 0.0, - "learning_rate": 0.0002999394584558879, - "loss": 0.1273, + "learning_rate": 0.00029996889426902825, + "loss": 0.1556, "step": 80 }, { "epoch": 0.0, - "learning_rate": 0.00029993189076287386, - "loss": 0.144, + "learning_rate": 0.00029996500605265677, + "loss": 0.1376, "step": 90 }, { "epoch": 0.0, - "learning_rate": 0.0002999243230698599, - "loss": 0.172, + "learning_rate": 0.00029996111783628534, + "loss": 0.1429, "step": 100 }, { "epoch": 0.0, - "learning_rate": 0.0002999167553768459, - "loss": 0.1288, + "learning_rate": 0.00029995722961991385, + "loss": 0.1162, "step": 110 }, { "epoch": 0.0, - "learning_rate": 0.00029990918768383186, - "loss": 0.1398, + "learning_rate": 0.0002999533414035424, + "loss": 0.1291, "step": 120 }, { "epoch": 0.0, - "learning_rate": 0.00029990161999081784, - "loss": 0.164, + "learning_rate": 0.00029994945318717093, + "loss": 0.13, "step": 130 }, { "epoch": 0.0, - "learning_rate": 0.0002998940522978038, - "loss": 0.1436, + "learning_rate": 0.00029994556497079945, + "loss": 0.1487, "step": 140 }, { "epoch": 0.0, - "learning_rate": 0.0002998864846047898, - "loss": 0.1263, + "learning_rate": 0.000299941676754428, + "loss": 0.1119, "step": 150 }, { "epoch": 0.0, - "learning_rate": 0.00029987891691177584, - "loss": 0.1235, + "learning_rate": 0.00029993778853805653, + "loss": 0.1375, "step": 160 }, { "epoch": 0.0, - "learning_rate": 0.0002998713492187618, - "loss": 0.1192, + "learning_rate": 0.00029993390032168505, + "loss": 0.1118, "step": 170 }, { "epoch": 0.0, - "learning_rate": 0.0002998637815257478, - "loss": 0.1067, + "learning_rate": 0.0002999300121053136, + "loss": 0.1084, "step": 180 }, { "epoch": 0.0, - "learning_rate": 0.0002998562138327338, - "loss": 0.1085, + "learning_rate": 0.0002999261238889422, + "loss": 0.1184, "step": 190 }, { "epoch": 0.0, - "learning_rate": 0.00029984864613971977, - "loss": 0.1203, + "learning_rate": 0.0002999222356725707, + "loss": 0.1323, "step": 200 }, { "epoch": 0.0, - "learning_rate": 0.00029984107844670575, - "loss": 0.1025, + "learning_rate": 0.0002999183474561992, + "loss": 0.1202, "step": 210 }, { "epoch": 0.0, - "learning_rate": 0.00029983351075369173, - "loss": 0.1044, + "learning_rate": 0.00029991445923982773, + "loss": 0.1063, "step": 220 }, { "epoch": 0.0, - "learning_rate": 0.00029982594306067776, - "loss": 0.0965, + "learning_rate": 0.0002999105710234563, + "loss": 0.1167, "step": 230 }, { "epoch": 0.0, - "learning_rate": 0.00029981837536766375, - "loss": 0.1083, + "learning_rate": 0.0002999066828070848, + "loss": 0.1002, "step": 240 }, { "epoch": 0.0, - "learning_rate": 0.0002998108076746497, - "loss": 0.106, + "learning_rate": 0.0002999027945907134, + "loss": 0.104, "step": 250 }, { "epoch": 0.0, - "learning_rate": 0.0002998032399816357, - "loss": 0.1017, + "learning_rate": 0.0002998989063743419, + "loss": 0.1216, "step": 260 }, { "epoch": 0.0, - "learning_rate": 0.0002997956722886217, - "loss": 0.1216, + "learning_rate": 0.0002998950181579704, + "loss": 0.117, "step": 270 }, { "epoch": 0.0, - "learning_rate": 0.00029978810459560767, - "loss": 0.1059, + "learning_rate": 0.000299891129941599, + "loss": 0.1064, "step": 280 }, { "epoch": 0.0, - "learning_rate": 0.0002997805369025937, - "loss": 0.0953, + "learning_rate": 0.0002998872417252275, + "loss": 0.1148, "step": 290 }, { "epoch": 0.0, - "learning_rate": 0.0002997729692095797, - "loss": 0.0948, + "learning_rate": 0.000299883353508856, + "loss": 0.0943, "step": 300 }, { "epoch": 0.0, - "learning_rate": 0.00029976540151656567, - "loss": 0.1041, + "learning_rate": 0.0002998794652924846, + "loss": 0.1039, "step": 310 }, { "epoch": 0.0, - "learning_rate": 0.00029975783382355165, - "loss": 0.0998, + "learning_rate": 0.0002998755770761131, + "loss": 0.1171, "step": 320 }, { "epoch": 0.0, - "learning_rate": 0.00029975026613053763, - "loss": 0.0976, + "learning_rate": 0.00029987168885974166, + "loss": 0.1102, "step": 330 }, { "epoch": 0.0, - "learning_rate": 0.0002997426984375236, - "loss": 0.1064, + "learning_rate": 0.00029986780064337017, + "loss": 0.1102, "step": 340 }, { "epoch": 0.0, - "learning_rate": 0.0002997351307445096, - "loss": 0.1054, + "learning_rate": 0.0002998639124269987, + "loss": 0.1167, "step": 350 }, { "epoch": 0.0, - "learning_rate": 0.00029972756305149563, - "loss": 0.084, + "learning_rate": 0.00029986002421062726, + "loss": 0.1074, "step": 360 }, { "epoch": 0.0, - "learning_rate": 0.0002997199953584816, - "loss": 0.0937, + "learning_rate": 0.00029985613599425577, + "loss": 0.1107, "step": 370 }, { "epoch": 0.0, - "learning_rate": 0.0002997124276654676, - "loss": 0.1096, + "learning_rate": 0.00029985224777788434, + "loss": 0.1021, "step": 380 }, { "epoch": 0.0, - "learning_rate": 0.0002997048599724536, - "loss": 0.1014, + "learning_rate": 0.00029984835956151285, + "loss": 0.1011, "step": 390 }, { "epoch": 0.0, - "learning_rate": 0.00029969729227943956, - "loss": 0.0946, + "learning_rate": 0.0002998444713451414, + "loss": 0.1051, "step": 400 }, { "epoch": 0.0, - "learning_rate": 0.00029968972458642554, - "loss": 0.0951, + "learning_rate": 0.00029984058312876994, + "loss": 0.0837, "step": 410 }, { "epoch": 0.0, - "learning_rate": 0.0002996821568934116, - "loss": 0.0892, + "learning_rate": 0.00029983669491239845, + "loss": 0.0925, "step": 420 }, { "epoch": 0.0, - "learning_rate": 0.00029967458920039756, - "loss": 0.0945, + "learning_rate": 0.00029983280669602697, + "loss": 0.1086, "step": 430 }, { "epoch": 0.0, - "learning_rate": 0.00029966702150738354, - "loss": 0.0932, + "learning_rate": 0.00029982891847965553, + "loss": 0.0881, "step": 440 }, { "epoch": 0.0, - "learning_rate": 0.0002996594538143695, - "loss": 0.0833, + "learning_rate": 0.00029982503026328405, + "loss": 0.0898, "step": 450 }, { "epoch": 0.0, - "learning_rate": 0.0002996518861213555, - "loss": 0.0837, + "learning_rate": 0.0002998211420469126, + "loss": 0.1033, "step": 460 }, { "epoch": 0.0, - "learning_rate": 0.0002996443184283415, - "loss": 0.085, + "learning_rate": 0.00029981725383054113, + "loss": 0.1079, "step": 470 }, { "epoch": 0.0, - "learning_rate": 0.0002996367507353275, - "loss": 0.086, + "learning_rate": 0.0002998133656141697, + "loss": 0.0976, "step": 480 }, { "epoch": 0.0, - "learning_rate": 0.0002996291830423135, - "loss": 0.079, + "learning_rate": 0.0002998094773977982, + "loss": 0.1109, "step": 490 }, { "epoch": 0.0, - "learning_rate": 0.0002996216153492995, - "loss": 0.0793, + "learning_rate": 0.00029980558918142673, + "loss": 0.1082, "step": 500 }, { "epoch": 0.0, - "learning_rate": 0.00029961404765628546, - "loss": 0.0857, + "learning_rate": 0.00029980170096505524, + "loss": 0.1971, "step": 510 }, { "epoch": 0.0, - "learning_rate": 0.00029960647996327144, - "loss": 0.0824, + "learning_rate": 0.0002997978127486838, + "loss": 0.1078, "step": 520 }, { "epoch": 0.0, - "learning_rate": 0.0002995989122702574, - "loss": 0.0853, + "learning_rate": 0.0002997939245323124, + "loss": 0.0928, "step": 530 }, { "epoch": 0.0, - "learning_rate": 0.0002995913445772434, - "loss": 0.0837, + "learning_rate": 0.0002997900363159409, + "loss": 0.1055, "step": 540 }, { "epoch": 0.0, - "learning_rate": 0.00029958377688422944, - "loss": 0.0743, + "learning_rate": 0.0002997861480995694, + "loss": 0.1023, "step": 550 }, { "epoch": 0.0, - "learning_rate": 0.0002995762091912154, - "loss": 0.0792, + "learning_rate": 0.0002997822598831979, + "loss": 0.0934, "step": 560 }, { "epoch": 0.0, - "learning_rate": 0.0002995686414982014, - "loss": 0.0767, + "learning_rate": 0.0002997783716668265, + "loss": 0.1039, "step": 570 }, { "epoch": 0.0, - "learning_rate": 0.0002995610738051874, - "loss": 0.0813, + "learning_rate": 0.000299774483450455, + "loss": 0.087, "step": 580 }, { "epoch": 0.0, - "learning_rate": 0.00029955350611217337, - "loss": 0.0869, + "learning_rate": 0.0002997705952340836, + "loss": 0.0906, "step": 590 }, { "epoch": 0.0, - "learning_rate": 0.00029954593841915935, - "loss": 0.0795, + "learning_rate": 0.0002997667070177121, + "loss": 0.0846, "step": 600 }, { "epoch": 0.0, - "learning_rate": 0.0002995383707261454, - "loss": 0.0784, + "learning_rate": 0.00029976281880134066, + "loss": 0.0917, "step": 610 }, { "epoch": 0.0, - "learning_rate": 0.00029953080303313137, - "loss": 0.0813, + "learning_rate": 0.0002997589305849692, + "loss": 0.1092, "step": 620 }, { "epoch": 0.0, - "learning_rate": 0.0002995232353401173, - "loss": 0.0906, + "learning_rate": 0.0002997550423685977, + "loss": 0.1039, "step": 630 }, { "epoch": 0.0, - "learning_rate": 0.0002995156676471033, - "loss": 0.0762, + "learning_rate": 0.0002997511541522262, + "loss": 0.1769, "step": 640 }, { "epoch": 0.0, - "learning_rate": 0.0002995080999540893, - "loss": 0.0874, + "learning_rate": 0.0002997472659358548, + "loss": 0.1353, "step": 650 }, { "epoch": 0.0, - "learning_rate": 0.0002995005322610753, - "loss": 0.0744, + "learning_rate": 0.0002997433777194833, + "loss": 0.0978, "step": 660 }, { "epoch": 0.0, - "learning_rate": 0.00029949296456806127, - "loss": 0.0719, + "learning_rate": 0.00029973948950311186, + "loss": 0.1023, "step": 670 }, { "epoch": 0.0, - "learning_rate": 0.00029948539687504725, - "loss": 0.0757, + "learning_rate": 0.00029973560128674037, + "loss": 0.0935, "step": 680 }, { "epoch": 0.0, - "learning_rate": 0.00029947782918203324, - "loss": 0.0752, + "learning_rate": 0.00029973171307036894, + "loss": 0.1242, "step": 690 }, { "epoch": 0.0, - "learning_rate": 0.0002994702614890192, - "loss": 0.0854, + "learning_rate": 0.00029972782485399745, + "loss": 0.0939, "step": 700 }, { "epoch": 0.0, - "learning_rate": 0.00029946269379600525, - "loss": 0.0878, + "learning_rate": 0.00029972393663762597, + "loss": 0.095, "step": 710 }, { "epoch": 0.0, - "learning_rate": 0.00029945512610299123, - "loss": 0.0747, + "learning_rate": 0.0002997200484212545, + "loss": 0.095, "step": 720 }, { "epoch": 0.0, - "learning_rate": 0.0002994475584099772, - "loss": 0.0783, + "learning_rate": 0.00029971616020488305, + "loss": 0.0844, "step": 730 }, { "epoch": 0.0, - "learning_rate": 0.0002994399907169632, - "loss": 0.0841, + "learning_rate": 0.0002997122719885116, + "loss": 0.1014, "step": 740 }, { "epoch": 0.0, - "learning_rate": 0.0002994324230239492, - "loss": 0.0798, + "learning_rate": 0.00029970838377214014, + "loss": 0.0894, "step": 750 }, { "epoch": 0.0, - "learning_rate": 0.00029942485533093516, - "loss": 0.0835, + "learning_rate": 0.00029970449555576865, + "loss": 0.0934, "step": 760 }, { "epoch": 0.0, - "learning_rate": 0.00029941728763792114, - "loss": 0.0709, + "learning_rate": 0.00029970060733939716, + "loss": 0.1144, "step": 770 }, { "epoch": 0.0, - "learning_rate": 0.0002994097199449072, - "loss": 0.0715, + "learning_rate": 0.00029969671912302573, + "loss": 0.0885, "step": 780 }, { "epoch": 0.0, - "learning_rate": 0.00029940215225189316, - "loss": 0.0859, + "learning_rate": 0.00029969283090665425, + "loss": 0.0893, "step": 790 }, { "epoch": 0.0, - "learning_rate": 0.00029939458455887914, - "loss": 0.0811, + "learning_rate": 0.0002996889426902828, + "loss": 0.0883, "step": 800 }, { "epoch": 0.0, - "learning_rate": 0.0002993870168658651, - "loss": 0.0768, + "learning_rate": 0.00029968505447391133, + "loss": 0.083, "step": 810 }, { "epoch": 0.0, - "learning_rate": 0.0002993794491728511, - "loss": 0.0736, + "learning_rate": 0.0002996811662575399, + "loss": 0.0868, "step": 820 }, { "epoch": 0.0, - "learning_rate": 0.0002993718814798371, - "loss": 0.0673, + "learning_rate": 0.0002996772780411684, + "loss": 0.0977, "step": 830 }, { "epoch": 0.0, - "learning_rate": 0.0002993643137868231, - "loss": 0.0703, + "learning_rate": 0.00029967338982479693, + "loss": 0.0841, "step": 840 }, { "epoch": 0.0, - "learning_rate": 0.0002993567460938091, - "loss": 0.0774, + "learning_rate": 0.00029966950160842544, + "loss": 0.0846, "step": 850 }, { "epoch": 0.0, - "learning_rate": 0.0002993491784007951, - "loss": 0.0795, + "learning_rate": 0.000299665613392054, + "loss": 0.0754, "step": 860 }, { "epoch": 0.0, - "learning_rate": 0.00029934161070778106, - "loss": 0.0833, + "learning_rate": 0.0002996617251756826, + "loss": 0.0802, "step": 870 }, { "epoch": 0.0, - "learning_rate": 0.00029933404301476705, - "loss": 0.077, + "learning_rate": 0.0002996578369593111, + "loss": 0.0986, "step": 880 }, { "epoch": 0.0, - "learning_rate": 0.000299326475321753, - "loss": 0.0724, + "learning_rate": 0.0002996539487429396, + "loss": 0.0845, "step": 890 }, { "epoch": 0.0, - "learning_rate": 0.000299318907628739, - "loss": 0.0766, + "learning_rate": 0.0002996500605265682, + "loss": 0.0767, "step": 900 }, { "epoch": 0.0, - "learning_rate": 0.00029931133993572504, - "loss": 0.0849, + "learning_rate": 0.0002996461723101967, + "loss": 0.0787, "step": 910 }, { "epoch": 0.0, - "learning_rate": 0.000299303772242711, - "loss": 0.0761, + "learning_rate": 0.0002996422840938252, + "loss": 0.0861, "step": 920 }, { "epoch": 0.0, - "learning_rate": 0.000299296204549697, - "loss": 0.0725, + "learning_rate": 0.0002996383958774538, + "loss": 0.086, "step": 930 }, { "epoch": 0.0, - "learning_rate": 0.000299288636856683, - "loss": 0.0778, + "learning_rate": 0.0002996345076610823, + "loss": 0.0706, "step": 940 }, { "epoch": 0.0, - "learning_rate": 0.00029928106916366897, - "loss": 0.0758, + "learning_rate": 0.00029963061944471086, + "loss": 0.0881, "step": 950 }, { "epoch": 0.0, - "learning_rate": 0.00029927350147065495, - "loss": 0.0794, + "learning_rate": 0.0002996267312283394, + "loss": 0.0731, "step": 960 }, { "epoch": 0.0, - "learning_rate": 0.000299265933777641, - "loss": 0.0707, + "learning_rate": 0.0002996228430119679, + "loss": 0.0821, "step": 970 }, { "epoch": 0.0, - "learning_rate": 0.00029925836608462697, + "learning_rate": 0.00029961895479559646, "loss": 0.0737, "step": 980 }, { "epoch": 0.0, - "learning_rate": 0.00029925079839161295, - "loss": 0.0756, + "learning_rate": 0.00029961506657922497, + "loss": 0.0892, "step": 990 }, { - "epoch": 0.01, - "learning_rate": 0.00029924323069859893, - "loss": 0.0794, + "epoch": 0.0, + "learning_rate": 0.0002996111783628535, + "loss": 0.0694, "step": 1000 }, { - "epoch": 0.01, - "eval_cer": 0.914636193640606, - "eval_loss": 0.057572510093450546, - "eval_runtime": 117.4563, - "eval_samples_per_second": 17.028, - "eval_steps_per_second": 4.257, + "epoch": 0.0, + "eval_cer": 0.8818566463859275, + "eval_loss": 0.06612774729728699, + "eval_runtime": 107.9329, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.633, "step": 1000 }, { - "epoch": 0.01, - "learning_rate": 0.0002992356630055849, - "loss": 0.0786, + "epoch": 0.0, + "learning_rate": 0.00029960729014648206, + "loss": 0.0788, "step": 1010 }, { - "epoch": 0.01, - "learning_rate": 0.0002992280953125709, - "loss": 0.0757, + "epoch": 0.0, + "learning_rate": 0.00029960340193011057, + "loss": 0.0885, "step": 1020 }, { - "epoch": 0.01, - "learning_rate": 0.00029922052761955693, - "loss": 0.079, + "epoch": 0.0, + "learning_rate": 0.00029959951371373914, + "loss": 0.094, "step": 1030 }, { - "epoch": 0.01, - "learning_rate": 0.0002992129599265429, - "loss": 0.0718, + "epoch": 0.0, + "learning_rate": 0.00029959562549736765, + "loss": 0.0913, "step": 1040 }, { - "epoch": 0.01, - "learning_rate": 0.0002992053922335289, - "loss": 0.083, + "epoch": 0.0, + "learning_rate": 0.00029959173728099617, + "loss": 0.0892, "step": 1050 }, { - "epoch": 0.01, - "learning_rate": 0.0002991978245405149, - "loss": 0.0785, + "epoch": 0.0, + "learning_rate": 0.0002995878490646247, + "loss": 0.078, "step": 1060 }, { - "epoch": 0.01, - "learning_rate": 0.00029919025684750086, - "loss": 0.0776, + "epoch": 0.0, + "learning_rate": 0.00029958396084825325, + "loss": 0.0822, "step": 1070 }, { - "epoch": 0.01, - "learning_rate": 0.00029918268915448684, - "loss": 0.0747, + "epoch": 0.0, + "learning_rate": 0.0002995800726318818, + "loss": 0.0802, "step": 1080 }, { - "epoch": 0.01, - "learning_rate": 0.0002991751214614728, - "loss": 0.082, + "epoch": 0.0, + "learning_rate": 0.00029957618441551033, + "loss": 0.0878, "step": 1090 }, { - "epoch": 0.01, - "learning_rate": 0.00029916755376845885, - "loss": 0.073, + "epoch": 0.0, + "learning_rate": 0.00029957229619913885, + "loss": 0.0858, "step": 1100 }, { - "epoch": 0.01, - "learning_rate": 0.00029915998607544484, - "loss": 0.0719, + "epoch": 0.0, + "learning_rate": 0.0002995684079827674, + "loss": 0.0799, "step": 1110 }, { - "epoch": 0.01, - "learning_rate": 0.0002991524183824308, - "loss": 0.0861, + "epoch": 0.0, + "learning_rate": 0.00029956451976639593, + "loss": 0.0817, "step": 1120 }, { - "epoch": 0.01, - "learning_rate": 0.0002991448506894168, - "loss": 0.0647, + "epoch": 0.0, + "learning_rate": 0.00029956063155002445, + "loss": 0.0783, "step": 1130 }, { - "epoch": 0.01, - "learning_rate": 0.0002991372829964028, - "loss": 0.0666, + "epoch": 0.0, + "learning_rate": 0.000299556743333653, + "loss": 0.0846, "step": 1140 }, { - "epoch": 0.01, - "learning_rate": 0.00029912971530338876, - "loss": 0.0736, + "epoch": 0.0, + "learning_rate": 0.00029955285511728153, + "loss": 0.0719, "step": 1150 }, { - "epoch": 0.01, - "learning_rate": 0.0002991221476103748, - "loss": 0.0638, + "epoch": 0.0, + "learning_rate": 0.0002995489669009101, + "loss": 0.0744, "step": 1160 }, { - "epoch": 0.01, - "learning_rate": 0.0002991145799173608, - "loss": 0.0711, + "epoch": 0.0, + "learning_rate": 0.0002995450786845386, + "loss": 0.0723, "step": 1170 }, { - "epoch": 0.01, - "learning_rate": 0.00029910701222434676, - "loss": 0.0683, + "epoch": 0.0, + "learning_rate": 0.00029954119046816713, + "loss": 0.0738, "step": 1180 }, { - "epoch": 0.01, - "learning_rate": 0.00029909944453133274, - "loss": 0.0695, + "epoch": 0.0, + "learning_rate": 0.0002995373022517957, + "loss": 0.0719, "step": 1190 }, { - "epoch": 0.01, - "learning_rate": 0.0002990918768383187, - "loss": 0.0733, + "epoch": 0.0, + "learning_rate": 0.0002995334140354242, + "loss": 0.0693, "step": 1200 }, { - "epoch": 0.01, - "learning_rate": 0.0002990843091453047, - "loss": 0.0736, + "epoch": 0.0, + "learning_rate": 0.0002995295258190527, + "loss": 0.0873, "step": 1210 }, { - "epoch": 0.01, - "learning_rate": 0.00029907674145229074, - "loss": 0.0725, + "epoch": 0.0, + "learning_rate": 0.0002995256376026813, + "loss": 0.0718, "step": 1220 }, { - "epoch": 0.01, - "learning_rate": 0.0002990691737592767, - "loss": 0.0629, + "epoch": 0.0, + "learning_rate": 0.00029952174938630986, + "loss": 0.0786, "step": 1230 }, { - "epoch": 0.01, - "learning_rate": 0.0002990616060662627, - "loss": 0.061, + "epoch": 0.0, + "learning_rate": 0.0002995178611699384, + "loss": 0.0907, "step": 1240 }, { - "epoch": 0.01, - "learning_rate": 0.0002990540383732487, - "loss": 0.059, + "epoch": 0.0, + "learning_rate": 0.0002995139729535669, + "loss": 0.0682, "step": 1250 }, { - "epoch": 0.01, - "learning_rate": 0.00029904647068023467, - "loss": 0.0654, + "epoch": 0.0, + "learning_rate": 0.0002995100847371954, + "loss": 0.0745, "step": 1260 }, { - "epoch": 0.01, - "learning_rate": 0.00029903890298722065, - "loss": 0.0563, + "epoch": 0.0, + "learning_rate": 0.000299506196520824, + "loss": 0.076, "step": 1270 }, { - "epoch": 0.01, - "learning_rate": 0.00029903133529420663, - "loss": 0.0666, + "epoch": 0.0, + "learning_rate": 0.0002995023083044525, + "loss": 0.0741, "step": 1280 }, { - "epoch": 0.01, - "learning_rate": 0.00029902376760119266, - "loss": 0.0655, + "epoch": 0.0, + "learning_rate": 0.00029949842008808106, + "loss": 0.0667, "step": 1290 }, { - "epoch": 0.01, - "learning_rate": 0.00029901619990817865, - "loss": 0.0569, + "epoch": 0.0, + "learning_rate": 0.0002994945318717096, + "loss": 0.0749, "step": 1300 }, { - "epoch": 0.01, - "learning_rate": 0.0002990086322151646, - "loss": 0.0673, + "epoch": 0.0, + "learning_rate": 0.0002994906436553381, + "loss": 0.0662, "step": 1310 }, { - "epoch": 0.01, - "learning_rate": 0.0002990010645221506, - "loss": 0.0653, + "epoch": 0.0, + "learning_rate": 0.00029948675543896666, + "loss": 0.0797, "step": 1320 }, { - "epoch": 0.01, - "learning_rate": 0.0002989934968291366, - "loss": 0.0668, + "epoch": 0.0, + "learning_rate": 0.00029948286722259517, + "loss": 0.0678, "step": 1330 }, { - "epoch": 0.01, - "learning_rate": 0.00029898592913612257, + "epoch": 0.0, + "learning_rate": 0.0002994789790062237, "loss": 0.0727, "step": 1340 }, { - "epoch": 0.01, - "learning_rate": 0.0002989783614431086, - "loss": 0.0714, + "epoch": 0.0, + "learning_rate": 0.00029947509078985225, + "loss": 0.0707, "step": 1350 }, { - "epoch": 0.01, - "learning_rate": 0.0002989707937500946, - "loss": 0.0657, + "epoch": 0.0, + "learning_rate": 0.00029947120257348077, + "loss": 0.0772, "step": 1360 }, { - "epoch": 0.01, - "learning_rate": 0.00029896322605708057, - "loss": 0.0631, + "epoch": 0.0, + "learning_rate": 0.00029946731435710934, + "loss": 0.0816, "step": 1370 }, { - "epoch": 0.01, - "learning_rate": 0.00029895565836406655, - "loss": 0.0658, + "epoch": 0.0, + "learning_rate": 0.00029946342614073785, + "loss": 0.0686, "step": 1380 }, { - "epoch": 0.01, - "learning_rate": 0.00029894809067105253, - "loss": 0.0652, + "epoch": 0.0, + "learning_rate": 0.00029945953792436637, + "loss": 0.0735, "step": 1390 }, { - "epoch": 0.01, - "learning_rate": 0.0002989405229780385, - "loss": 0.0743, + "epoch": 0.0, + "learning_rate": 0.00029945564970799494, + "loss": 0.0699, "step": 1400 }, { - "epoch": 0.01, - "learning_rate": 0.0002989329552850245, - "loss": 0.0639, + "epoch": 0.0, + "learning_rate": 0.00029945176149162345, + "loss": 0.0721, "step": 1410 }, { - "epoch": 0.01, - "learning_rate": 0.00029892538759201053, - "loss": 0.0642, + "epoch": 0.0, + "learning_rate": 0.000299447873275252, + "loss": 0.0639, "step": 1420 }, { - "epoch": 0.01, - "learning_rate": 0.0002989178198989965, - "loss": 0.0706, + "epoch": 0.0, + "learning_rate": 0.00029944398505888053, + "loss": 0.0736, "step": 1430 }, { - "epoch": 0.01, - "learning_rate": 0.0002989102522059825, - "loss": 0.0656, + "epoch": 0.0, + "learning_rate": 0.0002994400968425091, + "loss": 0.0691, "step": 1440 }, { - "epoch": 0.01, - "learning_rate": 0.0002989026845129685, - "loss": 0.0714, + "epoch": 0.0, + "learning_rate": 0.0002994362086261376, + "loss": 0.0772, "step": 1450 }, { - "epoch": 0.01, - "learning_rate": 0.00029889511681995446, - "loss": 0.0703, + "epoch": 0.0, + "learning_rate": 0.00029943232040976613, + "loss": 0.078, "step": 1460 }, { - "epoch": 0.01, - "learning_rate": 0.00029888754912694044, - "loss": 0.0675, + "epoch": 0.0, + "learning_rate": 0.00029942843219339465, + "loss": 0.0773, "step": 1470 }, { - "epoch": 0.01, - "learning_rate": 0.0002988799814339265, - "loss": 0.0703, + "epoch": 0.0, + "learning_rate": 0.0002994245439770232, + "loss": 0.0689, "step": 1480 }, { - "epoch": 0.01, - "learning_rate": 0.00029887241374091246, - "loss": 0.0671, + "epoch": 0.0, + "learning_rate": 0.00029942065576065173, + "loss": 0.076, "step": 1490 }, { - "epoch": 0.01, - "learning_rate": 0.00029886484604789844, - "loss": 0.0668, + "epoch": 0.0, + "learning_rate": 0.0002994167675442803, + "loss": 0.0729, "step": 1500 }, { - "epoch": 0.01, - "learning_rate": 0.0002988572783548844, - "loss": 0.0688, + "epoch": 0.0, + "learning_rate": 0.0002994128793279088, + "loss": 0.072, "step": 1510 }, { - "epoch": 0.01, - "learning_rate": 0.0002988497106618704, - "loss": 0.065, + "epoch": 0.0, + "learning_rate": 0.0002994089911115373, + "loss": 0.0747, "step": 1520 }, { - "epoch": 0.01, - "learning_rate": 0.0002988421429688564, - "loss": 0.0656, + "epoch": 0.0, + "learning_rate": 0.0002994051028951659, + "loss": 0.0733, "step": 1530 }, { - "epoch": 0.01, - "learning_rate": 0.0002988345752758424, - "loss": 0.0695, + "epoch": 0.0, + "learning_rate": 0.0002994012146787944, + "loss": 0.0746, "step": 1540 }, { - "epoch": 0.01, - "learning_rate": 0.0002988270075828284, - "loss": 0.0732, + "epoch": 0.0, + "learning_rate": 0.0002993973264624229, + "loss": 0.076, "step": 1550 }, { - "epoch": 0.01, - "learning_rate": 0.0002988194398898144, - "loss": 0.0693, + "epoch": 0.0, + "learning_rate": 0.0002993934382460515, + "loss": 0.0692, "step": 1560 }, { - "epoch": 0.01, - "learning_rate": 0.00029881187219680036, - "loss": 0.0653, + "epoch": 0.0, + "learning_rate": 0.00029938955002968006, + "loss": 0.0668, "step": 1570 }, { - "epoch": 0.01, - "learning_rate": 0.00029880430450378634, - "loss": 0.0652, + "epoch": 0.0, + "learning_rate": 0.0002993856618133086, + "loss": 0.0786, "step": 1580 }, { - "epoch": 0.01, - "learning_rate": 0.0002987967368107723, - "loss": 0.0775, + "epoch": 0.0, + "learning_rate": 0.0002993817735969371, + "loss": 0.0709, "step": 1590 }, { - "epoch": 0.01, - "learning_rate": 0.0002987891691177583, - "loss": 0.069, + "epoch": 0.0, + "learning_rate": 0.0002993778853805656, + "loss": 0.0715, "step": 1600 }, { - "epoch": 0.01, - "learning_rate": 0.00029878160142474434, - "loss": 0.0666, + "epoch": 0.0, + "learning_rate": 0.0002993739971641942, + "loss": 0.081, "step": 1610 }, { - "epoch": 0.01, - "learning_rate": 0.0002987740337317303, - "loss": 0.0642, + "epoch": 0.0, + "learning_rate": 0.0002993701089478227, + "loss": 0.1191, "step": 1620 }, { - "epoch": 0.01, - "learning_rate": 0.0002987664660387163, - "loss": 0.0659, + "epoch": 0.0, + "learning_rate": 0.00029936622073145126, + "loss": 0.1162, "step": 1630 }, { - "epoch": 0.01, - "learning_rate": 0.0002987588983457023, - "loss": 0.0657, + "epoch": 0.0, + "learning_rate": 0.00029936233251507977, + "loss": 0.07, "step": 1640 }, { - "epoch": 0.01, - "learning_rate": 0.00029875133065268827, - "loss": 0.0655, + "epoch": 0.0, + "learning_rate": 0.00029935844429870834, + "loss": 0.0789, "step": 1650 }, { - "epoch": 0.01, - "learning_rate": 0.00029874376295967425, - "loss": 0.0605, + "epoch": 0.0, + "learning_rate": 0.00029935455608233686, + "loss": 0.0745, "step": 1660 }, { - "epoch": 0.01, - "learning_rate": 0.0002987361952666603, - "loss": 0.0676, + "epoch": 0.0, + "learning_rate": 0.00029935066786596537, + "loss": 0.0832, "step": 1670 }, { - "epoch": 0.01, - "learning_rate": 0.00029872862757364627, - "loss": 0.0536, + "epoch": 0.0, + "learning_rate": 0.0002993467796495939, + "loss": 0.0877, "step": 1680 }, { - "epoch": 0.01, - "learning_rate": 0.00029872105988063225, - "loss": 0.059, + "epoch": 0.0, + "learning_rate": 0.00029934289143322245, + "loss": 0.0762, "step": 1690 }, { - "epoch": 0.01, - "learning_rate": 0.00029871349218761823, - "loss": 0.059, + "epoch": 0.0, + "learning_rate": 0.00029933900321685097, + "loss": 0.0694, "step": 1700 }, { - "epoch": 0.01, - "learning_rate": 0.0002987059244946042, - "loss": 0.0586, + "epoch": 0.0, + "learning_rate": 0.00029933511500047954, + "loss": 0.0824, "step": 1710 }, { - "epoch": 0.01, - "learning_rate": 0.0002986983568015902, - "loss": 0.0583, + "epoch": 0.0, + "learning_rate": 0.00029933122678410805, + "loss": 0.0831, "step": 1720 }, { - "epoch": 0.01, - "learning_rate": 0.0002986907891085762, - "loss": 0.0589, + "epoch": 0.0, + "learning_rate": 0.0002993273385677366, + "loss": 0.0773, "step": 1730 }, { - "epoch": 0.01, - "learning_rate": 0.0002986832214155622, - "loss": 0.0582, + "epoch": 0.0, + "learning_rate": 0.00029932345035136513, + "loss": 0.0658, "step": 1740 }, { - "epoch": 0.01, - "learning_rate": 0.0002986756537225482, - "loss": 0.0708, + "epoch": 0.0, + "learning_rate": 0.00029931956213499365, + "loss": 0.0758, "step": 1750 }, { - "epoch": 0.01, - "learning_rate": 0.00029866808602953417, - "loss": 0.0637, + "epoch": 0.0, + "learning_rate": 0.00029931567391862216, + "loss": 0.0781, "step": 1760 }, { - "epoch": 0.01, - "learning_rate": 0.00029866051833652015, - "loss": 0.0645, + "epoch": 0.0, + "learning_rate": 0.00029931178570225073, + "loss": 0.0683, "step": 1770 }, { - "epoch": 0.01, - "learning_rate": 0.00029865295064350613, - "loss": 0.0582, + "epoch": 0.0, + "learning_rate": 0.0002993078974858793, + "loss": 0.075, "step": 1780 }, { - "epoch": 0.01, - "learning_rate": 0.0002986453829504921, - "loss": 0.058, + "epoch": 0.0, + "learning_rate": 0.0002993040092695078, + "loss": 0.0753, "step": 1790 }, { - "epoch": 0.01, - "learning_rate": 0.00029863781525747815, - "loss": 0.0606, + "epoch": 0.0, + "learning_rate": 0.00029930012105313633, + "loss": 0.0709, "step": 1800 }, { - "epoch": 0.01, - "learning_rate": 0.00029863024756446413, - "loss": 0.0569, + "epoch": 0.0, + "learning_rate": 0.00029929623283676484, + "loss": 0.0658, "step": 1810 }, { - "epoch": 0.01, - "learning_rate": 0.0002986226798714501, - "loss": 0.0622, + "epoch": 0.0, + "learning_rate": 0.0002992923446203934, + "loss": 0.0714, "step": 1820 }, { - "epoch": 0.01, - "learning_rate": 0.0002986151121784361, - "loss": 0.0669, + "epoch": 0.0, + "learning_rate": 0.00029928845640402193, + "loss": 0.0787, "step": 1830 }, { - "epoch": 0.01, - "learning_rate": 0.0002986075444854221, - "loss": 0.0735, + "epoch": 0.0, + "learning_rate": 0.0002992845681876505, + "loss": 0.078, "step": 1840 }, { - "epoch": 0.01, - "learning_rate": 0.00029859997679240806, - "loss": 0.0759, + "epoch": 0.0, + "learning_rate": 0.000299280679971279, + "loss": 0.0707, "step": 1850 }, { - "epoch": 0.01, - "learning_rate": 0.0002985924090993941, - "loss": 0.0636, + "epoch": 0.0, + "learning_rate": 0.0002992767917549076, + "loss": 0.0677, "step": 1860 }, { - "epoch": 0.01, - "learning_rate": 0.0002985848414063801, - "loss": 0.0633, + "epoch": 0.0, + "learning_rate": 0.0002992729035385361, + "loss": 0.0664, "step": 1870 }, { - "epoch": 0.01, - "learning_rate": 0.00029857727371336606, - "loss": 0.064, + "epoch": 0.0, + "learning_rate": 0.0002992690153221646, + "loss": 0.0704, "step": 1880 }, { - "epoch": 0.01, - "learning_rate": 0.000298569706020352, - "loss": 0.0751, + "epoch": 0.0, + "learning_rate": 0.0002992651271057931, + "loss": 0.0717, "step": 1890 }, { - "epoch": 0.01, - "learning_rate": 0.000298562138327338, - "loss": 0.0611, + "epoch": 0.0, + "learning_rate": 0.0002992612388894217, + "loss": 0.0689, "step": 1900 }, { - "epoch": 0.01, - "learning_rate": 0.000298554570634324, - "loss": 0.0672, + "epoch": 0.0, + "learning_rate": 0.0002992573506730502, + "loss": 0.0565, "step": 1910 }, { - "epoch": 0.01, - "learning_rate": 0.00029854700294131, - "loss": 0.0659, + "epoch": 0.0, + "learning_rate": 0.0002992534624566788, + "loss": 0.1213, "step": 1920 }, { "epoch": 0.01, - "learning_rate": 0.00029853943524829596, - "loss": 0.0645, + "learning_rate": 0.0002992495742403073, + "loss": 0.089, "step": 1930 }, { "epoch": 0.01, - "learning_rate": 0.00029853186755528195, - "loss": 0.0679, + "learning_rate": 0.00029924568602393586, + "loss": 0.0781, "step": 1940 }, { "epoch": 0.01, - "learning_rate": 0.0002985242998622679, - "loss": 0.0619, + "learning_rate": 0.0002992417978075644, + "loss": 0.0892, "step": 1950 }, { "epoch": 0.01, - "learning_rate": 0.00029851673216925396, - "loss": 0.0564, + "learning_rate": 0.0002992379095911929, + "loss": 0.0952, "step": 1960 }, { "epoch": 0.01, - "learning_rate": 0.00029850916447623994, - "loss": 0.053, + "learning_rate": 0.00029923402137482146, + "loss": 0.1112, "step": 1970 }, { "epoch": 0.01, - "learning_rate": 0.0002985015967832259, - "loss": 0.0625, + "learning_rate": 0.00029923013315844997, + "loss": 0.0685, "step": 1980 }, { "epoch": 0.01, - "learning_rate": 0.0002984940290902119, - "loss": 0.063, + "learning_rate": 0.00029922624494207854, + "loss": 0.0803, "step": 1990 }, { "epoch": 0.01, - "learning_rate": 0.0002984864613971979, - "loss": 0.0629, + "learning_rate": 0.00029922235672570705, + "loss": 0.0688, "step": 2000 }, { "epoch": 0.01, - "eval_cer": 0.9145119829365546, - "eval_loss": 0.04564144089818001, - "eval_runtime": 117.4132, - "eval_samples_per_second": 17.034, - "eval_steps_per_second": 4.258, + "eval_cer": 0.8818524474751249, + "eval_loss": 0.05534271523356438, + "eval_runtime": 107.227, + "eval_samples_per_second": 18.652, + "eval_steps_per_second": 4.663, "step": 2000 }, { "epoch": 0.01, - "learning_rate": 0.00029847889370418387, - "loss": 0.052, + "learning_rate": 0.00029921846850933557, + "loss": 0.0748, "step": 2010 }, { "epoch": 0.01, - "learning_rate": 0.00029847132601116985, - "loss": 0.0563, + "learning_rate": 0.0002992145802929641, + "loss": 0.0765, "step": 2020 }, { "epoch": 0.01, - "learning_rate": 0.0002984637583181559, - "loss": 0.0644, + "learning_rate": 0.00029921069207659265, + "loss": 0.0679, "step": 2030 }, { "epoch": 0.01, - "learning_rate": 0.00029845619062514187, - "loss": 0.0555, + "learning_rate": 0.00029920680386022117, + "loss": 0.0698, "step": 2040 }, { "epoch": 0.01, - "learning_rate": 0.00029844862293212785, - "loss": 0.0578, + "learning_rate": 0.00029920291564384974, + "loss": 0.0723, "step": 2050 }, { "epoch": 0.01, - "learning_rate": 0.00029844105523911383, - "loss": 0.0626, + "learning_rate": 0.00029919902742747825, + "loss": 0.0768, "step": 2060 }, { "epoch": 0.01, - "learning_rate": 0.0002984334875460998, - "loss": 0.0582, + "learning_rate": 0.0002991951392111068, + "loss": 0.0664, "step": 2070 }, { "epoch": 0.01, - "learning_rate": 0.0002984259198530858, - "loss": 0.0599, + "learning_rate": 0.00029919125099473533, + "loss": 0.0647, "step": 2080 }, { "epoch": 0.01, - "learning_rate": 0.00029841835216007183, - "loss": 0.0776, + "learning_rate": 0.00029918736277836385, + "loss": 0.0678, "step": 2090 }, { "epoch": 0.01, - "learning_rate": 0.0002984107844670578, - "loss": 0.0647, + "learning_rate": 0.00029918347456199236, + "loss": 0.0812, "step": 2100 }, { "epoch": 0.01, - "learning_rate": 0.0002984032167740438, - "loss": 0.0603, + "learning_rate": 0.00029917958634562093, + "loss": 0.0666, "step": 2110 }, { "epoch": 0.01, - "learning_rate": 0.0002983956490810298, - "loss": 0.0652, + "learning_rate": 0.0002991756981292495, + "loss": 0.0857, "step": 2120 }, { "epoch": 0.01, - "learning_rate": 0.00029838808138801576, - "loss": 0.0623, + "learning_rate": 0.000299171809912878, + "loss": 0.0785, "step": 2130 }, { "epoch": 0.01, - "learning_rate": 0.00029838051369500174, - "loss": 0.0579, + "learning_rate": 0.00029916792169650653, + "loss": 0.0821, "step": 2140 }, { "epoch": 0.01, - "learning_rate": 0.0002983729460019877, - "loss": 0.0577, + "learning_rate": 0.0002991640334801351, + "loss": 0.0761, "step": 2150 }, { "epoch": 0.01, - "learning_rate": 0.00029836537830897375, - "loss": 0.0613, + "learning_rate": 0.0002991601452637636, + "loss": 0.0778, "step": 2160 }, { "epoch": 0.01, - "learning_rate": 0.00029835781061595974, - "loss": 0.0641, + "learning_rate": 0.0002991562570473921, + "loss": 0.0631, "step": 2170 }, { "epoch": 0.01, - "learning_rate": 0.0002983502429229457, - "loss": 0.0597, + "learning_rate": 0.0002991523688310207, + "loss": 0.069, "step": 2180 }, { "epoch": 0.01, - "learning_rate": 0.0002983426752299317, - "loss": 0.0632, + "learning_rate": 0.0002991484806146492, + "loss": 0.0718, "step": 2190 }, { "epoch": 0.01, - "learning_rate": 0.0002983351075369177, - "loss": 0.0626, + "learning_rate": 0.0002991445923982778, + "loss": 0.0633, "step": 2200 }, { "epoch": 0.01, - "learning_rate": 0.00029832753984390366, - "loss": 0.0596, + "learning_rate": 0.0002991407041819063, + "loss": 0.0653, "step": 2210 }, { "epoch": 0.01, - "learning_rate": 0.0002983199721508897, - "loss": 0.0594, + "learning_rate": 0.0002991368159655348, + "loss": 0.0659, "step": 2220 }, { "epoch": 0.01, - "learning_rate": 0.0002983124044578757, - "loss": 0.0628, + "learning_rate": 0.0002991329277491634, + "loss": 0.0608, "step": 2230 }, { "epoch": 0.01, - "learning_rate": 0.00029830483676486166, - "loss": 0.0622, + "learning_rate": 0.0002991290395327919, + "loss": 0.0725, "step": 2240 }, { "epoch": 0.01, - "learning_rate": 0.00029829726907184764, - "loss": 0.07, + "learning_rate": 0.0002991251513164204, + "loss": 0.0751, "step": 2250 }, { "epoch": 0.01, - "learning_rate": 0.0002982897013788336, - "loss": 0.0618, + "learning_rate": 0.000299121263100049, + "loss": 0.0726, "step": 2260 }, { "epoch": 0.01, - "learning_rate": 0.0002982821336858196, - "loss": 0.0629, + "learning_rate": 0.0002991173748836775, + "loss": 0.0653, "step": 2270 }, { "epoch": 0.01, - "learning_rate": 0.00029827456599280564, - "loss": 0.0638, + "learning_rate": 0.00029911348666730606, + "loss": 0.0627, "step": 2280 }, { "epoch": 0.01, - "learning_rate": 0.0002982669982997916, - "loss": 0.0545, + "learning_rate": 0.00029910959845093457, + "loss": 0.0625, "step": 2290 }, { "epoch": 0.01, - "learning_rate": 0.0002982594306067776, - "loss": 0.0578, + "learning_rate": 0.0002991057102345631, + "loss": 0.0615, "step": 2300 }, { "epoch": 0.01, - "learning_rate": 0.0002982518629137636, - "loss": 0.0553, + "learning_rate": 0.0002991018220181916, + "loss": 0.0675, "step": 2310 }, { "epoch": 0.01, - "learning_rate": 0.00029824429522074957, - "loss": 0.0535, + "learning_rate": 0.00029909793380182017, + "loss": 0.0709, "step": 2320 }, { "epoch": 0.01, - "learning_rate": 0.00029823672752773555, - "loss": 0.0537, + "learning_rate": 0.00029909404558544874, + "loss": 0.0631, "step": 2330 }, { "epoch": 0.01, - "learning_rate": 0.00029822915983472153, - "loss": 0.05, + "learning_rate": 0.00029909015736907725, + "loss": 0.0617, "step": 2340 }, { "epoch": 0.01, - "learning_rate": 0.00029822159214170756, - "loss": 0.0571, + "learning_rate": 0.00029908626915270577, + "loss": 0.0762, "step": 2350 }, { "epoch": 0.01, - "learning_rate": 0.00029821402444869355, - "loss": 0.0539, + "learning_rate": 0.00029908238093633434, + "loss": 0.0659, "step": 2360 }, { "epoch": 0.01, - "learning_rate": 0.00029820645675567953, - "loss": 0.0569, + "learning_rate": 0.00029907849271996285, + "loss": 0.0766, "step": 2370 }, { "epoch": 0.01, - "learning_rate": 0.0002981988890626655, - "loss": 0.0556, + "learning_rate": 0.00029907460450359137, + "loss": 0.0633, "step": 2380 }, { "epoch": 0.01, - "learning_rate": 0.0002981913213696515, - "loss": 0.0565, + "learning_rate": 0.00029907071628721993, + "loss": 0.0548, "step": 2390 }, { "epoch": 0.01, - "learning_rate": 0.00029818375367663747, - "loss": 0.0538, + "learning_rate": 0.00029906682807084845, + "loss": 0.0632, "step": 2400 }, { "epoch": 0.01, - "learning_rate": 0.0002981761859836235, - "loss": 0.0501, + "learning_rate": 0.000299062939854477, + "loss": 0.0565, "step": 2410 }, { "epoch": 0.01, - "learning_rate": 0.0002981686182906095, - "loss": 0.0545, + "learning_rate": 0.00029905905163810553, + "loss": 0.0635, "step": 2420 }, { "epoch": 0.01, - "learning_rate": 0.00029816105059759547, - "loss": 0.0578, + "learning_rate": 0.00029905516342173405, + "loss": 0.066, "step": 2430 }, { "epoch": 0.01, - "learning_rate": 0.00029815348290458145, - "loss": 0.052, + "learning_rate": 0.0002990512752053626, + "loss": 0.064, "step": 2440 }, { "epoch": 0.01, - "learning_rate": 0.00029814591521156743, - "loss": 0.0606, + "learning_rate": 0.00029904738698899113, + "loss": 0.0639, "step": 2450 }, { "epoch": 0.01, - "learning_rate": 0.0002981383475185534, + "learning_rate": 0.0002990434987726197, "loss": 0.0619, "step": 2460 }, { "epoch": 0.01, - "learning_rate": 0.00029813077982553945, - "loss": 0.0514, + "learning_rate": 0.0002990396105562482, + "loss": 0.068, "step": 2470 }, { "epoch": 0.01, - "learning_rate": 0.00029812321213252543, - "loss": 0.0585, + "learning_rate": 0.0002990357223398768, + "loss": 0.0636, "step": 2480 }, { "epoch": 0.01, - "learning_rate": 0.0002981156444395114, - "loss": 0.0566, + "learning_rate": 0.0002990318341235053, + "loss": 0.0596, "step": 2490 }, { "epoch": 0.01, - "learning_rate": 0.0002981080767464974, - "loss": 0.05, + "learning_rate": 0.0002990279459071338, + "loss": 0.0689, "step": 2500 }, { "epoch": 0.01, - "learning_rate": 0.0002981005090534834, - "loss": 0.0573, + "learning_rate": 0.0002990240576907623, + "loss": 0.0664, "step": 2510 }, { "epoch": 0.01, - "learning_rate": 0.00029809294136046936, - "loss": 0.0556, + "learning_rate": 0.0002990201694743909, + "loss": 0.0642, "step": 2520 }, { "epoch": 0.01, - "learning_rate": 0.00029808537366745534, - "loss": 0.0588, + "learning_rate": 0.0002990162812580194, + "loss": 0.0769, "step": 2530 }, { "epoch": 0.01, - "learning_rate": 0.0002980778059744414, - "loss": 0.0521, + "learning_rate": 0.000299012393041648, + "loss": 0.0666, "step": 2540 }, { "epoch": 0.01, - "learning_rate": 0.00029807023828142736, - "loss": 0.0625, + "learning_rate": 0.0002990085048252765, + "loss": 0.0638, "step": 2550 }, { "epoch": 0.01, - "learning_rate": 0.00029806267058841334, - "loss": 0.077, + "learning_rate": 0.000299004616608905, + "loss": 0.0627, "step": 2560 }, { "epoch": 0.01, - "learning_rate": 0.0002980551028953993, - "loss": 0.0558, + "learning_rate": 0.0002990007283925336, + "loss": 0.0687, "step": 2570 }, { "epoch": 0.01, - "learning_rate": 0.0002980475352023853, - "loss": 0.0603, + "learning_rate": 0.0002989968401761621, + "loss": 0.0614, "step": 2580 }, { "epoch": 0.01, - "learning_rate": 0.0002980399675093713, - "loss": 0.0523, + "learning_rate": 0.0002989929519597906, + "loss": 0.0713, "step": 2590 }, { "epoch": 0.01, - "learning_rate": 0.0002980323998163573, - "loss": 0.0529, + "learning_rate": 0.0002989890637434192, + "loss": 0.0697, "step": 2600 }, { "epoch": 0.01, - "learning_rate": 0.0002980248321233433, - "loss": 0.0549, + "learning_rate": 0.00029898517552704774, + "loss": 0.067, "step": 2610 }, { "epoch": 0.01, - "learning_rate": 0.0002980172644303293, - "loss": 0.0527, + "learning_rate": 0.00029898128731067626, + "loss": 0.0678, "step": 2620 }, { "epoch": 0.01, - "learning_rate": 0.00029800969673731526, - "loss": 0.0494, + "learning_rate": 0.00029897739909430477, + "loss": 0.0588, "step": 2630 }, { "epoch": 0.01, - "learning_rate": 0.00029800212904430124, - "loss": 0.0557, + "learning_rate": 0.0002989735108779333, + "loss": 0.0673, "step": 2640 }, { "epoch": 0.01, - "learning_rate": 0.0002979945613512872, - "loss": 0.056, + "learning_rate": 0.00029896962266156185, + "loss": 0.0685, "step": 2650 }, { "epoch": 0.01, - "learning_rate": 0.0002979869936582732, - "loss": 0.0545, + "learning_rate": 0.00029896573444519037, + "loss": 0.0745, "step": 2660 }, { "epoch": 0.01, - "learning_rate": 0.00029797942596525924, - "loss": 0.0517, + "learning_rate": 0.00029896184622881894, + "loss": 0.0798, "step": 2670 }, { "epoch": 0.01, - "learning_rate": 0.0002979718582722452, - "loss": 0.052, + "learning_rate": 0.00029895795801244745, + "loss": 0.0744, "step": 2680 }, { "epoch": 0.01, - "learning_rate": 0.0002979642905792312, - "loss": 0.0551, + "learning_rate": 0.000298954069796076, + "loss": 0.0809, "step": 2690 }, { "epoch": 0.01, - "learning_rate": 0.0002979567228862172, - "loss": 0.0493, + "learning_rate": 0.00029895018157970454, + "loss": 0.0668, "step": 2700 }, { "epoch": 0.01, - "learning_rate": 0.00029794915519320317, - "loss": 0.0518, + "learning_rate": 0.00029894629336333305, + "loss": 0.0775, "step": 2710 }, { "epoch": 0.01, - "learning_rate": 0.00029794158750018915, - "loss": 0.0528, + "learning_rate": 0.00029894240514696156, + "loss": 0.0732, "step": 2720 }, { "epoch": 0.01, - "learning_rate": 0.0002979340198071752, - "loss": 0.0472, + "learning_rate": 0.00029893851693059013, + "loss": 0.0708, "step": 2730 }, { "epoch": 0.01, - "learning_rate": 0.00029792645211416117, - "loss": 0.0541, + "learning_rate": 0.00029893462871421865, + "loss": 0.0628, "step": 2740 }, { "epoch": 0.01, - "learning_rate": 0.00029791888442114715, - "loss": 0.0504, + "learning_rate": 0.0002989307404978472, + "loss": 0.0631, "step": 2750 }, { "epoch": 0.01, - "learning_rate": 0.00029791131672813313, - "loss": 0.0628, + "learning_rate": 0.00029892685228147573, + "loss": 0.095, "step": 2760 }, { "epoch": 0.01, - "learning_rate": 0.0002979037490351191, - "loss": 0.0572, + "learning_rate": 0.00029892296406510425, + "loss": 0.0681, "step": 2770 }, { "epoch": 0.01, - "learning_rate": 0.0002978961813421051, - "loss": 0.0541, + "learning_rate": 0.0002989190758487328, + "loss": 0.0627, "step": 2780 }, { "epoch": 0.01, - "learning_rate": 0.00029788861364909113, - "loss": 0.0556, + "learning_rate": 0.00029891518763236133, + "loss": 0.0694, "step": 2790 }, { "epoch": 0.01, - "learning_rate": 0.0002978810459560771, - "loss": 0.0557, + "learning_rate": 0.00029891129941598984, + "loss": 0.0673, "step": 2800 }, { "epoch": 0.01, - "learning_rate": 0.0002978734782630631, - "loss": 0.0725, + "learning_rate": 0.0002989074111996184, + "loss": 0.0654, "step": 2810 }, { "epoch": 0.01, - "learning_rate": 0.00029786591057004907, - "loss": 0.0681, + "learning_rate": 0.000298903522983247, + "loss": 0.0688, "step": 2820 }, { "epoch": 0.01, - "learning_rate": 0.00029785834287703505, - "loss": 0.0572, + "learning_rate": 0.0002988996347668755, + "loss": 0.0673, "step": 2830 }, { "epoch": 0.01, - "learning_rate": 0.00029785077518402103, - "loss": 0.0536, + "learning_rate": 0.000298895746550504, + "loss": 0.0678, "step": 2840 }, { "epoch": 0.01, - "learning_rate": 0.000297843207491007, - "loss": 0.0545, + "learning_rate": 0.0002988918583341325, + "loss": 0.0686, "step": 2850 }, { "epoch": 0.01, - "learning_rate": 0.00029783563979799305, - "loss": 0.0573, + "learning_rate": 0.0002988879701177611, + "loss": 0.0708, "step": 2860 }, { "epoch": 0.01, - "learning_rate": 0.00029782807210497903, - "loss": 0.0519, + "learning_rate": 0.0002988840819013896, + "loss": 0.0866, "step": 2870 }, { "epoch": 0.01, - "learning_rate": 0.000297820504411965, - "loss": 0.0539, + "learning_rate": 0.0002988801936850182, + "loss": 0.0746, "step": 2880 }, { "epoch": 0.01, - "learning_rate": 0.000297812936718951, - "loss": 0.0611, + "learning_rate": 0.0002988763054686467, + "loss": 0.0657, "step": 2890 }, { "epoch": 0.01, - "learning_rate": 0.000297805369025937, - "loss": 0.0533, + "learning_rate": 0.00029887241725227526, + "loss": 0.0715, "step": 2900 }, { "epoch": 0.01, - "learning_rate": 0.00029779780133292296, - "loss": 0.0537, + "learning_rate": 0.0002988685290359038, + "loss": 0.0641, "step": 2910 }, { "epoch": 0.01, - "learning_rate": 0.000297790233639909, - "loss": 0.0529, + "learning_rate": 0.0002988646408195323, + "loss": 0.07, "step": 2920 }, { "epoch": 0.01, - "learning_rate": 0.000297782665946895, - "loss": 0.0539, + "learning_rate": 0.0002988607526031608, + "loss": 0.0689, "step": 2930 }, { "epoch": 0.01, - "learning_rate": 0.00029777509825388096, - "loss": 0.0511, + "learning_rate": 0.00029885686438678937, + "loss": 0.0578, "step": 2940 }, { "epoch": 0.01, - "learning_rate": 0.00029776753056086694, - "loss": 0.0568, + "learning_rate": 0.0002988529761704179, + "loss": 0.0586, "step": 2950 }, { "epoch": 0.01, - "learning_rate": 0.0002977599628678529, - "loss": 0.0534, + "learning_rate": 0.00029884908795404646, + "loss": 0.0629, "step": 2960 }, { "epoch": 0.01, - "learning_rate": 0.0002977523951748389, - "loss": 0.0514, + "learning_rate": 0.00029884519973767497, + "loss": 0.0664, "step": 2970 }, { - "epoch": 0.02, - "learning_rate": 0.00029774482748182494, - "loss": 0.059, + "epoch": 0.01, + "learning_rate": 0.0002988413115213035, + "loss": 0.0581, "step": 2980 }, { - "epoch": 0.02, - "learning_rate": 0.0002977372597888109, - "loss": 0.06, + "epoch": 0.01, + "learning_rate": 0.00029883742330493205, + "loss": 0.1604, "step": 2990 }, { - "epoch": 0.02, - "learning_rate": 0.0002977296920957969, - "loss": 0.071, + "epoch": 0.01, + "learning_rate": 0.00029883353508856057, + "loss": 0.1397, "step": 3000 }, { - "epoch": 0.02, - "eval_cer": 0.9145605027428246, - "eval_loss": 0.04296322166919708, - "eval_runtime": 117.3539, - "eval_samples_per_second": 17.042, - "eval_steps_per_second": 4.261, + "epoch": 0.01, + "eval_cer": 0.8836117911013883, + "eval_loss": 0.06463418900966644, + "eval_runtime": 107.8405, + "eval_samples_per_second": 18.546, + "eval_steps_per_second": 4.636, "step": 3000 }, { - "epoch": 0.02, - "learning_rate": 0.0002977221244027829, - "loss": 0.0634, + "epoch": 0.01, + "learning_rate": 0.00029882964687218914, + "loss": 0.0778, "step": 3010 }, { - "epoch": 0.02, - "learning_rate": 0.00029771455670976886, - "loss": 0.055, + "epoch": 0.01, + "learning_rate": 0.00029882575865581765, + "loss": 0.0669, "step": 3020 }, { - "epoch": 0.02, - "learning_rate": 0.00029770698901675484, - "loss": 0.0572, + "epoch": 0.01, + "learning_rate": 0.0002988218704394462, + "loss": 0.0723, "step": 3030 }, { - "epoch": 0.02, - "learning_rate": 0.0002976994213237408, - "loss": 0.0522, + "epoch": 0.01, + "learning_rate": 0.00029881798222307473, + "loss": 0.0695, "step": 3040 }, { - "epoch": 0.02, - "learning_rate": 0.00029769185363072686, - "loss": 0.0582, + "epoch": 0.01, + "learning_rate": 0.00029881409400670325, + "loss": 0.0611, "step": 3050 }, { - "epoch": 0.02, - "learning_rate": 0.00029768428593771284, - "loss": 0.0513, + "epoch": 0.01, + "learning_rate": 0.00029881020579033176, + "loss": 0.0761, "step": 3060 }, { - "epoch": 0.02, - "learning_rate": 0.0002976767182446988, - "loss": 0.0565, + "epoch": 0.01, + "learning_rate": 0.00029880631757396033, + "loss": 0.0636, "step": 3070 }, { - "epoch": 0.02, - "learning_rate": 0.0002976691505516848, - "loss": 0.0509, + "epoch": 0.01, + "learning_rate": 0.00029880242935758885, + "loss": 0.0658, "step": 3080 }, { - "epoch": 0.02, - "learning_rate": 0.0002976615828586708, - "loss": 0.0587, + "epoch": 0.01, + "learning_rate": 0.0002987985411412174, + "loss": 0.0685, "step": 3090 }, { - "epoch": 0.02, - "learning_rate": 0.00029765401516565677, - "loss": 0.0504, + "epoch": 0.01, + "learning_rate": 0.00029879465292484593, + "loss": 0.081, "step": 3100 }, { - "epoch": 0.02, - "learning_rate": 0.0002976464474726428, - "loss": 0.053, + "epoch": 0.01, + "learning_rate": 0.0002987907647084745, + "loss": 0.0649, "step": 3110 }, { - "epoch": 0.02, - "learning_rate": 0.0002976388797796288, - "loss": 0.0575, + "epoch": 0.01, + "learning_rate": 0.000298786876492103, + "loss": 0.0634, "step": 3120 }, { - "epoch": 0.02, - "learning_rate": 0.00029763131208661477, - "loss": 0.069, + "epoch": 0.01, + "learning_rate": 0.00029878298827573153, + "loss": 0.0747, "step": 3130 }, { - "epoch": 0.02, - "learning_rate": 0.00029762374439360075, - "loss": 0.0556, + "epoch": 0.01, + "learning_rate": 0.00029877910005936004, + "loss": 0.0699, "step": 3140 }, { - "epoch": 0.02, - "learning_rate": 0.00029761617670058673, - "loss": 0.0563, + "epoch": 0.01, + "learning_rate": 0.0002987752118429886, + "loss": 0.0661, "step": 3150 }, { - "epoch": 0.02, - "learning_rate": 0.0002976086090075727, - "loss": 0.0533, + "epoch": 0.01, + "learning_rate": 0.0002987713236266172, + "loss": 0.0721, "step": 3160 }, { - "epoch": 0.02, - "learning_rate": 0.0002976010413145587, - "loss": 0.0604, + "epoch": 0.01, + "learning_rate": 0.0002987674354102457, + "loss": 0.0964, "step": 3170 }, { - "epoch": 0.02, - "learning_rate": 0.0002975934736215447, - "loss": 0.0548, + "epoch": 0.01, + "learning_rate": 0.0002987635471938742, + "loss": 0.0708, "step": 3180 }, { - "epoch": 0.02, - "learning_rate": 0.00029758590592853066, - "loss": 0.0575, + "epoch": 0.01, + "learning_rate": 0.0002987596589775028, + "loss": 0.0742, "step": 3190 }, { - "epoch": 0.02, - "learning_rate": 0.00029757833823551664, - "loss": 0.0544, + "epoch": 0.01, + "learning_rate": 0.0002987557707611313, + "loss": 0.0671, "step": 3200 }, { - "epoch": 0.02, - "learning_rate": 0.0002975707705425026, - "loss": 0.0557, + "epoch": 0.01, + "learning_rate": 0.0002987518825447598, + "loss": 0.066, "step": 3210 }, { - "epoch": 0.02, - "learning_rate": 0.00029756320284948865, - "loss": 0.0545, + "epoch": 0.01, + "learning_rate": 0.0002987479943283884, + "loss": 0.0803, "step": 3220 }, { - "epoch": 0.02, - "learning_rate": 0.00029755563515647464, - "loss": 0.0549, + "epoch": 0.01, + "learning_rate": 0.0002987441061120169, + "loss": 0.0708, "step": 3230 }, { - "epoch": 0.02, - "learning_rate": 0.0002975480674634606, - "loss": 0.0504, + "epoch": 0.01, + "learning_rate": 0.00029874021789564546, + "loss": 0.052, "step": 3240 }, { - "epoch": 0.02, - "learning_rate": 0.0002975404997704466, - "loss": 0.0501, + "epoch": 0.01, + "learning_rate": 0.000298736329679274, + "loss": 0.0742, "step": 3250 }, { - "epoch": 0.02, - "learning_rate": 0.0002975329320774326, - "loss": 0.0545, + "epoch": 0.01, + "learning_rate": 0.0002987324414629025, + "loss": 0.0673, "step": 3260 }, { - "epoch": 0.02, - "learning_rate": 0.00029752536438441856, - "loss": 0.0453, + "epoch": 0.01, + "learning_rate": 0.000298728553246531, + "loss": 0.0646, "step": 3270 }, { - "epoch": 0.02, - "learning_rate": 0.0002975177966914046, - "loss": 0.0476, + "epoch": 0.01, + "learning_rate": 0.00029872466503015957, + "loss": 0.0643, "step": 3280 }, { - "epoch": 0.02, - "learning_rate": 0.0002975102289983906, - "loss": 0.0596, + "epoch": 0.01, + "learning_rate": 0.0002987207768137881, + "loss": 0.0731, "step": 3290 }, { - "epoch": 0.02, - "learning_rate": 0.00029750266130537656, - "loss": 0.06, + "epoch": 0.01, + "learning_rate": 0.00029871688859741665, + "loss": 0.0835, "step": 3300 }, { - "epoch": 0.02, - "learning_rate": 0.00029749509361236254, - "loss": 0.0556, + "epoch": 0.01, + "learning_rate": 0.00029871300038104517, + "loss": 0.0708, "step": 3310 }, { - "epoch": 0.02, - "learning_rate": 0.0002974875259193485, - "loss": 0.0532, + "epoch": 0.01, + "learning_rate": 0.00029870911216467374, + "loss": 0.0607, "step": 3320 }, { - "epoch": 0.02, - "learning_rate": 0.0002974799582263345, - "loss": 0.0508, + "epoch": 0.01, + "learning_rate": 0.00029870522394830225, + "loss": 0.0564, "step": 3330 }, { - "epoch": 0.02, - "learning_rate": 0.00029747239053332054, - "loss": 0.0553, + "epoch": 0.01, + "learning_rate": 0.00029870133573193077, + "loss": 0.0643, "step": 3340 }, { - "epoch": 0.02, - "learning_rate": 0.0002974648228403065, - "loss": 0.0571, + "epoch": 0.01, + "learning_rate": 0.0002986974475155593, + "loss": 0.0694, "step": 3350 }, { - "epoch": 0.02, - "learning_rate": 0.0002974572551472925, - "loss": 0.0518, + "epoch": 0.01, + "learning_rate": 0.00029869355929918785, + "loss": 0.0565, "step": 3360 }, { - "epoch": 0.02, - "learning_rate": 0.0002974496874542785, - "loss": 0.0596, + "epoch": 0.01, + "learning_rate": 0.0002986896710828164, + "loss": 0.0655, "step": 3370 }, { - "epoch": 0.02, - "learning_rate": 0.00029744211976126447, - "loss": 0.0473, + "epoch": 0.01, + "learning_rate": 0.00029868578286644493, + "loss": 0.0634, "step": 3380 }, { - "epoch": 0.02, - "learning_rate": 0.00029743455206825045, - "loss": 0.0541, + "epoch": 0.01, + "learning_rate": 0.00029868189465007345, + "loss": 0.0642, "step": 3390 }, { - "epoch": 0.02, - "learning_rate": 0.00029742698437523643, - "loss": 0.0475, + "epoch": 0.01, + "learning_rate": 0.000298678006433702, + "loss": 0.0587, "step": 3400 }, { - "epoch": 0.02, - "learning_rate": 0.00029741941668222246, - "loss": 0.0535, + "epoch": 0.01, + "learning_rate": 0.00029867411821733053, + "loss": 0.0557, "step": 3410 }, { - "epoch": 0.02, - "learning_rate": 0.00029741184898920845, - "loss": 0.0912, + "epoch": 0.01, + "learning_rate": 0.00029867023000095905, + "loss": 0.0587, "step": 3420 }, { - "epoch": 0.02, - "learning_rate": 0.00029740428129619443, - "loss": 0.0654, + "epoch": 0.01, + "learning_rate": 0.0002986663417845876, + "loss": 0.0583, "step": 3430 }, { - "epoch": 0.02, - "learning_rate": 0.0002973967136031804, - "loss": 0.1074, + "epoch": 0.01, + "learning_rate": 0.00029866245356821613, + "loss": 0.0552, "step": 3440 }, { - "epoch": 0.02, - "learning_rate": 0.0002973891459101664, - "loss": 0.0576, + "epoch": 0.01, + "learning_rate": 0.0002986585653518447, + "loss": 0.063, "step": 3450 }, { - "epoch": 0.02, - "learning_rate": 0.00029738157821715237, - "loss": 0.0517, + "epoch": 0.01, + "learning_rate": 0.0002986546771354732, + "loss": 0.0531, "step": 3460 }, { - "epoch": 0.02, - "learning_rate": 0.0002973740105241384, - "loss": 0.0604, + "epoch": 0.01, + "learning_rate": 0.0002986507889191017, + "loss": 0.0575, "step": 3470 }, { - "epoch": 0.02, - "learning_rate": 0.0002973664428311244, - "loss": 0.0488, + "epoch": 0.01, + "learning_rate": 0.00029864690070273024, + "loss": 0.0635, "step": 3480 }, { - "epoch": 0.02, - "learning_rate": 0.00029735887513811037, - "loss": 0.0484, + "epoch": 0.01, + "learning_rate": 0.0002986430124863588, + "loss": 0.0619, "step": 3490 }, { - "epoch": 0.02, - "learning_rate": 0.00029735130744509635, - "loss": 0.0547, + "epoch": 0.01, + "learning_rate": 0.0002986391242699873, + "loss": 0.0759, "step": 3500 }, { - "epoch": 0.02, - "learning_rate": 0.00029734373975208233, - "loss": 0.0545, + "epoch": 0.01, + "learning_rate": 0.0002986352360536159, + "loss": 0.0633, "step": 3510 }, { - "epoch": 0.02, - "learning_rate": 0.0002973361720590683, - "loss": 0.0482, + "epoch": 0.01, + "learning_rate": 0.0002986313478372444, + "loss": 0.0698, "step": 3520 }, { - "epoch": 0.02, - "learning_rate": 0.00029732860436605435, - "loss": 0.0554, + "epoch": 0.01, + "learning_rate": 0.000298627459620873, + "loss": 0.0604, "step": 3530 }, { - "epoch": 0.02, - "learning_rate": 0.00029732103667304033, - "loss": 0.0561, + "epoch": 0.01, + "learning_rate": 0.0002986235714045015, + "loss": 0.0583, "step": 3540 }, { - "epoch": 0.02, - "learning_rate": 0.0002973134689800263, - "loss": 0.0556, + "epoch": 0.01, + "learning_rate": 0.00029861968318813, + "loss": 0.0602, "step": 3550 }, { - "epoch": 0.02, - "learning_rate": 0.0002973059012870123, - "loss": 0.0797, + "epoch": 0.01, + "learning_rate": 0.0002986157949717586, + "loss": 0.0535, "step": 3560 }, { - "epoch": 0.02, - "learning_rate": 0.0002972983335939983, - "loss": 0.0609, + "epoch": 0.01, + "learning_rate": 0.0002986119067553871, + "loss": 0.0602, "step": 3570 }, { - "epoch": 0.02, - "learning_rate": 0.00029729076590098426, - "loss": 0.1602, + "epoch": 0.01, + "learning_rate": 0.00029860801853901566, + "loss": 0.0705, "step": 3580 }, { - "epoch": 0.02, - "learning_rate": 0.00029728319820797024, - "loss": 0.0635, + "epoch": 0.01, + "learning_rate": 0.00029860413032264417, + "loss": 0.063, "step": 3590 }, { - "epoch": 0.02, - "learning_rate": 0.0002972756305149563, - "loss": 0.0597, + "epoch": 0.01, + "learning_rate": 0.0002986002421062727, + "loss": 0.0599, "step": 3600 }, { - "epoch": 0.02, - "learning_rate": 0.00029726806282194226, - "loss": 0.0554, + "epoch": 0.01, + "learning_rate": 0.00029859635388990126, + "loss": 0.0827, "step": 3610 }, { - "epoch": 0.02, - "learning_rate": 0.00029726049512892824, - "loss": 0.0558, + "epoch": 0.01, + "learning_rate": 0.00029859246567352977, + "loss": 0.0624, "step": 3620 }, { - "epoch": 0.02, - "learning_rate": 0.0002972529274359142, - "loss": 0.0559, + "epoch": 0.01, + "learning_rate": 0.0002985885774571583, + "loss": 0.0782, "step": 3630 }, { - "epoch": 0.02, - "learning_rate": 0.0002972453597429002, - "loss": 0.0551, + "epoch": 0.01, + "learning_rate": 0.00029858468924078685, + "loss": 0.0619, "step": 3640 }, { - "epoch": 0.02, - "learning_rate": 0.0002972377920498862, - "loss": 0.0566, + "epoch": 0.01, + "learning_rate": 0.0002985808010244154, + "loss": 0.0616, "step": 3650 }, { - "epoch": 0.02, - "learning_rate": 0.0002972302243568722, - "loss": 0.0545, + "epoch": 0.01, + "learning_rate": 0.00029857691280804394, + "loss": 0.0596, "step": 3660 }, { - "epoch": 0.02, - "learning_rate": 0.0002972226566638582, - "loss": 0.0498, + "epoch": 0.01, + "learning_rate": 0.00029857302459167245, + "loss": 0.0691, "step": 3670 }, { - "epoch": 0.02, - "learning_rate": 0.0002972150889708442, - "loss": 0.052, + "epoch": 0.01, + "learning_rate": 0.00029856913637530097, + "loss": 0.0569, "step": 3680 }, { - "epoch": 0.02, - "learning_rate": 0.00029720752127783016, - "loss": 0.0546, + "epoch": 0.01, + "learning_rate": 0.00029856524815892953, + "loss": 0.0574, "step": 3690 }, { - "epoch": 0.02, - "learning_rate": 0.00029719995358481614, - "loss": 0.0547, + "epoch": 0.01, + "learning_rate": 0.00029856135994255805, + "loss": 0.0601, "step": 3700 }, { - "epoch": 0.02, - "learning_rate": 0.0002971923858918021, - "loss": 0.0474, + "epoch": 0.01, + "learning_rate": 0.0002985574717261866, + "loss": 0.0571, "step": 3710 }, { - "epoch": 0.02, - "learning_rate": 0.0002971848181987881, - "loss": 0.0519, + "epoch": 0.01, + "learning_rate": 0.00029855358350981513, + "loss": 0.0541, "step": 3720 }, { - "epoch": 0.02, - "learning_rate": 0.00029717725050577414, - "loss": 0.0477, + "epoch": 0.01, + "learning_rate": 0.00029854969529344365, + "loss": 0.0568, "step": 3730 }, { - "epoch": 0.02, - "learning_rate": 0.0002971696828127601, - "loss": 0.0469, + "epoch": 0.01, + "learning_rate": 0.0002985458070770722, + "loss": 0.0597, "step": 3740 }, { - "epoch": 0.02, - "learning_rate": 0.0002971621151197461, - "loss": 0.0513, + "epoch": 0.01, + "learning_rate": 0.00029854191886070073, + "loss": 0.0655, "step": 3750 }, { - "epoch": 0.02, - "learning_rate": 0.0002971545474267321, - "loss": 0.0462, + "epoch": 0.01, + "learning_rate": 0.00029853803064432924, + "loss": 0.0588, "step": 3760 }, { - "epoch": 0.02, - "learning_rate": 0.00029714697973371807, - "loss": 0.0553, + "epoch": 0.01, + "learning_rate": 0.0002985341424279578, + "loss": 0.0641, "step": 3770 }, { - "epoch": 0.02, - "learning_rate": 0.00029713941204070405, - "loss": 0.0615, + "epoch": 0.01, + "learning_rate": 0.00029853025421158633, + "loss": 0.068, "step": 3780 }, { - "epoch": 0.02, - "learning_rate": 0.0002971318443476901, - "loss": 0.0498, + "epoch": 0.01, + "learning_rate": 0.0002985263659952149, + "loss": 0.0597, "step": 3790 }, { - "epoch": 0.02, - "learning_rate": 0.00029712427665467607, - "loss": 0.0577, + "epoch": 0.01, + "learning_rate": 0.0002985224777788434, + "loss": 0.0619, "step": 3800 }, { - "epoch": 0.02, - "learning_rate": 0.00029711670896166205, - "loss": 0.0521, + "epoch": 0.01, + "learning_rate": 0.0002985185895624719, + "loss": 0.0554, "step": 3810 }, { - "epoch": 0.02, - "learning_rate": 0.00029710914126864803, - "loss": 0.0528, + "epoch": 0.01, + "learning_rate": 0.0002985147013461005, + "loss": 0.052, "step": 3820 }, { - "epoch": 0.02, - "learning_rate": 0.000297101573575634, - "loss": 0.0476, + "epoch": 0.01, + "learning_rate": 0.000298510813129729, + "loss": 0.0584, "step": 3830 }, { - "epoch": 0.02, - "learning_rate": 0.00029709400588262, - "loss": 0.0474, + "epoch": 0.01, + "learning_rate": 0.0002985069249133575, + "loss": 0.056, "step": 3840 }, { - "epoch": 0.02, - "learning_rate": 0.00029708643818960603, - "loss": 0.0548, + "epoch": 0.01, + "learning_rate": 0.0002985030366969861, + "loss": 0.0499, "step": 3850 }, { - "epoch": 0.02, - "learning_rate": 0.000297078870496592, - "loss": 0.0538, + "epoch": 0.01, + "learning_rate": 0.00029849914848061466, + "loss": 0.0667, "step": 3860 }, { - "epoch": 0.02, - "learning_rate": 0.000297071302803578, - "loss": 0.0453, + "epoch": 0.01, + "learning_rate": 0.0002984952602642432, + "loss": 0.053, "step": 3870 }, { - "epoch": 0.02, - "learning_rate": 0.00029706373511056397, - "loss": 0.052, + "epoch": 0.01, + "learning_rate": 0.0002984913720478717, + "loss": 0.0802, "step": 3880 }, { - "epoch": 0.02, - "learning_rate": 0.00029705616741754995, - "loss": 0.0486, + "epoch": 0.01, + "learning_rate": 0.0002984874838315002, + "loss": 0.0703, "step": 3890 }, { - "epoch": 0.02, - "learning_rate": 0.00029704859972453593, - "loss": 0.0462, + "epoch": 0.01, + "learning_rate": 0.0002984835956151288, + "loss": 0.0608, "step": 3900 }, { - "epoch": 0.02, - "learning_rate": 0.0002970410320315219, - "loss": 0.0425, + "epoch": 0.01, + "learning_rate": 0.0002984797073987573, + "loss": 0.0551, "step": 3910 }, { - "epoch": 0.02, - "learning_rate": 0.00029703346433850795, - "loss": 0.0561, + "epoch": 0.01, + "learning_rate": 0.00029847581918238586, + "loss": 0.0563, "step": 3920 }, { - "epoch": 0.02, - "learning_rate": 0.00029702589664549393, - "loss": 0.0472, + "epoch": 0.01, + "learning_rate": 0.00029847193096601437, + "loss": 0.0546, "step": 3930 }, { - "epoch": 0.02, - "learning_rate": 0.0002970183289524799, - "loss": 0.0526, + "epoch": 0.01, + "learning_rate": 0.00029846804274964294, + "loss": 0.0533, "step": 3940 }, { - "epoch": 0.02, - "learning_rate": 0.0002970107612594659, - "loss": 0.047, + "epoch": 0.01, + "learning_rate": 0.00029846415453327145, + "loss": 0.0598, "step": 3950 }, { - "epoch": 0.02, - "learning_rate": 0.0002970031935664519, - "loss": 0.051, + "epoch": 0.01, + "learning_rate": 0.00029846026631689997, + "loss": 0.0662, "step": 3960 }, { - "epoch": 0.02, - "learning_rate": 0.00029699562587343786, - "loss": 0.0456, + "epoch": 0.01, + "learning_rate": 0.0002984563781005285, + "loss": 0.0501, "step": 3970 }, { - "epoch": 0.02, - "learning_rate": 0.0002969880581804239, - "loss": 0.0425, + "epoch": 0.01, + "learning_rate": 0.00029845248988415705, + "loss": 0.0574, "step": 3980 }, { - "epoch": 0.02, - "learning_rate": 0.0002969804904874099, - "loss": 0.0543, + "epoch": 0.01, + "learning_rate": 0.00029844860166778557, + "loss": 0.058, "step": 3990 }, { - "epoch": 0.02, - "learning_rate": 0.00029697292279439586, - "loss": 0.0542, + "epoch": 0.01, + "learning_rate": 0.00029844471345141414, + "loss": 0.0488, "step": 4000 }, { - "epoch": 0.02, - "eval_cer": 0.9145430356125674, - "eval_loss": 0.038954902440309525, - "eval_runtime": 117.4435, - "eval_samples_per_second": 17.029, - "eval_steps_per_second": 4.257, + "epoch": 0.01, + "eval_cer": 0.8818566463859275, + "eval_loss": 0.04614216089248657, + "eval_runtime": 108.2516, + "eval_samples_per_second": 18.475, + "eval_steps_per_second": 4.619, "step": 4000 }, { - "epoch": 0.02, - "learning_rate": 0.00029696535510138184, - "loss": 0.0502, + "epoch": 0.01, + "learning_rate": 0.00029844082523504265, + "loss": 0.0674, "step": 4010 }, { - "epoch": 0.02, - "learning_rate": 0.0002969577874083678, - "loss": 0.0453, + "epoch": 0.01, + "learning_rate": 0.00029843693701867116, + "loss": 0.0578, "step": 4020 }, { - "epoch": 0.02, - "learning_rate": 0.0002969502197153538, - "loss": 0.0519, + "epoch": 0.01, + "learning_rate": 0.00029843304880229973, + "loss": 0.0618, "step": 4030 }, { - "epoch": 0.02, - "learning_rate": 0.00029694265202233984, - "loss": 0.0464, + "epoch": 0.01, + "learning_rate": 0.00029842916058592825, + "loss": 0.0501, "step": 4040 }, { - "epoch": 0.02, - "learning_rate": 0.0002969350843293258, - "loss": 0.0494, + "epoch": 0.01, + "learning_rate": 0.0002984252723695568, + "loss": 0.0549, "step": 4050 }, { - "epoch": 0.02, - "learning_rate": 0.0002969275166363118, - "loss": 0.0455, + "epoch": 0.01, + "learning_rate": 0.00029842138415318533, + "loss": 0.0528, "step": 4060 }, { - "epoch": 0.02, - "learning_rate": 0.0002969199489432978, - "loss": 0.0543, + "epoch": 0.01, + "learning_rate": 0.0002984174959368139, + "loss": 0.0546, "step": 4070 }, { - "epoch": 0.02, - "learning_rate": 0.00029691238125028376, - "loss": 0.0464, + "epoch": 0.01, + "learning_rate": 0.0002984136077204424, + "loss": 0.062, "step": 4080 }, { - "epoch": 0.02, - "learning_rate": 0.00029690481355726974, - "loss": 0.0518, + "epoch": 0.01, + "learning_rate": 0.00029840971950407093, + "loss": 0.0536, "step": 4090 }, { - "epoch": 0.02, - "learning_rate": 0.0002968972458642557, - "loss": 0.0526, + "epoch": 0.01, + "learning_rate": 0.00029840583128769944, + "loss": 0.0546, "step": 4100 }, { - "epoch": 0.02, - "learning_rate": 0.00029688967817124176, - "loss": 0.0541, + "epoch": 0.01, + "learning_rate": 0.000298401943071328, + "loss": 0.0492, "step": 4110 }, { - "epoch": 0.02, - "learning_rate": 0.00029688211047822774, - "loss": 0.0511, + "epoch": 0.01, + "learning_rate": 0.0002983980548549565, + "loss": 0.0491, "step": 4120 }, { - "epoch": 0.02, - "learning_rate": 0.0002968745427852137, - "loss": 0.0495, + "epoch": 0.01, + "learning_rate": 0.0002983941666385851, + "loss": 0.0528, "step": 4130 }, { - "epoch": 0.02, - "learning_rate": 0.0002968669750921997, - "loss": 0.0424, + "epoch": 0.01, + "learning_rate": 0.0002983902784222136, + "loss": 0.059, "step": 4140 }, { - "epoch": 0.02, - "learning_rate": 0.0002968594073991857, - "loss": 0.0516, + "epoch": 0.01, + "learning_rate": 0.0002983863902058422, + "loss": 0.0551, "step": 4150 }, { - "epoch": 0.02, - "learning_rate": 0.00029685183970617167, - "loss": 0.0454, + "epoch": 0.01, + "learning_rate": 0.0002983825019894707, + "loss": 0.0738, "step": 4160 }, { - "epoch": 0.02, - "learning_rate": 0.0002968442720131577, - "loss": 0.0522, + "epoch": 0.01, + "learning_rate": 0.0002983786137730992, + "loss": 0.0697, "step": 4170 }, { - "epoch": 0.02, - "learning_rate": 0.0002968367043201437, - "loss": 0.0516, + "epoch": 0.01, + "learning_rate": 0.0002983747255567277, + "loss": 0.0554, "step": 4180 }, { - "epoch": 0.02, - "learning_rate": 0.00029682913662712967, - "loss": 0.0462, + "epoch": 0.01, + "learning_rate": 0.0002983708373403563, + "loss": 0.0623, "step": 4190 }, { - "epoch": 0.02, - "learning_rate": 0.00029682156893411565, - "loss": 0.0546, + "epoch": 0.01, + "learning_rate": 0.00029836694912398486, + "loss": 0.0579, "step": 4200 }, { - "epoch": 0.02, - "learning_rate": 0.00029681400124110163, - "loss": 0.0444, + "epoch": 0.01, + "learning_rate": 0.0002983630609076134, + "loss": 0.0583, "step": 4210 }, { - "epoch": 0.02, - "learning_rate": 0.0002968064335480876, - "loss": 0.0504, + "epoch": 0.01, + "learning_rate": 0.0002983591726912419, + "loss": 0.058, "step": 4220 }, { - "epoch": 0.02, - "learning_rate": 0.0002967988658550736, - "loss": 0.0566, + "epoch": 0.01, + "learning_rate": 0.0002983552844748704, + "loss": 0.0461, "step": 4230 }, { - "epoch": 0.02, - "learning_rate": 0.00029679129816205963, - "loss": 0.0473, + "epoch": 0.01, + "learning_rate": 0.00029835139625849897, + "loss": 0.0552, "step": 4240 }, { - "epoch": 0.02, - "learning_rate": 0.0002967837304690456, - "loss": 0.048, + "epoch": 0.01, + "learning_rate": 0.0002983475080421275, + "loss": 0.0575, "step": 4250 }, { - "epoch": 0.02, - "learning_rate": 0.0002967761627760316, - "loss": 0.049, + "epoch": 0.01, + "learning_rate": 0.00029834361982575606, + "loss": 0.0514, "step": 4260 }, { - "epoch": 0.02, - "learning_rate": 0.0002967685950830176, - "loss": 0.0518, + "epoch": 0.01, + "learning_rate": 0.00029833973160938457, + "loss": 0.0558, "step": 4270 }, { - "epoch": 0.02, - "learning_rate": 0.00029676102739000355, - "loss": 0.0496, + "epoch": 0.01, + "learning_rate": 0.00029833584339301314, + "loss": 0.0576, "step": 4280 }, { - "epoch": 0.02, - "learning_rate": 0.00029675345969698954, - "loss": 0.0528, + "epoch": 0.01, + "learning_rate": 0.00029833195517664165, + "loss": 0.0573, "step": 4290 }, { - "epoch": 0.02, - "learning_rate": 0.00029674589200397557, - "loss": 0.0442, + "epoch": 0.01, + "learning_rate": 0.00029832806696027017, + "loss": 0.0564, "step": 4300 }, { - "epoch": 0.02, - "learning_rate": 0.00029673832431096155, - "loss": 0.0463, + "epoch": 0.01, + "learning_rate": 0.0002983241787438987, + "loss": 0.0581, "step": 4310 }, { - "epoch": 0.02, - "learning_rate": 0.00029673075661794753, - "loss": 0.0494, + "epoch": 0.01, + "learning_rate": 0.00029832029052752725, + "loss": 0.0578, "step": 4320 }, { - "epoch": 0.02, - "learning_rate": 0.0002967231889249335, - "loss": 0.0448, + "epoch": 0.01, + "learning_rate": 0.00029831640231115577, + "loss": 0.0556, "step": 4330 }, { - "epoch": 0.02, - "learning_rate": 0.0002967156212319195, - "loss": 0.0654, + "epoch": 0.01, + "learning_rate": 0.00029831251409478433, + "loss": 0.0532, "step": 4340 }, { - "epoch": 0.02, - "learning_rate": 0.0002967080535389055, - "loss": 0.0627, + "epoch": 0.01, + "learning_rate": 0.00029830862587841285, + "loss": 0.0515, "step": 4350 }, { - "epoch": 0.02, - "learning_rate": 0.0002967004858458915, - "loss": 0.0456, + "epoch": 0.01, + "learning_rate": 0.0002983047376620414, + "loss": 0.0657, "step": 4360 }, { - "epoch": 0.02, - "learning_rate": 0.0002966929181528775, - "loss": 0.0504, + "epoch": 0.01, + "learning_rate": 0.00029830084944566993, + "loss": 0.0505, "step": 4370 }, { - "epoch": 0.02, - "learning_rate": 0.0002966853504598635, - "loss": 0.046, + "epoch": 0.01, + "learning_rate": 0.00029829696122929845, + "loss": 0.0577, "step": 4380 }, { - "epoch": 0.02, - "learning_rate": 0.00029667778276684946, - "loss": 0.046, + "epoch": 0.01, + "learning_rate": 0.00029829307301292696, + "loss": 0.0532, "step": 4390 }, { - "epoch": 0.02, - "learning_rate": 0.00029667021507383544, - "loss": 0.0498, + "epoch": 0.01, + "learning_rate": 0.00029828918479655553, + "loss": 0.0619, "step": 4400 }, { - "epoch": 0.02, - "learning_rate": 0.0002966626473808214, - "loss": 0.0465, + "epoch": 0.01, + "learning_rate": 0.0002982852965801841, + "loss": 0.0569, "step": 4410 }, { - "epoch": 0.02, - "learning_rate": 0.0002966550796878074, - "loss": 0.0443, + "epoch": 0.01, + "learning_rate": 0.0002982814083638126, + "loss": 0.0599, "step": 4420 }, { - "epoch": 0.02, - "learning_rate": 0.0002966475119947934, - "loss": 0.0482, + "epoch": 0.01, + "learning_rate": 0.00029827752014744113, + "loss": 0.0542, "step": 4430 }, { - "epoch": 0.02, - "learning_rate": 0.00029663994430177937, - "loss": 0.0453, + "epoch": 0.01, + "learning_rate": 0.0002982736319310697, + "loss": 0.0615, "step": 4440 }, { - "epoch": 0.02, - "learning_rate": 0.00029663237660876535, - "loss": 0.0473, + "epoch": 0.01, + "learning_rate": 0.0002982697437146982, + "loss": 0.057, "step": 4450 }, { - "epoch": 0.02, - "learning_rate": 0.00029662480891575133, - "loss": 0.0463, + "epoch": 0.01, + "learning_rate": 0.0002982658554983267, + "loss": 0.0589, "step": 4460 }, { - "epoch": 0.02, - "learning_rate": 0.00029661724122273736, - "loss": 0.0426, + "epoch": 0.01, + "learning_rate": 0.0002982619672819553, + "loss": 0.0551, "step": 4470 }, { - "epoch": 0.02, - "learning_rate": 0.00029660967352972335, - "loss": 0.045, + "epoch": 0.01, + "learning_rate": 0.0002982580790655838, + "loss": 0.061, "step": 4480 }, { - "epoch": 0.02, - "learning_rate": 0.00029660210583670933, - "loss": 0.0493, + "epoch": 0.01, + "learning_rate": 0.0002982541908492124, + "loss": 0.052, "step": 4490 }, { - "epoch": 0.02, - "learning_rate": 0.0002965945381436953, - "loss": 0.0462, + "epoch": 0.01, + "learning_rate": 0.0002982503026328409, + "loss": 0.0536, "step": 4500 }, { - "epoch": 0.02, - "learning_rate": 0.0002965869704506813, - "loss": 0.047, + "epoch": 0.01, + "learning_rate": 0.0002982464144164694, + "loss": 0.0537, "step": 4510 }, { - "epoch": 0.02, - "learning_rate": 0.00029657940275766727, - "loss": 0.048, + "epoch": 0.01, + "learning_rate": 0.0002982425262000979, + "loss": 0.0709, "step": 4520 }, { - "epoch": 0.02, - "learning_rate": 0.0002965718350646533, - "loss": 0.0553, + "epoch": 0.01, + "learning_rate": 0.0002982386379837265, + "loss": 0.0524, "step": 4530 }, { - "epoch": 0.02, - "learning_rate": 0.0002965642673716393, - "loss": 0.0486, + "epoch": 0.01, + "learning_rate": 0.000298234749767355, + "loss": 0.0562, "step": 4540 }, { - "epoch": 0.02, - "learning_rate": 0.00029655669967862527, - "loss": 0.0472, + "epoch": 0.01, + "learning_rate": 0.00029823086155098357, + "loss": 0.061, "step": 4550 }, { - "epoch": 0.02, - "learning_rate": 0.00029654913198561125, - "loss": 0.0441, + "epoch": 0.01, + "learning_rate": 0.0002982269733346121, + "loss": 0.0584, "step": 4560 }, { - "epoch": 0.02, - "learning_rate": 0.00029654156429259723, - "loss": 0.0496, + "epoch": 0.01, + "learning_rate": 0.00029822308511824066, + "loss": 0.0648, "step": 4570 }, { - "epoch": 0.02, - "learning_rate": 0.0002965339965995832, - "loss": 0.0417, + "epoch": 0.01, + "learning_rate": 0.00029821919690186917, + "loss": 0.0624, "step": 4580 }, { - "epoch": 0.02, - "learning_rate": 0.00029652642890656925, - "loss": 0.0459, + "epoch": 0.01, + "learning_rate": 0.0002982153086854977, + "loss": 0.0833, "step": 4590 }, { - "epoch": 0.02, - "learning_rate": 0.00029651886121355523, - "loss": 0.0412, + "epoch": 0.01, + "learning_rate": 0.00029821142046912625, + "loss": 0.0506, "step": 4600 }, { - "epoch": 0.02, - "learning_rate": 0.0002965112935205412, - "loss": 0.0461, + "epoch": 0.01, + "learning_rate": 0.00029820753225275477, + "loss": 0.0602, "step": 4610 }, { - "epoch": 0.02, - "learning_rate": 0.0002965037258275272, - "loss": 0.0502, + "epoch": 0.01, + "learning_rate": 0.00029820364403638334, + "loss": 0.0497, "step": 4620 }, { - "epoch": 0.02, - "learning_rate": 0.0002964961581345132, - "loss": 0.0614, + "epoch": 0.01, + "learning_rate": 0.00029819975582001185, + "loss": 0.0742, "step": 4630 }, { - "epoch": 0.02, - "learning_rate": 0.00029648859044149916, - "loss": 0.0506, + "epoch": 0.01, + "learning_rate": 0.00029819586760364037, + "loss": 0.0569, "step": 4640 }, { - "epoch": 0.02, - "learning_rate": 0.00029648102274848514, - "loss": 0.0487, + "epoch": 0.01, + "learning_rate": 0.00029819197938726894, + "loss": 0.0489, "step": 4650 }, { - "epoch": 0.02, - "learning_rate": 0.0002964734550554712, - "loss": 0.0505, + "epoch": 0.01, + "learning_rate": 0.00029818809117089745, + "loss": 0.0821, "step": 4660 }, { - "epoch": 0.02, - "learning_rate": 0.00029646588736245716, - "loss": 0.0527, + "epoch": 0.01, + "learning_rate": 0.00029818420295452596, + "loss": 0.0609, "step": 4670 }, { - "epoch": 0.02, - "learning_rate": 0.00029645831966944314, - "loss": 0.0573, + "epoch": 0.01, + "learning_rate": 0.00029818031473815453, + "loss": 0.0532, "step": 4680 }, { - "epoch": 0.02, - "learning_rate": 0.0002964507519764291, - "loss": 0.0635, + "epoch": 0.01, + "learning_rate": 0.00029817642652178305, + "loss": 0.0577, "step": 4690 }, { - "epoch": 0.02, - "learning_rate": 0.0002964431842834151, - "loss": 0.0447, + "epoch": 0.01, + "learning_rate": 0.0002981725383054116, + "loss": 0.0579, "step": 4700 }, { - "epoch": 0.02, - "learning_rate": 0.0002964356165904011, - "loss": 0.0517, + "epoch": 0.01, + "learning_rate": 0.00029816865008904013, + "loss": 0.0674, "step": 4710 }, { - "epoch": 0.02, - "learning_rate": 0.0002964280488973871, - "loss": 0.0665, + "epoch": 0.01, + "learning_rate": 0.00029816476187266865, + "loss": 0.0576, "step": 4720 }, { - "epoch": 0.02, - "learning_rate": 0.0002964204812043731, - "loss": 0.0506, + "epoch": 0.01, + "learning_rate": 0.00029816087365629716, + "loss": 0.0607, "step": 4730 }, { - "epoch": 0.02, - "learning_rate": 0.0002964129135113591, - "loss": 0.0562, + "epoch": 0.01, + "learning_rate": 0.00029815698543992573, + "loss": 0.0517, "step": 4740 }, { - "epoch": 0.02, - "learning_rate": 0.00029640534581834506, - "loss": 0.052, + "epoch": 0.01, + "learning_rate": 0.0002981530972235543, + "loss": 0.0606, "step": 4750 }, { - "epoch": 0.02, - "learning_rate": 0.00029639777812533104, - "loss": 0.0505, + "epoch": 0.01, + "learning_rate": 0.0002981492090071828, + "loss": 0.0658, "step": 4760 }, { - "epoch": 0.02, - "learning_rate": 0.000296390210432317, - "loss": 0.0509, + "epoch": 0.01, + "learning_rate": 0.0002981453207908113, + "loss": 0.0594, "step": 4770 }, { - "epoch": 0.02, - "learning_rate": 0.000296382642739303, - "loss": 0.046, + "epoch": 0.01, + "learning_rate": 0.0002981414325744399, + "loss": 0.0844, "step": 4780 }, { - "epoch": 0.02, - "learning_rate": 0.00029637507504628904, - "loss": 0.0936, + "epoch": 0.01, + "learning_rate": 0.0002981375443580684, + "loss": 0.0531, "step": 4790 }, { - "epoch": 0.02, - "learning_rate": 0.000296367507353275, - "loss": 0.0593, + "epoch": 0.01, + "learning_rate": 0.0002981336561416969, + "loss": 0.0609, "step": 4800 }, { - "epoch": 0.02, - "learning_rate": 0.000296359939660261, - "loss": 0.0514, + "epoch": 0.01, + "learning_rate": 0.0002981297679253255, + "loss": 0.0573, "step": 4810 }, { - "epoch": 0.02, - "learning_rate": 0.000296352371967247, - "loss": 0.0491, + "epoch": 0.01, + "learning_rate": 0.000298125879708954, + "loss": 0.0534, "step": 4820 }, { - "epoch": 0.02, - "learning_rate": 0.00029634480427423297, - "loss": 0.0521, + "epoch": 0.01, + "learning_rate": 0.0002981219914925826, + "loss": 0.0508, "step": 4830 }, { - "epoch": 0.02, - "learning_rate": 0.00029633723658121895, - "loss": 0.0521, + "epoch": 0.01, + "learning_rate": 0.0002981181032762111, + "loss": 0.0756, "step": 4840 }, { - "epoch": 0.02, - "learning_rate": 0.000296329668888205, - "loss": 0.0527, + "epoch": 0.01, + "learning_rate": 0.0002981142150598396, + "loss": 0.0727, "step": 4850 }, { - "epoch": 0.02, - "learning_rate": 0.00029632210119519097, - "loss": 0.0649, + "epoch": 0.01, + "learning_rate": 0.0002981103268434682, + "loss": 0.0594, "step": 4860 }, { - "epoch": 0.02, - "learning_rate": 0.00029631453350217695, - "loss": 0.0527, + "epoch": 0.01, + "learning_rate": 0.0002981064386270967, + "loss": 0.0571, "step": 4870 }, { - "epoch": 0.02, - "learning_rate": 0.00029630696580916293, - "loss": 0.0539, + "epoch": 0.01, + "learning_rate": 0.0002981025504107252, + "loss": 0.0594, "step": 4880 }, { - "epoch": 0.02, - "learning_rate": 0.0002962993981161489, - "loss": 0.0478, + "epoch": 0.01, + "learning_rate": 0.00029809866219435377, + "loss": 0.0587, "step": 4890 }, { - "epoch": 0.02, - "learning_rate": 0.0002962918304231349, - "loss": 0.0465, + "epoch": 0.01, + "learning_rate": 0.00029809477397798234, + "loss": 0.0628, "step": 4900 }, { - "epoch": 0.02, - "learning_rate": 0.00029628426273012093, - "loss": 0.0743, + "epoch": 0.01, + "learning_rate": 0.00029809088576161085, + "loss": 0.0529, "step": 4910 }, { - "epoch": 0.02, - "learning_rate": 0.0002962766950371069, - "loss": 0.073, + "epoch": 0.01, + "learning_rate": 0.00029808699754523937, + "loss": 0.0587, "step": 4920 }, { - "epoch": 0.02, - "learning_rate": 0.0002962691273440929, - "loss": 0.0692, + "epoch": 0.01, + "learning_rate": 0.0002980831093288679, + "loss": 0.0587, "step": 4930 }, { - "epoch": 0.02, - "learning_rate": 0.00029626155965107887, - "loss": 0.044, + "epoch": 0.01, + "learning_rate": 0.00029807922111249645, + "loss": 0.0533, "step": 4940 }, { - "epoch": 0.02, - "learning_rate": 0.00029625399195806485, - "loss": 0.0441, + "epoch": 0.01, + "learning_rate": 0.00029807533289612497, + "loss": 0.061, "step": 4950 }, { - "epoch": 0.03, - "learning_rate": 0.00029624642426505083, - "loss": 0.0501, + "epoch": 0.01, + "learning_rate": 0.00029807144467975354, + "loss": 0.057, "step": 4960 }, { - "epoch": 0.03, - "learning_rate": 0.0002962388565720368, - "loss": 0.0458, + "epoch": 0.01, + "learning_rate": 0.00029806755646338205, + "loss": 0.0561, "step": 4970 }, { - "epoch": 0.03, - "learning_rate": 0.00029623128887902285, - "loss": 0.0422, + "epoch": 0.01, + "learning_rate": 0.00029806366824701057, + "loss": 0.0564, "step": 4980 }, { - "epoch": 0.03, - "learning_rate": 0.00029622372118600883, - "loss": 0.0495, + "epoch": 0.01, + "learning_rate": 0.00029805978003063913, + "loss": 0.0618, "step": 4990 }, { - "epoch": 0.03, - "learning_rate": 0.0002962161534929948, - "loss": 0.0464, + "epoch": 0.01, + "learning_rate": 0.00029805589181426765, + "loss": 0.0533, "step": 5000 }, { - "epoch": 0.03, - "eval_cer": 0.9145071309559275, - "eval_loss": 0.03470829501748085, - "eval_runtime": 117.4598, - "eval_samples_per_second": 17.027, - "eval_steps_per_second": 4.257, + "epoch": 0.01, + "eval_cer": 0.8818384511057832, + "eval_loss": 0.04352134093642235, + "eval_runtime": 107.4217, + "eval_samples_per_second": 18.618, + "eval_steps_per_second": 4.655, "step": 5000 }, { - "epoch": 0.03, - "learning_rate": 0.0002962085857999808, - "loss": 0.0427, + "epoch": 0.01, + "learning_rate": 0.00029805200359789616, + "loss": 0.0524, "step": 5010 }, { - "epoch": 0.03, - "learning_rate": 0.0002962010181069668, - "loss": 0.0465, + "epoch": 0.01, + "learning_rate": 0.00029804811538152473, + "loss": 0.0565, "step": 5020 }, { - "epoch": 0.03, - "learning_rate": 0.00029619345041395276, - "loss": 0.0453, + "epoch": 0.01, + "learning_rate": 0.00029804422716515325, + "loss": 0.0635, "step": 5030 }, { - "epoch": 0.03, - "learning_rate": 0.0002961858827209388, - "loss": 0.0415, + "epoch": 0.01, + "learning_rate": 0.0002980403389487818, + "loss": 0.0633, "step": 5040 }, { - "epoch": 0.03, - "learning_rate": 0.0002961783150279248, - "loss": 0.0476, + "epoch": 0.01, + "learning_rate": 0.00029803645073241033, + "loss": 0.0577, "step": 5050 }, { - "epoch": 0.03, - "learning_rate": 0.00029617074733491076, - "loss": 0.0447, + "epoch": 0.01, + "learning_rate": 0.00029803256251603884, + "loss": 0.051, "step": 5060 }, { - "epoch": 0.03, - "learning_rate": 0.00029616317964189674, - "loss": 0.0512, + "epoch": 0.01, + "learning_rate": 0.0002980286742996674, + "loss": 0.064, "step": 5070 }, { - "epoch": 0.03, - "learning_rate": 0.0002961556119488827, - "loss": 0.0486, + "epoch": 0.01, + "learning_rate": 0.00029802478608329593, + "loss": 0.0575, "step": 5080 }, { - "epoch": 0.03, - "learning_rate": 0.0002961480442558687, - "loss": 0.0486, + "epoch": 0.01, + "learning_rate": 0.00029802089786692444, + "loss": 0.0524, "step": 5090 }, { - "epoch": 0.03, - "learning_rate": 0.00029614047656285474, - "loss": 0.0493, + "epoch": 0.01, + "learning_rate": 0.000298017009650553, + "loss": 0.0593, "step": 5100 }, { - "epoch": 0.03, - "learning_rate": 0.0002961329088698407, - "loss": 0.0504, + "epoch": 0.01, + "learning_rate": 0.0002980131214341816, + "loss": 0.0563, "step": 5110 }, { - "epoch": 0.03, - "learning_rate": 0.0002961253411768267, - "loss": 0.0528, + "epoch": 0.01, + "learning_rate": 0.0002980092332178101, + "loss": 0.062, "step": 5120 }, { - "epoch": 0.03, - "learning_rate": 0.0002961177734838127, - "loss": 0.046, + "epoch": 0.01, + "learning_rate": 0.0002980053450014386, + "loss": 0.0695, "step": 5130 }, { - "epoch": 0.03, - "learning_rate": 0.00029611020579079866, - "loss": 0.0519, + "epoch": 0.01, + "learning_rate": 0.0002980014567850671, + "loss": 0.0664, "step": 5140 }, { - "epoch": 0.03, - "learning_rate": 0.00029610263809778465, - "loss": 0.0498, + "epoch": 0.01, + "learning_rate": 0.0002979975685686957, + "loss": 0.0559, "step": 5150 }, { - "epoch": 0.03, - "learning_rate": 0.0002960950704047706, - "loss": 0.0432, + "epoch": 0.01, + "learning_rate": 0.0002979936803523242, + "loss": 0.0502, "step": 5160 }, { - "epoch": 0.03, - "learning_rate": 0.00029608750271175666, - "loss": 0.0501, + "epoch": 0.01, + "learning_rate": 0.0002979897921359528, + "loss": 0.0537, "step": 5170 }, { - "epoch": 0.03, - "learning_rate": 0.00029607993501874264, - "loss": 0.0449, + "epoch": 0.01, + "learning_rate": 0.0002979859039195813, + "loss": 0.0484, "step": 5180 }, { - "epoch": 0.03, - "learning_rate": 0.0002960723673257286, - "loss": 0.0499, + "epoch": 0.01, + "learning_rate": 0.00029798201570320986, + "loss": 0.0484, "step": 5190 }, { - "epoch": 0.03, - "learning_rate": 0.0002960647996327146, - "loss": 0.0484, + "epoch": 0.01, + "learning_rate": 0.00029797812748683837, + "loss": 0.0562, "step": 5200 }, { - "epoch": 0.03, - "learning_rate": 0.0002960572319397006, - "loss": 0.0483, + "epoch": 0.01, + "learning_rate": 0.0002979742392704669, + "loss": 0.0541, "step": 5210 }, { - "epoch": 0.03, - "learning_rate": 0.00029604966424668657, - "loss": 0.0518, + "epoch": 0.01, + "learning_rate": 0.0002979703510540954, + "loss": 0.0673, "step": 5220 }, { - "epoch": 0.03, - "learning_rate": 0.0002960420965536726, - "loss": 0.0527, + "epoch": 0.01, + "learning_rate": 0.00029796646283772397, + "loss": 0.0536, "step": 5230 }, { - "epoch": 0.03, - "learning_rate": 0.0002960345288606586, - "loss": 0.0436, + "epoch": 0.01, + "learning_rate": 0.00029796257462135254, + "loss": 0.0556, "step": 5240 }, { - "epoch": 0.03, - "learning_rate": 0.00029602696116764457, - "loss": 0.0591, + "epoch": 0.01, + "learning_rate": 0.00029795868640498105, + "loss": 0.0469, "step": 5250 }, { - "epoch": 0.03, - "learning_rate": 0.00029601939347463055, - "loss": 0.0473, + "epoch": 0.01, + "learning_rate": 0.00029795479818860957, + "loss": 0.0601, "step": 5260 }, { - "epoch": 0.03, - "learning_rate": 0.00029601182578161653, - "loss": 0.0429, + "epoch": 0.01, + "learning_rate": 0.0002979509099722381, + "loss": 0.0537, "step": 5270 }, { - "epoch": 0.03, - "learning_rate": 0.0002960042580886025, - "loss": 0.0483, + "epoch": 0.01, + "learning_rate": 0.00029794702175586665, + "loss": 0.0569, "step": 5280 }, { - "epoch": 0.03, - "learning_rate": 0.0002959966903955885, - "loss": 0.0446, + "epoch": 0.01, + "learning_rate": 0.00029794313353949517, + "loss": 0.0462, "step": 5290 }, { - "epoch": 0.03, - "learning_rate": 0.00029598912270257453, - "loss": 0.0484, + "epoch": 0.01, + "learning_rate": 0.00029793924532312373, + "loss": 0.0461, "step": 5300 }, { - "epoch": 0.03, - "learning_rate": 0.0002959815550095605, - "loss": 0.0453, + "epoch": 0.01, + "learning_rate": 0.00029793535710675225, + "loss": 0.0489, "step": 5310 }, { - "epoch": 0.03, - "learning_rate": 0.0002959739873165465, - "loss": 0.0419, + "epoch": 0.01, + "learning_rate": 0.0002979314688903808, + "loss": 0.0535, "step": 5320 }, { - "epoch": 0.03, - "learning_rate": 0.0002959664196235325, - "loss": 0.0449, + "epoch": 0.01, + "learning_rate": 0.00029792758067400933, + "loss": 0.0546, "step": 5330 }, { - "epoch": 0.03, - "learning_rate": 0.00029595885193051846, - "loss": 0.0401, + "epoch": 0.01, + "learning_rate": 0.00029792369245763785, + "loss": 0.058, "step": 5340 }, { - "epoch": 0.03, - "learning_rate": 0.00029595128423750444, - "loss": 0.0498, + "epoch": 0.01, + "learning_rate": 0.00029791980424126636, + "loss": 0.0555, "step": 5350 }, { - "epoch": 0.03, - "learning_rate": 0.00029594371654449047, - "loss": 0.0448, + "epoch": 0.01, + "learning_rate": 0.00029791591602489493, + "loss": 0.0479, "step": 5360 }, { - "epoch": 0.03, - "learning_rate": 0.00029593614885147645, - "loss": 0.0476, + "epoch": 0.01, + "learning_rate": 0.00029791202780852345, + "loss": 0.0584, "step": 5370 }, { - "epoch": 0.03, - "learning_rate": 0.00029592858115846244, - "loss": 0.0491, + "epoch": 0.01, + "learning_rate": 0.000297908139592152, + "loss": 0.0514, "step": 5380 }, { - "epoch": 0.03, - "learning_rate": 0.0002959210134654484, - "loss": 0.0471, + "epoch": 0.01, + "learning_rate": 0.00029790425137578053, + "loss": 0.0491, "step": 5390 }, { - "epoch": 0.03, - "learning_rate": 0.0002959134457724344, - "loss": 0.0448, + "epoch": 0.01, + "learning_rate": 0.0002979003631594091, + "loss": 0.0511, "step": 5400 }, { - "epoch": 0.03, - "learning_rate": 0.0002959058780794204, - "loss": 0.0648, + "epoch": 0.01, + "learning_rate": 0.0002978964749430376, + "loss": 0.0489, "step": 5410 }, { - "epoch": 0.03, - "learning_rate": 0.0002958983103864064, - "loss": 0.0482, + "epoch": 0.01, + "learning_rate": 0.0002978925867266661, + "loss": 0.0532, "step": 5420 }, { - "epoch": 0.03, - "learning_rate": 0.0002958907426933924, + "epoch": 0.01, + "learning_rate": 0.00029788869851029464, "loss": 0.0484, "step": 5430 }, { - "epoch": 0.03, - "learning_rate": 0.0002958831750003784, - "loss": 0.0545, + "epoch": 0.01, + "learning_rate": 0.0002978848102939232, + "loss": 0.0599, "step": 5440 }, { - "epoch": 0.03, - "learning_rate": 0.00029587560730736436, - "loss": 0.0501, + "epoch": 0.01, + "learning_rate": 0.0002978809220775518, + "loss": 0.0483, "step": 5450 }, { - "epoch": 0.03, - "learning_rate": 0.00029586803961435034, - "loss": 0.0431, + "epoch": 0.01, + "learning_rate": 0.0002978770338611803, + "loss": 0.0587, "step": 5460 }, { - "epoch": 0.03, - "learning_rate": 0.0002958604719213363, - "loss": 0.0424, + "epoch": 0.01, + "learning_rate": 0.0002978731456448088, + "loss": 0.0512, "step": 5470 }, { - "epoch": 0.03, - "learning_rate": 0.0002958529042283223, - "loss": 0.0434, + "epoch": 0.01, + "learning_rate": 0.0002978692574284373, + "loss": 0.0508, "step": 5480 }, { - "epoch": 0.03, - "learning_rate": 0.00029584533653530834, - "loss": 0.0432, + "epoch": 0.01, + "learning_rate": 0.0002978653692120659, + "loss": 0.0508, "step": 5490 }, { - "epoch": 0.03, - "learning_rate": 0.0002958377688422943, - "loss": 0.0436, + "epoch": 0.01, + "learning_rate": 0.0002978614809956944, + "loss": 0.0495, "step": 5500 }, { - "epoch": 0.03, - "learning_rate": 0.0002958302011492803, - "loss": 0.0486, + "epoch": 0.01, + "learning_rate": 0.000297857592779323, + "loss": 0.0501, "step": 5510 }, { - "epoch": 0.03, - "learning_rate": 0.0002958226334562663, - "loss": 0.0478, + "epoch": 0.01, + "learning_rate": 0.0002978537045629515, + "loss": 0.057, "step": 5520 }, { - "epoch": 0.03, - "learning_rate": 0.00029581506576325227, - "loss": 0.0438, + "epoch": 0.01, + "learning_rate": 0.00029784981634658006, + "loss": 0.0646, "step": 5530 }, { - "epoch": 0.03, - "learning_rate": 0.00029580749807023825, - "loss": 0.0386, + "epoch": 0.01, + "learning_rate": 0.00029784592813020857, + "loss": 0.0549, "step": 5540 }, { - "epoch": 0.03, - "learning_rate": 0.0002957999303772243, - "loss": 0.0411, + "epoch": 0.01, + "learning_rate": 0.0002978420399138371, + "loss": 0.0562, "step": 5550 }, { - "epoch": 0.03, - "learning_rate": 0.00029579236268421026, - "loss": 0.0462, + "epoch": 0.01, + "learning_rate": 0.0002978381516974656, + "loss": 0.0589, "step": 5560 }, { - "epoch": 0.03, - "learning_rate": 0.00029578479499119625, - "loss": 0.0436, + "epoch": 0.01, + "learning_rate": 0.00029783426348109417, + "loss": 0.0552, "step": 5570 }, { - "epoch": 0.03, - "learning_rate": 0.0002957772272981822, - "loss": 0.0457, + "epoch": 0.01, + "learning_rate": 0.0002978303752647227, + "loss": 0.0616, "step": 5580 }, { - "epoch": 0.03, - "learning_rate": 0.0002957696596051682, - "loss": 0.0425, + "epoch": 0.01, + "learning_rate": 0.00029782648704835125, + "loss": 0.0601, "step": 5590 }, { - "epoch": 0.03, - "learning_rate": 0.0002957620919121542, - "loss": 0.0486, + "epoch": 0.01, + "learning_rate": 0.00029782259883197977, + "loss": 0.0528, "step": 5600 }, { - "epoch": 0.03, - "learning_rate": 0.0002957545242191402, - "loss": 0.0496, + "epoch": 0.01, + "learning_rate": 0.00029781871061560834, + "loss": 0.0515, "step": 5610 }, { - "epoch": 0.03, - "learning_rate": 0.0002957469565261262, - "loss": 0.0534, + "epoch": 0.01, + "learning_rate": 0.00029781482239923685, + "loss": 0.0585, "step": 5620 }, { - "epoch": 0.03, - "learning_rate": 0.0002957393888331122, - "loss": 0.0385, + "epoch": 0.01, + "learning_rate": 0.00029781093418286537, + "loss": 0.0572, "step": 5630 }, { - "epoch": 0.03, - "learning_rate": 0.00029573182114009817, - "loss": 0.0467, + "epoch": 0.01, + "learning_rate": 0.00029780704596649393, + "loss": 0.0533, "step": 5640 }, { - "epoch": 0.03, - "learning_rate": 0.00029572425344708415, - "loss": 0.0478, + "epoch": 0.01, + "learning_rate": 0.00029780315775012245, + "loss": 0.06, "step": 5650 }, { - "epoch": 0.03, - "learning_rate": 0.00029571668575407013, - "loss": 0.0406, + "epoch": 0.01, + "learning_rate": 0.000297799269533751, + "loss": 0.0529, "step": 5660 }, { - "epoch": 0.03, - "learning_rate": 0.0002957091180610561, - "loss": 0.0493, + "epoch": 0.01, + "learning_rate": 0.00029779538131737953, + "loss": 0.0557, "step": 5670 }, { - "epoch": 0.03, - "learning_rate": 0.0002957015503680421, - "loss": 0.0448, + "epoch": 0.01, + "learning_rate": 0.00029779149310100805, + "loss": 0.0457, "step": 5680 }, { - "epoch": 0.03, - "learning_rate": 0.0002956939826750281, - "loss": 0.0465, + "epoch": 0.01, + "learning_rate": 0.0002977876048846366, + "loss": 0.0462, "step": 5690 }, { - "epoch": 0.03, - "learning_rate": 0.00029568641498201406, - "loss": 0.0485, + "epoch": 0.01, + "learning_rate": 0.00029778371666826513, + "loss": 0.052, "step": 5700 }, { - "epoch": 0.03, - "learning_rate": 0.00029567884728900004, - "loss": 0.044, + "epoch": 0.01, + "learning_rate": 0.00029777982845189364, + "loss": 0.0478, "step": 5710 }, { - "epoch": 0.03, - "learning_rate": 0.0002956712795959861, - "loss": 0.0454, + "epoch": 0.01, + "learning_rate": 0.0002977759402355222, + "loss": 0.0501, "step": 5720 }, { - "epoch": 0.03, - "learning_rate": 0.00029566371190297206, - "loss": 0.0488, + "epoch": 0.01, + "learning_rate": 0.00029777205201915073, + "loss": 0.0539, "step": 5730 }, { - "epoch": 0.03, - "learning_rate": 0.00029565614420995804, - "loss": 0.042, + "epoch": 0.01, + "learning_rate": 0.0002977681638027793, + "loss": 0.0455, "step": 5740 }, { - "epoch": 0.03, - "learning_rate": 0.000295648576516944, - "loss": 0.046, + "epoch": 0.01, + "learning_rate": 0.0002977642755864078, + "loss": 0.0542, "step": 5750 }, { - "epoch": 0.03, - "learning_rate": 0.00029564100882393, - "loss": 0.0447, + "epoch": 0.01, + "learning_rate": 0.0002977603873700363, + "loss": 0.0425, "step": 5760 }, { - "epoch": 0.03, - "learning_rate": 0.000295633441130916, - "loss": 0.043, + "epoch": 0.01, + "learning_rate": 0.00029775649915366484, + "loss": 0.0524, "step": 5770 }, { - "epoch": 0.03, - "learning_rate": 0.000295625873437902, - "loss": 0.0484, + "epoch": 0.01, + "learning_rate": 0.0002977526109372934, + "loss": 0.0516, "step": 5780 }, { - "epoch": 0.03, - "learning_rate": 0.000295618305744888, - "loss": 0.0468, + "epoch": 0.02, + "learning_rate": 0.000297748722720922, + "loss": 0.0505, "step": 5790 }, { - "epoch": 0.03, - "learning_rate": 0.000295610738051874, - "loss": 0.0498, + "epoch": 0.02, + "learning_rate": 0.0002977448345045505, + "loss": 0.0497, "step": 5800 }, { - "epoch": 0.03, - "learning_rate": 0.00029560317035885996, - "loss": 0.0474, + "epoch": 0.02, + "learning_rate": 0.000297740946288179, + "loss": 0.0536, "step": 5810 }, { - "epoch": 0.03, - "learning_rate": 0.00029559560266584594, - "loss": 0.045, + "epoch": 0.02, + "learning_rate": 0.0002977370580718076, + "loss": 0.0507, "step": 5820 }, { - "epoch": 0.03, - "learning_rate": 0.0002955880349728319, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.0002977331698554361, + "loss": 0.0486, "step": 5830 }, { - "epoch": 0.03, - "learning_rate": 0.00029558046727981796, - "loss": 0.0414, + "epoch": 0.02, + "learning_rate": 0.0002977292816390646, + "loss": 0.0567, "step": 5840 }, { - "epoch": 0.03, - "learning_rate": 0.00029557289958680394, - "loss": 0.0423, + "epoch": 0.02, + "learning_rate": 0.00029772539342269317, + "loss": 0.0507, "step": 5850 }, { - "epoch": 0.03, - "learning_rate": 0.0002955653318937899, - "loss": 0.0437, + "epoch": 0.02, + "learning_rate": 0.0002977215052063217, + "loss": 0.0582, "step": 5860 }, { - "epoch": 0.03, - "learning_rate": 0.0002955577642007759, - "loss": 0.0409, + "epoch": 0.02, + "learning_rate": 0.00029771761698995026, + "loss": 0.0482, "step": 5870 }, { - "epoch": 0.03, - "learning_rate": 0.0002955501965077619, - "loss": 0.0462, + "epoch": 0.02, + "learning_rate": 0.00029771372877357877, + "loss": 0.0467, "step": 5880 }, { - "epoch": 0.03, - "learning_rate": 0.00029554262881474787, - "loss": 0.0426, + "epoch": 0.02, + "learning_rate": 0.0002977098405572073, + "loss": 0.0607, "step": 5890 }, { - "epoch": 0.03, - "learning_rate": 0.00029553506112173385, - "loss": 0.0413, + "epoch": 0.02, + "learning_rate": 0.00029770595234083585, + "loss": 0.051, "step": 5900 }, { - "epoch": 0.03, - "learning_rate": 0.0002955274934287199, - "loss": 0.0397, + "epoch": 0.02, + "learning_rate": 0.00029770206412446437, + "loss": 0.0532, "step": 5910 }, { - "epoch": 0.03, - "learning_rate": 0.00029551992573570587, - "loss": 0.0427, + "epoch": 0.02, + "learning_rate": 0.0002976981759080929, + "loss": 0.0531, "step": 5920 }, { - "epoch": 0.03, - "learning_rate": 0.00029551235804269185, - "loss": 0.0414, + "epoch": 0.02, + "learning_rate": 0.00029769428769172145, + "loss": 0.0524, "step": 5930 }, { - "epoch": 0.03, - "learning_rate": 0.00029550479034967783, - "loss": 0.0402, + "epoch": 0.02, + "learning_rate": 0.00029769039947535, + "loss": 0.0608, "step": 5940 }, { - "epoch": 0.03, - "learning_rate": 0.0002954972226566638, - "loss": 0.0468, + "epoch": 0.02, + "learning_rate": 0.00029768651125897853, + "loss": 0.0459, "step": 5950 }, { - "epoch": 0.03, - "learning_rate": 0.0002954896549636498, - "loss": 0.0353, + "epoch": 0.02, + "learning_rate": 0.00029768262304260705, + "loss": 0.0515, "step": 5960 }, { - "epoch": 0.03, - "learning_rate": 0.00029548208727063583, - "loss": 0.0466, + "epoch": 0.02, + "learning_rate": 0.00029767873482623556, + "loss": 0.0522, "step": 5970 }, { - "epoch": 0.03, - "learning_rate": 0.0002954745195776218, - "loss": 0.0469, + "epoch": 0.02, + "learning_rate": 0.0002976748466098641, + "loss": 0.0501, "step": 5980 }, { - "epoch": 0.03, - "learning_rate": 0.0002954669518846078, - "loss": 0.0437, + "epoch": 0.02, + "learning_rate": 0.00029767095839349265, + "loss": 0.0513, "step": 5990 }, { - "epoch": 0.03, - "learning_rate": 0.00029545938419159377, - "loss": 0.0402, + "epoch": 0.02, + "learning_rate": 0.0002976670701771212, + "loss": 0.0551, "step": 6000 }, { - "epoch": 0.03, - "eval_cer": 0.9144964565985481, - "eval_loss": 0.03346065431833267, - "eval_runtime": 117.4862, - "eval_samples_per_second": 17.023, - "eval_steps_per_second": 4.256, + "epoch": 0.02, + "eval_cer": 0.8817866645392185, + "eval_loss": 0.03934020921587944, + "eval_runtime": 107.5774, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, "step": 6000 }, { - "epoch": 0.03, - "learning_rate": 0.00029545181649857975, - "loss": 0.0513, + "epoch": 0.02, + "learning_rate": 0.00029766318196074973, + "loss": 0.048, "step": 6010 }, { - "epoch": 0.03, - "learning_rate": 0.00029544424880556574, - "loss": 0.0432, + "epoch": 0.02, + "learning_rate": 0.00029765929374437824, + "loss": 0.0518, "step": 6020 }, { - "epoch": 0.03, - "learning_rate": 0.0002954366811125517, - "loss": 0.0466, + "epoch": 0.02, + "learning_rate": 0.0002976554055280068, + "loss": 0.0474, "step": 6030 }, { - "epoch": 0.03, - "learning_rate": 0.00029542911341953775, - "loss": 0.0424, + "epoch": 0.02, + "learning_rate": 0.00029765151731163533, + "loss": 0.0529, "step": 6040 }, { - "epoch": 0.03, - "learning_rate": 0.00029542154572652373, - "loss": 0.0389, + "epoch": 0.02, + "learning_rate": 0.00029764762909526384, + "loss": 0.0457, "step": 6050 }, { - "epoch": 0.03, - "learning_rate": 0.0002954139780335097, - "loss": 0.0377, + "epoch": 0.02, + "learning_rate": 0.0002976437408788924, + "loss": 0.0507, "step": 6060 }, { - "epoch": 0.03, - "learning_rate": 0.0002954064103404957, - "loss": 0.0425, + "epoch": 0.02, + "learning_rate": 0.0002976398526625209, + "loss": 0.0534, "step": 6070 }, { - "epoch": 0.03, - "learning_rate": 0.0002953988426474817, - "loss": 0.0406, + "epoch": 0.02, + "learning_rate": 0.0002976359644461495, + "loss": 0.045, "step": 6080 }, { - "epoch": 0.03, - "learning_rate": 0.00029539127495446766, - "loss": 0.0465, + "epoch": 0.02, + "learning_rate": 0.000297632076229778, + "loss": 0.0526, "step": 6090 }, { - "epoch": 0.03, - "learning_rate": 0.0002953837072614537, - "loss": 0.0463, + "epoch": 0.02, + "learning_rate": 0.0002976281880134065, + "loss": 0.0477, "step": 6100 }, { - "epoch": 0.03, - "learning_rate": 0.0002953761395684397, - "loss": 0.0954, + "epoch": 0.02, + "learning_rate": 0.0002976242997970351, + "loss": 0.0453, "step": 6110 }, { - "epoch": 0.03, - "learning_rate": 0.00029536857187542566, - "loss": 0.068, + "epoch": 0.02, + "learning_rate": 0.0002976204115806636, + "loss": 0.0464, "step": 6120 }, { - "epoch": 0.03, - "learning_rate": 0.00029536100418241164, - "loss": 0.0656, + "epoch": 0.02, + "learning_rate": 0.0002976165233642921, + "loss": 0.0503, "step": 6130 }, { - "epoch": 0.03, - "learning_rate": 0.0002953534364893976, - "loss": 0.066, + "epoch": 0.02, + "learning_rate": 0.0002976126351479207, + "loss": 0.0492, "step": 6140 }, { - "epoch": 0.03, - "learning_rate": 0.0002953458687963836, - "loss": 0.0541, + "epoch": 0.02, + "learning_rate": 0.00029760874693154926, + "loss": 0.0502, "step": 6150 }, { - "epoch": 0.03, - "learning_rate": 0.00029533830110336964, - "loss": 0.0574, + "epoch": 0.02, + "learning_rate": 0.0002976048587151778, + "loss": 0.0499, "step": 6160 }, { - "epoch": 0.03, - "learning_rate": 0.0002953307334103556, - "loss": 0.0532, + "epoch": 0.02, + "learning_rate": 0.0002976009704988063, + "loss": 0.0488, "step": 6170 }, { - "epoch": 0.03, - "learning_rate": 0.0002953231657173416, - "loss": 0.0622, + "epoch": 0.02, + "learning_rate": 0.0002975970822824348, + "loss": 0.054, "step": 6180 }, { - "epoch": 0.03, - "learning_rate": 0.0002953155980243276, - "loss": 0.0538, + "epoch": 0.02, + "learning_rate": 0.00029759319406606337, + "loss": 0.049, "step": 6190 }, { - "epoch": 0.03, - "learning_rate": 0.00029530803033131356, - "loss": 0.0555, + "epoch": 0.02, + "learning_rate": 0.0002975893058496919, + "loss": 0.0618, "step": 6200 }, { - "epoch": 0.03, - "learning_rate": 0.00029530046263829955, - "loss": 0.0598, + "epoch": 0.02, + "learning_rate": 0.00029758541763332045, + "loss": 0.0551, "step": 6210 }, { - "epoch": 0.03, - "learning_rate": 0.0002952928949452855, - "loss": 0.046, + "epoch": 0.02, + "learning_rate": 0.00029758152941694897, + "loss": 0.0483, "step": 6220 }, { - "epoch": 0.03, - "learning_rate": 0.00029528532725227156, - "loss": 0.0497, + "epoch": 0.02, + "learning_rate": 0.0002975776412005775, + "loss": 0.0539, "step": 6230 }, { - "epoch": 0.03, - "learning_rate": 0.00029527775955925754, - "loss": 0.0507, + "epoch": 0.02, + "learning_rate": 0.00029757375298420605, + "loss": 0.0552, "step": 6240 }, { - "epoch": 0.03, - "learning_rate": 0.0002952701918662435, - "loss": 0.0494, + "epoch": 0.02, + "learning_rate": 0.00029756986476783457, + "loss": 0.0541, "step": 6250 }, { - "epoch": 0.03, - "learning_rate": 0.0002952626241732295, - "loss": 0.0491, + "epoch": 0.02, + "learning_rate": 0.0002975659765514631, + "loss": 0.0586, "step": 6260 }, { - "epoch": 0.03, - "learning_rate": 0.0002952550564802155, - "loss": 0.0548, + "epoch": 0.02, + "learning_rate": 0.00029756208833509165, + "loss": 0.0479, "step": 6270 }, { - "epoch": 0.03, - "learning_rate": 0.00029524748878720147, - "loss": 0.0527, + "epoch": 0.02, + "learning_rate": 0.00029755820011872016, + "loss": 0.0533, "step": 6280 }, { - "epoch": 0.03, - "learning_rate": 0.0002952399210941875, - "loss": 0.0517, + "epoch": 0.02, + "learning_rate": 0.00029755431190234873, + "loss": 0.0465, "step": 6290 }, { - "epoch": 0.03, - "learning_rate": 0.0002952323534011735, - "loss": 0.0451, + "epoch": 0.02, + "learning_rate": 0.00029755042368597725, + "loss": 0.0617, "step": 6300 }, { - "epoch": 0.03, - "learning_rate": 0.00029522478570815947, - "loss": 0.0527, + "epoch": 0.02, + "learning_rate": 0.00029754653546960576, + "loss": 0.0568, "step": 6310 }, { - "epoch": 0.03, - "learning_rate": 0.00029521721801514545, - "loss": 0.0539, + "epoch": 0.02, + "learning_rate": 0.00029754264725323433, + "loss": 0.0489, "step": 6320 }, { - "epoch": 0.03, - "learning_rate": 0.00029520965032213143, - "loss": 0.0477, + "epoch": 0.02, + "learning_rate": 0.00029753875903686285, + "loss": 0.0491, "step": 6330 }, { - "epoch": 0.03, - "learning_rate": 0.0002952020826291174, - "loss": 0.0627, + "epoch": 0.02, + "learning_rate": 0.0002975348708204914, + "loss": 0.0505, "step": 6340 }, { - "epoch": 0.03, - "learning_rate": 0.00029519451493610345, - "loss": 0.0474, + "epoch": 0.02, + "learning_rate": 0.00029753098260411993, + "loss": 0.0514, "step": 6350 }, { - "epoch": 0.03, - "learning_rate": 0.00029518694724308943, - "loss": 0.0467, + "epoch": 0.02, + "learning_rate": 0.0002975270943877485, + "loss": 0.0591, "step": 6360 }, { - "epoch": 0.03, - "learning_rate": 0.0002951793795500754, - "loss": 0.0516, + "epoch": 0.02, + "learning_rate": 0.000297523206171377, + "loss": 0.0578, "step": 6370 }, { - "epoch": 0.03, - "learning_rate": 0.0002951718118570614, - "loss": 0.0443, + "epoch": 0.02, + "learning_rate": 0.0002975193179550055, + "loss": 0.0488, "step": 6380 }, { - "epoch": 0.03, - "learning_rate": 0.0002951642441640474, - "loss": 0.048, + "epoch": 0.02, + "learning_rate": 0.00029751542973863404, + "loss": 0.0521, "step": 6390 }, { - "epoch": 0.03, - "learning_rate": 0.00029515667647103336, - "loss": 0.0481, + "epoch": 0.02, + "learning_rate": 0.0002975115415222626, + "loss": 0.0472, "step": 6400 }, { - "epoch": 0.03, - "learning_rate": 0.00029514910877801934, - "loss": 0.0468, + "epoch": 0.02, + "learning_rate": 0.0002975076533058911, + "loss": 0.0489, "step": 6410 }, { - "epoch": 0.03, - "learning_rate": 0.00029514154108500537, - "loss": 0.0453, + "epoch": 0.02, + "learning_rate": 0.0002975037650895197, + "loss": 0.0457, "step": 6420 }, { - "epoch": 0.03, - "learning_rate": 0.00029513397339199135, - "loss": 0.0819, + "epoch": 0.02, + "learning_rate": 0.0002974998768731482, + "loss": 0.0528, "step": 6430 }, { - "epoch": 0.03, - "learning_rate": 0.00029512640569897734, - "loss": 0.0532, + "epoch": 0.02, + "learning_rate": 0.0002974959886567768, + "loss": 0.0464, "step": 6440 }, { - "epoch": 0.03, - "learning_rate": 0.0002951188380059633, - "loss": 0.0467, + "epoch": 0.02, + "learning_rate": 0.0002974921004404053, + "loss": 0.0517, "step": 6450 }, { - "epoch": 0.03, - "learning_rate": 0.0002951112703129493, - "loss": 0.048, + "epoch": 0.02, + "learning_rate": 0.0002974882122240338, + "loss": 0.0525, "step": 6460 }, { - "epoch": 0.03, - "learning_rate": 0.0002951037026199353, - "loss": 0.0522, + "epoch": 0.02, + "learning_rate": 0.0002974843240076623, + "loss": 0.0567, "step": 6470 }, { - "epoch": 0.03, - "learning_rate": 0.0002950961349269213, - "loss": 0.0526, + "epoch": 0.02, + "learning_rate": 0.0002974804357912909, + "loss": 0.0525, "step": 6480 }, { - "epoch": 0.03, - "learning_rate": 0.0002950885672339073, - "loss": 0.0431, + "epoch": 0.02, + "learning_rate": 0.00029747654757491946, + "loss": 0.0526, "step": 6490 }, { - "epoch": 0.03, - "learning_rate": 0.0002950809995408933, - "loss": 0.0413, + "epoch": 0.02, + "learning_rate": 0.00029747265935854797, + "loss": 0.0477, "step": 6500 }, { - "epoch": 0.03, - "learning_rate": 0.00029507343184787926, - "loss": 0.0447, + "epoch": 0.02, + "learning_rate": 0.0002974687711421765, + "loss": 0.0448, "step": 6510 }, { - "epoch": 0.03, - "learning_rate": 0.00029506586415486524, - "loss": 0.0429, + "epoch": 0.02, + "learning_rate": 0.000297464882925805, + "loss": 0.0526, "step": 6520 }, { - "epoch": 0.03, - "learning_rate": 0.0002950582964618512, - "loss": 0.0491, + "epoch": 0.02, + "learning_rate": 0.00029746099470943357, + "loss": 0.0513, "step": 6530 }, { - "epoch": 0.03, - "learning_rate": 0.0002950507287688372, - "loss": 0.0441, + "epoch": 0.02, + "learning_rate": 0.0002974571064930621, + "loss": 0.0535, "step": 6540 }, { - "epoch": 0.03, - "learning_rate": 0.00029504316107582324, - "loss": 0.047, + "epoch": 0.02, + "learning_rate": 0.00029745321827669065, + "loss": 0.0449, "step": 6550 }, { - "epoch": 0.03, - "learning_rate": 0.0002950355933828092, - "loss": 0.0478, + "epoch": 0.02, + "learning_rate": 0.00029744933006031917, + "loss": 0.0575, "step": 6560 }, { - "epoch": 0.03, - "learning_rate": 0.0002950280256897952, - "loss": 0.0459, + "epoch": 0.02, + "learning_rate": 0.00029744544184394774, + "loss": 0.0505, "step": 6570 }, { - "epoch": 0.03, - "learning_rate": 0.0002950204579967812, - "loss": 0.0422, + "epoch": 0.02, + "learning_rate": 0.00029744155362757625, + "loss": 0.0517, "step": 6580 }, { - "epoch": 0.03, - "learning_rate": 0.00029501289030376717, - "loss": 0.044, + "epoch": 0.02, + "learning_rate": 0.00029743766541120477, + "loss": 0.0496, "step": 6590 }, { - "epoch": 0.03, - "learning_rate": 0.00029500532261075315, - "loss": 0.0382, + "epoch": 0.02, + "learning_rate": 0.0002974337771948333, + "loss": 0.0481, "step": 6600 }, { - "epoch": 0.03, - "learning_rate": 0.0002949977549177392, - "loss": 0.0437, + "epoch": 0.02, + "learning_rate": 0.00029742988897846185, + "loss": 0.0545, "step": 6610 }, { - "epoch": 0.03, - "learning_rate": 0.00029499018722472516, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.00029742600076209036, + "loss": 0.0474, "step": 6620 }, { - "epoch": 0.03, - "learning_rate": 0.00029498261953171115, - "loss": 0.0367, + "epoch": 0.02, + "learning_rate": 0.00029742211254571893, + "loss": 0.0515, "step": 6630 }, { - "epoch": 0.03, - "learning_rate": 0.0002949750518386971, - "loss": 0.0394, + "epoch": 0.02, + "learning_rate": 0.00029741822432934745, + "loss": 0.058, "step": 6640 }, { - "epoch": 0.03, - "learning_rate": 0.0002949674841456831, - "loss": 0.0373, + "epoch": 0.02, + "learning_rate": 0.000297414336112976, + "loss": 0.0532, "step": 6650 }, { - "epoch": 0.03, - "learning_rate": 0.0002949599164526691, - "loss": 0.0447, + "epoch": 0.02, + "learning_rate": 0.00029741044789660453, + "loss": 0.0517, "step": 6660 }, { - "epoch": 0.03, - "learning_rate": 0.0002949523487596551, - "loss": 0.0398, + "epoch": 0.02, + "learning_rate": 0.00029740655968023304, + "loss": 0.0553, "step": 6670 }, { - "epoch": 0.03, - "learning_rate": 0.0002949447810666411, - "loss": 0.0366, + "epoch": 0.02, + "learning_rate": 0.00029740267146386156, + "loss": 0.0438, "step": 6680 }, { - "epoch": 0.03, - "learning_rate": 0.0002949372133736271, - "loss": 0.0432, + "epoch": 0.02, + "learning_rate": 0.00029739878324749013, + "loss": 0.0509, "step": 6690 }, { - "epoch": 0.03, - "learning_rate": 0.00029492964568061307, - "loss": 0.0436, + "epoch": 0.02, + "learning_rate": 0.0002973948950311187, + "loss": 0.0506, "step": 6700 }, { - "epoch": 0.03, - "learning_rate": 0.00029492207798759905, - "loss": 0.0411, + "epoch": 0.02, + "learning_rate": 0.0002973910068147472, + "loss": 0.0608, "step": 6710 }, { - "epoch": 0.03, - "learning_rate": 0.00029491451029458503, - "loss": 0.0417, + "epoch": 0.02, + "learning_rate": 0.0002973871185983757, + "loss": 0.0479, "step": 6720 }, { - "epoch": 0.03, - "learning_rate": 0.000294906942601571, - "loss": 0.0432, + "epoch": 0.02, + "learning_rate": 0.00029738323038200424, + "loss": 0.0522, "step": 6730 }, { - "epoch": 0.03, - "learning_rate": 0.00029489937490855705, - "loss": 0.0392, + "epoch": 0.02, + "learning_rate": 0.0002973793421656328, + "loss": 0.0501, "step": 6740 }, { - "epoch": 0.03, - "learning_rate": 0.00029489180721554303, - "loss": 0.0403, + "epoch": 0.02, + "learning_rate": 0.0002973754539492613, + "loss": 0.064, "step": 6750 }, { - "epoch": 0.03, - "learning_rate": 0.000294884239522529, - "loss": 0.0409, + "epoch": 0.02, + "learning_rate": 0.0002973715657328899, + "loss": 0.0531, "step": 6760 }, { - "epoch": 0.03, - "learning_rate": 0.000294876671829515, - "loss": 0.0413, + "epoch": 0.02, + "learning_rate": 0.0002973676775165184, + "loss": 0.0522, "step": 6770 }, { - "epoch": 0.03, - "learning_rate": 0.000294869104136501, - "loss": 0.0445, + "epoch": 0.02, + "learning_rate": 0.000297363789300147, + "loss": 0.0621, "step": 6780 }, { - "epoch": 0.03, - "learning_rate": 0.00029486153644348696, - "loss": 0.0415, + "epoch": 0.02, + "learning_rate": 0.0002973599010837755, + "loss": 0.0464, "step": 6790 }, { - "epoch": 0.03, - "learning_rate": 0.000294853968750473, - "loss": 0.0381, + "epoch": 0.02, + "learning_rate": 0.000297356012867404, + "loss": 0.0558, "step": 6800 }, { - "epoch": 0.03, - "learning_rate": 0.000294846401057459, - "loss": 0.042, + "epoch": 0.02, + "learning_rate": 0.0002973521246510325, + "loss": 0.0464, "step": 6810 }, { - "epoch": 0.03, - "learning_rate": 0.00029483883336444496, - "loss": 0.0454, + "epoch": 0.02, + "learning_rate": 0.0002973482364346611, + "loss": 0.0525, "step": 6820 }, { - "epoch": 0.03, - "learning_rate": 0.00029483126567143094, - "loss": 0.0434, + "epoch": 0.02, + "learning_rate": 0.00029734434821828966, + "loss": 0.0488, "step": 6830 }, { - "epoch": 0.03, - "learning_rate": 0.0002948236979784169, - "loss": 0.0438, + "epoch": 0.02, + "learning_rate": 0.00029734046000191817, + "loss": 0.0482, "step": 6840 }, { - "epoch": 0.03, - "learning_rate": 0.0002948161302854029, - "loss": 0.0494, + "epoch": 0.02, + "learning_rate": 0.0002973365717855467, + "loss": 0.0524, "step": 6850 }, { - "epoch": 0.03, - "learning_rate": 0.00029480856259238894, - "loss": 0.0552, + "epoch": 0.02, + "learning_rate": 0.00029733268356917525, + "loss": 0.0438, "step": 6860 }, { - "epoch": 0.03, - "learning_rate": 0.0002948009948993749, - "loss": 0.0457, + "epoch": 0.02, + "learning_rate": 0.00029732879535280377, + "loss": 0.0497, "step": 6870 }, { - "epoch": 0.03, - "learning_rate": 0.0002947934272063609, - "loss": 0.0391, + "epoch": 0.02, + "learning_rate": 0.0002973249071364323, + "loss": 0.0531, "step": 6880 }, { - "epoch": 0.03, - "learning_rate": 0.0002947858595133469, - "loss": 0.0444, + "epoch": 0.02, + "learning_rate": 0.00029732101892006085, + "loss": 0.0478, "step": 6890 }, { - "epoch": 0.03, - "learning_rate": 0.00029477829182033286, - "loss": 0.0453, + "epoch": 0.02, + "learning_rate": 0.00029731713070368937, + "loss": 0.047, "step": 6900 }, { - "epoch": 0.03, - "learning_rate": 0.00029477072412731884, - "loss": 0.045, + "epoch": 0.02, + "learning_rate": 0.00029731324248731794, + "loss": 0.0419, "step": 6910 }, { - "epoch": 0.03, - "learning_rate": 0.0002947631564343048, - "loss": 0.0388, + "epoch": 0.02, + "learning_rate": 0.00029730935427094645, + "loss": 0.0493, "step": 6920 }, { - "epoch": 0.03, - "learning_rate": 0.0002947555887412908, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.00029730546605457496, + "loss": 0.0551, "step": 6930 }, { - "epoch": 0.04, - "learning_rate": 0.0002947480210482768, - "loss": 0.0415, + "epoch": 0.02, + "learning_rate": 0.00029730157783820353, + "loss": 0.0529, "step": 6940 }, { - "epoch": 0.04, - "learning_rate": 0.00029474045335526277, - "loss": 0.0424, + "epoch": 0.02, + "learning_rate": 0.00029729768962183205, + "loss": 0.0515, "step": 6950 }, { - "epoch": 0.04, - "learning_rate": 0.00029473288566224875, - "loss": 0.0373, + "epoch": 0.02, + "learning_rate": 0.00029729380140546056, + "loss": 0.0476, "step": 6960 }, { - "epoch": 0.04, - "learning_rate": 0.0002947253179692348, - "loss": 0.0375, + "epoch": 0.02, + "learning_rate": 0.00029728991318908913, + "loss": 0.053, "step": 6970 }, { - "epoch": 0.04, - "learning_rate": 0.00029471775027622077, - "loss": 0.0396, + "epoch": 0.02, + "learning_rate": 0.00029728602497271765, + "loss": 0.0479, "step": 6980 }, { - "epoch": 0.04, - "learning_rate": 0.00029471018258320675, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.0002972821367563462, + "loss": 0.0552, "step": 6990 }, { - "epoch": 0.04, - "learning_rate": 0.00029470261489019273, - "loss": 0.0927, + "epoch": 0.02, + "learning_rate": 0.00029727824853997473, + "loss": 0.0485, "step": 7000 }, { - "epoch": 0.04, - "eval_cer": 0.9144498775845288, - "eval_loss": 0.03059179149568081, - "eval_runtime": 117.5676, - "eval_samples_per_second": 17.011, - "eval_steps_per_second": 4.253, + "epoch": 0.02, + "eval_cer": 0.8817964619977577, + "eval_loss": 0.03943474590778351, + "eval_runtime": 107.6801, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 4.643, "step": 7000 }, { - "epoch": 0.04, - "learning_rate": 0.0002946950471971787, - "loss": 0.0505, + "epoch": 0.02, + "learning_rate": 0.00029727436032360324, + "loss": 0.0459, "step": 7010 }, { - "epoch": 0.04, - "learning_rate": 0.0002946874795041647, - "loss": 0.0615, + "epoch": 0.02, + "learning_rate": 0.00029727047210723176, + "loss": 0.0515, "step": 7020 }, { - "epoch": 0.04, - "learning_rate": 0.00029467991181115073, - "loss": 0.0509, + "epoch": 0.02, + "learning_rate": 0.0002972665838908603, + "loss": 0.0483, "step": 7030 }, { - "epoch": 0.04, - "learning_rate": 0.0002946723441181367, - "loss": 0.0462, + "epoch": 0.02, + "learning_rate": 0.0002972626956744889, + "loss": 0.0517, "step": 7040 }, { - "epoch": 0.04, - "learning_rate": 0.0002946647764251227, - "loss": 0.0421, + "epoch": 0.02, + "learning_rate": 0.0002972588074581174, + "loss": 0.0473, "step": 7050 }, { - "epoch": 0.04, - "learning_rate": 0.00029465720873210867, - "loss": 0.0414, + "epoch": 0.02, + "learning_rate": 0.0002972549192417459, + "loss": 0.0432, "step": 7060 }, { - "epoch": 0.04, - "learning_rate": 0.00029464964103909465, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.0002972510310253745, + "loss": 0.0509, "step": 7070 }, { - "epoch": 0.04, - "learning_rate": 0.00029464207334608064, - "loss": 0.0436, + "epoch": 0.02, + "learning_rate": 0.000297247142809003, + "loss": 0.0476, "step": 7080 }, { - "epoch": 0.04, - "learning_rate": 0.0002946345056530666, - "loss": 0.0425, + "epoch": 0.02, + "learning_rate": 0.0002972432545926315, + "loss": 0.0602, "step": 7090 }, { - "epoch": 0.04, - "learning_rate": 0.00029462693796005265, - "loss": 0.0442, + "epoch": 0.02, + "learning_rate": 0.0002972393663762601, + "loss": 0.0582, "step": 7100 }, { - "epoch": 0.04, - "learning_rate": 0.00029461937026703863, - "loss": 0.0411, + "epoch": 0.02, + "learning_rate": 0.0002972354781598886, + "loss": 0.0507, "step": 7110 }, { - "epoch": 0.04, - "learning_rate": 0.0002946118025740246, - "loss": 0.0409, + "epoch": 0.02, + "learning_rate": 0.0002972315899435172, + "loss": 0.048, "step": 7120 }, { - "epoch": 0.04, - "learning_rate": 0.0002946042348810106, - "loss": 0.0415, + "epoch": 0.02, + "learning_rate": 0.0002972277017271457, + "loss": 0.0506, "step": 7130 }, { - "epoch": 0.04, - "learning_rate": 0.0002945966671879966, - "loss": 0.0379, + "epoch": 0.02, + "learning_rate": 0.0002972238135107742, + "loss": 0.0479, "step": 7140 }, { - "epoch": 0.04, - "learning_rate": 0.00029458909949498256, - "loss": 0.0438, + "epoch": 0.02, + "learning_rate": 0.00029721992529440277, + "loss": 0.0522, "step": 7150 }, { - "epoch": 0.04, - "learning_rate": 0.0002945815318019686, - "loss": 0.0488, + "epoch": 0.02, + "learning_rate": 0.0002972160370780313, + "loss": 0.0499, "step": 7160 }, { - "epoch": 0.04, - "learning_rate": 0.0002945739641089546, - "loss": 0.0399, + "epoch": 0.02, + "learning_rate": 0.0002972121488616598, + "loss": 0.0548, "step": 7170 }, { - "epoch": 0.04, - "learning_rate": 0.00029456639641594056, - "loss": 0.0477, + "epoch": 0.02, + "learning_rate": 0.00029720826064528837, + "loss": 0.0573, "step": 7180 }, { - "epoch": 0.04, - "learning_rate": 0.00029455882872292654, - "loss": 0.0425, + "epoch": 0.02, + "learning_rate": 0.00029720437242891694, + "loss": 0.0517, "step": 7190 }, { - "epoch": 0.04, - "learning_rate": 0.0002945512610299125, - "loss": 0.0436, + "epoch": 0.02, + "learning_rate": 0.00029720048421254545, + "loss": 0.0446, "step": 7200 }, { - "epoch": 0.04, - "learning_rate": 0.0002945436933368985, - "loss": 0.0417, + "epoch": 0.02, + "learning_rate": 0.00029719659599617397, + "loss": 0.0455, "step": 7210 }, { - "epoch": 0.04, - "learning_rate": 0.00029453612564388454, - "loss": 0.0403, + "epoch": 0.02, + "learning_rate": 0.0002971927077798025, + "loss": 0.0519, "step": 7220 }, { - "epoch": 0.04, - "learning_rate": 0.0002945285579508705, - "loss": 0.0378, + "epoch": 0.02, + "learning_rate": 0.00029718881956343105, + "loss": 0.0572, "step": 7230 }, { - "epoch": 0.04, - "learning_rate": 0.0002945209902578565, - "loss": 0.045, + "epoch": 0.02, + "learning_rate": 0.00029718493134705957, + "loss": 0.057, "step": 7240 }, { - "epoch": 0.04, - "learning_rate": 0.0002945134225648425, - "loss": 0.0385, + "epoch": 0.02, + "learning_rate": 0.00029718104313068813, + "loss": 0.0536, "step": 7250 }, { - "epoch": 0.04, - "learning_rate": 0.00029450585487182846, - "loss": 0.0402, + "epoch": 0.02, + "learning_rate": 0.00029717715491431665, + "loss": 0.0533, "step": 7260 }, { - "epoch": 0.04, - "learning_rate": 0.00029449828717881445, - "loss": 0.0473, + "epoch": 0.02, + "learning_rate": 0.00029717326669794516, + "loss": 0.0466, "step": 7270 }, { - "epoch": 0.04, - "learning_rate": 0.0002944907194858004, - "loss": 0.0433, + "epoch": 0.02, + "learning_rate": 0.00029716937848157373, + "loss": 0.0638, "step": 7280 }, { - "epoch": 0.04, - "learning_rate": 0.00029448315179278646, - "loss": 0.0402, + "epoch": 0.02, + "learning_rate": 0.00029716549026520225, + "loss": 0.0516, "step": 7290 }, { - "epoch": 0.04, - "learning_rate": 0.00029447558409977244, - "loss": 0.04, + "epoch": 0.02, + "learning_rate": 0.00029716160204883076, + "loss": 0.0661, "step": 7300 }, { - "epoch": 0.04, - "learning_rate": 0.0002944680164067584, - "loss": 0.0422, + "epoch": 0.02, + "learning_rate": 0.00029715771383245933, + "loss": 0.0678, "step": 7310 }, { - "epoch": 0.04, - "learning_rate": 0.0002944604487137444, - "loss": 0.043, + "epoch": 0.02, + "learning_rate": 0.00029715382561608784, + "loss": 0.055, "step": 7320 }, { - "epoch": 0.04, - "learning_rate": 0.0002944528810207304, - "loss": 0.0423, + "epoch": 0.02, + "learning_rate": 0.0002971499373997164, + "loss": 0.0438, "step": 7330 }, { - "epoch": 0.04, - "learning_rate": 0.00029444531332771637, - "loss": 0.0394, + "epoch": 0.02, + "learning_rate": 0.00029714604918334493, + "loss": 0.0444, "step": 7340 }, { - "epoch": 0.04, - "learning_rate": 0.0002944377456347024, - "loss": 0.0409, + "epoch": 0.02, + "learning_rate": 0.00029714216096697344, + "loss": 0.0494, "step": 7350 }, { - "epoch": 0.04, - "learning_rate": 0.0002944301779416884, - "loss": 0.038, + "epoch": 0.02, + "learning_rate": 0.000297138272750602, + "loss": 0.0529, "step": 7360 }, { - "epoch": 0.04, - "learning_rate": 0.00029442261024867437, - "loss": 0.0363, + "epoch": 0.02, + "learning_rate": 0.0002971343845342305, + "loss": 0.0513, "step": 7370 }, { - "epoch": 0.04, - "learning_rate": 0.00029441504255566035, - "loss": 0.0443, + "epoch": 0.02, + "learning_rate": 0.0002971304963178591, + "loss": 0.0498, "step": 7380 }, { - "epoch": 0.04, - "learning_rate": 0.00029440747486264633, - "loss": 0.0407, + "epoch": 0.02, + "learning_rate": 0.0002971266081014876, + "loss": 0.0457, "step": 7390 }, { - "epoch": 0.04, - "learning_rate": 0.0002943999071696323, - "loss": 0.0506, + "epoch": 0.02, + "learning_rate": 0.0002971227198851162, + "loss": 0.0534, "step": 7400 }, { - "epoch": 0.04, - "learning_rate": 0.00029439233947661835, - "loss": 0.0434, + "epoch": 0.02, + "learning_rate": 0.0002971188316687447, + "loss": 0.0453, "step": 7410 }, { - "epoch": 0.04, - "learning_rate": 0.00029438477178360433, - "loss": 0.0501, + "epoch": 0.02, + "learning_rate": 0.0002971149434523732, + "loss": 0.0476, "step": 7420 }, { - "epoch": 0.04, - "learning_rate": 0.0002943772040905903, - "loss": 0.05, + "epoch": 0.02, + "learning_rate": 0.0002971110552360017, + "loss": 0.0494, "step": 7430 }, { - "epoch": 0.04, - "learning_rate": 0.0002943696363975763, - "loss": 0.0444, + "epoch": 0.02, + "learning_rate": 0.0002971071670196303, + "loss": 0.0476, "step": 7440 }, { - "epoch": 0.04, - "learning_rate": 0.0002943620687045623, - "loss": 0.0354, + "epoch": 0.02, + "learning_rate": 0.0002971032788032588, + "loss": 0.0459, "step": 7450 }, { - "epoch": 0.04, - "learning_rate": 0.00029435450101154826, - "loss": 0.0387, + "epoch": 0.02, + "learning_rate": 0.0002970993905868874, + "loss": 0.0488, "step": 7460 }, { - "epoch": 0.04, - "learning_rate": 0.00029434693331853424, - "loss": 0.0454, + "epoch": 0.02, + "learning_rate": 0.0002970955023705159, + "loss": 0.0501, "step": 7470 }, { - "epoch": 0.04, - "learning_rate": 0.00029433936562552027, - "loss": 0.0397, + "epoch": 0.02, + "learning_rate": 0.0002970916141541444, + "loss": 0.0526, "step": 7480 }, { - "epoch": 0.04, - "learning_rate": 0.00029433179793250625, - "loss": 0.0448, + "epoch": 0.02, + "learning_rate": 0.00029708772593777297, + "loss": 0.0468, "step": 7490 }, { - "epoch": 0.04, - "learning_rate": 0.00029432423023949224, - "loss": 0.0408, + "epoch": 0.02, + "learning_rate": 0.0002970838377214015, + "loss": 0.0505, "step": 7500 }, { - "epoch": 0.04, - "learning_rate": 0.0002943166625464782, - "loss": 0.046, + "epoch": 0.02, + "learning_rate": 0.00029707994950503, + "loss": 0.0486, "step": 7510 }, { - "epoch": 0.04, - "learning_rate": 0.0002943090948534642, - "loss": 0.0449, + "epoch": 0.02, + "learning_rate": 0.00029707606128865857, + "loss": 0.0435, "step": 7520 }, { - "epoch": 0.04, - "learning_rate": 0.0002943015271604502, - "loss": 0.0428, + "epoch": 0.02, + "learning_rate": 0.00029707217307228714, + "loss": 0.0515, "step": 7530 }, { - "epoch": 0.04, - "learning_rate": 0.0002942939594674362, - "loss": 0.04, + "epoch": 0.02, + "learning_rate": 0.00029706828485591565, + "loss": 0.0514, "step": 7540 }, { - "epoch": 0.04, - "learning_rate": 0.0002942863917744222, - "loss": 0.0422, + "epoch": 0.02, + "learning_rate": 0.00029706439663954417, + "loss": 0.0541, "step": 7550 }, { - "epoch": 0.04, - "learning_rate": 0.0002942788240814082, - "loss": 0.0374, + "epoch": 0.02, + "learning_rate": 0.0002970605084231727, + "loss": 0.0557, "step": 7560 }, { - "epoch": 0.04, - "learning_rate": 0.00029427125638839416, - "loss": 0.0432, + "epoch": 0.02, + "learning_rate": 0.00029705662020680125, + "loss": 0.0506, "step": 7570 }, { - "epoch": 0.04, - "learning_rate": 0.00029426368869538014, - "loss": 0.0425, + "epoch": 0.02, + "learning_rate": 0.00029705273199042976, + "loss": 0.0463, "step": 7580 }, { - "epoch": 0.04, - "learning_rate": 0.0002942561210023661, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.00029704884377405833, + "loss": 0.0448, "step": 7590 }, { - "epoch": 0.04, - "learning_rate": 0.0002942485533093521, - "loss": 0.0396, + "epoch": 0.02, + "learning_rate": 0.00029704495555768685, + "loss": 0.0422, "step": 7600 }, { - "epoch": 0.04, - "learning_rate": 0.00029424098561633814, - "loss": 0.0368, + "epoch": 0.02, + "learning_rate": 0.0002970410673413154, + "loss": 0.0496, "step": 7610 }, { - "epoch": 0.04, - "learning_rate": 0.0002942334179233241, - "loss": 0.0451, + "epoch": 0.02, + "learning_rate": 0.00029703717912494393, + "loss": 0.0584, "step": 7620 }, { - "epoch": 0.04, - "learning_rate": 0.0002942258502303101, - "loss": 0.0437, + "epoch": 0.02, + "learning_rate": 0.00029703329090857245, + "loss": 0.0454, "step": 7630 }, { - "epoch": 0.04, - "learning_rate": 0.0002942182825372961, - "loss": 0.0516, + "epoch": 0.02, + "learning_rate": 0.00029702940269220096, + "loss": 0.0481, "step": 7640 }, { - "epoch": 0.04, - "learning_rate": 0.00029421071484428207, - "loss": 0.0346, + "epoch": 0.02, + "learning_rate": 0.00029702551447582953, + "loss": 0.0491, "step": 7650 }, { - "epoch": 0.04, - "learning_rate": 0.00029420314715126805, - "loss": 0.0381, + "epoch": 0.02, + "learning_rate": 0.00029702162625945804, + "loss": 0.0431, "step": 7660 }, { - "epoch": 0.04, - "learning_rate": 0.0002941955794582541, - "loss": 0.0469, + "epoch": 0.02, + "learning_rate": 0.0002970177380430866, + "loss": 0.0459, "step": 7670 }, { - "epoch": 0.04, - "learning_rate": 0.00029418801176524006, - "loss": 0.0404, + "epoch": 0.02, + "learning_rate": 0.0002970138498267151, + "loss": 0.0475, "step": 7680 }, { - "epoch": 0.04, - "learning_rate": 0.00029418044407222605, - "loss": 0.0437, + "epoch": 0.02, + "learning_rate": 0.0002970099616103437, + "loss": 0.0542, "step": 7690 }, { - "epoch": 0.04, - "learning_rate": 0.000294172876379212, - "loss": 0.0414, + "epoch": 0.02, + "learning_rate": 0.0002970060733939722, + "loss": 0.049, "step": 7700 }, { - "epoch": 0.04, - "learning_rate": 0.000294165308686198, - "loss": 0.0486, + "epoch": 0.02, + "learning_rate": 0.0002970021851776007, + "loss": 0.0586, "step": 7710 }, { - "epoch": 0.04, - "learning_rate": 0.000294157740993184, - "loss": 0.0429, + "epoch": 0.02, + "learning_rate": 0.00029699829696122924, + "loss": 0.0454, "step": 7720 }, { - "epoch": 0.04, - "learning_rate": 0.00029415017330017, - "loss": 0.0445, + "epoch": 0.02, + "learning_rate": 0.0002969944087448578, + "loss": 0.0528, "step": 7730 }, { - "epoch": 0.04, - "learning_rate": 0.000294142605607156, - "loss": 0.0423, + "epoch": 0.02, + "learning_rate": 0.0002969905205284864, + "loss": 0.0555, "step": 7740 }, { - "epoch": 0.04, - "learning_rate": 0.000294135037914142, - "loss": 0.0376, + "epoch": 0.02, + "learning_rate": 0.0002969866323121149, + "loss": 0.0495, "step": 7750 }, { - "epoch": 0.04, - "learning_rate": 0.00029412747022112797, - "loss": 0.0449, + "epoch": 0.02, + "learning_rate": 0.0002969827440957434, + "loss": 0.0483, "step": 7760 }, { - "epoch": 0.04, - "learning_rate": 0.00029411990252811395, - "loss": 0.0464, + "epoch": 0.02, + "learning_rate": 0.0002969788558793719, + "loss": 0.0564, "step": 7770 }, { - "epoch": 0.04, - "learning_rate": 0.00029411233483509993, - "loss": 0.0354, + "epoch": 0.02, + "learning_rate": 0.0002969749676630005, + "loss": 0.063, "step": 7780 }, { - "epoch": 0.04, - "learning_rate": 0.0002941047671420859, - "loss": 0.0362, + "epoch": 0.02, + "learning_rate": 0.000296971079446629, + "loss": 0.0394, "step": 7790 }, { - "epoch": 0.04, - "learning_rate": 0.00029409719944907195, - "loss": 0.0384, + "epoch": 0.02, + "learning_rate": 0.00029696719123025757, + "loss": 0.052, "step": 7800 }, { - "epoch": 0.04, - "learning_rate": 0.00029408963175605793, - "loss": 0.036, + "epoch": 0.02, + "learning_rate": 0.0002969633030138861, + "loss": 0.0551, "step": 7810 }, { - "epoch": 0.04, - "learning_rate": 0.0002940820640630439, - "loss": 0.0413, + "epoch": 0.02, + "learning_rate": 0.00029695941479751466, + "loss": 0.0548, "step": 7820 }, { - "epoch": 0.04, - "learning_rate": 0.0002940744963700299, - "loss": 0.0345, + "epoch": 0.02, + "learning_rate": 0.00029695552658114317, + "loss": 0.0699, "step": 7830 }, { - "epoch": 0.04, - "learning_rate": 0.0002940669286770159, - "loss": 0.0379, + "epoch": 0.02, + "learning_rate": 0.0002969516383647717, + "loss": 0.0532, "step": 7840 }, { - "epoch": 0.04, - "learning_rate": 0.00029405936098400186, - "loss": 0.0438, + "epoch": 0.02, + "learning_rate": 0.0002969477501484002, + "loss": 0.0589, "step": 7850 }, { - "epoch": 0.04, - "learning_rate": 0.0002940517932909879, - "loss": 0.0433, + "epoch": 0.02, + "learning_rate": 0.00029694386193202877, + "loss": 0.0516, "step": 7860 }, { - "epoch": 0.04, - "learning_rate": 0.0002940442255979739, - "loss": 0.0404, + "epoch": 0.02, + "learning_rate": 0.0002969399737156573, + "loss": 0.0523, "step": 7870 }, { - "epoch": 0.04, - "learning_rate": 0.00029403665790495986, - "loss": 0.0398, + "epoch": 0.02, + "learning_rate": 0.00029693608549928585, + "loss": 0.0847, "step": 7880 }, { - "epoch": 0.04, - "learning_rate": 0.00029402909021194584, - "loss": 0.0438, + "epoch": 0.02, + "learning_rate": 0.00029693219728291437, + "loss": 0.0531, "step": 7890 }, { - "epoch": 0.04, - "learning_rate": 0.0002940215225189318, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.00029692830906654293, + "loss": 0.0509, "step": 7900 }, { - "epoch": 0.04, - "learning_rate": 0.0002940139548259178, - "loss": 0.0459, + "epoch": 0.02, + "learning_rate": 0.00029692442085017145, + "loss": 0.0537, "step": 7910 }, { - "epoch": 0.04, - "learning_rate": 0.00029400638713290384, - "loss": 0.049, + "epoch": 0.02, + "learning_rate": 0.00029692053263379996, + "loss": 0.0503, "step": 7920 }, { - "epoch": 0.04, - "learning_rate": 0.0002939988194398898, - "loss": 0.0392, + "epoch": 0.02, + "learning_rate": 0.00029691664441742853, + "loss": 0.0544, "step": 7930 }, { - "epoch": 0.04, - "learning_rate": 0.0002939912517468758, - "loss": 0.0387, + "epoch": 0.02, + "learning_rate": 0.00029691275620105705, + "loss": 0.0538, "step": 7940 }, { - "epoch": 0.04, - "learning_rate": 0.0002939836840538618, - "loss": 0.0401, + "epoch": 0.02, + "learning_rate": 0.0002969088679846856, + "loss": 0.0554, "step": 7950 }, { - "epoch": 0.04, - "learning_rate": 0.00029397611636084776, - "loss": 0.0488, + "epoch": 0.02, + "learning_rate": 0.00029690497976831413, + "loss": 0.0524, "step": 7960 }, { - "epoch": 0.04, - "learning_rate": 0.00029396854866783374, - "loss": 0.0453, + "epoch": 0.02, + "learning_rate": 0.00029690109155194264, + "loss": 0.0577, "step": 7970 }, { - "epoch": 0.04, - "learning_rate": 0.0002939609809748197, - "loss": 0.0404, + "epoch": 0.02, + "learning_rate": 0.00029689720333557116, + "loss": 0.0501, "step": 7980 }, { - "epoch": 0.04, - "learning_rate": 0.00029395341328180576, - "loss": 0.0408, + "epoch": 0.02, + "learning_rate": 0.00029689331511919973, + "loss": 0.0482, "step": 7990 }, { - "epoch": 0.04, - "learning_rate": 0.00029394584558879174, - "loss": 0.0365, + "epoch": 0.02, + "learning_rate": 0.00029688942690282824, + "loss": 0.0516, "step": 8000 }, { - "epoch": 0.04, - "eval_cer": 0.9145313908590625, - "eval_loss": 0.03206906095147133, - "eval_runtime": 117.4386, - "eval_samples_per_second": 17.03, - "eval_steps_per_second": 4.258, + "epoch": 0.02, + "eval_cer": 0.8818510478381908, + "eval_loss": 0.038032468408346176, + "eval_runtime": 107.8792, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, "step": 8000 }, { - "epoch": 0.04, - "learning_rate": 0.0002939382778957777, - "loss": 0.0413, + "epoch": 0.02, + "learning_rate": 0.0002968855386864568, + "loss": 0.0487, "step": 8010 }, { - "epoch": 0.04, - "learning_rate": 0.0002939307102027637, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.0002968816504700853, + "loss": 0.0506, "step": 8020 }, { - "epoch": 0.04, - "learning_rate": 0.0002939231425097497, - "loss": 0.0403, + "epoch": 0.02, + "learning_rate": 0.0002968777622537139, + "loss": 0.0475, "step": 8030 }, { - "epoch": 0.04, - "learning_rate": 0.00029391557481673567, - "loss": 0.0382, + "epoch": 0.02, + "learning_rate": 0.0002968738740373424, + "loss": 0.0567, "step": 8040 }, { - "epoch": 0.04, - "learning_rate": 0.0002939080071237217, - "loss": 0.0399, + "epoch": 0.02, + "learning_rate": 0.0002968699858209709, + "loss": 0.0503, "step": 8050 }, { - "epoch": 0.04, - "learning_rate": 0.0002939004394307077, - "loss": 0.0431, + "epoch": 0.02, + "learning_rate": 0.00029686609760459944, + "loss": 0.0664, "step": 8060 }, { - "epoch": 0.04, - "learning_rate": 0.00029389287173769367, - "loss": 0.0478, + "epoch": 0.02, + "learning_rate": 0.000296862209388228, + "loss": 0.0512, "step": 8070 }, { - "epoch": 0.04, - "learning_rate": 0.00029388530404467965, - "loss": 0.0366, + "epoch": 0.02, + "learning_rate": 0.0002968583211718566, + "loss": 0.0509, "step": 8080 }, { - "epoch": 0.04, - "learning_rate": 0.00029387773635166563, - "loss": 0.037, + "epoch": 0.02, + "learning_rate": 0.0002968544329554851, + "loss": 0.0533, "step": 8090 }, { - "epoch": 0.04, - "learning_rate": 0.0002938701686586516, - "loss": 0.0357, + "epoch": 0.02, + "learning_rate": 0.0002968505447391136, + "loss": 0.0498, "step": 8100 }, { - "epoch": 0.04, - "learning_rate": 0.0002938626009656376, - "loss": 0.0408, + "epoch": 0.02, + "learning_rate": 0.0002968466565227422, + "loss": 0.0567, "step": 8110 }, { - "epoch": 0.04, - "learning_rate": 0.0002938550332726236, - "loss": 0.0392, + "epoch": 0.02, + "learning_rate": 0.0002968427683063707, + "loss": 0.0604, "step": 8120 }, { - "epoch": 0.04, - "learning_rate": 0.0002938474655796096, - "loss": 0.0465, + "epoch": 0.02, + "learning_rate": 0.0002968388800899992, + "loss": 0.0575, "step": 8130 }, { - "epoch": 0.04, - "learning_rate": 0.0002938398978865956, - "loss": 0.0369, + "epoch": 0.02, + "learning_rate": 0.00029683499187362777, + "loss": 0.0522, "step": 8140 }, { - "epoch": 0.04, - "learning_rate": 0.00029383233019358157, - "loss": 0.0439, + "epoch": 0.02, + "learning_rate": 0.0002968311036572563, + "loss": 0.0544, "step": 8150 }, { - "epoch": 0.04, - "learning_rate": 0.00029382476250056755, - "loss": 0.0455, + "epoch": 0.02, + "learning_rate": 0.00029682721544088485, + "loss": 0.0475, "step": 8160 }, { - "epoch": 0.04, - "learning_rate": 0.00029381719480755353, - "loss": 0.0379, + "epoch": 0.02, + "learning_rate": 0.00029682332722451337, + "loss": 0.0504, "step": 8170 }, { - "epoch": 0.04, - "learning_rate": 0.0002938096271145395, - "loss": 0.0352, + "epoch": 0.02, + "learning_rate": 0.0002968194390081419, + "loss": 0.0551, "step": 8180 }, { - "epoch": 0.04, - "learning_rate": 0.0002938020594215255, - "loss": 0.0366, + "epoch": 0.02, + "learning_rate": 0.0002968155507917704, + "loss": 0.0451, "step": 8190 }, { - "epoch": 0.04, - "learning_rate": 0.0002937944917285115, - "loss": 0.04, + "epoch": 0.02, + "learning_rate": 0.00029681166257539897, + "loss": 0.0529, "step": 8200 }, { - "epoch": 0.04, - "learning_rate": 0.00029378692403549746, - "loss": 0.0367, + "epoch": 0.02, + "learning_rate": 0.0002968077743590275, + "loss": 0.0546, "step": 8210 }, { - "epoch": 0.04, - "learning_rate": 0.0002937793563424835, - "loss": 0.0417, + "epoch": 0.02, + "learning_rate": 0.00029680388614265605, + "loss": 0.0438, "step": 8220 }, { - "epoch": 0.04, - "learning_rate": 0.0002937717886494695, - "loss": 0.0412, + "epoch": 0.02, + "learning_rate": 0.00029679999792628456, + "loss": 0.047, "step": 8230 }, { - "epoch": 0.04, - "learning_rate": 0.00029376422095645546, - "loss": 0.0383, + "epoch": 0.02, + "learning_rate": 0.00029679610970991313, + "loss": 0.0709, "step": 8240 }, { - "epoch": 0.04, - "learning_rate": 0.00029375665326344144, - "loss": 0.0383, + "epoch": 0.02, + "learning_rate": 0.00029679222149354165, + "loss": 0.0536, "step": 8250 }, { - "epoch": 0.04, - "learning_rate": 0.0002937490855704274, - "loss": 0.0386, + "epoch": 0.02, + "learning_rate": 0.00029678833327717016, + "loss": 0.0497, "step": 8260 }, { - "epoch": 0.04, - "learning_rate": 0.0002937415178774134, - "loss": 0.041, + "epoch": 0.02, + "learning_rate": 0.0002967844450607987, + "loss": 0.0468, "step": 8270 }, { - "epoch": 0.04, - "learning_rate": 0.00029373395018439944, - "loss": 0.0444, + "epoch": 0.02, + "learning_rate": 0.00029678055684442725, + "loss": 0.0445, "step": 8280 }, { - "epoch": 0.04, - "learning_rate": 0.0002937263824913854, - "loss": 0.0399, + "epoch": 0.02, + "learning_rate": 0.0002967766686280558, + "loss": 0.042, "step": 8290 }, { - "epoch": 0.04, - "learning_rate": 0.0002937188147983714, - "loss": 0.0458, + "epoch": 0.02, + "learning_rate": 0.00029677278041168433, + "loss": 0.0506, "step": 8300 }, { - "epoch": 0.04, - "learning_rate": 0.0002937112471053574, - "loss": 0.036, + "epoch": 0.02, + "learning_rate": 0.00029676889219531284, + "loss": 0.0503, "step": 8310 }, { - "epoch": 0.04, - "learning_rate": 0.00029370367941234336, - "loss": 0.0409, + "epoch": 0.02, + "learning_rate": 0.0002967650039789414, + "loss": 0.0518, "step": 8320 }, { - "epoch": 0.04, - "learning_rate": 0.00029369611171932935, - "loss": 0.0406, + "epoch": 0.02, + "learning_rate": 0.0002967611157625699, + "loss": 0.0551, "step": 8330 }, { - "epoch": 0.04, - "learning_rate": 0.00029368854402631533, - "loss": 0.0401, + "epoch": 0.02, + "learning_rate": 0.00029675722754619844, + "loss": 0.0548, "step": 8340 }, { - "epoch": 0.04, - "learning_rate": 0.00029368097633330136, - "loss": 0.0408, + "epoch": 0.02, + "learning_rate": 0.000296753339329827, + "loss": 0.0528, "step": 8350 }, { - "epoch": 0.04, - "learning_rate": 0.00029367340864028734, - "loss": 0.035, + "epoch": 0.02, + "learning_rate": 0.0002967494511134555, + "loss": 0.0499, "step": 8360 }, { - "epoch": 0.04, - "learning_rate": 0.0002936658409472733, - "loss": 0.0411, + "epoch": 0.02, + "learning_rate": 0.0002967455628970841, + "loss": 0.0523, "step": 8370 }, { - "epoch": 0.04, - "learning_rate": 0.0002936582732542593, - "loss": 0.0472, + "epoch": 0.02, + "learning_rate": 0.0002967416746807126, + "loss": 0.0498, "step": 8380 }, { - "epoch": 0.04, - "learning_rate": 0.0002936507055612453, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.0002967377864643411, + "loss": 0.0476, "step": 8390 }, { - "epoch": 0.04, - "learning_rate": 0.00029364313786823127, - "loss": 0.0366, + "epoch": 0.02, + "learning_rate": 0.0002967338982479697, + "loss": 0.0445, "step": 8400 }, { - "epoch": 0.04, - "learning_rate": 0.0002936355701752173, - "loss": 0.0368, + "epoch": 0.02, + "learning_rate": 0.0002967300100315982, + "loss": 0.0526, "step": 8410 }, { - "epoch": 0.04, - "learning_rate": 0.0002936280024822033, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.0002967261218152267, + "loss": 0.0556, "step": 8420 }, { - "epoch": 0.04, - "learning_rate": 0.00029362043478918927, - "loss": 0.0373, + "epoch": 0.02, + "learning_rate": 0.0002967222335988553, + "loss": 0.0443, "step": 8430 }, { - "epoch": 0.04, - "learning_rate": 0.00029361286709617525, - "loss": 0.0376, + "epoch": 0.02, + "learning_rate": 0.0002967183453824838, + "loss": 0.0537, "step": 8440 }, { - "epoch": 0.04, - "learning_rate": 0.00029360529940316123, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.00029671445716611237, + "loss": 0.0509, "step": 8450 }, { - "epoch": 0.04, - "learning_rate": 0.0002935977317101472, - "loss": 0.0445, + "epoch": 0.02, + "learning_rate": 0.0002967105689497409, + "loss": 0.0518, "step": 8460 }, { - "epoch": 0.04, - "learning_rate": 0.00029359016401713325, - "loss": 0.1198, + "epoch": 0.02, + "learning_rate": 0.0002967066807333694, + "loss": 0.0426, "step": 8470 }, { - "epoch": 0.04, - "learning_rate": 0.00029358259632411923, - "loss": 0.0436, + "epoch": 0.02, + "learning_rate": 0.00029670279251699797, + "loss": 0.0493, "step": 8480 }, { - "epoch": 0.04, - "learning_rate": 0.0002935750286311052, - "loss": 0.0414, + "epoch": 0.02, + "learning_rate": 0.0002966989043006265, + "loss": 0.0565, "step": 8490 }, { - "epoch": 0.04, - "learning_rate": 0.0002935674609380912, - "loss": 0.0396, + "epoch": 0.02, + "learning_rate": 0.00029669501608425505, + "loss": 0.0531, "step": 8500 }, { - "epoch": 0.04, - "learning_rate": 0.0002935598932450772, - "loss": 0.0366, + "epoch": 0.02, + "learning_rate": 0.00029669112786788357, + "loss": 0.0528, "step": 8510 }, { - "epoch": 0.04, - "learning_rate": 0.00029355232555206316, - "loss": 0.0383, + "epoch": 0.02, + "learning_rate": 0.0002966872396515121, + "loss": 0.0464, "step": 8520 }, { - "epoch": 0.04, - "learning_rate": 0.00029354475785904914, - "loss": 0.0715, + "epoch": 0.02, + "learning_rate": 0.00029668335143514065, + "loss": 0.0517, "step": 8530 }, { - "epoch": 0.04, - "learning_rate": 0.0002935371901660352, - "loss": 0.067, + "epoch": 0.02, + "learning_rate": 0.00029667946321876917, + "loss": 0.0459, "step": 8540 }, { - "epoch": 0.04, - "learning_rate": 0.00029352962247302115, - "loss": 0.0371, + "epoch": 0.02, + "learning_rate": 0.0002966755750023977, + "loss": 0.0415, "step": 8550 }, { - "epoch": 0.04, - "learning_rate": 0.00029352205478000714, - "loss": 0.0326, + "epoch": 0.02, + "learning_rate": 0.00029667168678602625, + "loss": 0.0446, "step": 8560 }, { - "epoch": 0.04, - "learning_rate": 0.0002935144870869931, - "loss": 0.0439, + "epoch": 0.02, + "learning_rate": 0.0002966677985696548, + "loss": 0.0402, "step": 8570 }, { - "epoch": 0.04, - "learning_rate": 0.0002935069193939791, - "loss": 0.0387, + "epoch": 0.02, + "learning_rate": 0.00029666391035328333, + "loss": 0.0673, "step": 8580 }, { - "epoch": 0.04, - "learning_rate": 0.0002934993517009651, - "loss": 0.0407, + "epoch": 0.02, + "learning_rate": 0.00029666002213691185, + "loss": 0.0413, "step": 8590 }, { - "epoch": 0.04, - "learning_rate": 0.0002934917840079511, - "loss": 0.0378, + "epoch": 0.02, + "learning_rate": 0.00029665613392054036, + "loss": 0.0442, "step": 8600 }, { - "epoch": 0.04, - "learning_rate": 0.0002934842163149371, - "loss": 0.0389, + "epoch": 0.02, + "learning_rate": 0.00029665224570416893, + "loss": 0.0502, "step": 8610 }, { - "epoch": 0.04, - "learning_rate": 0.0002934766486219231, - "loss": 0.0462, + "epoch": 0.02, + "learning_rate": 0.00029664835748779744, + "loss": 0.0484, "step": 8620 }, { - "epoch": 0.04, - "learning_rate": 0.00029346908092890906, - "loss": 0.0362, + "epoch": 0.02, + "learning_rate": 0.000296644469271426, + "loss": 0.0518, "step": 8630 }, { - "epoch": 0.04, - "learning_rate": 0.00029346151323589504, - "loss": 0.0355, + "epoch": 0.02, + "learning_rate": 0.00029664058105505453, + "loss": 0.0545, "step": 8640 }, { - "epoch": 0.04, - "learning_rate": 0.000293453945542881, - "loss": 0.0501, + "epoch": 0.02, + "learning_rate": 0.0002966366928386831, + "loss": 0.0462, "step": 8650 }, { - "epoch": 0.04, - "learning_rate": 0.000293446377849867, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.0002966328046223116, + "loss": 0.0551, "step": 8660 }, { - "epoch": 0.04, - "learning_rate": 0.00029343881015685304, - "loss": 0.047, + "epoch": 0.02, + "learning_rate": 0.0002966289164059401, + "loss": 0.0452, "step": 8670 }, { - "epoch": 0.04, - "learning_rate": 0.000293431242463839, - "loss": 0.0424, + "epoch": 0.02, + "learning_rate": 0.00029662502818956864, + "loss": 0.0477, "step": 8680 }, { - "epoch": 0.04, - "learning_rate": 0.000293423674770825, - "loss": 0.0412, + "epoch": 0.02, + "learning_rate": 0.0002966211399731972, + "loss": 0.0475, "step": 8690 }, { - "epoch": 0.04, - "learning_rate": 0.000293416107077811, - "loss": 0.0422, + "epoch": 0.02, + "learning_rate": 0.0002966172517568257, + "loss": 0.047, "step": 8700 }, { - "epoch": 0.04, - "learning_rate": 0.00029340853938479697, - "loss": 0.0416, + "epoch": 0.02, + "learning_rate": 0.0002966133635404543, + "loss": 0.046, "step": 8710 }, { - "epoch": 0.04, - "learning_rate": 0.00029340097169178295, - "loss": 0.0439, + "epoch": 0.02, + "learning_rate": 0.0002966094753240828, + "loss": 0.0473, "step": 8720 }, { - "epoch": 0.04, - "learning_rate": 0.000293393403998769, - "loss": 0.0432, + "epoch": 0.02, + "learning_rate": 0.0002966055871077113, + "loss": 0.0446, "step": 8730 }, { - "epoch": 0.04, - "learning_rate": 0.00029338583630575496, - "loss": 0.049, + "epoch": 0.02, + "learning_rate": 0.0002966016988913399, + "loss": 0.0524, "step": 8740 }, { - "epoch": 0.04, - "learning_rate": 0.00029337826861274095, - "loss": 0.0852, + "epoch": 0.02, + "learning_rate": 0.0002965978106749684, + "loss": 0.0517, "step": 8750 }, { - "epoch": 0.04, - "learning_rate": 0.00029337070091972693, - "loss": 0.0452, + "epoch": 0.02, + "learning_rate": 0.0002965939224585969, + "loss": 0.049, "step": 8760 }, { - "epoch": 0.04, - "learning_rate": 0.0002933631332267129, - "loss": 0.0722, + "epoch": 0.02, + "learning_rate": 0.0002965900342422255, + "loss": 0.0457, "step": 8770 }, { - "epoch": 0.04, - "learning_rate": 0.0002933555655336989, - "loss": 0.0839, + "epoch": 0.02, + "learning_rate": 0.00029658614602585406, + "loss": 0.0469, "step": 8780 }, { - "epoch": 0.04, - "learning_rate": 0.0002933479978406849, - "loss": 0.0442, + "epoch": 0.02, + "learning_rate": 0.00029658225780948257, + "loss": 0.0419, "step": 8790 }, { - "epoch": 0.04, - "learning_rate": 0.0002933404301476709, - "loss": 0.044, + "epoch": 0.02, + "learning_rate": 0.0002965783695931111, + "loss": 0.064, "step": 8800 }, { - "epoch": 0.04, - "learning_rate": 0.0002933328624546569, - "loss": 0.041, + "epoch": 0.02, + "learning_rate": 0.0002965744813767396, + "loss": 0.0499, "step": 8810 }, { - "epoch": 0.04, - "learning_rate": 0.00029332529476164287, - "loss": 0.0471, + "epoch": 0.02, + "learning_rate": 0.00029657059316036817, + "loss": 0.0464, "step": 8820 }, { - "epoch": 0.04, - "learning_rate": 0.00029331772706862885, - "loss": 0.037, + "epoch": 0.02, + "learning_rate": 0.0002965667049439967, + "loss": 0.0468, "step": 8830 }, { - "epoch": 0.04, - "learning_rate": 0.00029331015937561483, - "loss": 0.0418, + "epoch": 0.02, + "learning_rate": 0.00029656281672762525, + "loss": 0.0513, "step": 8840 }, { - "epoch": 0.04, - "learning_rate": 0.0002933025916826008, - "loss": 0.0411, + "epoch": 0.02, + "learning_rate": 0.00029655892851125377, + "loss": 0.0491, "step": 8850 }, { - "epoch": 0.04, - "learning_rate": 0.00029329502398958685, - "loss": 0.0448, + "epoch": 0.02, + "learning_rate": 0.00029655504029488234, + "loss": 0.0457, "step": 8860 }, { - "epoch": 0.04, - "learning_rate": 0.00029328745629657283, - "loss": 0.0363, + "epoch": 0.02, + "learning_rate": 0.00029655115207851085, + "loss": 0.0529, "step": 8870 }, { - "epoch": 0.04, - "learning_rate": 0.0002932798886035588, - "loss": 0.0438, + "epoch": 0.02, + "learning_rate": 0.00029654726386213936, + "loss": 0.0471, "step": 8880 }, { - "epoch": 0.04, - "learning_rate": 0.0002932723209105448, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.0002965433756457679, + "loss": 0.0504, "step": 8890 }, { - "epoch": 0.04, - "learning_rate": 0.0002932647532175308, - "loss": 0.0423, + "epoch": 0.02, + "learning_rate": 0.00029653948742939645, + "loss": 0.0428, "step": 8900 }, { - "epoch": 0.04, - "learning_rate": 0.00029325718552451676, - "loss": 0.0412, + "epoch": 0.02, + "learning_rate": 0.00029653559921302496, + "loss": 0.0444, "step": 8910 }, { - "epoch": 0.05, - "learning_rate": 0.0002932496178315028, - "loss": 0.0338, + "epoch": 0.02, + "learning_rate": 0.00029653171099665353, + "loss": 0.0504, "step": 8920 }, { - "epoch": 0.05, - "learning_rate": 0.0002932420501384888, - "loss": 0.0347, + "epoch": 0.02, + "learning_rate": 0.00029652782278028205, + "loss": 0.0523, "step": 8930 }, { - "epoch": 0.05, - "learning_rate": 0.00029323448244547476, - "loss": 0.0444, + "epoch": 0.02, + "learning_rate": 0.00029652393456391056, + "loss": 0.0561, "step": 8940 }, { - "epoch": 0.05, - "learning_rate": 0.00029322691475246074, - "loss": 0.0343, + "epoch": 0.02, + "learning_rate": 0.00029652004634753913, + "loss": 0.0561, "step": 8950 }, { - "epoch": 0.05, - "learning_rate": 0.0002932193470594467, - "loss": 0.0437, + "epoch": 0.02, + "learning_rate": 0.00029651615813116764, + "loss": 0.0484, "step": 8960 }, { - "epoch": 0.05, - "learning_rate": 0.0002932117793664327, - "loss": 0.04, + "epoch": 0.02, + "learning_rate": 0.0002965122699147962, + "loss": 0.0507, "step": 8970 }, { - "epoch": 0.05, - "learning_rate": 0.00029320421167341874, - "loss": 0.0405, + "epoch": 0.02, + "learning_rate": 0.0002965083816984247, + "loss": 0.0458, "step": 8980 }, { - "epoch": 0.05, - "learning_rate": 0.0002931966439804047, - "loss": 0.0338, + "epoch": 0.02, + "learning_rate": 0.0002965044934820533, + "loss": 0.0392, "step": 8990 }, { - "epoch": 0.05, - "learning_rate": 0.0002931890762873907, - "loss": 0.043, + "epoch": 0.02, + "learning_rate": 0.0002965006052656818, + "loss": 0.0534, "step": 9000 }, { - "epoch": 0.05, - "eval_cer": 0.9145352724435641, - "eval_loss": 0.03075648657977581, - "eval_runtime": 117.5474, - "eval_samples_per_second": 17.014, - "eval_steps_per_second": 4.254, + "epoch": 0.02, + "eval_cer": 0.881751673615864, + "eval_loss": 0.0344533696770668, + "eval_runtime": 107.61, + "eval_samples_per_second": 18.586, + "eval_steps_per_second": 4.646, "step": 9000 }, { - "epoch": 0.05, - "learning_rate": 0.0002931815085943767, - "loss": 0.0435, + "epoch": 0.02, + "learning_rate": 0.0002964967170493103, + "loss": 0.0483, "step": 9010 }, { - "epoch": 0.05, - "learning_rate": 0.00029317394090136266, - "loss": 0.0368, + "epoch": 0.02, + "learning_rate": 0.00029649282883293884, + "loss": 0.048, "step": 9020 }, { - "epoch": 0.05, - "learning_rate": 0.00029316637320834864, - "loss": 0.0428, + "epoch": 0.02, + "learning_rate": 0.0002964889406165674, + "loss": 0.0403, "step": 9030 }, { - "epoch": 0.05, - "learning_rate": 0.0002931588055153346, - "loss": 0.0391, + "epoch": 0.02, + "learning_rate": 0.0002964850524001959, + "loss": 0.0477, "step": 9040 }, { - "epoch": 0.05, - "learning_rate": 0.00029315123782232066, - "loss": 0.0364, + "epoch": 0.02, + "learning_rate": 0.0002964811641838245, + "loss": 0.043, "step": 9050 }, { - "epoch": 0.05, - "learning_rate": 0.00029314367012930664, - "loss": 0.0351, + "epoch": 0.02, + "learning_rate": 0.000296477275967453, + "loss": 0.039, "step": 9060 }, { - "epoch": 0.05, - "learning_rate": 0.0002931361024362926, - "loss": 0.0363, + "epoch": 0.02, + "learning_rate": 0.0002964733877510816, + "loss": 0.0478, "step": 9070 }, { - "epoch": 0.05, - "learning_rate": 0.0002931285347432786, - "loss": 0.0389, + "epoch": 0.02, + "learning_rate": 0.0002964694995347101, + "loss": 0.0464, "step": 9080 }, { - "epoch": 0.05, - "learning_rate": 0.0002931209670502646, - "loss": 0.0447, + "epoch": 0.02, + "learning_rate": 0.0002964656113183386, + "loss": 0.0468, "step": 9090 }, { - "epoch": 0.05, - "learning_rate": 0.00029311339935725057, - "loss": 0.0385, + "epoch": 0.02, + "learning_rate": 0.0002964617231019671, + "loss": 0.0419, "step": 9100 }, { - "epoch": 0.05, - "learning_rate": 0.0002931058316642366, - "loss": 0.0429, + "epoch": 0.02, + "learning_rate": 0.0002964578348855957, + "loss": 0.0466, "step": 9110 }, { - "epoch": 0.05, - "learning_rate": 0.0002930982639712226, - "loss": 0.0399, + "epoch": 0.02, + "learning_rate": 0.00029645394666922426, + "loss": 0.046, "step": 9120 }, { - "epoch": 0.05, - "learning_rate": 0.00029309069627820857, - "loss": 0.0383, + "epoch": 0.02, + "learning_rate": 0.00029645005845285277, + "loss": 0.0473, "step": 9130 }, { - "epoch": 0.05, - "learning_rate": 0.00029308312858519455, - "loss": 0.0303, + "epoch": 0.02, + "learning_rate": 0.0002964461702364813, + "loss": 0.0506, "step": 9140 }, { - "epoch": 0.05, - "learning_rate": 0.00029307556089218053, - "loss": 0.042, + "epoch": 0.02, + "learning_rate": 0.00029644228202010985, + "loss": 0.0387, "step": 9150 }, { - "epoch": 0.05, - "learning_rate": 0.0002930679931991665, - "loss": 0.0415, + "epoch": 0.02, + "learning_rate": 0.00029643839380373837, + "loss": 0.0425, "step": 9160 }, { - "epoch": 0.05, - "learning_rate": 0.0002930604255061525, - "loss": 0.038, + "epoch": 0.02, + "learning_rate": 0.0002964345055873669, + "loss": 0.0444, "step": 9170 }, { - "epoch": 0.05, - "learning_rate": 0.00029305285781313853, - "loss": 0.0375, + "epoch": 0.02, + "learning_rate": 0.00029643061737099545, + "loss": 0.0444, "step": 9180 }, { - "epoch": 0.05, - "learning_rate": 0.0002930452901201245, - "loss": 0.0364, + "epoch": 0.02, + "learning_rate": 0.00029642672915462397, + "loss": 0.0434, "step": 9190 }, { - "epoch": 0.05, - "learning_rate": 0.0002930377224271105, - "loss": 0.0377, + "epoch": 0.02, + "learning_rate": 0.00029642284093825253, + "loss": 0.0576, "step": 9200 }, { - "epoch": 0.05, - "learning_rate": 0.00029303015473409647, - "loss": 0.0382, + "epoch": 0.02, + "learning_rate": 0.00029641895272188105, + "loss": 0.0476, "step": 9210 }, { - "epoch": 0.05, - "learning_rate": 0.00029302258704108245, - "loss": 0.0425, + "epoch": 0.02, + "learning_rate": 0.00029641506450550956, + "loss": 0.0518, "step": 9220 }, { - "epoch": 0.05, - "learning_rate": 0.00029301501934806843, - "loss": 0.0377, + "epoch": 0.02, + "learning_rate": 0.0002964111762891381, + "loss": 0.0487, "step": 9230 }, { - "epoch": 0.05, - "learning_rate": 0.00029300745165505447, - "loss": 0.0442, + "epoch": 0.02, + "learning_rate": 0.00029640728807276665, + "loss": 0.0588, "step": 9240 }, { - "epoch": 0.05, - "learning_rate": 0.00029299988396204045, - "loss": 0.0396, + "epoch": 0.02, + "learning_rate": 0.00029640339985639516, + "loss": 0.0524, "step": 9250 }, { - "epoch": 0.05, - "learning_rate": 0.00029299231626902643, - "loss": 0.0383, + "epoch": 0.02, + "learning_rate": 0.00029639951164002373, + "loss": 0.0535, "step": 9260 }, { - "epoch": 0.05, - "learning_rate": 0.0002929847485760124, - "loss": 0.0436, + "epoch": 0.02, + "learning_rate": 0.00029639562342365224, + "loss": 0.05, "step": 9270 }, { - "epoch": 0.05, - "learning_rate": 0.0002929771808829984, - "loss": 0.0385, + "epoch": 0.02, + "learning_rate": 0.0002963917352072808, + "loss": 0.0423, "step": 9280 }, { - "epoch": 0.05, - "learning_rate": 0.0002929696131899844, - "loss": 0.0407, + "epoch": 0.02, + "learning_rate": 0.00029638784699090933, + "loss": 0.0382, "step": 9290 }, { - "epoch": 0.05, - "learning_rate": 0.0002929620454969704, - "loss": 0.0399, + "epoch": 0.02, + "learning_rate": 0.00029638395877453784, + "loss": 0.0467, "step": 9300 }, { - "epoch": 0.05, - "learning_rate": 0.0002929544778039564, - "loss": 0.0396, + "epoch": 0.02, + "learning_rate": 0.00029638007055816636, + "loss": 0.0402, "step": 9310 }, { - "epoch": 0.05, - "learning_rate": 0.0002929469101109424, - "loss": 0.0334, + "epoch": 0.02, + "learning_rate": 0.0002963761823417949, + "loss": 0.0425, "step": 9320 }, { - "epoch": 0.05, - "learning_rate": 0.00029293934241792836, - "loss": 0.0379, + "epoch": 0.02, + "learning_rate": 0.0002963722941254235, + "loss": 0.0439, "step": 9330 }, { - "epoch": 0.05, - "learning_rate": 0.00029293177472491434, - "loss": 0.034, + "epoch": 0.02, + "learning_rate": 0.000296368405909052, + "loss": 0.0444, "step": 9340 }, { - "epoch": 0.05, - "learning_rate": 0.0002929242070319003, - "loss": 0.0384, + "epoch": 0.02, + "learning_rate": 0.0002963645176926805, + "loss": 0.046, "step": 9350 }, { - "epoch": 0.05, - "learning_rate": 0.0002929166393388863, - "loss": 0.0372, + "epoch": 0.02, + "learning_rate": 0.0002963606294763091, + "loss": 0.0374, "step": 9360 }, { - "epoch": 0.05, - "learning_rate": 0.00029290907164587234, - "loss": 0.0371, + "epoch": 0.02, + "learning_rate": 0.0002963567412599376, + "loss": 0.0395, "step": 9370 }, { - "epoch": 0.05, - "learning_rate": 0.0002929015039528583, - "loss": 0.0378, + "epoch": 0.02, + "learning_rate": 0.0002963528530435661, + "loss": 0.0458, "step": 9380 }, { - "epoch": 0.05, - "learning_rate": 0.0002928939362598443, - "loss": 0.0362, + "epoch": 0.02, + "learning_rate": 0.0002963489648271947, + "loss": 0.0361, "step": 9390 }, { - "epoch": 0.05, - "learning_rate": 0.0002928863685668303, - "loss": 0.0385, + "epoch": 0.02, + "learning_rate": 0.0002963450766108232, + "loss": 0.0402, "step": 9400 }, { - "epoch": 0.05, - "learning_rate": 0.00029287880087381626, - "loss": 0.0355, + "epoch": 0.02, + "learning_rate": 0.0002963411883944518, + "loss": 0.044, "step": 9410 }, { - "epoch": 0.05, - "learning_rate": 0.00029287123318080224, - "loss": 0.0418, + "epoch": 0.02, + "learning_rate": 0.0002963373001780803, + "loss": 0.0361, "step": 9420 }, { - "epoch": 0.05, - "learning_rate": 0.0002928636654877882, - "loss": 0.0369, + "epoch": 0.02, + "learning_rate": 0.0002963334119617088, + "loss": 0.0427, "step": 9430 }, { - "epoch": 0.05, - "learning_rate": 0.0002928560977947742, - "loss": 0.0423, + "epoch": 0.02, + "learning_rate": 0.0002963295237453373, + "loss": 0.048, "step": 9440 }, { - "epoch": 0.05, - "learning_rate": 0.0002928485301017602, - "loss": 0.0349, + "epoch": 0.02, + "learning_rate": 0.0002963256355289659, + "loss": 0.0448, "step": 9450 }, { - "epoch": 0.05, - "learning_rate": 0.00029284096240874617, - "loss": 0.0379, + "epoch": 0.02, + "learning_rate": 0.0002963217473125944, + "loss": 0.0466, "step": 9460 }, { - "epoch": 0.05, - "learning_rate": 0.0002928333947157322, - "loss": 0.0444, + "epoch": 0.02, + "learning_rate": 0.00029631785909622297, + "loss": 0.0373, "step": 9470 }, { - "epoch": 0.05, - "learning_rate": 0.0002928258270227182, - "loss": 0.0357, + "epoch": 0.02, + "learning_rate": 0.0002963139708798515, + "loss": 0.0478, "step": 9480 }, { - "epoch": 0.05, - "learning_rate": 0.00029281825932970417, - "loss": 0.0495, + "epoch": 0.02, + "learning_rate": 0.00029631008266348005, + "loss": 0.0394, "step": 9490 }, { - "epoch": 0.05, - "learning_rate": 0.00029281069163669015, - "loss": 0.0384, + "epoch": 0.02, + "learning_rate": 0.00029630619444710857, + "loss": 0.0433, "step": 9500 }, { - "epoch": 0.05, - "learning_rate": 0.00029280312394367613, - "loss": 0.0448, + "epoch": 0.02, + "learning_rate": 0.0002963023062307371, + "loss": 0.0424, "step": 9510 }, { - "epoch": 0.05, - "learning_rate": 0.0002927955562506621, - "loss": 0.0382, + "epoch": 0.02, + "learning_rate": 0.00029629841801436565, + "loss": 0.0388, "step": 9520 }, { - "epoch": 0.05, - "learning_rate": 0.00029278798855764815, - "loss": 0.0397, + "epoch": 0.02, + "learning_rate": 0.00029629452979799416, + "loss": 0.0337, "step": 9530 }, { - "epoch": 0.05, - "learning_rate": 0.00029278042086463413, - "loss": 0.0354, + "epoch": 0.02, + "learning_rate": 0.00029629064158162273, + "loss": 0.0448, "step": 9540 }, { - "epoch": 0.05, - "learning_rate": 0.0002927728531716201, - "loss": 0.042, + "epoch": 0.02, + "learning_rate": 0.00029628675336525125, + "loss": 0.0458, "step": 9550 }, { - "epoch": 0.05, - "learning_rate": 0.0002927652854786061, - "loss": 0.0458, + "epoch": 0.02, + "learning_rate": 0.00029628286514887976, + "loss": 0.0496, "step": 9560 }, { - "epoch": 0.05, - "learning_rate": 0.0002927577177855921, - "loss": 0.0349, + "epoch": 0.02, + "learning_rate": 0.00029627897693250833, + "loss": 0.0531, "step": 9570 }, { - "epoch": 0.05, - "learning_rate": 0.00029275015009257806, - "loss": 0.0386, + "epoch": 0.02, + "learning_rate": 0.00029627508871613685, + "loss": 0.0426, "step": 9580 }, { - "epoch": 0.05, - "learning_rate": 0.00029274258239956404, - "loss": 0.0407, + "epoch": 0.02, + "learning_rate": 0.00029627120049976536, + "loss": 0.0413, "step": 9590 }, { - "epoch": 0.05, - "learning_rate": 0.0002927350147065501, - "loss": 0.0397, + "epoch": 0.02, + "learning_rate": 0.00029626731228339393, + "loss": 0.0413, "step": 9600 }, { - "epoch": 0.05, - "learning_rate": 0.00029272744701353605, - "loss": 0.0394, + "epoch": 0.02, + "learning_rate": 0.00029626342406702244, + "loss": 0.0465, "step": 9610 }, { - "epoch": 0.05, - "learning_rate": 0.00029271987932052204, - "loss": 0.043, + "epoch": 0.02, + "learning_rate": 0.000296259535850651, + "loss": 0.0445, "step": 9620 }, { - "epoch": 0.05, - "learning_rate": 0.000292712311627508, - "loss": 0.0395, + "epoch": 0.02, + "learning_rate": 0.0002962556476342795, + "loss": 0.049, "step": 9630 }, { - "epoch": 0.05, - "learning_rate": 0.000292704743934494, - "loss": 0.0401, + "epoch": 0.02, + "learning_rate": 0.00029625175941790804, + "loss": 0.0439, "step": 9640 }, { - "epoch": 0.05, - "learning_rate": 0.00029269717624148, - "loss": 0.0418, + "epoch": 0.03, + "learning_rate": 0.0002962478712015366, + "loss": 0.0474, "step": 9650 }, { - "epoch": 0.05, - "learning_rate": 0.000292689608548466, - "loss": 0.0458, + "epoch": 0.03, + "learning_rate": 0.0002962439829851651, + "loss": 0.0584, "step": 9660 }, { - "epoch": 0.05, - "learning_rate": 0.000292682040855452, - "loss": 0.0492, + "epoch": 0.03, + "learning_rate": 0.0002962400947687937, + "loss": 0.0565, "step": 9670 }, { - "epoch": 0.05, - "learning_rate": 0.000292674473162438, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.0002962362065524222, + "loss": 0.0364, "step": 9680 }, { - "epoch": 0.05, - "learning_rate": 0.00029266690546942396, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.0002962323183360507, + "loss": 0.045, "step": 9690 }, { - "epoch": 0.05, - "learning_rate": 0.00029265933777640994, - "loss": 0.0515, + "epoch": 0.03, + "learning_rate": 0.0002962284301196793, + "loss": 0.0438, "step": 9700 }, { - "epoch": 0.05, - "learning_rate": 0.0002926517700833959, - "loss": 0.0445, + "epoch": 0.03, + "learning_rate": 0.0002962245419033078, + "loss": 0.0434, "step": 9710 }, { - "epoch": 0.05, - "learning_rate": 0.00029264420239038196, - "loss": 0.0406, + "epoch": 0.03, + "learning_rate": 0.0002962206536869363, + "loss": 0.0518, "step": 9720 }, { - "epoch": 0.05, - "learning_rate": 0.00029263663469736794, - "loss": 0.0414, + "epoch": 0.03, + "learning_rate": 0.0002962167654705649, + "loss": 0.055, "step": 9730 }, { - "epoch": 0.05, - "learning_rate": 0.0002926290670043539, - "loss": 0.0355, + "epoch": 0.03, + "learning_rate": 0.0002962128772541934, + "loss": 0.0492, "step": 9740 }, { - "epoch": 0.05, - "learning_rate": 0.0002926214993113399, - "loss": 0.0383, + "epoch": 0.03, + "learning_rate": 0.00029620898903782197, + "loss": 0.0436, "step": 9750 }, { - "epoch": 0.05, - "learning_rate": 0.0002926139316183259, - "loss": 0.0398, + "epoch": 0.03, + "learning_rate": 0.0002962051008214505, + "loss": 0.0577, "step": 9760 }, { - "epoch": 0.05, - "learning_rate": 0.00029260636392531187, - "loss": 0.0456, + "epoch": 0.03, + "learning_rate": 0.000296201212605079, + "loss": 0.0458, "step": 9770 }, { - "epoch": 0.05, - "learning_rate": 0.00029259879623229785, - "loss": 0.0414, + "epoch": 0.03, + "learning_rate": 0.00029619732438870757, + "loss": 0.1094, "step": 9780 }, { - "epoch": 0.05, - "learning_rate": 0.0002925912285392839, - "loss": 0.0428, + "epoch": 0.03, + "learning_rate": 0.0002961934361723361, + "loss": 0.0492, "step": 9790 }, { - "epoch": 0.05, - "learning_rate": 0.00029258366084626986, - "loss": 0.038, + "epoch": 0.03, + "learning_rate": 0.0002961895479559646, + "loss": 0.0467, "step": 9800 }, { - "epoch": 0.05, - "learning_rate": 0.00029257609315325585, - "loss": 0.0365, + "epoch": 0.03, + "learning_rate": 0.00029618565973959317, + "loss": 0.0528, "step": 9810 }, { - "epoch": 0.05, - "learning_rate": 0.00029256852546024183, - "loss": 0.0341, + "epoch": 0.03, + "learning_rate": 0.00029618177152322174, + "loss": 0.0452, "step": 9820 }, { - "epoch": 0.05, - "learning_rate": 0.0002925609577672278, - "loss": 0.0397, + "epoch": 0.03, + "learning_rate": 0.00029617788330685025, + "loss": 0.0534, "step": 9830 }, { - "epoch": 0.05, - "learning_rate": 0.0002925533900742138, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.00029617399509047877, + "loss": 0.0445, "step": 9840 }, { - "epoch": 0.05, - "learning_rate": 0.0002925458223811998, - "loss": 0.0411, + "epoch": 0.03, + "learning_rate": 0.0002961701068741073, + "loss": 0.0444, "step": 9850 }, { - "epoch": 0.05, - "learning_rate": 0.0002925382546881858, - "loss": 0.039, + "epoch": 0.03, + "learning_rate": 0.00029616621865773585, + "loss": 0.0468, "step": 9860 }, { - "epoch": 0.05, - "learning_rate": 0.0002925306869951718, - "loss": 0.0385, + "epoch": 0.03, + "learning_rate": 0.00029616233044136436, + "loss": 0.0556, "step": 9870 }, { - "epoch": 0.05, - "learning_rate": 0.00029252311930215777, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.00029615844222499293, + "loss": 0.0481, "step": 9880 }, { - "epoch": 0.05, - "learning_rate": 0.00029251555160914375, - "loss": 0.0366, + "epoch": 0.03, + "learning_rate": 0.00029615455400862145, + "loss": 0.0404, "step": 9890 }, { - "epoch": 0.05, - "learning_rate": 0.00029250798391612973, - "loss": 0.0343, + "epoch": 0.03, + "learning_rate": 0.00029615066579225, + "loss": 0.0458, "step": 9900 }, { - "epoch": 0.05, - "learning_rate": 0.0002925004162231157, - "loss": 0.0382, + "epoch": 0.03, + "learning_rate": 0.00029614677757587853, + "loss": 0.0492, "step": 9910 }, { - "epoch": 0.05, - "learning_rate": 0.00029249284853010175, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.00029614288935950704, + "loss": 0.0374, "step": 9920 }, { - "epoch": 0.05, - "learning_rate": 0.00029248528083708773, - "loss": 0.0409, + "epoch": 0.03, + "learning_rate": 0.00029613900114313556, + "loss": 0.044, "step": 9930 }, { - "epoch": 0.05, - "learning_rate": 0.0002924777131440737, - "loss": 0.0425, + "epoch": 0.03, + "learning_rate": 0.00029613511292676413, + "loss": 0.0472, "step": 9940 }, { - "epoch": 0.05, - "learning_rate": 0.0002924701454510597, - "loss": 0.0364, + "epoch": 0.03, + "learning_rate": 0.00029613122471039264, + "loss": 0.0439, "step": 9950 }, { - "epoch": 0.05, - "learning_rate": 0.0002924625777580457, - "loss": 0.0376, + "epoch": 0.03, + "learning_rate": 0.0002961273364940212, + "loss": 0.0491, "step": 9960 }, { - "epoch": 0.05, - "learning_rate": 0.00029245501006503166, - "loss": 0.038, + "epoch": 0.03, + "learning_rate": 0.0002961234482776497, + "loss": 0.0458, "step": 9970 }, { - "epoch": 0.05, - "learning_rate": 0.0002924474423720177, - "loss": 0.0385, + "epoch": 0.03, + "learning_rate": 0.00029611956006127824, + "loss": 0.0467, "step": 9980 }, { - "epoch": 0.05, - "learning_rate": 0.0002924398746790037, - "loss": 0.0304, + "epoch": 0.03, + "learning_rate": 0.0002961156718449068, + "loss": 0.0472, "step": 9990 }, { - "epoch": 0.05, - "learning_rate": 0.00029243230698598966, - "loss": 0.0413, + "epoch": 0.03, + "learning_rate": 0.0002961117836285353, + "loss": 0.0457, "step": 10000 }, { - "epoch": 0.05, - "eval_cer": 0.9145003381830497, - "eval_loss": 0.02770831808447838, - "eval_runtime": 117.615, - "eval_samples_per_second": 17.005, - "eval_steps_per_second": 4.251, + "epoch": 0.03, + "eval_cer": 0.8818412503796516, + "eval_loss": 0.03403039649128914, + "eval_runtime": 107.5829, + "eval_samples_per_second": 18.59, + "eval_steps_per_second": 4.648, "step": 10000 }, { - "epoch": 0.05, - "learning_rate": 0.00029242473929297564, - "loss": 0.0328, + "epoch": 0.03, + "learning_rate": 0.00029610789541216384, + "loss": 0.0435, "step": 10010 }, { - "epoch": 0.05, - "learning_rate": 0.0002924171715999616, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.0002961040071957924, + "loss": 0.0492, "step": 10020 }, { - "epoch": 0.05, - "learning_rate": 0.0002924096039069476, - "loss": 0.0386, + "epoch": 0.03, + "learning_rate": 0.000296100118979421, + "loss": 0.0422, "step": 10030 }, { - "epoch": 0.05, - "learning_rate": 0.00029240203621393364, - "loss": 0.0341, + "epoch": 0.03, + "learning_rate": 0.0002960962307630495, + "loss": 0.0445, "step": 10040 }, { - "epoch": 0.05, - "learning_rate": 0.0002923944685209196, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.000296092342546678, + "loss": 0.0527, "step": 10050 }, { - "epoch": 0.05, - "learning_rate": 0.0002923869008279056, - "loss": 0.046, + "epoch": 0.03, + "learning_rate": 0.0002960884543303065, + "loss": 0.0493, "step": 10060 }, { - "epoch": 0.05, - "learning_rate": 0.0002923793331348916, - "loss": 0.0378, + "epoch": 0.03, + "learning_rate": 0.0002960845661139351, + "loss": 0.0456, "step": 10070 }, { - "epoch": 0.05, - "learning_rate": 0.00029237176544187756, - "loss": 0.039, + "epoch": 0.03, + "learning_rate": 0.0002960806778975636, + "loss": 0.0446, "step": 10080 }, { - "epoch": 0.05, - "learning_rate": 0.00029236419774886354, - "loss": 0.0352, + "epoch": 0.03, + "learning_rate": 0.00029607678968119217, + "loss": 0.0457, "step": 10090 }, { - "epoch": 0.05, - "learning_rate": 0.0002923566300558495, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.0002960729014648207, + "loss": 0.0473, "step": 10100 }, { - "epoch": 0.05, - "learning_rate": 0.00029234906236283556, - "loss": 0.039, + "epoch": 0.03, + "learning_rate": 0.00029606901324844925, + "loss": 0.0488, "step": 10110 }, { - "epoch": 0.05, - "learning_rate": 0.00029234149466982154, - "loss": 0.0353, + "epoch": 0.03, + "learning_rate": 0.00029606512503207777, + "loss": 0.0425, "step": 10120 }, { - "epoch": 0.05, - "learning_rate": 0.0002923339269768075, - "loss": 0.0336, + "epoch": 0.03, + "learning_rate": 0.0002960612368157063, + "loss": 0.0434, "step": 10130 }, { - "epoch": 0.05, - "learning_rate": 0.0002923263592837935, - "loss": 0.0427, + "epoch": 0.03, + "learning_rate": 0.0002960573485993348, + "loss": 0.0509, "step": 10140 }, { - "epoch": 0.05, - "learning_rate": 0.0002923187915907795, - "loss": 0.0359, + "epoch": 0.03, + "learning_rate": 0.00029605346038296337, + "loss": 0.0386, "step": 10150 }, { - "epoch": 0.05, - "learning_rate": 0.00029231122389776547, - "loss": 0.0366, + "epoch": 0.03, + "learning_rate": 0.00029604957216659194, + "loss": 0.0485, "step": 10160 }, { - "epoch": 0.05, - "learning_rate": 0.0002923036562047515, - "loss": 0.0341, + "epoch": 0.03, + "learning_rate": 0.00029604568395022045, + "loss": 0.0456, "step": 10170 }, { - "epoch": 0.05, - "learning_rate": 0.0002922960885117375, - "loss": 0.0412, + "epoch": 0.03, + "learning_rate": 0.00029604179573384896, + "loss": 0.0443, "step": 10180 }, { - "epoch": 0.05, - "learning_rate": 0.00029228852081872347, - "loss": 0.0317, + "epoch": 0.03, + "learning_rate": 0.0002960379075174775, + "loss": 0.044, "step": 10190 }, { - "epoch": 0.05, - "learning_rate": 0.00029228095312570945, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.00029603401930110605, + "loss": 0.0485, "step": 10200 }, { - "epoch": 0.05, - "learning_rate": 0.00029227338543269543, - "loss": 0.0357, + "epoch": 0.03, + "learning_rate": 0.00029603013108473456, + "loss": 0.0542, "step": 10210 }, { - "epoch": 0.05, - "learning_rate": 0.0002922658177396814, - "loss": 0.0333, + "epoch": 0.03, + "learning_rate": 0.00029602624286836313, + "loss": 0.05, "step": 10220 }, { - "epoch": 0.05, - "learning_rate": 0.00029225825004666745, - "loss": 0.0419, + "epoch": 0.03, + "learning_rate": 0.00029602235465199165, + "loss": 0.0417, "step": 10230 }, { - "epoch": 0.05, - "learning_rate": 0.00029225068235365343, - "loss": 0.0327, + "epoch": 0.03, + "learning_rate": 0.0002960184664356202, + "loss": 0.0518, "step": 10240 }, { - "epoch": 0.05, - "learning_rate": 0.0002922431146606394, - "loss": 0.0337, + "epoch": 0.03, + "learning_rate": 0.00029601457821924873, + "loss": 0.0441, "step": 10250 }, { - "epoch": 0.05, - "learning_rate": 0.0002922355469676254, - "loss": 0.0386, + "epoch": 0.03, + "learning_rate": 0.00029601069000287724, + "loss": 0.0403, "step": 10260 }, { - "epoch": 0.05, - "learning_rate": 0.00029222797927461137, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.00029600680178650576, + "loss": 0.0421, "step": 10270 }, { - "epoch": 0.05, - "learning_rate": 0.00029222041158159735, - "loss": 0.035, + "epoch": 0.03, + "learning_rate": 0.0002960029135701343, + "loss": 0.0424, "step": 10280 }, { - "epoch": 0.05, - "learning_rate": 0.00029221284388858333, - "loss": 0.0343, + "epoch": 0.03, + "learning_rate": 0.00029599902535376284, + "loss": 0.0642, "step": 10290 }, { - "epoch": 0.05, - "learning_rate": 0.00029220527619556937, - "loss": 0.0481, + "epoch": 0.03, + "learning_rate": 0.0002959951371373914, + "loss": 0.0554, "step": 10300 }, { - "epoch": 0.05, - "learning_rate": 0.00029219770850255535, - "loss": 0.0382, + "epoch": 0.03, + "learning_rate": 0.0002959912489210199, + "loss": 0.0489, "step": 10310 }, { - "epoch": 0.05, - "learning_rate": 0.00029219014080954133, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.0002959873607046485, + "loss": 0.0455, "step": 10320 }, { - "epoch": 0.05, - "learning_rate": 0.0002921825731165273, - "loss": 0.0422, + "epoch": 0.03, + "learning_rate": 0.000295983472488277, + "loss": 0.0445, "step": 10330 }, { - "epoch": 0.05, - "learning_rate": 0.0002921750054235133, - "loss": 0.0343, + "epoch": 0.03, + "learning_rate": 0.0002959795842719055, + "loss": 0.0461, "step": 10340 }, { - "epoch": 0.05, - "learning_rate": 0.0002921674377304993, + "epoch": 0.03, + "learning_rate": 0.00029597569605553404, "loss": 0.046, "step": 10350 }, { - "epoch": 0.05, - "learning_rate": 0.0002921598700374853, - "loss": 0.0407, + "epoch": 0.03, + "learning_rate": 0.0002959718078391626, + "loss": 0.0435, "step": 10360 }, { - "epoch": 0.05, - "learning_rate": 0.0002921523023444713, - "loss": 0.0364, + "epoch": 0.03, + "learning_rate": 0.0002959679196227912, + "loss": 0.0499, "step": 10370 }, { - "epoch": 0.05, - "learning_rate": 0.0002921447346514573, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.0002959640314064197, + "loss": 0.0392, "step": 10380 }, { - "epoch": 0.05, - "learning_rate": 0.00029213716695844326, - "loss": 0.0338, + "epoch": 0.03, + "learning_rate": 0.0002959601431900482, + "loss": 0.0497, "step": 10390 }, { - "epoch": 0.05, - "learning_rate": 0.00029212959926542924, - "loss": 0.0333, + "epoch": 0.03, + "learning_rate": 0.00029595625497367677, + "loss": 0.0461, "step": 10400 }, { - "epoch": 0.05, - "learning_rate": 0.0002921220315724152, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.0002959523667573053, + "loss": 0.0398, "step": 10410 }, { - "epoch": 0.05, - "learning_rate": 0.0002921144638794012, - "loss": 0.0357, + "epoch": 0.03, + "learning_rate": 0.0002959484785409338, + "loss": 0.0432, "step": 10420 }, { - "epoch": 0.05, - "learning_rate": 0.00029210689618638724, - "loss": 0.0351, + "epoch": 0.03, + "learning_rate": 0.00029594459032456237, + "loss": 0.045, "step": 10430 }, { - "epoch": 0.05, - "learning_rate": 0.0002920993284933732, - "loss": 0.0356, + "epoch": 0.03, + "learning_rate": 0.0002959407021081909, + "loss": 0.0415, "step": 10440 }, { - "epoch": 0.05, - "learning_rate": 0.0002920917608003592, - "loss": 0.0394, + "epoch": 0.03, + "learning_rate": 0.00029593681389181945, + "loss": 0.044, "step": 10450 }, { - "epoch": 0.05, - "learning_rate": 0.0002920841931073452, - "loss": 0.0376, + "epoch": 0.03, + "learning_rate": 0.00029593292567544797, + "loss": 0.0503, "step": 10460 }, { - "epoch": 0.05, - "learning_rate": 0.00029207662541433116, - "loss": 0.0374, + "epoch": 0.03, + "learning_rate": 0.0002959290374590765, + "loss": 0.0544, "step": 10470 }, { - "epoch": 0.05, - "learning_rate": 0.00029206905772131714, - "loss": 0.0333, + "epoch": 0.03, + "learning_rate": 0.000295925149242705, + "loss": 0.0492, "step": 10480 }, { - "epoch": 0.05, - "learning_rate": 0.0002920614900283032, - "loss": 0.0313, + "epoch": 0.03, + "learning_rate": 0.00029592126102633357, + "loss": 0.0691, "step": 10490 }, { - "epoch": 0.05, - "learning_rate": 0.00029205392233528916, - "loss": 0.0328, + "epoch": 0.03, + "learning_rate": 0.0002959173728099621, + "loss": 0.0529, "step": 10500 }, { - "epoch": 0.05, - "learning_rate": 0.00029204635464227514, - "loss": 0.0339, + "epoch": 0.03, + "learning_rate": 0.00029591348459359065, + "loss": 0.0467, "step": 10510 }, { - "epoch": 0.05, - "learning_rate": 0.0002920387869492611, - "loss": 0.03, + "epoch": 0.03, + "learning_rate": 0.00029590959637721916, + "loss": 0.0417, "step": 10520 }, { - "epoch": 0.05, - "learning_rate": 0.0002920312192562471, - "loss": 0.0353, + "epoch": 0.03, + "learning_rate": 0.00029590570816084773, + "loss": 0.0425, "step": 10530 }, { - "epoch": 0.05, - "learning_rate": 0.0002920236515632331, - "loss": 0.035, + "epoch": 0.03, + "learning_rate": 0.00029590181994447625, + "loss": 0.0381, "step": 10540 }, { - "epoch": 0.05, - "learning_rate": 0.0002920160838702191, - "loss": 0.0311, + "epoch": 0.03, + "learning_rate": 0.00029589793172810476, + "loss": 0.0384, "step": 10550 }, { - "epoch": 0.05, - "learning_rate": 0.0002920085161772051, - "loss": 0.0359, + "epoch": 0.03, + "learning_rate": 0.00029589404351173333, + "loss": 0.044, "step": 10560 }, { - "epoch": 0.05, - "learning_rate": 0.0002920009484841911, - "loss": 0.0373, + "epoch": 0.03, + "learning_rate": 0.00029589015529536184, + "loss": 0.0468, "step": 10570 }, { - "epoch": 0.05, - "learning_rate": 0.00029199338079117707, - "loss": 0.0408, + "epoch": 0.03, + "learning_rate": 0.0002958862670789904, + "loss": 0.0444, "step": 10580 }, { - "epoch": 0.05, - "learning_rate": 0.00029198581309816305, - "loss": 0.0406, + "epoch": 0.03, + "learning_rate": 0.00029588237886261893, + "loss": 0.0466, "step": 10590 }, { - "epoch": 0.05, - "learning_rate": 0.00029197824540514903, - "loss": 0.039, + "epoch": 0.03, + "learning_rate": 0.00029587849064624744, + "loss": 0.0451, "step": 10600 }, { - "epoch": 0.05, - "learning_rate": 0.000291970677712135, - "loss": 0.0318, + "epoch": 0.03, + "learning_rate": 0.000295874602429876, + "loss": 0.0418, "step": 10610 }, { - "epoch": 0.05, - "learning_rate": 0.00029196311001912105, - "loss": 0.0357, + "epoch": 0.03, + "learning_rate": 0.0002958707142135045, + "loss": 0.0418, "step": 10620 }, { - "epoch": 0.05, - "learning_rate": 0.00029195554232610703, - "loss": 0.0354, + "epoch": 0.03, + "learning_rate": 0.00029586682599713304, + "loss": 0.0424, "step": 10630 }, { - "epoch": 0.05, - "learning_rate": 0.000291947974633093, - "loss": 0.0331, + "epoch": 0.03, + "learning_rate": 0.0002958629377807616, + "loss": 0.0436, "step": 10640 }, { - "epoch": 0.05, - "learning_rate": 0.000291940406940079, - "loss": 0.0322, + "epoch": 0.03, + "learning_rate": 0.0002958590495643901, + "loss": 0.0419, "step": 10650 }, { - "epoch": 0.05, - "learning_rate": 0.000291932839247065, - "loss": 0.0391, + "epoch": 0.03, + "learning_rate": 0.0002958551613480187, + "loss": 0.0452, "step": 10660 }, { - "epoch": 0.05, - "learning_rate": 0.00029192527155405095, - "loss": 0.0352, + "epoch": 0.03, + "learning_rate": 0.0002958512731316472, + "loss": 0.0489, "step": 10670 }, { - "epoch": 0.05, - "learning_rate": 0.000291917703861037, - "loss": 0.0335, + "epoch": 0.03, + "learning_rate": 0.0002958473849152757, + "loss": 0.0448, "step": 10680 }, { - "epoch": 0.05, - "learning_rate": 0.0002919101361680229, - "loss": 0.0336, + "epoch": 0.03, + "learning_rate": 0.00029584349669890424, + "loss": 0.0521, "step": 10690 }, { - "epoch": 0.05, - "learning_rate": 0.0002919025684750089, - "loss": 0.0392, + "epoch": 0.03, + "learning_rate": 0.0002958396084825328, + "loss": 0.0412, "step": 10700 }, { - "epoch": 0.05, - "learning_rate": 0.0002918950007819949, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.00029583572026616137, + "loss": 0.0454, "step": 10710 }, { - "epoch": 0.05, - "learning_rate": 0.0002918874330889809, - "loss": 0.0386, + "epoch": 0.03, + "learning_rate": 0.0002958318320497899, + "loss": 0.0402, "step": 10720 }, { - "epoch": 0.05, - "learning_rate": 0.0002918798653959669, - "loss": 0.037, + "epoch": 0.03, + "learning_rate": 0.0002958279438334184, + "loss": 0.0442, "step": 10730 }, { - "epoch": 0.05, - "learning_rate": 0.0002918722977029529, - "loss": 0.042, + "epoch": 0.03, + "learning_rate": 0.00029582405561704697, + "loss": 0.0503, "step": 10740 }, { - "epoch": 0.05, - "learning_rate": 0.00029186473000993886, - "loss": 0.0359, + "epoch": 0.03, + "learning_rate": 0.0002958201674006755, + "loss": 0.0504, "step": 10750 }, { - "epoch": 0.05, - "learning_rate": 0.00029185716231692484, - "loss": 0.0392, + "epoch": 0.03, + "learning_rate": 0.000295816279184304, + "loss": 0.0433, "step": 10760 }, { - "epoch": 0.05, - "learning_rate": 0.0002918495946239108, - "loss": 0.0366, + "epoch": 0.03, + "learning_rate": 0.00029581239096793257, + "loss": 0.0408, "step": 10770 }, { - "epoch": 0.05, - "learning_rate": 0.00029184202693089686, - "loss": 0.0351, + "epoch": 0.03, + "learning_rate": 0.0002958085027515611, + "loss": 0.0396, "step": 10780 }, { - "epoch": 0.05, - "learning_rate": 0.00029183445923788284, - "loss": 0.0386, + "epoch": 0.03, + "learning_rate": 0.00029580461453518965, + "loss": 0.0405, "step": 10790 }, { - "epoch": 0.05, - "learning_rate": 0.0002918268915448688, - "loss": 0.0321, + "epoch": 0.03, + "learning_rate": 0.00029580072631881817, + "loss": 0.0524, "step": 10800 }, { - "epoch": 0.05, - "learning_rate": 0.0002918193238518548, - "loss": 0.0346, + "epoch": 0.03, + "learning_rate": 0.0002957968381024467, + "loss": 0.0415, "step": 10810 }, { - "epoch": 0.05, - "learning_rate": 0.0002918117561588408, - "loss": 0.0375, + "epoch": 0.03, + "learning_rate": 0.00029579294988607525, + "loss": 0.0455, "step": 10820 }, { - "epoch": 0.05, - "learning_rate": 0.00029180418846582677, - "loss": 0.0344, + "epoch": 0.03, + "learning_rate": 0.00029578906166970376, + "loss": 0.0509, "step": 10830 }, { - "epoch": 0.05, - "learning_rate": 0.00029179662077281275, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.0002957851734533323, + "loss": 0.0473, "step": 10840 }, { - "epoch": 0.05, - "learning_rate": 0.0002917890530797988, - "loss": 0.0319, + "epoch": 0.03, + "learning_rate": 0.00029578128523696085, + "loss": 0.0423, "step": 10850 }, { - "epoch": 0.05, - "learning_rate": 0.00029178148538678476, - "loss": 0.0333, + "epoch": 0.03, + "learning_rate": 0.0002957773970205894, + "loss": 0.0435, "step": 10860 }, { - "epoch": 0.05, - "learning_rate": 0.00029177391769377075, - "loss": 0.0359, + "epoch": 0.03, + "learning_rate": 0.00029577350880421793, + "loss": 0.0502, "step": 10870 }, { - "epoch": 0.05, - "learning_rate": 0.00029176635000075673, - "loss": 0.0368, + "epoch": 0.03, + "learning_rate": 0.00029576962058784645, + "loss": 0.0432, "step": 10880 }, { - "epoch": 0.05, - "learning_rate": 0.0002917587823077427, - "loss": 0.0322, + "epoch": 0.03, + "learning_rate": 0.00029576573237147496, + "loss": 0.0449, "step": 10890 }, { - "epoch": 0.05, - "learning_rate": 0.0002917512146147287, - "loss": 0.0395, + "epoch": 0.03, + "learning_rate": 0.00029576184415510353, + "loss": 0.0394, "step": 10900 }, { - "epoch": 0.06, - "learning_rate": 0.0002917436469217147, - "loss": 0.0388, + "epoch": 0.03, + "learning_rate": 0.00029575795593873204, + "loss": 0.048, "step": 10910 }, { - "epoch": 0.06, - "learning_rate": 0.0002917360792287007, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.0002957540677223606, + "loss": 0.0475, "step": 10920 }, { - "epoch": 0.06, - "learning_rate": 0.0002917285115356867, - "loss": 0.0386, + "epoch": 0.03, + "learning_rate": 0.0002957501795059891, + "loss": 0.0491, "step": 10930 }, { - "epoch": 0.06, - "learning_rate": 0.00029172094384267267, - "loss": 0.0409, + "epoch": 0.03, + "learning_rate": 0.00029574629128961764, + "loss": 0.0499, "step": 10940 }, { - "epoch": 0.06, - "learning_rate": 0.00029171337614965865, - "loss": 0.0367, + "epoch": 0.03, + "learning_rate": 0.0002957424030732462, + "loss": 0.0462, "step": 10950 }, { - "epoch": 0.06, - "learning_rate": 0.00029170580845664463, - "loss": 0.0355, + "epoch": 0.03, + "learning_rate": 0.0002957385148568747, + "loss": 0.0449, "step": 10960 }, { - "epoch": 0.06, - "learning_rate": 0.0002916982407636306, - "loss": 0.0337, + "epoch": 0.03, + "learning_rate": 0.00029573462664050324, + "loss": 0.0464, "step": 10970 }, { - "epoch": 0.06, - "learning_rate": 0.00029169067307061665, - "loss": 0.0409, + "epoch": 0.03, + "learning_rate": 0.0002957307384241318, + "loss": 0.046, "step": 10980 }, { - "epoch": 0.06, - "learning_rate": 0.00029168310537760263, - "loss": 0.0377, + "epoch": 0.03, + "learning_rate": 0.0002957268502077603, + "loss": 0.0445, "step": 10990 }, { - "epoch": 0.06, - "learning_rate": 0.0002916755376845886, - "loss": 0.0333, + "epoch": 0.03, + "learning_rate": 0.0002957229619913889, + "loss": 0.0443, "step": 11000 }, { - "epoch": 0.06, - "eval_cer": 0.9145003381830497, - "eval_loss": 0.027273865416646004, - "eval_runtime": 117.4476, - "eval_samples_per_second": 17.029, - "eval_steps_per_second": 4.257, + "epoch": 0.03, + "eval_cer": 0.8817390768834564, + "eval_loss": 0.03759730979800224, + "eval_runtime": 108.4369, + "eval_samples_per_second": 18.444, + "eval_steps_per_second": 4.611, "step": 11000 }, { - "epoch": 0.06, - "learning_rate": 0.0002916679699915746, - "loss": 0.032, + "epoch": 0.03, + "learning_rate": 0.0002957190737750174, + "loss": 0.0462, "step": 11010 }, { - "epoch": 0.06, - "learning_rate": 0.0002916604022985606, - "loss": 0.0327, + "epoch": 0.03, + "learning_rate": 0.0002957151855586459, + "loss": 0.0469, "step": 11020 }, { - "epoch": 0.06, - "learning_rate": 0.00029165283460554656, - "loss": 0.0479, + "epoch": 0.03, + "learning_rate": 0.0002957112973422745, + "loss": 0.0517, "step": 11030 }, { - "epoch": 0.06, - "learning_rate": 0.0002916452669125326, - "loss": 0.0659, + "epoch": 0.03, + "learning_rate": 0.000295707409125903, + "loss": 0.0469, "step": 11040 }, { - "epoch": 0.06, - "learning_rate": 0.0002916376992195186, - "loss": 0.044, + "epoch": 0.03, + "learning_rate": 0.0002957035209095315, + "loss": 0.0513, "step": 11050 }, { - "epoch": 0.06, - "learning_rate": 0.00029163013152650456, - "loss": 0.0389, + "epoch": 0.03, + "learning_rate": 0.0002956996326931601, + "loss": 0.0538, "step": 11060 }, { - "epoch": 0.06, - "learning_rate": 0.00029162256383349054, - "loss": 0.0395, + "epoch": 0.03, + "learning_rate": 0.00029569574447678865, + "loss": 0.0448, "step": 11070 }, { - "epoch": 0.06, - "learning_rate": 0.0002916149961404765, - "loss": 0.0589, + "epoch": 0.03, + "learning_rate": 0.00029569185626041717, + "loss": 0.0473, "step": 11080 }, { - "epoch": 0.06, - "learning_rate": 0.0002916074284474625, - "loss": 0.0441, + "epoch": 0.03, + "learning_rate": 0.0002956879680440457, + "loss": 0.0456, "step": 11090 }, { - "epoch": 0.06, - "learning_rate": 0.00029159986075444854, - "loss": 0.0429, + "epoch": 0.03, + "learning_rate": 0.0002956840798276742, + "loss": 0.0501, "step": 11100 }, { - "epoch": 0.06, - "learning_rate": 0.0002915922930614345, - "loss": 0.0401, + "epoch": 0.03, + "learning_rate": 0.00029568019161130277, + "loss": 0.0632, "step": 11110 }, { - "epoch": 0.06, - "learning_rate": 0.0002915847253684205, - "loss": 0.0403, + "epoch": 0.03, + "learning_rate": 0.0002956763033949313, + "loss": 0.0435, "step": 11120 }, { - "epoch": 0.06, - "learning_rate": 0.0002915771576754065, - "loss": 0.0418, + "epoch": 0.03, + "learning_rate": 0.00029567241517855985, + "loss": 0.0449, "step": 11130 }, { - "epoch": 0.06, - "learning_rate": 0.00029156958998239246, - "loss": 0.0355, + "epoch": 0.03, + "learning_rate": 0.00029566852696218837, + "loss": 0.0415, "step": 11140 }, { - "epoch": 0.06, - "learning_rate": 0.00029156202228937844, - "loss": 0.0404, + "epoch": 0.03, + "learning_rate": 0.00029566463874581693, + "loss": 0.0527, "step": 11150 }, { - "epoch": 0.06, - "learning_rate": 0.0002915544545963644, - "loss": 0.0396, + "epoch": 0.03, + "learning_rate": 0.00029566075052944545, + "loss": 0.0509, "step": 11160 }, { - "epoch": 0.06, - "learning_rate": 0.00029154688690335046, - "loss": 0.0428, + "epoch": 0.03, + "learning_rate": 0.00029565686231307396, + "loss": 0.0489, "step": 11170 }, { - "epoch": 0.06, - "learning_rate": 0.00029153931921033644, - "loss": 0.0404, + "epoch": 0.03, + "learning_rate": 0.0002956529740967025, + "loss": 0.0446, "step": 11180 }, { - "epoch": 0.06, - "learning_rate": 0.0002915317515173224, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.00029564908588033105, + "loss": 0.0554, "step": 11190 }, { - "epoch": 0.06, - "learning_rate": 0.0002915241838243084, - "loss": 0.0383, + "epoch": 0.03, + "learning_rate": 0.00029564519766395956, + "loss": 0.0504, "step": 11200 }, { - "epoch": 0.06, - "learning_rate": 0.0002915166161312944, - "loss": 0.0385, + "epoch": 0.03, + "learning_rate": 0.00029564130944758813, + "loss": 0.0527, "step": 11210 }, { - "epoch": 0.06, - "learning_rate": 0.00029150904843828037, - "loss": 0.0371, + "epoch": 0.03, + "learning_rate": 0.00029563742123121664, + "loss": 0.0553, "step": 11220 }, { - "epoch": 0.06, - "learning_rate": 0.0002915014807452664, - "loss": 0.0374, + "epoch": 0.03, + "learning_rate": 0.00029563353301484516, + "loss": 0.0456, "step": 11230 }, { - "epoch": 0.06, - "learning_rate": 0.0002914939130522524, - "loss": 0.0389, + "epoch": 0.03, + "learning_rate": 0.00029562964479847373, + "loss": 0.051, "step": 11240 }, { - "epoch": 0.06, - "learning_rate": 0.00029148634535923837, - "loss": 0.0397, + "epoch": 0.03, + "learning_rate": 0.00029562575658210224, + "loss": 0.0476, "step": 11250 }, { - "epoch": 0.06, - "learning_rate": 0.00029147877766622435, - "loss": 0.0373, + "epoch": 0.03, + "learning_rate": 0.0002956218683657308, + "loss": 0.0429, "step": 11260 }, { - "epoch": 0.06, - "learning_rate": 0.00029147120997321033, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.0002956179801493593, + "loss": 0.044, "step": 11270 }, { - "epoch": 0.06, - "learning_rate": 0.0002914636422801963, - "loss": 0.0383, + "epoch": 0.03, + "learning_rate": 0.0002956140919329879, + "loss": 0.0444, "step": 11280 }, { - "epoch": 0.06, - "learning_rate": 0.00029145607458718235, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.0002956102037166164, + "loss": 0.039, "step": 11290 }, { - "epoch": 0.06, - "learning_rate": 0.00029144850689416833, - "loss": 0.0377, + "epoch": 0.03, + "learning_rate": 0.0002956063155002449, + "loss": 0.0483, "step": 11300 }, { - "epoch": 0.06, - "learning_rate": 0.0002914409392011543, - "loss": 0.0394, + "epoch": 0.03, + "learning_rate": 0.00029560242728387344, + "loss": 0.0433, "step": 11310 }, { - "epoch": 0.06, - "learning_rate": 0.0002914333715081403, - "loss": 0.0408, + "epoch": 0.03, + "learning_rate": 0.000295598539067502, + "loss": 0.044, "step": 11320 }, { - "epoch": 0.06, - "learning_rate": 0.00029142580381512627, - "loss": 0.0381, + "epoch": 0.03, + "learning_rate": 0.0002955946508511305, + "loss": 0.0446, "step": 11330 }, { - "epoch": 0.06, - "learning_rate": 0.00029141823612211225, - "loss": 0.038, + "epoch": 0.03, + "learning_rate": 0.0002955907626347591, + "loss": 0.0466, "step": 11340 }, { - "epoch": 0.06, - "learning_rate": 0.00029141066842909824, - "loss": 0.0319, + "epoch": 0.03, + "learning_rate": 0.0002955868744183876, + "loss": 0.0429, "step": 11350 }, { - "epoch": 0.06, - "learning_rate": 0.00029140310073608427, - "loss": 0.0309, + "epoch": 0.03, + "learning_rate": 0.00029558298620201617, + "loss": 0.0442, "step": 11360 }, { - "epoch": 0.06, - "learning_rate": 0.00029139553304307025, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.0002955790979856447, + "loss": 0.0403, "step": 11370 }, { - "epoch": 0.06, - "learning_rate": 0.00029138796535005623, - "loss": 0.0346, + "epoch": 0.03, + "learning_rate": 0.0002955752097692732, + "loss": 0.0422, "step": 11380 }, { - "epoch": 0.06, - "learning_rate": 0.0002913803976570422, - "loss": 0.0753, + "epoch": 0.03, + "learning_rate": 0.0002955713215529017, + "loss": 0.0347, "step": 11390 }, { - "epoch": 0.06, - "learning_rate": 0.0002913728299640282, - "loss": 0.037, + "epoch": 0.03, + "learning_rate": 0.0002955674333365303, + "loss": 0.042, "step": 11400 }, { - "epoch": 0.06, - "learning_rate": 0.0002913652622710142, - "loss": 0.0302, + "epoch": 0.03, + "learning_rate": 0.00029556354512015885, + "loss": 0.0464, "step": 11410 }, { - "epoch": 0.06, - "learning_rate": 0.0002913576945780002, - "loss": 0.0365, + "epoch": 0.03, + "learning_rate": 0.00029555965690378737, + "loss": 0.0463, "step": 11420 }, { - "epoch": 0.06, - "learning_rate": 0.0002913501268849862, - "loss": 0.0351, + "epoch": 0.03, + "learning_rate": 0.0002955557686874159, + "loss": 0.0424, "step": 11430 }, { - "epoch": 0.06, - "learning_rate": 0.0002913425591919722, - "loss": 0.0354, + "epoch": 0.03, + "learning_rate": 0.0002955518804710444, + "loss": 0.0439, "step": 11440 }, { - "epoch": 0.06, - "learning_rate": 0.00029133499149895816, - "loss": 0.0371, + "epoch": 0.03, + "learning_rate": 0.00029554799225467297, + "loss": 0.051, "step": 11450 }, { - "epoch": 0.06, - "learning_rate": 0.00029132742380594414, - "loss": 0.0396, + "epoch": 0.03, + "learning_rate": 0.0002955441040383015, + "loss": 0.0438, "step": 11460 }, { - "epoch": 0.06, - "learning_rate": 0.0002913198561129301, - "loss": 0.0351, + "epoch": 0.03, + "learning_rate": 0.00029554021582193005, + "loss": 0.0456, "step": 11470 }, { - "epoch": 0.06, - "learning_rate": 0.0002913122884199161, - "loss": 0.0356, + "epoch": 0.03, + "learning_rate": 0.00029553632760555856, + "loss": 0.0438, "step": 11480 }, { - "epoch": 0.06, - "learning_rate": 0.00029130472072690214, - "loss": 0.0317, + "epoch": 0.03, + "learning_rate": 0.00029553243938918713, + "loss": 0.0413, "step": 11490 }, { - "epoch": 0.06, - "learning_rate": 0.0002912971530338881, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.00029552855117281565, + "loss": 0.0466, "step": 11500 }, { - "epoch": 0.06, - "learning_rate": 0.0002912895853408741, - "loss": 0.0338, + "epoch": 0.03, + "learning_rate": 0.00029552466295644416, + "loss": 0.0451, "step": 11510 }, { - "epoch": 0.06, - "learning_rate": 0.0002912820176478601, - "loss": 0.0393, + "epoch": 0.03, + "learning_rate": 0.0002955207747400727, + "loss": 0.0427, "step": 11520 }, { - "epoch": 0.06, - "learning_rate": 0.00029127444995484606, - "loss": 0.0316, + "epoch": 0.03, + "learning_rate": 0.00029551688652370125, + "loss": 0.0446, "step": 11530 }, { - "epoch": 0.06, - "learning_rate": 0.00029126688226183205, - "loss": 0.04, + "epoch": 0.03, + "learning_rate": 0.00029551299830732976, + "loss": 0.0362, "step": 11540 }, { - "epoch": 0.06, - "learning_rate": 0.0002912593145688181, - "loss": 0.0313, + "epoch": 0.03, + "learning_rate": 0.00029550911009095833, + "loss": 0.0376, "step": 11550 }, { - "epoch": 0.06, - "learning_rate": 0.00029125174687580406, - "loss": 0.0319, + "epoch": 0.03, + "learning_rate": 0.00029550522187458684, + "loss": 0.0351, "step": 11560 }, { - "epoch": 0.06, - "learning_rate": 0.00029124417918279004, - "loss": 0.0326, + "epoch": 0.03, + "learning_rate": 0.0002955013336582154, + "loss": 0.0348, "step": 11570 }, { - "epoch": 0.06, - "learning_rate": 0.000291236611489776, - "loss": 0.038, + "epoch": 0.03, + "learning_rate": 0.0002954974454418439, + "loss": 0.0353, "step": 11580 }, { - "epoch": 0.06, - "learning_rate": 0.000291229043796762, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.00029549355722547244, + "loss": 0.0361, "step": 11590 }, { - "epoch": 0.06, - "learning_rate": 0.000291221476103748, - "loss": 0.0331, + "epoch": 0.03, + "learning_rate": 0.00029548966900910096, + "loss": 0.0448, "step": 11600 }, { - "epoch": 0.06, - "learning_rate": 0.000291213908410734, - "loss": 0.033, + "epoch": 0.03, + "learning_rate": 0.0002954857807927295, + "loss": 0.0392, "step": 11610 }, { - "epoch": 0.06, - "learning_rate": 0.00029120634071772, - "loss": 0.0379, + "epoch": 0.03, + "learning_rate": 0.0002954818925763581, + "loss": 0.0391, "step": 11620 }, { - "epoch": 0.06, - "learning_rate": 0.000291198773024706, - "loss": 0.037, + "epoch": 0.03, + "learning_rate": 0.0002954780043599866, + "loss": 0.0462, "step": 11630 }, { - "epoch": 0.06, - "learning_rate": 0.00029119120533169197, - "loss": 0.038, + "epoch": 0.03, + "learning_rate": 0.0002954741161436151, + "loss": 0.0445, "step": 11640 }, { - "epoch": 0.06, - "learning_rate": 0.00029118363763867795, - "loss": 0.0337, + "epoch": 0.03, + "learning_rate": 0.0002954702279272437, + "loss": 0.0468, "step": 11650 }, { - "epoch": 0.06, - "learning_rate": 0.00029117606994566393, - "loss": 0.034, + "epoch": 0.03, + "learning_rate": 0.0002954663397108722, + "loss": 0.046, "step": 11660 }, { - "epoch": 0.06, - "learning_rate": 0.0002911685022526499, - "loss": 0.0362, + "epoch": 0.03, + "learning_rate": 0.0002954624514945007, + "loss": 0.0475, "step": 11670 }, { - "epoch": 0.06, - "learning_rate": 0.00029116093455963595, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.0002954585632781293, + "loss": 0.0418, "step": 11680 }, { - "epoch": 0.06, - "learning_rate": 0.00029115336686662193, - "loss": 0.0393, + "epoch": 0.03, + "learning_rate": 0.0002954546750617578, + "loss": 0.0418, "step": 11690 }, { - "epoch": 0.06, - "learning_rate": 0.0002911457991736079, - "loss": 0.0366, + "epoch": 0.03, + "learning_rate": 0.00029545078684538637, + "loss": 0.0466, "step": 11700 }, { - "epoch": 0.06, - "learning_rate": 0.0002911382314805939, - "loss": 0.0364, + "epoch": 0.03, + "learning_rate": 0.0002954468986290149, + "loss": 0.0441, "step": 11710 }, { - "epoch": 0.06, - "learning_rate": 0.0002911306637875799, - "loss": 0.0375, + "epoch": 0.03, + "learning_rate": 0.0002954430104126434, + "loss": 0.0455, "step": 11720 }, { - "epoch": 0.06, - "learning_rate": 0.00029112309609456586, - "loss": 0.0362, + "epoch": 0.03, + "learning_rate": 0.0002954391221962719, + "loss": 0.0395, "step": 11730 }, { - "epoch": 0.06, - "learning_rate": 0.0002911155284015519, - "loss": 0.0365, + "epoch": 0.03, + "learning_rate": 0.0002954352339799005, + "loss": 0.0817, "step": 11740 }, { - "epoch": 0.06, - "learning_rate": 0.00029110796070853787, - "loss": 0.0312, + "epoch": 0.03, + "learning_rate": 0.00029543134576352905, + "loss": 0.0446, "step": 11750 }, { - "epoch": 0.06, - "learning_rate": 0.00029110039301552385, - "loss": 0.0329, + "epoch": 0.03, + "learning_rate": 0.00029542745754715757, + "loss": 0.0474, "step": 11760 }, { - "epoch": 0.06, - "learning_rate": 0.00029109282532250984, - "loss": 0.0376, + "epoch": 0.03, + "learning_rate": 0.0002954235693307861, + "loss": 0.0458, "step": 11770 }, { - "epoch": 0.06, - "learning_rate": 0.0002910852576294958, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.00029541968111441465, + "loss": 0.0439, "step": 11780 }, { - "epoch": 0.06, - "learning_rate": 0.0002910776899364818, - "loss": 0.0418, + "epoch": 0.03, + "learning_rate": 0.00029541579289804316, + "loss": 0.0462, "step": 11790 }, { - "epoch": 0.06, - "learning_rate": 0.00029107012224346783, - "loss": 0.0339, + "epoch": 0.03, + "learning_rate": 0.0002954119046816717, + "loss": 0.0359, "step": 11800 }, { - "epoch": 0.06, - "learning_rate": 0.0002910625545504538, - "loss": 0.0385, + "epoch": 0.03, + "learning_rate": 0.00029540801646530025, + "loss": 0.0424, "step": 11810 }, { - "epoch": 0.06, - "learning_rate": 0.0002910549868574398, - "loss": 0.0373, + "epoch": 0.03, + "learning_rate": 0.00029540412824892876, + "loss": 0.0409, "step": 11820 }, { - "epoch": 0.06, - "learning_rate": 0.0002910474191644258, - "loss": 0.0311, + "epoch": 0.03, + "learning_rate": 0.00029540024003255733, + "loss": 0.051, "step": 11830 }, { - "epoch": 0.06, - "learning_rate": 0.00029103985147141176, - "loss": 0.0353, + "epoch": 0.03, + "learning_rate": 0.00029539635181618585, + "loss": 0.0454, "step": 11840 }, { - "epoch": 0.06, - "learning_rate": 0.00029103228377839774, - "loss": 0.0359, + "epoch": 0.03, + "learning_rate": 0.00029539246359981436, + "loss": 0.0431, "step": 11850 }, { - "epoch": 0.06, - "learning_rate": 0.0002910247160853837, - "loss": 0.0353, + "epoch": 0.03, + "learning_rate": 0.00029538857538344293, + "loss": 0.0403, "step": 11860 }, { - "epoch": 0.06, - "learning_rate": 0.00029101714839236976, - "loss": 0.0389, + "epoch": 0.03, + "learning_rate": 0.00029538468716707144, + "loss": 0.0391, "step": 11870 }, { - "epoch": 0.06, - "learning_rate": 0.00029100958069935574, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.00029538079895069996, + "loss": 0.0435, "step": 11880 }, { - "epoch": 0.06, - "learning_rate": 0.0002910020130063417, - "loss": 0.0369, + "epoch": 0.03, + "learning_rate": 0.00029537691073432853, + "loss": 0.0423, "step": 11890 }, { - "epoch": 0.06, - "learning_rate": 0.0002909944453133277, - "loss": 0.0368, + "epoch": 0.03, + "learning_rate": 0.0002953730225179571, + "loss": 0.0342, "step": 11900 }, { - "epoch": 0.06, - "learning_rate": 0.0002909868776203137, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.0002953691343015856, + "loss": 0.0467, "step": 11910 }, { - "epoch": 0.06, - "learning_rate": 0.00029097930992729967, - "loss": 0.0351, + "epoch": 0.03, + "learning_rate": 0.0002953652460852141, + "loss": 0.0425, "step": 11920 }, { - "epoch": 0.06, - "learning_rate": 0.0002909717422342857, - "loss": 0.0364, + "epoch": 0.03, + "learning_rate": 0.00029536135786884264, + "loss": 0.0409, "step": 11930 }, { - "epoch": 0.06, - "learning_rate": 0.0002909641745412717, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.00029535746965247115, + "loss": 0.037, "step": 11940 }, { - "epoch": 0.06, - "learning_rate": 0.0002909566068482576, - "loss": 0.0367, + "epoch": 0.03, + "learning_rate": 0.0002953535814360997, + "loss": 0.0475, "step": 11950 }, { - "epoch": 0.06, - "learning_rate": 0.0002909490391552436, - "loss": 0.0375, + "epoch": 0.03, + "learning_rate": 0.0002953496932197283, + "loss": 0.0373, "step": 11960 }, { - "epoch": 0.06, - "learning_rate": 0.0002909414714622296, - "loss": 0.0364, + "epoch": 0.03, + "learning_rate": 0.0002953458050033568, + "loss": 0.0442, "step": 11970 }, { - "epoch": 0.06, - "learning_rate": 0.0002909339037692156, - "loss": 0.0374, + "epoch": 0.03, + "learning_rate": 0.0002953419167869853, + "loss": 0.0467, "step": 11980 }, { - "epoch": 0.06, - "learning_rate": 0.0002909263360762016, - "loss": 0.0334, + "epoch": 0.03, + "learning_rate": 0.0002953380285706139, + "loss": 0.0423, "step": 11990 }, { - "epoch": 0.06, - "learning_rate": 0.00029091876838318757, - "loss": 0.0286, + "epoch": 0.03, + "learning_rate": 0.0002953341403542424, + "loss": 0.0465, "step": 12000 }, { - "epoch": 0.06, - "eval_cer": 0.9145042197675514, - "eval_loss": 0.026305437088012695, - "eval_runtime": 117.4972, - "eval_samples_per_second": 17.022, - "eval_steps_per_second": 4.255, + "epoch": 0.03, + "eval_cer": 0.8818370514688489, + "eval_loss": 0.03303086385130882, + "eval_runtime": 107.7286, + "eval_samples_per_second": 18.565, + "eval_steps_per_second": 4.641, "step": 12000 }, { - "epoch": 0.06, - "learning_rate": 0.00029091120069017355, - "loss": 0.0336, + "epoch": 0.03, + "learning_rate": 0.0002953302521378709, + "loss": 0.0466, "step": 12010 }, { - "epoch": 0.06, - "learning_rate": 0.00029090363299715953, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.0002953263639214995, + "loss": 0.0404, "step": 12020 }, { - "epoch": 0.06, - "learning_rate": 0.00029089606530414557, - "loss": 0.0361, + "epoch": 0.03, + "learning_rate": 0.000295322475705128, + "loss": 0.0449, "step": 12030 }, { - "epoch": 0.06, - "learning_rate": 0.00029088849761113155, - "loss": 0.0325, + "epoch": 0.03, + "learning_rate": 0.00029531858748875657, + "loss": 0.0454, "step": 12040 }, { - "epoch": 0.06, - "learning_rate": 0.00029088092991811753, - "loss": 0.0327, + "epoch": 0.03, + "learning_rate": 0.0002953146992723851, + "loss": 0.0506, "step": 12050 }, { - "epoch": 0.06, - "learning_rate": 0.0002908733622251035, - "loss": 0.0293, + "epoch": 0.03, + "learning_rate": 0.0002953108110560136, + "loss": 0.0417, "step": 12060 }, { - "epoch": 0.06, - "learning_rate": 0.0002908657945320895, - "loss": 0.033, + "epoch": 0.03, + "learning_rate": 0.00029530692283964217, + "loss": 0.0382, "step": 12070 }, { - "epoch": 0.06, - "learning_rate": 0.0002908582268390755, + "epoch": 0.03, + "learning_rate": 0.0002953030346232707, "loss": 0.0414, "step": 12080 }, { - "epoch": 0.06, - "learning_rate": 0.00029085065914606146, - "loss": 0.0345, + "epoch": 0.03, + "learning_rate": 0.0002952991464068992, + "loss": 0.0429, "step": 12090 }, { - "epoch": 0.06, - "learning_rate": 0.0002908430914530475, - "loss": 0.0344, + "epoch": 0.03, + "learning_rate": 0.00029529525819052777, + "loss": 0.039, "step": 12100 }, { - "epoch": 0.06, - "learning_rate": 0.0002908355237600335, - "loss": 0.0329, + "epoch": 0.03, + "learning_rate": 0.00029529136997415633, + "loss": 0.0418, "step": 12110 }, { - "epoch": 0.06, - "learning_rate": 0.00029082795606701946, - "loss": 0.0307, + "epoch": 0.03, + "learning_rate": 0.00029528748175778485, + "loss": 0.0458, "step": 12120 }, { - "epoch": 0.06, - "learning_rate": 0.00029082038837400544, - "loss": 0.0321, + "epoch": 0.03, + "learning_rate": 0.00029528359354141336, + "loss": 0.0449, "step": 12130 }, { - "epoch": 0.06, - "learning_rate": 0.0002908128206809914, - "loss": 0.0359, + "epoch": 0.03, + "learning_rate": 0.0002952797053250419, + "loss": 0.0387, "step": 12140 }, { - "epoch": 0.06, - "learning_rate": 0.0002908052529879774, - "loss": 0.0324, + "epoch": 0.03, + "learning_rate": 0.00029527581710867045, + "loss": 0.0439, "step": 12150 }, { - "epoch": 0.06, - "learning_rate": 0.00029079768529496344, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.00029527192889229896, + "loss": 0.0375, "step": 12160 }, { - "epoch": 0.06, - "learning_rate": 0.0002907901176019494, - "loss": 0.0323, + "epoch": 0.03, + "learning_rate": 0.00029526804067592753, + "loss": 0.0394, "step": 12170 }, { - "epoch": 0.06, - "learning_rate": 0.0002907825499089354, - "loss": 0.0378, + "epoch": 0.03, + "learning_rate": 0.00029526415245955604, + "loss": 0.0427, "step": 12180 }, { - "epoch": 0.06, - "learning_rate": 0.0002907749822159214, - "loss": 0.0332, + "epoch": 0.03, + "learning_rate": 0.00029526026424318456, + "loss": 0.0395, "step": 12190 }, { - "epoch": 0.06, - "learning_rate": 0.00029076741452290736, - "loss": 0.0339, + "epoch": 0.03, + "learning_rate": 0.00029525637602681313, + "loss": 0.0553, "step": 12200 }, { - "epoch": 0.06, - "learning_rate": 0.00029075984682989334, - "loss": 0.0361, + "epoch": 0.03, + "learning_rate": 0.00029525248781044164, + "loss": 0.0489, "step": 12210 }, { - "epoch": 0.06, - "learning_rate": 0.0002907522791368793, - "loss": 0.0336, + "epoch": 0.03, + "learning_rate": 0.00029524859959407016, + "loss": 0.0444, "step": 12220 }, { - "epoch": 0.06, - "learning_rate": 0.00029074471144386536, - "loss": 0.0313, + "epoch": 0.03, + "learning_rate": 0.0002952447113776987, + "loss": 0.0469, "step": 12230 }, { - "epoch": 0.06, - "learning_rate": 0.00029073714375085134, - "loss": 0.0326, + "epoch": 0.03, + "learning_rate": 0.00029524082316132724, + "loss": 0.0504, "step": 12240 }, { - "epoch": 0.06, - "learning_rate": 0.0002907295760578373, - "loss": 0.0321, + "epoch": 0.03, + "learning_rate": 0.0002952369349449558, + "loss": 0.0476, "step": 12250 }, { - "epoch": 0.06, - "learning_rate": 0.0002907220083648233, - "loss": 0.0311, + "epoch": 0.03, + "learning_rate": 0.0002952330467285843, + "loss": 0.0459, "step": 12260 }, { - "epoch": 0.06, - "learning_rate": 0.0002907144406718093, - "loss": 0.0396, + "epoch": 0.03, + "learning_rate": 0.00029522915851221284, + "loss": 0.0454, "step": 12270 }, { - "epoch": 0.06, - "learning_rate": 0.00029070687297879527, - "loss": 0.0312, + "epoch": 0.03, + "learning_rate": 0.0002952252702958414, + "loss": 0.05, "step": 12280 }, { - "epoch": 0.06, - "learning_rate": 0.0002906993052857813, - "loss": 0.0345, + "epoch": 0.03, + "learning_rate": 0.0002952213820794699, + "loss": 0.0419, "step": 12290 }, { - "epoch": 0.06, - "learning_rate": 0.0002906917375927673, - "loss": 0.0336, + "epoch": 0.03, + "learning_rate": 0.0002952174938630985, + "loss": 0.0439, "step": 12300 }, { - "epoch": 0.06, - "learning_rate": 0.00029068416989975327, - "loss": 0.0433, + "epoch": 0.03, + "learning_rate": 0.000295213605646727, + "loss": 0.0415, "step": 12310 }, { - "epoch": 0.06, - "learning_rate": 0.00029067660220673925, - "loss": 0.0356, + "epoch": 0.03, + "learning_rate": 0.0002952097174303556, + "loss": 0.0414, "step": 12320 }, { - "epoch": 0.06, - "learning_rate": 0.00029066903451372523, - "loss": 0.0329, + "epoch": 0.03, + "learning_rate": 0.0002952058292139841, + "loss": 0.0408, "step": 12330 }, { - "epoch": 0.06, - "learning_rate": 0.0002906614668207112, - "loss": 0.0341, + "epoch": 0.03, + "learning_rate": 0.0002952019409976126, + "loss": 0.0384, "step": 12340 }, { - "epoch": 0.06, - "learning_rate": 0.00029065389912769725, - "loss": 0.033, + "epoch": 0.03, + "learning_rate": 0.0002951980527812411, + "loss": 0.0408, "step": 12350 }, { - "epoch": 0.06, - "learning_rate": 0.00029064633143468323, - "loss": 0.0393, + "epoch": 0.03, + "learning_rate": 0.0002951941645648697, + "loss": 0.0429, "step": 12360 }, { - "epoch": 0.06, - "learning_rate": 0.0002906387637416692, - "loss": 0.0398, + "epoch": 0.03, + "learning_rate": 0.0002951902763484982, + "loss": 0.0458, "step": 12370 }, { - "epoch": 0.06, - "learning_rate": 0.0002906311960486552, - "loss": 0.0456, + "epoch": 0.03, + "learning_rate": 0.00029518638813212677, + "loss": 0.0452, "step": 12380 }, { - "epoch": 0.06, - "learning_rate": 0.00029062362835564117, - "loss": 0.0452, + "epoch": 0.03, + "learning_rate": 0.0002951824999157553, + "loss": 0.0491, "step": 12390 }, { - "epoch": 0.06, - "learning_rate": 0.00029061606066262715, - "loss": 0.0408, + "epoch": 0.03, + "learning_rate": 0.00029517861169938385, + "loss": 0.0449, "step": 12400 }, { - "epoch": 0.06, - "learning_rate": 0.00029060849296961314, - "loss": 0.0333, + "epoch": 0.03, + "learning_rate": 0.00029517472348301237, + "loss": 0.0523, "step": 12410 }, { - "epoch": 0.06, - "learning_rate": 0.00029060092527659917, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.0002951708352666409, + "loss": 0.0483, "step": 12420 }, { - "epoch": 0.06, - "learning_rate": 0.00029059335758358515, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.0002951669470502694, + "loss": 0.0446, "step": 12430 }, { - "epoch": 0.06, - "learning_rate": 0.00029058578989057113, - "loss": 0.0361, + "epoch": 0.03, + "learning_rate": 0.00029516305883389796, + "loss": 0.0367, "step": 12440 }, { - "epoch": 0.06, - "learning_rate": 0.0002905782221975571, - "loss": 0.0384, + "epoch": 0.03, + "learning_rate": 0.00029515917061752653, + "loss": 0.0387, "step": 12450 }, { - "epoch": 0.06, - "learning_rate": 0.0002905706545045431, - "loss": 0.0354, + "epoch": 0.03, + "learning_rate": 0.00029515528240115505, + "loss": 0.0399, "step": 12460 }, { - "epoch": 0.06, - "learning_rate": 0.0002905630868115291, - "loss": 0.0404, + "epoch": 0.03, + "learning_rate": 0.00029515139418478356, + "loss": 0.0317, "step": 12470 }, { - "epoch": 0.06, - "learning_rate": 0.0002905555191185151, - "loss": 0.0301, + "epoch": 0.03, + "learning_rate": 0.0002951475059684121, + "loss": 0.0417, "step": 12480 }, { - "epoch": 0.06, - "learning_rate": 0.0002905479514255011, - "loss": 0.0325, + "epoch": 0.03, + "learning_rate": 0.00029514361775204065, + "loss": 0.0403, "step": 12490 }, { - "epoch": 0.06, - "learning_rate": 0.0002905403837324871, - "loss": 0.0303, + "epoch": 0.03, + "learning_rate": 0.00029513972953566916, + "loss": 0.0449, "step": 12500 }, { - "epoch": 0.06, - "learning_rate": 0.00029053281603947306, - "loss": 0.0342, + "epoch": 0.03, + "learning_rate": 0.00029513584131929773, + "loss": 0.0367, "step": 12510 }, { - "epoch": 0.06, - "learning_rate": 0.00029052524834645904, - "loss": 0.0303, + "epoch": 0.03, + "learning_rate": 0.00029513195310292624, + "loss": 0.041, "step": 12520 }, { - "epoch": 0.06, - "learning_rate": 0.000290517680653445, - "loss": 0.0327, + "epoch": 0.03, + "learning_rate": 0.0002951280648865548, + "loss": 0.0453, "step": 12530 }, { - "epoch": 0.06, - "learning_rate": 0.000290510112960431, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.0002951241766701833, + "loss": 0.0404, "step": 12540 }, { - "epoch": 0.06, - "learning_rate": 0.00029050254526741704, - "loss": 0.0303, + "epoch": 0.03, + "learning_rate": 0.00029512028845381184, + "loss": 0.043, "step": 12550 }, { - "epoch": 0.06, - "learning_rate": 0.000290494977574403, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.00029511640023744036, + "loss": 0.0469, "step": 12560 }, { - "epoch": 0.06, - "learning_rate": 0.000290487409881389, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.0002951125120210689, + "loss": 0.0389, "step": 12570 }, { - "epoch": 0.06, - "learning_rate": 0.000290479842188375, - "loss": 0.035, + "epoch": 0.03, + "learning_rate": 0.00029510862380469744, + "loss": 0.0423, "step": 12580 }, { - "epoch": 0.06, - "learning_rate": 0.00029047227449536096, - "loss": 0.0285, + "epoch": 0.03, + "learning_rate": 0.000295104735588326, + "loss": 0.0414, "step": 12590 }, { - "epoch": 0.06, - "learning_rate": 0.00029046470680234695, - "loss": 0.032, + "epoch": 0.03, + "learning_rate": 0.0002951008473719545, + "loss": 0.0354, "step": 12600 }, { - "epoch": 0.06, - "learning_rate": 0.000290457139109333, - "loss": 0.0345, + "epoch": 0.03, + "learning_rate": 0.0002950969591555831, + "loss": 0.0559, "step": 12610 }, { - "epoch": 0.06, - "learning_rate": 0.00029044957141631896, - "loss": 0.0381, + "epoch": 0.03, + "learning_rate": 0.0002950930709392116, + "loss": 0.0433, "step": 12620 }, { - "epoch": 0.06, - "learning_rate": 0.00029044200372330494, - "loss": 0.04, + "epoch": 0.03, + "learning_rate": 0.0002950891827228401, + "loss": 0.0452, "step": 12630 }, { - "epoch": 0.06, - "learning_rate": 0.0002904344360302909, - "loss": 0.0362, + "epoch": 0.03, + "learning_rate": 0.00029508529450646863, + "loss": 0.041, "step": 12640 }, { - "epoch": 0.06, - "learning_rate": 0.0002904268683372769, - "loss": 0.032, + "epoch": 0.03, + "learning_rate": 0.0002950814062900972, + "loss": 0.0385, "step": 12650 }, { - "epoch": 0.06, - "learning_rate": 0.0002904193006442629, - "loss": 0.0366, + "epoch": 0.03, + "learning_rate": 0.00029507751807372577, + "loss": 0.0467, "step": 12660 }, { - "epoch": 0.06, - "learning_rate": 0.0002904117329512489, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.0002950736298573543, + "loss": 0.0454, "step": 12670 }, { - "epoch": 0.06, - "learning_rate": 0.0002904041652582349, - "loss": 0.0369, + "epoch": 0.03, + "learning_rate": 0.0002950697416409828, + "loss": 0.0451, "step": 12680 }, { - "epoch": 0.06, - "learning_rate": 0.0002903965975652209, - "loss": 0.0337, + "epoch": 0.03, + "learning_rate": 0.0002950658534246113, + "loss": 0.0438, "step": 12690 }, { - "epoch": 0.06, - "learning_rate": 0.00029038902987220687, - "loss": 0.0308, + "epoch": 0.03, + "learning_rate": 0.0002950619652082399, + "loss": 0.04, "step": 12700 }, { - "epoch": 0.06, - "learning_rate": 0.00029038146217919285, - "loss": 0.0523, + "epoch": 0.03, + "learning_rate": 0.0002950580769918684, + "loss": 0.0424, "step": 12710 }, { - "epoch": 0.06, - "learning_rate": 0.00029037389448617883, - "loss": 0.0437, + "epoch": 0.03, + "learning_rate": 0.00029505418877549697, + "loss": 0.0344, "step": 12720 }, { - "epoch": 0.06, - "learning_rate": 0.0002903663267931648, - "loss": 0.0365, + "epoch": 0.03, + "learning_rate": 0.0002950503005591255, + "loss": 0.0397, "step": 12730 }, { - "epoch": 0.06, - "learning_rate": 0.00029035875910015085, - "loss": 0.0349, + "epoch": 0.03, + "learning_rate": 0.00029504641234275405, + "loss": 0.0547, "step": 12740 }, { - "epoch": 0.06, - "learning_rate": 0.00029035119140713683, - "loss": 0.0321, + "epoch": 0.03, + "learning_rate": 0.00029504252412638257, + "loss": 0.0465, "step": 12750 }, { - "epoch": 0.06, - "learning_rate": 0.0002903436237141228, - "loss": 0.0318, + "epoch": 0.03, + "learning_rate": 0.0002950386359100111, + "loss": 0.0445, "step": 12760 }, { - "epoch": 0.06, - "learning_rate": 0.0002903360560211088, - "loss": 0.0335, + "epoch": 0.03, + "learning_rate": 0.0002950347476936396, + "loss": 0.0349, "step": 12770 }, { - "epoch": 0.06, - "learning_rate": 0.0002903284883280948, - "loss": 0.0305, + "epoch": 0.03, + "learning_rate": 0.00029503085947726816, + "loss": 0.0463, "step": 12780 }, { - "epoch": 0.06, - "learning_rate": 0.00029032092063508076, - "loss": 0.0381, + "epoch": 0.03, + "learning_rate": 0.0002950269712608967, + "loss": 0.0474, "step": 12790 }, { - "epoch": 0.06, - "learning_rate": 0.0002903133529420668, - "loss": 0.0327, + "epoch": 0.03, + "learning_rate": 0.00029502308304452525, + "loss": 0.0468, "step": 12800 }, { - "epoch": 0.06, - "learning_rate": 0.00029030578524905277, - "loss": 0.0432, + "epoch": 0.03, + "learning_rate": 0.00029501919482815376, + "loss": 0.0438, "step": 12810 }, { - "epoch": 0.06, - "learning_rate": 0.00029029821755603875, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.00029501530661178233, + "loss": 0.0379, "step": 12820 }, { - "epoch": 0.06, - "learning_rate": 0.00029029064986302474, - "loss": 0.0574, + "epoch": 0.03, + "learning_rate": 0.00029501141839541084, + "loss": 0.0392, "step": 12830 }, { - "epoch": 0.06, - "learning_rate": 0.0002902830821700107, - "loss": 0.045, + "epoch": 0.03, + "learning_rate": 0.00029500753017903936, + "loss": 0.0373, "step": 12840 }, { - "epoch": 0.06, - "learning_rate": 0.0002902755144769967, - "loss": 0.0303, + "epoch": 0.03, + "learning_rate": 0.00029500364196266793, + "loss": 0.0379, "step": 12850 }, { - "epoch": 0.06, - "learning_rate": 0.00029026794678398273, - "loss": 0.0365, + "epoch": 0.03, + "learning_rate": 0.00029499975374629644, + "loss": 0.0399, "step": 12860 }, { - "epoch": 0.06, - "learning_rate": 0.0002902603790909687, - "loss": 0.0443, + "epoch": 0.03, + "learning_rate": 0.000294995865529925, + "loss": 0.0697, "step": 12870 }, { - "epoch": 0.06, - "learning_rate": 0.0002902528113979547, - "loss": 0.0384, + "epoch": 0.03, + "learning_rate": 0.0002949919773135535, + "loss": 0.044, "step": 12880 }, { - "epoch": 0.07, - "learning_rate": 0.0002902452437049407, - "loss": 0.035, + "epoch": 0.03, + "learning_rate": 0.00029498808909718204, + "loss": 0.0547, "step": 12890 }, { - "epoch": 0.07, - "learning_rate": 0.00029023767601192666, - "loss": 0.0431, + "epoch": 0.03, + "learning_rate": 0.0002949842008808106, + "loss": 0.0418, "step": 12900 }, { - "epoch": 0.07, - "learning_rate": 0.00029023010831891264, - "loss": 0.0393, + "epoch": 0.03, + "learning_rate": 0.0002949803126644391, + "loss": 0.0382, "step": 12910 }, { - "epoch": 0.07, - "learning_rate": 0.0002902225406258986, - "loss": 0.0324, + "epoch": 0.03, + "learning_rate": 0.00029497642444806764, + "loss": 0.0419, "step": 12920 }, { - "epoch": 0.07, - "learning_rate": 0.00029021497293288466, - "loss": 0.0353, + "epoch": 0.03, + "learning_rate": 0.0002949725362316962, + "loss": 0.0372, "step": 12930 }, { - "epoch": 0.07, - "learning_rate": 0.00029020740523987064, - "loss": 0.0457, + "epoch": 0.03, + "learning_rate": 0.0002949686480153247, + "loss": 0.0394, "step": 12940 }, { - "epoch": 0.07, - "learning_rate": 0.0002901998375468566, - "loss": 0.0338, + "epoch": 0.03, + "learning_rate": 0.0002949647597989533, + "loss": 0.0428, "step": 12950 }, { - "epoch": 0.07, - "learning_rate": 0.0002901922698538426, - "loss": 0.0305, + "epoch": 0.03, + "learning_rate": 0.0002949608715825818, + "loss": 0.0479, "step": 12960 }, { - "epoch": 0.07, - "learning_rate": 0.0002901847021608286, - "loss": 0.0322, + "epoch": 0.03, + "learning_rate": 0.0002949569833662103, + "loss": 0.0435, "step": 12970 }, { - "epoch": 0.07, - "learning_rate": 0.00029017713446781457, - "loss": 0.0351, + "epoch": 0.03, + "learning_rate": 0.00029495309514983883, + "loss": 0.0362, "step": 12980 }, { - "epoch": 0.07, - "learning_rate": 0.0002901695667748006, - "loss": 0.0309, + "epoch": 0.03, + "learning_rate": 0.0002949492069334674, + "loss": 0.0365, "step": 12990 }, { - "epoch": 0.07, - "learning_rate": 0.0002901619990817866, - "loss": 0.0373, + "epoch": 0.03, + "learning_rate": 0.00029494531871709597, + "loss": 0.0465, "step": 13000 }, { - "epoch": 0.07, - "eval_cer": 0.9145245980861848, - "eval_loss": 0.026163555681705475, - "eval_runtime": 116.7644, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.03, + "eval_cer": 0.8818286536472439, + "eval_loss": 0.03343910351395607, + "eval_runtime": 107.7406, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, "step": 13000 }, { - "epoch": 0.07, - "learning_rate": 0.00029015443138877256, - "loss": 0.0371, + "epoch": 0.03, + "learning_rate": 0.0002949414305007245, + "loss": 0.041, "step": 13010 }, { - "epoch": 0.07, - "learning_rate": 0.00029014686369575855, - "loss": 0.0344, + "epoch": 0.03, + "learning_rate": 0.000294937542284353, + "loss": 0.0397, "step": 13020 }, { - "epoch": 0.07, - "learning_rate": 0.0002901392960027445, - "loss": 0.0352, + "epoch": 0.03, + "learning_rate": 0.00029493365406798157, + "loss": 0.0431, "step": 13030 }, { - "epoch": 0.07, - "learning_rate": 0.0002901317283097305, - "loss": 0.0361, + "epoch": 0.03, + "learning_rate": 0.0002949297658516101, + "loss": 0.0354, "step": 13040 }, { - "epoch": 0.07, - "learning_rate": 0.0002901241606167165, - "loss": 0.0444, + "epoch": 0.03, + "learning_rate": 0.0002949258776352386, + "loss": 0.0428, "step": 13050 }, { - "epoch": 0.07, - "learning_rate": 0.0002901165929237025, - "loss": 0.0307, + "epoch": 0.03, + "learning_rate": 0.00029492198941886717, + "loss": 0.0375, "step": 13060 }, { - "epoch": 0.07, - "learning_rate": 0.0002901090252306885, - "loss": 0.034, + "epoch": 0.03, + "learning_rate": 0.0002949181012024957, + "loss": 0.0462, "step": 13070 }, { - "epoch": 0.07, - "learning_rate": 0.0002901014575376745, - "loss": 0.0451, + "epoch": 0.03, + "learning_rate": 0.00029491421298612425, + "loss": 0.0419, "step": 13080 }, { - "epoch": 0.07, - "learning_rate": 0.00029009388984466047, - "loss": 0.0379, + "epoch": 0.03, + "learning_rate": 0.00029491032476975276, + "loss": 0.045, "step": 13090 }, { - "epoch": 0.07, - "learning_rate": 0.00029008632215164645, - "loss": 0.0347, + "epoch": 0.03, + "learning_rate": 0.0002949064365533813, + "loss": 0.0463, "step": 13100 }, { - "epoch": 0.07, - "learning_rate": 0.00029007875445863243, - "loss": 0.0288, + "epoch": 0.03, + "learning_rate": 0.00029490254833700985, + "loss": 0.0383, "step": 13110 }, { - "epoch": 0.07, - "learning_rate": 0.00029007118676561847, - "loss": 0.038, + "epoch": 0.03, + "learning_rate": 0.00029489866012063836, + "loss": 0.0374, "step": 13120 }, { - "epoch": 0.07, - "learning_rate": 0.00029006361907260445, - "loss": 0.032, + "epoch": 0.03, + "learning_rate": 0.0002948947719042669, + "loss": 0.0405, "step": 13130 }, { - "epoch": 0.07, - "learning_rate": 0.00029005605137959043, - "loss": 0.0372, + "epoch": 0.03, + "learning_rate": 0.00029489088368789545, + "loss": 0.0439, "step": 13140 }, { - "epoch": 0.07, - "learning_rate": 0.0002900484836865764, - "loss": 0.0325, + "epoch": 0.03, + "learning_rate": 0.00029488699547152396, + "loss": 0.0428, "step": 13150 }, { - "epoch": 0.07, - "learning_rate": 0.0002900409159935624, - "loss": 0.0342, + "epoch": 0.03, + "learning_rate": 0.00029488310725515253, + "loss": 0.0398, "step": 13160 }, { - "epoch": 0.07, - "learning_rate": 0.0002900333483005484, - "loss": 0.0377, + "epoch": 0.03, + "learning_rate": 0.00029487921903878104, + "loss": 0.0404, "step": 13170 }, { - "epoch": 0.07, - "learning_rate": 0.0002900257806075344, - "loss": 0.0408, + "epoch": 0.03, + "learning_rate": 0.00029487533082240956, + "loss": 0.0507, "step": 13180 }, { - "epoch": 0.07, - "learning_rate": 0.0002900182129145204, - "loss": 0.0353, + "epoch": 0.03, + "learning_rate": 0.00029487144260603807, + "loss": 0.0511, "step": 13190 }, { - "epoch": 0.07, - "learning_rate": 0.0002900106452215063, - "loss": 0.0307, + "epoch": 0.03, + "learning_rate": 0.00029486755438966664, + "loss": 0.0424, "step": 13200 }, { - "epoch": 0.07, - "learning_rate": 0.0002900030775284923, - "loss": 0.0331, + "epoch": 0.03, + "learning_rate": 0.0002948636661732952, + "loss": 0.0466, "step": 13210 }, { - "epoch": 0.07, - "learning_rate": 0.00028999550983547834, - "loss": 0.0322, + "epoch": 0.03, + "learning_rate": 0.0002948597779569237, + "loss": 0.0463, "step": 13220 }, { - "epoch": 0.07, - "learning_rate": 0.0002899879421424643, - "loss": 0.0342, + "epoch": 0.03, + "learning_rate": 0.00029485588974055224, + "loss": 0.0382, "step": 13230 }, { - "epoch": 0.07, - "learning_rate": 0.0002899803744494503, - "loss": 0.0312, + "epoch": 0.03, + "learning_rate": 0.0002948520015241808, + "loss": 0.0396, "step": 13240 }, { - "epoch": 0.07, - "learning_rate": 0.0002899728067564363, - "loss": 0.0645, + "epoch": 0.03, + "learning_rate": 0.0002948481133078093, + "loss": 0.0512, "step": 13250 }, { - "epoch": 0.07, - "learning_rate": 0.00028996523906342226, - "loss": 0.0352, + "epoch": 0.03, + "learning_rate": 0.00029484422509143784, + "loss": 0.0542, "step": 13260 }, { - "epoch": 0.07, - "learning_rate": 0.00028995767137040824, - "loss": 0.0671, + "epoch": 0.03, + "learning_rate": 0.0002948403368750664, + "loss": 0.0456, "step": 13270 }, { - "epoch": 0.07, - "learning_rate": 0.0002899501036773942, - "loss": 0.0338, + "epoch": 0.03, + "learning_rate": 0.0002948364486586949, + "loss": 0.0424, "step": 13280 }, { - "epoch": 0.07, - "learning_rate": 0.00028994253598438026, - "loss": 0.0341, + "epoch": 0.03, + "learning_rate": 0.0002948325604423235, + "loss": 0.0411, "step": 13290 }, { - "epoch": 0.07, - "learning_rate": 0.00028993496829136624, - "loss": 0.036, + "epoch": 0.03, + "learning_rate": 0.000294828672225952, + "loss": 0.0407, "step": 13300 }, { - "epoch": 0.07, - "learning_rate": 0.0002899274005983522, - "loss": 0.0352, + "epoch": 0.03, + "learning_rate": 0.0002948247840095805, + "loss": 0.042, "step": 13310 }, { - "epoch": 0.07, - "learning_rate": 0.0002899198329053382, - "loss": 0.0352, + "epoch": 0.03, + "learning_rate": 0.0002948208957932091, + "loss": 0.0369, "step": 13320 }, { - "epoch": 0.07, - "learning_rate": 0.0002899122652123242, - "loss": 0.0402, + "epoch": 0.03, + "learning_rate": 0.0002948170075768376, + "loss": 0.0436, "step": 13330 }, { - "epoch": 0.07, - "learning_rate": 0.00028990469751931017, - "loss": 0.0315, + "epoch": 0.03, + "learning_rate": 0.00029481311936046617, + "loss": 0.0388, "step": 13340 }, { - "epoch": 0.07, - "learning_rate": 0.0002898971298262962, - "loss": 0.0331, + "epoch": 0.03, + "learning_rate": 0.0002948092311440947, + "loss": 0.0383, "step": 13350 }, { - "epoch": 0.07, - "learning_rate": 0.0002898895621332822, - "loss": 0.0371, + "epoch": 0.03, + "learning_rate": 0.00029480534292772325, + "loss": 0.0464, "step": 13360 }, { - "epoch": 0.07, - "learning_rate": 0.00028988199444026817, - "loss": 0.0314, + "epoch": 0.03, + "learning_rate": 0.00029480145471135177, + "loss": 0.0378, "step": 13370 }, { - "epoch": 0.07, - "learning_rate": 0.00028987442674725415, - "loss": 0.0473, + "epoch": 0.03, + "learning_rate": 0.0002947975664949803, + "loss": 0.0458, "step": 13380 }, { - "epoch": 0.07, - "learning_rate": 0.00028986685905424013, - "loss": 0.0328, + "epoch": 0.03, + "learning_rate": 0.0002947936782786088, + "loss": 0.0372, "step": 13390 }, { - "epoch": 0.07, - "learning_rate": 0.0002898592913612261, - "loss": 0.0332, + "epoch": 0.03, + "learning_rate": 0.00029478979006223737, + "loss": 0.0482, "step": 13400 }, { - "epoch": 0.07, - "learning_rate": 0.00028985172366821215, - "loss": 0.0323, + "epoch": 0.03, + "learning_rate": 0.0002947859018458659, + "loss": 0.0541, "step": 13410 }, { - "epoch": 0.07, - "learning_rate": 0.00028984415597519813, - "loss": 0.0412, + "epoch": 0.03, + "learning_rate": 0.00029478201362949445, + "loss": 0.0455, "step": 13420 }, { - "epoch": 0.07, - "learning_rate": 0.0002898365882821841, - "loss": 0.037, + "epoch": 0.03, + "learning_rate": 0.00029477812541312296, + "loss": 0.0451, "step": 13430 }, { - "epoch": 0.07, - "learning_rate": 0.0002898290205891701, - "loss": 0.0363, + "epoch": 0.03, + "learning_rate": 0.0002947742371967515, + "loss": 0.0438, "step": 13440 }, { - "epoch": 0.07, - "learning_rate": 0.00028982145289615607, - "loss": 0.0358, + "epoch": 0.03, + "learning_rate": 0.00029477034898038005, + "loss": 0.043, "step": 13450 }, { - "epoch": 0.07, - "learning_rate": 0.00028981388520314205, - "loss": 0.026, + "epoch": 0.03, + "learning_rate": 0.00029476646076400856, + "loss": 0.0399, "step": 13460 }, { - "epoch": 0.07, - "learning_rate": 0.00028980631751012804, - "loss": 0.04, + "epoch": 0.03, + "learning_rate": 0.0002947625725476371, + "loss": 0.0447, "step": 13470 }, { - "epoch": 0.07, - "learning_rate": 0.00028979874981711407, - "loss": 0.0377, + "epoch": 0.03, + "learning_rate": 0.00029475868433126564, + "loss": 0.0419, "step": 13480 }, { - "epoch": 0.07, - "learning_rate": 0.00028979118212410005, - "loss": 0.0385, + "epoch": 0.03, + "learning_rate": 0.0002947547961148942, + "loss": 0.0441, "step": 13490 }, { - "epoch": 0.07, - "learning_rate": 0.00028978361443108603, - "loss": 0.0294, + "epoch": 0.03, + "learning_rate": 0.00029475090789852273, + "loss": 0.0536, "step": 13500 }, { - "epoch": 0.07, - "learning_rate": 0.000289776046738072, - "loss": 0.0346, + "epoch": 0.04, + "learning_rate": 0.00029474701968215124, + "loss": 0.0491, "step": 13510 }, { - "epoch": 0.07, - "learning_rate": 0.000289768479045058, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.00029474313146577976, + "loss": 0.0452, "step": 13520 }, { - "epoch": 0.07, - "learning_rate": 0.000289760911352044, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002947392432494083, + "loss": 0.0517, "step": 13530 }, { - "epoch": 0.07, - "learning_rate": 0.00028975334365903, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.00029473535503303684, + "loss": 0.0495, "step": 13540 }, { - "epoch": 0.07, - "learning_rate": 0.000289745775966016, - "loss": 0.0355, + "epoch": 0.04, + "learning_rate": 0.0002947314668166654, + "loss": 0.046, "step": 13550 }, { - "epoch": 0.07, - "learning_rate": 0.000289738208273002, - "loss": 0.0329, + "epoch": 0.04, + "learning_rate": 0.0002947275786002939, + "loss": 0.0433, "step": 13560 }, { - "epoch": 0.07, - "learning_rate": 0.00028973064057998796, - "loss": 0.0385, + "epoch": 0.04, + "learning_rate": 0.0002947236903839225, + "loss": 0.0379, "step": 13570 }, { - "epoch": 0.07, - "learning_rate": 0.00028972307288697394, - "loss": 0.0433, + "epoch": 0.04, + "learning_rate": 0.000294719802167551, + "loss": 0.0471, "step": 13580 }, { - "epoch": 0.07, - "learning_rate": 0.0002897155051939599, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.0002947159139511795, + "loss": 0.0474, "step": 13590 }, { - "epoch": 0.07, - "learning_rate": 0.00028970793750094596, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.00029471202573480804, + "loss": 0.0483, "step": 13600 }, { - "epoch": 0.07, - "learning_rate": 0.00028970036980793194, - "loss": 0.0551, + "epoch": 0.04, + "learning_rate": 0.0002947081375184366, + "loss": 0.0387, "step": 13610 }, { - "epoch": 0.07, - "learning_rate": 0.0002896928021149179, - "loss": 0.0347, + "epoch": 0.04, + "learning_rate": 0.0002947042493020651, + "loss": 0.0467, "step": 13620 }, { - "epoch": 0.07, - "learning_rate": 0.0002896852344219039, - "loss": 0.0574, + "epoch": 0.04, + "learning_rate": 0.0002947003610856937, + "loss": 0.0396, "step": 13630 }, { - "epoch": 0.07, - "learning_rate": 0.0002896776667288899, - "loss": 0.0331, + "epoch": 0.04, + "learning_rate": 0.0002946964728693222, + "loss": 0.0433, "step": 13640 }, { - "epoch": 0.07, - "learning_rate": 0.00028967009903587586, - "loss": 0.0646, + "epoch": 0.04, + "learning_rate": 0.0002946925846529507, + "loss": 0.0434, "step": 13650 }, { - "epoch": 0.07, - "learning_rate": 0.00028966253134286185, - "loss": 0.0507, + "epoch": 0.04, + "learning_rate": 0.0002946886964365793, + "loss": 0.0452, "step": 13660 }, { - "epoch": 0.07, - "learning_rate": 0.0002896549636498479, - "loss": 0.0312, + "epoch": 0.04, + "learning_rate": 0.0002946848082202078, + "loss": 0.0363, "step": 13670 }, { - "epoch": 0.07, - "learning_rate": 0.00028964739595683386, - "loss": 0.0364, + "epoch": 0.04, + "learning_rate": 0.0002946809200038363, + "loss": 0.0527, "step": 13680 }, { - "epoch": 0.07, - "learning_rate": 0.00028963982826381984, - "loss": 0.0587, + "epoch": 0.04, + "learning_rate": 0.0002946770317874649, + "loss": 0.0581, "step": 13690 }, { - "epoch": 0.07, - "learning_rate": 0.0002896322605708058, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.00029467314357109345, + "loss": 0.0486, "step": 13700 }, { - "epoch": 0.07, - "learning_rate": 0.0002896246928777918, - "loss": 0.04, + "epoch": 0.04, + "learning_rate": 0.00029466925535472197, + "loss": 0.0425, "step": 13710 }, { - "epoch": 0.07, - "learning_rate": 0.0002896171251847778, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.0002946653671383505, + "loss": 0.0411, "step": 13720 }, { - "epoch": 0.07, - "learning_rate": 0.0002896095574917638, - "loss": 0.0464, + "epoch": 0.04, + "learning_rate": 0.000294661478921979, + "loss": 0.0418, "step": 13730 }, { - "epoch": 0.07, - "learning_rate": 0.0002896019897987498, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.00029465759070560756, + "loss": 0.037, "step": 13740 }, { - "epoch": 0.07, - "learning_rate": 0.0002895944221057358, - "loss": 0.0395, + "epoch": 0.04, + "learning_rate": 0.0002946537024892361, + "loss": 0.0554, "step": 13750 }, { - "epoch": 0.07, - "learning_rate": 0.00028958685441272177, - "loss": 0.0346, + "epoch": 0.04, + "learning_rate": 0.00029464981427286465, + "loss": 0.0383, "step": 13760 }, { - "epoch": 0.07, - "learning_rate": 0.00028957928671970775, - "loss": 0.0306, + "epoch": 0.04, + "learning_rate": 0.00029464592605649316, + "loss": 0.0416, "step": 13770 }, { - "epoch": 0.07, - "learning_rate": 0.00028957171902669373, - "loss": 0.0604, + "epoch": 0.04, + "learning_rate": 0.00029464203784012173, + "loss": 0.0443, "step": 13780 }, { - "epoch": 0.07, - "learning_rate": 0.0002895641513336797, - "loss": 0.0405, + "epoch": 0.04, + "learning_rate": 0.00029463814962375025, + "loss": 0.0395, "step": 13790 }, { - "epoch": 0.07, - "learning_rate": 0.00028955658364066575, - "loss": 0.0467, + "epoch": 0.04, + "learning_rate": 0.00029463426140737876, + "loss": 0.0361, "step": 13800 }, { - "epoch": 0.07, - "learning_rate": 0.00028954901594765173, - "loss": 0.0378, + "epoch": 0.04, + "learning_rate": 0.0002946303731910073, + "loss": 0.0396, "step": 13810 }, { - "epoch": 0.07, - "learning_rate": 0.0002895414482546377, - "loss": 0.0559, + "epoch": 0.04, + "learning_rate": 0.00029462648497463584, + "loss": 0.0374, "step": 13820 }, { - "epoch": 0.07, - "learning_rate": 0.0002895338805616237, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.00029462259675826436, + "loss": 0.0421, "step": 13830 }, { - "epoch": 0.07, - "learning_rate": 0.0002895263128686097, - "loss": 0.0332, + "epoch": 0.04, + "learning_rate": 0.0002946187085418929, + "loss": 0.0422, "step": 13840 }, { - "epoch": 0.07, - "learning_rate": 0.00028951874517559566, - "loss": 0.0363, + "epoch": 0.04, + "learning_rate": 0.00029461482032552144, + "loss": 0.0475, "step": 13850 }, { - "epoch": 0.07, - "learning_rate": 0.0002895111774825817, - "loss": 0.0429, + "epoch": 0.04, + "learning_rate": 0.00029461093210915, + "loss": 0.0392, "step": 13860 }, { - "epoch": 0.07, - "learning_rate": 0.00028950360978956767, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.0002946070438927785, + "loss": 0.0419, "step": 13870 }, { - "epoch": 0.07, - "learning_rate": 0.00028949604209655365, - "loss": 0.0326, + "epoch": 0.04, + "learning_rate": 0.00029460315567640704, + "loss": 0.0433, "step": 13880 }, { - "epoch": 0.07, - "learning_rate": 0.00028948847440353964, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.0002945992674600356, + "loss": 0.0396, "step": 13890 }, { - "epoch": 0.07, - "learning_rate": 0.0002894809067105256, - "loss": 0.0299, + "epoch": 0.04, + "learning_rate": 0.0002945953792436641, + "loss": 0.0427, "step": 13900 }, { - "epoch": 0.07, - "learning_rate": 0.0002894733390175116, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.0002945914910272927, + "loss": 0.0418, "step": 13910 }, { - "epoch": 0.07, - "learning_rate": 0.00028946577132449763, - "loss": 0.0354, + "epoch": 0.04, + "learning_rate": 0.0002945876028109212, + "loss": 0.0386, "step": 13920 }, { - "epoch": 0.07, - "learning_rate": 0.0002894582036314836, - "loss": 0.0404, + "epoch": 0.04, + "learning_rate": 0.0002945837145945497, + "loss": 0.0391, "step": 13930 }, { - "epoch": 0.07, - "learning_rate": 0.0002894506359384696, - "loss": 0.0354, + "epoch": 0.04, + "learning_rate": 0.00029457982637817823, + "loss": 0.0392, "step": 13940 }, { - "epoch": 0.07, - "learning_rate": 0.0002894430682454556, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.0002945759381618068, + "loss": 0.0451, "step": 13950 }, { - "epoch": 0.07, - "learning_rate": 0.00028943550055244156, - "loss": 0.031, + "epoch": 0.04, + "learning_rate": 0.0002945720499454353, + "loss": 0.0427, "step": 13960 }, { - "epoch": 0.07, - "learning_rate": 0.00028942793285942754, - "loss": 0.0277, + "epoch": 0.04, + "learning_rate": 0.0002945681617290639, + "loss": 0.0389, "step": 13970 }, { - "epoch": 0.07, - "learning_rate": 0.0002894203651664135, - "loss": 0.0345, + "epoch": 0.04, + "learning_rate": 0.0002945642735126924, + "loss": 0.0625, "step": 13980 }, { - "epoch": 0.07, - "learning_rate": 0.00028941279747339956, - "loss": 0.0318, + "epoch": 0.04, + "learning_rate": 0.00029456038529632097, + "loss": 0.0465, "step": 13990 }, { - "epoch": 0.07, - "learning_rate": 0.00028940522978038554, + "epoch": 0.04, + "learning_rate": 0.0002945564970799495, "loss": 0.0418, "step": 14000 }, { - "epoch": 0.07, - "eval_cer": 0.9144731670915385, - "eval_loss": 0.02422579564154148, - "eval_runtime": 116.5786, - "eval_samples_per_second": 17.156, - "eval_steps_per_second": 4.289, + "epoch": 0.04, + "eval_cer": 0.8818748416660718, + "eval_loss": 0.031777381896972656, + "eval_runtime": 107.6404, + "eval_samples_per_second": 18.58, + "eval_steps_per_second": 4.645, "step": 14000 }, { - "epoch": 0.07, - "learning_rate": 0.0002893976620873715, - "loss": 0.0302, + "epoch": 0.04, + "learning_rate": 0.000294552608863578, + "loss": 0.0604, "step": 14010 }, { - "epoch": 0.07, - "learning_rate": 0.0002893900943943575, - "loss": 0.0365, + "epoch": 0.04, + "learning_rate": 0.0002945487206472065, + "loss": 0.0609, "step": 14020 }, { - "epoch": 0.07, - "learning_rate": 0.0002893825267013435, - "loss": 0.0346, + "epoch": 0.04, + "learning_rate": 0.0002945448324308351, + "loss": 0.051, "step": 14030 }, { - "epoch": 0.07, - "learning_rate": 0.00028937495900832947, - "loss": 0.0365, + "epoch": 0.04, + "learning_rate": 0.00029454094421446365, + "loss": 0.0499, "step": 14040 }, { - "epoch": 0.07, - "learning_rate": 0.0002893673913153155, - "loss": 0.0297, + "epoch": 0.04, + "learning_rate": 0.00029453705599809217, + "loss": 0.0426, "step": 14050 }, { - "epoch": 0.07, - "learning_rate": 0.0002893598236223015, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.0002945331677817207, + "loss": 0.0394, "step": 14060 }, { - "epoch": 0.07, - "learning_rate": 0.00028935225592928746, - "loss": 0.0343, + "epoch": 0.04, + "learning_rate": 0.00029452927956534925, + "loss": 0.0356, "step": 14070 }, { - "epoch": 0.07, - "learning_rate": 0.00028934468823627345, - "loss": 0.0285, + "epoch": 0.04, + "learning_rate": 0.00029452539134897776, + "loss": 0.0419, "step": 14080 }, { - "epoch": 0.07, - "learning_rate": 0.00028933712054325943, - "loss": 0.0311, + "epoch": 0.04, + "learning_rate": 0.0002945215031326063, + "loss": 0.0481, "step": 14090 }, { - "epoch": 0.07, - "learning_rate": 0.0002893295528502454, - "loss": 0.0287, + "epoch": 0.04, + "learning_rate": 0.00029451761491623485, + "loss": 0.0422, "step": 14100 }, { - "epoch": 0.07, - "learning_rate": 0.00028932198515723144, - "loss": 0.034, + "epoch": 0.04, + "learning_rate": 0.00029451372669986336, + "loss": 0.0484, "step": 14110 }, { - "epoch": 0.07, - "learning_rate": 0.0002893144174642174, - "loss": 0.0345, + "epoch": 0.04, + "learning_rate": 0.00029450983848349193, + "loss": 0.048, "step": 14120 }, { - "epoch": 0.07, - "learning_rate": 0.0002893068497712034, - "loss": 0.0444, + "epoch": 0.04, + "learning_rate": 0.00029450595026712044, + "loss": 0.048, "step": 14130 }, { - "epoch": 0.07, - "learning_rate": 0.0002892992820781894, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.00029450206205074896, + "loss": 0.0434, "step": 14140 }, { - "epoch": 0.07, - "learning_rate": 0.00028929171438517537, - "loss": 0.0286, + "epoch": 0.04, + "learning_rate": 0.0002944981738343775, + "loss": 0.048, "step": 14150 }, { - "epoch": 0.07, - "learning_rate": 0.00028928414669216135, - "loss": 0.0295, + "epoch": 0.04, + "learning_rate": 0.00029449428561800604, + "loss": 0.0381, "step": 14160 }, { - "epoch": 0.07, - "learning_rate": 0.00028927657899914733, - "loss": 0.0294, + "epoch": 0.04, + "learning_rate": 0.00029449039740163456, + "loss": 0.049, "step": 14170 }, { - "epoch": 0.07, - "learning_rate": 0.00028926901130613337, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002944865091852631, + "loss": 0.0402, "step": 14180 }, { - "epoch": 0.07, - "learning_rate": 0.00028926144361311935, - "loss": 0.035, + "epoch": 0.04, + "learning_rate": 0.00029448262096889164, + "loss": 0.0459, "step": 14190 }, { - "epoch": 0.07, - "learning_rate": 0.00028925387592010533, - "loss": 0.0372, + "epoch": 0.04, + "learning_rate": 0.0002944787327525202, + "loss": 0.0411, "step": 14200 }, { - "epoch": 0.07, - "learning_rate": 0.0002892463082270913, - "loss": 0.036, + "epoch": 0.04, + "learning_rate": 0.0002944748445361487, + "loss": 0.0427, "step": 14210 }, { - "epoch": 0.07, - "learning_rate": 0.0002892387405340773, - "loss": 0.0359, + "epoch": 0.04, + "learning_rate": 0.00029447095631977724, + "loss": 0.0468, "step": 14220 }, { - "epoch": 0.07, - "learning_rate": 0.0002892311728410633, - "loss": 0.0477, + "epoch": 0.04, + "learning_rate": 0.00029446706810340575, + "loss": 0.0364, "step": 14230 }, { - "epoch": 0.07, - "learning_rate": 0.0002892236051480493, - "loss": 0.0356, + "epoch": 0.04, + "learning_rate": 0.0002944631798870343, + "loss": 0.0475, "step": 14240 }, { - "epoch": 0.07, - "learning_rate": 0.0002892160374550353, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002944592916706629, + "loss": 0.0434, "step": 14250 }, { - "epoch": 0.07, - "learning_rate": 0.0002892084697620213, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.0002944554034542914, + "loss": 0.0376, "step": 14260 }, { - "epoch": 0.07, - "learning_rate": 0.00028920090206900726, - "loss": 0.0356, + "epoch": 0.04, + "learning_rate": 0.0002944515152379199, + "loss": 0.0427, "step": 14270 }, { - "epoch": 0.07, - "learning_rate": 0.00028919333437599324, - "loss": 0.0336, + "epoch": 0.04, + "learning_rate": 0.0002944476270215485, + "loss": 0.0383, "step": 14280 }, { - "epoch": 0.07, - "learning_rate": 0.0002891857666829792, - "loss": 0.053, + "epoch": 0.04, + "learning_rate": 0.000294443738805177, + "loss": 0.0546, "step": 14290 }, { - "epoch": 0.07, - "learning_rate": 0.0002891781989899652, - "loss": 0.0315, + "epoch": 0.04, + "learning_rate": 0.0002944398505888055, + "loss": 0.0434, "step": 14300 }, { - "epoch": 0.07, - "learning_rate": 0.00028917063129695124, - "loss": 0.0358, + "epoch": 0.04, + "learning_rate": 0.0002944359623724341, + "loss": 0.042, "step": 14310 }, { - "epoch": 0.07, - "learning_rate": 0.0002891630636039372, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.0002944320741560626, + "loss": 0.0387, "step": 14320 }, { - "epoch": 0.07, - "learning_rate": 0.0002891554959109232, - "loss": 0.0473, + "epoch": 0.04, + "learning_rate": 0.00029442818593969117, + "loss": 0.0431, "step": 14330 }, { - "epoch": 0.07, - "learning_rate": 0.0002891479282179092, - "loss": 0.0392, + "epoch": 0.04, + "learning_rate": 0.0002944242977233197, + "loss": 0.0669, "step": 14340 }, { - "epoch": 0.07, - "learning_rate": 0.00028914036052489516, - "loss": 0.0394, + "epoch": 0.04, + "learning_rate": 0.0002944204095069482, + "loss": 0.0388, "step": 14350 }, { - "epoch": 0.07, - "learning_rate": 0.00028913279283188114, - "loss": 0.0356, + "epoch": 0.04, + "learning_rate": 0.00029441652129057677, + "loss": 0.0402, "step": 14360 }, { - "epoch": 0.07, - "learning_rate": 0.0002891252251388672, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.0002944126330742053, + "loss": 0.0415, "step": 14370 }, { - "epoch": 0.07, - "learning_rate": 0.00028911765744585316, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.0002944087448578338, + "loss": 0.038, "step": 14380 }, { - "epoch": 0.07, - "learning_rate": 0.00028911008975283914, - "loss": 0.0364, + "epoch": 0.04, + "learning_rate": 0.00029440485664146236, + "loss": 0.0456, "step": 14390 }, { - "epoch": 0.07, - "learning_rate": 0.0002891025220598251, - "loss": 0.0495, + "epoch": 0.04, + "learning_rate": 0.0002944009684250909, + "loss": 0.0446, "step": 14400 }, { - "epoch": 0.07, - "learning_rate": 0.0002890949543668111, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.00029439708020871945, + "loss": 0.0364, "step": 14410 }, { - "epoch": 0.07, - "learning_rate": 0.0002890873866737971, - "loss": 0.0472, + "epoch": 0.04, + "learning_rate": 0.00029439319199234796, + "loss": 0.0492, "step": 14420 }, { - "epoch": 0.07, - "learning_rate": 0.0002890798189807831, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.0002943893037759765, + "loss": 0.0389, "step": 14430 }, { - "epoch": 0.07, - "learning_rate": 0.0002890722512877691, - "loss": 0.0442, + "epoch": 0.04, + "learning_rate": 0.00029438541555960505, + "loss": 0.0368, "step": 14440 }, { - "epoch": 0.07, - "learning_rate": 0.0002890646835947551, - "loss": 0.0373, + "epoch": 0.04, + "learning_rate": 0.00029438152734323356, + "loss": 0.0439, "step": 14450 }, { - "epoch": 0.07, - "learning_rate": 0.000289057115901741, - "loss": 0.0391, + "epoch": 0.04, + "learning_rate": 0.00029437763912686213, + "loss": 0.0417, "step": 14460 }, { - "epoch": 0.07, - "learning_rate": 0.00028904954820872705, - "loss": 0.0436, + "epoch": 0.04, + "learning_rate": 0.00029437375091049064, + "loss": 0.0384, "step": 14470 }, { - "epoch": 0.07, - "learning_rate": 0.00028904198051571303, - "loss": 0.037, + "epoch": 0.04, + "learning_rate": 0.00029436986269411916, + "loss": 0.0442, "step": 14480 }, { - "epoch": 0.07, - "learning_rate": 0.000289034412822699, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.0002943659744777477, + "loss": 0.0466, "step": 14490 }, { - "epoch": 0.07, - "learning_rate": 0.000289026845129685, - "loss": 0.0468, + "epoch": 0.04, + "learning_rate": 0.00029436208626137624, + "loss": 0.0407, "step": 14500 }, { - "epoch": 0.07, - "learning_rate": 0.000289019277436671, - "loss": 0.0449, + "epoch": 0.04, + "learning_rate": 0.00029435819804500476, + "loss": 0.0419, "step": 14510 }, { - "epoch": 0.07, - "learning_rate": 0.00028901170974365695, - "loss": 0.035, + "epoch": 0.04, + "learning_rate": 0.0002943543098286333, + "loss": 0.0443, "step": 14520 }, { - "epoch": 0.07, - "learning_rate": 0.00028900414205064294, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.0002943504216122619, + "loss": 0.0698, "step": 14530 }, { - "epoch": 0.07, - "learning_rate": 0.00028899657435762897, - "loss": 0.0312, + "epoch": 0.04, + "learning_rate": 0.0002943465333958904, + "loss": 0.043, "step": 14540 }, { - "epoch": 0.07, - "learning_rate": 0.00028898900666461495, - "loss": 0.038, + "epoch": 0.04, + "learning_rate": 0.0002943426451795189, + "loss": 0.0491, "step": 14550 }, { - "epoch": 0.07, - "learning_rate": 0.00028898143897160093, - "loss": 0.0329, + "epoch": 0.04, + "learning_rate": 0.00029433875696314744, + "loss": 0.0379, "step": 14560 }, { - "epoch": 0.07, - "learning_rate": 0.0002889738712785869, - "loss": 0.0311, + "epoch": 0.04, + "learning_rate": 0.000294334868746776, + "loss": 0.0411, "step": 14570 }, { - "epoch": 0.07, - "learning_rate": 0.0002889663035855729, - "loss": 0.0367, + "epoch": 0.04, + "learning_rate": 0.0002943309805304045, + "loss": 0.0388, "step": 14580 }, { - "epoch": 0.07, - "learning_rate": 0.0002889587358925589, - "loss": 0.0503, + "epoch": 0.04, + "learning_rate": 0.0002943270923140331, + "loss": 0.0518, "step": 14590 }, { - "epoch": 0.07, - "learning_rate": 0.0002889511681995449, - "loss": 0.0425, + "epoch": 0.04, + "learning_rate": 0.0002943232040976616, + "loss": 0.0646, "step": 14600 }, { - "epoch": 0.07, - "learning_rate": 0.0002889436005065309, - "loss": 0.0403, + "epoch": 0.04, + "learning_rate": 0.00029431931588129017, + "loss": 0.0381, "step": 14610 }, { - "epoch": 0.07, - "learning_rate": 0.0002889360328135169, - "loss": 0.0389, + "epoch": 0.04, + "learning_rate": 0.0002943154276649187, + "loss": 0.039, "step": 14620 }, { - "epoch": 0.07, - "learning_rate": 0.00028892846512050286, - "loss": 0.0358, + "epoch": 0.04, + "learning_rate": 0.0002943115394485472, + "loss": 0.038, "step": 14630 }, { - "epoch": 0.07, - "learning_rate": 0.00028892089742748884, - "loss": 0.0336, + "epoch": 0.04, + "learning_rate": 0.0002943076512321757, + "loss": 0.0462, "step": 14640 }, { - "epoch": 0.07, - "learning_rate": 0.0002889133297344748, - "loss": 0.0622, + "epoch": 0.04, + "learning_rate": 0.0002943037630158043, + "loss": 0.042, "step": 14650 }, { - "epoch": 0.07, - "learning_rate": 0.00028890576204146086, - "loss": 0.0343, + "epoch": 0.04, + "learning_rate": 0.0002942998747994328, + "loss": 0.0402, "step": 14660 }, { - "epoch": 0.07, - "learning_rate": 0.00028889819434844684, - "loss": 0.0374, + "epoch": 0.04, + "learning_rate": 0.00029429598658306137, + "loss": 0.0367, "step": 14670 }, { - "epoch": 0.07, - "learning_rate": 0.0002888906266554328, - "loss": 0.0478, + "epoch": 0.04, + "learning_rate": 0.0002942920983666899, + "loss": 0.0437, "step": 14680 }, { - "epoch": 0.07, - "learning_rate": 0.0002888830589624188, - "loss": 0.0415, + "epoch": 0.04, + "learning_rate": 0.0002942882101503184, + "loss": 0.0369, "step": 14690 }, { - "epoch": 0.07, - "learning_rate": 0.0002888754912694048, - "loss": 0.0346, + "epoch": 0.04, + "learning_rate": 0.00029428432193394697, + "loss": 0.0406, "step": 14700 }, { - "epoch": 0.07, - "learning_rate": 0.00028886792357639076, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.0002942804337175755, + "loss": 0.0371, "step": 14710 }, { - "epoch": 0.07, - "learning_rate": 0.00028886035588337675, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.000294276545501204, + "loss": 0.0411, "step": 14720 }, { - "epoch": 0.07, - "learning_rate": 0.0002888527881903628, - "loss": 0.0433, + "epoch": 0.04, + "learning_rate": 0.00029427265728483256, + "loss": 0.0397, "step": 14730 }, { - "epoch": 0.07, - "learning_rate": 0.00028884522049734876, - "loss": 0.03, + "epoch": 0.04, + "learning_rate": 0.00029426876906846113, + "loss": 0.043, "step": 14740 }, { - "epoch": 0.07, - "learning_rate": 0.00028883765280433474, - "loss": 0.0347, + "epoch": 0.04, + "learning_rate": 0.00029426488085208965, + "loss": 0.0391, "step": 14750 }, { - "epoch": 0.07, - "learning_rate": 0.0002888300851113207, + "epoch": 0.04, + "learning_rate": 0.00029426099263571816, "loss": 0.0369, "step": 14760 }, { - "epoch": 0.07, - "learning_rate": 0.0002888225174183067, - "loss": 0.0439, - "step": 14770 + "epoch": 0.04, + "learning_rate": 0.0002942571044193467, + "loss": 0.0438, + "step": 14770 }, { - "epoch": 0.07, - "learning_rate": 0.0002888149497252927, - "loss": 0.0368, + "epoch": 0.04, + "learning_rate": 0.00029425321620297524, + "loss": 0.05, "step": 14780 }, { - "epoch": 0.07, - "learning_rate": 0.0002888073820322787, - "loss": 0.0311, + "epoch": 0.04, + "learning_rate": 0.00029424932798660376, + "loss": 0.0418, "step": 14790 }, { - "epoch": 0.07, - "learning_rate": 0.0002887998143392647, - "loss": 0.0356, + "epoch": 0.04, + "learning_rate": 0.00029424543977023233, + "loss": 0.0398, "step": 14800 }, { - "epoch": 0.07, - "learning_rate": 0.0002887922466462507, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.00029424155155386084, + "loss": 0.0422, "step": 14810 }, { - "epoch": 0.07, - "learning_rate": 0.00028878467895323667, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.0002942376633374894, + "loss": 0.039, "step": 14820 }, { - "epoch": 0.07, - "learning_rate": 0.00028877711126022265, - "loss": 0.037, + "epoch": 0.04, + "learning_rate": 0.0002942337751211179, + "loss": 0.0404, "step": 14830 }, { - "epoch": 0.07, - "learning_rate": 0.00028876954356720863, - "loss": 0.0331, + "epoch": 0.04, + "learning_rate": 0.00029422988690474644, + "loss": 0.0349, "step": 14840 }, { - "epoch": 0.07, - "learning_rate": 0.0002887619758741946, - "loss": 0.0329, + "epoch": 0.04, + "learning_rate": 0.00029422599868837495, + "loss": 0.0414, "step": 14850 }, { - "epoch": 0.07, - "learning_rate": 0.00028875440818118065, - "loss": 0.0359, + "epoch": 0.04, + "learning_rate": 0.0002942221104720035, + "loss": 0.0419, "step": 14860 }, { - "epoch": 0.08, - "learning_rate": 0.00028874684048816663, - "loss": 0.0347, + "epoch": 0.04, + "learning_rate": 0.00029421822225563204, + "loss": 0.0429, "step": 14870 }, { - "epoch": 0.08, - "learning_rate": 0.0002887392727951526, - "loss": 0.0534, + "epoch": 0.04, + "learning_rate": 0.0002942143340392606, + "loss": 0.0405, "step": 14880 }, { - "epoch": 0.08, - "learning_rate": 0.0002887317051021386, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.0002942104458228891, + "loss": 0.0481, "step": 14890 }, { - "epoch": 0.08, - "learning_rate": 0.0002887241374091246, - "loss": 0.0433, + "epoch": 0.04, + "learning_rate": 0.00029420655760651764, + "loss": 0.0373, "step": 14900 }, { - "epoch": 0.08, - "learning_rate": 0.00028871656971611056, - "loss": 0.0429, + "epoch": 0.04, + "learning_rate": 0.0002942026693901462, + "loss": 0.0443, "step": 14910 }, { - "epoch": 0.08, - "learning_rate": 0.0002887090020230966, - "loss": 0.0369, + "epoch": 0.04, + "learning_rate": 0.0002941987811737747, + "loss": 0.0433, "step": 14920 }, { - "epoch": 0.08, - "learning_rate": 0.0002887014343300826, - "loss": 0.0347, + "epoch": 0.04, + "learning_rate": 0.0002941948929574033, + "loss": 0.0481, "step": 14930 }, { - "epoch": 0.08, - "learning_rate": 0.00028869386663706855, - "loss": 0.0352, + "epoch": 0.04, + "learning_rate": 0.0002941910047410318, + "loss": 0.0463, "step": 14940 }, { - "epoch": 0.08, - "learning_rate": 0.00028868629894405454, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.00029418711652466037, + "loss": 0.0501, "step": 14950 }, { - "epoch": 0.08, - "learning_rate": 0.0002886787312510405, - "loss": 0.0314, + "epoch": 0.04, + "learning_rate": 0.0002941832283082889, + "loss": 0.0442, "step": 14960 }, { - "epoch": 0.08, - "learning_rate": 0.0002886711635580265, - "loss": 0.0342, + "epoch": 0.04, + "learning_rate": 0.0002941793400919174, + "loss": 0.0422, "step": 14970 }, { - "epoch": 0.08, - "learning_rate": 0.00028866359586501253, - "loss": 0.0588, + "epoch": 0.04, + "learning_rate": 0.0002941754518755459, + "loss": 0.0515, "step": 14980 }, { - "epoch": 0.08, - "learning_rate": 0.0002886560281719985, - "loss": 0.0336, + "epoch": 0.04, + "learning_rate": 0.0002941715636591745, + "loss": 0.0412, "step": 14990 }, { - "epoch": 0.08, - "learning_rate": 0.0002886484604789845, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.000294167675442803, + "loss": 0.0378, "step": 15000 }, { - "epoch": 0.08, - "eval_cer": 0.9145216868978086, - "eval_loss": 0.025017283856868744, - "eval_runtime": 116.429, - "eval_samples_per_second": 17.178, - "eval_steps_per_second": 4.294, + "epoch": 0.04, + "eval_cer": 0.8818076590932312, + "eval_loss": 0.03137202188372612, + "eval_runtime": 107.683, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, "step": 15000 }, { - "epoch": 0.08, - "learning_rate": 0.0002886408927859705, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.00029416378722643157, + "loss": 0.0459, "step": 15010 }, { - "epoch": 0.08, - "learning_rate": 0.00028863332509295646, - "loss": 0.0274, + "epoch": 0.04, + "learning_rate": 0.0002941598990100601, + "loss": 0.0344, "step": 15020 }, { - "epoch": 0.08, - "learning_rate": 0.00028862575739994244, - "loss": 0.0345, + "epoch": 0.04, + "learning_rate": 0.00029415601079368865, + "loss": 0.0418, "step": 15030 }, { - "epoch": 0.08, - "learning_rate": 0.0002886181897069284, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.00029415212257731716, + "loss": 0.0395, "step": 15040 }, { - "epoch": 0.08, - "learning_rate": 0.00028861062201391446, - "loss": 0.0358, + "epoch": 0.04, + "learning_rate": 0.0002941482343609457, + "loss": 0.0395, "step": 15050 }, { - "epoch": 0.08, - "learning_rate": 0.00028860305432090044, - "loss": 0.0312, + "epoch": 0.04, + "learning_rate": 0.0002941443461445742, + "loss": 0.0445, "step": 15060 }, { - "epoch": 0.08, - "learning_rate": 0.0002885954866278864, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.00029414045792820276, + "loss": 0.0463, "step": 15070 }, { - "epoch": 0.08, - "learning_rate": 0.0002885879189348724, - "loss": 0.0374, + "epoch": 0.04, + "learning_rate": 0.00029413656971183133, + "loss": 0.0415, "step": 15080 }, { - "epoch": 0.08, - "learning_rate": 0.0002885803512418584, - "loss": 0.0311, + "epoch": 0.04, + "learning_rate": 0.00029413268149545985, + "loss": 0.044, "step": 15090 }, { - "epoch": 0.08, - "learning_rate": 0.00028857278354884437, - "loss": 0.0347, + "epoch": 0.04, + "learning_rate": 0.00029412879327908836, + "loss": 0.0357, "step": 15100 }, { - "epoch": 0.08, - "learning_rate": 0.0002885652158558304, - "loss": 0.0314, + "epoch": 0.04, + "learning_rate": 0.00029412490506271693, + "loss": 0.0415, "step": 15110 }, { - "epoch": 0.08, - "learning_rate": 0.0002885576481628164, - "loss": 0.0334, + "epoch": 0.04, + "learning_rate": 0.00029412101684634544, + "loss": 0.0421, "step": 15120 }, { - "epoch": 0.08, - "learning_rate": 0.00028855008046980236, - "loss": 0.0437, + "epoch": 0.04, + "learning_rate": 0.00029411712862997396, + "loss": 0.0426, "step": 15130 }, { - "epoch": 0.08, - "learning_rate": 0.00028854251277678835, - "loss": 0.0346, + "epoch": 0.04, + "learning_rate": 0.0002941132404136025, + "loss": 0.0444, "step": 15140 }, { - "epoch": 0.08, - "learning_rate": 0.00028853494508377433, - "loss": 0.0357, + "epoch": 0.04, + "learning_rate": 0.00029410935219723104, + "loss": 0.0384, "step": 15150 }, { - "epoch": 0.08, - "learning_rate": 0.0002885273773907603, - "loss": 0.0331, + "epoch": 0.04, + "learning_rate": 0.0002941054639808596, + "loss": 0.0538, "step": 15160 }, { - "epoch": 0.08, - "learning_rate": 0.00028851980969774634, - "loss": 0.0358, + "epoch": 0.04, + "learning_rate": 0.0002941015757644881, + "loss": 0.0441, "step": 15170 }, { - "epoch": 0.08, - "learning_rate": 0.0002885122420047323, - "loss": 0.0401, + "epoch": 0.04, + "learning_rate": 0.00029409768754811664, + "loss": 0.0439, "step": 15180 }, { - "epoch": 0.08, - "learning_rate": 0.0002885046743117183, - "loss": 0.0337, + "epoch": 0.04, + "learning_rate": 0.00029409379933174515, + "loss": 0.0468, "step": 15190 }, { - "epoch": 0.08, - "learning_rate": 0.0002884971066187043, - "loss": 0.0365, + "epoch": 0.04, + "learning_rate": 0.0002940899111153737, + "loss": 0.0479, "step": 15200 }, { - "epoch": 0.08, - "learning_rate": 0.00028848953892569027, - "loss": 0.0399, + "epoch": 0.04, + "learning_rate": 0.00029408602289900224, + "loss": 0.0427, "step": 15210 }, { - "epoch": 0.08, - "learning_rate": 0.00028848197123267625, - "loss": 0.0353, + "epoch": 0.04, + "learning_rate": 0.0002940821346826308, + "loss": 0.0373, "step": 15220 }, { - "epoch": 0.08, - "learning_rate": 0.00028847440353966223, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.0002940782464662593, + "loss": 0.0442, "step": 15230 }, { - "epoch": 0.08, - "learning_rate": 0.00028846683584664827, - "loss": 0.0345, + "epoch": 0.04, + "learning_rate": 0.0002940743582498879, + "loss": 0.0475, "step": 15240 }, { - "epoch": 0.08, - "learning_rate": 0.00028845926815363425, - "loss": 0.0326, + "epoch": 0.04, + "learning_rate": 0.0002940704700335164, + "loss": 0.0501, "step": 15250 }, { - "epoch": 0.08, - "learning_rate": 0.00028845170046062023, - "loss": 0.0296, + "epoch": 0.04, + "learning_rate": 0.0002940665818171449, + "loss": 0.0431, "step": 15260 }, { - "epoch": 0.08, - "learning_rate": 0.0002884441327676062, - "loss": 0.033, + "epoch": 0.04, + "learning_rate": 0.00029406269360077343, + "loss": 0.0407, "step": 15270 }, { - "epoch": 0.08, - "learning_rate": 0.0002884365650745922, - "loss": 0.0354, + "epoch": 0.04, + "learning_rate": 0.000294058805384402, + "loss": 0.0506, "step": 15280 }, { - "epoch": 0.08, - "learning_rate": 0.0002884289973815782, - "loss": 0.0502, + "epoch": 0.04, + "learning_rate": 0.00029405491716803057, + "loss": 0.0416, "step": 15290 }, { - "epoch": 0.08, - "learning_rate": 0.0002884214296885642, - "loss": 0.0442, + "epoch": 0.04, + "learning_rate": 0.0002940510289516591, + "loss": 0.0431, "step": 15300 }, { - "epoch": 0.08, - "learning_rate": 0.0002884138619955502, - "loss": 0.0323, + "epoch": 0.04, + "learning_rate": 0.0002940471407352876, + "loss": 0.0457, "step": 15310 }, { - "epoch": 0.08, - "learning_rate": 0.0002884062943025362, - "loss": 0.0361, + "epoch": 0.04, + "learning_rate": 0.00029404325251891617, + "loss": 0.0432, "step": 15320 }, { - "epoch": 0.08, - "learning_rate": 0.00028839872660952216, - "loss": 0.0331, + "epoch": 0.04, + "learning_rate": 0.0002940393643025447, + "loss": 0.0412, "step": 15330 }, { - "epoch": 0.08, - "learning_rate": 0.00028839115891650814, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.0002940354760861732, + "loss": 0.0355, "step": 15340 }, { - "epoch": 0.08, - "learning_rate": 0.0002883835912234941, - "loss": 0.032, + "epoch": 0.04, + "learning_rate": 0.00029403158786980177, + "loss": 0.0439, "step": 15350 }, { - "epoch": 0.08, - "learning_rate": 0.0002883760235304801, - "loss": 0.0329, + "epoch": 0.04, + "learning_rate": 0.0002940276996534303, + "loss": 0.0419, "step": 15360 }, { - "epoch": 0.08, - "learning_rate": 0.00028836845583746614, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.00029402381143705885, + "loss": 0.0392, "step": 15370 }, { - "epoch": 0.08, - "learning_rate": 0.0002883608881444521, - "loss": 0.038, + "epoch": 0.04, + "learning_rate": 0.00029401992322068736, + "loss": 0.0348, "step": 15380 }, { - "epoch": 0.08, - "learning_rate": 0.0002883533204514381, - "loss": 0.0385, + "epoch": 0.04, + "learning_rate": 0.0002940160350043159, + "loss": 0.0445, "step": 15390 }, { - "epoch": 0.08, - "learning_rate": 0.0002883457527584241, - "loss": 0.0355, + "epoch": 0.04, + "learning_rate": 0.0002940121467879444, + "loss": 0.0373, "step": 15400 }, { - "epoch": 0.08, - "learning_rate": 0.00028833818506541006, - "loss": 0.0344, + "epoch": 0.04, + "learning_rate": 0.00029400825857157296, + "loss": 0.0367, "step": 15410 }, { - "epoch": 0.08, - "learning_rate": 0.00028833061737239604, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.0002940043703552015, + "loss": 0.0375, "step": 15420 }, { - "epoch": 0.08, - "learning_rate": 0.0002883230496793821, - "loss": 0.0305, + "epoch": 0.04, + "learning_rate": 0.00029400048213883004, + "loss": 0.0389, "step": 15430 }, { - "epoch": 0.08, - "learning_rate": 0.00028831548198636806, - "loss": 0.0391, + "epoch": 0.04, + "learning_rate": 0.00029399659392245856, + "loss": 0.036, "step": 15440 }, { - "epoch": 0.08, - "learning_rate": 0.00028830791429335404, - "loss": 0.0369, + "epoch": 0.04, + "learning_rate": 0.00029399270570608713, + "loss": 0.0451, "step": 15450 }, { - "epoch": 0.08, - "learning_rate": 0.00028830034660034, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.00029398881748971564, + "loss": 0.0406, "step": 15460 }, { - "epoch": 0.08, - "learning_rate": 0.000288292778907326, - "loss": 0.0283, + "epoch": 0.04, + "learning_rate": 0.00029398492927334416, + "loss": 0.055, "step": 15470 }, { - "epoch": 0.08, - "learning_rate": 0.000288285211214312, - "loss": 0.0287, + "epoch": 0.04, + "learning_rate": 0.0002939810410569727, + "loss": 0.0409, "step": 15480 }, { - "epoch": 0.08, - "learning_rate": 0.000288277643521298, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.00029397715284060124, + "loss": 0.0401, "step": 15490 }, { - "epoch": 0.08, - "learning_rate": 0.000288270075828284, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.0002939732646242298, + "loss": 0.0379, "step": 15500 }, { - "epoch": 0.08, - "learning_rate": 0.00028826250813527, - "loss": 0.0343, + "epoch": 0.04, + "learning_rate": 0.0002939693764078583, + "loss": 0.0387, "step": 15510 }, { - "epoch": 0.08, - "learning_rate": 0.00028825494044225597, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.00029396548819148684, + "loss": 0.0393, "step": 15520 }, { - "epoch": 0.08, - "learning_rate": 0.00028824737274924195, - "loss": 0.0358, + "epoch": 0.04, + "learning_rate": 0.0002939615999751154, + "loss": 0.0347, "step": 15530 }, { - "epoch": 0.08, - "learning_rate": 0.00028823980505622793, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.0002939577117587439, + "loss": 0.0438, "step": 15540 }, { - "epoch": 0.08, - "learning_rate": 0.0002882322373632139, - "loss": 0.0307, + "epoch": 0.04, + "learning_rate": 0.00029395382354237244, + "loss": 0.0399, "step": 15550 }, { - "epoch": 0.08, - "learning_rate": 0.00028822466967019995, - "loss": 0.032, + "epoch": 0.04, + "learning_rate": 0.000293949935326001, + "loss": 0.0379, "step": 15560 }, { - "epoch": 0.08, - "learning_rate": 0.00028821710197718593, - "loss": 0.0351, + "epoch": 0.04, + "learning_rate": 0.0002939460471096295, + "loss": 0.0491, "step": 15570 }, { - "epoch": 0.08, - "learning_rate": 0.0002882095342841719, - "loss": 0.036, + "epoch": 0.04, + "learning_rate": 0.0002939421588932581, + "loss": 0.0469, "step": 15580 }, { - "epoch": 0.08, - "learning_rate": 0.0002882019665911579, - "loss": 0.0309, + "epoch": 0.04, + "learning_rate": 0.0002939382706768866, + "loss": 0.0389, "step": 15590 }, { - "epoch": 0.08, - "learning_rate": 0.00028819439889814387, - "loss": 0.0341, + "epoch": 0.04, + "learning_rate": 0.0002939343824605151, + "loss": 0.0356, "step": 15600 }, { - "epoch": 0.08, - "learning_rate": 0.00028818683120512985, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.0002939304942441437, + "loss": 0.0429, "step": 15610 }, { - "epoch": 0.08, - "learning_rate": 0.0002881792635121159, - "loss": 0.0377, + "epoch": 0.04, + "learning_rate": 0.0002939266060277722, + "loss": 0.0406, "step": 15620 }, { - "epoch": 0.08, - "learning_rate": 0.00028817169581910187, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.00029392271781140077, + "loss": 0.0413, "step": 15630 }, { - "epoch": 0.08, - "learning_rate": 0.00028816412812608785, - "loss": 0.0298, + "epoch": 0.04, + "learning_rate": 0.0002939188295950293, + "loss": 0.0406, "step": 15640 }, { - "epoch": 0.08, - "learning_rate": 0.00028815656043307383, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.0002939149413786578, + "loss": 0.0394, "step": 15650 }, { - "epoch": 0.08, - "learning_rate": 0.0002881489927400598, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.00029391105316228637, + "loss": 0.0466, "step": 15660 }, { - "epoch": 0.08, - "learning_rate": 0.0002881414250470458, - "loss": 0.0334, + "epoch": 0.04, + "learning_rate": 0.0002939071649459149, + "loss": 0.0357, "step": 15670 }, { - "epoch": 0.08, - "learning_rate": 0.00028813385735403183, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.0002939032767295434, + "loss": 0.0417, "step": 15680 }, { - "epoch": 0.08, - "learning_rate": 0.0002881262896610178, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.00029389938851317196, + "loss": 0.0405, "step": 15690 }, { - "epoch": 0.08, - "learning_rate": 0.0002881187219680038, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.0002938955002968005, + "loss": 0.0324, "step": 15700 }, { - "epoch": 0.08, - "learning_rate": 0.0002881111542749898, - "loss": 0.0326, + "epoch": 0.04, + "learning_rate": 0.00029389161208042905, + "loss": 0.0376, "step": 15710 }, { - "epoch": 0.08, - "learning_rate": 0.00028810358658197576, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.00029388772386405756, + "loss": 0.0348, "step": 15720 }, { - "epoch": 0.08, - "learning_rate": 0.00028809601888896174, - "loss": 0.0351, + "epoch": 0.04, + "learning_rate": 0.0002938838356476861, + "loss": 0.0417, "step": 15730 }, { - "epoch": 0.08, - "learning_rate": 0.0002880884511959477, - "loss": 0.0318, + "epoch": 0.04, + "learning_rate": 0.00029387994743131465, + "loss": 0.042, "step": 15740 }, { - "epoch": 0.08, - "learning_rate": 0.0002880808835029337, - "loss": 0.0348, + "epoch": 0.04, + "learning_rate": 0.00029387605921494316, + "loss": 0.037, "step": 15750 }, { - "epoch": 0.08, - "learning_rate": 0.0002880733158099197, - "loss": 0.0315, + "epoch": 0.04, + "learning_rate": 0.0002938721709985717, + "loss": 0.0845, "step": 15760 }, { - "epoch": 0.08, - "learning_rate": 0.00028806574811690566, - "loss": 0.0285, + "epoch": 0.04, + "learning_rate": 0.00029386828278220024, + "loss": 0.0469, "step": 15770 }, { - "epoch": 0.08, - "learning_rate": 0.00028805818042389165, - "loss": 0.0318, + "epoch": 0.04, + "learning_rate": 0.0002938643945658288, + "loss": 0.048, "step": 15780 }, { - "epoch": 0.08, - "learning_rate": 0.0002880506127308777, - "loss": 0.0326, + "epoch": 0.04, + "learning_rate": 0.0002938605063494573, + "loss": 0.0423, "step": 15790 }, { - "epoch": 0.08, - "learning_rate": 0.00028804304503786366, - "loss": 0.0285, + "epoch": 0.04, + "learning_rate": 0.00029385661813308584, + "loss": 0.0448, "step": 15800 }, { - "epoch": 0.08, - "learning_rate": 0.00028803547734484964, - "loss": 0.034, + "epoch": 0.04, + "learning_rate": 0.00029385272991671436, + "loss": 0.0631, "step": 15810 }, { - "epoch": 0.08, - "learning_rate": 0.0002880279096518356, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.0002938488417003429, + "loss": 0.0448, "step": 15820 }, { - "epoch": 0.08, - "learning_rate": 0.0002880203419588216, - "loss": 0.0292, + "epoch": 0.04, + "learning_rate": 0.00029384495348397144, + "loss": 0.039, "step": 15830 }, { - "epoch": 0.08, - "learning_rate": 0.0002880127742658076, - "loss": 0.0298, + "epoch": 0.04, + "learning_rate": 0.0002938410652676, + "loss": 0.0412, "step": 15840 }, { - "epoch": 0.08, - "learning_rate": 0.0002880052065727936, - "loss": 0.0283, + "epoch": 0.04, + "learning_rate": 0.0002938371770512285, + "loss": 0.0431, "step": 15850 }, { - "epoch": 0.08, - "learning_rate": 0.0002879976388797796, - "loss": 0.0338, + "epoch": 0.04, + "learning_rate": 0.0002938332888348571, + "loss": 0.0392, "step": 15860 }, { - "epoch": 0.08, - "learning_rate": 0.0002879900711867656, - "loss": 0.0364, + "epoch": 0.04, + "learning_rate": 0.0002938294006184856, + "loss": 0.0384, "step": 15870 }, { - "epoch": 0.08, - "learning_rate": 0.00028798250349375157, - "loss": 0.028, + "epoch": 0.04, + "learning_rate": 0.0002938255124021141, + "loss": 0.0443, "step": 15880 }, { - "epoch": 0.08, - "learning_rate": 0.00028797493580073755, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.00029382162418574263, + "loss": 0.0388, "step": 15890 }, { - "epoch": 0.08, - "learning_rate": 0.00028796736810772353, - "loss": 0.0321, + "epoch": 0.04, + "learning_rate": 0.0002938177359693712, + "loss": 0.0378, "step": 15900 }, { - "epoch": 0.08, - "learning_rate": 0.00028795980041470957, - "loss": 0.0291, + "epoch": 0.04, + "learning_rate": 0.0002938138477529997, + "loss": 0.039, "step": 15910 }, { - "epoch": 0.08, - "learning_rate": 0.00028795223272169555, - "loss": 0.032, + "epoch": 0.04, + "learning_rate": 0.0002938099595366283, + "loss": 0.0373, "step": 15920 }, { - "epoch": 0.08, - "learning_rate": 0.00028794466502868153, - "loss": 0.0289, + "epoch": 0.04, + "learning_rate": 0.0002938060713202568, + "loss": 0.0344, "step": 15930 }, { - "epoch": 0.08, - "learning_rate": 0.0002879370973356675, - "loss": 0.0352, + "epoch": 0.04, + "learning_rate": 0.0002938021831038853, + "loss": 0.04, "step": 15940 }, { - "epoch": 0.08, - "learning_rate": 0.0002879295296426535, - "loss": 0.032, + "epoch": 0.04, + "learning_rate": 0.0002937982948875139, + "loss": 0.0326, "step": 15950 }, { - "epoch": 0.08, - "learning_rate": 0.0002879219619496395, - "loss": 0.0366, + "epoch": 0.04, + "learning_rate": 0.0002937944066711424, + "loss": 0.0343, "step": 15960 }, { - "epoch": 0.08, - "learning_rate": 0.00028791439425662546, - "loss": 0.0315, + "epoch": 0.04, + "learning_rate": 0.0002937905184547709, + "loss": 0.043, "step": 15970 }, { - "epoch": 0.08, - "learning_rate": 0.0002879068265636115, - "loss": 0.0363, + "epoch": 0.04, + "learning_rate": 0.0002937866302383995, + "loss": 0.0414, "step": 15980 }, { - "epoch": 0.08, - "learning_rate": 0.0002878992588705975, - "loss": 0.0299, + "epoch": 0.04, + "learning_rate": 0.00029378274202202805, + "loss": 0.0403, "step": 15990 }, { - "epoch": 0.08, - "learning_rate": 0.00028789169117758345, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.00029377885380565657, + "loss": 0.0366, "step": 16000 }, { - "epoch": 0.08, - "eval_cer": 0.9144945158062973, - "eval_loss": 0.02421427145600319, - "eval_runtime": 116.6835, - "eval_samples_per_second": 17.14, - "eval_steps_per_second": 4.285, + "epoch": 0.04, + "eval_cer": 0.88186084529673, + "eval_loss": 0.03012273460626602, + "eval_runtime": 107.9461, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, "step": 16000 }, { - "epoch": 0.08, - "learning_rate": 0.00028788412348456944, - "loss": 0.0314, + "epoch": 0.04, + "learning_rate": 0.0002937749655892851, + "loss": 0.0375, "step": 16010 }, { - "epoch": 0.08, - "learning_rate": 0.0002878765557915554, - "loss": 0.0338, + "epoch": 0.04, + "learning_rate": 0.0002937710773729136, + "loss": 0.0422, "step": 16020 }, { - "epoch": 0.08, - "learning_rate": 0.0002878689880985414, - "loss": 0.0299, + "epoch": 0.04, + "learning_rate": 0.00029376718915654216, + "loss": 0.0427, "step": 16030 }, { - "epoch": 0.08, - "learning_rate": 0.00028786142040552743, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.0002937633009401707, + "loss": 0.0419, "step": 16040 }, { - "epoch": 0.08, - "learning_rate": 0.0002878538527125134, - "loss": 0.0309, + "epoch": 0.04, + "learning_rate": 0.00029375941272379925, + "loss": 0.0427, "step": 16050 }, { - "epoch": 0.08, - "learning_rate": 0.0002878462850194994, - "loss": 0.0302, + "epoch": 0.04, + "learning_rate": 0.00029375552450742776, + "loss": 0.0404, "step": 16060 }, { - "epoch": 0.08, - "learning_rate": 0.0002878387173264854, - "loss": 0.0344, + "epoch": 0.04, + "learning_rate": 0.00029375163629105633, + "loss": 0.0365, "step": 16070 }, { - "epoch": 0.08, - "learning_rate": 0.00028783114963347136, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.00029374774807468484, + "loss": 0.0372, "step": 16080 }, { - "epoch": 0.08, - "learning_rate": 0.00028782358194045734, - "loss": 0.034, + "epoch": 0.04, + "learning_rate": 0.00029374385985831336, + "loss": 0.0384, "step": 16090 }, { - "epoch": 0.08, - "learning_rate": 0.0002878160142474433, - "loss": 0.0352, + "epoch": 0.04, + "learning_rate": 0.0002937399716419419, + "loss": 0.0423, "step": 16100 }, { - "epoch": 0.08, - "learning_rate": 0.00028780844655442936, - "loss": 0.0281, + "epoch": 0.04, + "learning_rate": 0.00029373608342557044, + "loss": 0.0354, "step": 16110 }, { - "epoch": 0.08, - "learning_rate": 0.00028780087886141534, - "loss": 0.0263, + "epoch": 0.04, + "learning_rate": 0.000293732195209199, + "loss": 0.0394, "step": 16120 }, { - "epoch": 0.08, - "learning_rate": 0.0002877933111684013, - "loss": 0.0265, + "epoch": 0.04, + "learning_rate": 0.0002937283069928275, + "loss": 0.0427, "step": 16130 }, { - "epoch": 0.08, - "learning_rate": 0.0002877857434753873, - "loss": 0.0284, + "epoch": 0.04, + "learning_rate": 0.00029372441877645604, + "loss": 0.0432, "step": 16140 }, { - "epoch": 0.08, - "learning_rate": 0.0002877781757823733, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.00029372053056008455, + "loss": 0.0402, "step": 16150 }, { - "epoch": 0.08, - "learning_rate": 0.00028777060808935927, - "loss": 0.0283, + "epoch": 0.04, + "learning_rate": 0.0002937166423437131, + "loss": 0.0474, "step": 16160 }, { - "epoch": 0.08, - "learning_rate": 0.0002877630403963453, - "loss": 0.033, + "epoch": 0.04, + "learning_rate": 0.00029371275412734164, + "loss": 0.0369, "step": 16170 }, { - "epoch": 0.08, - "learning_rate": 0.0002877554727033313, - "loss": 0.0318, + "epoch": 0.04, + "learning_rate": 0.0002937088659109702, + "loss": 0.0425, "step": 16180 }, { - "epoch": 0.08, - "learning_rate": 0.00028774790501031726, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.0002937049776945987, + "loss": 0.0391, "step": 16190 }, { - "epoch": 0.08, - "learning_rate": 0.00028774033731730325, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.0002937010894782273, + "loss": 0.0389, "step": 16200 }, { - "epoch": 0.08, - "learning_rate": 0.00028773276962428923, - "loss": 0.0288, + "epoch": 0.04, + "learning_rate": 0.0002936972012618558, + "loss": 0.0424, "step": 16210 }, { - "epoch": 0.08, - "learning_rate": 0.0002877252019312752, - "loss": 0.0331, + "epoch": 0.04, + "learning_rate": 0.0002936933130454843, + "loss": 0.0423, "step": 16220 }, { - "epoch": 0.08, - "learning_rate": 0.00028771763423826124, - "loss": 0.03, + "epoch": 0.04, + "learning_rate": 0.00029368942482911283, + "loss": 0.0427, "step": 16230 }, { - "epoch": 0.08, - "learning_rate": 0.0002877100665452472, - "loss": 0.0282, + "epoch": 0.04, + "learning_rate": 0.0002936855366127414, + "loss": 0.0383, "step": 16240 }, { - "epoch": 0.08, - "learning_rate": 0.0002877024988522332, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.0002936816483963699, + "loss": 0.0419, "step": 16250 }, { - "epoch": 0.08, - "learning_rate": 0.0002876949311592192, - "loss": 0.0297, + "epoch": 0.04, + "learning_rate": 0.0002936777601799985, + "loss": 0.0345, "step": 16260 }, { - "epoch": 0.08, - "learning_rate": 0.00028768736346620517, - "loss": 0.0416, + "epoch": 0.04, + "learning_rate": 0.000293673871963627, + "loss": 0.037, "step": 16270 }, { - "epoch": 0.08, - "learning_rate": 0.00028767979577319115, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.00029366998374725557, + "loss": 0.0443, "step": 16280 }, { - "epoch": 0.08, - "learning_rate": 0.00028767222808017713, - "loss": 0.028, + "epoch": 0.04, + "learning_rate": 0.0002936660955308841, + "loss": 0.0373, "step": 16290 }, { - "epoch": 0.08, - "learning_rate": 0.00028766466038716317, - "loss": 0.0305, + "epoch": 0.04, + "learning_rate": 0.0002936622073145126, + "loss": 0.036, "step": 16300 }, { - "epoch": 0.08, - "learning_rate": 0.00028765709269414915, - "loss": 0.0321, + "epoch": 0.04, + "learning_rate": 0.0002936583190981411, + "loss": 0.0403, "step": 16310 }, { - "epoch": 0.08, - "learning_rate": 0.00028764952500113513, - "loss": 0.0368, + "epoch": 0.04, + "learning_rate": 0.0002936544308817697, + "loss": 0.0389, "step": 16320 }, { - "epoch": 0.08, - "learning_rate": 0.0002876419573081211, - "loss": 0.0294, + "epoch": 0.04, + "learning_rate": 0.00029365054266539825, + "loss": 0.0413, "step": 16330 }, { - "epoch": 0.08, - "learning_rate": 0.0002876343896151071, - "loss": 0.028, + "epoch": 0.04, + "learning_rate": 0.00029364665444902676, + "loss": 0.0449, "step": 16340 }, { - "epoch": 0.08, - "learning_rate": 0.0002876268219220931, - "loss": 0.031, + "epoch": 0.04, + "learning_rate": 0.0002936427662326553, + "loss": 0.041, "step": 16350 }, { - "epoch": 0.08, - "learning_rate": 0.0002876192542290791, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.00029363887801628385, + "loss": 0.0353, "step": 16360 }, { - "epoch": 0.08, - "learning_rate": 0.0002876116865360651, - "loss": 0.0365, + "epoch": 0.04, + "learning_rate": 0.00029363498979991236, + "loss": 0.0339, "step": 16370 }, { - "epoch": 0.08, - "learning_rate": 0.0002876041188430511, - "loss": 0.0327, + "epoch": 0.04, + "learning_rate": 0.0002936311015835409, + "loss": 0.0417, "step": 16380 }, { - "epoch": 0.08, - "learning_rate": 0.00028759655115003706, - "loss": 0.0309, + "epoch": 0.04, + "learning_rate": 0.00029362721336716945, + "loss": 0.0395, "step": 16390 }, { - "epoch": 0.08, - "learning_rate": 0.00028758898345702304, - "loss": 0.0306, + "epoch": 0.04, + "learning_rate": 0.00029362332515079796, + "loss": 0.0394, "step": 16400 }, { - "epoch": 0.08, - "learning_rate": 0.000287581415764009, - "loss": 0.0296, + "epoch": 0.04, + "learning_rate": 0.00029361943693442653, + "loss": 0.0387, "step": 16410 }, { - "epoch": 0.08, - "learning_rate": 0.000287573848070995, - "loss": 0.032, + "epoch": 0.04, + "learning_rate": 0.00029361554871805504, + "loss": 0.0351, "step": 16420 }, { - "epoch": 0.08, - "learning_rate": 0.00028756628037798104, - "loss": 0.0331, + "epoch": 0.04, + "learning_rate": 0.00029361166050168356, + "loss": 0.0321, "step": 16430 }, { - "epoch": 0.08, - "learning_rate": 0.000287558712684967, - "loss": 0.0354, + "epoch": 0.04, + "learning_rate": 0.00029360777228531207, + "loss": 0.0375, "step": 16440 }, { - "epoch": 0.08, - "learning_rate": 0.000287551144991953, - "loss": 0.0395, + "epoch": 0.04, + "learning_rate": 0.00029360388406894064, + "loss": 0.0426, "step": 16450 }, { - "epoch": 0.08, - "learning_rate": 0.000287543577298939, - "loss": 0.0339, + "epoch": 0.04, + "learning_rate": 0.00029359999585256916, + "loss": 0.039, "step": 16460 }, { - "epoch": 0.08, - "learning_rate": 0.00028753600960592496, - "loss": 0.0355, + "epoch": 0.04, + "learning_rate": 0.0002935961076361977, + "loss": 0.0398, "step": 16470 }, { - "epoch": 0.08, - "learning_rate": 0.00028752844191291094, - "loss": 0.0343, + "epoch": 0.04, + "learning_rate": 0.00029359221941982624, + "loss": 0.043, "step": 16480 }, { - "epoch": 0.08, - "learning_rate": 0.000287520874219897, - "loss": 0.0391, + "epoch": 0.04, + "learning_rate": 0.0002935883312034548, + "loss": 0.0445, "step": 16490 }, { - "epoch": 0.08, - "learning_rate": 0.00028751330652688296, - "loss": 0.0339, + "epoch": 0.04, + "learning_rate": 0.0002935844429870833, + "loss": 0.0398, "step": 16500 }, { - "epoch": 0.08, - "learning_rate": 0.00028750573883386894, - "loss": 0.0301, + "epoch": 0.04, + "learning_rate": 0.00029358055477071184, + "loss": 0.038, "step": 16510 }, { - "epoch": 0.08, - "learning_rate": 0.0002874981711408549, - "loss": 0.0293, + "epoch": 0.04, + "learning_rate": 0.0002935766665543404, + "loss": 0.0439, "step": 16520 }, { - "epoch": 0.08, - "learning_rate": 0.0002874906034478409, - "loss": 0.03, + "epoch": 0.04, + "learning_rate": 0.0002935727783379689, + "loss": 0.0376, "step": 16530 }, { - "epoch": 0.08, - "learning_rate": 0.0002874830357548269, - "loss": 0.0332, + "epoch": 0.04, + "learning_rate": 0.0002935688901215975, + "loss": 0.03, "step": 16540 }, { - "epoch": 0.08, - "learning_rate": 0.0002874754680618129, - "loss": 0.033, + "epoch": 0.04, + "learning_rate": 0.000293565001905226, + "loss": 0.0415, "step": 16550 }, { - "epoch": 0.08, - "learning_rate": 0.0002874679003687989, - "loss": 0.0313, + "epoch": 0.04, + "learning_rate": 0.0002935611136888545, + "loss": 0.0394, "step": 16560 }, { - "epoch": 0.08, - "learning_rate": 0.0002874603326757849, - "loss": 0.0316, + "epoch": 0.04, + "learning_rate": 0.0002935572254724831, + "loss": 0.0356, "step": 16570 }, { - "epoch": 0.08, - "learning_rate": 0.00028745276498277087, - "loss": 0.0291, + "epoch": 0.04, + "learning_rate": 0.0002935533372561116, + "loss": 0.0372, "step": 16580 }, { - "epoch": 0.08, - "learning_rate": 0.00028744519728975685, - "loss": 0.0332, + "epoch": 0.04, + "learning_rate": 0.0002935494490397401, + "loss": 0.0391, "step": 16590 }, { - "epoch": 0.08, - "learning_rate": 0.00028743762959674283, - "loss": 0.03, + "epoch": 0.04, + "learning_rate": 0.0002935455608233687, + "loss": 0.0421, "step": 16600 }, { - "epoch": 0.08, - "learning_rate": 0.0002874300619037288, - "loss": 0.0315, + "epoch": 0.04, + "learning_rate": 0.0002935416726069972, + "loss": 0.0335, "step": 16610 }, { - "epoch": 0.08, - "learning_rate": 0.00028742249421071485, - "loss": 0.0341, + "epoch": 0.04, + "learning_rate": 0.00029353778439062577, + "loss": 0.039, "step": 16620 }, { - "epoch": 0.08, - "learning_rate": 0.00028741492651770083, - "loss": 0.0323, + "epoch": 0.04, + "learning_rate": 0.0002935338961742543, + "loss": 0.0397, "step": 16630 }, { - "epoch": 0.08, - "learning_rate": 0.0002874073588246868, - "loss": 0.0294, + "epoch": 0.04, + "learning_rate": 0.0002935300079578828, + "loss": 0.0398, "step": 16640 }, { - "epoch": 0.08, - "learning_rate": 0.0002873997911316728, - "loss": 0.0272, + "epoch": 0.04, + "learning_rate": 0.0002935261197415113, + "loss": 0.0357, "step": 16650 }, { - "epoch": 0.08, - "learning_rate": 0.00028739222343865877, - "loss": 0.0345, + "epoch": 0.04, + "learning_rate": 0.0002935222315251399, + "loss": 0.0375, "step": 16660 }, { - "epoch": 0.08, - "learning_rate": 0.00028738465574564475, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.00029351834330876845, + "loss": 0.0341, "step": 16670 }, { - "epoch": 0.08, - "learning_rate": 0.0002873770880526308, - "loss": 0.0294, + "epoch": 0.04, + "learning_rate": 0.00029351445509239696, + "loss": 0.0374, "step": 16680 }, { - "epoch": 0.08, - "learning_rate": 0.00028736952035961677, - "loss": 0.0301, + "epoch": 0.04, + "learning_rate": 0.0002935105668760255, + "loss": 0.0364, "step": 16690 }, { - "epoch": 0.08, - "learning_rate": 0.00028736195266660275, - "loss": 0.0301, + "epoch": 0.04, + "learning_rate": 0.00029350667865965405, + "loss": 0.0414, "step": 16700 }, { - "epoch": 0.08, - "learning_rate": 0.00028735438497358873, - "loss": 0.0299, + "epoch": 0.04, + "learning_rate": 0.00029350279044328256, + "loss": 0.0346, "step": 16710 }, { - "epoch": 0.08, - "learning_rate": 0.0002873468172805747, - "loss": 0.0355, + "epoch": 0.04, + "learning_rate": 0.0002934989022269111, + "loss": 0.038, "step": 16720 }, { - "epoch": 0.08, - "learning_rate": 0.0002873392495875607, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.00029349501401053964, + "loss": 0.0385, "step": 16730 }, { - "epoch": 0.08, - "learning_rate": 0.00028733168189454673, - "loss": 0.0323, + "epoch": 0.04, + "learning_rate": 0.00029349112579416816, + "loss": 0.0394, "step": 16740 }, { - "epoch": 0.08, - "learning_rate": 0.0002873241142015327, - "loss": 0.0399, + "epoch": 0.04, + "learning_rate": 0.00029348723757779673, + "loss": 0.042, "step": 16750 }, { - "epoch": 0.08, - "learning_rate": 0.0002873165465085187, - "loss": 0.034, + "epoch": 0.04, + "learning_rate": 0.00029348334936142524, + "loss": 0.0362, "step": 16760 }, { - "epoch": 0.08, - "learning_rate": 0.0002873089788155047, - "loss": 0.036, + "epoch": 0.04, + "learning_rate": 0.00029347946114505376, + "loss": 0.0386, "step": 16770 }, { - "epoch": 0.08, - "learning_rate": 0.00028730141112249066, - "loss": 0.0351, + "epoch": 0.04, + "learning_rate": 0.0002934755729286823, + "loss": 0.0346, "step": 16780 }, { - "epoch": 0.08, - "learning_rate": 0.00028729384342947664, - "loss": 0.033, + "epoch": 0.04, + "learning_rate": 0.00029347168471231084, + "loss": 0.0407, "step": 16790 }, { - "epoch": 0.08, - "learning_rate": 0.0002872862757364626, - "loss": 0.0324, + "epoch": 0.04, + "learning_rate": 0.00029346779649593935, + "loss": 0.042, "step": 16800 }, { - "epoch": 0.08, - "learning_rate": 0.00028727870804344866, - "loss": 0.0323, + "epoch": 0.04, + "learning_rate": 0.0002934639082795679, + "loss": 0.0405, "step": 16810 }, { - "epoch": 0.08, - "learning_rate": 0.00028727114035043464, - "loss": 0.0301, + "epoch": 0.04, + "learning_rate": 0.0002934600200631965, + "loss": 0.037, "step": 16820 }, { - "epoch": 0.08, - "learning_rate": 0.0002872635726574206, - "loss": 0.0378, + "epoch": 0.04, + "learning_rate": 0.000293456131846825, + "loss": 0.0323, "step": 16830 }, { - "epoch": 0.08, - "learning_rate": 0.0002872560049644066, - "loss": 0.0318, + "epoch": 0.04, + "learning_rate": 0.0002934522436304535, + "loss": 0.0396, "step": 16840 }, { - "epoch": 0.09, - "learning_rate": 0.0002872484372713926, - "loss": 0.0299, + "epoch": 0.04, + "learning_rate": 0.00029344835541408204, + "loss": 0.043, "step": 16850 }, { - "epoch": 0.09, - "learning_rate": 0.00028724086957837856, - "loss": 0.0302, + "epoch": 0.04, + "learning_rate": 0.0002934444671977106, + "loss": 0.0394, "step": 16860 }, { - "epoch": 0.09, - "learning_rate": 0.0002872333018853646, - "loss": 0.0349, + "epoch": 0.04, + "learning_rate": 0.0002934405789813391, + "loss": 0.0429, "step": 16870 }, { - "epoch": 0.09, - "learning_rate": 0.0002872257341923506, - "loss": 0.0315, + "epoch": 0.04, + "learning_rate": 0.0002934366907649677, + "loss": 0.0388, "step": 16880 }, { - "epoch": 0.09, - "learning_rate": 0.00028721816649933656, - "loss": 0.0354, + "epoch": 0.04, + "learning_rate": 0.0002934328025485962, + "loss": 0.0435, "step": 16890 }, { - "epoch": 0.09, - "learning_rate": 0.00028721059880632254, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.0002934289143322247, + "loss": 0.0428, "step": 16900 }, { - "epoch": 0.09, - "learning_rate": 0.0002872030311133085, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.0002934250261158533, + "loss": 0.0457, "step": 16910 }, { - "epoch": 0.09, - "learning_rate": 0.0002871954634202945, - "loss": 0.0345, + "epoch": 0.04, + "learning_rate": 0.0002934211378994818, + "loss": 0.0409, "step": 16920 }, { - "epoch": 0.09, - "learning_rate": 0.0002871878957272805, - "loss": 0.0307, + "epoch": 0.04, + "learning_rate": 0.0002934172496831103, + "loss": 0.0415, "step": 16930 }, { - "epoch": 0.09, - "learning_rate": 0.0002871803280342665, - "loss": 0.032, + "epoch": 0.04, + "learning_rate": 0.0002934133614667389, + "loss": 0.0393, "step": 16940 }, { - "epoch": 0.09, - "learning_rate": 0.0002871727603412525, - "loss": 0.0293, + "epoch": 0.04, + "learning_rate": 0.0002934094732503674, + "loss": 0.0429, "step": 16950 }, { - "epoch": 0.09, - "learning_rate": 0.0002871651926482385, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.00029340558503399597, + "loss": 0.0338, "step": 16960 }, { - "epoch": 0.09, - "learning_rate": 0.00028715762495522447, - "loss": 0.0278, + "epoch": 0.04, + "learning_rate": 0.0002934016968176245, + "loss": 0.048, "step": 16970 }, { - "epoch": 0.09, - "learning_rate": 0.00028715005726221045, - "loss": 0.0296, + "epoch": 0.04, + "learning_rate": 0.000293397808601253, + "loss": 0.0363, "step": 16980 }, { - "epoch": 0.09, - "learning_rate": 0.00028714248956919643, - "loss": 0.0333, + "epoch": 0.04, + "learning_rate": 0.00029339392038488156, + "loss": 0.0343, "step": 16990 }, { - "epoch": 0.09, - "learning_rate": 0.0002871349218761824, - "loss": 0.0302, + "epoch": 0.04, + "learning_rate": 0.0002933900321685101, + "loss": 0.0352, "step": 17000 }, { - "epoch": 0.09, - "eval_cer": 0.9145527395738214, - "eval_loss": 0.023293539881706238, - "eval_runtime": 117.3978, - "eval_samples_per_second": 17.036, - "eval_steps_per_second": 4.259, + "epoch": 0.04, + "eval_cer": 0.8818314529211123, + "eval_loss": 0.028564387932419777, + "eval_runtime": 107.5392, + "eval_samples_per_second": 18.598, + "eval_steps_per_second": 4.649, "step": 17000 }, { - "epoch": 0.09, - "learning_rate": 0.0002871273541831684, - "loss": 0.0279, + "epoch": 0.04, + "learning_rate": 0.0002933861439521386, + "loss": 0.0351, "step": 17010 }, { - "epoch": 0.09, - "learning_rate": 0.0002871197864901544, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.00029338225573576716, + "loss": 0.045, "step": 17020 }, { - "epoch": 0.09, - "learning_rate": 0.00028711221879714036, - "loss": 0.0283, + "epoch": 0.04, + "learning_rate": 0.00029337836751939573, + "loss": 0.0414, "step": 17030 }, { - "epoch": 0.09, - "learning_rate": 0.0002871046511041264, - "loss": 0.0282, + "epoch": 0.04, + "learning_rate": 0.00029337447930302425, + "loss": 0.0377, "step": 17040 }, { - "epoch": 0.09, - "learning_rate": 0.0002870970834111124, - "loss": 0.0307, + "epoch": 0.04, + "learning_rate": 0.00029337059108665276, + "loss": 0.0351, "step": 17050 }, { - "epoch": 0.09, - "learning_rate": 0.00028708951571809836, - "loss": 0.0334, + "epoch": 0.04, + "learning_rate": 0.0002933667028702813, + "loss": 0.0405, "step": 17060 }, { - "epoch": 0.09, - "learning_rate": 0.00028708194802508434, - "loss": 0.0319, + "epoch": 0.04, + "learning_rate": 0.00029336281465390984, + "loss": 0.0365, "step": 17070 }, { - "epoch": 0.09, - "learning_rate": 0.0002870743803320703, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.00029335892643753836, + "loss": 0.0401, "step": 17080 }, { - "epoch": 0.09, - "learning_rate": 0.0002870668126390563, - "loss": 0.027, + "epoch": 0.04, + "learning_rate": 0.0002933550382211669, + "loss": 0.0421, "step": 17090 }, { - "epoch": 0.09, - "learning_rate": 0.00028705924494604234, - "loss": 0.0343, + "epoch": 0.04, + "learning_rate": 0.00029335115000479544, + "loss": 0.0378, "step": 17100 }, { - "epoch": 0.09, - "learning_rate": 0.0002870516772530283, - "loss": 0.0314, + "epoch": 0.04, + "learning_rate": 0.000293347261788424, + "loss": 0.0412, "step": 17110 }, { - "epoch": 0.09, - "learning_rate": 0.0002870441095600143, - "loss": 0.0286, + "epoch": 0.04, + "learning_rate": 0.0002933433735720525, + "loss": 0.0424, "step": 17120 }, { - "epoch": 0.09, - "learning_rate": 0.0002870365418670003, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.00029333948535568104, + "loss": 0.0388, "step": 17130 }, { - "epoch": 0.09, - "learning_rate": 0.00028702897417398626, - "loss": 0.0329, + "epoch": 0.04, + "learning_rate": 0.00029333559713930955, + "loss": 0.0443, "step": 17140 }, { - "epoch": 0.09, - "learning_rate": 0.00028702140648097224, - "loss": 0.0308, + "epoch": 0.04, + "learning_rate": 0.0002933317089229381, + "loss": 0.0342, "step": 17150 }, { - "epoch": 0.09, - "learning_rate": 0.0002870138387879582, - "loss": 0.0304, + "epoch": 0.04, + "learning_rate": 0.00029332782070656664, + "loss": 0.0447, "step": 17160 }, { - "epoch": 0.09, - "learning_rate": 0.00028700627109494426, - "loss": 0.0315, + "epoch": 0.04, + "learning_rate": 0.0002933239324901952, + "loss": 0.0342, "step": 17170 }, { - "epoch": 0.09, - "learning_rate": 0.00028699870340193024, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.0002933200442738237, + "loss": 0.0426, "step": 17180 }, { - "epoch": 0.09, - "learning_rate": 0.0002869911357089162, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.00029331615605745223, + "loss": 0.0443, "step": 17190 }, { - "epoch": 0.09, - "learning_rate": 0.0002869835680159022, - "loss": 0.0369, + "epoch": 0.04, + "learning_rate": 0.0002933122678410808, + "loss": 0.0332, "step": 17200 }, { - "epoch": 0.09, - "learning_rate": 0.0002869760003228882, - "loss": 0.0303, + "epoch": 0.04, + "learning_rate": 0.0002933083796247093, + "loss": 0.0393, "step": 17210 }, { - "epoch": 0.09, - "learning_rate": 0.00028696843262987417, - "loss": 0.0252, + "epoch": 0.04, + "learning_rate": 0.0002933044914083379, + "loss": 0.0423, "step": 17220 }, { - "epoch": 0.09, - "learning_rate": 0.0002869608649368602, - "loss": 0.0312, + "epoch": 0.04, + "learning_rate": 0.0002933006031919664, + "loss": 0.0331, "step": 17230 }, { - "epoch": 0.09, - "learning_rate": 0.0002869532972438462, - "loss": 0.0317, + "epoch": 0.04, + "learning_rate": 0.00029329671497559497, + "loss": 0.0416, "step": 17240 }, { - "epoch": 0.09, - "learning_rate": 0.00028694572955083217, - "loss": 0.0286, + "epoch": 0.04, + "learning_rate": 0.0002932928267592235, + "loss": 0.0355, "step": 17250 }, { - "epoch": 0.09, - "learning_rate": 0.00028693816185781815, - "loss": 0.0246, + "epoch": 0.04, + "learning_rate": 0.000293288938542852, + "loss": 0.0351, "step": 17260 }, { - "epoch": 0.09, - "learning_rate": 0.00028693059416480413, - "loss": 0.0347, + "epoch": 0.04, + "learning_rate": 0.0002932850503264805, + "loss": 0.045, "step": 17270 }, { - "epoch": 0.09, - "learning_rate": 0.0002869230264717901, - "loss": 0.0277, + "epoch": 0.04, + "learning_rate": 0.0002932811621101091, + "loss": 0.0364, "step": 17280 }, { - "epoch": 0.09, - "learning_rate": 0.00028691545877877615, - "loss": 0.0274, + "epoch": 0.04, + "learning_rate": 0.0002932772738937376, + "loss": 0.0329, "step": 17290 }, { - "epoch": 0.09, - "learning_rate": 0.0002869078910857621, - "loss": 0.0322, + "epoch": 0.04, + "learning_rate": 0.00029327338567736617, + "loss": 0.0359, "step": 17300 }, { - "epoch": 0.09, - "learning_rate": 0.0002869003233927481, - "loss": 0.0295, + "epoch": 0.04, + "learning_rate": 0.0002932694974609947, + "loss": 0.0427, "step": 17310 }, { - "epoch": 0.09, - "learning_rate": 0.0002868927556997341, - "loss": 0.0297, + "epoch": 0.04, + "learning_rate": 0.00029326560924462325, + "loss": 0.0444, "step": 17320 }, { - "epoch": 0.09, - "learning_rate": 0.00028688518800672007, - "loss": 0.0277, + "epoch": 0.04, + "learning_rate": 0.00029326172102825176, + "loss": 0.0363, "step": 17330 }, { - "epoch": 0.09, - "learning_rate": 0.00028687762031370605, - "loss": 0.0328, + "epoch": 0.04, + "learning_rate": 0.0002932578328118803, + "loss": 0.0453, "step": 17340 }, { - "epoch": 0.09, - "learning_rate": 0.00028687005262069203, - "loss": 0.0314, + "epoch": 0.04, + "learning_rate": 0.0002932539445955088, + "loss": 0.0377, "step": 17350 }, { - "epoch": 0.09, - "learning_rate": 0.00028686248492767807, - "loss": 0.0325, + "epoch": 0.04, + "learning_rate": 0.00029325005637913736, + "loss": 0.0508, "step": 17360 }, { - "epoch": 0.09, - "learning_rate": 0.00028685491723466405, - "loss": 0.0294, + "epoch": 0.05, + "learning_rate": 0.00029324616816276593, + "loss": 0.0391, "step": 17370 }, { - "epoch": 0.09, - "learning_rate": 0.00028684734954165003, - "loss": 0.0308, + "epoch": 0.05, + "learning_rate": 0.00029324227994639444, + "loss": 0.043, "step": 17380 }, { - "epoch": 0.09, - "learning_rate": 0.000286839781848636, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.00029323839173002296, + "loss": 0.0637, "step": 17390 }, { - "epoch": 0.09, - "learning_rate": 0.000286832214155622, - "loss": 0.0317, + "epoch": 0.05, + "learning_rate": 0.0002932345035136515, + "loss": 0.1008, "step": 17400 }, { - "epoch": 0.09, - "learning_rate": 0.000286824646462608, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.00029323061529728004, + "loss": 0.0745, "step": 17410 }, { - "epoch": 0.09, - "learning_rate": 0.000286817078769594, - "loss": 0.0334, + "epoch": 0.05, + "learning_rate": 0.00029322672708090856, + "loss": 0.054, "step": 17420 }, { - "epoch": 0.09, - "learning_rate": 0.00028680951107658, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.0002932228388645371, + "loss": 0.0342, "step": 17430 }, { - "epoch": 0.09, - "learning_rate": 0.000286801943383566, - "loss": 0.0283, + "epoch": 0.05, + "learning_rate": 0.00029321895064816564, + "loss": 0.038, "step": 17440 }, { - "epoch": 0.09, - "learning_rate": 0.00028679437569055196, - "loss": 0.032, + "epoch": 0.05, + "learning_rate": 0.0002932150624317942, + "loss": 0.0426, "step": 17450 }, { - "epoch": 0.09, - "learning_rate": 0.00028678680799753794, - "loss": 0.0244, + "epoch": 0.05, + "learning_rate": 0.0002932111742154227, + "loss": 0.0394, "step": 17460 }, { - "epoch": 0.09, - "learning_rate": 0.0002867792403045239, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.00029320728599905124, + "loss": 0.0476, "step": 17470 }, { - "epoch": 0.09, - "learning_rate": 0.00028677167261150996, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.00029320339778267975, + "loss": 0.0438, "step": 17480 }, { - "epoch": 0.09, - "learning_rate": 0.00028676410491849594, - "loss": 0.034, + "epoch": 0.05, + "learning_rate": 0.0002931995095663083, + "loss": 0.04, "step": 17490 }, { - "epoch": 0.09, - "learning_rate": 0.0002867565372254819, - "loss": 0.0267, + "epoch": 0.05, + "learning_rate": 0.00029319562134993684, + "loss": 0.046, "step": 17500 }, { - "epoch": 0.09, - "learning_rate": 0.0002867489695324679, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.0002931917331335654, + "loss": 0.045, "step": 17510 }, { - "epoch": 0.09, - "learning_rate": 0.0002867414018394539, - "loss": 0.0289, + "epoch": 0.05, + "learning_rate": 0.0002931878449171939, + "loss": 0.0622, "step": 17520 }, { - "epoch": 0.09, - "learning_rate": 0.00028673383414643986, - "loss": 0.0278, + "epoch": 0.05, + "learning_rate": 0.0002931839567008225, + "loss": 0.0487, "step": 17530 }, { - "epoch": 0.09, - "learning_rate": 0.00028672626645342584, - "loss": 0.035, + "epoch": 0.05, + "learning_rate": 0.000293180068484451, + "loss": 0.0501, "step": 17540 }, { - "epoch": 0.09, - "learning_rate": 0.0002867186987604119, - "loss": 0.0308, + "epoch": 0.05, + "learning_rate": 0.0002931761802680795, + "loss": 0.0463, "step": 17550 }, { - "epoch": 0.09, - "learning_rate": 0.00028671113106739786, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.00029317229205170803, + "loss": 0.0434, "step": 17560 }, { - "epoch": 0.09, - "learning_rate": 0.00028670356337438384, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.0002931684038353366, + "loss": 0.0388, "step": 17570 }, { - "epoch": 0.09, - "learning_rate": 0.0002866959956813698, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.00029316451561896517, + "loss": 0.0394, "step": 17580 }, { - "epoch": 0.09, - "learning_rate": 0.0002866884279883558, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.0002931606274025937, + "loss": 0.047, "step": 17590 }, { - "epoch": 0.09, - "learning_rate": 0.0002866808602953418, - "loss": 0.0384, + "epoch": 0.05, + "learning_rate": 0.0002931567391862222, + "loss": 0.0409, "step": 17600 }, { - "epoch": 0.09, - "learning_rate": 0.0002866732926023278, - "loss": 0.0315, + "epoch": 0.05, + "learning_rate": 0.00029315285096985077, + "loss": 0.0423, "step": 17610 }, { - "epoch": 0.09, - "learning_rate": 0.0002866657249093138, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002931489627534793, + "loss": 0.0436, "step": 17620 }, { - "epoch": 0.09, - "learning_rate": 0.0002866581572162998, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002931450745371078, + "loss": 0.0505, "step": 17630 }, { - "epoch": 0.09, - "learning_rate": 0.00028665058952328577, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.00029314118632073636, + "loss": 0.0406, "step": 17640 }, { - "epoch": 0.09, - "learning_rate": 0.00028664302183027175, - "loss": 0.0346, + "epoch": 0.05, + "learning_rate": 0.0002931372981043649, + "loss": 0.0467, "step": 17650 }, { - "epoch": 0.09, - "learning_rate": 0.00028663545413725773, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.00029313340988799345, + "loss": 0.0471, "step": 17660 }, { - "epoch": 0.09, - "learning_rate": 0.0002866278864442437, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.00029312952167162196, + "loss": 0.0431, "step": 17670 }, { - "epoch": 0.09, - "learning_rate": 0.00028662031875122975, - "loss": 0.0325, + "epoch": 0.05, + "learning_rate": 0.0002931256334552505, + "loss": 0.0411, "step": 17680 }, { - "epoch": 0.09, - "learning_rate": 0.00028661275105821573, - "loss": 0.0299, + "epoch": 0.05, + "learning_rate": 0.000293121745238879, + "loss": 0.0391, "step": 17690 }, { - "epoch": 0.09, - "learning_rate": 0.0002866051833652017, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.00029311785702250756, + "loss": 0.0407, "step": 17700 }, { - "epoch": 0.09, - "learning_rate": 0.0002865976156721877, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.00029311396880613613, + "loss": 0.0371, "step": 17710 }, { - "epoch": 0.09, - "learning_rate": 0.00028659004797917367, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.00029311008058976464, + "loss": 0.0345, "step": 17720 }, { - "epoch": 0.09, - "learning_rate": 0.00028658248028615965, - "loss": 0.0352, + "epoch": 0.05, + "learning_rate": 0.00029310619237339316, + "loss": 0.0467, "step": 17730 }, { - "epoch": 0.09, - "learning_rate": 0.0002865749125931457, - "loss": 0.0326, + "epoch": 0.05, + "learning_rate": 0.0002931023041570217, + "loss": 0.0382, "step": 17740 }, { - "epoch": 0.09, - "learning_rate": 0.00028656734490013167, - "loss": 0.0296, + "epoch": 0.05, + "learning_rate": 0.00029309841594065024, + "loss": 0.04, "step": 17750 }, { - "epoch": 0.09, - "learning_rate": 0.00028655977720711765, - "loss": 0.0295, + "epoch": 0.05, + "learning_rate": 0.00029309452772427876, + "loss": 0.0461, "step": 17760 }, { - "epoch": 0.09, - "learning_rate": 0.00028655220951410363, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002930906395079073, + "loss": 0.0412, "step": 17770 }, { - "epoch": 0.09, - "learning_rate": 0.0002865446418210896, - "loss": 0.0272, + "epoch": 0.05, + "learning_rate": 0.00029308675129153584, + "loss": 0.0387, "step": 17780 }, { - "epoch": 0.09, - "learning_rate": 0.0002865370741280756, - "loss": 0.0346, + "epoch": 0.05, + "learning_rate": 0.0002930828630751644, + "loss": 0.0421, "step": 17790 }, { - "epoch": 0.09, - "learning_rate": 0.00028652950643506163, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.0002930789748587929, + "loss": 0.0376, "step": 17800 }, { - "epoch": 0.09, - "learning_rate": 0.0002865219387420476, - "loss": 0.0374, + "epoch": 0.05, + "learning_rate": 0.00029307508664242144, + "loss": 0.0397, "step": 17810 }, { - "epoch": 0.09, - "learning_rate": 0.0002865143710490336, - "loss": 0.0299, + "epoch": 0.05, + "learning_rate": 0.00029307119842605, + "loss": 0.0395, "step": 17820 }, { - "epoch": 0.09, - "learning_rate": 0.0002865068033560196, - "loss": 0.0341, + "epoch": 0.05, + "learning_rate": 0.0002930673102096785, + "loss": 0.0456, "step": 17830 }, { - "epoch": 0.09, - "learning_rate": 0.00028649923566300556, - "loss": 0.0345, + "epoch": 0.05, + "learning_rate": 0.00029306342199330703, + "loss": 0.0295, "step": 17840 }, { - "epoch": 0.09, - "learning_rate": 0.00028649166796999154, - "loss": 0.0286, + "epoch": 0.05, + "learning_rate": 0.0002930595337769356, + "loss": 0.0348, "step": 17850 }, { - "epoch": 0.09, - "learning_rate": 0.0002864841002769775, - "loss": 0.0388, + "epoch": 0.05, + "learning_rate": 0.00029305564556056417, + "loss": 0.0363, "step": 17860 }, { - "epoch": 0.09, - "learning_rate": 0.00028647653258396356, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.0002930517573441927, + "loss": 0.0358, "step": 17870 }, { - "epoch": 0.09, - "learning_rate": 0.00028646896489094954, - "loss": 0.0301, + "epoch": 0.05, + "learning_rate": 0.0002930478691278212, + "loss": 0.0374, "step": 17880 }, { - "epoch": 0.09, - "learning_rate": 0.0002864613971979355, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.0002930439809114497, + "loss": 0.0346, "step": 17890 }, { - "epoch": 0.09, - "learning_rate": 0.0002864538295049215, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.00029304009269507823, + "loss": 0.0352, "step": 17900 }, { - "epoch": 0.09, - "learning_rate": 0.0002864462618119075, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.0002930362044787068, + "loss": 0.0429, "step": 17910 }, { - "epoch": 0.09, - "learning_rate": 0.00028643869411889346, - "loss": 0.035, + "epoch": 0.05, + "learning_rate": 0.00029303231626233537, + "loss": 0.0409, "step": 17920 }, { - "epoch": 0.09, - "learning_rate": 0.0002864311264258795, - "loss": 0.033, + "epoch": 0.05, + "learning_rate": 0.0002930284280459639, + "loss": 0.0371, "step": 17930 }, { - "epoch": 0.09, - "learning_rate": 0.0002864235587328655, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.0002930245398295924, + "loss": 0.036, "step": 17940 }, { - "epoch": 0.09, - "learning_rate": 0.00028641599103985146, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.00029302065161322096, + "loss": 0.0396, "step": 17950 }, { - "epoch": 0.09, - "learning_rate": 0.00028640842334683744, - "loss": 0.0367, + "epoch": 0.05, + "learning_rate": 0.0002930167633968495, + "loss": 0.0401, "step": 17960 }, { - "epoch": 0.09, - "learning_rate": 0.0002864008556538234, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.000293012875180478, + "loss": 0.0313, "step": 17970 }, { - "epoch": 0.09, - "learning_rate": 0.0002863932879608094, - "loss": 0.032, + "epoch": 0.05, + "learning_rate": 0.00029300898696410656, + "loss": 0.0472, "step": 17980 }, { - "epoch": 0.09, - "learning_rate": 0.00028638572026779544, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.0002930050987477351, + "loss": 0.0331, "step": 17990 }, { - "epoch": 0.09, - "learning_rate": 0.0002863781525747814, - "loss": 0.03, + "epoch": 0.05, + "learning_rate": 0.00029300121053136365, + "loss": 0.0385, "step": 18000 }, { - "epoch": 0.09, - "eval_cer": 0.9144838414489178, - "eval_loss": 0.022705839946866035, - "eval_runtime": 117.5421, - "eval_samples_per_second": 17.015, - "eval_steps_per_second": 4.254, + "epoch": 0.05, + "eval_cer": 0.8818174565517705, + "eval_loss": 0.02818988636136055, + "eval_runtime": 107.7914, + "eval_samples_per_second": 18.554, + "eval_steps_per_second": 4.639, "step": 18000 }, { - "epoch": 0.09, - "learning_rate": 0.0002863705848817674, - "loss": 0.0372, + "epoch": 0.05, + "learning_rate": 0.00029299732231499216, + "loss": 0.0375, "step": 18010 }, { - "epoch": 0.09, - "learning_rate": 0.0002863630171887534, - "loss": 0.0282, + "epoch": 0.05, + "learning_rate": 0.0002929934340986207, + "loss": 0.0344, "step": 18020 }, { - "epoch": 0.09, - "learning_rate": 0.00028635544949573937, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.00029298954588224924, + "loss": 0.0401, "step": 18030 }, { - "epoch": 0.09, - "learning_rate": 0.00028634788180272535, - "loss": 0.0286, + "epoch": 0.05, + "learning_rate": 0.00029298565766587776, + "loss": 0.0356, "step": 18040 }, { - "epoch": 0.09, - "learning_rate": 0.00028634031410971133, - "loss": 0.0281, + "epoch": 0.05, + "learning_rate": 0.00029298176944950627, + "loss": 0.04, "step": 18050 }, { - "epoch": 0.09, - "learning_rate": 0.00028633274641669737, - "loss": 0.0328, + "epoch": 0.05, + "learning_rate": 0.00029297788123313484, + "loss": 0.0391, "step": 18060 }, { - "epoch": 0.09, - "learning_rate": 0.00028632517872368335, - "loss": 0.0322, + "epoch": 0.05, + "learning_rate": 0.0002929739930167634, + "loss": 0.0347, "step": 18070 }, { - "epoch": 0.09, - "learning_rate": 0.00028631761103066933, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.0002929701048003919, + "loss": 0.0388, "step": 18080 }, { - "epoch": 0.09, - "learning_rate": 0.0002863100433376553, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.00029296621658402044, + "loss": 0.0354, "step": 18090 }, { - "epoch": 0.09, - "learning_rate": 0.0002863024756446413, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.00029296232836764895, + "loss": 0.0368, "step": 18100 }, { - "epoch": 0.09, - "learning_rate": 0.0002862949079516273, - "loss": 0.0275, + "epoch": 0.05, + "learning_rate": 0.0002929584401512775, + "loss": 0.0324, "step": 18110 }, { - "epoch": 0.09, - "learning_rate": 0.0002862873402586133, - "loss": 0.0325, + "epoch": 0.05, + "learning_rate": 0.00029295455193490604, + "loss": 0.0333, "step": 18120 }, { - "epoch": 0.09, - "learning_rate": 0.0002862797725655993, - "loss": 0.0323, + "epoch": 0.05, + "learning_rate": 0.0002929506637185346, + "loss": 0.0403, "step": 18130 }, { - "epoch": 0.09, - "learning_rate": 0.00028627220487258527, - "loss": 0.0348, + "epoch": 0.05, + "learning_rate": 0.0002929467755021631, + "loss": 0.0367, "step": 18140 }, { - "epoch": 0.09, - "learning_rate": 0.00028626463717957125, - "loss": 0.0337, + "epoch": 0.05, + "learning_rate": 0.00029294288728579164, + "loss": 0.0446, "step": 18150 }, { - "epoch": 0.09, - "learning_rate": 0.00028625706948655724, - "loss": 0.0313, + "epoch": 0.05, + "learning_rate": 0.0002929389990694202, + "loss": 0.0285, "step": 18160 }, { - "epoch": 0.09, - "learning_rate": 0.0002862495017935432, - "loss": 0.039, + "epoch": 0.05, + "learning_rate": 0.0002929351108530487, + "loss": 0.0341, "step": 18170 }, { - "epoch": 0.09, - "learning_rate": 0.0002862419341005292, - "loss": 0.0294, + "epoch": 0.05, + "learning_rate": 0.00029293122263667723, + "loss": 0.0437, "step": 18180 }, { - "epoch": 0.09, - "learning_rate": 0.00028623436640751523, - "loss": 0.0348, + "epoch": 0.05, + "learning_rate": 0.0002929273344203058, + "loss": 0.0379, "step": 18190 }, { - "epoch": 0.09, - "learning_rate": 0.0002862267987145012, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.0002929234462039343, + "loss": 0.0394, "step": 18200 }, { - "epoch": 0.09, - "learning_rate": 0.0002862192310214872, - "loss": 0.0327, + "epoch": 0.05, + "learning_rate": 0.0002929195579875629, + "loss": 0.0371, "step": 18210 }, { - "epoch": 0.09, - "learning_rate": 0.0002862116633284732, - "loss": 0.0282, + "epoch": 0.05, + "learning_rate": 0.0002929156697711914, + "loss": 0.0337, "step": 18220 }, { - "epoch": 0.09, - "learning_rate": 0.00028620409563545916, - "loss": 0.025, + "epoch": 0.05, + "learning_rate": 0.0002929117815548199, + "loss": 0.0402, "step": 18230 }, { - "epoch": 0.09, - "learning_rate": 0.00028619652794244514, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.0002929078933384485, + "loss": 0.0381, "step": 18240 }, { - "epoch": 0.09, - "learning_rate": 0.0002861889602494311, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.000292904005122077, + "loss": 0.0343, "step": 18250 }, { - "epoch": 0.09, - "learning_rate": 0.0002861813925564171, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029290011690570557, + "loss": 0.0386, "step": 18260 }, { - "epoch": 0.09, - "learning_rate": 0.0002861738248634031, - "loss": 0.0253, + "epoch": 0.05, + "learning_rate": 0.0002928962286893341, + "loss": 0.0356, "step": 18270 }, { - "epoch": 0.09, - "learning_rate": 0.00028616625717038907, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.00029289234047296265, + "loss": 0.0362, "step": 18280 }, { - "epoch": 0.09, - "learning_rate": 0.0002861586894773751, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.00029288845225659116, + "loss": 0.0328, "step": 18290 }, { - "epoch": 0.09, - "learning_rate": 0.0002861511217843611, - "loss": 0.0257, + "epoch": 0.05, + "learning_rate": 0.0002928845640402197, + "loss": 0.0363, "step": 18300 }, { - "epoch": 0.09, - "learning_rate": 0.00028614355409134707, - "loss": 0.0315, + "epoch": 0.05, + "learning_rate": 0.0002928806758238482, + "loss": 0.0394, "step": 18310 }, { - "epoch": 0.09, - "learning_rate": 0.00028613598639833305, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.00029287678760747676, + "loss": 0.0322, "step": 18320 }, { - "epoch": 0.09, - "learning_rate": 0.00028612841870531903, - "loss": 0.0262, + "epoch": 0.05, + "learning_rate": 0.0002928728993911053, + "loss": 0.0389, "step": 18330 }, { - "epoch": 0.09, - "learning_rate": 0.000286120851012305, - "loss": 0.0273, + "epoch": 0.05, + "learning_rate": 0.00029286901117473384, + "loss": 0.0394, "step": 18340 }, { - "epoch": 0.09, - "learning_rate": 0.00028611328331929105, - "loss": 0.0336, + "epoch": 0.05, + "learning_rate": 0.00029286512295836236, + "loss": 0.0323, "step": 18350 }, { - "epoch": 0.09, - "learning_rate": 0.000286105715626277, - "loss": 0.0279, + "epoch": 0.05, + "learning_rate": 0.0002928612347419909, + "loss": 0.0445, "step": 18360 }, { - "epoch": 0.09, - "learning_rate": 0.000286098147933263, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.00029285734652561944, + "loss": 0.0385, "step": 18370 }, { - "epoch": 0.09, - "learning_rate": 0.000286090580240249, - "loss": 0.036, + "epoch": 0.05, + "learning_rate": 0.00029285345830924796, + "loss": 0.0338, "step": 18380 }, { - "epoch": 0.09, - "learning_rate": 0.00028608301254723497, - "loss": 0.0276, + "epoch": 0.05, + "learning_rate": 0.00029284957009287647, + "loss": 0.0383, "step": 18390 }, { - "epoch": 0.09, - "learning_rate": 0.00028607544485422095, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.00029284568187650504, + "loss": 0.0389, "step": 18400 }, { - "epoch": 0.09, - "learning_rate": 0.00028606787716120693, - "loss": 0.0358, + "epoch": 0.05, + "learning_rate": 0.0002928417936601336, + "loss": 0.0431, "step": 18410 }, { - "epoch": 0.09, - "learning_rate": 0.00028606030946819297, - "loss": 0.0325, + "epoch": 0.05, + "learning_rate": 0.0002928379054437621, + "loss": 0.0422, "step": 18420 }, { - "epoch": 0.09, - "learning_rate": 0.00028605274177517895, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.00029283401722739064, + "loss": 0.0336, "step": 18430 }, { - "epoch": 0.09, - "learning_rate": 0.00028604517408216493, - "loss": 0.0289, + "epoch": 0.05, + "learning_rate": 0.00029283012901101915, + "loss": 0.0368, "step": 18440 }, { - "epoch": 0.09, - "learning_rate": 0.0002860376063891509, - "loss": 0.0284, + "epoch": 0.05, + "learning_rate": 0.0002928262407946477, + "loss": 0.0344, "step": 18450 }, { - "epoch": 0.09, - "learning_rate": 0.0002860300386961369, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.00029282235257827624, + "loss": 0.0366, "step": 18460 }, { - "epoch": 0.09, - "learning_rate": 0.0002860224710031229, - "loss": 0.0249, + "epoch": 0.05, + "learning_rate": 0.0002928184643619048, + "loss": 0.0362, "step": 18470 }, { - "epoch": 0.09, - "learning_rate": 0.0002860149033101089, - "loss": 0.0263, + "epoch": 0.05, + "learning_rate": 0.0002928145761455333, + "loss": 0.0355, "step": 18480 }, { - "epoch": 0.09, - "learning_rate": 0.0002860073356170949, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.0002928106879291619, + "loss": 0.038, "step": 18490 }, { - "epoch": 0.09, - "learning_rate": 0.0002859997679240809, - "loss": 0.0277, + "epoch": 0.05, + "learning_rate": 0.0002928067997127904, + "loss": 0.0385, "step": 18500 }, { - "epoch": 0.09, - "learning_rate": 0.00028599220023106686, - "loss": 0.0284, + "epoch": 0.05, + "learning_rate": 0.0002928029114964189, + "loss": 0.0376, "step": 18510 }, { - "epoch": 0.09, - "learning_rate": 0.00028598463253805284, - "loss": 0.0301, + "epoch": 0.05, + "learning_rate": 0.00029279902328004743, + "loss": 0.0368, "step": 18520 }, { - "epoch": 0.09, - "learning_rate": 0.0002859770648450388, - "loss": 0.0301, + "epoch": 0.05, + "learning_rate": 0.000292795135063676, + "loss": 0.0386, "step": 18530 }, { - "epoch": 0.09, - "learning_rate": 0.00028596949715202486, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.0002927912468473045, + "loss": 0.0385, "step": 18540 }, { - "epoch": 0.09, - "learning_rate": 0.00028596192945901084, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.0002927873586309331, + "loss": 0.0315, "step": 18550 }, { - "epoch": 0.09, - "learning_rate": 0.0002859543617659968, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.0002927834704145616, + "loss": 0.0384, "step": 18560 }, { - "epoch": 0.09, - "learning_rate": 0.0002859467940729828, - "loss": 0.031, + "epoch": 0.05, + "learning_rate": 0.00029277958219819017, + "loss": 0.0458, "step": 18570 }, { - "epoch": 0.09, - "learning_rate": 0.0002859392263799688, - "loss": 0.0351, + "epoch": 0.05, + "learning_rate": 0.0002927756939818187, + "loss": 0.0447, "step": 18580 }, { - "epoch": 0.09, - "learning_rate": 0.00028593165868695476, - "loss": 0.0335, + "epoch": 0.05, + "learning_rate": 0.0002927718057654472, + "loss": 0.0349, "step": 18590 }, { - "epoch": 0.09, - "learning_rate": 0.00028592409099394074, - "loss": 0.0335, + "epoch": 0.05, + "learning_rate": 0.0002927679175490757, + "loss": 0.0387, "step": 18600 }, { - "epoch": 0.09, - "learning_rate": 0.0002859165233009268, - "loss": 0.0265, + "epoch": 0.05, + "learning_rate": 0.0002927640293327043, + "loss": 0.0364, "step": 18610 }, { - "epoch": 0.09, - "learning_rate": 0.00028590895560791276, - "loss": 0.0344, + "epoch": 0.05, + "learning_rate": 0.00029276014111633285, + "loss": 0.044, "step": 18620 }, { - "epoch": 0.09, - "learning_rate": 0.00028590138791489874, - "loss": 0.0333, + "epoch": 0.05, + "learning_rate": 0.00029275625289996136, + "loss": 0.046, "step": 18630 }, { - "epoch": 0.09, - "learning_rate": 0.0002858938202218847, - "loss": 0.0277, + "epoch": 0.05, + "learning_rate": 0.0002927523646835899, + "loss": 0.0397, "step": 18640 }, { - "epoch": 0.09, - "learning_rate": 0.0002858862525288707, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.0002927484764672184, + "loss": 0.0341, "step": 18650 }, { - "epoch": 0.09, - "learning_rate": 0.0002858786848358567, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.00029274458825084696, + "loss": 0.0383, "step": 18660 }, { - "epoch": 0.09, - "learning_rate": 0.0002858711171428427, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.0002927407000344755, + "loss": 0.0353, "step": 18670 }, { - "epoch": 0.09, - "learning_rate": 0.0002858635494498287, - "loss": 0.0381, + "epoch": 0.05, + "learning_rate": 0.00029273681181810404, + "loss": 0.0344, "step": 18680 }, { - "epoch": 0.09, - "learning_rate": 0.0002858559817568147, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.00029273292360173256, + "loss": 0.0338, "step": 18690 }, { - "epoch": 0.09, - "learning_rate": 0.00028584841406380067, - "loss": 0.0364, + "epoch": 0.05, + "learning_rate": 0.0002927290353853611, + "loss": 0.0347, "step": 18700 }, { - "epoch": 0.09, - "learning_rate": 0.00028584084637078665, - "loss": 0.034, + "epoch": 0.05, + "learning_rate": 0.00029272514716898964, + "loss": 0.0395, "step": 18710 }, { - "epoch": 0.09, - "learning_rate": 0.00028583327867777263, - "loss": 0.0288, + "epoch": 0.05, + "learning_rate": 0.00029272125895261816, + "loss": 0.0338, "step": 18720 }, { - "epoch": 0.09, - "learning_rate": 0.0002858257109847586, - "loss": 0.0339, + "epoch": 0.05, + "learning_rate": 0.00029271737073624667, + "loss": 0.0386, "step": 18730 }, { - "epoch": 0.09, - "learning_rate": 0.00028581814329174465, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.00029271348251987524, + "loss": 0.0397, "step": 18740 }, { - "epoch": 0.09, - "learning_rate": 0.00028581057559873063, - "loss": 0.0273, + "epoch": 0.05, + "learning_rate": 0.00029270959430350375, + "loss": 0.0413, "step": 18750 }, { - "epoch": 0.09, - "learning_rate": 0.0002858030079057166, - "loss": 0.0301, + "epoch": 0.05, + "learning_rate": 0.0002927057060871323, + "loss": 0.0482, "step": 18760 }, { - "epoch": 0.09, - "learning_rate": 0.0002857954402127026, - "loss": 0.0277, + "epoch": 0.05, + "learning_rate": 0.00029270181787076084, + "loss": 0.0363, "step": 18770 }, { - "epoch": 0.09, - "learning_rate": 0.00028578787251968857, - "loss": 0.0278, + "epoch": 0.05, + "learning_rate": 0.0002926979296543894, + "loss": 0.0381, "step": 18780 }, { - "epoch": 0.09, - "learning_rate": 0.00028578030482667455, - "loss": 0.0277, + "epoch": 0.05, + "learning_rate": 0.0002926940414380179, + "loss": 0.0376, "step": 18790 }, { - "epoch": 0.09, - "learning_rate": 0.0002857727371336606, - "loss": 0.0293, + "epoch": 0.05, + "learning_rate": 0.00029269015322164643, + "loss": 0.0393, "step": 18800 }, { - "epoch": 0.09, - "learning_rate": 0.00028576516944064657, - "loss": 0.029, + "epoch": 0.05, + "learning_rate": 0.000292686265005275, + "loss": 0.0324, "step": 18810 }, { - "epoch": 0.09, - "learning_rate": 0.00028575760174763255, - "loss": 0.0273, + "epoch": 0.05, + "learning_rate": 0.0002926823767889035, + "loss": 0.0359, "step": 18820 }, { - "epoch": 0.09, - "learning_rate": 0.00028575003405461853, - "loss": 0.0286, + "epoch": 0.05, + "learning_rate": 0.0002926784885725321, + "loss": 0.046, "step": 18830 }, { - "epoch": 0.1, - "learning_rate": 0.0002857424663616045, - "loss": 0.0345, + "epoch": 0.05, + "learning_rate": 0.0002926746003561606, + "loss": 0.031, "step": 18840 }, { - "epoch": 0.1, - "learning_rate": 0.0002857348986685905, - "loss": 0.0305, + "epoch": 0.05, + "learning_rate": 0.0002926707121397891, + "loss": 0.0393, "step": 18850 }, { - "epoch": 0.1, - "learning_rate": 0.00028572733097557653, - "loss": 0.0274, + "epoch": 0.05, + "learning_rate": 0.00029266682392341763, + "loss": 0.038, "step": 18860 }, { - "epoch": 0.1, - "learning_rate": 0.0002857197632825625, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.0002926629357070462, + "loss": 0.0311, "step": 18870 }, { - "epoch": 0.1, - "learning_rate": 0.0002857121955895485, - "loss": 0.0284, + "epoch": 0.05, + "learning_rate": 0.0002926590474906747, + "loss": 0.0413, "step": 18880 }, { - "epoch": 0.1, - "learning_rate": 0.0002857046278965345, - "loss": 0.0303, + "epoch": 0.05, + "learning_rate": 0.0002926551592743033, + "loss": 0.0423, "step": 18890 }, { - "epoch": 0.1, - "learning_rate": 0.00028569706020352046, - "loss": 0.0354, + "epoch": 0.05, + "learning_rate": 0.0002926512710579318, + "loss": 0.0406, "step": 18900 }, { - "epoch": 0.1, - "learning_rate": 0.00028568949251050644, - "loss": 0.0368, + "epoch": 0.05, + "learning_rate": 0.00029264738284156037, + "loss": 0.0479, "step": 18910 }, { - "epoch": 0.1, - "learning_rate": 0.0002856819248174924, - "loss": 0.0355, + "epoch": 0.05, + "learning_rate": 0.0002926434946251889, + "loss": 0.0387, "step": 18920 }, { - "epoch": 0.1, - "learning_rate": 0.00028567435712447846, - "loss": 0.0382, + "epoch": 0.05, + "learning_rate": 0.0002926396064088174, + "loss": 0.0344, "step": 18930 }, { - "epoch": 0.1, - "learning_rate": 0.00028566678943146444, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.0002926357181924459, + "loss": 0.04, "step": 18940 }, { - "epoch": 0.1, - "learning_rate": 0.0002856592217384504, - "loss": 0.0295, + "epoch": 0.05, + "learning_rate": 0.0002926318299760745, + "loss": 0.0335, "step": 18950 }, { - "epoch": 0.1, - "learning_rate": 0.0002856516540454364, - "loss": 0.0314, + "epoch": 0.05, + "learning_rate": 0.00029262794175970305, + "loss": 0.0378, "step": 18960 }, { - "epoch": 0.1, - "learning_rate": 0.0002856440863524224, - "loss": 0.033, + "epoch": 0.05, + "learning_rate": 0.00029262405354333156, + "loss": 0.0347, "step": 18970 }, { - "epoch": 0.1, - "learning_rate": 0.00028563651865940836, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.0002926201653269601, + "loss": 0.0339, "step": 18980 }, { - "epoch": 0.1, - "learning_rate": 0.0002856289509663944, - "loss": 0.0315, + "epoch": 0.05, + "learning_rate": 0.00029261627711058864, + "loss": 0.0417, "step": 18990 }, { - "epoch": 0.1, - "learning_rate": 0.0002856213832733804, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.00029261238889421716, + "loss": 0.0385, "step": 19000 }, { - "epoch": 0.1, - "eval_cer": 0.9144974269946735, - "eval_loss": 0.022285686805844307, - "eval_runtime": 117.4593, - "eval_samples_per_second": 17.027, - "eval_steps_per_second": 4.257, + "epoch": 0.05, + "eval_cer": 0.8817614710744033, + "eval_loss": 0.029142551124095917, + "eval_runtime": 107.6868, + "eval_samples_per_second": 18.572, + "eval_steps_per_second": 4.643, "step": 19000 }, { - "epoch": 0.1, - "learning_rate": 0.00028561381558036636, - "loss": 0.0299, + "epoch": 0.05, + "learning_rate": 0.0002926085006778457, + "loss": 0.036, "step": 19010 }, { - "epoch": 0.1, - "learning_rate": 0.00028560624788735234, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.00029260461246147424, + "loss": 0.0359, "step": 19020 }, { - "epoch": 0.1, - "learning_rate": 0.0002855986801943383, - "loss": 0.0294, + "epoch": 0.05, + "learning_rate": 0.00029260072424510276, + "loss": 0.0389, "step": 19030 }, { - "epoch": 0.1, - "learning_rate": 0.0002855911125013243, - "loss": 0.0314, + "epoch": 0.05, + "learning_rate": 0.0002925968360287313, + "loss": 0.0376, "step": 19040 }, { - "epoch": 0.1, - "learning_rate": 0.00028558354480831034, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.00029259294781235984, + "loss": 0.0375, "step": 19050 }, { - "epoch": 0.1, - "learning_rate": 0.0002855759771152963, - "loss": 0.0323, + "epoch": 0.05, + "learning_rate": 0.00029258905959598835, + "loss": 0.0498, "step": 19060 }, { - "epoch": 0.1, - "learning_rate": 0.0002855684094222823, - "loss": 0.031, + "epoch": 0.05, + "learning_rate": 0.0002925851713796169, + "loss": 0.0429, "step": 19070 }, { - "epoch": 0.1, - "learning_rate": 0.0002855608417292683, - "loss": 0.0292, + "epoch": 0.05, + "learning_rate": 0.00029258128316324544, + "loss": 0.0424, "step": 19080 }, { - "epoch": 0.1, - "learning_rate": 0.00028555327403625427, - "loss": 0.0276, + "epoch": 0.05, + "learning_rate": 0.00029257739494687395, + "loss": 0.037, "step": 19090 }, { - "epoch": 0.1, - "learning_rate": 0.00028554570634324025, - "loss": 0.0284, + "epoch": 0.05, + "learning_rate": 0.0002925735067305025, + "loss": 0.0332, "step": 19100 }, { - "epoch": 0.1, - "learning_rate": 0.00028553813865022623, - "loss": 0.0268, + "epoch": 0.05, + "learning_rate": 0.00029256961851413104, + "loss": 0.0364, "step": 19110 }, { - "epoch": 0.1, - "learning_rate": 0.00028553057095721227, - "loss": 0.0259, + "epoch": 0.05, + "learning_rate": 0.0002925657302977596, + "loss": 0.0383, "step": 19120 }, { - "epoch": 0.1, - "learning_rate": 0.00028552300326419825, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002925618420813881, + "loss": 0.0387, "step": 19130 }, { - "epoch": 0.1, - "learning_rate": 0.00028551543557118423, - "loss": 0.0303, + "epoch": 0.05, + "learning_rate": 0.00029255795386501663, + "loss": 0.0358, "step": 19140 }, { - "epoch": 0.1, - "learning_rate": 0.0002855078678781702, - "loss": 0.0296, + "epoch": 0.05, + "learning_rate": 0.00029255406564864515, + "loss": 0.0325, "step": 19150 }, { - "epoch": 0.1, - "learning_rate": 0.0002855003001851562, - "loss": 0.028, + "epoch": 0.05, + "learning_rate": 0.0002925501774322737, + "loss": 0.0372, "step": 19160 }, { - "epoch": 0.1, - "learning_rate": 0.0002854927324921422, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.0002925462892159023, + "loss": 0.0343, "step": 19170 }, { - "epoch": 0.1, - "learning_rate": 0.0002854851647991282, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.0002925424009995308, + "loss": 0.0406, "step": 19180 }, { - "epoch": 0.1, - "learning_rate": 0.0002854775971061142, - "loss": 0.0261, + "epoch": 0.05, + "learning_rate": 0.0002925385127831593, + "loss": 0.0339, "step": 19190 }, { - "epoch": 0.1, - "learning_rate": 0.00028547002941310017, - "loss": 0.03, + "epoch": 0.05, + "learning_rate": 0.0002925346245667879, + "loss": 0.0362, "step": 19200 }, { - "epoch": 0.1, - "learning_rate": 0.00028546246172008615, - "loss": 0.035, + "epoch": 0.05, + "learning_rate": 0.0002925307363504164, + "loss": 0.0328, "step": 19210 }, { - "epoch": 0.1, - "learning_rate": 0.00028545489402707214, - "loss": 0.0365, + "epoch": 0.05, + "learning_rate": 0.0002925268481340449, + "loss": 0.0357, "step": 19220 }, { - "epoch": 0.1, - "learning_rate": 0.0002854473263340581, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.0002925229599176735, + "loss": 0.039, "step": 19230 }, { - "epoch": 0.1, - "learning_rate": 0.0002854397586410441, - "loss": 0.0317, + "epoch": 0.05, + "learning_rate": 0.000292519071701302, + "loss": 0.034, "step": 19240 }, { - "epoch": 0.1, - "learning_rate": 0.00028543219094803013, - "loss": 0.0303, + "epoch": 0.05, + "learning_rate": 0.00029251518348493056, + "loss": 0.038, "step": 19250 }, { - "epoch": 0.1, - "learning_rate": 0.0002854246232550161, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.0002925112952685591, + "loss": 0.0394, "step": 19260 }, { - "epoch": 0.1, - "learning_rate": 0.0002854170555620021, - "loss": 0.0328, + "epoch": 0.05, + "learning_rate": 0.0002925074070521876, + "loss": 0.0395, "step": 19270 }, { - "epoch": 0.1, - "learning_rate": 0.0002854094878689881, - "loss": 0.0278, + "epoch": 0.05, + "learning_rate": 0.00029250351883581616, + "loss": 0.0424, "step": 19280 }, { - "epoch": 0.1, - "learning_rate": 0.00028540192017597406, - "loss": 0.0338, + "epoch": 0.05, + "learning_rate": 0.0002924996306194447, + "loss": 0.0424, "step": 19290 }, { - "epoch": 0.1, - "learning_rate": 0.00028539435248296004, - "loss": 0.0286, + "epoch": 0.05, + "learning_rate": 0.00029249574240307325, + "loss": 0.0358, "step": 19300 }, { - "epoch": 0.1, - "learning_rate": 0.0002853867847899461, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.00029249185418670176, + "loss": 0.0376, "step": 19310 }, { - "epoch": 0.1, - "learning_rate": 0.00028537921709693206, - "loss": 0.0334, + "epoch": 0.05, + "learning_rate": 0.00029248796597033033, + "loss": 0.04, "step": 19320 }, { - "epoch": 0.1, - "learning_rate": 0.00028537164940391804, - "loss": 0.0312, + "epoch": 0.05, + "learning_rate": 0.00029248407775395884, + "loss": 0.0369, "step": 19330 }, { - "epoch": 0.1, - "learning_rate": 0.000285364081710904, - "loss": 0.03, + "epoch": 0.05, + "learning_rate": 0.00029248018953758736, + "loss": 0.0406, "step": 19340 }, { - "epoch": 0.1, - "learning_rate": 0.00028535651401789, - "loss": 0.0294, + "epoch": 0.05, + "learning_rate": 0.00029247630132121587, + "loss": 0.0377, "step": 19350 }, { - "epoch": 0.1, - "learning_rate": 0.000285348946324876, - "loss": 0.027, + "epoch": 0.05, + "learning_rate": 0.00029247241310484444, + "loss": 0.0438, "step": 19360 }, { - "epoch": 0.1, - "learning_rate": 0.000285341378631862, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.00029246852488847296, + "loss": 0.0387, "step": 19370 }, { - "epoch": 0.1, - "learning_rate": 0.000285333810938848, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.0002924646366721015, + "loss": 0.0425, "step": 19380 }, { - "epoch": 0.1, - "learning_rate": 0.000285326243245834, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029246074845573004, + "loss": 0.0359, "step": 19390 }, { - "epoch": 0.1, - "learning_rate": 0.00028531867555281996, - "loss": 0.0293, + "epoch": 0.05, + "learning_rate": 0.00029245686023935855, + "loss": 0.041, "step": 19400 }, { - "epoch": 0.1, - "learning_rate": 0.00028531110785980595, - "loss": 0.0271, + "epoch": 0.05, + "learning_rate": 0.0002924529720229871, + "loss": 0.0454, "step": 19410 }, { - "epoch": 0.1, - "learning_rate": 0.0002853035401667919, - "loss": 0.0244, + "epoch": 0.05, + "learning_rate": 0.00029244908380661564, + "loss": 0.0362, "step": 19420 }, { - "epoch": 0.1, - "learning_rate": 0.0002852959724737779, - "loss": 0.026, + "epoch": 0.05, + "learning_rate": 0.00029244519559024415, + "loss": 0.0341, "step": 19430 }, { - "epoch": 0.1, - "learning_rate": 0.00028528840478076394, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002924413073738727, + "loss": 0.0332, "step": 19440 }, { - "epoch": 0.1, - "learning_rate": 0.0002852808370877499, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.0002924374191575013, + "loss": 0.0405, "step": 19450 }, { - "epoch": 0.1, - "learning_rate": 0.0002852732693947359, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.0002924335309411298, + "loss": 0.0355, "step": 19460 }, { - "epoch": 0.1, - "learning_rate": 0.0002852657017017219, - "loss": 0.027, + "epoch": 0.05, + "learning_rate": 0.0002924296427247583, + "loss": 0.0296, "step": 19470 }, { - "epoch": 0.1, - "learning_rate": 0.00028525813400870787, - "loss": 0.0247, + "epoch": 0.05, + "learning_rate": 0.00029242575450838683, + "loss": 0.0384, "step": 19480 }, { - "epoch": 0.1, - "learning_rate": 0.00028525056631569385, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002924218662920154, + "loss": 0.0378, "step": 19490 }, { - "epoch": 0.1, - "learning_rate": 0.00028524299862267983, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.0002924179780756439, + "loss": 0.0392, "step": 19500 }, { - "epoch": 0.1, - "learning_rate": 0.0002852354309296658, - "loss": 0.0279, + "epoch": 0.05, + "learning_rate": 0.0002924140898592725, + "loss": 0.0311, "step": 19510 }, { - "epoch": 0.1, - "learning_rate": 0.0002852278632366518, - "loss": 0.0299, + "epoch": 0.05, + "learning_rate": 0.000292410201642901, + "loss": 0.0342, "step": 19520 }, { - "epoch": 0.1, - "learning_rate": 0.0002852202955436378, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.00029240631342652957, + "loss": 0.0401, "step": 19530 }, { - "epoch": 0.1, - "learning_rate": 0.0002852127278506238, - "loss": 0.0317, + "epoch": 0.05, + "learning_rate": 0.0002924024252101581, + "loss": 0.0394, "step": 19540 }, { - "epoch": 0.1, - "learning_rate": 0.0002852051601576098, - "loss": 0.0305, + "epoch": 0.05, + "learning_rate": 0.0002923985369937866, + "loss": 0.0366, "step": 19550 }, { - "epoch": 0.1, - "learning_rate": 0.0002851975924645958, - "loss": 0.027, + "epoch": 0.05, + "learning_rate": 0.0002923946487774151, + "loss": 0.0411, "step": 19560 }, { - "epoch": 0.1, - "learning_rate": 0.00028519002477158176, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002923907605610437, + "loss": 0.0353, "step": 19570 }, { - "epoch": 0.1, - "learning_rate": 0.00028518245707856774, - "loss": 0.028, + "epoch": 0.05, + "learning_rate": 0.0002923868723446722, + "loss": 0.0408, "step": 19580 }, { - "epoch": 0.1, - "learning_rate": 0.0002851748893855537, - "loss": 0.028, + "epoch": 0.05, + "learning_rate": 0.00029238298412830076, + "loss": 0.0447, "step": 19590 }, { - "epoch": 0.1, - "learning_rate": 0.00028516732169253976, - "loss": 0.032, + "epoch": 0.05, + "learning_rate": 0.0002923790959119293, + "loss": 0.0373, "step": 19600 }, { - "epoch": 0.1, - "learning_rate": 0.00028515975399952574, - "loss": 0.0251, + "epoch": 0.05, + "learning_rate": 0.0002923752076955578, + "loss": 0.032, "step": 19610 }, { - "epoch": 0.1, - "learning_rate": 0.0002851521863065117, - "loss": 0.0283, + "epoch": 0.05, + "learning_rate": 0.00029237131947918636, + "loss": 0.0355, "step": 19620 }, { - "epoch": 0.1, - "learning_rate": 0.0002851446186134977, - "loss": 0.0369, + "epoch": 0.05, + "learning_rate": 0.0002923674312628149, + "loss": 0.0375, "step": 19630 }, { - "epoch": 0.1, - "learning_rate": 0.0002851370509204837, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.0002923635430464434, + "loss": 0.0339, "step": 19640 }, { - "epoch": 0.1, - "learning_rate": 0.00028512948322746966, - "loss": 0.0303, + "epoch": 0.05, + "learning_rate": 0.00029235965483007196, + "loss": 0.0431, "step": 19650 }, { - "epoch": 0.1, - "learning_rate": 0.00028512191553445564, - "loss": 0.0286, + "epoch": 0.05, + "learning_rate": 0.00029235576661370053, + "loss": 0.0312, "step": 19660 }, { - "epoch": 0.1, - "learning_rate": 0.0002851143478414417, - "loss": 0.0365, + "epoch": 0.05, + "learning_rate": 0.00029235187839732904, + "loss": 0.0346, "step": 19670 }, { - "epoch": 0.1, - "learning_rate": 0.00028510678014842766, - "loss": 0.0292, + "epoch": 0.05, + "learning_rate": 0.00029234799018095756, + "loss": 0.0363, "step": 19680 }, { - "epoch": 0.1, - "learning_rate": 0.00028509921245541364, - "loss": 0.0282, + "epoch": 0.05, + "learning_rate": 0.00029234410196458607, + "loss": 0.0366, "step": 19690 }, { - "epoch": 0.1, - "learning_rate": 0.0002850916447623996, - "loss": 0.0279, + "epoch": 0.05, + "learning_rate": 0.00029234021374821464, + "loss": 0.0367, "step": 19700 }, { - "epoch": 0.1, - "learning_rate": 0.0002850840770693856, - "loss": 0.0292, + "epoch": 0.05, + "learning_rate": 0.00029233632553184315, + "loss": 0.0355, "step": 19710 }, { - "epoch": 0.1, - "learning_rate": 0.0002850765093763716, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.0002923324373154717, + "loss": 0.0321, "step": 19720 }, { - "epoch": 0.1, - "learning_rate": 0.0002850689416833576, - "loss": 0.0246, + "epoch": 0.05, + "learning_rate": 0.00029232854909910024, + "loss": 0.0383, "step": 19730 }, { - "epoch": 0.1, - "learning_rate": 0.0002850613739903436, - "loss": 0.0289, + "epoch": 0.05, + "learning_rate": 0.0002923246608827288, + "loss": 0.0398, "step": 19740 }, { - "epoch": 0.1, - "learning_rate": 0.0002850538062973296, - "loss": 0.0257, + "epoch": 0.05, + "learning_rate": 0.0002923207726663573, + "loss": 0.0384, "step": 19750 }, { - "epoch": 0.1, - "learning_rate": 0.00028504623860431557, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.00029231688444998584, + "loss": 0.0381, "step": 19760 }, { - "epoch": 0.1, - "learning_rate": 0.00028503867091130155, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029231299623361435, + "loss": 0.0394, "step": 19770 }, { - "epoch": 0.1, - "learning_rate": 0.00028503110321828753, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.0002923091080172429, + "loss": 0.0432, "step": 19780 }, { - "epoch": 0.1, - "learning_rate": 0.00028502353552527357, - "loss": 0.0287, + "epoch": 0.05, + "learning_rate": 0.00029230521980087143, + "loss": 0.0381, "step": 19790 }, { - "epoch": 0.1, - "learning_rate": 0.00028501596783225955, - "loss": 0.0239, + "epoch": 0.05, + "learning_rate": 0.0002923013315845, + "loss": 0.038, "step": 19800 }, { - "epoch": 0.1, - "learning_rate": 0.00028500840013924553, - "loss": 0.0271, + "epoch": 0.05, + "learning_rate": 0.0002922974433681285, + "loss": 0.0418, "step": 19810 }, { - "epoch": 0.1, - "learning_rate": 0.0002850008324462315, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.0002922935551517571, + "loss": 0.032, "step": 19820 }, { - "epoch": 0.1, - "learning_rate": 0.0002849932647532175, - "loss": 0.0273, + "epoch": 0.05, + "learning_rate": 0.0002922896669353856, + "loss": 0.041, "step": 19830 }, { - "epoch": 0.1, - "learning_rate": 0.0002849856970602035, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.0002922857787190141, + "loss": 0.0354, "step": 19840 }, { - "epoch": 0.1, - "learning_rate": 0.00028497812936718945, - "loss": 0.0265, + "epoch": 0.05, + "learning_rate": 0.0002922818905026427, + "loss": 0.0404, "step": 19850 }, { - "epoch": 0.1, - "learning_rate": 0.0002849705616741755, - "loss": 0.0284, + "epoch": 0.05, + "learning_rate": 0.0002922780022862712, + "loss": 0.0393, "step": 19860 }, { - "epoch": 0.1, - "learning_rate": 0.00028496299398116147, - "loss": 0.0309, - "step": 19870 + "epoch": 0.05, + "learning_rate": 0.00029227411406989977, + "loss": 0.0415, + "step": 19870 }, { - "epoch": 0.1, - "learning_rate": 0.00028495542628814745, - "loss": 0.0278, + "epoch": 0.05, + "learning_rate": 0.0002922702258535283, + "loss": 0.0352, "step": 19880 }, { - "epoch": 0.1, - "learning_rate": 0.00028494785859513343, - "loss": 0.0259, + "epoch": 0.05, + "learning_rate": 0.0002922663376371568, + "loss": 0.0356, "step": 19890 }, { - "epoch": 0.1, - "learning_rate": 0.0002849402909021194, - "loss": 0.0321, + "epoch": 0.05, + "learning_rate": 0.0002922624494207853, + "loss": 0.0384, "step": 19900 }, { - "epoch": 0.1, - "learning_rate": 0.0002849327232091054, - "loss": 0.0266, + "epoch": 0.05, + "learning_rate": 0.0002922585612044139, + "loss": 0.0385, "step": 19910 }, { - "epoch": 0.1, - "learning_rate": 0.00028492515551609143, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.0002922546729880424, + "loss": 0.0382, "step": 19920 }, { - "epoch": 0.1, - "learning_rate": 0.0002849175878230774, - "loss": 0.0257, + "epoch": 0.05, + "learning_rate": 0.00029225078477167096, + "loss": 0.0401, "step": 19930 }, { - "epoch": 0.1, - "learning_rate": 0.0002849100201300634, - "loss": 0.0303, + "epoch": 0.05, + "learning_rate": 0.0002922468965552995, + "loss": 0.0401, "step": 19940 }, { - "epoch": 0.1, - "learning_rate": 0.0002849024524370494, - "loss": 0.0253, + "epoch": 0.05, + "learning_rate": 0.00029224300833892805, + "loss": 0.0317, "step": 19950 }, { - "epoch": 0.1, - "learning_rate": 0.00028489488474403536, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029223912012255656, + "loss": 0.0323, "step": 19960 }, { - "epoch": 0.1, - "learning_rate": 0.00028488731705102134, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.0002922352319061851, + "loss": 0.0318, "step": 19970 }, { - "epoch": 0.1, - "learning_rate": 0.0002848797493580073, - "loss": 0.0314, + "epoch": 0.05, + "learning_rate": 0.0002922313436898136, + "loss": 0.0376, "step": 19980 }, { - "epoch": 0.1, - "learning_rate": 0.00028487218166499336, - "loss": 0.0295, + "epoch": 0.05, + "learning_rate": 0.00029222745547344216, + "loss": 0.0419, "step": 19990 }, { - "epoch": 0.1, - "learning_rate": 0.00028486461397197934, - "loss": 0.0302, + "epoch": 0.05, + "learning_rate": 0.0002922235672570707, + "loss": 0.0358, "step": 20000 }, { - "epoch": 0.1, - "eval_cer": 0.9145546803660722, - "eval_loss": 0.023069359362125397, - "eval_runtime": 117.5456, - "eval_samples_per_second": 17.015, - "eval_steps_per_second": 4.254, + "epoch": 0.05, + "eval_cer": 0.8818160569148363, + "eval_loss": 0.02738848887383938, + "eval_runtime": 107.5768, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, "step": 20000 }, { - "epoch": 0.1, - "learning_rate": 0.0002848570462789653, - "loss": 0.0283, + "epoch": 0.05, + "learning_rate": 0.00029221967904069924, + "loss": 0.036, "step": 20010 }, { - "epoch": 0.1, - "learning_rate": 0.0002848494785859513, - "loss": 0.0321, + "epoch": 0.05, + "learning_rate": 0.00029221579082432776, + "loss": 0.0371, "step": 20020 }, { - "epoch": 0.1, - "learning_rate": 0.0002848419108929373, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.0002922119026079563, + "loss": 0.0364, "step": 20030 }, { - "epoch": 0.1, - "learning_rate": 0.00028483434319992326, - "loss": 0.0282, + "epoch": 0.05, + "learning_rate": 0.00029220801439158484, + "loss": 0.0379, "step": 20040 }, { - "epoch": 0.1, - "learning_rate": 0.0002848267755069093, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.00029220412617521335, + "loss": 0.0432, "step": 20050 }, { - "epoch": 0.1, - "learning_rate": 0.0002848192078138953, - "loss": 0.0305, + "epoch": 0.05, + "learning_rate": 0.0002922002379588419, + "loss": 0.0375, "step": 20060 }, { - "epoch": 0.1, - "learning_rate": 0.00028481164012088126, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029219634974247044, + "loss": 0.0394, "step": 20070 }, { - "epoch": 0.1, - "learning_rate": 0.00028480407242786724, - "loss": 0.0331, + "epoch": 0.05, + "learning_rate": 0.000292192461526099, + "loss": 0.0357, "step": 20080 }, { - "epoch": 0.1, - "learning_rate": 0.0002847965047348532, - "loss": 0.0245, + "epoch": 0.05, + "learning_rate": 0.0002921885733097275, + "loss": 0.035, "step": 20090 }, { - "epoch": 0.1, - "learning_rate": 0.0002847889370418392, - "loss": 0.0304, + "epoch": 0.05, + "learning_rate": 0.00029218468509335603, + "loss": 0.0332, "step": 20100 }, { - "epoch": 0.1, - "learning_rate": 0.00028478136934882524, - "loss": 0.0276, + "epoch": 0.05, + "learning_rate": 0.00029218079687698455, + "loss": 0.0375, "step": 20110 }, { - "epoch": 0.1, - "learning_rate": 0.0002847738016558112, - "loss": 0.023, + "epoch": 0.05, + "learning_rate": 0.0002921769086606131, + "loss": 0.0356, "step": 20120 }, { - "epoch": 0.1, - "learning_rate": 0.0002847662339627972, - "loss": 0.0354, + "epoch": 0.05, + "learning_rate": 0.00029217302044424163, + "loss": 0.0443, "step": 20130 }, { - "epoch": 0.1, - "learning_rate": 0.0002847586662697832, - "loss": 0.0302, + "epoch": 0.05, + "learning_rate": 0.0002921691322278702, + "loss": 0.0335, "step": 20140 }, { - "epoch": 0.1, - "learning_rate": 0.00028475109857676917, - "loss": 0.0276, + "epoch": 0.05, + "learning_rate": 0.0002921652440114987, + "loss": 0.0362, "step": 20150 }, { - "epoch": 0.1, - "learning_rate": 0.00028474353088375515, - "loss": 0.0319, + "epoch": 0.05, + "learning_rate": 0.0002921613557951273, + "loss": 0.0331, "step": 20160 }, { - "epoch": 0.1, - "learning_rate": 0.00028473596319074113, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.0002921574675787558, + "loss": 0.0386, "step": 20170 }, { - "epoch": 0.1, - "learning_rate": 0.00028472839549772717, - "loss": 0.0328, + "epoch": 0.05, + "learning_rate": 0.0002921535793623843, + "loss": 0.0313, "step": 20180 }, { - "epoch": 0.1, - "learning_rate": 0.00028472082780471315, - "loss": 0.0325, + "epoch": 0.05, + "learning_rate": 0.00029214969114601283, + "loss": 0.0334, "step": 20190 }, { - "epoch": 0.1, - "learning_rate": 0.00028471326011169913, - "loss": 0.0266, + "epoch": 0.05, + "learning_rate": 0.0002921458029296414, + "loss": 0.0349, "step": 20200 }, { - "epoch": 0.1, - "learning_rate": 0.0002847056924186851, - "loss": 0.0299, + "epoch": 0.05, + "learning_rate": 0.00029214191471326997, + "loss": 0.0351, "step": 20210 }, { - "epoch": 0.1, - "learning_rate": 0.0002846981247256711, - "loss": 0.032, + "epoch": 0.05, + "learning_rate": 0.0002921380264968985, + "loss": 0.0357, "step": 20220 }, { - "epoch": 0.1, - "learning_rate": 0.0002846905570326571, - "loss": 0.0276, + "epoch": 0.05, + "learning_rate": 0.000292134138280527, + "loss": 0.038, "step": 20230 }, { - "epoch": 0.1, - "learning_rate": 0.0002846829893396431, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.00029213025006415556, + "loss": 0.0314, "step": 20240 }, { - "epoch": 0.1, - "learning_rate": 0.0002846754216466291, - "loss": 0.034, + "epoch": 0.05, + "learning_rate": 0.0002921263618477841, + "loss": 0.0363, "step": 20250 }, { - "epoch": 0.1, - "learning_rate": 0.0002846678539536151, - "loss": 0.0277, + "epoch": 0.05, + "learning_rate": 0.0002921224736314126, + "loss": 0.0361, "step": 20260 }, { - "epoch": 0.1, - "learning_rate": 0.00028466028626060105, - "loss": 0.0356, + "epoch": 0.05, + "learning_rate": 0.00029211858541504116, + "loss": 0.0419, "step": 20270 }, { - "epoch": 0.1, - "learning_rate": 0.00028465271856758704, - "loss": 0.0342, + "epoch": 0.05, + "learning_rate": 0.0002921146971986697, + "loss": 0.0312, "step": 20280 }, { - "epoch": 0.1, - "learning_rate": 0.000284645150874573, - "loss": 0.0367, + "epoch": 0.05, + "learning_rate": 0.00029211080898229824, + "loss": 0.0302, "step": 20290 }, { - "epoch": 0.1, - "learning_rate": 0.000284637583181559, - "loss": 0.0308, + "epoch": 0.05, + "learning_rate": 0.00029210692076592676, + "loss": 0.0352, "step": 20300 }, { - "epoch": 0.1, - "learning_rate": 0.00028463001548854503, - "loss": 0.0358, + "epoch": 0.05, + "learning_rate": 0.0002921030325495553, + "loss": 0.0471, "step": 20310 }, { - "epoch": 0.1, - "learning_rate": 0.000284622447795531, - "loss": 0.0264, + "epoch": 0.05, + "learning_rate": 0.00029209914433318384, + "loss": 0.037, "step": 20320 }, { - "epoch": 0.1, - "learning_rate": 0.000284614880102517, - "loss": 0.0355, + "epoch": 0.05, + "learning_rate": 0.00029209525611681236, + "loss": 0.0398, "step": 20330 }, { - "epoch": 0.1, - "learning_rate": 0.000284607312409503, - "loss": 0.0305, + "epoch": 0.05, + "learning_rate": 0.00029209136790044087, + "loss": 0.0348, "step": 20340 }, { - "epoch": 0.1, - "learning_rate": 0.00028459974471648896, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.00029208747968406944, + "loss": 0.037, "step": 20350 }, { - "epoch": 0.1, - "learning_rate": 0.00028459217702347494, - "loss": 0.0282, + "epoch": 0.05, + "learning_rate": 0.00029208359146769795, + "loss": 0.0348, "step": 20360 }, { - "epoch": 0.1, - "learning_rate": 0.000284584609330461, - "loss": 0.0418, + "epoch": 0.05, + "learning_rate": 0.0002920797032513265, + "loss": 0.0292, "step": 20370 }, { - "epoch": 0.1, - "learning_rate": 0.00028457704163744696, - "loss": 0.0341, + "epoch": 0.05, + "learning_rate": 0.00029207581503495504, + "loss": 0.0399, "step": 20380 }, { - "epoch": 0.1, - "learning_rate": 0.00028456947394443294, - "loss": 0.0329, + "epoch": 0.05, + "learning_rate": 0.00029207192681858355, + "loss": 0.0363, "step": 20390 }, { - "epoch": 0.1, - "learning_rate": 0.0002845619062514189, - "loss": 0.0361, + "epoch": 0.05, + "learning_rate": 0.0002920680386022121, + "loss": 0.0336, "step": 20400 }, { - "epoch": 0.1, - "learning_rate": 0.0002845543385584049, - "loss": 0.0252, + "epoch": 0.05, + "learning_rate": 0.00029206415038584064, + "loss": 0.0371, "step": 20410 }, { - "epoch": 0.1, - "learning_rate": 0.0002845467708653909, - "loss": 0.0322, + "epoch": 0.05, + "learning_rate": 0.0002920602621694692, + "loss": 0.0343, "step": 20420 }, { - "epoch": 0.1, - "learning_rate": 0.0002845392031723769, - "loss": 0.0348, + "epoch": 0.05, + "learning_rate": 0.0002920563739530977, + "loss": 0.0317, "step": 20430 }, { - "epoch": 0.1, - "learning_rate": 0.0002845316354793629, - "loss": 0.0338, + "epoch": 0.05, + "learning_rate": 0.00029205248573672623, + "loss": 0.0344, "step": 20440 }, { - "epoch": 0.1, - "learning_rate": 0.0002845240677863489, - "loss": 0.0335, + "epoch": 0.05, + "learning_rate": 0.0002920485975203548, + "loss": 0.0355, "step": 20450 }, { - "epoch": 0.1, - "learning_rate": 0.00028451650009333486, - "loss": 0.0374, + "epoch": 0.05, + "learning_rate": 0.0002920447093039833, + "loss": 0.0441, "step": 20460 }, { - "epoch": 0.1, - "learning_rate": 0.00028450893240032085, - "loss": 0.0308, + "epoch": 0.05, + "learning_rate": 0.00029204082108761183, + "loss": 0.0342, "step": 20470 }, { - "epoch": 0.1, - "learning_rate": 0.00028450136470730683, - "loss": 0.0306, + "epoch": 0.05, + "learning_rate": 0.0002920369328712404, + "loss": 0.0392, "step": 20480 }, { - "epoch": 0.1, - "learning_rate": 0.0002844937970142928, - "loss": 0.0352, + "epoch": 0.05, + "learning_rate": 0.00029203304465486897, + "loss": 0.0422, "step": 20490 }, { - "epoch": 0.1, - "learning_rate": 0.00028448622932127884, - "loss": 0.0332, + "epoch": 0.05, + "learning_rate": 0.0002920291564384975, + "loss": 0.0379, "step": 20500 }, { - "epoch": 0.1, - "learning_rate": 0.0002844786616282648, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.000292025268222126, + "loss": 0.0329, "step": 20510 }, { - "epoch": 0.1, - "learning_rate": 0.0002844710939352508, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.0002920213800057545, + "loss": 0.0378, "step": 20520 }, { - "epoch": 0.1, - "learning_rate": 0.0002844635262422368, - "loss": 0.0246, + "epoch": 0.05, + "learning_rate": 0.0002920174917893831, + "loss": 0.0337, "step": 20530 }, { - "epoch": 0.1, - "learning_rate": 0.00028445595854922277, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.0002920136035730116, + "loss": 0.0358, "step": 20540 }, { - "epoch": 0.1, - "learning_rate": 0.00028444839085620875, - "loss": 0.0396, + "epoch": 0.05, + "learning_rate": 0.00029200971535664016, + "loss": 0.0352, "step": 20550 }, { - "epoch": 0.1, - "learning_rate": 0.0002844408231631948, - "loss": 0.0393, + "epoch": 0.05, + "learning_rate": 0.0002920058271402687, + "loss": 0.0337, "step": 20560 }, { - "epoch": 0.1, - "learning_rate": 0.00028443325547018077, - "loss": 0.0275, + "epoch": 0.05, + "learning_rate": 0.00029200193892389725, + "loss": 0.0341, "step": 20570 }, { - "epoch": 0.1, - "learning_rate": 0.00028442568777716675, - "loss": 0.0317, + "epoch": 0.05, + "learning_rate": 0.00029199805070752576, + "loss": 0.0373, "step": 20580 }, { - "epoch": 0.1, - "learning_rate": 0.00028441812008415273, - "loss": 0.0321, + "epoch": 0.05, + "learning_rate": 0.0002919941624911543, + "loss": 0.0362, "step": 20590 }, { - "epoch": 0.1, - "learning_rate": 0.0002844105523911387, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002919902742747828, + "loss": 0.0505, "step": 20600 }, { - "epoch": 0.1, - "learning_rate": 0.0002844029846981247, - "loss": 0.0265, + "epoch": 0.05, + "learning_rate": 0.00029198638605841136, + "loss": 0.0406, "step": 20610 }, { - "epoch": 0.1, - "learning_rate": 0.00028439541700511073, - "loss": 0.0292, + "epoch": 0.05, + "learning_rate": 0.0002919824978420399, + "loss": 0.0346, "step": 20620 }, { - "epoch": 0.1, - "learning_rate": 0.0002843878493120967, - "loss": 0.031, + "epoch": 0.05, + "learning_rate": 0.00029197860962566844, + "loss": 0.0426, "step": 20630 }, { - "epoch": 0.1, - "learning_rate": 0.0002843802816190827, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029197472140929696, + "loss": 0.0356, "step": 20640 }, { - "epoch": 0.1, - "learning_rate": 0.0002843727139260687, - "loss": 0.0292, + "epoch": 0.05, + "learning_rate": 0.00029197083319292547, + "loss": 0.039, "step": 20650 }, { - "epoch": 0.1, - "learning_rate": 0.00028436514623305466, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.00029196694497655404, + "loss": 0.0404, "step": 20660 }, { - "epoch": 0.1, - "learning_rate": 0.00028435757854004064, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.00029196305676018256, + "loss": 0.0374, "step": 20670 }, { - "epoch": 0.1, - "learning_rate": 0.0002843500108470266, - "loss": 0.0288, + "epoch": 0.05, + "learning_rate": 0.00029195916854381107, + "loss": 0.0349, "step": 20680 }, { - "epoch": 0.1, - "learning_rate": 0.00028434244315401265, - "loss": 0.026, + "epoch": 0.05, + "learning_rate": 0.00029195528032743964, + "loss": 0.0457, "step": 20690 }, { - "epoch": 0.1, - "learning_rate": 0.00028433487546099864, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.0002919513921110682, + "loss": 0.0317, "step": 20700 }, { - "epoch": 0.1, - "learning_rate": 0.0002843273077679846, - "loss": 0.027, + "epoch": 0.05, + "learning_rate": 0.0002919475038946967, + "loss": 0.0341, "step": 20710 }, { - "epoch": 0.1, - "learning_rate": 0.0002843197400749706, - "loss": 0.0312, + "epoch": 0.05, + "learning_rate": 0.00029194361567832524, + "loss": 0.0348, "step": 20720 }, { - "epoch": 0.1, - "learning_rate": 0.0002843121723819566, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.00029193972746195375, + "loss": 0.0367, "step": 20730 }, { - "epoch": 0.1, - "learning_rate": 0.00028430460468894256, - "loss": 0.0281, + "epoch": 0.05, + "learning_rate": 0.0002919358392455823, + "loss": 0.0376, "step": 20740 }, { - "epoch": 0.1, - "learning_rate": 0.00028429703699592854, - "loss": 0.0328, + "epoch": 0.05, + "learning_rate": 0.00029193195102921083, + "loss": 0.0309, "step": 20750 }, { - "epoch": 0.1, - "learning_rate": 0.0002842894693029145, - "loss": 0.0289, + "epoch": 0.05, + "learning_rate": 0.0002919280628128394, + "loss": 0.0364, "step": 20760 }, { - "epoch": 0.1, - "learning_rate": 0.0002842819016099005, - "loss": 0.0331, + "epoch": 0.05, + "learning_rate": 0.0002919241745964679, + "loss": 0.0367, "step": 20770 }, { - "epoch": 0.1, - "learning_rate": 0.0002842743339168865, - "loss": 0.0302, + "epoch": 0.05, + "learning_rate": 0.0002919202863800965, + "loss": 0.0385, "step": 20780 }, { - "epoch": 0.1, - "learning_rate": 0.0002842667662238725, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.000291916398163725, + "loss": 0.0486, "step": 20790 }, { - "epoch": 0.1, - "learning_rate": 0.0002842591985308585, - "loss": 0.0358, + "epoch": 0.05, + "learning_rate": 0.0002919125099473535, + "loss": 0.0373, "step": 20800 }, { - "epoch": 0.1, - "learning_rate": 0.0002842516308378445, - "loss": 0.03, + "epoch": 0.05, + "learning_rate": 0.00029190862173098203, + "loss": 0.0353, "step": 20810 }, { - "epoch": 0.11, - "learning_rate": 0.00028424406314483047, - "loss": 0.0273, + "epoch": 0.05, + "learning_rate": 0.0002919047335146106, + "loss": 0.0388, "step": 20820 }, { - "epoch": 0.11, - "learning_rate": 0.00028423649545181645, - "loss": 0.0302, + "epoch": 0.05, + "learning_rate": 0.0002919008452982391, + "loss": 0.0368, "step": 20830 }, { - "epoch": 0.11, - "learning_rate": 0.00028422892775880243, - "loss": 0.0328, + "epoch": 0.05, + "learning_rate": 0.0002918969570818677, + "loss": 0.0323, "step": 20840 }, { - "epoch": 0.11, - "learning_rate": 0.00028422136006578847, - "loss": 0.0305, + "epoch": 0.05, + "learning_rate": 0.0002918930688654962, + "loss": 0.0404, "step": 20850 }, { - "epoch": 0.11, - "learning_rate": 0.00028421379237277445, - "loss": 0.0309, + "epoch": 0.05, + "learning_rate": 0.0002918891806491247, + "loss": 0.0334, "step": 20860 }, { - "epoch": 0.11, - "learning_rate": 0.00028420622467976043, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002918852924327533, + "loss": 0.0344, "step": 20870 }, { - "epoch": 0.11, - "learning_rate": 0.0002841986569867464, - "loss": 0.0318, + "epoch": 0.05, + "learning_rate": 0.0002918814042163818, + "loss": 0.0366, "step": 20880 }, { - "epoch": 0.11, - "learning_rate": 0.0002841910892937324, - "loss": 0.0358, + "epoch": 0.05, + "learning_rate": 0.00029187751600001036, + "loss": 0.0553, "step": 20890 }, { - "epoch": 0.11, - "learning_rate": 0.0002841835216007184, - "loss": 0.0282, + "epoch": 0.05, + "learning_rate": 0.0002918736277836389, + "loss": 0.0316, "step": 20900 }, { - "epoch": 0.11, - "learning_rate": 0.00028417595390770435, - "loss": 0.0285, + "epoch": 0.05, + "learning_rate": 0.00029186973956726745, + "loss": 0.0348, "step": 20910 }, { - "epoch": 0.11, - "learning_rate": 0.0002841683862146904, - "loss": 0.0371, + "epoch": 0.05, + "learning_rate": 0.00029186585135089596, + "loss": 0.0324, "step": 20920 }, { - "epoch": 0.11, - "learning_rate": 0.00028416081852167637, - "loss": 0.0311, + "epoch": 0.05, + "learning_rate": 0.0002918619631345245, + "loss": 0.0363, "step": 20930 }, { - "epoch": 0.11, - "learning_rate": 0.00028415325082866235, - "loss": 0.0481, + "epoch": 0.05, + "learning_rate": 0.000291858074918153, + "loss": 0.0365, "step": 20940 }, { - "epoch": 0.11, - "learning_rate": 0.00028414568313564833, - "loss": 0.0307, + "epoch": 0.05, + "learning_rate": 0.00029185418670178156, + "loss": 0.0352, "step": 20950 }, { - "epoch": 0.11, - "learning_rate": 0.0002841381154426343, - "loss": 0.031, + "epoch": 0.05, + "learning_rate": 0.0002918502984854101, + "loss": 0.0304, "step": 20960 }, { - "epoch": 0.11, - "learning_rate": 0.0002841305477496203, - "loss": 0.0286, + "epoch": 0.05, + "learning_rate": 0.00029184641026903864, + "loss": 0.0368, "step": 20970 }, { - "epoch": 0.11, - "learning_rate": 0.00028412298005660633, - "loss": 0.03, + "epoch": 0.05, + "learning_rate": 0.00029184252205266716, + "loss": 0.0444, "step": 20980 }, { - "epoch": 0.11, - "learning_rate": 0.0002841154123635923, - "loss": 0.0331, + "epoch": 0.05, + "learning_rate": 0.0002918386338362957, + "loss": 0.0391, "step": 20990 }, { - "epoch": 0.11, - "learning_rate": 0.0002841078446705783, - "loss": 0.0248, + "epoch": 0.05, + "learning_rate": 0.00029183474561992424, + "loss": 0.0391, "step": 21000 }, { - "epoch": 0.11, - "eval_cer": 0.9145119829365546, - "eval_loss": 0.021799687296152115, - "eval_runtime": 117.5088, - "eval_samples_per_second": 17.02, - "eval_steps_per_second": 4.255, + "epoch": 0.05, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.026714030653238297, + "eval_runtime": 107.7623, + "eval_samples_per_second": 18.559, + "eval_steps_per_second": 4.64, "step": 21000 }, { - "epoch": 0.11, - "learning_rate": 0.0002841002769775643, - "loss": 0.0341, + "epoch": 0.05, + "learning_rate": 0.00029183085740355275, + "loss": 0.0367, "step": 21010 }, { - "epoch": 0.11, - "learning_rate": 0.00028409270928455026, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.00029182696918718127, + "loss": 0.0383, "step": 21020 }, { - "epoch": 0.11, - "learning_rate": 0.00028408514159153624, - "loss": 0.0277, + "epoch": 0.05, + "learning_rate": 0.00029182308097080984, + "loss": 0.0365, "step": 21030 }, { - "epoch": 0.11, - "learning_rate": 0.0002840775738985222, - "loss": 0.0317, + "epoch": 0.05, + "learning_rate": 0.0002918191927544384, + "loss": 0.0391, "step": 21040 }, { - "epoch": 0.11, - "learning_rate": 0.00028407000620550826, - "loss": 0.0341, + "epoch": 0.05, + "learning_rate": 0.0002918153045380669, + "loss": 0.0364, "step": 21050 }, { - "epoch": 0.11, - "learning_rate": 0.00028406243851249424, - "loss": 0.0266, + "epoch": 0.05, + "learning_rate": 0.00029181141632169544, + "loss": 0.0309, "step": 21060 }, { - "epoch": 0.11, - "learning_rate": 0.0002840548708194802, - "loss": 0.0294, + "epoch": 0.05, + "learning_rate": 0.000291807528105324, + "loss": 0.0314, "step": 21070 }, { - "epoch": 0.11, - "learning_rate": 0.0002840473031264662, - "loss": 0.0324, + "epoch": 0.05, + "learning_rate": 0.0002918036398889525, + "loss": 0.032, "step": 21080 }, { - "epoch": 0.11, - "learning_rate": 0.0002840397354334522, - "loss": 0.0352, + "epoch": 0.05, + "learning_rate": 0.00029179975167258103, + "loss": 0.0389, "step": 21090 }, { - "epoch": 0.11, - "learning_rate": 0.00028403216774043816, - "loss": 0.0292, + "epoch": 0.05, + "learning_rate": 0.0002917958634562096, + "loss": 0.0424, "step": 21100 }, { - "epoch": 0.11, - "learning_rate": 0.0002840246000474242, - "loss": 0.0342, + "epoch": 0.05, + "learning_rate": 0.0002917919752398381, + "loss": 0.0404, "step": 21110 }, { - "epoch": 0.11, - "learning_rate": 0.0002840170323544102, - "loss": 0.0298, + "epoch": 0.05, + "learning_rate": 0.0002917880870234667, + "loss": 0.0486, "step": 21120 }, { - "epoch": 0.11, - "learning_rate": 0.00028400946466139616, - "loss": 0.0297, + "epoch": 0.05, + "learning_rate": 0.0002917841988070952, + "loss": 0.0334, "step": 21130 }, { - "epoch": 0.11, - "learning_rate": 0.00028400189696838214, - "loss": 0.0291, + "epoch": 0.05, + "learning_rate": 0.0002917803105907237, + "loss": 0.0399, "step": 21140 }, { - "epoch": 0.11, - "learning_rate": 0.0002839943292753681, - "loss": 0.0265, + "epoch": 0.05, + "learning_rate": 0.00029177642237435223, + "loss": 0.0322, "step": 21150 }, { - "epoch": 0.11, - "learning_rate": 0.0002839867615823541, - "loss": 0.0303, + "epoch": 0.05, + "learning_rate": 0.0002917725341579808, + "loss": 0.0335, "step": 21160 }, { - "epoch": 0.11, - "learning_rate": 0.00028397919388934014, - "loss": 0.0283, + "epoch": 0.05, + "learning_rate": 0.0002917686459416093, + "loss": 0.0325, "step": 21170 }, { - "epoch": 0.11, - "learning_rate": 0.0002839716261963261, - "loss": 0.0293, + "epoch": 0.05, + "learning_rate": 0.0002917647577252379, + "loss": 0.0328, "step": 21180 }, { - "epoch": 0.11, - "learning_rate": 0.0002839640585033121, - "loss": 0.0316, + "epoch": 0.05, + "learning_rate": 0.0002917608695088664, + "loss": 0.0362, "step": 21190 }, { - "epoch": 0.11, - "learning_rate": 0.0002839564908102981, - "loss": 0.0332, + "epoch": 0.05, + "learning_rate": 0.00029175698129249496, + "loss": 0.0343, "step": 21200 }, { - "epoch": 0.11, - "learning_rate": 0.00028394892311728407, - "loss": 0.0376, + "epoch": 0.05, + "learning_rate": 0.0002917530930761235, + "loss": 0.0327, "step": 21210 }, { - "epoch": 0.11, - "learning_rate": 0.00028394135542427005, - "loss": 0.0328, + "epoch": 0.06, + "learning_rate": 0.000291749204859752, + "loss": 0.0313, "step": 21220 }, { - "epoch": 0.11, - "learning_rate": 0.00028393378773125603, - "loss": 0.0347, + "epoch": 0.06, + "learning_rate": 0.0002917453166433805, + "loss": 0.0376, "step": 21230 }, { - "epoch": 0.11, - "learning_rate": 0.00028392622003824207, - "loss": 0.0322, + "epoch": 0.06, + "learning_rate": 0.0002917414284270091, + "loss": 0.0405, "step": 21240 }, { - "epoch": 0.11, - "learning_rate": 0.00028391865234522805, - "loss": 0.0329, + "epoch": 0.06, + "learning_rate": 0.00029173754021063765, + "loss": 0.0379, "step": 21250 }, { - "epoch": 0.11, - "learning_rate": 0.00028391108465221403, - "loss": 0.0309, + "epoch": 0.06, + "learning_rate": 0.00029173365199426616, + "loss": 0.0343, "step": 21260 }, { - "epoch": 0.11, - "learning_rate": 0.0002839035169592, - "loss": 0.0357, + "epoch": 0.06, + "learning_rate": 0.0002917297637778947, + "loss": 0.0393, "step": 21270 }, { - "epoch": 0.11, - "learning_rate": 0.000283895949266186, - "loss": 0.0267, + "epoch": 0.06, + "learning_rate": 0.00029172587556152324, + "loss": 0.0396, "step": 21280 }, { - "epoch": 0.11, - "learning_rate": 0.000283888381573172, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.00029172198734515176, + "loss": 0.0369, "step": 21290 }, { - "epoch": 0.11, - "learning_rate": 0.000283880813880158, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.00029171809912878027, + "loss": 0.035, "step": 21300 }, { - "epoch": 0.11, - "learning_rate": 0.000283873246187144, - "loss": 0.0297, + "epoch": 0.06, + "learning_rate": 0.00029171421091240884, + "loss": 0.0367, "step": 21310 }, { - "epoch": 0.11, - "learning_rate": 0.00028386567849413, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.00029171032269603736, + "loss": 0.0353, "step": 21320 }, { - "epoch": 0.11, - "learning_rate": 0.00028385811080111595, - "loss": 0.0247, + "epoch": 0.06, + "learning_rate": 0.0002917064344796659, + "loss": 0.0388, "step": 21330 }, { - "epoch": 0.11, - "learning_rate": 0.00028385054310810194, - "loss": 0.0314, + "epoch": 0.06, + "learning_rate": 0.00029170254626329444, + "loss": 0.0387, "step": 21340 }, { - "epoch": 0.11, - "learning_rate": 0.0002838429754150879, - "loss": 0.0338, + "epoch": 0.06, + "learning_rate": 0.00029169865804692295, + "loss": 0.0492, "step": 21350 }, { - "epoch": 0.11, - "learning_rate": 0.00028383540772207395, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.00029169476983055147, + "loss": 0.0423, "step": 21360 }, { - "epoch": 0.11, - "learning_rate": 0.00028382784002905993, - "loss": 0.0307, + "epoch": 0.06, + "learning_rate": 0.00029169088161418004, + "loss": 0.0462, "step": 21370 }, { - "epoch": 0.11, - "learning_rate": 0.0002838202723360459, - "loss": 0.0314, + "epoch": 0.06, + "learning_rate": 0.00029168699339780855, + "loss": 0.0476, "step": 21380 }, { - "epoch": 0.11, - "learning_rate": 0.0002838127046430319, - "loss": 0.0284, + "epoch": 0.06, + "learning_rate": 0.0002916831051814371, + "loss": 0.0407, "step": 21390 }, { - "epoch": 0.11, - "learning_rate": 0.0002838051369500179, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.00029167921696506563, + "loss": 0.037, "step": 21400 }, { - "epoch": 0.11, - "learning_rate": 0.00028379756925700386, - "loss": 0.0336, + "epoch": 0.06, + "learning_rate": 0.0002916753287486942, + "loss": 0.0374, "step": 21410 }, { - "epoch": 0.11, - "learning_rate": 0.00028379000156398984, - "loss": 0.0312, + "epoch": 0.06, + "learning_rate": 0.0002916714405323227, + "loss": 0.0391, "step": 21420 }, { - "epoch": 0.11, - "learning_rate": 0.0002837824338709759, - "loss": 0.0311, + "epoch": 0.06, + "learning_rate": 0.00029166755231595123, + "loss": 0.0697, "step": 21430 }, { - "epoch": 0.11, - "learning_rate": 0.00028377486617796186, - "loss": 0.0293, + "epoch": 0.06, + "learning_rate": 0.0002916636640995798, + "loss": 0.0597, "step": 21440 }, { - "epoch": 0.11, - "learning_rate": 0.00028376729848494784, - "loss": 0.0297, + "epoch": 0.06, + "learning_rate": 0.0002916597758832083, + "loss": 0.0395, "step": 21450 }, { - "epoch": 0.11, - "learning_rate": 0.0002837597307919338, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.0002916558876668369, + "loss": 0.0405, "step": 21460 }, { - "epoch": 0.11, - "learning_rate": 0.0002837521630989198, - "loss": 0.0243, + "epoch": 0.06, + "learning_rate": 0.0002916519994504654, + "loss": 0.0361, "step": 21470 }, { - "epoch": 0.11, - "learning_rate": 0.0002837445954059058, - "loss": 0.0277, + "epoch": 0.06, + "learning_rate": 0.0002916481112340939, + "loss": 0.0364, "step": 21480 }, { - "epoch": 0.11, - "learning_rate": 0.0002837370277128918, - "loss": 0.0269, + "epoch": 0.06, + "learning_rate": 0.0002916442230177225, + "loss": 0.0363, "step": 21490 }, { - "epoch": 0.11, - "learning_rate": 0.0002837294600198778, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.000291640334801351, + "loss": 0.0324, "step": 21500 }, { - "epoch": 0.11, - "learning_rate": 0.0002837218923268638, - "loss": 0.0276, + "epoch": 0.06, + "learning_rate": 0.0002916364465849795, + "loss": 0.0314, "step": 21510 }, { - "epoch": 0.11, - "learning_rate": 0.00028371432463384976, - "loss": 0.0306, + "epoch": 0.06, + "learning_rate": 0.0002916325583686081, + "loss": 0.0352, "step": 21520 }, { - "epoch": 0.11, - "learning_rate": 0.00028370675694083575, - "loss": 0.0309, + "epoch": 0.06, + "learning_rate": 0.0002916286701522366, + "loss": 0.0442, "step": 21530 }, { - "epoch": 0.11, - "learning_rate": 0.00028369918924782173, - "loss": 0.029, + "epoch": 0.06, + "learning_rate": 0.00029162478193586516, + "loss": 0.0365, "step": 21540 }, { - "epoch": 0.11, - "learning_rate": 0.0002836916215548077, + "epoch": 0.06, + "learning_rate": 0.0002916208937194937, "loss": 0.0354, "step": 21550 }, { - "epoch": 0.11, - "learning_rate": 0.00028368405386179374, - "loss": 0.039, + "epoch": 0.06, + "learning_rate": 0.0002916170055031222, + "loss": 0.0343, "step": 21560 }, { - "epoch": 0.11, - "learning_rate": 0.0002836764861687797, - "loss": 0.0296, + "epoch": 0.06, + "learning_rate": 0.00029161311728675076, + "loss": 0.038, "step": 21570 }, { - "epoch": 0.11, - "learning_rate": 0.0002836689184757657, - "loss": 0.0278, + "epoch": 0.06, + "learning_rate": 0.0002916092290703793, + "loss": 0.0332, "step": 21580 }, { - "epoch": 0.11, - "learning_rate": 0.0002836613507827517, - "loss": 0.0293, + "epoch": 0.06, + "learning_rate": 0.00029160534085400784, + "loss": 0.0351, "step": 21590 }, { - "epoch": 0.11, - "learning_rate": 0.00028365378308973767, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.00029160145263763636, + "loss": 0.0393, "step": 21600 }, { - "epoch": 0.11, - "learning_rate": 0.00028364621539672365, - "loss": 0.0281, + "epoch": 0.06, + "learning_rate": 0.0002915975644212649, + "loss": 0.031, "step": 21610 }, { - "epoch": 0.11, - "learning_rate": 0.0002836386477037097, - "loss": 0.0231, + "epoch": 0.06, + "learning_rate": 0.00029159367620489344, + "loss": 0.0403, "step": 21620 }, { - "epoch": 0.11, - "learning_rate": 0.00028363108001069567, - "loss": 0.0244, + "epoch": 0.06, + "learning_rate": 0.00029158978798852196, + "loss": 0.0412, "step": 21630 }, { - "epoch": 0.11, - "learning_rate": 0.00028362351231768165, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.00029158589977215047, + "loss": 0.0374, "step": 21640 }, { - "epoch": 0.11, - "learning_rate": 0.00028361594462466763, - "loss": 0.0277, + "epoch": 0.06, + "learning_rate": 0.00029158201155577904, + "loss": 0.0392, "step": 21650 }, { - "epoch": 0.11, - "learning_rate": 0.0002836083769316536, - "loss": 0.0264, + "epoch": 0.06, + "learning_rate": 0.00029157812333940755, + "loss": 0.0391, "step": 21660 }, { - "epoch": 0.11, - "learning_rate": 0.0002836008092386396, - "loss": 0.0247, + "epoch": 0.06, + "learning_rate": 0.0002915742351230361, + "loss": 0.0342, "step": 21670 }, { - "epoch": 0.11, - "learning_rate": 0.00028359324154562563, - "loss": 0.0261, + "epoch": 0.06, + "learning_rate": 0.00029157034690666464, + "loss": 0.0519, "step": 21680 }, { - "epoch": 0.11, - "learning_rate": 0.0002835856738526116, - "loss": 0.0295, + "epoch": 0.06, + "learning_rate": 0.00029156645869029315, + "loss": 0.0392, "step": 21690 }, { - "epoch": 0.11, - "learning_rate": 0.0002835781061595976, - "loss": 0.0298, + "epoch": 0.06, + "learning_rate": 0.0002915625704739217, + "loss": 0.0368, "step": 21700 }, { - "epoch": 0.11, - "learning_rate": 0.0002835705384665836, - "loss": 0.0272, + "epoch": 0.06, + "learning_rate": 0.00029155868225755024, + "loss": 0.0525, "step": 21710 }, { - "epoch": 0.11, - "learning_rate": 0.00028356297077356956, - "loss": 0.0324, + "epoch": 0.06, + "learning_rate": 0.00029155479404117875, + "loss": 0.0381, "step": 21720 }, { - "epoch": 0.11, - "learning_rate": 0.00028355540308055554, - "loss": 0.0303, + "epoch": 0.06, + "learning_rate": 0.0002915509058248073, + "loss": 0.0399, "step": 21730 }, { - "epoch": 0.11, - "learning_rate": 0.0002835478353875415, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.0002915470176084359, + "loss": 0.0349, "step": 21740 }, { - "epoch": 0.11, - "learning_rate": 0.00028354026769452755, - "loss": 0.0307, + "epoch": 0.06, + "learning_rate": 0.0002915431293920644, + "loss": 0.0368, "step": 21750 }, { - "epoch": 0.11, - "learning_rate": 0.00028353270000151354, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.0002915392411756929, + "loss": 0.0398, "step": 21760 }, { - "epoch": 0.11, - "learning_rate": 0.0002835251323084995, - "loss": 0.0283, + "epoch": 0.06, + "learning_rate": 0.00029153535295932143, + "loss": 0.0389, "step": 21770 }, { - "epoch": 0.11, - "learning_rate": 0.0002835175646154855, - "loss": 0.0261, + "epoch": 0.06, + "learning_rate": 0.00029153146474295, + "loss": 0.051, "step": 21780 }, { - "epoch": 0.11, - "learning_rate": 0.0002835099969224715, - "loss": 0.033, + "epoch": 0.06, + "learning_rate": 0.0002915275765265785, + "loss": 0.0418, "step": 21790 }, { - "epoch": 0.11, - "learning_rate": 0.00028350242922945746, - "loss": 0.0286, + "epoch": 0.06, + "learning_rate": 0.0002915236883102071, + "loss": 0.0367, "step": 21800 }, { - "epoch": 0.11, - "learning_rate": 0.0002834948615364435, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.0002915198000938356, + "loss": 0.0485, "step": 21810 }, { - "epoch": 0.11, - "learning_rate": 0.0002834872938434295, - "loss": 0.0286, + "epoch": 0.06, + "learning_rate": 0.00029151591187746417, + "loss": 0.037, "step": 21820 }, { - "epoch": 0.11, - "learning_rate": 0.00028347972615041546, - "loss": 0.0283, + "epoch": 0.06, + "learning_rate": 0.0002915120236610927, + "loss": 0.0344, "step": 21830 }, { - "epoch": 0.11, - "learning_rate": 0.00028347215845740144, - "loss": 0.0422, + "epoch": 0.06, + "learning_rate": 0.0002915081354447212, + "loss": 0.0413, "step": 21840 }, { - "epoch": 0.11, - "learning_rate": 0.0002834645907643874, - "loss": 0.0347, + "epoch": 0.06, + "learning_rate": 0.0002915042472283497, + "loss": 0.0398, "step": 21850 }, { - "epoch": 0.11, - "learning_rate": 0.0002834570230713734, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.0002915003590119783, + "loss": 0.039, "step": 21860 }, { - "epoch": 0.11, - "learning_rate": 0.00028344945537835944, - "loss": 0.0305, + "epoch": 0.06, + "learning_rate": 0.0002914964707956068, + "loss": 0.0343, "step": 21870 }, { - "epoch": 0.11, - "learning_rate": 0.0002834418876853454, - "loss": 0.0271, + "epoch": 0.06, + "learning_rate": 0.00029149258257923536, + "loss": 0.034, "step": 21880 }, { - "epoch": 0.11, - "learning_rate": 0.0002834343199923314, - "loss": 0.0306, + "epoch": 0.06, + "learning_rate": 0.0002914886943628639, + "loss": 0.0396, "step": 21890 }, { - "epoch": 0.11, - "learning_rate": 0.0002834267522993174, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.0002914848061464924, + "loss": 0.0346, "step": 21900 }, { - "epoch": 0.11, - "learning_rate": 0.00028341918460630337, - "loss": 0.0346, + "epoch": 0.06, + "learning_rate": 0.00029148091793012096, + "loss": 0.0352, "step": 21910 }, { - "epoch": 0.11, - "learning_rate": 0.00028341161691328935, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.0002914770297137495, + "loss": 0.046, "step": 21920 }, { - "epoch": 0.11, - "learning_rate": 0.00028340404922027533, - "loss": 0.0244, + "epoch": 0.06, + "learning_rate": 0.000291473141497378, + "loss": 0.0363, "step": 21930 }, { - "epoch": 0.11, - "learning_rate": 0.00028339648152726136, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.00029146925328100656, + "loss": 0.0429, "step": 21940 }, { - "epoch": 0.11, - "learning_rate": 0.00028338891383424735, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002914653650646351, + "loss": 0.0336, "step": 21950 }, { - "epoch": 0.11, - "learning_rate": 0.00028338134614123333, - "loss": 0.0289, + "epoch": 0.06, + "learning_rate": 0.00029146147684826364, + "loss": 0.0381, "step": 21960 }, { - "epoch": 0.11, - "learning_rate": 0.0002833737784482193, - "loss": 0.0245, + "epoch": 0.06, + "learning_rate": 0.00029145758863189216, + "loss": 0.0368, "step": 21970 }, { - "epoch": 0.11, - "learning_rate": 0.0002833662107552053, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.00029145370041552067, + "loss": 0.0387, "step": 21980 }, { - "epoch": 0.11, - "learning_rate": 0.00028335864306219127, - "loss": 0.0277, + "epoch": 0.06, + "learning_rate": 0.00029144981219914924, + "loss": 0.0389, "step": 21990 }, { - "epoch": 0.11, - "learning_rate": 0.00028335107536917725, - "loss": 0.026, + "epoch": 0.06, + "learning_rate": 0.00029144592398277775, + "loss": 0.0383, "step": 22000 }, { - "epoch": 0.11, - "eval_cer": 0.9144663743186606, - "eval_loss": 0.021011509001255035, - "eval_runtime": 117.4912, - "eval_samples_per_second": 17.023, - "eval_steps_per_second": 4.256, + "epoch": 0.06, + "eval_cer": 0.8817894638130869, + "eval_loss": 0.02770763821899891, + "eval_runtime": 107.5949, + "eval_samples_per_second": 18.588, + "eval_steps_per_second": 4.647, "step": 22000 }, { - "epoch": 0.11, - "learning_rate": 0.00028334350767616323, - "loss": 0.0327, + "epoch": 0.06, + "learning_rate": 0.0002914420357664063, + "loss": 0.0393, "step": 22010 }, { - "epoch": 0.11, - "learning_rate": 0.0002833359399831492, - "loss": 0.0257, + "epoch": 0.06, + "learning_rate": 0.00029143814755003484, + "loss": 0.0345, "step": 22020 }, { - "epoch": 0.11, - "learning_rate": 0.0002833283722901352, - "loss": 0.0277, + "epoch": 0.06, + "learning_rate": 0.0002914342593336634, + "loss": 0.0346, "step": 22030 }, { - "epoch": 0.11, - "learning_rate": 0.00028332080459712123, - "loss": 0.0319, + "epoch": 0.06, + "learning_rate": 0.0002914303711172919, + "loss": 0.0375, "step": 22040 }, { - "epoch": 0.11, - "learning_rate": 0.0002833132369041072, - "loss": 0.0257, + "epoch": 0.06, + "learning_rate": 0.00029142648290092043, + "loss": 0.0361, "step": 22050 }, { - "epoch": 0.11, - "learning_rate": 0.0002833056692110932, - "loss": 0.0284, + "epoch": 0.06, + "learning_rate": 0.00029142259468454895, + "loss": 0.0372, "step": 22060 }, { - "epoch": 0.11, - "learning_rate": 0.0002832981015180792, - "loss": 0.0336, + "epoch": 0.06, + "learning_rate": 0.0002914187064681775, + "loss": 0.0408, "step": 22070 }, { - "epoch": 0.11, - "learning_rate": 0.00028329053382506516, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.0002914148182518061, + "loss": 0.039, "step": 22080 }, { - "epoch": 0.11, - "learning_rate": 0.00028328296613205114, - "loss": 0.0259, + "epoch": 0.06, + "learning_rate": 0.0002914109300354346, + "loss": 0.0367, "step": 22090 }, { - "epoch": 0.11, - "learning_rate": 0.0002832753984390371, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.0002914070418190631, + "loss": 0.0401, "step": 22100 }, { - "epoch": 0.11, - "learning_rate": 0.00028326783074602316, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.00029140315360269163, + "loss": 0.0365, "step": 22110 }, { - "epoch": 0.11, - "learning_rate": 0.00028326026305300914, - "loss": 0.0306, + "epoch": 0.06, + "learning_rate": 0.0002913992653863202, + "loss": 0.0398, "step": 22120 }, { - "epoch": 0.11, - "learning_rate": 0.0002832526953599951, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.0002913953771699487, + "loss": 0.0327, "step": 22130 }, { - "epoch": 0.11, - "learning_rate": 0.0002832451276669811, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.0002913914889535773, + "loss": 0.0374, "step": 22140 }, { - "epoch": 0.11, - "learning_rate": 0.0002832375599739671, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.0002913876007372058, + "loss": 0.0284, "step": 22150 }, { - "epoch": 0.11, - "learning_rate": 0.00028322999228095306, - "loss": 0.0353, + "epoch": 0.06, + "learning_rate": 0.00029138371252083437, + "loss": 0.0356, "step": 22160 }, { - "epoch": 0.11, - "learning_rate": 0.0002832224245879391, - "loss": 0.0253, + "epoch": 0.06, + "learning_rate": 0.0002913798243044629, + "loss": 0.0363, "step": 22170 }, { - "epoch": 0.11, - "learning_rate": 0.0002832148568949251, - "loss": 0.0283, + "epoch": 0.06, + "learning_rate": 0.0002913759360880914, + "loss": 0.0389, "step": 22180 }, { - "epoch": 0.11, - "learning_rate": 0.00028320728920191106, - "loss": 0.0256, + "epoch": 0.06, + "learning_rate": 0.0002913720478717199, + "loss": 0.0423, "step": 22190 }, { - "epoch": 0.11, - "learning_rate": 0.00028319972150889704, - "loss": 0.031, + "epoch": 0.06, + "learning_rate": 0.0002913681596553485, + "loss": 0.0353, "step": 22200 }, { - "epoch": 0.11, - "learning_rate": 0.000283192153815883, - "loss": 0.0296, + "epoch": 0.06, + "learning_rate": 0.000291364271438977, + "loss": 0.0359, "step": 22210 }, { - "epoch": 0.11, - "learning_rate": 0.000283184586122869, - "loss": 0.027, + "epoch": 0.06, + "learning_rate": 0.00029136038322260556, + "loss": 0.0439, "step": 22220 }, { - "epoch": 0.11, - "learning_rate": 0.00028317701842985504, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.0002913564950062341, + "loss": 0.032, "step": 22230 }, { - "epoch": 0.11, - "learning_rate": 0.000283169450736841, - "loss": 0.0297, + "epoch": 0.06, + "learning_rate": 0.00029135260678986264, + "loss": 0.0354, "step": 22240 }, { - "epoch": 0.11, - "learning_rate": 0.000283161883043827, - "loss": 0.0266, + "epoch": 0.06, + "learning_rate": 0.00029134871857349116, + "loss": 0.0371, "step": 22250 }, { - "epoch": 0.11, - "learning_rate": 0.000283154315350813, - "loss": 0.0307, + "epoch": 0.06, + "learning_rate": 0.0002913448303571197, + "loss": 0.0398, "step": 22260 }, { - "epoch": 0.11, - "learning_rate": 0.00028314674765779897, - "loss": 0.0264, + "epoch": 0.06, + "learning_rate": 0.0002913409421407482, + "loss": 0.0393, "step": 22270 }, { - "epoch": 0.11, - "learning_rate": 0.00028313917996478495, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.00029133705392437676, + "loss": 0.032, "step": 22280 }, { - "epoch": 0.11, - "learning_rate": 0.00028313161227177093, - "loss": 0.0313, + "epoch": 0.06, + "learning_rate": 0.0002913331657080053, + "loss": 0.0398, "step": 22290 }, { - "epoch": 0.11, - "learning_rate": 0.00028312404457875697, - "loss": 0.0223, + "epoch": 0.06, + "learning_rate": 0.00029132927749163384, + "loss": 0.0361, "step": 22300 }, { - "epoch": 0.11, - "learning_rate": 0.00028311647688574295, - "loss": 0.0285, + "epoch": 0.06, + "learning_rate": 0.00029132538927526235, + "loss": 0.0414, "step": 22310 }, { - "epoch": 0.11, - "learning_rate": 0.00028310890919272893, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.0002913215010588909, + "loss": 0.0333, "step": 22320 }, { - "epoch": 0.11, - "learning_rate": 0.0002831013414997149, - "loss": 0.0389, + "epoch": 0.06, + "learning_rate": 0.00029131761284251944, + "loss": 0.0355, "step": 22330 }, { - "epoch": 0.11, - "learning_rate": 0.0002830937738067009, - "loss": 0.037, + "epoch": 0.06, + "learning_rate": 0.00029131372462614795, + "loss": 0.0386, "step": 22340 }, { - "epoch": 0.11, - "learning_rate": 0.0002830862061136869, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002913098364097765, + "loss": 0.0365, "step": 22350 }, { - "epoch": 0.11, - "learning_rate": 0.0002830786384206729, - "loss": 0.0333, + "epoch": 0.06, + "learning_rate": 0.00029130594819340504, + "loss": 0.0343, "step": 22360 }, { - "epoch": 0.11, - "learning_rate": 0.0002830710707276589, - "loss": 0.0416, + "epoch": 0.06, + "learning_rate": 0.0002913020599770336, + "loss": 0.0365, "step": 22370 }, { - "epoch": 0.11, - "learning_rate": 0.0002830635030346449, - "loss": 0.0273, + "epoch": 0.06, + "learning_rate": 0.0002912981717606621, + "loss": 0.0327, "step": 22380 }, { - "epoch": 0.11, - "learning_rate": 0.00028305593534163085, - "loss": 0.0299, + "epoch": 0.06, + "learning_rate": 0.00029129428354429063, + "loss": 0.035, "step": 22390 }, { - "epoch": 0.11, - "learning_rate": 0.00028304836764861684, - "loss": 0.0309, + "epoch": 0.06, + "learning_rate": 0.00029129039532791915, + "loss": 0.0387, "step": 22400 }, { - "epoch": 0.11, - "learning_rate": 0.0002830407999556028, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002912865071115477, + "loss": 0.0317, "step": 22410 }, { - "epoch": 0.11, - "learning_rate": 0.00028303323226258885, - "loss": 0.0312, - "step": 22420 + "epoch": 0.06, + "learning_rate": 0.00029128261889517623, + "loss": 0.0345, + "step": 22420 }, { - "epoch": 0.11, - "learning_rate": 0.00028302566456957483, - "loss": 0.0316, + "epoch": 0.06, + "learning_rate": 0.0002912787306788048, + "loss": 0.0323, "step": 22430 }, { - "epoch": 0.11, - "learning_rate": 0.0002830180968765608, - "loss": 0.0328, + "epoch": 0.06, + "learning_rate": 0.0002912748424624333, + "loss": 0.033, "step": 22440 }, { - "epoch": 0.11, - "learning_rate": 0.0002830105291835468, - "loss": 0.0317, + "epoch": 0.06, + "learning_rate": 0.0002912709542460619, + "loss": 0.0362, "step": 22450 }, { - "epoch": 0.11, - "learning_rate": 0.0002830029614905328, - "loss": 0.0324, + "epoch": 0.06, + "learning_rate": 0.0002912670660296904, + "loss": 0.0278, "step": 22460 }, { - "epoch": 0.11, - "learning_rate": 0.00028299539379751876, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.0002912631778133189, + "loss": 0.0346, "step": 22470 }, { - "epoch": 0.11, - "learning_rate": 0.00028298782610450474, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.0002912592895969475, + "loss": 0.0378, "step": 22480 }, { - "epoch": 0.11, - "learning_rate": 0.0002829802584114908, - "loss": 0.0316, + "epoch": 0.06, + "learning_rate": 0.000291255401380576, + "loss": 0.0334, "step": 22490 }, { - "epoch": 0.11, - "learning_rate": 0.00028297269071847676, - "loss": 0.0309, + "epoch": 0.06, + "learning_rate": 0.00029125151316420456, + "loss": 0.029, "step": 22500 }, { - "epoch": 0.11, - "learning_rate": 0.00028296512302546274, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002912476249478331, + "loss": 0.0321, "step": 22510 }, { - "epoch": 0.11, - "learning_rate": 0.0002829575553324487, - "loss": 0.0312, + "epoch": 0.06, + "learning_rate": 0.0002912437367314616, + "loss": 0.0355, "step": 22520 }, { - "epoch": 0.11, - "learning_rate": 0.0002829499876394347, - "loss": 0.0314, + "epoch": 0.06, + "learning_rate": 0.00029123984851509016, + "loss": 0.0375, "step": 22530 }, { - "epoch": 0.11, - "learning_rate": 0.0002829424199464207, - "loss": 0.035, + "epoch": 0.06, + "learning_rate": 0.0002912359602987187, + "loss": 0.0295, "step": 22540 }, { - "epoch": 0.11, - "learning_rate": 0.0002829348522534067, - "loss": 0.0283, + "epoch": 0.06, + "learning_rate": 0.0002912320720823472, + "loss": 0.032, "step": 22550 }, { - "epoch": 0.11, - "learning_rate": 0.0002829272845603927, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.00029122818386597576, + "loss": 0.0368, "step": 22560 }, { - "epoch": 0.11, - "learning_rate": 0.0002829197168673787, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.0002912242956496043, + "loss": 0.0315, "step": 22570 }, { - "epoch": 0.11, - "learning_rate": 0.00028291214917436466, - "loss": 0.0296, + "epoch": 0.06, + "learning_rate": 0.00029122040743323284, + "loss": 0.034, "step": 22580 }, { - "epoch": 0.11, - "learning_rate": 0.00028290458148135065, - "loss": 0.0294, + "epoch": 0.06, + "learning_rate": 0.00029121651921686136, + "loss": 0.0398, "step": 22590 }, { - "epoch": 0.11, - "learning_rate": 0.00028289701378833663, - "loss": 0.0285, + "epoch": 0.06, + "learning_rate": 0.00029121263100048987, + "loss": 0.0338, "step": 22600 }, { - "epoch": 0.11, - "learning_rate": 0.0002828894460953226, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.0002912087427841184, + "loss": 0.0363, "step": 22610 }, { - "epoch": 0.11, - "learning_rate": 0.00028288187840230864, - "loss": 0.0311, + "epoch": 0.06, + "learning_rate": 0.00029120485456774696, + "loss": 0.0246, "step": 22620 }, { - "epoch": 0.11, - "learning_rate": 0.0002828743107092946, - "loss": 0.029, + "epoch": 0.06, + "learning_rate": 0.0002912009663513755, + "loss": 0.0397, "step": 22630 }, { - "epoch": 0.11, - "learning_rate": 0.0002828667430162806, - "loss": 0.0341, + "epoch": 0.06, + "learning_rate": 0.00029119707813500404, + "loss": 0.0357, "step": 22640 }, { - "epoch": 0.11, - "learning_rate": 0.0002828591753232666, - "loss": 0.0317, + "epoch": 0.06, + "learning_rate": 0.00029119318991863255, + "loss": 0.0426, "step": 22650 }, { - "epoch": 0.11, - "learning_rate": 0.00028285160763025257, - "loss": 0.0263, + "epoch": 0.06, + "learning_rate": 0.0002911893017022611, + "loss": 0.0436, "step": 22660 }, { - "epoch": 0.11, - "learning_rate": 0.00028284403993723855, - "loss": 0.0257, + "epoch": 0.06, + "learning_rate": 0.00029118541348588964, + "loss": 0.0381, "step": 22670 }, { - "epoch": 0.11, - "learning_rate": 0.0002828364722442246, - "loss": 0.0298, + "epoch": 0.06, + "learning_rate": 0.00029118152526951815, + "loss": 0.0376, "step": 22680 }, { - "epoch": 0.11, - "learning_rate": 0.00028282890455121057, - "loss": 0.0329, + "epoch": 0.06, + "learning_rate": 0.0002911776370531467, + "loss": 0.0375, "step": 22690 }, { - "epoch": 0.11, - "learning_rate": 0.00028282133685819655, - "loss": 0.0311, + "epoch": 0.06, + "learning_rate": 0.00029117374883677523, + "loss": 0.0345, "step": 22700 }, { - "epoch": 0.11, - "learning_rate": 0.00028281376916518253, - "loss": 0.0481, + "epoch": 0.06, + "learning_rate": 0.0002911698606204038, + "loss": 0.033, "step": 22710 }, { - "epoch": 0.11, - "learning_rate": 0.0002828062014721685, - "loss": 0.0289, + "epoch": 0.06, + "learning_rate": 0.0002911659724040323, + "loss": 0.0296, "step": 22720 }, { - "epoch": 0.11, - "learning_rate": 0.0002827986337791545, - "loss": 0.0321, + "epoch": 0.06, + "learning_rate": 0.00029116208418766083, + "loss": 0.0367, "step": 22730 }, { - "epoch": 0.11, - "learning_rate": 0.00028279106608614053, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.0002911581959712894, + "loss": 0.0406, "step": 22740 }, { - "epoch": 0.11, - "learning_rate": 0.0002827834983931265, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.0002911543077549179, + "loss": 0.0351, "step": 22750 }, { - "epoch": 0.11, - "learning_rate": 0.0002827759307001125, - "loss": 0.0284, + "epoch": 0.06, + "learning_rate": 0.00029115041953854643, + "loss": 0.0339, "step": 22760 }, { - "epoch": 0.11, - "learning_rate": 0.0002827683630070985, - "loss": 0.0327, + "epoch": 0.06, + "learning_rate": 0.000291146531322175, + "loss": 0.0373, "step": 22770 }, { - "epoch": 0.11, - "learning_rate": 0.00028276079531408446, - "loss": 0.0308, + "epoch": 0.06, + "learning_rate": 0.00029114264310580357, + "loss": 0.0302, "step": 22780 }, { - "epoch": 0.11, - "learning_rate": 0.00028275322762107044, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002911387548894321, + "loss": 0.0363, "step": 22790 }, { - "epoch": 0.12, - "learning_rate": 0.0002827456599280564, - "loss": 0.0265, + "epoch": 0.06, + "learning_rate": 0.0002911348666730606, + "loss": 0.0351, "step": 22800 }, { - "epoch": 0.12, - "learning_rate": 0.00028273809223504246, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.0002911309784566891, + "loss": 0.0439, "step": 22810 }, { - "epoch": 0.12, - "learning_rate": 0.00028273052454202844, - "loss": 0.0385, + "epoch": 0.06, + "learning_rate": 0.0002911270902403177, + "loss": 0.0315, "step": 22820 }, { - "epoch": 0.12, - "learning_rate": 0.0002827229568490144, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.0002911232020239462, + "loss": 0.0379, "step": 22830 }, { - "epoch": 0.12, - "learning_rate": 0.0002827153891560004, - "loss": 0.0387, + "epoch": 0.06, + "learning_rate": 0.00029111931380757476, + "loss": 0.0329, "step": 22840 }, { - "epoch": 0.12, - "learning_rate": 0.0002827078214629864, - "loss": 0.0367, + "epoch": 0.06, + "learning_rate": 0.0002911154255912033, + "loss": 0.0483, "step": 22850 }, { - "epoch": 0.12, - "learning_rate": 0.00028270025376997236, - "loss": 0.0381, + "epoch": 0.06, + "learning_rate": 0.0002911115373748318, + "loss": 0.0308, "step": 22860 }, { - "epoch": 0.12, - "learning_rate": 0.0002826926860769584, - "loss": 0.0264, + "epoch": 0.06, + "learning_rate": 0.00029110764915846036, + "loss": 0.029, "step": 22870 }, { - "epoch": 0.12, - "learning_rate": 0.0002826851183839444, - "loss": 0.0268, + "epoch": 0.06, + "learning_rate": 0.0002911037609420889, + "loss": 0.034, "step": 22880 }, { - "epoch": 0.12, - "learning_rate": 0.00028267755069093036, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002910998727257174, + "loss": 0.0383, "step": 22890 }, { - "epoch": 0.12, - "learning_rate": 0.00028266998299791634, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.00029109598450934596, + "loss": 0.0357, "step": 22900 }, { - "epoch": 0.12, - "learning_rate": 0.0002826624153049023, - "loss": 0.0295, + "epoch": 0.06, + "learning_rate": 0.0002910920962929745, + "loss": 0.0347, "step": 22910 }, { - "epoch": 0.12, - "learning_rate": 0.0002826548476118883, - "loss": 0.0362, + "epoch": 0.06, + "learning_rate": 0.00029108820807660304, + "loss": 0.0346, "step": 22920 }, { - "epoch": 0.12, - "learning_rate": 0.00028264727991887434, - "loss": 0.0312, + "epoch": 0.06, + "learning_rate": 0.00029108431986023156, + "loss": 0.0369, "step": 22930 }, { - "epoch": 0.12, - "learning_rate": 0.0002826397122258603, - "loss": 0.0301, + "epoch": 0.06, + "learning_rate": 0.00029108043164386007, + "loss": 0.0324, "step": 22940 }, { - "epoch": 0.12, - "learning_rate": 0.0002826321445328463, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.00029107654342748864, + "loss": 0.0383, "step": 22950 }, { - "epoch": 0.12, - "learning_rate": 0.0002826245768398323, - "loss": 0.0324, + "epoch": 0.06, + "learning_rate": 0.00029107265521111715, + "loss": 0.0357, "step": 22960 }, { - "epoch": 0.12, - "learning_rate": 0.00028261700914681827, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.00029106876699474567, + "loss": 0.0325, "step": 22970 }, { - "epoch": 0.12, - "learning_rate": 0.00028260944145380425, - "loss": 0.0282, + "epoch": 0.06, + "learning_rate": 0.00029106487877837424, + "loss": 0.0357, "step": 22980 }, { - "epoch": 0.12, - "learning_rate": 0.00028260187376079023, - "loss": 0.0255, + "epoch": 0.06, + "learning_rate": 0.0002910609905620028, + "loss": 0.0404, "step": 22990 }, { - "epoch": 0.12, - "learning_rate": 0.00028259430606777627, - "loss": 0.0325, + "epoch": 0.06, + "learning_rate": 0.0002910571023456313, + "loss": 0.0407, "step": 23000 }, { - "epoch": 0.12, - "eval_cer": 0.9145051901636767, - "eval_loss": 0.02104305848479271, - "eval_runtime": 117.2879, - "eval_samples_per_second": 17.052, - "eval_steps_per_second": 4.263, + "epoch": 0.06, + "eval_cer": 0.881821655462573, + "eval_loss": 0.026583530008792877, + "eval_runtime": 107.715, + "eval_samples_per_second": 18.568, + "eval_steps_per_second": 4.642, "step": 23000 }, { - "epoch": 0.12, - "learning_rate": 0.00028258673837476225, - "loss": 0.0284, + "epoch": 0.06, + "learning_rate": 0.00029105321412925984, + "loss": 0.0304, "step": 23010 }, { - "epoch": 0.12, - "learning_rate": 0.00028257917068174823, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.00029104932591288835, + "loss": 0.0353, "step": 23020 }, { - "epoch": 0.12, - "learning_rate": 0.0002825716029887342, - "loss": 0.0379, + "epoch": 0.06, + "learning_rate": 0.0002910454376965169, + "loss": 0.0423, "step": 23030 }, { - "epoch": 0.12, - "learning_rate": 0.0002825640352957202, - "loss": 0.0286, + "epoch": 0.06, + "learning_rate": 0.00029104154948014543, + "loss": 0.033, "step": 23040 }, { - "epoch": 0.12, - "learning_rate": 0.00028255646760270617, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.000291037661263774, + "loss": 0.0331, "step": 23050 }, { - "epoch": 0.12, - "learning_rate": 0.0002825488999096922, - "loss": 0.0265, + "epoch": 0.06, + "learning_rate": 0.0002910337730474025, + "loss": 0.033, "step": 23060 }, { - "epoch": 0.12, - "learning_rate": 0.0002825413322166782, - "loss": 0.0265, + "epoch": 0.06, + "learning_rate": 0.0002910298848310311, + "loss": 0.0311, "step": 23070 }, { - "epoch": 0.12, - "learning_rate": 0.00028253376452366417, - "loss": 0.0236, + "epoch": 0.06, + "learning_rate": 0.0002910259966146596, + "loss": 0.0355, "step": 23080 }, { - "epoch": 0.12, - "learning_rate": 0.00028252619683065015, - "loss": 0.0313, + "epoch": 0.06, + "learning_rate": 0.0002910221083982881, + "loss": 0.0333, "step": 23090 }, { - "epoch": 0.12, - "learning_rate": 0.00028251862913763613, + "epoch": 0.06, + "learning_rate": 0.00029101822018191663, "loss": 0.0322, "step": 23100 }, { - "epoch": 0.12, - "learning_rate": 0.0002825110614446221, - "loss": 0.0246, + "epoch": 0.06, + "learning_rate": 0.0002910143319655452, + "loss": 0.0355, "step": 23110 }, { - "epoch": 0.12, - "learning_rate": 0.0002825034937516081, - "loss": 0.0267, + "epoch": 0.06, + "learning_rate": 0.0002910104437491737, + "loss": 0.0412, "step": 23120 }, { - "epoch": 0.12, - "learning_rate": 0.00028249592605859413, - "loss": 0.0279, + "epoch": 0.06, + "learning_rate": 0.0002910065555328023, + "loss": 0.0379, "step": 23130 }, { - "epoch": 0.12, - "learning_rate": 0.0002824883583655801, - "loss": 0.0299, + "epoch": 0.06, + "learning_rate": 0.0002910026673164308, + "loss": 0.0381, "step": 23140 }, { - "epoch": 0.12, - "learning_rate": 0.0002824807906725661, - "loss": 0.0319, + "epoch": 0.06, + "learning_rate": 0.0002909987791000593, + "loss": 0.0463, "step": 23150 }, { - "epoch": 0.12, - "learning_rate": 0.0002824732229795521, - "loss": 0.0298, + "epoch": 0.06, + "learning_rate": 0.0002909948908836879, + "loss": 0.0425, "step": 23160 }, { - "epoch": 0.12, - "learning_rate": 0.00028246565528653806, - "loss": 0.0317, + "epoch": 0.06, + "learning_rate": 0.0002909910026673164, + "loss": 0.0429, "step": 23170 }, { - "epoch": 0.12, - "learning_rate": 0.00028245808759352404, - "loss": 0.0303, + "epoch": 0.06, + "learning_rate": 0.00029098711445094496, + "loss": 0.0347, "step": 23180 }, { - "epoch": 0.12, - "learning_rate": 0.0002824505199005101, - "loss": 0.0286, + "epoch": 0.06, + "learning_rate": 0.0002909832262345735, + "loss": 0.0327, "step": 23190 }, { - "epoch": 0.12, - "learning_rate": 0.00028244295220749606, - "loss": 0.0312, + "epoch": 0.06, + "learning_rate": 0.00029097933801820205, + "loss": 0.0371, "step": 23200 }, { - "epoch": 0.12, - "learning_rate": 0.00028243538451448204, - "loss": 0.033, + "epoch": 0.06, + "learning_rate": 0.00029097544980183056, + "loss": 0.0342, "step": 23210 }, { - "epoch": 0.12, - "learning_rate": 0.000282427816821468, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.0002909715615854591, + "loss": 0.0349, "step": 23220 }, { - "epoch": 0.12, - "learning_rate": 0.000282420249128454, - "loss": 0.0307, + "epoch": 0.06, + "learning_rate": 0.0002909676733690876, + "loss": 0.0408, "step": 23230 }, { - "epoch": 0.12, - "learning_rate": 0.00028241268143544, - "loss": 0.0273, + "epoch": 0.06, + "learning_rate": 0.00029096378515271616, + "loss": 0.0324, "step": 23240 }, { - "epoch": 0.12, - "learning_rate": 0.000282405113742426, - "loss": 0.0331, + "epoch": 0.06, + "learning_rate": 0.00029095989693634467, + "loss": 0.0363, "step": 23250 }, { - "epoch": 0.12, - "learning_rate": 0.00028239754604941195, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.00029095600871997324, + "loss": 0.0351, "step": 23260 }, { - "epoch": 0.12, - "learning_rate": 0.0002823899783563979, - "loss": 0.0332, + "epoch": 0.06, + "learning_rate": 0.00029095212050360176, + "loss": 0.0372, "step": 23270 }, { - "epoch": 0.12, - "learning_rate": 0.0002823824106633839, - "loss": 0.026, + "epoch": 0.06, + "learning_rate": 0.0002909482322872303, + "loss": 0.0325, "step": 23280 }, { - "epoch": 0.12, - "learning_rate": 0.00028237484297036994, - "loss": 0.0326, + "epoch": 0.06, + "learning_rate": 0.00029094434407085884, + "loss": 0.0359, "step": 23290 }, { - "epoch": 0.12, - "learning_rate": 0.0002823672752773559, - "loss": 0.0301, + "epoch": 0.06, + "learning_rate": 0.00029094045585448735, + "loss": 0.0383, "step": 23300 }, { - "epoch": 0.12, - "learning_rate": 0.0002823597075843419, - "loss": 0.0236, + "epoch": 0.06, + "learning_rate": 0.00029093656763811587, + "loss": 0.0431, "step": 23310 }, { - "epoch": 0.12, - "learning_rate": 0.0002823521398913279, - "loss": 0.0281, + "epoch": 0.06, + "learning_rate": 0.00029093267942174444, + "loss": 0.0349, "step": 23320 }, { - "epoch": 0.12, - "learning_rate": 0.00028234457219831387, - "loss": 0.0325, + "epoch": 0.06, + "learning_rate": 0.000290928791205373, + "loss": 0.0317, "step": 23330 }, { - "epoch": 0.12, - "learning_rate": 0.00028233700450529985, - "loss": 0.0255, + "epoch": 0.06, + "learning_rate": 0.0002909249029890015, + "loss": 0.0365, "step": 23340 }, { - "epoch": 0.12, - "learning_rate": 0.00028232943681228583, - "loss": 0.0332, + "epoch": 0.06, + "learning_rate": 0.00029092101477263003, + "loss": 0.0377, "step": 23350 }, { - "epoch": 0.12, - "learning_rate": 0.00028232186911927187, - "loss": 0.0365, + "epoch": 0.06, + "learning_rate": 0.00029091712655625855, + "loss": 0.0302, "step": 23360 }, { - "epoch": 0.12, - "learning_rate": 0.00028231430142625785, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.0002909132383398871, + "loss": 0.0395, "step": 23370 }, { - "epoch": 0.12, - "learning_rate": 0.00028230673373324383, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.00029090935012351563, + "loss": 0.0347, "step": 23380 }, { - "epoch": 0.12, - "learning_rate": 0.0002822991660402298, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.0002909054619071442, + "loss": 0.0308, "step": 23390 }, { - "epoch": 0.12, - "learning_rate": 0.0002822915983472158, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.0002909015736907727, + "loss": 0.0377, "step": 23400 }, { - "epoch": 0.12, - "learning_rate": 0.0002822840306542018, - "loss": 0.027, + "epoch": 0.06, + "learning_rate": 0.0002908976854744013, + "loss": 0.0349, "step": 23410 }, { - "epoch": 0.12, - "learning_rate": 0.0002822764629611878, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.0002908937972580298, + "loss": 0.0347, "step": 23420 }, { - "epoch": 0.12, - "learning_rate": 0.0002822688952681738, - "loss": 0.0266, + "epoch": 0.06, + "learning_rate": 0.0002908899090416583, + "loss": 0.0363, "step": 23430 }, { - "epoch": 0.12, - "learning_rate": 0.0002822613275751598, - "loss": 0.0257, + "epoch": 0.06, + "learning_rate": 0.00029088602082528683, + "loss": 0.0345, "step": 23440 }, { - "epoch": 0.12, - "learning_rate": 0.00028225375988214576, - "loss": 0.0247, + "epoch": 0.06, + "learning_rate": 0.0002908821326089154, + "loss": 0.034, "step": 23450 }, { - "epoch": 0.12, - "learning_rate": 0.00028224619218913174, - "loss": 0.0295, + "epoch": 0.06, + "learning_rate": 0.0002908782443925439, + "loss": 0.0281, "step": 23460 }, { - "epoch": 0.12, - "learning_rate": 0.0002822386244961177, - "loss": 0.0279, + "epoch": 0.06, + "learning_rate": 0.0002908743561761725, + "loss": 0.0398, "step": 23470 }, { - "epoch": 0.12, - "learning_rate": 0.00028223105680310375, - "loss": 0.0316, + "epoch": 0.06, + "learning_rate": 0.000290870467959801, + "loss": 0.0387, "step": 23480 }, { - "epoch": 0.12, - "learning_rate": 0.00028222348911008974, - "loss": 0.0258, + "epoch": 0.06, + "learning_rate": 0.00029086657974342956, + "loss": 0.037, "step": 23490 }, { - "epoch": 0.12, - "learning_rate": 0.0002822159214170757, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.0002908626915270581, + "loss": 0.0396, "step": 23500 }, { - "epoch": 0.12, - "learning_rate": 0.0002822083537240617, - "loss": 0.033, + "epoch": 0.06, + "learning_rate": 0.0002908588033106866, + "loss": 0.0428, "step": 23510 }, { - "epoch": 0.12, - "learning_rate": 0.0002822007860310477, - "loss": 0.0299, + "epoch": 0.06, + "learning_rate": 0.0002908549150943151, + "loss": 0.0331, "step": 23520 }, { - "epoch": 0.12, - "learning_rate": 0.00028219321833803366, - "loss": 0.0252, + "epoch": 0.06, + "learning_rate": 0.0002908510268779437, + "loss": 0.0489, "step": 23530 }, { - "epoch": 0.12, - "learning_rate": 0.00028218565064501964, - "loss": 0.0287, + "epoch": 0.06, + "learning_rate": 0.00029084713866157224, + "loss": 0.0399, "step": 23540 }, { - "epoch": 0.12, - "learning_rate": 0.0002821780829520057, - "loss": 0.1276, + "epoch": 0.06, + "learning_rate": 0.00029084325044520076, + "loss": 0.0437, "step": 23550 }, { - "epoch": 0.12, - "learning_rate": 0.00028217051525899166, - "loss": 0.0328, + "epoch": 0.06, + "learning_rate": 0.0002908393622288293, + "loss": 0.0319, "step": 23560 }, { - "epoch": 0.12, - "learning_rate": 0.00028216294756597764, - "loss": 0.0346, + "epoch": 0.06, + "learning_rate": 0.00029083547401245784, + "loss": 0.0296, "step": 23570 }, { - "epoch": 0.12, - "learning_rate": 0.0002821553798729636, - "loss": 0.0323, + "epoch": 0.06, + "learning_rate": 0.00029083158579608636, + "loss": 0.0296, "step": 23580 }, { - "epoch": 0.12, - "learning_rate": 0.0002821478121799496, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.00029082769757971487, + "loss": 0.0374, "step": 23590 }, { - "epoch": 0.12, - "learning_rate": 0.0002821402444869356, - "loss": 0.0294, + "epoch": 0.06, + "learning_rate": 0.00029082380936334344, + "loss": 0.035, "step": 23600 }, { - "epoch": 0.12, - "learning_rate": 0.0002821326767939216, - "loss": 0.0275, + "epoch": 0.06, + "learning_rate": 0.00029081992114697195, + "loss": 0.032, "step": 23610 }, { - "epoch": 0.12, - "learning_rate": 0.0002821251091009076, - "loss": 0.0323, + "epoch": 0.06, + "learning_rate": 0.0002908160329306005, + "loss": 0.0313, "step": 23620 }, { - "epoch": 0.12, - "learning_rate": 0.0002821175414078936, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.00029081214471422904, + "loss": 0.0316, "step": 23630 }, { - "epoch": 0.12, - "learning_rate": 0.00028210997371487957, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.00029080825649785755, + "loss": 0.0382, "step": 23640 }, { - "epoch": 0.12, - "learning_rate": 0.00028210240602186555, - "loss": 0.0379, + "epoch": 0.06, + "learning_rate": 0.00029080436828148607, + "loss": 0.0368, "step": 23650 }, { - "epoch": 0.12, - "learning_rate": 0.00028209483832885153, - "loss": 0.0279, + "epoch": 0.06, + "learning_rate": 0.00029080048006511464, + "loss": 0.0321, "step": 23660 }, { - "epoch": 0.12, - "learning_rate": 0.00028208727063583756, - "loss": 0.0226, + "epoch": 0.06, + "learning_rate": 0.00029079659184874315, + "loss": 0.0324, "step": 23670 }, { - "epoch": 0.12, - "learning_rate": 0.00028207970294282355, - "loss": 0.0285, + "epoch": 0.06, + "learning_rate": 0.0002907927036323717, + "loss": 0.037, "step": 23680 }, { - "epoch": 0.12, - "learning_rate": 0.0002820721352498095, - "loss": 0.0275, + "epoch": 0.06, + "learning_rate": 0.00029078881541600023, + "loss": 0.0368, "step": 23690 }, { - "epoch": 0.12, - "learning_rate": 0.0002820645675567955, - "loss": 0.0252, + "epoch": 0.06, + "learning_rate": 0.0002907849271996288, + "loss": 0.0371, "step": 23700 }, { - "epoch": 0.12, - "learning_rate": 0.0002820569998637815, - "loss": 0.0279, + "epoch": 0.06, + "learning_rate": 0.0002907810389832573, + "loss": 0.0313, "step": 23710 }, { - "epoch": 0.12, - "learning_rate": 0.00028204943217076747, - "loss": 0.0306, + "epoch": 0.06, + "learning_rate": 0.00029077715076688583, + "loss": 0.0296, "step": 23720 }, { - "epoch": 0.12, - "learning_rate": 0.00028204186447775345, - "loss": 0.0272, + "epoch": 0.06, + "learning_rate": 0.0002907732625505144, + "loss": 0.0345, "step": 23730 }, { - "epoch": 0.12, - "learning_rate": 0.0002820342967847395, - "loss": 0.0456, + "epoch": 0.06, + "learning_rate": 0.0002907693743341429, + "loss": 0.0359, "step": 23740 }, { - "epoch": 0.12, - "learning_rate": 0.00028202672909172547, - "loss": 0.0343, + "epoch": 0.06, + "learning_rate": 0.0002907654861177715, + "loss": 0.0309, "step": 23750 }, { - "epoch": 0.12, - "learning_rate": 0.00028201916139871145, - "loss": 0.0281, + "epoch": 0.06, + "learning_rate": 0.0002907615979014, + "loss": 0.0358, "step": 23760 }, { - "epoch": 0.12, - "learning_rate": 0.00028201159370569743, - "loss": 0.0254, + "epoch": 0.06, + "learning_rate": 0.0002907577096850285, + "loss": 0.0363, "step": 23770 }, { - "epoch": 0.12, - "learning_rate": 0.0002820040260126834, - "loss": 0.0322, + "epoch": 0.06, + "learning_rate": 0.0002907538214686571, + "loss": 0.0312, "step": 23780 }, { - "epoch": 0.12, - "learning_rate": 0.0002819964583196694, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.0002907499332522856, + "loss": 0.0277, "step": 23790 }, { - "epoch": 0.12, - "learning_rate": 0.00028198889062665543, - "loss": 0.0271, + "epoch": 0.06, + "learning_rate": 0.0002907460450359141, + "loss": 0.0371, "step": 23800 }, { - "epoch": 0.12, - "learning_rate": 0.0002819813229336414, - "loss": 0.029, + "epoch": 0.06, + "learning_rate": 0.0002907421568195427, + "loss": 0.0309, "step": 23810 }, { - "epoch": 0.12, - "learning_rate": 0.0002819737552406274, - "loss": 0.0246, + "epoch": 0.06, + "learning_rate": 0.0002907382686031712, + "loss": 0.0385, "step": 23820 }, { - "epoch": 0.12, - "learning_rate": 0.0002819661875476134, - "loss": 0.0308, + "epoch": 0.06, + "learning_rate": 0.00029073438038679976, + "loss": 0.0413, "step": 23830 }, { - "epoch": 0.12, - "learning_rate": 0.00028195861985459936, - "loss": 0.027, + "epoch": 0.06, + "learning_rate": 0.0002907304921704283, + "loss": 0.0332, "step": 23840 }, { - "epoch": 0.12, - "learning_rate": 0.00028195105216158534, - "loss": 0.0289, + "epoch": 0.06, + "learning_rate": 0.0002907266039540568, + "loss": 0.0336, "step": 23850 }, { - "epoch": 0.12, - "learning_rate": 0.0002819434844685713, - "loss": 0.0263, + "epoch": 0.06, + "learning_rate": 0.0002907227157376853, + "loss": 0.0318, "step": 23860 }, { - "epoch": 0.12, - "learning_rate": 0.00028193591677555736, - "loss": 0.0278, + "epoch": 0.06, + "learning_rate": 0.0002907188275213139, + "loss": 0.0324, "step": 23870 }, { - "epoch": 0.12, - "learning_rate": 0.00028192834908254334, - "loss": 0.0247, + "epoch": 0.06, + "learning_rate": 0.00029071493930494244, + "loss": 0.0369, "step": 23880 }, { - "epoch": 0.12, - "learning_rate": 0.0002819207813895293, - "loss": 0.03, + "epoch": 0.06, + "learning_rate": 0.00029071105108857096, + "loss": 0.0363, "step": 23890 }, { - "epoch": 0.12, - "learning_rate": 0.0002819132136965153, - "loss": 0.031, + "epoch": 0.06, + "learning_rate": 0.00029070716287219947, + "loss": 0.0382, "step": 23900 }, { - "epoch": 0.12, - "learning_rate": 0.0002819056460035013, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.00029070327465582804, + "loss": 0.0334, "step": 23910 }, { - "epoch": 0.12, - "learning_rate": 0.00028189807831048726, - "loss": 0.0339, + "epoch": 0.06, + "learning_rate": 0.00029069938643945656, + "loss": 0.0373, "step": 23920 }, { - "epoch": 0.12, - "learning_rate": 0.0002818905106174733, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.00029069549822308507, + "loss": 0.0374, "step": 23930 }, { - "epoch": 0.12, - "learning_rate": 0.0002818829429244593, - "loss": 0.0301, + "epoch": 0.06, + "learning_rate": 0.00029069161000671364, + "loss": 0.0345, "step": 23940 }, { - "epoch": 0.12, - "learning_rate": 0.00028187537523144526, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.00029068772179034215, + "loss": 0.0337, "step": 23950 }, { - "epoch": 0.12, - "learning_rate": 0.00028186780753843124, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.0002906838335739707, + "loss": 0.0361, "step": 23960 }, { - "epoch": 0.12, - "learning_rate": 0.0002818602398454172, - "loss": 0.0244, + "epoch": 0.06, + "learning_rate": 0.00029067994535759924, + "loss": 0.0373, "step": 23970 }, { - "epoch": 0.12, - "learning_rate": 0.0002818526721524032, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.00029067605714122775, + "loss": 0.032, "step": 23980 }, { - "epoch": 0.12, - "learning_rate": 0.00028184510445938924, - "loss": 0.0227, + "epoch": 0.06, + "learning_rate": 0.0002906721689248563, + "loss": 0.0345, "step": 23990 }, { - "epoch": 0.12, - "learning_rate": 0.0002818375367663752, - "loss": 0.0285, + "epoch": 0.06, + "learning_rate": 0.00029066828070848483, + "loss": 0.0354, "step": 24000 }, { - "epoch": 0.12, - "eval_cer": 0.9144692855070369, - "eval_loss": 0.02072213776409626, - "eval_runtime": 117.2385, - "eval_samples_per_second": 17.059, - "eval_steps_per_second": 4.265, + "epoch": 0.06, + "eval_cer": 0.8818426500165857, + "eval_loss": 0.02564888820052147, + "eval_runtime": 107.6719, + "eval_samples_per_second": 18.575, + "eval_steps_per_second": 4.644, "step": 24000 }, { - "epoch": 0.12, - "learning_rate": 0.0002818299690733612, - "loss": 0.0287, + "epoch": 0.06, + "learning_rate": 0.00029066439249211335, + "loss": 0.0351, "step": 24010 }, { - "epoch": 0.12, - "learning_rate": 0.0002818224013803472, - "loss": 0.0316, + "epoch": 0.06, + "learning_rate": 0.0002906605042757419, + "loss": 0.0405, "step": 24020 }, { - "epoch": 0.12, - "learning_rate": 0.00028181483368733317, - "loss": 0.0248, + "epoch": 0.06, + "learning_rate": 0.0002906566160593705, + "loss": 0.0434, "step": 24030 }, { - "epoch": 0.12, - "learning_rate": 0.00028180726599431915, - "loss": 0.0284, + "epoch": 0.06, + "learning_rate": 0.000290652727842999, + "loss": 0.041, "step": 24040 }, { - "epoch": 0.12, - "learning_rate": 0.00028179969830130513, - "loss": 0.0252, + "epoch": 0.06, + "learning_rate": 0.0002906488396266275, + "loss": 0.0341, "step": 24050 }, { - "epoch": 0.12, - "learning_rate": 0.00028179213060829117, - "loss": 0.0277, + "epoch": 0.06, + "learning_rate": 0.00029064495141025603, + "loss": 0.0342, "step": 24060 }, { - "epoch": 0.12, - "learning_rate": 0.00028178456291527715, - "loss": 0.0269, + "epoch": 0.06, + "learning_rate": 0.0002906410631938846, + "loss": 0.0389, "step": 24070 }, { - "epoch": 0.12, - "learning_rate": 0.00028177699522226313, - "loss": 0.0237, + "epoch": 0.06, + "learning_rate": 0.0002906371749775131, + "loss": 0.0329, "step": 24080 }, { - "epoch": 0.12, - "learning_rate": 0.0002817694275292491, - "loss": 0.0218, + "epoch": 0.06, + "learning_rate": 0.0002906332867611417, + "loss": 0.034, "step": 24090 }, { - "epoch": 0.12, - "learning_rate": 0.0002817618598362351, - "loss": 0.0265, + "epoch": 0.06, + "learning_rate": 0.0002906293985447702, + "loss": 0.0433, "step": 24100 }, { - "epoch": 0.12, - "learning_rate": 0.00028175429214322107, - "loss": 0.0265, + "epoch": 0.06, + "learning_rate": 0.0002906255103283987, + "loss": 0.0386, "step": 24110 }, { - "epoch": 0.12, - "learning_rate": 0.0002817467244502071, - "loss": 0.0246, + "epoch": 0.06, + "learning_rate": 0.0002906216221120273, + "loss": 0.0353, "step": 24120 }, { - "epoch": 0.12, - "learning_rate": 0.0002817391567571931, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.0002906177338956558, + "loss": 0.0318, "step": 24130 }, { - "epoch": 0.12, - "learning_rate": 0.00028173158906417907, - "loss": 0.0256, + "epoch": 0.06, + "learning_rate": 0.0002906138456792843, + "loss": 0.0364, "step": 24140 }, { - "epoch": 0.12, - "learning_rate": 0.00028172402137116505, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.0002906099574629129, + "loss": 0.0332, "step": 24150 }, { - "epoch": 0.12, - "learning_rate": 0.00028171645367815103, - "loss": 0.0244, + "epoch": 0.06, + "learning_rate": 0.0002906060692465414, + "loss": 0.0358, "step": 24160 }, { - "epoch": 0.12, - "learning_rate": 0.000281708885985137, - "loss": 0.0364, + "epoch": 0.06, + "learning_rate": 0.00029060218103016996, + "loss": 0.0386, "step": 24170 }, { - "epoch": 0.12, - "learning_rate": 0.000281701318292123, - "loss": 0.0286, + "epoch": 0.06, + "learning_rate": 0.0002905982928137985, + "loss": 0.0343, "step": 24180 }, { - "epoch": 0.12, - "learning_rate": 0.00028169375059910903, - "loss": 0.0318, + "epoch": 0.06, + "learning_rate": 0.000290594404597427, + "loss": 0.0343, "step": 24190 }, { - "epoch": 0.12, - "learning_rate": 0.000281686182906095, - "loss": 0.027, + "epoch": 0.06, + "learning_rate": 0.00029059051638105556, + "loss": 0.0414, "step": 24200 }, { - "epoch": 0.12, - "learning_rate": 0.000281678615213081, - "loss": 0.0287, + "epoch": 0.06, + "learning_rate": 0.00029058662816468407, + "loss": 0.0352, "step": 24210 }, { - "epoch": 0.12, - "learning_rate": 0.000281671047520067, - "loss": 0.0317, + "epoch": 0.06, + "learning_rate": 0.00029058273994831264, + "loss": 0.0368, "step": 24220 }, { - "epoch": 0.12, - "learning_rate": 0.00028166347982705296, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.00029057885173194116, + "loss": 0.0334, "step": 24230 }, { - "epoch": 0.12, - "learning_rate": 0.00028165591213403894, - "loss": 0.0272, + "epoch": 0.06, + "learning_rate": 0.0002905749635155697, + "loss": 0.0373, "step": 24240 }, { - "epoch": 0.12, - "learning_rate": 0.000281648344441025, - "loss": 0.0273, + "epoch": 0.06, + "learning_rate": 0.00029057107529919824, + "loss": 0.0297, "step": 24250 }, { - "epoch": 0.12, - "learning_rate": 0.00028164077674801096, - "loss": 0.0303, + "epoch": 0.06, + "learning_rate": 0.00029056718708282675, + "loss": 0.039, "step": 24260 }, { - "epoch": 0.12, - "learning_rate": 0.00028163320905499694, - "loss": 0.0329, + "epoch": 0.06, + "learning_rate": 0.00029056329886645527, + "loss": 0.0354, "step": 24270 }, { - "epoch": 0.12, - "learning_rate": 0.0002816256413619829, - "loss": 0.0332, + "epoch": 0.06, + "learning_rate": 0.00029055941065008384, + "loss": 0.0384, "step": 24280 }, { - "epoch": 0.12, - "learning_rate": 0.0002816180736689689, - "loss": 0.0362, + "epoch": 0.06, + "learning_rate": 0.00029055552243371235, + "loss": 0.0384, "step": 24290 }, { - "epoch": 0.12, - "learning_rate": 0.0002816105059759549, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002905516342173409, + "loss": 0.0395, "step": 24300 }, { - "epoch": 0.12, - "learning_rate": 0.0002816029382829409, - "loss": 0.0287, + "epoch": 0.06, + "learning_rate": 0.00029054774600096943, + "loss": 0.0397, "step": 24310 }, { - "epoch": 0.12, - "learning_rate": 0.0002815953705899269, - "loss": 0.0327, + "epoch": 0.06, + "learning_rate": 0.00029054385778459795, + "loss": 0.0343, "step": 24320 }, { - "epoch": 0.12, - "learning_rate": 0.0002815878028969129, - "loss": 0.0282, + "epoch": 0.06, + "learning_rate": 0.0002905399695682265, + "loss": 0.0393, "step": 24330 }, { - "epoch": 0.12, - "learning_rate": 0.00028158023520389886, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.00029053608135185503, + "loss": 0.039, "step": 24340 }, { - "epoch": 0.12, - "learning_rate": 0.00028157266751088484, - "loss": 0.0349, + "epoch": 0.06, + "learning_rate": 0.00029053219313548355, + "loss": 0.0343, "step": 24350 }, { - "epoch": 0.12, - "learning_rate": 0.0002815650998178708, - "loss": 0.0319, + "epoch": 0.06, + "learning_rate": 0.0002905283049191121, + "loss": 0.0327, "step": 24360 }, { - "epoch": 0.12, - "learning_rate": 0.0002815575321248568, - "loss": 0.0286, + "epoch": 0.06, + "learning_rate": 0.0002905244167027407, + "loss": 0.0349, "step": 24370 }, { - "epoch": 0.12, - "learning_rate": 0.00028154996443184284, - "loss": 0.0275, + "epoch": 0.06, + "learning_rate": 0.0002905205284863692, + "loss": 0.034, "step": 24380 }, { - "epoch": 0.12, - "learning_rate": 0.0002815423967388288, - "loss": 0.0355, + "epoch": 0.06, + "learning_rate": 0.0002905166402699977, + "loss": 0.0361, "step": 24390 }, { - "epoch": 0.12, - "learning_rate": 0.0002815348290458148, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.00029051275205362623, + "loss": 0.0444, "step": 24400 }, { - "epoch": 0.12, - "learning_rate": 0.0002815272613528008, - "loss": 0.0293, + "epoch": 0.06, + "learning_rate": 0.0002905088638372548, + "loss": 0.036, "step": 24410 }, { - "epoch": 0.12, - "learning_rate": 0.00028151969365978677, - "loss": 0.0315, + "epoch": 0.06, + "learning_rate": 0.0002905049756208833, + "loss": 0.0334, "step": 24420 }, { - "epoch": 0.12, - "learning_rate": 0.00028151212596677275, - "loss": 0.0235, + "epoch": 0.06, + "learning_rate": 0.0002905010874045119, + "loss": 0.0348, "step": 24430 }, { - "epoch": 0.12, - "learning_rate": 0.0002815045582737588, - "loss": 0.0301, + "epoch": 0.06, + "learning_rate": 0.0002904971991881404, + "loss": 0.0389, "step": 24440 }, { - "epoch": 0.12, - "learning_rate": 0.00028149699058074477, - "loss": 0.029, + "epoch": 0.06, + "learning_rate": 0.00029049331097176896, + "loss": 0.0367, "step": 24450 }, { - "epoch": 0.12, - "learning_rate": 0.00028148942288773075, - "loss": 0.0302, + "epoch": 0.06, + "learning_rate": 0.0002904894227553975, + "loss": 0.0363, "step": 24460 }, { - "epoch": 0.12, - "learning_rate": 0.00028148185519471673, - "loss": 0.0273, + "epoch": 0.06, + "learning_rate": 0.000290485534539026, + "loss": 0.0428, "step": 24470 }, { - "epoch": 0.12, - "learning_rate": 0.0002814742875017027, - "loss": 0.0269, + "epoch": 0.06, + "learning_rate": 0.0002904816463226545, + "loss": 0.0314, "step": 24480 }, { - "epoch": 0.12, - "learning_rate": 0.0002814667198086887, - "loss": 0.0247, + "epoch": 0.06, + "learning_rate": 0.0002904777581062831, + "loss": 0.0357, "step": 24490 }, { - "epoch": 0.12, - "learning_rate": 0.00028145915211567473, - "loss": 0.026, + "epoch": 0.06, + "learning_rate": 0.0002904738698899116, + "loss": 0.0733, "step": 24500 }, { - "epoch": 0.12, - "learning_rate": 0.00028145158442266066, - "loss": 0.0294, + "epoch": 0.06, + "learning_rate": 0.00029046998167354016, + "loss": 0.0377, "step": 24510 }, { - "epoch": 0.12, - "learning_rate": 0.00028144401672964664, - "loss": 0.0272, + "epoch": 0.06, + "learning_rate": 0.0002904660934571687, + "loss": 0.0396, "step": 24520 }, { - "epoch": 0.12, - "learning_rate": 0.0002814364490366326, - "loss": 0.0217, + "epoch": 0.06, + "learning_rate": 0.00029046220524079724, + "loss": 0.0404, "step": 24530 }, { - "epoch": 0.12, - "learning_rate": 0.00028142888134361865, - "loss": 0.0293, + "epoch": 0.06, + "learning_rate": 0.00029045831702442576, + "loss": 0.0347, "step": 24540 }, { - "epoch": 0.12, - "learning_rate": 0.00028142131365060464, - "loss": 0.0248, + "epoch": 0.06, + "learning_rate": 0.00029045442880805427, + "loss": 0.0387, "step": 24550 }, { - "epoch": 0.12, - "learning_rate": 0.0002814137459575906, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.0002904505405916828, + "loss": 0.0359, "step": 24560 }, { - "epoch": 0.12, - "learning_rate": 0.0002814061782645766, - "loss": 0.0301, + "epoch": 0.06, + "learning_rate": 0.00029044665237531135, + "loss": 0.0341, "step": 24570 }, { - "epoch": 0.12, - "learning_rate": 0.0002813986105715626, - "loss": 0.027, + "epoch": 0.06, + "learning_rate": 0.0002904427641589399, + "loss": 0.035, "step": 24580 }, { - "epoch": 0.12, - "learning_rate": 0.00028139104287854856, - "loss": 0.0261, + "epoch": 0.06, + "learning_rate": 0.00029043887594256844, + "loss": 0.0327, "step": 24590 }, { - "epoch": 0.12, - "learning_rate": 0.00028138347518553454, - "loss": 0.034, + "epoch": 0.06, + "learning_rate": 0.00029043498772619695, + "loss": 0.0543, "step": 24600 }, { - "epoch": 0.12, - "learning_rate": 0.0002813759074925206, - "loss": 0.028, + "epoch": 0.06, + "learning_rate": 0.00029043109950982547, + "loss": 0.0431, "step": 24610 }, { - "epoch": 0.12, - "learning_rate": 0.00028136833979950656, - "loss": 0.0271, + "epoch": 0.06, + "learning_rate": 0.00029042721129345404, + "loss": 0.0408, "step": 24620 }, { - "epoch": 0.12, - "learning_rate": 0.00028136077210649254, - "loss": 0.0243, + "epoch": 0.06, + "learning_rate": 0.00029042332307708255, + "loss": 0.0399, "step": 24630 }, { - "epoch": 0.12, - "learning_rate": 0.0002813532044134785, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.0002904194348607111, + "loss": 0.0351, "step": 24640 }, { - "epoch": 0.12, - "learning_rate": 0.0002813456367204645, - "loss": 0.0321, + "epoch": 0.06, + "learning_rate": 0.00029041554664433963, + "loss": 0.0339, "step": 24650 }, { - "epoch": 0.12, - "learning_rate": 0.0002813380690274505, - "loss": 0.0278, + "epoch": 0.06, + "learning_rate": 0.0002904116584279682, + "loss": 0.0366, "step": 24660 }, { - "epoch": 0.12, - "learning_rate": 0.0002813305013344365, - "loss": 0.0268, + "epoch": 0.06, + "learning_rate": 0.0002904077702115967, + "loss": 0.037, "step": 24670 }, { - "epoch": 0.12, - "learning_rate": 0.0002813229336414225, - "loss": 0.0261, + "epoch": 0.06, + "learning_rate": 0.00029040388199522523, + "loss": 0.0321, "step": 24680 }, { - "epoch": 0.12, - "learning_rate": 0.0002813153659484085, - "loss": 0.0272, + "epoch": 0.06, + "learning_rate": 0.00029039999377885375, + "loss": 0.0378, "step": 24690 }, { - "epoch": 0.12, - "learning_rate": 0.00028130779825539447, - "loss": 0.0261, + "epoch": 0.06, + "learning_rate": 0.0002903961055624823, + "loss": 0.0398, "step": 24700 }, { - "epoch": 0.12, - "learning_rate": 0.00028130023056238045, - "loss": 0.0262, + "epoch": 0.06, + "learning_rate": 0.00029039221734611083, + "loss": 0.0322, "step": 24710 }, { - "epoch": 0.12, - "learning_rate": 0.00028129266286936643, - "loss": 0.0257, + "epoch": 0.06, + "learning_rate": 0.0002903883291297394, + "loss": 0.0359, "step": 24720 }, { - "epoch": 0.12, - "learning_rate": 0.00028128509517635246, - "loss": 0.0253, + "epoch": 0.06, + "learning_rate": 0.0002903844409133679, + "loss": 0.043, "step": 24730 }, { - "epoch": 0.12, - "learning_rate": 0.00028127752748333845, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.0002903805526969965, + "loss": 0.0356, "step": 24740 }, { - "epoch": 0.12, - "learning_rate": 0.0002812699597903244, - "loss": 0.0277, + "epoch": 0.06, + "learning_rate": 0.000290376664480625, + "loss": 0.0279, "step": 24750 }, { - "epoch": 0.12, - "learning_rate": 0.0002812623920973104, - "loss": 0.0255, + "epoch": 0.06, + "learning_rate": 0.0002903727762642535, + "loss": 0.0325, "step": 24760 }, { - "epoch": 0.12, - "learning_rate": 0.0002812548244042964, - "loss": 0.0246, + "epoch": 0.06, + "learning_rate": 0.0002903688880478821, + "loss": 0.0365, "step": 24770 }, { - "epoch": 0.13, - "learning_rate": 0.00028124725671128237, - "loss": 0.0251, + "epoch": 0.06, + "learning_rate": 0.0002903649998315106, + "loss": 0.027, "step": 24780 }, { - "epoch": 0.13, - "learning_rate": 0.00028123968901826835, - "loss": 0.0291, + "epoch": 0.06, + "learning_rate": 0.00029036111161513916, + "loss": 0.031, "step": 24790 }, { - "epoch": 0.13, - "learning_rate": 0.0002812321213252544, - "loss": 0.0275, + "epoch": 0.06, + "learning_rate": 0.0002903572233987677, + "loss": 0.0348, "step": 24800 }, { - "epoch": 0.13, - "learning_rate": 0.00028122455363224037, - "loss": 0.0207, + "epoch": 0.06, + "learning_rate": 0.0002903533351823962, + "loss": 0.0312, "step": 24810 }, { - "epoch": 0.13, - "learning_rate": 0.00028121698593922635, - "loss": 0.023, + "epoch": 0.06, + "learning_rate": 0.0002903494469660247, + "loss": 0.038, "step": 24820 }, { - "epoch": 0.13, - "learning_rate": 0.00028120941824621233, - "loss": 0.0244, + "epoch": 0.06, + "learning_rate": 0.0002903455587496533, + "loss": 0.0326, "step": 24830 }, { - "epoch": 0.13, - "learning_rate": 0.0002812018505531983, - "loss": 0.0243, + "epoch": 0.06, + "learning_rate": 0.0002903416705332818, + "loss": 0.0385, "step": 24840 }, { - "epoch": 0.13, - "learning_rate": 0.0002811942828601843, - "loss": 0.0252, + "epoch": 0.06, + "learning_rate": 0.00029033778231691036, + "loss": 0.0322, "step": 24850 }, { - "epoch": 0.13, - "learning_rate": 0.00028118671516717033, - "loss": 0.0266, + "epoch": 0.06, + "learning_rate": 0.00029033389410053887, + "loss": 0.0375, "step": 24860 }, { - "epoch": 0.13, - "learning_rate": 0.0002811791474741563, - "loss": 0.0278, + "epoch": 0.06, + "learning_rate": 0.00029033000588416744, + "loss": 0.0401, "step": 24870 }, { - "epoch": 0.13, - "learning_rate": 0.0002811715797811423, - "loss": 0.0258, + "epoch": 0.06, + "learning_rate": 0.00029032611766779596, + "loss": 0.0332, "step": 24880 }, { - "epoch": 0.13, - "learning_rate": 0.0002811640120881283, - "loss": 0.0303, + "epoch": 0.06, + "learning_rate": 0.00029032222945142447, + "loss": 0.0376, "step": 24890 }, { - "epoch": 0.13, - "learning_rate": 0.00028115644439511426, - "loss": 0.0255, + "epoch": 0.06, + "learning_rate": 0.000290318341235053, + "loss": 0.0359, "step": 24900 }, { - "epoch": 0.13, - "learning_rate": 0.00028114887670210024, - "loss": 0.0287, + "epoch": 0.06, + "learning_rate": 0.00029031445301868155, + "loss": 0.0294, "step": 24910 }, { - "epoch": 0.13, - "learning_rate": 0.0002811413090090862, - "loss": 0.0292, + "epoch": 0.06, + "learning_rate": 0.0002903105648023101, + "loss": 0.0352, "step": 24920 }, { - "epoch": 0.13, - "learning_rate": 0.00028113374131607226, - "loss": 0.0314, + "epoch": 0.06, + "learning_rate": 0.00029030667658593864, + "loss": 0.0338, "step": 24930 }, { - "epoch": 0.13, - "learning_rate": 0.00028112617362305824, - "loss": 0.0283, + "epoch": 0.06, + "learning_rate": 0.00029030278836956715, + "loss": 0.0333, "step": 24940 }, { - "epoch": 0.13, - "learning_rate": 0.0002811186059300442, - "loss": 0.0254, + "epoch": 0.06, + "learning_rate": 0.0002902989001531957, + "loss": 0.0507, "step": 24950 }, { - "epoch": 0.13, - "learning_rate": 0.0002811110382370302, - "loss": 0.0273, + "epoch": 0.06, + "learning_rate": 0.00029029501193682423, + "loss": 0.0395, "step": 24960 }, { - "epoch": 0.13, - "learning_rate": 0.0002811034705440162, - "loss": 0.0274, + "epoch": 0.06, + "learning_rate": 0.00029029112372045275, + "loss": 0.0346, "step": 24970 }, { - "epoch": 0.13, - "learning_rate": 0.00028109590285100216, - "loss": 0.0304, + "epoch": 0.06, + "learning_rate": 0.0002902872355040813, + "loss": 0.0448, "step": 24980 }, { - "epoch": 0.13, - "learning_rate": 0.0002810883351579882, - "loss": 0.0299, + "epoch": 0.06, + "learning_rate": 0.00029028334728770983, + "loss": 0.0373, "step": 24990 }, { - "epoch": 0.13, - "learning_rate": 0.0002810807674649742, - "loss": 0.0289, + "epoch": 0.06, + "learning_rate": 0.0002902794590713384, + "loss": 0.0422, "step": 25000 }, { - "epoch": 0.13, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.01934368908405304, - "eval_runtime": 117.2646, - "eval_samples_per_second": 17.055, - "eval_steps_per_second": 4.264, + "epoch": 0.06, + "eval_cer": 0.8817572721636008, + "eval_loss": 0.02701452560722828, + "eval_runtime": 107.7133, + "eval_samples_per_second": 18.568, + "eval_steps_per_second": 4.642, "step": 25000 }, { - "epoch": 0.13, - "learning_rate": 0.00028107319977196016, - "loss": 0.032, + "epoch": 0.06, + "learning_rate": 0.0002902755708549669, + "loss": 0.0373, "step": 25010 }, { - "epoch": 0.13, - "learning_rate": 0.00028106563207894614, - "loss": 0.0244, + "epoch": 0.06, + "learning_rate": 0.00029027168263859543, + "loss": 0.0321, "step": 25020 }, { - "epoch": 0.13, - "learning_rate": 0.0002810580643859321, - "loss": 0.0296, + "epoch": 0.06, + "learning_rate": 0.000290267794422224, + "loss": 0.0294, "step": 25030 }, { - "epoch": 0.13, - "learning_rate": 0.0002810504966929181, - "loss": 0.0274, + "epoch": 0.06, + "learning_rate": 0.0002902639062058525, + "loss": 0.0417, "step": 25040 }, { - "epoch": 0.13, - "learning_rate": 0.00028104292899990414, - "loss": 0.0288, + "epoch": 0.06, + "learning_rate": 0.00029026001798948103, + "loss": 0.0475, "step": 25050 }, { - "epoch": 0.13, - "learning_rate": 0.0002810353613068901, - "loss": 0.0311, + "epoch": 0.06, + "learning_rate": 0.0002902561297731096, + "loss": 0.0352, "step": 25060 }, { - "epoch": 0.13, - "learning_rate": 0.0002810277936138761, - "loss": 0.0269, + "epoch": 0.06, + "learning_rate": 0.0002902522415567381, + "loss": 0.0366, "step": 25070 }, { - "epoch": 0.13, - "learning_rate": 0.0002810202259208621, - "loss": 0.0316, + "epoch": 0.07, + "learning_rate": 0.0002902483533403667, + "loss": 0.0311, "step": 25080 }, { - "epoch": 0.13, - "learning_rate": 0.00028101265822784807, - "loss": 0.0299, + "epoch": 0.07, + "learning_rate": 0.0002902444651239952, + "loss": 0.0345, "step": 25090 }, { - "epoch": 0.13, - "learning_rate": 0.00028100509053483405, - "loss": 0.0291, + "epoch": 0.07, + "learning_rate": 0.0002902405769076237, + "loss": 0.0367, "step": 25100 }, { - "epoch": 0.13, - "learning_rate": 0.00028099752284182003, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.0002902366886912522, + "loss": 0.0324, "step": 25110 }, { - "epoch": 0.13, - "learning_rate": 0.00028098995514880607, - "loss": 0.031, + "epoch": 0.07, + "learning_rate": 0.0002902328004748808, + "loss": 0.0297, "step": 25120 }, { - "epoch": 0.13, - "learning_rate": 0.00028098238745579205, - "loss": 0.028, + "epoch": 0.07, + "learning_rate": 0.00029022891225850936, + "loss": 0.0319, "step": 25130 }, { - "epoch": 0.13, - "learning_rate": 0.00028097481976277803, - "loss": 0.025, + "epoch": 0.07, + "learning_rate": 0.0002902250240421379, + "loss": 0.0395, "step": 25140 }, { - "epoch": 0.13, - "learning_rate": 0.000280967252069764, - "loss": 0.0181, + "epoch": 0.07, + "learning_rate": 0.0002902211358257664, + "loss": 0.0356, "step": 25150 }, { - "epoch": 0.13, - "learning_rate": 0.00028095968437675, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.00029021724760939496, + "loss": 0.0357, "step": 25160 }, { - "epoch": 0.13, - "learning_rate": 0.00028095211668373597, - "loss": 0.0255, + "epoch": 0.07, + "learning_rate": 0.0002902133593930235, + "loss": 0.0358, "step": 25170 }, { - "epoch": 0.13, - "learning_rate": 0.000280944548990722, - "loss": 0.0309, + "epoch": 0.07, + "learning_rate": 0.000290209471176652, + "loss": 0.0391, "step": 25180 }, { - "epoch": 0.13, - "learning_rate": 0.000280936981297708, - "loss": 0.0269, + "epoch": 0.07, + "learning_rate": 0.00029020558296028056, + "loss": 0.0336, "step": 25190 }, { - "epoch": 0.13, - "learning_rate": 0.00028092941360469397, - "loss": 0.0306, + "epoch": 0.07, + "learning_rate": 0.00029020169474390907, + "loss": 0.0365, "step": 25200 }, { - "epoch": 0.13, - "learning_rate": 0.00028092184591167995, - "loss": 0.0282, + "epoch": 0.07, + "learning_rate": 0.00029019780652753764, + "loss": 0.0317, "step": 25210 }, { - "epoch": 0.13, - "learning_rate": 0.00028091427821866593, - "loss": 0.0253, + "epoch": 0.07, + "learning_rate": 0.00029019391831116615, + "loss": 0.032, "step": 25220 }, { - "epoch": 0.13, - "learning_rate": 0.0002809067105256519, - "loss": 0.0256, + "epoch": 0.07, + "learning_rate": 0.00029019003009479467, + "loss": 0.0358, "step": 25230 }, { - "epoch": 0.13, - "learning_rate": 0.00028089914283263795, - "loss": 0.0316, + "epoch": 0.07, + "learning_rate": 0.00029018614187842324, + "loss": 0.0365, "step": 25240 }, { - "epoch": 0.13, - "learning_rate": 0.00028089157513962393, - "loss": 0.0256, + "epoch": 0.07, + "learning_rate": 0.00029018225366205175, + "loss": 0.0332, "step": 25250 }, { - "epoch": 0.13, - "learning_rate": 0.0002808840074466099, - "loss": 0.0257, + "epoch": 0.07, + "learning_rate": 0.00029017836544568027, + "loss": 0.0307, "step": 25260 }, { - "epoch": 0.13, - "learning_rate": 0.0002808764397535959, - "loss": 0.0248, + "epoch": 0.07, + "learning_rate": 0.00029017447722930884, + "loss": 0.0353, "step": 25270 }, { - "epoch": 0.13, - "learning_rate": 0.0002808688720605819, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.0002901705890129374, + "loss": 0.0405, "step": 25280 }, { - "epoch": 0.13, - "learning_rate": 0.00028086130436756786, - "loss": 0.0283, + "epoch": 0.07, + "learning_rate": 0.0002901667007965659, + "loss": 0.0326, "step": 25290 }, { - "epoch": 0.13, - "learning_rate": 0.00028085373667455384, - "loss": 0.0252, + "epoch": 0.07, + "learning_rate": 0.00029016281258019443, + "loss": 0.0387, "step": 25300 }, { - "epoch": 0.13, - "learning_rate": 0.0002808461689815399, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.00029015892436382295, + "loss": 0.0313, "step": 25310 }, { - "epoch": 0.13, - "learning_rate": 0.00028083860128852586, - "loss": 0.0215, + "epoch": 0.07, + "learning_rate": 0.0002901550361474515, + "loss": 0.0332, "step": 25320 }, { - "epoch": 0.13, - "learning_rate": 0.00028083103359551184, - "loss": 0.0299, + "epoch": 0.07, + "learning_rate": 0.00029015114793108003, + "loss": 0.0324, "step": 25330 }, { - "epoch": 0.13, - "learning_rate": 0.0002808234659024978, - "loss": 0.0243, + "epoch": 0.07, + "learning_rate": 0.0002901472597147086, + "loss": 0.0318, "step": 25340 }, { - "epoch": 0.13, - "learning_rate": 0.0002808158982094838, - "loss": 0.0348, + "epoch": 0.07, + "learning_rate": 0.0002901433714983371, + "loss": 0.0352, "step": 25350 }, { - "epoch": 0.13, - "learning_rate": 0.0002808083305164698, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.00029013948328196563, + "loss": 0.0319, "step": 25360 }, { - "epoch": 0.13, - "learning_rate": 0.0002808007628234558, - "loss": 0.0305, + "epoch": 0.07, + "learning_rate": 0.0002901355950655942, + "loss": 0.0372, "step": 25370 }, { - "epoch": 0.13, - "learning_rate": 0.0002807931951304418, - "loss": 0.0269, + "epoch": 0.07, + "learning_rate": 0.0002901317068492227, + "loss": 0.0371, "step": 25380 }, { - "epoch": 0.13, - "learning_rate": 0.0002807856274374278, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00029012781863285123, + "loss": 0.034, "step": 25390 }, { - "epoch": 0.13, - "learning_rate": 0.00028077805974441376, - "loss": 0.03, + "epoch": 0.07, + "learning_rate": 0.0002901239304164798, + "loss": 0.0368, "step": 25400 }, { - "epoch": 0.13, - "learning_rate": 0.00028077049205139974, - "loss": 0.0283, + "epoch": 0.07, + "learning_rate": 0.00029012004220010836, + "loss": 0.0325, "step": 25410 }, { - "epoch": 0.13, - "learning_rate": 0.0002807629243583857, - "loss": 0.0247, + "epoch": 0.07, + "learning_rate": 0.0002901161539837369, + "loss": 0.0379, "step": 25420 }, { - "epoch": 0.13, - "learning_rate": 0.0002807553566653717, - "loss": 0.0282, + "epoch": 0.07, + "learning_rate": 0.0002901122657673654, + "loss": 0.0327, "step": 25430 }, { - "epoch": 0.13, - "learning_rate": 0.00028074778897235774, - "loss": 0.0228, + "epoch": 0.07, + "learning_rate": 0.0002901083775509939, + "loss": 0.0344, "step": 25440 }, { - "epoch": 0.13, - "learning_rate": 0.0002807402212793437, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.0002901044893346225, + "loss": 0.0385, "step": 25450 }, { - "epoch": 0.13, - "learning_rate": 0.0002807326535863297, - "loss": 0.0335, + "epoch": 0.07, + "learning_rate": 0.000290100601118251, + "loss": 0.034, "step": 25460 }, { - "epoch": 0.13, - "learning_rate": 0.0002807250858933157, - "loss": 0.0284, + "epoch": 0.07, + "learning_rate": 0.00029009671290187956, + "loss": 0.0345, "step": 25470 }, { - "epoch": 0.13, - "learning_rate": 0.00028071751820030167, - "loss": 0.03, + "epoch": 0.07, + "learning_rate": 0.0002900928246855081, + "loss": 0.0333, "step": 25480 }, { - "epoch": 0.13, - "learning_rate": 0.00028070995050728765, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.00029008893646913664, + "loss": 0.0377, "step": 25490 }, { - "epoch": 0.13, - "learning_rate": 0.0002807023828142737, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.00029008504825276516, + "loss": 0.0362, "step": 25500 }, { - "epoch": 0.13, - "learning_rate": 0.00028069481512125967, - "loss": 0.0282, + "epoch": 0.07, + "learning_rate": 0.00029008116003639367, + "loss": 0.0311, "step": 25510 }, { - "epoch": 0.13, - "learning_rate": 0.00028068724742824565, - "loss": 0.0257, + "epoch": 0.07, + "learning_rate": 0.0002900772718200222, + "loss": 0.0361, "step": 25520 }, { - "epoch": 0.13, - "learning_rate": 0.00028067967973523163, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.00029007338360365076, + "loss": 0.0378, "step": 25530 }, { - "epoch": 0.13, - "learning_rate": 0.0002806721120422176, - "loss": 0.0248, + "epoch": 0.07, + "learning_rate": 0.00029006949538727927, + "loss": 0.036, "step": 25540 }, { - "epoch": 0.13, - "learning_rate": 0.0002806645443492036, - "loss": 0.0252, + "epoch": 0.07, + "learning_rate": 0.00029006560717090784, + "loss": 0.0353, "step": 25550 }, { - "epoch": 0.13, - "learning_rate": 0.00028065697665618963, - "loss": 0.0278, + "epoch": 0.07, + "learning_rate": 0.00029006171895453635, + "loss": 0.0397, "step": 25560 }, { - "epoch": 0.13, - "learning_rate": 0.0002806494089631756, - "loss": 0.0305, + "epoch": 0.07, + "learning_rate": 0.00029005783073816487, + "loss": 0.0317, "step": 25570 }, { - "epoch": 0.13, - "learning_rate": 0.0002806418412701616, - "loss": 0.0253, + "epoch": 0.07, + "learning_rate": 0.00029005394252179344, + "loss": 0.0372, "step": 25580 }, { - "epoch": 0.13, - "learning_rate": 0.00028063427357714757, - "loss": 0.0302, + "epoch": 0.07, + "learning_rate": 0.00029005005430542195, + "loss": 0.0342, "step": 25590 }, { - "epoch": 0.13, - "learning_rate": 0.00028062670588413355, - "loss": 0.0312, + "epoch": 0.07, + "learning_rate": 0.00029004616608905047, + "loss": 0.043, "step": 25600 }, { - "epoch": 0.13, - "learning_rate": 0.00028061913819111954, - "loss": 0.0293, + "epoch": 0.07, + "learning_rate": 0.00029004227787267903, + "loss": 0.0406, "step": 25610 }, { - "epoch": 0.13, - "learning_rate": 0.0002806115704981055, - "loss": 0.0286, + "epoch": 0.07, + "learning_rate": 0.0002900383896563076, + "loss": 0.0318, "step": 25620 }, { - "epoch": 0.13, - "learning_rate": 0.00028060400280509155, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.0002900345014399361, + "loss": 0.0329, "step": 25630 }, { - "epoch": 0.13, - "learning_rate": 0.00028059643511207753, - "loss": 0.0245, + "epoch": 0.07, + "learning_rate": 0.00029003061322356463, + "loss": 0.0394, "step": 25640 }, { - "epoch": 0.13, - "learning_rate": 0.0002805888674190635, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.00029002672500719315, + "loss": 0.0391, "step": 25650 }, { - "epoch": 0.13, - "learning_rate": 0.0002805812997260495, - "loss": 0.0281, + "epoch": 0.07, + "learning_rate": 0.0002900228367908217, + "loss": 0.0311, "step": 25660 }, { - "epoch": 0.13, - "learning_rate": 0.0002805737320330355, - "loss": 0.0347, + "epoch": 0.07, + "learning_rate": 0.00029001894857445023, + "loss": 0.0319, "step": 25670 }, { - "epoch": 0.13, - "learning_rate": 0.00028056616434002146, - "loss": 0.0276, + "epoch": 0.07, + "learning_rate": 0.0002900150603580788, + "loss": 0.0367, "step": 25680 }, { - "epoch": 0.13, - "learning_rate": 0.0002805585966470075, - "loss": 0.03, + "epoch": 0.07, + "learning_rate": 0.0002900111721417073, + "loss": 0.0434, "step": 25690 }, { - "epoch": 0.13, - "learning_rate": 0.0002805510289539935, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.0002900072839253359, + "loss": 0.0338, "step": 25700 }, { - "epoch": 0.13, - "learning_rate": 0.00028054346126097946, - "loss": 0.0377, + "epoch": 0.07, + "learning_rate": 0.0002900033957089644, + "loss": 0.0317, "step": 25710 }, { - "epoch": 0.13, - "learning_rate": 0.00028053589356796544, - "loss": 0.0605, + "epoch": 0.07, + "learning_rate": 0.0002899995074925929, + "loss": 0.035, "step": 25720 }, { - "epoch": 0.13, - "learning_rate": 0.0002805283258749514, - "loss": 0.032, + "epoch": 0.07, + "learning_rate": 0.0002899956192762214, + "loss": 0.0325, "step": 25730 }, { - "epoch": 0.13, - "learning_rate": 0.0002805207581819374, - "loss": 0.0337, + "epoch": 0.07, + "learning_rate": 0.00028999173105985, + "loss": 0.0321, "step": 25740 }, { - "epoch": 0.13, - "learning_rate": 0.00028051319048892344, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002899878428434785, + "loss": 0.033, "step": 25750 }, { - "epoch": 0.13, - "learning_rate": 0.0002805056227959094, - "loss": 0.0316, + "epoch": 0.07, + "learning_rate": 0.0002899839546271071, + "loss": 0.0314, "step": 25760 }, { - "epoch": 0.13, - "learning_rate": 0.00028049805510289535, - "loss": 0.0249, + "epoch": 0.07, + "learning_rate": 0.0002899800664107356, + "loss": 0.0327, "step": 25770 }, { - "epoch": 0.13, - "learning_rate": 0.00028049048740988133, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.00028997617819436416, + "loss": 0.0327, "step": 25780 }, { - "epoch": 0.13, - "learning_rate": 0.00028048291971686736, - "loss": 0.0345, + "epoch": 0.07, + "learning_rate": 0.0002899722899779927, + "loss": 0.0316, "step": 25790 }, { - "epoch": 0.13, - "learning_rate": 0.00028047535202385335, - "loss": 0.0284, + "epoch": 0.07, + "learning_rate": 0.0002899684017616212, + "loss": 0.0346, "step": 25800 }, { - "epoch": 0.13, - "learning_rate": 0.00028046778433083933, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.00028996451354524976, + "loss": 0.0316, "step": 25810 }, { - "epoch": 0.13, - "learning_rate": 0.0002804602166378253, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.0002899606253288783, + "loss": 0.0307, "step": 25820 }, { - "epoch": 0.13, - "learning_rate": 0.0002804526489448113, - "loss": 0.0298, + "epoch": 0.07, + "learning_rate": 0.00028995673711250684, + "loss": 0.0454, "step": 25830 }, { - "epoch": 0.13, - "learning_rate": 0.00028044508125179727, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.00028995284889613536, + "loss": 0.0352, "step": 25840 }, { - "epoch": 0.13, - "learning_rate": 0.00028043751355878325, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.00028994896067976387, + "loss": 0.0362, "step": 25850 }, { - "epoch": 0.13, - "learning_rate": 0.0002804299458657693, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.0002899450724633924, + "loss": 0.0352, "step": 25860 }, { - "epoch": 0.13, - "learning_rate": 0.00028042237817275527, - "loss": 0.024, + "epoch": 0.07, + "learning_rate": 0.00028994118424702095, + "loss": 0.0371, "step": 25870 }, { - "epoch": 0.13, - "learning_rate": 0.00028041481047974125, - "loss": 0.0263, + "epoch": 0.07, + "learning_rate": 0.00028993729603064947, + "loss": 0.0364, "step": 25880 }, { - "epoch": 0.13, - "learning_rate": 0.00028040724278672723, - "loss": 0.0284, + "epoch": 0.07, + "learning_rate": 0.00028993340781427804, + "loss": 0.0386, "step": 25890 }, { - "epoch": 0.13, - "learning_rate": 0.0002803996750937132, - "loss": 0.0283, + "epoch": 0.07, + "learning_rate": 0.00028992951959790655, + "loss": 0.0342, "step": 25900 }, { - "epoch": 0.13, - "learning_rate": 0.0002803921074006992, - "loss": 0.0398, + "epoch": 0.07, + "learning_rate": 0.0002899256313815351, + "loss": 0.0301, "step": 25910 }, { - "epoch": 0.13, - "learning_rate": 0.00028038453970768523, - "loss": 0.0498, + "epoch": 0.07, + "learning_rate": 0.00028992174316516364, + "loss": 0.0284, "step": 25920 }, { - "epoch": 0.13, - "learning_rate": 0.0002803769720146712, - "loss": 0.03, + "epoch": 0.07, + "learning_rate": 0.00028991785494879215, + "loss": 0.0371, "step": 25930 }, { - "epoch": 0.13, - "learning_rate": 0.0002803694043216572, - "loss": 0.0254, + "epoch": 0.07, + "learning_rate": 0.00028991396673242066, + "loss": 0.0315, "step": 25940 }, { - "epoch": 0.13, - "learning_rate": 0.0002803618366286432, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.00028991007851604923, + "loss": 0.0365, "step": 25950 }, { - "epoch": 0.13, - "learning_rate": 0.00028035426893562916, - "loss": 0.0304, + "epoch": 0.07, + "learning_rate": 0.0002899061902996778, + "loss": 0.0318, "step": 25960 }, { - "epoch": 0.13, - "learning_rate": 0.00028034670124261514, - "loss": 0.0237, + "epoch": 0.07, + "learning_rate": 0.0002899023020833063, + "loss": 0.0324, "step": 25970 }, { - "epoch": 0.13, - "learning_rate": 0.0002803391335496011, - "loss": 0.0255, + "epoch": 0.07, + "learning_rate": 0.00028989841386693483, + "loss": 0.0333, "step": 25980 }, { - "epoch": 0.13, - "learning_rate": 0.00028033156585658716, - "loss": 0.0223, + "epoch": 0.07, + "learning_rate": 0.0002898945256505634, + "loss": 0.0352, "step": 25990 }, { - "epoch": 0.13, - "learning_rate": 0.00028032399816357314, - "loss": 0.0258, + "epoch": 0.07, + "learning_rate": 0.0002898906374341919, + "loss": 0.0374, "step": 26000 }, { - "epoch": 0.13, - "eval_cer": 0.9144799598644162, - "eval_loss": 0.019629212096333504, - "eval_runtime": 117.332, - "eval_samples_per_second": 17.046, - "eval_steps_per_second": 4.261, + "epoch": 0.07, + "eval_cer": 0.881813257640968, + "eval_loss": 0.026022659614682198, + "eval_runtime": 107.6573, + "eval_samples_per_second": 18.577, + "eval_steps_per_second": 4.644, "step": 26000 }, { - "epoch": 0.13, - "learning_rate": 0.0002803164304705591, - "loss": 0.0294, + "epoch": 0.07, + "learning_rate": 0.00028988674921782043, + "loss": 0.035, "step": 26010 }, { - "epoch": 0.13, - "learning_rate": 0.0002803088627775451, - "loss": 0.028, + "epoch": 0.07, + "learning_rate": 0.000289882861001449, + "loss": 0.0385, "step": 26020 }, { - "epoch": 0.13, - "learning_rate": 0.0002803012950845311, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002898789727850775, + "loss": 0.0352, "step": 26030 }, { - "epoch": 0.13, - "learning_rate": 0.00028029372739151706, - "loss": 0.0292, + "epoch": 0.07, + "learning_rate": 0.0002898750845687061, + "loss": 0.0372, "step": 26040 }, { - "epoch": 0.13, - "learning_rate": 0.0002802861596985031, - "loss": 0.0327, + "epoch": 0.07, + "learning_rate": 0.0002898711963523346, + "loss": 0.035, "step": 26050 }, { - "epoch": 0.13, - "learning_rate": 0.0002802785920054891, - "loss": 0.0273, + "epoch": 0.07, + "learning_rate": 0.0002898673081359631, + "loss": 0.0335, "step": 26060 }, { - "epoch": 0.13, - "learning_rate": 0.00028027102431247506, - "loss": 0.0342, + "epoch": 0.07, + "learning_rate": 0.0002898634199195916, + "loss": 0.039, "step": 26070 }, { - "epoch": 0.13, - "learning_rate": 0.00028026345661946104, - "loss": 0.0319, + "epoch": 0.07, + "learning_rate": 0.0002898595317032202, + "loss": 0.0349, "step": 26080 }, { - "epoch": 0.13, - "learning_rate": 0.000280255888926447, - "loss": 0.031, + "epoch": 0.07, + "learning_rate": 0.0002898556434868487, + "loss": 0.0357, "step": 26090 }, { - "epoch": 0.13, - "learning_rate": 0.000280248321233433, - "loss": 0.0213, + "epoch": 0.07, + "learning_rate": 0.0002898517552704773, + "loss": 0.0339, "step": 26100 }, { - "epoch": 0.13, - "learning_rate": 0.00028024075354041904, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.0002898478670541058, + "loss": 0.0368, "step": 26110 }, { - "epoch": 0.13, - "learning_rate": 0.000280233185847405, - "loss": 0.0279, + "epoch": 0.07, + "learning_rate": 0.00028984397883773436, + "loss": 0.0325, "step": 26120 }, { - "epoch": 0.13, - "learning_rate": 0.000280225618154391, - "loss": 0.0244, + "epoch": 0.07, + "learning_rate": 0.0002898400906213629, + "loss": 0.0362, "step": 26130 }, { - "epoch": 0.13, - "learning_rate": 0.000280218050461377, - "loss": 0.0294, + "epoch": 0.07, + "learning_rate": 0.0002898362024049914, + "loss": 0.0374, "step": 26140 }, { - "epoch": 0.13, - "learning_rate": 0.00028021048276836297, - "loss": 0.0253, + "epoch": 0.07, + "learning_rate": 0.0002898323141886199, + "loss": 0.0433, "step": 26150 }, { - "epoch": 0.13, - "learning_rate": 0.00028020291507534895, - "loss": 0.0221, + "epoch": 0.07, + "learning_rate": 0.00028982842597224847, + "loss": 0.0362, "step": 26160 }, { - "epoch": 0.13, - "learning_rate": 0.00028019534738233493, - "loss": 0.0235, + "epoch": 0.07, + "learning_rate": 0.00028982453775587704, + "loss": 0.0322, "step": 26170 }, { - "epoch": 0.13, - "learning_rate": 0.00028018777968932097, - "loss": 0.0256, + "epoch": 0.07, + "learning_rate": 0.00028982064953950556, + "loss": 0.038, "step": 26180 }, { - "epoch": 0.13, - "learning_rate": 0.00028018021199630695, - "loss": 0.0281, + "epoch": 0.07, + "learning_rate": 0.00028981676132313407, + "loss": 0.0332, "step": 26190 }, { - "epoch": 0.13, - "learning_rate": 0.00028017264430329293, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.00028981287310676264, + "loss": 0.0311, "step": 26200 }, { - "epoch": 0.13, - "learning_rate": 0.0002801650766102789, - "loss": 0.0247, + "epoch": 0.07, + "learning_rate": 0.00028980898489039115, + "loss": 0.0396, "step": 26210 }, { - "epoch": 0.13, - "learning_rate": 0.0002801575089172649, - "loss": 0.0251, + "epoch": 0.07, + "learning_rate": 0.00028980509667401967, + "loss": 0.0351, "step": 26220 }, { - "epoch": 0.13, - "learning_rate": 0.0002801499412242509, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.00028980120845764824, + "loss": 0.0349, "step": 26230 }, { - "epoch": 0.13, - "learning_rate": 0.0002801423735312369, - "loss": 0.0286, + "epoch": 0.07, + "learning_rate": 0.00028979732024127675, + "loss": 0.0309, "step": 26240 }, { - "epoch": 0.13, - "learning_rate": 0.0002801348058382229, - "loss": 0.0289, + "epoch": 0.07, + "learning_rate": 0.0002897934320249053, + "loss": 0.0354, "step": 26250 }, { - "epoch": 0.13, - "learning_rate": 0.00028012723814520887, - "loss": 0.0265, + "epoch": 0.07, + "learning_rate": 0.00028978954380853383, + "loss": 0.0324, "step": 26260 }, { - "epoch": 0.13, - "learning_rate": 0.00028011967045219485, - "loss": 0.0294, + "epoch": 0.07, + "learning_rate": 0.00028978565559216235, + "loss": 0.0281, "step": 26270 }, { - "epoch": 0.13, - "learning_rate": 0.00028011210275918083, + "epoch": 0.07, + "learning_rate": 0.0002897817673757909, "loss": 0.0306, "step": 26280 }, { - "epoch": 0.13, - "learning_rate": 0.0002801045350661668, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.00028977787915941943, + "loss": 0.0299, "step": 26290 }, { - "epoch": 0.13, - "learning_rate": 0.00028009696737315285, - "loss": 0.0307, + "epoch": 0.07, + "learning_rate": 0.00028977399094304795, + "loss": 0.0325, "step": 26300 }, { - "epoch": 0.13, - "learning_rate": 0.00028008939968013883, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.0002897701027266765, + "loss": 0.0416, "step": 26310 }, { - "epoch": 0.13, - "learning_rate": 0.0002800818319871248, - "loss": 0.0289, + "epoch": 0.07, + "learning_rate": 0.00028976621451030503, + "loss": 0.0288, "step": 26320 }, { - "epoch": 0.13, - "learning_rate": 0.0002800742642941108, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.0002897623262939336, + "loss": 0.0392, "step": 26330 }, { - "epoch": 0.13, - "learning_rate": 0.0002800666966010968, - "loss": 0.0258, + "epoch": 0.07, + "learning_rate": 0.0002897584380775621, + "loss": 0.0374, "step": 26340 }, { - "epoch": 0.13, - "learning_rate": 0.00028005912890808276, - "loss": 0.0311, + "epoch": 0.07, + "learning_rate": 0.00028975454986119063, + "loss": 0.0349, "step": 26350 }, { - "epoch": 0.13, - "learning_rate": 0.00028005156121506874, - "loss": 0.0253, + "epoch": 0.07, + "learning_rate": 0.0002897506616448192, + "loss": 0.0373, "step": 26360 }, { - "epoch": 0.13, - "learning_rate": 0.0002800439935220548, - "loss": 0.0236, + "epoch": 0.07, + "learning_rate": 0.0002897467734284477, + "loss": 0.0336, "step": 26370 }, { - "epoch": 0.13, - "learning_rate": 0.00028003642582904076, - "loss": 0.0235, + "epoch": 0.07, + "learning_rate": 0.0002897428852120763, + "loss": 0.0351, "step": 26380 }, { - "epoch": 0.13, - "learning_rate": 0.00028002885813602674, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002897389969957048, + "loss": 0.0354, "step": 26390 }, { - "epoch": 0.13, - "learning_rate": 0.0002800212904430127, - "loss": 0.0229, + "epoch": 0.07, + "learning_rate": 0.0002897351087793333, + "loss": 0.036, "step": 26400 }, { - "epoch": 0.13, - "learning_rate": 0.0002800137227499987, - "loss": 0.0255, + "epoch": 0.07, + "learning_rate": 0.0002897312205629619, + "loss": 0.0383, "step": 26410 }, { - "epoch": 0.13, - "learning_rate": 0.0002800061550569847, - "loss": 0.0301, + "epoch": 0.07, + "learning_rate": 0.0002897273323465904, + "loss": 0.0336, "step": 26420 }, { - "epoch": 0.13, - "learning_rate": 0.0002799985873639707, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.0002897234441302189, + "loss": 0.0367, "step": 26430 }, { - "epoch": 0.13, - "learning_rate": 0.0002799910196709567, - "loss": 0.0226, + "epoch": 0.07, + "learning_rate": 0.0002897195559138475, + "loss": 0.0347, "step": 26440 }, { - "epoch": 0.13, - "learning_rate": 0.0002799834519779427, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.000289715667697476, + "loss": 0.0349, "step": 26450 }, { - "epoch": 0.13, - "learning_rate": 0.00027997588428492866, - "loss": 0.0286, + "epoch": 0.07, + "learning_rate": 0.00028971177948110456, + "loss": 0.0411, "step": 26460 }, { - "epoch": 0.13, - "learning_rate": 0.00027996831659191464, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.0002897078912647331, + "loss": 0.0333, "step": 26470 }, { - "epoch": 0.13, - "learning_rate": 0.0002799607488989006, - "loss": 0.0276, + "epoch": 0.07, + "learning_rate": 0.0002897040030483616, + "loss": 0.0306, "step": 26480 }, { - "epoch": 0.13, - "learning_rate": 0.0002799531812058866, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.00028970011483199016, + "loss": 0.0342, "step": 26490 }, { - "epoch": 0.13, - "learning_rate": 0.00027994561351287264, - "loss": 0.0327, + "epoch": 0.07, + "learning_rate": 0.00028969622661561867, + "loss": 0.0316, "step": 26500 }, { - "epoch": 0.13, - "learning_rate": 0.0002799380458198586, - "loss": 0.0265, + "epoch": 0.07, + "learning_rate": 0.00028969233839924724, + "loss": 0.0351, "step": 26510 }, { - "epoch": 0.13, - "learning_rate": 0.0002799304781268446, - "loss": 0.0286, + "epoch": 0.07, + "learning_rate": 0.00028968845018287575, + "loss": 0.0394, "step": 26520 }, { - "epoch": 0.13, - "learning_rate": 0.0002799229104338306, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.0002896845619665043, + "loss": 0.0353, "step": 26530 }, { - "epoch": 0.13, - "learning_rate": 0.00027991534274081657, - "loss": 0.0244, + "epoch": 0.07, + "learning_rate": 0.00028968067375013284, + "loss": 0.0306, "step": 26540 }, { - "epoch": 0.13, - "learning_rate": 0.00027990777504780255, - "loss": 0.0262, + "epoch": 0.07, + "learning_rate": 0.00028967678553376135, + "loss": 0.0342, "step": 26550 }, { - "epoch": 0.13, - "learning_rate": 0.0002799002073547886, - "loss": 0.0246, + "epoch": 0.07, + "learning_rate": 0.00028967289731738987, + "loss": 0.0328, "step": 26560 }, { - "epoch": 0.13, - "learning_rate": 0.00027989263966177457, - "loss": 0.0241, + "epoch": 0.07, + "learning_rate": 0.00028966900910101844, + "loss": 0.0311, "step": 26570 }, { - "epoch": 0.13, - "learning_rate": 0.00027988507196876055, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.00028966512088464695, + "loss": 0.0351, "step": 26580 }, { - "epoch": 0.13, - "learning_rate": 0.00027987750427574653, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.0002896612326682755, + "loss": 0.0317, "step": 26590 }, { - "epoch": 0.13, - "learning_rate": 0.0002798699365827325, - "loss": 0.0289, + "epoch": 0.07, + "learning_rate": 0.00028965734445190403, + "loss": 0.0341, "step": 26600 }, { - "epoch": 0.13, - "learning_rate": 0.0002798623688897185, - "loss": 0.0224, + "epoch": 0.07, + "learning_rate": 0.00028965345623553255, + "loss": 0.0319, "step": 26610 }, { - "epoch": 0.13, - "learning_rate": 0.00027985480119670453, - "loss": 0.0345, + "epoch": 0.07, + "learning_rate": 0.0002896495680191611, + "loss": 0.0304, "step": 26620 }, { - "epoch": 0.13, - "learning_rate": 0.0002798472335036905, - "loss": 0.0268, + "epoch": 0.07, + "learning_rate": 0.00028964567980278963, + "loss": 0.0272, "step": 26630 }, { - "epoch": 0.13, - "learning_rate": 0.0002798396658106765, - "loss": 0.0274, + "epoch": 0.07, + "learning_rate": 0.00028964179158641815, + "loss": 0.0341, "step": 26640 }, { - "epoch": 0.13, - "learning_rate": 0.0002798320981176625, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002896379033700467, + "loss": 0.03, "step": 26650 }, { - "epoch": 0.13, - "learning_rate": 0.00027982453042464845, - "loss": 0.0246, + "epoch": 0.07, + "learning_rate": 0.0002896340151536753, + "loss": 0.0326, "step": 26660 }, { - "epoch": 0.13, - "learning_rate": 0.00027981696273163444, - "loss": 0.0257, + "epoch": 0.07, + "learning_rate": 0.0002896301269373038, + "loss": 0.0306, "step": 26670 }, { - "epoch": 0.13, - "learning_rate": 0.0002798093950386204, - "loss": 0.0251, + "epoch": 0.07, + "learning_rate": 0.0002896262387209323, + "loss": 0.0325, "step": 26680 }, { - "epoch": 0.13, - "learning_rate": 0.00027980182734560645, - "loss": 0.0335, + "epoch": 0.07, + "learning_rate": 0.0002896223505045608, + "loss": 0.0294, "step": 26690 }, { - "epoch": 0.13, - "learning_rate": 0.00027979425965259243, - "loss": 0.0317, + "epoch": 0.07, + "learning_rate": 0.0002896184622881894, + "loss": 0.0329, "step": 26700 }, { - "epoch": 0.13, - "learning_rate": 0.0002797866919595784, - "loss": 0.029, + "epoch": 0.07, + "learning_rate": 0.0002896145740718179, + "loss": 0.0288, "step": 26710 }, { - "epoch": 0.13, - "learning_rate": 0.0002797791242665644, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.0002896106858554465, + "loss": 0.0319, "step": 26720 }, { - "epoch": 0.13, - "learning_rate": 0.0002797715565735504, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.000289606797639075, + "loss": 0.04, "step": 26730 }, { - "epoch": 0.13, - "learning_rate": 0.00027976398888053636, - "loss": 0.0233, + "epoch": 0.07, + "learning_rate": 0.00028960290942270356, + "loss": 0.0396, "step": 26740 }, { - "epoch": 0.13, - "learning_rate": 0.0002797564211875224, - "loss": 0.0269, + "epoch": 0.07, + "learning_rate": 0.0002895990212063321, + "loss": 0.0302, "step": 26750 }, { - "epoch": 0.14, - "learning_rate": 0.0002797488534945084, - "loss": 0.0241, + "epoch": 0.07, + "learning_rate": 0.0002895951329899606, + "loss": 0.0364, "step": 26760 }, { - "epoch": 0.14, - "learning_rate": 0.00027974128580149436, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.0002895912447735891, + "loss": 0.0368, "step": 26770 }, { - "epoch": 0.14, - "learning_rate": 0.00027973371810848034, - "loss": 0.0314, + "epoch": 0.07, + "learning_rate": 0.0002895873565572177, + "loss": 0.0342, "step": 26780 }, { - "epoch": 0.14, - "learning_rate": 0.0002797261504154663, - "loss": 0.0305, + "epoch": 0.07, + "learning_rate": 0.0002895834683408462, + "loss": 0.0284, "step": 26790 }, { - "epoch": 0.14, - "learning_rate": 0.0002797185827224523, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.00028957958012447476, + "loss": 0.0342, "step": 26800 }, { - "epoch": 0.14, - "learning_rate": 0.00027971101502943834, - "loss": 0.0316, + "epoch": 0.07, + "learning_rate": 0.00028957569190810327, + "loss": 0.0314, "step": 26810 }, { - "epoch": 0.14, - "learning_rate": 0.0002797034473364243, - "loss": 0.0237, + "epoch": 0.07, + "learning_rate": 0.0002895718036917318, + "loss": 0.0313, "step": 26820 }, { - "epoch": 0.14, - "learning_rate": 0.0002796958796434103, - "loss": 0.0287, + "epoch": 0.07, + "learning_rate": 0.00028956791547536036, + "loss": 0.0385, "step": 26830 }, { - "epoch": 0.14, - "learning_rate": 0.0002796883119503963, - "loss": 0.024, + "epoch": 0.07, + "learning_rate": 0.00028956402725898887, + "loss": 0.0329, "step": 26840 }, { - "epoch": 0.14, - "learning_rate": 0.00027968074425738226, - "loss": 0.0314, + "epoch": 0.07, + "learning_rate": 0.0002895601390426174, + "loss": 0.0337, "step": 26850 }, { - "epoch": 0.14, - "learning_rate": 0.00027967317656436825, - "loss": 0.0315, + "epoch": 0.07, + "learning_rate": 0.00028955625082624595, + "loss": 0.0347, "step": 26860 }, { - "epoch": 0.14, - "learning_rate": 0.00027966560887135423, - "loss": 0.0268, + "epoch": 0.07, + "learning_rate": 0.0002895523626098745, + "loss": 0.0368, "step": 26870 }, { - "epoch": 0.14, - "learning_rate": 0.00027965804117834026, - "loss": 0.0279, + "epoch": 0.07, + "learning_rate": 0.00028954847439350304, + "loss": 0.0302, "step": 26880 }, { - "epoch": 0.14, - "learning_rate": 0.00027965047348532624, - "loss": 0.0324, + "epoch": 0.07, + "learning_rate": 0.00028954458617713155, + "loss": 0.0334, "step": 26890 }, { - "epoch": 0.14, - "learning_rate": 0.0002796429057923122, - "loss": 0.0249, + "epoch": 0.07, + "learning_rate": 0.00028954069796076007, + "loss": 0.037, "step": 26900 }, { - "epoch": 0.14, - "learning_rate": 0.0002796353380992982, - "loss": 0.0301, + "epoch": 0.07, + "learning_rate": 0.00028953680974438863, + "loss": 0.0365, "step": 26910 }, { - "epoch": 0.14, - "learning_rate": 0.0002796277704062842, - "loss": 0.0246, + "epoch": 0.07, + "learning_rate": 0.00028953292152801715, + "loss": 0.0287, "step": 26920 }, { - "epoch": 0.14, - "learning_rate": 0.00027962020271327017, - "loss": 0.0289, + "epoch": 0.07, + "learning_rate": 0.0002895290333116457, + "loss": 0.0257, "step": 26930 }, { - "epoch": 0.14, - "learning_rate": 0.0002796126350202562, - "loss": 0.0264, + "epoch": 0.07, + "learning_rate": 0.00028952514509527423, + "loss": 0.0266, "step": 26940 }, { - "epoch": 0.14, - "learning_rate": 0.0002796050673272422, - "loss": 0.0234, + "epoch": 0.07, + "learning_rate": 0.0002895212568789028, + "loss": 0.0342, "step": 26950 }, { - "epoch": 0.14, - "learning_rate": 0.00027959749963422817, - "loss": 0.0335, + "epoch": 0.07, + "learning_rate": 0.0002895173686625313, + "loss": 0.0419, "step": 26960 }, { - "epoch": 0.14, - "learning_rate": 0.00027958993194121415, - "loss": 0.0256, + "epoch": 0.07, + "learning_rate": 0.00028951348044615983, + "loss": 0.0388, "step": 26970 }, { - "epoch": 0.14, - "learning_rate": 0.00027958236424820013, - "loss": 0.0356, + "epoch": 0.07, + "learning_rate": 0.00028950959222978834, + "loss": 0.0325, "step": 26980 }, { - "epoch": 0.14, - "learning_rate": 0.0002795747965551861, - "loss": 0.0252, + "epoch": 0.07, + "learning_rate": 0.0002895057040134169, + "loss": 0.0393, "step": 26990 }, { - "epoch": 0.14, - "learning_rate": 0.0002795672288621721, - "loss": 0.0255, + "epoch": 0.07, + "learning_rate": 0.0002895018157970455, + "loss": 0.037, "step": 27000 }, { - "epoch": 0.14, - "eval_cer": 0.9144469663961525, - "eval_loss": 0.020766137167811394, - "eval_runtime": 117.1709, - "eval_samples_per_second": 17.069, - "eval_steps_per_second": 4.267, + "epoch": 0.07, + "eval_cer": 0.8818118580040337, + "eval_loss": 0.02456413209438324, + "eval_runtime": 107.6789, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 4.643, "step": 27000 }, { - "epoch": 0.14, - "learning_rate": 0.00027955966116915813, - "loss": 0.0269, + "epoch": 0.07, + "learning_rate": 0.000289497927580674, + "loss": 0.0335, "step": 27010 }, { - "epoch": 0.14, - "learning_rate": 0.0002795520934761441, - "loss": 0.0345, + "epoch": 0.07, + "learning_rate": 0.0002894940393643025, + "loss": 0.0275, "step": 27020 }, { - "epoch": 0.14, - "learning_rate": 0.00027954452578313004, - "loss": 0.0293, + "epoch": 0.07, + "learning_rate": 0.0002894901511479311, + "loss": 0.0362, "step": 27030 }, { - "epoch": 0.14, - "learning_rate": 0.0002795369580901161, - "loss": 0.0293, + "epoch": 0.07, + "learning_rate": 0.0002894862629315596, + "loss": 0.0328, "step": 27040 }, { - "epoch": 0.14, - "learning_rate": 0.00027952939039710206, - "loss": 0.0265, + "epoch": 0.07, + "learning_rate": 0.0002894823747151881, + "loss": 0.0327, "step": 27050 }, { - "epoch": 0.14, - "learning_rate": 0.00027952182270408804, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002894784864988167, + "loss": 0.0287, "step": 27060 }, { - "epoch": 0.14, - "learning_rate": 0.000279514255011074, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.0002894745982824452, + "loss": 0.0298, "step": 27070 }, { - "epoch": 0.14, - "learning_rate": 0.00027950668731806, - "loss": 0.0241, + "epoch": 0.07, + "learning_rate": 0.00028947071006607376, + "loss": 0.0335, "step": 27080 }, { - "epoch": 0.14, - "learning_rate": 0.000279499119625046, - "loss": 0.0265, + "epoch": 0.07, + "learning_rate": 0.0002894668218497023, + "loss": 0.032, "step": 27090 }, { - "epoch": 0.14, - "learning_rate": 0.00027949155193203196, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002894629336333308, + "loss": 0.0295, "step": 27100 }, { - "epoch": 0.14, - "learning_rate": 0.000279483984239018, - "loss": 0.033, + "epoch": 0.07, + "learning_rate": 0.0002894590454169593, + "loss": 0.0311, "step": 27110 }, { - "epoch": 0.14, - "learning_rate": 0.000279476416546004, - "loss": 0.0283, + "epoch": 0.07, + "learning_rate": 0.0002894551572005879, + "loss": 0.0332, "step": 27120 }, { - "epoch": 0.14, - "learning_rate": 0.00027946884885298996, - "loss": 0.0311, + "epoch": 0.07, + "learning_rate": 0.0002894512689842164, + "loss": 0.0339, "step": 27130 }, { - "epoch": 0.14, - "learning_rate": 0.00027946128115997594, - "loss": 0.0304, + "epoch": 0.07, + "learning_rate": 0.00028944738076784496, + "loss": 0.0314, "step": 27140 }, { - "epoch": 0.14, - "learning_rate": 0.0002794537134669619, - "loss": 0.0269, + "epoch": 0.07, + "learning_rate": 0.00028944349255147347, + "loss": 0.0325, "step": 27150 }, { - "epoch": 0.14, - "learning_rate": 0.0002794461457739479, - "loss": 0.0238, + "epoch": 0.07, + "learning_rate": 0.00028943960433510204, + "loss": 0.0342, "step": 27160 }, { - "epoch": 0.14, - "learning_rate": 0.00027943857808093394, - "loss": 0.0255, + "epoch": 0.07, + "learning_rate": 0.00028943571611873055, + "loss": 0.0355, "step": 27170 }, { - "epoch": 0.14, - "learning_rate": 0.0002794310103879199, - "loss": 0.0229, + "epoch": 0.07, + "learning_rate": 0.00028943182790235907, + "loss": 0.0386, "step": 27180 }, { - "epoch": 0.14, - "learning_rate": 0.0002794234426949059, - "loss": 0.026, + "epoch": 0.07, + "learning_rate": 0.0002894279396859876, + "loss": 0.0285, "step": 27190 }, { - "epoch": 0.14, - "learning_rate": 0.0002794158750018919, - "loss": 0.0263, + "epoch": 0.07, + "learning_rate": 0.00028942405146961615, + "loss": 0.0305, "step": 27200 }, { - "epoch": 0.14, - "learning_rate": 0.00027940830730887787, - "loss": 0.0264, + "epoch": 0.07, + "learning_rate": 0.0002894201632532447, + "loss": 0.0341, "step": 27210 }, { - "epoch": 0.14, - "learning_rate": 0.00027940073961586385, - "loss": 0.0274, + "epoch": 0.07, + "learning_rate": 0.00028941627503687324, + "loss": 0.0358, "step": 27220 }, { - "epoch": 0.14, - "learning_rate": 0.00027939317192284983, - "loss": 0.0254, + "epoch": 0.07, + "learning_rate": 0.00028941238682050175, + "loss": 0.0342, "step": 27230 }, { - "epoch": 0.14, - "learning_rate": 0.00027938560422983587, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.0002894084986041303, + "loss": 0.0336, "step": 27240 }, { - "epoch": 0.14, - "learning_rate": 0.00027937803653682185, - "loss": 0.0252, + "epoch": 0.07, + "learning_rate": 0.00028940461038775883, + "loss": 0.0313, "step": 27250 }, { - "epoch": 0.14, - "learning_rate": 0.00027937046884380783, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.00028940072217138735, + "loss": 0.0362, "step": 27260 }, { - "epoch": 0.14, - "learning_rate": 0.0002793629011507938, - "loss": 0.023, + "epoch": 0.07, + "learning_rate": 0.0002893968339550159, + "loss": 0.035, "step": 27270 }, { - "epoch": 0.14, - "learning_rate": 0.0002793553334577798, - "loss": 0.0264, + "epoch": 0.07, + "learning_rate": 0.00028939294573864443, + "loss": 0.0319, "step": 27280 }, { - "epoch": 0.14, - "learning_rate": 0.0002793477657647658, - "loss": 0.0249, + "epoch": 0.07, + "learning_rate": 0.000289389057522273, + "loss": 0.0364, "step": 27290 }, { - "epoch": 0.14, - "learning_rate": 0.0002793401980717518, - "loss": 0.0292, + "epoch": 0.07, + "learning_rate": 0.0002893851693059015, + "loss": 0.0341, "step": 27300 }, { - "epoch": 0.14, - "learning_rate": 0.0002793326303787378, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.00028938128108953003, + "loss": 0.0383, "step": 27310 }, { - "epoch": 0.14, - "learning_rate": 0.00027932506268572377, - "loss": 0.0252, + "epoch": 0.07, + "learning_rate": 0.00028937739287315854, + "loss": 0.0351, "step": 27320 }, { - "epoch": 0.14, - "learning_rate": 0.00027931749499270975, - "loss": 0.0293, + "epoch": 0.07, + "learning_rate": 0.0002893735046567871, + "loss": 0.0324, "step": 27330 }, { - "epoch": 0.14, - "learning_rate": 0.00027930992729969573, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.0002893696164404156, + "loss": 0.0386, "step": 27340 }, { - "epoch": 0.14, - "learning_rate": 0.0002793023596066817, - "loss": 0.0279, + "epoch": 0.07, + "learning_rate": 0.0002893657282240442, + "loss": 0.0321, "step": 27350 }, { - "epoch": 0.14, - "learning_rate": 0.00027929479191366775, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.0002893618400076727, + "loss": 0.035, "step": 27360 }, { - "epoch": 0.14, - "learning_rate": 0.00027928722422065373, - "loss": 0.0384, + "epoch": 0.07, + "learning_rate": 0.0002893579517913013, + "loss": 0.0381, "step": 27370 }, { - "epoch": 0.14, - "learning_rate": 0.0002792796565276397, - "loss": 0.0245, + "epoch": 0.07, + "learning_rate": 0.0002893540635749298, + "loss": 0.035, "step": 27380 }, { - "epoch": 0.14, - "learning_rate": 0.0002792720888346257, - "loss": 0.0309, + "epoch": 0.07, + "learning_rate": 0.0002893501753585583, + "loss": 0.0346, "step": 27390 }, { - "epoch": 0.14, - "learning_rate": 0.0002792645211416117, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.0002893462871421869, + "loss": 0.0354, "step": 27400 }, { - "epoch": 0.14, - "learning_rate": 0.00027925695344859766, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002893423989258154, + "loss": 0.0323, "step": 27410 }, { - "epoch": 0.14, - "learning_rate": 0.00027924938575558364, - "loss": 0.0263, + "epoch": 0.07, + "learning_rate": 0.00028933851070944396, + "loss": 0.0372, "step": 27420 }, { - "epoch": 0.14, - "learning_rate": 0.0002792418180625697, - "loss": 0.0229, + "epoch": 0.07, + "learning_rate": 0.0002893346224930725, + "loss": 0.0361, "step": 27430 }, { - "epoch": 0.14, - "learning_rate": 0.00027923425036955566, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.000289330734276701, + "loss": 0.053, "step": 27440 }, { - "epoch": 0.14, - "learning_rate": 0.00027922668267654164, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.00028932684606032956, + "loss": 0.032, "step": 27450 }, { - "epoch": 0.14, - "learning_rate": 0.0002792191149835276, - "loss": 0.0283, + "epoch": 0.07, + "learning_rate": 0.00028932295784395807, + "loss": 0.0357, "step": 27460 }, { - "epoch": 0.14, - "learning_rate": 0.0002792115472905136, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.0002893190696275866, + "loss": 0.0399, "step": 27470 }, { - "epoch": 0.14, - "learning_rate": 0.0002792039795974996, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.00028931518141121516, + "loss": 0.0398, "step": 27480 }, { - "epoch": 0.14, - "learning_rate": 0.0002791964119044856, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.00028931129319484367, + "loss": 0.0398, "step": 27490 }, { - "epoch": 0.14, - "learning_rate": 0.0002791888442114716, - "loss": 0.0313, + "epoch": 0.07, + "learning_rate": 0.00028930740497847224, + "loss": 0.0303, "step": 27500 }, { - "epoch": 0.14, - "learning_rate": 0.0002791812765184576, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.00028930351676210075, + "loss": 0.0415, "step": 27510 }, { - "epoch": 0.14, - "learning_rate": 0.00027917370882544356, - "loss": 0.0307, + "epoch": 0.07, + "learning_rate": 0.00028929962854572927, + "loss": 0.0326, "step": 27520 }, { - "epoch": 0.14, - "learning_rate": 0.00027916614113242954, - "loss": 0.0735, + "epoch": 0.07, + "learning_rate": 0.00028929574032935784, + "loss": 0.0299, "step": 27530 }, { - "epoch": 0.14, - "learning_rate": 0.0002791585734394155, - "loss": 0.0338, + "epoch": 0.07, + "learning_rate": 0.00028929185211298635, + "loss": 0.0301, "step": 27540 }, { - "epoch": 0.14, - "learning_rate": 0.00027915100574640156, - "loss": 0.0304, + "epoch": 0.07, + "learning_rate": 0.0002892879638966149, + "loss": 0.0317, "step": 27550 }, { - "epoch": 0.14, - "learning_rate": 0.00027914343805338754, - "loss": 0.036, + "epoch": 0.07, + "learning_rate": 0.00028928407568024343, + "loss": 0.0326, "step": 27560 }, { - "epoch": 0.14, - "learning_rate": 0.0002791358703603735, - "loss": 0.0325, + "epoch": 0.07, + "learning_rate": 0.00028928018746387195, + "loss": 0.0353, "step": 27570 }, { - "epoch": 0.14, - "learning_rate": 0.0002791283026673595, - "loss": 0.0392, + "epoch": 0.07, + "learning_rate": 0.0002892762992475005, + "loss": 0.0322, "step": 27580 }, { - "epoch": 0.14, - "learning_rate": 0.0002791207349743455, - "loss": 0.0254, + "epoch": 0.07, + "learning_rate": 0.00028927241103112903, + "loss": 0.0308, "step": 27590 }, { - "epoch": 0.14, - "learning_rate": 0.00027911316728133147, - "loss": 0.0372, + "epoch": 0.07, + "learning_rate": 0.00028926852281475755, + "loss": 0.035, "step": 27600 }, { - "epoch": 0.14, - "learning_rate": 0.00027910559958831745, - "loss": 0.0293, + "epoch": 0.07, + "learning_rate": 0.0002892646345983861, + "loss": 0.0303, "step": 27610 }, { - "epoch": 0.14, - "learning_rate": 0.0002790980318953035, - "loss": 0.0353, + "epoch": 0.07, + "learning_rate": 0.00028926074638201463, + "loss": 0.0347, "step": 27620 }, { - "epoch": 0.14, - "learning_rate": 0.00027909046420228947, - "loss": 0.0362, + "epoch": 0.07, + "learning_rate": 0.0002892568581656432, + "loss": 0.0482, "step": 27630 }, { - "epoch": 0.14, - "learning_rate": 0.00027908289650927545, - "loss": 0.0291, + "epoch": 0.07, + "learning_rate": 0.0002892529699492717, + "loss": 0.0316, "step": 27640 }, { - "epoch": 0.14, - "learning_rate": 0.00027907532881626143, - "loss": 0.0336, + "epoch": 0.07, + "learning_rate": 0.00028924908173290023, + "loss": 0.0404, "step": 27650 }, { - "epoch": 0.14, - "learning_rate": 0.0002790677611232474, - "loss": 0.0239, + "epoch": 0.07, + "learning_rate": 0.0002892451935165288, + "loss": 0.0306, "step": 27660 }, { - "epoch": 0.14, - "learning_rate": 0.0002790601934302334, - "loss": 0.0268, + "epoch": 0.07, + "learning_rate": 0.0002892413053001573, + "loss": 0.0321, "step": 27670 }, { - "epoch": 0.14, - "learning_rate": 0.00027905262573721943, - "loss": 0.026, + "epoch": 0.07, + "learning_rate": 0.0002892374170837858, + "loss": 0.032, "step": 27680 }, { - "epoch": 0.14, - "learning_rate": 0.0002790450580442054, - "loss": 0.0304, + "epoch": 0.07, + "learning_rate": 0.0002892335288674144, + "loss": 0.029, "step": 27690 }, { - "epoch": 0.14, - "learning_rate": 0.0002790374903511914, - "loss": 0.0298, + "epoch": 0.07, + "learning_rate": 0.00028922964065104296, + "loss": 0.0425, "step": 27700 }, { - "epoch": 0.14, - "learning_rate": 0.0002790299226581774, - "loss": 0.0302, + "epoch": 0.07, + "learning_rate": 0.0002892257524346715, + "loss": 0.0343, "step": 27710 }, { - "epoch": 0.14, - "learning_rate": 0.00027902235496516335, - "loss": 0.0229, + "epoch": 0.07, + "learning_rate": 0.0002892218642183, + "loss": 0.0358, "step": 27720 }, { - "epoch": 0.14, - "learning_rate": 0.00027901478727214934, - "loss": 0.0303, + "epoch": 0.07, + "learning_rate": 0.0002892179760019285, + "loss": 0.0361, "step": 27730 }, { - "epoch": 0.14, - "learning_rate": 0.0002790072195791353, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.0002892140877855571, + "loss": 0.0378, "step": 27740 }, { - "epoch": 0.14, - "learning_rate": 0.00027899965188612135, - "loss": 0.0317, + "epoch": 0.07, + "learning_rate": 0.0002892101995691856, + "loss": 0.0409, "step": 27750 }, { - "epoch": 0.14, - "learning_rate": 0.00027899208419310733, - "loss": 0.028, + "epoch": 0.07, + "learning_rate": 0.00028920631135281416, + "loss": 0.0355, "step": 27760 }, { - "epoch": 0.14, - "learning_rate": 0.0002789845165000933, - "loss": 0.0281, + "epoch": 0.07, + "learning_rate": 0.0002892024231364427, + "loss": 0.0429, "step": 27770 }, { - "epoch": 0.14, - "learning_rate": 0.0002789769488070793, - "loss": 0.0298, + "epoch": 0.07, + "learning_rate": 0.00028919853492007124, + "loss": 0.039, "step": 27780 }, { - "epoch": 0.14, - "learning_rate": 0.0002789693811140653, - "loss": 0.0308, + "epoch": 0.07, + "learning_rate": 0.00028919464670369976, + "loss": 0.0479, "step": 27790 }, { - "epoch": 0.14, - "learning_rate": 0.00027896181342105126, - "loss": 0.0301, + "epoch": 0.07, + "learning_rate": 0.00028919075848732827, + "loss": 0.0405, "step": 27800 }, { - "epoch": 0.14, - "learning_rate": 0.0002789542457280373, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.0002891868702709568, + "loss": 0.0421, "step": 27810 }, { - "epoch": 0.14, - "learning_rate": 0.0002789466780350233, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.00028918298205458535, + "loss": 0.037, "step": 27820 }, { - "epoch": 0.14, - "learning_rate": 0.00027893911034200926, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.00028917909383821387, + "loss": 0.0369, "step": 27830 }, { - "epoch": 0.14, - "learning_rate": 0.00027893154264899524, - "loss": 0.022, + "epoch": 0.07, + "learning_rate": 0.00028917520562184244, + "loss": 0.0393, "step": 27840 }, { - "epoch": 0.14, - "learning_rate": 0.0002789239749559812, - "loss": 0.0281, + "epoch": 0.07, + "learning_rate": 0.00028917131740547095, + "loss": 0.0407, "step": 27850 }, { - "epoch": 0.14, - "learning_rate": 0.0002789164072629672, - "loss": 0.0254, + "epoch": 0.07, + "learning_rate": 0.00028916742918909947, + "loss": 0.0313, "step": 27860 }, { - "epoch": 0.14, - "learning_rate": 0.00027890883956995324, - "loss": 0.0222, + "epoch": 0.07, + "learning_rate": 0.00028916354097272804, + "loss": 0.0363, "step": 27870 }, { - "epoch": 0.14, - "learning_rate": 0.0002789012718769392, - "loss": 0.0244, + "epoch": 0.07, + "learning_rate": 0.00028915965275635655, + "loss": 0.0338, "step": 27880 }, { - "epoch": 0.14, - "learning_rate": 0.0002788937041839252, - "loss": 0.023, + "epoch": 0.07, + "learning_rate": 0.00028915576453998506, + "loss": 0.038, "step": 27890 }, { - "epoch": 0.14, - "learning_rate": 0.0002788861364909112, - "loss": 0.0324, + "epoch": 0.07, + "learning_rate": 0.00028915187632361363, + "loss": 0.0322, "step": 27900 }, { - "epoch": 0.14, - "learning_rate": 0.00027887856879789716, - "loss": 0.025, + "epoch": 0.07, + "learning_rate": 0.0002891479881072422, + "loss": 0.0338, "step": 27910 }, { - "epoch": 0.14, - "learning_rate": 0.00027887100110488315, - "loss": 0.0321, + "epoch": 0.07, + "learning_rate": 0.0002891440998908707, + "loss": 0.032, "step": 27920 }, { - "epoch": 0.14, - "learning_rate": 0.00027886343341186913, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.00028914021167449923, + "loss": 0.0371, "step": 27930 }, { - "epoch": 0.14, - "learning_rate": 0.00027885586571885516, - "loss": 0.0302, + "epoch": 0.07, + "learning_rate": 0.00028913632345812775, + "loss": 0.0339, "step": 27940 }, { - "epoch": 0.14, - "learning_rate": 0.00027884829802584114, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.0002891324352417563, + "loss": 0.0333, "step": 27950 }, { - "epoch": 0.14, - "learning_rate": 0.0002788407303328271, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.00028912854702538483, + "loss": 0.0331, "step": 27960 }, { - "epoch": 0.14, - "learning_rate": 0.0002788331626398131, - "loss": 0.0243, + "epoch": 0.07, + "learning_rate": 0.0002891246588090134, + "loss": 0.0361, "step": 27970 }, { - "epoch": 0.14, - "learning_rate": 0.0002788255949467991, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.0002891207705926419, + "loss": 0.0316, "step": 27980 }, { - "epoch": 0.14, - "learning_rate": 0.00027881802725378507, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.0002891168823762705, + "loss": 0.0386, "step": 27990 }, { - "epoch": 0.14, - "learning_rate": 0.0002788104595607711, - "loss": 0.0278, + "epoch": 0.07, + "learning_rate": 0.000289112994159899, + "loss": 0.0344, "step": 28000 }, { - "epoch": 0.14, - "eval_cer": 0.9144489071884033, - "eval_loss": 0.019581960514187813, - "eval_runtime": 117.2391, - "eval_samples_per_second": 17.059, - "eval_steps_per_second": 4.265, + "epoch": 0.07, + "eval_cer": 0.8817950623608236, + "eval_loss": 0.024856723845005035, + "eval_runtime": 107.5236, + "eval_samples_per_second": 18.601, + "eval_steps_per_second": 4.65, "step": 28000 }, { - "epoch": 0.14, - "learning_rate": 0.0002788028918677571, - "loss": 0.026, + "epoch": 0.07, + "learning_rate": 0.0002891091059435275, + "loss": 0.0365, "step": 28010 }, { - "epoch": 0.14, - "learning_rate": 0.00027879532417474307, - "loss": 0.0265, + "epoch": 0.07, + "learning_rate": 0.000289105217727156, + "loss": 0.0353, "step": 28020 }, { - "epoch": 0.14, - "learning_rate": 0.00027878775648172905, - "loss": 0.0289, + "epoch": 0.07, + "learning_rate": 0.0002891013295107846, + "loss": 0.0339, "step": 28030 }, { - "epoch": 0.14, - "learning_rate": 0.00027878018878871503, - "loss": 0.0244, + "epoch": 0.07, + "learning_rate": 0.0002890974412944131, + "loss": 0.0346, "step": 28040 }, { - "epoch": 0.14, - "learning_rate": 0.000278772621095701, - "loss": 0.026, + "epoch": 0.07, + "learning_rate": 0.0002890935530780417, + "loss": 0.0321, "step": 28050 }, { - "epoch": 0.14, - "learning_rate": 0.000278765053402687, - "loss": 0.0308, + "epoch": 0.07, + "learning_rate": 0.0002890896648616702, + "loss": 0.0319, "step": 28060 }, { - "epoch": 0.14, - "learning_rate": 0.00027875748570967303, - "loss": 0.0273, + "epoch": 0.07, + "learning_rate": 0.0002890857766452987, + "loss": 0.0321, "step": 28070 }, { - "epoch": 0.14, - "learning_rate": 0.000278749918016659, - "loss": 0.0355, + "epoch": 0.07, + "learning_rate": 0.0002890818884289273, + "loss": 0.0357, "step": 28080 }, { - "epoch": 0.14, - "learning_rate": 0.000278742350323645, - "loss": 0.0232, + "epoch": 0.07, + "learning_rate": 0.0002890780002125558, + "loss": 0.0356, "step": 28090 }, { - "epoch": 0.14, - "learning_rate": 0.000278734782630631, - "loss": 0.0242, + "epoch": 0.07, + "learning_rate": 0.00028907411199618436, + "loss": 0.0343, "step": 28100 }, { - "epoch": 0.14, - "learning_rate": 0.00027872721493761696, - "loss": 0.024, + "epoch": 0.07, + "learning_rate": 0.00028907022377981287, + "loss": 0.0389, "step": 28110 }, { - "epoch": 0.14, - "learning_rate": 0.00027871964724460294, - "loss": 0.0248, + "epoch": 0.07, + "learning_rate": 0.00028906633556344144, + "loss": 0.0303, "step": 28120 }, { - "epoch": 0.14, - "learning_rate": 0.000278712079551589, - "loss": 0.0276, + "epoch": 0.07, + "learning_rate": 0.00028906244734706996, + "loss": 0.0359, "step": 28130 }, { - "epoch": 0.14, - "learning_rate": 0.00027870451185857495, - "loss": 0.0257, + "epoch": 0.07, + "learning_rate": 0.00028905855913069847, + "loss": 0.0319, "step": 28140 }, { - "epoch": 0.14, - "learning_rate": 0.00027869694416556094, - "loss": 0.0262, + "epoch": 0.07, + "learning_rate": 0.000289054670914327, + "loss": 0.0268, "step": 28150 }, { - "epoch": 0.14, - "learning_rate": 0.0002786893764725469, - "loss": 0.0285, + "epoch": 0.07, + "learning_rate": 0.00028905078269795555, + "loss": 0.0301, "step": 28160 }, { - "epoch": 0.14, - "learning_rate": 0.0002786818087795329, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.00028904689448158407, + "loss": 0.0348, "step": 28170 }, { - "epoch": 0.14, - "learning_rate": 0.0002786742410865189, - "loss": 0.0282, + "epoch": 0.07, + "learning_rate": 0.00028904300626521264, + "loss": 0.0315, "step": 28180 }, { - "epoch": 0.14, - "learning_rate": 0.0002786666733935049, - "loss": 0.0276, + "epoch": 0.07, + "learning_rate": 0.00028903911804884115, + "loss": 0.0329, "step": 28190 }, { - "epoch": 0.14, - "learning_rate": 0.0002786591057004909, - "loss": 0.0262, + "epoch": 0.07, + "learning_rate": 0.0002890352298324697, + "loss": 0.0283, "step": 28200 }, { - "epoch": 0.14, - "learning_rate": 0.0002786515380074769, - "loss": 0.0309, + "epoch": 0.07, + "learning_rate": 0.00028903134161609823, + "loss": 0.0328, "step": 28210 }, { - "epoch": 0.14, - "learning_rate": 0.00027864397031446286, - "loss": 0.027, + "epoch": 0.07, + "learning_rate": 0.00028902745339972675, + "loss": 0.0257, "step": 28220 }, { - "epoch": 0.14, - "learning_rate": 0.00027863640262144884, - "loss": 0.028, + "epoch": 0.07, + "learning_rate": 0.00028902356518335526, + "loss": 0.0321, "step": 28230 }, { - "epoch": 0.14, - "learning_rate": 0.0002786288349284348, - "loss": 0.0263, + "epoch": 0.07, + "learning_rate": 0.00028901967696698383, + "loss": 0.0426, "step": 28240 }, { - "epoch": 0.14, - "learning_rate": 0.0002786212672354208, - "loss": 0.0252, + "epoch": 0.07, + "learning_rate": 0.0002890157887506124, + "loss": 0.0314, "step": 28250 }, { - "epoch": 0.14, - "learning_rate": 0.00027861369954240684, - "loss": 0.0231, + "epoch": 0.07, + "learning_rate": 0.0002890119005342409, + "loss": 0.0341, "step": 28260 }, { - "epoch": 0.14, - "learning_rate": 0.0002786061318493928, - "loss": 0.0324, + "epoch": 0.07, + "learning_rate": 0.00028900801231786943, + "loss": 0.0303, "step": 28270 }, { - "epoch": 0.14, - "learning_rate": 0.00027859856415637875, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.000289004124101498, + "loss": 0.0337, "step": 28280 }, { - "epoch": 0.14, - "learning_rate": 0.00027859099646336473, - "loss": 0.0323, + "epoch": 0.07, + "learning_rate": 0.0002890002358851265, + "loss": 0.0356, "step": 28290 }, { - "epoch": 0.14, - "learning_rate": 0.00027858342877035077, - "loss": 0.0298, + "epoch": 0.07, + "learning_rate": 0.00028899634766875503, + "loss": 0.0282, "step": 28300 }, { - "epoch": 0.14, - "learning_rate": 0.00027857586107733675, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.0002889924594523836, + "loss": 0.0354, "step": 28310 }, { - "epoch": 0.14, - "learning_rate": 0.00027856829338432273, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.0002889885712360121, + "loss": 0.0336, "step": 28320 }, { - "epoch": 0.14, - "learning_rate": 0.0002785607256913087, - "loss": 0.0289, + "epoch": 0.07, + "learning_rate": 0.0002889846830196407, + "loss": 0.0272, "step": 28330 }, { - "epoch": 0.14, - "learning_rate": 0.0002785531579982947, - "loss": 0.0295, + "epoch": 0.07, + "learning_rate": 0.0002889807948032692, + "loss": 0.039, "step": 28340 }, { - "epoch": 0.14, - "learning_rate": 0.0002785455903052807, - "loss": 0.0278, + "epoch": 0.07, + "learning_rate": 0.0002889769065868977, + "loss": 0.0331, "step": 28350 }, { - "epoch": 0.14, - "learning_rate": 0.0002785380226122667, - "loss": 0.0243, + "epoch": 0.07, + "learning_rate": 0.0002889730183705262, + "loss": 0.0309, "step": 28360 }, { - "epoch": 0.14, - "learning_rate": 0.0002785304549192527, - "loss": 0.0245, + "epoch": 0.07, + "learning_rate": 0.0002889691301541548, + "loss": 0.0328, "step": 28370 }, { - "epoch": 0.14, - "learning_rate": 0.00027852288722623867, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.0002889652419377833, + "loss": 0.0331, "step": 28380 }, { - "epoch": 0.14, - "learning_rate": 0.00027851531953322465, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.0002889613537214119, + "loss": 0.0305, "step": 28390 }, { - "epoch": 0.14, - "learning_rate": 0.00027850775184021064, - "loss": 0.0339, + "epoch": 0.07, + "learning_rate": 0.0002889574655050404, + "loss": 0.0328, "step": 28400 }, { - "epoch": 0.14, - "learning_rate": 0.0002785001841471966, - "loss": 0.0302, + "epoch": 0.07, + "learning_rate": 0.00028895357728866896, + "loss": 0.0326, "step": 28410 }, { - "epoch": 0.14, - "learning_rate": 0.00027849261645418265, - "loss": 0.0254, + "epoch": 0.07, + "learning_rate": 0.0002889496890722975, + "loss": 0.0326, "step": 28420 }, { - "epoch": 0.14, - "learning_rate": 0.00027848504876116863, - "loss": 0.0304, + "epoch": 0.07, + "learning_rate": 0.000288945800855926, + "loss": 0.0333, "step": 28430 }, { - "epoch": 0.14, - "learning_rate": 0.0002784774810681546, - "loss": 0.0308, + "epoch": 0.07, + "learning_rate": 0.0002889419126395545, + "loss": 0.0292, "step": 28440 }, { - "epoch": 0.14, - "learning_rate": 0.0002784699133751406, - "loss": 0.0263, + "epoch": 0.07, + "learning_rate": 0.00028893802442318307, + "loss": 0.0374, "step": 28450 }, { - "epoch": 0.14, - "learning_rate": 0.0002784623456821266, - "loss": 0.0257, + "epoch": 0.07, + "learning_rate": 0.00028893413620681164, + "loss": 0.0346, "step": 28460 }, { - "epoch": 0.14, - "learning_rate": 0.00027845477798911256, - "loss": 0.0271, + "epoch": 0.07, + "learning_rate": 0.00028893024799044015, + "loss": 0.0338, "step": 28470 }, { - "epoch": 0.14, - "learning_rate": 0.00027844721029609854, - "loss": 0.0242, + "epoch": 0.07, + "learning_rate": 0.00028892635977406867, + "loss": 0.032, "step": 28480 }, { - "epoch": 0.14, - "learning_rate": 0.0002784396426030846, - "loss": 0.0299, + "epoch": 0.07, + "learning_rate": 0.00028892247155769724, + "loss": 0.0345, "step": 28490 }, { - "epoch": 0.14, - "learning_rate": 0.00027843207491007056, - "loss": 0.0269, + "epoch": 0.07, + "learning_rate": 0.00028891858334132575, + "loss": 0.0358, "step": 28500 }, { - "epoch": 0.14, - "learning_rate": 0.00027842450721705654, - "loss": 0.0218, + "epoch": 0.07, + "learning_rate": 0.00028891469512495427, + "loss": 0.0346, "step": 28510 }, { - "epoch": 0.14, - "learning_rate": 0.0002784169395240425, - "loss": 0.0264, + "epoch": 0.07, + "learning_rate": 0.00028891080690858284, + "loss": 0.0403, "step": 28520 }, { - "epoch": 0.14, - "learning_rate": 0.0002784093718310285, - "loss": 0.0277, + "epoch": 0.07, + "learning_rate": 0.00028890691869221135, + "loss": 0.0347, "step": 28530 }, { - "epoch": 0.14, - "learning_rate": 0.0002784018041380145, - "loss": 0.022, + "epoch": 0.07, + "learning_rate": 0.0002889030304758399, + "loss": 0.0312, "step": 28540 }, { - "epoch": 0.14, - "learning_rate": 0.0002783942364450005, - "loss": 0.0259, + "epoch": 0.07, + "learning_rate": 0.00028889914225946843, + "loss": 0.0315, "step": 28550 }, { - "epoch": 0.14, - "learning_rate": 0.0002783866687519865, - "loss": 0.0247, + "epoch": 0.07, + "learning_rate": 0.00028889525404309695, + "loss": 0.0325, "step": 28560 }, { - "epoch": 0.14, - "learning_rate": 0.0002783791010589725, - "loss": 0.0326, + "epoch": 0.07, + "learning_rate": 0.00028889136582672546, + "loss": 0.0344, "step": 28570 }, { - "epoch": 0.14, - "learning_rate": 0.00027837153336595846, - "loss": 0.0264, + "epoch": 0.07, + "learning_rate": 0.00028888747761035403, + "loss": 0.0315, "step": 28580 }, { - "epoch": 0.14, - "learning_rate": 0.00027836396567294445, - "loss": 0.0302, + "epoch": 0.07, + "learning_rate": 0.0002888835893939826, + "loss": 0.0466, "step": 28590 }, { - "epoch": 0.14, - "learning_rate": 0.0002783563979799304, - "loss": 0.0238, + "epoch": 0.07, + "learning_rate": 0.0002888797011776111, + "loss": 0.0387, "step": 28600 }, { - "epoch": 0.14, - "learning_rate": 0.00027834883028691646, - "loss": 0.0248, + "epoch": 0.07, + "learning_rate": 0.00028887581296123963, + "loss": 0.03, "step": 28610 }, { - "epoch": 0.14, - "learning_rate": 0.00027834126259390244, - "loss": 0.0241, + "epoch": 0.07, + "learning_rate": 0.0002888719247448682, + "loss": 0.0335, "step": 28620 }, { - "epoch": 0.14, - "learning_rate": 0.0002783336949008884, - "loss": 0.0256, + "epoch": 0.07, + "learning_rate": 0.0002888680365284967, + "loss": 0.0349, "step": 28630 }, { - "epoch": 0.14, - "learning_rate": 0.0002783261272078744, - "loss": 0.0241, + "epoch": 0.07, + "learning_rate": 0.0002888641483121252, + "loss": 0.0327, "step": 28640 }, { - "epoch": 0.14, - "learning_rate": 0.0002783185595148604, - "loss": 0.0243, + "epoch": 0.07, + "learning_rate": 0.0002888602600957538, + "loss": 0.0487, "step": 28650 }, { - "epoch": 0.14, - "learning_rate": 0.00027831099182184637, - "loss": 0.0278, + "epoch": 0.07, + "learning_rate": 0.0002888563718793823, + "loss": 0.0422, "step": 28660 }, { - "epoch": 0.14, - "learning_rate": 0.00027830342412883235, - "loss": 0.0215, + "epoch": 0.07, + "learning_rate": 0.0002888524836630109, + "loss": 0.0338, "step": 28670 }, { - "epoch": 0.14, - "learning_rate": 0.0002782958564358184, - "loss": 0.0272, + "epoch": 0.07, + "learning_rate": 0.0002888485954466394, + "loss": 0.0331, "step": 28680 }, { - "epoch": 0.14, - "learning_rate": 0.00027828828874280437, - "loss": 0.0275, + "epoch": 0.07, + "learning_rate": 0.0002888447072302679, + "loss": 0.0352, "step": 28690 }, { - "epoch": 0.14, - "learning_rate": 0.00027828072104979035, - "loss": 0.0244, + "epoch": 0.07, + "learning_rate": 0.0002888408190138965, + "loss": 0.0318, "step": 28700 }, { - "epoch": 0.14, - "learning_rate": 0.00027827315335677633, - "loss": 0.0249, + "epoch": 0.07, + "learning_rate": 0.000288836930797525, + "loss": 0.0325, "step": 28710 }, { - "epoch": 0.14, - "learning_rate": 0.0002782655856637623, - "loss": 0.0267, + "epoch": 0.07, + "learning_rate": 0.0002888330425811535, + "loss": 0.0363, "step": 28720 }, { - "epoch": 0.14, - "learning_rate": 0.0002782580179707483, - "loss": 0.0328, + "epoch": 0.07, + "learning_rate": 0.0002888291543647821, + "loss": 0.0294, "step": 28730 }, { - "epoch": 0.14, - "learning_rate": 0.00027825045027773433, - "loss": 0.0308, + "epoch": 0.07, + "learning_rate": 0.00028882526614841064, + "loss": 0.0366, "step": 28740 }, { - "epoch": 0.15, - "learning_rate": 0.0002782428825847203, - "loss": 0.0261, + "epoch": 0.07, + "learning_rate": 0.00028882137793203916, + "loss": 0.0347, "step": 28750 }, { - "epoch": 0.15, - "learning_rate": 0.0002782353148917063, - "loss": 0.0326, + "epoch": 0.07, + "learning_rate": 0.00028881748971566767, + "loss": 0.0305, "step": 28760 }, { - "epoch": 0.15, - "learning_rate": 0.0002782277471986923, - "loss": 0.0281, + "epoch": 0.07, + "learning_rate": 0.0002888136014992962, + "loss": 0.0282, "step": 28770 }, { - "epoch": 0.15, - "learning_rate": 0.00027822017950567826, - "loss": 0.0258, + "epoch": 0.07, + "learning_rate": 0.00028880971328292476, + "loss": 0.0287, "step": 28780 }, { - "epoch": 0.15, - "learning_rate": 0.00027821261181266424, - "loss": 0.0279, + "epoch": 0.07, + "learning_rate": 0.00028880582506655327, + "loss": 0.029, "step": 28790 }, { - "epoch": 0.15, - "learning_rate": 0.0002782050441196502, - "loss": 0.0553, + "epoch": 0.07, + "learning_rate": 0.00028880193685018184, + "loss": 0.0328, "step": 28800 }, { - "epoch": 0.15, - "learning_rate": 0.00027819747642663625, - "loss": 0.0291, + "epoch": 0.07, + "learning_rate": 0.00028879804863381035, + "loss": 0.0293, "step": 28810 }, { - "epoch": 0.15, - "learning_rate": 0.00027818990873362224, - "loss": 0.0254, + "epoch": 0.07, + "learning_rate": 0.00028879416041743887, + "loss": 0.0347, "step": 28820 }, { - "epoch": 0.15, - "learning_rate": 0.0002781823410406082, - "loss": 0.0298, + "epoch": 0.07, + "learning_rate": 0.00028879027220106744, + "loss": 0.0318, "step": 28830 }, { - "epoch": 0.15, - "learning_rate": 0.0002781747733475942, - "loss": 0.0266, + "epoch": 0.07, + "learning_rate": 0.00028878638398469595, + "loss": 0.0332, "step": 28840 }, { - "epoch": 0.15, - "learning_rate": 0.0002781672056545802, - "loss": 0.025, + "epoch": 0.07, + "learning_rate": 0.00028878249576832447, + "loss": 0.0395, "step": 28850 }, { - "epoch": 0.15, - "learning_rate": 0.00027815963796156616, - "loss": 0.0223, + "epoch": 0.07, + "learning_rate": 0.00028877860755195303, + "loss": 0.0373, "step": 28860 }, { - "epoch": 0.15, - "learning_rate": 0.0002781520702685522, - "loss": 0.0274, + "epoch": 0.07, + "learning_rate": 0.00028877471933558155, + "loss": 0.0273, "step": 28870 }, { - "epoch": 0.15, - "learning_rate": 0.0002781445025755382, - "loss": 0.0294, + "epoch": 0.07, + "learning_rate": 0.0002887708311192101, + "loss": 0.0367, "step": 28880 }, { - "epoch": 0.15, - "learning_rate": 0.00027813693488252416, - "loss": 0.021, + "epoch": 0.07, + "learning_rate": 0.00028876694290283863, + "loss": 0.0304, "step": 28890 }, { - "epoch": 0.15, - "learning_rate": 0.00027812936718951014, - "loss": 0.0343, + "epoch": 0.07, + "learning_rate": 0.00028876305468646715, + "loss": 0.0342, "step": 28900 }, { - "epoch": 0.15, - "learning_rate": 0.0002781217994964961, - "loss": 0.0349, + "epoch": 0.07, + "learning_rate": 0.0002887591664700957, + "loss": 0.0293, "step": 28910 }, { - "epoch": 0.15, - "learning_rate": 0.0002781142318034821, - "loss": 0.028, + "epoch": 0.07, + "learning_rate": 0.00028875527825372423, + "loss": 0.0299, "step": 28920 }, { - "epoch": 0.15, - "learning_rate": 0.00027810666411046814, - "loss": 0.0245, + "epoch": 0.07, + "learning_rate": 0.00028875139003735274, + "loss": 0.0288, "step": 28930 }, { - "epoch": 0.15, - "learning_rate": 0.0002780990964174541, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.0002887475018209813, + "loss": 0.0382, "step": 28940 }, { - "epoch": 0.15, - "learning_rate": 0.0002780915287244401, - "loss": 0.0269, + "epoch": 0.08, + "learning_rate": 0.0002887436136046099, + "loss": 0.0306, "step": 28950 }, { - "epoch": 0.15, - "learning_rate": 0.0002780839610314261, - "loss": 0.0236, + "epoch": 0.08, + "learning_rate": 0.0002887397253882384, + "loss": 0.038, "step": 28960 }, { - "epoch": 0.15, - "learning_rate": 0.00027807639333841207, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002887358371718669, + "loss": 0.0357, "step": 28970 }, { - "epoch": 0.15, - "learning_rate": 0.00027806882564539805, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.0002887319489554954, + "loss": 0.0379, "step": 28980 }, { - "epoch": 0.15, - "learning_rate": 0.00027806125795238403, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.000288728060739124, + "loss": 0.0357, "step": 28990 }, { - "epoch": 0.15, - "learning_rate": 0.00027805369025937006, - "loss": 0.0245, + "epoch": 0.08, + "learning_rate": 0.0002887241725227525, + "loss": 0.0386, "step": 29000 }, { - "epoch": 0.15, - "eval_cer": 0.914481900656667, - "eval_loss": 0.019330712035298347, - "eval_runtime": 117.3753, - "eval_samples_per_second": 17.039, - "eval_steps_per_second": 4.26, + "epoch": 0.08, + "eval_cer": 0.8817614710744033, + "eval_loss": 0.025074917823076248, + "eval_runtime": 107.6332, + "eval_samples_per_second": 18.582, + "eval_steps_per_second": 4.645, "step": 29000 }, { - "epoch": 0.15, - "learning_rate": 0.00027804612256635605, - "loss": 0.0274, + "epoch": 0.08, + "learning_rate": 0.0002887202843063811, + "loss": 0.0372, "step": 29010 }, { - "epoch": 0.15, - "learning_rate": 0.000278038554873342, - "loss": 0.0276, + "epoch": 0.08, + "learning_rate": 0.0002887163960900096, + "loss": 0.0475, "step": 29020 }, { - "epoch": 0.15, - "learning_rate": 0.000278030987180328, - "loss": 0.0246, + "epoch": 0.08, + "learning_rate": 0.0002887125078736381, + "loss": 0.0303, "step": 29030 }, { - "epoch": 0.15, - "learning_rate": 0.000278023419487314, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.0002887086196572667, + "loss": 0.0469, "step": 29040 }, { - "epoch": 0.15, - "learning_rate": 0.00027801585179429997, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002887047314408952, + "loss": 0.0362, "step": 29050 }, { - "epoch": 0.15, - "learning_rate": 0.000278008284101286, - "loss": 0.0284, + "epoch": 0.08, + "learning_rate": 0.0002887008432245237, + "loss": 0.0339, "step": 29060 }, { - "epoch": 0.15, - "learning_rate": 0.000278000716408272, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.0002886969550081523, + "loss": 0.0362, "step": 29070 }, { - "epoch": 0.15, - "learning_rate": 0.00027799314871525797, - "loss": 0.0235, + "epoch": 0.08, + "learning_rate": 0.0002886930667917808, + "loss": 0.0383, "step": 29080 }, { - "epoch": 0.15, - "learning_rate": 0.00027798558102224395, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.00028868917857540936, + "loss": 0.0317, "step": 29090 }, { - "epoch": 0.15, - "learning_rate": 0.00027797801332922993, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.00028868529035903787, + "loss": 0.037, "step": 29100 }, { - "epoch": 0.15, - "learning_rate": 0.0002779704456362159, - "loss": 0.0223, + "epoch": 0.08, + "learning_rate": 0.0002886814021426664, + "loss": 0.0378, "step": 29110 }, { - "epoch": 0.15, - "learning_rate": 0.00027796287794320195, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.00028867751392629495, + "loss": 0.032, "step": 29120 }, { - "epoch": 0.15, - "learning_rate": 0.00027795531025018793, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.00028867362570992347, + "loss": 0.035, "step": 29130 }, { - "epoch": 0.15, - "learning_rate": 0.0002779477425571739, - "loss": 0.0279, + "epoch": 0.08, + "learning_rate": 0.00028866973749355204, + "loss": 0.0373, "step": 29140 }, { - "epoch": 0.15, - "learning_rate": 0.0002779401748641599, - "loss": 0.0236, + "epoch": 0.08, + "learning_rate": 0.00028866584927718055, + "loss": 0.0312, "step": 29150 }, { - "epoch": 0.15, - "learning_rate": 0.0002779326071711459, - "loss": 0.0221, + "epoch": 0.08, + "learning_rate": 0.0002886619610608091, + "loss": 0.0383, "step": 29160 }, { - "epoch": 0.15, - "learning_rate": 0.00027792503947813186, - "loss": 0.0285, + "epoch": 0.08, + "learning_rate": 0.00028865807284443764, + "loss": 0.0414, "step": 29170 }, { - "epoch": 0.15, - "learning_rate": 0.00027791747178511784, - "loss": 0.0282, + "epoch": 0.08, + "learning_rate": 0.00028865418462806615, + "loss": 0.0331, "step": 29180 }, { - "epoch": 0.15, - "learning_rate": 0.0002779099040921039, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.00028865029641169466, + "loss": 0.0357, "step": 29190 }, { - "epoch": 0.15, - "learning_rate": 0.00027790233639908986, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.00028864640819532323, + "loss": 0.0307, "step": 29200 }, { - "epoch": 0.15, - "learning_rate": 0.00027789476870607584, - "loss": 0.0211, + "epoch": 0.08, + "learning_rate": 0.00028864251997895175, + "loss": 0.0375, "step": 29210 }, { - "epoch": 0.15, - "learning_rate": 0.0002778872010130618, - "loss": 0.0244, + "epoch": 0.08, + "learning_rate": 0.0002886386317625803, + "loss": 0.0391, "step": 29220 }, { - "epoch": 0.15, - "learning_rate": 0.0002778796333200478, - "loss": 0.0257, + "epoch": 0.08, + "learning_rate": 0.00028863474354620883, + "loss": 0.0402, "step": 29230 }, { - "epoch": 0.15, - "learning_rate": 0.0002778720656270338, - "loss": 0.0246, + "epoch": 0.08, + "learning_rate": 0.0002886308553298374, + "loss": 0.0324, "step": 29240 }, { - "epoch": 0.15, - "learning_rate": 0.0002778644979340198, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.0002886269671134659, + "loss": 0.034, "step": 29250 }, { - "epoch": 0.15, - "learning_rate": 0.0002778569302410058, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028862307889709443, + "loss": 0.0355, "step": 29260 }, { - "epoch": 0.15, - "learning_rate": 0.0002778493625479918, - "loss": 0.0322, + "epoch": 0.08, + "learning_rate": 0.00028861919068072294, + "loss": 0.0317, "step": 29270 }, { - "epoch": 0.15, - "learning_rate": 0.00027784179485497776, - "loss": 0.0275, + "epoch": 0.08, + "learning_rate": 0.0002886153024643515, + "loss": 0.0336, "step": 29280 }, { - "epoch": 0.15, - "learning_rate": 0.00027783422716196374, - "loss": 0.038, + "epoch": 0.08, + "learning_rate": 0.0002886114142479801, + "loss": 0.0366, "step": 29290 }, { - "epoch": 0.15, - "learning_rate": 0.0002778266594689497, - "loss": 0.0285, + "epoch": 0.08, + "learning_rate": 0.0002886075260316086, + "loss": 0.0272, "step": 29300 }, { - "epoch": 0.15, - "learning_rate": 0.0002778190917759357, - "loss": 0.0286, + "epoch": 0.08, + "learning_rate": 0.0002886036378152371, + "loss": 0.0328, "step": 29310 }, { - "epoch": 0.15, - "learning_rate": 0.00027781152408292174, - "loss": 0.0296, + "epoch": 0.08, + "learning_rate": 0.0002885997495988656, + "loss": 0.0319, "step": 29320 }, { - "epoch": 0.15, - "learning_rate": 0.0002778039563899077, - "loss": 0.0242, + "epoch": 0.08, + "learning_rate": 0.0002885958613824942, + "loss": 0.0321, "step": 29330 }, { - "epoch": 0.15, - "learning_rate": 0.0002777963886968937, - "loss": 0.0275, + "epoch": 0.08, + "learning_rate": 0.0002885919731661227, + "loss": 0.0425, "step": 29340 }, { - "epoch": 0.15, - "learning_rate": 0.0002777888210038797, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.0002885880849497513, + "loss": 0.0501, "step": 29350 }, { - "epoch": 0.15, - "learning_rate": 0.00027778125331086567, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.0002885841967333798, + "loss": 0.0415, "step": 29360 }, { - "epoch": 0.15, - "learning_rate": 0.00027777368561785165, - "loss": 0.0303, + "epoch": 0.08, + "learning_rate": 0.00028858030851700836, + "loss": 0.0321, "step": 29370 }, { - "epoch": 0.15, - "learning_rate": 0.0002777661179248377, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002885764203006369, + "loss": 0.0336, "step": 29380 }, { - "epoch": 0.15, - "learning_rate": 0.00027775855023182367, - "loss": 0.0271, + "epoch": 0.08, + "learning_rate": 0.0002885725320842654, + "loss": 0.0342, "step": 29390 }, { - "epoch": 0.15, - "learning_rate": 0.00027775098253880965, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.0002885686438678939, + "loss": 0.0331, "step": 29400 }, { - "epoch": 0.15, - "learning_rate": 0.00027774341484579563, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.00028856475565152247, + "loss": 0.0329, "step": 29410 }, { - "epoch": 0.15, - "learning_rate": 0.0002777358471527816, - "loss": 0.023, + "epoch": 0.08, + "learning_rate": 0.000288560867435151, + "loss": 0.0275, "step": 29420 }, { - "epoch": 0.15, - "learning_rate": 0.0002777282794597676, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.00028855697921877956, + "loss": 0.031, "step": 29430 }, { - "epoch": 0.15, - "learning_rate": 0.0002777207117667536, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.00028855309100240807, + "loss": 0.0302, "step": 29440 }, { - "epoch": 0.15, - "learning_rate": 0.0002777131440737396, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.00028854920278603664, + "loss": 0.0327, "step": 29450 }, { - "epoch": 0.15, - "learning_rate": 0.0002777055763807256, - "loss": 0.0269, + "epoch": 0.08, + "learning_rate": 0.00028854531456966515, + "loss": 0.0299, "step": 29460 }, { - "epoch": 0.15, - "learning_rate": 0.00027769800868771157, - "loss": 0.0234, + "epoch": 0.08, + "learning_rate": 0.00028854142635329367, + "loss": 0.0373, "step": 29470 }, { - "epoch": 0.15, - "learning_rate": 0.00027769044099469755, - "loss": 0.0261, + "epoch": 0.08, + "learning_rate": 0.0002885375381369222, + "loss": 0.0286, "step": 29480 }, { - "epoch": 0.15, - "learning_rate": 0.00027768287330168353, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.00028853364992055075, + "loss": 0.0327, "step": 29490 }, { - "epoch": 0.15, - "learning_rate": 0.0002776753056086695, - "loss": 0.0213, + "epoch": 0.08, + "learning_rate": 0.0002885297617041793, + "loss": 0.0321, "step": 29500 }, { - "epoch": 0.15, - "learning_rate": 0.00027766773791565555, - "loss": 0.0267, + "epoch": 0.08, + "learning_rate": 0.00028852587348780783, + "loss": 0.0366, "step": 29510 }, { - "epoch": 0.15, - "learning_rate": 0.00027766017022264153, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.00028852198527143635, + "loss": 0.0285, "step": 29520 }, { - "epoch": 0.15, - "learning_rate": 0.0002776526025296275, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.00028851809705506486, + "loss": 0.0406, "step": 29530 }, { - "epoch": 0.15, - "learning_rate": 0.00027764503483661344, - "loss": 0.0273, + "epoch": 0.08, + "learning_rate": 0.00028851420883869343, + "loss": 0.0319, "step": 29540 }, { - "epoch": 0.15, - "learning_rate": 0.0002776374671435995, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.00028851032062232195, + "loss": 0.0315, "step": 29550 }, { - "epoch": 0.15, - "learning_rate": 0.00027762989945058546, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.0002885064324059505, + "loss": 0.025, "step": 29560 }, { - "epoch": 0.15, - "learning_rate": 0.00027762233175757144, - "loss": 0.0302, + "epoch": 0.08, + "learning_rate": 0.00028850254418957903, + "loss": 0.0294, "step": 29570 }, { - "epoch": 0.15, - "learning_rate": 0.0002776147640645574, - "loss": 0.034, + "epoch": 0.08, + "learning_rate": 0.0002884986559732076, + "loss": 0.0326, "step": 29580 }, { - "epoch": 0.15, - "learning_rate": 0.0002776071963715434, - "loss": 0.0244, + "epoch": 0.08, + "learning_rate": 0.0002884947677568361, + "loss": 0.0372, "step": 29590 }, { - "epoch": 0.15, - "learning_rate": 0.0002775996286785294, - "loss": 0.0234, + "epoch": 0.08, + "learning_rate": 0.00028849087954046463, + "loss": 0.0328, "step": 29600 }, { - "epoch": 0.15, - "learning_rate": 0.0002775920609855154, - "loss": 0.0261, + "epoch": 0.08, + "learning_rate": 0.00028848699132409314, + "loss": 0.0367, "step": 29610 }, { - "epoch": 0.15, - "learning_rate": 0.0002775844932925014, - "loss": 0.0279, + "epoch": 0.08, + "learning_rate": 0.0002884831031077217, + "loss": 0.0265, "step": 29620 }, { - "epoch": 0.15, - "learning_rate": 0.0002775769255994874, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.0002884792148913502, + "loss": 0.0367, "step": 29630 }, { - "epoch": 0.15, - "learning_rate": 0.00027756935790647336, - "loss": 0.0304, + "epoch": 0.08, + "learning_rate": 0.0002884753266749788, + "loss": 0.0323, "step": 29640 }, { - "epoch": 0.15, - "learning_rate": 0.00027756179021345935, - "loss": 0.0272, + "epoch": 0.08, + "learning_rate": 0.0002884714384586073, + "loss": 0.0297, "step": 29650 }, { - "epoch": 0.15, - "learning_rate": 0.0002775542225204453, - "loss": 0.0267, + "epoch": 0.08, + "learning_rate": 0.0002884675502422359, + "loss": 0.0381, "step": 29660 }, { - "epoch": 0.15, - "learning_rate": 0.00027754665482743136, - "loss": 0.0304, + "epoch": 0.08, + "learning_rate": 0.0002884636620258644, + "loss": 0.0275, "step": 29670 }, { - "epoch": 0.15, - "learning_rate": 0.00027753908713441734, - "loss": 0.024, + "epoch": 0.08, + "learning_rate": 0.0002884597738094929, + "loss": 0.0308, "step": 29680 }, { - "epoch": 0.15, - "learning_rate": 0.0002775315194414033, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.0002884558855931215, + "loss": 0.035, "step": 29690 }, { - "epoch": 0.15, - "learning_rate": 0.0002775239517483893, - "loss": 0.0217, + "epoch": 0.08, + "learning_rate": 0.00028845199737675, + "loss": 0.0338, "step": 29700 }, { - "epoch": 0.15, - "learning_rate": 0.0002775163840553753, - "loss": 0.0248, + "epoch": 0.08, + "learning_rate": 0.00028844810916037856, + "loss": 0.0297, "step": 29710 }, { - "epoch": 0.15, - "learning_rate": 0.00027750881636236127, - "loss": 0.0237, + "epoch": 0.08, + "learning_rate": 0.0002884442209440071, + "loss": 0.0256, "step": 29720 }, { - "epoch": 0.15, - "learning_rate": 0.00027750124866934725, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.0002884403327276356, + "loss": 0.0324, "step": 29730 }, { - "epoch": 0.15, - "learning_rate": 0.0002774936809763333, - "loss": 0.0284, + "epoch": 0.08, + "learning_rate": 0.00028843644451126416, + "loss": 0.0384, "step": 29740 }, { - "epoch": 0.15, - "learning_rate": 0.00027748611328331927, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028843255629489267, + "loss": 0.0324, "step": 29750 }, { - "epoch": 0.15, - "learning_rate": 0.00027747854559030525, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.0002884286680785212, + "loss": 0.0379, "step": 29760 }, { - "epoch": 0.15, - "learning_rate": 0.00027747097789729123, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.00028842477986214975, + "loss": 0.0283, "step": 29770 }, { - "epoch": 0.15, - "learning_rate": 0.0002774634102042772, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.00028842089164577827, + "loss": 0.0356, "step": 29780 }, { - "epoch": 0.15, - "learning_rate": 0.0002774558425112632, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028841700342940684, + "loss": 0.0307, "step": 29790 }, { - "epoch": 0.15, - "learning_rate": 0.00027744827481824923, - "loss": 0.0196, + "epoch": 0.08, + "learning_rate": 0.00028841311521303535, + "loss": 0.0298, "step": 29800 }, { - "epoch": 0.15, - "learning_rate": 0.0002774407071252352, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.00028840922699666387, + "loss": 0.0293, "step": 29810 }, { - "epoch": 0.15, - "learning_rate": 0.0002774331394322212, - "loss": 0.0267, + "epoch": 0.08, + "learning_rate": 0.0002884053387802924, + "loss": 0.0339, "step": 29820 }, { - "epoch": 0.15, - "learning_rate": 0.0002774255717392072, - "loss": 0.0261, + "epoch": 0.08, + "learning_rate": 0.00028840145056392095, + "loss": 0.0323, "step": 29830 }, { - "epoch": 0.15, - "learning_rate": 0.00027741800404619316, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.0002883975623475495, + "loss": 0.0314, "step": 29840 }, { - "epoch": 0.15, - "learning_rate": 0.00027741043635317914, - "loss": 0.0293, + "epoch": 0.08, + "learning_rate": 0.00028839367413117803, + "loss": 0.0357, "step": 29850 }, { - "epoch": 0.15, - "learning_rate": 0.0002774028686601651, - "loss": 0.0241, + "epoch": 0.08, + "learning_rate": 0.00028838978591480655, + "loss": 0.0256, "step": 29860 }, { - "epoch": 0.15, - "learning_rate": 0.00027739530096715115, - "loss": 0.0231, + "epoch": 0.08, + "learning_rate": 0.0002883858976984351, + "loss": 0.0299, "step": 29870 }, { - "epoch": 0.15, - "learning_rate": 0.00027738773327413714, - "loss": 0.0228, + "epoch": 0.08, + "learning_rate": 0.00028838200948206363, + "loss": 0.0372, "step": 29880 }, { - "epoch": 0.15, - "learning_rate": 0.0002773801655811231, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.00028837812126569215, + "loss": 0.0332, "step": 29890 }, { - "epoch": 0.15, - "learning_rate": 0.0002773725978881091, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.0002883742330493207, + "loss": 0.0286, "step": 29900 }, { - "epoch": 0.15, - "learning_rate": 0.0002773650301950951, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.00028837034483294923, + "loss": 0.0302, "step": 29910 }, { - "epoch": 0.15, - "learning_rate": 0.00027735746250208106, - "loss": 0.0291, + "epoch": 0.08, + "learning_rate": 0.0002883664566165778, + "loss": 0.0327, "step": 29920 }, { - "epoch": 0.15, - "learning_rate": 0.0002773498948090671, - "loss": 0.0242, + "epoch": 0.08, + "learning_rate": 0.0002883625684002063, + "loss": 0.0326, "step": 29930 }, { - "epoch": 0.15, - "learning_rate": 0.0002773423271160531, - "loss": 0.0272, + "epoch": 0.08, + "learning_rate": 0.0002883586801838348, + "loss": 0.0315, "step": 29940 }, { - "epoch": 0.15, - "learning_rate": 0.00027733475942303906, - "loss": 0.0286, + "epoch": 0.08, + "learning_rate": 0.0002883547919674634, + "loss": 0.0438, "step": 29950 }, { - "epoch": 0.15, - "learning_rate": 0.00027732719173002504, - "loss": 0.0244, + "epoch": 0.08, + "learning_rate": 0.0002883509037510919, + "loss": 0.0303, "step": 29960 }, { - "epoch": 0.15, - "learning_rate": 0.000277319624037011, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.0002883470155347204, + "loss": 0.0308, "step": 29970 }, { - "epoch": 0.15, - "learning_rate": 0.000277312056343997, - "loss": 0.0295, + "epoch": 0.08, + "learning_rate": 0.000288343127318349, + "loss": 0.0305, "step": 29980 }, { - "epoch": 0.15, - "learning_rate": 0.00027730448865098304, - "loss": 0.0313, + "epoch": 0.08, + "learning_rate": 0.00028833923910197756, + "loss": 0.0316, "step": 29990 }, { - "epoch": 0.15, - "learning_rate": 0.000277296920957969, - "loss": 0.0226, + "epoch": 0.08, + "learning_rate": 0.0002883353508856061, + "loss": 0.0343, "step": 30000 }, { - "epoch": 0.15, - "eval_cer": 0.9144518183767796, - "eval_loss": 0.019204232841730118, - "eval_runtime": 117.3422, - "eval_samples_per_second": 17.044, - "eval_steps_per_second": 4.261, + "epoch": 0.08, + "eval_cer": 0.8817922630869552, + "eval_loss": 0.025351664051413536, + "eval_runtime": 107.6228, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 30000 }, { - "epoch": 0.15, - "learning_rate": 0.000277289353264955, - "loss": 0.0214, + "epoch": 0.08, + "learning_rate": 0.0002883314626692346, + "loss": 0.0313, "step": 30010 }, { - "epoch": 0.15, - "learning_rate": 0.000277281785571941, - "loss": 0.0318, + "epoch": 0.08, + "learning_rate": 0.0002883275744528631, + "loss": 0.0321, "step": 30020 }, { - "epoch": 0.15, - "learning_rate": 0.00027727421787892697, - "loss": 0.0273, + "epoch": 0.08, + "learning_rate": 0.0002883236862364916, + "loss": 0.0361, "step": 30030 }, { - "epoch": 0.15, - "learning_rate": 0.00027726665018591295, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.0002883197980201202, + "loss": 0.0415, "step": 30040 }, { - "epoch": 0.15, - "learning_rate": 0.00027725908249289893, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.00028831590980374876, + "loss": 0.0308, "step": 30050 }, { - "epoch": 0.15, - "learning_rate": 0.00027725151479988496, - "loss": 0.0308, + "epoch": 0.08, + "learning_rate": 0.00028831202158737727, + "loss": 0.0352, "step": 30060 }, { - "epoch": 0.15, - "learning_rate": 0.00027724394710687095, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.0002883081333710058, + "loss": 0.0298, "step": 30070 }, { - "epoch": 0.15, - "learning_rate": 0.0002772363794138569, - "loss": 0.0299, + "epoch": 0.08, + "learning_rate": 0.00028830424515463436, + "loss": 0.0322, "step": 30080 }, { - "epoch": 0.15, - "learning_rate": 0.0002772288117208429, - "loss": 0.03, + "epoch": 0.08, + "learning_rate": 0.00028830035693826287, + "loss": 0.0335, "step": 30090 }, { - "epoch": 0.15, - "learning_rate": 0.0002772212440278289, - "loss": 0.0269, + "epoch": 0.08, + "learning_rate": 0.0002882964687218914, + "loss": 0.0322, "step": 30100 }, { - "epoch": 0.15, - "learning_rate": 0.00027721367633481487, - "loss": 0.0316, + "epoch": 0.08, + "learning_rate": 0.00028829258050551995, + "loss": 0.0349, "step": 30110 }, { - "epoch": 0.15, - "learning_rate": 0.0002772061086418009, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.00028828869228914847, + "loss": 0.0306, "step": 30120 }, { - "epoch": 0.15, - "learning_rate": 0.0002771985409487869, - "loss": 0.0273, + "epoch": 0.08, + "learning_rate": 0.00028828480407277704, + "loss": 0.0318, "step": 30130 }, { - "epoch": 0.15, - "learning_rate": 0.00027719097325577287, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.00028828091585640555, + "loss": 0.033, "step": 30140 }, { - "epoch": 0.15, - "learning_rate": 0.00027718340556275885, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.00028827702764003407, + "loss": 0.031, "step": 30150 }, { - "epoch": 0.15, - "learning_rate": 0.00027717583786974483, - "loss": 0.0293, + "epoch": 0.08, + "learning_rate": 0.00028827313942366263, + "loss": 0.0318, "step": 30160 }, { - "epoch": 0.15, - "learning_rate": 0.0002771682701767308, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.00028826925120729115, + "loss": 0.031, "step": 30170 }, { - "epoch": 0.15, - "learning_rate": 0.00027716070248371685, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.0002882653629909197, + "loss": 0.0347, "step": 30180 }, { - "epoch": 0.15, - "learning_rate": 0.00027715313479070283, - "loss": 0.0224, + "epoch": 0.08, + "learning_rate": 0.00028826147477454823, + "loss": 0.0335, "step": 30190 }, { - "epoch": 0.15, - "learning_rate": 0.0002771455670976888, - "loss": 0.0264, + "epoch": 0.08, + "learning_rate": 0.0002882575865581768, + "loss": 0.033, "step": 30200 }, { - "epoch": 0.15, - "learning_rate": 0.0002771379994046748, - "loss": 0.0284, + "epoch": 0.08, + "learning_rate": 0.0002882536983418053, + "loss": 0.0303, "step": 30210 }, { - "epoch": 0.15, - "learning_rate": 0.0002771304317116608, - "loss": 0.0267, + "epoch": 0.08, + "learning_rate": 0.00028824981012543383, + "loss": 0.031, "step": 30220 }, { - "epoch": 0.15, - "learning_rate": 0.00027712286401864676, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.00028824592190906234, + "loss": 0.0387, "step": 30230 }, { - "epoch": 0.15, - "learning_rate": 0.00027711529632563274, - "loss": 0.0244, + "epoch": 0.08, + "learning_rate": 0.0002882420336926909, + "loss": 0.0299, "step": 30240 }, { - "epoch": 0.15, - "learning_rate": 0.0002771077286326188, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.00028823814547631943, + "loss": 0.034, "step": 30250 }, { - "epoch": 0.15, - "learning_rate": 0.00027710016093960476, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.000288234257259948, + "loss": 0.0368, "step": 30260 }, { - "epoch": 0.15, - "learning_rate": 0.00027709259324659074, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.0002882303690435765, + "loss": 0.0399, "step": 30270 }, { - "epoch": 0.15, - "learning_rate": 0.0002770850255535767, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.000288226480827205, + "loss": 0.0332, "step": 30280 }, { - "epoch": 0.15, - "learning_rate": 0.0002770774578605627, - "loss": 0.0328, + "epoch": 0.08, + "learning_rate": 0.0002882225926108336, + "loss": 0.0335, "step": 30290 }, { - "epoch": 0.15, - "learning_rate": 0.0002770698901675487, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.0002882187043944621, + "loss": 0.0334, "step": 30300 }, { - "epoch": 0.15, - "learning_rate": 0.0002770623224745347, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.0002882148161780906, + "loss": 0.0371, "step": 30310 }, { - "epoch": 0.15, - "learning_rate": 0.0002770547547815207, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.0002882109279617192, + "loss": 0.0328, "step": 30320 }, { - "epoch": 0.15, - "learning_rate": 0.0002770471870885067, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.00028820703974534776, + "loss": 0.0317, "step": 30330 }, { - "epoch": 0.15, - "learning_rate": 0.00027703961939549266, - "loss": 0.0289, + "epoch": 0.08, + "learning_rate": 0.0002882031515289763, + "loss": 0.039, "step": 30340 }, { - "epoch": 0.15, - "learning_rate": 0.00027703205170247864, - "loss": 0.0257, + "epoch": 0.08, + "learning_rate": 0.0002881992633126048, + "loss": 0.0291, "step": 30350 }, { - "epoch": 0.15, - "learning_rate": 0.0002770244840094646, - "loss": 0.031, + "epoch": 0.08, + "learning_rate": 0.0002881953750962333, + "loss": 0.0364, "step": 30360 }, { - "epoch": 0.15, - "learning_rate": 0.0002770169163164506, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.00028819148687986187, + "loss": 0.0346, "step": 30370 }, { - "epoch": 0.15, - "learning_rate": 0.00027700934862343664, - "loss": 0.0271, + "epoch": 0.08, + "learning_rate": 0.0002881875986634904, + "loss": 0.0317, "step": 30380 }, { - "epoch": 0.15, - "learning_rate": 0.0002770017809304226, - "loss": 0.0275, + "epoch": 0.08, + "learning_rate": 0.00028818371044711896, + "loss": 0.0364, "step": 30390 }, { - "epoch": 0.15, - "learning_rate": 0.0002769942132374086, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.00028817982223074747, + "loss": 0.0364, "step": 30400 }, { - "epoch": 0.15, - "learning_rate": 0.0002769866455443946, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.00028817593401437604, + "loss": 0.0307, "step": 30410 }, { - "epoch": 0.15, - "learning_rate": 0.00027697907785138057, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028817204579800455, + "loss": 0.0359, "step": 30420 }, { - "epoch": 0.15, - "learning_rate": 0.00027697151015836655, - "loss": 0.039, + "epoch": 0.08, + "learning_rate": 0.00028816815758163307, + "loss": 0.0347, "step": 30430 }, { - "epoch": 0.15, - "learning_rate": 0.0002769639424653526, - "loss": 0.0278, + "epoch": 0.08, + "learning_rate": 0.0002881642693652616, + "loss": 0.0341, "step": 30440 }, { - "epoch": 0.15, - "learning_rate": 0.00027695637477233857, - "loss": 0.0306, + "epoch": 0.08, + "learning_rate": 0.00028816038114889015, + "loss": 0.0381, "step": 30450 }, { - "epoch": 0.15, - "learning_rate": 0.00027694880707932455, - "loss": 0.0284, + "epoch": 0.08, + "learning_rate": 0.00028815649293251867, + "loss": 0.0294, "step": 30460 }, { - "epoch": 0.15, - "learning_rate": 0.00027694123938631053, - "loss": 0.0228, + "epoch": 0.08, + "learning_rate": 0.00028815260471614723, + "loss": 0.0411, "step": 30470 }, { - "epoch": 0.15, - "learning_rate": 0.0002769336716932965, - "loss": 0.0214, + "epoch": 0.08, + "learning_rate": 0.00028814871649977575, + "loss": 0.033, "step": 30480 }, { - "epoch": 0.15, - "learning_rate": 0.0002769261040002825, - "loss": 0.0261, + "epoch": 0.08, + "learning_rate": 0.0002881448282834043, + "loss": 0.0317, "step": 30490 }, { - "epoch": 0.15, - "learning_rate": 0.0002769185363072685, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.00028814094006703283, + "loss": 0.028, "step": 30500 }, { - "epoch": 0.15, - "learning_rate": 0.0002769109686142545, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.00028813705185066135, + "loss": 0.0338, "step": 30510 }, { - "epoch": 0.15, - "learning_rate": 0.0002769034009212405, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.00028813316363428986, + "loss": 0.0351, "step": 30520 }, { - "epoch": 0.15, - "learning_rate": 0.00027689583322822647, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.00028812927541791843, + "loss": 0.028, "step": 30530 }, { - "epoch": 0.15, - "learning_rate": 0.00027688826553521245, - "loss": 0.0211, + "epoch": 0.08, + "learning_rate": 0.000288125387201547, + "loss": 0.0345, "step": 30540 }, { - "epoch": 0.15, - "learning_rate": 0.00027688069784219843, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.0002881214989851755, + "loss": 0.0317, "step": 30550 }, { - "epoch": 0.15, - "learning_rate": 0.0002768731301491844, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.00028811761076880403, + "loss": 0.0353, "step": 30560 }, { - "epoch": 0.15, - "learning_rate": 0.00027686556245617045, - "loss": 0.0195, + "epoch": 0.08, + "learning_rate": 0.00028811372255243254, + "loss": 0.031, "step": 30570 }, { - "epoch": 0.15, - "learning_rate": 0.00027685799476315643, - "loss": 0.0276, + "epoch": 0.08, + "learning_rate": 0.0002881098343360611, + "loss": 0.0313, "step": 30580 }, { - "epoch": 0.15, - "learning_rate": 0.0002768504270701424, - "loss": 0.0213, + "epoch": 0.08, + "learning_rate": 0.0002881059461196896, + "loss": 0.0326, "step": 30590 }, { - "epoch": 0.15, - "learning_rate": 0.0002768428593771284, - "loss": 0.0234, + "epoch": 0.08, + "learning_rate": 0.0002881020579033182, + "loss": 0.0322, "step": 30600 }, { - "epoch": 0.15, - "learning_rate": 0.0002768352916841144, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.0002880981696869467, + "loss": 0.0293, "step": 30610 }, { - "epoch": 0.15, - "learning_rate": 0.00027682772399110036, - "loss": 0.0246, + "epoch": 0.08, + "learning_rate": 0.0002880942814705753, + "loss": 0.0309, "step": 30620 }, { - "epoch": 0.15, - "learning_rate": 0.0002768201562980864, - "loss": 0.0295, + "epoch": 0.08, + "learning_rate": 0.0002880903932542038, + "loss": 0.0354, "step": 30630 }, { - "epoch": 0.15, - "learning_rate": 0.0002768125886050724, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.0002880865050378323, + "loss": 0.0312, "step": 30640 }, { - "epoch": 0.15, - "learning_rate": 0.00027680502091205836, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002880826168214608, + "loss": 0.0271, "step": 30650 }, { - "epoch": 0.15, - "learning_rate": 0.00027679745321904434, - "loss": 0.0241, + "epoch": 0.08, + "learning_rate": 0.0002880787286050894, + "loss": 0.0303, "step": 30660 }, { - "epoch": 0.15, - "learning_rate": 0.0002767898855260303, - "loss": 0.0441, + "epoch": 0.08, + "learning_rate": 0.0002880748403887179, + "loss": 0.036, "step": 30670 }, { - "epoch": 0.15, - "learning_rate": 0.0002767823178330163, - "loss": 0.0257, + "epoch": 0.08, + "learning_rate": 0.0002880709521723465, + "loss": 0.0343, "step": 30680 }, { - "epoch": 0.15, - "learning_rate": 0.00027677475014000234, - "loss": 0.029, + "epoch": 0.08, + "learning_rate": 0.000288067063955975, + "loss": 0.0343, "step": 30690 }, { - "epoch": 0.15, - "learning_rate": 0.0002767671824469883, - "loss": 0.0312, + "epoch": 0.08, + "learning_rate": 0.00028806317573960356, + "loss": 0.0337, "step": 30700 }, { - "epoch": 0.15, - "learning_rate": 0.0002767596147539743, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.00028805928752323207, + "loss": 0.0365, "step": 30710 }, { - "epoch": 0.15, - "learning_rate": 0.0002767520470609603, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.0002880553993068606, + "loss": 0.0289, "step": 30720 }, { - "epoch": 0.16, - "learning_rate": 0.00027674447936794626, - "loss": 0.0235, + "epoch": 0.08, + "learning_rate": 0.00028805151109048915, + "loss": 0.0342, "step": 30730 }, { - "epoch": 0.16, - "learning_rate": 0.00027673691167493224, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.00028804762287411767, + "loss": 0.0331, "step": 30740 }, { - "epoch": 0.16, - "learning_rate": 0.0002767293439819182, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028804373465774624, + "loss": 0.0298, "step": 30750 }, { - "epoch": 0.16, - "learning_rate": 0.00027672177628890426, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.00028803984644137475, + "loss": 0.0297, "step": 30760 }, { - "epoch": 0.16, - "learning_rate": 0.00027671420859589024, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.00028803595822500327, + "loss": 0.032, "step": 30770 }, { - "epoch": 0.16, - "learning_rate": 0.0002767066409028762, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.0002880320700086318, + "loss": 0.032, "step": 30780 }, { - "epoch": 0.16, - "learning_rate": 0.0002766990732098622, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.00028802818179226035, + "loss": 0.0379, "step": 30790 }, { - "epoch": 0.16, - "learning_rate": 0.0002766915055168482, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.00028802429357588887, + "loss": 0.0366, "step": 30800 }, { - "epoch": 0.16, - "learning_rate": 0.00027668393782383417, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.00028802040535951743, + "loss": 0.0324, "step": 30810 }, { - "epoch": 0.16, - "learning_rate": 0.00027667637013082015, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.00028801651714314595, + "loss": 0.0296, "step": 30820 }, { - "epoch": 0.16, - "learning_rate": 0.00027666880243780613, - "loss": 0.0303, + "epoch": 0.08, + "learning_rate": 0.0002880126289267745, + "loss": 0.0352, "step": 30830 }, { - "epoch": 0.16, - "learning_rate": 0.0002766612347447921, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028800874071040303, + "loss": 0.0351, "step": 30840 }, { - "epoch": 0.16, - "learning_rate": 0.0002766536670517781, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.00028800485249403155, + "loss": 0.0305, "step": 30850 }, { - "epoch": 0.16, - "learning_rate": 0.00027664609935876413, - "loss": 0.0243, + "epoch": 0.08, + "learning_rate": 0.00028800096427766006, + "loss": 0.0295, "step": 30860 }, { - "epoch": 0.16, - "learning_rate": 0.0002766385316657501, - "loss": 0.0242, + "epoch": 0.08, + "learning_rate": 0.00028799707606128863, + "loss": 0.0255, "step": 30870 }, { - "epoch": 0.16, - "learning_rate": 0.0002766309639727361, - "loss": 0.0213, + "epoch": 0.08, + "learning_rate": 0.0002879931878449172, + "loss": 0.0359, "step": 30880 }, { - "epoch": 0.16, - "learning_rate": 0.0002766233962797221, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.0002879892996285457, + "loss": 0.0283, "step": 30890 }, { - "epoch": 0.16, - "learning_rate": 0.00027661582858670806, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.00028798541141217423, + "loss": 0.0315, "step": 30900 }, { - "epoch": 0.16, - "learning_rate": 0.00027660826089369404, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.0002879815231958028, + "loss": 0.0365, "step": 30910 }, { - "epoch": 0.16, - "learning_rate": 0.00027660069320068007, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.0002879776349794313, + "loss": 0.0342, "step": 30920 }, { - "epoch": 0.16, - "learning_rate": 0.00027659312550766605, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.0002879737467630598, + "loss": 0.0349, "step": 30930 }, { - "epoch": 0.16, - "learning_rate": 0.00027658555781465204, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.0002879698585466884, + "loss": 0.037, "step": 30940 }, { - "epoch": 0.16, - "learning_rate": 0.000276577990121638, - "loss": 0.0231, + "epoch": 0.08, + "learning_rate": 0.0002879659703303169, + "loss": 0.0346, "step": 30950 }, { - "epoch": 0.16, - "learning_rate": 0.000276570422428624, - "loss": 0.0243, + "epoch": 0.08, + "learning_rate": 0.0002879620821139455, + "loss": 0.0316, "step": 30960 }, { - "epoch": 0.16, - "learning_rate": 0.00027656285473561, - "loss": 0.032, + "epoch": 0.08, + "learning_rate": 0.000287958193897574, + "loss": 0.0305, "step": 30970 }, { - "epoch": 0.16, - "learning_rate": 0.00027655528704259596, - "loss": 0.0222, + "epoch": 0.08, + "learning_rate": 0.0002879543056812025, + "loss": 0.0367, "step": 30980 }, { - "epoch": 0.16, - "learning_rate": 0.000276547719349582, - "loss": 0.0229, + "epoch": 0.08, + "learning_rate": 0.0002879504174648311, + "loss": 0.0339, "step": 30990 }, { - "epoch": 0.16, - "learning_rate": 0.000276540151656568, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.0002879465292484596, + "loss": 0.03, "step": 31000 }, { - "epoch": 0.16, - "eval_cer": 0.914447936792278, - "eval_loss": 0.018999282270669937, - "eval_runtime": 117.1152, - "eval_samples_per_second": 17.077, - "eval_steps_per_second": 4.269, + "epoch": 0.08, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.023973068222403526, + "eval_runtime": 107.5545, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, "step": 31000 }, { - "epoch": 0.16, - "learning_rate": 0.00027653258396355396, - "loss": 0.0254, + "epoch": 0.08, + "learning_rate": 0.0002879426410320881, + "loss": 0.0354, "step": 31010 }, { - "epoch": 0.16, - "learning_rate": 0.00027652501627053994, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028793875281571667, + "loss": 0.0306, "step": 31020 }, { - "epoch": 0.16, - "learning_rate": 0.0002765174485775259, - "loss": 0.0342, + "epoch": 0.08, + "learning_rate": 0.0002879348645993452, + "loss": 0.0324, "step": 31030 }, { - "epoch": 0.16, - "learning_rate": 0.0002765098808845119, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.00028793097638297376, + "loss": 0.0316, "step": 31040 }, { - "epoch": 0.16, - "learning_rate": 0.00027650231319149794, - "loss": 0.0225, + "epoch": 0.08, + "learning_rate": 0.00028792708816660227, + "loss": 0.0367, "step": 31050 }, { - "epoch": 0.16, - "learning_rate": 0.0002764947454984839, - "loss": 0.0251, + "epoch": 0.08, + "learning_rate": 0.0002879231999502308, + "loss": 0.0393, "step": 31060 }, { - "epoch": 0.16, - "learning_rate": 0.0002764871778054699, - "loss": 0.0287, + "epoch": 0.08, + "learning_rate": 0.0002879193117338593, + "loss": 0.0355, "step": 31070 }, { - "epoch": 0.16, - "learning_rate": 0.0002764796101124559, - "loss": 0.0304, + "epoch": 0.08, + "learning_rate": 0.00028791542351748787, + "loss": 0.0279, "step": 31080 }, { - "epoch": 0.16, - "learning_rate": 0.00027647204241944187, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.00028791153530111644, + "loss": 0.0308, "step": 31090 }, { - "epoch": 0.16, - "learning_rate": 0.00027646447472642785, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.00028790764708474495, + "loss": 0.0329, "step": 31100 }, { - "epoch": 0.16, - "learning_rate": 0.00027645690703341383, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.00028790375886837347, + "loss": 0.032, "step": 31110 }, { - "epoch": 0.16, - "learning_rate": 0.00027644933934039986, - "loss": 0.0269, + "epoch": 0.08, + "learning_rate": 0.00028789987065200203, + "loss": 0.0361, "step": 31120 }, { - "epoch": 0.16, - "learning_rate": 0.00027644177164738585, - "loss": 0.0222, + "epoch": 0.08, + "learning_rate": 0.00028789598243563055, + "loss": 0.0338, "step": 31130 }, { - "epoch": 0.16, - "learning_rate": 0.0002764342039543718, - "loss": 0.0196, + "epoch": 0.08, + "learning_rate": 0.00028789209421925906, + "loss": 0.0334, "step": 31140 }, { - "epoch": 0.16, - "learning_rate": 0.0002764266362613578, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.00028788820600288763, + "loss": 0.0287, "step": 31150 }, { - "epoch": 0.16, - "learning_rate": 0.0002764190685683438, - "loss": 0.024, + "epoch": 0.08, + "learning_rate": 0.00028788431778651615, + "loss": 0.0313, "step": 31160 }, { - "epoch": 0.16, - "learning_rate": 0.00027641150087532977, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.0002878804295701447, + "loss": 0.0306, "step": 31170 }, { - "epoch": 0.16, - "learning_rate": 0.0002764039331823158, - "loss": 0.0208, + "epoch": 0.08, + "learning_rate": 0.00028787654135377323, + "loss": 0.0385, "step": 31180 }, { - "epoch": 0.16, - "learning_rate": 0.0002763963654893018, - "loss": 0.024, + "epoch": 0.08, + "learning_rate": 0.00028787265313740174, + "loss": 0.0339, "step": 31190 }, { - "epoch": 0.16, - "learning_rate": 0.00027638879779628777, - "loss": 0.0275, + "epoch": 0.08, + "learning_rate": 0.0002878687649210303, + "loss": 0.0334, "step": 31200 }, { - "epoch": 0.16, - "learning_rate": 0.00027638123010327375, - "loss": 0.0274, + "epoch": 0.08, + "learning_rate": 0.00028786487670465883, + "loss": 0.0439, "step": 31210 }, { - "epoch": 0.16, - "learning_rate": 0.00027637366241025973, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.00028786098848828734, + "loss": 0.0324, "step": 31220 }, { - "epoch": 0.16, - "learning_rate": 0.0002763660947172457, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.0002878571002719159, + "loss": 0.0353, "step": 31230 }, { - "epoch": 0.16, - "learning_rate": 0.00027635852702423175, - "loss": 0.0236, + "epoch": 0.08, + "learning_rate": 0.0002878532120555445, + "loss": 0.0402, "step": 31240 }, { - "epoch": 0.16, - "learning_rate": 0.00027635095933121773, - "loss": 0.0244, + "epoch": 0.08, + "learning_rate": 0.000287849323839173, + "loss": 0.0371, "step": 31250 }, { - "epoch": 0.16, - "learning_rate": 0.0002763433916382037, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.0002878454356228015, + "loss": 0.0288, "step": 31260 }, { - "epoch": 0.16, - "learning_rate": 0.0002763358239451897, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028784154740643, + "loss": 0.0303, "step": 31270 }, { - "epoch": 0.16, - "learning_rate": 0.0002763282562521757, - "loss": 0.0286, + "epoch": 0.08, + "learning_rate": 0.0002878376591900586, + "loss": 0.0383, "step": 31280 }, { - "epoch": 0.16, - "learning_rate": 0.00027632068855916166, - "loss": 0.0289, + "epoch": 0.08, + "learning_rate": 0.0002878337709736871, + "loss": 0.0335, "step": 31290 }, { - "epoch": 0.16, - "learning_rate": 0.00027631312086614764, - "loss": 0.0289, + "epoch": 0.08, + "learning_rate": 0.0002878298827573157, + "loss": 0.0322, "step": 31300 }, { - "epoch": 0.16, - "learning_rate": 0.0002763055531731337, - "loss": 0.0294, + "epoch": 0.08, + "learning_rate": 0.0002878259945409442, + "loss": 0.0329, "step": 31310 }, { - "epoch": 0.16, - "learning_rate": 0.00027629798548011966, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.0002878221063245727, + "loss": 0.0316, "step": 31320 }, { - "epoch": 0.16, - "learning_rate": 0.00027629041778710564, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.0002878182181082013, + "loss": 0.0339, "step": 31330 }, { - "epoch": 0.16, - "learning_rate": 0.0002762828500940916, - "loss": 0.0199, + "epoch": 0.08, + "learning_rate": 0.0002878143298918298, + "loss": 0.0365, "step": 31340 }, { - "epoch": 0.16, - "learning_rate": 0.0002762752824010776, - "loss": 0.024, + "epoch": 0.08, + "learning_rate": 0.0002878104416754583, + "loss": 0.0339, "step": 31350 }, { - "epoch": 0.16, - "learning_rate": 0.0002762677147080636, - "loss": 0.0228, + "epoch": 0.08, + "learning_rate": 0.00028780655345908687, + "loss": 0.0332, "step": 31360 }, { - "epoch": 0.16, - "learning_rate": 0.0002762601470150496, - "loss": 0.0392, + "epoch": 0.08, + "learning_rate": 0.00028780266524271544, + "loss": 0.035, "step": 31370 }, { - "epoch": 0.16, - "learning_rate": 0.0002762525793220356, - "loss": 0.0231, + "epoch": 0.08, + "learning_rate": 0.00028779877702634395, + "loss": 0.0298, "step": 31380 }, { - "epoch": 0.16, - "learning_rate": 0.0002762450116290216, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.00028779488880997247, + "loss": 0.0298, "step": 31390 }, { - "epoch": 0.16, - "learning_rate": 0.00027623744393600756, - "loss": 0.0354, + "epoch": 0.08, + "learning_rate": 0.000287791000593601, + "loss": 0.0271, "step": 31400 }, { - "epoch": 0.16, - "learning_rate": 0.00027622987624299354, - "loss": 0.0284, + "epoch": 0.08, + "learning_rate": 0.00028778711237722955, + "loss": 0.0337, "step": 31410 }, { - "epoch": 0.16, - "learning_rate": 0.0002762223085499795, - "loss": 0.0366, + "epoch": 0.08, + "learning_rate": 0.00028778322416085807, + "loss": 0.0319, "step": 31420 }, { - "epoch": 0.16, - "learning_rate": 0.00027621474085696556, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.00028777933594448664, + "loss": 0.0292, "step": 31430 }, { - "epoch": 0.16, - "learning_rate": 0.00027620717316395154, - "loss": 0.0294, + "epoch": 0.08, + "learning_rate": 0.00028777544772811515, + "loss": 0.0343, "step": 31440 }, { - "epoch": 0.16, - "learning_rate": 0.0002761996054709375, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.0002877715595117437, + "loss": 0.026, "step": 31450 }, { - "epoch": 0.16, - "learning_rate": 0.0002761920377779235, - "loss": 0.0317, + "epoch": 0.08, + "learning_rate": 0.00028776767129537223, + "loss": 0.0295, "step": 31460 }, { - "epoch": 0.16, - "learning_rate": 0.0002761844700849095, - "loss": 0.0279, + "epoch": 0.08, + "learning_rate": 0.00028776378307900075, + "loss": 0.0339, "step": 31470 }, { - "epoch": 0.16, - "learning_rate": 0.00027617690239189547, - "loss": 0.0217, + "epoch": 0.08, + "learning_rate": 0.00028775989486262926, + "loss": 0.0352, "step": 31480 }, { - "epoch": 0.16, - "learning_rate": 0.00027616933469888145, - "loss": 0.0259, + "epoch": 0.08, + "learning_rate": 0.00028775600664625783, + "loss": 0.0302, "step": 31490 }, { - "epoch": 0.16, - "learning_rate": 0.0002761617670058675, - "loss": 0.0209, + "epoch": 0.08, + "learning_rate": 0.00028775211842988635, + "loss": 0.0315, "step": 31500 }, { - "epoch": 0.16, - "learning_rate": 0.00027615419931285347, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.0002877482302135149, + "loss": 0.0315, "step": 31510 }, { - "epoch": 0.16, - "learning_rate": 0.00027614663161983945, - "loss": 0.0325, + "epoch": 0.08, + "learning_rate": 0.00028774434199714343, + "loss": 0.0312, "step": 31520 }, { - "epoch": 0.16, - "learning_rate": 0.00027613906392682543, - "loss": 0.0311, + "epoch": 0.08, + "learning_rate": 0.00028774045378077194, + "loss": 0.0338, "step": 31530 }, { - "epoch": 0.16, - "learning_rate": 0.0002761314962338114, - "loss": 0.0289, + "epoch": 0.08, + "learning_rate": 0.0002877365655644005, + "loss": 0.0351, "step": 31540 }, { - "epoch": 0.16, - "learning_rate": 0.0002761239285407974, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.000287732677348029, + "loss": 0.029, "step": 31550 }, { - "epoch": 0.16, - "learning_rate": 0.00027611636084778343, - "loss": 0.0269, + "epoch": 0.08, + "learning_rate": 0.00028772878913165754, + "loss": 0.0308, "step": 31560 }, { - "epoch": 0.16, - "learning_rate": 0.0002761087931547694, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.0002877249009152861, + "loss": 0.0329, "step": 31570 }, { - "epoch": 0.16, - "learning_rate": 0.0002761012254617554, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.0002877210126989147, + "loss": 0.0364, "step": 31580 }, { - "epoch": 0.16, - "learning_rate": 0.00027609365776874137, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.0002877171244825432, + "loss": 0.0328, "step": 31590 }, { - "epoch": 0.16, - "learning_rate": 0.00027608609007572735, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.0002877132362661717, + "loss": 0.032, "step": 31600 }, { - "epoch": 0.16, - "learning_rate": 0.00027607852238271333, - "loss": 0.0265, + "epoch": 0.08, + "learning_rate": 0.0002877093480498002, + "loss": 0.0311, "step": 31610 }, { - "epoch": 0.16, - "learning_rate": 0.0002760709546896993, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.0002877054598334288, + "loss": 0.0403, "step": 31620 }, { - "epoch": 0.16, - "learning_rate": 0.00027606338699668535, - "loss": 0.0225, + "epoch": 0.08, + "learning_rate": 0.0002877015716170573, + "loss": 0.0307, "step": 31630 }, { - "epoch": 0.16, - "learning_rate": 0.00027605581930367133, - "loss": 0.0229, + "epoch": 0.08, + "learning_rate": 0.0002876976834006859, + "loss": 0.029, "step": 31640 }, { - "epoch": 0.16, - "learning_rate": 0.0002760482516106573, - "loss": 0.0274, + "epoch": 0.08, + "learning_rate": 0.0002876937951843144, + "loss": 0.0379, "step": 31650 }, { - "epoch": 0.16, - "learning_rate": 0.0002760406839176433, - "loss": 0.0216, + "epoch": 0.08, + "learning_rate": 0.00028768990696794296, + "loss": 0.0394, "step": 31660 }, { - "epoch": 0.16, - "learning_rate": 0.0002760331162246293, - "loss": 0.0267, + "epoch": 0.08, + "learning_rate": 0.00028768601875157147, + "loss": 0.0378, "step": 31670 }, { - "epoch": 0.16, - "learning_rate": 0.00027602554853161526, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.0002876821305352, + "loss": 0.0393, "step": 31680 }, { - "epoch": 0.16, - "learning_rate": 0.0002760179808386013, - "loss": 0.0241, + "epoch": 0.08, + "learning_rate": 0.0002876782423188285, + "loss": 0.0278, "step": 31690 }, { - "epoch": 0.16, - "learning_rate": 0.0002760104131455873, - "loss": 0.0282, + "epoch": 0.08, + "learning_rate": 0.00028767435410245707, + "loss": 0.0379, "step": 31700 }, { - "epoch": 0.16, - "learning_rate": 0.00027600284545257326, - "loss": 0.0242, + "epoch": 0.08, + "learning_rate": 0.0002876704658860856, + "loss": 0.0393, "step": 31710 }, { - "epoch": 0.16, - "learning_rate": 0.00027599527775955924, - "loss": 0.0243, + "epoch": 0.08, + "learning_rate": 0.00028766657766971415, + "loss": 0.0372, "step": 31720 }, { - "epoch": 0.16, - "learning_rate": 0.0002759877100665452, - "loss": 0.027, + "epoch": 0.08, + "learning_rate": 0.00028766268945334267, + "loss": 0.0287, "step": 31730 }, { - "epoch": 0.16, - "learning_rate": 0.0002759801423735312, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.00028765880123697124, + "loss": 0.0295, "step": 31740 }, { - "epoch": 0.16, - "learning_rate": 0.00027597257468051724, - "loss": 0.0339, + "epoch": 0.08, + "learning_rate": 0.00028765491302059975, + "loss": 0.0311, "step": 31750 }, { - "epoch": 0.16, - "learning_rate": 0.0002759650069875032, - "loss": 0.0257, + "epoch": 0.08, + "learning_rate": 0.00028765102480422827, + "loss": 0.0326, "step": 31760 }, { - "epoch": 0.16, - "learning_rate": 0.0002759574392944892, - "loss": 0.0305, + "epoch": 0.08, + "learning_rate": 0.00028764713658785683, + "loss": 0.0271, "step": 31770 }, { - "epoch": 0.16, - "learning_rate": 0.0002759498716014752, - "loss": 0.0229, + "epoch": 0.08, + "learning_rate": 0.00028764324837148535, + "loss": 0.0331, "step": 31780 }, { - "epoch": 0.16, - "learning_rate": 0.00027594230390846116, - "loss": 0.0226, + "epoch": 0.08, + "learning_rate": 0.0002876393601551139, + "loss": 0.0262, "step": 31790 }, { - "epoch": 0.16, - "learning_rate": 0.00027593473621544714, - "loss": 0.0289, + "epoch": 0.08, + "learning_rate": 0.00028763547193874243, + "loss": 0.0293, "step": 31800 }, { - "epoch": 0.16, - "learning_rate": 0.0002759271685224331, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.00028763158372237095, + "loss": 0.0293, "step": 31810 }, { - "epoch": 0.16, - "learning_rate": 0.00027591960082941916, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.00028762769550599946, + "loss": 0.035, "step": 31820 }, { - "epoch": 0.16, - "learning_rate": 0.00027591203313640514, - "loss": 0.0242, + "epoch": 0.08, + "learning_rate": 0.00028762380728962803, + "loss": 0.0363, "step": 31830 }, { - "epoch": 0.16, - "learning_rate": 0.0002759044654433911, - "loss": 0.0299, + "epoch": 0.08, + "learning_rate": 0.00028761991907325654, + "loss": 0.0354, "step": 31840 }, { - "epoch": 0.16, - "learning_rate": 0.0002758968977503771, - "loss": 0.0288, + "epoch": 0.08, + "learning_rate": 0.0002876160308568851, + "loss": 0.0243, "step": 31850 }, { - "epoch": 0.16, - "learning_rate": 0.0002758893300573631, - "loss": 0.0235, + "epoch": 0.08, + "learning_rate": 0.00028761214264051363, + "loss": 0.0381, "step": 31860 }, { - "epoch": 0.16, - "learning_rate": 0.00027588176236434907, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.0002876082544241422, + "loss": 0.0334, "step": 31870 }, { - "epoch": 0.16, - "learning_rate": 0.0002758741946713351, - "loss": 0.0336, + "epoch": 0.08, + "learning_rate": 0.0002876043662077707, + "loss": 0.0345, "step": 31880 }, { - "epoch": 0.16, - "learning_rate": 0.0002758666269783211, - "loss": 0.0238, + "epoch": 0.08, + "learning_rate": 0.0002876004779913992, + "loss": 0.0329, "step": 31890 }, { - "epoch": 0.16, - "learning_rate": 0.00027585905928530707, - "loss": 0.0272, + "epoch": 0.08, + "learning_rate": 0.00028759658977502774, + "loss": 0.0262, "step": 31900 }, { - "epoch": 0.16, - "learning_rate": 0.00027585149159229305, - "loss": 0.0237, + "epoch": 0.08, + "learning_rate": 0.0002875927015586563, + "loss": 0.0255, "step": 31910 }, { - "epoch": 0.16, - "learning_rate": 0.00027584392389927903, - "loss": 0.0236, + "epoch": 0.08, + "learning_rate": 0.0002875888133422849, + "loss": 0.0292, "step": 31920 }, { - "epoch": 0.16, - "learning_rate": 0.000275836356206265, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.0002875849251259134, + "loss": 0.0303, "step": 31930 }, { - "epoch": 0.16, - "learning_rate": 0.000275828788513251, - "loss": 0.0271, + "epoch": 0.08, + "learning_rate": 0.0002875810369095419, + "loss": 0.0283, "step": 31940 }, { - "epoch": 0.16, - "learning_rate": 0.00027582122082023703, - "loss": 0.0268, + "epoch": 0.08, + "learning_rate": 0.0002875771486931705, + "loss": 0.0312, "step": 31950 }, { - "epoch": 0.16, - "learning_rate": 0.000275813653127223, - "loss": 0.0238, + "epoch": 0.08, + "learning_rate": 0.000287573260476799, + "loss": 0.0283, "step": 31960 }, { - "epoch": 0.16, - "learning_rate": 0.000275806085434209, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.0002875693722604275, + "loss": 0.0326, "step": 31970 }, { - "epoch": 0.16, - "learning_rate": 0.000275798517741195, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.0002875654840440561, + "loss": 0.0305, "step": 31980 }, { - "epoch": 0.16, - "learning_rate": 0.00027579095004818095, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.0002875615958276846, + "loss": 0.0384, "step": 31990 }, { - "epoch": 0.16, - "learning_rate": 0.00027578338235516694, - "loss": 0.0273, + "epoch": 0.08, + "learning_rate": 0.00028755770761131316, + "loss": 0.0307, "step": 32000 }, { - "epoch": 0.16, - "eval_cer": 0.9144896638256703, - "eval_loss": 0.017893997952342033, - "eval_runtime": 117.1916, - "eval_samples_per_second": 17.066, - "eval_steps_per_second": 4.267, + "epoch": 0.08, + "eval_cer": 0.8818356518319148, + "eval_loss": 0.023202601820230484, + "eval_runtime": 107.5432, + "eval_samples_per_second": 18.597, + "eval_steps_per_second": 4.649, "step": 32000 }, { - "epoch": 0.16, - "learning_rate": 0.00027577581466215297, - "loss": 0.0236, + "epoch": 0.08, + "learning_rate": 0.00028755381939494167, + "loss": 0.033, "step": 32010 }, { - "epoch": 0.16, - "learning_rate": 0.00027576824696913895, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.0002875499311785702, + "loss": 0.0317, "step": 32020 }, { - "epoch": 0.16, - "learning_rate": 0.00027576067927612493, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.0002875460429621987, + "loss": 0.0327, "step": 32030 }, { - "epoch": 0.16, - "learning_rate": 0.0002757531115831109, - "loss": 0.0208, + "epoch": 0.08, + "learning_rate": 0.00028754215474582727, + "loss": 0.0276, "step": 32040 }, { - "epoch": 0.16, - "learning_rate": 0.0002757455438900969, - "loss": 0.025, + "epoch": 0.08, + "learning_rate": 0.0002875382665294558, + "loss": 0.0281, "step": 32050 }, { - "epoch": 0.16, - "learning_rate": 0.0002757379761970829, - "loss": 0.023, + "epoch": 0.08, + "learning_rate": 0.00028753437831308435, + "loss": 0.031, "step": 32060 }, { - "epoch": 0.16, - "learning_rate": 0.00027573040850406886, - "loss": 0.0272, + "epoch": 0.08, + "learning_rate": 0.00028753049009671287, + "loss": 0.0366, "step": 32070 }, { - "epoch": 0.16, - "learning_rate": 0.00027572284081105484, - "loss": 0.0225, + "epoch": 0.08, + "learning_rate": 0.00028752660188034144, + "loss": 0.0353, "step": 32080 }, { - "epoch": 0.16, - "learning_rate": 0.0002757152731180408, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.00028752271366396995, + "loss": 0.0351, "step": 32090 }, { - "epoch": 0.16, - "learning_rate": 0.0002757077054250268, - "loss": 0.0251, + "epoch": 0.08, + "learning_rate": 0.00028751882544759846, + "loss": 0.0293, "step": 32100 }, { - "epoch": 0.16, - "learning_rate": 0.00027570013773201284, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.000287514937231227, + "loss": 0.0291, "step": 32110 }, { - "epoch": 0.16, - "learning_rate": 0.0002756925700389988, - "loss": 0.0257, + "epoch": 0.08, + "learning_rate": 0.00028751104901485555, + "loss": 0.0267, "step": 32120 }, { - "epoch": 0.16, - "learning_rate": 0.0002756850023459848, - "loss": 0.0245, + "epoch": 0.08, + "learning_rate": 0.0002875071607984841, + "loss": 0.0338, "step": 32130 }, { - "epoch": 0.16, - "learning_rate": 0.0002756774346529708, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028750327258211263, + "loss": 0.034, "step": 32140 }, { - "epoch": 0.16, - "learning_rate": 0.00027566986695995677, - "loss": 0.0264, + "epoch": 0.08, + "learning_rate": 0.00028749938436574115, + "loss": 0.0325, "step": 32150 }, { - "epoch": 0.16, - "learning_rate": 0.00027566229926694275, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.0002874954961493697, + "loss": 0.0282, "step": 32160 }, { - "epoch": 0.16, - "learning_rate": 0.00027565473157392873, - "loss": 0.0344, + "epoch": 0.08, + "learning_rate": 0.00028749160793299823, + "loss": 0.031, "step": 32170 }, { - "epoch": 0.16, - "learning_rate": 0.00027564716388091476, - "loss": 0.0269, + "epoch": 0.08, + "learning_rate": 0.00028748771971662674, + "loss": 0.0295, "step": 32180 }, { - "epoch": 0.16, - "learning_rate": 0.00027563959618790075, - "loss": 0.0241, + "epoch": 0.08, + "learning_rate": 0.0002874838315002553, + "loss": 0.0346, "step": 32190 }, { - "epoch": 0.16, - "learning_rate": 0.00027563202849488673, - "loss": 0.0234, + "epoch": 0.08, + "learning_rate": 0.0002874799432838838, + "loss": 0.0336, "step": 32200 }, { - "epoch": 0.16, - "learning_rate": 0.0002756244608018727, - "loss": 0.028, + "epoch": 0.08, + "learning_rate": 0.0002874760550675124, + "loss": 0.0409, "step": 32210 }, { - "epoch": 0.16, - "learning_rate": 0.0002756168931088587, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.0002874721668511409, + "loss": 0.0342, "step": 32220 }, { - "epoch": 0.16, - "learning_rate": 0.00027560932541584467, - "loss": 0.0261, + "epoch": 0.08, + "learning_rate": 0.0002874682786347694, + "loss": 0.0307, "step": 32230 }, { - "epoch": 0.16, - "learning_rate": 0.0002756017577228307, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.000287464390418398, + "loss": 0.0332, "step": 32240 }, { - "epoch": 0.16, - "learning_rate": 0.0002755941900298167, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.0002874605022020265, + "loss": 0.0323, "step": 32250 }, { - "epoch": 0.16, - "learning_rate": 0.00027558662233680267, - "loss": 0.0309, + "epoch": 0.08, + "learning_rate": 0.000287456613985655, + "loss": 0.045, "step": 32260 }, { - "epoch": 0.16, - "learning_rate": 0.00027557905464378865, - "loss": 0.0308, + "epoch": 0.08, + "learning_rate": 0.0002874527257692836, + "loss": 0.0573, "step": 32270 }, { - "epoch": 0.16, - "learning_rate": 0.00027557148695077463, - "loss": 0.0274, + "epoch": 0.08, + "learning_rate": 0.0002874488375529121, + "loss": 0.032, "step": 32280 }, { - "epoch": 0.16, - "learning_rate": 0.0002755639192577606, - "loss": 0.0283, + "epoch": 0.08, + "learning_rate": 0.0002874449493365407, + "loss": 0.0495, "step": 32290 }, { - "epoch": 0.16, - "learning_rate": 0.00027555635156474665, - "loss": 0.0241, + "epoch": 0.08, + "learning_rate": 0.0002874410611201692, + "loss": 0.0366, "step": 32300 }, { - "epoch": 0.16, - "learning_rate": 0.00027554878387173263, - "loss": 0.0299, + "epoch": 0.08, + "learning_rate": 0.0002874371729037977, + "loss": 0.0432, "step": 32310 }, { - "epoch": 0.16, - "learning_rate": 0.0002755412161787186, - "loss": 0.0252, + "epoch": 0.08, + "learning_rate": 0.00028743328468742627, + "loss": 0.0371, "step": 32320 }, { - "epoch": 0.16, - "learning_rate": 0.0002755336484857046, - "loss": 0.0258, + "epoch": 0.08, + "learning_rate": 0.0002874293964710548, + "loss": 0.0369, "step": 32330 }, { - "epoch": 0.16, - "learning_rate": 0.0002755260807926906, - "loss": 0.0216, + "epoch": 0.08, + "learning_rate": 0.00028742550825468336, + "loss": 0.0288, "step": 32340 }, { - "epoch": 0.16, - "learning_rate": 0.00027551851309967656, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028742162003831187, + "loss": 0.0353, "step": 32350 }, { - "epoch": 0.16, - "learning_rate": 0.00027551094540666254, - "loss": 0.0251, + "epoch": 0.08, + "learning_rate": 0.0002874177318219404, + "loss": 0.0327, "step": 32360 }, { - "epoch": 0.16, - "learning_rate": 0.0002755033777136486, - "loss": 0.0318, + "epoch": 0.08, + "learning_rate": 0.00028741384360556895, + "loss": 0.0323, "step": 32370 }, { - "epoch": 0.16, - "learning_rate": 0.00027549581002063456, - "loss": 0.0237, + "epoch": 0.08, + "learning_rate": 0.00028740995538919747, + "loss": 0.0359, "step": 32380 }, { - "epoch": 0.16, - "learning_rate": 0.00027548824232762054, - "loss": 0.0221, + "epoch": 0.08, + "learning_rate": 0.000287406067172826, + "loss": 0.0355, "step": 32390 }, { - "epoch": 0.16, - "learning_rate": 0.0002754806746346065, - "loss": 0.0226, + "epoch": 0.08, + "learning_rate": 0.00028740217895645455, + "loss": 0.0327, "step": 32400 }, { - "epoch": 0.16, - "learning_rate": 0.0002754731069415925, - "loss": 0.0262, + "epoch": 0.08, + "learning_rate": 0.00028739829074008307, + "loss": 0.0384, "step": 32410 }, { - "epoch": 0.16, - "learning_rate": 0.0002754655392485785, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.00028739440252371163, + "loss": 0.0356, "step": 32420 }, { - "epoch": 0.16, - "learning_rate": 0.0002754579715555645, - "loss": 0.0227, + "epoch": 0.08, + "learning_rate": 0.00028739051430734015, + "loss": 0.036, "step": 32430 }, { - "epoch": 0.16, - "learning_rate": 0.0002754504038625505, - "loss": 0.0267, + "epoch": 0.08, + "learning_rate": 0.00028738662609096866, + "loss": 0.0294, "step": 32440 }, { - "epoch": 0.16, - "learning_rate": 0.0002754428361695365, - "loss": 0.0282, + "epoch": 0.08, + "learning_rate": 0.00028738273787459723, + "loss": 0.033, "step": 32450 }, { - "epoch": 0.16, - "learning_rate": 0.00027543526847652246, - "loss": 0.0243, + "epoch": 0.08, + "learning_rate": 0.00028737884965822575, + "loss": 0.0361, "step": 32460 }, { - "epoch": 0.16, - "learning_rate": 0.00027542770078350844, - "loss": 0.0223, + "epoch": 0.08, + "learning_rate": 0.0002873749614418543, + "loss": 0.0327, "step": 32470 }, { - "epoch": 0.16, - "learning_rate": 0.0002754201330904944, - "loss": 0.0243, + "epoch": 0.08, + "learning_rate": 0.00028737107322548283, + "loss": 0.0336, "step": 32480 }, { - "epoch": 0.16, - "learning_rate": 0.00027541256539748046, - "loss": 0.0246, + "epoch": 0.08, + "learning_rate": 0.0002873671850091114, + "loss": 0.0345, "step": 32490 }, { - "epoch": 0.16, - "learning_rate": 0.00027540499770446644, - "loss": 0.0247, + "epoch": 0.08, + "learning_rate": 0.0002873632967927399, + "loss": 0.0411, "step": 32500 }, { - "epoch": 0.16, - "learning_rate": 0.0002753974300114524, - "loss": 0.0245, + "epoch": 0.08, + "learning_rate": 0.00028735940857636843, + "loss": 0.0387, "step": 32510 }, { - "epoch": 0.16, - "learning_rate": 0.0002753898623184384, - "loss": 0.0256, + "epoch": 0.08, + "learning_rate": 0.00028735552035999694, + "loss": 0.0329, "step": 32520 }, { - "epoch": 0.16, - "learning_rate": 0.0002753822946254244, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.0002873516321436255, + "loss": 0.0352, "step": 32530 }, { - "epoch": 0.16, - "learning_rate": 0.00027537472693241037, - "loss": 0.0264, + "epoch": 0.08, + "learning_rate": 0.000287347743927254, + "loss": 0.03, "step": 32540 }, { - "epoch": 0.16, - "learning_rate": 0.00027536715923939635, - "loss": 0.024, + "epoch": 0.08, + "learning_rate": 0.0002873438557108826, + "loss": 0.0287, "step": 32550 }, { - "epoch": 0.16, - "learning_rate": 0.0002753595915463824, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.0002873399674945111, + "loss": 0.0328, "step": 32560 }, { - "epoch": 0.16, - "learning_rate": 0.00027535202385336837, - "loss": 0.0236, + "epoch": 0.08, + "learning_rate": 0.0002873360792781396, + "loss": 0.0363, "step": 32570 }, { - "epoch": 0.16, - "learning_rate": 0.00027534445616035435, - "loss": 0.0233, + "epoch": 0.08, + "learning_rate": 0.0002873321910617682, + "loss": 0.0316, "step": 32580 }, { - "epoch": 0.16, - "learning_rate": 0.00027533688846734033, - "loss": 0.0288, + "epoch": 0.08, + "learning_rate": 0.0002873283028453967, + "loss": 0.0301, "step": 32590 }, { - "epoch": 0.16, - "learning_rate": 0.0002753293207743263, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.0002873244146290252, + "loss": 0.0346, "step": 32600 }, { - "epoch": 0.16, - "learning_rate": 0.0002753217530813123, - "loss": 0.0255, + "epoch": 0.08, + "learning_rate": 0.0002873205264126538, + "loss": 0.035, "step": 32610 }, { - "epoch": 0.16, - "learning_rate": 0.00027531418538829833, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028731663819628236, + "loss": 0.0339, "step": 32620 }, { - "epoch": 0.16, - "learning_rate": 0.0002753066176952843, - "loss": 0.0249, + "epoch": 0.08, + "learning_rate": 0.0002873127499799109, + "loss": 0.0302, "step": 32630 }, { - "epoch": 0.16, - "learning_rate": 0.0002752990500022703, - "loss": 0.0277, + "epoch": 0.08, + "learning_rate": 0.0002873088617635394, + "loss": 0.0285, "step": 32640 }, { - "epoch": 0.16, - "learning_rate": 0.00027529148230925627, - "loss": 0.0321, + "epoch": 0.08, + "learning_rate": 0.0002873049735471679, + "loss": 0.0342, "step": 32650 }, { - "epoch": 0.16, - "learning_rate": 0.00027528391461624225, - "loss": 0.026, + "epoch": 0.08, + "learning_rate": 0.00028730108533079647, + "loss": 0.0297, "step": 32660 }, { - "epoch": 0.16, - "learning_rate": 0.00027527634692322823, - "loss": 0.0227, + "epoch": 0.08, + "learning_rate": 0.000287297197114425, + "loss": 0.0369, "step": 32670 }, { - "epoch": 0.16, - "learning_rate": 0.0002752687792302142, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028729330889805355, + "loss": 0.0314, "step": 32680 }, { - "epoch": 0.16, - "learning_rate": 0.00027526121153720025, - "loss": 0.0263, + "epoch": 0.08, + "learning_rate": 0.00028728942068168207, + "loss": 0.0362, "step": 32690 }, { - "epoch": 0.16, - "learning_rate": 0.00027525364384418623, - "loss": 0.0239, + "epoch": 0.08, + "learning_rate": 0.00028728553246531064, + "loss": 0.0354, "step": 32700 }, { - "epoch": 0.17, - "learning_rate": 0.0002752460761511722, - "loss": 0.0281, + "epoch": 0.08, + "learning_rate": 0.00028728164424893915, + "loss": 0.0336, "step": 32710 }, { - "epoch": 0.17, - "learning_rate": 0.0002752385084581582, - "loss": 0.0254, + "epoch": 0.08, + "learning_rate": 0.00028727775603256767, + "loss": 0.0311, "step": 32720 }, { - "epoch": 0.17, - "learning_rate": 0.0002752309407651442, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.0002872738678161962, + "loss": 0.0296, "step": 32730 }, { - "epoch": 0.17, - "learning_rate": 0.00027522337307213016, - "loss": 0.0253, + "epoch": 0.08, + "learning_rate": 0.00028726997959982475, + "loss": 0.0322, "step": 32740 }, { - "epoch": 0.17, - "learning_rate": 0.0002752158053791162, - "loss": 0.0266, + "epoch": 0.08, + "learning_rate": 0.00028726609138345326, + "loss": 0.0319, "step": 32750 }, { - "epoch": 0.17, - "learning_rate": 0.0002752082376861022, - "loss": 0.028, + "epoch": 0.08, + "learning_rate": 0.00028726220316708183, + "loss": 0.0274, "step": 32760 }, { - "epoch": 0.17, - "learning_rate": 0.00027520066999308816, - "loss": 0.0268, + "epoch": 0.08, + "learning_rate": 0.00028725831495071035, + "loss": 0.0307, "step": 32770 }, { - "epoch": 0.17, - "learning_rate": 0.00027519310230007414, - "loss": 0.0232, + "epoch": 0.08, + "learning_rate": 0.00028725442673433886, + "loss": 0.0315, "step": 32780 }, { - "epoch": 0.17, - "learning_rate": 0.0002751855346070601, - "loss": 0.0297, + "epoch": 0.08, + "learning_rate": 0.00028725053851796743, + "loss": 0.0315, "step": 32790 }, { - "epoch": 0.17, - "learning_rate": 0.0002751779669140461, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.00028724665030159595, + "loss": 0.039, "step": 32800 }, { - "epoch": 0.17, - "learning_rate": 0.00027517039922103214, - "loss": 0.0301, + "epoch": 0.09, + "learning_rate": 0.00028724276208522446, + "loss": 0.0286, "step": 32810 }, { - "epoch": 0.17, - "learning_rate": 0.0002751628315280181, - "loss": 0.03, + "epoch": 0.09, + "learning_rate": 0.00028723887386885303, + "loss": 0.0323, "step": 32820 }, { - "epoch": 0.17, - "learning_rate": 0.0002751552638350041, - "loss": 0.0269, + "epoch": 0.09, + "learning_rate": 0.0002872349856524816, + "loss": 0.0329, "step": 32830 }, { - "epoch": 0.17, - "learning_rate": 0.0002751476961419901, - "loss": 0.0339, + "epoch": 0.09, + "learning_rate": 0.0002872310974361101, + "loss": 0.0308, "step": 32840 }, { - "epoch": 0.17, - "learning_rate": 0.00027514012844897606, - "loss": 0.0306, + "epoch": 0.09, + "learning_rate": 0.0002872272092197386, + "loss": 0.0288, "step": 32850 }, { - "epoch": 0.17, - "learning_rate": 0.00027513256075596204, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.00028722332100336714, + "loss": 0.036, "step": 32860 }, { - "epoch": 0.17, - "learning_rate": 0.000275124993062948, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.0002872194327869957, + "loss": 0.0312, "step": 32870 }, { - "epoch": 0.17, - "learning_rate": 0.00027511742536993406, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.0002872155445706242, + "loss": 0.0365, "step": 32880 }, { - "epoch": 0.17, - "learning_rate": 0.00027510985767692004, - "loss": 0.023, + "epoch": 0.09, + "learning_rate": 0.0002872116563542528, + "loss": 0.0306, "step": 32890 }, { - "epoch": 0.17, - "learning_rate": 0.000275102289983906, - "loss": 0.0251, + "epoch": 0.09, + "learning_rate": 0.0002872077681378813, + "loss": 0.0303, "step": 32900 }, { - "epoch": 0.17, - "learning_rate": 0.000275094722290892, - "loss": 0.0289, + "epoch": 0.09, + "learning_rate": 0.0002872038799215099, + "loss": 0.0298, "step": 32910 }, { - "epoch": 0.17, - "learning_rate": 0.000275087154597878, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.0002871999917051384, + "loss": 0.0312, "step": 32920 }, { - "epoch": 0.17, - "learning_rate": 0.00027507958690486397, - "loss": 0.0261, + "epoch": 0.09, + "learning_rate": 0.0002871961034887669, + "loss": 0.0349, "step": 32930 }, { - "epoch": 0.17, - "learning_rate": 0.00027507201921185, - "loss": 0.0416, + "epoch": 0.09, + "learning_rate": 0.0002871922152723954, + "loss": 0.0328, "step": 32940 }, { - "epoch": 0.17, - "learning_rate": 0.000275064451518836, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.000287188327056024, + "loss": 0.0277, "step": 32950 }, { - "epoch": 0.17, - "learning_rate": 0.00027505688382582197, - "loss": 0.0251, + "epoch": 0.09, + "learning_rate": 0.00028718443883965256, + "loss": 0.0347, "step": 32960 }, { - "epoch": 0.17, - "learning_rate": 0.00027504931613280795, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.00028718055062328107, + "loss": 0.0461, "step": 32970 }, { - "epoch": 0.17, - "learning_rate": 0.00027504174843979393, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.0002871766624069096, + "loss": 0.0306, "step": 32980 }, { - "epoch": 0.17, - "learning_rate": 0.0002750341807467799, - "loss": 0.023, + "epoch": 0.09, + "learning_rate": 0.00028717277419053816, + "loss": 0.0336, "step": 32990 }, { - "epoch": 0.17, - "learning_rate": 0.00027502661305376595, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.00028716888597416667, + "loss": 0.0394, "step": 33000 }, { - "epoch": 0.17, - "eval_cer": 0.9144838414489178, - "eval_loss": 0.018402038142085075, - "eval_runtime": 117.2116, - "eval_samples_per_second": 17.063, - "eval_steps_per_second": 4.266, + "epoch": 0.09, + "eval_cer": 0.8818328525580464, + "eval_loss": 0.023882215842604637, + "eval_runtime": 107.6564, + "eval_samples_per_second": 18.578, + "eval_steps_per_second": 4.644, "step": 33000 }, { - "epoch": 0.17, - "learning_rate": 0.00027501904536075193, - "loss": 0.0259, + "epoch": 0.09, + "learning_rate": 0.0002871649977577952, + "loss": 0.0326, "step": 33010 }, { - "epoch": 0.17, - "learning_rate": 0.0002750114776677379, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.00028716110954142375, + "loss": 0.029, "step": 33020 }, { - "epoch": 0.17, - "learning_rate": 0.0002750039099747239, - "loss": 0.0264, + "epoch": 0.09, + "learning_rate": 0.00028715722132505227, + "loss": 0.033, "step": 33030 }, { - "epoch": 0.17, - "learning_rate": 0.0002749963422817099, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.00028715333310868084, + "loss": 0.0307, "step": 33040 }, { - "epoch": 0.17, - "learning_rate": 0.00027498877458869585, - "loss": 0.0211, + "epoch": 0.09, + "learning_rate": 0.00028714944489230935, + "loss": 0.0291, "step": 33050 }, { - "epoch": 0.17, - "learning_rate": 0.00027498120689568184, - "loss": 0.021, + "epoch": 0.09, + "learning_rate": 0.00028714555667593787, + "loss": 0.0328, "step": 33060 }, { - "epoch": 0.17, - "learning_rate": 0.00027497363920266787, - "loss": 0.0223, + "epoch": 0.09, + "learning_rate": 0.0002871416684595664, + "loss": 0.0315, "step": 33070 }, { - "epoch": 0.17, - "learning_rate": 0.00027496607150965385, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.00028713778024319495, + "loss": 0.0304, "step": 33080 }, { - "epoch": 0.17, - "learning_rate": 0.00027495850381663983, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.00028713389202682346, + "loss": 0.0315, "step": 33090 }, { - "epoch": 0.17, - "learning_rate": 0.0002749509361236258, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.00028713000381045203, + "loss": 0.0404, "step": 33100 }, { - "epoch": 0.17, - "learning_rate": 0.0002749433684306118, - "loss": 0.0264, + "epoch": 0.09, + "learning_rate": 0.00028712611559408055, + "loss": 0.0391, "step": 33110 }, { - "epoch": 0.17, - "learning_rate": 0.0002749358007375978, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.0002871222273777091, + "loss": 0.0296, "step": 33120 }, { - "epoch": 0.17, - "learning_rate": 0.0002749282330445838, - "loss": 0.0317, + "epoch": 0.09, + "learning_rate": 0.00028711833916133763, + "loss": 0.0303, "step": 33130 }, { - "epoch": 0.17, - "learning_rate": 0.0002749206653515698, - "loss": 0.0236, + "epoch": 0.09, + "learning_rate": 0.00028711445094496614, + "loss": 0.0335, "step": 33140 }, { - "epoch": 0.17, - "learning_rate": 0.0002749130976585558, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.00028711056272859466, + "loss": 0.0321, "step": 33150 }, { - "epoch": 0.17, - "learning_rate": 0.00027490552996554176, - "loss": 0.0312, + "epoch": 0.09, + "learning_rate": 0.00028710667451222323, + "loss": 0.0279, "step": 33160 }, { - "epoch": 0.17, - "learning_rate": 0.00027489796227252774, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.0002871027862958518, + "loss": 0.0261, "step": 33170 }, { - "epoch": 0.17, - "learning_rate": 0.0002748903945795137, - "loss": 0.0219, + "epoch": 0.09, + "learning_rate": 0.0002870988980794803, + "loss": 0.0291, "step": 33180 }, { - "epoch": 0.17, - "learning_rate": 0.0002748828268864997, - "loss": 0.023, + "epoch": 0.09, + "learning_rate": 0.0002870950098631088, + "loss": 0.0313, "step": 33190 }, { - "epoch": 0.17, - "learning_rate": 0.00027487525919348574, - "loss": 0.0482, + "epoch": 0.09, + "learning_rate": 0.0002870911216467374, + "loss": 0.0384, "step": 33200 }, { - "epoch": 0.17, - "learning_rate": 0.0002748676915004717, - "loss": 0.0344, + "epoch": 0.09, + "learning_rate": 0.0002870872334303659, + "loss": 0.0365, "step": 33210 }, { - "epoch": 0.17, - "learning_rate": 0.0002748601238074577, - "loss": 0.0282, + "epoch": 0.09, + "learning_rate": 0.0002870833452139944, + "loss": 0.0316, "step": 33220 }, { - "epoch": 0.17, - "learning_rate": 0.0002748525561144437, - "loss": 0.0291, + "epoch": 0.09, + "learning_rate": 0.000287079456997623, + "loss": 0.0352, "step": 33230 }, { - "epoch": 0.17, - "learning_rate": 0.00027484498842142966, - "loss": 0.0255, + "epoch": 0.09, + "learning_rate": 0.0002870755687812515, + "loss": 0.0312, "step": 33240 }, { - "epoch": 0.17, - "learning_rate": 0.00027483742072841565, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.0002870716805648801, + "loss": 0.0288, "step": 33250 }, { - "epoch": 0.17, - "learning_rate": 0.0002748298530354017, - "loss": 0.0304, + "epoch": 0.09, + "learning_rate": 0.0002870677923485086, + "loss": 0.0325, "step": 33260 }, { - "epoch": 0.17, - "learning_rate": 0.00027482228534238766, - "loss": 0.0233, + "epoch": 0.09, + "learning_rate": 0.0002870639041321371, + "loss": 0.033, "step": 33270 }, { - "epoch": 0.17, - "learning_rate": 0.00027481471764937364, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.0002870600159157656, + "loss": 0.0323, "step": 33280 }, { - "epoch": 0.17, - "learning_rate": 0.0002748071499563596, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.0002870561276993942, + "loss": 0.0279, "step": 33290 }, { - "epoch": 0.17, - "learning_rate": 0.0002747995822633456, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.0002870522394830227, + "loss": 0.0306, "step": 33300 }, { - "epoch": 0.17, - "learning_rate": 0.0002747920145703316, - "loss": 0.0461, + "epoch": 0.09, + "learning_rate": 0.00028704835126665127, + "loss": 0.0351, "step": 33310 }, { - "epoch": 0.17, - "learning_rate": 0.00027478444687731757, - "loss": 0.0418, + "epoch": 0.09, + "learning_rate": 0.0002870444630502798, + "loss": 0.0497, "step": 33320 }, { - "epoch": 0.17, - "learning_rate": 0.00027477687918430355, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.00028704057483390835, + "loss": 0.0317, "step": 33330 }, { - "epoch": 0.17, - "learning_rate": 0.00027476931149128953, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.00028703668661753687, + "loss": 0.0278, "step": 33340 }, { - "epoch": 0.17, - "learning_rate": 0.0002747617437982755, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.0002870327984011654, + "loss": 0.0333, "step": 33350 }, { - "epoch": 0.17, - "learning_rate": 0.00027475417610526155, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.00028702891018479395, + "loss": 0.0301, "step": 33360 }, { - "epoch": 0.17, - "learning_rate": 0.00027474660841224753, - "loss": 0.0233, + "epoch": 0.09, + "learning_rate": 0.00028702502196842247, + "loss": 0.0316, "step": 33370 }, { - "epoch": 0.17, - "learning_rate": 0.0002747390407192335, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.00028702113375205104, + "loss": 0.0333, "step": 33380 }, { - "epoch": 0.17, - "learning_rate": 0.0002747314730262195, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.00028701724553567955, + "loss": 0.0299, "step": 33390 }, { - "epoch": 0.17, - "learning_rate": 0.0002747239053332055, - "loss": 0.0259, + "epoch": 0.09, + "learning_rate": 0.00028701335731930806, + "loss": 0.0354, "step": 33400 }, { - "epoch": 0.17, - "learning_rate": 0.00027471633764019146, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.00028700946910293663, + "loss": 0.0288, "step": 33410 }, { - "epoch": 0.17, - "learning_rate": 0.00027470876994717744, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.00028700558088656515, + "loss": 0.0303, "step": 33420 }, { - "epoch": 0.17, - "learning_rate": 0.0002747012022541635, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.00028700169267019366, + "loss": 0.0297, "step": 33430 }, { - "epoch": 0.17, - "learning_rate": 0.00027469363456114946, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028699780445382223, + "loss": 0.0298, "step": 33440 }, { - "epoch": 0.17, - "learning_rate": 0.00027468606686813544, - "loss": 0.031, + "epoch": 0.09, + "learning_rate": 0.00028699391623745075, + "loss": 0.0323, "step": 33450 }, { - "epoch": 0.17, - "learning_rate": 0.0002746784991751214, - "loss": 0.0264, + "epoch": 0.09, + "learning_rate": 0.0002869900280210793, + "loss": 0.0319, "step": 33460 }, { - "epoch": 0.17, - "learning_rate": 0.0002746709314821074, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028698613980470783, + "loss": 0.036, "step": 33470 }, { - "epoch": 0.17, - "learning_rate": 0.0002746633637890934, - "loss": 0.0261, + "epoch": 0.09, + "learning_rate": 0.00028698225158833634, + "loss": 0.0271, "step": 33480 }, { - "epoch": 0.17, - "learning_rate": 0.0002746557960960794, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.0002869783633719649, + "loss": 0.0328, "step": 33490 }, { - "epoch": 0.17, - "learning_rate": 0.0002746482284030654, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.0002869744751555934, + "loss": 0.0286, "step": 33500 }, { - "epoch": 0.17, - "learning_rate": 0.0002746406607100514, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.000286970586939222, + "loss": 0.0378, "step": 33510 }, { - "epoch": 0.17, - "learning_rate": 0.00027463309301703736, - "loss": 0.0218, + "epoch": 0.09, + "learning_rate": 0.0002869666987228505, + "loss": 0.0305, "step": 33520 }, { - "epoch": 0.17, - "learning_rate": 0.00027462552532402334, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.000286962810506479, + "loss": 0.0308, "step": 33530 }, { - "epoch": 0.17, - "learning_rate": 0.0002746179576310093, - "loss": 0.0267, + "epoch": 0.09, + "learning_rate": 0.0002869589222901076, + "loss": 0.0266, "step": 33540 }, { - "epoch": 0.17, - "learning_rate": 0.00027461038993799536, - "loss": 0.0298, + "epoch": 0.09, + "learning_rate": 0.0002869550340737361, + "loss": 0.0338, "step": 33550 }, { - "epoch": 0.17, - "learning_rate": 0.00027460282224498134, - "loss": 0.0277, + "epoch": 0.09, + "learning_rate": 0.0002869511458573646, + "loss": 0.0331, "step": 33560 }, { - "epoch": 0.17, - "learning_rate": 0.0002745952545519673, - "loss": 0.0324, + "epoch": 0.09, + "learning_rate": 0.0002869472576409932, + "loss": 0.0367, "step": 33570 }, { - "epoch": 0.17, - "learning_rate": 0.0002745876868589533, - "loss": 0.0339, + "epoch": 0.09, + "learning_rate": 0.0002869433694246217, + "loss": 0.0282, "step": 33580 }, { - "epoch": 0.17, - "learning_rate": 0.0002745801191659393, - "loss": 0.0385, + "epoch": 0.09, + "learning_rate": 0.0002869394812082503, + "loss": 0.033, "step": 33590 }, { - "epoch": 0.17, - "learning_rate": 0.00027457255147292527, - "loss": 0.0297, + "epoch": 0.09, + "learning_rate": 0.0002869355929918788, + "loss": 0.0286, "step": 33600 }, { - "epoch": 0.17, - "learning_rate": 0.00027456498377991125, - "loss": 0.0355, + "epoch": 0.09, + "learning_rate": 0.0002869317047755073, + "loss": 0.0301, "step": 33610 }, { - "epoch": 0.17, - "learning_rate": 0.0002745574160868973, - "loss": 0.0277, + "epoch": 0.09, + "learning_rate": 0.00028692781655913587, + "loss": 0.0323, "step": 33620 }, { - "epoch": 0.17, - "learning_rate": 0.00027454984839388327, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.0002869239283427644, + "loss": 0.0329, "step": 33630 }, { - "epoch": 0.17, - "learning_rate": 0.00027454228070086925, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.0002869200401263929, + "loss": 0.0284, "step": 33640 }, { - "epoch": 0.17, - "learning_rate": 0.00027453471300785523, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.00028691615191002147, + "loss": 0.0356, "step": 33650 }, { - "epoch": 0.17, - "learning_rate": 0.0002745271453148412, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.00028691226369365004, + "loss": 0.0388, "step": 33660 }, { - "epoch": 0.17, - "learning_rate": 0.0002745195776218272, - "loss": 0.0221, + "epoch": 0.09, + "learning_rate": 0.00028690837547727855, + "loss": 0.069, "step": 33670 }, { - "epoch": 0.17, - "learning_rate": 0.00027451200992881323, - "loss": 0.0293, + "epoch": 0.09, + "learning_rate": 0.00028690448726090707, + "loss": 0.0371, "step": 33680 }, { - "epoch": 0.17, - "learning_rate": 0.0002745044422357992, - "loss": 0.031, + "epoch": 0.09, + "learning_rate": 0.0002869005990445356, + "loss": 0.0328, "step": 33690 }, { - "epoch": 0.17, - "learning_rate": 0.0002744968745427852, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.00028689671082816415, + "loss": 0.037, "step": 33700 }, { - "epoch": 0.17, - "learning_rate": 0.00027448930684977117, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.00028689282261179267, + "loss": 0.0314, "step": 33710 }, { - "epoch": 0.17, - "learning_rate": 0.00027448173915675715, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.00028688893439542123, + "loss": 0.1216, "step": 33720 }, { - "epoch": 0.17, - "learning_rate": 0.00027447417146374313, - "loss": 0.0239, + "epoch": 0.09, + "learning_rate": 0.00028688504617904975, + "loss": 0.0316, "step": 33730 }, { - "epoch": 0.17, - "learning_rate": 0.0002744666037707291, - "loss": 0.0254, + "epoch": 0.09, + "learning_rate": 0.0002868811579626783, + "loss": 0.0441, "step": 33740 }, { - "epoch": 0.17, - "learning_rate": 0.00027445903607771515, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.00028687726974630683, + "loss": 0.0281, "step": 33750 }, { - "epoch": 0.17, - "learning_rate": 0.00027445146838470113, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.00028687338152993535, + "loss": 0.0325, "step": 33760 }, { - "epoch": 0.17, - "learning_rate": 0.0002744439006916871, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.00028686949331356386, + "loss": 0.0315, "step": 33770 }, { - "epoch": 0.17, - "learning_rate": 0.0002744363329986731, - "loss": 0.0282, + "epoch": 0.09, + "learning_rate": 0.00028686560509719243, + "loss": 0.036, "step": 33780 }, { - "epoch": 0.17, - "learning_rate": 0.0002744287653056591, - "loss": 0.021, + "epoch": 0.09, + "learning_rate": 0.00028686171688082094, + "loss": 0.028, "step": 33790 }, { - "epoch": 0.17, - "learning_rate": 0.00027442119761264506, - "loss": 0.0207, + "epoch": 0.09, + "learning_rate": 0.0002868578286644495, + "loss": 0.0285, "step": 33800 }, { - "epoch": 0.17, - "learning_rate": 0.0002744136299196311, - "loss": 0.0308, + "epoch": 0.09, + "learning_rate": 0.00028685394044807803, + "loss": 0.033, "step": 33810 }, { - "epoch": 0.17, - "learning_rate": 0.0002744060622266171, - "loss": 0.0278, + "epoch": 0.09, + "learning_rate": 0.00028685005223170654, + "loss": 0.0301, "step": 33820 }, { - "epoch": 0.17, - "learning_rate": 0.00027439849453360306, - "loss": 0.0252, + "epoch": 0.09, + "learning_rate": 0.0002868461640153351, + "loss": 0.0344, "step": 33830 }, { - "epoch": 0.17, - "learning_rate": 0.00027439092684058904, - "loss": 0.025, + "epoch": 0.09, + "learning_rate": 0.0002868422757989636, + "loss": 0.0335, "step": 33840 }, { - "epoch": 0.17, - "learning_rate": 0.000274383359147575, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.00028683838758259214, + "loss": 0.0314, "step": 33850 }, { - "epoch": 0.17, - "learning_rate": 0.000274375791454561, - "loss": 0.0229, + "epoch": 0.09, + "learning_rate": 0.0002868344993662207, + "loss": 0.0339, "step": 33860 }, { - "epoch": 0.17, - "learning_rate": 0.00027436822376154704, - "loss": 0.027, + "epoch": 0.09, + "learning_rate": 0.0002868306111498493, + "loss": 0.0257, "step": 33870 }, { - "epoch": 0.17, - "learning_rate": 0.000274360656068533, - "loss": 0.028, + "epoch": 0.09, + "learning_rate": 0.0002868267229334778, + "loss": 0.0361, "step": 33880 }, { - "epoch": 0.17, - "learning_rate": 0.000274353088375519, - "loss": 0.0222, + "epoch": 0.09, + "learning_rate": 0.0002868228347171063, + "loss": 0.0263, "step": 33890 }, { - "epoch": 0.17, - "learning_rate": 0.000274345520682505, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.0002868189465007348, + "loss": 0.0232, "step": 33900 }, { - "epoch": 0.17, - "learning_rate": 0.00027433795298949096, - "loss": 0.029, + "epoch": 0.09, + "learning_rate": 0.0002868150582843634, + "loss": 0.0308, "step": 33910 }, { - "epoch": 0.17, - "learning_rate": 0.00027433038529647694, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.0002868111700679919, + "loss": 0.0342, "step": 33920 }, { - "epoch": 0.17, - "learning_rate": 0.0002743228176034629, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.0002868072818516205, + "loss": 0.0294, "step": 33930 }, { - "epoch": 0.17, - "learning_rate": 0.00027431524991044896, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.000286803393635249, + "loss": 0.0492, "step": 33940 }, { - "epoch": 0.17, - "learning_rate": 0.00027430768221743494, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028679950541887756, + "loss": 0.0311, "step": 33950 }, { - "epoch": 0.17, - "learning_rate": 0.0002743001145244209, - "loss": 0.0215, + "epoch": 0.09, + "learning_rate": 0.00028679561720250607, + "loss": 0.0352, "step": 33960 }, { - "epoch": 0.17, - "learning_rate": 0.0002742925468314069, - "loss": 0.0234, + "epoch": 0.09, + "learning_rate": 0.0002867917289861346, + "loss": 0.0396, "step": 33970 }, { - "epoch": 0.17, - "learning_rate": 0.0002742849791383929, - "loss": 0.021, + "epoch": 0.09, + "learning_rate": 0.0002867878407697631, + "loss": 0.0353, "step": 33980 }, { - "epoch": 0.17, - "learning_rate": 0.00027427741144537887, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.00028678395255339167, + "loss": 0.0274, "step": 33990 }, { - "epoch": 0.17, - "learning_rate": 0.0002742698437523649, - "loss": 0.0264, + "epoch": 0.09, + "learning_rate": 0.0002867800643370202, + "loss": 0.0357, "step": 34000 }, { - "epoch": 0.17, - "eval_cer": 0.9144916046179211, - "eval_loss": 0.017292475327849388, - "eval_runtime": 117.3012, - "eval_samples_per_second": 17.05, - "eval_steps_per_second": 4.263, + "epoch": 0.09, + "eval_cer": 0.8817866645392185, + "eval_loss": 0.023611877113580704, + "eval_runtime": 107.9395, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, "step": 34000 }, { - "epoch": 0.17, - "learning_rate": 0.0002742622760593509, - "loss": 0.0221, + "epoch": 0.09, + "learning_rate": 0.00028677617612064875, + "loss": 0.0383, "step": 34010 }, { - "epoch": 0.17, - "learning_rate": 0.00027425470836633687, - "loss": 0.0193, + "epoch": 0.09, + "learning_rate": 0.00028677228790427727, + "loss": 0.0348, "step": 34020 }, { - "epoch": 0.17, - "learning_rate": 0.00027424714067332285, - "loss": 0.0214, + "epoch": 0.09, + "learning_rate": 0.0002867683996879058, + "loss": 0.0358, "step": 34030 }, { - "epoch": 0.17, - "learning_rate": 0.00027423957298030883, - "loss": 0.0213, + "epoch": 0.09, + "learning_rate": 0.00028676451147153435, + "loss": 0.0304, "step": 34040 }, { - "epoch": 0.17, - "learning_rate": 0.0002742320052872948, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028676062325516286, + "loss": 0.031, "step": 34050 }, { - "epoch": 0.17, - "learning_rate": 0.00027422443759428085, - "loss": 0.0271, + "epoch": 0.09, + "learning_rate": 0.00028675673503879143, + "loss": 0.034, "step": 34060 }, { - "epoch": 0.17, - "learning_rate": 0.00027421686990126683, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.00028675284682241995, + "loss": 0.0355, "step": 34070 }, { - "epoch": 0.17, - "learning_rate": 0.0002742093022082528, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.0002867489586060485, + "loss": 0.038, "step": 34080 }, { - "epoch": 0.17, - "learning_rate": 0.0002742017345152388, - "loss": 0.0283, + "epoch": 0.09, + "learning_rate": 0.00028674507038967703, + "loss": 0.0641, "step": 34090 }, { - "epoch": 0.17, - "learning_rate": 0.0002741941668222248, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.00028674118217330555, + "loss": 0.0373, "step": 34100 }, { - "epoch": 0.17, - "learning_rate": 0.00027418659912921075, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.00028673729395693406, + "loss": 0.0295, "step": 34110 }, { - "epoch": 0.17, - "learning_rate": 0.00027417903143619674, - "loss": 0.032, + "epoch": 0.09, + "learning_rate": 0.00028673340574056263, + "loss": 0.0351, "step": 34120 }, { - "epoch": 0.17, - "learning_rate": 0.00027417146374318277, - "loss": 0.0216, + "epoch": 0.09, + "learning_rate": 0.00028672951752419114, + "loss": 0.0314, "step": 34130 }, { - "epoch": 0.17, - "learning_rate": 0.00027416389605016875, - "loss": 0.0195, + "epoch": 0.09, + "learning_rate": 0.0002867256293078197, + "loss": 0.0331, "step": 34140 }, { - "epoch": 0.17, - "learning_rate": 0.00027415632835715473, - "loss": 0.0229, + "epoch": 0.09, + "learning_rate": 0.0002867217410914482, + "loss": 0.038, "step": 34150 }, { - "epoch": 0.17, - "learning_rate": 0.0002741487606641407, - "loss": 0.023, + "epoch": 0.09, + "learning_rate": 0.0002867178528750768, + "loss": 0.0367, "step": 34160 }, { - "epoch": 0.17, - "learning_rate": 0.0002741411929711267, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.0002867139646587053, + "loss": 0.0297, "step": 34170 }, { - "epoch": 0.17, - "learning_rate": 0.0002741336252781127, - "loss": 0.0255, + "epoch": 0.09, + "learning_rate": 0.0002867100764423338, + "loss": 0.0313, "step": 34180 }, { - "epoch": 0.17, - "learning_rate": 0.0002741260575850987, - "loss": 0.0225, + "epoch": 0.09, + "learning_rate": 0.00028670618822596234, + "loss": 0.0955, "step": 34190 }, { - "epoch": 0.17, - "learning_rate": 0.0002741184898920847, - "loss": 0.0278, + "epoch": 0.09, + "learning_rate": 0.0002867023000095909, + "loss": 0.0364, "step": 34200 }, { - "epoch": 0.17, - "learning_rate": 0.0002741109221990707, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.0002866984117932195, + "loss": 0.025, "step": 34210 }, { - "epoch": 0.17, - "learning_rate": 0.00027410335450605666, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.000286694523576848, + "loss": 0.0329, "step": 34220 }, { - "epoch": 0.17, - "learning_rate": 0.00027409578681304264, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.0002866906353604765, + "loss": 0.0296, "step": 34230 }, { - "epoch": 0.17, - "learning_rate": 0.0002740882191200286, - "loss": 0.0223, + "epoch": 0.09, + "learning_rate": 0.000286686747144105, + "loss": 0.0349, "step": 34240 }, { - "epoch": 0.17, - "learning_rate": 0.0002740806514270146, - "loss": 0.0229, + "epoch": 0.09, + "learning_rate": 0.0002866828589277336, + "loss": 0.0629, "step": 34250 }, { - "epoch": 0.17, - "learning_rate": 0.00027407308373400064, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.0002866789707113621, + "loss": 0.033, "step": 34260 }, { - "epoch": 0.17, - "learning_rate": 0.0002740655160409866, - "loss": 0.0233, + "epoch": 0.09, + "learning_rate": 0.00028667508249499067, + "loss": 0.0349, "step": 34270 }, { - "epoch": 0.17, - "learning_rate": 0.0002740579483479726, - "loss": 0.0288, + "epoch": 0.09, + "learning_rate": 0.0002866711942786192, + "loss": 0.0357, "step": 34280 }, { - "epoch": 0.17, - "learning_rate": 0.0002740503806549586, - "loss": 0.0272, + "epoch": 0.09, + "learning_rate": 0.00028666730606224776, + "loss": 0.0318, "step": 34290 }, { - "epoch": 0.17, - "learning_rate": 0.00027404281296194457, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.00028666341784587627, + "loss": 0.0318, "step": 34300 }, { - "epoch": 0.17, - "learning_rate": 0.00027403524526893055, - "loss": 0.0286, + "epoch": 0.09, + "learning_rate": 0.0002866595296295048, + "loss": 0.0316, "step": 34310 }, { - "epoch": 0.17, - "learning_rate": 0.0002740276775759166, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.0002866556414131333, + "loss": 0.0368, "step": 34320 }, { - "epoch": 0.17, - "learning_rate": 0.00027402010988290256, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.00028665175319676187, + "loss": 0.0302, "step": 34330 }, { - "epoch": 0.17, - "learning_rate": 0.00027401254218988854, - "loss": 0.0323, + "epoch": 0.09, + "learning_rate": 0.0002866478649803904, + "loss": 0.0298, "step": 34340 }, { - "epoch": 0.17, - "learning_rate": 0.0002740049744968745, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.00028664397676401895, + "loss": 0.0325, "step": 34350 }, { - "epoch": 0.17, - "learning_rate": 0.0002739974068038605, - "loss": 0.0277, + "epoch": 0.09, + "learning_rate": 0.00028664008854764747, + "loss": 0.0331, "step": 34360 }, { - "epoch": 0.17, - "learning_rate": 0.0002739898391108465, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.00028663620033127603, + "loss": 0.0473, "step": 34370 }, { - "epoch": 0.17, - "learning_rate": 0.0002739822714178325, - "loss": 0.025, + "epoch": 0.09, + "learning_rate": 0.00028663231211490455, + "loss": 0.0404, "step": 34380 }, { - "epoch": 0.17, - "learning_rate": 0.0002739747037248185, - "loss": 0.025, + "epoch": 0.09, + "learning_rate": 0.00028662842389853306, + "loss": 0.0357, "step": 34390 }, { - "epoch": 0.17, - "learning_rate": 0.0002739671360318045, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.0002866245356821616, + "loss": 0.0317, "step": 34400 }, { - "epoch": 0.17, - "learning_rate": 0.00027395956833879047, - "loss": 0.0213, + "epoch": 0.09, + "learning_rate": 0.00028662064746579015, + "loss": 0.0334, "step": 34410 }, { - "epoch": 0.17, - "learning_rate": 0.00027395200064577645, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.0002866167592494187, + "loss": 0.0366, "step": 34420 }, { - "epoch": 0.17, - "learning_rate": 0.00027394443295276243, - "loss": 0.0225, + "epoch": 0.09, + "learning_rate": 0.00028661287103304723, + "loss": 0.0337, "step": 34430 }, { - "epoch": 0.17, - "learning_rate": 0.0002739368652597484, - "loss": 0.0276, + "epoch": 0.09, + "learning_rate": 0.00028660898281667574, + "loss": 0.0334, "step": 34440 }, { - "epoch": 0.17, - "learning_rate": 0.00027392929756673445, - "loss": 0.0242, + "epoch": 0.09, + "learning_rate": 0.0002866050946003043, + "loss": 0.0324, "step": 34450 }, { - "epoch": 0.17, - "learning_rate": 0.00027392172987372043, - "loss": 0.0296, + "epoch": 0.09, + "learning_rate": 0.00028660120638393283, + "loss": 0.0362, "step": 34460 }, { - "epoch": 0.17, - "learning_rate": 0.0002739141621807064, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.00028659731816756134, + "loss": 0.0342, "step": 34470 }, { - "epoch": 0.17, - "learning_rate": 0.0002739065944876924, - "loss": 0.0257, + "epoch": 0.09, + "learning_rate": 0.0002865934299511899, + "loss": 0.0281, "step": 34480 }, { - "epoch": 0.17, - "learning_rate": 0.0002738990267946784, - "loss": 0.0237, + "epoch": 0.09, + "learning_rate": 0.0002865895417348184, + "loss": 0.0316, "step": 34490 }, { - "epoch": 0.17, - "learning_rate": 0.00027389145910166436, - "loss": 0.0226, + "epoch": 0.09, + "learning_rate": 0.000286585653518447, + "loss": 0.0301, "step": 34500 }, { - "epoch": 0.17, - "learning_rate": 0.0002738838914086504, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.0002865817653020755, + "loss": 0.0347, "step": 34510 }, { - "epoch": 0.17, - "learning_rate": 0.0002738763237156364, - "loss": 0.0301, + "epoch": 0.09, + "learning_rate": 0.000286577877085704, + "loss": 0.0344, "step": 34520 }, { - "epoch": 0.17, - "learning_rate": 0.00027386875602262236, - "loss": 0.0272, + "epoch": 0.09, + "learning_rate": 0.00028657398886933254, + "loss": 0.0392, "step": 34530 }, { - "epoch": 0.17, - "learning_rate": 0.00027386118832960834, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.0002865701006529611, + "loss": 0.0526, "step": 34540 }, { - "epoch": 0.17, - "learning_rate": 0.0002738536206365943, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.0002865662124365897, + "loss": 0.0416, "step": 34550 }, { - "epoch": 0.17, - "learning_rate": 0.0002738460529435803, - "loss": 0.0228, + "epoch": 0.09, + "learning_rate": 0.0002865623242202182, + "loss": 0.0348, "step": 34560 }, { - "epoch": 0.17, - "learning_rate": 0.0002738384852505663, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.0002865584360038467, + "loss": 0.0352, "step": 34570 }, { - "epoch": 0.17, - "learning_rate": 0.00027383091755755226, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.0002865545477874753, + "loss": 0.0297, "step": 34580 }, { - "epoch": 0.17, - "learning_rate": 0.00027382334986453824, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.0002865506595711038, + "loss": 0.0363, "step": 34590 }, { - "epoch": 0.17, - "learning_rate": 0.0002738157821715242, - "loss": 0.0313, + "epoch": 0.09, + "learning_rate": 0.0002865467713547323, + "loss": 0.0632, "step": 34600 }, { - "epoch": 0.17, - "learning_rate": 0.00027380821447851026, - "loss": 0.0229, + "epoch": 0.09, + "learning_rate": 0.00028654288313836087, + "loss": 0.0357, "step": 34610 }, { - "epoch": 0.17, - "learning_rate": 0.00027380064678549624, - "loss": 0.0182, + "epoch": 0.09, + "learning_rate": 0.0002865389949219894, + "loss": 0.0312, "step": 34620 }, { - "epoch": 0.17, - "learning_rate": 0.0002737930790924822, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028653510670561795, + "loss": 0.0295, "step": 34630 }, { - "epoch": 0.17, - "learning_rate": 0.0002737855113994682, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028653121848924647, + "loss": 0.0305, "step": 34640 }, { - "epoch": 0.17, - "learning_rate": 0.0002737779437064542, - "loss": 0.0218, + "epoch": 0.09, + "learning_rate": 0.000286527330272875, + "loss": 0.0392, "step": 34650 }, { - "epoch": 0.17, - "learning_rate": 0.00027377037601344017, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.00028652344205650355, + "loss": 0.0279, "step": 34660 }, { - "epoch": 0.17, - "learning_rate": 0.00027376280832042615, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.00028651955384013207, + "loss": 0.037, "step": 34670 }, { - "epoch": 0.17, - "learning_rate": 0.0002737552406274122, - "loss": 0.0192, + "epoch": 0.09, + "learning_rate": 0.0002865156656237606, + "loss": 0.0366, "step": 34680 }, { - "epoch": 0.18, - "learning_rate": 0.00027374767293439817, - "loss": 0.0239, + "epoch": 0.09, + "learning_rate": 0.00028651177740738915, + "loss": 0.031, "step": 34690 }, { - "epoch": 0.18, - "learning_rate": 0.00027374010524138415, - "loss": 0.0198, + "epoch": 0.09, + "learning_rate": 0.0002865078891910177, + "loss": 0.032, "step": 34700 }, { - "epoch": 0.18, - "learning_rate": 0.00027373253754837013, - "loss": 0.0267, + "epoch": 0.09, + "learning_rate": 0.00028650400097464623, + "loss": 0.0319, "step": 34710 }, { - "epoch": 0.18, - "learning_rate": 0.0002737249698553561, - "loss": 0.0285, + "epoch": 0.09, + "learning_rate": 0.00028650011275827475, + "loss": 0.0321, "step": 34720 }, { - "epoch": 0.18, - "learning_rate": 0.0002737174021623421, - "loss": 0.0223, + "epoch": 0.09, + "learning_rate": 0.00028649622454190326, + "loss": 0.0305, "step": 34730 }, { - "epoch": 0.18, - "learning_rate": 0.00027370983446932813, - "loss": 0.0228, + "epoch": 0.09, + "learning_rate": 0.0002864923363255318, + "loss": 0.0333, "step": 34740 }, { - "epoch": 0.18, - "learning_rate": 0.0002737022667763141, - "loss": 0.0204, + "epoch": 0.09, + "learning_rate": 0.00028648844810916035, + "loss": 0.0372, "step": 34750 }, { - "epoch": 0.18, - "learning_rate": 0.0002736946990833001, - "loss": 0.0211, + "epoch": 0.09, + "learning_rate": 0.0002864845598927889, + "loss": 0.0374, "step": 34760 }, { - "epoch": 0.18, - "learning_rate": 0.00027368713139028607, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.00028648067167641743, + "loss": 0.0301, "step": 34770 }, { - "epoch": 0.18, - "learning_rate": 0.00027367956369727205, - "loss": 0.0251, + "epoch": 0.09, + "learning_rate": 0.00028647678346004594, + "loss": 0.0296, "step": 34780 }, { - "epoch": 0.18, - "learning_rate": 0.00027367199600425804, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.0002864728952436745, + "loss": 0.0301, "step": 34790 }, { - "epoch": 0.18, - "learning_rate": 0.00027366442831124407, - "loss": 0.0338, + "epoch": 0.09, + "learning_rate": 0.000286469007027303, + "loss": 0.0389, "step": 34800 }, { - "epoch": 0.18, - "learning_rate": 0.00027365686061823005, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028646511881093154, + "loss": 0.034, "step": 34810 }, { - "epoch": 0.18, - "learning_rate": 0.00027364929292521603, - "loss": 0.0304, + "epoch": 0.09, + "learning_rate": 0.0002864612305945601, + "loss": 0.0327, "step": 34820 }, { - "epoch": 0.18, - "learning_rate": 0.000273641725232202, - "loss": 0.0239, + "epoch": 0.09, + "learning_rate": 0.0002864573423781886, + "loss": 0.034, "step": 34830 }, { - "epoch": 0.18, - "learning_rate": 0.000273634157539188, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.0002864534541618172, + "loss": 0.0349, "step": 34840 }, { - "epoch": 0.18, - "learning_rate": 0.000273626589846174, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.0002864495659454457, + "loss": 0.0327, "step": 34850 }, { - "epoch": 0.18, - "learning_rate": 0.00027361902215315996, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.0002864456777290742, + "loss": 0.0286, "step": 34860 }, { - "epoch": 0.18, - "learning_rate": 0.000273611454460146, - "loss": 0.0213, + "epoch": 0.09, + "learning_rate": 0.0002864417895127028, + "loss": 0.0297, "step": 34870 }, { - "epoch": 0.18, - "learning_rate": 0.000273603886767132, - "loss": 0.0225, + "epoch": 0.09, + "learning_rate": 0.0002864379012963313, + "loss": 0.0224, "step": 34880 }, { - "epoch": 0.18, - "learning_rate": 0.00027359631907411796, - "loss": 0.0259, + "epoch": 0.09, + "learning_rate": 0.0002864340130799598, + "loss": 0.0296, "step": 34890 }, { - "epoch": 0.18, - "learning_rate": 0.00027358875138110394, - "loss": 0.0226, + "epoch": 0.09, + "learning_rate": 0.0002864301248635884, + "loss": 0.0295, "step": 34900 }, { - "epoch": 0.18, - "learning_rate": 0.0002735811836880899, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.00028642623664721696, + "loss": 0.0271, "step": 34910 }, { - "epoch": 0.18, - "learning_rate": 0.0002735736159950759, - "loss": 0.0255, + "epoch": 0.09, + "learning_rate": 0.00028642234843084547, + "loss": 0.0348, "step": 34920 }, { - "epoch": 0.18, - "learning_rate": 0.00027356604830206194, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.000286418460214474, + "loss": 0.0335, "step": 34930 }, { - "epoch": 0.18, - "learning_rate": 0.0002735584806090479, - "loss": 0.0275, + "epoch": 0.09, + "learning_rate": 0.0002864145719981025, + "loss": 0.0311, "step": 34940 }, { - "epoch": 0.18, - "learning_rate": 0.0002735509129160339, - "loss": 0.0252, + "epoch": 0.09, + "learning_rate": 0.00028641068378173107, + "loss": 0.031, "step": 34950 }, { - "epoch": 0.18, - "learning_rate": 0.0002735433452230199, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.0002864067955653596, + "loss": 0.0303, "step": 34960 }, { - "epoch": 0.18, - "learning_rate": 0.00027353577753000586, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.00028640290734898815, + "loss": 0.0375, "step": 34970 }, { - "epoch": 0.18, - "learning_rate": 0.00027352820983699185, - "loss": 0.0299, + "epoch": 0.09, + "learning_rate": 0.00028639901913261667, + "loss": 0.0322, "step": 34980 }, { - "epoch": 0.18, - "learning_rate": 0.0002735206421439778, - "loss": 0.0257, + "epoch": 0.09, + "learning_rate": 0.0002863951309162452, + "loss": 0.0291, "step": 34990 }, { - "epoch": 0.18, - "learning_rate": 0.00027351307445096386, - "loss": 0.0209, + "epoch": 0.09, + "learning_rate": 0.00028639124269987375, + "loss": 0.0372, "step": 35000 }, { - "epoch": 0.18, - "eval_cer": 0.9144683151109114, - "eval_loss": 0.01787448488175869, - "eval_runtime": 117.4101, - "eval_samples_per_second": 17.034, - "eval_steps_per_second": 4.259, + "epoch": 0.09, + "eval_cer": 0.8818622449336642, + "eval_loss": 0.023330524563789368, + "eval_runtime": 107.4947, + "eval_samples_per_second": 18.606, + "eval_steps_per_second": 4.651, "step": 35000 }, { - "epoch": 0.18, - "learning_rate": 0.00027350550675794984, - "loss": 0.0287, + "epoch": 0.09, + "learning_rate": 0.00028638735448350227, + "loss": 0.0309, "step": 35010 }, { - "epoch": 0.18, - "learning_rate": 0.0002734979390649358, - "loss": 0.0266, + "epoch": 0.09, + "learning_rate": 0.0002863834662671308, + "loss": 0.0395, "step": 35020 }, { - "epoch": 0.18, - "learning_rate": 0.0002734903713719218, - "loss": 0.0211, + "epoch": 0.09, + "learning_rate": 0.00028637957805075935, + "loss": 0.0353, "step": 35030 }, { - "epoch": 0.18, - "learning_rate": 0.0002734828036789078, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028637568983438786, + "loss": 0.0329, "step": 35040 }, { - "epoch": 0.18, - "learning_rate": 0.00027347523598589377, - "loss": 0.0237, + "epoch": 0.09, + "learning_rate": 0.00028637180161801643, + "loss": 0.035, "step": 35050 }, { - "epoch": 0.18, - "learning_rate": 0.0002734676682928798, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.00028636791340164495, + "loss": 0.0342, "step": 35060 }, { - "epoch": 0.18, - "learning_rate": 0.0002734601005998658, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.00028636402518527346, + "loss": 0.0281, "step": 35070 }, { - "epoch": 0.18, - "learning_rate": 0.00027345253290685177, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.00028636013696890203, + "loss": 0.0355, "step": 35080 }, { - "epoch": 0.18, - "learning_rate": 0.00027344496521383775, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.00028635624875253054, + "loss": 0.0348, "step": 35090 }, { - "epoch": 0.18, - "learning_rate": 0.00027343739752082373, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.0002863523605361591, + "loss": 0.0323, "step": 35100 }, { - "epoch": 0.18, - "learning_rate": 0.0002734298298278097, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.00028634847231978763, + "loss": 0.0315, "step": 35110 }, { - "epoch": 0.18, - "learning_rate": 0.00027342226213479575, - "loss": 0.025, + "epoch": 0.09, + "learning_rate": 0.0002863445841034162, + "loss": 0.0297, "step": 35120 }, { - "epoch": 0.18, - "learning_rate": 0.00027341469444178173, - "loss": 0.0251, + "epoch": 0.09, + "learning_rate": 0.0002863406958870447, + "loss": 0.0361, "step": 35130 }, { - "epoch": 0.18, - "learning_rate": 0.0002734071267487677, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.0002863368076706732, + "loss": 0.0356, "step": 35140 }, { - "epoch": 0.18, - "learning_rate": 0.0002733995590557537, - "loss": 0.0239, + "epoch": 0.09, + "learning_rate": 0.00028633291945430174, + "loss": 0.0347, "step": 35150 }, { - "epoch": 0.18, - "learning_rate": 0.0002733919913627397, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.0002863290312379303, + "loss": 0.028, "step": 35160 }, { - "epoch": 0.18, - "learning_rate": 0.00027338442366972566, - "loss": 0.0257, - "step": 35170 + "epoch": 0.09, + "learning_rate": 0.0002863251430215588, + "loss": 0.0314, + "step": 35170 }, { - "epoch": 0.18, - "learning_rate": 0.00027337685597671164, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.0002863212548051874, + "loss": 0.0365, "step": 35180 }, { - "epoch": 0.18, - "learning_rate": 0.00027336928828369767, - "loss": 0.0274, + "epoch": 0.09, + "learning_rate": 0.0002863173665888159, + "loss": 0.0377, "step": 35190 }, { - "epoch": 0.18, - "learning_rate": 0.00027336172059068365, - "loss": 0.0238, + "epoch": 0.09, + "learning_rate": 0.0002863134783724445, + "loss": 0.0276, "step": 35200 }, { - "epoch": 0.18, - "learning_rate": 0.00027335415289766964, - "loss": 0.0302, + "epoch": 0.09, + "learning_rate": 0.000286309590156073, + "loss": 0.0345, "step": 35210 }, { - "epoch": 0.18, - "learning_rate": 0.0002733465852046556, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.0002863057019397015, + "loss": 0.0278, "step": 35220 }, { - "epoch": 0.18, - "learning_rate": 0.0002733390175116416, - "loss": 0.0286, + "epoch": 0.09, + "learning_rate": 0.00028630181372333, + "loss": 0.0336, "step": 35230 }, { - "epoch": 0.18, - "learning_rate": 0.0002733314498186276, - "loss": 0.028, + "epoch": 0.09, + "learning_rate": 0.0002862979255069586, + "loss": 0.0361, "step": 35240 }, { - "epoch": 0.18, - "learning_rate": 0.0002733238821256136, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.00028629403729058716, + "loss": 0.0316, "step": 35250 }, { - "epoch": 0.18, - "learning_rate": 0.0002733163144325996, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.00028629014907421567, + "loss": 0.041, "step": 35260 }, { - "epoch": 0.18, - "learning_rate": 0.0002733087467395856, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.0002862862608578442, + "loss": 0.0273, "step": 35270 }, { - "epoch": 0.18, - "learning_rate": 0.00027330117904657156, - "loss": 0.0198, + "epoch": 0.09, + "learning_rate": 0.0002862823726414727, + "loss": 0.0333, "step": 35280 }, { - "epoch": 0.18, - "learning_rate": 0.00027329361135355754, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.00028627848442510127, + "loss": 0.0311, "step": 35290 }, { - "epoch": 0.18, - "learning_rate": 0.0002732860436605435, - "loss": 0.0212, + "epoch": 0.09, + "learning_rate": 0.0002862745962087298, + "loss": 0.0359, "step": 35300 }, { - "epoch": 0.18, - "learning_rate": 0.00027327847596752956, - "loss": 0.0283, + "epoch": 0.09, + "learning_rate": 0.00028627070799235835, + "loss": 0.0289, "step": 35310 }, { - "epoch": 0.18, - "learning_rate": 0.00027327090827451554, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.00028626681977598687, + "loss": 0.0288, "step": 35320 }, { - "epoch": 0.18, - "learning_rate": 0.0002732633405815015, - "loss": 0.0221, + "epoch": 0.09, + "learning_rate": 0.00028626293155961544, + "loss": 0.0372, "step": 35330 }, { - "epoch": 0.18, - "learning_rate": 0.0002732557728884875, - "loss": 0.023, + "epoch": 0.09, + "learning_rate": 0.00028625904334324395, + "loss": 0.0263, "step": 35340 }, { - "epoch": 0.18, - "learning_rate": 0.0002732482051954735, - "loss": 0.0209, + "epoch": 0.09, + "learning_rate": 0.00028625515512687246, + "loss": 0.0221, "step": 35350 }, { - "epoch": 0.18, - "learning_rate": 0.00027324063750245947, - "loss": 0.0215, + "epoch": 0.09, + "learning_rate": 0.000286251266910501, + "loss": 0.0304, "step": 35360 }, { - "epoch": 0.18, - "learning_rate": 0.00027323306980944545, - "loss": 0.0196, + "epoch": 0.09, + "learning_rate": 0.00028624737869412955, + "loss": 0.0283, "step": 35370 }, { - "epoch": 0.18, - "learning_rate": 0.0002732255021164315, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.00028624349047775806, + "loss": 0.0278, "step": 35380 }, { - "epoch": 0.18, - "learning_rate": 0.00027321793442341746, - "loss": 0.0289, + "epoch": 0.09, + "learning_rate": 0.00028623960226138663, + "loss": 0.0317, "step": 35390 }, { - "epoch": 0.18, - "learning_rate": 0.00027321036673040345, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028623571404501515, + "loss": 0.0385, "step": 35400 }, { - "epoch": 0.18, - "learning_rate": 0.0002732027990373894, - "loss": 0.0211, + "epoch": 0.09, + "learning_rate": 0.0002862318258286437, + "loss": 0.0314, "step": 35410 }, { - "epoch": 0.18, - "learning_rate": 0.0002731952313443754, - "loss": 0.025, + "epoch": 0.09, + "learning_rate": 0.00028622793761227223, + "loss": 0.033, "step": 35420 }, { - "epoch": 0.18, - "learning_rate": 0.0002731876636513614, - "loss": 0.0214, + "epoch": 0.09, + "learning_rate": 0.00028622404939590074, + "loss": 0.0306, "step": 35430 }, { - "epoch": 0.18, - "learning_rate": 0.0002731800959583474, - "loss": 0.0198, + "epoch": 0.09, + "learning_rate": 0.00028622016117952926, + "loss": 0.0333, "step": 35440 }, { - "epoch": 0.18, - "learning_rate": 0.0002731725282653334, - "loss": 0.0235, + "epoch": 0.09, + "learning_rate": 0.0002862162729631578, + "loss": 0.0344, "step": 35450 }, { - "epoch": 0.18, - "learning_rate": 0.0002731649605723194, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.0002862123847467864, + "loss": 0.0276, "step": 35460 }, { - "epoch": 0.18, - "learning_rate": 0.00027315739287930537, - "loss": 0.0221, + "epoch": 0.09, + "learning_rate": 0.0002862084965304149, + "loss": 0.0299, "step": 35470 }, { - "epoch": 0.18, - "learning_rate": 0.00027314982518629135, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.0002862046083140434, + "loss": 0.0278, "step": 35480 }, { - "epoch": 0.18, - "learning_rate": 0.00027314225749327733, - "loss": 0.0221, + "epoch": 0.09, + "learning_rate": 0.00028620072009767194, + "loss": 0.0278, "step": 35490 }, { - "epoch": 0.18, - "learning_rate": 0.0002731346898002633, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.0002861968318813005, + "loss": 0.0301, "step": 35500 }, { - "epoch": 0.18, - "learning_rate": 0.00027312712210724935, - "loss": 0.0291, + "epoch": 0.09, + "learning_rate": 0.000286192943664929, + "loss": 0.035, "step": 35510 }, { - "epoch": 0.18, - "learning_rate": 0.00027311955441423533, - "loss": 0.0322, + "epoch": 0.09, + "learning_rate": 0.0002861890554485576, + "loss": 0.032, "step": 35520 }, { - "epoch": 0.18, - "learning_rate": 0.0002731119867212213, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.0002861851672321861, + "loss": 0.0361, "step": 35530 }, { - "epoch": 0.18, - "learning_rate": 0.0002731044190282073, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.0002861812790158147, + "loss": 0.0395, "step": 35540 }, { - "epoch": 0.18, - "learning_rate": 0.0002730968513351933, - "loss": 0.0252, + "epoch": 0.09, + "learning_rate": 0.0002861773907994432, + "loss": 0.0301, "step": 35550 }, { - "epoch": 0.18, - "learning_rate": 0.00027308928364217926, - "loss": 0.0342, + "epoch": 0.09, + "learning_rate": 0.0002861735025830717, + "loss": 0.0344, "step": 35560 }, { - "epoch": 0.18, - "learning_rate": 0.0002730817159491653, - "loss": 0.0298, + "epoch": 0.09, + "learning_rate": 0.0002861696143667002, + "loss": 0.029, "step": 35570 }, { - "epoch": 0.18, - "learning_rate": 0.0002730741482561513, - "loss": 0.0258, + "epoch": 0.09, + "learning_rate": 0.0002861657261503288, + "loss": 0.0337, "step": 35580 }, { - "epoch": 0.18, - "learning_rate": 0.00027306658056313726, - "loss": 0.0257, + "epoch": 0.09, + "learning_rate": 0.0002861618379339573, + "loss": 0.0277, "step": 35590 }, { - "epoch": 0.18, - "learning_rate": 0.00027305901287012324, - "loss": 0.0302, + "epoch": 0.09, + "learning_rate": 0.00028615794971758587, + "loss": 0.0283, "step": 35600 }, { - "epoch": 0.18, - "learning_rate": 0.0002730514451771092, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.0002861540615012144, + "loss": 0.0341, "step": 35610 }, { - "epoch": 0.18, - "learning_rate": 0.0002730438774840952, - "loss": 0.0255, + "epoch": 0.09, + "learning_rate": 0.00028615017328484295, + "loss": 0.0324, "step": 35620 }, { - "epoch": 0.18, - "learning_rate": 0.00027303630979108124, - "loss": 0.0271, + "epoch": 0.09, + "learning_rate": 0.00028614628506847147, + "loss": 0.0267, "step": 35630 }, { - "epoch": 0.18, - "learning_rate": 0.0002730287420980672, - "loss": 0.0264, + "epoch": 0.09, + "learning_rate": 0.0002861423968521, + "loss": 0.0308, "step": 35640 }, { - "epoch": 0.18, - "learning_rate": 0.0002730211744050532, - "loss": 0.0195, + "epoch": 0.09, + "learning_rate": 0.00028613850863572855, + "loss": 0.0315, "step": 35650 }, { - "epoch": 0.18, - "learning_rate": 0.0002730136067120392, - "loss": 0.0241, + "epoch": 0.09, + "learning_rate": 0.00028613462041935707, + "loss": 0.028, "step": 35660 }, { - "epoch": 0.18, - "learning_rate": 0.00027300603901902516, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.00028613073220298563, + "loss": 0.0361, "step": 35670 }, { - "epoch": 0.18, - "learning_rate": 0.00027299847132601114, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.00028612684398661415, + "loss": 0.0362, "step": 35680 }, { - "epoch": 0.18, - "learning_rate": 0.0002729909036329971, - "loss": 0.0234, + "epoch": 0.09, + "learning_rate": 0.00028612295577024266, + "loss": 0.0338, "step": 35690 }, { - "epoch": 0.18, - "learning_rate": 0.00027298333593998316, - "loss": 0.0209, + "epoch": 0.09, + "learning_rate": 0.00028611906755387123, + "loss": 0.0311, "step": 35700 }, { - "epoch": 0.18, - "learning_rate": 0.00027297576824696914, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.00028611517933749975, + "loss": 0.0286, "step": 35710 }, { - "epoch": 0.18, - "learning_rate": 0.0002729682005539551, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028611129112112826, + "loss": 0.0324, "step": 35720 }, { - "epoch": 0.18, - "learning_rate": 0.0002729606328609411, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.00028610740290475683, + "loss": 0.0299, "step": 35730 }, { - "epoch": 0.18, - "learning_rate": 0.0002729530651679271, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.00028610351468838534, + "loss": 0.0268, "step": 35740 }, { - "epoch": 0.18, - "learning_rate": 0.00027294549747491307, - "loss": 0.0195, + "epoch": 0.09, + "learning_rate": 0.0002860996264720139, + "loss": 0.0258, "step": 35750 }, { - "epoch": 0.18, - "learning_rate": 0.0002729379297818991, - "loss": 0.0239, + "epoch": 0.09, + "learning_rate": 0.00028609573825564243, + "loss": 0.0281, "step": 35760 }, { - "epoch": 0.18, - "learning_rate": 0.0002729303620888851, - "loss": 0.0248, + "epoch": 0.09, + "learning_rate": 0.00028609185003927094, + "loss": 0.028, "step": 35770 }, { - "epoch": 0.18, - "learning_rate": 0.00027292279439587107, - "loss": 0.0257, + "epoch": 0.09, + "learning_rate": 0.00028608796182289946, + "loss": 0.0323, "step": 35780 }, { - "epoch": 0.18, - "learning_rate": 0.00027291522670285705, - "loss": 0.0179, + "epoch": 0.09, + "learning_rate": 0.000286084073606528, + "loss": 0.0346, "step": 35790 }, { - "epoch": 0.18, - "learning_rate": 0.00027290765900984303, - "loss": 0.0221, + "epoch": 0.09, + "learning_rate": 0.0002860801853901566, + "loss": 0.0326, "step": 35800 }, { - "epoch": 0.18, - "learning_rate": 0.000272900091316829, - "loss": 0.0205, + "epoch": 0.09, + "learning_rate": 0.0002860762971737851, + "loss": 0.0301, "step": 35810 }, { - "epoch": 0.18, - "learning_rate": 0.000272892523623815, - "loss": 0.0231, + "epoch": 0.09, + "learning_rate": 0.0002860724089574136, + "loss": 0.0346, "step": 35820 }, { - "epoch": 0.18, - "learning_rate": 0.00027288495593080097, - "loss": 0.0268, + "epoch": 0.09, + "learning_rate": 0.0002860685207410422, + "loss": 0.0287, "step": 35830 }, { - "epoch": 0.18, - "learning_rate": 0.00027287738823778695, - "loss": 0.0242, + "epoch": 0.09, + "learning_rate": 0.0002860646325246707, + "loss": 0.0321, "step": 35840 }, { - "epoch": 0.18, - "learning_rate": 0.00027286982054477294, - "loss": 0.0212, + "epoch": 0.09, + "learning_rate": 0.0002860607443082992, + "loss": 0.0401, "step": 35850 }, { - "epoch": 0.18, - "learning_rate": 0.00027286225285175897, - "loss": 0.0261, + "epoch": 0.09, + "learning_rate": 0.0002860568560919278, + "loss": 0.0338, "step": 35860 }, { - "epoch": 0.18, - "learning_rate": 0.00027285468515874495, - "loss": 0.0323, + "epoch": 0.09, + "learning_rate": 0.0002860529678755563, + "loss": 0.0291, "step": 35870 }, { - "epoch": 0.18, - "learning_rate": 0.00027284711746573093, - "loss": 0.0225, + "epoch": 0.09, + "learning_rate": 0.00028604907965918487, + "loss": 0.0344, "step": 35880 }, { - "epoch": 0.18, - "learning_rate": 0.0002728395497727169, - "loss": 0.0265, + "epoch": 0.09, + "learning_rate": 0.0002860451914428134, + "loss": 0.0319, "step": 35890 }, { - "epoch": 0.18, - "learning_rate": 0.0002728319820797029, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.0002860413032264419, + "loss": 0.0288, "step": 35900 }, { - "epoch": 0.18, - "learning_rate": 0.0002728244143866889, - "loss": 0.0237, + "epoch": 0.09, + "learning_rate": 0.00028603741501007047, + "loss": 0.029, "step": 35910 }, { - "epoch": 0.18, - "learning_rate": 0.00027281684669367486, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.000286033526793699, + "loss": 0.0317, "step": 35920 }, { - "epoch": 0.18, - "learning_rate": 0.0002728092790006609, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.0002860296385773275, + "loss": 0.0317, "step": 35930 }, { - "epoch": 0.18, - "learning_rate": 0.0002728017113076469, - "loss": 0.0273, + "epoch": 0.09, + "learning_rate": 0.00028602575036095607, + "loss": 0.0344, "step": 35940 }, { - "epoch": 0.18, - "learning_rate": 0.00027279414361463286, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.00028602186214458464, + "loss": 0.0313, "step": 35950 }, { - "epoch": 0.18, - "learning_rate": 0.00027278657592161884, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.00028601797392821315, + "loss": 0.0289, "step": 35960 }, { - "epoch": 0.18, - "learning_rate": 0.0002727790082286048, - "loss": 0.0257, + "epoch": 0.09, + "learning_rate": 0.00028601408571184167, + "loss": 0.0288, "step": 35970 }, { - "epoch": 0.18, - "learning_rate": 0.0002727714405355908, - "loss": 0.0219, + "epoch": 0.09, + "learning_rate": 0.0002860101974954702, + "loss": 0.0304, "step": 35980 }, { - "epoch": 0.18, - "learning_rate": 0.00027276387284257684, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.0002860063092790987, + "loss": 0.0291, "step": 35990 }, { - "epoch": 0.18, - "learning_rate": 0.0002727563051495628, - "loss": 0.0288, + "epoch": 0.09, + "learning_rate": 0.00028600242106272726, + "loss": 0.0372, "step": 36000 }, { - "epoch": 0.18, - "eval_cer": 0.9144993677869243, - "eval_loss": 0.017736734822392464, - "eval_runtime": 117.3015, - "eval_samples_per_second": 17.05, - "eval_steps_per_second": 4.263, + "epoch": 0.09, + "eval_cer": 0.8818356518319148, + "eval_loss": 0.022460658103227615, + "eval_runtime": 107.7073, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, "step": 36000 }, { - "epoch": 0.18, - "learning_rate": 0.0002727487374565488, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.00028599853284635583, + "loss": 0.034, "step": 36010 }, { - "epoch": 0.18, - "learning_rate": 0.0002727411697635348, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.00028599464462998435, + "loss": 0.032, "step": 36020 }, { - "epoch": 0.18, - "learning_rate": 0.00027273360207052076, - "loss": 0.0304, + "epoch": 0.09, + "learning_rate": 0.00028599075641361286, + "loss": 0.0327, "step": 36030 }, { - "epoch": 0.18, - "learning_rate": 0.00027272603437750675, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.00028598686819724143, + "loss": 0.0305, "step": 36040 }, { - "epoch": 0.18, - "learning_rate": 0.0002727184666844927, - "loss": 0.0254, + "epoch": 0.09, + "learning_rate": 0.00028598297998086995, + "loss": 0.0342, "step": 36050 }, { - "epoch": 0.18, - "learning_rate": 0.00027271089899147876, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.00028597909176449846, + "loss": 0.0327, "step": 36060 }, { - "epoch": 0.18, - "learning_rate": 0.00027270333129846474, - "loss": 0.0275, + "epoch": 0.09, + "learning_rate": 0.00028597520354812703, + "loss": 0.0262, "step": 36070 }, { - "epoch": 0.18, - "learning_rate": 0.0002726957636054507, - "loss": 0.0228, + "epoch": 0.09, + "learning_rate": 0.00028597131533175554, + "loss": 0.0342, "step": 36080 }, { - "epoch": 0.18, - "learning_rate": 0.0002726881959124367, - "loss": 0.0233, + "epoch": 0.09, + "learning_rate": 0.0002859674271153841, + "loss": 0.028, "step": 36090 }, { - "epoch": 0.18, - "learning_rate": 0.0002726806282194227, - "loss": 0.0226, + "epoch": 0.09, + "learning_rate": 0.0002859635388990126, + "loss": 0.0308, "step": 36100 }, { - "epoch": 0.18, - "learning_rate": 0.00027267306052640867, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.00028595965068264114, + "loss": 0.0296, "step": 36110 }, { - "epoch": 0.18, - "learning_rate": 0.0002726654928333947, - "loss": 0.0246, + "epoch": 0.09, + "learning_rate": 0.0002859557624662697, + "loss": 0.0303, "step": 36120 }, { - "epoch": 0.18, - "learning_rate": 0.0002726579251403807, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.0002859518742498982, + "loss": 0.0283, "step": 36130 }, { - "epoch": 0.18, - "learning_rate": 0.00027265035744736667, - "loss": 0.0262, + "epoch": 0.09, + "learning_rate": 0.0002859479860335268, + "loss": 0.0245, "step": 36140 }, { - "epoch": 0.18, - "learning_rate": 0.00027264278975435265, - "loss": 0.0247, + "epoch": 0.09, + "learning_rate": 0.0002859440978171553, + "loss": 0.0319, "step": 36150 }, { - "epoch": 0.18, - "learning_rate": 0.00027263522206133863, - "loss": 0.0173, + "epoch": 0.09, + "learning_rate": 0.0002859402096007839, + "loss": 0.0341, "step": 36160 }, { - "epoch": 0.18, - "learning_rate": 0.0002726276543683246, + "epoch": 0.09, + "learning_rate": 0.0002859363213844124, "loss": 0.0275, "step": 36170 }, { - "epoch": 0.18, - "learning_rate": 0.00027262008667531065, - "loss": 0.0216, + "epoch": 0.09, + "learning_rate": 0.0002859324331680409, + "loss": 0.0256, "step": 36180 }, { - "epoch": 0.18, - "learning_rate": 0.00027261251898229663, - "loss": 0.0252, + "epoch": 0.09, + "learning_rate": 0.0002859285449516694, + "loss": 0.0579, "step": 36190 }, { - "epoch": 0.18, - "learning_rate": 0.0002726049512892826, - "loss": 0.0233, + "epoch": 0.09, + "learning_rate": 0.000285924656735298, + "loss": 0.0266, "step": 36200 }, { - "epoch": 0.18, - "learning_rate": 0.0002725973835962686, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.0002859207685189265, + "loss": 0.0296, "step": 36210 }, { - "epoch": 0.18, - "learning_rate": 0.0002725898159032546, - "loss": 0.0275, + "epoch": 0.09, + "learning_rate": 0.00028591688030255507, + "loss": 0.0374, "step": 36220 }, { - "epoch": 0.18, - "learning_rate": 0.00027258224821024056, - "loss": 0.0284, + "epoch": 0.09, + "learning_rate": 0.0002859129920861836, + "loss": 0.0298, "step": 36230 }, { - "epoch": 0.18, - "learning_rate": 0.00027257468051722654, - "loss": 0.034, + "epoch": 0.09, + "learning_rate": 0.0002859091038698121, + "loss": 0.0305, "step": 36240 }, { - "epoch": 0.18, - "learning_rate": 0.00027256711282421257, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.00028590521565344067, + "loss": 0.0346, "step": 36250 }, { - "epoch": 0.18, - "learning_rate": 0.00027255954513119855, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.0002859013274370692, + "loss": 0.028, "step": 36260 }, { - "epoch": 0.18, - "learning_rate": 0.00027255197743818454, - "loss": 0.0238, + "epoch": 0.09, + "learning_rate": 0.0002858974392206977, + "loss": 0.031, "step": 36270 }, { - "epoch": 0.18, - "learning_rate": 0.0002725444097451705, - "loss": 0.0279, + "epoch": 0.09, + "learning_rate": 0.00028589355100432627, + "loss": 0.025, "step": 36280 }, { - "epoch": 0.18, - "learning_rate": 0.0002725368420521565, - "loss": 0.0303, + "epoch": 0.09, + "learning_rate": 0.00028588966278795484, + "loss": 0.0344, "step": 36290 }, { - "epoch": 0.18, - "learning_rate": 0.0002725292743591425, - "loss": 0.0305, + "epoch": 0.09, + "learning_rate": 0.00028588577457158335, + "loss": 0.0286, "step": 36300 }, { - "epoch": 0.18, - "learning_rate": 0.0002725217066661285, - "loss": 0.0226, + "epoch": 0.09, + "learning_rate": 0.00028588188635521187, + "loss": 0.0284, "step": 36310 }, { - "epoch": 0.18, - "learning_rate": 0.0002725141389731145, - "loss": 0.0211, + "epoch": 0.09, + "learning_rate": 0.0002858779981388404, + "loss": 0.0237, "step": 36320 }, { - "epoch": 0.18, - "learning_rate": 0.0002725065712801005, - "loss": 0.0224, + "epoch": 0.09, + "learning_rate": 0.00028587410992246895, + "loss": 0.0293, "step": 36330 }, { - "epoch": 0.18, - "learning_rate": 0.00027249900358708646, - "loss": 0.021, + "epoch": 0.09, + "learning_rate": 0.00028587022170609746, + "loss": 0.0281, "step": 36340 }, { - "epoch": 0.18, - "learning_rate": 0.00027249143589407244, + "epoch": 0.09, + "learning_rate": 0.00028586633348972603, "loss": 0.0276, "step": 36350 }, { - "epoch": 0.18, - "learning_rate": 0.0002724838682010584, - "loss": 0.0245, + "epoch": 0.09, + "learning_rate": 0.00028586244527335455, + "loss": 0.0321, "step": 36360 }, { - "epoch": 0.18, - "learning_rate": 0.00027247630050804446, - "loss": 0.024, + "epoch": 0.09, + "learning_rate": 0.0002858585570569831, + "loss": 0.0316, "step": 36370 }, { - "epoch": 0.18, - "learning_rate": 0.00027246873281503044, - "loss": 0.0213, + "epoch": 0.09, + "learning_rate": 0.00028585466884061163, + "loss": 0.0259, "step": 36380 }, { - "epoch": 0.18, - "learning_rate": 0.0002724611651220164, - "loss": 0.0307, + "epoch": 0.09, + "learning_rate": 0.00028585078062424014, + "loss": 0.0289, "step": 36390 }, { - "epoch": 0.18, - "learning_rate": 0.0002724535974290024, - "loss": 0.0263, + "epoch": 0.09, + "learning_rate": 0.00028584689240786866, + "loss": 0.0255, "step": 36400 }, { - "epoch": 0.18, - "learning_rate": 0.0002724460297359884, - "loss": 0.0227, + "epoch": 0.09, + "learning_rate": 0.00028584300419149723, + "loss": 0.0272, "step": 36410 }, { - "epoch": 0.18, - "learning_rate": 0.00027243846204297437, - "loss": 0.0236, + "epoch": 0.09, + "learning_rate": 0.00028583911597512574, + "loss": 0.0289, "step": 36420 }, { - "epoch": 0.18, - "learning_rate": 0.00027243089434996035, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.0002858352277587543, + "loss": 0.0277, "step": 36430 }, { - "epoch": 0.18, - "learning_rate": 0.0002724233266569464, - "loss": 0.0254, + "epoch": 0.09, + "learning_rate": 0.0002858313395423828, + "loss": 0.0284, "step": 36440 }, { - "epoch": 0.18, - "learning_rate": 0.00027241575896393236, - "loss": 0.0281, + "epoch": 0.09, + "learning_rate": 0.0002858274513260114, + "loss": 0.0298, "step": 36450 }, { - "epoch": 0.18, - "learning_rate": 0.00027240819127091835, - "loss": 0.0232, + "epoch": 0.09, + "learning_rate": 0.0002858235631096399, + "loss": 0.026, "step": 36460 }, { - "epoch": 0.18, - "learning_rate": 0.0002724006235779043, - "loss": 0.0223, + "epoch": 0.09, + "learning_rate": 0.0002858196748932684, + "loss": 0.0295, "step": 36470 }, { - "epoch": 0.18, - "learning_rate": 0.0002723930558848903, - "loss": 0.0208, + "epoch": 0.09, + "learning_rate": 0.00028581578667689694, + "loss": 0.0297, "step": 36480 }, { - "epoch": 0.18, - "learning_rate": 0.0002723854881918763, - "loss": 0.0249, + "epoch": 0.09, + "learning_rate": 0.0002858118984605255, + "loss": 0.0267, "step": 36490 }, { - "epoch": 0.18, - "learning_rate": 0.0002723779204988623, - "loss": 0.023, + "epoch": 0.09, + "learning_rate": 0.0002858080102441541, + "loss": 0.0366, "step": 36500 }, { - "epoch": 0.18, - "learning_rate": 0.0002723703528058483, - "loss": 0.021, + "epoch": 0.09, + "learning_rate": 0.0002858041220277826, + "loss": 0.0315, "step": 36510 }, { - "epoch": 0.18, - "learning_rate": 0.0002723627851128343, - "loss": 0.03, + "epoch": 0.09, + "learning_rate": 0.0002858002338114111, + "loss": 0.0275, "step": 36520 }, { - "epoch": 0.18, - "learning_rate": 0.00027235521741982027, - "loss": 0.0234, + "epoch": 0.09, + "learning_rate": 0.0002857963455950396, + "loss": 0.0272, "step": 36530 }, { - "epoch": 0.18, - "learning_rate": 0.00027234764972680625, - "loss": 0.0242, + "epoch": 0.09, + "learning_rate": 0.0002857924573786682, + "loss": 0.032, "step": 36540 }, { - "epoch": 0.18, - "learning_rate": 0.00027234008203379223, - "loss": 0.0294, + "epoch": 0.09, + "learning_rate": 0.0002857885691622967, + "loss": 0.0262, "step": 36550 }, { - "epoch": 0.18, - "learning_rate": 0.0002723325143407782, - "loss": 0.0256, + "epoch": 0.09, + "learning_rate": 0.00028578468094592527, + "loss": 0.0332, "step": 36560 }, { - "epoch": 0.18, - "learning_rate": 0.00027232494664776425, - "loss": 0.021, + "epoch": 0.09, + "learning_rate": 0.0002857807927295538, + "loss": 0.0296, "step": 36570 }, { - "epoch": 0.18, - "learning_rate": 0.00027231737895475023, - "loss": 0.0243, + "epoch": 0.09, + "learning_rate": 0.00028577690451318235, + "loss": 0.0298, "step": 36580 }, { - "epoch": 0.18, - "learning_rate": 0.0002723098112617362, - "loss": 0.028, + "epoch": 0.09, + "learning_rate": 0.00028577301629681087, + "loss": 0.0333, "step": 36590 }, { - "epoch": 0.18, - "learning_rate": 0.0002723022435687222, - "loss": 0.0244, + "epoch": 0.09, + "learning_rate": 0.0002857691280804394, + "loss": 0.0276, "step": 36600 }, { - "epoch": 0.18, - "learning_rate": 0.0002722946758757082, - "loss": 0.0219, + "epoch": 0.09, + "learning_rate": 0.0002857652398640679, + "loss": 0.034, "step": 36610 }, { - "epoch": 0.18, - "learning_rate": 0.00027228710818269416, - "loss": 0.026, + "epoch": 0.09, + "learning_rate": 0.00028576135164769647, + "loss": 0.0351, "step": 36620 }, { - "epoch": 0.18, - "learning_rate": 0.0002722795404896802, - "loss": 0.0216, + "epoch": 0.09, + "learning_rate": 0.000285757463431325, + "loss": 0.032, "step": 36630 }, { - "epoch": 0.18, - "learning_rate": 0.0002722719727966662, - "loss": 0.0226, + "epoch": 0.09, + "learning_rate": 0.00028575357521495355, + "loss": 0.0305, "step": 36640 }, { - "epoch": 0.18, - "learning_rate": 0.00027226440510365216, - "loss": 0.0201, + "epoch": 0.1, + "learning_rate": 0.00028574968699858206, + "loss": 0.0288, "step": 36650 }, { - "epoch": 0.18, - "learning_rate": 0.00027225683741063814, - "loss": 0.0263, + "epoch": 0.1, + "learning_rate": 0.00028574579878221063, + "loss": 0.0332, "step": 36660 }, { - "epoch": 0.19, - "learning_rate": 0.0002722492697176241, - "loss": 0.0205, + "epoch": 0.1, + "learning_rate": 0.00028574191056583915, + "loss": 0.0299, "step": 36670 }, { - "epoch": 0.19, - "learning_rate": 0.0002722417020246101, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.00028573802234946766, + "loss": 0.0318, "step": 36680 }, { - "epoch": 0.19, - "learning_rate": 0.00027223413433159614, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.00028573413413309623, + "loss": 0.0247, "step": 36690 }, { - "epoch": 0.19, - "learning_rate": 0.0002722265666385821, - "loss": 0.0249, + "epoch": 0.1, + "learning_rate": 0.00028573024591672475, + "loss": 0.0333, "step": 36700 }, { - "epoch": 0.19, - "learning_rate": 0.0002722189989455681, - "loss": 0.0224, + "epoch": 0.1, + "learning_rate": 0.0002857263577003533, + "loss": 0.0323, "step": 36710 }, { - "epoch": 0.19, - "learning_rate": 0.0002722114312525541, - "loss": 0.0221, + "epoch": 0.1, + "learning_rate": 0.00028572246948398183, + "loss": 0.0277, "step": 36720 }, { - "epoch": 0.19, - "learning_rate": 0.00027220386355954006, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.00028571858126761034, + "loss": 0.03, "step": 36730 }, { - "epoch": 0.19, - "learning_rate": 0.00027219629586652604, - "loss": 0.0195, + "epoch": 0.1, + "learning_rate": 0.00028571469305123886, + "loss": 0.0312, "step": 36740 }, { - "epoch": 0.19, - "learning_rate": 0.000272188728173512, - "loss": 0.0206, + "epoch": 0.1, + "learning_rate": 0.0002857108048348674, + "loss": 0.0307, "step": 36750 }, { - "epoch": 0.19, - "learning_rate": 0.00027218116048049806, - "loss": 0.0219, + "epoch": 0.1, + "learning_rate": 0.00028570691661849594, + "loss": 0.0284, "step": 36760 }, { - "epoch": 0.19, - "learning_rate": 0.00027217359278748404, - "loss": 0.0263, + "epoch": 0.1, + "learning_rate": 0.0002857030284021245, + "loss": 0.029, "step": 36770 }, { - "epoch": 0.19, - "learning_rate": 0.00027216602509447, - "loss": 0.0195, + "epoch": 0.1, + "learning_rate": 0.000285699140185753, + "loss": 0.0252, "step": 36780 }, { - "epoch": 0.19, - "learning_rate": 0.000272158457401456, - "loss": 0.0277, + "epoch": 0.1, + "learning_rate": 0.0002856952519693816, + "loss": 0.0301, "step": 36790 }, { - "epoch": 0.19, - "learning_rate": 0.000272150889708442, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.0002856913637530101, + "loss": 0.0351, "step": 36800 }, { - "epoch": 0.19, - "learning_rate": 0.00027214332201542797, - "loss": 0.0289, + "epoch": 0.1, + "learning_rate": 0.0002856874755366386, + "loss": 0.033, "step": 36810 }, { - "epoch": 0.19, - "learning_rate": 0.000272135754322414, - "loss": 0.0276, + "epoch": 0.1, + "learning_rate": 0.00028568358732026714, + "loss": 0.0307, "step": 36820 }, { - "epoch": 0.19, - "learning_rate": 0.0002721281866294, - "loss": 0.0266, + "epoch": 0.1, + "learning_rate": 0.0002856796991038957, + "loss": 0.0361, "step": 36830 }, { - "epoch": 0.19, - "learning_rate": 0.00027212061893638597, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.0002856758108875243, + "loss": 0.0343, "step": 36840 }, { - "epoch": 0.19, - "learning_rate": 0.00027211305124337195, - "loss": 0.0262, + "epoch": 0.1, + "learning_rate": 0.0002856719226711528, + "loss": 0.0289, "step": 36850 }, { - "epoch": 0.19, - "learning_rate": 0.00027210548355035793, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.0002856680344547813, + "loss": 0.0337, "step": 36860 }, { - "epoch": 0.19, - "learning_rate": 0.0002720979158573439, - "loss": 0.028, + "epoch": 0.1, + "learning_rate": 0.00028566414623840987, + "loss": 0.0312, "step": 36870 }, { - "epoch": 0.19, - "learning_rate": 0.00027209034816432995, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.0002856602580220384, + "loss": 0.0296, "step": 36880 }, { - "epoch": 0.19, - "learning_rate": 0.0002720827804713159, - "loss": 0.0191, + "epoch": 0.1, + "learning_rate": 0.0002856563698056669, + "loss": 0.0514, "step": 36890 }, { - "epoch": 0.19, - "learning_rate": 0.0002720752127783019, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.00028565248158929547, + "loss": 0.0326, "step": 36900 }, { - "epoch": 0.19, - "learning_rate": 0.0002720676450852879, - "loss": 0.0195, + "epoch": 0.1, + "learning_rate": 0.000285648593372924, + "loss": 0.033, "step": 36910 }, { - "epoch": 0.19, - "learning_rate": 0.00027206007739227387, - "loss": 0.0199, + "epoch": 0.1, + "learning_rate": 0.00028564470515655255, + "loss": 0.0338, "step": 36920 }, { - "epoch": 0.19, - "learning_rate": 0.00027205250969925985, - "loss": 0.02, + "epoch": 0.1, + "learning_rate": 0.00028564081694018107, + "loss": 0.0336, "step": 36930 }, { - "epoch": 0.19, - "learning_rate": 0.00027204494200624583, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.0002856369287238096, + "loss": 0.031, "step": 36940 }, { - "epoch": 0.19, - "learning_rate": 0.00027203737431323187, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028563304050743815, + "loss": 0.0262, "step": 36950 }, { - "epoch": 0.19, - "learning_rate": 0.00027202980662021785, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.00028562915229106666, + "loss": 0.032, "step": 36960 }, { - "epoch": 0.19, - "learning_rate": 0.00027202223892720383, - "loss": 0.0295, + "epoch": 0.1, + "learning_rate": 0.0002856252640746952, + "loss": 0.0305, "step": 36970 }, { - "epoch": 0.19, - "learning_rate": 0.0002720146712341898, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.00028562137585832375, + "loss": 0.0383, "step": 36980 }, { - "epoch": 0.19, - "learning_rate": 0.0002720071035411758, - "loss": 0.0301, + "epoch": 0.1, + "learning_rate": 0.00028561748764195226, + "loss": 0.0298, "step": 36990 }, { - "epoch": 0.19, - "learning_rate": 0.0002719995358481618, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.00028561359942558083, + "loss": 0.03, "step": 37000 }, { - "epoch": 0.19, - "eval_cer": 0.9144654039225352, - "eval_loss": 0.018076682463288307, - "eval_runtime": 117.2546, - "eval_samples_per_second": 17.057, - "eval_steps_per_second": 4.264, + "epoch": 0.1, + "eval_cer": 0.8817502739789299, + "eval_loss": 0.02250346727669239, + "eval_runtime": 107.7374, + "eval_samples_per_second": 18.564, + "eval_steps_per_second": 4.641, "step": 37000 }, { - "epoch": 0.19, - "learning_rate": 0.0002719919681551478, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.00028560971120920935, + "loss": 0.0322, "step": 37010 }, { - "epoch": 0.19, - "learning_rate": 0.0002719844004621338, - "loss": 0.0248, + "epoch": 0.1, + "learning_rate": 0.00028560582299283786, + "loss": 0.0336, "step": 37020 }, { - "epoch": 0.19, - "learning_rate": 0.0002719768327691198, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.0002856019347764664, + "loss": 0.0268, "step": 37030 }, { - "epoch": 0.19, - "learning_rate": 0.00027196926507610576, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.00028559804656009494, + "loss": 0.0301, "step": 37040 }, { - "epoch": 0.19, - "learning_rate": 0.00027196169738309174, - "loss": 0.022, + "epoch": 0.1, + "learning_rate": 0.0002855941583437235, + "loss": 0.0341, "step": 37050 }, { - "epoch": 0.19, - "learning_rate": 0.0002719541296900777, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.00028559027012735203, + "loss": 0.0292, "step": 37060 }, { - "epoch": 0.19, - "learning_rate": 0.0002719465619970637, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028558638191098054, + "loss": 0.0333, "step": 37070 }, { - "epoch": 0.19, - "learning_rate": 0.0002719389943040497, - "loss": 0.0225, + "epoch": 0.1, + "learning_rate": 0.0002855824936946091, + "loss": 0.0304, "step": 37080 }, { - "epoch": 0.19, - "learning_rate": 0.00027193142661103566, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.0002855786054782376, + "loss": 0.0321, "step": 37090 }, { - "epoch": 0.19, - "learning_rate": 0.00027192385891802165, - "loss": 0.0285, + "epoch": 0.1, + "learning_rate": 0.00028557471726186614, + "loss": 0.0288, "step": 37100 }, { - "epoch": 0.19, - "learning_rate": 0.00027191629122500763, - "loss": 0.0269, + "epoch": 0.1, + "learning_rate": 0.0002855708290454947, + "loss": 0.0275, "step": 37110 }, { - "epoch": 0.19, - "learning_rate": 0.00027190872353199366, - "loss": 0.0351, + "epoch": 0.1, + "learning_rate": 0.0002855669408291232, + "loss": 0.0328, "step": 37120 }, { - "epoch": 0.19, - "learning_rate": 0.00027190115583897964, - "loss": 0.022, + "epoch": 0.1, + "learning_rate": 0.0002855630526127518, + "loss": 0.0338, "step": 37130 }, { - "epoch": 0.19, - "learning_rate": 0.0002718935881459656, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.0002855591643963803, + "loss": 0.0276, "step": 37140 }, { - "epoch": 0.19, - "learning_rate": 0.0002718860204529516, - "loss": 0.0259, + "epoch": 0.1, + "learning_rate": 0.0002855552761800088, + "loss": 0.032, "step": 37150 }, { - "epoch": 0.19, - "learning_rate": 0.0002718784527599376, - "loss": 0.0287, + "epoch": 0.1, + "learning_rate": 0.0002855513879636374, + "loss": 0.0378, "step": 37160 }, { - "epoch": 0.19, - "learning_rate": 0.00027187088506692357, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.0002855474997472659, + "loss": 0.0328, "step": 37170 }, { - "epoch": 0.19, - "learning_rate": 0.0002718633173739096, - "loss": 0.0226, + "epoch": 0.1, + "learning_rate": 0.0002855436115308944, + "loss": 0.032, "step": 37180 }, { - "epoch": 0.19, - "learning_rate": 0.0002718557496808956, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.000285539723314523, + "loss": 0.032, "step": 37190 }, { - "epoch": 0.19, - "learning_rate": 0.00027184818198788157, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.00028553583509815156, + "loss": 0.0383, "step": 37200 }, { - "epoch": 0.19, - "learning_rate": 0.00027184061429486755, - "loss": 0.0209, + "epoch": 0.1, + "learning_rate": 0.00028553194688178007, + "loss": 0.0316, "step": 37210 }, { - "epoch": 0.19, - "learning_rate": 0.00027183304660185353, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.0002855280586654086, + "loss": 0.035, "step": 37220 }, { - "epoch": 0.19, - "learning_rate": 0.0002718254789088395, - "loss": 0.0244, + "epoch": 0.1, + "learning_rate": 0.0002855241704490371, + "loss": 0.0316, "step": 37230 }, { - "epoch": 0.19, - "learning_rate": 0.00027181791121582555, - "loss": 0.0243, + "epoch": 0.1, + "learning_rate": 0.00028552028223266567, + "loss": 0.027, "step": 37240 }, { - "epoch": 0.19, - "learning_rate": 0.00027181034352281153, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.0002855163940162942, + "loss": 0.0265, "step": 37250 }, { - "epoch": 0.19, - "learning_rate": 0.0002718027758297975, - "loss": 0.0268, + "epoch": 0.1, + "learning_rate": 0.00028551250579992275, + "loss": 0.0335, "step": 37260 }, { - "epoch": 0.19, - "learning_rate": 0.0002717952081367835, - "loss": 0.0252, + "epoch": 0.1, + "learning_rate": 0.00028550861758355127, + "loss": 0.0256, "step": 37270 }, { - "epoch": 0.19, - "learning_rate": 0.0002717876404437695, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.0002855047293671798, + "loss": 0.0276, "step": 37280 }, { - "epoch": 0.19, - "learning_rate": 0.00027178007275075546, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.00028550084115080835, + "loss": 0.0314, "step": 37290 }, { - "epoch": 0.19, - "learning_rate": 0.00027177250505774144, - "loss": 0.0274, + "epoch": 0.1, + "learning_rate": 0.00028549695293443686, + "loss": 0.0337, "step": 37300 }, { - "epoch": 0.19, - "learning_rate": 0.00027176493736472747, - "loss": 0.0264, + "epoch": 0.1, + "learning_rate": 0.0002854930647180654, + "loss": 0.0308, "step": 37310 }, { - "epoch": 0.19, - "learning_rate": 0.00027175736967171345, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028548917650169395, + "loss": 0.0299, "step": 37320 }, { - "epoch": 0.19, - "learning_rate": 0.00027174980197869944, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.0002854852882853225, + "loss": 0.0302, "step": 37330 }, { - "epoch": 0.19, - "learning_rate": 0.0002717422342856854, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.00028548140006895103, + "loss": 0.0315, "step": 37340 }, { - "epoch": 0.19, - "learning_rate": 0.0002717346665926714, - "loss": 0.0207, + "epoch": 0.1, + "learning_rate": 0.00028547751185257954, + "loss": 0.0273, "step": 37350 }, { - "epoch": 0.19, - "learning_rate": 0.0002717270988996574, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.00028547362363620806, + "loss": 0.0298, "step": 37360 }, { - "epoch": 0.19, - "learning_rate": 0.0002717195312066434, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028546973541983663, + "loss": 0.0329, "step": 37370 }, { - "epoch": 0.19, - "learning_rate": 0.0002717119635136294, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028546584720346514, + "loss": 0.0343, "step": 37380 }, { - "epoch": 0.19, - "learning_rate": 0.0002717043958206154, - "loss": 0.0214, + "epoch": 0.1, + "learning_rate": 0.0002854619589870937, + "loss": 0.0472, "step": 37390 }, { - "epoch": 0.19, - "learning_rate": 0.00027169682812760136, - "loss": 0.0215, + "epoch": 0.1, + "learning_rate": 0.0002854580707707222, + "loss": 0.0341, "step": 37400 }, { - "epoch": 0.19, - "learning_rate": 0.00027168926043458734, - "loss": 0.0285, + "epoch": 0.1, + "learning_rate": 0.0002854541825543508, + "loss": 0.0344, "step": 37410 }, { - "epoch": 0.19, - "learning_rate": 0.0002716816927415733, - "loss": 0.0205, + "epoch": 0.1, + "learning_rate": 0.0002854502943379793, + "loss": 0.031, "step": 37420 }, { - "epoch": 0.19, - "learning_rate": 0.00027167412504855936, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.0002854464061216078, + "loss": 0.0344, "step": 37430 }, { - "epoch": 0.19, - "learning_rate": 0.00027166655735554534, - "loss": 0.0243, + "epoch": 0.1, + "learning_rate": 0.00028544251790523634, + "loss": 0.0331, "step": 37440 }, { - "epoch": 0.19, - "learning_rate": 0.0002716589896625313, - "loss": 0.0226, + "epoch": 0.1, + "learning_rate": 0.0002854386296888649, + "loss": 0.0265, "step": 37450 }, { - "epoch": 0.19, - "learning_rate": 0.0002716514219695173, - "loss": 0.0223, + "epoch": 0.1, + "learning_rate": 0.0002854347414724934, + "loss": 0.0249, "step": 37460 }, { - "epoch": 0.19, - "learning_rate": 0.0002716438542765033, - "loss": 0.0222, + "epoch": 0.1, + "learning_rate": 0.000285430853256122, + "loss": 0.0341, "step": 37470 }, { - "epoch": 0.19, - "learning_rate": 0.00027163628658348927, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.0002854269650397505, + "loss": 0.0334, "step": 37480 }, { - "epoch": 0.19, - "learning_rate": 0.00027162871889047525, - "loss": 0.0225, + "epoch": 0.1, + "learning_rate": 0.000285423076823379, + "loss": 0.0287, "step": 37490 }, { - "epoch": 0.19, - "learning_rate": 0.0002716211511974613, - "loss": 0.0236, + "epoch": 0.1, + "learning_rate": 0.0002854191886070076, + "loss": 0.0327, "step": 37500 }, { - "epoch": 0.19, - "learning_rate": 0.00027161358350444726, - "loss": 0.0356, + "epoch": 0.1, + "learning_rate": 0.0002854153003906361, + "loss": 0.0408, "step": 37510 }, { - "epoch": 0.19, - "learning_rate": 0.00027160601581143325, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.0002854114121742646, + "loss": 0.0322, "step": 37520 }, { - "epoch": 0.19, - "learning_rate": 0.00027159844811841923, - "loss": 0.0573, + "epoch": 0.1, + "learning_rate": 0.0002854075239578932, + "loss": 0.0328, "step": 37530 }, { - "epoch": 0.19, - "learning_rate": 0.0002715908804254052, - "loss": 0.0224, + "epoch": 0.1, + "learning_rate": 0.00028540363574152175, + "loss": 0.0287, "step": 37540 }, { - "epoch": 0.19, - "learning_rate": 0.0002715833127323912, - "loss": 0.029, + "epoch": 0.1, + "learning_rate": 0.00028539974752515027, + "loss": 0.034, "step": 37550 }, { - "epoch": 0.19, - "learning_rate": 0.0002715757450393772, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.0002853958593087788, + "loss": 0.0364, "step": 37560 }, { - "epoch": 0.19, - "learning_rate": 0.0002715681773463632, - "loss": 0.0277, + "epoch": 0.1, + "learning_rate": 0.0002853919710924073, + "loss": 0.0293, "step": 37570 }, { - "epoch": 0.19, - "learning_rate": 0.0002715606096533492, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.00028538808287603587, + "loss": 0.0333, "step": 37580 }, { - "epoch": 0.19, - "learning_rate": 0.00027155304196033517, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.0002853841946596644, + "loss": 0.0338, "step": 37590 }, { - "epoch": 0.19, - "learning_rate": 0.00027154547426732115, - "loss": 0.0249, + "epoch": 0.1, + "learning_rate": 0.00028538030644329295, + "loss": 0.0333, "step": 37600 }, { - "epoch": 0.19, - "learning_rate": 0.00027153790657430713, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.00028537641822692146, + "loss": 0.0276, "step": 37610 }, { - "epoch": 0.19, - "learning_rate": 0.0002715303388812931, - "loss": 0.0274, + "epoch": 0.1, + "learning_rate": 0.00028537253001055003, + "loss": 0.0341, "step": 37620 }, { - "epoch": 0.19, - "learning_rate": 0.00027152277118827915, - "loss": 0.0216, + "epoch": 0.1, + "learning_rate": 0.00028536864179417855, + "loss": 0.0269, "step": 37630 }, { - "epoch": 0.19, - "learning_rate": 0.00027151520349526513, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.00028536475357780706, + "loss": 0.0295, "step": 37640 }, { - "epoch": 0.19, - "learning_rate": 0.0002715076358022511, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.0002853608653614356, + "loss": 0.0314, "step": 37650 }, { - "epoch": 0.19, - "learning_rate": 0.0002715000681092371, - "loss": 0.0254, + "epoch": 0.1, + "learning_rate": 0.00028535697714506415, + "loss": 0.0314, "step": 37660 }, { - "epoch": 0.19, - "learning_rate": 0.0002714925004162231, - "loss": 0.0251, + "epoch": 0.1, + "learning_rate": 0.00028535308892869266, + "loss": 0.0303, "step": 37670 }, { - "epoch": 0.19, - "learning_rate": 0.00027148493272320906, - "loss": 0.0245, + "epoch": 0.1, + "learning_rate": 0.00028534920071232123, + "loss": 0.0468, "step": 37680 }, { - "epoch": 0.19, - "learning_rate": 0.0002714773650301951, - "loss": 0.0204, + "epoch": 0.1, + "learning_rate": 0.00028534531249594974, + "loss": 0.0265, "step": 37690 }, { - "epoch": 0.19, - "learning_rate": 0.0002714697973371811, - "loss": 0.0244, + "epoch": 0.1, + "learning_rate": 0.0002853414242795783, + "loss": 0.0257, "step": 37700 }, { - "epoch": 0.19, - "learning_rate": 0.00027146222964416706, - "loss": 0.0219, + "epoch": 0.1, + "learning_rate": 0.0002853375360632068, + "loss": 0.0313, "step": 37710 }, { - "epoch": 0.19, - "learning_rate": 0.00027145466195115304, - "loss": 0.0314, + "epoch": 0.1, + "learning_rate": 0.00028533364784683534, + "loss": 0.0317, "step": 37720 }, { - "epoch": 0.19, - "learning_rate": 0.000271447094258139, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.0002853297596304639, + "loss": 0.0322, "step": 37730 }, { - "epoch": 0.19, - "learning_rate": 0.000271439526565125, - "loss": 0.0268, + "epoch": 0.1, + "learning_rate": 0.0002853258714140924, + "loss": 0.0383, "step": 37740 }, { - "epoch": 0.19, - "learning_rate": 0.00027143195887211104, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.000285321983197721, + "loss": 0.0301, "step": 37750 }, { - "epoch": 0.19, - "learning_rate": 0.000271424391179097, - "loss": 0.0201, + "epoch": 0.1, + "learning_rate": 0.0002853180949813495, + "loss": 0.0298, "step": 37760 }, { - "epoch": 0.19, - "learning_rate": 0.000271416823486083, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.000285314206764978, + "loss": 0.032, "step": 37770 }, { - "epoch": 0.19, - "learning_rate": 0.000271409255793069, - "loss": 0.0236, + "epoch": 0.1, + "learning_rate": 0.00028531031854860654, + "loss": 0.0334, "step": 37780 }, { - "epoch": 0.19, - "learning_rate": 0.00027140168810005496, - "loss": 0.0226, + "epoch": 0.1, + "learning_rate": 0.0002853064303322351, + "loss": 0.0304, "step": 37790 }, { - "epoch": 0.19, - "learning_rate": 0.00027139412040704094, - "loss": 0.0216, + "epoch": 0.1, + "learning_rate": 0.0002853025421158636, + "loss": 0.0345, "step": 37800 }, { - "epoch": 0.19, - "learning_rate": 0.0002713865527140269, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.0002852986538994922, + "loss": 0.0326, "step": 37810 }, { - "epoch": 0.19, - "learning_rate": 0.00027137898502101296, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.0002852947656831207, + "loss": 0.0311, "step": 37820 }, { - "epoch": 0.19, - "learning_rate": 0.00027137141732799894, - "loss": 0.0245, + "epoch": 0.1, + "learning_rate": 0.00028529087746674927, + "loss": 0.0332, "step": 37830 }, { - "epoch": 0.19, - "learning_rate": 0.0002713638496349849, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.0002852869892503778, + "loss": 0.0292, "step": 37840 }, { - "epoch": 0.19, - "learning_rate": 0.0002713562819419709, - "loss": 0.0286, + "epoch": 0.1, + "learning_rate": 0.0002852831010340063, + "loss": 0.0429, "step": 37850 }, { - "epoch": 0.19, - "learning_rate": 0.0002713487142489569, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.0002852792128176348, + "loss": 0.033, "step": 37860 }, { - "epoch": 0.19, - "learning_rate": 0.00027134114655594287, - "loss": 0.0217, + "epoch": 0.1, + "learning_rate": 0.0002852753246012634, + "loss": 0.0322, "step": 37870 }, { - "epoch": 0.19, - "learning_rate": 0.0002713335788629289, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.00028527143638489195, + "loss": 0.0347, "step": 37880 }, { - "epoch": 0.19, - "learning_rate": 0.0002713260111699149, - "loss": 0.0218, + "epoch": 0.1, + "learning_rate": 0.00028526754816852047, + "loss": 0.0276, "step": 37890 }, { - "epoch": 0.19, - "learning_rate": 0.00027131844347690087, - "loss": 0.0275, + "epoch": 0.1, + "learning_rate": 0.000285263659952149, + "loss": 0.0364, "step": 37900 }, { - "epoch": 0.19, - "learning_rate": 0.00027131087578388685, - "loss": 0.0215, + "epoch": 0.1, + "learning_rate": 0.00028525977173577755, + "loss": 0.0331, "step": 37910 }, { - "epoch": 0.19, - "learning_rate": 0.00027130330809087283, - "loss": 0.0254, + "epoch": 0.1, + "learning_rate": 0.00028525588351940607, + "loss": 0.0336, "step": 37920 }, { - "epoch": 0.19, - "learning_rate": 0.0002712957403978588, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.0002852519953030346, + "loss": 0.0293, "step": 37930 }, { - "epoch": 0.19, - "learning_rate": 0.00027128817270484485, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.00028524810708666315, + "loss": 0.028, "step": 37940 }, { - "epoch": 0.19, - "learning_rate": 0.00027128060501183083, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.00028524421887029166, + "loss": 0.035, "step": 37950 }, { - "epoch": 0.19, - "learning_rate": 0.0002712730373188168, - "loss": 0.0263, + "epoch": 0.1, + "learning_rate": 0.00028524033065392023, + "loss": 0.0305, "step": 37960 }, { - "epoch": 0.19, - "learning_rate": 0.0002712654696258028, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.00028523644243754875, + "loss": 0.0321, "step": 37970 }, { - "epoch": 0.19, - "learning_rate": 0.00027125790193278877, - "loss": 0.028, + "epoch": 0.1, + "learning_rate": 0.00028523255422117726, + "loss": 0.0342, "step": 37980 }, { - "epoch": 0.19, - "learning_rate": 0.00027125033423977475, - "loss": 0.0321, + "epoch": 0.1, + "learning_rate": 0.0002852286660048058, + "loss": 0.0324, "step": 37990 }, { - "epoch": 0.19, - "learning_rate": 0.00027124276654676073, - "loss": 0.0245, + "epoch": 0.1, + "learning_rate": 0.00028522477778843434, + "loss": 0.0355, "step": 38000 }, { - "epoch": 0.19, - "eval_cer": 0.9144780190721654, - "eval_loss": 0.018160896375775337, - "eval_runtime": 117.0624, - "eval_samples_per_second": 17.085, - "eval_steps_per_second": 4.271, + "epoch": 0.1, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.021771151572465897, + "eval_runtime": 107.8634, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, "step": 38000 }, { - "epoch": 0.19, - "learning_rate": 0.00027123519885374677, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.00028522088957206286, + "loss": 0.0256, "step": 38010 }, { - "epoch": 0.19, - "learning_rate": 0.00027122763116073275, - "loss": 0.0244, + "epoch": 0.1, + "learning_rate": 0.00028521700135569143, + "loss": 0.0292, "step": 38020 }, { - "epoch": 0.19, - "learning_rate": 0.00027122006346771873, - "loss": 0.0204, + "epoch": 0.1, + "learning_rate": 0.00028521311313931994, + "loss": 0.0239, "step": 38030 }, { - "epoch": 0.19, - "learning_rate": 0.0002712124957747047, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.0002852092249229485, + "loss": 0.0332, "step": 38040 }, { - "epoch": 0.19, - "learning_rate": 0.0002712049280816907, - "loss": 0.0324, + "epoch": 0.1, + "learning_rate": 0.000285205336706577, + "loss": 0.0325, "step": 38050 }, { - "epoch": 0.19, - "learning_rate": 0.0002711973603886767, - "loss": 0.0269, + "epoch": 0.1, + "learning_rate": 0.00028520144849020554, + "loss": 0.0322, "step": 38060 }, { - "epoch": 0.19, - "learning_rate": 0.0002711897926956627, - "loss": 0.0237, + "epoch": 0.1, + "learning_rate": 0.00028519756027383405, + "loss": 0.0298, "step": 38070 }, { - "epoch": 0.19, - "learning_rate": 0.0002711822250026487, - "loss": 0.0293, + "epoch": 0.1, + "learning_rate": 0.0002851936720574626, + "loss": 0.031, "step": 38080 }, { - "epoch": 0.19, - "learning_rate": 0.0002711746573096347, - "loss": 0.0288, + "epoch": 0.1, + "learning_rate": 0.0002851897838410912, + "loss": 0.0345, "step": 38090 }, { - "epoch": 0.19, - "learning_rate": 0.00027116708961662066, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.0002851858956247197, + "loss": 0.0301, "step": 38100 }, { - "epoch": 0.19, - "learning_rate": 0.00027115952192360664, - "loss": 0.0216, + "epoch": 0.1, + "learning_rate": 0.0002851820074083482, + "loss": 0.0325, "step": 38110 }, { - "epoch": 0.19, - "learning_rate": 0.0002711519542305926, - "loss": 0.0203, + "epoch": 0.1, + "learning_rate": 0.0002851781191919768, + "loss": 0.0318, "step": 38120 }, { - "epoch": 0.19, - "learning_rate": 0.0002711443865375786, - "loss": 0.0267, + "epoch": 0.1, + "learning_rate": 0.0002851742309756053, + "loss": 0.0281, "step": 38130 }, { - "epoch": 0.19, - "learning_rate": 0.00027113681884456464, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.0002851703427592338, + "loss": 0.0284, "step": 38140 }, { - "epoch": 0.19, - "learning_rate": 0.0002711292511515506, - "loss": 0.0211, + "epoch": 0.1, + "learning_rate": 0.0002851664545428624, + "loss": 0.0275, "step": 38150 }, { - "epoch": 0.19, - "learning_rate": 0.0002711216834585366, - "loss": 0.0251, + "epoch": 0.1, + "learning_rate": 0.0002851625663264909, + "loss": 0.0334, "step": 38160 }, { - "epoch": 0.19, - "learning_rate": 0.0002711141157655226, - "loss": 0.0225, + "epoch": 0.1, + "learning_rate": 0.00028515867811011947, + "loss": 0.0368, "step": 38170 }, { - "epoch": 0.19, - "learning_rate": 0.00027110654807250856, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.000285154789893748, + "loss": 0.0311, "step": 38180 }, { - "epoch": 0.19, - "learning_rate": 0.00027109898037949454, - "loss": 0.0287, + "epoch": 0.1, + "learning_rate": 0.0002851509016773765, + "loss": 0.0318, "step": 38190 }, { - "epoch": 0.19, - "learning_rate": 0.0002710914126864806, - "loss": 0.0216, + "epoch": 0.1, + "learning_rate": 0.00028514701346100507, + "loss": 0.0351, "step": 38200 }, { - "epoch": 0.19, - "learning_rate": 0.00027108384499346656, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.0002851431252446336, + "loss": 0.0384, "step": 38210 }, { - "epoch": 0.19, - "learning_rate": 0.00027107627730045254, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.0002851392370282621, + "loss": 0.0378, "step": 38220 }, { - "epoch": 0.19, - "learning_rate": 0.0002710687096074385, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.00028513534881189067, + "loss": 0.0335, "step": 38230 }, { - "epoch": 0.19, - "learning_rate": 0.0002710611419144245, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.0002851314605955192, + "loss": 0.0279, "step": 38240 }, { - "epoch": 0.19, - "learning_rate": 0.0002710535742214105, - "loss": 0.0211, + "epoch": 0.1, + "learning_rate": 0.00028512757237914775, + "loss": 0.0381, "step": 38250 }, { - "epoch": 0.19, - "learning_rate": 0.0002710460065283965, - "loss": 0.0203, + "epoch": 0.1, + "learning_rate": 0.00028512368416277626, + "loss": 0.0287, "step": 38260 }, { - "epoch": 0.19, - "learning_rate": 0.0002710384388353825, - "loss": 0.0245, + "epoch": 0.1, + "learning_rate": 0.0002851197959464048, + "loss": 0.0275, "step": 38270 }, { - "epoch": 0.19, - "learning_rate": 0.0002710308711423685, - "loss": 0.025, + "epoch": 0.1, + "learning_rate": 0.00028511590773003335, + "loss": 0.0266, "step": 38280 }, { - "epoch": 0.19, - "learning_rate": 0.00027102330344935447, - "loss": 0.0281, + "epoch": 0.1, + "learning_rate": 0.00028511201951366186, + "loss": 0.0359, "step": 38290 }, { - "epoch": 0.19, - "learning_rate": 0.00027101573575634045, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028510813129729043, + "loss": 0.0344, "step": 38300 }, { - "epoch": 0.19, - "learning_rate": 0.00027100816806332643, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028510424308091895, + "loss": 0.0307, "step": 38310 }, { - "epoch": 0.19, - "learning_rate": 0.0002710006003703124, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028510035486454746, + "loss": 0.0303, "step": 38320 }, { - "epoch": 0.19, - "learning_rate": 0.00027099303267729845, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.00028509646664817603, + "loss": 0.0276, "step": 38330 }, { - "epoch": 0.19, - "learning_rate": 0.0002709854649842844, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.00028509257843180454, + "loss": 0.0309, "step": 38340 }, { - "epoch": 0.19, - "learning_rate": 0.00027097789729127036, - "loss": 0.0277, + "epoch": 0.1, + "learning_rate": 0.00028508869021543306, + "loss": 0.0281, "step": 38350 }, { - "epoch": 0.19, - "learning_rate": 0.00027097032959825634, - "loss": 0.0221, + "epoch": 0.1, + "learning_rate": 0.0002850848019990616, + "loss": 0.0303, "step": 38360 }, { - "epoch": 0.19, - "learning_rate": 0.0002709627619052424, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.00028508091378269014, + "loss": 0.0337, "step": 38370 }, { - "epoch": 0.19, - "learning_rate": 0.00027095519421222835, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.0002850770255663187, + "loss": 0.0322, "step": 38380 }, { - "epoch": 0.19, - "learning_rate": 0.00027094762651921434, - "loss": 0.0213, + "epoch": 0.1, + "learning_rate": 0.0002850731373499472, + "loss": 0.0342, "step": 38390 }, { - "epoch": 0.19, - "learning_rate": 0.0002709400588262003, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.00028506924913357574, + "loss": 0.0296, "step": 38400 }, { - "epoch": 0.19, - "learning_rate": 0.0002709324911331863, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.0002850653609172043, + "loss": 0.0332, "step": 38410 }, { - "epoch": 0.19, - "learning_rate": 0.0002709249234401723, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.0002850614727008328, + "loss": 0.0285, "step": 38420 }, { - "epoch": 0.19, - "learning_rate": 0.0002709173557471583, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.0002850575844844614, + "loss": 0.0282, "step": 38430 }, { - "epoch": 0.19, - "learning_rate": 0.0002709097880541443, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.0002850536962680899, + "loss": 0.0321, "step": 38440 }, { - "epoch": 0.19, - "learning_rate": 0.0002709022203611303, - "loss": 0.0203, + "epoch": 0.1, + "learning_rate": 0.0002850498080517185, + "loss": 0.0287, "step": 38450 }, { - "epoch": 0.19, - "learning_rate": 0.00027089465266811626, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.000285045919835347, + "loss": 0.033, "step": 38460 }, { - "epoch": 0.19, - "learning_rate": 0.00027088708497510224, - "loss": 0.0275, + "epoch": 0.1, + "learning_rate": 0.0002850420316189755, + "loss": 0.0252, "step": 38470 }, { - "epoch": 0.19, - "learning_rate": 0.0002708795172820882, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.000285038143402604, + "loss": 0.0287, "step": 38480 }, { - "epoch": 0.19, - "learning_rate": 0.00027087194958907426, - "loss": 0.0208, + "epoch": 0.1, + "learning_rate": 0.0002850342551862326, + "loss": 0.0332, "step": 38490 }, { - "epoch": 0.19, - "learning_rate": 0.00027086438189606024, - "loss": 0.027, + "epoch": 0.1, + "learning_rate": 0.0002850303669698611, + "loss": 0.0268, "step": 38500 }, { - "epoch": 0.19, - "learning_rate": 0.0002708568142030462, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.00028502647875348967, + "loss": 0.0328, "step": 38510 }, { - "epoch": 0.19, - "learning_rate": 0.0002708492465100322, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.0002850225905371182, + "loss": 0.0238, "step": 38520 }, { - "epoch": 0.19, - "learning_rate": 0.0002708416788170182, - "loss": 0.0218, + "epoch": 0.1, + "learning_rate": 0.0002850187023207467, + "loss": 0.0267, "step": 38530 }, { - "epoch": 0.19, - "learning_rate": 0.00027083411112400417, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028501481410437527, + "loss": 0.0326, "step": 38540 }, { - "epoch": 0.19, - "learning_rate": 0.00027082654343099015, - "loss": 0.0222, + "epoch": 0.1, + "learning_rate": 0.0002850109258880038, + "loss": 0.0312, "step": 38550 }, { - "epoch": 0.19, - "learning_rate": 0.0002708189757379762, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.0002850070376716323, + "loss": 0.0255, "step": 38560 }, { - "epoch": 0.19, - "learning_rate": 0.00027081140804496216, - "loss": 0.026, + "epoch": 0.1, + "learning_rate": 0.00028500314945526087, + "loss": 0.0318, "step": 38570 }, { - "epoch": 0.19, - "learning_rate": 0.00027080384035194815, - "loss": 0.0221, + "epoch": 0.1, + "learning_rate": 0.00028499926123888943, + "loss": 0.0277, "step": 38580 }, { - "epoch": 0.19, - "learning_rate": 0.00027079627265893413, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.00028499537302251795, + "loss": 0.03, "step": 38590 }, { - "epoch": 0.19, - "learning_rate": 0.0002707887049659201, - "loss": 0.0223, + "epoch": 0.1, + "learning_rate": 0.00028499148480614646, + "loss": 0.0332, "step": 38600 }, { - "epoch": 0.19, - "learning_rate": 0.0002707811372729061, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.000284987596589775, + "loss": 0.0313, "step": 38610 }, { - "epoch": 0.19, - "learning_rate": 0.0002707735695798921, - "loss": 0.0237, + "epoch": 0.1, + "learning_rate": 0.00028498370837340355, + "loss": 0.03, "step": 38620 }, { - "epoch": 0.19, - "learning_rate": 0.0002707660018868781, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.00028497982015703206, + "loss": 0.0259, "step": 38630 }, { - "epoch": 0.19, - "learning_rate": 0.0002707584341938641, - "loss": 0.0358, + "epoch": 0.1, + "learning_rate": 0.00028497593194066063, + "loss": 0.0337, "step": 38640 }, { - "epoch": 0.19, - "learning_rate": 0.00027075086650085007, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028497204372428914, + "loss": 0.0317, "step": 38650 }, { - "epoch": 0.2, - "learning_rate": 0.00027074329880783605, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.0002849681555079177, + "loss": 0.0346, "step": 38660 }, { - "epoch": 0.2, - "learning_rate": 0.00027073573111482203, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028496426729154623, + "loss": 0.0352, "step": 38670 }, { - "epoch": 0.2, - "learning_rate": 0.00027072816342180807, - "loss": 0.0261, + "epoch": 0.1, + "learning_rate": 0.00028496037907517474, + "loss": 0.0281, "step": 38680 }, { - "epoch": 0.2, - "learning_rate": 0.00027072059572879405, - "loss": 0.0218, + "epoch": 0.1, + "learning_rate": 0.00028495649085880326, + "loss": 0.0263, "step": 38690 }, { - "epoch": 0.2, - "learning_rate": 0.00027071302803578003, - "loss": 0.0213, + "epoch": 0.1, + "learning_rate": 0.0002849526026424318, + "loss": 0.0351, "step": 38700 }, { - "epoch": 0.2, - "learning_rate": 0.000270705460342766, - "loss": 0.0222, + "epoch": 0.1, + "learning_rate": 0.00028494871442606034, + "loss": 0.0329, "step": 38710 }, { - "epoch": 0.2, - "learning_rate": 0.000270697892649752, - "loss": 0.0201, + "epoch": 0.1, + "learning_rate": 0.0002849448262096889, + "loss": 0.0275, "step": 38720 }, { - "epoch": 0.2, - "learning_rate": 0.000270690324956738, - "loss": 0.0257, + "epoch": 0.1, + "learning_rate": 0.0002849409379933174, + "loss": 0.034, "step": 38730 }, { - "epoch": 0.2, - "learning_rate": 0.00027068275726372396, - "loss": 0.0273, + "epoch": 0.1, + "learning_rate": 0.00028493704977694594, + "loss": 0.0297, "step": 38740 }, { - "epoch": 0.2, - "learning_rate": 0.00027067518957071, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.0002849331615605745, + "loss": 0.0285, "step": 38750 }, { - "epoch": 0.2, - "learning_rate": 0.000270667621877696, - "loss": 0.0204, + "epoch": 0.1, + "learning_rate": 0.000284929273344203, + "loss": 0.0289, "step": 38760 }, { - "epoch": 0.2, - "learning_rate": 0.00027066005418468196, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.00028492538512783154, + "loss": 0.0331, "step": 38770 }, { - "epoch": 0.2, - "learning_rate": 0.00027065248649166794, - "loss": 0.0281, + "epoch": 0.1, + "learning_rate": 0.0002849214969114601, + "loss": 0.0282, "step": 38780 }, { - "epoch": 0.2, - "learning_rate": 0.0002706449187986539, - "loss": 0.025, + "epoch": 0.1, + "learning_rate": 0.0002849176086950887, + "loss": 0.0304, "step": 38790 }, { - "epoch": 0.2, - "learning_rate": 0.0002706373511056399, - "loss": 0.0248, + "epoch": 0.1, + "learning_rate": 0.0002849137204787172, + "loss": 0.0279, "step": 38800 }, { - "epoch": 0.2, - "learning_rate": 0.00027062978341262594, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.0002849098322623457, + "loss": 0.0342, "step": 38810 }, { - "epoch": 0.2, - "learning_rate": 0.0002706222157196119, - "loss": 0.022, + "epoch": 0.1, + "learning_rate": 0.0002849059440459742, + "loss": 0.0346, "step": 38820 }, { - "epoch": 0.2, - "learning_rate": 0.0002706146480265979, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.0002849020558296028, + "loss": 0.0327, "step": 38830 }, { - "epoch": 0.2, - "learning_rate": 0.0002706070803335839, - "loss": 0.025, + "epoch": 0.1, + "learning_rate": 0.0002848981676132313, + "loss": 0.0335, "step": 38840 }, { - "epoch": 0.2, - "learning_rate": 0.00027059951264056986, - "loss": 0.0249, + "epoch": 0.1, + "learning_rate": 0.00028489427939685987, + "loss": 0.0272, "step": 38850 }, { - "epoch": 0.2, - "learning_rate": 0.00027059194494755584, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.0002848903911804884, + "loss": 0.027, "step": 38860 }, { - "epoch": 0.2, - "learning_rate": 0.0002705843772545418, - "loss": 0.0215, + "epoch": 0.1, + "learning_rate": 0.00028488650296411695, + "loss": 0.0305, "step": 38870 }, { - "epoch": 0.2, - "learning_rate": 0.00027057680956152786, - "loss": 0.0224, + "epoch": 0.1, + "learning_rate": 0.00028488261474774547, + "loss": 0.0309, "step": 38880 }, { - "epoch": 0.2, - "learning_rate": 0.00027056924186851384, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.000284878726531374, + "loss": 0.0306, "step": 38890 }, { - "epoch": 0.2, - "learning_rate": 0.0002705616741754998, - "loss": 0.0223, + "epoch": 0.1, + "learning_rate": 0.0002848748383150025, + "loss": 0.0338, "step": 38900 }, { - "epoch": 0.2, - "learning_rate": 0.0002705541064824858, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.00028487095009863106, + "loss": 0.0293, "step": 38910 }, { - "epoch": 0.2, - "learning_rate": 0.0002705465387894718, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.0002848670618822596, + "loss": 0.0275, "step": 38920 }, { - "epoch": 0.2, - "learning_rate": 0.00027053897109645777, - "loss": 0.0203, + "epoch": 0.1, + "learning_rate": 0.00028486317366588815, + "loss": 0.0313, "step": 38930 }, { - "epoch": 0.2, - "learning_rate": 0.0002705314034034438, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028485928544951666, + "loss": 0.0314, "step": 38940 }, { - "epoch": 0.2, - "learning_rate": 0.0002705238357104298, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.00028485539723314523, + "loss": 0.0304, "step": 38950 }, { - "epoch": 0.2, - "learning_rate": 0.00027051626801741577, - "loss": 0.0212, + "epoch": 0.1, + "learning_rate": 0.00028485150901677375, + "loss": 0.0325, "step": 38960 }, { - "epoch": 0.2, - "learning_rate": 0.00027050870032440175, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.00028484762080040226, + "loss": 0.0333, "step": 38970 }, { - "epoch": 0.2, - "learning_rate": 0.00027050113263138773, - "loss": 0.0266, + "epoch": 0.1, + "learning_rate": 0.00028484373258403083, + "loss": 0.0292, "step": 38980 }, { - "epoch": 0.2, - "learning_rate": 0.0002704935649383737, - "loss": 0.0206, + "epoch": 0.1, + "learning_rate": 0.00028483984436765934, + "loss": 0.0328, "step": 38990 }, { - "epoch": 0.2, - "learning_rate": 0.00027048599724535975, - "loss": 0.0195, + "epoch": 0.1, + "learning_rate": 0.0002848359561512879, + "loss": 0.0246, "step": 39000 }, { - "epoch": 0.2, - "eval_cer": 0.9144702559031622, - "eval_loss": 0.017209572717547417, - "eval_runtime": 117.1365, - "eval_samples_per_second": 17.074, - "eval_steps_per_second": 4.269, + "epoch": 0.1, + "eval_cer": 0.8818440496535199, + "eval_loss": 0.02235816977918148, + "eval_runtime": 107.7775, + "eval_samples_per_second": 18.557, + "eval_steps_per_second": 4.639, "step": 39000 }, { - "epoch": 0.2, - "learning_rate": 0.00027047842955234573, - "loss": 0.0312, + "epoch": 0.1, + "learning_rate": 0.0002848320679349164, + "loss": 0.0275, "step": 39010 }, { - "epoch": 0.2, - "learning_rate": 0.0002704708618593317, - "loss": 0.0205, + "epoch": 0.1, + "learning_rate": 0.00028482817971854494, + "loss": 0.0276, "step": 39020 }, { - "epoch": 0.2, - "learning_rate": 0.0002704632941663177, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.00028482429150217346, + "loss": 0.036, "step": 39030 }, { - "epoch": 0.2, - "learning_rate": 0.00027045572647330367, - "loss": 0.0261, + "epoch": 0.1, + "learning_rate": 0.000284820403285802, + "loss": 0.0324, "step": 39040 }, { - "epoch": 0.2, - "learning_rate": 0.00027044815878028965, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.00028481651506943054, + "loss": 0.0348, "step": 39050 }, { - "epoch": 0.2, - "learning_rate": 0.00027044059108727563, - "loss": 0.0226, + "epoch": 0.1, + "learning_rate": 0.0002848126268530591, + "loss": 0.0296, "step": 39060 }, { - "epoch": 0.2, - "learning_rate": 0.00027043302339426167, - "loss": 0.02, + "epoch": 0.1, + "learning_rate": 0.0002848087386366876, + "loss": 0.0348, "step": 39070 }, { - "epoch": 0.2, - "learning_rate": 0.00027042545570124765, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.0002848048504203162, + "loss": 0.0315, "step": 39080 }, { - "epoch": 0.2, - "learning_rate": 0.00027041788800823363, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.0002848009622039447, + "loss": 0.0303, "step": 39090 }, { - "epoch": 0.2, - "learning_rate": 0.0002704103203152196, - "loss": 0.0216, + "epoch": 0.1, + "learning_rate": 0.0002847970739875732, + "loss": 0.0276, "step": 39100 }, { - "epoch": 0.2, - "learning_rate": 0.0002704027526222056, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.00028479318577120173, + "loss": 0.0277, "step": 39110 }, { - "epoch": 0.2, - "learning_rate": 0.0002703951849291916, - "loss": 0.0219, + "epoch": 0.1, + "learning_rate": 0.0002847892975548303, + "loss": 0.0327, "step": 39120 }, { - "epoch": 0.2, - "learning_rate": 0.0002703876172361776, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.00028478540933845887, + "loss": 0.0329, "step": 39130 }, { - "epoch": 0.2, - "learning_rate": 0.0002703800495431636, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.0002847815211220874, + "loss": 0.0293, "step": 39140 }, { - "epoch": 0.2, - "learning_rate": 0.0002703724818501496, - "loss": 0.0223, + "epoch": 0.1, + "learning_rate": 0.0002847776329057159, + "loss": 0.0371, "step": 39150 }, { - "epoch": 0.2, - "learning_rate": 0.00027036491415713556, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.00028477374468934447, + "loss": 0.0287, "step": 39160 }, { - "epoch": 0.2, - "learning_rate": 0.00027035734646412154, - "loss": 0.0252, + "epoch": 0.1, + "learning_rate": 0.000284769856472973, + "loss": 0.0404, "step": 39170 }, { - "epoch": 0.2, - "learning_rate": 0.0002703497787711075, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.0002847659682566015, + "loss": 0.0294, "step": 39180 }, { - "epoch": 0.2, - "learning_rate": 0.00027034221107809356, - "loss": 0.0284, + "epoch": 0.1, + "learning_rate": 0.00028476208004023007, + "loss": 0.0288, "step": 39190 }, { - "epoch": 0.2, - "learning_rate": 0.00027033464338507954, - "loss": 0.0259, + "epoch": 0.1, + "learning_rate": 0.0002847581918238586, + "loss": 0.0261, "step": 39200 }, { - "epoch": 0.2, - "learning_rate": 0.0002703270756920655, - "loss": 0.0266, + "epoch": 0.1, + "learning_rate": 0.00028475430360748715, + "loss": 0.0405, "step": 39210 }, { - "epoch": 0.2, - "learning_rate": 0.0002703195079990515, - "loss": 0.0246, + "epoch": 0.1, + "learning_rate": 0.00028475041539111567, + "loss": 0.0286, "step": 39220 }, { - "epoch": 0.2, - "learning_rate": 0.0002703119403060375, - "loss": 0.0243, + "epoch": 0.1, + "learning_rate": 0.0002847465271747442, + "loss": 0.03, "step": 39230 }, { - "epoch": 0.2, - "learning_rate": 0.00027030437261302346, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.0002847426389583727, + "loss": 0.0284, "step": 39240 }, { - "epoch": 0.2, - "learning_rate": 0.00027029680492000944, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028473875074200126, + "loss": 0.0267, "step": 39250 }, { - "epoch": 0.2, - "learning_rate": 0.0002702892372269955, - "loss": 0.0294, + "epoch": 0.1, + "learning_rate": 0.0002847348625256298, + "loss": 0.0326, "step": 39260 }, { - "epoch": 0.2, - "learning_rate": 0.00027028166953398146, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.00028473097430925835, + "loss": 0.0301, "step": 39270 }, { - "epoch": 0.2, - "learning_rate": 0.00027027410184096744, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.00028472708609288686, + "loss": 0.0312, "step": 39280 }, { - "epoch": 0.2, - "learning_rate": 0.0002702665341479534, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.00028472319787651543, + "loss": 0.0335, "step": 39290 }, { - "epoch": 0.2, - "learning_rate": 0.0002702589664549394, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028471930966014394, + "loss": 0.0272, "step": 39300 }, { - "epoch": 0.2, - "learning_rate": 0.0002702513987619254, - "loss": 0.0287, + "epoch": 0.1, + "learning_rate": 0.00028471542144377246, + "loss": 0.0278, "step": 39310 }, { - "epoch": 0.2, - "learning_rate": 0.0002702438310689114, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.00028471153322740103, + "loss": 0.0315, "step": 39320 }, { - "epoch": 0.2, - "learning_rate": 0.0002702362633758974, - "loss": 0.0206, + "epoch": 0.1, + "learning_rate": 0.00028470764501102954, + "loss": 0.0341, "step": 39330 }, { - "epoch": 0.2, - "learning_rate": 0.0002702286956828834, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.0002847037567946581, + "loss": 0.0305, "step": 39340 }, { - "epoch": 0.2, - "learning_rate": 0.00027022112798986937, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.0002846998685782866, + "loss": 0.0275, "step": 39350 }, { - "epoch": 0.2, - "learning_rate": 0.00027021356029685535, - "loss": 0.0273, + "epoch": 0.1, + "learning_rate": 0.00028469598036191514, + "loss": 0.03, "step": 39360 }, { - "epoch": 0.2, - "learning_rate": 0.00027020599260384133, - "loss": 0.0271, + "epoch": 0.1, + "learning_rate": 0.0002846920921455437, + "loss": 0.0229, "step": 39370 }, { - "epoch": 0.2, - "learning_rate": 0.0002701984249108273, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.0002846882039291722, + "loss": 0.0297, "step": 39380 }, { - "epoch": 0.2, - "learning_rate": 0.00027019085721781335, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.00028468431571280074, + "loss": 0.0358, "step": 39390 }, { - "epoch": 0.2, - "learning_rate": 0.00027018328952479933, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.0002846804274964293, + "loss": 0.031, "step": 39400 }, { - "epoch": 0.2, - "learning_rate": 0.0002701757218317853, - "loss": 0.025, + "epoch": 0.1, + "learning_rate": 0.0002846765392800578, + "loss": 0.0367, "step": 39410 }, { - "epoch": 0.2, - "learning_rate": 0.0002701681541387713, - "loss": 0.0244, + "epoch": 0.1, + "learning_rate": 0.0002846726510636864, + "loss": 0.0347, "step": 39420 }, { - "epoch": 0.2, - "learning_rate": 0.0002701605864457573, - "loss": 0.0249, + "epoch": 0.1, + "learning_rate": 0.0002846687628473149, + "loss": 0.0286, "step": 39430 }, { - "epoch": 0.2, - "learning_rate": 0.00027015301875274325, - "loss": 0.0284, + "epoch": 0.1, + "learning_rate": 0.0002846648746309434, + "loss": 0.0445, "step": 39440 }, { - "epoch": 0.2, - "learning_rate": 0.0002701454510597293, - "loss": 0.0252, + "epoch": 0.1, + "learning_rate": 0.00028466098641457193, + "loss": 0.0323, "step": 39450 }, { - "epoch": 0.2, - "learning_rate": 0.00027013788336671527, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.0002846570981982005, + "loss": 0.0269, "step": 39460 }, { - "epoch": 0.2, - "learning_rate": 0.00027013031567370125, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.00028465320998182907, + "loss": 0.0386, "step": 39470 }, { - "epoch": 0.2, - "learning_rate": 0.00027012274798068723, - "loss": 0.025, + "epoch": 0.1, + "learning_rate": 0.0002846493217654576, + "loss": 0.033, "step": 39480 }, { - "epoch": 0.2, - "learning_rate": 0.0002701151802876732, - "loss": 0.0308, + "epoch": 0.1, + "learning_rate": 0.0002846454335490861, + "loss": 0.0264, "step": 39490 }, { - "epoch": 0.2, - "learning_rate": 0.0002701076125946592, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.00028464154533271467, + "loss": 0.0302, "step": 39500 }, { - "epoch": 0.2, - "learning_rate": 0.00027010004490164523, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.0002846376571163432, + "loss": 0.0324, "step": 39510 }, { - "epoch": 0.2, - "learning_rate": 0.0002700924772086312, - "loss": 0.0216, + "epoch": 0.1, + "learning_rate": 0.0002846337688999717, + "loss": 0.0285, "step": 39520 }, { - "epoch": 0.2, - "learning_rate": 0.0002700849095156172, - "loss": 0.0224, + "epoch": 0.1, + "learning_rate": 0.00028462988068360027, + "loss": 0.0301, "step": 39530 }, { - "epoch": 0.2, - "learning_rate": 0.0002700773418226032, - "loss": 0.0296, + "epoch": 0.1, + "learning_rate": 0.0002846259924672288, + "loss": 0.029, "step": 39540 }, { - "epoch": 0.2, - "learning_rate": 0.00027006977412958916, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.00028462210425085735, + "loss": 0.0306, "step": 39550 }, { - "epoch": 0.2, - "learning_rate": 0.00027006220643657514, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.00028461821603448586, + "loss": 0.0271, "step": 39560 }, { - "epoch": 0.2, - "learning_rate": 0.0002700546387435611, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.0002846143278181144, + "loss": 0.0278, "step": 39570 }, { - "epoch": 0.2, - "learning_rate": 0.00027004707105054716, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.00028461043960174295, + "loss": 0.0255, "step": 39580 }, { - "epoch": 0.2, - "learning_rate": 0.00027003950335753314, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.00028460655138537146, + "loss": 0.0313, "step": 39590 }, { - "epoch": 0.2, - "learning_rate": 0.00027003193566451907, - "loss": 0.0265, + "epoch": 0.1, + "learning_rate": 0.000284602663169, + "loss": 0.0303, "step": 39600 }, { - "epoch": 0.2, - "learning_rate": 0.00027002436797150505, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.00028459877495262855, + "loss": 0.0315, "step": 39610 }, { - "epoch": 0.2, - "learning_rate": 0.0002700168002784911, - "loss": 0.0259, + "epoch": 0.1, + "learning_rate": 0.0002845948867362571, + "loss": 0.0272, "step": 39620 }, { - "epoch": 0.2, - "learning_rate": 0.00027000923258547706, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028459099851988563, + "loss": 0.0344, "step": 39630 }, { - "epoch": 0.2, - "learning_rate": 0.00027000166489246305, - "loss": 0.0199, + "epoch": 0.1, + "learning_rate": 0.00028458711030351414, + "loss": 0.0323, "step": 39640 }, { - "epoch": 0.2, - "learning_rate": 0.00026999409719944903, - "loss": 0.0248, + "epoch": 0.1, + "learning_rate": 0.00028458322208714266, + "loss": 0.0306, "step": 39650 }, { - "epoch": 0.2, - "learning_rate": 0.000269986529506435, - "loss": 0.0259, + "epoch": 0.1, + "learning_rate": 0.0002845793338707712, + "loss": 0.0327, "step": 39660 }, { - "epoch": 0.2, - "learning_rate": 0.000269978961813421, - "loss": 0.0222, + "epoch": 0.1, + "learning_rate": 0.00028457544565439974, + "loss": 0.0354, "step": 39670 }, { - "epoch": 0.2, - "learning_rate": 0.000269971394120407, - "loss": 0.0292, + "epoch": 0.1, + "learning_rate": 0.0002845715574380283, + "loss": 0.034, "step": 39680 }, { - "epoch": 0.2, - "learning_rate": 0.000269963826427393, - "loss": 0.0235, + "epoch": 0.1, + "learning_rate": 0.0002845676692216568, + "loss": 0.0307, "step": 39690 }, { - "epoch": 0.2, - "learning_rate": 0.000269956258734379, - "loss": 0.0219, + "epoch": 0.1, + "learning_rate": 0.00028456378100528534, + "loss": 0.027, "step": 39700 }, { - "epoch": 0.2, - "learning_rate": 0.00026994869104136497, - "loss": 0.0204, + "epoch": 0.1, + "learning_rate": 0.0002845598927889139, + "loss": 0.0289, "step": 39710 }, { - "epoch": 0.2, - "learning_rate": 0.00026994112334835095, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.0002845560045725424, + "loss": 0.0325, "step": 39720 }, { - "epoch": 0.2, - "learning_rate": 0.00026993355565533693, - "loss": 0.0252, + "epoch": 0.1, + "learning_rate": 0.00028455211635617094, + "loss": 0.0302, "step": 39730 }, { - "epoch": 0.2, - "learning_rate": 0.00026992598796232297, - "loss": 0.0226, + "epoch": 0.1, + "learning_rate": 0.0002845482281397995, + "loss": 0.0358, "step": 39740 }, { - "epoch": 0.2, - "learning_rate": 0.00026991842026930895, - "loss": 0.0288, + "epoch": 0.1, + "learning_rate": 0.000284544339923428, + "loss": 0.0296, "step": 39750 }, { - "epoch": 0.2, - "learning_rate": 0.00026991085257629493, - "loss": 0.0283, + "epoch": 0.1, + "learning_rate": 0.0002845404517070566, + "loss": 0.0301, "step": 39760 }, { - "epoch": 0.2, - "learning_rate": 0.0002699032848832809, - "loss": 0.0258, + "epoch": 0.1, + "learning_rate": 0.0002845365634906851, + "loss": 0.0334, "step": 39770 }, { - "epoch": 0.2, - "learning_rate": 0.0002698957171902669, - "loss": 0.0237, + "epoch": 0.1, + "learning_rate": 0.0002845326752743136, + "loss": 0.0274, "step": 39780 }, { - "epoch": 0.2, - "learning_rate": 0.0002698881494972529, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.0002845287870579422, + "loss": 0.0336, "step": 39790 }, { - "epoch": 0.2, - "learning_rate": 0.00026988058180423886, - "loss": 0.0244, + "epoch": 0.1, + "learning_rate": 0.0002845248988415707, + "loss": 0.0319, "step": 39800 }, { - "epoch": 0.2, - "learning_rate": 0.0002698730141112249, - "loss": 0.0241, + "epoch": 0.1, + "learning_rate": 0.0002845210106251992, + "loss": 0.0263, "step": 39810 }, { - "epoch": 0.2, - "learning_rate": 0.0002698654464182109, - "loss": 0.0213, + "epoch": 0.1, + "learning_rate": 0.0002845171224088278, + "loss": 0.0309, "step": 39820 }, { - "epoch": 0.2, - "learning_rate": 0.00026985787872519686, - "loss": 0.0202, + "epoch": 0.1, + "learning_rate": 0.00028451323419245635, + "loss": 0.0287, "step": 39830 }, { - "epoch": 0.2, - "learning_rate": 0.00026985031103218284, - "loss": 0.0214, + "epoch": 0.1, + "learning_rate": 0.00028450934597608487, + "loss": 0.0281, "step": 39840 }, { - "epoch": 0.2, - "learning_rate": 0.0002698427433391688, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.0002845054577597134, + "loss": 0.0271, "step": 39850 }, { - "epoch": 0.2, - "learning_rate": 0.0002698351756461548, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.0002845015695433419, + "loss": 0.0331, "step": 39860 }, { - "epoch": 0.2, - "learning_rate": 0.00026982760795314084, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.00028449768132697047, + "loss": 0.0324, "step": 39870 }, { - "epoch": 0.2, - "learning_rate": 0.0002698200402601268, - "loss": 0.0255, + "epoch": 0.1, + "learning_rate": 0.000284493793110599, + "loss": 0.0356, "step": 39880 }, { - "epoch": 0.2, - "learning_rate": 0.0002698124725671128, - "loss": 0.0256, + "epoch": 0.1, + "learning_rate": 0.00028448990489422755, + "loss": 0.0268, "step": 39890 }, { - "epoch": 0.2, - "learning_rate": 0.0002698049048740988, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.00028448601667785606, + "loss": 0.0351, "step": 39900 }, { - "epoch": 0.2, - "learning_rate": 0.00026979733718108476, - "loss": 0.0215, + "epoch": 0.1, + "learning_rate": 0.00028448212846148463, + "loss": 0.0314, "step": 39910 }, { - "epoch": 0.2, - "learning_rate": 0.00026978976948807074, - "loss": 0.0348, + "epoch": 0.1, + "learning_rate": 0.00028447824024511315, + "loss": 0.0313, "step": 39920 }, { - "epoch": 0.2, - "learning_rate": 0.0002697822017950567, - "loss": 0.0344, + "epoch": 0.1, + "learning_rate": 0.00028447435202874166, + "loss": 0.0259, "step": 39930 }, { - "epoch": 0.2, - "learning_rate": 0.00026977463410204276, - "loss": 0.0237, + "epoch": 0.1, + "learning_rate": 0.0002844704638123702, + "loss": 0.0296, "step": 39940 }, { - "epoch": 0.2, - "learning_rate": 0.00026976706640902874, - "loss": 0.0288, + "epoch": 0.1, + "learning_rate": 0.00028446657559599874, + "loss": 0.0262, "step": 39950 }, { - "epoch": 0.2, - "learning_rate": 0.0002697594987160147, - "loss": 0.0227, + "epoch": 0.1, + "learning_rate": 0.00028446268737962726, + "loss": 0.0349, "step": 39960 }, { - "epoch": 0.2, - "learning_rate": 0.0002697519310230007, - "loss": 0.0276, + "epoch": 0.1, + "learning_rate": 0.00028445879916325583, + "loss": 0.0335, "step": 39970 }, { - "epoch": 0.2, - "learning_rate": 0.0002697443633299867, - "loss": 0.0226, + "epoch": 0.1, + "learning_rate": 0.00028445491094688434, + "loss": 0.0311, "step": 39980 }, { - "epoch": 0.2, - "learning_rate": 0.00026973679563697267, - "loss": 0.0191, + "epoch": 0.1, + "learning_rate": 0.00028445102273051286, + "loss": 0.027, "step": 39990 }, { - "epoch": 0.2, - "learning_rate": 0.0002697292279439587, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.0002844471345141414, + "loss": 0.026, "step": 40000 }, { - "epoch": 0.2, - "eval_cer": 0.9144896638256703, - "eval_loss": 0.017527606338262558, - "eval_runtime": 117.0438, - "eval_samples_per_second": 17.088, - "eval_steps_per_second": 4.272, + "epoch": 0.1, + "eval_cer": 0.8818636445705984, + "eval_loss": 0.021385852247476578, + "eval_runtime": 107.7355, + "eval_samples_per_second": 18.564, + "eval_steps_per_second": 4.641, "step": 40000 }, { - "epoch": 0.2, - "learning_rate": 0.0002697216602509447, - "loss": 0.0219, + "epoch": 0.1, + "learning_rate": 0.00028444324629776994, + "loss": 0.0295, "step": 40010 }, { - "epoch": 0.2, - "learning_rate": 0.00026971409255793067, - "loss": 0.024, + "epoch": 0.1, + "learning_rate": 0.0002844393580813985, + "loss": 0.0276, "step": 40020 }, { - "epoch": 0.2, - "learning_rate": 0.00026970652486491665, - "loss": 0.0232, + "epoch": 0.1, + "learning_rate": 0.000284435469865027, + "loss": 0.0319, "step": 40030 }, { - "epoch": 0.2, - "learning_rate": 0.00026969895717190263, - "loss": 0.0238, + "epoch": 0.1, + "learning_rate": 0.0002844315816486556, + "loss": 0.0306, "step": 40040 }, { - "epoch": 0.2, - "learning_rate": 0.0002696913894788886, - "loss": 0.0242, + "epoch": 0.1, + "learning_rate": 0.0002844276934322841, + "loss": 0.028, "step": 40050 }, { - "epoch": 0.2, - "learning_rate": 0.00026968382178587465, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.0002844238052159126, + "loss": 0.0282, "step": 40060 }, { - "epoch": 0.2, - "learning_rate": 0.00026967625409286063, - "loss": 0.0212, + "epoch": 0.1, + "learning_rate": 0.00028441991699954114, + "loss": 0.0311, "step": 40070 }, { - "epoch": 0.2, - "learning_rate": 0.0002696686863998466, - "loss": 0.0224, + "epoch": 0.1, + "learning_rate": 0.0002844160287831697, + "loss": 0.0329, "step": 40080 }, { - "epoch": 0.2, - "learning_rate": 0.0002696611187068326, - "loss": 0.0264, + "epoch": 0.1, + "learning_rate": 0.0002844121405667982, + "loss": 0.0337, "step": 40090 }, { - "epoch": 0.2, - "learning_rate": 0.00026965355101381857, - "loss": 0.0214, + "epoch": 0.1, + "learning_rate": 0.0002844082523504268, + "loss": 0.0276, "step": 40100 }, { - "epoch": 0.2, - "learning_rate": 0.00026964598332080455, - "loss": 0.0193, + "epoch": 0.1, + "learning_rate": 0.0002844043641340553, + "loss": 0.0268, "step": 40110 }, { - "epoch": 0.2, - "learning_rate": 0.00026963841562779054, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.00028440047591768387, + "loss": 0.0316, "step": 40120 }, { - "epoch": 0.2, - "learning_rate": 0.00026963084793477657, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.0002843965877013124, + "loss": 0.0298, "step": 40130 }, { - "epoch": 0.2, - "learning_rate": 0.00026962328024176255, - "loss": 0.0214, + "epoch": 0.1, + "learning_rate": 0.0002843926994849409, + "loss": 0.0266, "step": 40140 }, { - "epoch": 0.2, - "learning_rate": 0.00026961571254874853, - "loss": 0.0225, + "epoch": 0.1, + "learning_rate": 0.0002843888112685694, + "loss": 0.0247, "step": 40150 }, { - "epoch": 0.2, - "learning_rate": 0.0002696081448557345, - "loss": 0.0234, + "epoch": 0.1, + "learning_rate": 0.000284384923052198, + "loss": 0.0309, "step": 40160 }, { - "epoch": 0.2, - "learning_rate": 0.0002696005771627205, - "loss": 0.0214, + "epoch": 0.1, + "learning_rate": 0.00028438103483582655, + "loss": 0.0235, "step": 40170 }, { - "epoch": 0.2, - "learning_rate": 0.0002695930094697065, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028437714661945507, + "loss": 0.0284, "step": 40180 }, { - "epoch": 0.2, - "learning_rate": 0.0002695854417766925, - "loss": 0.0198, + "epoch": 0.1, + "learning_rate": 0.0002843732584030836, + "loss": 0.0255, "step": 40190 }, { - "epoch": 0.2, - "learning_rate": 0.0002695778740836785, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.0002843693701867121, + "loss": 0.0324, "step": 40200 }, { - "epoch": 0.2, - "learning_rate": 0.0002695703063906645, - "loss": 0.0218, + "epoch": 0.1, + "learning_rate": 0.00028436548197034066, + "loss": 0.0328, "step": 40210 }, { - "epoch": 0.2, - "learning_rate": 0.00026956273869765046, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.0002843615937539692, + "loss": 0.0286, "step": 40220 }, { - "epoch": 0.2, - "learning_rate": 0.00026955517100463644, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028435770553759775, + "loss": 0.0269, "step": 40230 }, { - "epoch": 0.2, - "learning_rate": 0.0002695476033116224, - "loss": 0.0228, + "epoch": 0.1, + "learning_rate": 0.00028435381732122626, + "loss": 0.0279, "step": 40240 }, { - "epoch": 0.2, - "learning_rate": 0.00026954003561860846, - "loss": 0.018, + "epoch": 0.1, + "learning_rate": 0.00028434992910485483, + "loss": 0.0304, "step": 40250 }, { - "epoch": 0.2, - "learning_rate": 0.00026953246792559444, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.00028434604088848335, + "loss": 0.0279, "step": 40260 }, { - "epoch": 0.2, - "learning_rate": 0.0002695249002325804, - "loss": 0.0248, - "step": 40270 + "epoch": 0.1, + "learning_rate": 0.00028434215267211186, + "loss": 0.0428, + "step": 40270 }, { - "epoch": 0.2, - "learning_rate": 0.0002695173325395664, - "loss": 0.0231, + "epoch": 0.1, + "learning_rate": 0.0002843382644557404, + "loss": 0.028, "step": 40280 }, { - "epoch": 0.2, - "learning_rate": 0.0002695097648465524, - "loss": 0.0194, + "epoch": 0.1, + "learning_rate": 0.00028433437623936894, + "loss": 0.0275, "step": 40290 }, { - "epoch": 0.2, - "learning_rate": 0.00026950219715353836, - "loss": 0.0268, + "epoch": 0.1, + "learning_rate": 0.00028433048802299746, + "loss": 0.0412, "step": 40300 }, { - "epoch": 0.2, - "learning_rate": 0.00026949462946052435, - "loss": 0.0225, + "epoch": 0.1, + "learning_rate": 0.000284326599806626, + "loss": 0.0324, "step": 40310 }, { - "epoch": 0.2, - "learning_rate": 0.0002694870617675104, - "loss": 0.021, + "epoch": 0.1, + "learning_rate": 0.00028432271159025454, + "loss": 0.0407, "step": 40320 }, { - "epoch": 0.2, - "learning_rate": 0.00026947949407449636, - "loss": 0.0212, + "epoch": 0.1, + "learning_rate": 0.0002843188233738831, + "loss": 0.0344, "step": 40330 }, { - "epoch": 0.2, - "learning_rate": 0.00026947192638148234, - "loss": 0.0196, + "epoch": 0.1, + "learning_rate": 0.0002843149351575116, + "loss": 0.0359, "step": 40340 }, { - "epoch": 0.2, - "learning_rate": 0.0002694643586884683, - "loss": 0.0207, + "epoch": 0.1, + "learning_rate": 0.00028431104694114014, + "loss": 0.0333, "step": 40350 }, { - "epoch": 0.2, - "learning_rate": 0.0002694567909954543, - "loss": 0.0239, + "epoch": 0.1, + "learning_rate": 0.00028430715872476865, + "loss": 0.0334, "step": 40360 }, { - "epoch": 0.2, - "learning_rate": 0.0002694492233024403, - "loss": 0.0247, + "epoch": 0.1, + "learning_rate": 0.0002843032705083972, + "loss": 0.0357, "step": 40370 }, { - "epoch": 0.2, - "learning_rate": 0.0002694416556094263, - "loss": 0.0192, + "epoch": 0.1, + "learning_rate": 0.0002842993822920258, + "loss": 0.0295, "step": 40380 }, { - "epoch": 0.2, - "learning_rate": 0.0002694340879164123, - "loss": 0.023, + "epoch": 0.1, + "learning_rate": 0.0002842954940756543, + "loss": 0.0316, "step": 40390 }, { - "epoch": 0.2, - "learning_rate": 0.0002694265202233983, - "loss": 0.0229, + "epoch": 0.1, + "learning_rate": 0.0002842916058592828, + "loss": 0.0302, "step": 40400 }, { - "epoch": 0.2, - "learning_rate": 0.00026941895253038427, - "loss": 0.0219, + "epoch": 0.1, + "learning_rate": 0.0002842877176429114, + "loss": 0.0393, "step": 40410 }, { - "epoch": 0.2, - "learning_rate": 0.00026941138483737025, - "loss": 0.0203, + "epoch": 0.1, + "learning_rate": 0.0002842838294265399, + "loss": 0.0333, "step": 40420 }, { - "epoch": 0.2, - "learning_rate": 0.00026940381714435623, - "loss": 0.0248, + "epoch": 0.1, + "learning_rate": 0.0002842799412101684, + "loss": 0.0307, "step": 40430 }, { - "epoch": 0.2, - "learning_rate": 0.0002693962494513422, - "loss": 0.0201, + "epoch": 0.1, + "learning_rate": 0.000284276052993797, + "loss": 0.0377, "step": 40440 }, { - "epoch": 0.2, - "learning_rate": 0.00026938868175832825, - "loss": 0.0244, + "epoch": 0.1, + "learning_rate": 0.0002842721647774255, + "loss": 0.0407, "step": 40450 }, { - "epoch": 0.2, - "learning_rate": 0.00026938111406531423, - "loss": 0.0253, + "epoch": 0.1, + "learning_rate": 0.00028426827656105407, + "loss": 0.029, "step": 40460 }, { - "epoch": 0.2, - "learning_rate": 0.0002693735463723002, - "loss": 0.0213, + "epoch": 0.1, + "learning_rate": 0.0002842643883446826, + "loss": 0.0357, "step": 40470 }, { - "epoch": 0.2, - "learning_rate": 0.0002693659786792862, - "loss": 0.0182, + "epoch": 0.1, + "learning_rate": 0.0002842605001283111, + "loss": 0.0327, "step": 40480 }, { - "epoch": 0.2, - "learning_rate": 0.0002693584109862722, - "loss": 0.0214, + "epoch": 0.1, + "learning_rate": 0.0002842566119119396, + "loss": 0.0365, "step": 40490 }, { - "epoch": 0.2, - "learning_rate": 0.00026935084329325816, - "loss": 0.0233, + "epoch": 0.1, + "learning_rate": 0.0002842527236955682, + "loss": 0.0325, "step": 40500 }, { - "epoch": 0.2, - "learning_rate": 0.0002693432756002442, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.0002842488354791967, + "loss": 0.0313, "step": 40510 }, { - "epoch": 0.2, - "learning_rate": 0.00026933570790723017, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.00028424494726282527, + "loss": 0.0333, "step": 40520 }, { - "epoch": 0.2, - "learning_rate": 0.00026932814021421615, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.0002842410590464538, + "loss": 0.049, "step": 40530 }, { - "epoch": 0.2, - "learning_rate": 0.00026932057252120214, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.00028423717083008235, + "loss": 0.0323, "step": 40540 }, { - "epoch": 0.2, - "learning_rate": 0.0002693130048281881, - "loss": 0.027, + "epoch": 0.11, + "learning_rate": 0.00028423328261371086, + "loss": 0.0306, "step": 40550 }, { - "epoch": 0.2, - "learning_rate": 0.0002693054371351741, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.0002842293943973394, + "loss": 0.0267, "step": 40560 }, { - "epoch": 0.2, - "learning_rate": 0.00026929786944216013, - "loss": 0.0266, + "epoch": 0.11, + "learning_rate": 0.00028422550618096795, + "loss": 0.0278, "step": 40570 }, { - "epoch": 0.2, - "learning_rate": 0.0002692903017491461, - "loss": 0.0279, + "epoch": 0.11, + "learning_rate": 0.00028422161796459646, + "loss": 0.0314, "step": 40580 }, { - "epoch": 0.2, - "learning_rate": 0.0002692827340561321, - "loss": 0.0205, + "epoch": 0.11, + "learning_rate": 0.00028421772974822503, + "loss": 0.0352, "step": 40590 }, { - "epoch": 0.2, - "learning_rate": 0.0002692751663631181, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.00028421384153185354, + "loss": 0.029, "step": 40600 }, { - "epoch": 0.2, - "learning_rate": 0.00026926759867010406, - "loss": 0.0209, + "epoch": 0.11, + "learning_rate": 0.00028420995331548206, + "loss": 0.027, "step": 40610 }, { - "epoch": 0.2, - "learning_rate": 0.00026926003097709004, - "loss": 0.0262, + "epoch": 0.11, + "learning_rate": 0.00028420606509911063, + "loss": 0.0341, "step": 40620 }, { - "epoch": 0.2, - "learning_rate": 0.000269252463284076, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.00028420217688273914, + "loss": 0.0319, "step": 40630 }, { - "epoch": 0.21, - "learning_rate": 0.00026924489559106206, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.00028419828866636766, + "loss": 0.0291, "step": 40640 }, { - "epoch": 0.21, - "learning_rate": 0.00026923732789804804, - "loss": 0.0227, + "epoch": 0.11, + "learning_rate": 0.0002841944004499962, + "loss": 0.0287, "step": 40650 }, { - "epoch": 0.21, - "learning_rate": 0.000269229760205034, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.0002841905122336248, + "loss": 0.0222, "step": 40660 }, { - "epoch": 0.21, - "learning_rate": 0.00026922219251202, - "loss": 0.0278, + "epoch": 0.11, + "learning_rate": 0.0002841866240172533, + "loss": 0.0276, "step": 40670 }, { - "epoch": 0.21, - "learning_rate": 0.000269214624819006, - "loss": 0.0184, + "epoch": 0.11, + "learning_rate": 0.0002841827358008818, + "loss": 0.0278, "step": 40680 }, { - "epoch": 0.21, - "learning_rate": 0.00026920705712599197, - "loss": 0.0232, + "epoch": 0.11, + "learning_rate": 0.00028417884758451034, + "loss": 0.0241, "step": 40690 }, { - "epoch": 0.21, - "learning_rate": 0.000269199489432978, - "loss": 0.0224, + "epoch": 0.11, + "learning_rate": 0.00028417495936813885, + "loss": 0.0363, "step": 40700 }, { - "epoch": 0.21, - "learning_rate": 0.000269191921739964, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.0002841710711517674, + "loss": 0.0301, "step": 40710 }, { - "epoch": 0.21, - "learning_rate": 0.00026918435404694996, - "loss": 0.0192, + "epoch": 0.11, + "learning_rate": 0.000284167182935396, + "loss": 0.0317, "step": 40720 }, { - "epoch": 0.21, - "learning_rate": 0.00026917678635393595, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.0002841632947190245, + "loss": 0.029, "step": 40730 }, { - "epoch": 0.21, - "learning_rate": 0.0002691692186609219, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.000284159406502653, + "loss": 0.0256, "step": 40740 }, { - "epoch": 0.21, - "learning_rate": 0.0002691616509679079, - "loss": 0.0259, + "epoch": 0.11, + "learning_rate": 0.0002841555182862816, + "loss": 0.0302, "step": 40750 }, { - "epoch": 0.21, - "learning_rate": 0.00026915408327489394, - "loss": 0.0215, + "epoch": 0.11, + "learning_rate": 0.0002841516300699101, + "loss": 0.0325, "step": 40760 }, { - "epoch": 0.21, - "learning_rate": 0.0002691465155818799, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.0002841477418535386, + "loss": 0.0277, "step": 40770 }, { - "epoch": 0.21, - "learning_rate": 0.0002691389478888659, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.0002841438536371672, + "loss": 0.0359, "step": 40780 }, { - "epoch": 0.21, - "learning_rate": 0.0002691313801958519, - "loss": 0.0194, + "epoch": 0.11, + "learning_rate": 0.0002841399654207957, + "loss": 0.0309, "step": 40790 }, { - "epoch": 0.21, - "learning_rate": 0.00026912381250283787, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.00028413607720442427, + "loss": 0.0382, "step": 40800 }, { - "epoch": 0.21, - "learning_rate": 0.00026911624480982385, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.0002841321889880528, + "loss": 0.0288, "step": 40810 }, { - "epoch": 0.21, - "learning_rate": 0.00026910867711680983, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.0002841283007716813, + "loss": 0.0356, "step": 40820 }, { - "epoch": 0.21, - "learning_rate": 0.00026910110942379587, - "loss": 0.0228, + "epoch": 0.11, + "learning_rate": 0.00028412441255530987, + "loss": 0.0288, "step": 40830 }, { - "epoch": 0.21, - "learning_rate": 0.00026909354173078185, - "loss": 0.0255, + "epoch": 0.11, + "learning_rate": 0.0002841205243389384, + "loss": 0.0284, "step": 40840 }, { - "epoch": 0.21, - "learning_rate": 0.0002690859740377678, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.0002841166361225669, + "loss": 0.0347, "step": 40850 }, { - "epoch": 0.21, - "learning_rate": 0.00026907840634475376, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.00028411274790619546, + "loss": 0.0309, "step": 40860 }, { - "epoch": 0.21, - "learning_rate": 0.0002690708386517398, - "loss": 0.0216, + "epoch": 0.11, + "learning_rate": 0.00028410885968982403, + "loss": 0.031, "step": 40870 }, { - "epoch": 0.21, - "learning_rate": 0.0002690632709587258, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.00028410497147345255, + "loss": 0.0314, "step": 40880 }, { - "epoch": 0.21, - "learning_rate": 0.00026905570326571176, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.00028410108325708106, + "loss": 0.0338, "step": 40890 }, { - "epoch": 0.21, - "learning_rate": 0.00026904813557269774, - "loss": 0.024, + "epoch": 0.11, + "learning_rate": 0.0002840971950407096, + "loss": 0.0299, "step": 40900 }, { - "epoch": 0.21, - "learning_rate": 0.0002690405678796837, - "loss": 0.0252, + "epoch": 0.11, + "learning_rate": 0.00028409330682433815, + "loss": 0.0261, "step": 40910 }, { - "epoch": 0.21, - "learning_rate": 0.0002690330001866697, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.00028408941860796666, + "loss": 0.0303, "step": 40920 }, { - "epoch": 0.21, - "learning_rate": 0.00026902543249365574, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.00028408553039159523, + "loss": 0.0382, "step": 40930 }, { - "epoch": 0.21, - "learning_rate": 0.0002690178648006417, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.00028408164217522374, + "loss": 0.0284, "step": 40940 }, { - "epoch": 0.21, - "learning_rate": 0.0002690102971076277, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.00028407775395885226, + "loss": 0.0329, "step": 40950 }, { - "epoch": 0.21, - "learning_rate": 0.0002690027294146137, - "loss": 0.0267, + "epoch": 0.11, + "learning_rate": 0.0002840738657424808, + "loss": 0.0319, "step": 40960 }, { - "epoch": 0.21, - "learning_rate": 0.00026899516172159966, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.00028406997752610934, + "loss": 0.0302, "step": 40970 }, { - "epoch": 0.21, - "learning_rate": 0.00026898759402858564, - "loss": 0.025, + "epoch": 0.11, + "learning_rate": 0.00028406608930973786, + "loss": 0.0452, "step": 40980 }, { - "epoch": 0.21, - "learning_rate": 0.0002689800263355716, - "loss": 0.0233, + "epoch": 0.11, + "learning_rate": 0.0002840622010933664, + "loss": 0.0274, "step": 40990 }, { - "epoch": 0.21, - "learning_rate": 0.00026897245864255766, - "loss": 0.0207, + "epoch": 0.11, + "learning_rate": 0.00028405831287699494, + "loss": 0.0318, "step": 41000 }, { - "epoch": 0.21, - "eval_cer": 0.914467344714786, - "eval_loss": 0.01699613220989704, - "eval_runtime": 117.194, - "eval_samples_per_second": 17.066, - "eval_steps_per_second": 4.266, + "epoch": 0.11, + "eval_cer": 0.8817656699852059, + "eval_loss": 0.021903902292251587, + "eval_runtime": 107.5953, + "eval_samples_per_second": 18.588, + "eval_steps_per_second": 4.647, "step": 41000 }, { - "epoch": 0.21, - "learning_rate": 0.00026896489094954364, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.0002840544246606235, + "loss": 0.0273, "step": 41010 }, { - "epoch": 0.21, - "learning_rate": 0.0002689573232565296, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.000284050536444252, + "loss": 0.0282, "step": 41020 }, { - "epoch": 0.21, - "learning_rate": 0.0002689497555635156, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.00028404664822788054, + "loss": 0.0419, "step": 41030 }, { - "epoch": 0.21, - "learning_rate": 0.0002689421878705016, - "loss": 0.0222, + "epoch": 0.11, + "learning_rate": 0.0002840427600115091, + "loss": 0.0402, "step": 41040 }, { - "epoch": 0.21, - "learning_rate": 0.00026893462017748757, - "loss": 0.0222, + "epoch": 0.11, + "learning_rate": 0.0002840388717951376, + "loss": 0.0249, "step": 41050 }, { - "epoch": 0.21, - "learning_rate": 0.0002689270524844736, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.0002840349835787662, + "loss": 0.0277, "step": 41060 }, { - "epoch": 0.21, - "learning_rate": 0.0002689194847914596, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.0002840310953623947, + "loss": 0.0476, "step": 41070 }, { - "epoch": 0.21, - "learning_rate": 0.00026891191709844557, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.00028402720714602327, + "loss": 0.0341, "step": 41080 }, { - "epoch": 0.21, - "learning_rate": 0.00026890434940543155, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.0002840233189296518, + "loss": 0.029, "step": 41090 }, { - "epoch": 0.21, - "learning_rate": 0.00026889678171241753, - "loss": 0.0216, + "epoch": 0.11, + "learning_rate": 0.0002840194307132803, + "loss": 0.0277, "step": 41100 }, { - "epoch": 0.21, - "learning_rate": 0.0002688892140194035, - "loss": 0.0208, + "epoch": 0.11, + "learning_rate": 0.0002840155424969088, + "loss": 0.0313, "step": 41110 }, { - "epoch": 0.21, - "learning_rate": 0.00026888164632638955, - "loss": 0.0247, + "epoch": 0.11, + "learning_rate": 0.0002840116542805374, + "loss": 0.0384, "step": 41120 }, { - "epoch": 0.21, - "learning_rate": 0.00026887407863337553, - "loss": 0.0211, + "epoch": 0.11, + "learning_rate": 0.0002840077660641659, + "loss": 0.0338, "step": 41130 }, { - "epoch": 0.21, - "learning_rate": 0.0002688665109403615, - "loss": 0.0257, + "epoch": 0.11, + "learning_rate": 0.00028400387784779447, + "loss": 0.0266, "step": 41140 }, { - "epoch": 0.21, - "learning_rate": 0.0002688589432473475, - "loss": 0.025, + "epoch": 0.11, + "learning_rate": 0.000283999989631423, + "loss": 0.0282, "step": 41150 }, { - "epoch": 0.21, - "learning_rate": 0.00026885137555433347, - "loss": 0.0201, + "epoch": 0.11, + "learning_rate": 0.00028399610141505155, + "loss": 0.0289, "step": 41160 }, { - "epoch": 0.21, - "learning_rate": 0.00026884380786131945, - "loss": 0.0224, + "epoch": 0.11, + "learning_rate": 0.00028399221319868007, + "loss": 0.0283, "step": 41170 }, { - "epoch": 0.21, - "learning_rate": 0.00026883624016830544, - "loss": 0.0261, + "epoch": 0.11, + "learning_rate": 0.0002839883249823086, + "loss": 0.0336, "step": 41180 }, { - "epoch": 0.21, - "learning_rate": 0.00026882867247529147, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.0002839844367659371, + "loss": 0.0297, "step": 41190 }, { - "epoch": 0.21, - "learning_rate": 0.00026882110478227745, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028398054854956566, + "loss": 0.0293, "step": 41200 }, { - "epoch": 0.21, - "learning_rate": 0.00026881353708926343, - "loss": 0.0228, + "epoch": 0.11, + "learning_rate": 0.00028397666033319423, + "loss": 0.0285, "step": 41210 }, { - "epoch": 0.21, - "learning_rate": 0.0002688059693962494, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.00028397277211682275, + "loss": 0.0361, "step": 41220 }, { - "epoch": 0.21, - "learning_rate": 0.0002687984017032354, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.00028396888390045126, + "loss": 0.0385, "step": 41230 }, { - "epoch": 0.21, - "learning_rate": 0.0002687908340102214, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002839649956840798, + "loss": 0.0343, "step": 41240 }, { - "epoch": 0.21, - "learning_rate": 0.0002687832663172074, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.00028396110746770834, + "loss": 0.0273, "step": 41250 }, { - "epoch": 0.21, - "learning_rate": 0.0002687756986241934, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.00028395721925133686, + "loss": 0.0335, "step": 41260 }, { - "epoch": 0.21, - "learning_rate": 0.0002687681309311794, - "loss": 0.0283, + "epoch": 0.11, + "learning_rate": 0.00028395333103496543, + "loss": 0.0348, "step": 41270 }, { - "epoch": 0.21, - "learning_rate": 0.00026876056323816536, - "loss": 0.0257, + "epoch": 0.11, + "learning_rate": 0.00028394944281859394, + "loss": 0.0277, "step": 41280 }, { - "epoch": 0.21, - "learning_rate": 0.00026875299554515134, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.0002839455546022225, + "loss": 0.0299, "step": 41290 }, { - "epoch": 0.21, - "learning_rate": 0.0002687454278521373, - "loss": 0.0202, + "epoch": 0.11, + "learning_rate": 0.000283941666385851, + "loss": 0.0232, "step": 41300 }, { - "epoch": 0.21, - "learning_rate": 0.00026873786015912336, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.00028393777816947954, + "loss": 0.0273, "step": 41310 }, { - "epoch": 0.21, - "learning_rate": 0.00026873029246610934, - "loss": 0.029, + "epoch": 0.11, + "learning_rate": 0.00028393388995310805, + "loss": 0.0396, "step": 41320 }, { - "epoch": 0.21, - "learning_rate": 0.0002687227247730953, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.0002839300017367366, + "loss": 0.034, "step": 41330 }, { - "epoch": 0.21, - "learning_rate": 0.0002687151570800813, - "loss": 0.024, + "epoch": 0.11, + "learning_rate": 0.00028392611352036514, + "loss": 0.0325, "step": 41340 }, { - "epoch": 0.21, - "learning_rate": 0.0002687075893870673, - "loss": 0.0215, + "epoch": 0.11, + "learning_rate": 0.0002839222253039937, + "loss": 0.0282, "step": 41350 }, { - "epoch": 0.21, - "learning_rate": 0.00026870002169405326, - "loss": 0.0202, + "epoch": 0.11, + "learning_rate": 0.0002839183370876222, + "loss": 0.0296, "step": 41360 }, { - "epoch": 0.21, - "learning_rate": 0.00026869245400103925, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002839144488712508, + "loss": 0.0303, "step": 41370 }, { - "epoch": 0.21, - "learning_rate": 0.0002686848863080253, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002839105606548793, + "loss": 0.0312, "step": 41380 }, { - "epoch": 0.21, - "learning_rate": 0.00026867731861501126, - "loss": 0.0239, + "epoch": 0.11, + "learning_rate": 0.0002839066724385078, + "loss": 0.0268, "step": 41390 }, { - "epoch": 0.21, - "learning_rate": 0.00026866975092199724, - "loss": 0.0218, + "epoch": 0.11, + "learning_rate": 0.00028390278422213633, + "loss": 0.0451, "step": 41400 }, { - "epoch": 0.21, - "learning_rate": 0.0002686621832289832, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.0002838988960057649, + "loss": 0.0574, "step": 41410 }, { - "epoch": 0.21, - "learning_rate": 0.0002686546155359692, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.00028389500778939347, + "loss": 0.0366, "step": 41420 }, { - "epoch": 0.21, - "learning_rate": 0.0002686470478429552, - "loss": 0.0188, + "epoch": 0.11, + "learning_rate": 0.000283891119573022, + "loss": 0.0339, "step": 41430 }, { - "epoch": 0.21, - "learning_rate": 0.0002686394801499412, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.0002838872313566505, + "loss": 0.034, "step": 41440 }, { - "epoch": 0.21, - "learning_rate": 0.0002686319124569272, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.000283883343140279, + "loss": 0.0261, "step": 41450 }, { - "epoch": 0.21, - "learning_rate": 0.0002686243447639132, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.0002838794549239076, + "loss": 0.0342, "step": 41460 }, { - "epoch": 0.21, - "learning_rate": 0.00026861677707089917, - "loss": 0.02, + "epoch": 0.11, + "learning_rate": 0.0002838755667075361, + "loss": 0.0331, "step": 41470 }, { - "epoch": 0.21, - "learning_rate": 0.00026860920937788515, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.00028387167849116467, + "loss": 0.0402, "step": 41480 }, { - "epoch": 0.21, - "learning_rate": 0.00026860164168487113, - "loss": 0.0202, + "epoch": 0.11, + "learning_rate": 0.0002838677902747932, + "loss": 0.0346, "step": 41490 }, { - "epoch": 0.21, - "learning_rate": 0.0002685940739918571, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028386390205842175, + "loss": 0.0287, "step": 41500 }, { - "epoch": 0.21, - "learning_rate": 0.00026858650629884315, - "loss": 0.0227, + "epoch": 0.11, + "learning_rate": 0.00028386001384205026, + "loss": 0.0288, "step": 41510 }, { - "epoch": 0.21, - "learning_rate": 0.00026857893860582913, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.0002838561256256788, + "loss": 0.0298, "step": 41520 }, { - "epoch": 0.21, - "learning_rate": 0.0002685713709128151, - "loss": 0.0223, + "epoch": 0.11, + "learning_rate": 0.0002838522374093073, + "loss": 0.028, "step": 41530 }, { - "epoch": 0.21, - "learning_rate": 0.0002685638032198011, - "loss": 0.0314, + "epoch": 0.11, + "learning_rate": 0.00028384834919293586, + "loss": 0.0305, "step": 41540 }, { - "epoch": 0.21, - "learning_rate": 0.0002685562355267871, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.0002838444609765644, + "loss": 0.0319, "step": 41550 }, { - "epoch": 0.21, - "learning_rate": 0.00026854866783377306, - "loss": 0.0286, + "epoch": 0.11, + "learning_rate": 0.00028384057276019295, + "loss": 0.0295, "step": 41560 }, { - "epoch": 0.21, - "learning_rate": 0.0002685411001407591, - "loss": 0.0293, + "epoch": 0.11, + "learning_rate": 0.00028383668454382146, + "loss": 0.0277, "step": 41570 }, { - "epoch": 0.21, - "learning_rate": 0.00026853353244774507, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.00028383279632745003, + "loss": 0.0274, "step": 41580 }, { - "epoch": 0.21, - "learning_rate": 0.00026852596475473105, - "loss": 0.0232, + "epoch": 0.11, + "learning_rate": 0.00028382890811107854, + "loss": 0.032, "step": 41590 }, { - "epoch": 0.21, - "learning_rate": 0.00026851839706171704, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.00028382501989470706, + "loss": 0.0369, "step": 41600 }, { - "epoch": 0.21, - "learning_rate": 0.000268510829368703, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.0002838211316783356, + "loss": 0.0296, "step": 41610 }, { - "epoch": 0.21, - "learning_rate": 0.000268503261675689, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028381724346196414, + "loss": 0.0256, "step": 41620 }, { - "epoch": 0.21, - "learning_rate": 0.00026849569398267503, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.0002838133552455927, + "loss": 0.0282, "step": 41630 }, { - "epoch": 0.21, - "learning_rate": 0.000268488126289661, - "loss": 0.0277, + "epoch": 0.11, + "learning_rate": 0.0002838094670292212, + "loss": 0.0269, "step": 41640 }, { - "epoch": 0.21, - "learning_rate": 0.000268480558596647, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.00028380557881284974, + "loss": 0.029, "step": 41650 }, { - "epoch": 0.21, - "learning_rate": 0.000268472990903633, - "loss": 0.0216, + "epoch": 0.11, + "learning_rate": 0.0002838016905964783, + "loss": 0.0286, "step": 41660 }, { - "epoch": 0.21, - "learning_rate": 0.00026846542321061896, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.0002837978023801068, + "loss": 0.0286, "step": 41670 }, { - "epoch": 0.21, - "learning_rate": 0.00026845785551760494, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.00028379391416373534, + "loss": 0.0315, "step": 41680 }, { - "epoch": 0.21, - "learning_rate": 0.0002684502878245909, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.0002837900259473639, + "loss": 0.0336, "step": 41690 }, { - "epoch": 0.21, - "learning_rate": 0.00026844272013157696, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002837861377309924, + "loss": 0.0297, "step": 41700 }, { - "epoch": 0.21, - "learning_rate": 0.00026843515243856294, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.000283782249514621, + "loss": 0.0372, "step": 41710 }, { - "epoch": 0.21, - "learning_rate": 0.0002684275847455489, - "loss": 0.0195, + "epoch": 0.11, + "learning_rate": 0.0002837783612982495, + "loss": 0.0326, "step": 41720 }, { - "epoch": 0.21, - "learning_rate": 0.0002684200170525349, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.000283774473081878, + "loss": 0.0365, "step": 41730 }, { - "epoch": 0.21, - "learning_rate": 0.0002684124493595209, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.00028377058486550653, + "loss": 0.0522, "step": 41740 }, { - "epoch": 0.21, - "learning_rate": 0.00026840488166650687, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.0002837666966491351, + "loss": 0.0514, "step": 41750 }, { - "epoch": 0.21, - "learning_rate": 0.0002683973139734929, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.00028376280843276367, + "loss": 0.0338, "step": 41760 }, { - "epoch": 0.21, - "learning_rate": 0.0002683897462804789, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.0002837589202163922, + "loss": 0.0357, "step": 41770 }, { - "epoch": 0.21, - "learning_rate": 0.00026838217858746486, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.0002837550320000207, + "loss": 0.0431, "step": 41780 }, { - "epoch": 0.21, - "learning_rate": 0.00026837461089445085, - "loss": 0.0263, + "epoch": 0.11, + "learning_rate": 0.00028375114378364927, + "loss": 0.0317, "step": 41790 }, { - "epoch": 0.21, - "learning_rate": 0.0002683670432014368, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.0002837472555672778, + "loss": 0.0376, "step": 41800 }, { - "epoch": 0.21, - "learning_rate": 0.0002683594755084228, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.0002837433673509063, + "loss": 0.0296, "step": 41810 }, { - "epoch": 0.21, - "learning_rate": 0.00026835190781540884, - "loss": 0.0203, + "epoch": 0.11, + "learning_rate": 0.00028373947913453487, + "loss": 0.0338, "step": 41820 }, { - "epoch": 0.21, - "learning_rate": 0.0002683443401223948, - "loss": 0.0245, + "epoch": 0.11, + "learning_rate": 0.0002837355909181634, + "loss": 0.0276, "step": 41830 }, { - "epoch": 0.21, - "learning_rate": 0.0002683367724293808, - "loss": 0.0206, + "epoch": 0.11, + "learning_rate": 0.00028373170270179195, + "loss": 0.0262, "step": 41840 }, { - "epoch": 0.21, - "learning_rate": 0.0002683292047363668, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028372781448542046, + "loss": 0.0261, "step": 41850 }, { - "epoch": 0.21, - "learning_rate": 0.00026832163704335277, - "loss": 0.0256, + "epoch": 0.11, + "learning_rate": 0.000283723926269049, + "loss": 0.0226, "step": 41860 }, { - "epoch": 0.21, - "learning_rate": 0.00026831406935033875, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.00028372003805267755, + "loss": 0.0252, "step": 41870 }, { - "epoch": 0.21, - "learning_rate": 0.00026830650165732473, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.00028371614983630606, + "loss": 0.0305, "step": 41880 }, { - "epoch": 0.21, - "learning_rate": 0.00026829893396431077, - "loss": 0.0211, + "epoch": 0.11, + "learning_rate": 0.0002837122616199346, + "loss": 0.0301, "step": 41890 }, { - "epoch": 0.21, - "learning_rate": 0.00026829136627129675, - "loss": 0.0196, + "epoch": 0.11, + "learning_rate": 0.00028370837340356314, + "loss": 0.0268, "step": 41900 }, { - "epoch": 0.21, - "learning_rate": 0.00026828379857828273, - "loss": 0.0222, + "epoch": 0.11, + "learning_rate": 0.0002837044851871917, + "loss": 0.0303, "step": 41910 }, { - "epoch": 0.21, - "learning_rate": 0.0002682762308852687, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.00028370059697082023, + "loss": 0.0286, "step": 41920 }, { - "epoch": 0.21, - "learning_rate": 0.0002682686631922547, - "loss": 0.0218, + "epoch": 0.11, + "learning_rate": 0.00028369670875444874, + "loss": 0.0286, "step": 41930 }, { - "epoch": 0.21, - "learning_rate": 0.0002682610954992407, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.00028369282053807726, + "loss": 0.0263, "step": 41940 }, { - "epoch": 0.21, - "learning_rate": 0.0002682535278062267, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.00028368893232170577, + "loss": 0.0313, "step": 41950 }, { - "epoch": 0.21, - "learning_rate": 0.0002682459601132127, - "loss": 0.0307, + "epoch": 0.11, + "learning_rate": 0.00028368504410533434, + "loss": 0.0275, "step": 41960 }, { - "epoch": 0.21, - "learning_rate": 0.0002682383924201987, - "loss": 0.0334, + "epoch": 0.11, + "learning_rate": 0.0002836811558889629, + "loss": 0.0372, "step": 41970 }, { - "epoch": 0.21, - "learning_rate": 0.00026823082472718466, - "loss": 0.0275, + "epoch": 0.11, + "learning_rate": 0.0002836772676725914, + "loss": 0.0287, "step": 41980 }, { - "epoch": 0.21, - "learning_rate": 0.00026822325703417064, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.00028367337945621994, + "loss": 0.0279, "step": 41990 }, { - "epoch": 0.21, - "learning_rate": 0.0002682156893411566, - "loss": 0.0311, + "epoch": 0.11, + "learning_rate": 0.0002836694912398485, + "loss": 0.0328, "step": 42000 }, { - "epoch": 0.21, - "eval_cer": 0.9144421144155256, - "eval_loss": 0.01655089110136032, - "eval_runtime": 117.2639, - "eval_samples_per_second": 17.056, - "eval_steps_per_second": 4.264, + "epoch": 0.11, + "eval_cer": 0.8818510478381908, + "eval_loss": 0.021058108657598495, + "eval_runtime": 107.6507, + "eval_samples_per_second": 18.579, + "eval_steps_per_second": 4.645, "step": 42000 }, { - "epoch": 0.21, - "learning_rate": 0.0002682081216481426, - "loss": 0.0264, + "epoch": 0.11, + "learning_rate": 0.000283665603023477, + "loss": 0.0316, "step": 42010 }, { - "epoch": 0.21, - "learning_rate": 0.00026820055395512864, - "loss": 0.0291, + "epoch": 0.11, + "learning_rate": 0.00028366171480710554, + "loss": 0.0273, "step": 42020 }, { - "epoch": 0.21, - "learning_rate": 0.0002681929862621146, - "loss": 0.0261, + "epoch": 0.11, + "learning_rate": 0.0002836578265907341, + "loss": 0.028, "step": 42030 }, { - "epoch": 0.21, - "learning_rate": 0.0002681854185691006, - "loss": 0.0209, + "epoch": 0.11, + "learning_rate": 0.0002836539383743626, + "loss": 0.0314, "step": 42040 }, { - "epoch": 0.21, - "learning_rate": 0.0002681778508760866, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.0002836500501579912, + "loss": 0.0286, "step": 42050 }, { - "epoch": 0.21, - "learning_rate": 0.00026817028318307256, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.0002836461619416197, + "loss": 0.029, "step": 42060 }, { - "epoch": 0.21, - "learning_rate": 0.00026816271549005854, - "loss": 0.0239, + "epoch": 0.11, + "learning_rate": 0.0002836422737252482, + "loss": 0.0283, "step": 42070 }, { - "epoch": 0.21, - "learning_rate": 0.0002681551477970446, - "loss": 0.0293, + "epoch": 0.11, + "learning_rate": 0.0002836383855088768, + "loss": 0.0291, "step": 42080 }, { - "epoch": 0.21, - "learning_rate": 0.00026814758010403056, - "loss": 0.0192, + "epoch": 0.11, + "learning_rate": 0.0002836344972925053, + "loss": 0.0267, "step": 42090 }, { - "epoch": 0.21, - "learning_rate": 0.00026814001241101654, - "loss": 0.0228, + "epoch": 0.11, + "learning_rate": 0.0002836306090761338, + "loss": 0.0297, "step": 42100 }, { - "epoch": 0.21, - "learning_rate": 0.00026813244471800247, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.0002836267208597624, + "loss": 0.0268, "step": 42110 }, { - "epoch": 0.21, - "learning_rate": 0.0002681248770249885, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.00028362283264339095, + "loss": 0.0276, "step": 42120 }, { - "epoch": 0.21, - "learning_rate": 0.0002681173093319745, - "loss": 0.024, + "epoch": 0.11, + "learning_rate": 0.00028361894442701947, + "loss": 0.0341, "step": 42130 }, { - "epoch": 0.21, - "learning_rate": 0.00026810974163896047, - "loss": 0.0257, + "epoch": 0.11, + "learning_rate": 0.000283615056210648, + "loss": 0.0344, "step": 42140 }, { - "epoch": 0.21, - "learning_rate": 0.00026810217394594645, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.0002836111679942765, + "loss": 0.0328, "step": 42150 }, { - "epoch": 0.21, - "learning_rate": 0.00026809460625293243, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028360727977790506, + "loss": 0.0322, "step": 42160 }, { - "epoch": 0.21, - "learning_rate": 0.0002680870385599184, - "loss": 0.0223, + "epoch": 0.11, + "learning_rate": 0.0002836033915615336, + "loss": 0.0313, "step": 42170 }, { - "epoch": 0.21, - "learning_rate": 0.00026807947086690445, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.00028359950334516215, + "loss": 0.0338, "step": 42180 }, { - "epoch": 0.21, - "learning_rate": 0.00026807190317389043, - "loss": 0.02, + "epoch": 0.11, + "learning_rate": 0.00028359561512879066, + "loss": 0.0277, "step": 42190 }, { - "epoch": 0.21, - "learning_rate": 0.0002680643354808764, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.0002835917269124192, + "loss": 0.0323, "step": 42200 }, { - "epoch": 0.21, - "learning_rate": 0.0002680567677878624, - "loss": 0.0179, + "epoch": 0.11, + "learning_rate": 0.00028358783869604775, + "loss": 0.0229, "step": 42210 }, { - "epoch": 0.21, - "learning_rate": 0.00026804920009484837, - "loss": 0.0194, + "epoch": 0.11, + "learning_rate": 0.00028358395047967626, + "loss": 0.0256, "step": 42220 }, { - "epoch": 0.21, - "learning_rate": 0.00026804163240183435, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.0002835800622633048, + "loss": 0.0296, "step": 42230 }, { - "epoch": 0.21, - "learning_rate": 0.00026803406470882034, - "loss": 0.018, + "epoch": 0.11, + "learning_rate": 0.00028357617404693334, + "loss": 0.0357, "step": 42240 }, { - "epoch": 0.21, - "learning_rate": 0.00026802649701580637, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.0002835722858305619, + "loss": 0.0308, "step": 42250 }, { - "epoch": 0.21, - "learning_rate": 0.00026801892932279235, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.0002835683976141904, + "loss": 0.0284, "step": 42260 }, { - "epoch": 0.21, - "learning_rate": 0.00026801136162977833, - "loss": 0.0258, + "epoch": 0.11, + "learning_rate": 0.00028356450939781894, + "loss": 0.033, "step": 42270 }, { - "epoch": 0.21, - "learning_rate": 0.0002680037939367643, - "loss": 0.0204, + "epoch": 0.11, + "learning_rate": 0.00028356062118144746, + "loss": 0.0296, "step": 42280 }, { - "epoch": 0.21, - "learning_rate": 0.0002679962262437503, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.000283556732965076, + "loss": 0.0311, "step": 42290 }, { - "epoch": 0.21, - "learning_rate": 0.0002679886585507363, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.00028355284474870454, + "loss": 0.0243, "step": 42300 }, { - "epoch": 0.21, - "learning_rate": 0.0002679810908577223, - "loss": 0.0187, + "epoch": 0.11, + "learning_rate": 0.0002835489565323331, + "loss": 0.0288, "step": 42310 }, { - "epoch": 0.21, - "learning_rate": 0.0002679735231647083, - "loss": 0.019, + "epoch": 0.11, + "learning_rate": 0.0002835450683159616, + "loss": 0.0271, "step": 42320 }, { - "epoch": 0.21, - "learning_rate": 0.0002679659554716943, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.0002835411800995902, + "loss": 0.0281, "step": 42330 }, { - "epoch": 0.21, - "learning_rate": 0.00026795838777868026, - "loss": 0.0222, + "epoch": 0.11, + "learning_rate": 0.0002835372918832187, + "loss": 0.0293, "step": 42340 }, { - "epoch": 0.21, - "learning_rate": 0.00026795082008566624, - "loss": 0.0202, + "epoch": 0.11, + "learning_rate": 0.0002835334036668472, + "loss": 0.0308, "step": 42350 }, { - "epoch": 0.21, - "learning_rate": 0.0002679432523926522, - "loss": 0.0223, + "epoch": 0.11, + "learning_rate": 0.00028352951545047573, + "loss": 0.0275, "step": 42360 }, { - "epoch": 0.21, - "learning_rate": 0.00026793568469963826, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.0002835256272341043, + "loss": 0.0265, "step": 42370 }, { - "epoch": 0.21, - "learning_rate": 0.00026792811700662424, - "loss": 0.0199, + "epoch": 0.11, + "learning_rate": 0.0002835217390177328, + "loss": 0.0283, "step": 42380 }, { - "epoch": 0.21, - "learning_rate": 0.0002679205493136102, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.0002835178508013614, + "loss": 0.0291, "step": 42390 }, { - "epoch": 0.21, - "learning_rate": 0.0002679129816205962, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.0002835139625849899, + "loss": 0.0306, "step": 42400 }, { - "epoch": 0.21, - "learning_rate": 0.0002679054139275822, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.00028351007436861847, + "loss": 0.0271, "step": 42410 }, { - "epoch": 0.21, - "learning_rate": 0.00026789784623456816, - "loss": 0.0229, + "epoch": 0.11, + "learning_rate": 0.000283506186152247, + "loss": 0.034, "step": 42420 }, { - "epoch": 0.21, - "learning_rate": 0.00026789027854155415, - "loss": 0.0213, + "epoch": 0.11, + "learning_rate": 0.0002835022979358755, + "loss": 0.0371, "step": 42430 }, { - "epoch": 0.21, - "learning_rate": 0.0002678827108485402, - "loss": 0.0188, + "epoch": 0.11, + "learning_rate": 0.000283498409719504, + "loss": 0.0263, "step": 42440 }, { - "epoch": 0.21, - "learning_rate": 0.00026787514315552616, - "loss": 0.0209, + "epoch": 0.11, + "learning_rate": 0.0002834945215031326, + "loss": 0.0301, "step": 42450 }, { - "epoch": 0.21, - "learning_rate": 0.00026786757546251214, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.00028349063328676115, + "loss": 0.0298, "step": 42460 }, { - "epoch": 0.21, - "learning_rate": 0.0002678600077694981, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028348674507038967, + "loss": 0.024, "step": 42470 }, { - "epoch": 0.21, - "learning_rate": 0.0002678524400764841, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.0002834828568540182, + "loss": 0.0288, "step": 42480 }, { - "epoch": 0.21, - "learning_rate": 0.0002678448723834701, - "loss": 0.0195, + "epoch": 0.11, + "learning_rate": 0.0002834789686376467, + "loss": 0.0472, "step": 42490 }, { - "epoch": 0.21, - "learning_rate": 0.0002678373046904561, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.00028347508042127526, + "loss": 0.0345, "step": 42500 }, { - "epoch": 0.21, - "learning_rate": 0.0002678297369974421, - "loss": 0.0203, + "epoch": 0.11, + "learning_rate": 0.0002834711922049038, + "loss": 0.0334, "step": 42510 }, { - "epoch": 0.21, - "learning_rate": 0.0002678221693044281, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.00028346730398853235, + "loss": 0.0276, "step": 42520 }, { - "epoch": 0.21, - "learning_rate": 0.00026781460161141407, - "loss": 0.0229, + "epoch": 0.11, + "learning_rate": 0.00028346341577216086, + "loss": 0.0272, "step": 42530 }, { - "epoch": 0.21, - "learning_rate": 0.00026780703391840005, - "loss": 0.0261, + "epoch": 0.11, + "learning_rate": 0.00028345952755578943, + "loss": 0.0251, "step": 42540 }, { - "epoch": 0.21, - "learning_rate": 0.00026779946622538603, - "loss": 0.0243, + "epoch": 0.11, + "learning_rate": 0.00028345563933941794, + "loss": 0.0258, "step": 42550 }, { - "epoch": 0.21, - "learning_rate": 0.00026779189853237207, - "loss": 0.0204, + "epoch": 0.11, + "learning_rate": 0.00028345175112304646, + "loss": 0.0294, "step": 42560 }, { - "epoch": 0.21, - "learning_rate": 0.00026778433083935805, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.000283447862906675, + "loss": 0.0338, "step": 42570 }, { - "epoch": 0.21, - "learning_rate": 0.00026777676314634403, - "loss": 0.0189, + "epoch": 0.11, + "learning_rate": 0.00028344397469030354, + "loss": 0.0319, "step": 42580 }, { - "epoch": 0.21, - "learning_rate": 0.00026776919545333, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.00028344008647393206, + "loss": 0.0287, "step": 42590 }, { - "epoch": 0.21, - "learning_rate": 0.000267761627760316, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002834361982575606, + "loss": 0.0253, "step": 42600 }, { - "epoch": 0.21, - "learning_rate": 0.000267754060067302, - "loss": 0.0232, + "epoch": 0.11, + "learning_rate": 0.00028343231004118914, + "loss": 0.031, "step": 42610 }, { - "epoch": 0.22, - "learning_rate": 0.00026774649237428796, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002834284218248177, + "loss": 0.0294, "step": 42620 }, { - "epoch": 0.22, - "learning_rate": 0.000267738924681274, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.0002834245336084462, + "loss": 0.0276, "step": 42630 }, { - "epoch": 0.22, - "learning_rate": 0.00026773135698825997, - "loss": 0.0227, + "epoch": 0.11, + "learning_rate": 0.00028342064539207474, + "loss": 0.0299, "step": 42640 }, { - "epoch": 0.22, - "learning_rate": 0.00026772378929524595, - "loss": 0.0223, + "epoch": 0.11, + "learning_rate": 0.0002834167571757033, + "loss": 0.031, "step": 42650 }, { - "epoch": 0.22, - "learning_rate": 0.00026771622160223194, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002834128689593318, + "loss": 0.026, "step": 42660 }, { - "epoch": 0.22, - "learning_rate": 0.0002677086539092179, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.0002834089807429604, + "loss": 0.0259, "step": 42670 }, { - "epoch": 0.22, - "learning_rate": 0.0002677010862162039, - "loss": 0.0209, + "epoch": 0.11, + "learning_rate": 0.0002834050925265889, + "loss": 0.0279, "step": 42680 }, { - "epoch": 0.22, - "learning_rate": 0.00026769351852318993, - "loss": 0.0256, + "epoch": 0.11, + "learning_rate": 0.0002834012043102174, + "loss": 0.0292, "step": 42690 }, { - "epoch": 0.22, - "learning_rate": 0.0002676859508301759, - "loss": 0.0274, + "epoch": 0.11, + "learning_rate": 0.00028339731609384593, + "loss": 0.0269, "step": 42700 }, { - "epoch": 0.22, - "learning_rate": 0.0002676783831371619, - "loss": 0.024, + "epoch": 0.11, + "learning_rate": 0.0002833934278774745, + "loss": 0.0286, "step": 42710 }, { - "epoch": 0.22, - "learning_rate": 0.0002676708154441479, - "loss": 0.0265, + "epoch": 0.11, + "learning_rate": 0.000283389539661103, + "loss": 0.0314, "step": 42720 }, { - "epoch": 0.22, - "learning_rate": 0.00026766324775113386, - "loss": 0.0192, + "epoch": 0.11, + "learning_rate": 0.0002833856514447316, + "loss": 0.0348, "step": 42730 }, { - "epoch": 0.22, - "learning_rate": 0.00026765568005811984, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.0002833817632283601, + "loss": 0.0255, "step": 42740 }, { - "epoch": 0.22, - "learning_rate": 0.0002676481123651058, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.00028337787501198867, + "loss": 0.0318, "step": 42750 }, { - "epoch": 0.22, - "learning_rate": 0.00026764054467209186, - "loss": 0.0211, + "epoch": 0.11, + "learning_rate": 0.0002833739867956172, + "loss": 0.0276, "step": 42760 }, { - "epoch": 0.22, - "learning_rate": 0.00026763297697907784, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.0002833700985792457, + "loss": 0.0303, "step": 42770 }, { - "epoch": 0.22, - "learning_rate": 0.0002676254092860638, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002833662103628742, + "loss": 0.0301, "step": 42780 }, { - "epoch": 0.22, - "learning_rate": 0.0002676178415930498, - "loss": 0.0222, + "epoch": 0.11, + "learning_rate": 0.0002833623221465028, + "loss": 0.0336, "step": 42790 }, { - "epoch": 0.22, - "learning_rate": 0.0002676102739000358, - "loss": 0.0208, + "epoch": 0.11, + "learning_rate": 0.00028335843393013135, + "loss": 0.0304, "step": 42800 }, { - "epoch": 0.22, - "learning_rate": 0.00026760270620702177, - "loss": 0.0224, + "epoch": 0.11, + "learning_rate": 0.00028335454571375986, + "loss": 0.0244, "step": 42810 }, { - "epoch": 0.22, - "learning_rate": 0.0002675951385140078, - "loss": 0.0195, + "epoch": 0.11, + "learning_rate": 0.0002833506574973884, + "loss": 0.0318, "step": 42820 }, { - "epoch": 0.22, - "learning_rate": 0.0002675875708209938, - "loss": 0.0269, + "epoch": 0.11, + "learning_rate": 0.00028334676928101695, + "loss": 0.026, "step": 42830 }, { - "epoch": 0.22, - "learning_rate": 0.00026758000312797976, - "loss": 0.0266, + "epoch": 0.11, + "learning_rate": 0.00028334288106464546, + "loss": 0.0327, "step": 42840 }, { - "epoch": 0.22, - "learning_rate": 0.00026757243543496575, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.000283338992848274, + "loss": 0.0325, "step": 42850 }, { - "epoch": 0.22, - "learning_rate": 0.00026756486774195173, - "loss": 0.0231, + "epoch": 0.11, + "learning_rate": 0.00028333510463190254, + "loss": 0.028, "step": 42860 }, { - "epoch": 0.22, - "learning_rate": 0.0002675573000489377, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.00028333121641553106, + "loss": 0.0374, "step": 42870 }, { - "epoch": 0.22, - "learning_rate": 0.00026754973235592374, - "loss": 0.0207, + "epoch": 0.11, + "learning_rate": 0.00028332732819915963, + "loss": 0.0341, "step": 42880 }, { - "epoch": 0.22, - "learning_rate": 0.0002675421646629097, - "loss": 0.0204, + "epoch": 0.11, + "learning_rate": 0.00028332343998278814, + "loss": 0.0304, "step": 42890 }, { - "epoch": 0.22, - "learning_rate": 0.0002675345969698957, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.00028331955176641666, + "loss": 0.0458, "step": 42900 }, { - "epoch": 0.22, - "learning_rate": 0.0002675270292768817, - "loss": 0.0285, + "epoch": 0.11, + "learning_rate": 0.0002833156635500452, + "loss": 0.0376, "step": 42910 }, { - "epoch": 0.22, - "learning_rate": 0.00026751946158386767, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.00028331177533367374, + "loss": 0.0365, "step": 42920 }, { - "epoch": 0.22, - "learning_rate": 0.00026751189389085365, - "loss": 0.0294, + "epoch": 0.11, + "learning_rate": 0.00028330788711730226, + "loss": 0.0309, "step": 42930 }, { - "epoch": 0.22, - "learning_rate": 0.00026750432619783963, - "loss": 0.0213, + "epoch": 0.11, + "learning_rate": 0.0002833039989009308, + "loss": 0.0263, "step": 42940 }, { - "epoch": 0.22, - "learning_rate": 0.00026749675850482567, - "loss": 0.0254, + "epoch": 0.11, + "learning_rate": 0.00028330011068455934, + "loss": 0.0353, "step": 42950 }, { - "epoch": 0.22, - "learning_rate": 0.00026748919081181165, - "loss": 0.0196, + "epoch": 0.11, + "learning_rate": 0.0002832962224681879, + "loss": 0.0337, "step": 42960 }, { - "epoch": 0.22, - "learning_rate": 0.00026748162311879763, - "loss": 0.0287, + "epoch": 0.11, + "learning_rate": 0.0002832923342518164, + "loss": 0.0267, "step": 42970 }, { - "epoch": 0.22, - "learning_rate": 0.0002674740554257836, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.00028328844603544494, + "loss": 0.0302, "step": 42980 }, { - "epoch": 0.22, - "learning_rate": 0.0002674664877327696, - "loss": 0.0244, + "epoch": 0.11, + "learning_rate": 0.00028328455781907345, + "loss": 0.0297, "step": 42990 }, { - "epoch": 0.22, - "learning_rate": 0.0002674589200397556, - "loss": 0.024, + "epoch": 0.11, + "learning_rate": 0.000283280669602702, + "loss": 0.0374, "step": 43000 }, { - "epoch": 0.22, - "eval_cer": 0.9144954862024227, - "eval_loss": 0.01679139770567417, - "eval_runtime": 117.1853, - "eval_samples_per_second": 17.067, - "eval_steps_per_second": 4.267, + "epoch": 0.11, + "eval_cer": 0.8818090587301654, + "eval_loss": 0.02232929691672325, + "eval_runtime": 107.3768, + "eval_samples_per_second": 18.626, + "eval_steps_per_second": 4.657, "step": 43000 }, { - "epoch": 0.22, - "learning_rate": 0.0002674513523467416, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.0002832767813863306, + "loss": 0.0275, "step": 43010 }, { - "epoch": 0.22, - "learning_rate": 0.0002674437846537276, - "loss": 0.0265, + "epoch": 0.11, + "learning_rate": 0.0002832728931699591, + "loss": 0.0277, "step": 43020 }, { - "epoch": 0.22, - "learning_rate": 0.0002674362169607136, - "loss": 0.0239, + "epoch": 0.11, + "learning_rate": 0.0002832690049535876, + "loss": 0.0287, "step": 43030 }, { - "epoch": 0.22, - "learning_rate": 0.00026742864926769956, - "loss": 0.0224, + "epoch": 0.11, + "learning_rate": 0.0002832651167372162, + "loss": 0.0317, "step": 43040 }, { - "epoch": 0.22, - "learning_rate": 0.00026742108157468554, - "loss": 0.0224, + "epoch": 0.11, + "learning_rate": 0.0002832612285208447, + "loss": 0.0281, "step": 43050 }, { - "epoch": 0.22, - "learning_rate": 0.0002674135138816715, - "loss": 0.0209, + "epoch": 0.11, + "learning_rate": 0.0002832573403044732, + "loss": 0.0234, "step": 43060 }, { - "epoch": 0.22, - "learning_rate": 0.00026740594618865755, - "loss": 0.0221, + "epoch": 0.11, + "learning_rate": 0.0002832534520881018, + "loss": 0.0339, "step": 43070 }, { - "epoch": 0.22, - "learning_rate": 0.00026739837849564354, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.0002832495638717303, + "loss": 0.0329, "step": 43080 }, { - "epoch": 0.22, - "learning_rate": 0.0002673908108026295, - "loss": 0.02, + "epoch": 0.11, + "learning_rate": 0.00028324567565535887, + "loss": 0.0299, "step": 43090 }, { - "epoch": 0.22, - "learning_rate": 0.0002673832431096155, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.0002832417874389874, + "loss": 0.0307, "step": 43100 }, { - "epoch": 0.22, - "learning_rate": 0.0002673756754166015, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.0002832378992226159, + "loss": 0.0258, "step": 43110 }, { - "epoch": 0.22, - "learning_rate": 0.00026736810772358746, - "loss": 0.0228, + "epoch": 0.11, + "learning_rate": 0.00028323401100624446, + "loss": 0.0375, "step": 43120 }, { - "epoch": 0.22, - "learning_rate": 0.00026736054003057344, - "loss": 0.0192, + "epoch": 0.11, + "learning_rate": 0.000283230122789873, + "loss": 0.0275, "step": 43130 }, { - "epoch": 0.22, - "learning_rate": 0.0002673529723375595, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002832262345735015, + "loss": 0.0349, "step": 43140 }, { - "epoch": 0.22, - "learning_rate": 0.00026734540464454546, - "loss": 0.0229, + "epoch": 0.11, + "learning_rate": 0.00028322234635713006, + "loss": 0.042, "step": 43150 }, { - "epoch": 0.22, - "learning_rate": 0.00026733783695153144, - "loss": 0.0224, + "epoch": 0.11, + "learning_rate": 0.00028321845814075863, + "loss": 0.0289, "step": 43160 }, { - "epoch": 0.22, - "learning_rate": 0.0002673302692585174, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.00028321456992438715, + "loss": 0.0303, "step": 43170 }, { - "epoch": 0.22, - "learning_rate": 0.0002673227015655034, - "loss": 0.025, + "epoch": 0.11, + "learning_rate": 0.00028321068170801566, + "loss": 0.0291, "step": 43180 }, { - "epoch": 0.22, - "learning_rate": 0.0002673151338724894, - "loss": 0.0229, + "epoch": 0.11, + "learning_rate": 0.0002832067934916442, + "loss": 0.0276, "step": 43190 }, { - "epoch": 0.22, - "learning_rate": 0.0002673075661794754, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.00028320290527527274, + "loss": 0.0328, "step": 43200 }, { - "epoch": 0.22, - "learning_rate": 0.0002672999984864614, - "loss": 0.0209, + "epoch": 0.11, + "learning_rate": 0.00028319901705890126, + "loss": 0.029, "step": 43210 }, { - "epoch": 0.22, - "learning_rate": 0.0002672924307934474, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.00028319512884252983, + "loss": 0.0264, "step": 43220 }, { - "epoch": 0.22, - "learning_rate": 0.00026728486310043337, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.00028319124062615834, + "loss": 0.0308, "step": 43230 }, { - "epoch": 0.22, - "learning_rate": 0.00026727729540741935, - "loss": 0.0241, + "epoch": 0.11, + "learning_rate": 0.00028318735240978686, + "loss": 0.03, "step": 43240 }, { - "epoch": 0.22, - "learning_rate": 0.00026726972771440533, - "loss": 0.0254, + "epoch": 0.11, + "learning_rate": 0.0002831834641934154, + "loss": 0.0335, "step": 43250 }, { - "epoch": 0.22, - "learning_rate": 0.0002672621600213913, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.00028317957597704394, + "loss": 0.0259, "step": 43260 }, { - "epoch": 0.22, - "learning_rate": 0.00026725459232837735, - "loss": 0.0281, + "epoch": 0.11, + "learning_rate": 0.00028317568776067245, + "loss": 0.0306, "step": 43270 }, { - "epoch": 0.22, - "learning_rate": 0.00026724702463536333, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.000283171799544301, + "loss": 0.0323, "step": 43280 }, { - "epoch": 0.22, - "learning_rate": 0.0002672394569423493, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.00028316791132792954, + "loss": 0.0304, "step": 43290 }, { - "epoch": 0.22, - "learning_rate": 0.0002672318892493353, - "loss": 0.0235, + "epoch": 0.11, + "learning_rate": 0.0002831640231115581, + "loss": 0.0278, "step": 43300 }, { - "epoch": 0.22, - "learning_rate": 0.00026722432155632127, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.0002831601348951866, + "loss": 0.0264, "step": 43310 }, { - "epoch": 0.22, - "learning_rate": 0.00026721675386330725, - "loss": 0.0237, + "epoch": 0.11, + "learning_rate": 0.00028315624667881514, + "loss": 0.0258, "step": 43320 }, { - "epoch": 0.22, - "learning_rate": 0.0002672091861702933, - "loss": 0.0194, + "epoch": 0.11, + "learning_rate": 0.0002831523584624437, + "loss": 0.0279, "step": 43330 }, { - "epoch": 0.22, - "learning_rate": 0.00026720161847727927, - "loss": 0.0216, + "epoch": 0.11, + "learning_rate": 0.0002831484702460722, + "loss": 0.0271, "step": 43340 }, { - "epoch": 0.22, - "learning_rate": 0.00026719405078426525, - "loss": 0.0227, + "epoch": 0.11, + "learning_rate": 0.0002831445820297008, + "loss": 0.0225, "step": 43350 }, { - "epoch": 0.22, - "learning_rate": 0.00026718648309125123, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.0002831406938133293, + "loss": 0.0287, "step": 43360 }, { - "epoch": 0.22, - "learning_rate": 0.0002671789153982372, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.00028313680559695787, + "loss": 0.0308, "step": 43370 }, { - "epoch": 0.22, - "learning_rate": 0.0002671713477052232, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.0002831329173805864, + "loss": 0.0239, "step": 43380 }, { - "epoch": 0.22, - "learning_rate": 0.0002671637800122092, - "loss": 0.0223, + "epoch": 0.11, + "learning_rate": 0.0002831290291642149, + "loss": 0.0283, "step": 43390 }, { - "epoch": 0.22, - "learning_rate": 0.00026715621231919516, - "loss": 0.0216, + "epoch": 0.11, + "learning_rate": 0.0002831251409478434, + "loss": 0.025, "step": 43400 }, { - "epoch": 0.22, - "learning_rate": 0.00026714864462618114, - "loss": 0.0199, + "epoch": 0.11, + "learning_rate": 0.000283121252731472, + "loss": 0.025, "step": 43410 }, { - "epoch": 0.22, - "learning_rate": 0.0002671410769331671, - "loss": 0.0257, + "epoch": 0.11, + "learning_rate": 0.0002831173645151005, + "loss": 0.0256, "step": 43420 }, { - "epoch": 0.22, - "learning_rate": 0.00026713350924015316, - "loss": 0.0252, + "epoch": 0.11, + "learning_rate": 0.00028311347629872907, + "loss": 0.0251, "step": 43430 }, { - "epoch": 0.22, - "learning_rate": 0.00026712594154713914, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.0002831095880823576, + "loss": 0.0298, "step": 43440 }, { - "epoch": 0.22, - "learning_rate": 0.0002671183738541251, - "loss": 0.0199, + "epoch": 0.11, + "learning_rate": 0.0002831056998659861, + "loss": 0.0307, "step": 43450 }, { - "epoch": 0.22, - "learning_rate": 0.0002671108061611111, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.00028310181164961466, + "loss": 0.0296, "step": 43460 }, { - "epoch": 0.22, - "learning_rate": 0.0002671032384680971, - "loss": 0.0195, + "epoch": 0.11, + "learning_rate": 0.0002830979234332432, + "loss": 0.0355, "step": 43470 }, { - "epoch": 0.22, - "learning_rate": 0.00026709567077508306, - "loss": 0.0232, + "epoch": 0.11, + "learning_rate": 0.0002830940352168717, + "loss": 0.0314, "step": 43480 }, { - "epoch": 0.22, - "learning_rate": 0.00026708810308206905, - "loss": 0.0198, + "epoch": 0.11, + "learning_rate": 0.00028309014700050026, + "loss": 0.0292, "step": 43490 }, { - "epoch": 0.22, - "learning_rate": 0.0002670805353890551, - "loss": 0.0285, + "epoch": 0.11, + "learning_rate": 0.00028308625878412883, + "loss": 0.0326, "step": 43500 }, { - "epoch": 0.22, - "learning_rate": 0.00026707296769604106, - "loss": 0.0255, + "epoch": 0.11, + "learning_rate": 0.00028308237056775734, + "loss": 0.024, "step": 43510 }, { - "epoch": 0.22, - "learning_rate": 0.00026706540000302704, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.00028307848235138586, + "loss": 0.0304, "step": 43520 }, { - "epoch": 0.22, - "learning_rate": 0.000267057832310013, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.0002830745941350144, + "loss": 0.0283, "step": 43530 }, { - "epoch": 0.22, - "learning_rate": 0.000267050264616999, - "loss": 0.0227, + "epoch": 0.11, + "learning_rate": 0.00028307070591864294, + "loss": 0.0279, "step": 43540 }, { - "epoch": 0.22, - "learning_rate": 0.000267042696923985, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.00028306681770227146, + "loss": 0.0288, "step": 43550 }, { - "epoch": 0.22, - "learning_rate": 0.000267035129230971, - "loss": 0.0207, + "epoch": 0.11, + "learning_rate": 0.0002830629294859, + "loss": 0.0277, "step": 43560 }, { - "epoch": 0.22, - "learning_rate": 0.000267027561537957, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.00028305904126952854, + "loss": 0.0321, "step": 43570 }, { - "epoch": 0.22, - "learning_rate": 0.000267019993844943, - "loss": 0.0204, + "epoch": 0.11, + "learning_rate": 0.0002830551530531571, + "loss": 0.034, "step": 43580 }, { - "epoch": 0.22, - "learning_rate": 0.00026701242615192897, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.0002830512648367856, + "loss": 0.035, "step": 43590 }, { - "epoch": 0.22, - "learning_rate": 0.00026700485845891495, - "loss": 0.022, + "epoch": 0.11, + "learning_rate": 0.00028304737662041414, + "loss": 0.0304, "step": 43600 }, { - "epoch": 0.22, - "learning_rate": 0.00026699729076590093, - "loss": 0.0504, + "epoch": 0.11, + "learning_rate": 0.00028304348840404265, + "loss": 0.0259, "step": 43610 }, { - "epoch": 0.22, - "learning_rate": 0.00026698972307288697, - "loss": 0.0199, + "epoch": 0.11, + "learning_rate": 0.0002830396001876712, + "loss": 0.0285, "step": 43620 }, { - "epoch": 0.22, - "learning_rate": 0.00026698215537987295, - "loss": 0.0281, + "epoch": 0.11, + "learning_rate": 0.00028303571197129974, + "loss": 0.03, "step": 43630 }, { - "epoch": 0.22, - "learning_rate": 0.00026697458768685893, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.0002830318237549283, + "loss": 0.0308, "step": 43640 }, { - "epoch": 0.22, - "learning_rate": 0.0002669670199938449, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.0002830279355385568, + "loss": 0.0274, "step": 43650 }, { - "epoch": 0.22, - "learning_rate": 0.0002669594523008309, - "loss": 0.0211, + "epoch": 0.11, + "learning_rate": 0.0002830240473221854, + "loss": 0.0285, "step": 43660 }, { - "epoch": 0.22, - "learning_rate": 0.0002669518846078169, - "loss": 0.0208, + "epoch": 0.11, + "learning_rate": 0.0002830201591058139, + "loss": 0.0318, "step": 43670 }, { - "epoch": 0.22, - "learning_rate": 0.00026694431691480286, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.0002830162708894424, + "loss": 0.0249, "step": 43680 }, { - "epoch": 0.22, - "learning_rate": 0.0002669367492217889, - "loss": 0.0202, + "epoch": 0.11, + "learning_rate": 0.00028301238267307093, + "loss": 0.0261, "step": 43690 }, { - "epoch": 0.22, - "learning_rate": 0.0002669291815287749, - "loss": 0.0228, + "epoch": 0.11, + "learning_rate": 0.0002830084944566995, + "loss": 0.0241, "step": 43700 }, { - "epoch": 0.22, - "learning_rate": 0.00026692161383576085, - "loss": 0.0259, + "epoch": 0.11, + "learning_rate": 0.00028300460624032807, + "loss": 0.0317, "step": 43710 }, { - "epoch": 0.22, - "learning_rate": 0.00026691404614274684, - "loss": 0.0252, + "epoch": 0.11, + "learning_rate": 0.0002830007180239566, + "loss": 0.035, "step": 43720 }, { - "epoch": 0.22, - "learning_rate": 0.0002669064784497328, - "loss": 0.0236, + "epoch": 0.11, + "learning_rate": 0.0002829968298075851, + "loss": 0.0293, "step": 43730 }, { - "epoch": 0.22, - "learning_rate": 0.0002668989107567188, - "loss": 0.0253, + "epoch": 0.11, + "learning_rate": 0.0002829929415912136, + "loss": 0.0277, "step": 43740 }, { - "epoch": 0.22, - "learning_rate": 0.00026689134306370483, - "loss": 0.0205, + "epoch": 0.11, + "learning_rate": 0.0002829890533748422, + "loss": 0.0304, "step": 43750 }, { - "epoch": 0.22, - "learning_rate": 0.0002668837753706908, - "loss": 0.0192, + "epoch": 0.11, + "learning_rate": 0.0002829851651584707, + "loss": 0.0278, "step": 43760 }, { - "epoch": 0.22, - "learning_rate": 0.0002668762076776768, - "loss": 0.0189, + "epoch": 0.11, + "learning_rate": 0.00028298127694209926, + "loss": 0.0293, "step": 43770 }, { - "epoch": 0.22, - "learning_rate": 0.0002668686399846628, - "loss": 0.0208, + "epoch": 0.11, + "learning_rate": 0.0002829773887257278, + "loss": 0.0331, "step": 43780 }, { - "epoch": 0.22, - "learning_rate": 0.00026686107229164876, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.00028297350050935635, + "loss": 0.0267, "step": 43790 }, { - "epoch": 0.22, - "learning_rate": 0.00026685350459863474, - "loss": 0.0204, + "epoch": 0.11, + "learning_rate": 0.00028296961229298486, + "loss": 0.0265, "step": 43800 }, { - "epoch": 0.22, - "learning_rate": 0.0002668459369056207, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.0002829657240766134, + "loss": 0.0371, "step": 43810 }, { - "epoch": 0.22, - "learning_rate": 0.00026683836921260676, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.0002829618358602419, + "loss": 0.0293, "step": 43820 }, { - "epoch": 0.22, - "learning_rate": 0.00026683080151959274, - "loss": 0.0263, + "epoch": 0.11, + "learning_rate": 0.00028295794764387046, + "loss": 0.0276, "step": 43830 }, { - "epoch": 0.22, - "learning_rate": 0.0002668232338265787, - "loss": 0.0205, + "epoch": 0.11, + "learning_rate": 0.00028295405942749903, + "loss": 0.0315, "step": 43840 }, { - "epoch": 0.22, - "learning_rate": 0.0002668156661335647, + "epoch": 0.11, + "learning_rate": 0.00028295017121112754, "loss": 0.0266, "step": 43850 }, { - "epoch": 0.22, - "learning_rate": 0.0002668080984405507, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.00028294628299475606, + "loss": 0.0315, "step": 43860 }, { - "epoch": 0.22, - "learning_rate": 0.00026680053074753667, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.0002829423947783846, + "loss": 0.0337, "step": 43870 }, { - "epoch": 0.22, - "learning_rate": 0.0002667929630545227, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.00028293850656201314, + "loss": 0.0277, "step": 43880 }, { - "epoch": 0.22, - "learning_rate": 0.0002667853953615087, - "loss": 0.0225, + "epoch": 0.11, + "learning_rate": 0.00028293461834564166, + "loss": 0.0306, "step": 43890 }, { - "epoch": 0.22, - "learning_rate": 0.00026677782766849466, - "loss": 0.0233, + "epoch": 0.11, + "learning_rate": 0.0002829307301292702, + "loss": 0.0292, "step": 43900 }, { - "epoch": 0.22, - "learning_rate": 0.00026677025997548065, - "loss": 0.0208, + "epoch": 0.11, + "learning_rate": 0.00028292684191289874, + "loss": 0.038, "step": 43910 }, { - "epoch": 0.22, - "learning_rate": 0.00026676269228246663, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.0002829229536965273, + "loss": 0.0258, "step": 43920 }, { - "epoch": 0.22, - "learning_rate": 0.0002667551245894526, - "loss": 0.0218, + "epoch": 0.11, + "learning_rate": 0.0002829190654801558, + "loss": 0.0453, "step": 43930 }, { - "epoch": 0.22, - "learning_rate": 0.00026674755689643864, - "loss": 0.02, + "epoch": 0.11, + "learning_rate": 0.00028291517726378434, + "loss": 0.0287, "step": 43940 }, { - "epoch": 0.22, - "learning_rate": 0.0002667399892034246, - "loss": 0.0161, + "epoch": 0.11, + "learning_rate": 0.00028291128904741285, + "loss": 0.0278, "step": 43950 }, { - "epoch": 0.22, - "learning_rate": 0.0002667324215104106, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.0002829074008310414, + "loss": 0.0318, "step": 43960 }, { - "epoch": 0.22, - "learning_rate": 0.0002667248538173966, - "loss": 0.0182, + "epoch": 0.11, + "learning_rate": 0.00028290351261466993, + "loss": 0.0292, "step": 43970 }, { - "epoch": 0.22, - "learning_rate": 0.00026671728612438257, - "loss": 0.0228, + "epoch": 0.11, + "learning_rate": 0.0002828996243982985, + "loss": 0.0281, "step": 43980 }, { - "epoch": 0.22, - "learning_rate": 0.00026670971843136855, - "loss": 0.0189, + "epoch": 0.11, + "learning_rate": 0.000282895736181927, + "loss": 0.0261, "step": 43990 }, { - "epoch": 0.22, - "learning_rate": 0.00026670215073835453, - "loss": 0.0206, + "epoch": 0.11, + "learning_rate": 0.0002828918479655556, + "loss": 0.03, "step": 44000 }, { - "epoch": 0.22, - "eval_cer": 0.914452788772905, - "eval_loss": 0.01625337265431881, - "eval_runtime": 117.269, - "eval_samples_per_second": 17.055, - "eval_steps_per_second": 4.264, + "epoch": 0.11, + "eval_cer": 0.8818090587301654, + "eval_loss": 0.021903708577156067, + "eval_runtime": 107.4337, + "eval_samples_per_second": 18.616, + "eval_steps_per_second": 4.654, "step": 44000 }, { - "epoch": 0.22, - "learning_rate": 0.00026669458304534057, - "loss": 0.0252, + "epoch": 0.11, + "learning_rate": 0.0002828879597491841, + "loss": 0.0297, "step": 44010 }, { - "epoch": 0.22, - "learning_rate": 0.00026668701535232655, - "loss": 0.026, + "epoch": 0.11, + "learning_rate": 0.0002828840715328126, + "loss": 0.0263, "step": 44020 }, { - "epoch": 0.22, - "learning_rate": 0.00026667944765931253, - "loss": 0.0212, + "epoch": 0.11, + "learning_rate": 0.00028288018331644113, + "loss": 0.0313, "step": 44030 }, { - "epoch": 0.22, - "learning_rate": 0.0002666718799662985, - "loss": 0.0205, + "epoch": 0.11, + "learning_rate": 0.0002828762951000697, + "loss": 0.0305, "step": 44040 }, { - "epoch": 0.22, - "learning_rate": 0.0002666643122732845, - "loss": 0.0271, + "epoch": 0.11, + "learning_rate": 0.00028287240688369827, + "loss": 0.0283, "step": 44050 }, { - "epoch": 0.22, - "learning_rate": 0.0002666567445802705, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.0002828685186673268, + "loss": 0.028, "step": 44060 }, { - "epoch": 0.22, - "learning_rate": 0.0002666491768872565, - "loss": 0.0242, + "epoch": 0.11, + "learning_rate": 0.0002828646304509553, + "loss": 0.0352, "step": 44070 }, { - "epoch": 0.22, - "learning_rate": 0.0002666416091942425, - "loss": 0.0203, + "epoch": 0.11, + "learning_rate": 0.00028286074223458387, + "loss": 0.0306, "step": 44080 }, { - "epoch": 0.22, - "learning_rate": 0.0002666340415012285, - "loss": 0.0196, + "epoch": 0.11, + "learning_rate": 0.0002828568540182124, + "loss": 0.0267, "step": 44090 }, { - "epoch": 0.22, - "learning_rate": 0.00026662647380821446, - "loss": 0.0214, + "epoch": 0.11, + "learning_rate": 0.0002828529658018409, + "loss": 0.0222, "step": 44100 }, { - "epoch": 0.22, - "learning_rate": 0.00026661890611520044, - "loss": 0.0276, + "epoch": 0.11, + "learning_rate": 0.00028284907758546946, + "loss": 0.0327, "step": 44110 }, { - "epoch": 0.22, - "learning_rate": 0.0002666113384221864, - "loss": 0.0215, + "epoch": 0.11, + "learning_rate": 0.000282845189369098, + "loss": 0.0406, "step": 44120 }, { - "epoch": 0.22, - "learning_rate": 0.00026660377072917245, - "loss": 0.0233, + "epoch": 0.11, + "learning_rate": 0.00028284130115272655, + "loss": 0.0248, "step": 44130 }, { - "epoch": 0.22, - "learning_rate": 0.00026659620303615844, - "loss": 0.0246, + "epoch": 0.11, + "learning_rate": 0.00028283741293635506, + "loss": 0.03, "step": 44140 }, { - "epoch": 0.22, - "learning_rate": 0.0002665886353431444, - "loss": 0.0191, + "epoch": 0.11, + "learning_rate": 0.0002828335247199836, + "loss": 0.0296, "step": 44150 }, { - "epoch": 0.22, - "learning_rate": 0.0002665810676501304, - "loss": 0.0241, + "epoch": 0.11, + "learning_rate": 0.00028282963650361214, + "loss": 0.0326, "step": 44160 }, { - "epoch": 0.22, - "learning_rate": 0.0002665734999571164, - "loss": 0.0196, + "epoch": 0.11, + "learning_rate": 0.00028282574828724066, + "loss": 0.0277, "step": 44170 }, { - "epoch": 0.22, - "learning_rate": 0.00026656593226410236, - "loss": 0.0297, + "epoch": 0.11, + "learning_rate": 0.0002828218600708692, + "loss": 0.0342, "step": 44180 }, { - "epoch": 0.22, - "learning_rate": 0.00026655836457108834, - "loss": 0.0272, + "epoch": 0.11, + "learning_rate": 0.00028281797185449774, + "loss": 0.0285, "step": 44190 }, { - "epoch": 0.22, - "learning_rate": 0.0002665507968780744, - "loss": 0.0298, + "epoch": 0.11, + "learning_rate": 0.00028281408363812626, + "loss": 0.0311, "step": 44200 }, { - "epoch": 0.22, - "learning_rate": 0.00026654322918506036, - "loss": 0.0241, + "epoch": 0.11, + "learning_rate": 0.0002828101954217548, + "loss": 0.0301, "step": 44210 }, { - "epoch": 0.22, - "learning_rate": 0.00026653566149204634, - "loss": 0.0249, + "epoch": 0.11, + "learning_rate": 0.00028280630720538334, + "loss": 0.0303, "step": 44220 }, { - "epoch": 0.22, - "learning_rate": 0.0002665280937990323, - "loss": 0.0265, + "epoch": 0.11, + "learning_rate": 0.00028280241898901185, + "loss": 0.0254, "step": 44230 }, { - "epoch": 0.22, - "learning_rate": 0.0002665205261060183, - "loss": 0.021, + "epoch": 0.11, + "learning_rate": 0.0002827985307726404, + "loss": 0.0236, "step": 44240 }, { - "epoch": 0.22, - "learning_rate": 0.0002665129584130043, - "loss": 0.0226, + "epoch": 0.11, + "learning_rate": 0.00028279464255626894, + "loss": 0.0321, "step": 44250 }, { - "epoch": 0.22, - "learning_rate": 0.0002665053907199903, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.0002827907543398975, + "loss": 0.0271, "step": 44260 }, { - "epoch": 0.22, - "learning_rate": 0.0002664978230269763, - "loss": 0.0364, + "epoch": 0.11, + "learning_rate": 0.000282786866123526, + "loss": 0.0267, "step": 44270 }, { - "epoch": 0.22, - "learning_rate": 0.0002664902553339623, - "loss": 0.0259, + "epoch": 0.11, + "learning_rate": 0.00028278297790715454, + "loss": 0.027, "step": 44280 }, { - "epoch": 0.22, - "learning_rate": 0.00026648268764094827, - "loss": 0.0238, + "epoch": 0.11, + "learning_rate": 0.0002827790896907831, + "loss": 0.0272, "step": 44290 }, { - "epoch": 0.22, - "learning_rate": 0.00026647511994793425, - "loss": 0.0234, + "epoch": 0.11, + "learning_rate": 0.0002827752014744116, + "loss": 0.0353, "step": 44300 }, { - "epoch": 0.22, - "learning_rate": 0.00026646755225492023, - "loss": 0.0217, + "epoch": 0.11, + "learning_rate": 0.00028277131325804013, + "loss": 0.0283, "step": 44310 }, { - "epoch": 0.22, - "learning_rate": 0.0002664599845619062, - "loss": 0.0233, + "epoch": 0.11, + "learning_rate": 0.0002827674250416687, + "loss": 0.0268, "step": 44320 }, { - "epoch": 0.22, - "learning_rate": 0.00026645241686889225, - "loss": 0.023, + "epoch": 0.11, + "learning_rate": 0.0002827635368252972, + "loss": 0.0412, "step": 44330 }, { - "epoch": 0.22, - "learning_rate": 0.00026644484917587823, - "loss": 0.0219, + "epoch": 0.11, + "learning_rate": 0.0002827596486089258, + "loss": 0.0309, "step": 44340 }, { - "epoch": 0.22, - "learning_rate": 0.0002664372814828642, - "loss": 0.0251, + "epoch": 0.11, + "learning_rate": 0.0002827557603925543, + "loss": 0.036, "step": 44350 }, { - "epoch": 0.22, - "learning_rate": 0.0002664297137898502, - "loss": 0.0248, + "epoch": 0.11, + "learning_rate": 0.0002827518721761828, + "loss": 0.03, "step": 44360 }, { - "epoch": 0.22, - "learning_rate": 0.00026642214609683617, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.0002827479839598114, + "loss": 0.0266, "step": 44370 }, { - "epoch": 0.22, - "learning_rate": 0.00026641457840382215, - "loss": 0.0293, + "epoch": 0.12, + "learning_rate": 0.0002827440957434399, + "loss": 0.0283, "step": 44380 }, { - "epoch": 0.22, - "learning_rate": 0.0002664070107108082, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.00028274020752706847, + "loss": 0.0257, "step": 44390 }, { - "epoch": 0.22, - "learning_rate": 0.00026639944301779417, - "loss": 0.0255, + "epoch": 0.12, + "learning_rate": 0.000282736319310697, + "loss": 0.0322, "step": 44400 }, { - "epoch": 0.22, - "learning_rate": 0.00026639187532478015, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.00028273243109432555, + "loss": 0.0314, "step": 44410 }, { - "epoch": 0.22, - "learning_rate": 0.00026638430763176613, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028272854287795406, + "loss": 0.0296, "step": 44420 }, { - "epoch": 0.22, - "learning_rate": 0.0002663767399387521, - "loss": 0.0215, + "epoch": 0.12, + "learning_rate": 0.0002827246546615826, + "loss": 0.034, "step": 44430 }, { - "epoch": 0.22, - "learning_rate": 0.0002663691722457381, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.0002827207664452111, + "loss": 0.0361, "step": 44440 }, { - "epoch": 0.22, - "learning_rate": 0.00026636160455272413, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.00028271687822883966, + "loss": 0.0273, "step": 44450 }, { - "epoch": 0.22, - "learning_rate": 0.0002663540368597101, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.0002827129900124682, + "loss": 0.0284, "step": 44460 }, { - "epoch": 0.22, - "learning_rate": 0.0002663464691666961, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.00028270910179609675, + "loss": 0.0249, "step": 44470 }, { - "epoch": 0.22, - "learning_rate": 0.0002663389014736821, - "loss": 0.0173, + "epoch": 0.12, + "learning_rate": 0.00028270521357972526, + "loss": 0.0281, "step": 44480 }, { - "epoch": 0.22, - "learning_rate": 0.00026633133378066806, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.0002827013253633538, + "loss": 0.0287, "step": 44490 }, { - "epoch": 0.22, - "learning_rate": 0.00026632376608765404, - "loss": 0.0256, + "epoch": 0.12, + "learning_rate": 0.00028269743714698234, + "loss": 0.0246, "step": 44500 }, { - "epoch": 0.22, - "learning_rate": 0.00026631619839464, - "loss": 0.0221, + "epoch": 0.12, + "learning_rate": 0.00028269354893061086, + "loss": 0.0291, "step": 44510 }, { - "epoch": 0.22, - "learning_rate": 0.00026630863070162606, - "loss": 0.0248, + "epoch": 0.12, + "learning_rate": 0.00028268966071423937, + "loss": 0.0314, "step": 44520 }, { - "epoch": 0.22, - "learning_rate": 0.00026630106300861204, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.00028268577249786794, + "loss": 0.0271, "step": 44530 }, { - "epoch": 0.22, - "learning_rate": 0.000266293495315598, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.0002826818842814965, + "loss": 0.0297, "step": 44540 }, { - "epoch": 0.22, - "learning_rate": 0.000266285927622584, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.000282677996065125, + "loss": 0.0317, "step": 44550 }, { - "epoch": 0.22, - "learning_rate": 0.00026627835992957, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.00028267410784875354, + "loss": 0.0274, "step": 44560 }, { - "epoch": 0.22, - "learning_rate": 0.00026627079223655596, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.00028267021963238205, + "loss": 0.031, "step": 44570 }, { - "epoch": 0.22, - "learning_rate": 0.000266263224543542, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.0002826663314160106, + "loss": 0.022, "step": 44580 }, { - "epoch": 0.22, - "learning_rate": 0.000266255656850528, - "loss": 0.0189, + "epoch": 0.12, + "learning_rate": 0.00028266244319963914, + "loss": 0.0351, "step": 44590 }, { - "epoch": 0.23, - "learning_rate": 0.00026624808915751396, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.0002826585549832677, + "loss": 0.031, "step": 44600 }, { - "epoch": 0.23, - "learning_rate": 0.00026624052146449994, - "loss": 0.0242, + "epoch": 0.12, + "learning_rate": 0.0002826546667668962, + "loss": 0.0264, "step": 44610 }, { - "epoch": 0.23, - "learning_rate": 0.0002662329537714859, - "loss": 0.0203, + "epoch": 0.12, + "learning_rate": 0.0002826507785505248, + "loss": 0.0335, "step": 44620 }, { - "epoch": 0.23, - "learning_rate": 0.0002662253860784719, - "loss": 0.025, + "epoch": 0.12, + "learning_rate": 0.0002826468903341533, + "loss": 0.0289, "step": 44630 }, { - "epoch": 0.23, - "learning_rate": 0.0002662178183854579, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002826430021177818, + "loss": 0.0288, "step": 44640 }, { - "epoch": 0.23, - "learning_rate": 0.00026621025069244387, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.00028263911390141033, + "loss": 0.0301, "step": 44650 }, { - "epoch": 0.23, - "learning_rate": 0.00026620268299942985, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002826352256850389, + "loss": 0.0327, "step": 44660 }, { - "epoch": 0.23, - "learning_rate": 0.00026619511530641583, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.0002826313374686674, + "loss": 0.0264, "step": 44670 }, { - "epoch": 0.23, - "learning_rate": 0.00026618754761340187, - "loss": 0.0193, + "epoch": 0.12, + "learning_rate": 0.000282627449252296, + "loss": 0.0274, "step": 44680 }, { - "epoch": 0.23, - "learning_rate": 0.00026617997992038785, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.0002826235610359245, + "loss": 0.0264, "step": 44690 }, { - "epoch": 0.23, - "learning_rate": 0.00026617241222737383, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.000282619672819553, + "loss": 0.031, "step": 44700 }, { - "epoch": 0.23, - "learning_rate": 0.0002661648445343598, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.0002826157846031816, + "loss": 0.0238, "step": 44710 }, { - "epoch": 0.23, - "learning_rate": 0.0002661572768413458, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002826118963868101, + "loss": 0.0283, "step": 44720 }, { - "epoch": 0.23, - "learning_rate": 0.0002661497091483318, - "loss": 0.0232, + "epoch": 0.12, + "learning_rate": 0.0002826080081704386, + "loss": 0.0308, "step": 44730 }, { - "epoch": 0.23, - "learning_rate": 0.00026614214145531776, - "loss": 0.0252, + "epoch": 0.12, + "learning_rate": 0.0002826041199540672, + "loss": 0.0235, "step": 44740 }, { - "epoch": 0.23, - "learning_rate": 0.0002661345737623038, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028260023173769575, + "loss": 0.0365, "step": 44750 }, { - "epoch": 0.23, - "learning_rate": 0.0002661270060692898, - "loss": 0.0239, + "epoch": 0.12, + "learning_rate": 0.00028259634352132426, + "loss": 0.0329, "step": 44760 }, { - "epoch": 0.23, - "learning_rate": 0.00026611943837627575, - "loss": 0.0185, + "epoch": 0.12, + "learning_rate": 0.0002825924553049528, + "loss": 0.0331, "step": 44770 }, { - "epoch": 0.23, - "learning_rate": 0.00026611187068326174, - "loss": 0.0217, + "epoch": 0.12, + "learning_rate": 0.0002825885670885813, + "loss": 0.0272, "step": 44780 }, { - "epoch": 0.23, - "learning_rate": 0.0002661043029902477, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.00028258467887220986, + "loss": 0.0353, "step": 44790 }, { - "epoch": 0.23, - "learning_rate": 0.0002660967352972337, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.0002825807906558384, + "loss": 0.0306, "step": 44800 }, { - "epoch": 0.23, - "learning_rate": 0.00026608916760421973, + "epoch": 0.12, + "learning_rate": 0.00028257690243946694, "loss": 0.0278, "step": 44810 }, { - "epoch": 0.23, - "learning_rate": 0.0002660815999112057, - "loss": 0.0196, + "epoch": 0.12, + "learning_rate": 0.00028257301422309546, + "loss": 0.0354, "step": 44820 }, { - "epoch": 0.23, - "learning_rate": 0.0002660740322181917, - "loss": 0.0175, + "epoch": 0.12, + "learning_rate": 0.00028256912600672403, + "loss": 0.0241, "step": 44830 }, { - "epoch": 0.23, - "learning_rate": 0.0002660664645251777, - "loss": 0.0179, + "epoch": 0.12, + "learning_rate": 0.00028256523779035254, + "loss": 0.0307, "step": 44840 }, { - "epoch": 0.23, - "learning_rate": 0.00026605889683216366, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.00028256134957398106, + "loss": 0.0252, "step": 44850 }, { - "epoch": 0.23, - "learning_rate": 0.00026605132913914964, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.00028255746135760957, + "loss": 0.0263, "step": 44860 }, { - "epoch": 0.23, - "learning_rate": 0.0002660437614461356, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.00028255357314123814, + "loss": 0.0267, "step": 44870 }, { - "epoch": 0.23, - "learning_rate": 0.00026603619375312166, - "loss": 0.0186, + "epoch": 0.12, + "learning_rate": 0.00028254968492486665, + "loss": 0.0255, "step": 44880 }, { - "epoch": 0.23, - "learning_rate": 0.00026602862606010764, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.0002825457967084952, + "loss": 0.0259, "step": 44890 }, { - "epoch": 0.23, - "learning_rate": 0.0002660210583670936, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.00028254190849212374, + "loss": 0.0291, "step": 44900 }, { - "epoch": 0.23, - "learning_rate": 0.0002660134906740796, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.00028253802027575225, + "loss": 0.0322, "step": 44910 }, { - "epoch": 0.23, - "learning_rate": 0.0002660059229810656, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002825341320593808, + "loss": 0.0335, "step": 44920 }, { - "epoch": 0.23, - "learning_rate": 0.00026599835528805157, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.00028253024384300934, + "loss": 0.0328, "step": 44930 }, { - "epoch": 0.23, - "learning_rate": 0.0002659907875950376, - "loss": 0.02, + "epoch": 0.12, + "learning_rate": 0.0002825263556266379, + "loss": 0.0301, "step": 44940 }, { - "epoch": 0.23, - "learning_rate": 0.0002659832199020236, - "loss": 0.0213, + "epoch": 0.12, + "learning_rate": 0.0002825224674102664, + "loss": 0.0332, "step": 44950 }, { - "epoch": 0.23, - "learning_rate": 0.00026597565220900956, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.000282518579193895, + "loss": 0.0337, "step": 44960 }, { - "epoch": 0.23, - "learning_rate": 0.00026596808451599555, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.0002825146909775235, + "loss": 0.0315, "step": 44970 }, { - "epoch": 0.23, - "learning_rate": 0.00026596051682298153, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.000282510802761152, + "loss": 0.0344, "step": 44980 }, { - "epoch": 0.23, - "learning_rate": 0.0002659529491299675, - "loss": 0.0202, + "epoch": 0.12, + "learning_rate": 0.00028250691454478053, + "loss": 0.0285, "step": 44990 }, { - "epoch": 0.23, - "learning_rate": 0.00026594538143695354, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.0002825030263284091, + "loss": 0.0283, "step": 45000 }, { - "epoch": 0.23, - "eval_cer": 0.9144896638256703, - "eval_loss": 0.016492534428834915, - "eval_runtime": 117.0086, - "eval_samples_per_second": 17.093, - "eval_steps_per_second": 4.273, + "epoch": 0.12, + "eval_cer": 0.8818104583670996, + "eval_loss": 0.022675270214676857, + "eval_runtime": 107.7182, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, "step": 45000 }, { - "epoch": 0.23, - "learning_rate": 0.0002659378137439395, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.0002824991381120376, + "loss": 0.0301, "step": 45010 }, { - "epoch": 0.23, - "learning_rate": 0.0002659302460509255, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.0002824952498956662, + "loss": 0.0281, "step": 45020 }, { - "epoch": 0.23, - "learning_rate": 0.0002659226783579115, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.0002824913616792947, + "loss": 0.0262, "step": 45030 }, { - "epoch": 0.23, - "learning_rate": 0.00026591511066489747, - "loss": 0.0202, + "epoch": 0.12, + "learning_rate": 0.00028248747346292327, + "loss": 0.0351, "step": 45040 }, { - "epoch": 0.23, - "learning_rate": 0.00026590754297188345, - "loss": 0.0213, + "epoch": 0.12, + "learning_rate": 0.0002824835852465518, + "loss": 0.0307, "step": 45050 }, { - "epoch": 0.23, - "learning_rate": 0.00026589997527886943, - "loss": 0.019, + "epoch": 0.12, + "learning_rate": 0.0002824796970301803, + "loss": 0.0333, "step": 45060 }, { - "epoch": 0.23, - "learning_rate": 0.00026589240758585547, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.0002824758088138088, + "loss": 0.0274, "step": 45070 }, { - "epoch": 0.23, - "learning_rate": 0.00026588483989284145, - "loss": 0.0309, + "epoch": 0.12, + "learning_rate": 0.0002824719205974374, + "loss": 0.0271, "step": 45080 }, { - "epoch": 0.23, - "learning_rate": 0.00026587727219982743, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.00028246803238106595, + "loss": 0.0355, "step": 45090 }, { - "epoch": 0.23, - "learning_rate": 0.0002658697045068134, - "loss": 0.0226, + "epoch": 0.12, + "learning_rate": 0.00028246414416469446, + "loss": 0.0275, "step": 45100 }, { - "epoch": 0.23, - "learning_rate": 0.0002658621368137994, - "loss": 0.0203, + "epoch": 0.12, + "learning_rate": 0.000282460255948323, + "loss": 0.0341, "step": 45110 }, { - "epoch": 0.23, - "learning_rate": 0.0002658545691207854, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028245636773195155, + "loss": 0.0319, "step": 45120 }, { - "epoch": 0.23, - "learning_rate": 0.0002658470014277714, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.00028245247951558006, + "loss": 0.0303, "step": 45130 }, { - "epoch": 0.23, - "learning_rate": 0.0002658394337347574, - "loss": 0.0204, + "epoch": 0.12, + "learning_rate": 0.0002824485912992086, + "loss": 0.0306, "step": 45140 }, { - "epoch": 0.23, - "learning_rate": 0.0002658318660417434, - "loss": 0.0221, + "epoch": 0.12, + "learning_rate": 0.00028244470308283714, + "loss": 0.0303, "step": 45150 }, { - "epoch": 0.23, - "learning_rate": 0.00026582429834872936, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.00028244081486646566, + "loss": 0.0303, "step": 45160 }, { - "epoch": 0.23, - "learning_rate": 0.00026581673065571534, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002824369266500942, + "loss": 0.0304, "step": 45170 }, { - "epoch": 0.23, - "learning_rate": 0.0002658091629627013, - "loss": 0.0224, + "epoch": 0.12, + "learning_rate": 0.00028243303843372274, + "loss": 0.0306, "step": 45180 }, { - "epoch": 0.23, - "learning_rate": 0.00026580159526968735, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.00028242915021735126, + "loss": 0.0296, "step": 45190 }, { - "epoch": 0.23, - "learning_rate": 0.00026579402757667334, - "loss": 0.0245, + "epoch": 0.12, + "learning_rate": 0.00028242526200097977, + "loss": 0.0291, "step": 45200 }, { - "epoch": 0.23, - "learning_rate": 0.0002657864598836593, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.00028242137378460834, + "loss": 0.0305, "step": 45210 }, { - "epoch": 0.23, - "learning_rate": 0.0002657788921906453, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.00028241748556823685, + "loss": 0.0361, "step": 45220 }, { - "epoch": 0.23, - "learning_rate": 0.0002657713244976313, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002824135973518654, + "loss": 0.032, "step": 45230 }, { - "epoch": 0.23, - "learning_rate": 0.00026576375680461726, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.00028240970913549394, + "loss": 0.0316, "step": 45240 }, { - "epoch": 0.23, - "learning_rate": 0.00026575618911160324, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.0002824058209191225, + "loss": 0.0272, "step": 45250 }, { - "epoch": 0.23, - "learning_rate": 0.0002657486214185893, - "loss": 0.0224, + "epoch": 0.12, + "learning_rate": 0.000282401932702751, + "loss": 0.0317, "step": 45260 }, { - "epoch": 0.23, - "learning_rate": 0.00026574105372557526, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.00028239804448637953, + "loss": 0.0307, "step": 45270 }, { - "epoch": 0.23, - "learning_rate": 0.00026573348603256124, - "loss": 0.0253, + "epoch": 0.12, + "learning_rate": 0.00028239415627000805, + "loss": 0.0262, "step": 45280 }, { - "epoch": 0.23, - "learning_rate": 0.0002657259183395472, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.0002823902680536366, + "loss": 0.0356, "step": 45290 }, { - "epoch": 0.23, - "learning_rate": 0.0002657183506465332, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.0002823863798372652, + "loss": 0.0297, "step": 45300 }, { - "epoch": 0.23, - "learning_rate": 0.0002657107829535192, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002823824916208937, + "loss": 0.0297, "step": 45310 }, { - "epoch": 0.23, - "learning_rate": 0.0002657032152605052, - "loss": 0.0265, + "epoch": 0.12, + "learning_rate": 0.0002823786034045222, + "loss": 0.032, "step": 45320 }, { - "epoch": 0.23, - "learning_rate": 0.0002656956475674912, - "loss": 0.0194, + "epoch": 0.12, + "learning_rate": 0.0002823747151881508, + "loss": 0.0413, "step": 45330 }, { - "epoch": 0.23, - "learning_rate": 0.0002656880798744772, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.0002823708269717793, + "loss": 0.0324, "step": 45340 }, { - "epoch": 0.23, - "learning_rate": 0.00026568051218146317, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.0002823669387554078, + "loss": 0.0331, "step": 45350 }, { - "epoch": 0.23, - "learning_rate": 0.00026567294448844915, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002823630505390364, + "loss": 0.0358, "step": 45360 }, { - "epoch": 0.23, - "learning_rate": 0.00026566537679543513, - "loss": 0.0268, - "step": 45370 + "epoch": 0.12, + "learning_rate": 0.0002823591623226649, + "loss": 0.027, + "step": 45370 }, { - "epoch": 0.23, - "learning_rate": 0.0002656578091024211, - "loss": 0.0272, + "epoch": 0.12, + "learning_rate": 0.00028235527410629347, + "loss": 0.027, "step": 45380 }, { - "epoch": 0.23, - "learning_rate": 0.00026565024140940715, - "loss": 0.021, + "epoch": 0.12, + "learning_rate": 0.000282351385889922, + "loss": 0.032, "step": 45390 }, { - "epoch": 0.23, - "learning_rate": 0.00026564267371639313, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.0002823474976735505, + "loss": 0.0284, "step": 45400 }, { - "epoch": 0.23, - "learning_rate": 0.0002656351060233791, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.000282343609457179, + "loss": 0.032, "step": 45410 }, { - "epoch": 0.23, - "learning_rate": 0.0002656275383303651, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.0002823397212408076, + "loss": 0.0277, "step": 45420 }, { - "epoch": 0.23, - "learning_rate": 0.00026561997063735107, - "loss": 0.0226, + "epoch": 0.12, + "learning_rate": 0.00028233583302443615, + "loss": 0.0298, "step": 45430 }, { - "epoch": 0.23, - "learning_rate": 0.00026561240294433705, - "loss": 0.0266, + "epoch": 0.12, + "learning_rate": 0.00028233194480806466, + "loss": 0.0326, "step": 45440 }, { - "epoch": 0.23, - "learning_rate": 0.0002656048352513231, - "loss": 0.0282, + "epoch": 0.12, + "learning_rate": 0.0002823280565916932, + "loss": 0.0313, "step": 45450 }, { - "epoch": 0.23, - "learning_rate": 0.00026559726755830907, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.00028232416837532174, + "loss": 0.0301, "step": 45460 }, { - "epoch": 0.23, - "learning_rate": 0.00026558969986529505, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.00028232028015895026, + "loss": 0.034, "step": 45470 }, { - "epoch": 0.23, - "learning_rate": 0.00026558213217228103, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.0002823163919425788, + "loss": 0.027, "step": 45480 }, { - "epoch": 0.23, - "learning_rate": 0.000265574564479267, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.00028231250372620734, + "loss": 0.0292, "step": 45490 }, { - "epoch": 0.23, - "learning_rate": 0.000265566996786253, - "loss": 0.0232, + "epoch": 0.12, + "learning_rate": 0.00028230861550983586, + "loss": 0.0306, "step": 45500 }, { - "epoch": 0.23, - "learning_rate": 0.00026555942909323903, - "loss": 0.0253, + "epoch": 0.12, + "learning_rate": 0.0002823047272934644, + "loss": 0.0268, "step": 45510 }, { - "epoch": 0.23, - "learning_rate": 0.000265551861400225, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.00028230083907709294, + "loss": 0.0359, "step": 45520 }, { - "epoch": 0.23, - "learning_rate": 0.000265544293707211, - "loss": 0.0222, + "epoch": 0.12, + "learning_rate": 0.00028229695086072145, + "loss": 0.0326, "step": 45530 }, { - "epoch": 0.23, - "learning_rate": 0.000265536726014197, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.00028229306264435, + "loss": 0.0294, "step": 45540 }, { - "epoch": 0.23, - "learning_rate": 0.00026552915832118296, - "loss": 0.0195, + "epoch": 0.12, + "learning_rate": 0.00028228917442797854, + "loss": 0.0288, "step": 45550 }, { - "epoch": 0.23, - "learning_rate": 0.00026552159062816894, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.00028228528621160705, + "loss": 0.03, "step": 45560 }, { - "epoch": 0.23, - "learning_rate": 0.0002655140229351549, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002822813979952356, + "loss": 0.0289, "step": 45570 }, { - "epoch": 0.23, - "learning_rate": 0.00026550645524214096, - "loss": 0.0243, + "epoch": 0.12, + "learning_rate": 0.0002822775097788642, + "loss": 0.0303, "step": 45580 }, { - "epoch": 0.23, - "learning_rate": 0.00026549888754912694, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.0002822736215624927, + "loss": 0.0327, "step": 45590 }, { - "epoch": 0.23, - "learning_rate": 0.0002654913198561129, - "loss": 0.0222, + "epoch": 0.12, + "learning_rate": 0.0002822697333461212, + "loss": 0.0327, "step": 45600 }, { - "epoch": 0.23, - "learning_rate": 0.0002654837521630989, - "loss": 0.0198, + "epoch": 0.12, + "learning_rate": 0.00028226584512974973, + "loss": 0.0294, "step": 45610 }, { - "epoch": 0.23, - "learning_rate": 0.0002654761844700849, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002822619569133783, + "loss": 0.0287, "step": 45620 }, { - "epoch": 0.23, - "learning_rate": 0.00026546861677707086, - "loss": 0.0186, + "epoch": 0.12, + "learning_rate": 0.0002822580686970068, + "loss": 0.0318, "step": 45630 }, { - "epoch": 0.23, - "learning_rate": 0.0002654610490840569, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.0002822541804806354, + "loss": 0.032, "step": 45640 }, { - "epoch": 0.23, - "learning_rate": 0.0002654534813910429, - "loss": 0.0279, + "epoch": 0.12, + "learning_rate": 0.0002822502922642639, + "loss": 0.0259, "step": 45650 }, { - "epoch": 0.23, - "learning_rate": 0.00026544591369802886, - "loss": 0.0211, + "epoch": 0.12, + "learning_rate": 0.0002822464040478924, + "loss": 0.0351, "step": 45660 }, { - "epoch": 0.23, - "learning_rate": 0.00026543834600501484, - "loss": 0.019, + "epoch": 0.12, + "learning_rate": 0.000282242515831521, + "loss": 0.0298, "step": 45670 }, { - "epoch": 0.23, - "learning_rate": 0.0002654307783120008, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.0002822386276151495, + "loss": 0.0294, "step": 45680 }, { - "epoch": 0.23, - "learning_rate": 0.0002654232106189868, - "loss": 0.0187, + "epoch": 0.12, + "learning_rate": 0.000282234739398778, + "loss": 0.0252, "step": 45690 }, { - "epoch": 0.23, - "learning_rate": 0.00026541564292597284, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.0002822308511824066, + "loss": 0.03, "step": 45700 }, { - "epoch": 0.23, - "learning_rate": 0.0002654080752329588, - "loss": 0.0282, + "epoch": 0.12, + "learning_rate": 0.0002822269629660351, + "loss": 0.0287, "step": 45710 }, { - "epoch": 0.23, - "learning_rate": 0.0002654005075399448, - "loss": 0.0182, + "epoch": 0.12, + "learning_rate": 0.00028222307474966366, + "loss": 0.0287, "step": 45720 }, { - "epoch": 0.23, - "learning_rate": 0.0002653929398469308, - "loss": 0.0236, + "epoch": 0.12, + "learning_rate": 0.0002822191865332922, + "loss": 0.0261, "step": 45730 }, { - "epoch": 0.23, - "learning_rate": 0.00026538537215391677, - "loss": 0.0195, + "epoch": 0.12, + "learning_rate": 0.0002822152983169207, + "loss": 0.0248, "step": 45740 }, { - "epoch": 0.23, - "learning_rate": 0.00026537780446090275, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.00028221141010054926, + "loss": 0.0268, "step": 45750 }, { - "epoch": 0.23, - "learning_rate": 0.00026537023676788873, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.0002822075218841778, + "loss": 0.0305, "step": 45760 }, { - "epoch": 0.23, - "learning_rate": 0.00026536266907487477, - "loss": 0.0218, + "epoch": 0.12, + "learning_rate": 0.0002822036336678063, + "loss": 0.0302, "step": 45770 }, { - "epoch": 0.23, - "learning_rate": 0.00026535510138186075, - "loss": 0.0249, + "epoch": 0.12, + "learning_rate": 0.00028219974545143486, + "loss": 0.0481, "step": 45780 }, { - "epoch": 0.23, - "learning_rate": 0.00026534753368884673, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.00028219585723506343, + "loss": 0.0333, "step": 45790 }, { - "epoch": 0.23, - "learning_rate": 0.0002653399659958327, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.00028219196901869194, + "loss": 0.0333, "step": 45800 }, { - "epoch": 0.23, - "learning_rate": 0.0002653323983028187, - "loss": 0.0184, + "epoch": 0.12, + "learning_rate": 0.00028218808080232046, + "loss": 0.0279, "step": 45810 }, { - "epoch": 0.23, - "learning_rate": 0.0002653248306098047, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.00028218419258594897, + "loss": 0.0329, "step": 45820 }, { - "epoch": 0.23, - "learning_rate": 0.0002653172629167907, - "loss": 0.0245, + "epoch": 0.12, + "learning_rate": 0.00028218030436957754, + "loss": 0.0272, "step": 45830 }, { - "epoch": 0.23, - "learning_rate": 0.0002653096952237767, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.00028217641615320606, + "loss": 0.0295, "step": 45840 }, { - "epoch": 0.23, - "learning_rate": 0.00026530212753076267, - "loss": 0.0254, + "epoch": 0.12, + "learning_rate": 0.0002821725279368346, + "loss": 0.0339, "step": 45850 }, { - "epoch": 0.23, - "learning_rate": 0.00026529455983774865, - "loss": 0.0221, + "epoch": 0.12, + "learning_rate": 0.00028216863972046314, + "loss": 0.0275, "step": 45860 }, { - "epoch": 0.23, - "learning_rate": 0.00026528699214473463, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.0002821647515040917, + "loss": 0.0287, "step": 45870 }, { - "epoch": 0.23, - "learning_rate": 0.0002652794244517206, - "loss": 0.0242, + "epoch": 0.12, + "learning_rate": 0.0002821608632877202, + "loss": 0.0248, "step": 45880 }, { - "epoch": 0.23, - "learning_rate": 0.0002652718567587066, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.00028215697507134874, + "loss": 0.0258, "step": 45890 }, { - "epoch": 0.23, - "learning_rate": 0.0002652642890656926, - "loss": 0.0223, + "epoch": 0.12, + "learning_rate": 0.00028215308685497725, + "loss": 0.0278, "step": 45900 }, { - "epoch": 0.23, - "learning_rate": 0.00026525672137267856, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002821491986386058, + "loss": 0.0287, "step": 45910 }, { - "epoch": 0.23, - "learning_rate": 0.00026524915367966454, - "loss": 0.0258, + "epoch": 0.12, + "learning_rate": 0.00028214531042223433, + "loss": 0.0326, "step": 45920 }, { - "epoch": 0.23, - "learning_rate": 0.0002652415859866506, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002821414222058629, + "loss": 0.0274, "step": 45930 }, { - "epoch": 0.23, - "learning_rate": 0.00026523401829363656, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002821375339894914, + "loss": 0.0359, "step": 45940 }, { - "epoch": 0.23, - "learning_rate": 0.00026522645060062254, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.00028213364577311993, + "loss": 0.0237, "step": 45950 }, { - "epoch": 0.23, - "learning_rate": 0.0002652188829076085, - "loss": 0.0182, + "epoch": 0.12, + "learning_rate": 0.0002821297575567485, + "loss": 0.0273, "step": 45960 }, { - "epoch": 0.23, - "learning_rate": 0.0002652113152145945, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.000282125869340377, + "loss": 0.0334, "step": 45970 }, { - "epoch": 0.23, - "learning_rate": 0.0002652037475215805, - "loss": 0.0192, + "epoch": 0.12, + "learning_rate": 0.0002821219811240056, + "loss": 0.0267, "step": 45980 }, { - "epoch": 0.23, - "learning_rate": 0.00026519617982856647, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002821180929076341, + "loss": 0.0267, "step": 45990 }, { - "epoch": 0.23, - "learning_rate": 0.0002651886121355525, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028211420469126267, + "loss": 0.0273, "step": 46000 }, { - "epoch": 0.23, - "eval_cer": 0.9144877230334195, - "eval_loss": 0.016304470598697662, - "eval_runtime": 117.0909, - "eval_samples_per_second": 17.081, - "eval_steps_per_second": 4.27, + "epoch": 0.12, + "eval_cer": 0.8817810659914818, + "eval_loss": 0.020111197605729103, + "eval_runtime": 107.811, + "eval_samples_per_second": 18.551, + "eval_steps_per_second": 4.638, "step": 46000 }, { - "epoch": 0.23, - "learning_rate": 0.0002651810444425385, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002821103164748912, + "loss": 0.0337, "step": 46010 }, { - "epoch": 0.23, - "learning_rate": 0.00026517347674952447, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002821064282585197, + "loss": 0.0304, "step": 46020 }, { - "epoch": 0.23, - "learning_rate": 0.00026516590905651045, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.0002821025400421482, + "loss": 0.0265, "step": 46030 }, { - "epoch": 0.23, - "learning_rate": 0.00026515834136349643, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002820986518257768, + "loss": 0.0301, "step": 46040 }, { - "epoch": 0.23, - "learning_rate": 0.0002651507736704824, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.0002820947636094053, + "loss": 0.0251, "step": 46050 }, { - "epoch": 0.23, - "learning_rate": 0.00026514320597746845, - "loss": 0.0197, + "epoch": 0.12, + "learning_rate": 0.00028209087539303386, + "loss": 0.0269, "step": 46060 }, { - "epoch": 0.23, - "learning_rate": 0.0002651356382844544, - "loss": 0.0191, + "epoch": 0.12, + "learning_rate": 0.0002820869871766624, + "loss": 0.0322, "step": 46070 }, { - "epoch": 0.23, - "learning_rate": 0.0002651280705914404, - "loss": 0.0204, + "epoch": 0.12, + "learning_rate": 0.00028208309896029095, + "loss": 0.0335, "step": 46080 }, { - "epoch": 0.23, - "learning_rate": 0.0002651205028984264, - "loss": 0.0198, + "epoch": 0.12, + "learning_rate": 0.00028207921074391946, + "loss": 0.0328, "step": 46090 }, { - "epoch": 0.23, - "learning_rate": 0.00026511293520541237, - "loss": 0.0197, + "epoch": 0.12, + "learning_rate": 0.000282075322527548, + "loss": 0.028, "step": 46100 }, { - "epoch": 0.23, - "learning_rate": 0.00026510536751239835, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.0002820714343111765, + "loss": 0.0333, "step": 46110 }, { - "epoch": 0.23, - "learning_rate": 0.00026509779981938433, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.00028206754609480506, + "loss": 0.0302, "step": 46120 }, { - "epoch": 0.23, - "learning_rate": 0.00026509023212637037, - "loss": 0.0263, + "epoch": 0.12, + "learning_rate": 0.00028206365787843363, + "loss": 0.0294, "step": 46130 }, { - "epoch": 0.23, - "learning_rate": 0.00026508266443335635, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028205976966206214, + "loss": 0.0319, "step": 46140 }, { - "epoch": 0.23, - "learning_rate": 0.00026507509674034233, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.00028205588144569066, + "loss": 0.0258, "step": 46150 }, { - "epoch": 0.23, - "learning_rate": 0.0002650675290473283, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.00028205199322931917, + "loss": 0.0267, "step": 46160 }, { - "epoch": 0.23, - "learning_rate": 0.0002650599613543143, - "loss": 0.0249, + "epoch": 0.12, + "learning_rate": 0.00028204810501294774, + "loss": 0.0381, "step": 46170 }, { - "epoch": 0.23, - "learning_rate": 0.0002650523936613003, - "loss": 0.0269, + "epoch": 0.12, + "learning_rate": 0.00028204421679657625, + "loss": 0.0276, "step": 46180 }, { - "epoch": 0.23, - "learning_rate": 0.0002650448259682863, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.0002820403285802048, + "loss": 0.0291, "step": 46190 }, { - "epoch": 0.23, - "learning_rate": 0.0002650372582752723, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028203644036383334, + "loss": 0.0263, "step": 46200 }, { - "epoch": 0.23, - "learning_rate": 0.0002650296905822583, - "loss": 0.0305, + "epoch": 0.12, + "learning_rate": 0.0002820325521474619, + "loss": 0.0387, "step": 46210 }, { - "epoch": 0.23, - "learning_rate": 0.00026502212288924426, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002820286639310904, + "loss": 0.0258, "step": 46220 }, { - "epoch": 0.23, - "learning_rate": 0.00026501455519623024, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.00028202477571471894, + "loss": 0.0281, "step": 46230 }, { - "epoch": 0.23, - "learning_rate": 0.0002650069875032162, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.00028202088749834745, + "loss": 0.0356, "step": 46240 }, { - "epoch": 0.23, - "learning_rate": 0.00026499941981020226, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.000282016999281976, + "loss": 0.0301, "step": 46250 }, { - "epoch": 0.23, - "learning_rate": 0.00026499185211718824, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028201311106560453, + "loss": 0.0267, "step": 46260 }, { - "epoch": 0.23, - "learning_rate": 0.0002649842844241742, - "loss": 0.0191, + "epoch": 0.12, + "learning_rate": 0.0002820092228492331, + "loss": 0.0322, "step": 46270 }, { - "epoch": 0.23, - "learning_rate": 0.0002649767167311602, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.0002820053346328616, + "loss": 0.0226, "step": 46280 }, { - "epoch": 0.23, - "learning_rate": 0.0002649691490381462, - "loss": 0.0187, + "epoch": 0.12, + "learning_rate": 0.0002820014464164902, + "loss": 0.0276, "step": 46290 }, { - "epoch": 0.23, - "learning_rate": 0.00026496158134513216, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.0002819975582001187, + "loss": 0.0239, "step": 46300 }, { - "epoch": 0.23, - "learning_rate": 0.00026495401365211814, - "loss": 0.0185, + "epoch": 0.12, + "learning_rate": 0.0002819936699837472, + "loss": 0.0373, "step": 46310 }, { - "epoch": 0.23, - "learning_rate": 0.0002649464459591042, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028198978176737573, + "loss": 0.0328, "step": 46320 }, { - "epoch": 0.23, - "learning_rate": 0.00026493887826609016, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002819858935510043, + "loss": 0.029, "step": 46330 }, { - "epoch": 0.23, - "learning_rate": 0.00026493131057307614, - "loss": 0.0189, + "epoch": 0.12, + "learning_rate": 0.00028198200533463287, + "loss": 0.0305, "step": 46340 }, { - "epoch": 0.23, - "learning_rate": 0.0002649237428800621, - "loss": 0.0188, + "epoch": 0.12, + "learning_rate": 0.0002819781171182614, + "loss": 0.0274, "step": 46350 }, { - "epoch": 0.23, - "learning_rate": 0.0002649161751870481, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.0002819742289018899, + "loss": 0.0275, "step": 46360 }, { - "epoch": 0.23, - "learning_rate": 0.0002649086074940341, - "loss": 0.0203, + "epoch": 0.12, + "learning_rate": 0.00028197034068551846, + "loss": 0.0285, "step": 46370 }, { - "epoch": 0.23, - "learning_rate": 0.0002649010398010201, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.000281966452469147, + "loss": 0.0266, "step": 46380 }, { - "epoch": 0.23, - "learning_rate": 0.0002648934721080061, - "loss": 0.0184, + "epoch": 0.12, + "learning_rate": 0.0002819625642527755, + "loss": 0.0407, "step": 46390 }, { - "epoch": 0.23, - "learning_rate": 0.0002648859044149921, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.00028195867603640406, + "loss": 0.0296, "step": 46400 }, { - "epoch": 0.23, - "learning_rate": 0.00026487833672197807, - "loss": 0.0194, + "epoch": 0.12, + "learning_rate": 0.0002819547878200326, + "loss": 0.0303, "step": 46410 }, { - "epoch": 0.23, - "learning_rate": 0.00026487076902896405, - "loss": 0.0244, + "epoch": 0.12, + "learning_rate": 0.00028195089960366115, + "loss": 0.0289, "step": 46420 }, { - "epoch": 0.23, - "learning_rate": 0.00026486320133595003, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.00028194701138728966, + "loss": 0.0238, "step": 46430 }, { - "epoch": 0.23, - "learning_rate": 0.00026485563364293607, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.0002819431231709182, + "loss": 0.0265, "step": 46440 }, { - "epoch": 0.23, - "learning_rate": 0.00026484806594992205, - "loss": 0.0217, + "epoch": 0.12, + "learning_rate": 0.0002819392349545467, + "loss": 0.0262, "step": 46450 }, { - "epoch": 0.23, - "learning_rate": 0.00026484049825690803, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.00028193534673817526, + "loss": 0.0257, "step": 46460 }, { - "epoch": 0.23, - "learning_rate": 0.000264832930563894, - "loss": 0.0162, + "epoch": 0.12, + "learning_rate": 0.00028193145852180377, + "loss": 0.0289, "step": 46470 }, { - "epoch": 0.23, - "learning_rate": 0.00026482536287088, - "loss": 0.0231, + "epoch": 0.12, + "learning_rate": 0.00028192757030543234, + "loss": 0.0309, "step": 46480 }, { - "epoch": 0.23, - "learning_rate": 0.00026481779517786597, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.00028192368208906086, + "loss": 0.0263, "step": 46490 }, { - "epoch": 0.23, - "learning_rate": 0.00026481022748485195, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.0002819197938726894, + "loss": 0.0262, "step": 46500 }, { - "epoch": 0.23, - "learning_rate": 0.000264802659791838, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.00028191590565631794, + "loss": 0.0211, "step": 46510 }, { - "epoch": 0.23, - "learning_rate": 0.00026479509209882397, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.00028191201743994645, + "loss": 0.0271, "step": 46520 }, { - "epoch": 0.23, - "learning_rate": 0.00026478752440580995, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.000281908129223575, + "loss": 0.0327, "step": 46530 }, { - "epoch": 0.23, - "learning_rate": 0.00026477995671279593, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028190424100720354, + "loss": 0.029, "step": 46540 }, { - "epoch": 0.23, - "learning_rate": 0.0002647723890197819, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.0002819003527908321, + "loss": 0.0336, "step": 46550 }, { - "epoch": 0.23, - "learning_rate": 0.0002647648213267679, - "loss": 0.0276, + "epoch": 0.12, + "learning_rate": 0.0002818964645744606, + "loss": 0.0295, "step": 46560 }, { - "epoch": 0.23, - "learning_rate": 0.00026475725363375393, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.00028189257635808913, + "loss": 0.0346, "step": 46570 }, { - "epoch": 0.24, - "learning_rate": 0.0002647496859407399, - "loss": 0.0196, + "epoch": 0.12, + "learning_rate": 0.0002818886881417177, + "loss": 0.0261, "step": 46580 }, { - "epoch": 0.24, - "learning_rate": 0.0002647421182477259, - "loss": 0.0196, + "epoch": 0.12, + "learning_rate": 0.0002818847999253462, + "loss": 0.0323, "step": 46590 }, { - "epoch": 0.24, - "learning_rate": 0.0002647345505547119, - "loss": 0.0203, + "epoch": 0.12, + "learning_rate": 0.00028188091170897473, + "loss": 0.0311, "step": 46600 }, { - "epoch": 0.24, - "learning_rate": 0.00026472698286169786, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.0002818770234926033, + "loss": 0.03, "step": 46610 }, { - "epoch": 0.24, - "learning_rate": 0.00026471941516868384, - "loss": 0.0217, + "epoch": 0.12, + "learning_rate": 0.00028187313527623187, + "loss": 0.0279, "step": 46620 }, { - "epoch": 0.24, - "learning_rate": 0.0002647118474756698, - "loss": 0.0185, + "epoch": 0.12, + "learning_rate": 0.0002818692470598604, + "loss": 0.0281, "step": 46630 }, { - "epoch": 0.24, - "learning_rate": 0.00026470427978265586, - "loss": 0.0215, + "epoch": 0.12, + "learning_rate": 0.0002818653588434889, + "loss": 0.0268, "step": 46640 }, { - "epoch": 0.24, - "learning_rate": 0.00026469671208964184, - "loss": 0.0194, + "epoch": 0.12, + "learning_rate": 0.0002818614706271174, + "loss": 0.0356, "step": 46650 }, { - "epoch": 0.24, - "learning_rate": 0.0002646891443966278, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.00028185758241074593, + "loss": 0.0254, "step": 46660 }, { - "epoch": 0.24, - "learning_rate": 0.0002646815767036138, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.0002818536941943745, + "loss": 0.0273, "step": 46670 }, { - "epoch": 0.24, - "learning_rate": 0.0002646740090105998, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.00028184980597800307, + "loss": 0.0293, "step": 46680 }, { - "epoch": 0.24, - "learning_rate": 0.00026466644131758576, - "loss": 0.0189, + "epoch": 0.12, + "learning_rate": 0.0002818459177616316, + "loss": 0.031, "step": 46690 }, { - "epoch": 0.24, - "learning_rate": 0.0002646588736245718, - "loss": 0.0191, + "epoch": 0.12, + "learning_rate": 0.0002818420295452601, + "loss": 0.0308, "step": 46700 }, { - "epoch": 0.24, - "learning_rate": 0.0002646513059315578, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.00028183814132888866, + "loss": 0.0258, "step": 46710 }, { - "epoch": 0.24, - "learning_rate": 0.00026464373823854376, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.0002818342531125172, + "loss": 0.0277, "step": 46720 }, { - "epoch": 0.24, - "learning_rate": 0.00026463617054552974, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.0002818303648961457, + "loss": 0.0291, "step": 46730 }, { - "epoch": 0.24, - "learning_rate": 0.0002646286028525157, - "loss": 0.0222, + "epoch": 0.12, + "learning_rate": 0.00028182647667977426, + "loss": 0.0226, "step": 46740 }, { - "epoch": 0.24, - "learning_rate": 0.0002646210351595017, - "loss": 0.0259, + "epoch": 0.12, + "learning_rate": 0.0002818225884634028, + "loss": 0.0295, "step": 46750 }, { - "epoch": 0.24, - "learning_rate": 0.00026461346746648774, - "loss": 0.0206, + "epoch": 0.12, + "learning_rate": 0.00028181870024703134, + "loss": 0.0288, "step": 46760 }, { - "epoch": 0.24, - "learning_rate": 0.0002646058997734737, - "loss": 0.0267, + "epoch": 0.12, + "learning_rate": 0.00028181481203065986, + "loss": 0.0289, "step": 46770 }, { - "epoch": 0.24, - "learning_rate": 0.0002645983320804597, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.0002818109238142884, + "loss": 0.0343, "step": 46780 }, { - "epoch": 0.24, - "learning_rate": 0.0002645907643874457, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.00028180703559791694, + "loss": 0.0333, "step": 46790 }, { - "epoch": 0.24, - "learning_rate": 0.00026458319669443167, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.00028180314738154546, + "loss": 0.0305, "step": 46800 }, { - "epoch": 0.24, - "learning_rate": 0.00026457562900141765, - "loss": 0.0181, + "epoch": 0.12, + "learning_rate": 0.00028179925916517397, + "loss": 0.0304, "step": 46810 }, { - "epoch": 0.24, - "learning_rate": 0.00026456806130840363, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.00028179537094880254, + "loss": 0.029, "step": 46820 }, { - "epoch": 0.24, - "learning_rate": 0.00026456049361538967, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.0002817914827324311, + "loss": 0.0281, "step": 46830 }, { - "epoch": 0.24, - "learning_rate": 0.00026455292592237565, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.0002817875945160596, + "loss": 0.0312, "step": 46840 }, { - "epoch": 0.24, - "learning_rate": 0.00026454535822936163, - "loss": 0.0234, + "epoch": 0.12, + "learning_rate": 0.00028178370629968814, + "loss": 0.0259, "step": 46850 }, { - "epoch": 0.24, - "learning_rate": 0.0002645377905363476, - "loss": 0.0178, + "epoch": 0.12, + "learning_rate": 0.00028177981808331665, + "loss": 0.0311, "step": 46860 }, { - "epoch": 0.24, - "learning_rate": 0.0002645302228433336, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.0002817759298669452, + "loss": 0.0267, "step": 46870 }, { - "epoch": 0.24, - "learning_rate": 0.0002645226551503196, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.00028177204165057374, + "loss": 0.0283, "step": 46880 }, { - "epoch": 0.24, - "learning_rate": 0.0002645150874573056, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.0002817681534342023, + "loss": 0.0283, "step": 46890 }, { - "epoch": 0.24, - "learning_rate": 0.0002645075197642916, - "loss": 0.0211, + "epoch": 0.12, + "learning_rate": 0.0002817642652178308, + "loss": 0.0253, "step": 46900 }, { - "epoch": 0.24, - "learning_rate": 0.00026449995207127757, - "loss": 0.0274, + "epoch": 0.12, + "learning_rate": 0.00028176037700145933, + "loss": 0.028, "step": 46910 }, { - "epoch": 0.24, - "learning_rate": 0.00026449238437826355, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002817564887850879, + "loss": 0.0301, "step": 46920 }, { - "epoch": 0.24, - "learning_rate": 0.00026448481668524954, - "loss": 0.0243, + "epoch": 0.12, + "learning_rate": 0.0002817526005687164, + "loss": 0.0294, "step": 46930 }, { - "epoch": 0.24, - "learning_rate": 0.0002644772489922355, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028174871235234493, + "loss": 0.028, "step": 46940 }, { - "epoch": 0.24, - "learning_rate": 0.00026446968129922155, - "loss": 0.0171, + "epoch": 0.12, + "learning_rate": 0.0002817448241359735, + "loss": 0.0311, "step": 46950 }, { - "epoch": 0.24, - "learning_rate": 0.00026446211360620753, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.000281740935919602, + "loss": 0.0291, "step": 46960 }, { - "epoch": 0.24, - "learning_rate": 0.0002644545459131935, - "loss": 0.0197, + "epoch": 0.12, + "learning_rate": 0.0002817370477032306, + "loss": 0.024, "step": 46970 }, { - "epoch": 0.24, - "learning_rate": 0.0002644469782201795, - "loss": 0.0285, + "epoch": 0.12, + "learning_rate": 0.0002817331594868591, + "loss": 0.025, "step": 46980 }, { - "epoch": 0.24, - "learning_rate": 0.0002644394105271655, - "loss": 0.0208, + "epoch": 0.12, + "learning_rate": 0.0002817292712704876, + "loss": 0.0316, "step": 46990 }, { - "epoch": 0.24, - "learning_rate": 0.00026443184283415146, - "loss": 0.0222, + "epoch": 0.12, + "learning_rate": 0.0002817253830541162, + "loss": 0.0307, "step": 47000 }, { - "epoch": 0.24, - "eval_cer": 0.9145042197675514, - "eval_loss": 0.01637718454003334, - "eval_runtime": 117.1859, - "eval_samples_per_second": 17.067, - "eval_steps_per_second": 4.267, + "epoch": 0.12, + "eval_cer": 0.8818650442075325, + "eval_loss": 0.02089322730898857, + "eval_runtime": 107.6372, + "eval_samples_per_second": 18.581, + "eval_steps_per_second": 4.645, "step": 47000 }, { - "epoch": 0.24, - "learning_rate": 0.00026442427514113744, - "loss": 0.0188, + "epoch": 0.12, + "learning_rate": 0.0002817214948377447, + "loss": 0.0258, "step": 47010 }, { - "epoch": 0.24, - "learning_rate": 0.0002644167074481235, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.00028171760662137326, + "loss": 0.0238, "step": 47020 }, { - "epoch": 0.24, - "learning_rate": 0.00026440913975510946, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.0002817137184050018, + "loss": 0.0305, "step": 47030 }, { - "epoch": 0.24, - "learning_rate": 0.00026440157206209544, - "loss": 0.0211, + "epoch": 0.12, + "learning_rate": 0.00028170983018863035, + "loss": 0.0248, "step": 47040 }, { - "epoch": 0.24, - "learning_rate": 0.0002643940043690814, - "loss": 0.0213, + "epoch": 0.12, + "learning_rate": 0.00028170594197225886, + "loss": 0.034, "step": 47050 }, { - "epoch": 0.24, - "learning_rate": 0.0002643864366760674, - "loss": 0.0222, + "epoch": 0.12, + "learning_rate": 0.0002817020537558874, + "loss": 0.024, "step": 47060 }, { - "epoch": 0.24, - "learning_rate": 0.0002643788689830534, - "loss": 0.0188, + "epoch": 0.12, + "learning_rate": 0.0002816981655395159, + "loss": 0.031, "step": 47070 }, { - "epoch": 0.24, - "learning_rate": 0.0002643713012900394, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.00028169427732314446, + "loss": 0.0247, "step": 47080 }, { - "epoch": 0.24, - "learning_rate": 0.0002643637335970254, - "loss": 0.0224, + "epoch": 0.12, + "learning_rate": 0.000281690389106773, + "loss": 0.0263, "step": 47090 }, { - "epoch": 0.24, - "learning_rate": 0.0002643561659040114, - "loss": 0.0182, + "epoch": 0.12, + "learning_rate": 0.00028168650089040154, + "loss": 0.0316, "step": 47100 }, { - "epoch": 0.24, - "learning_rate": 0.00026434859821099736, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028168261267403006, + "loss": 0.0308, "step": 47110 }, { - "epoch": 0.24, - "learning_rate": 0.00026434103051798335, - "loss": 0.0206, + "epoch": 0.12, + "learning_rate": 0.0002816787244576586, + "loss": 0.0297, "step": 47120 }, { - "epoch": 0.24, - "learning_rate": 0.0002643334628249693, - "loss": 0.0196, + "epoch": 0.12, + "learning_rate": 0.00028167483624128714, + "loss": 0.028, "step": 47130 }, { - "epoch": 0.24, - "learning_rate": 0.0002643258951319553, - "loss": 0.0266, + "epoch": 0.12, + "learning_rate": 0.00028167094802491566, + "loss": 0.0303, "step": 47140 }, { - "epoch": 0.24, - "learning_rate": 0.0002643183274389413, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.00028166705980854417, + "loss": 0.0303, "step": 47150 }, { - "epoch": 0.24, - "learning_rate": 0.00026431075974592727, - "loss": 0.0224, + "epoch": 0.12, + "learning_rate": 0.00028166317159217274, + "loss": 0.0348, "step": 47160 }, { - "epoch": 0.24, - "learning_rate": 0.00026430319205291325, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.0002816592833758013, + "loss": 0.0326, "step": 47170 }, { - "epoch": 0.24, - "learning_rate": 0.00026429562435989923, - "loss": 0.0187, + "epoch": 0.12, + "learning_rate": 0.0002816553951594298, + "loss": 0.0305, "step": 47180 }, { - "epoch": 0.24, - "learning_rate": 0.00026428805666688527, - "loss": 0.0233, + "epoch": 0.12, + "learning_rate": 0.00028165150694305834, + "loss": 0.0253, "step": 47190 }, { - "epoch": 0.24, - "learning_rate": 0.00026428048897387125, - "loss": 0.0248, + "epoch": 0.12, + "learning_rate": 0.00028164761872668685, + "loss": 0.0233, "step": 47200 }, { - "epoch": 0.24, - "learning_rate": 0.00026427292128085723, - "loss": 0.0197, + "epoch": 0.12, + "learning_rate": 0.0002816437305103154, + "loss": 0.0277, "step": 47210 }, { - "epoch": 0.24, - "learning_rate": 0.0002642653535878432, - "loss": 0.027, + "epoch": 0.12, + "learning_rate": 0.00028163984229394393, + "loss": 0.0305, "step": 47220 }, { - "epoch": 0.24, - "learning_rate": 0.0002642577858948292, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.0002816359540775725, + "loss": 0.0285, "step": 47230 }, { - "epoch": 0.24, - "learning_rate": 0.0002642502182018152, - "loss": 0.0343, + "epoch": 0.12, + "learning_rate": 0.000281632065861201, + "loss": 0.0248, "step": 47240 }, { - "epoch": 0.24, - "learning_rate": 0.0002642426505088012, - "loss": 0.0245, + "epoch": 0.12, + "learning_rate": 0.0002816281776448296, + "loss": 0.0286, "step": 47250 }, { - "epoch": 0.24, - "learning_rate": 0.0002642350828157872, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002816242894284581, + "loss": 0.0276, "step": 47260 }, { - "epoch": 0.24, - "learning_rate": 0.0002642275151227732, - "loss": 0.0239, + "epoch": 0.12, + "learning_rate": 0.0002816204012120866, + "loss": 0.0283, "step": 47270 }, { - "epoch": 0.24, - "learning_rate": 0.00026421994742975916, - "loss": 0.0241, + "epoch": 0.12, + "learning_rate": 0.00028161651299571513, + "loss": 0.0307, "step": 47280 }, { - "epoch": 0.24, - "learning_rate": 0.00026421237973674514, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.0002816126247793437, + "loss": 0.0289, "step": 47290 }, { - "epoch": 0.24, - "learning_rate": 0.0002642048120437311, - "loss": 0.0254, + "epoch": 0.12, + "learning_rate": 0.0002816087365629722, + "loss": 0.0319, "step": 47300 }, { - "epoch": 0.24, - "learning_rate": 0.00026419724435071716, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.0002816048483466008, + "loss": 0.0227, "step": 47310 }, { - "epoch": 0.24, - "learning_rate": 0.00026418967665770314, - "loss": 0.019, + "epoch": 0.12, + "learning_rate": 0.0002816009601302293, + "loss": 0.026, "step": 47320 }, { - "epoch": 0.24, - "learning_rate": 0.0002641821089646891, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.00028159707191385787, + "loss": 0.0254, "step": 47330 }, { - "epoch": 0.24, - "learning_rate": 0.0002641745412716751, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.0002815931836974864, + "loss": 0.0296, "step": 47340 }, { - "epoch": 0.24, - "learning_rate": 0.0002641669735786611, - "loss": 0.0224, + "epoch": 0.12, + "learning_rate": 0.0002815892954811149, + "loss": 0.0248, "step": 47350 }, { - "epoch": 0.24, - "learning_rate": 0.00026415940588564706, - "loss": 0.0274, + "epoch": 0.12, + "learning_rate": 0.0002815854072647434, + "loss": 0.0279, "step": 47360 }, { - "epoch": 0.24, - "learning_rate": 0.00026415183819263304, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.000281581519048372, + "loss": 0.0297, "step": 47370 }, { - "epoch": 0.24, - "learning_rate": 0.0002641442704996191, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.00028157763083200055, + "loss": 0.0295, "step": 47380 }, { - "epoch": 0.24, - "learning_rate": 0.00026413670280660506, - "loss": 0.0193, + "epoch": 0.12, + "learning_rate": 0.00028157374261562906, + "loss": 0.0248, "step": 47390 }, { - "epoch": 0.24, - "learning_rate": 0.00026412913511359104, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.0002815698543992576, + "loss": 0.0293, "step": 47400 }, { - "epoch": 0.24, - "learning_rate": 0.000264121567420577, - "loss": 0.0196, + "epoch": 0.12, + "learning_rate": 0.0002815659661828861, + "loss": 0.0307, "step": 47410 }, { - "epoch": 0.24, - "learning_rate": 0.000264113999727563, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.00028156207796651466, + "loss": 0.0279, "step": 47420 }, { - "epoch": 0.24, - "learning_rate": 0.000264106432034549, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002815581897501432, + "loss": 0.0323, "step": 47430 }, { - "epoch": 0.24, - "learning_rate": 0.000264098864341535, - "loss": 0.0207, + "epoch": 0.12, + "learning_rate": 0.00028155430153377174, + "loss": 0.0361, "step": 47440 }, { - "epoch": 0.24, - "learning_rate": 0.000264091296648521, - "loss": 0.0191, + "epoch": 0.12, + "learning_rate": 0.00028155041331740026, + "loss": 0.0246, "step": 47450 }, { - "epoch": 0.24, - "learning_rate": 0.000264083728955507, - "loss": 0.0182, + "epoch": 0.12, + "learning_rate": 0.0002815465251010288, + "loss": 0.0361, "step": 47460 }, { - "epoch": 0.24, - "learning_rate": 0.00026407616126249297, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.00028154263688465734, + "loss": 0.0318, "step": 47470 }, { - "epoch": 0.24, - "learning_rate": 0.00026406859356947895, - "loss": 0.02, + "epoch": 0.12, + "learning_rate": 0.00028153874866828585, + "loss": 0.0314, "step": 47480 }, { - "epoch": 0.24, - "learning_rate": 0.00026406102587646493, - "loss": 0.0159, + "epoch": 0.12, + "learning_rate": 0.00028153486045191437, + "loss": 0.0273, "step": 47490 }, { - "epoch": 0.24, - "learning_rate": 0.00026405345818345097, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.00028153097223554294, + "loss": 0.029, "step": 47500 }, { - "epoch": 0.24, - "learning_rate": 0.00026404589049043695, - "loss": 0.0226, + "epoch": 0.12, + "learning_rate": 0.00028152708401917145, + "loss": 0.0278, "step": 47510 }, { - "epoch": 0.24, - "learning_rate": 0.00026403832279742293, - "loss": 0.0201, + "epoch": 0.12, + "learning_rate": 0.0002815231958028, + "loss": 0.0287, "step": 47520 }, { - "epoch": 0.24, - "learning_rate": 0.0002640307551044089, - "loss": 0.0164, + "epoch": 0.12, + "learning_rate": 0.00028151930758642854, + "loss": 0.0312, "step": 47530 }, { - "epoch": 0.24, - "learning_rate": 0.0002640231874113949, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002815154193700571, + "loss": 0.0244, "step": 47540 }, { - "epoch": 0.24, - "learning_rate": 0.00026401561971838087, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.0002815115311536856, + "loss": 0.0266, "step": 47550 }, { - "epoch": 0.24, - "learning_rate": 0.00026400805202536685, - "loss": 0.0194, + "epoch": 0.12, + "learning_rate": 0.00028150764293731413, + "loss": 0.0312, "step": 47560 }, { - "epoch": 0.24, - "learning_rate": 0.0002640004843323529, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.0002815037547209427, + "loss": 0.0281, "step": 47570 }, { - "epoch": 0.24, - "learning_rate": 0.00026399291663933887, - "loss": 0.0188, + "epoch": 0.12, + "learning_rate": 0.0002814998665045712, + "loss": 0.0292, "step": 47580 }, { - "epoch": 0.24, - "learning_rate": 0.00026398534894632485, - "loss": 0.0244, + "epoch": 0.12, + "learning_rate": 0.0002814959782881998, + "loss": 0.0256, "step": 47590 }, { - "epoch": 0.24, - "learning_rate": 0.00026397778125331083, - "loss": 0.0197, + "epoch": 0.12, + "learning_rate": 0.0002814920900718283, + "loss": 0.0293, "step": 47600 }, { - "epoch": 0.24, - "learning_rate": 0.0002639702135602968, - "loss": 0.0221, + "epoch": 0.12, + "learning_rate": 0.0002814882018554568, + "loss": 0.0283, "step": 47610 }, { - "epoch": 0.24, - "learning_rate": 0.0002639626458672828, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002814843136390854, + "loss": 0.03, "step": 47620 }, { - "epoch": 0.24, - "learning_rate": 0.00026395507817426883, - "loss": 0.0227, + "epoch": 0.12, + "learning_rate": 0.0002814804254227139, + "loss": 0.0246, "step": 47630 }, { - "epoch": 0.24, - "learning_rate": 0.0002639475104812548, - "loss": 0.0247, + "epoch": 0.12, + "learning_rate": 0.0002814765372063424, + "loss": 0.024, "step": 47640 }, { - "epoch": 0.24, - "learning_rate": 0.0002639399427882408, - "loss": 0.0204, + "epoch": 0.12, + "learning_rate": 0.000281472648989971, + "loss": 0.0301, "step": 47650 }, { - "epoch": 0.24, - "learning_rate": 0.0002639323750952268, - "loss": 0.026, + "epoch": 0.12, + "learning_rate": 0.0002814687607735995, + "loss": 0.0262, "step": 47660 }, { - "epoch": 0.24, - "learning_rate": 0.00026392480740221276, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.00028146487255722806, + "loss": 0.0239, "step": 47670 }, { - "epoch": 0.24, - "learning_rate": 0.00026391723970919874, - "loss": 0.022, + "epoch": 0.12, + "learning_rate": 0.0002814609843408566, + "loss": 0.0255, "step": 47680 }, { - "epoch": 0.24, - "learning_rate": 0.0002639096720161847, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002814570961244851, + "loss": 0.0311, "step": 47690 }, { - "epoch": 0.24, - "learning_rate": 0.00026390210432317076, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.0002814532079081136, + "loss": 0.0281, "step": 47700 }, { - "epoch": 0.24, - "learning_rate": 0.00026389453663015674, - "loss": 0.0277, + "epoch": 0.12, + "learning_rate": 0.0002814493196917422, + "loss": 0.0296, "step": 47710 }, { - "epoch": 0.24, - "learning_rate": 0.0002638869689371427, - "loss": 0.0262, + "epoch": 0.12, + "learning_rate": 0.00028144543147537075, + "loss": 0.025, "step": 47720 }, { - "epoch": 0.24, - "learning_rate": 0.0002638794012441287, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.00028144154325899926, + "loss": 0.0343, "step": 47730 }, { - "epoch": 0.24, - "learning_rate": 0.0002638718335511147, - "loss": 0.0265, + "epoch": 0.12, + "learning_rate": 0.0002814376550426278, + "loss": 0.0263, "step": 47740 }, { - "epoch": 0.24, - "learning_rate": 0.00026386426585810066, - "loss": 0.0204, + "epoch": 0.12, + "learning_rate": 0.00028143376682625634, + "loss": 0.0259, "step": 47750 }, { - "epoch": 0.24, - "learning_rate": 0.0002638566981650867, - "loss": 0.0244, + "epoch": 0.12, + "learning_rate": 0.00028142987860988486, + "loss": 0.0297, "step": 47760 }, { - "epoch": 0.24, - "learning_rate": 0.0002638491304720727, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.00028142599039351337, + "loss": 0.0241, "step": 47770 }, { - "epoch": 0.24, - "learning_rate": 0.00026384156277905866, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028142210217714194, + "loss": 0.0332, "step": 47780 }, { - "epoch": 0.24, - "learning_rate": 0.00026383399508604464, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028141821396077046, + "loss": 0.0379, "step": 47790 }, { - "epoch": 0.24, - "learning_rate": 0.0002638264273930306, - "loss": 0.0253, + "epoch": 0.12, + "learning_rate": 0.000281414325744399, + "loss": 0.0292, "step": 47800 }, { - "epoch": 0.24, - "learning_rate": 0.0002638188597000166, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.00028141043752802754, + "loss": 0.0324, "step": 47810 }, { - "epoch": 0.24, - "learning_rate": 0.00026381129200700264, - "loss": 0.0226, + "epoch": 0.12, + "learning_rate": 0.00028140654931165605, + "loss": 0.035, "step": 47820 }, { - "epoch": 0.24, - "learning_rate": 0.0002638037243139886, - "loss": 0.0198, + "epoch": 0.12, + "learning_rate": 0.0002814026610952846, + "loss": 0.0326, "step": 47830 }, { - "epoch": 0.24, - "learning_rate": 0.0002637961566209746, - "loss": 0.0209, + "epoch": 0.12, + "learning_rate": 0.00028139877287891314, + "loss": 0.0324, "step": 47840 }, { - "epoch": 0.24, - "learning_rate": 0.0002637885889279606, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.00028139488466254165, + "loss": 0.0317, "step": 47850 }, { - "epoch": 0.24, - "learning_rate": 0.00026378102123494657, - "loss": 0.0185, + "epoch": 0.12, + "learning_rate": 0.0002813909964461702, + "loss": 0.03, "step": 47860 }, { - "epoch": 0.24, - "learning_rate": 0.00026377345354193255, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.0002813871082297988, + "loss": 0.0272, "step": 47870 }, { - "epoch": 0.24, - "learning_rate": 0.00026376588584891853, - "loss": 0.0234, + "epoch": 0.12, + "learning_rate": 0.0002813832200134273, + "loss": 0.025, "step": 47880 }, { - "epoch": 0.24, - "learning_rate": 0.00026375831815590457, - "loss": 0.0225, + "epoch": 0.12, + "learning_rate": 0.0002813793317970558, + "loss": 0.027, "step": 47890 }, { - "epoch": 0.24, - "learning_rate": 0.00026375075046289055, - "loss": 0.0246, + "epoch": 0.12, + "learning_rate": 0.00028137544358068433, + "loss": 0.026, "step": 47900 }, { - "epoch": 0.24, - "learning_rate": 0.00026374318276987653, - "loss": 0.0237, + "epoch": 0.12, + "learning_rate": 0.00028137155536431285, + "loss": 0.0281, "step": 47910 }, { - "epoch": 0.24, - "learning_rate": 0.0002637356150768625, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002813676671479414, + "loss": 0.0295, "step": 47920 }, { - "epoch": 0.24, - "learning_rate": 0.0002637280473838485, - "loss": 0.0238, + "epoch": 0.12, + "learning_rate": 0.00028136377893157, + "loss": 0.0275, "step": 47930 }, { - "epoch": 0.24, - "learning_rate": 0.0002637204796908345, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.0002813598907151985, + "loss": 0.028, "step": 47940 }, { - "epoch": 0.24, - "learning_rate": 0.0002637129119978205, - "loss": 0.0245, + "epoch": 0.12, + "learning_rate": 0.000281356002498827, + "loss": 0.0316, "step": 47950 }, { - "epoch": 0.24, - "learning_rate": 0.0002637053443048065, - "loss": 0.024, + "epoch": 0.12, + "learning_rate": 0.0002813521142824556, + "loss": 0.0295, "step": 47960 }, { - "epoch": 0.24, - "learning_rate": 0.00026369777661179247, - "loss": 0.0206, + "epoch": 0.12, + "learning_rate": 0.0002813482260660841, + "loss": 0.0303, "step": 47970 }, { - "epoch": 0.24, - "learning_rate": 0.00026369020891877845, - "loss": 0.0229, + "epoch": 0.12, + "learning_rate": 0.0002813443378497126, + "loss": 0.0277, "step": 47980 }, { - "epoch": 0.24, - "learning_rate": 0.00026368264122576444, - "loss": 0.0198, + "epoch": 0.12, + "learning_rate": 0.0002813404496333412, + "loss": 0.035, "step": 47990 }, { - "epoch": 0.24, - "learning_rate": 0.0002636750735327504, - "loss": 0.0226, + "epoch": 0.12, + "learning_rate": 0.0002813365614169697, + "loss": 0.0302, "step": 48000 }, { - "epoch": 0.24, - "eval_cer": 0.9144945158062973, - "eval_loss": 0.015514707192778587, - "eval_runtime": 117.0856, - "eval_samples_per_second": 17.082, - "eval_steps_per_second": 4.27, + "epoch": 0.12, + "eval_cer": 0.8818804402138085, + "eval_loss": 0.022080879658460617, + "eval_runtime": 107.5098, + "eval_samples_per_second": 18.603, + "eval_steps_per_second": 4.651, "step": 48000 }, { - "epoch": 0.24, - "learning_rate": 0.00026366750583973645, - "loss": 0.0243, + "epoch": 0.12, + "learning_rate": 0.00028133267320059826, + "loss": 0.0361, "step": 48010 }, { - "epoch": 0.24, - "learning_rate": 0.00026365993814672243, - "loss": 0.0214, + "epoch": 0.12, + "learning_rate": 0.0002813287849842268, + "loss": 0.0382, "step": 48020 }, { - "epoch": 0.24, - "learning_rate": 0.0002636523704537084, - "loss": 0.0243, + "epoch": 0.12, + "learning_rate": 0.0002813248967678553, + "loss": 0.035, "step": 48030 }, { - "epoch": 0.24, - "learning_rate": 0.0002636448027606944, - "loss": 0.0254, + "epoch": 0.12, + "learning_rate": 0.00028132100855148386, + "loss": 0.0309, "step": 48040 }, { - "epoch": 0.24, - "learning_rate": 0.0002636372350676804, - "loss": 0.023, + "epoch": 0.12, + "learning_rate": 0.0002813171203351124, + "loss": 0.0334, "step": 48050 }, { - "epoch": 0.24, - "learning_rate": 0.00026362966737466636, - "loss": 0.0218, + "epoch": 0.12, + "learning_rate": 0.0002813132321187409, + "loss": 0.0357, "step": 48060 }, { - "epoch": 0.24, - "learning_rate": 0.00026362209968165234, - "loss": 0.0228, + "epoch": 0.12, + "learning_rate": 0.00028130934390236946, + "loss": 0.0288, "step": 48070 }, { - "epoch": 0.24, - "learning_rate": 0.0002636145319886384, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.00028130545568599803, + "loss": 0.0278, "step": 48080 }, { - "epoch": 0.24, - "learning_rate": 0.00026360696429562436, - "loss": 0.0156, + "epoch": 0.12, + "learning_rate": 0.00028130156746962654, + "loss": 0.0275, "step": 48090 }, { - "epoch": 0.24, - "learning_rate": 0.00026359939660261034, - "loss": 0.0239, + "epoch": 0.12, + "learning_rate": 0.00028129767925325506, + "loss": 0.0322, "step": 48100 }, { - "epoch": 0.24, - "learning_rate": 0.0002635918289095963, - "loss": 0.0257, + "epoch": 0.12, + "learning_rate": 0.00028129379103688357, + "loss": 0.0331, "step": 48110 }, { - "epoch": 0.24, - "learning_rate": 0.0002635842612165823, - "loss": 0.0211, + "epoch": 0.12, + "learning_rate": 0.00028128990282051214, + "loss": 0.0265, "step": 48120 }, { - "epoch": 0.24, - "learning_rate": 0.0002635766935235683, - "loss": 0.0273, + "epoch": 0.12, + "learning_rate": 0.00028128601460414065, + "loss": 0.0345, "step": 48130 }, { - "epoch": 0.24, - "learning_rate": 0.0002635691258305543, - "loss": 0.0219, + "epoch": 0.12, + "learning_rate": 0.0002812821263877692, + "loss": 0.0296, "step": 48140 }, { - "epoch": 0.24, - "learning_rate": 0.0002635615581375403, - "loss": 0.0251, + "epoch": 0.12, + "learning_rate": 0.00028127823817139774, + "loss": 0.0284, "step": 48150 }, { - "epoch": 0.24, - "learning_rate": 0.0002635539904445263, - "loss": 0.0212, + "epoch": 0.12, + "learning_rate": 0.00028127434995502625, + "loss": 0.0307, "step": 48160 }, { - "epoch": 0.24, - "learning_rate": 0.00026354642275151226, - "loss": 0.0205, + "epoch": 0.12, + "learning_rate": 0.0002812704617386548, + "loss": 0.0248, "step": 48170 }, { - "epoch": 0.24, - "learning_rate": 0.00026353885505849825, - "loss": 0.0199, + "epoch": 0.12, + "learning_rate": 0.00028126657352228334, + "loss": 0.027, "step": 48180 }, { - "epoch": 0.24, - "learning_rate": 0.0002635312873654842, - "loss": 0.0203, + "epoch": 0.12, + "learning_rate": 0.00028126268530591185, + "loss": 0.0269, "step": 48190 }, { - "epoch": 0.24, - "learning_rate": 0.0002635237196724702, - "loss": 0.0216, + "epoch": 0.12, + "learning_rate": 0.0002812587970895404, + "loss": 0.0261, "step": 48200 }, { - "epoch": 0.24, - "learning_rate": 0.00026351615197945624, - "loss": 0.0198, + "epoch": 0.12, + "learning_rate": 0.000281254908873169, + "loss": 0.0284, "step": 48210 }, { - "epoch": 0.24, - "learning_rate": 0.0002635085842864422, - "loss": 0.0235, + "epoch": 0.12, + "learning_rate": 0.0002812510206567975, + "loss": 0.0282, "step": 48220 }, { - "epoch": 0.24, - "learning_rate": 0.0002635010165934282, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.000281247132440426, + "loss": 0.0316, "step": 48230 }, { - "epoch": 0.24, - "learning_rate": 0.0002634934489004142, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.00028124324422405453, + "loss": 0.0289, "step": 48240 }, { - "epoch": 0.24, - "learning_rate": 0.00026348588120740017, - "loss": 0.0189, + "epoch": 0.13, + "learning_rate": 0.0002812393560076831, + "loss": 0.0227, "step": 48250 }, { - "epoch": 0.24, - "learning_rate": 0.00026347831351438615, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.0002812354677913116, + "loss": 0.0289, "step": 48260 }, { - "epoch": 0.24, - "learning_rate": 0.0002634707458213722, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.0002812315795749402, + "loss": 0.0284, "step": 48270 }, { - "epoch": 0.24, - "learning_rate": 0.00026346317812835817, - "loss": 0.024, + "epoch": 0.13, + "learning_rate": 0.0002812276913585687, + "loss": 0.0277, "step": 48280 }, { - "epoch": 0.24, - "learning_rate": 0.00026345561043534415, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.00028122380314219727, + "loss": 0.0284, "step": 48290 }, { - "epoch": 0.24, - "learning_rate": 0.00026344804274233013, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002812199149258258, + "loss": 0.0313, "step": 48300 }, { - "epoch": 0.24, - "learning_rate": 0.0002634404750493161, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.0002812160267094543, + "loss": 0.0291, "step": 48310 }, { - "epoch": 0.24, - "learning_rate": 0.0002634329073563021, - "loss": 0.0354, + "epoch": 0.13, + "learning_rate": 0.0002812121384930828, + "loss": 0.0306, "step": 48320 }, { - "epoch": 0.24, - "learning_rate": 0.00026342533966328813, - "loss": 0.0351, + "epoch": 0.13, + "learning_rate": 0.0002812082502767114, + "loss": 0.0282, "step": 48330 }, { - "epoch": 0.24, - "learning_rate": 0.0002634177719702741, - "loss": 0.0239, + "epoch": 0.13, + "learning_rate": 0.0002812043620603399, + "loss": 0.0255, "step": 48340 }, { - "epoch": 0.24, - "learning_rate": 0.0002634102042772601, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.00028120047384396846, + "loss": 0.0291, "step": 48350 }, { - "epoch": 0.24, - "learning_rate": 0.0002634026365842461, - "loss": 0.0196, + "epoch": 0.13, + "learning_rate": 0.000281196585627597, + "loss": 0.0329, "step": 48360 }, { - "epoch": 0.24, - "learning_rate": 0.00026339506889123206, - "loss": 0.0282, + "epoch": 0.13, + "learning_rate": 0.00028119269741122555, + "loss": 0.0359, "step": 48370 }, { - "epoch": 0.24, - "learning_rate": 0.00026338750119821804, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.00028118880919485406, + "loss": 0.0247, "step": 48380 }, { - "epoch": 0.24, - "learning_rate": 0.000263379933505204, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.0002811849209784826, + "loss": 0.0338, "step": 48390 }, { - "epoch": 0.24, - "learning_rate": 0.00026337236581219, - "loss": 0.0243, + "epoch": 0.13, + "learning_rate": 0.0002811810327621111, + "loss": 0.0289, "step": 48400 }, { - "epoch": 0.24, - "learning_rate": 0.000263364798119176, - "loss": 0.0196, + "epoch": 0.13, + "learning_rate": 0.00028117714454573966, + "loss": 0.0311, "step": 48410 }, { - "epoch": 0.24, - "learning_rate": 0.00026335723042616196, - "loss": 0.0195, + "epoch": 0.13, + "learning_rate": 0.0002811732563293682, + "loss": 0.0247, "step": 48420 }, { - "epoch": 0.24, - "learning_rate": 0.00026334966273314794, - "loss": 0.0169, + "epoch": 0.13, + "learning_rate": 0.00028116936811299674, + "loss": 0.0291, "step": 48430 }, { - "epoch": 0.24, - "learning_rate": 0.000263342095040134, - "loss": 0.0239, + "epoch": 0.13, + "learning_rate": 0.00028116547989662526, + "loss": 0.0283, "step": 48440 }, { - "epoch": 0.24, - "learning_rate": 0.00026333452734711996, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.00028116159168025377, + "loss": 0.0268, "step": 48450 }, { - "epoch": 0.24, - "learning_rate": 0.00026332695965410594, - "loss": 0.0185, + "epoch": 0.13, + "learning_rate": 0.00028115770346388234, + "loss": 0.0244, "step": 48460 }, { - "epoch": 0.24, - "learning_rate": 0.0002633193919610919, - "loss": 0.0182, + "epoch": 0.13, + "learning_rate": 0.00028115381524751085, + "loss": 0.0248, "step": 48470 }, { - "epoch": 0.24, - "learning_rate": 0.0002633118242680779, - "loss": 0.0219, + "epoch": 0.13, + "learning_rate": 0.0002811499270311394, + "loss": 0.0289, "step": 48480 }, { - "epoch": 0.24, - "learning_rate": 0.0002633042565750639, - "loss": 0.0188, + "epoch": 0.13, + "learning_rate": 0.00028114603881476794, + "loss": 0.0285, "step": 48490 }, { - "epoch": 0.24, - "learning_rate": 0.0002632966888820499, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.0002811421505983965, + "loss": 0.0285, "step": 48500 }, { - "epoch": 0.24, - "learning_rate": 0.0002632891211890359, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.000281138262382025, + "loss": 0.0267, "step": 48510 }, { - "epoch": 0.24, - "learning_rate": 0.0002632815534960219, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.00028113437416565353, + "loss": 0.0342, "step": 48520 }, { - "epoch": 0.24, - "learning_rate": 0.00026327398580300787, - "loss": 0.0176, + "epoch": 0.13, + "learning_rate": 0.00028113048594928205, + "loss": 0.0265, "step": 48530 }, { - "epoch": 0.24, - "learning_rate": 0.00026326641810999385, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.0002811265977329106, + "loss": 0.029, "step": 48540 }, { - "epoch": 0.24, - "learning_rate": 0.00026325885041697983, - "loss": 0.0193, + "epoch": 0.13, + "learning_rate": 0.00028112270951653913, + "loss": 0.0251, "step": 48550 }, { - "epoch": 0.24, - "learning_rate": 0.00026325128272396587, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.0002811188213001677, + "loss": 0.0317, "step": 48560 }, { - "epoch": 0.25, - "learning_rate": 0.00026324371503095185, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.0002811149330837962, + "loss": 0.031, "step": 48570 }, { - "epoch": 0.25, - "learning_rate": 0.00026323614733793783, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.0002811110448674248, + "loss": 0.0264, "step": 48580 }, { - "epoch": 0.25, - "learning_rate": 0.0002632285796449238, - "loss": 0.0161, + "epoch": 0.13, + "learning_rate": 0.0002811071566510533, + "loss": 0.0299, "step": 48590 }, { - "epoch": 0.25, - "learning_rate": 0.0002632210119519098, - "loss": 0.0273, + "epoch": 0.13, + "learning_rate": 0.0002811032684346818, + "loss": 0.0243, "step": 48600 }, { - "epoch": 0.25, - "learning_rate": 0.00026321344425889577, - "loss": 0.0227, + "epoch": 0.13, + "learning_rate": 0.0002810993802183104, + "loss": 0.031, "step": 48610 }, { - "epoch": 0.25, - "learning_rate": 0.00026320587656588175, - "loss": 0.0217, + "epoch": 0.13, + "learning_rate": 0.0002810954920019389, + "loss": 0.0336, "step": 48620 }, { - "epoch": 0.25, - "learning_rate": 0.0002631983088728678, - "loss": 0.0256, + "epoch": 0.13, + "learning_rate": 0.00028109160378556747, + "loss": 0.0308, "step": 48630 }, { - "epoch": 0.25, - "learning_rate": 0.00026319074117985377, - "loss": 0.0195, + "epoch": 0.13, + "learning_rate": 0.000281087715569196, + "loss": 0.03, "step": 48640 }, { - "epoch": 0.25, - "learning_rate": 0.00026318317348683975, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.0002810838273528245, + "loss": 0.0256, "step": 48650 }, { - "epoch": 0.25, - "learning_rate": 0.00026317560579382573, - "loss": 0.0203, + "epoch": 0.13, + "learning_rate": 0.000281079939136453, + "loss": 0.0254, "step": 48660 }, { - "epoch": 0.25, - "learning_rate": 0.0002631680381008117, - "loss": 0.0292, + "epoch": 0.13, + "learning_rate": 0.0002810760509200816, + "loss": 0.0291, "step": 48670 }, { - "epoch": 0.25, - "learning_rate": 0.0002631604704077977, - "loss": 0.0227, + "epoch": 0.13, + "learning_rate": 0.0002810721627037101, + "loss": 0.0263, "step": 48680 }, { - "epoch": 0.25, - "learning_rate": 0.00026315290271478373, - "loss": 0.0221, + "epoch": 0.13, + "learning_rate": 0.00028106827448733866, + "loss": 0.0332, "step": 48690 }, { - "epoch": 0.25, - "learning_rate": 0.0002631453350217697, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.0002810643862709672, + "loss": 0.0293, "step": 48700 }, { - "epoch": 0.25, - "learning_rate": 0.0002631377673287557, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.00028106049805459574, + "loss": 0.0271, "step": 48710 }, { - "epoch": 0.25, - "learning_rate": 0.0002631301996357417, - "loss": 0.0198, + "epoch": 0.13, + "learning_rate": 0.00028105660983822426, + "loss": 0.0298, "step": 48720 }, { - "epoch": 0.25, - "learning_rate": 0.00026312263194272766, - "loss": 0.0239, + "epoch": 0.13, + "learning_rate": 0.0002810527216218528, + "loss": 0.0304, "step": 48730 }, { - "epoch": 0.25, - "learning_rate": 0.00026311506424971364, - "loss": 0.0193, + "epoch": 0.13, + "learning_rate": 0.0002810488334054813, + "loss": 0.0308, "step": 48740 }, { - "epoch": 0.25, - "learning_rate": 0.0002631074965566996, - "loss": 0.0203, + "epoch": 0.13, + "learning_rate": 0.00028104494518910986, + "loss": 0.031, "step": 48750 }, { - "epoch": 0.25, - "learning_rate": 0.00026309992886368566, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.0002810410569727384, + "loss": 0.0335, "step": 48760 }, { - "epoch": 0.25, - "learning_rate": 0.00026309236117067164, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.00028103716875636694, + "loss": 0.0317, "step": 48770 }, { - "epoch": 0.25, - "learning_rate": 0.0002630847934776576, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.00028103328053999545, + "loss": 0.0321, "step": 48780 }, { - "epoch": 0.25, - "learning_rate": 0.0002630772257846436, - "loss": 0.0235, + "epoch": 0.13, + "learning_rate": 0.000281029392323624, + "loss": 0.0397, "step": 48790 }, { - "epoch": 0.25, - "learning_rate": 0.0002630696580916296, - "loss": 0.0219, + "epoch": 0.13, + "learning_rate": 0.00028102550410725254, + "loss": 0.0366, "step": 48800 }, { - "epoch": 0.25, - "learning_rate": 0.00026306209039861556, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.00028102161589088105, + "loss": 0.0299, "step": 48810 }, { - "epoch": 0.25, - "learning_rate": 0.0002630545227056016, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.0002810177276745096, + "loss": 0.0304, "step": 48820 }, { - "epoch": 0.25, - "learning_rate": 0.0002630469550125876, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.00028101383945813814, + "loss": 0.0324, "step": 48830 }, { - "epoch": 0.25, - "learning_rate": 0.00026303938731957356, - "loss": 0.0202, + "epoch": 0.13, + "learning_rate": 0.0002810099512417667, + "loss": 0.0282, "step": 48840 }, { - "epoch": 0.25, - "learning_rate": 0.00026303181962655954, - "loss": 0.0193, + "epoch": 0.13, + "learning_rate": 0.0002810060630253952, + "loss": 0.035, "step": 48850 }, { - "epoch": 0.25, - "learning_rate": 0.0002630242519335455, - "loss": 0.0174, + "epoch": 0.13, + "learning_rate": 0.00028100217480902373, + "loss": 0.0211, "step": 48860 }, { - "epoch": 0.25, - "learning_rate": 0.0002630166842405315, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.0002809982865926523, + "loss": 0.0299, "step": 48870 }, { - "epoch": 0.25, - "learning_rate": 0.00026300911654751754, - "loss": 0.0255, + "epoch": 0.13, + "learning_rate": 0.0002809943983762808, + "loss": 0.025, "step": 48880 }, { - "epoch": 0.25, - "learning_rate": 0.0002630015488545035, - "loss": 0.0251, + "epoch": 0.13, + "learning_rate": 0.00028099051015990933, + "loss": 0.0299, "step": 48890 }, { - "epoch": 0.25, - "learning_rate": 0.0002629939811614895, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.0002809866219435379, + "loss": 0.025, "step": 48900 }, { - "epoch": 0.25, - "learning_rate": 0.0002629864134684755, - "loss": 0.0236, + "epoch": 0.13, + "learning_rate": 0.0002809827337271664, + "loss": 0.0307, "step": 48910 }, { - "epoch": 0.25, - "learning_rate": 0.00026297884577546147, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.000280978845510795, + "loss": 0.0284, "step": 48920 }, { - "epoch": 0.25, - "learning_rate": 0.00026297127808244745, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.0002809749572944235, + "loss": 0.0309, "step": 48930 }, { - "epoch": 0.25, - "learning_rate": 0.00026296371038943343, - "loss": 0.0219, + "epoch": 0.13, + "learning_rate": 0.000280971069078052, + "loss": 0.0274, "step": 48940 }, { - "epoch": 0.25, - "learning_rate": 0.00026295614269641947, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.0002809671808616805, + "loss": 0.0312, "step": 48950 }, { - "epoch": 0.25, - "learning_rate": 0.00026294857500340545, - "loss": 0.0219, + "epoch": 0.13, + "learning_rate": 0.0002809632926453091, + "loss": 0.0292, "step": 48960 }, { - "epoch": 0.25, - "learning_rate": 0.00026294100731039143, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.00028095940442893766, + "loss": 0.0294, "step": 48970 }, { - "epoch": 0.25, - "learning_rate": 0.0002629334396173774, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.0002809555162125662, + "loss": 0.0323, "step": 48980 }, { - "epoch": 0.25, - "learning_rate": 0.0002629258719243634, - "loss": 0.0226, + "epoch": 0.13, + "learning_rate": 0.0002809516279961947, + "loss": 0.0294, "step": 48990 }, { - "epoch": 0.25, - "learning_rate": 0.0002629183042313494, - "loss": 0.0171, + "epoch": 0.13, + "learning_rate": 0.00028094773977982326, + "loss": 0.0309, "step": 49000 }, { - "epoch": 0.25, - "eval_cer": 0.914452788772905, - "eval_loss": 0.01547841913998127, - "eval_runtime": 116.9106, - "eval_samples_per_second": 17.107, - "eval_steps_per_second": 4.277, + "epoch": 0.13, + "eval_cer": 0.881806259456297, + "eval_loss": 0.021124470978975296, + "eval_runtime": 107.4686, + "eval_samples_per_second": 18.61, + "eval_steps_per_second": 4.653, "step": 49000 }, { - "epoch": 0.25, - "learning_rate": 0.0002629107365383354, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002809438515634518, + "loss": 0.0327, "step": 49010 }, { - "epoch": 0.25, - "learning_rate": 0.0002629031688453214, - "loss": 0.0196, + "epoch": 0.13, + "learning_rate": 0.0002809399633470803, + "loss": 0.025, "step": 49020 }, { - "epoch": 0.25, - "learning_rate": 0.0002628956011523074, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.00028093607513070886, + "loss": 0.0292, "step": 49030 }, { - "epoch": 0.25, - "learning_rate": 0.00026288803345929335, - "loss": 0.0224, + "epoch": 0.13, + "learning_rate": 0.0002809321869143374, + "loss": 0.0272, "step": 49040 }, { - "epoch": 0.25, - "learning_rate": 0.00026288046576627934, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.00028092829869796594, + "loss": 0.0309, "step": 49050 }, { - "epoch": 0.25, - "learning_rate": 0.0002628728980732653, - "loss": 0.02, + "epoch": 0.13, + "learning_rate": 0.00028092441048159446, + "loss": 0.0352, "step": 49060 }, { - "epoch": 0.25, - "learning_rate": 0.00026286533038025135, - "loss": 0.0183, + "epoch": 0.13, + "learning_rate": 0.00028092052226522297, + "loss": 0.0299, "step": 49070 }, { - "epoch": 0.25, - "learning_rate": 0.00026285776268723733, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00028091663404885154, + "loss": 0.0306, "step": 49080 }, { - "epoch": 0.25, - "learning_rate": 0.0002628501949942233, - "loss": 0.0184, + "epoch": 0.13, + "learning_rate": 0.00028091274583248006, + "loss": 0.0239, "step": 49090 }, { - "epoch": 0.25, - "learning_rate": 0.0002628426273012093, - "loss": 0.0265, + "epoch": 0.13, + "learning_rate": 0.00028090885761610857, + "loss": 0.0272, "step": 49100 }, { - "epoch": 0.25, - "learning_rate": 0.0002628350596081953, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00028090496939973714, + "loss": 0.0276, "step": 49110 }, { - "epoch": 0.25, - "learning_rate": 0.00026282749191518126, - "loss": 0.0267, + "epoch": 0.13, + "learning_rate": 0.0002809010811833657, + "loss": 0.0355, "step": 49120 }, { - "epoch": 0.25, - "learning_rate": 0.00026281992422216724, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.0002808971929669942, + "loss": 0.0292, "step": 49130 }, { - "epoch": 0.25, - "learning_rate": 0.0002628123565291533, - "loss": 0.0201, + "epoch": 0.13, + "learning_rate": 0.00028089330475062274, + "loss": 0.0361, "step": 49140 }, { - "epoch": 0.25, - "learning_rate": 0.00026280478883613926, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00028088941653425125, + "loss": 0.0298, "step": 49150 }, { - "epoch": 0.25, - "learning_rate": 0.00026279722114312524, - "loss": 0.0224, + "epoch": 0.13, + "learning_rate": 0.0002808855283178798, + "loss": 0.0257, "step": 49160 }, { - "epoch": 0.25, - "learning_rate": 0.0002627896534501112, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.00028088164010150833, + "loss": 0.0259, "step": 49170 }, { - "epoch": 0.25, - "learning_rate": 0.0002627820857570972, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.0002808777518851369, + "loss": 0.0255, "step": 49180 }, { - "epoch": 0.25, - "learning_rate": 0.0002627745180640832, - "loss": 0.0164, + "epoch": 0.13, + "learning_rate": 0.0002808738636687654, + "loss": 0.0277, "step": 49190 }, { - "epoch": 0.25, - "learning_rate": 0.0002627669503710692, - "loss": 0.018, + "epoch": 0.13, + "learning_rate": 0.00028086997545239393, + "loss": 0.0282, "step": 49200 }, { - "epoch": 0.25, - "learning_rate": 0.0002627593826780552, - "loss": 0.0173, + "epoch": 0.13, + "learning_rate": 0.0002808660872360225, + "loss": 0.0269, "step": 49210 }, { - "epoch": 0.25, - "learning_rate": 0.0002627518149850412, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.000280862199019651, + "loss": 0.0293, "step": 49220 }, { - "epoch": 0.25, - "learning_rate": 0.00026274424729202716, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.00028085831080327953, + "loss": 0.0295, "step": 49230 }, { - "epoch": 0.25, - "learning_rate": 0.00026273667959901315, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.0002808544225869081, + "loss": 0.0243, "step": 49240 }, { - "epoch": 0.25, - "learning_rate": 0.00026272911190599913, - "loss": 0.0169, + "epoch": 0.13, + "learning_rate": 0.0002808505343705366, + "loss": 0.0281, "step": 49250 }, { - "epoch": 0.25, - "learning_rate": 0.0002627215442129851, - "loss": 0.0187, + "epoch": 0.13, + "learning_rate": 0.0002808466461541652, + "loss": 0.0358, "step": 49260 }, { - "epoch": 0.25, - "learning_rate": 0.00026271397651997114, - "loss": 0.0195, + "epoch": 0.13, + "learning_rate": 0.0002808427579377937, + "loss": 0.0275, "step": 49270 }, { - "epoch": 0.25, - "learning_rate": 0.0002627064088269571, - "loss": 0.0175, + "epoch": 0.13, + "learning_rate": 0.0002808388697214222, + "loss": 0.0269, "step": 49280 }, { - "epoch": 0.25, - "learning_rate": 0.0002626988411339431, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.0002808349815050508, + "loss": 0.0233, "step": 49290 }, { - "epoch": 0.25, - "learning_rate": 0.0002626912734409291, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.0002808310932886793, + "loss": 0.0294, "step": 49300 }, { - "epoch": 0.25, - "learning_rate": 0.00026268370574791507, - "loss": 0.0264, + "epoch": 0.13, + "learning_rate": 0.00028082720507230786, + "loss": 0.0313, "step": 49310 }, { - "epoch": 0.25, - "learning_rate": 0.00026267613805490105, - "loss": 0.0278, + "epoch": 0.13, + "learning_rate": 0.0002808233168559364, + "loss": 0.0321, "step": 49320 }, { - "epoch": 0.25, - "learning_rate": 0.0002626685703618871, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.00028081942863956495, + "loss": 0.0236, "step": 49330 }, { - "epoch": 0.25, - "learning_rate": 0.00026266100266887307, - "loss": 0.0231, + "epoch": 0.13, + "learning_rate": 0.00028081554042319346, + "loss": 0.0271, "step": 49340 }, { - "epoch": 0.25, - "learning_rate": 0.00026265343497585905, - "loss": 0.0239, + "epoch": 0.13, + "learning_rate": 0.000280811652206822, + "loss": 0.0241, "step": 49350 }, { - "epoch": 0.25, - "learning_rate": 0.00026264586728284503, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.0002808077639904505, + "loss": 0.0263, "step": 49360 }, { - "epoch": 0.25, - "learning_rate": 0.000262638299589831, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.00028080387577407906, + "loss": 0.028, "step": 49370 }, { - "epoch": 0.25, - "learning_rate": 0.000262630731896817, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028079998755770757, + "loss": 0.0303, "step": 49380 }, { - "epoch": 0.25, - "learning_rate": 0.00026262316420380303, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.00028079609934133614, + "loss": 0.0297, "step": 49390 }, { - "epoch": 0.25, - "learning_rate": 0.000262615596510789, - "loss": 0.02, + "epoch": 0.13, + "learning_rate": 0.00028079221112496466, + "loss": 0.0262, "step": 49400 }, { - "epoch": 0.25, - "learning_rate": 0.000262608028817775, - "loss": 0.0201, + "epoch": 0.13, + "learning_rate": 0.00028078832290859317, + "loss": 0.0301, "step": 49410 }, { - "epoch": 0.25, - "learning_rate": 0.000262600461124761, - "loss": 0.0203, + "epoch": 0.13, + "learning_rate": 0.00028078443469222174, + "loss": 0.0276, "step": 49420 }, { - "epoch": 0.25, - "learning_rate": 0.00026259289343174696, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.00028078054647585025, + "loss": 0.0287, "step": 49430 }, { - "epoch": 0.25, - "learning_rate": 0.00026258532573873294, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.00028077665825947877, + "loss": 0.0292, "step": 49440 }, { - "epoch": 0.25, - "learning_rate": 0.0002625777580457189, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028077277004310734, + "loss": 0.0295, "step": 49450 }, { - "epoch": 0.25, - "learning_rate": 0.00026257019035270495, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.0002807688818267359, + "loss": 0.028, "step": 49460 }, { - "epoch": 0.25, - "learning_rate": 0.00026256262265969094, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002807649936103644, + "loss": 0.0276, "step": 49470 }, { - "epoch": 0.25, - "learning_rate": 0.0002625550549666769, - "loss": 0.0235, + "epoch": 0.13, + "learning_rate": 0.00028076110539399294, + "loss": 0.0265, "step": 49480 }, { - "epoch": 0.25, - "learning_rate": 0.0002625474872736629, - "loss": 0.0181, + "epoch": 0.13, + "learning_rate": 0.00028075721717762145, + "loss": 0.0309, "step": 49490 }, { - "epoch": 0.25, - "learning_rate": 0.0002625399195806489, - "loss": 0.0182, + "epoch": 0.13, + "learning_rate": 0.00028075332896125, + "loss": 0.0311, "step": 49500 }, { - "epoch": 0.25, - "learning_rate": 0.00026253235188763486, - "loss": 0.0221, + "epoch": 0.13, + "learning_rate": 0.00028074944074487853, + "loss": 0.0545, "step": 49510 }, { - "epoch": 0.25, - "learning_rate": 0.0002625247841946209, - "loss": 0.0301, + "epoch": 0.13, + "learning_rate": 0.0002807455525285071, + "loss": 0.0313, "step": 49520 }, { - "epoch": 0.25, - "learning_rate": 0.0002625172165016069, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.0002807416643121356, + "loss": 0.0258, "step": 49530 }, { - "epoch": 0.25, - "learning_rate": 0.00026250964880859286, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.0002807377760957642, + "loss": 0.0303, "step": 49540 }, { - "epoch": 0.25, - "learning_rate": 0.00026250208111557884, - "loss": 0.0226, + "epoch": 0.13, + "learning_rate": 0.0002807338878793927, + "loss": 0.0289, "step": 49550 }, { - "epoch": 0.25, - "learning_rate": 0.0002624945134225648, - "loss": 0.0236, + "epoch": 0.13, + "learning_rate": 0.0002807299996630212, + "loss": 0.0299, "step": 49560 }, { - "epoch": 0.25, - "learning_rate": 0.0002624869457295508, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.00028072611144664973, + "loss": 0.0301, "step": 49570 }, { - "epoch": 0.25, - "learning_rate": 0.00026247937803653684, - "loss": 0.0232, + "epoch": 0.13, + "learning_rate": 0.0002807222232302783, + "loss": 0.0313, "step": 49580 }, { - "epoch": 0.25, - "learning_rate": 0.0002624718103435228, - "loss": 0.02, + "epoch": 0.13, + "learning_rate": 0.0002807183350139068, + "loss": 0.024, "step": 49590 }, { - "epoch": 0.25, - "learning_rate": 0.0002624642426505088, - "loss": 0.0189, + "epoch": 0.13, + "learning_rate": 0.0002807144467975354, + "loss": 0.0261, "step": 49600 }, { - "epoch": 0.25, - "learning_rate": 0.0002624566749574948, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.0002807105585811639, + "loss": 0.0333, "step": 49610 }, { - "epoch": 0.25, - "learning_rate": 0.00026244910726448077, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.00028070667036479246, + "loss": 0.0305, "step": 49620 }, { - "epoch": 0.25, - "learning_rate": 0.00026244153957146675, - "loss": 0.0176, + "epoch": 0.13, + "learning_rate": 0.000280702782148421, + "loss": 0.0272, "step": 49630 }, { - "epoch": 0.25, - "learning_rate": 0.00026243397187845273, - "loss": 0.0277, + "epoch": 0.13, + "learning_rate": 0.0002806988939320495, + "loss": 0.0264, "step": 49640 }, { - "epoch": 0.25, - "learning_rate": 0.0002624264041854387, - "loss": 0.0259, + "epoch": 0.13, + "learning_rate": 0.000280695005715678, + "loss": 0.031, "step": 49650 }, { - "epoch": 0.25, - "learning_rate": 0.0002624188364924247, - "loss": 0.0293, + "epoch": 0.13, + "learning_rate": 0.0002806911174993066, + "loss": 0.0265, "step": 49660 }, { - "epoch": 0.25, - "learning_rate": 0.0002624112687994107, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.00028068722928293514, + "loss": 0.0313, "step": 49670 }, { - "epoch": 0.25, - "learning_rate": 0.00026240370110639665, - "loss": 0.0198, + "epoch": 0.13, + "learning_rate": 0.00028068334106656366, + "loss": 0.0324, "step": 49680 }, { - "epoch": 0.25, - "learning_rate": 0.0002623961334133827, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.0002806794528501922, + "loss": 0.0316, "step": 49690 }, { - "epoch": 0.25, - "learning_rate": 0.00026238856572036867, - "loss": 0.0217, + "epoch": 0.13, + "learning_rate": 0.0002806755646338207, + "loss": 0.027, "step": 49700 }, { - "epoch": 0.25, - "learning_rate": 0.00026238099802735465, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.00028067167641744926, + "loss": 0.0375, "step": 49710 }, { - "epoch": 0.25, - "learning_rate": 0.00026237343033434063, - "loss": 0.0174, + "epoch": 0.13, + "learning_rate": 0.00028066778820107777, + "loss": 0.0281, "step": 49720 }, { - "epoch": 0.25, - "learning_rate": 0.0002623658626413266, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.00028066389998470634, + "loss": 0.0231, "step": 49730 }, { - "epoch": 0.25, - "learning_rate": 0.0002623582949483126, - "loss": 0.0251, + "epoch": 0.13, + "learning_rate": 0.00028066001176833485, + "loss": 0.0346, "step": 49740 }, { - "epoch": 0.25, - "learning_rate": 0.00026235072725529863, - "loss": 0.0189, + "epoch": 0.13, + "learning_rate": 0.0002806561235519634, + "loss": 0.0316, "step": 49750 }, { - "epoch": 0.25, - "learning_rate": 0.0002623431595622846, - "loss": 0.019, + "epoch": 0.13, + "learning_rate": 0.00028065223533559194, + "loss": 0.0265, "step": 49760 }, { - "epoch": 0.25, - "learning_rate": 0.0002623355918692706, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028064834711922045, + "loss": 0.0267, "step": 49770 }, { - "epoch": 0.25, - "learning_rate": 0.0002623280241762566, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.00028064445890284897, + "loss": 0.03, "step": 49780 }, { - "epoch": 0.25, - "learning_rate": 0.00026232045648324256, - "loss": 0.0243, + "epoch": 0.13, + "learning_rate": 0.00028064057068647754, + "loss": 0.0275, "step": 49790 }, { - "epoch": 0.25, - "learning_rate": 0.00026231288879022854, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.0002806366824701061, + "loss": 0.0276, "step": 49800 }, { - "epoch": 0.25, - "learning_rate": 0.0002623053210972146, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.0002806327942537346, + "loss": 0.0302, "step": 49810 }, { - "epoch": 0.25, - "learning_rate": 0.00026229775340420056, - "loss": 0.0203, + "epoch": 0.13, + "learning_rate": 0.00028062890603736313, + "loss": 0.041, "step": 49820 }, { - "epoch": 0.25, - "learning_rate": 0.00026229018571118654, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.0002806250178209917, + "loss": 0.029, "step": 49830 }, { - "epoch": 0.25, - "learning_rate": 0.0002622826180181725, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.0002806211296046202, + "loss": 0.0273, "step": 49840 }, { - "epoch": 0.25, - "learning_rate": 0.0002622750503251585, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.00028061724138824873, + "loss": 0.0328, "step": 49850 }, { - "epoch": 0.25, - "learning_rate": 0.0002622674826321445, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.0002806133531718773, + "loss": 0.0269, "step": 49860 }, { - "epoch": 0.25, - "learning_rate": 0.00026225991493913046, - "loss": 0.0197, + "epoch": 0.13, + "learning_rate": 0.0002806094649555058, + "loss": 0.0333, "step": 49870 }, { - "epoch": 0.25, - "learning_rate": 0.0002622523472461165, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.0002806055767391344, + "loss": 0.0357, "step": 49880 }, { - "epoch": 0.25, - "learning_rate": 0.0002622447795531025, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.0002806016885227629, + "loss": 0.0299, "step": 49890 }, { - "epoch": 0.25, - "learning_rate": 0.00026223721186008846, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.0002805978003063914, + "loss": 0.0313, "step": 49900 }, { - "epoch": 0.25, - "learning_rate": 0.00026222964416707444, - "loss": 0.0235, + "epoch": 0.13, + "learning_rate": 0.00028059391209001993, + "loss": 0.0323, "step": 49910 }, { - "epoch": 0.25, - "learning_rate": 0.0002622220764740604, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.0002805900238736485, + "loss": 0.0291, "step": 49920 }, { - "epoch": 0.25, - "learning_rate": 0.0002622145087810464, - "loss": 0.0262, + "epoch": 0.13, + "learning_rate": 0.000280586135657277, + "loss": 0.0295, "step": 49930 }, { - "epoch": 0.25, - "learning_rate": 0.00026220694108803244, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.0002805822474409056, + "loss": 0.0317, "step": 49940 }, { - "epoch": 0.25, - "learning_rate": 0.0002621993733950184, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.0002805783592245341, + "loss": 0.0314, "step": 49950 }, { - "epoch": 0.25, - "learning_rate": 0.0002621918057020044, - "loss": 0.0185, + "epoch": 0.13, + "learning_rate": 0.00028057447100816266, + "loss": 0.0293, "step": 49960 }, { - "epoch": 0.25, - "learning_rate": 0.0002621842380089904, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.0002805705827917912, + "loss": 0.027, "step": 49970 }, { - "epoch": 0.25, - "learning_rate": 0.00026217667031597637, - "loss": 0.0246, + "epoch": 0.13, + "learning_rate": 0.0002805666945754197, + "loss": 0.0279, "step": 49980 }, { - "epoch": 0.25, - "learning_rate": 0.00026216910262296235, - "loss": 0.0191, + "epoch": 0.13, + "learning_rate": 0.0002805628063590482, + "loss": 0.0253, "step": 49990 }, { - "epoch": 0.25, - "learning_rate": 0.00026216153492994833, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.0002805589181426768, + "loss": 0.0373, "step": 50000 }, { - "epoch": 0.25, - "eval_cer": 0.9144683151109114, - "eval_loss": 0.015245326794683933, - "eval_runtime": 117.0207, - "eval_samples_per_second": 17.091, - "eval_steps_per_second": 4.273, + "epoch": 0.13, + "eval_cer": 0.881797861634692, + "eval_loss": 0.021269751712679863, + "eval_runtime": 107.6876, + "eval_samples_per_second": 18.572, + "eval_steps_per_second": 4.643, "step": 50000 }, { - "epoch": 0.25, - "learning_rate": 0.00026215396723693437, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.00028055502992630534, + "loss": 0.028, "step": 50010 }, { - "epoch": 0.25, - "learning_rate": 0.00026214639954392035, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.00028055114170993386, + "loss": 0.0291, "step": 50020 }, { - "epoch": 0.25, - "learning_rate": 0.00026213883185090633, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.00028054725349356237, + "loss": 0.0269, "step": 50030 }, { - "epoch": 0.25, - "learning_rate": 0.0002621312641578923, - "loss": 0.0178, + "epoch": 0.13, + "learning_rate": 0.00028054336527719094, + "loss": 0.0263, "step": 50040 }, { - "epoch": 0.25, - "learning_rate": 0.0002621236964648783, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00028053947706081946, + "loss": 0.034, "step": 50050 }, { - "epoch": 0.25, - "learning_rate": 0.0002621161287718643, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.00028053558884444797, + "loss": 0.0332, "step": 50060 }, { - "epoch": 0.25, - "learning_rate": 0.0002621085610788503, - "loss": 0.0221, + "epoch": 0.13, + "learning_rate": 0.00028053170062807654, + "loss": 0.0274, "step": 50070 }, { - "epoch": 0.25, - "learning_rate": 0.0002621009933858363, - "loss": 0.0188, + "epoch": 0.13, + "learning_rate": 0.00028052781241170505, + "loss": 0.0248, "step": 50080 }, { - "epoch": 0.25, - "learning_rate": 0.0002620934256928223, - "loss": 0.0233, + "epoch": 0.13, + "learning_rate": 0.0002805239241953336, + "loss": 0.0263, "step": 50090 }, { - "epoch": 0.25, - "learning_rate": 0.00026208585799980825, - "loss": 0.0258, + "epoch": 0.13, + "learning_rate": 0.00028052003597896214, + "loss": 0.0294, "step": 50100 }, { - "epoch": 0.25, - "learning_rate": 0.00026207829030679424, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.00028051614776259065, + "loss": 0.0294, "step": 50110 }, { - "epoch": 0.25, - "learning_rate": 0.0002620707226137802, - "loss": 0.0217, + "epoch": 0.13, + "learning_rate": 0.00028051225954621917, + "loss": 0.0273, "step": 50120 }, { - "epoch": 0.25, - "learning_rate": 0.00026206315492076625, - "loss": 0.0236, + "epoch": 0.13, + "learning_rate": 0.00028050837132984773, + "loss": 0.0308, "step": 50130 }, { - "epoch": 0.25, - "learning_rate": 0.00026205558722775223, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.00028050448311347625, + "loss": 0.0288, "step": 50140 }, { - "epoch": 0.25, - "learning_rate": 0.0002620480195347382, - "loss": 0.0196, + "epoch": 0.13, + "learning_rate": 0.0002805005948971048, + "loss": 0.0287, "step": 50150 }, { - "epoch": 0.25, - "learning_rate": 0.0002620404518417242, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.00028049670668073333, + "loss": 0.0277, "step": 50160 }, { - "epoch": 0.25, - "learning_rate": 0.0002620328841487102, - "loss": 0.0217, + "epoch": 0.13, + "learning_rate": 0.0002804928184643619, + "loss": 0.0346, "step": 50170 }, { - "epoch": 0.25, - "learning_rate": 0.00026202531645569616, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.0002804889302479904, + "loss": 0.029, "step": 50180 }, { - "epoch": 0.25, - "learning_rate": 0.00026201774876268214, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.00028048504203161893, + "loss": 0.028, "step": 50190 }, { - "epoch": 0.25, - "learning_rate": 0.0002620101810696682, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.0002804811538152475, + "loss": 0.0286, "step": 50200 }, { - "epoch": 0.25, - "learning_rate": 0.00026200261337665416, - "loss": 0.0253, + "epoch": 0.13, + "learning_rate": 0.000280477265598876, + "loss": 0.0264, "step": 50210 }, { - "epoch": 0.25, - "learning_rate": 0.00026199504568364014, - "loss": 0.0251, + "epoch": 0.13, + "learning_rate": 0.0002804733773825046, + "loss": 0.0299, "step": 50220 }, { - "epoch": 0.25, - "learning_rate": 0.0002619874779906261, - "loss": 0.02, + "epoch": 0.13, + "learning_rate": 0.0002804694891661331, + "loss": 0.0304, "step": 50230 }, { - "epoch": 0.25, - "learning_rate": 0.0002619799102976121, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.0002804656009497616, + "loss": 0.0308, "step": 50240 }, { - "epoch": 0.25, - "learning_rate": 0.0002619723426045981, - "loss": 0.0262, + "epoch": 0.13, + "learning_rate": 0.0002804617127333902, + "loss": 0.028, "step": 50250 }, { - "epoch": 0.25, - "learning_rate": 0.0002619647749115841, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.0002804578245170187, + "loss": 0.0283, "step": 50260 }, { - "epoch": 0.25, - "learning_rate": 0.0002619572072185701, - "loss": 0.0235, + "epoch": 0.13, + "learning_rate": 0.0002804539363006472, + "loss": 0.0331, "step": 50270 }, { - "epoch": 0.25, - "learning_rate": 0.0002619496395255561, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.0002804500480842758, + "loss": 0.0288, "step": 50280 }, { - "epoch": 0.25, - "learning_rate": 0.00026194207183254206, - "loss": 0.0196, + "epoch": 0.13, + "learning_rate": 0.0002804461598679043, + "loss": 0.0278, "step": 50290 }, { - "epoch": 0.25, - "learning_rate": 0.00026193450413952805, - "loss": 0.019, + "epoch": 0.13, + "learning_rate": 0.00028044227165153286, + "loss": 0.0298, "step": 50300 }, { - "epoch": 0.25, - "learning_rate": 0.00026192693644651403, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.0002804383834351614, + "loss": 0.0261, "step": 50310 }, { - "epoch": 0.25, - "learning_rate": 0.00026191936875350006, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.0002804344952187899, + "loss": 0.0255, "step": 50320 }, { - "epoch": 0.25, - "learning_rate": 0.00026191180106048604, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.00028043060700241846, + "loss": 0.0331, "step": 50330 }, { - "epoch": 0.25, - "learning_rate": 0.000261904233367472, - "loss": 0.0252, + "epoch": 0.13, + "learning_rate": 0.000280426718786047, + "loss": 0.031, "step": 50340 }, { - "epoch": 0.25, - "learning_rate": 0.000261896665674458, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.00028042283056967554, + "loss": 0.0292, "step": 50350 }, { - "epoch": 0.25, - "learning_rate": 0.000261889097981444, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.00028041894235330406, + "loss": 0.0299, "step": 50360 }, { - "epoch": 0.25, - "learning_rate": 0.00026188153028842997, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.00028041505413693257, + "loss": 0.0222, "step": 50370 }, { - "epoch": 0.25, - "learning_rate": 0.00026187396259541595, + "epoch": 0.13, + "learning_rate": 0.00028041116592056114, "loss": 0.0233, "step": 50380 }, { - "epoch": 0.25, - "learning_rate": 0.000261866394902402, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.00028040727770418965, + "loss": 0.0307, "step": 50390 }, { - "epoch": 0.25, - "learning_rate": 0.00026185882720938797, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.00028040338948781817, + "loss": 0.0248, "step": 50400 }, { - "epoch": 0.25, - "learning_rate": 0.00026185125951637395, - "loss": 0.0197, + "epoch": 0.13, + "learning_rate": 0.00028039950127144674, + "loss": 0.0288, "step": 50410 }, { - "epoch": 0.25, - "learning_rate": 0.00026184369182335993, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.00028039561305507525, + "loss": 0.0296, "step": 50420 }, { - "epoch": 0.25, - "learning_rate": 0.0002618361241303459, - "loss": 0.0183, + "epoch": 0.13, + "learning_rate": 0.0002803917248387038, + "loss": 0.0241, "step": 50430 }, { - "epoch": 0.25, - "learning_rate": 0.0002618285564373319, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.00028038783662233234, + "loss": 0.0219, "step": 50440 }, { - "epoch": 0.25, - "learning_rate": 0.00026182098874431793, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.00028038394840596085, + "loss": 0.026, "step": 50450 }, { - "epoch": 0.25, - "learning_rate": 0.0002618134210513039, - "loss": 0.019, + "epoch": 0.13, + "learning_rate": 0.0002803800601895894, + "loss": 0.0288, "step": 50460 }, { - "epoch": 0.25, - "learning_rate": 0.0002618058533582899, - "loss": 0.0195, + "epoch": 0.13, + "learning_rate": 0.00028037617197321793, + "loss": 0.0256, "step": 50470 }, { - "epoch": 0.25, - "learning_rate": 0.0002617982856652759, - "loss": 0.0182, + "epoch": 0.13, + "learning_rate": 0.00028037228375684645, + "loss": 0.0286, "step": 50480 }, { - "epoch": 0.25, - "learning_rate": 0.00026179071797226186, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.000280368395540475, + "loss": 0.0282, "step": 50490 }, { - "epoch": 0.25, - "learning_rate": 0.00026178315027924784, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.0002803645073241036, + "loss": 0.0251, "step": 50500 }, { - "epoch": 0.25, - "learning_rate": 0.0002617755825862338, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.0002803606191077321, + "loss": 0.0281, "step": 50510 }, { - "epoch": 0.25, - "learning_rate": 0.00026176801489321985, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.0002803567308913606, + "loss": 0.028, "step": 50520 }, { - "epoch": 0.25, - "learning_rate": 0.00026176044720020584, - "loss": 0.0247, + "epoch": 0.13, + "learning_rate": 0.00028035284267498913, + "loss": 0.0279, "step": 50530 }, { - "epoch": 0.25, - "learning_rate": 0.0002617528795071918, - "loss": 0.0167, + "epoch": 0.13, + "learning_rate": 0.0002803489544586177, + "loss": 0.0272, "step": 50540 }, { - "epoch": 0.26, - "learning_rate": 0.0002617453118141778, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.0002803450662422462, + "loss": 0.029, "step": 50550 }, { - "epoch": 0.26, - "learning_rate": 0.0002617377441211638, - "loss": 0.0187, + "epoch": 0.13, + "learning_rate": 0.0002803411780258748, + "loss": 0.028, "step": 50560 }, { - "epoch": 0.26, - "learning_rate": 0.00026173017642814976, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002803372898095033, + "loss": 0.0258, "step": 50570 }, { - "epoch": 0.26, - "learning_rate": 0.0002617226087351358, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.00028033340159313186, + "loss": 0.0269, "step": 50580 }, { - "epoch": 0.26, - "learning_rate": 0.0002617150410421218, - "loss": 0.0193, + "epoch": 0.13, + "learning_rate": 0.0002803295133767604, + "loss": 0.0291, "step": 50590 }, { - "epoch": 0.26, - "learning_rate": 0.00026170747334910776, - "loss": 0.0202, + "epoch": 0.13, + "learning_rate": 0.0002803256251603889, + "loss": 0.0243, "step": 50600 }, { - "epoch": 0.26, - "learning_rate": 0.00026169990565609374, - "loss": 0.0174, + "epoch": 0.13, + "learning_rate": 0.0002803217369440174, + "loss": 0.0269, "step": 50610 }, { - "epoch": 0.26, - "learning_rate": 0.0002616923379630797, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.000280317848727646, + "loss": 0.0329, "step": 50620 }, { - "epoch": 0.26, - "learning_rate": 0.0002616847702700657, - "loss": 0.0233, + "epoch": 0.13, + "learning_rate": 0.0002803139605112745, + "loss": 0.0312, "step": 50630 }, { - "epoch": 0.26, - "learning_rate": 0.00026167720257705174, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.00028031007229490306, + "loss": 0.0294, "step": 50640 }, { - "epoch": 0.26, - "learning_rate": 0.0002616696348840377, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.0002803061840785316, + "loss": 0.0263, "step": 50650 }, { - "epoch": 0.26, - "learning_rate": 0.0002616620671910237, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.0002803022958621601, + "loss": 0.0208, "step": 50660 }, { - "epoch": 0.26, - "learning_rate": 0.0002616544994980097, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.00028029840764578866, + "loss": 0.0259, "step": 50670 }, { - "epoch": 0.26, - "learning_rate": 0.00026164693180499567, - "loss": 0.0222, + "epoch": 0.13, + "learning_rate": 0.00028029451942941717, + "loss": 0.0322, "step": 50680 }, { - "epoch": 0.26, - "learning_rate": 0.00026163936411198165, - "loss": 0.024, + "epoch": 0.13, + "learning_rate": 0.0002802906312130457, + "loss": 0.0251, "step": 50690 }, { - "epoch": 0.26, - "learning_rate": 0.00026163179641896763, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.00028028674299667426, + "loss": 0.0364, "step": 50700 }, { - "epoch": 0.26, - "learning_rate": 0.00026162422872595366, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.0002802828547803028, + "loss": 0.0249, "step": 50710 }, { - "epoch": 0.26, - "learning_rate": 0.00026161666103293965, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.00028027896656393134, + "loss": 0.0241, "step": 50720 }, { - "epoch": 0.26, - "learning_rate": 0.00026160909333992563, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.00028027507834755985, + "loss": 0.0314, "step": 50730 }, { - "epoch": 0.26, - "learning_rate": 0.0002616015256469116, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.00028027119013118837, + "loss": 0.0283, "step": 50740 }, { - "epoch": 0.26, - "learning_rate": 0.0002615939579538976, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.00028026730191481694, + "loss": 0.027, "step": 50750 }, { - "epoch": 0.26, - "learning_rate": 0.00026158639026088357, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.00028026341369844545, + "loss": 0.0269, "step": 50760 }, { - "epoch": 0.26, - "learning_rate": 0.0002615788225678696, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.000280259525482074, + "loss": 0.0276, "step": 50770 }, { - "epoch": 0.26, - "learning_rate": 0.0002615712548748556, - "loss": 0.0254, + "epoch": 0.13, + "learning_rate": 0.00028025563726570253, + "loss": 0.028, "step": 50780 }, { - "epoch": 0.26, - "learning_rate": 0.00026156368718184157, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.0002802517490493311, + "loss": 0.0344, "step": 50790 }, { - "epoch": 0.26, - "learning_rate": 0.00026155611948882755, - "loss": 0.0202, + "epoch": 0.13, + "learning_rate": 0.0002802478608329596, + "loss": 0.0257, "step": 50800 }, { - "epoch": 0.26, - "learning_rate": 0.00026154855179581353, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028024397261658813, + "loss": 0.0267, "step": 50810 }, { - "epoch": 0.26, - "learning_rate": 0.0002615409841027995, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.00028024008440021665, + "loss": 0.0282, "step": 50820 }, { - "epoch": 0.26, - "learning_rate": 0.00026153341640978555, - "loss": 0.0193, + "epoch": 0.13, + "learning_rate": 0.0002802361961838452, + "loss": 0.0238, "step": 50830 }, { - "epoch": 0.26, - "learning_rate": 0.00026152584871677153, - "loss": 0.0197, + "epoch": 0.13, + "learning_rate": 0.00028023230796747373, + "loss": 0.0294, "step": 50840 }, { - "epoch": 0.26, - "learning_rate": 0.0002615182810237575, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002802284197511023, + "loss": 0.0288, "step": 50850 }, { - "epoch": 0.26, - "learning_rate": 0.0002615107133307435, - "loss": 0.021, + "epoch": 0.13, + "learning_rate": 0.0002802245315347308, + "loss": 0.0303, "step": 50860 }, { - "epoch": 0.26, - "learning_rate": 0.0002615031456377295, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00028022064331835933, + "loss": 0.0335, "step": 50870 }, { - "epoch": 0.26, - "learning_rate": 0.00026149557794471546, - "loss": 0.0209, + "epoch": 0.13, + "learning_rate": 0.0002802167551019879, + "loss": 0.0314, "step": 50880 }, { - "epoch": 0.26, - "learning_rate": 0.00026148801025170144, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.0002802128668856164, + "loss": 0.0256, "step": 50890 }, { - "epoch": 0.26, - "learning_rate": 0.0002614804425586875, - "loss": 0.0198, + "epoch": 0.13, + "learning_rate": 0.000280208978669245, + "loss": 0.0281, "step": 50900 }, { - "epoch": 0.26, - "learning_rate": 0.0002614728748656734, - "loss": 0.0215, + "epoch": 0.13, + "learning_rate": 0.0002802050904528735, + "loss": 0.0309, "step": 50910 }, { - "epoch": 0.26, - "learning_rate": 0.0002614653071726594, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.00028020120223650206, + "loss": 0.0277, "step": 50920 }, { - "epoch": 0.26, - "learning_rate": 0.00026145773947964536, - "loss": 0.0217, + "epoch": 0.13, + "learning_rate": 0.0002801973140201306, + "loss": 0.0313, "step": 50930 }, { - "epoch": 0.26, - "learning_rate": 0.0002614501717866314, - "loss": 0.0229, + "epoch": 0.13, + "learning_rate": 0.0002801934258037591, + "loss": 0.0286, "step": 50940 }, { - "epoch": 0.26, - "learning_rate": 0.0002614426040936174, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.0002801895375873876, + "loss": 0.0263, "step": 50950 }, { - "epoch": 0.26, - "learning_rate": 0.00026143503640060336, - "loss": 0.018, + "epoch": 0.13, + "learning_rate": 0.0002801856493710162, + "loss": 0.0297, "step": 50960 }, { - "epoch": 0.26, - "learning_rate": 0.00026142746870758934, - "loss": 0.0183, + "epoch": 0.13, + "learning_rate": 0.0002801817611546447, + "loss": 0.0256, "step": 50970 }, { - "epoch": 0.26, - "learning_rate": 0.0002614199010145753, - "loss": 0.018, + "epoch": 0.13, + "learning_rate": 0.00028017787293827326, + "loss": 0.0248, "step": 50980 }, { - "epoch": 0.26, - "learning_rate": 0.0002614123333215613, - "loss": 0.0205, + "epoch": 0.13, + "learning_rate": 0.0002801739847219018, + "loss": 0.0314, "step": 50990 }, { - "epoch": 0.26, - "learning_rate": 0.00026140476562854734, - "loss": 0.022, + "epoch": 0.13, + "learning_rate": 0.00028017009650553034, + "loss": 0.0292, "step": 51000 }, { - "epoch": 0.26, - "eval_cer": 0.9144770486760401, - "eval_loss": 0.01605140045285225, - "eval_runtime": 117.035, - "eval_samples_per_second": 17.089, - "eval_steps_per_second": 4.272, + "epoch": 0.13, + "eval_cer": 0.8818202558256388, + "eval_loss": 0.020461125299334526, + "eval_runtime": 107.4733, + "eval_samples_per_second": 18.609, + "eval_steps_per_second": 4.652, "step": 51000 }, { - "epoch": 0.26, - "learning_rate": 0.0002613971979355333, - "loss": 0.019, + "epoch": 0.13, + "learning_rate": 0.00028016620828915886, + "loss": 0.028, "step": 51010 }, { - "epoch": 0.26, - "learning_rate": 0.0002613896302425193, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.00028016232007278737, + "loss": 0.0323, "step": 51020 }, { - "epoch": 0.26, - "learning_rate": 0.0002613820625495053, - "loss": 0.0232, + "epoch": 0.13, + "learning_rate": 0.0002801584318564159, + "loss": 0.0288, "step": 51030 }, { - "epoch": 0.26, - "learning_rate": 0.00026137449485649127, - "loss": 0.0221, + "epoch": 0.13, + "learning_rate": 0.00028015454364004445, + "loss": 0.0278, "step": 51040 }, { - "epoch": 0.26, - "learning_rate": 0.00026136692716347725, - "loss": 0.017, + "epoch": 0.13, + "learning_rate": 0.000280150655423673, + "loss": 0.0249, "step": 51050 }, { - "epoch": 0.26, - "learning_rate": 0.00026135935947046323, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.00028014676720730154, + "loss": 0.0273, "step": 51060 }, { - "epoch": 0.26, - "learning_rate": 0.00026135179177744927, - "loss": 0.02, + "epoch": 0.13, + "learning_rate": 0.00028014287899093005, + "loss": 0.0278, "step": 51070 }, { - "epoch": 0.26, - "learning_rate": 0.00026134422408443525, - "loss": 0.0178, + "epoch": 0.13, + "learning_rate": 0.0002801389907745586, + "loss": 0.0275, "step": 51080 }, { - "epoch": 0.26, - "learning_rate": 0.00026133665639142123, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.00028013510255818714, + "loss": 0.0269, "step": 51090 }, { - "epoch": 0.26, - "learning_rate": 0.0002613290886984072, - "loss": 0.0243, + "epoch": 0.13, + "learning_rate": 0.00028013121434181565, + "loss": 0.0232, "step": 51100 }, { - "epoch": 0.26, - "learning_rate": 0.0002613215210053932, - "loss": 0.0243, + "epoch": 0.13, + "learning_rate": 0.0002801273261254442, + "loss": 0.0294, "step": 51110 }, { - "epoch": 0.26, - "learning_rate": 0.0002613139533123792, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.00028012343790907273, + "loss": 0.0274, "step": 51120 }, { - "epoch": 0.26, - "learning_rate": 0.0002613063856193652, - "loss": 0.0265, + "epoch": 0.13, + "learning_rate": 0.0002801195496927013, + "loss": 0.0305, "step": 51130 }, { - "epoch": 0.26, - "learning_rate": 0.0002612988179263512, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.0002801156614763298, + "loss": 0.0256, "step": 51140 }, { - "epoch": 0.26, - "learning_rate": 0.0002612912502333372, - "loss": 0.0224, + "epoch": 0.13, + "learning_rate": 0.00028011177325995833, + "loss": 0.0367, "step": 51150 }, { - "epoch": 0.26, - "learning_rate": 0.00026128368254032315, - "loss": 0.0209, + "epoch": 0.13, + "learning_rate": 0.00028010788504358685, + "loss": 0.027, "step": 51160 }, { - "epoch": 0.26, - "learning_rate": 0.00026127611484730914, - "loss": 0.0192, + "epoch": 0.13, + "learning_rate": 0.0002801039968272154, + "loss": 0.0288, "step": 51170 }, { - "epoch": 0.26, - "learning_rate": 0.0002612685471542951, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.00028010010861084393, + "loss": 0.0298, "step": 51180 }, { - "epoch": 0.26, - "learning_rate": 0.00026126097946128115, - "loss": 0.023, + "epoch": 0.13, + "learning_rate": 0.0002800962203944725, + "loss": 0.0238, "step": 51190 }, { - "epoch": 0.26, - "learning_rate": 0.00026125341176826713, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.000280092332178101, + "loss": 0.0255, "step": 51200 }, { - "epoch": 0.26, - "learning_rate": 0.0002612458440752531, - "loss": 0.0201, + "epoch": 0.13, + "learning_rate": 0.0002800884439617296, + "loss": 0.0274, "step": 51210 }, { - "epoch": 0.26, - "learning_rate": 0.0002612382763822391, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.0002800845557453581, + "loss": 0.0322, "step": 51220 }, { - "epoch": 0.26, - "learning_rate": 0.0002612307086892251, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.0002800806675289866, + "loss": 0.0251, "step": 51230 }, { - "epoch": 0.26, - "learning_rate": 0.00026122314099621106, - "loss": 0.0203, + "epoch": 0.13, + "learning_rate": 0.0002800767793126151, + "loss": 0.0273, "step": 51240 }, { - "epoch": 0.26, - "learning_rate": 0.00026121557330319704, - "loss": 0.0187, + "epoch": 0.13, + "learning_rate": 0.0002800728910962437, + "loss": 0.0275, "step": 51250 }, { - "epoch": 0.26, - "learning_rate": 0.0002612080056101831, - "loss": 0.0227, + "epoch": 0.13, + "learning_rate": 0.00028006900287987226, + "loss": 0.0223, "step": 51260 }, { - "epoch": 0.26, - "learning_rate": 0.00026120043791716906, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.0002800651146635008, + "loss": 0.0266, "step": 51270 }, { - "epoch": 0.26, - "learning_rate": 0.00026119287022415504, - "loss": 0.0226, + "epoch": 0.13, + "learning_rate": 0.0002800612264471293, + "loss": 0.0312, "step": 51280 }, { - "epoch": 0.26, - "learning_rate": 0.000261185302531141, - "loss": 0.0201, + "epoch": 0.13, + "learning_rate": 0.00028005733823075786, + "loss": 0.028, "step": 51290 }, { - "epoch": 0.26, - "learning_rate": 0.000261177734838127, - "loss": 0.0182, + "epoch": 0.13, + "learning_rate": 0.0002800534500143864, + "loss": 0.0317, "step": 51300 }, { - "epoch": 0.26, - "learning_rate": 0.000261170167145113, - "loss": 0.0282, + "epoch": 0.13, + "learning_rate": 0.0002800495617980149, + "loss": 0.0269, "step": 51310 }, { - "epoch": 0.26, - "learning_rate": 0.000261162599452099, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.00028004567358164346, + "loss": 0.0353, "step": 51320 }, { - "epoch": 0.26, - "learning_rate": 0.000261155031759085, - "loss": 0.0216, + "epoch": 0.13, + "learning_rate": 0.00028004178536527197, + "loss": 0.0361, "step": 51330 }, { - "epoch": 0.26, - "learning_rate": 0.000261147464066071, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.00028003789714890054, + "loss": 0.0274, "step": 51340 }, { - "epoch": 0.26, - "learning_rate": 0.00026113989637305696, - "loss": 0.0197, + "epoch": 0.13, + "learning_rate": 0.00028003400893252906, + "loss": 0.0253, "step": 51350 }, { - "epoch": 0.26, - "learning_rate": 0.00026113232868004295, - "loss": 0.0178, + "epoch": 0.13, + "learning_rate": 0.00028003012071615757, + "loss": 0.0251, "step": 51360 }, { - "epoch": 0.26, - "learning_rate": 0.00026112476098702893, - "loss": 0.0197, + "epoch": 0.13, + "learning_rate": 0.0002800262324997861, + "loss": 0.0277, "step": 51370 }, { - "epoch": 0.26, - "learning_rate": 0.00026111719329401496, - "loss": 0.0244, + "epoch": 0.13, + "learning_rate": 0.00028002234428341465, + "loss": 0.0279, "step": 51380 }, { - "epoch": 0.26, - "learning_rate": 0.00026110962560100094, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.0002800184560670432, + "loss": 0.0306, "step": 51390 }, { - "epoch": 0.26, - "learning_rate": 0.0002611020579079869, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.00028001456785067174, + "loss": 0.0273, "step": 51400 }, { - "epoch": 0.26, - "learning_rate": 0.0002610944902149729, - "loss": 0.0206, + "epoch": 0.13, + "learning_rate": 0.00028001067963430025, + "loss": 0.0254, "step": 51410 }, { - "epoch": 0.26, - "learning_rate": 0.0002610869225219589, - "loss": 0.0204, + "epoch": 0.13, + "learning_rate": 0.0002800067914179288, + "loss": 0.0327, "step": 51420 }, { - "epoch": 0.26, - "learning_rate": 0.00026107935482894487, - "loss": 0.0269, + "epoch": 0.13, + "learning_rate": 0.00028000290320155733, + "loss": 0.0243, "step": 51430 }, { - "epoch": 0.26, - "learning_rate": 0.00026107178713593085, - "loss": 0.0278, + "epoch": 0.13, + "learning_rate": 0.00027999901498518585, + "loss": 0.0327, "step": 51440 }, { - "epoch": 0.26, - "learning_rate": 0.0002610642194429169, - "loss": 0.0228, + "epoch": 0.13, + "learning_rate": 0.0002799951267688144, + "loss": 0.0299, "step": 51450 }, { - "epoch": 0.26, - "learning_rate": 0.00026105665174990287, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.00027999123855244293, + "loss": 0.0243, "step": 51460 }, { - "epoch": 0.26, - "learning_rate": 0.00026104908405688885, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.0002799873503360715, + "loss": 0.0336, "step": 51470 }, { - "epoch": 0.26, - "learning_rate": 0.00026104151636387483, - "loss": 0.0218, + "epoch": 0.13, + "learning_rate": 0.0002799834621197, + "loss": 0.0253, "step": 51480 }, { - "epoch": 0.26, - "learning_rate": 0.0002610339486708608, - "loss": 0.0202, + "epoch": 0.13, + "learning_rate": 0.00027997957390332853, + "loss": 0.0293, "step": 51490 }, { - "epoch": 0.26, - "learning_rate": 0.0002610263809778468, - "loss": 0.0209, + "epoch": 0.13, + "learning_rate": 0.0002799756856869571, + "loss": 0.0309, "step": 51500 }, { - "epoch": 0.26, - "learning_rate": 0.00026101881328483283, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.0002799717974705856, + "loss": 0.0287, "step": 51510 }, { - "epoch": 0.26, - "learning_rate": 0.0002610112455918188, - "loss": 0.0222, + "epoch": 0.13, + "learning_rate": 0.00027996790925421413, + "loss": 0.0306, "step": 51520 }, { - "epoch": 0.26, - "learning_rate": 0.0002610036778988048, - "loss": 0.0191, + "epoch": 0.13, + "learning_rate": 0.0002799640210378427, + "loss": 0.0288, "step": 51530 }, { - "epoch": 0.26, - "learning_rate": 0.0002609961102057908, - "loss": 0.0196, + "epoch": 0.13, + "learning_rate": 0.00027996013282147127, + "loss": 0.0249, "step": 51540 }, { - "epoch": 0.26, - "learning_rate": 0.00026098854251277676, - "loss": 0.0214, + "epoch": 0.13, + "learning_rate": 0.0002799562446050998, + "loss": 0.0277, "step": 51550 }, { - "epoch": 0.26, - "learning_rate": 0.00026098097481976274, - "loss": 0.016, + "epoch": 0.13, + "learning_rate": 0.0002799523563887283, + "loss": 0.0294, "step": 51560 }, { - "epoch": 0.26, - "learning_rate": 0.0002609734071267487, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002799484681723568, + "loss": 0.0297, "step": 51570 }, { - "epoch": 0.26, - "learning_rate": 0.00026096583943373475, - "loss": 0.0242, + "epoch": 0.13, + "learning_rate": 0.0002799445799559854, + "loss": 0.029, "step": 51580 }, { - "epoch": 0.26, - "learning_rate": 0.00026095827174072074, - "loss": 0.018, + "epoch": 0.13, + "learning_rate": 0.0002799406917396139, + "loss": 0.0294, "step": 51590 }, { - "epoch": 0.26, - "learning_rate": 0.0002609507040477067, - "loss": 0.0201, + "epoch": 0.13, + "learning_rate": 0.00027993680352324246, + "loss": 0.0252, "step": 51600 }, { - "epoch": 0.26, - "learning_rate": 0.0002609431363546927, - "loss": 0.0232, + "epoch": 0.13, + "learning_rate": 0.000279932915306871, + "loss": 0.0259, "step": 51610 }, { - "epoch": 0.26, - "learning_rate": 0.0002609355686616787, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.0002799290270904995, + "loss": 0.0261, "step": 51620 }, { - "epoch": 0.26, - "learning_rate": 0.00026092800096866466, - "loss": 0.0198, + "epoch": 0.13, + "learning_rate": 0.00027992513887412806, + "loss": 0.0277, "step": 51630 }, { - "epoch": 0.26, - "learning_rate": 0.0002609204332756507, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.0002799212506577566, + "loss": 0.0225, "step": 51640 }, { - "epoch": 0.26, - "learning_rate": 0.0002609128655826367, - "loss": 0.0186, + "epoch": 0.13, + "learning_rate": 0.0002799173624413851, + "loss": 0.031, "step": 51650 }, { - "epoch": 0.26, - "learning_rate": 0.00026090529788962266, - "loss": 0.019, + "epoch": 0.13, + "learning_rate": 0.00027991347422501366, + "loss": 0.0316, "step": 51660 }, { - "epoch": 0.26, - "learning_rate": 0.00026089773019660864, - "loss": 0.0186, + "epoch": 0.13, + "learning_rate": 0.00027990958600864217, + "loss": 0.026, "step": 51670 }, { - "epoch": 0.26, - "learning_rate": 0.0002608901625035946, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.00027990569779227074, + "loss": 0.031, "step": 51680 }, { - "epoch": 0.26, - "learning_rate": 0.0002608825948105806, - "loss": 0.0175, + "epoch": 0.13, + "learning_rate": 0.00027990180957589925, + "loss": 0.0294, "step": 51690 }, { - "epoch": 0.26, - "learning_rate": 0.00026087502711756664, - "loss": 0.0212, + "epoch": 0.13, + "learning_rate": 0.00027989792135952777, + "loss": 0.0216, "step": 51700 }, { - "epoch": 0.26, - "learning_rate": 0.0002608674594245526, - "loss": 0.0241, + "epoch": 0.13, + "learning_rate": 0.00027989403314315634, + "loss": 0.0308, "step": 51710 }, { - "epoch": 0.26, - "learning_rate": 0.0002608598917315386, - "loss": 0.0191, + "epoch": 0.13, + "learning_rate": 0.00027989014492678485, + "loss": 0.0441, "step": 51720 }, { - "epoch": 0.26, - "learning_rate": 0.0002608523240385246, - "loss": 0.0188, + "epoch": 0.13, + "learning_rate": 0.00027988625671041337, + "loss": 0.0328, "step": 51730 }, { - "epoch": 0.26, - "learning_rate": 0.00026084475634551057, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.00027988236849404194, + "loss": 0.0343, "step": 51740 }, { - "epoch": 0.26, - "learning_rate": 0.00026083718865249655, - "loss": 0.0202, + "epoch": 0.13, + "learning_rate": 0.0002798784802776705, + "loss": 0.0302, "step": 51750 }, { - "epoch": 0.26, - "learning_rate": 0.00026082962095948253, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.000279874592061299, + "loss": 0.0296, "step": 51760 }, { - "epoch": 0.26, - "learning_rate": 0.00026082205326646856, - "loss": 0.0393, + "epoch": 0.13, + "learning_rate": 0.00027987070384492753, + "loss": 0.0279, "step": 51770 }, { - "epoch": 0.26, - "learning_rate": 0.00026081448557345455, - "loss": 0.0419, + "epoch": 0.13, + "learning_rate": 0.00027986681562855605, + "loss": 0.0276, "step": 51780 }, { - "epoch": 0.26, - "learning_rate": 0.00026080691788044053, - "loss": 0.0159, + "epoch": 0.13, + "learning_rate": 0.0002798629274121846, + "loss": 0.0312, "step": 51790 }, { - "epoch": 0.26, - "learning_rate": 0.0002607993501874265, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.00027985903919581313, + "loss": 0.0278, "step": 51800 }, { - "epoch": 0.26, - "learning_rate": 0.0002607917824944125, - "loss": 0.0199, + "epoch": 0.13, + "learning_rate": 0.0002798551509794417, + "loss": 0.0274, "step": 51810 }, { - "epoch": 0.26, - "learning_rate": 0.00026078421480139847, - "loss": 0.0203, + "epoch": 0.13, + "learning_rate": 0.0002798512627630702, + "loss": 0.026, "step": 51820 }, { - "epoch": 0.26, - "learning_rate": 0.0002607766471083845, - "loss": 0.0208, + "epoch": 0.13, + "learning_rate": 0.0002798473745466988, + "loss": 0.0344, "step": 51830 }, { - "epoch": 0.26, - "learning_rate": 0.0002607690794153705, - "loss": 0.0246, + "epoch": 0.13, + "learning_rate": 0.0002798434863303273, + "loss": 0.0263, "step": 51840 }, { - "epoch": 0.26, - "learning_rate": 0.00026076151172235647, - "loss": 0.0209, + "epoch": 0.13, + "learning_rate": 0.0002798395981139558, + "loss": 0.0309, "step": 51850 }, { - "epoch": 0.26, - "learning_rate": 0.00026075394402934245, - "loss": 0.0238, + "epoch": 0.13, + "learning_rate": 0.0002798357098975843, + "loss": 0.0266, "step": 51860 }, { - "epoch": 0.26, - "learning_rate": 0.00026074637633632843, - "loss": 0.0219, + "epoch": 0.13, + "learning_rate": 0.0002798318216812129, + "loss": 0.0297, "step": 51870 }, { - "epoch": 0.26, - "learning_rate": 0.0002607388086433144, - "loss": 0.0247, + "epoch": 0.13, + "learning_rate": 0.0002798279334648414, + "loss": 0.0284, "step": 51880 }, { - "epoch": 0.26, - "learning_rate": 0.00026073124095030045, - "loss": 0.0211, + "epoch": 0.13, + "learning_rate": 0.00027982404524847, + "loss": 0.0326, "step": 51890 }, { - "epoch": 0.26, - "learning_rate": 0.00026072367325728643, - "loss": 0.0167, + "epoch": 0.13, + "learning_rate": 0.0002798201570320985, + "loss": 0.0276, "step": 51900 }, { - "epoch": 0.26, - "learning_rate": 0.0002607161055642724, - "loss": 0.0237, + "epoch": 0.13, + "learning_rate": 0.000279816268815727, + "loss": 0.0303, "step": 51910 }, { - "epoch": 0.26, - "learning_rate": 0.0002607085378712584, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.0002798123805993556, + "loss": 0.0332, "step": 51920 }, { - "epoch": 0.26, - "learning_rate": 0.0002607009701782444, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.0002798084923829841, + "loss": 0.0305, "step": 51930 }, { - "epoch": 0.26, - "learning_rate": 0.00026069340248523036, - "loss": 0.0232, + "epoch": 0.13, + "learning_rate": 0.00027980460416661266, + "loss": 0.0308, "step": 51940 }, { - "epoch": 0.26, - "learning_rate": 0.00026068583479221634, - "loss": 0.0213, + "epoch": 0.13, + "learning_rate": 0.0002798007159502412, + "loss": 0.0275, "step": 51950 }, { - "epoch": 0.26, - "learning_rate": 0.0002606782670992024, - "loss": 0.0221, + "epoch": 0.13, + "learning_rate": 0.00027979682773386974, + "loss": 0.0318, "step": 51960 }, { - "epoch": 0.26, - "learning_rate": 0.00026067069940618836, - "loss": 0.0236, + "epoch": 0.13, + "learning_rate": 0.00027979293951749826, + "loss": 0.0323, "step": 51970 }, { - "epoch": 0.26, - "learning_rate": 0.00026066313171317434, - "loss": 0.0219, + "epoch": 0.13, + "learning_rate": 0.00027978905130112677, + "loss": 0.0259, "step": 51980 }, { - "epoch": 0.26, - "learning_rate": 0.0002606555640201603, - "loss": 0.0223, + "epoch": 0.13, + "learning_rate": 0.0002797851630847553, + "loss": 0.0316, "step": 51990 }, { - "epoch": 0.26, - "learning_rate": 0.0002606479963271463, - "loss": 0.0231, + "epoch": 0.13, + "learning_rate": 0.00027978127486838386, + "loss": 0.0273, "step": 52000 }, { - "epoch": 0.26, - "eval_cer": 0.9145013085791751, - "eval_loss": 0.015823883935809135, - "eval_runtime": 116.6377, - "eval_samples_per_second": 17.147, - "eval_steps_per_second": 4.287, + "epoch": 0.13, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.019722141325473785, + "eval_runtime": 107.1814, + "eval_samples_per_second": 18.66, + "eval_steps_per_second": 4.665, "step": 52000 }, { - "epoch": 0.26, - "learning_rate": 0.0002606404286341323, - "loss": 0.0225, + "epoch": 0.13, + "learning_rate": 0.00027977738665201237, + "loss": 0.0406, "step": 52010 }, { - "epoch": 0.26, - "learning_rate": 0.0002606328609411183, - "loss": 0.0197, + "epoch": 0.13, + "learning_rate": 0.00027977349843564094, + "loss": 0.0343, "step": 52020 }, { - "epoch": 0.26, - "learning_rate": 0.0002606252932481043, - "loss": 0.0207, + "epoch": 0.13, + "learning_rate": 0.00027976961021926945, + "loss": 0.0278, "step": 52030 }, { - "epoch": 0.26, - "learning_rate": 0.0002606177255550903, - "loss": 0.0181, + "epoch": 0.13, + "learning_rate": 0.000279765722002898, + "loss": 0.0293, "step": 52040 }, { - "epoch": 0.26, - "learning_rate": 0.00026061015786207626, - "loss": 0.0194, + "epoch": 0.13, + "learning_rate": 0.00027976183378652654, + "loss": 0.0307, "step": 52050 }, { - "epoch": 0.26, - "learning_rate": 0.00026060259016906224, - "loss": 0.0248, + "epoch": 0.13, + "learning_rate": 0.00027975794557015505, + "loss": 0.0325, "step": 52060 }, { - "epoch": 0.26, - "learning_rate": 0.0002605950224760482, - "loss": 0.0233, + "epoch": 0.13, + "learning_rate": 0.00027975405735378357, + "loss": 0.0264, "step": 52070 }, { - "epoch": 0.26, - "learning_rate": 0.0002605874547830342, - "loss": 0.0234, + "epoch": 0.13, + "learning_rate": 0.00027975016913741213, + "loss": 0.0306, "step": 52080 }, { - "epoch": 0.26, - "learning_rate": 0.00026057988709002024, - "loss": 0.0198, + "epoch": 0.14, + "learning_rate": 0.0002797462809210407, + "loss": 0.0297, "step": 52090 }, { - "epoch": 0.26, - "learning_rate": 0.0002605723193970062, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.0002797423927046692, + "loss": 0.0268, "step": 52100 }, { - "epoch": 0.26, - "learning_rate": 0.0002605647517039922, - "loss": 0.0186, + "epoch": 0.14, + "learning_rate": 0.00027973850448829773, + "loss": 0.0286, "step": 52110 }, { - "epoch": 0.26, - "learning_rate": 0.0002605571840109782, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.00027973461627192625, + "loss": 0.0286, "step": 52120 }, { - "epoch": 0.26, - "learning_rate": 0.00026054961631796417, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.0002797307280555548, + "loss": 0.023, "step": 52130 }, { - "epoch": 0.26, - "learning_rate": 0.00026054204862495015, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.00027972683983918333, + "loss": 0.0258, "step": 52140 }, { - "epoch": 0.26, - "learning_rate": 0.0002605344809319362, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.0002797229516228119, + "loss": 0.0292, "step": 52150 }, { - "epoch": 0.26, - "learning_rate": 0.00026052691323892217, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.0002797190634064404, + "loss": 0.0272, "step": 52160 }, { - "epoch": 0.26, - "learning_rate": 0.0002605193455459081, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.000279715175190069, + "loss": 0.0306, "step": 52170 }, { - "epoch": 0.26, - "learning_rate": 0.0002605117778528941, - "loss": 0.0268, + "epoch": 0.14, + "learning_rate": 0.0002797112869736975, + "loss": 0.027, "step": 52180 }, { - "epoch": 0.26, - "learning_rate": 0.0002605042101598801, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.000279707398757326, + "loss": 0.0263, "step": 52190 }, { - "epoch": 0.26, - "learning_rate": 0.0002604966424668661, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.0002797035105409545, + "loss": 0.0296, "step": 52200 }, { - "epoch": 0.26, - "learning_rate": 0.0002604890747738521, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.0002796996223245831, + "loss": 0.0246, "step": 52210 }, { - "epoch": 0.26, - "learning_rate": 0.00026048150708083806, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.0002796957341082116, + "loss": 0.0272, "step": 52220 }, { - "epoch": 0.26, - "learning_rate": 0.00026047393938782404, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.0002796918458918402, + "loss": 0.0306, "step": 52230 }, { - "epoch": 0.26, - "learning_rate": 0.00026046637169481, - "loss": 0.0238, + "epoch": 0.14, + "learning_rate": 0.0002796879576754687, + "loss": 0.0287, "step": 52240 }, { - "epoch": 0.26, - "learning_rate": 0.00026045880400179605, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.00027968406945909726, + "loss": 0.0206, "step": 52250 }, { - "epoch": 0.26, - "learning_rate": 0.00026045123630878204, - "loss": 0.0217, + "epoch": 0.14, + "learning_rate": 0.0002796801812427258, + "loss": 0.0282, "step": 52260 }, { - "epoch": 0.26, - "learning_rate": 0.000260443668615768, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.0002796762930263543, + "loss": 0.0304, "step": 52270 }, { - "epoch": 0.26, - "learning_rate": 0.000260436100922754, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.0002796724048099828, + "loss": 0.0236, "step": 52280 }, { - "epoch": 0.26, - "learning_rate": 0.00026042853322974, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.0002796685165936114, + "loss": 0.0356, "step": 52290 }, { - "epoch": 0.26, - "learning_rate": 0.00026042096553672596, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.00027966462837723994, + "loss": 0.0268, "step": 52300 }, { - "epoch": 0.26, - "learning_rate": 0.00026041339784371194, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.00027966074016086846, + "loss": 0.0241, "step": 52310 }, { - "epoch": 0.26, - "learning_rate": 0.000260405830150698, - "loss": 0.0196, + "epoch": 0.14, + "learning_rate": 0.00027965685194449697, + "loss": 0.0315, "step": 52320 }, { - "epoch": 0.26, - "learning_rate": 0.00026039826245768396, - "loss": 0.0229, + "epoch": 0.14, + "learning_rate": 0.00027965296372812554, + "loss": 0.0294, "step": 52330 }, { - "epoch": 0.26, - "learning_rate": 0.00026039069476466994, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.00027964907551175405, + "loss": 0.0247, "step": 52340 }, { - "epoch": 0.26, - "learning_rate": 0.0002603831270716559, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.00027964518729538257, + "loss": 0.0254, "step": 52350 }, { - "epoch": 0.26, - "learning_rate": 0.0002603755593786419, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.00027964129907901114, + "loss": 0.0323, "step": 52360 }, { - "epoch": 0.26, - "learning_rate": 0.0002603679916856279, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.00027963741086263965, + "loss": 0.0249, "step": 52370 }, { - "epoch": 0.26, - "learning_rate": 0.0002603604239926139, - "loss": 0.0292, + "epoch": 0.14, + "learning_rate": 0.0002796335226462682, + "loss": 0.0249, "step": 52380 }, { - "epoch": 0.26, - "learning_rate": 0.0002603528562995999, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.00027962963442989674, + "loss": 0.0357, "step": 52390 }, { - "epoch": 0.26, - "learning_rate": 0.0002603452886065859, - "loss": 0.0249, + "epoch": 0.14, + "learning_rate": 0.00027962574621352525, + "loss": 0.027, "step": 52400 }, { - "epoch": 0.26, - "learning_rate": 0.00026033772091357187, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.00027962185799715376, + "loss": 0.0332, "step": 52410 }, { - "epoch": 0.26, - "learning_rate": 0.00026033015322055785, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.00027961796978078233, + "loss": 0.0262, "step": 52420 }, { - "epoch": 0.26, - "learning_rate": 0.00026032258552754383, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027961408156441085, + "loss": 0.0225, "step": 52430 }, { - "epoch": 0.26, - "learning_rate": 0.00026031501783452986, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.0002796101933480394, + "loss": 0.0284, "step": 52440 }, { - "epoch": 0.26, - "learning_rate": 0.00026030745014151585, - "loss": 0.0258, + "epoch": 0.14, + "learning_rate": 0.00027960630513166793, + "loss": 0.0239, "step": 52450 }, { - "epoch": 0.26, - "learning_rate": 0.0002602998824485018, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.0002796024169152965, + "loss": 0.0265, "step": 52460 }, { - "epoch": 0.26, - "learning_rate": 0.0002602923147554878, - "loss": 0.0185, + "epoch": 0.14, + "learning_rate": 0.000279598528698925, + "loss": 0.0358, "step": 52470 }, { - "epoch": 0.26, - "learning_rate": 0.0002602847470624738, - "loss": 0.0182, + "epoch": 0.14, + "learning_rate": 0.00027959464048255353, + "loss": 0.0269, "step": 52480 }, { - "epoch": 0.26, - "learning_rate": 0.00026027717936945977, - "loss": 0.0181, + "epoch": 0.14, + "learning_rate": 0.0002795907522661821, + "loss": 0.0314, "step": 52490 }, { - "epoch": 0.26, - "learning_rate": 0.00026026961167644575, - "loss": 0.0193, + "epoch": 0.14, + "learning_rate": 0.0002795868640498106, + "loss": 0.0262, "step": 52500 }, { - "epoch": 0.26, - "learning_rate": 0.0002602620439834318, - "loss": 0.0241, + "epoch": 0.14, + "learning_rate": 0.0002795829758334392, + "loss": 0.0306, "step": 52510 }, { - "epoch": 0.26, - "learning_rate": 0.00026025447629041777, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.0002795790876170677, + "loss": 0.0272, "step": 52520 }, { - "epoch": 0.27, - "learning_rate": 0.00026024690859740375, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.0002795751994006962, + "loss": 0.0287, "step": 52530 }, { - "epoch": 0.27, - "learning_rate": 0.00026023934090438973, - "loss": 0.0189, + "epoch": 0.14, + "learning_rate": 0.0002795713111843248, + "loss": 0.0269, "step": 52540 }, { - "epoch": 0.27, - "learning_rate": 0.0002602317732113757, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.0002795674229679533, + "loss": 0.0289, "step": 52550 }, { - "epoch": 0.27, - "learning_rate": 0.0002602242055183617, - "loss": 0.0214, + "epoch": 0.14, + "learning_rate": 0.0002795635347515818, + "loss": 0.026, "step": 52560 }, { - "epoch": 0.27, - "learning_rate": 0.00026021663782534773, - "loss": 0.0204, + "epoch": 0.14, + "learning_rate": 0.0002795596465352104, + "loss": 0.0259, "step": 52570 }, { - "epoch": 0.27, - "learning_rate": 0.0002602090701323337, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.00027955575831883895, + "loss": 0.0306, "step": 52580 }, { - "epoch": 0.27, - "learning_rate": 0.0002602015024393197, - "loss": 0.0285, + "epoch": 0.14, + "learning_rate": 0.00027955187010246746, + "loss": 0.0282, "step": 52590 }, { - "epoch": 0.27, - "learning_rate": 0.0002601939347463057, - "loss": 0.0269, + "epoch": 0.14, + "learning_rate": 0.000279547981886096, + "loss": 0.0276, "step": 52600 }, { - "epoch": 0.27, - "learning_rate": 0.00026018636705329166, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.0002795440936697245, + "loss": 0.0306, "step": 52610 }, { - "epoch": 0.27, - "learning_rate": 0.00026017879936027764, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.000279540205453353, + "loss": 0.0253, "step": 52620 }, { - "epoch": 0.27, - "learning_rate": 0.0002601712316672636, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.00027953631723698157, + "loss": 0.0317, "step": 52630 }, { - "epoch": 0.27, - "learning_rate": 0.00026016366397424966, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.00027953242902061014, + "loss": 0.0285, "step": 52640 }, { - "epoch": 0.27, - "learning_rate": 0.00026015609628123564, - "loss": 0.0206, + "epoch": 0.14, + "learning_rate": 0.00027952854080423866, + "loss": 0.0237, "step": 52650 }, { - "epoch": 0.27, - "learning_rate": 0.0002601485285882216, - "loss": 0.0181, + "epoch": 0.14, + "learning_rate": 0.00027952465258786717, + "loss": 0.0256, "step": 52660 }, { - "epoch": 0.27, - "learning_rate": 0.0002601409608952076, - "loss": 0.0177, + "epoch": 0.14, + "learning_rate": 0.00027952076437149574, + "loss": 0.0275, "step": 52670 }, { - "epoch": 0.27, - "learning_rate": 0.0002601333932021936, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027951687615512425, + "loss": 0.0261, "step": 52680 }, { - "epoch": 0.27, - "learning_rate": 0.00026012582550917956, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.00027951298793875277, + "loss": 0.0256, "step": 52690 }, { - "epoch": 0.27, - "learning_rate": 0.0002601182578161656, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027950909972238134, + "loss": 0.0246, "step": 52700 }, { - "epoch": 0.27, - "learning_rate": 0.0002601106901231516, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.00027950521150600985, + "loss": 0.0341, "step": 52710 }, { - "epoch": 0.27, - "learning_rate": 0.00026010312243013756, - "loss": 0.0172, + "epoch": 0.14, + "learning_rate": 0.0002795013232896384, + "loss": 0.0258, "step": 52720 }, { - "epoch": 0.27, - "learning_rate": 0.00026009555473712354, - "loss": 0.0181, + "epoch": 0.14, + "learning_rate": 0.00027949743507326693, + "loss": 0.0322, "step": 52730 }, { - "epoch": 0.27, - "learning_rate": 0.0002600879870441095, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.00027949354685689545, + "loss": 0.0261, "step": 52740 }, { - "epoch": 0.27, - "learning_rate": 0.0002600804193510955, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.000279489658640524, + "loss": 0.0232, "step": 52750 }, { - "epoch": 0.27, - "learning_rate": 0.00026007285165808154, - "loss": 0.0196, + "epoch": 0.14, + "learning_rate": 0.00027948577042415253, + "loss": 0.0271, "step": 52760 }, { - "epoch": 0.27, - "learning_rate": 0.0002600652839650675, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.00027948188220778105, + "loss": 0.0307, "step": 52770 }, { - "epoch": 0.27, - "learning_rate": 0.0002600577162720535, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.0002794779939914096, + "loss": 0.0267, "step": 52780 }, { - "epoch": 0.27, - "learning_rate": 0.0002600501485790395, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.0002794741057750382, + "loss": 0.021, "step": 52790 }, { - "epoch": 0.27, - "learning_rate": 0.00026004258088602547, - "loss": 0.0178, + "epoch": 0.14, + "learning_rate": 0.0002794702175586667, + "loss": 0.0284, "step": 52800 }, { - "epoch": 0.27, - "learning_rate": 0.00026003501319301145, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.0002794663293422952, + "loss": 0.0262, "step": 52810 }, { - "epoch": 0.27, - "learning_rate": 0.00026002744549999743, - "loss": 0.0229, + "epoch": 0.14, + "learning_rate": 0.00027946244112592373, + "loss": 0.0275, "step": 52820 }, { - "epoch": 0.27, - "learning_rate": 0.00026001987780698347, - "loss": 0.0202, + "epoch": 0.14, + "learning_rate": 0.0002794585529095523, + "loss": 0.0279, "step": 52830 }, { - "epoch": 0.27, - "learning_rate": 0.00026001231011396945, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.0002794546646931808, + "loss": 0.0372, "step": 52840 }, { - "epoch": 0.27, - "learning_rate": 0.00026000474242095543, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.0002794507764768094, + "loss": 0.0284, "step": 52850 }, { - "epoch": 0.27, - "learning_rate": 0.0002599971747279414, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.0002794468882604379, + "loss": 0.024, "step": 52860 }, { - "epoch": 0.27, - "learning_rate": 0.0002599896070349274, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.0002794430000440664, + "loss": 0.03, "step": 52870 }, { - "epoch": 0.27, - "learning_rate": 0.00025998203934191337, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.000279439111827695, + "loss": 0.0271, "step": 52880 }, { - "epoch": 0.27, - "learning_rate": 0.0002599744716488994, - "loss": 0.023, + "epoch": 0.14, + "learning_rate": 0.0002794352236113235, + "loss": 0.0279, "step": 52890 }, { - "epoch": 0.27, - "learning_rate": 0.0002599669039558854, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.000279431335394952, + "loss": 0.0286, "step": 52900 }, { - "epoch": 0.27, - "learning_rate": 0.00025995933626287137, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.0002794274471785806, + "loss": 0.0233, "step": 52910 }, { - "epoch": 0.27, - "learning_rate": 0.00025995176856985735, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.0002794235589622091, + "loss": 0.0276, "step": 52920 }, { - "epoch": 0.27, - "learning_rate": 0.00025994420087684333, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.00027941967074583766, + "loss": 0.0199, "step": 52930 }, { - "epoch": 0.27, - "learning_rate": 0.0002599366331838293, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.0002794157825294662, + "loss": 0.0299, "step": 52940 }, { - "epoch": 0.27, - "learning_rate": 0.00025992906549081535, - "loss": 0.0185, + "epoch": 0.14, + "learning_rate": 0.0002794118943130947, + "loss": 0.0275, "step": 52950 }, { - "epoch": 0.27, - "learning_rate": 0.00025992149779780133, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.00027940800609672326, + "loss": 0.0238, "step": 52960 }, { - "epoch": 0.27, - "learning_rate": 0.0002599139301047873, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027940411788035177, + "loss": 0.04, "step": 52970 }, { - "epoch": 0.27, - "learning_rate": 0.0002599063624117733, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.00027940022966398034, + "loss": 0.0266, "step": 52980 }, { - "epoch": 0.27, - "learning_rate": 0.0002598987947187593, - "loss": 0.0221, + "epoch": 0.14, + "learning_rate": 0.00027939634144760885, + "loss": 0.0243, "step": 52990 }, { - "epoch": 0.27, - "learning_rate": 0.00025989122702574526, - "loss": 0.0175, + "epoch": 0.14, + "learning_rate": 0.0002793924532312374, + "loss": 0.0283, "step": 53000 }, { - "epoch": 0.27, - "eval_cer": 0.9145139237288054, - "eval_loss": 0.015266528353095055, - "eval_runtime": 115.681, - "eval_samples_per_second": 17.289, - "eval_steps_per_second": 4.322, + "epoch": 0.14, + "eval_cer": 0.8818118580040337, + "eval_loss": 0.020349837839603424, + "eval_runtime": 107.4292, + "eval_samples_per_second": 18.617, + "eval_steps_per_second": 4.654, "step": 53000 }, { - "epoch": 0.27, - "learning_rate": 0.00025988365933273124, - "loss": 0.0195, - "step": 53010 + "epoch": 0.14, + "learning_rate": 0.00027938856501486594, + "loss": 0.0208, + "step": 53010 }, { - "epoch": 0.27, - "learning_rate": 0.0002598760916397173, - "loss": 0.0184, + "epoch": 0.14, + "learning_rate": 0.00027938467679849445, + "loss": 0.0279, "step": 53020 }, { - "epoch": 0.27, - "learning_rate": 0.00025986852394670326, - "loss": 0.0241, + "epoch": 0.14, + "learning_rate": 0.00027938078858212297, + "loss": 0.026, "step": 53030 }, { - "epoch": 0.27, - "learning_rate": 0.00025986095625368924, - "loss": 0.0221, + "epoch": 0.14, + "learning_rate": 0.00027937690036575154, + "loss": 0.0276, "step": 53040 }, { - "epoch": 0.27, - "learning_rate": 0.0002598533885606752, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.00027937301214938005, + "loss": 0.0284, "step": 53050 }, { - "epoch": 0.27, - "learning_rate": 0.0002598458208676612, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.0002793691239330086, + "loss": 0.0289, "step": 53060 }, { - "epoch": 0.27, - "learning_rate": 0.0002598382531746472, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.00027936523571663713, + "loss": 0.0238, "step": 53070 }, { - "epoch": 0.27, - "learning_rate": 0.0002598306854816332, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.0002793613475002657, + "loss": 0.0247, "step": 53080 }, { - "epoch": 0.27, - "learning_rate": 0.0002598231177886192, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.0002793574592838942, + "loss": 0.023, "step": 53090 }, { - "epoch": 0.27, - "learning_rate": 0.0002598155500956052, - "loss": 0.0176, + "epoch": 0.14, + "learning_rate": 0.00027935357106752273, + "loss": 0.0326, "step": 53100 }, { - "epoch": 0.27, - "learning_rate": 0.00025980798240259116, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.00027934968285115125, + "loss": 0.0278, "step": 53110 }, { - "epoch": 0.27, - "learning_rate": 0.00025980041470957714, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.0002793457946347798, + "loss": 0.0372, "step": 53120 }, { - "epoch": 0.27, - "learning_rate": 0.0002597928470165631, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.0002793419064184084, + "loss": 0.0275, "step": 53130 }, { - "epoch": 0.27, - "learning_rate": 0.0002597852793235491, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002793380182020369, + "loss": 0.0295, "step": 53140 }, { - "epoch": 0.27, - "learning_rate": 0.00025977771163053514, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002793341299856654, + "loss": 0.0253, "step": 53150 }, { - "epoch": 0.27, - "learning_rate": 0.0002597701439375211, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.0002793302417692939, + "loss": 0.0303, "step": 53160 }, { - "epoch": 0.27, - "learning_rate": 0.0002597625762445071, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.0002793263535529225, + "loss": 0.0257, "step": 53170 }, { - "epoch": 0.27, - "learning_rate": 0.0002597550085514931, - "loss": 0.0261, + "epoch": 0.14, + "learning_rate": 0.000279322465336551, + "loss": 0.028, "step": 53180 }, { - "epoch": 0.27, - "learning_rate": 0.00025974744085847907, - "loss": 0.0254, + "epoch": 0.14, + "learning_rate": 0.0002793185771201796, + "loss": 0.0219, "step": 53190 }, { - "epoch": 0.27, - "learning_rate": 0.00025973987316546505, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.0002793146889038081, + "loss": 0.0224, "step": 53200 }, { - "epoch": 0.27, - "learning_rate": 0.0002597323054724511, - "loss": 0.0212, + "epoch": 0.14, + "learning_rate": 0.00027931080068743666, + "loss": 0.0261, "step": 53210 }, { - "epoch": 0.27, - "learning_rate": 0.00025972473777943707, - "loss": 0.0167, + "epoch": 0.14, + "learning_rate": 0.0002793069124710652, + "loss": 0.0321, "step": 53220 }, { - "epoch": 0.27, - "learning_rate": 0.00025971717008642305, - "loss": 0.0234, + "epoch": 0.14, + "learning_rate": 0.0002793030242546937, + "loss": 0.0288, "step": 53230 }, { - "epoch": 0.27, - "learning_rate": 0.00025970960239340903, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.0002792991360383222, + "loss": 0.0248, "step": 53240 }, { - "epoch": 0.27, - "learning_rate": 0.000259702034700395, - "loss": 0.0243, + "epoch": 0.14, + "learning_rate": 0.0002792952478219508, + "loss": 0.0248, "step": 53250 }, { - "epoch": 0.27, - "learning_rate": 0.000259694467007381, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.0002792913596055793, + "loss": 0.0246, "step": 53260 }, { - "epoch": 0.27, - "learning_rate": 0.00025968689931436703, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.00027928747138920786, + "loss": 0.0273, "step": 53270 }, { - "epoch": 0.27, - "learning_rate": 0.000259679331621353, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027928358317283637, + "loss": 0.025, "step": 53280 }, { - "epoch": 0.27, - "learning_rate": 0.000259671763928339, - "loss": 0.0202, + "epoch": 0.14, + "learning_rate": 0.00027927969495646494, + "loss": 0.0269, "step": 53290 }, { - "epoch": 0.27, - "learning_rate": 0.00025966419623532497, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.00027927580674009346, + "loss": 0.0237, "step": 53300 }, { - "epoch": 0.27, - "learning_rate": 0.00025965662854231095, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.00027927191852372197, + "loss": 0.0304, "step": 53310 }, { - "epoch": 0.27, - "learning_rate": 0.00025964906084929694, - "loss": 0.0198, + "epoch": 0.14, + "learning_rate": 0.0002792680303073505, + "loss": 0.0289, "step": 53320 }, { - "epoch": 0.27, - "learning_rate": 0.0002596414931562829, - "loss": 0.0193, + "epoch": 0.14, + "learning_rate": 0.00027926414209097905, + "loss": 0.0296, "step": 53330 }, { - "epoch": 0.27, - "learning_rate": 0.00025963392546326895, - "loss": 0.0194, + "epoch": 0.14, + "learning_rate": 0.0002792602538746076, + "loss": 0.028, "step": 53340 }, { - "epoch": 0.27, - "learning_rate": 0.00025962635777025493, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.00027925636565823614, + "loss": 0.0249, "step": 53350 }, { - "epoch": 0.27, - "learning_rate": 0.0002596187900772409, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027925247744186465, + "loss": 0.0297, "step": 53360 }, { - "epoch": 0.27, - "learning_rate": 0.0002596112223842269, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027924858922549317, + "loss": 0.0312, "step": 53370 }, { - "epoch": 0.27, - "learning_rate": 0.0002596036546912129, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.00027924470100912173, + "loss": 0.0266, "step": 53380 }, { - "epoch": 0.27, - "learning_rate": 0.00025959608699819886, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.00027924081279275025, + "loss": 0.0266, "step": 53390 }, { - "epoch": 0.27, - "learning_rate": 0.0002595885193051849, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.0002792369245763788, + "loss": 0.0334, "step": 53400 }, { - "epoch": 0.27, - "learning_rate": 0.0002595809516121709, - "loss": 0.0195, + "epoch": 0.14, + "learning_rate": 0.00027923303636000733, + "loss": 0.027, "step": 53410 }, { - "epoch": 0.27, - "learning_rate": 0.0002595733839191568, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.0002792291481436359, + "loss": 0.0301, "step": 53420 }, { - "epoch": 0.27, - "learning_rate": 0.0002595658162261428, - "loss": 0.0177, + "epoch": 0.14, + "learning_rate": 0.0002792252599272644, + "loss": 0.0268, "step": 53430 }, { - "epoch": 0.27, - "learning_rate": 0.0002595582485331288, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.00027922137171089293, + "loss": 0.0275, "step": 53440 }, { - "epoch": 0.27, - "learning_rate": 0.0002595506808401148, - "loss": 0.0245, + "epoch": 0.14, + "learning_rate": 0.00027921748349452144, + "loss": 0.0273, "step": 53450 }, { - "epoch": 0.27, - "learning_rate": 0.0002595431131471008, - "loss": 0.0175, + "epoch": 0.14, + "learning_rate": 0.00027921359527815, + "loss": 0.0315, "step": 53460 }, { - "epoch": 0.27, - "learning_rate": 0.00025953554545408677, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.00027920970706177853, + "loss": 0.0252, "step": 53470 }, { - "epoch": 0.27, - "learning_rate": 0.00025952797776107275, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.0002792058188454071, + "loss": 0.0251, "step": 53480 }, { - "epoch": 0.27, - "learning_rate": 0.00025952041006805873, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.0002792019306290356, + "loss": 0.0304, "step": 53490 }, { - "epoch": 0.27, - "learning_rate": 0.00025951284237504476, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.0002791980424126642, + "loss": 0.0264, "step": 53500 }, { - "epoch": 0.27, - "learning_rate": 0.00025950527468203075, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.0002791941541962927, + "loss": 0.03, "step": 53510 }, { - "epoch": 0.27, - "learning_rate": 0.0002594977069890167, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.0002791902659799212, + "loss": 0.0276, "step": 53520 }, { - "epoch": 0.27, - "learning_rate": 0.0002594901392960027, - "loss": 0.0182, + "epoch": 0.14, + "learning_rate": 0.0002791863777635498, + "loss": 0.0242, "step": 53530 }, { - "epoch": 0.27, - "learning_rate": 0.0002594825716029887, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.0002791824895471783, + "loss": 0.0283, "step": 53540 }, { - "epoch": 0.27, - "learning_rate": 0.00025947500390997467, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.00027917860133080686, + "loss": 0.0299, "step": 53550 }, { - "epoch": 0.27, - "learning_rate": 0.00025946743621696065, - "loss": 0.0212, + "epoch": 0.14, + "learning_rate": 0.0002791747131144354, + "loss": 0.0294, "step": 53560 }, { - "epoch": 0.27, - "learning_rate": 0.0002594598685239467, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.0002791708248980639, + "loss": 0.0317, "step": 53570 }, { - "epoch": 0.27, - "learning_rate": 0.00025945230083093267, - "loss": 0.0185, + "epoch": 0.14, + "learning_rate": 0.00027916693668169246, + "loss": 0.0282, "step": 53580 }, { - "epoch": 0.27, - "learning_rate": 0.00025944473313791865, - "loss": 0.0217, + "epoch": 0.14, + "learning_rate": 0.000279163048465321, + "loss": 0.0258, "step": 53590 }, { - "epoch": 0.27, - "learning_rate": 0.00025943716544490463, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.0002791591602489495, + "loss": 0.0248, "step": 53600 }, { - "epoch": 0.27, - "learning_rate": 0.0002594295977518906, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.00027915527203257806, + "loss": 0.0225, "step": 53610 }, { - "epoch": 0.27, - "learning_rate": 0.0002594220300588766, - "loss": 0.0195, + "epoch": 0.14, + "learning_rate": 0.00027915138381620657, + "loss": 0.0363, "step": 53620 }, { - "epoch": 0.27, - "learning_rate": 0.00025941446236586263, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.00027914749559983514, + "loss": 0.0251, "step": 53630 }, { - "epoch": 0.27, - "learning_rate": 0.0002594068946728486, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.00027914360738346365, + "loss": 0.0259, "step": 53640 }, { - "epoch": 0.27, - "learning_rate": 0.0002593993269798346, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.00027913971916709217, + "loss": 0.0321, "step": 53650 }, { - "epoch": 0.27, - "learning_rate": 0.0002593917592868206, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.0002791358309507207, + "loss": 0.023, "step": 53660 }, { - "epoch": 0.27, - "learning_rate": 0.00025938419159380656, - "loss": 0.0234, + "epoch": 0.14, + "learning_rate": 0.00027913194273434925, + "loss": 0.0282, "step": 53670 }, { - "epoch": 0.27, - "learning_rate": 0.00025937662390079254, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.0002791280545179778, + "loss": 0.0234, "step": 53680 }, { - "epoch": 0.27, - "learning_rate": 0.0002593690562077786, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.00027912416630160634, + "loss": 0.0338, "step": 53690 }, { - "epoch": 0.27, - "learning_rate": 0.00025936148851476456, - "loss": 0.0237, + "epoch": 0.14, + "learning_rate": 0.00027912027808523485, + "loss": 0.0284, "step": 53700 }, { - "epoch": 0.27, - "learning_rate": 0.00025935392082175054, - "loss": 0.0247, + "epoch": 0.14, + "learning_rate": 0.0002791163898688634, + "loss": 0.0284, "step": 53710 }, { - "epoch": 0.27, - "learning_rate": 0.0002593463531287365, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027911250165249193, + "loss": 0.0309, "step": 53720 }, { - "epoch": 0.27, - "learning_rate": 0.0002593387854357225, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.00027910861343612045, + "loss": 0.0338, "step": 53730 }, { - "epoch": 0.27, - "learning_rate": 0.0002593312177427085, - "loss": 0.023, + "epoch": 0.14, + "learning_rate": 0.000279104725219749, + "loss": 0.0288, "step": 53740 }, { - "epoch": 0.27, - "learning_rate": 0.00025932365004969446, - "loss": 0.0198, + "epoch": 0.14, + "learning_rate": 0.00027910083700337753, + "loss": 0.0241, "step": 53750 }, { - "epoch": 0.27, - "learning_rate": 0.0002593160823566805, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.0002790969487870061, + "loss": 0.0306, "step": 53760 }, { - "epoch": 0.27, - "learning_rate": 0.0002593085146636665, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.0002790930605706346, + "loss": 0.0242, "step": 53770 }, { - "epoch": 0.27, - "learning_rate": 0.00025930094697065246, - "loss": 0.018, + "epoch": 0.14, + "learning_rate": 0.00027908917235426313, + "loss": 0.0248, "step": 53780 }, { - "epoch": 0.27, - "learning_rate": 0.00025929337927763844, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.0002790852841378917, + "loss": 0.0295, "step": 53790 }, { - "epoch": 0.27, - "learning_rate": 0.0002592858115846244, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.0002790813959215202, + "loss": 0.0266, "step": 53800 }, { - "epoch": 0.27, - "learning_rate": 0.0002592782438916104, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.0002790775077051487, + "loss": 0.0224, "step": 53810 }, { - "epoch": 0.27, - "learning_rate": 0.00025927067619859644, - "loss": 0.0229, + "epoch": 0.14, + "learning_rate": 0.0002790736194887773, + "loss": 0.029, "step": 53820 }, { - "epoch": 0.27, - "learning_rate": 0.0002592631085055824, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.00027906973127240586, + "loss": 0.0346, "step": 53830 }, { - "epoch": 0.27, - "learning_rate": 0.0002592555408125684, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.0002790658430560344, + "loss": 0.0281, "step": 53840 }, { - "epoch": 0.27, - "learning_rate": 0.0002592479731195544, - "loss": 0.0186, + "epoch": 0.14, + "learning_rate": 0.0002790619548396629, + "loss": 0.0242, "step": 53850 }, { - "epoch": 0.27, - "learning_rate": 0.00025924040542654037, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.0002790580666232914, + "loss": 0.032, "step": 53860 }, { - "epoch": 0.27, - "learning_rate": 0.00025923283773352635, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.0002790541784069199, + "loss": 0.0319, "step": 53870 }, { - "epoch": 0.27, - "learning_rate": 0.00025922527004051233, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.0002790502901905485, + "loss": 0.0296, "step": 53880 }, { - "epoch": 0.27, - "learning_rate": 0.00025921770234749837, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.00027904640197417706, + "loss": 0.0288, "step": 53890 }, { - "epoch": 0.27, - "learning_rate": 0.00025921013465448435, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.0002790425137578056, + "loss": 0.0279, "step": 53900 }, { - "epoch": 0.27, - "learning_rate": 0.00025920256696147033, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.0002790386255414341, + "loss": 0.0271, "step": 53910 }, { - "epoch": 0.27, - "learning_rate": 0.0002591949992684563, - "loss": 0.0166, + "epoch": 0.14, + "learning_rate": 0.00027903473732506266, + "loss": 0.025, "step": 53920 }, { - "epoch": 0.27, - "learning_rate": 0.0002591874315754423, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.00027903084910869117, + "loss": 0.0272, "step": 53930 }, { - "epoch": 0.27, - "learning_rate": 0.00025917986388242827, - "loss": 0.0161, + "epoch": 0.14, + "learning_rate": 0.0002790269608923197, + "loss": 0.0277, "step": 53940 }, { - "epoch": 0.27, - "learning_rate": 0.0002591722961894143, - "loss": 0.0202, + "epoch": 0.14, + "learning_rate": 0.00027902307267594826, + "loss": 0.0297, "step": 53950 }, { - "epoch": 0.27, - "learning_rate": 0.0002591647284964003, - "loss": 0.0214, + "epoch": 0.14, + "learning_rate": 0.00027901918445957677, + "loss": 0.0205, "step": 53960 }, { - "epoch": 0.27, - "learning_rate": 0.00025915716080338627, - "loss": 0.0167, + "epoch": 0.14, + "learning_rate": 0.00027901529624320534, + "loss": 0.0264, "step": 53970 }, { - "epoch": 0.27, - "learning_rate": 0.00025914959311037225, - "loss": 0.0202, + "epoch": 0.14, + "learning_rate": 0.00027901140802683385, + "loss": 0.031, "step": 53980 }, { - "epoch": 0.27, - "learning_rate": 0.00025914202541735823, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.00027900751981046237, + "loss": 0.0285, "step": 53990 }, { - "epoch": 0.27, - "learning_rate": 0.0002591344577243442, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.00027900363159409094, + "loss": 0.0264, "step": 54000 }, { - "epoch": 0.27, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.014917539432644844, - "eval_runtime": 115.9864, - "eval_samples_per_second": 17.243, - "eval_steps_per_second": 4.311, + "epoch": 0.14, + "eval_cer": 0.8818370514688489, + "eval_loss": 0.02024264447391033, + "eval_runtime": 108.1973, + "eval_samples_per_second": 18.485, + "eval_steps_per_second": 4.621, "step": 54000 }, { - "epoch": 0.27, - "learning_rate": 0.00025912689003133025, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.00027899974337771945, + "loss": 0.0249, "step": 54010 }, { - "epoch": 0.27, - "learning_rate": 0.00025911932233831623, - "loss": 0.0186, + "epoch": 0.14, + "learning_rate": 0.00027899585516134797, + "loss": 0.03, "step": 54020 }, { - "epoch": 0.27, - "learning_rate": 0.0002591117546453022, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.00027899196694497653, + "loss": 0.0298, "step": 54030 }, { - "epoch": 0.27, - "learning_rate": 0.0002591041869522882, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.0002789880787286051, + "loss": 0.0303, "step": 54040 }, { - "epoch": 0.27, - "learning_rate": 0.0002590966192592742, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.0002789841905122336, + "loss": 0.0265, "step": 54050 }, { - "epoch": 0.27, - "learning_rate": 0.00025908905156626016, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.00027898030229586213, + "loss": 0.028, "step": 54060 }, { - "epoch": 0.27, - "learning_rate": 0.00025908148387324614, - "loss": 0.0279, + "epoch": 0.14, + "learning_rate": 0.00027897641407949065, + "loss": 0.0231, "step": 54070 }, { - "epoch": 0.27, - "learning_rate": 0.0002590739161802322, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.0002789725258631192, + "loss": 0.0276, "step": 54080 }, { - "epoch": 0.27, - "learning_rate": 0.00025906634848721816, - "loss": 0.0769, + "epoch": 0.14, + "learning_rate": 0.00027896863764674773, + "loss": 0.0264, "step": 54090 }, { - "epoch": 0.27, - "learning_rate": 0.00025905878079420414, - "loss": 0.0249, + "epoch": 0.14, + "learning_rate": 0.0002789647494303763, + "loss": 0.0235, "step": 54100 }, { - "epoch": 0.27, - "learning_rate": 0.0002590512131011901, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.0002789608612140048, + "loss": 0.0299, "step": 54110 }, { - "epoch": 0.27, - "learning_rate": 0.0002590436454081761, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027895697299763333, + "loss": 0.0258, "step": 54120 }, { - "epoch": 0.27, - "learning_rate": 0.0002590360777151621, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.0002789530847812619, + "loss": 0.028, "step": 54130 }, { - "epoch": 0.27, - "learning_rate": 0.0002590285100221481, - "loss": 0.0341, + "epoch": 0.14, + "learning_rate": 0.0002789491965648904, + "loss": 0.0259, "step": 54140 }, { - "epoch": 0.27, - "learning_rate": 0.0002590209423291341, - "loss": 0.0182, + "epoch": 0.14, + "learning_rate": 0.0002789453083485189, + "loss": 0.0242, "step": 54150 }, { - "epoch": 0.27, - "learning_rate": 0.0002590133746361201, - "loss": 0.0226, + "epoch": 0.14, + "learning_rate": 0.0002789414201321475, + "loss": 0.0272, "step": 54160 }, { - "epoch": 0.27, - "learning_rate": 0.00025900580694310606, - "loss": 0.0229, + "epoch": 0.14, + "learning_rate": 0.000278937531915776, + "loss": 0.0273, "step": 54170 }, { - "epoch": 0.27, - "learning_rate": 0.00025899823925009204, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.0002789336436994046, + "loss": 0.0258, "step": 54180 }, { - "epoch": 0.27, - "learning_rate": 0.000258990671557078, - "loss": 0.0165, + "epoch": 0.14, + "learning_rate": 0.0002789297554830331, + "loss": 0.0296, "step": 54190 }, { - "epoch": 0.27, - "learning_rate": 0.00025898310386406406, + "epoch": 0.14, + "learning_rate": 0.0002789258672666616, "loss": 0.0272, "step": 54200 }, { - "epoch": 0.27, - "learning_rate": 0.00025897553617105004, - "loss": 0.0251, + "epoch": 0.14, + "learning_rate": 0.0002789219790502902, + "loss": 0.0248, "step": 54210 }, { - "epoch": 0.27, - "learning_rate": 0.000258967968478036, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.0002789180908339187, + "loss": 0.0284, "step": 54220 }, { - "epoch": 0.27, - "learning_rate": 0.000258960400785022, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.00027891420261754726, + "loss": 0.0257, "step": 54230 }, { - "epoch": 0.27, - "learning_rate": 0.000258952833092008, - "loss": 0.0248, + "epoch": 0.14, + "learning_rate": 0.0002789103144011758, + "loss": 0.0261, "step": 54240 }, { - "epoch": 0.27, - "learning_rate": 0.00025894526539899397, - "loss": 0.0204, + "epoch": 0.14, + "learning_rate": 0.00027890642618480434, + "loss": 0.0293, "step": 54250 }, { - "epoch": 0.27, - "learning_rate": 0.00025893769770597995, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.00027890253796843286, + "loss": 0.0233, "step": 54260 }, { - "epoch": 0.27, - "learning_rate": 0.000258930130012966, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.00027889864975206137, + "loss": 0.0297, "step": 54270 }, { - "epoch": 0.27, - "learning_rate": 0.00025892256231995197, - "loss": 0.0206, + "epoch": 0.14, + "learning_rate": 0.0002788947615356899, + "loss": 0.0333, "step": 54280 }, { - "epoch": 0.27, - "learning_rate": 0.00025891499462693795, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.00027889087331931845, + "loss": 0.0267, "step": 54290 }, { - "epoch": 0.27, - "learning_rate": 0.00025890742693392393, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.00027888698510294697, + "loss": 0.0313, "step": 54300 }, { - "epoch": 0.27, - "learning_rate": 0.0002588998592409099, - "loss": 0.0159, + "epoch": 0.14, + "learning_rate": 0.00027888309688657554, + "loss": 0.0264, "step": 54310 }, { - "epoch": 0.27, - "learning_rate": 0.0002588922915478959, - "loss": 0.0225, + "epoch": 0.14, + "learning_rate": 0.00027887920867020405, + "loss": 0.028, "step": 54320 }, { - "epoch": 0.27, - "learning_rate": 0.00025888472385488193, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.0002788753204538326, + "loss": 0.0311, "step": 54330 }, { - "epoch": 0.27, - "learning_rate": 0.0002588771561618679, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027887143223746114, + "loss": 0.0268, "step": 54340 }, { - "epoch": 0.27, - "learning_rate": 0.0002588695884688539, - "loss": 0.0184, + "epoch": 0.14, + "learning_rate": 0.00027886754402108965, + "loss": 0.0298, "step": 54350 }, { - "epoch": 0.27, - "learning_rate": 0.00025886202077583987, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.00027886365580471816, + "loss": 0.0248, "step": 54360 }, { - "epoch": 0.27, - "learning_rate": 0.00025885445308282585, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027885976758834673, + "loss": 0.0289, "step": 54370 }, { - "epoch": 0.27, - "learning_rate": 0.00025884688538981184, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.0002788558793719753, + "loss": 0.0236, "step": 54380 }, { - "epoch": 0.27, - "learning_rate": 0.0002588393176967978, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.0002788519911556038, + "loss": 0.0311, "step": 54390 }, { - "epoch": 0.27, - "learning_rate": 0.00025883175000378385, - "loss": 0.0253, + "epoch": 0.14, + "learning_rate": 0.00027884810293923233, + "loss": 0.0295, "step": 54400 }, { - "epoch": 0.27, - "learning_rate": 0.00025882418231076983, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.00027884421472286085, + "loss": 0.0223, "step": 54410 }, { - "epoch": 0.27, - "learning_rate": 0.0002588166146177558, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002788403265064894, + "loss": 0.0294, "step": 54420 }, { - "epoch": 0.27, - "learning_rate": 0.0002588090469247418, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.00027883643829011793, + "loss": 0.0312, "step": 54430 }, { - "epoch": 0.27, - "learning_rate": 0.0002588014792317278, - "loss": 0.0204, + "epoch": 0.14, + "learning_rate": 0.0002788325500737465, + "loss": 0.0252, "step": 54440 }, { - "epoch": 0.27, - "learning_rate": 0.00025879391153871376, - "loss": 0.0228, + "epoch": 0.14, + "learning_rate": 0.000278828661857375, + "loss": 0.0241, "step": 54450 }, { - "epoch": 0.27, - "learning_rate": 0.0002587863438456998, - "loss": 0.0173, + "epoch": 0.14, + "learning_rate": 0.0002788247736410036, + "loss": 0.0263, "step": 54460 }, { - "epoch": 0.27, - "learning_rate": 0.0002587787761526858, - "loss": 0.0179, + "epoch": 0.14, + "learning_rate": 0.0002788208854246321, + "loss": 0.0316, "step": 54470 }, { - "epoch": 0.27, - "learning_rate": 0.00025877120845967176, - "loss": 0.0294, + "epoch": 0.14, + "learning_rate": 0.0002788169972082606, + "loss": 0.0284, "step": 54480 }, { - "epoch": 0.27, - "learning_rate": 0.00025876364076665774, - "loss": 0.023, + "epoch": 0.14, + "learning_rate": 0.0002788131089918891, + "loss": 0.0258, "step": 54490 }, { - "epoch": 0.27, - "learning_rate": 0.0002587560730736437, - "loss": 0.0196, + "epoch": 0.14, + "learning_rate": 0.0002788092207755177, + "loss": 0.0238, "step": 54500 }, { - "epoch": 0.28, - "learning_rate": 0.0002587485053806297, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.0002788053325591462, + "loss": 0.0301, "step": 54510 }, { - "epoch": 0.28, - "learning_rate": 0.00025874093768761574, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.0002788014443427748, + "loss": 0.029, "step": 54520 }, { - "epoch": 0.28, - "learning_rate": 0.0002587333699946017, - "loss": 0.0189, + "epoch": 0.14, + "learning_rate": 0.0002787975561264033, + "loss": 0.0262, "step": 54530 }, { - "epoch": 0.28, - "learning_rate": 0.0002587258023015877, - "loss": 0.022, + "epoch": 0.14, + "learning_rate": 0.00027879366791003186, + "loss": 0.0293, "step": 54540 }, { - "epoch": 0.28, - "learning_rate": 0.0002587182346085737, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.0002787897796936604, + "loss": 0.0256, "step": 54550 }, { - "epoch": 0.28, - "learning_rate": 0.00025871066691555966, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.0002787858914772889, + "loss": 0.0244, "step": 54560 }, { - "epoch": 0.28, - "learning_rate": 0.00025870309922254565, - "loss": 0.0198, + "epoch": 0.14, + "learning_rate": 0.00027878200326091746, + "loss": 0.0242, "step": 54570 }, { - "epoch": 0.28, - "learning_rate": 0.00025869553152953163, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.00027877811504454597, + "loss": 0.0308, "step": 54580 }, { - "epoch": 0.28, - "learning_rate": 0.00025868796383651766, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027877422682817454, + "loss": 0.0271, "step": 54590 }, { - "epoch": 0.28, - "learning_rate": 0.00025868039614350364, - "loss": 0.0253, + "epoch": 0.14, + "learning_rate": 0.00027877033861180306, + "loss": 0.028, "step": 54600 }, { - "epoch": 0.28, - "learning_rate": 0.0002586728284504896, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.00027876645039543157, + "loss": 0.0256, "step": 54610 }, { - "epoch": 0.28, - "learning_rate": 0.0002586652607574756, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.0002787625621790601, + "loss": 0.0297, "step": 54620 }, { - "epoch": 0.28, - "learning_rate": 0.0002586576930644616, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.00027875867396268865, + "loss": 0.0266, "step": 54630 }, { - "epoch": 0.28, - "learning_rate": 0.00025865012537144757, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027875478574631717, + "loss": 0.0247, "step": 54640 }, { - "epoch": 0.28, - "learning_rate": 0.0002586425576784336, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.00027875089752994574, + "loss": 0.0288, "step": 54650 }, { - "epoch": 0.28, - "learning_rate": 0.0002586349899854196, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.00027874700931357425, + "loss": 0.0288, "step": 54660 }, { - "epoch": 0.28, - "learning_rate": 0.00025862742229240557, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002787431210972028, + "loss": 0.0273, "step": 54670 }, { - "epoch": 0.28, - "learning_rate": 0.0002586198545993915, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.00027873923288083133, + "loss": 0.0334, "step": 54680 }, { - "epoch": 0.28, - "learning_rate": 0.00025861228690637753, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.00027873534466445985, + "loss": 0.0261, "step": 54690 }, { - "epoch": 0.28, - "learning_rate": 0.0002586047192133635, - "loss": 0.0227, + "epoch": 0.14, + "learning_rate": 0.00027873145644808836, + "loss": 0.0263, "step": 54700 }, { - "epoch": 0.28, - "learning_rate": 0.0002585971515203495, - "loss": 0.0164, + "epoch": 0.14, + "learning_rate": 0.00027872756823171693, + "loss": 0.0279, "step": 54710 }, { - "epoch": 0.28, - "learning_rate": 0.0002585895838273355, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.0002787236800153455, + "loss": 0.0281, "step": 54720 }, { - "epoch": 0.28, - "learning_rate": 0.00025858201613432146, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.000278719791798974, + "loss": 0.0227, "step": 54730 }, { - "epoch": 0.28, - "learning_rate": 0.00025857444844130744, - "loss": 0.0213, + "epoch": 0.14, + "learning_rate": 0.00027871590358260253, + "loss": 0.025, "step": 54740 }, { - "epoch": 0.28, - "learning_rate": 0.0002585668807482935, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.0002787120153662311, + "loss": 0.0274, "step": 54750 }, { - "epoch": 0.28, - "learning_rate": 0.00025855931305527946, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.0002787081271498596, + "loss": 0.0281, "step": 54760 }, { - "epoch": 0.28, - "learning_rate": 0.00025855174536226544, - "loss": 0.0232, + "epoch": 0.14, + "learning_rate": 0.00027870423893348813, + "loss": 0.0291, "step": 54770 }, { - "epoch": 0.28, - "learning_rate": 0.0002585441776692514, - "loss": 0.0258, + "epoch": 0.14, + "learning_rate": 0.0002787003507171167, + "loss": 0.0305, "step": 54780 }, { - "epoch": 0.28, - "learning_rate": 0.0002585366099762374, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.0002786964625007452, + "loss": 0.0258, "step": 54790 }, { - "epoch": 0.28, - "learning_rate": 0.0002585290422832234, - "loss": 0.0201, + "epoch": 0.14, + "learning_rate": 0.0002786925742843738, + "loss": 0.0268, "step": 54800 }, { - "epoch": 0.28, - "learning_rate": 0.00025852147459020936, - "loss": 0.0246, + "epoch": 0.14, + "learning_rate": 0.0002786886860680023, + "loss": 0.0278, "step": 54810 }, { - "epoch": 0.28, - "learning_rate": 0.0002585139068971954, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.0002786847978516308, + "loss": 0.0316, "step": 54820 }, { - "epoch": 0.28, - "learning_rate": 0.0002585063392041814, - "loss": 0.0237, + "epoch": 0.14, + "learning_rate": 0.0002786809096352594, + "loss": 0.0279, "step": 54830 }, { - "epoch": 0.28, - "learning_rate": 0.00025849877151116736, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002786770214188879, + "loss": 0.0246, "step": 54840 }, { - "epoch": 0.28, - "learning_rate": 0.00025849120381815334, - "loss": 0.0289, + "epoch": 0.14, + "learning_rate": 0.0002786731332025164, + "loss": 0.0288, "step": 54850 }, { - "epoch": 0.28, - "learning_rate": 0.0002584836361251393, - "loss": 0.0304, + "epoch": 0.14, + "learning_rate": 0.000278669244986145, + "loss": 0.0266, "step": 54860 }, { - "epoch": 0.28, - "learning_rate": 0.0002584760684321253, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.0002786653567697735, + "loss": 0.0304, "step": 54870 }, { - "epoch": 0.28, - "learning_rate": 0.00025846850073911134, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.00027866146855340206, + "loss": 0.0289, "step": 54880 }, { - "epoch": 0.28, - "learning_rate": 0.0002584609330460973, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.0002786575803370306, + "loss": 0.0261, "step": 54890 }, { - "epoch": 0.28, - "learning_rate": 0.0002584533653530833, - "loss": 0.0176, + "epoch": 0.14, + "learning_rate": 0.0002786536921206591, + "loss": 0.0237, "step": 54900 }, { - "epoch": 0.28, - "learning_rate": 0.0002584457976600693, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.0002786498039042876, + "loss": 0.0234, "step": 54910 }, { - "epoch": 0.28, - "learning_rate": 0.00025843822996705527, - "loss": 0.0249, + "epoch": 0.14, + "learning_rate": 0.00027864591568791617, + "loss": 0.0295, "step": 54920 }, { - "epoch": 0.28, - "learning_rate": 0.00025843066227404125, - "loss": 0.0194, + "epoch": 0.14, + "learning_rate": 0.00027864202747154474, + "loss": 0.0272, "step": 54930 }, { - "epoch": 0.28, - "learning_rate": 0.00025842309458102723, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.00027863813925517325, + "loss": 0.0233, "step": 54940 }, { - "epoch": 0.28, - "learning_rate": 0.00025841552688801327, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.00027863425103880177, + "loss": 0.0316, "step": 54950 }, { - "epoch": 0.28, - "learning_rate": 0.00025840795919499925, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.00027863036282243034, + "loss": 0.0307, "step": 54960 }, { - "epoch": 0.28, - "learning_rate": 0.00025840039150198523, - "loss": 0.0214, + "epoch": 0.14, + "learning_rate": 0.00027862647460605885, + "loss": 0.0311, "step": 54970 }, { - "epoch": 0.28, - "learning_rate": 0.0002583928238089712, - "loss": 0.0222, + "epoch": 0.14, + "learning_rate": 0.00027862258638968737, + "loss": 0.0273, "step": 54980 }, { - "epoch": 0.28, - "learning_rate": 0.0002583852561159572, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.00027861869817331594, + "loss": 0.0253, "step": 54990 }, { - "epoch": 0.28, - "learning_rate": 0.0002583776884229432, - "loss": 0.0218, + "epoch": 0.14, + "learning_rate": 0.00027861480995694445, + "loss": 0.0254, "step": 55000 }, { - "epoch": 0.28, - "eval_cer": 0.914472196695413, - "eval_loss": 0.014595328830182552, - "eval_runtime": 116.9041, - "eval_samples_per_second": 17.108, - "eval_steps_per_second": 4.277, + "epoch": 0.14, + "eval_cer": 0.881821655462573, + "eval_loss": 0.02109946869313717, + "eval_runtime": 108.1363, + "eval_samples_per_second": 18.495, + "eval_steps_per_second": 4.624, "step": 55000 }, { - "epoch": 0.28, - "learning_rate": 0.0002583701207299292, - "loss": 0.019, + "epoch": 0.14, + "learning_rate": 0.000278610921740573, + "loss": 0.0242, "step": 55010 }, { - "epoch": 0.28, - "learning_rate": 0.0002583625530369152, - "loss": 0.0263, + "epoch": 0.14, + "learning_rate": 0.00027860703352420153, + "loss": 0.0291, "step": 55020 }, { - "epoch": 0.28, - "learning_rate": 0.00025835498534390117, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.00027860314530783005, + "loss": 0.0259, "step": 55030 }, { - "epoch": 0.28, - "learning_rate": 0.00025834741765088715, - "loss": 0.0189, + "epoch": 0.14, + "learning_rate": 0.0002785992570914586, + "loss": 0.0267, "step": 55040 }, { - "epoch": 0.28, - "learning_rate": 0.00025833984995787313, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.00027859536887508713, + "loss": 0.0314, "step": 55050 }, { - "epoch": 0.28, - "learning_rate": 0.0002583322822648591, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.00027859148065871565, + "loss": 0.0352, "step": 55060 }, { - "epoch": 0.28, - "learning_rate": 0.00025832471457184515, - "loss": 0.0225, + "epoch": 0.14, + "learning_rate": 0.0002785875924423442, + "loss": 0.0326, "step": 55070 }, { - "epoch": 0.28, - "learning_rate": 0.00025831714687883113, - "loss": 0.0212, + "epoch": 0.14, + "learning_rate": 0.00027858370422597273, + "loss": 0.0299, "step": 55080 }, { - "epoch": 0.28, - "learning_rate": 0.0002583095791858171, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.0002785798160096013, + "loss": 0.031, "step": 55090 }, { - "epoch": 0.28, - "learning_rate": 0.0002583020114928031, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.0002785759277932298, + "loss": 0.0238, "step": 55100 }, { - "epoch": 0.28, - "learning_rate": 0.0002582944437997891, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.0002785720395768583, + "loss": 0.0287, "step": 55110 }, { - "epoch": 0.28, - "learning_rate": 0.00025828687610677506, - "loss": 0.0173, + "epoch": 0.14, + "learning_rate": 0.0002785681513604869, + "loss": 0.0305, "step": 55120 }, { - "epoch": 0.28, - "learning_rate": 0.00025827930841376104, - "loss": 0.0308, + "epoch": 0.14, + "learning_rate": 0.0002785642631441154, + "loss": 0.0259, "step": 55130 }, { - "epoch": 0.28, - "learning_rate": 0.0002582717407207471, - "loss": 0.0244, + "epoch": 0.14, + "learning_rate": 0.000278560374927744, + "loss": 0.0293, "step": 55140 }, { - "epoch": 0.28, - "learning_rate": 0.00025826417302773306, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.0002785564867113725, + "loss": 0.0296, "step": 55150 }, { - "epoch": 0.28, - "learning_rate": 0.00025825660533471904, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.000278552598495001, + "loss": 0.028, "step": 55160 }, { - "epoch": 0.28, - "learning_rate": 0.000258249037641705, - "loss": 0.0309, + "epoch": 0.14, + "learning_rate": 0.0002785487102786296, + "loss": 0.0301, "step": 55170 }, { - "epoch": 0.28, - "learning_rate": 0.000258241469948691, - "loss": 0.024, + "epoch": 0.14, + "learning_rate": 0.0002785448220622581, + "loss": 0.0271, "step": 55180 }, { - "epoch": 0.28, - "learning_rate": 0.000258233902255677, - "loss": 0.0204, + "epoch": 0.14, + "learning_rate": 0.0002785409338458866, + "loss": 0.0272, "step": 55190 }, { - "epoch": 0.28, - "learning_rate": 0.000258226334562663, - "loss": 0.0193, + "epoch": 0.14, + "learning_rate": 0.0002785370456295152, + "loss": 0.0272, "step": 55200 }, { - "epoch": 0.28, - "learning_rate": 0.000258218766869649, - "loss": 0.0225, + "epoch": 0.14, + "learning_rate": 0.0002785331574131437, + "loss": 0.0304, "step": 55210 }, { - "epoch": 0.28, - "learning_rate": 0.000258211199176635, - "loss": 0.02, + "epoch": 0.14, + "learning_rate": 0.00027852926919677226, + "loss": 0.028, "step": 55220 }, { - "epoch": 0.28, - "learning_rate": 0.00025820363148362096, - "loss": 0.0266, + "epoch": 0.14, + "learning_rate": 0.00027852538098040077, + "loss": 0.0258, "step": 55230 }, { - "epoch": 0.28, - "learning_rate": 0.00025819606379060694, - "loss": 0.0234, + "epoch": 0.14, + "learning_rate": 0.0002785214927640293, + "loss": 0.0265, "step": 55240 }, { - "epoch": 0.28, - "learning_rate": 0.0002581884960975929, - "loss": 0.0198, + "epoch": 0.14, + "learning_rate": 0.00027851760454765786, + "loss": 0.0239, "step": 55250 }, { - "epoch": 0.28, - "learning_rate": 0.00025818092840457896, - "loss": 0.0241, + "epoch": 0.14, + "learning_rate": 0.00027851371633128637, + "loss": 0.0218, "step": 55260 }, { - "epoch": 0.28, - "learning_rate": 0.00025817336071156494, - "loss": 0.0204, + "epoch": 0.14, + "learning_rate": 0.00027850982811491494, + "loss": 0.0293, "step": 55270 }, { - "epoch": 0.28, - "learning_rate": 0.0002581657930185509, - "loss": 0.0225, + "epoch": 0.14, + "learning_rate": 0.00027850593989854345, + "loss": 0.0278, "step": 55280 }, { - "epoch": 0.28, - "learning_rate": 0.0002581582253255369, - "loss": 0.0206, + "epoch": 0.14, + "learning_rate": 0.000278502051682172, + "loss": 0.0247, "step": 55290 }, { - "epoch": 0.28, - "learning_rate": 0.0002581506576325229, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.00027849816346580054, + "loss": 0.03, "step": 55300 }, { - "epoch": 0.28, - "learning_rate": 0.00025814308993950887, - "loss": 0.0211, + "epoch": 0.14, + "learning_rate": 0.00027849427524942905, + "loss": 0.0294, "step": 55310 }, { - "epoch": 0.28, - "learning_rate": 0.00025813552224649485, - "loss": 0.0247, + "epoch": 0.14, + "learning_rate": 0.00027849038703305757, + "loss": 0.0237, "step": 55320 }, { - "epoch": 0.28, - "learning_rate": 0.0002581279545534809, - "loss": 0.0197, + "epoch": 0.14, + "learning_rate": 0.00027848649881668613, + "loss": 0.0271, "step": 55330 }, { - "epoch": 0.28, - "learning_rate": 0.00025812038686046687, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.00027848261060031465, + "loss": 0.0272, "step": 55340 }, { - "epoch": 0.28, - "learning_rate": 0.00025811281916745285, - "loss": 0.0182, + "epoch": 0.14, + "learning_rate": 0.0002784787223839432, + "loss": 0.027, "step": 55350 }, { - "epoch": 0.28, - "learning_rate": 0.00025810525147443883, - "loss": 0.0203, + "epoch": 0.14, + "learning_rate": 0.00027847483416757173, + "loss": 0.0265, "step": 55360 }, { - "epoch": 0.28, - "learning_rate": 0.0002580976837814248, - "loss": 0.018, + "epoch": 0.14, + "learning_rate": 0.00027847094595120025, + "loss": 0.0304, "step": 55370 }, { - "epoch": 0.28, - "learning_rate": 0.0002580901160884108, - "loss": 0.0194, + "epoch": 0.14, + "learning_rate": 0.0002784670577348288, + "loss": 0.0313, "step": 55380 }, { - "epoch": 0.28, - "learning_rate": 0.00025808254839539683, - "loss": 0.0196, + "epoch": 0.14, + "learning_rate": 0.00027846316951845733, + "loss": 0.0259, "step": 55390 }, { - "epoch": 0.28, - "learning_rate": 0.0002580749807023828, - "loss": 0.0212, + "epoch": 0.14, + "learning_rate": 0.00027845928130208584, + "loss": 0.0366, "step": 55400 }, { - "epoch": 0.28, - "learning_rate": 0.0002580674130093688, - "loss": 0.025, + "epoch": 0.14, + "learning_rate": 0.0002784553930857144, + "loss": 0.0232, "step": 55410 }, { - "epoch": 0.28, - "learning_rate": 0.0002580598453163548, - "loss": 0.0202, + "epoch": 0.14, + "learning_rate": 0.000278451504869343, + "loss": 0.0275, "step": 55420 }, { - "epoch": 0.28, - "learning_rate": 0.00025805227762334075, - "loss": 0.0212, + "epoch": 0.14, + "learning_rate": 0.0002784476166529715, + "loss": 0.0275, "step": 55430 }, { - "epoch": 0.28, - "learning_rate": 0.00025804470993032674, - "loss": 0.0207, + "epoch": 0.14, + "learning_rate": 0.0002784437284366, + "loss": 0.0243, "step": 55440 }, { - "epoch": 0.28, - "learning_rate": 0.0002580371422373127, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.0002784398402202285, + "loss": 0.0304, "step": 55450 }, { - "epoch": 0.28, - "learning_rate": 0.00025802957454429875, - "loss": 0.0186, + "epoch": 0.14, + "learning_rate": 0.0002784359520038571, + "loss": 0.0289, "step": 55460 }, { - "epoch": 0.28, - "learning_rate": 0.00025802200685128473, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.0002784320637874856, + "loss": 0.027, "step": 55470 }, { - "epoch": 0.28, - "learning_rate": 0.0002580144391582707, - "loss": 0.0219, + "epoch": 0.14, + "learning_rate": 0.0002784281755711142, + "loss": 0.026, "step": 55480 }, { - "epoch": 0.28, - "learning_rate": 0.0002580068714652567, - "loss": 0.0261, + "epoch": 0.14, + "learning_rate": 0.0002784242873547427, + "loss": 0.0303, "step": 55490 }, { - "epoch": 0.28, - "learning_rate": 0.0002579993037722427, - "loss": 0.0177, + "epoch": 0.14, + "learning_rate": 0.00027842039913837126, + "loss": 0.0218, "step": 55500 }, { - "epoch": 0.28, - "learning_rate": 0.00025799173607922866, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.0002784165109219998, + "loss": 0.0262, "step": 55510 }, { - "epoch": 0.28, - "learning_rate": 0.0002579841683862147, - "loss": 0.0184, + "epoch": 0.14, + "learning_rate": 0.0002784126227056283, + "loss": 0.0268, "step": 55520 }, { - "epoch": 0.28, - "learning_rate": 0.0002579766006932007, - "loss": 0.021, + "epoch": 0.14, + "learning_rate": 0.0002784087344892568, + "loss": 0.0276, "step": 55530 }, { - "epoch": 0.28, - "learning_rate": 0.00025796903300018666, - "loss": 0.0221, + "epoch": 0.14, + "learning_rate": 0.00027840484627288537, + "loss": 0.0285, "step": 55540 }, { - "epoch": 0.28, - "learning_rate": 0.00025796146530717264, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.0002784009580565139, + "loss": 0.0295, "step": 55550 }, { - "epoch": 0.28, - "learning_rate": 0.0002579538976141586, - "loss": 0.0187, - "step": 55560 + "epoch": 0.14, + "learning_rate": 0.00027839706984014246, + "loss": 0.0271, + "step": 55560 }, { - "epoch": 0.28, - "learning_rate": 0.0002579463299211446, - "loss": 0.0199, + "epoch": 0.14, + "learning_rate": 0.00027839318162377097, + "loss": 0.0258, "step": 55570 }, { - "epoch": 0.28, - "learning_rate": 0.00025793876222813064, - "loss": 0.0181, + "epoch": 0.14, + "learning_rate": 0.0002783892934073995, + "loss": 0.0302, "step": 55580 }, { - "epoch": 0.28, - "learning_rate": 0.0002579311945351166, - "loss": 0.0181, + "epoch": 0.14, + "learning_rate": 0.00027838540519102805, + "loss": 0.024, "step": 55590 }, { - "epoch": 0.28, - "learning_rate": 0.0002579236268421026, - "loss": 0.0198, + "epoch": 0.14, + "learning_rate": 0.00027838151697465657, + "loss": 0.0267, "step": 55600 }, { - "epoch": 0.28, - "learning_rate": 0.0002579160591490886, - "loss": 0.0223, + "epoch": 0.14, + "learning_rate": 0.0002783776287582851, + "loss": 0.022, "step": 55610 }, { - "epoch": 0.28, - "learning_rate": 0.00025790849145607456, - "loss": 0.0208, + "epoch": 0.14, + "learning_rate": 0.00027837374054191365, + "loss": 0.0253, "step": 55620 }, { - "epoch": 0.28, - "learning_rate": 0.00025790092376306055, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.0002783698523255422, + "loss": 0.0271, "step": 55630 }, { - "epoch": 0.28, - "learning_rate": 0.00025789335607004653, - "loss": 0.0182, + "epoch": 0.14, + "learning_rate": 0.00027836596410917073, + "loss": 0.0259, "step": 55640 }, { - "epoch": 0.28, - "learning_rate": 0.00025788578837703256, - "loss": 0.0224, + "epoch": 0.14, + "learning_rate": 0.00027836207589279925, + "loss": 0.0312, "step": 55650 }, { - "epoch": 0.28, - "learning_rate": 0.00025787822068401854, - "loss": 0.0204, + "epoch": 0.14, + "learning_rate": 0.00027835818767642776, + "loss": 0.0251, "step": 55660 }, { - "epoch": 0.28, - "learning_rate": 0.0002578706529910045, - "loss": 0.0186, + "epoch": 0.14, + "learning_rate": 0.00027835429946005633, + "loss": 0.0289, "step": 55670 }, { - "epoch": 0.28, - "learning_rate": 0.0002578630852979905, - "loss": 0.023, + "epoch": 0.14, + "learning_rate": 0.00027835041124368485, + "loss": 0.033, "step": 55680 }, { - "epoch": 0.28, - "learning_rate": 0.0002578555176049765, - "loss": 0.0216, + "epoch": 0.14, + "learning_rate": 0.0002783465230273134, + "loss": 0.0286, "step": 55690 }, { - "epoch": 0.28, - "learning_rate": 0.00025784794991196247, - "loss": 0.0186, + "epoch": 0.14, + "learning_rate": 0.00027834263481094193, + "loss": 0.0254, "step": 55700 }, { - "epoch": 0.28, - "learning_rate": 0.0002578403822189485, - "loss": 0.0194, + "epoch": 0.14, + "learning_rate": 0.0002783387465945705, + "loss": 0.0237, "step": 55710 }, { - "epoch": 0.28, - "learning_rate": 0.0002578328145259345, - "loss": 0.0233, + "epoch": 0.14, + "learning_rate": 0.000278334858378199, + "loss": 0.0239, "step": 55720 }, { - "epoch": 0.28, - "learning_rate": 0.00025782524683292047, - "loss": 0.0215, + "epoch": 0.14, + "learning_rate": 0.00027833097016182753, + "loss": 0.0207, "step": 55730 }, { - "epoch": 0.28, - "learning_rate": 0.00025781767913990645, - "loss": 0.0178, + "epoch": 0.14, + "learning_rate": 0.00027832708194545604, + "loss": 0.0277, "step": 55740 }, { - "epoch": 0.28, - "learning_rate": 0.00025781011144689243, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.0002783231937290846, + "loss": 0.0256, "step": 55750 }, { - "epoch": 0.28, - "learning_rate": 0.0002578025437538784, - "loss": 0.0231, + "epoch": 0.14, + "learning_rate": 0.0002783193055127131, + "loss": 0.0277, "step": 55760 }, { - "epoch": 0.28, - "learning_rate": 0.00025779497606086445, - "loss": 0.0192, + "epoch": 0.14, + "learning_rate": 0.0002783154172963417, + "loss": 0.0232, "step": 55770 }, { - "epoch": 0.28, - "learning_rate": 0.00025778740836785043, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.0002783115290799702, + "loss": 0.0303, "step": 55780 }, { - "epoch": 0.28, - "learning_rate": 0.0002577798406748364, - "loss": 0.0225, + "epoch": 0.14, + "learning_rate": 0.0002783076408635988, + "loss": 0.0273, "step": 55790 }, { - "epoch": 0.28, - "learning_rate": 0.0002577722729818224, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.0002783037526472273, + "loss": 0.029, "step": 55800 }, { - "epoch": 0.28, - "learning_rate": 0.0002577647052888084, - "loss": 0.0206, + "epoch": 0.14, + "learning_rate": 0.0002782998644308558, + "loss": 0.0389, "step": 55810 }, { - "epoch": 0.28, - "learning_rate": 0.00025775713759579436, - "loss": 0.0156, + "epoch": 0.14, + "learning_rate": 0.0002782959762144844, + "loss": 0.025, "step": 55820 }, { - "epoch": 0.28, - "learning_rate": 0.00025774956990278034, - "loss": 0.0205, + "epoch": 0.14, + "learning_rate": 0.0002782920879981129, + "loss": 0.0285, "step": 55830 }, { - "epoch": 0.28, - "learning_rate": 0.0002577420022097664, - "loss": 0.0191, + "epoch": 0.14, + "learning_rate": 0.00027828819978174146, + "loss": 0.0303, "step": 55840 }, { - "epoch": 0.28, - "learning_rate": 0.00025773443451675235, - "loss": 0.0242, + "epoch": 0.14, + "learning_rate": 0.00027828431156537, + "loss": 0.0269, "step": 55850 }, { - "epoch": 0.28, - "learning_rate": 0.00025772686682373834, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.0002782804233489985, + "loss": 0.036, "step": 55860 }, { - "epoch": 0.28, - "learning_rate": 0.0002577192991307243, - "loss": 0.0188, + "epoch": 0.14, + "learning_rate": 0.000278276535132627, + "loss": 0.0322, "step": 55870 }, { - "epoch": 0.28, - "learning_rate": 0.0002577117314377103, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.00027827264691625557, + "loss": 0.0303, "step": 55880 }, { - "epoch": 0.28, - "learning_rate": 0.0002577041637446963, - "loss": 0.0209, + "epoch": 0.14, + "learning_rate": 0.0002782687586998841, + "loss": 0.0244, "step": 55890 }, { - "epoch": 0.28, - "learning_rate": 0.0002576965960516823, - "loss": 0.0239, + "epoch": 0.14, + "learning_rate": 0.00027826487048351265, + "loss": 0.0295, "step": 55900 }, { - "epoch": 0.28, - "learning_rate": 0.0002576890283586683, - "loss": 0.0183, + "epoch": 0.14, + "learning_rate": 0.00027826098226714117, + "loss": 0.0312, "step": 55910 }, { - "epoch": 0.28, - "learning_rate": 0.0002576814606656543, - "loss": 0.0171, + "epoch": 0.14, + "learning_rate": 0.00027825709405076974, + "loss": 0.0245, "step": 55920 }, { - "epoch": 0.28, - "learning_rate": 0.00025767389297264026, - "loss": 0.0187, + "epoch": 0.14, + "learning_rate": 0.00027825320583439825, + "loss": 0.0291, "step": 55930 }, { - "epoch": 0.28, - "learning_rate": 0.00025766632527962624, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027824931761802677, + "loss": 0.0426, "step": 55940 }, { - "epoch": 0.28, - "learning_rate": 0.0002576587575866122, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.0002782454294016553, + "loss": 0.0298, "step": 55950 }, { - "epoch": 0.28, - "learning_rate": 0.0002576511898935982, - "loss": 0.0193, + "epoch": 0.15, + "learning_rate": 0.00027824154118528385, + "loss": 0.0274, "step": 55960 }, { - "epoch": 0.28, - "learning_rate": 0.0002576436222005842, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.0002782376529689124, + "loss": 0.0271, "step": 55970 }, { - "epoch": 0.28, - "learning_rate": 0.00025763605450757017, - "loss": 0.0202, + "epoch": 0.15, + "learning_rate": 0.00027823376475254093, + "loss": 0.0384, "step": 55980 }, { - "epoch": 0.28, - "learning_rate": 0.00025762848681455615, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.00027822987653616945, + "loss": 0.0299, "step": 55990 }, { - "epoch": 0.28, - "learning_rate": 0.0002576209191215422, - "loss": 0.0231, + "epoch": 0.15, + "learning_rate": 0.000278225988319798, + "loss": 0.0241, "step": 56000 }, { - "epoch": 0.28, - "eval_cer": 0.9144886934295449, - "eval_loss": 0.014846866950392723, - "eval_runtime": 116.7024, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.284, + "epoch": 0.15, + "eval_cer": 0.8818426500165857, + "eval_loss": 0.020007161423563957, + "eval_runtime": 108.0119, + "eval_samples_per_second": 18.516, + "eval_steps_per_second": 4.629, "step": 56000 }, { - "epoch": 0.28, - "learning_rate": 0.00025761335142852817, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.00027822210010342653, + "loss": 0.0327, "step": 56010 }, { - "epoch": 0.28, - "learning_rate": 0.00025760578373551415, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.00027821821188705505, + "loss": 0.0303, "step": 56020 }, { - "epoch": 0.28, - "learning_rate": 0.00025759821604250013, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.0002782143236706836, + "loss": 0.0272, "step": 56030 }, { - "epoch": 0.28, - "learning_rate": 0.0002575906483494861, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027821043545431213, + "loss": 0.0292, "step": 56040 }, { - "epoch": 0.28, - "learning_rate": 0.0002575830806564721, - "loss": 0.0159, + "epoch": 0.15, + "learning_rate": 0.0002782065472379407, + "loss": 0.0261, "step": 56050 }, { - "epoch": 0.28, - "learning_rate": 0.0002575755129634581, - "loss": 0.0219, + "epoch": 0.15, + "learning_rate": 0.0002782026590215692, + "loss": 0.0303, "step": 56060 }, { - "epoch": 0.28, - "learning_rate": 0.0002575679452704441, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.00027819877080519773, + "loss": 0.0298, "step": 56070 }, { - "epoch": 0.28, - "learning_rate": 0.0002575603775774301, - "loss": 0.0193, + "epoch": 0.15, + "learning_rate": 0.00027819488258882624, + "loss": 0.0248, "step": 56080 }, { - "epoch": 0.28, - "learning_rate": 0.00025755280988441607, - "loss": 0.0166, + "epoch": 0.15, + "learning_rate": 0.0002781909943724548, + "loss": 0.0269, "step": 56090 }, { - "epoch": 0.28, - "learning_rate": 0.00025754524219140205, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.0002781871061560833, + "loss": 0.0291, "step": 56100 }, { - "epoch": 0.28, - "learning_rate": 0.00025753767449838803, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.0002781832179397119, + "loss": 0.0246, "step": 56110 }, { - "epoch": 0.28, - "learning_rate": 0.000257530106805374, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.0002781793297233404, + "loss": 0.0282, "step": 56120 }, { - "epoch": 0.28, - "learning_rate": 0.00025752253911236005, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.000278175441506969, + "loss": 0.0294, "step": 56130 }, { - "epoch": 0.28, - "learning_rate": 0.00025751497141934603, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.0002781715532905975, + "loss": 0.029, "step": 56140 }, { - "epoch": 0.28, - "learning_rate": 0.000257507403726332, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.000278167665074226, + "loss": 0.0283, "step": 56150 }, { - "epoch": 0.28, - "learning_rate": 0.000257499836033318, - "loss": 0.0181, + "epoch": 0.15, + "learning_rate": 0.0002781637768578546, + "loss": 0.036, "step": 56160 }, { - "epoch": 0.28, - "learning_rate": 0.000257492268340304, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.0002781598886414831, + "loss": 0.0245, "step": 56170 }, { - "epoch": 0.28, - "learning_rate": 0.00025748470064728996, - "loss": 0.0231, + "epoch": 0.15, + "learning_rate": 0.00027815600042511166, + "loss": 0.0371, "step": 56180 }, { - "epoch": 0.28, - "learning_rate": 0.00025747713295427594, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.00027815211220874017, + "loss": 0.0281, "step": 56190 }, { - "epoch": 0.28, - "learning_rate": 0.000257469565261262, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.0002781482239923687, + "loss": 0.0245, "step": 56200 }, { - "epoch": 0.28, - "learning_rate": 0.00025746199756824796, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027814433577599726, + "loss": 0.0276, "step": 56210 }, { - "epoch": 0.28, - "learning_rate": 0.00025745442987523394, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.00027814044755962577, + "loss": 0.0325, "step": 56220 }, { - "epoch": 0.28, - "learning_rate": 0.0002574468621822199, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.0002781365593432543, + "loss": 0.0291, "step": 56230 }, { - "epoch": 0.28, - "learning_rate": 0.0002574392944892059, - "loss": 0.0216, + "epoch": 0.15, + "learning_rate": 0.00027813267112688285, + "loss": 0.0312, "step": 56240 }, { - "epoch": 0.28, - "learning_rate": 0.0002574317267961919, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027812878291051137, + "loss": 0.0254, "step": 56250 }, { - "epoch": 0.28, - "learning_rate": 0.0002574241591031779, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.00027812489469413994, + "loss": 0.0322, "step": 56260 }, { - "epoch": 0.28, - "learning_rate": 0.0002574165914101639, - "loss": 0.0189, + "epoch": 0.15, + "learning_rate": 0.00027812100647776845, + "loss": 0.0256, "step": 56270 }, { - "epoch": 0.28, - "learning_rate": 0.0002574090237171499, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.00027811711826139697, + "loss": 0.0283, "step": 56280 }, { - "epoch": 0.28, - "learning_rate": 0.00025740145602413586, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.00027811323004502553, + "loss": 0.0231, "step": 56290 }, { - "epoch": 0.28, - "learning_rate": 0.00025739388833112184, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.00027810934182865405, + "loss": 0.0205, "step": 56300 }, { - "epoch": 0.28, - "learning_rate": 0.0002573863206381078, - "loss": 0.0243, + "epoch": 0.15, + "learning_rate": 0.0002781054536122826, + "loss": 0.0273, "step": 56310 }, { - "epoch": 0.28, - "learning_rate": 0.00025737875294509386, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.00027810156539591113, + "loss": 0.0252, "step": 56320 }, { - "epoch": 0.28, - "learning_rate": 0.00025737118525207984, - "loss": 0.0221, + "epoch": 0.15, + "learning_rate": 0.00027809767717953965, + "loss": 0.0249, "step": 56330 }, { - "epoch": 0.28, - "learning_rate": 0.0002573636175590658, - "loss": 0.0257, + "epoch": 0.15, + "learning_rate": 0.0002780937889631682, + "loss": 0.0308, "step": 56340 }, { - "epoch": 0.28, - "learning_rate": 0.0002573560498660518, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.00027808990074679673, + "loss": 0.0273, "step": 56350 }, { - "epoch": 0.28, - "learning_rate": 0.0002573484821730378, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.00027808601253042525, + "loss": 0.0259, "step": 56360 }, { - "epoch": 0.28, - "learning_rate": 0.00025734091448002377, - "loss": 0.0191, + "epoch": 0.15, + "learning_rate": 0.0002780821243140538, + "loss": 0.0275, "step": 56370 }, { - "epoch": 0.28, - "learning_rate": 0.00025733334678700975, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027807823609768233, + "loss": 0.0267, "step": 56380 }, { - "epoch": 0.28, - "learning_rate": 0.0002573257790939958, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.0002780743478813109, + "loss": 0.0259, "step": 56390 }, { - "epoch": 0.28, - "learning_rate": 0.00025731821140098177, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.0002780704596649394, + "loss": 0.0284, "step": 56400 }, { - "epoch": 0.28, - "learning_rate": 0.00025731064370796775, - "loss": 0.0216, + "epoch": 0.15, + "learning_rate": 0.0002780665714485679, + "loss": 0.0261, "step": 56410 }, { - "epoch": 0.28, - "learning_rate": 0.00025730307601495373, - "loss": 0.0271, + "epoch": 0.15, + "learning_rate": 0.0002780626832321965, + "loss": 0.0305, "step": 56420 }, { - "epoch": 0.28, - "learning_rate": 0.0002572955083219397, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.000278058795015825, + "loss": 0.0438, "step": 56430 }, { - "epoch": 0.28, - "learning_rate": 0.0002572879406289257, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.0002780549067994535, + "loss": 0.0279, "step": 56440 }, { - "epoch": 0.28, - "learning_rate": 0.00025728037293591173, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002780510185830821, + "loss": 0.0401, "step": 56450 }, { - "epoch": 0.28, - "learning_rate": 0.0002572728052428977, - "loss": 0.037, + "epoch": 0.15, + "learning_rate": 0.00027804713036671066, + "loss": 0.0323, "step": 56460 }, { - "epoch": 0.28, - "learning_rate": 0.0002572652375498837, - "loss": 0.0182, + "epoch": 0.15, + "learning_rate": 0.0002780432421503392, + "loss": 0.0336, "step": 56470 }, { - "epoch": 0.28, - "learning_rate": 0.0002572576698568697, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.0002780393539339677, + "loss": 0.0274, "step": 56480 }, { - "epoch": 0.28, - "learning_rate": 0.00025725010216385565, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.0002780354657175962, + "loss": 0.0306, "step": 56490 }, { - "epoch": 0.29, - "learning_rate": 0.00025724253447084164, - "loss": 0.0252, + "epoch": 0.15, + "learning_rate": 0.0002780315775012248, + "loss": 0.0284, "step": 56500 }, { - "epoch": 0.29, - "learning_rate": 0.0002572349667778276, - "loss": 0.0242, + "epoch": 0.15, + "learning_rate": 0.0002780276892848533, + "loss": 0.0277, "step": 56510 }, { - "epoch": 0.29, - "learning_rate": 0.00025722739908481365, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.00027802380106848186, + "loss": 0.0322, "step": 56520 }, { - "epoch": 0.29, - "learning_rate": 0.00025721983139179963, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.00027801991285211037, + "loss": 0.0315, "step": 56530 }, { - "epoch": 0.29, - "learning_rate": 0.0002572122636987856, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.00027801602463573894, + "loss": 0.0295, "step": 56540 }, { - "epoch": 0.29, - "learning_rate": 0.0002572046960057716, - "loss": 0.0227, + "epoch": 0.15, + "learning_rate": 0.00027801213641936745, + "loss": 0.026, "step": 56550 }, { - "epoch": 0.29, - "learning_rate": 0.0002571971283127576, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027800824820299597, + "loss": 0.0237, "step": 56560 }, { - "epoch": 0.29, - "learning_rate": 0.00025718956061974356, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.0002780043599866245, + "loss": 0.0287, "step": 56570 }, { - "epoch": 0.29, - "learning_rate": 0.0002571819929267296, - "loss": 0.0183, + "epoch": 0.15, + "learning_rate": 0.00027800047177025305, + "loss": 0.0281, "step": 56580 }, { - "epoch": 0.29, - "learning_rate": 0.0002571744252337156, - "loss": 0.0237, + "epoch": 0.15, + "learning_rate": 0.00027799658355388157, + "loss": 0.024, "step": 56590 }, { - "epoch": 0.29, - "learning_rate": 0.00025716685754070156, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.00027799269533751014, + "loss": 0.0312, "step": 56600 }, { - "epoch": 0.29, - "learning_rate": 0.00025715928984768754, - "loss": 0.0202, + "epoch": 0.15, + "learning_rate": 0.00027798880712113865, + "loss": 0.0261, "step": 56610 }, { - "epoch": 0.29, - "learning_rate": 0.0002571517221546735, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027798491890476716, + "loss": 0.0261, "step": 56620 }, { - "epoch": 0.29, - "learning_rate": 0.0002571441544616595, - "loss": 0.0222, + "epoch": 0.15, + "learning_rate": 0.00027798103068839573, + "loss": 0.0282, "step": 56630 }, { - "epoch": 0.29, - "learning_rate": 0.00025713658676864554, - "loss": 0.0181, + "epoch": 0.15, + "learning_rate": 0.00027797714247202425, + "loss": 0.03, "step": 56640 }, { - "epoch": 0.29, - "learning_rate": 0.0002571290190756315, - "loss": 0.0193, + "epoch": 0.15, + "learning_rate": 0.00027797325425565276, + "loss": 0.0283, "step": 56650 }, { - "epoch": 0.29, - "learning_rate": 0.0002571214513826175, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027796936603928133, + "loss": 0.0225, "step": 56660 }, { - "epoch": 0.29, - "learning_rate": 0.0002571138836896035, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.0002779654778229099, + "loss": 0.0279, "step": 56670 }, { - "epoch": 0.29, - "learning_rate": 0.00025710631599658946, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.0002779615896065384, + "loss": 0.0243, "step": 56680 }, { - "epoch": 0.29, - "learning_rate": 0.00025709874830357545, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027795770139016693, + "loss": 0.0286, "step": 56690 }, { - "epoch": 0.29, - "learning_rate": 0.00025709118061056143, - "loss": 0.0234, + "epoch": 0.15, + "learning_rate": 0.00027795381317379544, + "loss": 0.0258, "step": 56700 }, { - "epoch": 0.29, - "learning_rate": 0.00025708361291754746, - "loss": 0.027, + "epoch": 0.15, + "learning_rate": 0.000277949924957424, + "loss": 0.0305, "step": 56710 }, { - "epoch": 0.29, - "learning_rate": 0.00025707604522453344, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.00027794603674105253, + "loss": 0.0384, "step": 56720 }, { - "epoch": 0.29, - "learning_rate": 0.0002570684775315194, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.0002779421485246811, + "loss": 0.0287, "step": 56730 }, { - "epoch": 0.29, - "learning_rate": 0.0002570609098385054, - "loss": 0.0168, + "epoch": 0.15, + "learning_rate": 0.0002779382603083096, + "loss": 0.0336, "step": 56740 }, { - "epoch": 0.29, - "learning_rate": 0.0002570533421454914, - "loss": 0.0177, + "epoch": 0.15, + "learning_rate": 0.0002779343720919382, + "loss": 0.0268, "step": 56750 }, { - "epoch": 0.29, - "learning_rate": 0.00025704577445247737, - "loss": 0.0176, + "epoch": 0.15, + "learning_rate": 0.0002779304838755667, + "loss": 0.0294, "step": 56760 }, { - "epoch": 0.29, - "learning_rate": 0.0002570382067594634, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.0002779265956591952, + "loss": 0.0268, "step": 56770 }, { - "epoch": 0.29, - "learning_rate": 0.0002570306390664494, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.0002779227074428237, + "loss": 0.0287, "step": 56780 }, { - "epoch": 0.29, - "learning_rate": 0.00025702307137343537, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.0002779188192264523, + "loss": 0.0226, "step": 56790 }, { - "epoch": 0.29, - "learning_rate": 0.00025701550368042135, - "loss": 0.0257, + "epoch": 0.15, + "learning_rate": 0.0002779149310100808, + "loss": 0.0305, "step": 56800 }, { - "epoch": 0.29, - "learning_rate": 0.00025700793598740733, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.0002779110427937094, + "loss": 0.0281, "step": 56810 }, { - "epoch": 0.29, - "learning_rate": 0.0002570003682943933, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.0002779071545773379, + "loss": 0.0256, "step": 56820 }, { - "epoch": 0.29, - "learning_rate": 0.00025699280060137935, + "epoch": 0.15, + "learning_rate": 0.0002779032663609664, "loss": 0.0229, "step": 56830 }, { - "epoch": 0.29, - "learning_rate": 0.00025698523290836533, - "loss": 0.0193, + "epoch": 0.15, + "learning_rate": 0.00027789937814459497, + "loss": 0.0258, "step": 56840 }, { - "epoch": 0.29, - "learning_rate": 0.0002569776652153513, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.0002778954899282235, + "loss": 0.0283, "step": 56850 }, { - "epoch": 0.29, - "learning_rate": 0.0002569700975223373, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.00027789160171185206, + "loss": 0.0366, "step": 56860 }, { - "epoch": 0.29, - "learning_rate": 0.0002569625298293233, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.00027788771349548057, + "loss": 0.0334, "step": 56870 }, { - "epoch": 0.29, - "learning_rate": 0.00025695496213630926, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.00027788382527910914, + "loss": 0.0329, "step": 56880 }, { - "epoch": 0.29, - "learning_rate": 0.00025694739444329524, - "loss": 0.017, + "epoch": 0.15, + "learning_rate": 0.00027787993706273765, + "loss": 0.0277, "step": 56890 }, { - "epoch": 0.29, - "learning_rate": 0.0002569398267502813, - "loss": 0.0427, + "epoch": 0.15, + "learning_rate": 0.00027787604884636617, + "loss": 0.0304, "step": 56900 }, { - "epoch": 0.29, - "learning_rate": 0.00025693225905726725, - "loss": 0.0221, + "epoch": 0.15, + "learning_rate": 0.0002778721606299947, + "loss": 0.0268, "step": 56910 }, { - "epoch": 0.29, - "learning_rate": 0.00025692469136425324, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027786827241362325, + "loss": 0.0311, "step": 56920 }, { - "epoch": 0.29, - "learning_rate": 0.0002569171236712392, - "loss": 0.03, + "epoch": 0.15, + "learning_rate": 0.00027786438419725177, + "loss": 0.0267, "step": 56930 }, { - "epoch": 0.29, - "learning_rate": 0.0002569095559782252, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027786049598088033, + "loss": 0.0317, "step": 56940 }, { - "epoch": 0.29, - "learning_rate": 0.0002569019882852112, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.00027785660776450885, + "loss": 0.0263, "step": 56950 }, { - "epoch": 0.29, - "learning_rate": 0.0002568944205921972, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002778527195481374, + "loss": 0.0246, "step": 56960 }, { - "epoch": 0.29, - "learning_rate": 0.0002568868528991832, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.00027784883133176593, + "loss": 0.029, "step": 56970 }, { - "epoch": 0.29, - "learning_rate": 0.0002568792852061692, - "loss": 0.028, + "epoch": 0.15, + "learning_rate": 0.00027784494311539445, + "loss": 0.0297, "step": 56980 }, { - "epoch": 0.29, - "learning_rate": 0.00025687171751315516, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027784105489902296, + "loss": 0.0256, "step": 56990 }, { - "epoch": 0.29, - "learning_rate": 0.00025686414982014114, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.00027783716668265153, + "loss": 0.0255, "step": 57000 }, { - "epoch": 0.29, - "eval_cer": 0.9144644335264098, - "eval_loss": 0.014634103514254093, - "eval_runtime": 116.5702, - "eval_samples_per_second": 17.157, - "eval_steps_per_second": 4.289, + "epoch": 0.15, + "eval_cer": 0.8818160569148363, + "eval_loss": 0.019956447184085846, + "eval_runtime": 108.1102, + "eval_samples_per_second": 18.5, + "eval_steps_per_second": 4.625, "step": 57000 }, { - "epoch": 0.29, - "learning_rate": 0.0002568565821271271, - "loss": 0.0183, + "epoch": 0.15, + "learning_rate": 0.0002778332784662801, + "loss": 0.0228, "step": 57010 }, { - "epoch": 0.29, - "learning_rate": 0.0002568490144341131, - "loss": 0.0169, + "epoch": 0.15, + "learning_rate": 0.0002778293902499086, + "loss": 0.0259, "step": 57020 }, { - "epoch": 0.29, - "learning_rate": 0.00025684144674109914, - "loss": 0.0273, + "epoch": 0.15, + "learning_rate": 0.00027782550203353713, + "loss": 0.0268, "step": 57030 }, { - "epoch": 0.29, - "learning_rate": 0.0002568338790480851, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.0002778216138171657, + "loss": 0.0231, "step": 57040 }, { - "epoch": 0.29, - "learning_rate": 0.0002568263113550711, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.0002778177256007942, + "loss": 0.0226, "step": 57050 }, { - "epoch": 0.29, - "learning_rate": 0.0002568187436620571, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.0002778138373844227, + "loss": 0.0271, "step": 57060 }, { - "epoch": 0.29, - "learning_rate": 0.00025681117596904307, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.0002778099491680513, + "loss": 0.025, "step": 57070 }, { - "epoch": 0.29, - "learning_rate": 0.00025680360827602905, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.0002778060609516798, + "loss": 0.0199, "step": 57080 }, { - "epoch": 0.29, - "learning_rate": 0.0002567960405830151, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.0002778021727353084, + "loss": 0.0268, "step": 57090 }, { - "epoch": 0.29, - "learning_rate": 0.00025678847289000106, - "loss": 0.0243, + "epoch": 0.15, + "learning_rate": 0.0002777982845189369, + "loss": 0.0276, "step": 57100 }, { - "epoch": 0.29, - "learning_rate": 0.00025678090519698705, - "loss": 0.0207, + "epoch": 0.15, + "learning_rate": 0.0002777943963025654, + "loss": 0.0268, "step": 57110 }, { - "epoch": 0.29, - "learning_rate": 0.00025677333750397303, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.0002777905080861939, + "loss": 0.0247, "step": 57120 }, { - "epoch": 0.29, - "learning_rate": 0.000256765769810959, - "loss": 0.0218, + "epoch": 0.15, + "learning_rate": 0.0002777866198698225, + "loss": 0.0251, "step": 57130 }, { - "epoch": 0.29, - "learning_rate": 0.000256758202117945, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.000277782731653451, + "loss": 0.0292, "step": 57140 }, { - "epoch": 0.29, - "learning_rate": 0.000256750634424931, - "loss": 0.0202, + "epoch": 0.15, + "learning_rate": 0.0002777788434370796, + "loss": 0.0312, "step": 57150 }, { - "epoch": 0.29, - "learning_rate": 0.000256743066731917, - "loss": 0.0222, + "epoch": 0.15, + "learning_rate": 0.0002777749552207081, + "loss": 0.0261, "step": 57160 }, { - "epoch": 0.29, - "learning_rate": 0.000256735499038903, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027777106700433666, + "loss": 0.0274, "step": 57170 }, { - "epoch": 0.29, - "learning_rate": 0.00025672793134588897, - "loss": 0.0185, + "epoch": 0.15, + "learning_rate": 0.00027776717878796517, + "loss": 0.0243, "step": 57180 }, { - "epoch": 0.29, - "learning_rate": 0.00025672036365287495, - "loss": 0.0251, + "epoch": 0.15, + "learning_rate": 0.0002777632905715937, + "loss": 0.0315, "step": 57190 }, { - "epoch": 0.29, - "learning_rate": 0.00025671279595986093, - "loss": 0.0174, + "epoch": 0.15, + "learning_rate": 0.0002777594023552222, + "loss": 0.0331, "step": 57200 }, { - "epoch": 0.29, - "learning_rate": 0.0002567052282668469, - "loss": 0.0226, + "epoch": 0.15, + "learning_rate": 0.00027775551413885077, + "loss": 0.028, "step": 57210 }, { - "epoch": 0.29, - "learning_rate": 0.0002566976605738329, - "loss": 0.0242, + "epoch": 0.15, + "learning_rate": 0.00027775162592247934, + "loss": 0.0277, "step": 57220 }, { - "epoch": 0.29, - "learning_rate": 0.0002566900928808189, - "loss": 0.0263, + "epoch": 0.15, + "learning_rate": 0.00027774773770610785, + "loss": 0.0275, "step": 57230 }, { - "epoch": 0.29, - "learning_rate": 0.00025668252518780486, - "loss": 0.0278, + "epoch": 0.15, + "learning_rate": 0.00027774384948973637, + "loss": 0.0303, "step": 57240 }, { - "epoch": 0.29, - "learning_rate": 0.00025667495749479084, - "loss": 0.0207, + "epoch": 0.15, + "learning_rate": 0.00027773996127336494, + "loss": 0.0311, "step": 57250 }, { - "epoch": 0.29, - "learning_rate": 0.0002566673898017769, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027773607305699345, + "loss": 0.0248, "step": 57260 }, { - "epoch": 0.29, - "learning_rate": 0.00025665982210876286, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.00027773218484062196, + "loss": 0.0287, "step": 57270 }, { - "epoch": 0.29, - "learning_rate": 0.00025665225441574884, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.00027772829662425053, + "loss": 0.0336, "step": 57280 }, { - "epoch": 0.29, - "learning_rate": 0.0002566446867227348, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.00027772440840787905, + "loss": 0.0283, "step": 57290 }, { - "epoch": 0.29, - "learning_rate": 0.0002566371190297208, - "loss": 0.0245, + "epoch": 0.15, + "learning_rate": 0.0002777205201915076, + "loss": 0.0257, "step": 57300 }, { - "epoch": 0.29, - "learning_rate": 0.0002566295513367068, - "loss": 0.0265, + "epoch": 0.15, + "learning_rate": 0.00027771663197513613, + "loss": 0.0238, "step": 57310 }, { - "epoch": 0.29, - "learning_rate": 0.0002566219836436928, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.00027771274375876465, + "loss": 0.028, "step": 57320 }, { - "epoch": 0.29, - "learning_rate": 0.0002566144159506788, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.00027770885554239316, + "loss": 0.0286, "step": 57330 }, { - "epoch": 0.29, - "learning_rate": 0.0002566068482576648, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.00027770496732602173, + "loss": 0.0318, "step": 57340 }, { - "epoch": 0.29, - "learning_rate": 0.00025659928056465076, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.00027770107910965024, + "loss": 0.0303, "step": 57350 }, { - "epoch": 0.29, - "learning_rate": 0.00025659171287163674, - "loss": 0.0189, + "epoch": 0.15, + "learning_rate": 0.0002776971908932788, + "loss": 0.0283, "step": 57360 }, { - "epoch": 0.29, - "learning_rate": 0.0002565841451786227, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.0002776933026769073, + "loss": 0.0254, "step": 57370 }, { - "epoch": 0.29, - "learning_rate": 0.00025657657748560876, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.0002776894144605359, + "loss": 0.0278, "step": 57380 }, { - "epoch": 0.29, - "learning_rate": 0.00025656900979259474, - "loss": 0.0241, + "epoch": 0.15, + "learning_rate": 0.0002776855262441644, + "loss": 0.0253, "step": 57390 }, { - "epoch": 0.29, - "learning_rate": 0.0002565614420995807, - "loss": 0.0166, + "epoch": 0.15, + "learning_rate": 0.0002776816380277929, + "loss": 0.03, "step": 57400 }, { - "epoch": 0.29, - "learning_rate": 0.0002565538744065667, - "loss": 0.0163, + "epoch": 0.15, + "learning_rate": 0.0002776777498114215, + "loss": 0.0273, "step": 57410 }, { - "epoch": 0.29, - "learning_rate": 0.0002565463067135527, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.00027767386159505, + "loss": 0.0253, "step": 57420 }, { - "epoch": 0.29, - "learning_rate": 0.00025653873902053867, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.0002776699733786786, + "loss": 0.0267, "step": 57430 }, { - "epoch": 0.29, - "learning_rate": 0.00025653117132752465, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002776660851623071, + "loss": 0.0416, "step": 57440 }, { - "epoch": 0.29, - "learning_rate": 0.0002565236036345107, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.0002776621969459356, + "loss": 0.0365, "step": 57450 }, { - "epoch": 0.29, - "learning_rate": 0.00025651603594149667, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.0002776583087295642, + "loss": 0.0286, "step": 57460 }, { - "epoch": 0.29, - "learning_rate": 0.00025650846824848265, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.0002776544205131927, + "loss": 0.0269, "step": 57470 }, { - "epoch": 0.29, - "learning_rate": 0.00025650090055546863, - "loss": 0.0219, + "epoch": 0.15, + "learning_rate": 0.0002776505322968212, + "loss": 0.0345, "step": 57480 }, { - "epoch": 0.29, - "learning_rate": 0.0002564933328624546, - "loss": 0.0249, + "epoch": 0.15, + "learning_rate": 0.00027764664408044977, + "loss": 0.0265, "step": 57490 }, { - "epoch": 0.29, - "learning_rate": 0.0002564857651694406, - "loss": 0.0168, + "epoch": 0.15, + "learning_rate": 0.00027764275586407834, + "loss": 0.0281, "step": 57500 }, { - "epoch": 0.29, - "learning_rate": 0.00025647819747642663, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.00027763886764770686, + "loss": 0.0258, "step": 57510 }, { - "epoch": 0.29, - "learning_rate": 0.0002564706297834126, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027763497943133537, + "loss": 0.0558, "step": 57520 }, { - "epoch": 0.29, - "learning_rate": 0.0002564630620903986, - "loss": 0.0218, + "epoch": 0.15, + "learning_rate": 0.0002776310912149639, + "loss": 0.0267, "step": 57530 }, { - "epoch": 0.29, - "learning_rate": 0.0002564554943973846, - "loss": 0.0201, + "epoch": 0.15, + "learning_rate": 0.00027762720299859245, + "loss": 0.0245, "step": 57540 }, { - "epoch": 0.29, - "learning_rate": 0.00025644792670437056, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027762331478222097, + "loss": 0.0244, "step": 57550 }, { - "epoch": 0.29, - "learning_rate": 0.00025644035901135654, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.00027761942656584954, + "loss": 0.0315, "step": 57560 }, { - "epoch": 0.29, - "learning_rate": 0.00025643279131834257, - "loss": 0.0197, + "epoch": 0.15, + "learning_rate": 0.00027761553834947805, + "loss": 0.0246, "step": 57570 }, { - "epoch": 0.29, - "learning_rate": 0.00025642522362532855, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.00027761165013310657, + "loss": 0.0295, "step": 57580 }, { - "epoch": 0.29, - "learning_rate": 0.00025641765593231454, - "loss": 0.0191, + "epoch": 0.15, + "learning_rate": 0.00027760776191673513, + "loss": 0.0295, "step": 57590 }, { - "epoch": 0.29, - "learning_rate": 0.0002564100882393005, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.00027760387370036365, + "loss": 0.0249, "step": 57600 }, { - "epoch": 0.29, - "learning_rate": 0.0002564025205462865, - "loss": 0.0176, + "epoch": 0.15, + "learning_rate": 0.00027759998548399216, + "loss": 0.0266, "step": 57610 }, { - "epoch": 0.29, - "learning_rate": 0.0002563949528532725, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027759609726762073, + "loss": 0.0261, "step": 57620 }, { - "epoch": 0.29, - "learning_rate": 0.00025638738516025846, - "loss": 0.0181, + "epoch": 0.15, + "learning_rate": 0.00027759220905124925, + "loss": 0.0277, "step": 57630 }, { - "epoch": 0.29, - "learning_rate": 0.0002563798174672445, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.0002775883208348778, + "loss": 0.0275, "step": 57640 }, { - "epoch": 0.29, - "learning_rate": 0.0002563722497742305, - "loss": 0.0235, + "epoch": 0.15, + "learning_rate": 0.00027758443261850633, + "loss": 0.0242, "step": 57650 }, { - "epoch": 0.29, - "learning_rate": 0.00025636468208121646, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027758054440213484, + "loss": 0.0286, "step": 57660 }, { - "epoch": 0.29, - "learning_rate": 0.00025635711438820244, - "loss": 0.017, + "epoch": 0.15, + "learning_rate": 0.0002775766561857634, + "loss": 0.0274, "step": 57670 }, { - "epoch": 0.29, - "learning_rate": 0.0002563495466951884, - "loss": 0.0178, + "epoch": 0.15, + "learning_rate": 0.00027757276796939193, + "loss": 0.0266, "step": 57680 }, { - "epoch": 0.29, - "learning_rate": 0.0002563419790021744, - "loss": 0.0167, + "epoch": 0.15, + "learning_rate": 0.00027756887975302044, + "loss": 0.0261, "step": 57690 }, { - "epoch": 0.29, - "learning_rate": 0.00025633441130916044, - "loss": 0.017, + "epoch": 0.15, + "learning_rate": 0.000277564991536649, + "loss": 0.0243, "step": 57700 }, { - "epoch": 0.29, - "learning_rate": 0.0002563268436161464, - "loss": 0.0176, + "epoch": 0.15, + "learning_rate": 0.0002775611033202776, + "loss": 0.0273, "step": 57710 }, { - "epoch": 0.29, - "learning_rate": 0.0002563192759231324, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.0002775572151039061, + "loss": 0.0258, "step": 57720 }, { - "epoch": 0.29, - "learning_rate": 0.0002563117082301184, - "loss": 0.024, + "epoch": 0.15, + "learning_rate": 0.0002775533268875346, + "loss": 0.0257, "step": 57730 }, { - "epoch": 0.29, - "learning_rate": 0.00025630414053710437, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.0002775494386711631, + "loss": 0.0265, "step": 57740 }, { - "epoch": 0.29, - "learning_rate": 0.00025629657284409035, - "loss": 0.0136, + "epoch": 0.15, + "learning_rate": 0.0002775455504547917, + "loss": 0.0281, "step": 57750 }, { - "epoch": 0.29, - "learning_rate": 0.00025628900515107633, - "loss": 0.0175, + "epoch": 0.15, + "learning_rate": 0.0002775416622384202, + "loss": 0.0263, "step": 57760 }, { - "epoch": 0.29, - "learning_rate": 0.00025628143745806236, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002775377740220488, + "loss": 0.0285, "step": 57770 }, { - "epoch": 0.29, - "learning_rate": 0.00025627386976504835, - "loss": 0.0175, + "epoch": 0.15, + "learning_rate": 0.0002775338858056773, + "loss": 0.0228, "step": 57780 }, { - "epoch": 0.29, - "learning_rate": 0.0002562663020720343, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.00027752999758930586, + "loss": 0.0251, "step": 57790 }, { - "epoch": 0.29, - "learning_rate": 0.0002562587343790203, - "loss": 0.0179, + "epoch": 0.15, + "learning_rate": 0.0002775261093729344, + "loss": 0.0255, "step": 57800 }, { - "epoch": 0.29, - "learning_rate": 0.0002562511666860063, - "loss": 0.0197, + "epoch": 0.15, + "learning_rate": 0.0002775222211565629, + "loss": 0.0277, "step": 57810 }, { - "epoch": 0.29, - "learning_rate": 0.00025624359899299227, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.0002775183329401914, + "loss": 0.0368, "step": 57820 }, { - "epoch": 0.29, - "learning_rate": 0.0002562360312999783, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.00027751444472381997, + "loss": 0.0335, "step": 57830 }, { - "epoch": 0.29, - "learning_rate": 0.0002562284636069643, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002775105565074485, + "loss": 0.0301, "step": 57840 }, { - "epoch": 0.29, - "learning_rate": 0.00025622089591395027, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.00027750666829107705, + "loss": 0.0249, "step": 57850 }, { - "epoch": 0.29, - "learning_rate": 0.00025621332822093625, - "loss": 0.017, + "epoch": 0.15, + "learning_rate": 0.00027750278007470557, + "loss": 0.0249, "step": 57860 }, { - "epoch": 0.29, - "learning_rate": 0.00025620576052792223, - "loss": 0.0177, + "epoch": 0.15, + "learning_rate": 0.0002774988918583341, + "loss": 0.0253, "step": 57870 }, { - "epoch": 0.29, - "learning_rate": 0.0002561981928349082, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.00027749500364196265, + "loss": 0.0253, "step": 57880 }, { - "epoch": 0.29, - "learning_rate": 0.00025619062514189425, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.00027749111542559117, + "loss": 0.0274, "step": 57890 }, { - "epoch": 0.29, - "learning_rate": 0.00025618305744888023, - "loss": 0.0226, + "epoch": 0.15, + "learning_rate": 0.00027748722720921974, + "loss": 0.0368, "step": 57900 }, { - "epoch": 0.29, - "learning_rate": 0.0002561754897558662, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.00027748333899284825, + "loss": 0.0268, "step": 57910 }, { - "epoch": 0.29, - "learning_rate": 0.0002561679220628522, - "loss": 0.0172, + "epoch": 0.15, + "learning_rate": 0.0002774794507764768, + "loss": 0.0258, "step": 57920 }, { - "epoch": 0.29, - "learning_rate": 0.0002561603543698382, - "loss": 0.0197, + "epoch": 0.15, + "learning_rate": 0.00027747556256010533, + "loss": 0.0239, "step": 57930 }, { - "epoch": 0.29, - "learning_rate": 0.00025615278667682416, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.00027747167434373385, + "loss": 0.0275, "step": 57940 }, { - "epoch": 0.29, - "learning_rate": 0.00025614521898381014, - "loss": 0.0179, + "epoch": 0.15, + "learning_rate": 0.00027746778612736236, + "loss": 0.0253, "step": 57950 }, { - "epoch": 0.29, - "learning_rate": 0.0002561376512907962, - "loss": 0.0268, + "epoch": 0.15, + "learning_rate": 0.00027746389791099093, + "loss": 0.026, "step": 57960 }, { - "epoch": 0.29, - "learning_rate": 0.00025613008359778216, - "loss": 0.0231, + "epoch": 0.15, + "learning_rate": 0.00027746000969461945, + "loss": 0.0269, "step": 57970 }, { - "epoch": 0.29, - "learning_rate": 0.00025612251590476814, - "loss": 0.0186, + "epoch": 0.15, + "learning_rate": 0.000277456121478248, + "loss": 0.0267, "step": 57980 }, { - "epoch": 0.29, - "learning_rate": 0.0002561149482117541, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.00027745223326187653, + "loss": 0.0265, "step": 57990 }, { - "epoch": 0.29, - "learning_rate": 0.0002561073805187401, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.0002774483450455051, + "loss": 0.0277, "step": 58000 }, { - "epoch": 0.29, - "eval_cer": 0.914472196695413, - "eval_loss": 0.014296288602054119, - "eval_runtime": 116.695, - "eval_samples_per_second": 17.139, - "eval_steps_per_second": 4.285, + "epoch": 0.15, + "eval_cer": 0.881845449290454, + "eval_loss": 0.01981378346681595, + "eval_runtime": 107.9556, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.632, "step": 58000 }, { - "epoch": 0.29, - "learning_rate": 0.0002560998128257261, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.0002774444568291336, + "loss": 0.0355, "step": 58010 }, { - "epoch": 0.29, - "learning_rate": 0.0002560922451327121, - "loss": 0.0204, + "epoch": 0.15, + "learning_rate": 0.0002774405686127621, + "loss": 0.028, "step": 58020 }, { - "epoch": 0.29, - "learning_rate": 0.0002560846774396981, - "loss": 0.015, + "epoch": 0.15, + "learning_rate": 0.00027743668039639064, + "loss": 0.0293, "step": 58030 }, { - "epoch": 0.29, - "learning_rate": 0.0002560771097466841, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002774327921800192, + "loss": 0.0288, "step": 58040 }, { - "epoch": 0.29, - "learning_rate": 0.00025606954205367006, - "loss": 0.0218, + "epoch": 0.15, + "learning_rate": 0.0002774289039636478, + "loss": 0.0322, "step": 58050 }, { - "epoch": 0.29, - "learning_rate": 0.00025606197436065604, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.0002774250157472763, + "loss": 0.023, "step": 58060 }, { - "epoch": 0.29, - "learning_rate": 0.000256054406667642, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.0002774211275309048, + "loss": 0.0285, "step": 58070 }, { - "epoch": 0.29, - "learning_rate": 0.00025604683897462806, - "loss": 0.0193, + "epoch": 0.15, + "learning_rate": 0.0002774172393145333, + "loss": 0.031, "step": 58080 }, { - "epoch": 0.29, - "learning_rate": 0.00025603927128161404, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.0002774133510981619, + "loss": 0.0254, "step": 58090 }, { - "epoch": 0.29, - "learning_rate": 0.0002560317035886, - "loss": 0.0174, + "epoch": 0.15, + "learning_rate": 0.0002774094628817904, + "loss": 0.0268, "step": 58100 }, { - "epoch": 0.29, - "learning_rate": 0.000256024135895586, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.000277405574665419, + "loss": 0.0285, "step": 58110 }, { - "epoch": 0.29, - "learning_rate": 0.000256016568202572, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.0002774016864490475, + "loss": 0.0243, "step": 58120 }, { - "epoch": 0.29, - "learning_rate": 0.00025600900050955797, - "loss": 0.0179, + "epoch": 0.15, + "learning_rate": 0.00027739779823267606, + "loss": 0.025, "step": 58130 }, { - "epoch": 0.29, - "learning_rate": 0.00025600143281654395, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027739391001630457, + "loss": 0.024, "step": 58140 }, { - "epoch": 0.29, - "learning_rate": 0.00025599386512353, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.0002773900217999331, + "loss": 0.0292, "step": 58150 }, { - "epoch": 0.29, - "learning_rate": 0.00025598629743051597, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.0002773861335835616, + "loss": 0.0305, "step": 58160 }, { - "epoch": 0.29, - "learning_rate": 0.00025597872973750195, - "loss": 0.0255, + "epoch": 0.15, + "learning_rate": 0.00027738224536719017, + "loss": 0.0285, "step": 58170 }, { - "epoch": 0.29, - "learning_rate": 0.00025597116204448793, - "loss": 0.0201, + "epoch": 0.15, + "learning_rate": 0.0002773783571508187, + "loss": 0.0235, "step": 58180 }, { - "epoch": 0.29, - "learning_rate": 0.0002559635943514739, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.00027737446893444725, + "loss": 0.0289, "step": 58190 }, { - "epoch": 0.29, - "learning_rate": 0.0002559560266584599, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.00027737058071807577, + "loss": 0.0297, "step": 58200 }, { - "epoch": 0.29, - "learning_rate": 0.0002559484589654459, - "loss": 0.0221, + "epoch": 0.15, + "learning_rate": 0.00027736669250170434, + "loss": 0.0265, "step": 58210 }, { - "epoch": 0.29, - "learning_rate": 0.0002559408912724319, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027736280428533285, + "loss": 0.0344, "step": 58220 }, { - "epoch": 0.29, - "learning_rate": 0.0002559333235794179, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.00027735891606896137, + "loss": 0.0283, "step": 58230 }, { - "epoch": 0.29, - "learning_rate": 0.00025592575588640387, - "loss": 0.0174, + "epoch": 0.15, + "learning_rate": 0.0002773550278525899, + "loss": 0.0264, "step": 58240 }, { - "epoch": 0.29, - "learning_rate": 0.00025591818819338985, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.00027735113963621845, + "loss": 0.0321, "step": 58250 }, { - "epoch": 0.29, - "learning_rate": 0.00025591062050037583, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.000277347251419847, + "loss": 0.0273, "step": 58260 }, { - "epoch": 0.29, - "learning_rate": 0.0002559030528073618, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.00027734336320347553, + "loss": 0.0232, "step": 58270 }, { - "epoch": 0.29, - "learning_rate": 0.00025589548511434785, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.00027733947498710405, + "loss": 0.0315, "step": 58280 }, { - "epoch": 0.29, - "learning_rate": 0.00025588791742133383, - "loss": 0.0226, + "epoch": 0.15, + "learning_rate": 0.0002773355867707326, + "loss": 0.0298, "step": 58290 }, { - "epoch": 0.29, - "learning_rate": 0.0002558803497283198, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.00027733169855436113, + "loss": 0.0253, "step": 58300 }, { - "epoch": 0.29, - "learning_rate": 0.0002558727820353058, - "loss": 0.0201, + "epoch": 0.15, + "learning_rate": 0.00027732781033798964, + "loss": 0.0244, "step": 58310 }, { - "epoch": 0.29, - "learning_rate": 0.0002558652143422918, - "loss": 0.0253, + "epoch": 0.15, + "learning_rate": 0.0002773239221216182, + "loss": 0.022, "step": 58320 }, { - "epoch": 0.29, - "learning_rate": 0.00025585764664927776, - "loss": 0.018, + "epoch": 0.15, + "learning_rate": 0.00027732003390524673, + "loss": 0.0304, "step": 58330 }, { - "epoch": 0.29, - "learning_rate": 0.0002558500789562638, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002773161456888753, + "loss": 0.025, "step": 58340 }, { - "epoch": 0.29, - "learning_rate": 0.0002558425112632498, - "loss": 0.0159, + "epoch": 0.15, + "learning_rate": 0.0002773122574725038, + "loss": 0.0272, "step": 58350 }, { - "epoch": 0.29, - "learning_rate": 0.00025583494357023576, - "loss": 0.0183, + "epoch": 0.15, + "learning_rate": 0.0002773083692561323, + "loss": 0.0251, "step": 58360 }, { - "epoch": 0.29, - "learning_rate": 0.00025582737587722174, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.00027730448103976084, + "loss": 0.0292, "step": 58370 }, { - "epoch": 0.29, - "learning_rate": 0.0002558198081842077, - "loss": 0.018, + "epoch": 0.15, + "learning_rate": 0.0002773005928233894, + "loss": 0.0281, "step": 58380 }, { - "epoch": 0.29, - "learning_rate": 0.0002558122404911937, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.0002772967046070179, + "loss": 0.0314, "step": 58390 }, { - "epoch": 0.29, - "learning_rate": 0.00025580467279817974, - "loss": 0.0199, + "epoch": 0.15, + "learning_rate": 0.0002772928163906465, + "loss": 0.0265, "step": 58400 }, { - "epoch": 0.29, - "learning_rate": 0.0002557971051051657, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.000277288928174275, + "loss": 0.0289, "step": 58410 }, { - "epoch": 0.29, - "learning_rate": 0.0002557895374121517, - "loss": 0.0298, + "epoch": 0.15, + "learning_rate": 0.0002772850399579036, + "loss": 0.0273, "step": 58420 }, { - "epoch": 0.29, - "learning_rate": 0.0002557819697191377, - "loss": 0.0216, + "epoch": 0.15, + "learning_rate": 0.0002772811517415321, + "loss": 0.0215, "step": 58430 }, { - "epoch": 0.29, - "learning_rate": 0.00025577440202612366, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.0002772772635251606, + "loss": 0.0237, "step": 58440 }, { - "epoch": 0.29, - "learning_rate": 0.00025576683433310964, - "loss": 0.0182, + "epoch": 0.15, + "learning_rate": 0.0002772733753087892, + "loss": 0.0271, "step": 58450 }, { - "epoch": 0.29, - "learning_rate": 0.0002557592666400956, - "loss": 0.0166, + "epoch": 0.15, + "learning_rate": 0.0002772694870924177, + "loss": 0.0295, "step": 58460 }, { - "epoch": 0.29, - "learning_rate": 0.0002557516989470816, - "loss": 0.0229, + "epoch": 0.15, + "learning_rate": 0.00027726559887604626, + "loss": 0.0223, "step": 58470 }, { - "epoch": 0.3, - "learning_rate": 0.0002557441312540676, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.00027726171065967477, + "loss": 0.0261, "step": 58480 }, { - "epoch": 0.3, - "learning_rate": 0.00025573656356105357, - "loss": 0.0227, + "epoch": 0.15, + "learning_rate": 0.0002772578224433033, + "loss": 0.0266, "step": 58490 }, { - "epoch": 0.3, - "learning_rate": 0.00025572899586803955, - "loss": 0.0189, + "epoch": 0.15, + "learning_rate": 0.00027725393422693185, + "loss": 0.0265, "step": 58500 }, { - "epoch": 0.3, - "learning_rate": 0.0002557214281750256, - "loss": 0.0191, + "epoch": 0.15, + "learning_rate": 0.00027725004601056037, + "loss": 0.0318, "step": 58510 }, { - "epoch": 0.3, - "learning_rate": 0.00025571386048201157, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.0002772461577941889, + "loss": 0.0267, "step": 58520 }, { - "epoch": 0.3, - "learning_rate": 0.00025570629278899755, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.00027724226957781745, + "loss": 0.027, "step": 58530 }, { - "epoch": 0.3, - "learning_rate": 0.00025569872509598353, - "loss": 0.0174, + "epoch": 0.15, + "learning_rate": 0.00027723838136144597, + "loss": 0.0265, "step": 58540 }, { - "epoch": 0.3, - "learning_rate": 0.0002556911574029695, - "loss": 0.0252, + "epoch": 0.15, + "learning_rate": 0.00027723449314507454, + "loss": 0.0267, "step": 58550 }, { - "epoch": 0.3, - "learning_rate": 0.0002556835897099555, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027723060492870305, + "loss": 0.0196, "step": 58560 }, { - "epoch": 0.3, - "learning_rate": 0.00025567602201694153, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.00027722671671233156, + "loss": 0.0299, "step": 58570 }, { - "epoch": 0.3, - "learning_rate": 0.0002556684543239275, - "loss": 0.018, + "epoch": 0.15, + "learning_rate": 0.0002772228284959601, + "loss": 0.0221, "step": 58580 }, { - "epoch": 0.3, - "learning_rate": 0.0002556608866309135, - "loss": 0.0187, + "epoch": 0.15, + "learning_rate": 0.00027721894027958865, + "loss": 0.0315, "step": 58590 }, { - "epoch": 0.3, - "learning_rate": 0.0002556533189378995, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.0002772150520632172, + "loss": 0.0251, "step": 58600 }, { - "epoch": 0.3, - "learning_rate": 0.00025564575124488546, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027721116384684573, + "loss": 0.0281, "step": 58610 }, { - "epoch": 0.3, - "learning_rate": 0.00025563818355187144, - "loss": 0.0189, + "epoch": 0.15, + "learning_rate": 0.00027720727563047425, + "loss": 0.0292, "step": 58620 }, { - "epoch": 0.3, - "learning_rate": 0.00025563061585885747, - "loss": 0.0226, + "epoch": 0.15, + "learning_rate": 0.0002772033874141028, + "loss": 0.0258, "step": 58630 }, { - "epoch": 0.3, - "learning_rate": 0.00025562304816584345, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027719949919773133, + "loss": 0.0275, "step": 58640 }, { - "epoch": 0.3, - "learning_rate": 0.00025561548047282944, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.00027719561098135984, + "loss": 0.0281, "step": 58650 }, { - "epoch": 0.3, - "learning_rate": 0.0002556079127798154, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.0002771917227649884, + "loss": 0.0288, "step": 58660 }, { - "epoch": 0.3, - "learning_rate": 0.0002556003450868014, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002771878345486169, + "loss": 0.0264, "step": 58670 }, { - "epoch": 0.3, - "learning_rate": 0.0002555927773937874, - "loss": 0.0227, + "epoch": 0.15, + "learning_rate": 0.0002771839463322455, + "loss": 0.0291, "step": 58680 }, { - "epoch": 0.3, - "learning_rate": 0.00025558520970077336, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.000277180058115874, + "loss": 0.0261, "step": 58690 }, { - "epoch": 0.3, - "learning_rate": 0.0002555776420077594, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.0002771761698995025, + "loss": 0.0267, "step": 58700 }, { - "epoch": 0.3, - "learning_rate": 0.0002555700743147454, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.0002771722816831311, + "loss": 0.0273, "step": 58710 }, { - "epoch": 0.3, - "learning_rate": 0.00025556250662173136, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.0002771683934667596, + "loss": 0.0261, "step": 58720 }, { - "epoch": 0.3, - "learning_rate": 0.00025555493892871734, - "loss": 0.0195, + "epoch": 0.15, + "learning_rate": 0.0002771645052503881, + "loss": 0.0251, "step": 58730 }, { - "epoch": 0.3, - "learning_rate": 0.0002555473712357033, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002771606170340167, + "loss": 0.0278, "step": 58740 }, { - "epoch": 0.3, - "learning_rate": 0.0002555398035426893, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.00027715672881764526, + "loss": 0.0247, "step": 58750 }, { - "epoch": 0.3, - "learning_rate": 0.00025553223584967534, - "loss": 0.0218, + "epoch": 0.15, + "learning_rate": 0.0002771528406012738, + "loss": 0.0295, "step": 58760 }, { - "epoch": 0.3, - "learning_rate": 0.0002555246681566613, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.0002771489523849023, + "loss": 0.0252, "step": 58770 }, { - "epoch": 0.3, - "learning_rate": 0.0002555171004636473, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.0002771450641685308, + "loss": 0.0308, "step": 58780 }, { - "epoch": 0.3, - "learning_rate": 0.0002555095327706333, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027714117595215937, + "loss": 0.0279, "step": 58790 }, { - "epoch": 0.3, - "learning_rate": 0.00025550196507761927, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.0002771372877357879, + "loss": 0.0316, "step": 58800 }, { - "epoch": 0.3, - "learning_rate": 0.00025549439738460525, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.00027713339951941646, + "loss": 0.0331, "step": 58810 }, { - "epoch": 0.3, - "learning_rate": 0.00025548682969159123, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.00027712951130304497, + "loss": 0.0241, "step": 58820 }, { - "epoch": 0.3, - "learning_rate": 0.00025547926199857726, - "loss": 0.0188, + "epoch": 0.15, + "learning_rate": 0.0002771256230866735, + "loss": 0.0315, "step": 58830 }, { - "epoch": 0.3, - "learning_rate": 0.00025547169430556325, - "loss": 0.0202, + "epoch": 0.15, + "learning_rate": 0.00027712173487030205, + "loss": 0.0278, "step": 58840 }, { - "epoch": 0.3, - "learning_rate": 0.0002554641266125492, - "loss": 0.0244, + "epoch": 0.15, + "learning_rate": 0.00027711784665393057, + "loss": 0.0322, "step": 58850 }, { - "epoch": 0.3, - "learning_rate": 0.0002554565589195352, - "loss": 0.053, + "epoch": 0.15, + "learning_rate": 0.0002771139584375591, + "loss": 0.0269, "step": 58860 }, { - "epoch": 0.3, - "learning_rate": 0.0002554489912265212, - "loss": 0.0232, + "epoch": 0.15, + "learning_rate": 0.00027711007022118765, + "loss": 0.0257, "step": 58870 }, { - "epoch": 0.3, - "learning_rate": 0.00025544142353350717, - "loss": 0.0183, + "epoch": 0.15, + "learning_rate": 0.00027710618200481617, + "loss": 0.0303, "step": 58880 }, { - "epoch": 0.3, - "learning_rate": 0.0002554338558404932, - "loss": 0.0426, + "epoch": 0.15, + "learning_rate": 0.00027710229378844473, + "loss": 0.0245, "step": 58890 }, { - "epoch": 0.3, - "learning_rate": 0.0002554262881474792, - "loss": 0.0177, + "epoch": 0.15, + "learning_rate": 0.00027709840557207325, + "loss": 0.0301, "step": 58900 }, { - "epoch": 0.3, - "learning_rate": 0.00025541872045446517, - "loss": 0.0179, + "epoch": 0.15, + "learning_rate": 0.00027709451735570176, + "loss": 0.0221, "step": 58910 }, { - "epoch": 0.3, - "learning_rate": 0.00025541115276145115, - "loss": 0.0202, + "epoch": 0.15, + "learning_rate": 0.00027709062913933033, + "loss": 0.0262, "step": 58920 }, { - "epoch": 0.3, - "learning_rate": 0.00025540358506843713, - "loss": 0.0236, + "epoch": 0.15, + "learning_rate": 0.00027708674092295885, + "loss": 0.0275, "step": 58930 }, { - "epoch": 0.3, - "learning_rate": 0.0002553960173754231, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.00027708285270658736, + "loss": 0.0291, "step": 58940 }, { - "epoch": 0.3, - "learning_rate": 0.00025538844968240915, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.00027707896449021593, + "loss": 0.031, "step": 58950 }, { - "epoch": 0.3, - "learning_rate": 0.00025538088198939513, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.0002770750762738445, + "loss": 0.0265, "step": 58960 }, { - "epoch": 0.3, - "learning_rate": 0.0002553733142963811, - "loss": 0.0185, + "epoch": 0.15, + "learning_rate": 0.000277071188057473, + "loss": 0.0246, "step": 58970 }, { - "epoch": 0.3, - "learning_rate": 0.0002553657466033671, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.00027706729984110153, + "loss": 0.0278, "step": 58980 }, { - "epoch": 0.3, - "learning_rate": 0.0002553581789103531, - "loss": 0.0176, + "epoch": 0.15, + "learning_rate": 0.00027706341162473004, + "loss": 0.031, "step": 58990 }, { - "epoch": 0.3, - "learning_rate": 0.00025535061121733906, - "loss": 0.0179, + "epoch": 0.15, + "learning_rate": 0.0002770595234083586, + "loss": 0.0268, "step": 59000 }, { - "epoch": 0.3, - "eval_cer": 0.9144916046179211, - "eval_loss": 0.014513496309518814, - "eval_runtime": 116.7004, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.284, + "epoch": 0.15, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.0200749970972538, + "eval_runtime": 108.3189, + "eval_samples_per_second": 18.464, + "eval_steps_per_second": 4.616, "step": 59000 }, { - "epoch": 0.3, - "learning_rate": 0.00025534304352432504, - "loss": 0.024, + "epoch": 0.15, + "learning_rate": 0.0002770556351919871, + "loss": 0.0253, "step": 59010 }, { - "epoch": 0.3, - "learning_rate": 0.0002553354758313111, - "loss": 0.0185, + "epoch": 0.15, + "learning_rate": 0.0002770517469756157, + "loss": 0.0222, "step": 59020 }, { - "epoch": 0.3, - "learning_rate": 0.00025532790813829706, - "loss": 0.0185, + "epoch": 0.15, + "learning_rate": 0.0002770478587592442, + "loss": 0.0317, "step": 59030 }, { - "epoch": 0.3, - "learning_rate": 0.00025532034044528304, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002770439705428728, + "loss": 0.0278, "step": 59040 }, { - "epoch": 0.3, - "learning_rate": 0.000255312772752269, - "loss": 0.0171, + "epoch": 0.15, + "learning_rate": 0.0002770400823265013, + "loss": 0.027, "step": 59050 }, { - "epoch": 0.3, - "learning_rate": 0.000255305205059255, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002770361941101298, + "loss": 0.0349, "step": 59060 }, { - "epoch": 0.3, - "learning_rate": 0.000255297637366241, - "loss": 0.0191, + "epoch": 0.15, + "learning_rate": 0.0002770323058937583, + "loss": 0.0242, "step": 59070 }, { - "epoch": 0.3, - "learning_rate": 0.000255290069673227, - "loss": 0.0181, + "epoch": 0.15, + "learning_rate": 0.0002770284176773869, + "loss": 0.0218, "step": 59080 }, { - "epoch": 0.3, - "learning_rate": 0.000255282501980213, - "loss": 0.019, + "epoch": 0.15, + "learning_rate": 0.00027702452946101546, + "loss": 0.0219, "step": 59090 }, { - "epoch": 0.3, - "learning_rate": 0.000255274934287199, - "loss": 0.0217, + "epoch": 0.15, + "learning_rate": 0.000277020641244644, + "loss": 0.0258, "step": 59100 }, { - "epoch": 0.3, - "learning_rate": 0.00025526736659418496, - "loss": 0.0169, + "epoch": 0.15, + "learning_rate": 0.0002770167530282725, + "loss": 0.03, "step": 59110 }, { - "epoch": 0.3, - "learning_rate": 0.00025525979890117094, - "loss": 0.0203, + "epoch": 0.15, + "learning_rate": 0.000277012864811901, + "loss": 0.0311, "step": 59120 }, { - "epoch": 0.3, - "learning_rate": 0.0002552522312081569, - "loss": 0.0228, + "epoch": 0.15, + "learning_rate": 0.00027700897659552957, + "loss": 0.0279, "step": 59130 }, { - "epoch": 0.3, - "learning_rate": 0.00025524466351514296, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.0002770050883791581, + "loss": 0.0255, "step": 59140 }, { - "epoch": 0.3, - "learning_rate": 0.00025523709582212894, - "loss": 0.025, + "epoch": 0.15, + "learning_rate": 0.00027700120016278665, + "loss": 0.0285, "step": 59150 }, { - "epoch": 0.3, - "learning_rate": 0.0002552295281291149, - "loss": 0.0197, + "epoch": 0.15, + "learning_rate": 0.00027699731194641517, + "loss": 0.0235, "step": 59160 }, { - "epoch": 0.3, - "learning_rate": 0.0002552219604361009, - "loss": 0.0191, + "epoch": 0.15, + "learning_rate": 0.00027699342373004374, + "loss": 0.0264, "step": 59170 }, { - "epoch": 0.3, - "learning_rate": 0.0002552143927430869, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.00027698953551367225, + "loss": 0.035, "step": 59180 }, { - "epoch": 0.3, - "learning_rate": 0.00025520682505007287, - "loss": 0.0202, + "epoch": 0.15, + "learning_rate": 0.00027698564729730077, + "loss": 0.0274, "step": 59190 }, { - "epoch": 0.3, - "learning_rate": 0.00025519925735705885, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.0002769817590809293, + "loss": 0.0267, "step": 59200 }, { - "epoch": 0.3, - "learning_rate": 0.0002551916896640449, - "loss": 0.0189, + "epoch": 0.15, + "learning_rate": 0.00027697787086455785, + "loss": 0.0358, "step": 59210 }, { - "epoch": 0.3, - "learning_rate": 0.00025518412197103087, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.00027697398264818636, + "loss": 0.0288, "step": 59220 }, { - "epoch": 0.3, - "learning_rate": 0.00025517655427801685, - "loss": 0.0222, + "epoch": 0.15, + "learning_rate": 0.00027697009443181493, + "loss": 0.0429, "step": 59230 }, { - "epoch": 0.3, - "learning_rate": 0.00025516898658500283, - "loss": 0.0189, + "epoch": 0.15, + "learning_rate": 0.00027696620621544345, + "loss": 0.026, "step": 59240 }, { - "epoch": 0.3, - "learning_rate": 0.0002551614188919888, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.000276962317999072, + "loss": 0.0264, "step": 59250 }, { - "epoch": 0.3, - "learning_rate": 0.0002551538511989748, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.00027695842978270053, + "loss": 0.0238, "step": 59260 }, { - "epoch": 0.3, - "learning_rate": 0.0002551462835059608, - "loss": 0.0212, + "epoch": 0.15, + "learning_rate": 0.00027695454156632905, + "loss": 0.0304, "step": 59270 }, { - "epoch": 0.3, - "learning_rate": 0.0002551387158129468, - "loss": 0.0223, + "epoch": 0.15, + "learning_rate": 0.00027695065334995756, + "loss": 0.0257, "step": 59280 }, { - "epoch": 0.3, - "learning_rate": 0.0002551311481199328, - "loss": 0.0205, + "epoch": 0.15, + "learning_rate": 0.00027694676513358613, + "loss": 0.0252, "step": 59290 }, { - "epoch": 0.3, - "learning_rate": 0.00025512358042691877, - "loss": 0.0179, + "epoch": 0.15, + "learning_rate": 0.0002769428769172147, + "loss": 0.0239, "step": 59300 }, { - "epoch": 0.3, - "learning_rate": 0.00025511601273390475, - "loss": 0.0182, + "epoch": 0.15, + "learning_rate": 0.0002769389887008432, + "loss": 0.0357, "step": 59310 }, { - "epoch": 0.3, - "learning_rate": 0.00025510844504089073, - "loss": 0.0184, + "epoch": 0.15, + "learning_rate": 0.0002769351004844717, + "loss": 0.0269, "step": 59320 }, { - "epoch": 0.3, - "learning_rate": 0.0002551008773478767, - "loss": 0.0181, + "epoch": 0.15, + "learning_rate": 0.00027693121226810024, + "loss": 0.028, "step": 59330 }, { - "epoch": 0.3, - "learning_rate": 0.00025509330965486275, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.0002769273240517288, + "loss": 0.0247, "step": 59340 }, { - "epoch": 0.3, - "learning_rate": 0.00025508574196184873, - "loss": 0.0164, + "epoch": 0.15, + "learning_rate": 0.0002769234358353573, + "loss": 0.0244, "step": 59350 }, { - "epoch": 0.3, - "learning_rate": 0.0002550781742688347, - "loss": 0.0216, + "epoch": 0.15, + "learning_rate": 0.0002769195476189859, + "loss": 0.0275, "step": 59360 }, { - "epoch": 0.3, - "learning_rate": 0.0002550706065758207, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002769156594026144, + "loss": 0.027, "step": 59370 }, { - "epoch": 0.3, - "learning_rate": 0.0002550630388828067, - "loss": 0.0218, + "epoch": 0.15, + "learning_rate": 0.000276911771186243, + "loss": 0.0288, "step": 59380 }, { - "epoch": 0.3, - "learning_rate": 0.00025505547118979266, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.0002769078829698715, + "loss": 0.0224, "step": 59390 }, { - "epoch": 0.3, - "learning_rate": 0.0002550479034967787, - "loss": 0.0233, + "epoch": 0.15, + "learning_rate": 0.0002769039947535, + "loss": 0.0296, "step": 59400 }, { - "epoch": 0.3, - "learning_rate": 0.0002550403358037647, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.0002769001065371285, + "loss": 0.0206, "step": 59410 }, { - "epoch": 0.3, - "learning_rate": 0.00025503276811075066, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.0002768962183207571, + "loss": 0.0241, "step": 59420 }, { - "epoch": 0.3, - "learning_rate": 0.00025502520041773664, - "loss": 0.0208, + "epoch": 0.15, + "learning_rate": 0.0002768923301043856, + "loss": 0.0233, "step": 59430 }, { - "epoch": 0.3, - "learning_rate": 0.0002550176327247226, - "loss": 0.0222, + "epoch": 0.15, + "learning_rate": 0.00027688844188801417, + "loss": 0.0301, "step": 59440 }, { - "epoch": 0.3, - "learning_rate": 0.0002550100650317086, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002768845536716427, + "loss": 0.0383, "step": 59450 }, { - "epoch": 0.3, - "learning_rate": 0.00025500249733869464, - "loss": 0.0329, + "epoch": 0.15, + "learning_rate": 0.00027688066545527126, + "loss": 0.0316, "step": 59460 }, { - "epoch": 0.3, - "learning_rate": 0.0002549949296456806, - "loss": 0.0242, + "epoch": 0.15, + "learning_rate": 0.00027687677723889977, + "loss": 0.0251, "step": 59470 }, { - "epoch": 0.3, - "learning_rate": 0.0002549873619526666, - "loss": 0.0266, + "epoch": 0.15, + "learning_rate": 0.0002768728890225283, + "loss": 0.0253, "step": 59480 }, { - "epoch": 0.3, - "learning_rate": 0.0002549797942596526, - "loss": 0.0795, + "epoch": 0.15, + "learning_rate": 0.00027686900080615685, + "loss": 0.0246, "step": 59490 }, { - "epoch": 0.3, - "learning_rate": 0.00025497222656663856, - "loss": 0.0277, + "epoch": 0.15, + "learning_rate": 0.00027686511258978537, + "loss": 0.0247, "step": 59500 }, { - "epoch": 0.3, - "learning_rate": 0.00025496465887362454, - "loss": 0.02, + "epoch": 0.15, + "learning_rate": 0.00027686122437341394, + "loss": 0.0303, "step": 59510 }, { - "epoch": 0.3, - "learning_rate": 0.0002549570911806105, - "loss": 0.0209, + "epoch": 0.15, + "learning_rate": 0.00027685733615704245, + "loss": 0.0277, "step": 59520 }, { - "epoch": 0.3, - "learning_rate": 0.00025494952348759656, - "loss": 0.0174, + "epoch": 0.15, + "learning_rate": 0.00027685344794067097, + "loss": 0.032, "step": 59530 }, { - "epoch": 0.3, - "learning_rate": 0.00025494195579458254, - "loss": 0.0194, + "epoch": 0.15, + "learning_rate": 0.00027684955972429953, + "loss": 0.0234, "step": 59540 }, { - "epoch": 0.3, - "learning_rate": 0.0002549343881015685, - "loss": 0.0272, + "epoch": 0.15, + "learning_rate": 0.00027684567150792805, + "loss": 0.026, "step": 59550 }, { - "epoch": 0.3, - "learning_rate": 0.0002549268204085545, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.00027684178329155656, + "loss": 0.0293, "step": 59560 }, { - "epoch": 0.3, - "learning_rate": 0.0002549192527155405, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.00027683789507518513, + "loss": 0.0252, "step": 59570 }, { - "epoch": 0.3, - "learning_rate": 0.00025491168502252647, - "loss": 0.0221, + "epoch": 0.15, + "learning_rate": 0.00027683400685881365, + "loss": 0.0272, "step": 59580 }, { - "epoch": 0.3, - "learning_rate": 0.0002549041173295125, - "loss": 0.0304, + "epoch": 0.15, + "learning_rate": 0.0002768301186424422, + "loss": 0.0248, "step": 59590 }, { - "epoch": 0.3, - "learning_rate": 0.0002548965496364985, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.00027682623042607073, + "loss": 0.0325, "step": 59600 }, { - "epoch": 0.3, - "learning_rate": 0.00025488898194348447, - "loss": 0.0246, + "epoch": 0.15, + "learning_rate": 0.00027682234220969924, + "loss": 0.0271, "step": 59610 }, { - "epoch": 0.3, - "learning_rate": 0.00025488141425047045, - "loss": 0.0211, + "epoch": 0.15, + "learning_rate": 0.00027681845399332776, + "loss": 0.0263, "step": 59620 }, { - "epoch": 0.3, - "learning_rate": 0.00025487384655745643, - "loss": 0.0215, + "epoch": 0.15, + "learning_rate": 0.00027681456577695633, + "loss": 0.0285, "step": 59630 }, { - "epoch": 0.3, - "learning_rate": 0.0002548662788644424, - "loss": 0.0218, + "epoch": 0.15, + "learning_rate": 0.0002768106775605849, + "loss": 0.0295, "step": 59640 }, { - "epoch": 0.3, - "learning_rate": 0.00025485871117142845, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002768067893442134, + "loss": 0.0252, "step": 59650 }, { - "epoch": 0.3, - "learning_rate": 0.00025485114347841443, - "loss": 0.0248, + "epoch": 0.15, + "learning_rate": 0.0002768029011278419, + "loss": 0.0303, "step": 59660 }, { - "epoch": 0.3, - "learning_rate": 0.0002548435757854004, - "loss": 0.022, + "epoch": 0.15, + "learning_rate": 0.0002767990129114705, + "loss": 0.0281, "step": 59670 }, { - "epoch": 0.3, - "learning_rate": 0.0002548360080923864, - "loss": 0.0206, + "epoch": 0.15, + "learning_rate": 0.000276795124695099, + "loss": 0.0277, "step": 59680 }, { - "epoch": 0.3, - "learning_rate": 0.00025482844039937237, - "loss": 0.0213, + "epoch": 0.15, + "learning_rate": 0.0002767912364787275, + "loss": 0.0271, "step": 59690 }, { - "epoch": 0.3, - "learning_rate": 0.00025482087270635835, - "loss": 0.0178, + "epoch": 0.15, + "learning_rate": 0.0002767873482623561, + "loss": 0.0294, "step": 59700 }, { - "epoch": 0.3, - "learning_rate": 0.00025481330501334434, - "loss": 0.0318, + "epoch": 0.15, + "learning_rate": 0.0002767834600459846, + "loss": 0.0227, "step": 59710 }, { - "epoch": 0.3, - "learning_rate": 0.0002548057373203303, - "loss": 0.0239, + "epoch": 0.15, + "learning_rate": 0.0002767795718296132, + "loss": 0.0233, "step": 59720 }, { - "epoch": 0.3, - "learning_rate": 0.0002547981696273163, - "loss": 0.0198, + "epoch": 0.15, + "learning_rate": 0.0002767756836132417, + "loss": 0.0245, "step": 59730 }, { - "epoch": 0.3, - "learning_rate": 0.0002547906019343023, - "loss": 0.0214, + "epoch": 0.15, + "learning_rate": 0.0002767717953968702, + "loss": 0.0296, "step": 59740 }, { - "epoch": 0.3, - "learning_rate": 0.00025478303424128826, - "loss": 0.0176, + "epoch": 0.15, + "learning_rate": 0.0002767679071804988, + "loss": 0.0276, "step": 59750 }, { - "epoch": 0.3, - "learning_rate": 0.0002547754665482743, - "loss": 0.021, + "epoch": 0.15, + "learning_rate": 0.0002767640189641273, + "loss": 0.0249, "step": 59760 }, { - "epoch": 0.3, - "learning_rate": 0.0002547678988552603, - "loss": 0.0196, + "epoch": 0.15, + "learning_rate": 0.0002767601307477558, + "loss": 0.0292, "step": 59770 }, { - "epoch": 0.3, - "learning_rate": 0.00025476033116224626, - "loss": 0.0192, + "epoch": 0.15, + "learning_rate": 0.00027675624253138437, + "loss": 0.0272, "step": 59780 }, { - "epoch": 0.3, - "learning_rate": 0.00025475276346923224, - "loss": 0.025, + "epoch": 0.15, + "learning_rate": 0.00027675235431501294, + "loss": 0.0258, "step": 59790 }, { - "epoch": 0.3, - "learning_rate": 0.0002547451957762182, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.00027674846609864145, + "loss": 0.0257, "step": 59800 }, { - "epoch": 0.3, - "learning_rate": 0.0002547376280832042, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.00027674457788226997, + "loss": 0.0243, "step": 59810 }, { - "epoch": 0.3, - "learning_rate": 0.00025473006039019024, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.0002767406896658985, + "loss": 0.026, "step": 59820 }, { - "epoch": 0.3, - "learning_rate": 0.0002547224926971762, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.000276736801449527, + "loss": 0.0263, "step": 59830 }, { - "epoch": 0.3, - "learning_rate": 0.0002547149250041622, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.00027673291323315557, + "loss": 0.0296, "step": 59840 }, { - "epoch": 0.3, - "learning_rate": 0.0002547073573111482, - "loss": 0.016, + "epoch": 0.16, + "learning_rate": 0.00027672902501678414, + "loss": 0.0266, "step": 59850 }, { - "epoch": 0.3, - "learning_rate": 0.00025469978961813417, - "loss": 0.0213, + "epoch": 0.16, + "learning_rate": 0.00027672513680041265, + "loss": 0.0276, "step": 59860 }, { - "epoch": 0.3, - "learning_rate": 0.00025469222192512015, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.00027672124858404116, + "loss": 0.0268, "step": 59870 }, { - "epoch": 0.3, - "learning_rate": 0.0002546846542321062, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027671736036766973, + "loss": 0.0285, "step": 59880 }, { - "epoch": 0.3, - "learning_rate": 0.00025467708653909216, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.00027671347215129825, + "loss": 0.026, "step": 59890 }, { - "epoch": 0.3, - "learning_rate": 0.00025466951884607815, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.00027670958393492676, + "loss": 0.0262, "step": 59900 }, { - "epoch": 0.3, - "learning_rate": 0.0002546619511530641, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.00027670569571855533, + "loss": 0.0349, "step": 59910 }, { - "epoch": 0.3, - "learning_rate": 0.0002546543834600501, - "loss": 0.0191, + "epoch": 0.16, + "learning_rate": 0.00027670180750218385, + "loss": 0.0277, "step": 59920 }, { - "epoch": 0.3, - "learning_rate": 0.0002546468157670361, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.0002766979192858124, + "loss": 0.0278, "step": 59930 }, { - "epoch": 0.3, - "learning_rate": 0.00025463924807402207, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027669403106944093, + "loss": 0.0327, "step": 59940 }, { - "epoch": 0.3, - "learning_rate": 0.0002546316803810081, - "loss": 0.0267, + "epoch": 0.16, + "learning_rate": 0.00027669014285306944, + "loss": 0.0287, "step": 59950 }, { - "epoch": 0.3, - "learning_rate": 0.0002546241126879941, - "loss": 0.0264, + "epoch": 0.16, + "learning_rate": 0.000276686254636698, + "loss": 0.0251, "step": 59960 }, { - "epoch": 0.3, - "learning_rate": 0.00025461654499498007, - "loss": 0.0235, + "epoch": 0.16, + "learning_rate": 0.0002766823664203265, + "loss": 0.0294, "step": 59970 }, { - "epoch": 0.3, - "learning_rate": 0.00025460897730196605, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.00027667847820395504, + "loss": 0.0298, "step": 59980 }, { - "epoch": 0.3, - "learning_rate": 0.00025460140960895203, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.0002766745899875836, + "loss": 0.0255, "step": 59990 }, { - "epoch": 0.3, - "learning_rate": 0.000254593841915938, - "loss": 0.0241, + "epoch": 0.16, + "learning_rate": 0.0002766707017712122, + "loss": 0.0276, "step": 60000 }, { - "epoch": 0.3, - "eval_cer": 0.9145197461055578, - "eval_loss": 0.01466525811702013, - "eval_runtime": 116.7343, - "eval_samples_per_second": 17.133, - "eval_steps_per_second": 4.283, + "epoch": 0.16, + "eval_cer": 0.8818426500165857, + "eval_loss": 0.01959504745900631, + "eval_runtime": 108.0446, + "eval_samples_per_second": 18.511, + "eval_steps_per_second": 4.628, "step": 60000 }, { - "epoch": 0.3, - "learning_rate": 0.00025458627422292405, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.0002766668135548407, + "loss": 0.0247, "step": 60010 }, { - "epoch": 0.3, - "learning_rate": 0.00025457870652991003, - "loss": 0.022, + "epoch": 0.16, + "learning_rate": 0.0002766629253384692, + "loss": 0.0283, "step": 60020 }, { - "epoch": 0.3, - "learning_rate": 0.000254571138836896, - "loss": 0.025, + "epoch": 0.16, + "learning_rate": 0.0002766590371220977, + "loss": 0.0262, "step": 60030 }, { - "epoch": 0.3, - "learning_rate": 0.000254563571143882, - "loss": 0.0254, + "epoch": 0.16, + "learning_rate": 0.0002766551489057263, + "loss": 0.0234, "step": 60040 }, { - "epoch": 0.3, - "learning_rate": 0.000254556003450868, - "loss": 0.0161, + "epoch": 0.16, + "learning_rate": 0.0002766512606893548, + "loss": 0.0299, "step": 60050 }, { - "epoch": 0.3, - "learning_rate": 0.00025454843575785396, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.0002766473724729834, + "loss": 0.0319, "step": 60060 }, { - "epoch": 0.3, - "learning_rate": 0.00025454086806483994, - "loss": 0.0249, + "epoch": 0.16, + "learning_rate": 0.0002766434842566119, + "loss": 0.0294, "step": 60070 }, { - "epoch": 0.3, - "learning_rate": 0.000254533300371826, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.0002766395960402404, + "loss": 0.027, "step": 60080 }, { - "epoch": 0.3, - "learning_rate": 0.00025452573267881196, - "loss": 0.0251, + "epoch": 0.16, + "learning_rate": 0.00027663570782386897, + "loss": 0.0289, "step": 60090 }, { - "epoch": 0.3, - "learning_rate": 0.00025451816498579794, - "loss": 0.0184, + "epoch": 0.16, + "learning_rate": 0.0002766318196074975, + "loss": 0.0263, "step": 60100 }, { - "epoch": 0.3, - "learning_rate": 0.0002545105972927839, - "loss": 0.0202, + "epoch": 0.16, + "learning_rate": 0.000276627931391126, + "loss": 0.0258, "step": 60110 }, { - "epoch": 0.3, - "learning_rate": 0.0002545030295997699, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.00027662404317475457, + "loss": 0.0313, "step": 60120 }, { - "epoch": 0.3, - "learning_rate": 0.0002544954619067559, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.0002766201549583831, + "loss": 0.0317, "step": 60130 }, { - "epoch": 0.3, - "learning_rate": 0.0002544878942137419, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.00027661626674201165, + "loss": 0.0316, "step": 60140 }, { - "epoch": 0.3, - "learning_rate": 0.0002544803265207279, - "loss": 0.0158, + "epoch": 0.16, + "learning_rate": 0.00027661237852564017, + "loss": 0.0224, "step": 60150 }, { - "epoch": 0.3, - "learning_rate": 0.0002544727588277139, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.0002766084903092687, + "loss": 0.025, "step": 60160 }, { - "epoch": 0.3, - "learning_rate": 0.00025446519113469986, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.00027660460209289725, + "loss": 0.0259, "step": 60170 }, { - "epoch": 0.3, - "learning_rate": 0.00025445762344168584, - "loss": 0.0174, + "epoch": 0.16, + "learning_rate": 0.00027660071387652577, + "loss": 0.0275, "step": 60180 }, { - "epoch": 0.3, - "learning_rate": 0.0002544500557486718, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.00027659682566015433, + "loss": 0.0258, "step": 60190 }, { - "epoch": 0.3, - "learning_rate": 0.00025444248805565786, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027659293744378285, + "loss": 0.0209, "step": 60200 }, { - "epoch": 0.3, - "learning_rate": 0.00025443492036264384, - "loss": 0.0172, + "epoch": 0.16, + "learning_rate": 0.0002765890492274114, + "loss": 0.0296, "step": 60210 }, { - "epoch": 0.3, - "learning_rate": 0.0002544273526696298, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.00027658516101103993, + "loss": 0.0258, "step": 60220 }, { - "epoch": 0.3, - "learning_rate": 0.0002544197849766158, - "loss": 0.0178, + "epoch": 0.16, + "learning_rate": 0.00027658127279466845, + "loss": 0.0322, "step": 60230 }, { - "epoch": 0.3, - "learning_rate": 0.0002544122172836018, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.00027657738457829696, + "loss": 0.0231, "step": 60240 }, { - "epoch": 0.3, - "learning_rate": 0.00025440464959058777, - "loss": 0.0244, + "epoch": 0.16, + "learning_rate": 0.00027657349636192553, + "loss": 0.0259, "step": 60250 }, { - "epoch": 0.3, - "learning_rate": 0.00025439708189757375, - "loss": 0.0236, + "epoch": 0.16, + "learning_rate": 0.00027656960814555404, + "loss": 0.0231, "step": 60260 }, { - "epoch": 0.3, - "learning_rate": 0.0002543895142045598, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.0002765657199291826, + "loss": 0.0237, "step": 60270 }, { - "epoch": 0.3, - "learning_rate": 0.00025438194651154577, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.00027656183171281113, + "loss": 0.0218, "step": 60280 }, { - "epoch": 0.3, - "learning_rate": 0.00025437437881853175, - "loss": 0.0232, + "epoch": 0.16, + "learning_rate": 0.00027655794349643964, + "loss": 0.0258, "step": 60290 }, { - "epoch": 0.3, - "learning_rate": 0.00025436681112551773, - "loss": 0.0174, + "epoch": 0.16, + "learning_rate": 0.0002765540552800682, + "loss": 0.0267, "step": 60300 }, { - "epoch": 0.3, - "learning_rate": 0.0002543592434325037, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.0002765501670636967, + "loss": 0.0226, "step": 60310 }, { - "epoch": 0.3, - "learning_rate": 0.0002543516757394897, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.00027654627884732524, + "loss": 0.0233, "step": 60320 }, { - "epoch": 0.3, - "learning_rate": 0.0002543441080464757, - "loss": 0.0178, + "epoch": 0.16, + "learning_rate": 0.0002765423906309538, + "loss": 0.0207, "step": 60330 }, { - "epoch": 0.3, - "learning_rate": 0.0002543365403534617, - "loss": 0.0174, + "epoch": 0.16, + "learning_rate": 0.0002765385024145824, + "loss": 0.0277, "step": 60340 }, { - "epoch": 0.3, - "learning_rate": 0.0002543289726604477, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.0002765346141982109, + "loss": 0.0268, "step": 60350 }, { - "epoch": 0.3, - "learning_rate": 0.00025432140496743367, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.0002765307259818394, + "loss": 0.0253, "step": 60360 }, { - "epoch": 0.3, - "learning_rate": 0.00025431383727441965, - "loss": 0.0151, + "epoch": 0.16, + "learning_rate": 0.0002765268377654679, + "loss": 0.0211, "step": 60370 }, { - "epoch": 0.3, - "learning_rate": 0.00025430626958140563, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.0002765229495490965, + "loss": 0.0266, "step": 60380 }, { - "epoch": 0.3, - "learning_rate": 0.0002542987018883916, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.000276519061332725, + "loss": 0.0229, "step": 60390 }, { - "epoch": 0.3, - "learning_rate": 0.00025429113419537765, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.0002765151731163536, + "loss": 0.0271, "step": 60400 }, { - "epoch": 0.3, - "learning_rate": 0.00025428356650236363, - "loss": 0.0209, + "epoch": 0.16, + "learning_rate": 0.0002765112848999821, + "loss": 0.0263, "step": 60410 }, { - "epoch": 0.3, - "learning_rate": 0.0002542759988093496, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.00027650739668361066, + "loss": 0.0251, "step": 60420 }, { - "epoch": 0.3, - "learning_rate": 0.0002542684311163356, - "loss": 0.0209, + "epoch": 0.16, + "learning_rate": 0.00027650350846723917, + "loss": 0.0364, "step": 60430 }, { - "epoch": 0.3, - "learning_rate": 0.0002542608634233216, - "loss": 0.0154, + "epoch": 0.16, + "learning_rate": 0.0002764996202508677, + "loss": 0.0299, "step": 60440 }, { - "epoch": 0.3, - "learning_rate": 0.00025425329573030756, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.0002764957320344962, + "loss": 0.0271, "step": 60450 }, { - "epoch": 0.31, - "learning_rate": 0.0002542457280372936, - "loss": 0.0172, + "epoch": 0.16, + "learning_rate": 0.00027649184381812477, + "loss": 0.0295, "step": 60460 }, { - "epoch": 0.31, - "learning_rate": 0.0002542381603442796, - "loss": 0.0191, + "epoch": 0.16, + "learning_rate": 0.0002764879556017533, + "loss": 0.0292, "step": 60470 }, { - "epoch": 0.31, - "learning_rate": 0.00025423059265126556, - "loss": 0.0174, + "epoch": 0.16, + "learning_rate": 0.00027648406738538185, + "loss": 0.0293, "step": 60480 }, { - "epoch": 0.31, - "learning_rate": 0.00025422302495825154, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.00027648017916901037, + "loss": 0.0244, "step": 60490 }, { - "epoch": 0.31, - "learning_rate": 0.0002542154572652375, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.00027647629095263894, + "loss": 0.0296, "step": 60500 }, { - "epoch": 0.31, - "learning_rate": 0.0002542078895722235, - "loss": 0.0244, + "epoch": 0.16, + "learning_rate": 0.00027647240273626745, + "loss": 0.0283, "step": 60510 }, { - "epoch": 0.31, - "learning_rate": 0.00025420032187920954, - "loss": 0.0176, + "epoch": 0.16, + "learning_rate": 0.00027646851451989596, + "loss": 0.0242, "step": 60520 }, { - "epoch": 0.31, - "learning_rate": 0.0002541927541861955, - "loss": 0.0243, + "epoch": 0.16, + "learning_rate": 0.0002764646263035245, + "loss": 0.0274, "step": 60530 }, { - "epoch": 0.31, - "learning_rate": 0.0002541851864931815, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.00027646073808715305, + "loss": 0.0298, "step": 60540 }, { - "epoch": 0.31, - "learning_rate": 0.0002541776188001675, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.0002764568498707816, + "loss": 0.0303, "step": 60550 }, { - "epoch": 0.31, - "learning_rate": 0.00025417005110715346, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.00027645296165441013, + "loss": 0.0305, "step": 60560 }, { - "epoch": 0.31, - "learning_rate": 0.00025416248341413944, - "loss": 0.0218, + "epoch": 0.16, + "learning_rate": 0.00027644907343803865, + "loss": 0.0231, "step": 60570 }, { - "epoch": 0.31, - "learning_rate": 0.0002541549157211254, - "loss": 0.0238, + "epoch": 0.16, + "learning_rate": 0.00027644518522166716, + "loss": 0.0301, "step": 60580 }, { - "epoch": 0.31, - "learning_rate": 0.00025414734802811146, - "loss": 0.0173, + "epoch": 0.16, + "learning_rate": 0.00027644129700529573, + "loss": 0.029, "step": 60590 }, { - "epoch": 0.31, - "learning_rate": 0.00025413978033509744, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.00027643740878892424, + "loss": 0.0223, "step": 60600 }, { - "epoch": 0.31, - "learning_rate": 0.0002541322126420834, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.0002764335205725528, + "loss": 0.0274, "step": 60610 }, { - "epoch": 0.31, - "learning_rate": 0.0002541246449490694, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.0002764296323561813, + "loss": 0.0257, "step": 60620 }, { - "epoch": 0.31, - "learning_rate": 0.0002541170772560554, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.0002764257441398099, + "loss": 0.0287, "step": 60630 }, { - "epoch": 0.31, - "learning_rate": 0.00025410950956304137, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.0002764218559234384, + "loss": 0.0335, "step": 60640 }, { - "epoch": 0.31, - "learning_rate": 0.0002541019418700274, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.0002764179677070669, + "loss": 0.025, "step": 60650 }, { - "epoch": 0.31, - "learning_rate": 0.0002540943741770134, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.00027641407949069544, + "loss": 0.0271, "step": 60660 }, { - "epoch": 0.31, - "learning_rate": 0.00025408680648399937, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.000276410191274324, + "loss": 0.0265, "step": 60670 }, { - "epoch": 0.31, - "learning_rate": 0.00025407923879098535, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.0002764063030579526, + "loss": 0.0291, "step": 60680 }, { - "epoch": 0.31, - "learning_rate": 0.00025407167109797133, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.0002764024148415811, + "loss": 0.0241, "step": 60690 }, { - "epoch": 0.31, - "learning_rate": 0.0002540641034049573, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.0002763985266252096, + "loss": 0.0251, "step": 60700 }, { - "epoch": 0.31, - "learning_rate": 0.00025405653571194335, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.0002763946384088382, + "loss": 0.0203, "step": 60710 }, { - "epoch": 0.31, - "learning_rate": 0.00025404896801892933, - "loss": 0.0173, + "epoch": 0.16, + "learning_rate": 0.0002763907501924667, + "loss": 0.0278, "step": 60720 }, { - "epoch": 0.31, - "learning_rate": 0.0002540414003259153, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.0002763868619760952, + "loss": 0.0324, "step": 60730 }, { - "epoch": 0.31, - "learning_rate": 0.0002540338326329013, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.00027638297375972377, + "loss": 0.0273, "step": 60740 }, { - "epoch": 0.31, - "learning_rate": 0.0002540262649398873, - "loss": 0.0158, + "epoch": 0.16, + "learning_rate": 0.0002763790855433523, + "loss": 0.0352, "step": 60750 }, { - "epoch": 0.31, - "learning_rate": 0.00025401869724687325, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.00027637519732698086, + "loss": 0.0265, "step": 60760 }, { - "epoch": 0.31, - "learning_rate": 0.00025401112955385924, - "loss": 0.018, + "epoch": 0.16, + "learning_rate": 0.00027637130911060937, + "loss": 0.0235, "step": 60770 }, { - "epoch": 0.31, - "learning_rate": 0.00025400356186084527, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.0002763674208942379, + "loss": 0.0247, "step": 60780 }, { - "epoch": 0.31, - "learning_rate": 0.00025399599416783125, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.0002763635326778664, + "loss": 0.0265, "step": 60790 }, { - "epoch": 0.31, - "learning_rate": 0.00025398842647481723, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.00027635964446149497, + "loss": 0.0272, "step": 60800 }, { - "epoch": 0.31, - "learning_rate": 0.0002539808587818032, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.0002763557562451235, + "loss": 0.0235, "step": 60810 }, { - "epoch": 0.31, - "learning_rate": 0.0002539732910887892, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.00027635186802875205, + "loss": 0.0265, "step": 60820 }, { - "epoch": 0.31, - "learning_rate": 0.0002539657233957752, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.00027634797981238057, + "loss": 0.0268, "step": 60830 }, { - "epoch": 0.31, - "learning_rate": 0.0002539581557027612, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.00027634409159600913, + "loss": 0.0237, "step": 60840 }, { - "epoch": 0.31, - "learning_rate": 0.0002539505880097472, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.00027634020337963765, + "loss": 0.0257, "step": 60850 }, { - "epoch": 0.31, - "learning_rate": 0.0002539430203167332, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.00027633631516326616, + "loss": 0.0231, "step": 60860 }, { - "epoch": 0.31, - "learning_rate": 0.00025393545262371916, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.0002763324269468947, + "loss": 0.0306, "step": 60870 }, { - "epoch": 0.31, - "learning_rate": 0.00025392788493070514, - "loss": 0.0246, + "epoch": 0.16, + "learning_rate": 0.00027632853873052325, + "loss": 0.0213, "step": 60880 }, { - "epoch": 0.31, - "learning_rate": 0.0002539203172376911, - "loss": 0.0224, + "epoch": 0.16, + "learning_rate": 0.0002763246505141518, + "loss": 0.0235, "step": 60890 }, { - "epoch": 0.31, - "learning_rate": 0.0002539127495446771, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.00027632076229778033, + "loss": 0.021, "step": 60900 }, { - "epoch": 0.31, - "learning_rate": 0.00025390518185166314, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027631687408140884, + "loss": 0.0308, "step": 60910 }, { - "epoch": 0.31, - "learning_rate": 0.0002538976141586491, - "loss": 0.0235, + "epoch": 0.16, + "learning_rate": 0.0002763129858650374, + "loss": 0.0208, "step": 60920 }, { - "epoch": 0.31, - "learning_rate": 0.0002538900464656351, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.00027630909764866593, + "loss": 0.0252, "step": 60930 }, { - "epoch": 0.31, - "learning_rate": 0.0002538824787726211, - "loss": 0.0187, + "epoch": 0.16, + "learning_rate": 0.00027630520943229444, + "loss": 0.0225, "step": 60940 }, { - "epoch": 0.31, - "learning_rate": 0.00025387491107960706, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.000276301321215923, + "loss": 0.0268, "step": 60950 }, { - "epoch": 0.31, - "learning_rate": 0.00025386734338659305, - "loss": 0.0174, + "epoch": 0.16, + "learning_rate": 0.0002762974329995515, + "loss": 0.0253, "step": 60960 }, { - "epoch": 0.31, - "learning_rate": 0.00025385977569357903, - "loss": 0.018, + "epoch": 0.16, + "learning_rate": 0.0002762935447831801, + "loss": 0.0256, "step": 60970 }, { - "epoch": 0.31, - "learning_rate": 0.000253852208000565, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.0002762896565668086, + "loss": 0.0266, "step": 60980 }, { - "epoch": 0.31, - "learning_rate": 0.000253844640307551, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.0002762857683504371, + "loss": 0.0265, "step": 60990 }, { - "epoch": 0.31, - "learning_rate": 0.00025383707261453697, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.0002762818801340657, + "loss": 0.0256, "step": 61000 }, { - "epoch": 0.31, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.01344729121774435, - "eval_runtime": 116.7714, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.16, + "eval_cer": 0.8818818398507428, + "eval_loss": 0.01873914897441864, + "eval_runtime": 107.4676, + "eval_samples_per_second": 18.61, + "eval_steps_per_second": 4.653, "step": 61000 }, { - "epoch": 0.31, - "learning_rate": 0.000253829504921523, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.0002762779919176942, + "loss": 0.0292, "step": 61010 }, { - "epoch": 0.31, - "learning_rate": 0.000253821937228509, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.0002762741037013227, + "loss": 0.0257, "step": 61020 }, { - "epoch": 0.31, - "learning_rate": 0.00025381436953549497, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.0002762702154849513, + "loss": 0.0312, "step": 61030 }, { - "epoch": 0.31, - "learning_rate": 0.00025380680184248095, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.0002762663272685798, + "loss": 0.0251, "step": 61040 }, { - "epoch": 0.31, - "learning_rate": 0.00025379923414946693, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.00027626243905220837, + "loss": 0.0263, "step": 61050 }, { - "epoch": 0.31, - "learning_rate": 0.0002537916664564529, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.0002762585508358369, + "loss": 0.023, "step": 61060 }, { - "epoch": 0.31, - "learning_rate": 0.00025378409876343895, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.0002762546626194654, + "loss": 0.0265, "step": 61070 }, { - "epoch": 0.31, - "learning_rate": 0.00025377653107042493, - "loss": 0.0202, + "epoch": 0.16, + "learning_rate": 0.00027625077440309397, + "loss": 0.0332, "step": 61080 }, { - "epoch": 0.31, - "learning_rate": 0.0002537689633774109, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.0002762468861867225, + "loss": 0.0207, "step": 61090 }, { - "epoch": 0.31, - "learning_rate": 0.0002537613956843969, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027624299797035105, + "loss": 0.0291, "step": 61100 }, { - "epoch": 0.31, - "learning_rate": 0.0002537538279913829, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.00027623910975397957, + "loss": 0.0322, "step": 61110 }, { - "epoch": 0.31, - "learning_rate": 0.00025374626029836886, - "loss": 0.0154, + "epoch": 0.16, + "learning_rate": 0.0002762352215376081, + "loss": 0.0253, "step": 61120 }, { - "epoch": 0.31, - "learning_rate": 0.00025373869260535484, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.00027623133332123665, + "loss": 0.0258, "step": 61130 }, { - "epoch": 0.31, - "learning_rate": 0.0002537311249123409, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.00027622744510486517, + "loss": 0.0297, "step": 61140 }, { - "epoch": 0.31, - "learning_rate": 0.00025372355721932686, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.0002762235568884937, + "loss": 0.0251, "step": 61150 }, { - "epoch": 0.31, - "learning_rate": 0.00025371598952631284, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027621966867212225, + "loss": 0.0242, "step": 61160 }, { - "epoch": 0.31, - "learning_rate": 0.0002537084218332988, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.00027621578045575076, + "loss": 0.0253, "step": 61170 }, { - "epoch": 0.31, - "learning_rate": 0.0002537008541402848, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.00027621189223937933, + "loss": 0.0224, "step": 61180 }, { - "epoch": 0.31, - "learning_rate": 0.0002536932864472708, - "loss": 0.0142, + "epoch": 0.16, + "learning_rate": 0.00027620800402300785, + "loss": 0.0306, "step": 61190 }, { - "epoch": 0.31, - "learning_rate": 0.0002536857187542568, - "loss": 0.0162, + "epoch": 0.16, + "learning_rate": 0.00027620411580663636, + "loss": 0.031, "step": 61200 }, { - "epoch": 0.31, - "learning_rate": 0.0002536781510612428, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.00027620022759026493, + "loss": 0.0303, "step": 61210 }, { - "epoch": 0.31, - "learning_rate": 0.0002536705833682288, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027619633937389345, + "loss": 0.0243, "step": 61220 }, { - "epoch": 0.31, - "learning_rate": 0.00025366301567521476, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.000276192451157522, + "loss": 0.0259, "step": 61230 }, { - "epoch": 0.31, - "learning_rate": 0.00025365544798220074, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.00027618856294115053, + "loss": 0.0276, "step": 61240 }, { - "epoch": 0.31, - "learning_rate": 0.0002536478802891867, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.0002761846747247791, + "loss": 0.0316, "step": 61250 }, { - "epoch": 0.31, - "learning_rate": 0.00025364031259617276, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.0002761807865084076, + "loss": 0.029, "step": 61260 }, { - "epoch": 0.31, - "learning_rate": 0.00025363274490315874, - "loss": 0.021, + "epoch": 0.16, + "learning_rate": 0.0002761768982920361, + "loss": 0.0299, "step": 61270 }, { - "epoch": 0.31, - "learning_rate": 0.0002536251772101447, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.00027617301007566464, + "loss": 0.0275, "step": 61280 }, { - "epoch": 0.31, - "learning_rate": 0.0002536176095171307, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.0002761691218592932, + "loss": 0.0279, "step": 61290 }, { - "epoch": 0.31, - "learning_rate": 0.0002536100418241167, - "loss": 0.0178, + "epoch": 0.16, + "learning_rate": 0.0002761652336429217, + "loss": 0.0204, "step": 61300 }, { - "epoch": 0.31, - "learning_rate": 0.00025360247413110267, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.0002761613454265503, + "loss": 0.034, "step": 61310 }, { - "epoch": 0.31, - "learning_rate": 0.00025359490643808865, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.0002761574572101788, + "loss": 0.0285, "step": 61320 }, { - "epoch": 0.31, - "learning_rate": 0.0002535873387450747, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.0002761535689938073, + "loss": 0.0228, "step": 61330 }, { - "epoch": 0.31, - "learning_rate": 0.00025357977105206067, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.0002761496807774359, + "loss": 0.0285, "step": 61340 }, { - "epoch": 0.31, - "learning_rate": 0.00025357220335904665, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.0002761457925610644, + "loss": 0.0247, "step": 61350 }, { - "epoch": 0.31, - "learning_rate": 0.00025356463566603263, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002761419043446929, + "loss": 0.0285, "step": 61360 }, { - "epoch": 0.31, - "learning_rate": 0.0002535570679730186, - "loss": 0.0226, + "epoch": 0.16, + "learning_rate": 0.0002761380161283215, + "loss": 0.0313, "step": 61370 }, { - "epoch": 0.31, - "learning_rate": 0.0002535495002800046, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.00027613412791195006, + "loss": 0.0329, "step": 61380 }, { - "epoch": 0.31, - "learning_rate": 0.00025354193258699063, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027613023969557857, + "loss": 0.0258, "step": 61390 }, { - "epoch": 0.31, - "learning_rate": 0.0002535343648939766, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.0002761263514792071, + "loss": 0.0229, "step": 61400 }, { - "epoch": 0.31, - "learning_rate": 0.0002535267972009626, - "loss": 0.0229, + "epoch": 0.16, + "learning_rate": 0.0002761224632628356, + "loss": 0.0275, "step": 61410 }, { - "epoch": 0.31, - "learning_rate": 0.00025351922950794857, - "loss": 0.0246, + "epoch": 0.16, + "learning_rate": 0.00027611857504646417, + "loss": 0.0273, "step": 61420 }, { - "epoch": 0.31, - "learning_rate": 0.00025351166181493455, - "loss": 0.0162, + "epoch": 0.16, + "learning_rate": 0.0002761146868300927, + "loss": 0.0265, "step": 61430 }, { - "epoch": 0.31, - "learning_rate": 0.00025350409412192053, - "loss": 0.0236, + "epoch": 0.16, + "learning_rate": 0.00027611079861372125, + "loss": 0.0336, "step": 61440 }, { - "epoch": 0.31, - "learning_rate": 0.00025349652642890657, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027610691039734977, + "loss": 0.0306, "step": 61450 }, { - "epoch": 0.31, - "learning_rate": 0.00025348895873589255, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.00027610302218097834, + "loss": 0.0322, "step": 61460 }, { - "epoch": 0.31, - "learning_rate": 0.00025348139104287853, - "loss": 0.0222, + "epoch": 0.16, + "learning_rate": 0.00027609913396460685, + "loss": 0.0274, "step": 61470 }, { - "epoch": 0.31, - "learning_rate": 0.0002534738233498645, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.00027609524574823537, + "loss": 0.027, "step": 61480 }, { - "epoch": 0.31, - "learning_rate": 0.0002534662556568505, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.0002760913575318639, + "loss": 0.0229, "step": 61490 }, { - "epoch": 0.31, - "learning_rate": 0.0002534586879638365, - "loss": 0.0163, + "epoch": 0.16, + "learning_rate": 0.00027608746931549245, + "loss": 0.0282, "step": 61500 }, { - "epoch": 0.31, - "learning_rate": 0.00025345112027082246, - "loss": 0.0176, + "epoch": 0.16, + "learning_rate": 0.00027608358109912096, + "loss": 0.0301, "step": 61510 }, { - "epoch": 0.31, - "learning_rate": 0.0002534435525778085, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.00027607969288274953, + "loss": 0.0297, "step": 61520 }, { - "epoch": 0.31, - "learning_rate": 0.0002534359848847945, - "loss": 0.017, + "epoch": 0.16, + "learning_rate": 0.00027607580466637805, + "loss": 0.0321, "step": 61530 }, { - "epoch": 0.31, - "learning_rate": 0.00025342841719178046, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.00027607191645000656, + "loss": 0.0362, "step": 61540 }, { - "epoch": 0.31, - "learning_rate": 0.00025342084949876644, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.00027606802823363513, + "loss": 0.029, "step": 61550 }, { - "epoch": 0.31, - "learning_rate": 0.0002534132818057524, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.00027606414001726364, + "loss": 0.0211, "step": 61560 }, { - "epoch": 0.31, - "learning_rate": 0.0002534057141127384, - "loss": 0.0209, + "epoch": 0.16, + "learning_rate": 0.00027606025180089216, + "loss": 0.0226, "step": 61570 }, { - "epoch": 0.31, - "learning_rate": 0.00025339814641972444, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.00027605636358452073, + "loss": 0.0274, "step": 61580 }, { - "epoch": 0.31, - "learning_rate": 0.0002533905787267104, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.0002760524753681493, + "loss": 0.0259, "step": 61590 }, { - "epoch": 0.31, - "learning_rate": 0.0002533830110336964, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.0002760485871517778, + "loss": 0.0238, "step": 61600 }, { - "epoch": 0.31, - "learning_rate": 0.0002533754433406824, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.0002760446989354063, + "loss": 0.0272, "step": 61610 }, { - "epoch": 0.31, - "learning_rate": 0.00025336787564766836, - "loss": 0.0169, + "epoch": 0.16, + "learning_rate": 0.00027604081071903484, + "loss": 0.0208, "step": 61620 }, { - "epoch": 0.31, - "learning_rate": 0.00025336030795465434, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.0002760369225026634, + "loss": 0.0267, "step": 61630 }, { - "epoch": 0.31, - "learning_rate": 0.0002533527402616403, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.0002760330342862919, + "loss": 0.0266, "step": 61640 }, { - "epoch": 0.31, - "learning_rate": 0.00025334517256862636, - "loss": 0.0171, + "epoch": 0.16, + "learning_rate": 0.0002760291460699205, + "loss": 0.0246, "step": 61650 }, { - "epoch": 0.31, - "learning_rate": 0.00025333760487561234, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.000276025257853549, + "loss": 0.0324, "step": 61660 }, { - "epoch": 0.31, - "learning_rate": 0.0002533300371825983, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.0002760213696371776, + "loss": 0.0311, "step": 61670 }, { - "epoch": 0.31, - "learning_rate": 0.0002533224694895843, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.0002760174814208061, + "loss": 0.0251, "step": 61680 }, { - "epoch": 0.31, - "learning_rate": 0.0002533149017965703, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002760135932044346, + "loss": 0.0263, "step": 61690 }, { - "epoch": 0.31, - "learning_rate": 0.00025330733410355627, - "loss": 0.021, + "epoch": 0.16, + "learning_rate": 0.0002760097049880631, + "loss": 0.0284, "step": 61700 }, { - "epoch": 0.31, - "learning_rate": 0.0002532997664105423, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.0002760058167716917, + "loss": 0.0242, "step": 61710 }, { - "epoch": 0.31, - "learning_rate": 0.0002532921987175283, - "loss": 0.024, + "epoch": 0.16, + "learning_rate": 0.0002760019285553202, + "loss": 0.0273, "step": 61720 }, { - "epoch": 0.31, - "learning_rate": 0.00025328463102451427, - "loss": 0.018, + "epoch": 0.16, + "learning_rate": 0.00027599804033894877, + "loss": 0.0321, "step": 61730 }, { - "epoch": 0.31, - "learning_rate": 0.00025327706333150025, - "loss": 0.0191, + "epoch": 0.16, + "learning_rate": 0.0002759941521225773, + "loss": 0.0251, "step": 61740 }, { - "epoch": 0.31, - "learning_rate": 0.00025326949563848623, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.00027599026390620585, + "loss": 0.0264, "step": 61750 }, { - "epoch": 0.31, - "learning_rate": 0.0002532619279454722, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027598637568983437, + "loss": 0.0254, "step": 61760 }, { - "epoch": 0.31, - "learning_rate": 0.00025325436025245825, - "loss": 0.0175, + "epoch": 0.16, + "learning_rate": 0.0002759824874734629, + "loss": 0.0242, "step": 61770 }, { - "epoch": 0.31, - "learning_rate": 0.00025324679255944423, - "loss": 0.0175, + "epoch": 0.16, + "learning_rate": 0.00027597859925709145, + "loss": 0.0265, "step": 61780 }, { - "epoch": 0.31, - "learning_rate": 0.0002532392248664302, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.00027597471104071997, + "loss": 0.0285, "step": 61790 }, { - "epoch": 0.31, - "learning_rate": 0.0002532316571734162, - "loss": 0.0211, + "epoch": 0.16, + "learning_rate": 0.00027597082282434853, + "loss": 0.0272, "step": 61800 }, { - "epoch": 0.31, - "learning_rate": 0.0002532240894804022, - "loss": 0.0191, + "epoch": 0.16, + "learning_rate": 0.00027596693460797705, + "loss": 0.0256, "step": 61810 }, { - "epoch": 0.31, - "learning_rate": 0.00025321652178738815, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.00027596304639160556, + "loss": 0.0233, "step": 61820 }, { - "epoch": 0.31, - "learning_rate": 0.00025320895409437414, - "loss": 0.0227, + "epoch": 0.16, + "learning_rate": 0.0002759591581752341, + "loss": 0.0261, "step": 61830 }, { - "epoch": 0.31, - "learning_rate": 0.00025320138640136017, - "loss": 0.0221, + "epoch": 0.16, + "learning_rate": 0.00027595526995886265, + "loss": 0.0269, "step": 61840 }, { - "epoch": 0.31, - "learning_rate": 0.00025319381870834615, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027595138174249116, + "loss": 0.029, "step": 61850 }, { - "epoch": 0.31, - "learning_rate": 0.00025318625101533213, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.00027594749352611973, + "loss": 0.0199, "step": 61860 }, { - "epoch": 0.31, - "learning_rate": 0.0002531786833223181, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.00027594360530974825, + "loss": 0.0327, "step": 61870 }, { - "epoch": 0.31, - "learning_rate": 0.0002531711156293041, - "loss": 0.0242, + "epoch": 0.16, + "learning_rate": 0.0002759397170933768, + "loss": 0.0215, "step": 61880 }, { - "epoch": 0.31, - "learning_rate": 0.0002531635479362901, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027593582887700533, + "loss": 0.0264, "step": 61890 }, { - "epoch": 0.31, - "learning_rate": 0.0002531559802432761, - "loss": 0.0158, + "epoch": 0.16, + "learning_rate": 0.00027593194066063384, + "loss": 0.0233, "step": 61900 }, { - "epoch": 0.31, - "learning_rate": 0.0002531484125502621, - "loss": 0.0187, + "epoch": 0.16, + "learning_rate": 0.00027592805244426236, + "loss": 0.031, "step": 61910 }, { - "epoch": 0.31, - "learning_rate": 0.0002531408448572481, - "loss": 0.0213, + "epoch": 0.16, + "learning_rate": 0.0002759241642278909, + "loss": 0.0286, "step": 61920 }, { - "epoch": 0.31, - "learning_rate": 0.00025313327716423406, + "epoch": 0.16, + "learning_rate": 0.0002759202760115195, "loss": 0.0252, "step": 61930 }, { - "epoch": 0.31, - "learning_rate": 0.00025312570947122004, - "loss": 0.0224, + "epoch": 0.16, + "learning_rate": 0.000275916387795148, + "loss": 0.0302, "step": 61940 }, { - "epoch": 0.31, - "learning_rate": 0.000253118141778206, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.0002759124995787765, + "loss": 0.0252, "step": 61950 }, { - "epoch": 0.31, - "learning_rate": 0.00025311057408519206, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.0002759086113624051, + "loss": 0.0249, "step": 61960 }, { - "epoch": 0.31, - "learning_rate": 0.00025310300639217804, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.0002759047231460336, + "loss": 0.0222, "step": 61970 }, { - "epoch": 0.31, - "learning_rate": 0.000253095438699164, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.0002759008349296621, + "loss": 0.0317, "step": 61980 }, { - "epoch": 0.31, - "learning_rate": 0.00025308787100615, - "loss": 0.0169, + "epoch": 0.16, + "learning_rate": 0.0002758969467132907, + "loss": 0.0284, "step": 61990 }, { - "epoch": 0.31, - "learning_rate": 0.000253080303313136, - "loss": 0.024, + "epoch": 0.16, + "learning_rate": 0.0002758930584969192, + "loss": 0.0285, "step": 62000 }, { - "epoch": 0.31, - "eval_cer": 0.9144838414489178, - "eval_loss": 0.014024483039975166, - "eval_runtime": 116.7957, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.16, + "eval_cer": 0.8818426500165857, + "eval_loss": 0.019648298621177673, + "eval_runtime": 107.6017, + "eval_samples_per_second": 18.587, + "eval_steps_per_second": 4.647, "step": 62000 }, { - "epoch": 0.31, - "learning_rate": 0.00025307273562012196, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.0002758891702805478, + "loss": 0.0248, "step": 62010 }, { - "epoch": 0.31, - "learning_rate": 0.00025306516792710795, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.0002758852820641763, + "loss": 0.0273, "step": 62020 }, { - "epoch": 0.31, - "learning_rate": 0.000253057600234094, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.0002758813938478048, + "loss": 0.024, "step": 62030 }, { - "epoch": 0.31, - "learning_rate": 0.00025305003254107996, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.0002758775056314333, + "loss": 0.0296, "step": 62040 }, { - "epoch": 0.31, - "learning_rate": 0.00025304246484806594, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.0002758736174150619, + "loss": 0.0298, "step": 62050 }, { - "epoch": 0.31, - "learning_rate": 0.0002530348971550519, - "loss": 0.0228, + "epoch": 0.16, + "learning_rate": 0.0002758697291986904, + "loss": 0.0245, "step": 62060 }, { - "epoch": 0.31, - "learning_rate": 0.0002530273294620379, - "loss": 0.022, + "epoch": 0.16, + "learning_rate": 0.00027586584098231897, + "loss": 0.0359, "step": 62070 }, { - "epoch": 0.31, - "learning_rate": 0.0002530197617690239, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.0002758619527659475, + "loss": 0.0327, "step": 62080 }, { - "epoch": 0.31, - "learning_rate": 0.0002530121940760099, - "loss": 0.0275, + "epoch": 0.16, + "learning_rate": 0.00027585806454957605, + "loss": 0.0267, "step": 62090 }, { - "epoch": 0.31, - "learning_rate": 0.0002530046263829959, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.00027585417633320457, + "loss": 0.0293, "step": 62100 }, { - "epoch": 0.31, - "learning_rate": 0.0002529970586899819, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002758502881168331, + "loss": 0.0269, "step": 62110 }, { - "epoch": 0.31, - "learning_rate": 0.00025298949099696787, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.0002758463999004616, + "loss": 0.0266, "step": 62120 }, { - "epoch": 0.31, - "learning_rate": 0.00025298192330395385, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.00027584251168409017, + "loss": 0.028, "step": 62130 }, { - "epoch": 0.31, - "learning_rate": 0.00025297435561093983, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.00027583862346771873, + "loss": 0.0241, "step": 62140 }, { - "epoch": 0.31, - "learning_rate": 0.0002529667879179258, - "loss": 0.0213, + "epoch": 0.16, + "learning_rate": 0.00027583473525134725, + "loss": 0.0287, "step": 62150 }, { - "epoch": 0.31, - "learning_rate": 0.00025295922022491185, - "loss": 0.0231, + "epoch": 0.16, + "learning_rate": 0.00027583084703497576, + "loss": 0.0248, "step": 62160 }, { - "epoch": 0.31, - "learning_rate": 0.00025295165253189783, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.00027582695881860433, + "loss": 0.0303, "step": 62170 }, { - "epoch": 0.31, - "learning_rate": 0.0002529440848388838, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027582307060223285, + "loss": 0.0273, "step": 62180 }, { - "epoch": 0.31, - "learning_rate": 0.0002529365171458698, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.00027581918238586136, + "loss": 0.0284, "step": 62190 }, { - "epoch": 0.31, - "learning_rate": 0.0002529289494528558, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.00027581529416948993, + "loss": 0.0233, "step": 62200 }, { - "epoch": 0.31, - "learning_rate": 0.00025292138175984176, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.00027581140595311844, + "loss": 0.028, "step": 62210 }, { - "epoch": 0.31, - "learning_rate": 0.00025291381406682774, - "loss": 0.0237, + "epoch": 0.16, + "learning_rate": 0.000275807517736747, + "loss": 0.023, "step": 62220 }, { - "epoch": 0.31, - "learning_rate": 0.0002529062463738137, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.00027580362952037553, + "loss": 0.0239, "step": 62230 }, { - "epoch": 0.31, - "learning_rate": 0.0002528986786807997, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.00027579974130400404, + "loss": 0.027, "step": 62240 }, { - "epoch": 0.31, - "learning_rate": 0.0002528911109877857, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.0002757958530876326, + "loss": 0.022, "step": 62250 }, { - "epoch": 0.31, - "learning_rate": 0.0002528835432947717, - "loss": 0.0231, + "epoch": 0.16, + "learning_rate": 0.0002757919648712611, + "loss": 0.0208, "step": 62260 }, { - "epoch": 0.31, - "learning_rate": 0.0002528759756017577, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.0002757880766548897, + "loss": 0.0277, "step": 62270 }, { - "epoch": 0.31, - "learning_rate": 0.0002528684079087437, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.0002757841884385182, + "loss": 0.0259, "step": 62280 }, { - "epoch": 0.31, - "learning_rate": 0.00025286084021572966, - "loss": 0.0176, + "epoch": 0.16, + "learning_rate": 0.0002757803002221467, + "loss": 0.0204, "step": 62290 }, { - "epoch": 0.31, - "learning_rate": 0.00025285327252271564, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.0002757764120057753, + "loss": 0.0294, "step": 62300 }, { - "epoch": 0.31, - "learning_rate": 0.0002528457048297016, - "loss": 0.0173, + "epoch": 0.16, + "learning_rate": 0.0002757725237894038, + "loss": 0.0282, "step": 62310 }, { - "epoch": 0.31, - "learning_rate": 0.00025283813713668766, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.0002757686355730323, + "loss": 0.0234, "step": 62320 }, { - "epoch": 0.31, - "learning_rate": 0.00025283056944367364, - "loss": 0.0228, + "epoch": 0.16, + "learning_rate": 0.0002757647473566609, + "loss": 0.0227, "step": 62330 }, { - "epoch": 0.31, - "learning_rate": 0.0002528230017506596, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.0002757608591402894, + "loss": 0.0266, "step": 62340 }, { - "epoch": 0.31, - "learning_rate": 0.0002528154340576456, - "loss": 0.0232, + "epoch": 0.16, + "learning_rate": 0.00027575697092391797, + "loss": 0.0288, "step": 62350 }, { - "epoch": 0.31, - "learning_rate": 0.0002528078663646316, - "loss": 0.0159, + "epoch": 0.16, + "learning_rate": 0.0002757530827075465, + "loss": 0.0238, "step": 62360 }, { - "epoch": 0.31, - "learning_rate": 0.00025280029867161757, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.000275749194491175, + "loss": 0.0267, "step": 62370 }, { - "epoch": 0.31, - "learning_rate": 0.00025279273097860355, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027574530627480357, + "loss": 0.0227, "step": 62380 }, { - "epoch": 0.31, - "learning_rate": 0.0002527851632855896, - "loss": 0.023, + "epoch": 0.16, + "learning_rate": 0.0002757414180584321, + "loss": 0.0236, "step": 62390 }, { - "epoch": 0.31, - "learning_rate": 0.00025277759559257557, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.0002757375298420606, + "loss": 0.0182, "step": 62400 }, { - "epoch": 0.31, - "learning_rate": 0.00025277002789956155, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.00027573364162568917, + "loss": 0.0221, "step": 62410 }, { - "epoch": 0.31, - "learning_rate": 0.00025276246020654753, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.00027572975340931774, + "loss": 0.0257, "step": 62420 }, { - "epoch": 0.31, - "learning_rate": 0.0002527548925135335, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027572586519294625, + "loss": 0.0237, "step": 62430 }, { - "epoch": 0.32, - "learning_rate": 0.0002527473248205195, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.00027572197697657477, + "loss": 0.0242, "step": 62440 }, { - "epoch": 0.32, - "learning_rate": 0.00025273975712750553, - "loss": 0.0245, + "epoch": 0.16, + "learning_rate": 0.0002757180887602033, + "loss": 0.0282, "step": 62450 }, { - "epoch": 0.32, - "learning_rate": 0.0002527321894344915, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.00027571420054383185, + "loss": 0.0231, "step": 62460 }, { - "epoch": 0.32, - "learning_rate": 0.0002527246217414775, - "loss": 0.0215, + "epoch": 0.16, + "learning_rate": 0.00027571031232746036, + "loss": 0.0287, "step": 62470 }, { - "epoch": 0.32, - "learning_rate": 0.00025271705404846347, - "loss": 0.0223, + "epoch": 0.16, + "learning_rate": 0.00027570642411108893, + "loss": 0.0286, "step": 62480 }, { - "epoch": 0.32, - "learning_rate": 0.00025270948635544945, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.00027570253589471745, + "loss": 0.026, "step": 62490 }, { - "epoch": 0.32, - "learning_rate": 0.00025270191866243543, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.000275698647678346, + "loss": 0.0264, "step": 62500 }, { - "epoch": 0.32, - "learning_rate": 0.00025269435096942147, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.00027569475946197453, + "loss": 0.0237, "step": 62510 }, { - "epoch": 0.32, - "learning_rate": 0.00025268678327640745, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.00027569087124560304, + "loss": 0.0246, "step": 62520 }, { - "epoch": 0.32, - "learning_rate": 0.00025267921558339343, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.00027568698302923156, + "loss": 0.0248, "step": 62530 }, { - "epoch": 0.32, - "learning_rate": 0.0002526716478903794, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027568309481286013, + "loss": 0.0283, "step": 62540 }, { - "epoch": 0.32, - "learning_rate": 0.0002526640801973654, - "loss": 0.0155, + "epoch": 0.16, + "learning_rate": 0.00027567920659648864, + "loss": 0.0263, "step": 62550 }, { - "epoch": 0.32, - "learning_rate": 0.0002526565125043514, - "loss": 0.0229, + "epoch": 0.16, + "learning_rate": 0.0002756753183801172, + "loss": 0.0284, "step": 62560 }, { - "epoch": 0.32, - "learning_rate": 0.00025264894481133736, - "loss": 0.0238, + "epoch": 0.16, + "learning_rate": 0.0002756714301637457, + "loss": 0.0251, "step": 62570 }, { - "epoch": 0.32, - "learning_rate": 0.0002526413771183234, - "loss": 0.0245, + "epoch": 0.16, + "learning_rate": 0.00027566754194737424, + "loss": 0.0244, "step": 62580 }, { - "epoch": 0.32, - "learning_rate": 0.0002526338094253094, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.0002756636537310028, + "loss": 0.0269, "step": 62590 }, { - "epoch": 0.32, - "learning_rate": 0.00025262624173229536, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.0002756597655146313, + "loss": 0.0209, "step": 62600 }, { - "epoch": 0.32, - "learning_rate": 0.00025261867403928134, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.00027565587729825984, + "loss": 0.0225, "step": 62610 }, { - "epoch": 0.32, - "learning_rate": 0.0002526111063462673, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.0002756519890818884, + "loss": 0.0275, "step": 62620 }, { - "epoch": 0.32, - "learning_rate": 0.0002526035386532533, - "loss": 0.0173, + "epoch": 0.16, + "learning_rate": 0.000275648100865517, + "loss": 0.027, "step": 62630 }, { - "epoch": 0.32, - "learning_rate": 0.00025259597096023934, - "loss": 0.0172, + "epoch": 0.16, + "learning_rate": 0.0002756442126491455, + "loss": 0.0224, "step": 62640 }, { - "epoch": 0.32, - "learning_rate": 0.0002525884032672253, - "loss": 0.0247, + "epoch": 0.16, + "learning_rate": 0.000275640324432774, + "loss": 0.0238, "step": 62650 }, { - "epoch": 0.32, - "learning_rate": 0.0002525808355742113, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.0002756364362164025, + "loss": 0.0244, "step": 62660 }, { - "epoch": 0.32, - "learning_rate": 0.0002525732678811973, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.0002756325480000311, + "loss": 0.0273, "step": 62670 }, { - "epoch": 0.32, - "learning_rate": 0.00025256570018818326, - "loss": 0.0188, + "epoch": 0.16, + "learning_rate": 0.0002756286597836596, + "loss": 0.0261, "step": 62680 }, { - "epoch": 0.32, - "learning_rate": 0.00025255813249516924, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.00027562477156728817, + "loss": 0.0263, "step": 62690 }, { - "epoch": 0.32, - "learning_rate": 0.0002525505648021552, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002756208833509167, + "loss": 0.0275, "step": 62700 }, { - "epoch": 0.32, - "learning_rate": 0.00025254299710914126, - "loss": 0.0178, + "epoch": 0.16, + "learning_rate": 0.00027561699513454525, + "loss": 0.0275, "step": 62710 }, { - "epoch": 0.32, - "learning_rate": 0.00025253542941612724, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.00027561310691817377, + "loss": 0.0265, "step": 62720 }, { - "epoch": 0.32, - "learning_rate": 0.0002525278617231132, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.0002756092187018023, + "loss": 0.0225, "step": 62730 }, { - "epoch": 0.32, - "learning_rate": 0.0002525202940300992, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.0002756053304854308, + "loss": 0.0264, "step": 62740 }, { - "epoch": 0.32, - "learning_rate": 0.0002525127263370852, - "loss": 0.0273, + "epoch": 0.16, + "learning_rate": 0.00027560144226905937, + "loss": 0.0224, "step": 62750 }, { - "epoch": 0.32, - "learning_rate": 0.00025250515864407117, - "loss": 0.0189, + "epoch": 0.16, + "learning_rate": 0.0002755975540526879, + "loss": 0.0265, "step": 62760 }, { - "epoch": 0.32, - "learning_rate": 0.0002524975909510572, - "loss": 0.0171, + "epoch": 0.16, + "learning_rate": 0.00027559366583631645, + "loss": 0.026, "step": 62770 }, { - "epoch": 0.32, - "learning_rate": 0.0002524900232580432, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027558977761994496, + "loss": 0.0277, "step": 62780 }, { - "epoch": 0.32, - "learning_rate": 0.00025248245556502917, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.0002755858894035735, + "loss": 0.0247, "step": 62790 }, { - "epoch": 0.32, - "learning_rate": 0.00025247488787201515, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.00027558200118720205, + "loss": 0.0303, "step": 62800 }, { - "epoch": 0.32, - "learning_rate": 0.00025246732017900113, - "loss": 0.0176, + "epoch": 0.16, + "learning_rate": 0.00027557811297083056, + "loss": 0.021, "step": 62810 }, { - "epoch": 0.32, - "learning_rate": 0.0002524597524859871, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027557422475445913, + "loss": 0.021, "step": 62820 }, { - "epoch": 0.32, - "learning_rate": 0.00025245218479297315, - "loss": 0.0213, + "epoch": 0.16, + "learning_rate": 0.00027557033653808765, + "loss": 0.0234, "step": 62830 }, { - "epoch": 0.32, - "learning_rate": 0.00025244461709995913, - "loss": 0.0184, + "epoch": 0.16, + "learning_rate": 0.0002755664483217162, + "loss": 0.0216, "step": 62840 }, { - "epoch": 0.32, - "learning_rate": 0.0002524370494069451, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.00027556256010534473, + "loss": 0.0305, "step": 62850 }, { - "epoch": 0.32, - "learning_rate": 0.0002524294817139311, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027555867188897324, + "loss": 0.0251, "step": 62860 }, { - "epoch": 0.32, - "learning_rate": 0.0002524219140209171, - "loss": 0.0198, + "epoch": 0.16, + "learning_rate": 0.00027555478367260176, + "loss": 0.0249, "step": 62870 }, { - "epoch": 0.32, - "learning_rate": 0.00025241434632790305, - "loss": 0.0249, + "epoch": 0.16, + "learning_rate": 0.0002755508954562303, + "loss": 0.026, "step": 62880 }, { - "epoch": 0.32, - "learning_rate": 0.00025240677863488904, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.00027554700723985884, + "loss": 0.0329, "step": 62890 }, { - "epoch": 0.32, - "learning_rate": 0.00025239921094187507, - "loss": 0.0195, + "epoch": 0.16, + "learning_rate": 0.0002755431190234874, + "loss": 0.0272, "step": 62900 }, { - "epoch": 0.32, - "learning_rate": 0.00025239164324886105, - "loss": 0.0169, + "epoch": 0.16, + "learning_rate": 0.0002755392308071159, + "loss": 0.0276, "step": 62910 }, { - "epoch": 0.32, - "learning_rate": 0.00025238407555584703, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.0002755353425907445, + "loss": 0.0329, "step": 62920 }, { - "epoch": 0.32, - "learning_rate": 0.000252376507862833, - "loss": 0.0181, + "epoch": 0.16, + "learning_rate": 0.000275531454374373, + "loss": 0.0223, "step": 62930 }, { - "epoch": 0.32, - "learning_rate": 0.000252368940169819, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.0002755275661580015, + "loss": 0.0293, "step": 62940 }, { - "epoch": 0.32, - "learning_rate": 0.000252361372476805, - "loss": 0.0204, + "epoch": 0.16, + "learning_rate": 0.00027552367794163004, + "loss": 0.0323, "step": 62950 }, { - "epoch": 0.32, - "learning_rate": 0.000252353804783791, - "loss": 0.0172, + "epoch": 0.16, + "learning_rate": 0.0002755197897252586, + "loss": 0.0246, "step": 62960 }, { - "epoch": 0.32, - "learning_rate": 0.000252346237090777, - "loss": 0.0169, + "epoch": 0.16, + "learning_rate": 0.0002755159015088872, + "loss": 0.0205, "step": 62970 }, { - "epoch": 0.32, - "learning_rate": 0.000252338669397763, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.0002755120132925157, + "loss": 0.0242, "step": 62980 }, { - "epoch": 0.32, - "learning_rate": 0.00025233110170474896, - "loss": 0.0192, + "epoch": 0.16, + "learning_rate": 0.0002755081250761442, + "loss": 0.028, "step": 62990 }, { - "epoch": 0.32, - "learning_rate": 0.00025232353401173494, - "loss": 0.0175, + "epoch": 0.16, + "learning_rate": 0.00027550423685977277, + "loss": 0.0253, "step": 63000 }, { - "epoch": 0.32, - "eval_cer": 0.9144712262992877, - "eval_loss": 0.013699725270271301, - "eval_runtime": 116.7034, - "eval_samples_per_second": 17.137, - "eval_steps_per_second": 4.284, + "epoch": 0.16, + "eval_cer": 0.8818356518319148, + "eval_loss": 0.018866481259465218, + "eval_runtime": 107.714, + "eval_samples_per_second": 18.568, + "eval_steps_per_second": 4.642, "step": 63000 }, { - "epoch": 0.32, - "learning_rate": 0.0002523159663187209, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.0002755003486434013, + "loss": 0.0263, "step": 63010 }, { - "epoch": 0.32, - "learning_rate": 0.00025230839862570696, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.0002754964604270298, + "loss": 0.0276, "step": 63020 }, { - "epoch": 0.32, - "learning_rate": 0.00025230083093269294, - "loss": 0.0214, + "epoch": 0.16, + "learning_rate": 0.00027549257221065837, + "loss": 0.0318, "step": 63030 }, { - "epoch": 0.32, - "learning_rate": 0.0002522932632396789, - "loss": 0.0225, + "epoch": 0.16, + "learning_rate": 0.0002754886839942869, + "loss": 0.0266, "step": 63040 }, { - "epoch": 0.32, - "learning_rate": 0.0002522856955466649, - "loss": 0.0154, + "epoch": 0.16, + "learning_rate": 0.00027548479577791545, + "loss": 0.0235, "step": 63050 }, { - "epoch": 0.32, - "learning_rate": 0.0002522781278536509, - "loss": 0.0199, + "epoch": 0.16, + "learning_rate": 0.00027548090756154397, + "loss": 0.026, "step": 63060 }, { - "epoch": 0.32, - "learning_rate": 0.00025227056016063686, - "loss": 0.017, + "epoch": 0.16, + "learning_rate": 0.0002754770193451725, + "loss": 0.0332, "step": 63070 }, { - "epoch": 0.32, - "learning_rate": 0.00025226299246762285, - "loss": 0.0253, + "epoch": 0.16, + "learning_rate": 0.000275473131128801, + "loss": 0.0296, "step": 63080 }, { - "epoch": 0.32, - "learning_rate": 0.0002522554247746089, - "loss": 0.0208, + "epoch": 0.16, + "learning_rate": 0.00027546924291242957, + "loss": 0.0264, "step": 63090 }, { - "epoch": 0.32, - "learning_rate": 0.00025224785708159486, - "loss": 0.0201, + "epoch": 0.16, + "learning_rate": 0.0002754653546960581, + "loss": 0.0284, "step": 63100 }, { - "epoch": 0.32, - "learning_rate": 0.00025224028938858084, - "loss": 0.0207, + "epoch": 0.16, + "learning_rate": 0.00027546146647968665, + "loss": 0.033, "step": 63110 }, { - "epoch": 0.32, - "learning_rate": 0.0002522327216955668, - "loss": 0.0171, + "epoch": 0.16, + "learning_rate": 0.00027545757826331516, + "loss": 0.0239, "step": 63120 }, { - "epoch": 0.32, - "learning_rate": 0.0002522251540025528, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.00027545369004694373, + "loss": 0.0235, "step": 63130 }, { - "epoch": 0.32, - "learning_rate": 0.0002522175863095388, - "loss": 0.0175, + "epoch": 0.16, + "learning_rate": 0.00027544980183057225, + "loss": 0.0327, "step": 63140 }, { - "epoch": 0.32, - "learning_rate": 0.0002522100186165248, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027544591361420076, + "loss": 0.0312, "step": 63150 }, { - "epoch": 0.32, - "learning_rate": 0.0002522024509235108, - "loss": 0.0233, + "epoch": 0.16, + "learning_rate": 0.0002754420253978293, + "loss": 0.0286, "step": 63160 }, { - "epoch": 0.32, - "learning_rate": 0.0002521948832304968, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.00027543813718145784, + "loss": 0.0312, "step": 63170 }, { - "epoch": 0.32, - "learning_rate": 0.00025218731553748277, - "loss": 0.018, + "epoch": 0.16, + "learning_rate": 0.0002754342489650864, + "loss": 0.0279, "step": 63180 }, { - "epoch": 0.32, - "learning_rate": 0.00025217974784446875, - "loss": 0.0212, + "epoch": 0.16, + "learning_rate": 0.00027543036074871493, + "loss": 0.0279, "step": 63190 }, { - "epoch": 0.32, - "learning_rate": 0.00025217218015145473, - "loss": 0.0184, + "epoch": 0.16, + "learning_rate": 0.00027542647253234344, + "loss": 0.0277, "step": 63200 }, { - "epoch": 0.32, - "learning_rate": 0.0002521646124584407, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.000275422584315972, + "loss": 0.0268, "step": 63210 }, { - "epoch": 0.32, - "learning_rate": 0.00025215704476542675, - "loss": 0.0268, + "epoch": 0.16, + "learning_rate": 0.0002754186960996005, + "loss": 0.0261, "step": 63220 }, { - "epoch": 0.32, - "learning_rate": 0.00025214947707241273, - "loss": 0.0197, + "epoch": 0.16, + "learning_rate": 0.00027541480788322904, + "loss": 0.0263, "step": 63230 }, { - "epoch": 0.32, - "learning_rate": 0.0002521419093793987, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.0002754109196668576, + "loss": 0.0303, "step": 63240 }, { - "epoch": 0.32, - "learning_rate": 0.0002521343416863847, - "loss": 0.0178, + "epoch": 0.16, + "learning_rate": 0.0002754070314504861, + "loss": 0.0272, "step": 63250 }, { - "epoch": 0.32, - "learning_rate": 0.0002521267739933707, - "loss": 0.0218, + "epoch": 0.16, + "learning_rate": 0.0002754031432341147, + "loss": 0.0268, "step": 63260 }, { - "epoch": 0.32, - "learning_rate": 0.00025211920630035666, - "loss": 0.0217, + "epoch": 0.16, + "learning_rate": 0.0002753992550177432, + "loss": 0.0267, "step": 63270 }, { - "epoch": 0.32, - "learning_rate": 0.0002521116386073427, - "loss": 0.0218, + "epoch": 0.16, + "learning_rate": 0.0002753953668013717, + "loss": 0.0275, "step": 63280 }, { - "epoch": 0.32, - "learning_rate": 0.0002521040709143287, - "loss": 0.02, + "epoch": 0.16, + "learning_rate": 0.00027539147858500024, + "loss": 0.0348, "step": 63290 }, { - "epoch": 0.32, - "learning_rate": 0.00025209650322131465, - "loss": 0.0262, + "epoch": 0.16, + "learning_rate": 0.0002753875903686288, + "loss": 0.0329, "step": 63300 }, { - "epoch": 0.32, - "learning_rate": 0.00025208893552830064, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.0002753837021522573, + "loss": 0.0228, "step": 63310 }, { - "epoch": 0.32, - "learning_rate": 0.0002520813678352866, - "loss": 0.019, + "epoch": 0.16, + "learning_rate": 0.0002753798139358859, + "loss": 0.0277, "step": 63320 }, { - "epoch": 0.32, - "learning_rate": 0.0002520738001422726, - "loss": 0.017, + "epoch": 0.16, + "learning_rate": 0.0002753759257195144, + "loss": 0.028, "step": 63330 }, { - "epoch": 0.32, - "learning_rate": 0.00025206623244925863, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.00027537203750314297, + "loss": 0.026, "step": 63340 }, { - "epoch": 0.32, - "learning_rate": 0.0002520586647562446, - "loss": 0.0183, + "epoch": 0.16, + "learning_rate": 0.0002753681492867715, + "loss": 0.02, "step": 63350 }, { - "epoch": 0.32, - "learning_rate": 0.0002520510970632306, - "loss": 0.018, + "epoch": 0.16, + "learning_rate": 0.0002753642610704, + "loss": 0.0251, "step": 63360 }, { - "epoch": 0.32, - "learning_rate": 0.0002520435293702166, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.00027536037285402857, + "loss": 0.0275, "step": 63370 }, { - "epoch": 0.32, - "learning_rate": 0.00025203596167720256, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.0002753564846376571, + "loss": 0.0266, "step": 63380 }, { - "epoch": 0.32, - "learning_rate": 0.00025202839398418854, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027535259642128565, + "loss": 0.023, "step": 63390 }, { - "epoch": 0.32, - "learning_rate": 0.0002520208262911745, - "loss": 0.0273, + "epoch": 0.16, + "learning_rate": 0.00027534870820491417, + "loss": 0.0268, "step": 63400 }, { - "epoch": 0.32, - "learning_rate": 0.00025201325859816056, - "loss": 0.0179, + "epoch": 0.16, + "learning_rate": 0.0002753448199885427, + "loss": 0.0251, "step": 63410 }, { - "epoch": 0.32, - "learning_rate": 0.00025200569090514654, - "loss": 0.0242, + "epoch": 0.16, + "learning_rate": 0.00027534093177217125, + "loss": 0.027, "step": 63420 }, { - "epoch": 0.32, - "learning_rate": 0.0002519981232121325, - "loss": 0.0193, + "epoch": 0.16, + "learning_rate": 0.00027533704355579976, + "loss": 0.0268, "step": 63430 }, { - "epoch": 0.32, - "learning_rate": 0.0002519905555191185, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.0002753331553394283, + "loss": 0.0329, "step": 63440 }, { - "epoch": 0.32, - "learning_rate": 0.0002519829878261045, - "loss": 0.0235, + "epoch": 0.16, + "learning_rate": 0.00027532926712305685, + "loss": 0.0252, "step": 63450 }, { - "epoch": 0.32, - "learning_rate": 0.00025197542013309047, - "loss": 0.0206, + "epoch": 0.16, + "learning_rate": 0.0002753253789066854, + "loss": 0.0243, "step": 63460 }, { - "epoch": 0.32, - "learning_rate": 0.0002519678524400765, - "loss": 0.0165, + "epoch": 0.16, + "learning_rate": 0.00027532149069031393, + "loss": 0.0221, "step": 63470 }, { - "epoch": 0.32, - "learning_rate": 0.00025196028474706243, - "loss": 0.0186, + "epoch": 0.16, + "learning_rate": 0.00027531760247394245, + "loss": 0.0275, "step": 63480 }, { - "epoch": 0.32, - "learning_rate": 0.0002519527170540484, - "loss": 0.0216, + "epoch": 0.16, + "learning_rate": 0.00027531371425757096, + "loss": 0.0262, "step": 63490 }, { - "epoch": 0.32, - "learning_rate": 0.0002519451493610344, - "loss": 0.0175, + "epoch": 0.16, + "learning_rate": 0.00027530982604119953, + "loss": 0.0242, "step": 63500 }, { - "epoch": 0.32, - "learning_rate": 0.00025193758166802043, - "loss": 0.0144, + "epoch": 0.16, + "learning_rate": 0.00027530593782482804, + "loss": 0.0245, "step": 63510 }, { - "epoch": 0.32, - "learning_rate": 0.0002519300139750064, - "loss": 0.0219, + "epoch": 0.16, + "learning_rate": 0.0002753020496084566, + "loss": 0.0283, "step": 63520 }, { - "epoch": 0.32, - "learning_rate": 0.0002519224462819924, - "loss": 0.0196, + "epoch": 0.16, + "learning_rate": 0.0002752981613920851, + "loss": 0.0261, "step": 63530 }, { - "epoch": 0.32, - "learning_rate": 0.00025191487858897837, - "loss": 0.0194, + "epoch": 0.16, + "learning_rate": 0.00027529427317571364, + "loss": 0.0288, "step": 63540 }, { - "epoch": 0.32, - "learning_rate": 0.00025190731089596435, - "loss": 0.0176, + "epoch": 0.16, + "learning_rate": 0.0002752903849593422, + "loss": 0.0249, "step": 63550 }, { - "epoch": 0.32, - "learning_rate": 0.00025189974320295034, - "loss": 0.0203, + "epoch": 0.16, + "learning_rate": 0.0002752864967429707, + "loss": 0.0302, "step": 63560 }, { - "epoch": 0.32, - "learning_rate": 0.00025189217550993637, - "loss": 0.0162, + "epoch": 0.16, + "learning_rate": 0.00027528260852659924, + "loss": 0.0242, "step": 63570 }, { - "epoch": 0.32, - "learning_rate": 0.00025188460781692235, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.0002752787203102278, + "loss": 0.0252, "step": 63580 }, { - "epoch": 0.32, - "learning_rate": 0.00025187704012390833, - "loss": 0.0205, + "epoch": 0.16, + "learning_rate": 0.0002752748320938563, + "loss": 0.0258, "step": 63590 }, { - "epoch": 0.32, - "learning_rate": 0.0002518694724308943, - "loss": 0.023, + "epoch": 0.16, + "learning_rate": 0.0002752709438774849, + "loss": 0.0233, "step": 63600 }, { - "epoch": 0.32, - "learning_rate": 0.0002518619047378803, - "loss": 0.0245, + "epoch": 0.16, + "learning_rate": 0.0002752670556611134, + "loss": 0.0321, "step": 63610 }, { - "epoch": 0.32, - "learning_rate": 0.0002518543370448663, - "loss": 0.0177, + "epoch": 0.16, + "learning_rate": 0.0002752631674447419, + "loss": 0.0242, "step": 63620 }, { - "epoch": 0.32, - "learning_rate": 0.00025184676935185226, - "loss": 0.0182, + "epoch": 0.16, + "learning_rate": 0.0002752592792283705, + "loss": 0.0584, "step": 63630 }, { - "epoch": 0.32, - "learning_rate": 0.0002518392016588383, - "loss": 0.0235, + "epoch": 0.16, + "learning_rate": 0.000275255391011999, + "loss": 0.0265, "step": 63640 }, { - "epoch": 0.32, - "learning_rate": 0.0002518316339658243, - "loss": 0.0185, + "epoch": 0.16, + "learning_rate": 0.0002752515027956275, + "loss": 0.0271, "step": 63650 }, { - "epoch": 0.32, - "learning_rate": 0.00025182406627281026, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.0002752476145792561, + "loss": 0.0306, "step": 63660 }, { - "epoch": 0.32, - "learning_rate": 0.00025181649857979624, - "loss": 0.0162, + "epoch": 0.17, + "learning_rate": 0.00027524372636288466, + "loss": 0.0429, "step": 63670 }, { - "epoch": 0.32, - "learning_rate": 0.0002518089308867822, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027523983814651317, + "loss": 0.0229, "step": 63680 }, { - "epoch": 0.32, - "learning_rate": 0.0002518013631937682, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002752359499301417, + "loss": 0.0288, "step": 63690 }, { - "epoch": 0.32, - "learning_rate": 0.00025179379550075424, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002752320617137702, + "loss": 0.0421, "step": 63700 }, { - "epoch": 0.32, - "learning_rate": 0.0002517862278077402, - "loss": 0.0164, + "epoch": 0.17, + "learning_rate": 0.00027522817349739877, + "loss": 0.0224, "step": 63710 }, { - "epoch": 0.32, - "learning_rate": 0.0002517786601147262, - "loss": 0.0164, + "epoch": 0.17, + "learning_rate": 0.0002752242852810273, + "loss": 0.024, "step": 63720 }, { - "epoch": 0.32, - "learning_rate": 0.0002517710924217122, - "loss": 0.0245, + "epoch": 0.17, + "learning_rate": 0.00027522039706465585, + "loss": 0.0271, "step": 63730 }, { - "epoch": 0.32, - "learning_rate": 0.00025176352472869816, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.00027521650884828437, + "loss": 0.0318, "step": 63740 }, { - "epoch": 0.32, - "learning_rate": 0.00025175595703568415, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.00027521262063191293, + "loss": 0.0251, "step": 63750 }, { - "epoch": 0.32, - "learning_rate": 0.0002517483893426702, - "loss": 0.026, + "epoch": 0.17, + "learning_rate": 0.00027520873241554145, + "loss": 0.0245, "step": 63760 }, { - "epoch": 0.32, - "learning_rate": 0.00025174082164965616, - "loss": 0.0185, + "epoch": 0.17, + "learning_rate": 0.00027520484419916996, + "loss": 0.0247, "step": 63770 }, { - "epoch": 0.32, - "learning_rate": 0.00025173325395664214, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.0002752009559827985, + "loss": 0.0263, "step": 63780 }, { - "epoch": 0.32, - "learning_rate": 0.0002517256862636281, - "loss": 0.026, + "epoch": 0.17, + "learning_rate": 0.00027519706776642705, + "loss": 0.0275, "step": 63790 }, { - "epoch": 0.32, - "learning_rate": 0.0002517181185706141, - "loss": 0.0196, + "epoch": 0.17, + "learning_rate": 0.00027519317955005556, + "loss": 0.032, "step": 63800 }, { - "epoch": 0.32, - "learning_rate": 0.0002517105508776001, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.00027518929133368413, + "loss": 0.0243, "step": 63810 }, { - "epoch": 0.32, - "learning_rate": 0.00025170298318458607, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.00027518540311731264, + "loss": 0.031, "step": 63820 }, { - "epoch": 0.32, - "learning_rate": 0.0002516954154915721, - "loss": 0.0167, + "epoch": 0.17, + "learning_rate": 0.00027518151490094116, + "loss": 0.0237, "step": 63830 }, { - "epoch": 0.32, - "learning_rate": 0.0002516878477985581, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.00027517762668456973, + "loss": 0.0221, "step": 63840 }, { - "epoch": 0.32, - "learning_rate": 0.00025168028010554407, - "loss": 0.0162, + "epoch": 0.17, + "learning_rate": 0.00027517373846819824, + "loss": 0.0221, "step": 63850 }, { - "epoch": 0.32, - "learning_rate": 0.00025167271241253005, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002751698502518268, + "loss": 0.0277, "step": 63860 }, { - "epoch": 0.32, - "learning_rate": 0.00025166514471951603, - "loss": 0.0227, + "epoch": 0.17, + "learning_rate": 0.0002751659620354553, + "loss": 0.0251, "step": 63870 }, { - "epoch": 0.32, - "learning_rate": 0.000251657577026502, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.0002751620738190839, + "loss": 0.0268, "step": 63880 }, { - "epoch": 0.32, - "learning_rate": 0.00025165000933348805, - "loss": 0.0164, + "epoch": 0.17, + "learning_rate": 0.0002751581856027124, + "loss": 0.0249, "step": 63890 }, { - "epoch": 0.32, - "learning_rate": 0.00025164244164047403, - "loss": 0.0176, + "epoch": 0.17, + "learning_rate": 0.0002751542973863409, + "loss": 0.0273, "step": 63900 }, { - "epoch": 0.32, - "learning_rate": 0.00025163487394746, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.00027515040916996944, + "loss": 0.027, "step": 63910 }, { - "epoch": 0.32, - "learning_rate": 0.000251627306254446, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.000275146520953598, + "loss": 0.0246, "step": 63920 }, { - "epoch": 0.32, - "learning_rate": 0.000251619738561432, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.0002751426327372265, + "loss": 0.0269, "step": 63930 }, { - "epoch": 0.32, - "learning_rate": 0.00025161217086841796, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.0002751387445208551, + "loss": 0.022, "step": 63940 }, { - "epoch": 0.32, - "learning_rate": 0.00025160460317540394, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.0002751348563044836, + "loss": 0.0288, "step": 63950 }, { - "epoch": 0.32, - "learning_rate": 0.00025159703548238997, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.0002751309680881122, + "loss": 0.0265, "step": 63960 }, { - "epoch": 0.32, - "learning_rate": 0.00025158946778937595, - "loss": 0.026, + "epoch": 0.17, + "learning_rate": 0.0002751270798717407, + "loss": 0.0233, "step": 63970 }, { - "epoch": 0.32, - "learning_rate": 0.00025158190009636194, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.0002751231916553692, + "loss": 0.0273, "step": 63980 }, { - "epoch": 0.32, - "learning_rate": 0.0002515743324033479, - "loss": 0.0206, + "epoch": 0.17, + "learning_rate": 0.0002751193034389977, + "loss": 0.0279, "step": 63990 }, { - "epoch": 0.32, - "learning_rate": 0.0002515667647103339, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.0002751154152226263, + "loss": 0.0284, "step": 64000 }, { - "epoch": 0.32, - "eval_cer": 0.9144692855070369, - "eval_loss": 0.01427229680120945, - "eval_runtime": 116.7184, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.17, + "eval_cer": 0.8818384511057832, + "eval_loss": 0.018597625195980072, + "eval_runtime": 108.1781, + "eval_samples_per_second": 18.488, + "eval_steps_per_second": 4.622, "step": 64000 }, { - "epoch": 0.32, - "learning_rate": 0.0002515591970173199, - "loss": 0.0165, + "epoch": 0.17, + "learning_rate": 0.00027511152700625485, + "loss": 0.0261, "step": 64010 }, { - "epoch": 0.32, - "learning_rate": 0.0002515516293243059, - "loss": 0.0222, + "epoch": 0.17, + "learning_rate": 0.00027510763878988337, + "loss": 0.0258, "step": 64020 }, { - "epoch": 0.32, - "learning_rate": 0.0002515440616312919, - "loss": 0.0173, + "epoch": 0.17, + "learning_rate": 0.0002751037505735119, + "loss": 0.0294, "step": 64030 }, { - "epoch": 0.32, - "learning_rate": 0.0002515364939382779, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.0002750998623571404, + "loss": 0.0255, "step": 64040 }, { - "epoch": 0.32, - "learning_rate": 0.00025152892624526386, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.00027509597414076897, + "loss": 0.031, "step": 64050 }, { - "epoch": 0.32, - "learning_rate": 0.00025152135855224984, - "loss": 0.0208, + "epoch": 0.17, + "learning_rate": 0.0002750920859243975, + "loss": 0.0274, "step": 64060 }, { - "epoch": 0.32, - "learning_rate": 0.0002515137908592358, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.00027508819770802605, + "loss": 0.0303, "step": 64070 }, { - "epoch": 0.32, - "learning_rate": 0.00025150622316622186, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.00027508430949165456, + "loss": 0.0212, "step": 64080 }, { - "epoch": 0.32, - "learning_rate": 0.00025149865547320784, - "loss": 0.0217, + "epoch": 0.17, + "learning_rate": 0.00027508042127528313, + "loss": 0.0259, "step": 64090 }, { - "epoch": 0.32, - "learning_rate": 0.0002514910877801938, - "loss": 0.0243, + "epoch": 0.17, + "learning_rate": 0.00027507653305891165, + "loss": 0.0248, "step": 64100 }, { - "epoch": 0.32, - "learning_rate": 0.0002514835200871798, - "loss": 0.0202, + "epoch": 0.17, + "learning_rate": 0.00027507264484254016, + "loss": 0.0264, "step": 64110 }, { - "epoch": 0.32, - "learning_rate": 0.0002514759523941658, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.0002750687566261687, + "loss": 0.025, "step": 64120 }, { - "epoch": 0.32, - "learning_rate": 0.00025146838470115177, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.00027506486840979725, + "loss": 0.0237, "step": 64130 }, { - "epoch": 0.32, - "learning_rate": 0.00025146081700813775, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.00027506098019342576, + "loss": 0.0234, "step": 64140 }, { - "epoch": 0.32, - "learning_rate": 0.0002514532493151238, - "loss": 0.0202, + "epoch": 0.17, + "learning_rate": 0.00027505709197705433, + "loss": 0.0264, "step": 64150 }, { - "epoch": 0.32, - "learning_rate": 0.00025144568162210976, - "loss": 0.0202, + "epoch": 0.17, + "learning_rate": 0.00027505320376068284, + "loss": 0.0264, "step": 64160 }, { - "epoch": 0.32, - "learning_rate": 0.00025143811392909575, - "loss": 0.0187, + "epoch": 0.17, + "learning_rate": 0.0002750493155443114, + "loss": 0.0233, "step": 64170 }, { - "epoch": 0.32, - "learning_rate": 0.0002514305462360817, - "loss": 0.0184, + "epoch": 0.17, + "learning_rate": 0.0002750454273279399, + "loss": 0.0258, "step": 64180 }, { - "epoch": 0.32, - "learning_rate": 0.0002514229785430677, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.00027504153911156844, + "loss": 0.0301, "step": 64190 }, { - "epoch": 0.32, - "learning_rate": 0.0002514154108500537, - "loss": 0.025, + "epoch": 0.17, + "learning_rate": 0.00027503765089519696, + "loss": 0.0313, "step": 64200 }, { - "epoch": 0.32, - "learning_rate": 0.0002514078431570397, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.0002750337626788255, + "loss": 0.0259, "step": 64210 }, { - "epoch": 0.32, - "learning_rate": 0.0002514002754640257, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.0002750298744624541, + "loss": 0.0273, "step": 64220 }, { - "epoch": 0.32, - "learning_rate": 0.0002513927077710117, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002750259862460826, + "loss": 0.0283, "step": 64230 }, { - "epoch": 0.32, - "learning_rate": 0.00025138514007799767, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.0002750220980297111, + "loss": 0.0263, "step": 64240 }, { - "epoch": 0.32, - "learning_rate": 0.00025137757238498365, - "loss": 0.0217, + "epoch": 0.17, + "learning_rate": 0.0002750182098133397, + "loss": 0.0256, "step": 64250 }, { - "epoch": 0.32, - "learning_rate": 0.00025137000469196963, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.0002750143215969682, + "loss": 0.0214, "step": 64260 }, { - "epoch": 0.32, - "learning_rate": 0.0002513624369989556, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002750104333805967, + "loss": 0.0282, "step": 64270 }, { - "epoch": 0.32, - "learning_rate": 0.00025135486930594165, - "loss": 0.0185, + "epoch": 0.17, + "learning_rate": 0.0002750065451642253, + "loss": 0.0258, "step": 64280 }, { - "epoch": 0.32, - "learning_rate": 0.00025134730161292763, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.0002750026569478538, + "loss": 0.0301, "step": 64290 }, { - "epoch": 0.32, - "learning_rate": 0.0002513397339199136, - "loss": 0.017, + "epoch": 0.17, + "learning_rate": 0.00027499876873148237, + "loss": 0.0254, "step": 64300 }, { - "epoch": 0.32, - "learning_rate": 0.0002513321662268996, - "loss": 0.0185, + "epoch": 0.17, + "learning_rate": 0.0002749948805151109, + "loss": 0.0218, "step": 64310 }, { - "epoch": 0.32, - "learning_rate": 0.0002513245985338856, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.0002749909922987394, + "loss": 0.0278, "step": 64320 }, { - "epoch": 0.32, - "learning_rate": 0.00025131703084087156, - "loss": 0.0173, + "epoch": 0.17, + "learning_rate": 0.0002749871040823679, + "loss": 0.0279, "step": 64330 }, { - "epoch": 0.32, - "learning_rate": 0.0002513094631478576, - "loss": 0.0164, + "epoch": 0.17, + "learning_rate": 0.0002749832158659965, + "loss": 0.0325, "step": 64340 }, { - "epoch": 0.32, - "learning_rate": 0.0002513018954548436, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.000274979327649625, + "loss": 0.0253, "step": 64350 }, { - "epoch": 0.32, - "learning_rate": 0.00025129432776182956, - "loss": 0.0264, + "epoch": 0.17, + "learning_rate": 0.00027497543943325357, + "loss": 0.024, "step": 64360 }, { - "epoch": 0.32, - "learning_rate": 0.00025128676006881554, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.0002749715512168821, + "loss": 0.0245, "step": 64370 }, { - "epoch": 0.32, - "learning_rate": 0.0002512791923758015, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.00027496766300051065, + "loss": 0.0221, "step": 64380 }, { - "epoch": 0.32, - "learning_rate": 0.0002512716246827875, - "loss": 0.0248, + "epoch": 0.17, + "learning_rate": 0.00027496377478413917, + "loss": 0.0277, "step": 64390 }, { - "epoch": 0.32, - "learning_rate": 0.00025126405698977354, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002749598865677677, + "loss": 0.0284, "step": 64400 }, { - "epoch": 0.32, - "learning_rate": 0.0002512564892967595, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.00027495599835139625, + "loss": 0.0265, "step": 64410 }, { - "epoch": 0.33, - "learning_rate": 0.0002512489216037455, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.00027495211013502476, + "loss": 0.0267, "step": 64420 }, { - "epoch": 0.33, - "learning_rate": 0.0002512413539107315, - "loss": 0.0235, + "epoch": 0.17, + "learning_rate": 0.00027494822191865333, + "loss": 0.0267, "step": 64430 }, { - "epoch": 0.33, - "learning_rate": 0.00025123378621771746, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.00027494433370228185, + "loss": 0.0266, "step": 64440 }, { - "epoch": 0.33, - "learning_rate": 0.00025122621852470344, - "loss": 0.0293, + "epoch": 0.17, + "learning_rate": 0.00027494044548591036, + "loss": 0.0265, "step": 64450 }, { - "epoch": 0.33, - "learning_rate": 0.0002512186508316894, - "loss": 0.0289, + "epoch": 0.17, + "learning_rate": 0.00027493655726953893, + "loss": 0.027, "step": 64460 }, { - "epoch": 0.33, - "learning_rate": 0.00025121108313867546, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027493266905316744, + "loss": 0.0246, "step": 64470 }, { - "epoch": 0.33, - "learning_rate": 0.00025120351544566144, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.00027492878083679596, + "loss": 0.0293, "step": 64480 }, { - "epoch": 0.33, - "learning_rate": 0.0002511959477526474, - "loss": 0.0162, + "epoch": 0.17, + "learning_rate": 0.00027492489262042453, + "loss": 0.026, "step": 64490 }, { - "epoch": 0.33, - "learning_rate": 0.0002511883800596334, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.00027492100440405304, + "loss": 0.0191, "step": 64500 }, { - "epoch": 0.33, - "learning_rate": 0.0002511808123666194, - "loss": 0.0186, + "epoch": 0.17, + "learning_rate": 0.0002749171161876816, + "loss": 0.0247, "step": 64510 }, { - "epoch": 0.33, - "learning_rate": 0.00025117324467360537, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.0002749132279713101, + "loss": 0.0205, "step": 64520 }, { - "epoch": 0.33, - "learning_rate": 0.0002511656769805914, - "loss": 0.0168, + "epoch": 0.17, + "learning_rate": 0.00027490933975493864, + "loss": 0.0273, "step": 64530 }, { - "epoch": 0.33, - "learning_rate": 0.0002511581092875774, - "loss": 0.0238, + "epoch": 0.17, + "learning_rate": 0.00027490545153856715, + "loss": 0.0248, "step": 64540 }, { - "epoch": 0.33, - "learning_rate": 0.00025115054159456337, - "loss": 0.0161, + "epoch": 0.17, + "learning_rate": 0.0002749015633221957, + "loss": 0.0281, "step": 64550 }, { - "epoch": 0.33, - "learning_rate": 0.00025114297390154935, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002748976751058243, + "loss": 0.0248, "step": 64560 }, { - "epoch": 0.33, - "learning_rate": 0.00025113540620853533, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.0002748937868894528, + "loss": 0.0246, "step": 64570 }, { - "epoch": 0.33, - "learning_rate": 0.0002511278385155213, - "loss": 0.0244, + "epoch": 0.17, + "learning_rate": 0.0002748898986730813, + "loss": 0.0262, "step": 64580 }, { - "epoch": 0.33, - "learning_rate": 0.00025112027082250735, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002748860104567099, + "loss": 0.0312, "step": 64590 }, { - "epoch": 0.33, - "learning_rate": 0.0002511127031294933, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.0002748821222403384, + "loss": 0.0202, "step": 64600 }, { - "epoch": 0.33, - "learning_rate": 0.0002511051354364793, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002748782340239669, + "loss": 0.0259, "step": 64610 }, { - "epoch": 0.33, - "learning_rate": 0.0002510975677434653, - "loss": 0.0247, + "epoch": 0.17, + "learning_rate": 0.0002748743458075955, + "loss": 0.0266, "step": 64620 }, { - "epoch": 0.33, - "learning_rate": 0.00025109000005045127, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.000274870457591224, + "loss": 0.027, "step": 64630 }, { - "epoch": 0.33, - "learning_rate": 0.00025108243235743725, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.00027486656937485257, + "loss": 0.0333, "step": 64640 }, { - "epoch": 0.33, - "learning_rate": 0.00025107486466442323, - "loss": 0.0221, + "epoch": 0.17, + "learning_rate": 0.0002748626811584811, + "loss": 0.022, "step": 64650 }, { - "epoch": 0.33, - "learning_rate": 0.00025106729697140927, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.0002748587929421096, + "loss": 0.0242, "step": 64660 }, { - "epoch": 0.33, - "learning_rate": 0.00025105972927839525, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.00027485490472573817, + "loss": 0.0283, "step": 64670 }, { - "epoch": 0.33, - "learning_rate": 0.00025105216158538123, - "loss": 0.0156, + "epoch": 0.17, + "learning_rate": 0.0002748510165093667, + "loss": 0.0289, "step": 64680 }, { - "epoch": 0.33, - "learning_rate": 0.0002510445938923672, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002748471282929952, + "loss": 0.0288, "step": 64690 }, { - "epoch": 0.33, - "learning_rate": 0.0002510370261993532, - "loss": 0.017, + "epoch": 0.17, + "learning_rate": 0.00027484324007662377, + "loss": 0.0247, "step": 64700 }, { - "epoch": 0.33, - "learning_rate": 0.0002510294585063392, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.00027483935186025234, + "loss": 0.0241, "step": 64710 }, { - "epoch": 0.33, - "learning_rate": 0.0002510218908133252, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.00027483546364388085, + "loss": 0.0298, "step": 64720 }, { - "epoch": 0.33, - "learning_rate": 0.00025101432312031114, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.00027483157542750936, + "loss": 0.03, "step": 64730 }, { - "epoch": 0.33, - "learning_rate": 0.0002510067554272971, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.0002748276872111379, + "loss": 0.0253, "step": 64740 }, { - "epoch": 0.33, - "learning_rate": 0.0002509991877342831, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027482379899476645, + "loss": 0.0283, "step": 64750 }, { - "epoch": 0.33, - "learning_rate": 0.00025099162004126914, - "loss": 0.0206, + "epoch": 0.17, + "learning_rate": 0.00027481991077839496, + "loss": 0.0256, "step": 64760 }, { - "epoch": 0.33, - "learning_rate": 0.0002509840523482551, - "loss": 0.0202, + "epoch": 0.17, + "learning_rate": 0.00027481602256202353, + "loss": 0.0206, "step": 64770 }, { - "epoch": 0.33, - "learning_rate": 0.0002509764846552411, - "loss": 0.0167, + "epoch": 0.17, + "learning_rate": 0.00027481213434565205, + "loss": 0.0265, "step": 64780 }, { - "epoch": 0.33, - "learning_rate": 0.0002509689169622271, - "loss": 0.0165, + "epoch": 0.17, + "learning_rate": 0.00027480824612928056, + "loss": 0.0283, "step": 64790 }, { - "epoch": 0.33, - "learning_rate": 0.00025096134926921306, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.00027480435791290913, + "loss": 0.0224, "step": 64800 }, { - "epoch": 0.33, - "learning_rate": 0.00025095378157619905, - "loss": 0.018, + "epoch": 0.17, + "learning_rate": 0.00027480046969653764, + "loss": 0.0224, "step": 64810 }, { - "epoch": 0.33, - "learning_rate": 0.0002509462138831851, - "loss": 0.0163, + "epoch": 0.17, + "learning_rate": 0.00027479658148016616, + "loss": 0.0237, "step": 64820 }, { - "epoch": 0.33, - "learning_rate": 0.00025093864619017106, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.0002747926932637947, + "loss": 0.025, "step": 64830 }, { - "epoch": 0.33, - "learning_rate": 0.00025093107849715704, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.00027478880504742324, + "loss": 0.0228, "step": 64840 }, { - "epoch": 0.33, - "learning_rate": 0.000250923510804143, - "loss": 0.015, + "epoch": 0.17, + "learning_rate": 0.0002747849168310518, + "loss": 0.0251, "step": 64850 }, { - "epoch": 0.33, - "learning_rate": 0.000250915943111129, - "loss": 0.0222, + "epoch": 0.17, + "learning_rate": 0.0002747810286146803, + "loss": 0.0255, "step": 64860 }, { - "epoch": 0.33, - "learning_rate": 0.000250908375418115, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.00027477714039830884, + "loss": 0.0273, "step": 64870 }, { - "epoch": 0.33, - "learning_rate": 0.00025090080772510097, - "loss": 0.0169, + "epoch": 0.17, + "learning_rate": 0.0002747732521819374, + "loss": 0.0296, "step": 64880 }, { - "epoch": 0.33, - "learning_rate": 0.000250893240032087, - "loss": 0.0217, + "epoch": 0.17, + "learning_rate": 0.0002747693639655659, + "loss": 0.0263, "step": 64890 }, { - "epoch": 0.33, - "learning_rate": 0.000250885672339073, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.00027476547574919444, + "loss": 0.0279, "step": 64900 }, { - "epoch": 0.33, - "learning_rate": 0.00025087810464605897, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.000274761587532823, + "loss": 0.0305, "step": 64910 }, { - "epoch": 0.33, - "learning_rate": 0.00025087053695304495, - "loss": 0.0171, + "epoch": 0.17, + "learning_rate": 0.0002747576993164516, + "loss": 0.0248, "step": 64920 }, { - "epoch": 0.33, - "learning_rate": 0.00025086296926003093, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.0002747538111000801, + "loss": 0.0212, "step": 64930 }, { - "epoch": 0.33, - "learning_rate": 0.0002508554015670169, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.0002747499228837086, + "loss": 0.0241, "step": 64940 }, { - "epoch": 0.33, - "learning_rate": 0.00025084783387400295, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002747460346673371, + "loss": 0.0242, "step": 64950 }, { - "epoch": 0.33, - "learning_rate": 0.00025084026618098893, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.0002747421464509657, + "loss": 0.0305, "step": 64960 }, { - "epoch": 0.33, - "learning_rate": 0.0002508326984879749, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.0002747382582345942, + "loss": 0.0241, "step": 64970 }, { - "epoch": 0.33, - "learning_rate": 0.0002508251307949609, - "loss": 0.0263, + "epoch": 0.17, + "learning_rate": 0.00027473437001822277, + "loss": 0.0277, "step": 64980 }, { - "epoch": 0.33, - "learning_rate": 0.0002508175631019469, - "loss": 0.0171, + "epoch": 0.17, + "learning_rate": 0.0002747304818018513, + "loss": 0.0225, "step": 64990 }, { - "epoch": 0.33, - "learning_rate": 0.00025080999540893286, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.00027472659358547985, + "loss": 0.0214, "step": 65000 }, { - "epoch": 0.33, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.013442865572869778, - "eval_runtime": 116.7164, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.17, + "eval_cer": 0.8818076590932312, + "eval_loss": 0.01859799586236477, + "eval_runtime": 108.2159, + "eval_samples_per_second": 18.482, + "eval_steps_per_second": 4.62, "step": 65000 }, { - "epoch": 0.33, - "learning_rate": 0.00025080242771591884, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.00027472270536910837, + "loss": 0.025, "step": 65010 }, { - "epoch": 0.33, - "learning_rate": 0.00025079486002290487, - "loss": 0.0164, + "epoch": 0.17, + "learning_rate": 0.0002747188171527369, + "loss": 0.0277, "step": 65020 }, { - "epoch": 0.33, - "learning_rate": 0.00025078729232989085, - "loss": 0.0209, + "epoch": 0.17, + "learning_rate": 0.0002747149289363654, + "loss": 0.0265, "step": 65030 }, { - "epoch": 0.33, - "learning_rate": 0.00025077972463687684, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.00027471104071999397, + "loss": 0.0267, "step": 65040 }, { - "epoch": 0.33, - "learning_rate": 0.0002507721569438628, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.00027470715250362253, + "loss": 0.0231, "step": 65050 }, { - "epoch": 0.33, - "learning_rate": 0.0002507645892508488, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.00027470326428725105, + "loss": 0.0262, "step": 65060 }, { - "epoch": 0.33, - "learning_rate": 0.0002507570215578348, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.00027469937607087956, + "loss": 0.0302, "step": 65070 }, { - "epoch": 0.33, - "learning_rate": 0.0002507494538648208, - "loss": 0.0166, + "epoch": 0.17, + "learning_rate": 0.0002746954878545081, + "loss": 0.0231, "step": 65080 }, { - "epoch": 0.33, - "learning_rate": 0.0002507418861718068, - "loss": 0.0141, + "epoch": 0.17, + "learning_rate": 0.00027469159963813665, + "loss": 0.028, "step": 65090 }, { - "epoch": 0.33, - "learning_rate": 0.0002507343184787928, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.00027468771142176516, + "loss": 0.0265, "step": 65100 }, { - "epoch": 0.33, - "learning_rate": 0.00025072675078577876, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.00027468382320539373, + "loss": 0.0236, "step": 65110 }, { - "epoch": 0.33, - "learning_rate": 0.00025071918309276474, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.00027467993498902224, + "loss": 0.0311, "step": 65120 }, { - "epoch": 0.33, - "learning_rate": 0.0002507116153997507, - "loss": 0.0147, + "epoch": 0.17, + "learning_rate": 0.0002746760467726508, + "loss": 0.0234, "step": 65130 }, { - "epoch": 0.33, - "learning_rate": 0.00025070404770673676, - "loss": 0.0176, + "epoch": 0.17, + "learning_rate": 0.00027467215855627933, + "loss": 0.0255, "step": 65140 }, { - "epoch": 0.33, - "learning_rate": 0.00025069648001372274, - "loss": 0.0168, + "epoch": 0.17, + "learning_rate": 0.00027466827033990784, + "loss": 0.0277, "step": 65150 }, { - "epoch": 0.33, - "learning_rate": 0.0002506889123207087, - "loss": 0.0155, + "epoch": 0.17, + "learning_rate": 0.00027466438212353636, + "loss": 0.0282, "step": 65160 }, { - "epoch": 0.33, - "learning_rate": 0.0002506813446276947, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002746604939071649, + "loss": 0.0267, "step": 65170 }, { - "epoch": 0.33, - "learning_rate": 0.0002506737769346807, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.00027465660569079344, + "loss": 0.027, "step": 65180 }, { - "epoch": 0.33, - "learning_rate": 0.00025066620924166667, - "loss": 0.0169, + "epoch": 0.17, + "learning_rate": 0.000274652717474422, + "loss": 0.0255, "step": 65190 }, { - "epoch": 0.33, - "learning_rate": 0.00025065864154865265, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.0002746488292580505, + "loss": 0.0267, "step": 65200 }, { - "epoch": 0.33, - "learning_rate": 0.0002506510738556387, - "loss": 0.0235, + "epoch": 0.17, + "learning_rate": 0.0002746449410416791, + "loss": 0.0258, "step": 65210 }, { - "epoch": 0.33, - "learning_rate": 0.00025064350616262466, - "loss": 0.016, + "epoch": 0.17, + "learning_rate": 0.0002746410528253076, + "loss": 0.0233, "step": 65220 }, { - "epoch": 0.33, - "learning_rate": 0.00025063593846961065, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.0002746371646089361, + "loss": 0.0289, "step": 65230 }, { - "epoch": 0.33, - "learning_rate": 0.0002506283707765966, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027463327639256464, + "loss": 0.0288, "step": 65240 }, { - "epoch": 0.33, - "learning_rate": 0.0002506208030835826, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.0002746293881761932, + "loss": 0.0235, "step": 65250 }, { - "epoch": 0.33, - "learning_rate": 0.0002506132353905686, - "loss": 0.0207, + "epoch": 0.17, + "learning_rate": 0.0002746254999598218, + "loss": 0.0218, "step": 65260 }, { - "epoch": 0.33, - "learning_rate": 0.0002506056676975546, - "loss": 0.018, + "epoch": 0.17, + "learning_rate": 0.0002746216117434503, + "loss": 0.0259, "step": 65270 }, { - "epoch": 0.33, - "learning_rate": 0.0002505981000045406, - "loss": 0.0186, + "epoch": 0.17, + "learning_rate": 0.0002746177235270788, + "loss": 0.0287, "step": 65280 }, { - "epoch": 0.33, - "learning_rate": 0.0002505905323115266, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.0002746138353107073, + "loss": 0.0262, "step": 65290 }, { - "epoch": 0.33, - "learning_rate": 0.00025058296461851257, - "loss": 0.0265, + "epoch": 0.17, + "learning_rate": 0.0002746099470943359, + "loss": 0.0246, "step": 65300 }, { - "epoch": 0.33, - "learning_rate": 0.00025057539692549855, - "loss": 0.0166, + "epoch": 0.17, + "learning_rate": 0.0002746060588779644, + "loss": 0.0204, "step": 65310 }, { - "epoch": 0.33, - "learning_rate": 0.00025056782923248453, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.00027460217066159297, + "loss": 0.0184, "step": 65320 }, { - "epoch": 0.33, - "learning_rate": 0.00025056026153947057, - "loss": 0.016, + "epoch": 0.17, + "learning_rate": 0.0002745982824452215, + "loss": 0.0363, "step": 65330 }, { - "epoch": 0.33, - "learning_rate": 0.00025055269384645655, - "loss": 0.0151, + "epoch": 0.17, + "learning_rate": 0.00027459439422885005, + "loss": 0.0258, "step": 65340 }, { - "epoch": 0.33, - "learning_rate": 0.00025054512615344253, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.00027459050601247857, + "loss": 0.0224, "step": 65350 }, { - "epoch": 0.33, - "learning_rate": 0.0002505375584604285, - "loss": 0.0159, + "epoch": 0.17, + "learning_rate": 0.0002745866177961071, + "loss": 0.0294, "step": 65360 }, { - "epoch": 0.33, - "learning_rate": 0.0002505299907674145, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.0002745827295797356, + "loss": 0.0231, "step": 65370 }, { - "epoch": 0.33, - "learning_rate": 0.0002505224230744005, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.00027457884136336416, + "loss": 0.0283, "step": 65380 }, { - "epoch": 0.33, - "learning_rate": 0.00025051485538138646, - "loss": 0.0228, + "epoch": 0.17, + "learning_rate": 0.0002745749531469927, + "loss": 0.0257, "step": 65390 }, { - "epoch": 0.33, - "learning_rate": 0.0002505072876883725, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.00027457106493062125, + "loss": 0.0227, "step": 65400 }, { - "epoch": 0.33, - "learning_rate": 0.0002504997199953585, - "loss": 0.0173, + "epoch": 0.17, + "learning_rate": 0.00027456717671424976, + "loss": 0.0276, "step": 65410 }, { - "epoch": 0.33, - "learning_rate": 0.00025049215230234446, - "loss": 0.0188, + "epoch": 0.17, + "learning_rate": 0.00027456328849787833, + "loss": 0.0265, "step": 65420 }, { - "epoch": 0.33, - "learning_rate": 0.00025048458460933044, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.00027455940028150685, + "loss": 0.0295, "step": 65430 }, { - "epoch": 0.33, - "learning_rate": 0.0002504770169163164, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.00027455551206513536, + "loss": 0.0237, "step": 65440 }, { - "epoch": 0.33, - "learning_rate": 0.0002504694492233024, - "loss": 0.0222, + "epoch": 0.17, + "learning_rate": 0.00027455162384876393, + "loss": 0.0249, "step": 65450 }, { - "epoch": 0.33, - "learning_rate": 0.00025046188153028844, - "loss": 0.0185, + "epoch": 0.17, + "learning_rate": 0.00027454773563239244, + "loss": 0.0223, "step": 65460 }, { - "epoch": 0.33, - "learning_rate": 0.0002504543138372744, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.000274543847416021, + "loss": 0.0236, "step": 65470 }, { - "epoch": 0.33, - "learning_rate": 0.0002504467461442604, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.0002745399591996495, + "loss": 0.0227, "step": 65480 }, { - "epoch": 0.33, - "learning_rate": 0.0002504391784512464, - "loss": 0.0168, + "epoch": 0.17, + "learning_rate": 0.00027453607098327804, + "loss": 0.0263, "step": 65490 }, { - "epoch": 0.33, - "learning_rate": 0.00025043161075823236, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.0002745321827669066, + "loss": 0.0275, "step": 65500 }, { - "epoch": 0.33, - "learning_rate": 0.00025042404306521834, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.0002745282945505351, + "loss": 0.0243, "step": 65510 }, { - "epoch": 0.33, - "learning_rate": 0.0002504164753722043, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.00027452440633416364, + "loss": 0.0242, "step": 65520 }, { - "epoch": 0.33, - "learning_rate": 0.00025040890767919036, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002745205181177922, + "loss": 0.0266, "step": 65530 }, { - "epoch": 0.33, - "learning_rate": 0.00025040133998617634, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002745166299014207, + "loss": 0.0181, "step": 65540 }, { - "epoch": 0.33, - "learning_rate": 0.0002503937722931623, - "loss": 0.018, + "epoch": 0.17, + "learning_rate": 0.0002745127416850493, + "loss": 0.023, "step": 65550 }, { - "epoch": 0.33, - "learning_rate": 0.0002503862046001483, - "loss": 0.0307, + "epoch": 0.17, + "learning_rate": 0.0002745088534686778, + "loss": 0.0269, "step": 65560 }, { - "epoch": 0.33, - "learning_rate": 0.0002503786369071343, - "loss": 0.0172, + "epoch": 0.17, + "learning_rate": 0.0002745049652523063, + "loss": 0.0315, "step": 65570 }, { - "epoch": 0.33, - "learning_rate": 0.00025037106921412027, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.00027450107703593483, + "loss": 0.0225, "step": 65580 }, { - "epoch": 0.33, - "learning_rate": 0.0002503635015211063, - "loss": 0.0171, + "epoch": 0.17, + "learning_rate": 0.0002744971888195634, + "loss": 0.0246, "step": 65590 }, { - "epoch": 0.33, - "learning_rate": 0.0002503559338280923, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.00027449330060319197, + "loss": 0.0248, "step": 65600 }, { - "epoch": 0.33, - "learning_rate": 0.00025034836613507827, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.0002744894123868205, + "loss": 0.0247, "step": 65610 }, { - "epoch": 0.33, - "learning_rate": 0.00025034079844206425, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.000274485524170449, + "loss": 0.0263, "step": 65620 }, { - "epoch": 0.33, - "learning_rate": 0.00025033323074905023, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.00027448163595407757, + "loss": 0.0229, "step": 65630 }, { - "epoch": 0.33, - "learning_rate": 0.0002503256630560362, - "loss": 0.0196, + "epoch": 0.17, + "learning_rate": 0.0002744777477377061, + "loss": 0.0253, "step": 65640 }, { - "epoch": 0.33, - "learning_rate": 0.00025031809536302225, - "loss": 0.0177, + "epoch": 0.17, + "learning_rate": 0.0002744738595213346, + "loss": 0.0288, "step": 65650 }, { - "epoch": 0.33, - "learning_rate": 0.0002503105276700082, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.00027446997130496317, + "loss": 0.0243, "step": 65660 }, { - "epoch": 0.33, - "learning_rate": 0.0002503029599769942, - "loss": 0.0185, + "epoch": 0.17, + "learning_rate": 0.0002744660830885917, + "loss": 0.0315, "step": 65670 }, { - "epoch": 0.33, - "learning_rate": 0.0002502953922839802, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.00027446219487222025, + "loss": 0.0247, "step": 65680 }, { - "epoch": 0.33, - "learning_rate": 0.00025028782459096617, - "loss": 0.0224, + "epoch": 0.17, + "learning_rate": 0.00027445830665584877, + "loss": 0.0216, "step": 65690 }, { - "epoch": 0.33, - "learning_rate": 0.00025028025689795215, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.0002744544184394773, + "loss": 0.0254, "step": 65700 }, { - "epoch": 0.33, - "learning_rate": 0.00025027268920493813, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.00027445053022310585, + "loss": 0.0276, "step": 65710 }, { - "epoch": 0.33, - "learning_rate": 0.00025026512151192417, - "loss": 0.0159, + "epoch": 0.17, + "learning_rate": 0.00027444664200673436, + "loss": 0.0233, "step": 65720 }, { - "epoch": 0.33, - "learning_rate": 0.00025025755381891015, - "loss": 0.0251, + "epoch": 0.17, + "learning_rate": 0.0002744427537903629, + "loss": 0.0396, "step": 65730 }, { - "epoch": 0.33, - "learning_rate": 0.00025024998612589613, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.00027443886557399145, + "loss": 0.0263, "step": 65740 }, { - "epoch": 0.33, - "learning_rate": 0.0002502424184328821, - "loss": 0.0168, + "epoch": 0.17, + "learning_rate": 0.00027443497735761996, + "loss": 0.0271, "step": 65750 }, { - "epoch": 0.33, - "learning_rate": 0.0002502348507398681, - "loss": 0.019, - "step": 65760 + "epoch": 0.17, + "learning_rate": 0.00027443108914124853, + "loss": 0.0301, + "step": 65760 }, { - "epoch": 0.33, - "learning_rate": 0.0002502272830468541, - "loss": 0.0175, + "epoch": 0.17, + "learning_rate": 0.00027442720092487704, + "loss": 0.0237, "step": 65770 }, { - "epoch": 0.33, - "learning_rate": 0.0002502197153538401, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.00027442331270850556, + "loss": 0.0264, "step": 65780 }, { - "epoch": 0.33, - "learning_rate": 0.0002502121476608261, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002744194244921341, + "loss": 0.0264, "step": 65790 }, { - "epoch": 0.33, - "learning_rate": 0.0002502045799678121, - "loss": 0.023, + "epoch": 0.17, + "learning_rate": 0.00027441553627576264, + "loss": 0.0298, "step": 65800 }, { - "epoch": 0.33, - "learning_rate": 0.00025019701227479806, - "loss": 0.0184, + "epoch": 0.17, + "learning_rate": 0.0002744116480593912, + "loss": 0.0225, "step": 65810 }, { - "epoch": 0.33, - "learning_rate": 0.00025018944458178404, - "loss": 0.0244, + "epoch": 0.17, + "learning_rate": 0.0002744077598430197, + "loss": 0.026, "step": 65820 }, { - "epoch": 0.33, - "learning_rate": 0.00025018187688877, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.00027440387162664824, + "loss": 0.0318, "step": 65830 }, { - "epoch": 0.33, - "learning_rate": 0.00025017430919575606, - "loss": 0.0162, + "epoch": 0.17, + "learning_rate": 0.0002743999834102768, + "loss": 0.0239, "step": 65840 }, { - "epoch": 0.33, - "learning_rate": 0.00025016674150274204, - "loss": 0.0206, + "epoch": 0.17, + "learning_rate": 0.0002743960951939053, + "loss": 0.0249, "step": 65850 }, { - "epoch": 0.33, - "learning_rate": 0.000250159173809728, - "loss": 0.015, + "epoch": 0.17, + "learning_rate": 0.00027439220697753384, + "loss": 0.0241, "step": 65860 }, { - "epoch": 0.33, - "learning_rate": 0.000250151606116714, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.0002743883187611624, + "loss": 0.0218, "step": 65870 }, { - "epoch": 0.33, - "learning_rate": 0.0002501440384237, - "loss": 0.0303, + "epoch": 0.17, + "learning_rate": 0.0002743844305447909, + "loss": 0.0328, "step": 65880 }, { - "epoch": 0.33, - "learning_rate": 0.00025013647073068596, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.0002743805423284195, + "loss": 0.0286, "step": 65890 }, { - "epoch": 0.33, - "learning_rate": 0.00025012890303767194, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.000274376654112048, + "loss": 0.0223, "step": 65900 }, { - "epoch": 0.33, - "learning_rate": 0.000250121335344658, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.0002743727658956765, + "loss": 0.0273, "step": 65910 }, { - "epoch": 0.33, - "learning_rate": 0.00025011376765164396, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.0002743688776793051, + "loss": 0.0296, "step": 65920 }, { - "epoch": 0.33, - "learning_rate": 0.00025010619995862994, - "loss": 0.0211, + "epoch": 0.17, + "learning_rate": 0.0002743649894629336, + "loss": 0.0274, "step": 65930 }, { - "epoch": 0.33, - "learning_rate": 0.0002500986322656159, - "loss": 0.0188, + "epoch": 0.17, + "learning_rate": 0.0002743611012465621, + "loss": 0.0317, "step": 65940 }, { - "epoch": 0.33, - "learning_rate": 0.0002500910645726019, - "loss": 0.0166, + "epoch": 0.17, + "learning_rate": 0.0002743572130301907, + "loss": 0.0261, "step": 65950 }, { - "epoch": 0.33, - "learning_rate": 0.0002500834968795879, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.00027435332481381925, + "loss": 0.025, "step": 65960 }, { - "epoch": 0.33, - "learning_rate": 0.0002500759291865739, - "loss": 0.0177, + "epoch": 0.17, + "learning_rate": 0.00027434943659744777, + "loss": 0.025, "step": 65970 }, { - "epoch": 0.33, - "learning_rate": 0.0002500683614935599, - "loss": 0.0149, + "epoch": 0.17, + "learning_rate": 0.0002743455483810763, + "loss": 0.0216, "step": 65980 }, { - "epoch": 0.33, - "learning_rate": 0.00025006079380054583, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002743416601647048, + "loss": 0.0246, "step": 65990 }, { - "epoch": 0.33, - "learning_rate": 0.0002500532261075318, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.00027433777194833337, + "loss": 0.0272, "step": 66000 }, { - "epoch": 0.33, - "eval_cer": 0.9144324104542716, - "eval_loss": 0.01361939124763012, - "eval_runtime": 116.6985, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.285, + "epoch": 0.17, + "eval_cer": 0.8818118580040337, + "eval_loss": 0.018492352217435837, + "eval_runtime": 108.0625, + "eval_samples_per_second": 18.508, + "eval_steps_per_second": 4.627, "step": 66000 }, { - "epoch": 0.33, - "learning_rate": 0.00025004565841451785, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.0002743338837319619, + "loss": 0.0291, "step": 66010 }, { - "epoch": 0.33, - "learning_rate": 0.00025003809072150383, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.00027432999551559045, + "loss": 0.0265, "step": 66020 }, { - "epoch": 0.33, - "learning_rate": 0.0002500305230284898, - "loss": 0.0187, + "epoch": 0.17, + "learning_rate": 0.00027432610729921896, + "loss": 0.0258, "step": 66030 }, { - "epoch": 0.33, - "learning_rate": 0.0002500229553354758, - "loss": 0.0169, + "epoch": 0.17, + "learning_rate": 0.0002743222190828475, + "loss": 0.0287, "step": 66040 }, { - "epoch": 0.33, - "learning_rate": 0.0002500153876424618, - "loss": 0.0237, + "epoch": 0.17, + "learning_rate": 0.00027431833086647605, + "loss": 0.0267, "step": 66050 }, { - "epoch": 0.33, - "learning_rate": 0.00025000781994944776, - "loss": 0.0186, + "epoch": 0.17, + "learning_rate": 0.00027431444265010456, + "loss": 0.0273, "step": 66060 }, { - "epoch": 0.33, - "learning_rate": 0.00025000025225643374, - "loss": 0.0148, + "epoch": 0.17, + "learning_rate": 0.0002743105544337331, + "loss": 0.0247, "step": 66070 }, { - "epoch": 0.33, - "learning_rate": 0.00024999268456341977, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.00027430666621736165, + "loss": 0.025, "step": 66080 }, { - "epoch": 0.33, - "learning_rate": 0.00024998511687040575, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.00027430277800099016, + "loss": 0.032, "step": 66090 }, { - "epoch": 0.33, - "learning_rate": 0.00024997754917739174, - "loss": 0.0172, + "epoch": 0.17, + "learning_rate": 0.00027429888978461873, + "loss": 0.0281, "step": 66100 }, { - "epoch": 0.33, - "learning_rate": 0.0002499699814843777, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.00027429500156824724, + "loss": 0.0244, "step": 66110 }, { - "epoch": 0.33, - "learning_rate": 0.0002499624137913637, - "loss": 0.0187, + "epoch": 0.17, + "learning_rate": 0.00027429111335187576, + "loss": 0.0295, "step": 66120 }, { - "epoch": 0.33, - "learning_rate": 0.0002499548460983497, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.0002742872251355043, + "loss": 0.0241, "step": 66130 }, { - "epoch": 0.33, - "learning_rate": 0.0002499472784053357, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.00027428333691913284, + "loss": 0.0253, "step": 66140 }, { - "epoch": 0.33, - "learning_rate": 0.0002499397107123217, - "loss": 0.0175, + "epoch": 0.17, + "learning_rate": 0.0002742794487027614, + "loss": 0.0279, "step": 66150 }, { - "epoch": 0.33, - "learning_rate": 0.0002499321430193077, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.0002742755604863899, + "loss": 0.025, "step": 66160 }, { - "epoch": 0.33, - "learning_rate": 0.00024992457532629366, - "loss": 0.0172, + "epoch": 0.17, + "learning_rate": 0.0002742716722700185, + "loss": 0.0307, "step": 66170 }, { - "epoch": 0.33, - "learning_rate": 0.00024991700763327964, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.000274267784053647, + "loss": 0.0261, "step": 66180 }, { - "epoch": 0.33, - "learning_rate": 0.0002499094399402656, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002742638958372755, + "loss": 0.0228, "step": 66190 }, { - "epoch": 0.33, - "learning_rate": 0.00024990187224725166, - "loss": 0.0175, + "epoch": 0.17, + "learning_rate": 0.00027426000762090404, + "loss": 0.0253, "step": 66200 }, { - "epoch": 0.33, - "learning_rate": 0.00024989430455423764, - "loss": 0.0204, + "epoch": 0.17, + "learning_rate": 0.0002742561194045326, + "loss": 0.0254, "step": 66210 }, { - "epoch": 0.33, - "learning_rate": 0.0002498867368612236, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.0002742522311881611, + "loss": 0.0245, "step": 66220 }, { - "epoch": 0.33, - "learning_rate": 0.0002498791691682096, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.0002742483429717897, + "loss": 0.0238, "step": 66230 }, { - "epoch": 0.33, - "learning_rate": 0.0002498716014751956, - "loss": 0.0247, + "epoch": 0.17, + "learning_rate": 0.0002742444547554182, + "loss": 0.0209, "step": 66240 }, { - "epoch": 0.33, - "learning_rate": 0.00024986403378218157, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.0002742405665390467, + "loss": 0.027, "step": 66250 }, { - "epoch": 0.33, - "learning_rate": 0.00024985646608916755, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.0002742366783226753, + "loss": 0.0257, "step": 66260 }, { - "epoch": 0.33, - "learning_rate": 0.0002498488983961536, - "loss": 0.0232, + "epoch": 0.17, + "learning_rate": 0.0002742327901063038, + "loss": 0.0275, "step": 66270 }, { - "epoch": 0.33, - "learning_rate": 0.00024984133070313956, - "loss": 0.0173, + "epoch": 0.17, + "learning_rate": 0.0002742289018899323, + "loss": 0.0254, "step": 66280 }, { - "epoch": 0.33, - "learning_rate": 0.00024983376301012555, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.0002742250136735609, + "loss": 0.0282, "step": 66290 }, { - "epoch": 0.33, - "learning_rate": 0.00024982619531711153, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.00027422112545718945, + "loss": 0.0222, "step": 66300 }, { - "epoch": 0.33, - "learning_rate": 0.0002498186276240975, - "loss": 0.0176, + "epoch": 0.17, + "learning_rate": 0.00027421723724081797, + "loss": 0.026, "step": 66310 }, { - "epoch": 0.33, - "learning_rate": 0.0002498110599310835, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.0002742133490244465, + "loss": 0.029, "step": 66320 }, { - "epoch": 0.33, - "learning_rate": 0.0002498034922380695, - "loss": 0.0159, + "epoch": 0.17, + "learning_rate": 0.000274209460808075, + "loss": 0.0267, "step": 66330 }, { - "epoch": 0.33, - "learning_rate": 0.0002497959245450555, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.00027420557259170357, + "loss": 0.0304, "step": 66340 }, { - "epoch": 0.33, - "learning_rate": 0.0002497883568520415, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.0002742016843753321, + "loss": 0.0245, "step": 66350 }, { - "epoch": 0.33, - "learning_rate": 0.00024978078915902747, - "loss": 0.0234, + "epoch": 0.17, + "learning_rate": 0.00027419779615896065, + "loss": 0.0246, "step": 66360 }, { - "epoch": 0.33, - "learning_rate": 0.00024977322146601345, - "loss": 0.0172, + "epoch": 0.17, + "learning_rate": 0.00027419390794258916, + "loss": 0.0285, "step": 66370 }, { - "epoch": 0.33, - "learning_rate": 0.00024976565377299943, - "loss": 0.0188, + "epoch": 0.17, + "learning_rate": 0.00027419001972621773, + "loss": 0.0258, "step": 66380 }, { - "epoch": 0.33, - "learning_rate": 0.00024975808607998547, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.00027418613150984625, + "loss": 0.0251, "step": 66390 }, { - "epoch": 0.33, - "learning_rate": 0.00024975051838697145, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.00027418224329347476, + "loss": 0.0299, "step": 66400 }, { - "epoch": 0.34, - "learning_rate": 0.00024974295069395743, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.0002741783550771033, + "loss": 0.0239, "step": 66410 }, { - "epoch": 0.34, - "learning_rate": 0.0002497353830009434, - "loss": 0.0176, + "epoch": 0.17, + "learning_rate": 0.00027417446686073184, + "loss": 0.0284, "step": 66420 }, { - "epoch": 0.34, - "learning_rate": 0.0002497278153079294, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.00027417057864436036, + "loss": 0.0256, "step": 66430 }, { - "epoch": 0.34, - "learning_rate": 0.0002497202476149154, - "loss": 0.0188, + "epoch": 0.17, + "learning_rate": 0.00027416669042798893, + "loss": 0.0265, "step": 66440 }, { - "epoch": 0.34, - "learning_rate": 0.00024971267992190136, - "loss": 0.018, + "epoch": 0.17, + "learning_rate": 0.00027416280221161744, + "loss": 0.031, "step": 66450 }, { - "epoch": 0.34, - "learning_rate": 0.0002497051122288874, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.000274158913995246, + "loss": 0.0381, "step": 66460 }, { - "epoch": 0.34, - "learning_rate": 0.0002496975445358734, - "loss": 0.0144, + "epoch": 0.17, + "learning_rate": 0.0002741550257788745, + "loss": 0.0308, "step": 66470 }, { - "epoch": 0.34, - "learning_rate": 0.00024968997684285936, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.00027415113756250304, + "loss": 0.0336, "step": 66480 }, { - "epoch": 0.34, - "learning_rate": 0.00024968240914984534, - "loss": 0.018, + "epoch": 0.17, + "learning_rate": 0.00027414724934613155, + "loss": 0.0305, "step": 66490 }, { - "epoch": 0.34, - "learning_rate": 0.0002496748414568313, - "loss": 0.0167, + "epoch": 0.17, + "learning_rate": 0.0002741433611297601, + "loss": 0.0261, "step": 66500 }, { - "epoch": 0.34, - "learning_rate": 0.0002496672737638173, - "loss": 0.0173, + "epoch": 0.17, + "learning_rate": 0.0002741394729133887, + "loss": 0.0229, "step": 66510 }, { - "epoch": 0.34, - "learning_rate": 0.00024965970607080334, - "loss": 0.0172, + "epoch": 0.17, + "learning_rate": 0.0002741355846970172, + "loss": 0.033, "step": 66520 }, { - "epoch": 0.34, - "learning_rate": 0.0002496521383777893, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.0002741316964806457, + "loss": 0.0273, "step": 66530 }, { - "epoch": 0.34, - "learning_rate": 0.0002496445706847753, - "loss": 0.0283, + "epoch": 0.17, + "learning_rate": 0.00027412780826427424, + "loss": 0.0289, "step": 66540 }, { - "epoch": 0.34, - "learning_rate": 0.0002496370029917613, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002741239200479028, + "loss": 0.0232, "step": 66550 }, { - "epoch": 0.34, - "learning_rate": 0.00024962943529874726, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.0002741200318315313, + "loss": 0.0274, "step": 66560 }, { - "epoch": 0.34, - "learning_rate": 0.00024962186760573324, - "loss": 0.0156, + "epoch": 0.17, + "learning_rate": 0.0002741161436151599, + "loss": 0.0227, "step": 66570 }, { - "epoch": 0.34, - "learning_rate": 0.0002496142999127192, - "loss": 0.0211, + "epoch": 0.17, + "learning_rate": 0.0002741122553987884, + "loss": 0.0303, "step": 66580 }, { - "epoch": 0.34, - "learning_rate": 0.00024960673221970526, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027410836718241697, + "loss": 0.0241, "step": 66590 }, { - "epoch": 0.34, - "learning_rate": 0.00024959916452669124, - "loss": 0.0197, + "epoch": 0.17, + "learning_rate": 0.0002741044789660455, + "loss": 0.0288, "step": 66600 }, { - "epoch": 0.34, - "learning_rate": 0.0002495915968336772, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.000274100590749674, + "loss": 0.0293, "step": 66610 }, { - "epoch": 0.34, - "learning_rate": 0.0002495840291406632, - "loss": 0.0154, + "epoch": 0.17, + "learning_rate": 0.0002740967025333025, + "loss": 0.0273, "step": 66620 }, { - "epoch": 0.34, - "learning_rate": 0.0002495764614476492, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.0002740928143169311, + "loss": 0.022, "step": 66630 }, { - "epoch": 0.34, - "learning_rate": 0.00024956889375463517, - "loss": 0.0215, + "epoch": 0.17, + "learning_rate": 0.00027408892610055965, + "loss": 0.03, "step": 66640 }, { - "epoch": 0.34, - "learning_rate": 0.0002495613260616212, - "loss": 0.0231, + "epoch": 0.17, + "learning_rate": 0.00027408503788418817, + "loss": 0.0228, "step": 66650 }, { - "epoch": 0.34, - "learning_rate": 0.0002495537583686072, - "loss": 0.0234, + "epoch": 0.17, + "learning_rate": 0.0002740811496678167, + "loss": 0.0278, "step": 66660 }, { - "epoch": 0.34, - "learning_rate": 0.00024954619067559317, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.00027407726145144525, + "loss": 0.0326, "step": 66670 }, { - "epoch": 0.34, - "learning_rate": 0.00024953862298257915, - "loss": 0.0206, + "epoch": 0.17, + "learning_rate": 0.00027407337323507376, + "loss": 0.0262, "step": 66680 }, { - "epoch": 0.34, - "learning_rate": 0.00024953105528956513, - "loss": 0.0227, + "epoch": 0.17, + "learning_rate": 0.0002740694850187023, + "loss": 0.0205, "step": 66690 }, { - "epoch": 0.34, - "learning_rate": 0.0002495234875965511, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.00027406559680233085, + "loss": 0.0227, "step": 66700 }, { - "epoch": 0.34, - "learning_rate": 0.00024951591990353715, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027406170858595936, + "loss": 0.0257, "step": 66710 }, { - "epoch": 0.34, - "learning_rate": 0.00024950835221052313, - "loss": 0.018, + "epoch": 0.17, + "learning_rate": 0.00027405782036958793, + "loss": 0.0218, "step": 66720 }, { - "epoch": 0.34, - "learning_rate": 0.0002495007845175091, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.00027405393215321645, + "loss": 0.0243, "step": 66730 }, { - "epoch": 0.34, - "learning_rate": 0.0002494932168244951, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.00027405004393684496, + "loss": 0.024, "step": 66740 }, { - "epoch": 0.34, - "learning_rate": 0.00024948564913148107, - "loss": 0.017, + "epoch": 0.17, + "learning_rate": 0.0002740461557204735, + "loss": 0.0274, "step": 66750 }, { - "epoch": 0.34, - "learning_rate": 0.00024947808143846705, - "loss": 0.0216, + "epoch": 0.17, + "learning_rate": 0.00027404226750410204, + "loss": 0.022, "step": 66760 }, { - "epoch": 0.34, - "learning_rate": 0.00024947051374545303, - "loss": 0.0171, + "epoch": 0.17, + "learning_rate": 0.00027403837928773056, + "loss": 0.0271, "step": 66770 }, { - "epoch": 0.34, - "learning_rate": 0.00024946294605243907, - "loss": 0.0186, + "epoch": 0.17, + "learning_rate": 0.0002740344910713591, + "loss": 0.0261, "step": 66780 }, { - "epoch": 0.34, - "learning_rate": 0.00024945537835942505, - "loss": 0.0214, + "epoch": 0.17, + "learning_rate": 0.00027403060285498764, + "loss": 0.0293, "step": 66790 }, { - "epoch": 0.34, - "learning_rate": 0.00024944781066641103, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.0002740267146386162, + "loss": 0.0312, "step": 66800 }, { - "epoch": 0.34, - "learning_rate": 0.000249440242973397, - "loss": 0.0166, + "epoch": 0.17, + "learning_rate": 0.0002740228264222447, + "loss": 0.0282, "step": 66810 }, { - "epoch": 0.34, - "learning_rate": 0.000249432675280383, - "loss": 0.0183, + "epoch": 0.17, + "learning_rate": 0.00027401893820587324, + "loss": 0.0271, "step": 66820 }, { - "epoch": 0.34, - "learning_rate": 0.000249425107587369, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.00027401504998950175, + "loss": 0.0308, "step": 66830 }, { - "epoch": 0.34, - "learning_rate": 0.000249417539894355, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.0002740111617731303, + "loss": 0.0227, "step": 66840 }, { - "epoch": 0.34, - "learning_rate": 0.000249409972201341, - "loss": 0.0244, + "epoch": 0.17, + "learning_rate": 0.0002740072735567589, + "loss": 0.0252, "step": 66850 }, { - "epoch": 0.34, - "learning_rate": 0.000249402404508327, - "loss": 0.0206, + "epoch": 0.17, + "learning_rate": 0.0002740033853403874, + "loss": 0.0303, "step": 66860 }, { - "epoch": 0.34, - "learning_rate": 0.00024939483681531296, - "loss": 0.0177, + "epoch": 0.17, + "learning_rate": 0.0002739994971240159, + "loss": 0.027, "step": 66870 }, { - "epoch": 0.34, - "learning_rate": 0.00024938726912229894, - "loss": 0.0174, + "epoch": 0.17, + "learning_rate": 0.0002739956089076445, + "loss": 0.0312, "step": 66880 }, { - "epoch": 0.34, - "learning_rate": 0.0002493797014292849, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.000273991720691273, + "loss": 0.0241, "step": 66890 }, { - "epoch": 0.34, - "learning_rate": 0.00024937213373627096, - "loss": 0.0209, + "epoch": 0.17, + "learning_rate": 0.0002739878324749015, + "loss": 0.0225, "step": 66900 }, { - "epoch": 0.34, - "learning_rate": 0.00024936456604325694, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.0002739839442585301, + "loss": 0.0244, "step": 66910 }, { - "epoch": 0.34, - "learning_rate": 0.0002493569983502429, - "loss": 0.0161, + "epoch": 0.17, + "learning_rate": 0.0002739800560421586, + "loss": 0.0294, "step": 66920 }, { - "epoch": 0.34, - "learning_rate": 0.0002493494306572289, - "loss": 0.0236, + "epoch": 0.17, + "learning_rate": 0.00027397616782578717, + "loss": 0.0251, "step": 66930 }, { - "epoch": 0.34, - "learning_rate": 0.0002493418629642149, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.0002739722796094157, + "loss": 0.0347, "step": 66940 }, { - "epoch": 0.34, - "learning_rate": 0.00024933429527120086, - "loss": 0.0189, + "epoch": 0.17, + "learning_rate": 0.0002739683913930442, + "loss": 0.0246, "step": 66950 }, { - "epoch": 0.34, - "learning_rate": 0.00024932672757818684, - "loss": 0.0187, + "epoch": 0.17, + "learning_rate": 0.00027396450317667277, + "loss": 0.0295, "step": 66960 }, { - "epoch": 0.34, - "learning_rate": 0.0002493191598851729, - "loss": 0.0196, + "epoch": 0.17, + "learning_rate": 0.0002739606149603013, + "loss": 0.0274, "step": 66970 }, { - "epoch": 0.34, - "learning_rate": 0.00024931159219215886, - "loss": 0.0187, + "epoch": 0.17, + "learning_rate": 0.0002739567267439298, + "loss": 0.0297, "step": 66980 }, { - "epoch": 0.34, - "learning_rate": 0.00024930402449914484, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.00027395283852755837, + "loss": 0.0259, "step": 66990 }, { - "epoch": 0.34, - "learning_rate": 0.0002492964568061308, - "loss": 0.017, + "epoch": 0.17, + "learning_rate": 0.0002739489503111869, + "loss": 0.0232, "step": 67000 }, { - "epoch": 0.34, - "eval_cer": 0.9144518183767796, - "eval_loss": 0.013345795683562756, - "eval_runtime": 116.5962, - "eval_samples_per_second": 17.153, - "eval_steps_per_second": 4.288, + "epoch": 0.17, + "eval_cer": 0.8818006609085604, + "eval_loss": 0.018520452082157135, + "eval_runtime": 107.7331, + "eval_samples_per_second": 18.564, + "eval_steps_per_second": 4.641, "step": 67000 }, { - "epoch": 0.34, - "learning_rate": 0.0002492888891131168, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.00027394506209481545, + "loss": 0.0253, "step": 67010 }, { - "epoch": 0.34, - "learning_rate": 0.0002492813214201028, - "loss": 0.0234, + "epoch": 0.17, + "learning_rate": 0.00027394117387844396, + "loss": 0.0284, "step": 67020 }, { - "epoch": 0.34, - "learning_rate": 0.0002492737537270888, - "loss": 0.0155, + "epoch": 0.17, + "learning_rate": 0.0002739372856620725, + "loss": 0.0239, "step": 67030 }, { - "epoch": 0.34, - "learning_rate": 0.0002492661860340748, - "loss": 0.0181, + "epoch": 0.17, + "learning_rate": 0.00027393339744570105, + "loss": 0.0325, "step": 67040 }, { - "epoch": 0.34, - "learning_rate": 0.0002492586183410608, - "loss": 0.0186, + "epoch": 0.17, + "learning_rate": 0.00027392950922932956, + "loss": 0.0328, "step": 67050 }, { - "epoch": 0.34, - "learning_rate": 0.00024925105064804677, - "loss": 0.0213, + "epoch": 0.17, + "learning_rate": 0.00027392562101295813, + "loss": 0.0247, "step": 67060 }, { - "epoch": 0.34, - "learning_rate": 0.00024924348295503275, - "loss": 0.019, + "epoch": 0.17, + "learning_rate": 0.00027392173279658664, + "loss": 0.0337, "step": 67070 }, { - "epoch": 0.34, - "learning_rate": 0.00024923591526201873, - "loss": 0.0205, + "epoch": 0.17, + "learning_rate": 0.00027391784458021516, + "loss": 0.027, "step": 67080 }, { - "epoch": 0.34, - "learning_rate": 0.0002492283475690047, - "loss": 0.024, + "epoch": 0.17, + "learning_rate": 0.00027391395636384373, + "loss": 0.0277, "step": 67090 }, { - "epoch": 0.34, - "learning_rate": 0.00024922077987599075, - "loss": 0.0229, + "epoch": 0.17, + "learning_rate": 0.00027391006814747224, + "loss": 0.0272, "step": 67100 }, { - "epoch": 0.34, - "learning_rate": 0.00024921321218297673, - "loss": 0.0218, + "epoch": 0.17, + "learning_rate": 0.00027390617993110076, + "loss": 0.0258, "step": 67110 }, { - "epoch": 0.34, - "learning_rate": 0.0002492056444899627, - "loss": 0.0178, + "epoch": 0.17, + "learning_rate": 0.0002739022917147293, + "loss": 0.0243, "step": 67120 }, { - "epoch": 0.34, - "learning_rate": 0.0002491980767969487, - "loss": 0.021, + "epoch": 0.17, + "learning_rate": 0.00027389840349835784, + "loss": 0.0256, "step": 67130 }, { - "epoch": 0.34, - "learning_rate": 0.0002491905091039347, - "loss": 0.0172, + "epoch": 0.17, + "learning_rate": 0.0002738945152819864, + "loss": 0.0268, "step": 67140 }, { - "epoch": 0.34, - "learning_rate": 0.00024918294141092065, - "loss": 0.0164, + "epoch": 0.17, + "learning_rate": 0.0002738906270656149, + "loss": 0.025, "step": 67150 }, { - "epoch": 0.34, - "learning_rate": 0.0002491753737179067, - "loss": 0.0202, + "epoch": 0.17, + "learning_rate": 0.00027388673884924344, + "loss": 0.0288, "step": 67160 }, { - "epoch": 0.34, - "learning_rate": 0.00024916780602489267, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.000273882850632872, + "loss": 0.0276, "step": 67170 }, { - "epoch": 0.34, - "learning_rate": 0.00024916023833187865, - "loss": 0.0182, + "epoch": 0.17, + "learning_rate": 0.0002738789624165005, + "loss": 0.0277, "step": 67180 }, { - "epoch": 0.34, - "learning_rate": 0.00024915267063886463, - "loss": 0.0179, + "epoch": 0.17, + "learning_rate": 0.0002738750742001291, + "loss": 0.0253, "step": 67190 }, { - "epoch": 0.34, - "learning_rate": 0.0002491451029458506, - "loss": 0.0194, + "epoch": 0.17, + "learning_rate": 0.0002738711859837576, + "loss": 0.0278, "step": 67200 }, { - "epoch": 0.34, - "learning_rate": 0.0002491375352528366, - "loss": 0.0171, + "epoch": 0.17, + "learning_rate": 0.00027386729776738617, + "loss": 0.0261, "step": 67210 }, { - "epoch": 0.34, - "learning_rate": 0.00024912996755982263, - "loss": 0.0198, + "epoch": 0.17, + "learning_rate": 0.0002738634095510147, + "loss": 0.0272, "step": 67220 }, { - "epoch": 0.34, - "learning_rate": 0.0002491223998668086, - "loss": 0.0203, + "epoch": 0.17, + "learning_rate": 0.0002738595213346432, + "loss": 0.0268, "step": 67230 }, { - "epoch": 0.34, - "learning_rate": 0.0002491148321737946, - "loss": 0.0192, + "epoch": 0.17, + "learning_rate": 0.0002738556331182717, + "loss": 0.03, "step": 67240 }, { - "epoch": 0.34, - "learning_rate": 0.0002491072644807805, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002738517449019003, + "loss": 0.0273, "step": 67250 }, { - "epoch": 0.34, - "learning_rate": 0.00024909969678776656, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.0002738478566855288, + "loss": 0.0264, "step": 67260 }, { - "epoch": 0.34, - "learning_rate": 0.00024909212909475254, - "loss": 0.0163, + "epoch": 0.17, + "learning_rate": 0.00027384396846915737, + "loss": 0.0257, "step": 67270 }, { - "epoch": 0.34, - "learning_rate": 0.0002490845614017385, - "loss": 0.0163, + "epoch": 0.17, + "learning_rate": 0.0002738400802527859, + "loss": 0.0239, "step": 67280 }, { - "epoch": 0.34, - "learning_rate": 0.0002490769937087245, - "loss": 0.017, + "epoch": 0.17, + "learning_rate": 0.0002738361920364144, + "loss": 0.0264, "step": 67290 }, { - "epoch": 0.34, - "learning_rate": 0.0002490694260157105, - "loss": 0.0186, + "epoch": 0.17, + "learning_rate": 0.00027383230382004297, + "loss": 0.0259, "step": 67300 }, { - "epoch": 0.34, - "learning_rate": 0.00024906185832269647, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.0002738284156036715, + "loss": 0.0277, "step": 67310 }, { - "epoch": 0.34, - "learning_rate": 0.00024905429062968245, - "loss": 0.0191, + "epoch": 0.17, + "learning_rate": 0.0002738245273873, + "loss": 0.0231, "step": 67320 }, { - "epoch": 0.34, - "learning_rate": 0.0002490467229366685, - "loss": 0.0148, + "epoch": 0.17, + "learning_rate": 0.00027382063917092856, + "loss": 0.0211, "step": 67330 }, { - "epoch": 0.34, - "learning_rate": 0.00024903915524365446, - "loss": 0.0195, + "epoch": 0.17, + "learning_rate": 0.00027381675095455713, + "loss": 0.0212, "step": 67340 }, { - "epoch": 0.34, - "learning_rate": 0.00024903158755064045, - "loss": 0.0175, + "epoch": 0.17, + "learning_rate": 0.00027381286273818565, + "loss": 0.0278, "step": 67350 }, { - "epoch": 0.34, - "learning_rate": 0.00024902401985762643, - "loss": 0.017, + "epoch": 0.17, + "learning_rate": 0.00027380897452181416, + "loss": 0.021, "step": 67360 }, { - "epoch": 0.34, - "learning_rate": 0.0002490164521646124, - "loss": 0.022, + "epoch": 0.17, + "learning_rate": 0.0002738050863054427, + "loss": 0.0265, "step": 67370 }, { - "epoch": 0.34, - "learning_rate": 0.0002490088844715984, - "loss": 0.02, + "epoch": 0.17, + "learning_rate": 0.00027380119808907125, + "loss": 0.0272, "step": 67380 }, { - "epoch": 0.34, - "learning_rate": 0.0002490013167785844, - "loss": 0.0252, + "epoch": 0.17, + "learning_rate": 0.00027379730987269976, + "loss": 0.0248, "step": 67390 }, { - "epoch": 0.34, - "learning_rate": 0.0002489937490855704, - "loss": 0.0201, + "epoch": 0.17, + "learning_rate": 0.00027379342165632833, + "loss": 0.0305, "step": 67400 }, { - "epoch": 0.34, - "learning_rate": 0.0002489861813925564, - "loss": 0.0216, + "epoch": 0.17, + "learning_rate": 0.00027378953343995684, + "loss": 0.028, "step": 67410 }, { - "epoch": 0.34, - "learning_rate": 0.00024897861369954237, - "loss": 0.0163, + "epoch": 0.17, + "learning_rate": 0.0002737856452235854, + "loss": 0.0269, "step": 67420 }, { - "epoch": 0.34, - "learning_rate": 0.00024897104600652835, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.0002737817570072139, + "loss": 0.0284, "step": 67430 }, { - "epoch": 0.34, - "learning_rate": 0.00024896347831351433, - "loss": 0.0193, + "epoch": 0.17, + "learning_rate": 0.00027377786879084244, + "loss": 0.0239, "step": 67440 }, { - "epoch": 0.34, - "learning_rate": 0.00024895591062050037, - "loss": 0.0163, + "epoch": 0.17, + "learning_rate": 0.00027377398057447096, + "loss": 0.0236, "step": 67450 }, { - "epoch": 0.34, - "learning_rate": 0.00024894834292748635, - "loss": 0.0163, + "epoch": 0.17, + "learning_rate": 0.0002737700923580995, + "loss": 0.022, "step": 67460 }, { - "epoch": 0.34, - "learning_rate": 0.00024894077523447233, - "loss": 0.0185, + "epoch": 0.17, + "learning_rate": 0.00027376620414172804, + "loss": 0.0296, "step": 67470 }, { - "epoch": 0.34, - "learning_rate": 0.0002489332075414583, - "loss": 0.0225, + "epoch": 0.17, + "learning_rate": 0.0002737623159253566, + "loss": 0.0234, "step": 67480 }, { - "epoch": 0.34, - "learning_rate": 0.0002489256398484443, - "loss": 0.0176, + "epoch": 0.17, + "learning_rate": 0.0002737584277089851, + "loss": 0.029, "step": 67490 }, { - "epoch": 0.34, - "learning_rate": 0.0002489180721554303, - "loss": 0.0166, + "epoch": 0.17, + "learning_rate": 0.00027375453949261364, + "loss": 0.0277, "step": 67500 }, { - "epoch": 0.34, - "learning_rate": 0.00024891050446241626, - "loss": 0.0199, + "epoch": 0.17, + "learning_rate": 0.0002737506512762422, + "loss": 0.0246, "step": 67510 }, { - "epoch": 0.34, - "learning_rate": 0.0002489029367694023, - "loss": 0.0205, + "epoch": 0.18, + "learning_rate": 0.0002737467630598707, + "loss": 0.0275, "step": 67520 }, { - "epoch": 0.34, - "learning_rate": 0.0002488953690763883, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.00027374287484349923, + "loss": 0.0246, "step": 67530 }, { - "epoch": 0.34, - "learning_rate": 0.00024888780138337426, - "loss": 0.0173, + "epoch": 0.18, + "learning_rate": 0.0002737389866271278, + "loss": 0.03, "step": 67540 }, { - "epoch": 0.34, - "learning_rate": 0.00024888023369036024, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.00027373509841075637, + "loss": 0.0228, "step": 67550 }, { - "epoch": 0.34, - "learning_rate": 0.0002488726659973462, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.0002737312101943849, + "loss": 0.0251, "step": 67560 }, { - "epoch": 0.34, - "learning_rate": 0.0002488650983043322, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.0002737273219780134, + "loss": 0.0265, "step": 67570 }, { - "epoch": 0.34, - "learning_rate": 0.00024885753061131824, - "loss": 0.015, + "epoch": 0.18, + "learning_rate": 0.0002737234337616419, + "loss": 0.026, "step": 67580 }, { - "epoch": 0.34, - "learning_rate": 0.0002488499629183042, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.0002737195455452705, + "loss": 0.0213, "step": 67590 }, { - "epoch": 0.34, - "learning_rate": 0.0002488423952252902, - "loss": 0.0237, + "epoch": 0.18, + "learning_rate": 0.000273715657328899, + "loss": 0.0212, "step": 67600 }, { - "epoch": 0.34, - "learning_rate": 0.0002488348275322762, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.00027371176911252757, + "loss": 0.0247, "step": 67610 }, { - "epoch": 0.34, - "learning_rate": 0.00024882725983926216, - "loss": 0.0203, + "epoch": 0.18, + "learning_rate": 0.0002737078808961561, + "loss": 0.0256, "step": 67620 }, { - "epoch": 0.34, - "learning_rate": 0.00024881969214624814, - "loss": 0.0142, + "epoch": 0.18, + "learning_rate": 0.00027370399267978465, + "loss": 0.0247, "step": 67630 }, { - "epoch": 0.34, - "learning_rate": 0.0002488121244532342, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.00027370010446341317, + "loss": 0.0259, "step": 67640 }, { - "epoch": 0.34, - "learning_rate": 0.00024880455676022016, - "loss": 0.0195, + "epoch": 0.18, + "learning_rate": 0.0002736962162470417, + "loss": 0.0303, "step": 67650 }, { - "epoch": 0.34, - "learning_rate": 0.00024879698906720614, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.0002736923280306702, + "loss": 0.0227, "step": 67660 }, { - "epoch": 0.34, - "learning_rate": 0.0002487894213741921, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.00027368843981429876, + "loss": 0.0273, "step": 67670 }, { - "epoch": 0.34, - "learning_rate": 0.0002487818536811781, - "loss": 0.0162, + "epoch": 0.18, + "learning_rate": 0.0002736845515979273, + "loss": 0.0304, "step": 67680 }, { - "epoch": 0.34, - "learning_rate": 0.0002487742859881641, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.00027368066338155585, + "loss": 0.0272, "step": 67690 }, { - "epoch": 0.34, - "learning_rate": 0.00024876671829515007, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.00027367677516518436, + "loss": 0.0238, "step": 67700 }, { - "epoch": 0.34, - "learning_rate": 0.0002487591506021361, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.00027367288694881293, + "loss": 0.0231, "step": 67710 }, { - "epoch": 0.34, - "learning_rate": 0.0002487515829091221, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.00027366899873244144, + "loss": 0.0278, "step": 67720 }, { - "epoch": 0.34, - "learning_rate": 0.00024874401521610807, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.00027366511051606996, + "loss": 0.029, "step": 67730 }, { - "epoch": 0.34, - "learning_rate": 0.00024873644752309405, - "loss": 0.0148, + "epoch": 0.18, + "learning_rate": 0.00027366122229969853, + "loss": 0.0254, "step": 67740 }, { - "epoch": 0.34, - "learning_rate": 0.00024872887983008003, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.00027365733408332704, + "loss": 0.0247, "step": 67750 }, { - "epoch": 0.34, - "learning_rate": 0.000248721312137066, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002736534458669556, + "loss": 0.0227, "step": 67760 }, { - "epoch": 0.34, - "learning_rate": 0.00024871374444405205, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.0002736495576505841, + "loss": 0.0299, "step": 67770 }, { - "epoch": 0.34, - "learning_rate": 0.00024870617675103803, - "loss": 0.0261, + "epoch": 0.18, + "learning_rate": 0.00027364566943421264, + "loss": 0.0267, "step": 67780 }, { - "epoch": 0.34, - "learning_rate": 0.000248698609058024, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027364178121784115, + "loss": 0.0257, "step": 67790 }, { - "epoch": 0.34, - "learning_rate": 0.00024869104136501, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.0002736378930014697, + "loss": 0.025, "step": 67800 }, { - "epoch": 0.34, - "learning_rate": 0.00024868347367199597, - "loss": 0.0217, + "epoch": 0.18, + "learning_rate": 0.00027363400478509824, + "loss": 0.0256, "step": 67810 }, { - "epoch": 0.34, - "learning_rate": 0.00024867590597898195, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.0002736301165687268, + "loss": 0.0219, "step": 67820 }, { - "epoch": 0.34, - "learning_rate": 0.00024866833828596793, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.0002736262283523553, + "loss": 0.0261, "step": 67830 }, { - "epoch": 0.34, - "learning_rate": 0.00024866077059295397, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.0002736223401359839, + "loss": 0.0294, "step": 67840 }, { - "epoch": 0.34, - "learning_rate": 0.00024865320289993995, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002736184519196124, + "loss": 0.0253, "step": 67850 }, { - "epoch": 0.34, - "learning_rate": 0.00024864563520692593, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.0002736145637032409, + "loss": 0.03, "step": 67860 }, { - "epoch": 0.34, - "learning_rate": 0.0002486380675139119, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027361067548686943, + "loss": 0.0211, "step": 67870 }, { - "epoch": 0.34, - "learning_rate": 0.0002486304998208979, - "loss": 0.0182, + "epoch": 0.18, + "learning_rate": 0.000273606787270498, + "loss": 0.0237, "step": 67880 }, { - "epoch": 0.34, - "learning_rate": 0.0002486229321278839, - "loss": 0.0155, + "epoch": 0.18, + "learning_rate": 0.00027360289905412657, + "loss": 0.0248, "step": 67890 }, { - "epoch": 0.34, - "learning_rate": 0.0002486153644348699, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.0002735990108377551, + "loss": 0.0281, "step": 67900 }, { - "epoch": 0.34, - "learning_rate": 0.0002486077967418559, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.0002735951226213836, + "loss": 0.0272, "step": 67910 }, { - "epoch": 0.34, - "learning_rate": 0.0002486002290488419, - "loss": 0.0227, + "epoch": 0.18, + "learning_rate": 0.00027359123440501217, + "loss": 0.0248, "step": 67920 }, { - "epoch": 0.34, - "learning_rate": 0.00024859266135582786, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.0002735873461886407, + "loss": 0.0271, "step": 67930 }, { - "epoch": 0.34, - "learning_rate": 0.00024858509366281384, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.0002735834579722692, + "loss": 0.0277, "step": 67940 }, { - "epoch": 0.34, - "learning_rate": 0.0002485775259697998, - "loss": 0.0154, + "epoch": 0.18, + "learning_rate": 0.00027357956975589777, + "loss": 0.022, "step": 67950 }, { - "epoch": 0.34, - "learning_rate": 0.00024856995827678586, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.0002735756815395263, + "loss": 0.0331, "step": 67960 }, { - "epoch": 0.34, - "learning_rate": 0.00024856239058377184, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027357179332315485, + "loss": 0.0221, "step": 67970 }, { - "epoch": 0.34, - "learning_rate": 0.0002485548228907578, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.00027356790510678336, + "loss": 0.0254, "step": 67980 }, { - "epoch": 0.34, - "learning_rate": 0.0002485472551977438, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.0002735640168904119, + "loss": 0.029, "step": 67990 }, { - "epoch": 0.34, - "learning_rate": 0.0002485396875047298, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002735601286740404, + "loss": 0.024, "step": 68000 }, { - "epoch": 0.34, - "eval_cer": 0.9144692855070369, - "eval_loss": 0.013180240988731384, - "eval_runtime": 116.7123, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.18, + "eval_cer": 0.8818412503796516, + "eval_loss": 0.018042191863059998, + "eval_runtime": 107.7307, + "eval_samples_per_second": 18.565, + "eval_steps_per_second": 4.641, "step": 68000 }, { - "epoch": 0.34, - "learning_rate": 0.00024853211981171576, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.00027355624045766896, + "loss": 0.0292, "step": 68010 }, { - "epoch": 0.34, - "learning_rate": 0.00024852455211870174, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.0002735523522412975, + "loss": 0.0249, "step": 68020 }, { - "epoch": 0.34, - "learning_rate": 0.0002485169844256878, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.00027354846402492605, + "loss": 0.0307, "step": 68030 }, { - "epoch": 0.34, - "learning_rate": 0.00024850941673267376, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027354457580855456, + "loss": 0.0248, "step": 68040 }, { - "epoch": 0.34, - "learning_rate": 0.00024850184903965974, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.00027354068759218313, + "loss": 0.0259, "step": 68050 }, { - "epoch": 0.34, - "learning_rate": 0.0002484942813466457, - "loss": 0.015, + "epoch": 0.18, + "learning_rate": 0.00027353679937581164, + "loss": 0.0192, "step": 68060 }, { - "epoch": 0.34, - "learning_rate": 0.0002484867136536317, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027353291115944016, + "loss": 0.0284, "step": 68070 }, { - "epoch": 0.34, - "learning_rate": 0.0002484791459606177, - "loss": 0.0203, + "epoch": 0.18, + "learning_rate": 0.00027352902294306867, + "loss": 0.0231, "step": 68080 }, { - "epoch": 0.34, - "learning_rate": 0.0002484715782676037, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.00027352513472669724, + "loss": 0.0287, "step": 68090 }, { - "epoch": 0.34, - "learning_rate": 0.0002484640105745897, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.0002735212465103258, + "loss": 0.0274, "step": 68100 }, { - "epoch": 0.34, - "learning_rate": 0.0002484564428815757, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.0002735173582939543, + "loss": 0.0262, "step": 68110 }, { - "epoch": 0.34, - "learning_rate": 0.00024844887518856167, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027351347007758284, + "loss": 0.0282, "step": 68120 }, { - "epoch": 0.34, - "learning_rate": 0.00024844130749554765, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.0002735095818612114, + "loss": 0.0245, "step": 68130 }, { - "epoch": 0.34, - "learning_rate": 0.00024843373980253363, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.0002735056936448399, + "loss": 0.0254, "step": 68140 }, { - "epoch": 0.34, - "learning_rate": 0.0002484261721095196, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.00027350180542846844, + "loss": 0.0272, "step": 68150 }, { - "epoch": 0.34, - "learning_rate": 0.00024841860441650565, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.000273497917212097, + "loss": 0.0253, "step": 68160 }, { - "epoch": 0.34, - "learning_rate": 0.00024841103672349163, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.0002734940289957255, + "loss": 0.0253, "step": 68170 }, { - "epoch": 0.34, - "learning_rate": 0.0002484034690304776, - "loss": 0.0244, + "epoch": 0.18, + "learning_rate": 0.0002734901407793541, + "loss": 0.0338, "step": 68180 }, { - "epoch": 0.34, - "learning_rate": 0.0002483959013374636, - "loss": 0.0239, + "epoch": 0.18, + "learning_rate": 0.0002734862525629826, + "loss": 0.0253, "step": 68190 }, { - "epoch": 0.34, - "learning_rate": 0.0002483883336444496, - "loss": 0.0216, + "epoch": 0.18, + "learning_rate": 0.0002734823643466111, + "loss": 0.0255, "step": 68200 }, { - "epoch": 0.34, - "learning_rate": 0.00024838076595143555, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.0002734784761302397, + "loss": 0.0275, "step": 68210 }, { - "epoch": 0.34, - "learning_rate": 0.0002483731982584216, - "loss": 0.0216, + "epoch": 0.18, + "learning_rate": 0.0002734745879138682, + "loss": 0.0244, "step": 68220 }, { - "epoch": 0.34, - "learning_rate": 0.00024836563056540757, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.00027347069969749677, + "loss": 0.0256, "step": 68230 }, { - "epoch": 0.34, - "learning_rate": 0.00024835806287239355, - "loss": 0.0246, + "epoch": 0.18, + "learning_rate": 0.0002734668114811253, + "loss": 0.0275, "step": 68240 }, { - "epoch": 0.34, - "learning_rate": 0.00024835049517937953, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.0002734629232647538, + "loss": 0.0271, "step": 68250 }, { - "epoch": 0.34, - "learning_rate": 0.0002483429274863655, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.00027345903504838237, + "loss": 0.0233, "step": 68260 }, { - "epoch": 0.34, - "learning_rate": 0.0002483353597933515, - "loss": 0.0176, + "epoch": 0.18, + "learning_rate": 0.0002734551468320109, + "loss": 0.0226, "step": 68270 }, { - "epoch": 0.34, - "learning_rate": 0.00024832779210033753, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002734512586156394, + "loss": 0.0227, "step": 68280 }, { - "epoch": 0.34, - "learning_rate": 0.0002483202244073235, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.00027344737039926796, + "loss": 0.025, "step": 68290 }, { - "epoch": 0.34, - "learning_rate": 0.0002483126567143095, - "loss": 0.0207, - "step": 68300 + "epoch": 0.18, + "learning_rate": 0.0002734434821828965, + "loss": 0.0235, + "step": 68300 }, { - "epoch": 0.34, - "learning_rate": 0.0002483050890212955, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.00027343959396652505, + "loss": 0.0275, "step": 68310 }, { - "epoch": 0.34, - "learning_rate": 0.00024829752132828146, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027343570575015356, + "loss": 0.0264, "step": 68320 }, { - "epoch": 0.34, - "learning_rate": 0.00024828995363526744, - "loss": 0.0216, + "epoch": 0.18, + "learning_rate": 0.0002734318175337821, + "loss": 0.0203, "step": 68330 }, { - "epoch": 0.34, - "learning_rate": 0.0002482823859422534, - "loss": 0.0187, + "epoch": 0.18, + "learning_rate": 0.00027342792931741065, + "loss": 0.0284, "step": 68340 }, { - "epoch": 0.34, - "learning_rate": 0.00024827481824923946, - "loss": 0.0205, + "epoch": 0.18, + "learning_rate": 0.00027342404110103916, + "loss": 0.0246, "step": 68350 }, { - "epoch": 0.34, - "learning_rate": 0.00024826725055622544, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002734201528846677, + "loss": 0.0221, "step": 68360 }, { - "epoch": 0.34, - "learning_rate": 0.0002482596828632114, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.00027341626466829624, + "loss": 0.0284, "step": 68370 }, { - "epoch": 0.34, - "learning_rate": 0.0002482521151701974, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.0002734123764519248, + "loss": 0.0295, "step": 68380 }, { - "epoch": 0.35, - "learning_rate": 0.0002482445474771834, - "loss": 0.0183, + "epoch": 0.18, + "learning_rate": 0.00027340848823555333, + "loss": 0.0304, "step": 68390 }, { - "epoch": 0.35, - "learning_rate": 0.00024823697978416936, - "loss": 0.0167, + "epoch": 0.18, + "learning_rate": 0.00027340460001918184, + "loss": 0.0323, "step": 68400 }, { - "epoch": 0.35, - "learning_rate": 0.0002482294120911554, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027340071180281036, + "loss": 0.0307, "step": 68410 }, { - "epoch": 0.35, - "learning_rate": 0.0002482218443981414, - "loss": 0.0226, + "epoch": 0.18, + "learning_rate": 0.0002733968235864389, + "loss": 0.0283, "step": 68420 }, { - "epoch": 0.35, - "learning_rate": 0.00024821427670512736, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.00027339293537006744, + "loss": 0.024, "step": 68430 }, { - "epoch": 0.35, - "learning_rate": 0.00024820670901211334, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.000273389047153696, + "loss": 0.0223, "step": 68440 }, { - "epoch": 0.35, - "learning_rate": 0.0002481991413190993, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.0002733851589373245, + "loss": 0.0249, "step": 68450 }, { - "epoch": 0.35, - "learning_rate": 0.0002481915736260853, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.0002733812707209531, + "loss": 0.0258, "step": 68460 }, { - "epoch": 0.35, - "learning_rate": 0.00024818400593307134, - "loss": 0.0159, + "epoch": 0.18, + "learning_rate": 0.0002733773825045816, + "loss": 0.0233, "step": 68470 }, { - "epoch": 0.35, - "learning_rate": 0.0002481764382400573, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.0002733734942882101, + "loss": 0.0307, "step": 68480 }, { - "epoch": 0.35, - "learning_rate": 0.0002481688705470433, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.00027336960607183864, + "loss": 0.03, "step": 68490 }, { - "epoch": 0.35, - "learning_rate": 0.0002481613028540293, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002733657178554672, + "loss": 0.0241, "step": 68500 }, { - "epoch": 0.35, - "learning_rate": 0.00024815373516101527, - "loss": 0.0162, + "epoch": 0.18, + "learning_rate": 0.0002733618296390957, + "loss": 0.022, "step": 68510 }, { - "epoch": 0.35, - "learning_rate": 0.00024814616746800125, - "loss": 0.0233, + "epoch": 0.18, + "learning_rate": 0.0002733579414227243, + "loss": 0.0266, "step": 68520 }, { - "epoch": 0.35, - "learning_rate": 0.00024813859977498723, - "loss": 0.0157, + "epoch": 0.18, + "learning_rate": 0.0002733540532063528, + "loss": 0.0242, "step": 68530 }, { - "epoch": 0.35, - "learning_rate": 0.0002481310320819732, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002733501649899813, + "loss": 0.0295, "step": 68540 }, { - "epoch": 0.35, - "learning_rate": 0.0002481234643889592, - "loss": 0.0187, + "epoch": 0.18, + "learning_rate": 0.0002733462767736099, + "loss": 0.0272, "step": 68550 }, { - "epoch": 0.35, - "learning_rate": 0.0002481158966959452, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.0002733423885572384, + "loss": 0.0257, "step": 68560 }, { - "epoch": 0.35, - "learning_rate": 0.00024810832900293116, - "loss": 0.014, + "epoch": 0.18, + "learning_rate": 0.0002733385003408669, + "loss": 0.0253, "step": 68570 }, { - "epoch": 0.35, - "learning_rate": 0.0002481007613099172, - "loss": 0.0164, + "epoch": 0.18, + "learning_rate": 0.0002733346121244955, + "loss": 0.0235, "step": 68580 }, { - "epoch": 0.35, - "learning_rate": 0.0002480931936169032, - "loss": 0.0158, + "epoch": 0.18, + "learning_rate": 0.00027333072390812405, + "loss": 0.0259, "step": 68590 }, { - "epoch": 0.35, - "learning_rate": 0.00024808562592388916, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.00027332683569175257, + "loss": 0.0221, "step": 68600 }, { - "epoch": 0.35, - "learning_rate": 0.00024807805823087514, - "loss": 0.0215, + "epoch": 0.18, + "learning_rate": 0.0002733229474753811, + "loss": 0.0235, "step": 68610 }, { - "epoch": 0.35, - "learning_rate": 0.0002480704905378611, - "loss": 0.0182, + "epoch": 0.18, + "learning_rate": 0.0002733190592590096, + "loss": 0.0274, "step": 68620 }, { - "epoch": 0.35, - "learning_rate": 0.0002480629228448471, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027331517104263816, + "loss": 0.0256, "step": 68630 }, { - "epoch": 0.35, - "learning_rate": 0.00024805535515183314, - "loss": 0.0183, + "epoch": 0.18, + "learning_rate": 0.0002733112828262667, + "loss": 0.0251, "step": 68640 }, { - "epoch": 0.35, - "learning_rate": 0.0002480477874588191, - "loss": 0.0185, + "epoch": 0.18, + "learning_rate": 0.00027330739460989525, + "loss": 0.0255, "step": 68650 }, { - "epoch": 0.35, - "learning_rate": 0.0002480402197658051, - "loss": 0.0205, + "epoch": 0.18, + "learning_rate": 0.00027330350639352376, + "loss": 0.027, "step": 68660 }, { - "epoch": 0.35, - "learning_rate": 0.0002480326520727911, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027329961817715233, + "loss": 0.025, "step": 68670 }, { - "epoch": 0.35, - "learning_rate": 0.00024802508437977706, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.00027329572996078084, + "loss": 0.0265, "step": 68680 }, { - "epoch": 0.35, - "learning_rate": 0.00024801751668676304, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.00027329184174440936, + "loss": 0.0246, "step": 68690 }, { - "epoch": 0.35, - "learning_rate": 0.0002480099489937491, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.0002732879535280379, + "loss": 0.024, "step": 68700 }, { - "epoch": 0.35, - "learning_rate": 0.00024800238130073506, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027328406531166644, + "loss": 0.0287, "step": 68710 }, { - "epoch": 0.35, - "learning_rate": 0.00024799481360772104, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.00027328017709529496, + "loss": 0.0282, "step": 68720 }, { - "epoch": 0.35, - "learning_rate": 0.000247987245914707, - "loss": 0.0224, + "epoch": 0.18, + "learning_rate": 0.0002732762888789235, + "loss": 0.0261, "step": 68730 }, { - "epoch": 0.35, - "learning_rate": 0.000247979678221693, - "loss": 0.0159, + "epoch": 0.18, + "learning_rate": 0.00027327240066255204, + "loss": 0.0263, "step": 68740 }, { - "epoch": 0.35, - "learning_rate": 0.000247972110528679, - "loss": 0.0246, + "epoch": 0.18, + "learning_rate": 0.00027326851244618056, + "loss": 0.024, "step": 68750 }, { - "epoch": 0.35, - "learning_rate": 0.00024796454283566497, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.0002732646242298091, + "loss": 0.0249, "step": 68760 }, { - "epoch": 0.35, - "learning_rate": 0.000247956975142651, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.00027326073601343764, + "loss": 0.0278, "step": 68770 }, { - "epoch": 0.35, - "learning_rate": 0.000247949407449637, - "loss": 0.0139, + "epoch": 0.18, + "learning_rate": 0.0002732568477970662, + "loss": 0.0229, "step": 68780 }, { - "epoch": 0.35, - "learning_rate": 0.00024794183975662297, - "loss": 0.0155, + "epoch": 0.18, + "learning_rate": 0.0002732529595806947, + "loss": 0.0269, "step": 68790 }, { - "epoch": 0.35, - "learning_rate": 0.00024793427206360895, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.0002732490713643233, + "loss": 0.0317, "step": 68800 }, { - "epoch": 0.35, - "learning_rate": 0.00024792670437059493, - "loss": 0.0176, + "epoch": 0.18, + "learning_rate": 0.0002732451831479518, + "loss": 0.0278, "step": 68810 }, { - "epoch": 0.35, - "learning_rate": 0.0002479191366775809, - "loss": 0.0352, + "epoch": 0.18, + "learning_rate": 0.0002732412949315803, + "loss": 0.028, "step": 68820 }, { - "epoch": 0.35, - "learning_rate": 0.00024791156898456695, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.00027323740671520883, + "loss": 0.0262, "step": 68830 }, { - "epoch": 0.35, - "learning_rate": 0.00024790400129155293, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.0002732335184988374, + "loss": 0.0289, "step": 68840 }, { - "epoch": 0.35, - "learning_rate": 0.0002478964335985389, - "loss": 0.0245, + "epoch": 0.18, + "learning_rate": 0.0002732296302824659, + "loss": 0.0257, "step": 68850 }, { - "epoch": 0.35, - "learning_rate": 0.0002478888659055249, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.0002732257420660945, + "loss": 0.0245, "step": 68860 }, { - "epoch": 0.35, - "learning_rate": 0.00024788129821251087, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.000273221853849723, + "loss": 0.0272, "step": 68870 }, { - "epoch": 0.35, - "learning_rate": 0.00024787373051949685, - "loss": 0.022, + "epoch": 0.18, + "learning_rate": 0.00027321796563335157, + "loss": 0.0257, "step": 68880 }, { - "epoch": 0.35, - "learning_rate": 0.00024786616282648283, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.0002732140774169801, + "loss": 0.028, "step": 68890 }, { - "epoch": 0.35, - "learning_rate": 0.00024785859513346887, + "epoch": 0.18, + "learning_rate": 0.0002732101892006086, "loss": 0.0228, "step": 68900 }, { - "epoch": 0.35, - "learning_rate": 0.00024785102744045485, - "loss": 0.0237, + "epoch": 0.18, + "learning_rate": 0.0002732063009842371, + "loss": 0.0276, "step": 68910 }, { - "epoch": 0.35, - "learning_rate": 0.00024784345974744083, - "loss": 0.0238, + "epoch": 0.18, + "learning_rate": 0.0002732024127678657, + "loss": 0.0257, "step": 68920 }, { - "epoch": 0.35, - "learning_rate": 0.0002478358920544268, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.00027319852455149425, + "loss": 0.0274, "step": 68930 }, { - "epoch": 0.35, - "learning_rate": 0.0002478283243614128, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027319463633512276, + "loss": 0.0231, "step": 68940 }, { - "epoch": 0.35, - "learning_rate": 0.0002478207566683988, - "loss": 0.0207, + "epoch": 0.18, + "learning_rate": 0.0002731907481187513, + "loss": 0.0222, "step": 68950 }, { - "epoch": 0.35, - "learning_rate": 0.0002478131889753848, - "loss": 0.0246, + "epoch": 0.18, + "learning_rate": 0.00027318685990237985, + "loss": 0.0253, "step": 68960 }, { - "epoch": 0.35, - "learning_rate": 0.0002478056212823708, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.00027318297168600836, + "loss": 0.0268, "step": 68970 }, { - "epoch": 0.35, - "learning_rate": 0.0002477980535893568, - "loss": 0.0235, + "epoch": 0.18, + "learning_rate": 0.0002731790834696369, + "loss": 0.0241, "step": 68980 }, { - "epoch": 0.35, - "learning_rate": 0.00024779048589634276, - "loss": 0.0227, + "epoch": 0.18, + "learning_rate": 0.00027317519525326545, + "loss": 0.0266, "step": 68990 }, { - "epoch": 0.35, - "learning_rate": 0.00024778291820332874, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.00027317130703689396, + "loss": 0.0215, "step": 69000 }, { - "epoch": 0.35, - "eval_cer": 0.9145119829365546, - "eval_loss": 0.014301990158855915, - "eval_runtime": 116.8153, - "eval_samples_per_second": 17.121, - "eval_steps_per_second": 4.28, + "epoch": 0.18, + "eval_cer": 0.8818076590932312, + "eval_loss": 0.018843624740839005, + "eval_runtime": 108.0702, + "eval_samples_per_second": 18.506, + "eval_steps_per_second": 4.627, "step": 69000 }, { - "epoch": 0.35, - "learning_rate": 0.0002477753505103147, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.00027316741882052253, + "loss": 0.0239, "step": 69010 }, { - "epoch": 0.35, - "learning_rate": 0.00024776778281730076, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.00027316353060415104, + "loss": 0.0228, "step": 69020 }, { - "epoch": 0.35, - "learning_rate": 0.00024776021512428674, - "loss": 0.0158, + "epoch": 0.18, + "learning_rate": 0.00027315964238777956, + "loss": 0.0217, "step": 69030 }, { - "epoch": 0.35, - "learning_rate": 0.0002477526474312727, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027315575417140807, + "loss": 0.0292, "step": 69040 }, { - "epoch": 0.35, - "learning_rate": 0.0002477450797382587, - "loss": 0.0176, + "epoch": 0.18, + "learning_rate": 0.00027315186595503664, + "loss": 0.0241, "step": 69050 }, { - "epoch": 0.35, - "learning_rate": 0.0002477375120452447, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.00027314797773866516, + "loss": 0.0256, "step": 69060 }, { - "epoch": 0.35, - "learning_rate": 0.00024772994435223066, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.0002731440895222937, + "loss": 0.0302, "step": 69070 }, { - "epoch": 0.35, - "learning_rate": 0.00024772237665921665, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027314020130592224, + "loss": 0.0222, "step": 69080 }, { - "epoch": 0.35, - "learning_rate": 0.0002477148089662027, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002731363130895508, + "loss": 0.0275, "step": 69090 }, { - "epoch": 0.35, - "learning_rate": 0.00024770724127318866, - "loss": 0.0244, + "epoch": 0.18, + "learning_rate": 0.0002731324248731793, + "loss": 0.0257, "step": 69100 }, { - "epoch": 0.35, - "learning_rate": 0.00024769967358017464, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.00027312853665680784, + "loss": 0.0312, "step": 69110 }, { - "epoch": 0.35, - "learning_rate": 0.0002476921058871606, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.00027312464844043635, + "loss": 0.033, "step": 69120 }, { - "epoch": 0.35, - "learning_rate": 0.0002476845381941466, - "loss": 0.0234, + "epoch": 0.18, + "learning_rate": 0.0002731207602240649, + "loss": 0.0272, "step": 69130 }, { - "epoch": 0.35, - "learning_rate": 0.0002476769705011326, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.0002731168720076935, + "loss": 0.0382, "step": 69140 }, { - "epoch": 0.35, - "learning_rate": 0.0002476694028081186, - "loss": 0.0201, + "epoch": 0.18, + "learning_rate": 0.000273112983791322, + "loss": 0.0329, "step": 69150 }, { - "epoch": 0.35, - "learning_rate": 0.0002476618351151046, - "loss": 0.0182, + "epoch": 0.18, + "learning_rate": 0.0002731090955749505, + "loss": 0.0305, "step": 69160 }, { - "epoch": 0.35, - "learning_rate": 0.0002476542674220906, - "loss": 0.0224, + "epoch": 0.18, + "learning_rate": 0.0002731052073585791, + "loss": 0.0268, "step": 69170 }, { - "epoch": 0.35, - "learning_rate": 0.00024764669972907657, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002731013191422076, + "loss": 0.0268, "step": 69180 }, { - "epoch": 0.35, - "learning_rate": 0.00024763913203606255, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.0002730974309258361, + "loss": 0.0238, "step": 69190 }, { - "epoch": 0.35, - "learning_rate": 0.00024763156434304853, - "loss": 0.0215, + "epoch": 0.18, + "learning_rate": 0.0002730935427094647, + "loss": 0.0283, "step": 69200 }, { - "epoch": 0.35, - "learning_rate": 0.00024762399665003457, - "loss": 0.016, + "epoch": 0.18, + "learning_rate": 0.0002730896544930932, + "loss": 0.0247, "step": 69210 }, { - "epoch": 0.35, - "learning_rate": 0.00024761642895702055, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027308576627672177, + "loss": 0.0231, "step": 69220 }, { - "epoch": 0.35, - "learning_rate": 0.00024760886126400653, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.0002730818780603503, + "loss": 0.0276, "step": 69230 }, { - "epoch": 0.35, - "learning_rate": 0.0002476012935709925, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.0002730779898439788, + "loss": 0.0193, "step": 69240 }, { - "epoch": 0.35, - "learning_rate": 0.0002475937258779785, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.0002730741016276073, + "loss": 0.0286, "step": 69250 }, { - "epoch": 0.35, - "learning_rate": 0.0002475861581849645, - "loss": 0.016, + "epoch": 0.18, + "learning_rate": 0.0002730702134112359, + "loss": 0.0225, "step": 69260 }, { - "epoch": 0.35, - "learning_rate": 0.00024757859049195046, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.0002730663251948644, + "loss": 0.024, "step": 69270 }, { - "epoch": 0.35, - "learning_rate": 0.0002475710227989365, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.00027306243697849296, + "loss": 0.0238, "step": 69280 }, { - "epoch": 0.35, - "learning_rate": 0.00024756345510592247, - "loss": 0.0179, + "epoch": 0.18, + "learning_rate": 0.0002730585487621215, + "loss": 0.0257, "step": 69290 }, { - "epoch": 0.35, - "learning_rate": 0.00024755588741290845, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.00027305466054575005, + "loss": 0.0229, "step": 69300 }, { - "epoch": 0.35, - "learning_rate": 0.00024754831971989444, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.00027305077232937856, + "loss": 0.0236, "step": 69310 }, { - "epoch": 0.35, - "learning_rate": 0.0002475407520268804, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002730468841130071, + "loss": 0.0285, "step": 69320 }, { - "epoch": 0.35, - "learning_rate": 0.0002475331843338664, - "loss": 0.0214, + "epoch": 0.18, + "learning_rate": 0.00027304299589663564, + "loss": 0.0273, "step": 69330 }, { - "epoch": 0.35, - "learning_rate": 0.00024752561664085243, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.00027303910768026416, + "loss": 0.02, "step": 69340 }, { - "epoch": 0.35, - "learning_rate": 0.0002475180489478384, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.00027303521946389273, + "loss": 0.0206, "step": 69350 }, { - "epoch": 0.35, - "learning_rate": 0.0002475104812548244, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.00027303133124752124, + "loss": 0.028, "step": 69360 }, { - "epoch": 0.35, - "learning_rate": 0.0002475029135618104, - "loss": 0.0237, + "epoch": 0.18, + "learning_rate": 0.00027302744303114976, + "loss": 0.0276, "step": 69370 }, { - "epoch": 0.35, - "learning_rate": 0.00024749534586879636, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.0002730235548147783, + "loss": 0.0259, "step": 69380 }, { - "epoch": 0.35, - "learning_rate": 0.00024748777817578234, - "loss": 0.0217, + "epoch": 0.18, + "learning_rate": 0.00027301966659840684, + "loss": 0.0245, "step": 69390 }, { - "epoch": 0.35, - "learning_rate": 0.0002474802104827683, - "loss": 0.0231, + "epoch": 0.18, + "learning_rate": 0.00027301577838203535, + "loss": 0.0289, "step": 69400 }, { - "epoch": 0.35, - "learning_rate": 0.00024747264278975436, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.0002730118901656639, + "loss": 0.0215, "step": 69410 }, { - "epoch": 0.35, - "learning_rate": 0.00024746507509674034, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.00027300800194929244, + "loss": 0.0276, "step": 69420 }, { - "epoch": 0.35, - "learning_rate": 0.0002474575074037263, - "loss": 0.0446, + "epoch": 0.18, + "learning_rate": 0.000273004113732921, + "loss": 0.023, "step": 69430 }, { - "epoch": 0.35, - "learning_rate": 0.0002474499397107123, - "loss": 0.0461, + "epoch": 0.18, + "learning_rate": 0.0002730002255165495, + "loss": 0.0266, "step": 69440 }, { - "epoch": 0.35, - "learning_rate": 0.0002474423720176983, - "loss": 0.0163, + "epoch": 0.18, + "learning_rate": 0.00027299633730017804, + "loss": 0.0277, "step": 69450 }, { - "epoch": 0.35, - "learning_rate": 0.00024743480432468427, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.0002729924490838066, + "loss": 0.0264, "step": 69460 }, { - "epoch": 0.35, - "learning_rate": 0.0002474272366316703, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.0002729885608674351, + "loss": 0.0231, "step": 69470 }, { - "epoch": 0.35, - "learning_rate": 0.0002474196689386563, - "loss": 0.0231, + "epoch": 0.18, + "learning_rate": 0.0002729846726510637, + "loss": 0.0239, "step": 69480 }, { - "epoch": 0.35, - "learning_rate": 0.00024741210124564226, - "loss": 0.017, + "epoch": 0.18, + "learning_rate": 0.0002729807844346922, + "loss": 0.0263, "step": 69490 }, { - "epoch": 0.35, - "learning_rate": 0.00024740453355262825, - "loss": 0.0185, + "epoch": 0.18, + "learning_rate": 0.0002729768962183207, + "loss": 0.0314, "step": 69500 }, { - "epoch": 0.35, - "learning_rate": 0.0002473969658596142, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.0002729730080019493, + "loss": 0.025, "step": 69510 }, { - "epoch": 0.35, - "learning_rate": 0.0002473893981666002, - "loss": 0.0238, + "epoch": 0.18, + "learning_rate": 0.0002729691197855778, + "loss": 0.0225, "step": 69520 }, { - "epoch": 0.35, - "learning_rate": 0.00024738183047358624, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.0002729652315692063, + "loss": 0.0219, "step": 69530 }, { - "epoch": 0.35, - "learning_rate": 0.0002473742627805722, - "loss": 0.0167, + "epoch": 0.18, + "learning_rate": 0.0002729613433528349, + "loss": 0.0223, "step": 69540 }, { - "epoch": 0.35, - "learning_rate": 0.0002473666950875582, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.0002729574551364634, + "loss": 0.0226, "step": 69550 }, { - "epoch": 0.35, - "learning_rate": 0.0002473591273945442, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.00027295356692009197, + "loss": 0.0248, "step": 69560 }, { - "epoch": 0.35, - "learning_rate": 0.00024735155970153017, - "loss": 0.0176, + "epoch": 0.18, + "learning_rate": 0.0002729496787037205, + "loss": 0.0244, "step": 69570 }, { - "epoch": 0.35, - "learning_rate": 0.00024734399200851615, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.000272945790487349, + "loss": 0.0253, "step": 69580 }, { - "epoch": 0.35, - "learning_rate": 0.00024733642431550213, - "loss": 0.018, + "epoch": 0.18, + "learning_rate": 0.00027294190227097756, + "loss": 0.0246, "step": 69590 }, { - "epoch": 0.35, - "learning_rate": 0.00024732885662248817, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.0002729380140546061, + "loss": 0.028, "step": 69600 }, { - "epoch": 0.35, - "learning_rate": 0.00024732128892947415, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.0002729341258382346, + "loss": 0.0262, "step": 69610 }, { - "epoch": 0.35, - "learning_rate": 0.00024731372123646013, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.00027293023762186316, + "loss": 0.0274, "step": 69620 }, { - "epoch": 0.35, - "learning_rate": 0.0002473061535434461, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.00027292634940549173, + "loss": 0.0261, "step": 69630 }, { - "epoch": 0.35, - "learning_rate": 0.0002472985858504321, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.00027292246118912025, + "loss": 0.0303, "step": 69640 }, { - "epoch": 0.35, - "learning_rate": 0.0002472910181574181, - "loss": 0.0162, + "epoch": 0.18, + "learning_rate": 0.00027291857297274876, + "loss": 0.0253, "step": 69650 }, { - "epoch": 0.35, - "learning_rate": 0.0002472834504644041, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.0002729146847563773, + "loss": 0.028, "step": 69660 }, { - "epoch": 0.35, - "learning_rate": 0.0002472758827713901, - "loss": 0.0182, + "epoch": 0.18, + "learning_rate": 0.00027291079654000584, + "loss": 0.025, "step": 69670 }, { - "epoch": 0.35, - "learning_rate": 0.0002472683150783761, - "loss": 0.0283, + "epoch": 0.18, + "learning_rate": 0.00027290690832363436, + "loss": 0.0302, "step": 69680 }, { - "epoch": 0.35, - "learning_rate": 0.00024726074738536206, - "loss": 0.0173, + "epoch": 0.18, + "learning_rate": 0.0002729030201072629, + "loss": 0.0208, "step": 69690 }, { - "epoch": 0.35, - "learning_rate": 0.00024725317969234804, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.00027289913189089144, + "loss": 0.0267, "step": 69700 }, { - "epoch": 0.35, - "learning_rate": 0.000247245611999334, - "loss": 0.0161, + "epoch": 0.18, + "learning_rate": 0.00027289524367452, + "loss": 0.0238, "step": 69710 }, { - "epoch": 0.35, - "learning_rate": 0.00024723804430632005, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.0002728913554581485, + "loss": 0.0236, "step": 69720 }, { - "epoch": 0.35, - "learning_rate": 0.00024723047661330604, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.00027288746724177704, + "loss": 0.0322, "step": 69730 }, { - "epoch": 0.35, - "learning_rate": 0.000247222908920292, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.00027288357902540555, + "loss": 0.0254, "step": 69740 }, { - "epoch": 0.35, - "learning_rate": 0.000247215341227278, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.0002728796908090341, + "loss": 0.0264, "step": 69750 }, { - "epoch": 0.35, - "learning_rate": 0.000247207773534264, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.00027287580259266264, + "loss": 0.02, "step": 69760 }, { - "epoch": 0.35, - "learning_rate": 0.00024720020584124996, - "loss": 0.0157, + "epoch": 0.18, + "learning_rate": 0.0002728719143762912, + "loss": 0.0294, "step": 69770 }, { - "epoch": 0.35, - "learning_rate": 0.00024719263814823594, - "loss": 0.017, + "epoch": 0.18, + "learning_rate": 0.0002728680261599197, + "loss": 0.0253, "step": 69780 }, { - "epoch": 0.35, - "learning_rate": 0.0002471850704552219, - "loss": 0.0225, + "epoch": 0.18, + "learning_rate": 0.00027286413794354823, + "loss": 0.0257, "step": 69790 }, { - "epoch": 0.35, - "learning_rate": 0.0002471775027622079, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.0002728602497271768, + "loss": 0.0253, "step": 69800 }, { - "epoch": 0.35, - "learning_rate": 0.0002471699350691939, - "loss": 0.0204, + "epoch": 0.18, + "learning_rate": 0.0002728563615108053, + "loss": 0.0279, "step": 69810 }, { - "epoch": 0.35, - "learning_rate": 0.00024716236737617987, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.0002728524732944339, + "loss": 0.0262, "step": 69820 }, { - "epoch": 0.35, - "learning_rate": 0.0002471547996831659, - "loss": 0.0211, + "epoch": 0.18, + "learning_rate": 0.0002728485850780624, + "loss": 0.0284, "step": 69830 }, { - "epoch": 0.35, - "learning_rate": 0.0002471472319901519, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.00027284469686169097, + "loss": 0.0247, "step": 69840 }, { - "epoch": 0.35, - "learning_rate": 0.00024713966429713787, - "loss": 0.0183, + "epoch": 0.18, + "learning_rate": 0.0002728408086453195, + "loss": 0.0251, "step": 69850 }, { - "epoch": 0.35, - "learning_rate": 0.00024713209660412385, - "loss": 0.0153, + "epoch": 0.18, + "learning_rate": 0.000272836920428948, + "loss": 0.026, "step": 69860 }, { - "epoch": 0.35, - "learning_rate": 0.00024712452891110983, - "loss": 0.0213, + "epoch": 0.18, + "learning_rate": 0.0002728330322125765, + "loss": 0.0267, "step": 69870 }, { - "epoch": 0.35, - "learning_rate": 0.0002471169612180958, - "loss": 0.0205, + "epoch": 0.18, + "learning_rate": 0.0002728291439962051, + "loss": 0.0333, "step": 69880 }, { - "epoch": 0.35, - "learning_rate": 0.00024710939352508185, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.0002728252557798336, + "loss": 0.023, "step": 69890 }, { - "epoch": 0.35, - "learning_rate": 0.00024710182583206783, - "loss": 0.0185, + "epoch": 0.18, + "learning_rate": 0.00027282136756346217, + "loss": 0.0273, "step": 69900 }, { - "epoch": 0.35, - "learning_rate": 0.0002470942581390538, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.0002728174793470907, + "loss": 0.0298, "step": 69910 }, { - "epoch": 0.35, - "learning_rate": 0.0002470866904460398, - "loss": 0.0167, + "epoch": 0.18, + "learning_rate": 0.00027281359113071925, + "loss": 0.0236, "step": 69920 }, { - "epoch": 0.35, - "learning_rate": 0.00024707912275302577, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.00027280970291434776, + "loss": 0.0246, "step": 69930 }, { - "epoch": 0.35, - "learning_rate": 0.00024707155506001175, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.0002728058146979763, + "loss": 0.0234, "step": 69940 }, { - "epoch": 0.35, - "learning_rate": 0.00024706398736699774, - "loss": 0.0167, + "epoch": 0.18, + "learning_rate": 0.0002728019264816048, + "loss": 0.0255, "step": 69950 }, { - "epoch": 0.35, - "learning_rate": 0.00024705641967398377, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027279803826523336, + "loss": 0.0211, "step": 69960 }, { - "epoch": 0.35, - "learning_rate": 0.00024704885198096975, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.00027279415004886193, + "loss": 0.0312, "step": 69970 }, { - "epoch": 0.35, - "learning_rate": 0.00024704128428795573, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.00027279026183249044, + "loss": 0.0303, "step": 69980 }, { - "epoch": 0.35, - "learning_rate": 0.0002470337165949417, - "loss": 0.0218, + "epoch": 0.18, + "learning_rate": 0.00027278637361611896, + "loss": 0.0208, "step": 69990 }, { - "epoch": 0.35, - "learning_rate": 0.0002470261489019277, - "loss": 0.018, + "epoch": 0.18, + "learning_rate": 0.0002727824853997475, + "loss": 0.0227, "step": 70000 }, { - "epoch": 0.35, - "eval_cer": 0.9144508479806542, - "eval_loss": 0.013182277791202068, - "eval_runtime": 116.7197, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.18, + "eval_cer": 0.8817880641761527, + "eval_loss": 0.018043356016278267, + "eval_runtime": 107.6403, + "eval_samples_per_second": 18.58, + "eval_steps_per_second": 4.645, "step": 70000 }, { - "epoch": 0.35, - "learning_rate": 0.0002470185812089137, - "loss": 0.0209, + "epoch": 0.18, + "learning_rate": 0.00027277859718337604, + "loss": 0.0231, "step": 70010 }, { - "epoch": 0.35, - "learning_rate": 0.0002470110135158997, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.00027277470896700456, + "loss": 0.0225, "step": 70020 }, { - "epoch": 0.35, - "learning_rate": 0.0002470034458228857, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.0002727708207506331, + "loss": 0.0296, "step": 70030 }, { - "epoch": 0.35, - "learning_rate": 0.0002469958781298717, - "loss": 0.0319, + "epoch": 0.18, + "learning_rate": 0.00027276693253426164, + "loss": 0.0258, "step": 70040 }, { - "epoch": 0.35, - "learning_rate": 0.00024698831043685766, - "loss": 0.0164, + "epoch": 0.18, + "learning_rate": 0.0002727630443178902, + "loss": 0.0214, "step": 70050 }, { - "epoch": 0.35, - "learning_rate": 0.00024698074274384364, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.0002727591561015187, + "loss": 0.0262, "step": 70060 }, { - "epoch": 0.35, - "learning_rate": 0.0002469731750508296, - "loss": 0.0208, + "epoch": 0.18, + "learning_rate": 0.00027275526788514724, + "loss": 0.0263, "step": 70070 }, { - "epoch": 0.35, - "learning_rate": 0.00024696560735781566, - "loss": 0.0216, + "epoch": 0.18, + "learning_rate": 0.00027275137966877575, + "loss": 0.0296, "step": 70080 }, { - "epoch": 0.35, - "learning_rate": 0.00024695803966480164, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.0002727474914524043, + "loss": 0.0283, "step": 70090 }, { - "epoch": 0.35, - "learning_rate": 0.0002469504719717876, - "loss": 0.024, + "epoch": 0.18, + "learning_rate": 0.00027274360323603284, + "loss": 0.0255, "step": 70100 }, { - "epoch": 0.35, - "learning_rate": 0.0002469429042787736, - "loss": 0.0176, + "epoch": 0.18, + "learning_rate": 0.0002727397150196614, + "loss": 0.024, "step": 70110 }, { - "epoch": 0.35, - "learning_rate": 0.0002469353365857596, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002727358268032899, + "loss": 0.0333, "step": 70120 }, { - "epoch": 0.35, - "learning_rate": 0.00024692776889274556, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.0002727319385869185, + "loss": 0.0253, "step": 70130 }, { - "epoch": 0.35, - "learning_rate": 0.00024692020119973155, - "loss": 0.0241, + "epoch": 0.18, + "learning_rate": 0.000272728050370547, + "loss": 0.022, "step": 70140 }, { - "epoch": 0.35, - "learning_rate": 0.0002469126335067176, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.0002727241621541755, + "loss": 0.0259, "step": 70150 }, { - "epoch": 0.35, - "learning_rate": 0.00024690506581370356, - "loss": 0.0185, + "epoch": 0.18, + "learning_rate": 0.00027272027393780403, + "loss": 0.027, "step": 70160 }, { - "epoch": 0.35, - "learning_rate": 0.00024689749812068954, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.0002727163857214326, + "loss": 0.0287, "step": 70170 }, { - "epoch": 0.35, - "learning_rate": 0.0002468899304276755, - "loss": 0.0179, + "epoch": 0.18, + "learning_rate": 0.00027271249750506117, + "loss": 0.0286, "step": 70180 }, { - "epoch": 0.35, - "learning_rate": 0.0002468823627346615, - "loss": 0.0232, + "epoch": 0.18, + "learning_rate": 0.0002727086092886897, + "loss": 0.023, "step": 70190 }, { - "epoch": 0.35, - "learning_rate": 0.0002468747950416475, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.0002727047210723182, + "loss": 0.0229, "step": 70200 }, { - "epoch": 0.35, - "learning_rate": 0.0002468672273486335, - "loss": 0.0163, + "epoch": 0.18, + "learning_rate": 0.00027270083285594677, + "loss": 0.0233, "step": 70210 }, { - "epoch": 0.35, - "learning_rate": 0.0002468596596556195, - "loss": 0.0159, + "epoch": 0.18, + "learning_rate": 0.0002726969446395753, + "loss": 0.029, "step": 70220 }, { - "epoch": 0.35, - "learning_rate": 0.0002468520919626055, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002726930564232038, + "loss": 0.026, "step": 70230 }, { - "epoch": 0.35, - "learning_rate": 0.00024684452426959147, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.00027268916820683236, + "loss": 0.0238, "step": 70240 }, { - "epoch": 0.35, - "learning_rate": 0.00024683695657657745, - "loss": 0.0212, + "epoch": 0.18, + "learning_rate": 0.0002726852799904609, + "loss": 0.0225, "step": 70250 }, { - "epoch": 0.35, - "learning_rate": 0.00024682938888356343, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027268139177408945, + "loss": 0.0245, "step": 70260 }, { - "epoch": 0.35, - "learning_rate": 0.00024682182119054947, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.00027267750355771796, + "loss": 0.0263, "step": 70270 }, { - "epoch": 0.35, - "learning_rate": 0.00024681425349753545, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.0002726736153413465, + "loss": 0.024, "step": 70280 }, { - "epoch": 0.35, - "learning_rate": 0.00024680668580452143, - "loss": 0.0196, + "epoch": 0.18, + "learning_rate": 0.000272669727124975, + "loss": 0.0256, "step": 70290 }, { - "epoch": 0.35, - "learning_rate": 0.0002467991181115074, - "loss": 0.0184, + "epoch": 0.18, + "learning_rate": 0.00027266583890860356, + "loss": 0.025, "step": 70300 }, { - "epoch": 0.35, - "learning_rate": 0.0002467915504184934, - "loss": 0.0172, + "epoch": 0.18, + "learning_rate": 0.0002726619506922321, + "loss": 0.0233, "step": 70310 }, { - "epoch": 0.35, - "learning_rate": 0.0002467839827254794, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.00027265806247586064, + "loss": 0.021, "step": 70320 }, { - "epoch": 0.35, - "learning_rate": 0.00024677641503246536, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.00027265417425948916, + "loss": 0.0252, "step": 70330 }, { - "epoch": 0.35, - "learning_rate": 0.0002467688473394514, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.0002726502860431177, + "loss": 0.0227, "step": 70340 }, { - "epoch": 0.35, - "learning_rate": 0.00024676127964643737, - "loss": 0.017, + "epoch": 0.18, + "learning_rate": 0.00027264639782674624, + "loss": 0.0283, "step": 70350 }, { - "epoch": 0.35, - "learning_rate": 0.00024675371195342335, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.00027264250961037476, + "loss": 0.0275, "step": 70360 }, { - "epoch": 0.36, - "learning_rate": 0.00024674614426040934, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.0002726386213940033, + "loss": 0.0248, "step": 70370 }, { - "epoch": 0.36, - "learning_rate": 0.0002467385765673953, - "loss": 0.0163, + "epoch": 0.18, + "learning_rate": 0.00027263473317763184, + "loss": 0.0253, "step": 70380 }, { - "epoch": 0.36, - "learning_rate": 0.0002467310088743813, - "loss": 0.0163, + "epoch": 0.18, + "learning_rate": 0.0002726308449612604, + "loss": 0.0222, "step": 70390 }, { - "epoch": 0.36, - "learning_rate": 0.00024672344118136733, - "loss": 0.0186, + "epoch": 0.18, + "learning_rate": 0.0002726269567448889, + "loss": 0.0266, "step": 70400 }, { - "epoch": 0.36, - "learning_rate": 0.0002467158734883533, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027262306852851744, + "loss": 0.0232, "step": 70410 }, { - "epoch": 0.36, - "learning_rate": 0.0002467083057953393, - "loss": 0.0164, + "epoch": 0.18, + "learning_rate": 0.000272619180312146, + "loss": 0.0293, "step": 70420 }, { - "epoch": 0.36, - "learning_rate": 0.0002467007381023253, - "loss": 0.0178, + "epoch": 0.18, + "learning_rate": 0.0002726152920957745, + "loss": 0.0266, "step": 70430 }, { - "epoch": 0.36, - "learning_rate": 0.00024669317040931126, - "loss": 0.021, + "epoch": 0.18, + "learning_rate": 0.00027261140387940303, + "loss": 0.0235, "step": 70440 }, { - "epoch": 0.36, - "learning_rate": 0.00024668560271629724, - "loss": 0.0229, + "epoch": 0.18, + "learning_rate": 0.0002726075156630316, + "loss": 0.0231, "step": 70450 }, { - "epoch": 0.36, - "learning_rate": 0.0002466780350232832, - "loss": 0.0205, + "epoch": 0.18, + "learning_rate": 0.0002726036274466601, + "loss": 0.0241, "step": 70460 }, { - "epoch": 0.36, - "learning_rate": 0.00024667046733026926, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.0002725997392302887, + "loss": 0.0235, "step": 70470 }, { - "epoch": 0.36, - "learning_rate": 0.00024666289963725524, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002725958510139172, + "loss": 0.0288, "step": 70480 }, { - "epoch": 0.36, - "learning_rate": 0.0002466553319442412, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.0002725919627975457, + "loss": 0.0276, "step": 70490 }, { - "epoch": 0.36, - "learning_rate": 0.0002466477642512272, - "loss": 0.0183, + "epoch": 0.18, + "learning_rate": 0.00027258807458117423, + "loss": 0.0282, "step": 70500 }, { - "epoch": 0.36, - "learning_rate": 0.0002466401965582132, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002725841863648028, + "loss": 0.0244, "step": 70510 }, { - "epoch": 0.36, - "learning_rate": 0.00024663262886519917, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.00027258029814843137, + "loss": 0.0259, "step": 70520 }, { - "epoch": 0.36, - "learning_rate": 0.0002466250611721852, - "loss": 0.0221, + "epoch": 0.18, + "learning_rate": 0.0002725764099320599, + "loss": 0.0247, "step": 70530 }, { - "epoch": 0.36, - "learning_rate": 0.0002466174934791712, - "loss": 0.0203, + "epoch": 0.18, + "learning_rate": 0.0002725725217156884, + "loss": 0.0283, "step": 70540 }, { - "epoch": 0.36, - "learning_rate": 0.00024660992578615716, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.00027256863349931697, + "loss": 0.029, "step": 70550 }, { - "epoch": 0.36, - "learning_rate": 0.00024660235809314315, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.0002725647452829455, + "loss": 0.0201, "step": 70560 }, { - "epoch": 0.36, - "learning_rate": 0.0002465947904001291, - "loss": 0.0157, + "epoch": 0.18, + "learning_rate": 0.000272560857066574, + "loss": 0.0241, "step": 70570 }, { - "epoch": 0.36, - "learning_rate": 0.0002465872227071151, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.00027255696885020256, + "loss": 0.0225, "step": 70580 }, { - "epoch": 0.36, - "learning_rate": 0.00024657965501410114, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.0002725530806338311, + "loss": 0.0304, "step": 70590 }, { - "epoch": 0.36, - "learning_rate": 0.0002465720873210871, - "loss": 0.0168, + "epoch": 0.18, + "learning_rate": 0.00027254919241745965, + "loss": 0.024, "step": 70600 }, { - "epoch": 0.36, - "learning_rate": 0.0002465645196280731, - "loss": 0.0155, + "epoch": 0.18, + "learning_rate": 0.00027254530420108816, + "loss": 0.025, "step": 70610 }, { - "epoch": 0.36, - "learning_rate": 0.0002465569519350591, - "loss": 0.0235, + "epoch": 0.18, + "learning_rate": 0.0002725414159847167, + "loss": 0.03, "step": 70620 }, { - "epoch": 0.36, - "learning_rate": 0.00024654938424204507, - "loss": 0.0158, + "epoch": 0.18, + "learning_rate": 0.00027253752776834524, + "loss": 0.0248, "step": 70630 }, { - "epoch": 0.36, - "learning_rate": 0.00024654181654903105, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027253363955197376, + "loss": 0.025, "step": 70640 }, { - "epoch": 0.36, - "learning_rate": 0.00024653424885601703, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.0002725297513356023, + "loss": 0.0302, "step": 70650 }, { - "epoch": 0.36, - "learning_rate": 0.00024652668116300307, - "loss": 0.0156, + "epoch": 0.18, + "learning_rate": 0.00027252586311923084, + "loss": 0.024, "step": 70660 }, { - "epoch": 0.36, - "learning_rate": 0.00024651911346998905, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.0002725219749028594, + "loss": 0.0189, "step": 70670 }, { - "epoch": 0.36, - "learning_rate": 0.00024651154577697503, - "loss": 0.0187, + "epoch": 0.18, + "learning_rate": 0.0002725180866864879, + "loss": 0.0284, "step": 70680 }, { - "epoch": 0.36, - "learning_rate": 0.000246503978083961, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.00027251419847011644, + "loss": 0.0274, "step": 70690 }, { - "epoch": 0.36, - "learning_rate": 0.000246496410390947, - "loss": 0.0217, + "epoch": 0.18, + "learning_rate": 0.00027251031025374495, + "loss": 0.0262, "step": 70700 }, { - "epoch": 0.36, - "learning_rate": 0.000246488842697933, - "loss": 0.0209, + "epoch": 0.18, + "learning_rate": 0.0002725064220373735, + "loss": 0.0214, "step": 70710 }, { - "epoch": 0.36, - "learning_rate": 0.000246481275004919, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.00027250253382100204, + "loss": 0.0293, "step": 70720 }, { - "epoch": 0.36, - "learning_rate": 0.000246473707311905, - "loss": 0.0153, + "epoch": 0.18, + "learning_rate": 0.0002724986456046306, + "loss": 0.0256, "step": 70730 }, { - "epoch": 0.36, - "learning_rate": 0.000246466139618891, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.0002724947573882591, + "loss": 0.0253, "step": 70740 }, { - "epoch": 0.36, - "learning_rate": 0.00024645857192587696, - "loss": 0.0173, + "epoch": 0.18, + "learning_rate": 0.00027249086917188764, + "loss": 0.0279, "step": 70750 }, { - "epoch": 0.36, - "learning_rate": 0.00024645100423286294, - "loss": 0.0176, + "epoch": 0.18, + "learning_rate": 0.0002724869809555162, + "loss": 0.0271, "step": 70760 }, { - "epoch": 0.36, - "learning_rate": 0.0002464434365398489, - "loss": 0.0163, + "epoch": 0.18, + "learning_rate": 0.0002724830927391447, + "loss": 0.025, "step": 70770 }, { - "epoch": 0.36, - "learning_rate": 0.00024643586884683495, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.00027247920452277323, + "loss": 0.0229, "step": 70780 }, { - "epoch": 0.36, - "learning_rate": 0.00024642830115382094, - "loss": 0.0138, + "epoch": 0.18, + "learning_rate": 0.0002724753163064018, + "loss": 0.0223, "step": 70790 }, { - "epoch": 0.36, - "learning_rate": 0.0002464207334608069, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.0002724714280900303, + "loss": 0.0248, "step": 70800 }, { - "epoch": 0.36, - "learning_rate": 0.0002464131657677929, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.0002724675398736589, + "loss": 0.0301, "step": 70810 }, { - "epoch": 0.36, - "learning_rate": 0.0002464055980747789, - "loss": 0.0188, + "epoch": 0.18, + "learning_rate": 0.0002724636516572874, + "loss": 0.0287, "step": 70820 }, { - "epoch": 0.36, - "learning_rate": 0.00024639803038176486, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.0002724597634409159, + "loss": 0.021, "step": 70830 }, { - "epoch": 0.36, - "learning_rate": 0.00024639046268875084, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.0002724558752245445, + "loss": 0.0273, "step": 70840 }, { - "epoch": 0.36, - "learning_rate": 0.0002463828949957369, - "loss": 0.0182, - "step": 70850 + "epoch": 0.18, + "learning_rate": 0.000272451987008173, + "loss": 0.0256, + "step": 70850 }, { - "epoch": 0.36, - "learning_rate": 0.00024637532730272286, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002724480987918015, + "loss": 0.0272, "step": 70860 }, { - "epoch": 0.36, - "learning_rate": 0.00024636775960970884, - "loss": 0.0165, + "epoch": 0.18, + "learning_rate": 0.0002724442105754301, + "loss": 0.0217, "step": 70870 }, { - "epoch": 0.36, - "learning_rate": 0.0002463601919166948, - "loss": 0.0154, + "epoch": 0.18, + "learning_rate": 0.00027244032235905865, + "loss": 0.0211, "step": 70880 }, { - "epoch": 0.36, - "learning_rate": 0.0002463526242236808, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.00027243643414268716, + "loss": 0.027, "step": 70890 }, { - "epoch": 0.36, - "learning_rate": 0.0002463450565306668, - "loss": 0.0183, + "epoch": 0.18, + "learning_rate": 0.0002724325459263157, + "loss": 0.0255, "step": 70900 }, { - "epoch": 0.36, - "learning_rate": 0.0002463374888376528, - "loss": 0.0181, + "epoch": 0.18, + "learning_rate": 0.0002724286577099442, + "loss": 0.0289, "step": 70910 }, { - "epoch": 0.36, - "learning_rate": 0.0002463299211446388, - "loss": 0.0174, + "epoch": 0.18, + "learning_rate": 0.00027242476949357276, + "loss": 0.0258, "step": 70920 }, { - "epoch": 0.36, - "learning_rate": 0.0002463223534516248, - "loss": 0.0202, + "epoch": 0.18, + "learning_rate": 0.0002724208812772013, + "loss": 0.0269, "step": 70930 }, { - "epoch": 0.36, - "learning_rate": 0.00024631478575861077, - "loss": 0.0203, + "epoch": 0.18, + "learning_rate": 0.00027241699306082985, + "loss": 0.0267, "step": 70940 }, { - "epoch": 0.36, - "learning_rate": 0.00024630721806559675, - "loss": 0.0189, + "epoch": 0.18, + "learning_rate": 0.00027241310484445836, + "loss": 0.0251, "step": 70950 }, { - "epoch": 0.36, - "learning_rate": 0.00024629965037258273, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.0002724092166280869, + "loss": 0.0276, "step": 70960 }, { - "epoch": 0.36, - "learning_rate": 0.0002462920826795687, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.00027240532841171544, + "loss": 0.024, "step": 70970 }, { - "epoch": 0.36, - "learning_rate": 0.00024628451498655475, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.00027240144019534396, + "loss": 0.0263, "step": 70980 }, { - "epoch": 0.36, - "learning_rate": 0.0002462769472935407, - "loss": 0.0164, + "epoch": 0.18, + "learning_rate": 0.00027239755197897247, + "loss": 0.0249, "step": 70990 }, { - "epoch": 0.36, - "learning_rate": 0.0002462693796005267, - "loss": 0.0199, + "epoch": 0.18, + "learning_rate": 0.00027239366376260104, + "loss": 0.0223, "step": 71000 }, { - "epoch": 0.36, - "eval_cer": 0.9145042197675514, - "eval_loss": 0.013640601187944412, - "eval_runtime": 116.7174, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.18, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.018395202234387398, + "eval_runtime": 107.9247, + "eval_samples_per_second": 18.531, + "eval_steps_per_second": 4.633, "step": 71000 }, { - "epoch": 0.36, - "learning_rate": 0.0002462618119075127, - "loss": 0.0179, + "epoch": 0.18, + "learning_rate": 0.00027238977554622956, + "loss": 0.0266, "step": 71010 }, { - "epoch": 0.36, - "learning_rate": 0.00024625424421449867, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.0002723858873298581, + "loss": 0.0295, "step": 71020 }, { - "epoch": 0.36, - "learning_rate": 0.00024624667652148465, - "loss": 0.019, + "epoch": 0.18, + "learning_rate": 0.00027238199911348664, + "loss": 0.0319, "step": 71030 }, { - "epoch": 0.36, - "learning_rate": 0.00024623910882847063, - "loss": 0.0206, + "epoch": 0.18, + "learning_rate": 0.00027237811089711515, + "loss": 0.0221, "step": 71040 }, { - "epoch": 0.36, - "learning_rate": 0.0002462315411354566, - "loss": 0.0143, + "epoch": 0.18, + "learning_rate": 0.0002723742226807437, + "loss": 0.0247, "step": 71050 }, { - "epoch": 0.36, - "learning_rate": 0.0002462239734424426, - "loss": 0.0205, + "epoch": 0.18, + "learning_rate": 0.00027237033446437224, + "loss": 0.0252, "step": 71060 }, { - "epoch": 0.36, - "learning_rate": 0.0002462164057494286, - "loss": 0.0194, + "epoch": 0.18, + "learning_rate": 0.0002723664462480008, + "loss": 0.0236, "step": 71070 }, { - "epoch": 0.36, - "learning_rate": 0.0002462088380564146, - "loss": 0.0177, + "epoch": 0.18, + "learning_rate": 0.0002723625580316293, + "loss": 0.0266, "step": 71080 }, { - "epoch": 0.36, - "learning_rate": 0.0002462012703634006, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.0002723586698152579, + "loss": 0.0239, "step": 71090 }, { - "epoch": 0.36, - "learning_rate": 0.0002461937026703866, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002723547815988864, + "loss": 0.0283, "step": 71100 }, { - "epoch": 0.36, - "learning_rate": 0.00024618613497737256, - "loss": 0.0183, + "epoch": 0.18, + "learning_rate": 0.0002723508933825149, + "loss": 0.0235, "step": 71110 }, { - "epoch": 0.36, - "learning_rate": 0.00024617856728435854, - "loss": 0.0222, + "epoch": 0.18, + "learning_rate": 0.00027234700516614343, + "loss": 0.0249, "step": 71120 }, { - "epoch": 0.36, - "learning_rate": 0.0002461709995913445, - "loss": 0.0175, + "epoch": 0.18, + "learning_rate": 0.000272343116949772, + "loss": 0.0268, "step": 71130 }, { - "epoch": 0.36, - "learning_rate": 0.00024616343189833056, - "loss": 0.0197, + "epoch": 0.18, + "learning_rate": 0.0002723392287334005, + "loss": 0.027, "step": 71140 }, { - "epoch": 0.36, - "learning_rate": 0.00024615586420531654, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.0002723353405170291, + "loss": 0.025, "step": 71150 }, { - "epoch": 0.36, - "learning_rate": 0.0002461482965123025, - "loss": 0.0152, + "epoch": 0.18, + "learning_rate": 0.0002723314523006576, + "loss": 0.0329, "step": 71160 }, { - "epoch": 0.36, - "learning_rate": 0.0002461407288192885, - "loss": 0.0192, + "epoch": 0.18, + "learning_rate": 0.00027232756408428617, + "loss": 0.0262, "step": 71170 }, { - "epoch": 0.36, - "learning_rate": 0.0002461331611262745, - "loss": 0.0223, + "epoch": 0.18, + "learning_rate": 0.0002723236758679147, + "loss": 0.0227, "step": 71180 }, { - "epoch": 0.36, - "learning_rate": 0.00024612559343326046, - "loss": 0.0179, + "epoch": 0.18, + "learning_rate": 0.0002723197876515432, + "loss": 0.0232, "step": 71190 }, { - "epoch": 0.36, - "learning_rate": 0.00024611802574024645, - "loss": 0.0198, + "epoch": 0.18, + "learning_rate": 0.0002723158994351717, + "loss": 0.0228, "step": 71200 }, { - "epoch": 0.36, - "learning_rate": 0.0002461104580472325, - "loss": 0.0182, + "epoch": 0.18, + "learning_rate": 0.0002723120112188003, + "loss": 0.0254, "step": 71210 }, { - "epoch": 0.36, - "learning_rate": 0.00024610289035421846, - "loss": 0.0168, + "epoch": 0.18, + "learning_rate": 0.00027230812300242885, + "loss": 0.0231, "step": 71220 }, { - "epoch": 0.36, - "learning_rate": 0.00024609532266120444, - "loss": 0.0191, + "epoch": 0.18, + "learning_rate": 0.00027230423478605736, + "loss": 0.0236, "step": 71230 }, { - "epoch": 0.36, - "learning_rate": 0.0002460877549681904, - "loss": 0.0171, + "epoch": 0.18, + "learning_rate": 0.0002723003465696859, + "loss": 0.0235, "step": 71240 }, { - "epoch": 0.36, - "learning_rate": 0.0002460801872751764, - "loss": 0.0154, + "epoch": 0.18, + "learning_rate": 0.0002722964583533144, + "loss": 0.0299, "step": 71250 }, { - "epoch": 0.36, - "learning_rate": 0.0002460726195821624, - "loss": 0.0173, + "epoch": 0.18, + "learning_rate": 0.00027229257013694296, + "loss": 0.0242, "step": 71260 }, { - "epoch": 0.36, - "learning_rate": 0.0002460650518891484, - "loss": 0.018, + "epoch": 0.18, + "learning_rate": 0.0002722886819205715, + "loss": 0.0258, "step": 71270 }, { - "epoch": 0.36, - "learning_rate": 0.0002460574841961344, - "loss": 0.018, + "epoch": 0.18, + "learning_rate": 0.00027228479370420004, + "loss": 0.0276, "step": 71280 }, { - "epoch": 0.36, - "learning_rate": 0.0002460499165031204, - "loss": 0.0166, + "epoch": 0.18, + "learning_rate": 0.00027228090548782856, + "loss": 0.0312, "step": 71290 }, { - "epoch": 0.36, - "learning_rate": 0.00024604234881010637, - "loss": 0.02, + "epoch": 0.18, + "learning_rate": 0.00027227701727145713, + "loss": 0.0292, "step": 71300 }, { - "epoch": 0.36, - "learning_rate": 0.00024603478111709235, - "loss": 0.0157, + "epoch": 0.18, + "learning_rate": 0.00027227312905508564, + "loss": 0.0282, "step": 71310 }, { - "epoch": 0.36, - "learning_rate": 0.00024602721342407833, - "loss": 0.0169, + "epoch": 0.18, + "learning_rate": 0.00027226924083871416, + "loss": 0.0364, "step": 71320 }, { - "epoch": 0.36, - "learning_rate": 0.00024601964573106437, - "loss": 0.0161, + "epoch": 0.18, + "learning_rate": 0.00027226535262234267, + "loss": 0.029, "step": 71330 }, { - "epoch": 0.36, - "learning_rate": 0.00024601207803805035, - "loss": 0.0164, + "epoch": 0.18, + "learning_rate": 0.00027226146440597124, + "loss": 0.035, "step": 71340 }, { - "epoch": 0.36, - "learning_rate": 0.00024600451034503633, - "loss": 0.0193, + "epoch": 0.18, + "learning_rate": 0.00027225757618959975, + "loss": 0.0239, "step": 71350 }, { - "epoch": 0.36, - "learning_rate": 0.0002459969426520223, - "loss": 0.0161, + "epoch": 0.18, + "learning_rate": 0.0002722536879732283, + "loss": 0.0236, "step": 71360 }, { - "epoch": 0.36, - "learning_rate": 0.0002459893749590083, - "loss": 0.0136, + "epoch": 0.19, + "learning_rate": 0.00027224979975685684, + "loss": 0.0246, "step": 71370 }, { - "epoch": 0.36, - "learning_rate": 0.0002459818072659943, - "loss": 0.0146, + "epoch": 0.19, + "learning_rate": 0.0002722459115404854, + "loss": 0.0244, "step": 71380 }, { - "epoch": 0.36, - "learning_rate": 0.00024597423957298026, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.0002722420233241139, + "loss": 0.0295, "step": 71390 }, { - "epoch": 0.36, - "learning_rate": 0.0002459666718799663, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.00027223813510774244, + "loss": 0.0222, "step": 71400 }, { - "epoch": 0.36, - "learning_rate": 0.00024595910418695227, - "loss": 0.015, + "epoch": 0.19, + "learning_rate": 0.000272234246891371, + "loss": 0.0234, "step": 71410 }, { - "epoch": 0.36, - "learning_rate": 0.00024595153649393825, - "loss": 0.0234, + "epoch": 0.19, + "learning_rate": 0.0002722303586749995, + "loss": 0.0245, "step": 71420 }, { - "epoch": 0.36, - "learning_rate": 0.00024594396880092424, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.0002722264704586281, + "loss": 0.0281, "step": 71430 }, { - "epoch": 0.36, - "learning_rate": 0.0002459364011079102, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.0002722225822422566, + "loss": 0.0317, "step": 71440 }, { - "epoch": 0.36, - "learning_rate": 0.0002459288334148962, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002722186940258851, + "loss": 0.03, "step": 71450 }, { - "epoch": 0.36, - "learning_rate": 0.00024592126572188223, - "loss": 0.0142, + "epoch": 0.19, + "learning_rate": 0.00027221480580951363, + "loss": 0.0288, "step": 71460 }, { - "epoch": 0.36, - "learning_rate": 0.0002459136980288682, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.0002722109175931422, + "loss": 0.0248, "step": 71470 }, { - "epoch": 0.36, - "learning_rate": 0.0002459061303358542, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002722070293767707, + "loss": 0.0243, "step": 71480 }, { - "epoch": 0.36, - "learning_rate": 0.0002458985626428402, - "loss": 0.0163, + "epoch": 0.19, + "learning_rate": 0.0002722031411603993, + "loss": 0.0296, "step": 71490 }, { - "epoch": 0.36, - "learning_rate": 0.00024589099494982616, - "loss": 0.0148, + "epoch": 0.19, + "learning_rate": 0.0002721992529440278, + "loss": 0.0226, "step": 71500 }, { - "epoch": 0.36, - "learning_rate": 0.00024588342725681214, - "loss": 0.0154, + "epoch": 0.19, + "learning_rate": 0.00027219536472765637, + "loss": 0.0257, "step": 71510 }, { - "epoch": 0.36, - "learning_rate": 0.0002458758595637982, - "loss": 0.0158, + "epoch": 0.19, + "learning_rate": 0.0002721914765112849, + "loss": 0.0286, "step": 71520 }, { - "epoch": 0.36, - "learning_rate": 0.00024586829187078416, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002721875882949134, + "loss": 0.026, "step": 71530 }, { - "epoch": 0.36, - "learning_rate": 0.00024586072417777014, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.0002721837000785419, + "loss": 0.0317, "step": 71540 }, { - "epoch": 0.36, - "learning_rate": 0.0002458531564847561, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.0002721798118621705, + "loss": 0.0327, "step": 71550 }, { - "epoch": 0.36, - "learning_rate": 0.0002458455887917421, - "loss": 0.0136, + "epoch": 0.19, + "learning_rate": 0.00027217592364579905, + "loss": 0.023, "step": 71560 }, { - "epoch": 0.36, - "learning_rate": 0.0002458380210987281, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.00027217203542942756, + "loss": 0.024, "step": 71570 }, { - "epoch": 0.36, - "learning_rate": 0.00024583045340571407, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002721681472130561, + "loss": 0.028, "step": 71580 }, { - "epoch": 0.36, - "learning_rate": 0.0002458228857127001, - "loss": 0.0199, + "epoch": 0.19, + "learning_rate": 0.00027216425899668465, + "loss": 0.0226, "step": 71590 }, { - "epoch": 0.36, - "learning_rate": 0.0002458153180196861, - "loss": 0.0157, + "epoch": 0.19, + "learning_rate": 0.00027216037078031316, + "loss": 0.0252, "step": 71600 }, { - "epoch": 0.36, - "learning_rate": 0.00024580775032667206, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.0002721564825639417, + "loss": 0.0245, "step": 71610 }, { - "epoch": 0.36, - "learning_rate": 0.00024580018263365805, - "loss": 0.0175, + "epoch": 0.19, + "learning_rate": 0.00027215259434757024, + "loss": 0.0229, "step": 71620 }, { - "epoch": 0.36, - "learning_rate": 0.000245792614940644, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.00027214870613119876, + "loss": 0.0209, "step": 71630 }, { - "epoch": 0.36, - "learning_rate": 0.00024578504724763, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.0002721448179148273, + "loss": 0.0253, "step": 71640 }, { - "epoch": 0.36, - "learning_rate": 0.00024577747955461604, - "loss": 0.0222, + "epoch": 0.19, + "learning_rate": 0.00027214092969845584, + "loss": 0.0194, "step": 71650 }, { - "epoch": 0.36, - "learning_rate": 0.000245769911861602, - "loss": 0.0182, + "epoch": 0.19, + "learning_rate": 0.00027213704148208436, + "loss": 0.0219, "step": 71660 }, { - "epoch": 0.36, - "learning_rate": 0.000245762344168588, - "loss": 0.0146, + "epoch": 0.19, + "learning_rate": 0.0002721331532657129, + "loss": 0.028, "step": 71670 }, { - "epoch": 0.36, - "learning_rate": 0.000245754776475574, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.00027212926504934144, + "loss": 0.0312, "step": 71680 }, { - "epoch": 0.36, - "learning_rate": 0.00024574720878255997, - "loss": 0.0151, + "epoch": 0.19, + "learning_rate": 0.00027212537683296995, + "loss": 0.0244, "step": 71690 }, { - "epoch": 0.36, - "learning_rate": 0.00024573964108954595, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.0002721214886165985, + "loss": 0.0225, "step": 71700 }, { - "epoch": 0.36, - "learning_rate": 0.00024573207339653193, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027211760040022704, + "loss": 0.0233, "step": 71710 }, { - "epoch": 0.36, - "learning_rate": 0.00024572450570351797, - "loss": 0.0163, + "epoch": 0.19, + "learning_rate": 0.0002721137121838556, + "loss": 0.0271, "step": 71720 }, { - "epoch": 0.36, - "learning_rate": 0.00024571693801050395, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.0002721098239674841, + "loss": 0.0228, "step": 71730 }, { - "epoch": 0.36, - "learning_rate": 0.00024570937031748993, - "loss": 0.017, + "epoch": 0.19, + "learning_rate": 0.00027210593575111263, + "loss": 0.0287, "step": 71740 }, { - "epoch": 0.36, - "learning_rate": 0.0002457018026244759, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.00027210204753474115, + "loss": 0.0256, "step": 71750 }, { - "epoch": 0.36, - "learning_rate": 0.0002456942349314619, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002720981593183697, + "loss": 0.0236, "step": 71760 }, { - "epoch": 0.36, - "learning_rate": 0.0002456866672384479, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.0002720942711019983, + "loss": 0.031, "step": 71770 }, { - "epoch": 0.36, - "learning_rate": 0.0002456790995454339, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.0002720903828856268, + "loss": 0.0268, "step": 71780 }, { - "epoch": 0.36, - "learning_rate": 0.0002456715318524199, - "loss": 0.0152, + "epoch": 0.19, + "learning_rate": 0.0002720864946692553, + "loss": 0.0238, "step": 71790 }, { - "epoch": 0.36, - "learning_rate": 0.0002456639641594059, - "loss": 0.0157, + "epoch": 0.19, + "learning_rate": 0.0002720826064528839, + "loss": 0.0247, "step": 71800 }, { - "epoch": 0.36, - "learning_rate": 0.00024565639646639186, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.0002720787182365124, + "loss": 0.028, "step": 71810 }, { - "epoch": 0.36, - "learning_rate": 0.00024564882877337784, - "loss": 0.0197, + "epoch": 0.19, + "learning_rate": 0.0002720748300201409, + "loss": 0.0289, "step": 71820 }, { - "epoch": 0.36, - "learning_rate": 0.0002456412610803638, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.0002720709418037695, + "loss": 0.0246, "step": 71830 }, { - "epoch": 0.36, - "learning_rate": 0.00024563369338734985, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.000272067053587398, + "loss": 0.0284, "step": 71840 }, { - "epoch": 0.36, - "learning_rate": 0.00024562612569433584, - "loss": 0.0259, + "epoch": 0.19, + "learning_rate": 0.00027206316537102657, + "loss": 0.0241, "step": 71850 }, { - "epoch": 0.36, - "learning_rate": 0.0002456185580013218, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002720592771546551, + "loss": 0.0271, "step": 71860 }, { - "epoch": 0.36, - "learning_rate": 0.0002456109903083078, - "loss": 0.0149, + "epoch": 0.19, + "learning_rate": 0.0002720553889382836, + "loss": 0.0204, "step": 71870 }, { - "epoch": 0.36, - "learning_rate": 0.0002456034226152938, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.00027205150072191216, + "loss": 0.0252, "step": 71880 }, { - "epoch": 0.36, - "learning_rate": 0.00024559585492227976, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002720476125055407, + "loss": 0.0263, "step": 71890 }, { - "epoch": 0.36, - "learning_rate": 0.00024558828722926574, - "loss": 0.0223, + "epoch": 0.19, + "learning_rate": 0.0002720437242891692, + "loss": 0.0269, "step": 71900 }, { - "epoch": 0.36, - "learning_rate": 0.0002455807195362518, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.00027203983607279776, + "loss": 0.0371, "step": 71910 }, { - "epoch": 0.36, - "learning_rate": 0.00024557315184323776, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.00027203594785642633, + "loss": 0.022, "step": 71920 }, { - "epoch": 0.36, - "learning_rate": 0.00024556558415022374, - "loss": 0.0226, + "epoch": 0.19, + "learning_rate": 0.00027203205964005484, + "loss": 0.0208, "step": 71930 }, { - "epoch": 0.36, - "learning_rate": 0.0002455580164572097, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.00027202817142368336, + "loss": 0.0248, "step": 71940 }, { - "epoch": 0.36, - "learning_rate": 0.0002455504487641957, - "loss": 0.0139, + "epoch": 0.19, + "learning_rate": 0.0002720242832073119, + "loss": 0.0213, "step": 71950 }, { - "epoch": 0.36, - "learning_rate": 0.0002455428810711817, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027202039499094044, + "loss": 0.0282, "step": 71960 }, { - "epoch": 0.36, - "learning_rate": 0.0002455353133781677, - "loss": 0.0159, + "epoch": 0.19, + "learning_rate": 0.00027201650677456896, + "loss": 0.025, "step": 71970 }, { - "epoch": 0.36, - "learning_rate": 0.0002455277456851537, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.0002720126185581975, + "loss": 0.0241, "step": 71980 }, { - "epoch": 0.36, - "learning_rate": 0.0002455201779921397, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.00027200873034182604, + "loss": 0.0236, "step": 71990 }, { - "epoch": 0.36, - "learning_rate": 0.00024551261029912567, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027200484212545455, + "loss": 0.0262, "step": 72000 }, { - "epoch": 0.36, - "eval_cer": 0.9144828710527925, - "eval_loss": 0.013233224861323833, - "eval_runtime": 116.7335, - "eval_samples_per_second": 17.133, - "eval_steps_per_second": 4.283, + "epoch": 0.19, + "eval_cer": 0.8818034601824287, + "eval_loss": 0.017536072060465813, + "eval_runtime": 107.8637, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, "step": 72000 }, { - "epoch": 0.36, - "learning_rate": 0.00024550504260611165, - "loss": 0.0232, + "epoch": 0.19, + "learning_rate": 0.0002720009539090831, + "loss": 0.0243, "step": 72010 }, { - "epoch": 0.36, - "learning_rate": 0.00024549747491309763, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.00027199706569271164, + "loss": 0.0249, "step": 72020 }, { - "epoch": 0.36, - "learning_rate": 0.0002454899072200836, - "loss": 0.0155, + "epoch": 0.19, + "learning_rate": 0.00027199317747634015, + "loss": 0.0276, "step": 72030 }, { - "epoch": 0.36, - "learning_rate": 0.00024548233952706965, - "loss": 0.0159, + "epoch": 0.19, + "learning_rate": 0.0002719892892599687, + "loss": 0.0289, "step": 72040 }, { - "epoch": 0.36, - "learning_rate": 0.00024547477183405563, + "epoch": 0.19, + "learning_rate": 0.00027198540104359724, "loss": 0.0276, "step": 72050 }, { - "epoch": 0.36, - "learning_rate": 0.0002454672041410416, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.0002719815128272258, + "loss": 0.0213, "step": 72060 }, { - "epoch": 0.36, - "learning_rate": 0.0002454596364480276, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002719776246108543, + "loss": 0.0212, "step": 72070 }, { - "epoch": 0.36, - "learning_rate": 0.00024545206875501357, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.00027197373639448283, + "loss": 0.0258, "step": 72080 }, { - "epoch": 0.36, - "learning_rate": 0.00024544450106199955, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.0002719698481781114, + "loss": 0.02, "step": 72090 }, { - "epoch": 0.36, - "learning_rate": 0.0002454369333689856, - "loss": 0.0166, + "epoch": 0.19, + "learning_rate": 0.0002719659599617399, + "loss": 0.0279, "step": 72100 }, { - "epoch": 0.36, - "learning_rate": 0.00024542936567597157, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002719620717453685, + "loss": 0.0279, "step": 72110 }, { - "epoch": 0.36, - "learning_rate": 0.00024542179798295755, - "loss": 0.0223, + "epoch": 0.19, + "learning_rate": 0.000271958183528997, + "loss": 0.0213, "step": 72120 }, { - "epoch": 0.36, - "learning_rate": 0.00024541423028994353, - "loss": 0.016, + "epoch": 0.19, + "learning_rate": 0.00027195429531262557, + "loss": 0.0213, "step": 72130 }, { - "epoch": 0.36, - "learning_rate": 0.0002454066625969295, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002719504070962541, + "loss": 0.0195, "step": 72140 }, { - "epoch": 0.36, - "learning_rate": 0.0002453990949039155, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.0002719465188798826, + "loss": 0.0314, "step": 72150 }, { - "epoch": 0.36, - "learning_rate": 0.00024539152721090153, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.0002719426306635111, + "loss": 0.0227, "step": 72160 }, { - "epoch": 0.36, - "learning_rate": 0.0002453839595178875, - "loss": 0.0159, + "epoch": 0.19, + "learning_rate": 0.0002719387424471397, + "loss": 0.0253, "step": 72170 }, { - "epoch": 0.36, - "learning_rate": 0.0002453763918248735, - "loss": 0.0234, + "epoch": 0.19, + "learning_rate": 0.0002719348542307682, + "loss": 0.0216, "step": 72180 }, { - "epoch": 0.36, - "learning_rate": 0.0002453688241318595, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027193096601439676, + "loss": 0.0229, "step": 72190 }, { - "epoch": 0.36, - "learning_rate": 0.00024536125643884546, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.0002719270777980253, + "loss": 0.0207, "step": 72200 }, { - "epoch": 0.36, - "learning_rate": 0.00024535368874583144, - "loss": 0.0159, + "epoch": 0.19, + "learning_rate": 0.0002719231895816538, + "loss": 0.0263, "step": 72210 }, { - "epoch": 0.36, - "learning_rate": 0.0002453461210528174, - "loss": 0.0206, + "epoch": 0.19, + "learning_rate": 0.00027191930136528236, + "loss": 0.0246, "step": 72220 }, { - "epoch": 0.36, - "learning_rate": 0.00024533855335980346, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.0002719154131489109, + "loss": 0.0273, "step": 72230 }, { - "epoch": 0.36, - "learning_rate": 0.00024533098566678944, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.0002719115249325394, + "loss": 0.0212, "step": 72240 }, { - "epoch": 0.36, - "learning_rate": 0.0002453234179737754, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.00027190763671616796, + "loss": 0.0273, "step": 72250 }, { - "epoch": 0.36, - "learning_rate": 0.0002453158502807614, - "loss": 0.0214, + "epoch": 0.19, + "learning_rate": 0.00027190374849979653, + "loss": 0.0264, "step": 72260 }, { - "epoch": 0.36, - "learning_rate": 0.0002453082825877474, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027189986028342504, + "loss": 0.0251, "step": 72270 }, { - "epoch": 0.36, - "learning_rate": 0.00024530071489473336, - "loss": 0.022, + "epoch": 0.19, + "learning_rate": 0.00027189597206705356, + "loss": 0.0223, "step": 72280 }, { - "epoch": 0.36, - "learning_rate": 0.00024529314720171934, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.00027189208385068207, + "loss": 0.0229, "step": 72290 }, { - "epoch": 0.36, - "learning_rate": 0.0002452855795087053, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.00027188819563431064, + "loss": 0.0206, "step": 72300 }, { - "epoch": 0.36, - "learning_rate": 0.0002452780118156913, - "loss": 0.0165, + "epoch": 0.19, + "learning_rate": 0.00027188430741793916, + "loss": 0.0302, "step": 72310 }, { - "epoch": 0.36, - "learning_rate": 0.0002452704441226773, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.0002718804192015677, + "loss": 0.0233, "step": 72320 }, { - "epoch": 0.36, - "learning_rate": 0.0002452628764296633, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.00027187653098519624, + "loss": 0.031, "step": 72330 }, { - "epoch": 0.36, - "learning_rate": 0.0002452553087366493, - "loss": 0.0206, + "epoch": 0.19, + "learning_rate": 0.0002718726427688248, + "loss": 0.0289, "step": 72340 }, { - "epoch": 0.37, - "learning_rate": 0.0002452477410436353, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.0002718687545524533, + "loss": 0.022, "step": 72350 }, { - "epoch": 0.37, - "learning_rate": 0.00024524017335062127, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.00027186486633608184, + "loss": 0.0194, "step": 72360 }, { - "epoch": 0.37, - "learning_rate": 0.00024523260565760725, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.00027186097811971035, + "loss": 0.0236, "step": 72370 }, { - "epoch": 0.37, - "learning_rate": 0.00024522503796459323, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.0002718570899033389, + "loss": 0.0274, "step": 72380 }, { - "epoch": 0.37, - "learning_rate": 0.00024521747027157927, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027185320168696743, + "loss": 0.0198, "step": 72390 }, { - "epoch": 0.37, - "learning_rate": 0.00024520990257856525, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.000271849313470596, + "loss": 0.0251, "step": 72400 }, { - "epoch": 0.37, - "learning_rate": 0.00024520233488555123, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.0002718454252542245, + "loss": 0.0277, "step": 72410 }, { - "epoch": 0.37, - "learning_rate": 0.0002451947671925372, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.0002718415370378531, + "loss": 0.025, "step": 72420 }, { - "epoch": 0.37, - "learning_rate": 0.0002451871994995232, - "loss": 0.0172, + "epoch": 0.19, + "learning_rate": 0.0002718376488214816, + "loss": 0.0239, "step": 72430 }, { - "epoch": 0.37, - "learning_rate": 0.0002451796318065092, - "loss": 0.014, + "epoch": 0.19, + "learning_rate": 0.0002718337606051101, + "loss": 0.0236, "step": 72440 }, { - "epoch": 0.37, - "learning_rate": 0.00024517206411349516, - "loss": 0.0155, + "epoch": 0.19, + "learning_rate": 0.00027182987238873863, + "loss": 0.0201, "step": 72450 }, { - "epoch": 0.37, - "learning_rate": 0.0002451644964204812, - "loss": 0.0216, + "epoch": 0.19, + "learning_rate": 0.0002718259841723672, + "loss": 0.0253, "step": 72460 }, { - "epoch": 0.37, - "learning_rate": 0.0002451569287274672, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.00027182209595599577, + "loss": 0.0237, "step": 72470 }, { - "epoch": 0.37, - "learning_rate": 0.00024514936103445315, - "loss": 0.0172, + "epoch": 0.19, + "learning_rate": 0.0002718182077396243, + "loss": 0.0224, "step": 72480 }, { - "epoch": 0.37, - "learning_rate": 0.00024514179334143914, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.0002718143195232528, + "loss": 0.0219, "step": 72490 }, { - "epoch": 0.37, - "learning_rate": 0.0002451342256484251, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.0002718104313068813, + "loss": 0.026, "step": 72500 }, { - "epoch": 0.37, - "learning_rate": 0.0002451266579554111, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.0002718065430905099, + "loss": 0.0227, "step": 72510 }, { - "epoch": 0.37, - "learning_rate": 0.00024511909026239713, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.0002718026548741384, + "loss": 0.0285, "step": 72520 }, { - "epoch": 0.37, - "learning_rate": 0.0002451115225693831, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.00027179876665776696, + "loss": 0.0261, "step": 72530 }, { - "epoch": 0.37, - "learning_rate": 0.0002451039548763691, - "loss": 0.017, + "epoch": 0.19, + "learning_rate": 0.0002717948784413955, + "loss": 0.0258, "step": 72540 }, { - "epoch": 0.37, - "learning_rate": 0.0002450963871833551, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.00027179099022502405, + "loss": 0.0329, "step": 72550 }, { - "epoch": 0.37, - "learning_rate": 0.00024508881949034106, - "loss": 0.017, + "epoch": 0.19, + "learning_rate": 0.00027178710200865256, + "loss": 0.0234, "step": 72560 }, { - "epoch": 0.37, - "learning_rate": 0.00024508125179732704, - "loss": 0.0172, + "epoch": 0.19, + "learning_rate": 0.0002717832137922811, + "loss": 0.0279, "step": 72570 }, { - "epoch": 0.37, - "learning_rate": 0.0002450736841043131, - "loss": 0.0167, + "epoch": 0.19, + "learning_rate": 0.0002717793255759096, + "loss": 0.0297, "step": 72580 }, { - "epoch": 0.37, - "learning_rate": 0.00024506611641129906, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.00027177543735953816, + "loss": 0.0264, "step": 72590 }, { - "epoch": 0.37, - "learning_rate": 0.00024505854871828504, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.0002717715491431667, + "loss": 0.0297, "step": 72600 }, { - "epoch": 0.37, - "learning_rate": 0.000245050981025271, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027176766092679524, + "loss": 0.0237, "step": 72610 }, { - "epoch": 0.37, - "learning_rate": 0.000245043413332257, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.00027176377271042376, + "loss": 0.0294, "step": 72620 }, { - "epoch": 0.37, - "learning_rate": 0.000245035845639243, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.0002717598844940523, + "loss": 0.0236, "step": 72630 }, { - "epoch": 0.37, - "learning_rate": 0.00024502827794622897, - "loss": 0.0175, + "epoch": 0.19, + "learning_rate": 0.00027175599627768084, + "loss": 0.03, "step": 72640 }, { - "epoch": 0.37, - "learning_rate": 0.000245020710253215, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.00027175210806130935, + "loss": 0.0274, "step": 72650 }, { - "epoch": 0.37, - "learning_rate": 0.000245013142560201, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.0002717482198449379, + "loss": 0.0272, "step": 72660 }, { - "epoch": 0.37, - "learning_rate": 0.00024500557486718696, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.00027174433162856644, + "loss": 0.0296, "step": 72670 }, { - "epoch": 0.37, - "learning_rate": 0.00024499800717417295, - "loss": 0.0239, + "epoch": 0.19, + "learning_rate": 0.000271740443412195, + "loss": 0.0211, "step": 72680 }, { - "epoch": 0.37, - "learning_rate": 0.00024499043948115893, - "loss": 0.017, + "epoch": 0.19, + "learning_rate": 0.0002717365551958235, + "loss": 0.0235, "step": 72690 }, { - "epoch": 0.37, - "learning_rate": 0.0002449828717881449, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027173266697945204, + "loss": 0.0234, "step": 72700 }, { - "epoch": 0.37, - "learning_rate": 0.00024497530409513094, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.00027172877876308055, + "loss": 0.0282, "step": 72710 }, { - "epoch": 0.37, - "learning_rate": 0.0002449677364021169, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.0002717248905467091, + "loss": 0.0283, "step": 72720 }, { - "epoch": 0.37, - "learning_rate": 0.0002449601687091029, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.00027172100233033763, + "loss": 0.0239, "step": 72730 }, { - "epoch": 0.37, - "learning_rate": 0.0002449526010160889, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.0002717171141139662, + "loss": 0.0273, "step": 72740 }, { - "epoch": 0.37, - "learning_rate": 0.00024494503332307487, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.0002717132258975947, + "loss": 0.0243, "step": 72750 }, { - "epoch": 0.37, - "learning_rate": 0.00024493746563006085, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002717093376812233, + "loss": 0.0236, "step": 72760 }, { - "epoch": 0.37, - "learning_rate": 0.00024492989793704683, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002717054494648518, + "loss": 0.0244, "step": 72770 }, { - "epoch": 0.37, - "learning_rate": 0.00024492233024403287, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.0002717015612484803, + "loss": 0.0239, "step": 72780 }, { - "epoch": 0.37, - "learning_rate": 0.00024491476255101885, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027169767303210883, + "loss": 0.032, "step": 72790 }, { - "epoch": 0.37, - "learning_rate": 0.00024490719485800483, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.0002716937848157374, + "loss": 0.0278, "step": 72800 }, { - "epoch": 0.37, - "learning_rate": 0.0002448996271649908, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.00027168989659936597, + "loss": 0.022, "step": 72810 }, { - "epoch": 0.37, - "learning_rate": 0.0002448920594719768, - "loss": 0.0175, + "epoch": 0.19, + "learning_rate": 0.0002716860083829945, + "loss": 0.0232, "step": 72820 }, { - "epoch": 0.37, - "learning_rate": 0.0002448844917789628, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.000271682120166623, + "loss": 0.0312, "step": 72830 }, { - "epoch": 0.37, - "learning_rate": 0.0002448769240859488, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.00027167823195025156, + "loss": 0.0208, "step": 72840 }, { - "epoch": 0.37, - "learning_rate": 0.0002448693563929348, - "loss": 0.0163, + "epoch": 0.19, + "learning_rate": 0.0002716743437338801, + "loss": 0.0289, "step": 72850 }, { - "epoch": 0.37, - "learning_rate": 0.0002448617886999208, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.0002716704555175086, + "loss": 0.0228, "step": 72860 }, { - "epoch": 0.37, - "learning_rate": 0.00024485422100690676, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027166656730113716, + "loss": 0.0246, "step": 72870 }, { - "epoch": 0.37, - "learning_rate": 0.00024484665331389274, - "loss": 0.0232, + "epoch": 0.19, + "learning_rate": 0.0002716626790847657, + "loss": 0.023, "step": 72880 }, { - "epoch": 0.37, - "learning_rate": 0.0002448390856208787, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.00027165879086839425, + "loss": 0.028, "step": 72890 }, { - "epoch": 0.37, - "learning_rate": 0.00024483151792786475, - "loss": 0.0167, + "epoch": 0.19, + "learning_rate": 0.00027165490265202276, + "loss": 0.02, "step": 72900 }, { - "epoch": 0.37, - "learning_rate": 0.00024482395023485074, - "loss": 0.0166, + "epoch": 0.19, + "learning_rate": 0.0002716510144356513, + "loss": 0.0226, "step": 72910 }, { - "epoch": 0.37, - "learning_rate": 0.0002448163825418367, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.00027164712621927984, + "loss": 0.0234, "step": 72920 }, { - "epoch": 0.37, - "learning_rate": 0.0002448088148488227, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027164323800290836, + "loss": 0.0267, "step": 72930 }, { - "epoch": 0.37, - "learning_rate": 0.0002448012471558087, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.00027163934978653687, + "loss": 0.0315, "step": 72940 }, { - "epoch": 0.37, - "learning_rate": 0.00024479367946279466, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.00027163546157016544, + "loss": 0.0257, "step": 72950 }, { - "epoch": 0.37, - "learning_rate": 0.00024478611176978064, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.00027163157335379396, + "loss": 0.0262, "step": 72960 }, { - "epoch": 0.37, - "learning_rate": 0.0002447785440767667, - "loss": 0.0165, + "epoch": 0.19, + "learning_rate": 0.0002716276851374225, + "loss": 0.0246, "step": 72970 }, { - "epoch": 0.37, - "learning_rate": 0.00024477097638375266, - "loss": 0.0158, + "epoch": 0.19, + "learning_rate": 0.00027162379692105104, + "loss": 0.0295, "step": 72980 }, { - "epoch": 0.37, - "learning_rate": 0.00024476340869073864, - "loss": 0.0159, + "epoch": 0.19, + "learning_rate": 0.00027161990870467955, + "loss": 0.0236, "step": 72990 }, { - "epoch": 0.37, - "learning_rate": 0.0002447558409977246, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.0002716160204883081, + "loss": 0.0234, "step": 73000 }, { - "epoch": 0.37, - "eval_cer": 0.9145197461055578, - "eval_loss": 0.013241157867014408, - "eval_runtime": 116.696, - "eval_samples_per_second": 17.139, - "eval_steps_per_second": 4.285, + "epoch": 0.19, + "eval_cer": 0.88176706962214, + "eval_loss": 0.018438469618558884, + "eval_runtime": 107.9064, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, "step": 73000 }, { - "epoch": 0.37, - "learning_rate": 0.0002447482733047106, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.00027161213227193664, + "loss": 0.0253, "step": 73010 }, { - "epoch": 0.37, - "learning_rate": 0.0002447407056116966, - "loss": 0.0194, + "epoch": 0.19, + "learning_rate": 0.0002716082440555652, + "loss": 0.0262, "step": 73020 }, { - "epoch": 0.37, - "learning_rate": 0.0002447331379186826, - "loss": 0.0166, + "epoch": 0.19, + "learning_rate": 0.0002716043558391937, + "loss": 0.059, "step": 73030 }, { - "epoch": 0.37, - "learning_rate": 0.0002447255702256686, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.00027160046762282223, + "loss": 0.0958, "step": 73040 }, { - "epoch": 0.37, - "learning_rate": 0.0002447180025326546, - "loss": 0.0232, + "epoch": 0.19, + "learning_rate": 0.0002715965794064508, + "loss": 0.0285, "step": 73050 }, { - "epoch": 0.37, - "learning_rate": 0.00024471043483964057, - "loss": 0.0167, + "epoch": 0.19, + "learning_rate": 0.0002715926911900793, + "loss": 0.0338, "step": 73060 }, { - "epoch": 0.37, - "learning_rate": 0.00024470286714662655, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.00027158880297370783, + "loss": 0.0242, "step": 73070 }, { - "epoch": 0.37, - "learning_rate": 0.00024469529945361253, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.0002715849147573364, + "loss": 0.0243, "step": 73080 }, { - "epoch": 0.37, - "learning_rate": 0.00024468773176059856, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.0002715810265409649, + "loss": 0.0243, "step": 73090 }, { - "epoch": 0.37, - "learning_rate": 0.00024468016406758455, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002715771383245935, + "loss": 0.0256, "step": 73100 }, { - "epoch": 0.37, - "learning_rate": 0.00024467259637457053, - "loss": 0.0291, + "epoch": 0.19, + "learning_rate": 0.000271573250108222, + "loss": 0.0281, "step": 73110 }, { - "epoch": 0.37, - "learning_rate": 0.0002446650286815565, - "loss": 0.0198, + "epoch": 0.19, + "learning_rate": 0.0002715693618918505, + "loss": 0.0276, "step": 73120 }, { - "epoch": 0.37, - "learning_rate": 0.0002446574609885425, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.0002715654736754791, + "loss": 0.027, "step": 73130 }, { - "epoch": 0.37, - "learning_rate": 0.00024464989329552847, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.0002715615854591076, + "loss": 0.0202, "step": 73140 }, { - "epoch": 0.37, - "learning_rate": 0.00024464232560251445, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027155769724273617, + "loss": 0.0324, "step": 73150 }, { - "epoch": 0.37, - "learning_rate": 0.0002446347579095005, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.0002715538090263647, + "loss": 0.0307, "step": 73160 }, { - "epoch": 0.37, - "learning_rate": 0.00024462719021648647, - "loss": 0.0233, + "epoch": 0.19, + "learning_rate": 0.00027154992080999325, + "loss": 0.0325, "step": 73170 }, { - "epoch": 0.37, - "learning_rate": 0.00024461962252347245, - "loss": 0.0152, + "epoch": 0.19, + "learning_rate": 0.00027154603259362176, + "loss": 0.0237, "step": 73180 }, { - "epoch": 0.37, - "learning_rate": 0.00024461205483045843, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002715421443772503, + "loss": 0.0225, "step": 73190 }, { - "epoch": 0.37, - "learning_rate": 0.0002446044871374444, - "loss": 0.0244, + "epoch": 0.19, + "learning_rate": 0.0002715382561608788, + "loss": 0.0251, "step": 73200 }, { - "epoch": 0.37, - "learning_rate": 0.0002445969194444304, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.00027153436794450736, + "loss": 0.0284, "step": 73210 }, { - "epoch": 0.37, - "learning_rate": 0.00024458935175141643, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.0002715304797281359, + "loss": 0.0257, "step": 73220 }, { - "epoch": 0.37, - "learning_rate": 0.0002445817840584024, - "loss": 0.0149, + "epoch": 0.19, + "learning_rate": 0.00027152659151176444, + "loss": 0.0231, "step": 73230 }, { - "epoch": 0.37, - "learning_rate": 0.0002445742163653884, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027152270329539296, + "loss": 0.0222, "step": 73240 }, { - "epoch": 0.37, - "learning_rate": 0.0002445666486723744, - "loss": 0.0194, + "epoch": 0.19, + "learning_rate": 0.0002715188150790215, + "loss": 0.0268, "step": 73250 }, { - "epoch": 0.37, - "learning_rate": 0.00024455908097936036, - "loss": 0.0158, + "epoch": 0.19, + "learning_rate": 0.00027151492686265004, + "loss": 0.0214, "step": 73260 }, { - "epoch": 0.37, - "learning_rate": 0.00024455151328634634, - "loss": 0.0166, + "epoch": 0.19, + "learning_rate": 0.00027151103864627856, + "loss": 0.0233, "step": 73270 }, { - "epoch": 0.37, - "learning_rate": 0.0002445439455933323, - "loss": 0.014, + "epoch": 0.19, + "learning_rate": 0.00027150715042990707, + "loss": 0.0486, "step": 73280 }, { - "epoch": 0.37, - "learning_rate": 0.00024453637790031836, - "loss": 0.0207, + "epoch": 0.19, + "learning_rate": 0.00027150326221353564, + "loss": 0.0237, "step": 73290 }, { - "epoch": 0.37, - "learning_rate": 0.00024452881020730434, - "loss": 0.0232, + "epoch": 0.19, + "learning_rate": 0.0002714993739971642, + "loss": 0.019, "step": 73300 }, { - "epoch": 0.37, - "learning_rate": 0.0002445212425142903, - "loss": 0.0151, + "epoch": 0.19, + "learning_rate": 0.0002714954857807927, + "loss": 0.0259, "step": 73310 }, { - "epoch": 0.37, - "learning_rate": 0.0002445136748212763, - "loss": 0.0191, + "epoch": 0.19, + "learning_rate": 0.00027149159756442124, + "loss": 0.0289, "step": 73320 }, { - "epoch": 0.37, - "learning_rate": 0.0002445061071282623, - "loss": 0.021, + "epoch": 0.19, + "learning_rate": 0.00027148770934804975, + "loss": 0.0238, "step": 73330 }, { - "epoch": 0.37, - "learning_rate": 0.00024449853943524826, - "loss": 0.0165, + "epoch": 0.19, + "learning_rate": 0.0002714838211316783, + "loss": 0.0284, "step": 73340 }, { - "epoch": 0.37, - "learning_rate": 0.0002444909717422343, - "loss": 0.0135, + "epoch": 0.19, + "learning_rate": 0.00027147993291530684, + "loss": 0.0258, "step": 73350 }, { - "epoch": 0.37, - "learning_rate": 0.0002444834040492203, - "loss": 0.0145, + "epoch": 0.19, + "learning_rate": 0.0002714760446989354, + "loss": 0.0265, "step": 73360 }, { - "epoch": 0.37, - "learning_rate": 0.00024447583635620626, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.0002714721564825639, + "loss": 0.0241, "step": 73370 }, { - "epoch": 0.37, - "learning_rate": 0.00024446826866319224, - "loss": 0.0165, + "epoch": 0.19, + "learning_rate": 0.0002714682682661925, + "loss": 0.0312, "step": 73380 }, { - "epoch": 0.37, - "learning_rate": 0.0002444607009701782, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.000271464380049821, + "loss": 0.0221, "step": 73390 }, { - "epoch": 0.37, - "learning_rate": 0.0002444531332771642, - "loss": 0.0139, + "epoch": 0.19, + "learning_rate": 0.0002714604918334495, + "loss": 0.0209, "step": 73400 }, { - "epoch": 0.37, - "learning_rate": 0.00024444556558415024, - "loss": 0.014, + "epoch": 0.19, + "learning_rate": 0.00027145660361707803, + "loss": 0.026, "step": 73410 }, { - "epoch": 0.37, - "learning_rate": 0.0002444379978911362, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.0002714527154007066, + "loss": 0.0232, "step": 73420 }, { - "epoch": 0.37, - "learning_rate": 0.0002444304301981222, - "loss": 0.0149, + "epoch": 0.19, + "learning_rate": 0.0002714488271843351, + "loss": 0.0195, "step": 73430 }, { - "epoch": 0.37, - "learning_rate": 0.0002444228625051082, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002714449389679637, + "loss": 0.0285, "step": 73440 }, { - "epoch": 0.37, - "learning_rate": 0.00024441529481209417, - "loss": 0.0219, + "epoch": 0.19, + "learning_rate": 0.0002714410507515922, + "loss": 0.0213, "step": 73450 }, { - "epoch": 0.37, - "learning_rate": 0.00024440772711908015, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.0002714371625352207, + "loss": 0.027, "step": 73460 }, { - "epoch": 0.37, - "learning_rate": 0.00024440015942606613, - "loss": 0.0198, + "epoch": 0.19, + "learning_rate": 0.0002714332743188493, + "loss": 0.0263, "step": 73470 }, { - "epoch": 0.37, - "learning_rate": 0.00024439259173305217, - "loss": 0.0182, + "epoch": 0.19, + "learning_rate": 0.0002714293861024778, + "loss": 0.0242, "step": 73480 }, { - "epoch": 0.37, - "learning_rate": 0.00024438502404003815, - "loss": 0.0175, + "epoch": 0.19, + "learning_rate": 0.0002714254978861063, + "loss": 0.0189, "step": 73490 }, { - "epoch": 0.37, - "learning_rate": 0.00024437745634702413, - "loss": 0.024, + "epoch": 0.19, + "learning_rate": 0.0002714216096697349, + "loss": 0.026, "step": 73500 }, { - "epoch": 0.37, - "learning_rate": 0.0002443698886540101, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.00027141772145336345, + "loss": 0.028, "step": 73510 }, { - "epoch": 0.37, - "learning_rate": 0.0002443623209609961, - "loss": 0.0212, + "epoch": 0.19, + "learning_rate": 0.00027141383323699196, + "loss": 0.0284, "step": 73520 }, { - "epoch": 0.37, - "learning_rate": 0.0002443547532679821, - "loss": 0.0182, + "epoch": 0.19, + "learning_rate": 0.0002714099450206205, + "loss": 0.0267, "step": 73530 }, { - "epoch": 0.37, - "learning_rate": 0.00024434718557496805, - "loss": 0.0156, + "epoch": 0.19, + "learning_rate": 0.000271406056804249, + "loss": 0.0253, "step": 73540 }, { - "epoch": 0.37, - "learning_rate": 0.00024433961788195404, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.00027140216858787756, + "loss": 0.0196, "step": 73550 }, { - "epoch": 0.37, - "learning_rate": 0.00024433205018894, - "loss": 0.0374, + "epoch": 0.19, + "learning_rate": 0.0002713982803715061, + "loss": 0.0249, "step": 73560 }, { - "epoch": 0.37, - "learning_rate": 0.000244324482495926, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.00027139439215513464, + "loss": 0.0271, "step": 73570 }, { - "epoch": 0.37, - "learning_rate": 0.00024431691480291203, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027139050393876316, + "loss": 0.0269, "step": 73580 }, { - "epoch": 0.37, - "learning_rate": 0.000244309347109898, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.0002713866157223917, + "loss": 0.0262, "step": 73590 }, { - "epoch": 0.37, - "learning_rate": 0.000244301779416884, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027138272750602024, + "loss": 0.0298, "step": 73600 }, { - "epoch": 0.37, - "learning_rate": 0.00024429421172387, - "loss": 0.0218, + "epoch": 0.19, + "learning_rate": 0.00027137883928964876, + "loss": 0.0231, "step": 73610 }, { - "epoch": 0.37, - "learning_rate": 0.00024428664403085596, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.00027137495107327727, + "loss": 0.0229, "step": 73620 }, { - "epoch": 0.37, - "learning_rate": 0.00024427907633784194, - "loss": 0.0197, + "epoch": 0.19, + "learning_rate": 0.00027137106285690584, + "loss": 0.0335, "step": 73630 }, { - "epoch": 0.37, - "learning_rate": 0.000244271508644828, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.00027136717464053435, + "loss": 0.0243, "step": 73640 }, { - "epoch": 0.37, - "learning_rate": 0.00024426394095181396, - "loss": 0.0201, + "epoch": 0.19, + "learning_rate": 0.0002713632864241629, + "loss": 0.026, "step": 73650 }, { - "epoch": 0.37, - "learning_rate": 0.00024425637325879994, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.00027135939820779144, + "loss": 0.0323, "step": 73660 }, { - "epoch": 0.37, - "learning_rate": 0.0002442488055657859, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027135550999142, + "loss": 0.023, "step": 73670 }, { - "epoch": 0.37, - "learning_rate": 0.0002442412378727719, - "loss": 0.0148, + "epoch": 0.19, + "learning_rate": 0.0002713516217750485, + "loss": 0.0251, "step": 73680 }, { - "epoch": 0.37, - "learning_rate": 0.0002442336701797579, - "loss": 0.0149, + "epoch": 0.19, + "learning_rate": 0.00027134773355867703, + "loss": 0.0235, "step": 73690 }, { - "epoch": 0.37, - "learning_rate": 0.00024422610248674387, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.0002713438453423056, + "loss": 0.0256, "step": 73700 }, { - "epoch": 0.37, - "learning_rate": 0.0002442185347937299, - "loss": 0.0163, + "epoch": 0.19, + "learning_rate": 0.0002713399571259341, + "loss": 0.0254, "step": 73710 }, { - "epoch": 0.37, - "learning_rate": 0.0002442109671007159, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.0002713360689095627, + "loss": 0.0187, "step": 73720 }, { - "epoch": 0.37, - "learning_rate": 0.00024420339940770186, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002713321806931912, + "loss": 0.0275, "step": 73730 }, { - "epoch": 0.37, - "learning_rate": 0.00024419583171468785, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002713282924768197, + "loss": 0.0239, "step": 73740 }, { - "epoch": 0.37, - "learning_rate": 0.00024418826402167383, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.00027132440426044823, + "loss": 0.0231, "step": 73750 }, { - "epoch": 0.37, - "learning_rate": 0.0002441806963286598, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002713205160440768, + "loss": 0.0223, "step": 73760 }, { - "epoch": 0.37, - "learning_rate": 0.00024417312863564584, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002713166278277053, + "loss": 0.0248, "step": 73770 }, { - "epoch": 0.37, - "learning_rate": 0.0002441655609426318, - "loss": 0.0166, + "epoch": 0.19, + "learning_rate": 0.0002713127396113339, + "loss": 0.0278, "step": 73780 }, { - "epoch": 0.37, - "learning_rate": 0.0002441579932496178, - "loss": 0.0153, + "epoch": 0.19, + "learning_rate": 0.0002713088513949624, + "loss": 0.026, "step": 73790 }, { - "epoch": 0.37, - "learning_rate": 0.0002441504255566038, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.00027130496317859097, + "loss": 0.0189, "step": 73800 }, { - "epoch": 0.37, - "learning_rate": 0.00024414285786358977, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.0002713010749622195, + "loss": 0.0219, "step": 73810 }, { - "epoch": 0.37, - "learning_rate": 0.00024413529017057578, - "loss": 0.0177, + "epoch": 0.19, + "learning_rate": 0.000271297186745848, + "loss": 0.026, "step": 73820 }, { - "epoch": 0.37, - "learning_rate": 0.00024412772247756176, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.0002712932985294765, + "loss": 0.0217, "step": 73830 }, { - "epoch": 0.37, - "learning_rate": 0.00024412015478454774, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.0002712894103131051, + "loss": 0.0218, "step": 73840 }, { - "epoch": 0.37, - "learning_rate": 0.00024411258709153375, - "loss": 0.0168, + "epoch": 0.19, + "learning_rate": 0.00027128552209673365, + "loss": 0.0312, "step": 73850 }, { - "epoch": 0.37, - "learning_rate": 0.00024410501939851973, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.00027128163388036216, + "loss": 0.0279, "step": 73860 }, { - "epoch": 0.37, - "learning_rate": 0.0002440974517055057, - "loss": 0.0192, + "epoch": 0.19, + "learning_rate": 0.0002712777456639907, + "loss": 0.0234, "step": 73870 }, { - "epoch": 0.37, - "learning_rate": 0.00024408988401249172, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.00027127385744761924, + "loss": 0.0232, "step": 73880 }, { - "epoch": 0.37, - "learning_rate": 0.0002440823163194777, - "loss": 0.015, + "epoch": 0.19, + "learning_rate": 0.00027126996923124776, + "loss": 0.0226, "step": 73890 }, { - "epoch": 0.37, - "learning_rate": 0.00024407474862646368, - "loss": 0.0198, + "epoch": 0.19, + "learning_rate": 0.0002712660810148763, + "loss": 0.0224, "step": 73900 }, { - "epoch": 0.37, - "learning_rate": 0.00024406718093344967, - "loss": 0.0203, + "epoch": 0.19, + "learning_rate": 0.00027126219279850484, + "loss": 0.0251, "step": 73910 }, { - "epoch": 0.37, - "learning_rate": 0.00024405961324043567, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.00027125830458213336, + "loss": 0.0315, "step": 73920 }, { - "epoch": 0.37, - "learning_rate": 0.00024405204554742166, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002712544163657619, + "loss": 0.0274, "step": 73930 }, { - "epoch": 0.37, - "learning_rate": 0.00024404447785440764, - "loss": 0.017, + "epoch": 0.19, + "learning_rate": 0.00027125052814939044, + "loss": 0.026, "step": 73940 }, { - "epoch": 0.37, - "learning_rate": 0.00024403691016139365, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027124663993301895, + "loss": 0.0312, "step": 73950 }, { - "epoch": 0.37, - "learning_rate": 0.00024402934246837963, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.00027124275171664747, + "loss": 0.0209, "step": 73960 }, { - "epoch": 0.37, - "learning_rate": 0.0002440217747753656, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.00027123886350027604, + "loss": 0.0228, "step": 73970 }, { - "epoch": 0.37, - "learning_rate": 0.00024401420708235162, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.00027123497528390455, + "loss": 0.023, "step": 73980 }, { - "epoch": 0.37, - "learning_rate": 0.0002440066393893376, - "loss": 0.0221, + "epoch": 0.19, + "learning_rate": 0.0002712310870675331, + "loss": 0.024, "step": 73990 }, { - "epoch": 0.37, - "learning_rate": 0.00024399907169632358, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027122719885116164, + "loss": 0.0253, "step": 74000 }, { - "epoch": 0.37, - "eval_cer": 0.9144848118450433, - "eval_loss": 0.012880527414381504, - "eval_runtime": 116.6543, - "eval_samples_per_second": 17.145, - "eval_steps_per_second": 4.286, + "epoch": 0.19, + "eval_cer": 0.8818370514688489, + "eval_loss": 0.018291616812348366, + "eval_runtime": 108.0408, + "eval_samples_per_second": 18.512, + "eval_steps_per_second": 4.628, "step": 74000 }, { - "epoch": 0.37, - "learning_rate": 0.0002439915040033096, - "loss": 0.0215, + "epoch": 0.19, + "learning_rate": 0.0002712233106347902, + "loss": 0.0218, "step": 74010 }, { - "epoch": 0.37, - "learning_rate": 0.00024398393631029557, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.0002712194224184187, + "loss": 0.03, "step": 74020 }, { - "epoch": 0.37, - "learning_rate": 0.00024397636861728155, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027121553420204723, + "loss": 0.025, "step": 74030 }, { - "epoch": 0.37, - "learning_rate": 0.00024396880092426756, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.00027121164598567575, + "loss": 0.0264, "step": 74040 }, { - "epoch": 0.37, - "learning_rate": 0.00024396123323125354, - "loss": 0.0164, + "epoch": 0.19, + "learning_rate": 0.0002712077577693043, + "loss": 0.0199, "step": 74050 }, { - "epoch": 0.37, - "learning_rate": 0.00024395366553823952, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.0002712038695529329, + "loss": 0.029, "step": 74060 }, { - "epoch": 0.37, - "learning_rate": 0.00024394609784522553, - "loss": 0.016, + "epoch": 0.19, + "learning_rate": 0.0002711999813365614, + "loss": 0.0227, "step": 74070 }, { - "epoch": 0.37, - "learning_rate": 0.0002439385301522115, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.0002711960931201899, + "loss": 0.0317, "step": 74080 }, { - "epoch": 0.37, - "learning_rate": 0.0002439309624591975, - "loss": 0.0194, + "epoch": 0.19, + "learning_rate": 0.0002711922049038185, + "loss": 0.0344, "step": 74090 }, { - "epoch": 0.37, - "learning_rate": 0.00024392339476618348, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.000271188316687447, + "loss": 0.0263, "step": 74100 }, { - "epoch": 0.37, - "learning_rate": 0.00024391582707316948, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.0002711844284710755, + "loss": 0.0234, "step": 74110 }, { - "epoch": 0.37, - "learning_rate": 0.00024390825938015547, - "loss": 0.0197, + "epoch": 0.19, + "learning_rate": 0.0002711805402547041, + "loss": 0.0211, "step": 74120 }, { - "epoch": 0.37, - "learning_rate": 0.00024390069168714145, - "loss": 0.0172, + "epoch": 0.19, + "learning_rate": 0.0002711766520383326, + "loss": 0.0246, "step": 74130 }, { - "epoch": 0.37, - "learning_rate": 0.00024389312399412746, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.00027117276382196116, + "loss": 0.0197, "step": 74140 }, { - "epoch": 0.37, - "learning_rate": 0.00024388555630111344, - "loss": 0.0165, + "epoch": 0.19, + "learning_rate": 0.0002711688756055897, + "loss": 0.0255, "step": 74150 }, { - "epoch": 0.37, - "learning_rate": 0.00024387798860809942, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.0002711649873892182, + "loss": 0.0242, "step": 74160 }, { - "epoch": 0.37, - "learning_rate": 0.00024387042091508543, - "loss": 0.015, + "epoch": 0.19, + "learning_rate": 0.00027116109917284676, + "loss": 0.0246, "step": 74170 }, { - "epoch": 0.37, - "learning_rate": 0.0002438628532220714, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.0002711572109564753, + "loss": 0.0192, "step": 74180 }, { - "epoch": 0.37, - "learning_rate": 0.0002438552855290574, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.0002711533227401038, + "loss": 0.0227, "step": 74190 }, { - "epoch": 0.37, - "learning_rate": 0.0002438477178360434, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.00027114943452373236, + "loss": 0.0238, "step": 74200 }, { - "epoch": 0.37, - "learning_rate": 0.00024384015014302938, - "loss": 0.0182, + "epoch": 0.19, + "learning_rate": 0.0002711455463073609, + "loss": 0.0252, "step": 74210 }, { - "epoch": 0.37, - "learning_rate": 0.00024383258245001536, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027114165809098944, + "loss": 0.024, "step": 74220 }, { - "epoch": 0.37, - "learning_rate": 0.00024382501475700137, - "loss": 0.0242, + "epoch": 0.19, + "learning_rate": 0.00027113776987461796, + "loss": 0.0205, "step": 74230 }, { - "epoch": 0.37, - "learning_rate": 0.00024381744706398735, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.00027113388165824647, + "loss": 0.0236, "step": 74240 }, { - "epoch": 0.37, - "learning_rate": 0.00024380987937097333, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027112999344187504, + "loss": 0.0231, "step": 74250 }, { - "epoch": 0.37, - "learning_rate": 0.00024380231167795931, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.00027112610522550356, + "loss": 0.0226, "step": 74260 }, { - "epoch": 0.37, - "learning_rate": 0.00024379474398494532, - "loss": 0.0148, + "epoch": 0.19, + "learning_rate": 0.0002711222170091321, + "loss": 0.0251, "step": 74270 }, { - "epoch": 0.37, - "learning_rate": 0.0002437871762919313, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027111832879276064, + "loss": 0.024, "step": 74280 }, { - "epoch": 0.37, - "learning_rate": 0.00024377960859891729, - "loss": 0.0166, + "epoch": 0.19, + "learning_rate": 0.00027111444057638915, + "loss": 0.0223, "step": 74290 }, { - "epoch": 0.37, - "learning_rate": 0.0002437720409059033, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002711105523600177, + "loss": 0.0217, "step": 74300 }, { - "epoch": 0.37, - "learning_rate": 0.00024376447321288928, - "loss": 0.0141, + "epoch": 0.19, + "learning_rate": 0.00027110666414364624, + "loss": 0.0252, "step": 74310 }, { - "epoch": 0.37, - "learning_rate": 0.00024375690551987526, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027110277592727475, + "loss": 0.0228, "step": 74320 }, { - "epoch": 0.38, - "learning_rate": 0.00024374933782686127, - "loss": 0.0209, + "epoch": 0.19, + "learning_rate": 0.0002710988877109033, + "loss": 0.0239, "step": 74330 }, { - "epoch": 0.38, - "learning_rate": 0.00024374177013384725, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.0002710949994945319, + "loss": 0.0257, "step": 74340 }, { - "epoch": 0.38, - "learning_rate": 0.00024373420244083323, - "loss": 0.0157, + "epoch": 0.19, + "learning_rate": 0.0002710911112781604, + "loss": 0.0287, "step": 74350 }, { - "epoch": 0.38, - "learning_rate": 0.00024372663474781924, - "loss": 0.0167, + "epoch": 0.19, + "learning_rate": 0.0002710872230617889, + "loss": 0.0217, "step": 74360 }, { - "epoch": 0.38, - "learning_rate": 0.00024371906705480522, - "loss": 0.0168, + "epoch": 0.19, + "learning_rate": 0.00027108333484541743, + "loss": 0.0289, "step": 74370 }, { - "epoch": 0.38, - "learning_rate": 0.0002437114993617912, - "loss": 0.0158, + "epoch": 0.19, + "learning_rate": 0.000271079446629046, + "loss": 0.0211, "step": 74380 }, { - "epoch": 0.38, - "learning_rate": 0.0002437039316687772, - "loss": 0.0216, + "epoch": 0.19, + "learning_rate": 0.0002710755584126745, + "loss": 0.0262, "step": 74390 }, { - "epoch": 0.38, - "learning_rate": 0.0002436963639757632, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.0002710716701963031, + "loss": 0.0212, "step": 74400 }, { - "epoch": 0.38, - "learning_rate": 0.00024368879628274917, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.0002710677819799316, + "loss": 0.0295, "step": 74410 }, { - "epoch": 0.38, - "learning_rate": 0.00024368122858973515, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.00027106389376356017, + "loss": 0.0229, "step": 74420 }, { - "epoch": 0.38, - "learning_rate": 0.00024367366089672116, - "loss": 0.0231, + "epoch": 0.19, + "learning_rate": 0.0002710600055471887, + "loss": 0.0237, "step": 74430 }, { - "epoch": 0.38, - "learning_rate": 0.00024366609320370714, - "loss": 0.0163, + "epoch": 0.19, + "learning_rate": 0.0002710561173308172, + "loss": 0.022, "step": 74440 }, { - "epoch": 0.38, - "learning_rate": 0.00024365852551069312, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002710522291144457, + "loss": 0.0258, "step": 74450 }, { - "epoch": 0.38, - "learning_rate": 0.00024365095781767913, + "epoch": 0.19, + "learning_rate": 0.0002710483408980743, "loss": 0.0225, "step": 74460 }, { - "epoch": 0.38, - "learning_rate": 0.00024364339012466511, - "loss": 0.0206, + "epoch": 0.19, + "learning_rate": 0.0002710444526817028, + "loss": 0.0241, "step": 74470 }, { - "epoch": 0.38, - "learning_rate": 0.0002436358224316511, - "loss": 0.0202, + "epoch": 0.19, + "learning_rate": 0.00027104056446533136, + "loss": 0.0224, "step": 74480 }, { - "epoch": 0.38, - "learning_rate": 0.0002436282547386371, - "loss": 0.0168, + "epoch": 0.19, + "learning_rate": 0.0002710366762489599, + "loss": 0.0221, "step": 74490 }, { - "epoch": 0.38, - "learning_rate": 0.00024362068704562309, - "loss": 0.0195, + "epoch": 0.19, + "learning_rate": 0.0002710327880325884, + "loss": 0.0256, "step": 74500 }, { - "epoch": 0.38, - "learning_rate": 0.00024361311935260907, - "loss": 0.0196, + "epoch": 0.19, + "learning_rate": 0.00027102889981621696, + "loss": 0.0215, "step": 74510 }, { - "epoch": 0.38, - "learning_rate": 0.00024360555165959508, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.0002710250115998455, + "loss": 0.0243, "step": 74520 }, { - "epoch": 0.38, - "learning_rate": 0.00024359798396658106, - "loss": 0.0168, + "epoch": 0.19, + "learning_rate": 0.000271021123383474, + "loss": 0.0276, "step": 74530 }, { - "epoch": 0.38, - "learning_rate": 0.00024359041627356704, - "loss": 0.0194, + "epoch": 0.19, + "learning_rate": 0.00027101723516710256, + "loss": 0.0257, "step": 74540 }, { - "epoch": 0.38, - "learning_rate": 0.00024358284858055305, - "loss": 0.0216, + "epoch": 0.19, + "learning_rate": 0.0002710133469507311, + "loss": 0.0221, "step": 74550 }, { - "epoch": 0.38, - "learning_rate": 0.00024357528088753903, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.00027100945873435964, + "loss": 0.0205, "step": 74560 }, { - "epoch": 0.38, - "learning_rate": 0.000243567713194525, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027100557051798816, + "loss": 0.0243, "step": 74570 }, { - "epoch": 0.38, - "learning_rate": 0.00024356014550151102, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.00027100168230161667, + "loss": 0.0241, "step": 74580 }, { - "epoch": 0.38, - "learning_rate": 0.000243552577808497, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027099779408524524, + "loss": 0.0225, "step": 74590 }, { - "epoch": 0.38, - "learning_rate": 0.00024354501011548298, - "loss": 0.0183, + "epoch": 0.19, + "learning_rate": 0.00027099390586887375, + "loss": 0.0258, "step": 74600 }, { - "epoch": 0.38, - "learning_rate": 0.00024353744242246896, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.0002709900176525023, + "loss": 0.0232, "step": 74610 }, { - "epoch": 0.38, - "learning_rate": 0.00024352987472945497, - "loss": 0.0213, + "epoch": 0.19, + "learning_rate": 0.00027098612943613084, + "loss": 0.0261, "step": 74620 }, { - "epoch": 0.38, - "learning_rate": 0.00024352230703644095, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.0002709822412197594, + "loss": 0.0293, "step": 74630 }, { - "epoch": 0.38, - "learning_rate": 0.00024351473934342693, - "loss": 0.0194, + "epoch": 0.19, + "learning_rate": 0.0002709783530033879, + "loss": 0.0216, "step": 74640 }, { - "epoch": 0.38, - "learning_rate": 0.00024350717165041294, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027097446478701644, + "loss": 0.0237, "step": 74650 }, { - "epoch": 0.38, - "learning_rate": 0.00024349960395739892, - "loss": 0.0214, + "epoch": 0.19, + "learning_rate": 0.00027097057657064495, + "loss": 0.0264, "step": 74660 }, { - "epoch": 0.38, - "learning_rate": 0.0002434920362643849, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.0002709666883542735, + "loss": 0.0215, "step": 74670 }, { - "epoch": 0.38, - "learning_rate": 0.00024348446857137091, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.00027096280013790203, + "loss": 0.026, "step": 74680 }, { - "epoch": 0.38, - "learning_rate": 0.0002434769008783569, - "loss": 0.0165, + "epoch": 0.19, + "learning_rate": 0.0002709589119215306, + "loss": 0.0278, "step": 74690 }, { - "epoch": 0.38, - "learning_rate": 0.00024346933318534288, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.0002709550237051591, + "loss": 0.0263, "step": 74700 }, { - "epoch": 0.38, - "learning_rate": 0.00024346176549232889, - "loss": 0.0171, + "epoch": 0.19, + "learning_rate": 0.00027095113548878763, + "loss": 0.0221, "step": 74710 }, { - "epoch": 0.38, - "learning_rate": 0.00024345419779931487, - "loss": 0.0178, + "epoch": 0.19, + "learning_rate": 0.0002709472472724162, + "loss": 0.0199, "step": 74720 }, { - "epoch": 0.38, - "learning_rate": 0.00024344663010630085, - "loss": 0.017, + "epoch": 0.19, + "learning_rate": 0.0002709433590560447, + "loss": 0.0344, "step": 74730 }, { - "epoch": 0.38, - "learning_rate": 0.00024343906241328686, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002709394708396733, + "loss": 0.0208, "step": 74740 }, { - "epoch": 0.38, - "learning_rate": 0.00024343149472027284, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.0002709355826233018, + "loss": 0.0255, "step": 74750 }, { - "epoch": 0.38, - "learning_rate": 0.00024342392702725882, - "loss": 0.0185, + "epoch": 0.19, + "learning_rate": 0.00027093169440693037, + "loss": 0.0226, "step": 74760 }, { - "epoch": 0.38, - "learning_rate": 0.0002434163593342448, - "loss": 0.0179, + "epoch": 0.19, + "learning_rate": 0.0002709278061905589, + "loss": 0.0227, "step": 74770 }, { - "epoch": 0.38, - "learning_rate": 0.0002434087916412308, - "loss": 0.0176, + "epoch": 0.19, + "learning_rate": 0.0002709239179741874, + "loss": 0.03, "step": 74780 }, { - "epoch": 0.38, - "learning_rate": 0.00024340122394821676, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002709200297578159, + "loss": 0.0244, "step": 74790 }, { - "epoch": 0.38, - "learning_rate": 0.00024339365625520275, - "loss": 0.0175, + "epoch": 0.19, + "learning_rate": 0.0002709161415414445, + "loss": 0.024, "step": 74800 }, { - "epoch": 0.38, - "learning_rate": 0.00024338608856218873, - "loss": 0.0168, + "epoch": 0.19, + "learning_rate": 0.000270912253325073, + "loss": 0.0225, "step": 74810 }, { - "epoch": 0.38, - "learning_rate": 0.00024337852086917474, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.00027090836510870156, + "loss": 0.0248, "step": 74820 }, { - "epoch": 0.38, - "learning_rate": 0.00024337095317616072, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.0002709044768923301, + "loss": 0.027, "step": 74830 }, { - "epoch": 0.38, - "learning_rate": 0.0002433633854831467, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.00027090058867595864, + "loss": 0.0234, "step": 74840 }, { - "epoch": 0.38, - "learning_rate": 0.0002433558177901327, - "loss": 0.0167, + "epoch": 0.19, + "learning_rate": 0.00027089670045958716, + "loss": 0.0226, "step": 74850 }, { - "epoch": 0.38, - "learning_rate": 0.0002433482500971187, - "loss": 0.0211, + "epoch": 0.19, + "learning_rate": 0.0002708928122432157, + "loss": 0.0232, "step": 74860 }, { - "epoch": 0.38, - "learning_rate": 0.00024334068240410467, - "loss": 0.0193, + "epoch": 0.19, + "learning_rate": 0.0002708889240268442, + "loss": 0.0217, "step": 74870 }, { - "epoch": 0.38, - "learning_rate": 0.00024333311471109068, - "loss": 0.0197, + "epoch": 0.19, + "learning_rate": 0.00027088503581047276, + "loss": 0.0247, "step": 74880 }, { - "epoch": 0.38, - "learning_rate": 0.00024332554701807666, - "loss": 0.0151, + "epoch": 0.19, + "learning_rate": 0.0002708811475941013, + "loss": 0.025, "step": 74890 }, { - "epoch": 0.38, - "learning_rate": 0.00024331797932506264, - "loss": 0.0191, + "epoch": 0.19, + "learning_rate": 0.00027087725937772984, + "loss": 0.0283, "step": 74900 }, { - "epoch": 0.38, - "learning_rate": 0.00024331041163204865, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.00027087337116135836, + "loss": 0.0281, "step": 74910 }, { - "epoch": 0.38, - "learning_rate": 0.00024330284393903463, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.0002708694829449869, + "loss": 0.0219, "step": 74920 }, { - "epoch": 0.38, - "learning_rate": 0.00024329527624602061, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.00027086559472861544, + "loss": 0.0246, "step": 74930 }, { - "epoch": 0.38, - "learning_rate": 0.00024328770855300662, - "loss": 0.0187, + "epoch": 0.19, + "learning_rate": 0.00027086170651224395, + "loss": 0.0287, "step": 74940 }, { - "epoch": 0.38, - "learning_rate": 0.0002432801408599926, - "loss": 0.0184, + "epoch": 0.19, + "learning_rate": 0.0002708578182958725, + "loss": 0.0302, "step": 74950 }, { - "epoch": 0.38, - "learning_rate": 0.00024327257316697859, - "loss": 0.0186, + "epoch": 0.19, + "learning_rate": 0.00027085393007950104, + "loss": 0.0209, "step": 74960 }, { - "epoch": 0.38, - "learning_rate": 0.0002432650054739646, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.0002708500418631296, + "loss": 0.0235, "step": 74970 }, { - "epoch": 0.38, - "learning_rate": 0.00024325743778095058, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.0002708461536467581, + "loss": 0.0288, "step": 74980 }, { - "epoch": 0.38, - "learning_rate": 0.00024324987008793656, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027084226543038663, + "loss": 0.0222, "step": 74990 }, { - "epoch": 0.38, - "learning_rate": 0.00024324230239492254, - "loss": 0.0191, + "epoch": 0.19, + "learning_rate": 0.00027083837721401515, + "loss": 0.0261, "step": 75000 }, { - "epoch": 0.38, - "eval_cer": 0.9144935454101719, - "eval_loss": 0.013869182206690311, - "eval_runtime": 116.7861, - "eval_samples_per_second": 17.125, - "eval_steps_per_second": 4.281, + "epoch": 0.19, + "eval_cer": 0.8817908634500211, + "eval_loss": 0.017617717385292053, + "eval_runtime": 107.5409, + "eval_samples_per_second": 18.598, + "eval_steps_per_second": 4.649, "step": 75000 }, { - "epoch": 0.38, - "learning_rate": 0.00024323473470190855, - "loss": 0.0208, + "epoch": 0.19, + "learning_rate": 0.0002708344889976437, + "loss": 0.0273, "step": 75010 }, { - "epoch": 0.38, - "learning_rate": 0.00024322716700889453, - "loss": 0.0217, + "epoch": 0.19, + "learning_rate": 0.00027083060078127223, + "loss": 0.0304, "step": 75020 }, { - "epoch": 0.38, - "learning_rate": 0.0002432195993158805, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.0002708267125649008, + "loss": 0.0268, "step": 75030 }, { - "epoch": 0.38, - "learning_rate": 0.00024321203162286652, - "loss": 0.0162, + "epoch": 0.19, + "learning_rate": 0.0002708228243485293, + "loss": 0.0246, "step": 75040 }, { - "epoch": 0.38, - "learning_rate": 0.0002432044639298525, - "loss": 0.0242, + "epoch": 0.19, + "learning_rate": 0.0002708189361321579, + "loss": 0.0229, "step": 75050 }, { - "epoch": 0.38, - "learning_rate": 0.00024319689623683848, - "loss": 0.019, + "epoch": 0.19, + "learning_rate": 0.0002708150479157864, + "loss": 0.0187, "step": 75060 }, { - "epoch": 0.38, - "learning_rate": 0.0002431893285438245, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.0002708111596994149, + "loss": 0.021, "step": 75070 }, { - "epoch": 0.38, - "learning_rate": 0.00024318176085081047, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.00027080727148304343, + "loss": 0.0253, "step": 75080 }, { - "epoch": 0.38, - "learning_rate": 0.00024317419315779645, - "loss": 0.0173, + "epoch": 0.19, + "learning_rate": 0.000270803383266672, + "loss": 0.0316, "step": 75090 }, { - "epoch": 0.38, - "learning_rate": 0.00024316662546478246, - "loss": 0.0189, + "epoch": 0.19, + "learning_rate": 0.00027079949505030056, + "loss": 0.0222, "step": 75100 }, { - "epoch": 0.38, - "learning_rate": 0.00024315905777176844, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.0002707956068339291, + "loss": 0.0262, "step": 75110 }, { - "epoch": 0.38, - "learning_rate": 0.00024315149007875442, - "loss": 0.0204, + "epoch": 0.19, + "learning_rate": 0.0002707917186175576, + "loss": 0.0212, "step": 75120 }, { - "epoch": 0.38, - "learning_rate": 0.00024314392238574043, - "loss": 0.0199, + "epoch": 0.19, + "learning_rate": 0.00027078783040118616, + "loss": 0.0282, "step": 75130 }, { - "epoch": 0.38, - "learning_rate": 0.00024313635469272641, - "loss": 0.0169, + "epoch": 0.19, + "learning_rate": 0.0002707839421848147, + "loss": 0.0218, "step": 75140 }, { - "epoch": 0.38, - "learning_rate": 0.0002431287869997124, - "loss": 0.0174, + "epoch": 0.19, + "learning_rate": 0.0002707800539684432, + "loss": 0.0212, "step": 75150 }, { - "epoch": 0.38, - "learning_rate": 0.00024312121930669838, - "loss": 0.02, + "epoch": 0.19, + "learning_rate": 0.00027077616575207176, + "loss": 0.0256, "step": 75160 }, { - "epoch": 0.38, - "learning_rate": 0.00024311365161368439, - "loss": 0.0205, + "epoch": 0.19, + "learning_rate": 0.0002707722775357003, + "loss": 0.0209, "step": 75170 }, { - "epoch": 0.38, - "learning_rate": 0.00024310608392067037, - "loss": 0.0188, + "epoch": 0.19, + "learning_rate": 0.00027076838931932884, + "loss": 0.0254, "step": 75180 }, { - "epoch": 0.38, - "learning_rate": 0.00024309851622765635, - "loss": 0.0221, + "epoch": 0.19, + "learning_rate": 0.00027076450110295736, + "loss": 0.0281, "step": 75190 }, { - "epoch": 0.38, - "learning_rate": 0.00024309094853464236, - "loss": 0.0181, + "epoch": 0.19, + "learning_rate": 0.00027076061288658587, + "loss": 0.027, "step": 75200 }, { - "epoch": 0.38, - "learning_rate": 0.00024308338084162834, - "loss": 0.018, + "epoch": 0.19, + "learning_rate": 0.0002707567246702144, + "loss": 0.0245, "step": 75210 }, { - "epoch": 0.38, - "learning_rate": 0.00024307581314861432, - "loss": 0.0225, + "epoch": 0.19, + "learning_rate": 0.00027075283645384296, + "loss": 0.0248, "step": 75220 }, { - "epoch": 0.38, - "learning_rate": 0.00024306824545560033, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.00027074894823747147, + "loss": 0.0269, "step": 75230 }, { - "epoch": 0.38, - "learning_rate": 0.0002430606777625863, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00027074506002110004, + "loss": 0.0242, "step": 75240 }, { - "epoch": 0.38, - "learning_rate": 0.0002430531100695723, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.00027074117180472855, + "loss": 0.0269, "step": 75250 }, { - "epoch": 0.38, - "learning_rate": 0.0002430455423765583, - "loss": 0.0203, + "epoch": 0.2, + "learning_rate": 0.0002707372835883571, + "loss": 0.026, "step": 75260 }, { - "epoch": 0.38, - "learning_rate": 0.00024303797468354428, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.00027073339537198564, + "loss": 0.0225, "step": 75270 }, { - "epoch": 0.38, - "learning_rate": 0.00024303040699053026, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.00027072950715561415, + "loss": 0.0253, "step": 75280 }, { - "epoch": 0.38, - "learning_rate": 0.00024302283929751627, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002707256189392427, + "loss": 0.0256, "step": 75290 }, { - "epoch": 0.38, - "learning_rate": 0.00024301527160450225, - "loss": 0.0194, + "epoch": 0.2, + "learning_rate": 0.00027072173072287123, + "loss": 0.0255, "step": 75300 }, { - "epoch": 0.38, - "learning_rate": 0.00024300770391148823, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.0002707178425064998, + "loss": 0.0228, "step": 75310 }, { - "epoch": 0.38, - "learning_rate": 0.00024300013621847422, - "loss": 0.0145, + "epoch": 0.2, + "learning_rate": 0.0002707139542901283, + "loss": 0.026, "step": 75320 }, { - "epoch": 0.38, - "learning_rate": 0.00024299256852546022, - "loss": 0.0141, + "epoch": 0.2, + "learning_rate": 0.00027071006607375683, + "loss": 0.0263, "step": 75330 }, { - "epoch": 0.38, - "learning_rate": 0.0002429850008324462, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.0002707061778573854, + "loss": 0.0239, "step": 75340 }, { - "epoch": 0.38, - "learning_rate": 0.0002429774331394322, - "loss": 0.0232, + "epoch": 0.2, + "learning_rate": 0.0002707022896410139, + "loss": 0.0314, "step": 75350 }, { - "epoch": 0.38, - "learning_rate": 0.0002429698654464182, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.00027069840142464243, + "loss": 0.0213, "step": 75360 }, { - "epoch": 0.38, - "learning_rate": 0.00024296229775340418, - "loss": 0.0148, + "epoch": 0.2, + "learning_rate": 0.000270694513208271, + "loss": 0.0265, "step": 75370 }, { - "epoch": 0.38, - "learning_rate": 0.00024295473006039016, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002706906249918995, + "loss": 0.025, "step": 75380 }, { - "epoch": 0.38, - "learning_rate": 0.00024294716236737617, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.0002706867367755281, + "loss": 0.0244, "step": 75390 }, { - "epoch": 0.38, - "learning_rate": 0.00024293959467436215, - "loss": 0.0162, + "epoch": 0.2, + "learning_rate": 0.0002706828485591566, + "loss": 0.0243, "step": 75400 }, { - "epoch": 0.38, - "learning_rate": 0.00024293202698134813, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002706789603427851, + "loss": 0.0262, "step": 75410 }, { - "epoch": 0.38, - "learning_rate": 0.00024292445928833414, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002706750721264137, + "loss": 0.0208, "step": 75420 }, { - "epoch": 0.38, - "learning_rate": 0.00024291689159532012, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002706711839100422, + "loss": 0.0218, "step": 75430 }, { - "epoch": 0.38, - "learning_rate": 0.0002429093239023061, - "loss": 0.0187, + "epoch": 0.2, + "learning_rate": 0.00027066729569367076, + "loss": 0.0266, "step": 75440 }, { - "epoch": 0.38, - "learning_rate": 0.0002429017562092921, - "loss": 0.0137, + "epoch": 0.2, + "learning_rate": 0.0002706634074772993, + "loss": 0.0226, "step": 75450 }, { - "epoch": 0.38, - "learning_rate": 0.0002428941885162781, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.0002706595192609278, + "loss": 0.0269, "step": 75460 }, { - "epoch": 0.38, - "learning_rate": 0.00024288662082326407, - "loss": 0.0159, + "epoch": 0.2, + "learning_rate": 0.00027065563104455636, + "loss": 0.0266, "step": 75470 }, { - "epoch": 0.38, - "learning_rate": 0.00024287905313025008, - "loss": 0.0231, + "epoch": 0.2, + "learning_rate": 0.0002706517428281849, + "loss": 0.0259, "step": 75480 }, { - "epoch": 0.38, - "learning_rate": 0.00024287148543723606, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.0002706478546118134, + "loss": 0.0221, "step": 75490 }, { - "epoch": 0.38, - "learning_rate": 0.00024286391774422204, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.00027064396639544196, + "loss": 0.0263, "step": 75500 }, { - "epoch": 0.38, - "learning_rate": 0.00024285635005120803, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.0002706400781790705, + "loss": 0.0281, "step": 75510 }, { - "epoch": 0.38, - "learning_rate": 0.00024284878235819403, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.00027063618996269904, + "loss": 0.0217, "step": 75520 }, { - "epoch": 0.38, - "learning_rate": 0.00024284121466518002, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.00027063230174632756, + "loss": 0.0242, "step": 75530 }, { - "epoch": 0.38, - "learning_rate": 0.000242833646972166, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00027062841352995607, + "loss": 0.026, "step": 75540 }, { - "epoch": 0.38, - "learning_rate": 0.000242826079279152, - "loss": 0.0158, + "epoch": 0.2, + "learning_rate": 0.00027062452531358464, + "loss": 0.0252, "step": 75550 }, { - "epoch": 0.38, - "learning_rate": 0.000242818511586138, - "loss": 0.0201, + "epoch": 0.2, + "learning_rate": 0.00027062063709721315, + "loss": 0.0263, "step": 75560 }, { - "epoch": 0.38, - "learning_rate": 0.00024281094389312397, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.00027061674888084167, + "loss": 0.021, "step": 75570 }, { - "epoch": 0.38, - "learning_rate": 0.00024280337620010998, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.00027061286066447024, + "loss": 0.0246, "step": 75580 }, { - "epoch": 0.38, - "learning_rate": 0.00024279580850709596, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.0002706089724480988, + "loss": 0.0261, "step": 75590 }, { - "epoch": 0.38, - "learning_rate": 0.00024278824081408194, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.0002706050842317273, + "loss": 0.0371, "step": 75600 }, { - "epoch": 0.38, - "learning_rate": 0.00024278067312106795, - "loss": 0.0191, + "epoch": 0.2, + "learning_rate": 0.00027060119601535584, + "loss": 0.0294, "step": 75610 }, { - "epoch": 0.38, - "learning_rate": 0.00024277310542805393, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.00027059730779898435, + "loss": 0.0215, "step": 75620 }, { - "epoch": 0.38, - "learning_rate": 0.0002427655377350399, - "loss": 0.0191, + "epoch": 0.2, + "learning_rate": 0.0002705934195826129, + "loss": 0.0237, "step": 75630 }, { - "epoch": 0.38, - "learning_rate": 0.00024275797004202592, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.00027058953136624143, + "loss": 0.0228, "step": 75640 }, { - "epoch": 0.38, - "learning_rate": 0.0002427504023490119, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.00027058564314987, + "loss": 0.0233, "step": 75650 }, { - "epoch": 0.38, - "learning_rate": 0.00024274283465599788, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.0002705817549334985, + "loss": 0.0231, "step": 75660 }, { - "epoch": 0.38, - "learning_rate": 0.00024273526696298386, - "loss": 0.0238, + "epoch": 0.2, + "learning_rate": 0.0002705778667171271, + "loss": 0.0231, "step": 75670 }, { - "epoch": 0.38, - "learning_rate": 0.00024272769926996987, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.0002705739785007556, + "loss": 0.0245, "step": 75680 }, { - "epoch": 0.38, - "learning_rate": 0.00024272013157695585, - "loss": 0.0169, + "epoch": 0.2, + "learning_rate": 0.0002705700902843841, + "loss": 0.0199, "step": 75690 }, { - "epoch": 0.38, - "learning_rate": 0.00024271256388394184, - "loss": 0.02, + "epoch": 0.2, + "learning_rate": 0.00027056620206801263, + "loss": 0.0215, "step": 75700 }, { - "epoch": 0.38, - "learning_rate": 0.00024270499619092784, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.0002705623138516412, + "loss": 0.0222, "step": 75710 }, { - "epoch": 0.38, - "learning_rate": 0.00024269742849791383, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.0002705584256352697, + "loss": 0.0256, "step": 75720 }, { - "epoch": 0.38, - "learning_rate": 0.0002426898608048998, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.0002705545374188983, + "loss": 0.024, "step": 75730 }, { - "epoch": 0.38, - "learning_rate": 0.00024268229311188582, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.0002705506492025268, + "loss": 0.0255, "step": 75740 }, { - "epoch": 0.38, - "learning_rate": 0.0002426747254188718, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002705467609861553, + "loss": 0.0294, "step": 75750 }, { - "epoch": 0.38, - "learning_rate": 0.00024266715772585778, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002705428727697839, + "loss": 0.0229, "step": 75760 }, { - "epoch": 0.38, - "learning_rate": 0.0002426595900328438, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.0002705389845534124, + "loss": 0.0271, "step": 75770 }, { - "epoch": 0.38, - "learning_rate": 0.00024265202233982977, - "loss": 0.0161, + "epoch": 0.2, + "learning_rate": 0.0002705350963370409, + "loss": 0.0217, "step": 75780 }, { - "epoch": 0.38, - "learning_rate": 0.00024264445464681575, - "loss": 0.0233, + "epoch": 0.2, + "learning_rate": 0.0002705312081206695, + "loss": 0.0213, "step": 75790 }, { - "epoch": 0.38, - "learning_rate": 0.00024263688695380176, - "loss": 0.0207, + "epoch": 0.2, + "learning_rate": 0.00027052731990429805, + "loss": 0.0218, "step": 75800 }, { - "epoch": 0.38, - "learning_rate": 0.00024262931926078774, - "loss": 0.0291, + "epoch": 0.2, + "learning_rate": 0.00027052343168792656, + "loss": 0.0227, "step": 75810 }, { - "epoch": 0.38, - "learning_rate": 0.00024262175156777372, - "loss": 0.0234, + "epoch": 0.2, + "learning_rate": 0.0002705195434715551, + "loss": 0.0246, "step": 75820 }, { - "epoch": 0.38, - "learning_rate": 0.0002426141838747597, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002705156552551836, + "loss": 0.0255, "step": 75830 }, { - "epoch": 0.38, - "learning_rate": 0.0002426066161817457, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.00027051176703881216, + "loss": 0.0242, "step": 75840 }, { - "epoch": 0.38, - "learning_rate": 0.0002425990484887317, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.00027050787882244067, + "loss": 0.0202, "step": 75850 }, { - "epoch": 0.38, - "learning_rate": 0.00024259148079571767, - "loss": 0.0199, + "epoch": 0.2, + "learning_rate": 0.00027050399060606924, + "loss": 0.0232, "step": 75860 }, { - "epoch": 0.38, - "learning_rate": 0.00024258391310270368, - "loss": 0.014, + "epoch": 0.2, + "learning_rate": 0.00027050010238969776, + "loss": 0.0248, "step": 75870 }, { - "epoch": 0.38, - "learning_rate": 0.00024257634540968966, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.0002704962141733263, + "loss": 0.0217, "step": 75880 }, { - "epoch": 0.38, - "learning_rate": 0.00024256877771667565, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.00027049232595695484, + "loss": 0.0251, "step": 75890 }, { - "epoch": 0.38, - "learning_rate": 0.00024256121002366165, - "loss": 0.017, + "epoch": 0.2, + "learning_rate": 0.00027048843774058335, + "loss": 0.0356, "step": 75900 }, { - "epoch": 0.38, - "learning_rate": 0.00024255364233064764, - "loss": 0.0169, + "epoch": 0.2, + "learning_rate": 0.00027048454952421187, + "loss": 0.0193, "step": 75910 }, { - "epoch": 0.38, - "learning_rate": 0.00024254607463763362, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00027048066130784044, + "loss": 0.0293, "step": 75920 }, { - "epoch": 0.38, - "learning_rate": 0.00024253850694461963, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.000270476773091469, + "loss": 0.0324, "step": 75930 }, { - "epoch": 0.38, - "learning_rate": 0.0002425309392516056, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002704728848750975, + "loss": 0.0213, "step": 75940 }, { - "epoch": 0.38, - "learning_rate": 0.0002425233715585916, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.00027046899665872603, + "loss": 0.0238, "step": 75950 }, { - "epoch": 0.38, - "learning_rate": 0.0002425158038655776, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.00027046510844235455, + "loss": 0.025, "step": 75960 }, { - "epoch": 0.38, - "learning_rate": 0.00024250823617256358, - "loss": 0.0203, + "epoch": 0.2, + "learning_rate": 0.0002704612202259831, + "loss": 0.0213, "step": 75970 }, { - "epoch": 0.38, - "learning_rate": 0.00024250066847954956, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00027045733200961163, + "loss": 0.0241, "step": 75980 }, { - "epoch": 0.38, - "learning_rate": 0.00024249310078653557, - "loss": 0.0203, + "epoch": 0.2, + "learning_rate": 0.0002704534437932402, + "loss": 0.0274, "step": 75990 }, { - "epoch": 0.38, - "learning_rate": 0.00024248553309352155, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.0002704495555768687, + "loss": 0.0284, "step": 76000 }, { - "epoch": 0.38, - "eval_cer": 0.9144925750140465, - "eval_loss": 0.012879201211035252, - "eval_runtime": 116.6021, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.2, + "eval_cer": 0.8817768670806793, + "eval_loss": 0.01834818534553051, + "eval_runtime": 107.643, + "eval_samples_per_second": 18.58, + "eval_steps_per_second": 4.645, "step": 76000 }, { - "epoch": 0.38, - "learning_rate": 0.00024247796540050753, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.0002704456673604973, + "loss": 0.0234, "step": 76010 }, { - "epoch": 0.38, - "learning_rate": 0.0002424703977074935, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.0002704417791441258, + "loss": 0.0233, "step": 76020 }, { - "epoch": 0.38, - "learning_rate": 0.00024246283001447952, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.0002704378909277543, + "loss": 0.0239, "step": 76030 }, { - "epoch": 0.38, - "learning_rate": 0.0002424552623214655, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00027043400271138283, + "loss": 0.0215, "step": 76040 }, { - "epoch": 0.38, - "learning_rate": 0.00024244769462845146, - "loss": 0.0159, + "epoch": 0.2, + "learning_rate": 0.0002704301144950114, + "loss": 0.022, "step": 76050 }, { - "epoch": 0.38, - "learning_rate": 0.00024244012693543744, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.0002704262262786399, + "loss": 0.0293, "step": 76060 }, { - "epoch": 0.38, - "learning_rate": 0.00024243255924242345, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.0002704223380622685, + "loss": 0.0302, "step": 76070 }, { - "epoch": 0.38, - "learning_rate": 0.00024242499154940943, - "loss": 0.0219, + "epoch": 0.2, + "learning_rate": 0.000270418449845897, + "loss": 0.0194, "step": 76080 }, { - "epoch": 0.38, - "learning_rate": 0.0002424174238563954, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.00027041456162952556, + "loss": 0.0285, "step": 76090 }, { - "epoch": 0.38, - "learning_rate": 0.00024240985616338142, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.0002704106734131541, + "loss": 0.0267, "step": 76100 }, { - "epoch": 0.38, - "learning_rate": 0.0002424022884703674, - "loss": 0.0203, + "epoch": 0.2, + "learning_rate": 0.0002704067851967826, + "loss": 0.0225, "step": 76110 }, { - "epoch": 0.38, - "learning_rate": 0.00024239472077735338, - "loss": 0.0205, + "epoch": 0.2, + "learning_rate": 0.0002704028969804111, + "loss": 0.0238, "step": 76120 }, { - "epoch": 0.38, - "learning_rate": 0.0002423871530843394, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.0002703990087640397, + "loss": 0.0276, "step": 76130 }, { - "epoch": 0.38, - "learning_rate": 0.00024237958539132537, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00027039512054766824, + "loss": 0.0308, "step": 76140 }, { - "epoch": 0.38, - "learning_rate": 0.00024237201769831135, - "loss": 0.0143, + "epoch": 0.2, + "learning_rate": 0.00027039123233129676, + "loss": 0.0212, "step": 76150 }, { - "epoch": 0.38, - "learning_rate": 0.00024236445000529736, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002703873441149253, + "loss": 0.0248, "step": 76160 }, { - "epoch": 0.38, - "learning_rate": 0.00024235688231228334, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002703834558985538, + "loss": 0.0292, "step": 76170 }, { - "epoch": 0.38, - "learning_rate": 0.00024234931461926932, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.00027037956768218236, + "loss": 0.023, "step": 76180 }, { - "epoch": 0.38, - "learning_rate": 0.00024234174692625533, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00027037567946581087, + "loss": 0.0233, "step": 76190 }, { - "epoch": 0.38, - "learning_rate": 0.00024233417923324131, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.00027037179124943944, + "loss": 0.0208, "step": 76200 }, { - "epoch": 0.38, - "learning_rate": 0.0002423266115402273, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.00027036790303306795, + "loss": 0.0249, "step": 76210 }, { - "epoch": 0.38, - "learning_rate": 0.00024231904384721328, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002703640148166965, + "loss": 0.0288, "step": 76220 }, { - "epoch": 0.38, - "learning_rate": 0.00024231147615419929, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00027036012660032504, + "loss": 0.0227, "step": 76230 }, { - "epoch": 0.38, - "learning_rate": 0.00024230390846118527, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.00027035623838395355, + "loss": 0.0211, "step": 76240 }, { - "epoch": 0.38, - "learning_rate": 0.00024229634076817125, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.00027035235016758207, + "loss": 0.0218, "step": 76250 }, { - "epoch": 0.38, - "learning_rate": 0.00024228877307515726, - "loss": 0.0212, + "epoch": 0.2, + "learning_rate": 0.00027034846195121064, + "loss": 0.0211, "step": 76260 }, { - "epoch": 0.38, - "learning_rate": 0.00024228120538214324, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.00027034457373483915, + "loss": 0.0323, "step": 76270 }, { - "epoch": 0.38, - "learning_rate": 0.00024227363768912922, - "loss": 0.0169, + "epoch": 0.2, + "learning_rate": 0.0002703406855184677, + "loss": 0.0256, "step": 76280 }, { - "epoch": 0.38, - "learning_rate": 0.00024226606999611523, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.00027033679730209623, + "loss": 0.0237, "step": 76290 }, { - "epoch": 0.38, - "learning_rate": 0.0002422585023031012, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.0002703329090857248, + "loss": 0.0209, "step": 76300 }, { - "epoch": 0.38, - "learning_rate": 0.0002422509346100872, - "loss": 0.0154, + "epoch": 0.2, + "learning_rate": 0.0002703290208693533, + "loss": 0.0264, "step": 76310 }, { - "epoch": 0.39, - "learning_rate": 0.0002422433669170732, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.00027032513265298183, + "loss": 0.0264, "step": 76320 }, { - "epoch": 0.39, - "learning_rate": 0.00024223579922405918, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.0002703212444366104, + "loss": 0.0307, "step": 76330 }, { - "epoch": 0.39, - "learning_rate": 0.00024222823153104516, - "loss": 0.0238, + "epoch": 0.2, + "learning_rate": 0.0002703173562202389, + "loss": 0.0252, "step": 76340 }, { - "epoch": 0.39, - "learning_rate": 0.00024222066383803117, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.0002703134680038675, + "loss": 0.0228, "step": 76350 }, { - "epoch": 0.39, - "learning_rate": 0.00024221309614501715, - "loss": 0.0149, + "epoch": 0.2, + "learning_rate": 0.000270309579787496, + "loss": 0.0238, "step": 76360 }, { - "epoch": 0.39, - "learning_rate": 0.00024220552845200313, - "loss": 0.0194, + "epoch": 0.2, + "learning_rate": 0.0002703056915711245, + "loss": 0.0247, "step": 76370 }, { - "epoch": 0.39, - "learning_rate": 0.00024219796075898914, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.0002703018033547531, + "loss": 0.0238, "step": 76380 }, { - "epoch": 0.39, - "learning_rate": 0.00024219039306597512, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002702979151383816, + "loss": 0.0234, "step": 76390 }, { - "epoch": 0.39, - "learning_rate": 0.0002421828253729611, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.0002702940269220101, + "loss": 0.0269, "step": 76400 }, { - "epoch": 0.39, - "learning_rate": 0.0002421752576799471, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.0002702901387056387, + "loss": 0.0253, "step": 76410 }, { - "epoch": 0.39, - "learning_rate": 0.0002421676899869331, - "loss": 0.0212, + "epoch": 0.2, + "learning_rate": 0.0002702862504892672, + "loss": 0.0252, "step": 76420 }, { - "epoch": 0.39, - "learning_rate": 0.00024216012229391908, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.00027028236227289576, + "loss": 0.0273, "step": 76430 }, { - "epoch": 0.39, - "learning_rate": 0.00024215255460090506, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002702784740565243, + "loss": 0.0265, "step": 76440 }, { - "epoch": 0.39, - "learning_rate": 0.00024214498690789107, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.0002702745858401528, + "loss": 0.0297, "step": 76450 }, { - "epoch": 0.39, - "learning_rate": 0.00024213741921487705, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002702706976237813, + "loss": 0.031, "step": 76460 }, { - "epoch": 0.39, - "learning_rate": 0.00024212985152186303, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.0002702668094074099, + "loss": 0.0296, "step": 76470 }, { - "epoch": 0.39, - "learning_rate": 0.00024212228382884904, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00027026292119103844, + "loss": 0.0238, "step": 76480 }, { - "epoch": 0.39, - "learning_rate": 0.00024211471613583502, - "loss": 0.016, + "epoch": 0.2, + "learning_rate": 0.00027025903297466696, + "loss": 0.0253, "step": 76490 }, { - "epoch": 0.39, - "learning_rate": 0.000242107148442821, - "loss": 0.0139, + "epoch": 0.2, + "learning_rate": 0.00027025514475829547, + "loss": 0.0237, "step": 76500 }, { - "epoch": 0.39, - "learning_rate": 0.000242099580749807, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00027025125654192404, + "loss": 0.0183, "step": 76510 }, { - "epoch": 0.39, - "learning_rate": 0.000242092013056793, - "loss": 0.0215, + "epoch": 0.2, + "learning_rate": 0.00027024736832555256, + "loss": 0.0271, "step": 76520 }, { - "epoch": 0.39, - "learning_rate": 0.00024208444536377897, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.00027024348010918107, + "loss": 0.0244, "step": 76530 }, { - "epoch": 0.39, - "learning_rate": 0.00024207687767076498, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.00027023959189280964, + "loss": 0.0218, "step": 76540 }, { - "epoch": 0.39, - "learning_rate": 0.00024206930997775096, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.00027023570367643815, + "loss": 0.0185, "step": 76550 }, { - "epoch": 0.39, - "learning_rate": 0.00024206174228473694, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.0002702318154600667, + "loss": 0.0285, "step": 76560 }, { - "epoch": 0.39, - "learning_rate": 0.00024205417459172293, - "loss": 0.055, + "epoch": 0.2, + "learning_rate": 0.00027022792724369524, + "loss": 0.0186, "step": 76570 }, { - "epoch": 0.39, - "learning_rate": 0.00024204660689870893, - "loss": 0.0154, + "epoch": 0.2, + "learning_rate": 0.00027022403902732375, + "loss": 0.0271, "step": 76580 }, { - "epoch": 0.39, - "learning_rate": 0.00024203903920569492, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002702201508109523, + "loss": 0.0243, "step": 76590 }, { - "epoch": 0.39, - "learning_rate": 0.0002420314715126809, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.00027021626259458083, + "loss": 0.0316, "step": 76600 }, { - "epoch": 0.39, - "learning_rate": 0.0002420239038196669, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.00027021237437820935, + "loss": 0.0297, "step": 76610 }, { - "epoch": 0.39, - "learning_rate": 0.0002420163361266529, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.0002702084861618379, + "loss": 0.0279, "step": 76620 }, { - "epoch": 0.39, - "learning_rate": 0.00024200876843363887, - "loss": 0.0205, + "epoch": 0.2, + "learning_rate": 0.0002702045979454665, + "loss": 0.0243, "step": 76630 }, { - "epoch": 0.39, - "learning_rate": 0.00024200120074062488, - "loss": 0.0199, + "epoch": 0.2, + "learning_rate": 0.000270200709729095, + "loss": 0.0257, "step": 76640 }, { - "epoch": 0.39, - "learning_rate": 0.00024199363304761086, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002701968215127235, + "loss": 0.0271, "step": 76650 }, { - "epoch": 0.39, - "learning_rate": 0.00024198606535459684, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.00027019293329635203, + "loss": 0.0259, "step": 76660 }, { - "epoch": 0.39, - "learning_rate": 0.00024197849766158285, - "loss": 0.0187, + "epoch": 0.2, + "learning_rate": 0.00027018904507998054, + "loss": 0.0311, "step": 76670 }, { - "epoch": 0.39, - "learning_rate": 0.00024197092996856883, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.0002701851568636091, + "loss": 0.034, "step": 76680 }, { - "epoch": 0.39, - "learning_rate": 0.0002419633622755548, - "loss": 0.0145, + "epoch": 0.2, + "learning_rate": 0.0002701812686472377, + "loss": 0.0346, "step": 76690 }, { - "epoch": 0.39, - "learning_rate": 0.00024195579458254082, - "loss": 0.0157, + "epoch": 0.2, + "learning_rate": 0.0002701773804308662, + "loss": 0.0285, "step": 76700 }, { - "epoch": 0.39, - "learning_rate": 0.0002419482268895268, - "loss": 0.0168, + "epoch": 0.2, + "learning_rate": 0.0002701734922144947, + "loss": 0.0245, "step": 76710 }, { - "epoch": 0.39, - "learning_rate": 0.00024194065919651278, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002701696039981233, + "loss": 0.0274, "step": 76720 }, { - "epoch": 0.39, - "learning_rate": 0.00024193309150349876, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002701657157817518, + "loss": 0.0248, "step": 76730 }, { - "epoch": 0.39, - "learning_rate": 0.00024192552381048477, - "loss": 0.0141, + "epoch": 0.2, + "learning_rate": 0.0002701618275653803, + "loss": 0.0272, "step": 76740 }, { - "epoch": 0.39, - "learning_rate": 0.00024191795611747075, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.0002701579393490089, + "loss": 0.0239, "step": 76750 }, { - "epoch": 0.39, - "learning_rate": 0.00024191038842445674, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.0002701540511326374, + "loss": 0.0291, "step": 76760 }, { - "epoch": 0.39, - "learning_rate": 0.00024190282073144274, - "loss": 0.0201, + "epoch": 0.2, + "learning_rate": 0.00027015016291626596, + "loss": 0.0234, "step": 76770 }, { - "epoch": 0.39, - "learning_rate": 0.00024189525303842873, - "loss": 0.0201, + "epoch": 0.2, + "learning_rate": 0.0002701462746998945, + "loss": 0.0256, "step": 76780 }, { - "epoch": 0.39, - "learning_rate": 0.0002418876853454147, - "loss": 0.0148, + "epoch": 0.2, + "learning_rate": 0.000270142386483523, + "loss": 0.0239, "step": 76790 }, { - "epoch": 0.39, - "learning_rate": 0.00024188011765240072, - "loss": 0.0211, + "epoch": 0.2, + "learning_rate": 0.00027013849826715156, + "loss": 0.0302, "step": 76800 }, { - "epoch": 0.39, - "learning_rate": 0.0002418725499593867, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.0002701346100507801, + "loss": 0.0246, "step": 76810 }, { - "epoch": 0.39, - "learning_rate": 0.00024186498226637268, - "loss": 0.0161, + "epoch": 0.2, + "learning_rate": 0.0002701307218344086, + "loss": 0.0244, "step": 76820 }, { - "epoch": 0.39, - "learning_rate": 0.0002418574145733587, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00027012683361803716, + "loss": 0.0242, "step": 76830 }, { - "epoch": 0.39, - "learning_rate": 0.00024184984688034467, - "loss": 0.0152, + "epoch": 0.2, + "learning_rate": 0.0002701229454016657, + "loss": 0.0282, "step": 76840 }, { - "epoch": 0.39, - "learning_rate": 0.00024184227918733065, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.00027011905718529424, + "loss": 0.023, "step": 76850 }, { - "epoch": 0.39, - "learning_rate": 0.00024183471149431666, - "loss": 0.0214, + "epoch": 0.2, + "learning_rate": 0.00027011516896892275, + "loss": 0.0275, "step": 76860 }, { - "epoch": 0.39, - "learning_rate": 0.00024182714380130264, - "loss": 0.0268, + "epoch": 0.2, + "learning_rate": 0.00027011128075255127, + "loss": 0.0283, "step": 76870 }, { - "epoch": 0.39, - "learning_rate": 0.00024181957610828862, - "loss": 0.0213, + "epoch": 0.2, + "learning_rate": 0.00027010739253617984, + "loss": 0.0184, "step": 76880 }, { - "epoch": 0.39, - "learning_rate": 0.00024181200841527463, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00027010350431980835, + "loss": 0.0268, "step": 76890 }, { - "epoch": 0.39, - "learning_rate": 0.0002418044407222606, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002700996161034369, + "loss": 0.0282, "step": 76900 }, { - "epoch": 0.39, - "learning_rate": 0.0002417968730292466, - "loss": 0.0206, + "epoch": 0.2, + "learning_rate": 0.00027009572788706544, + "loss": 0.0222, "step": 76910 }, { - "epoch": 0.39, - "learning_rate": 0.00024178930533623257, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.00027009183967069395, + "loss": 0.0248, "step": 76920 }, { - "epoch": 0.39, - "learning_rate": 0.00024178173764321858, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.0002700879514543225, + "loss": 0.0254, "step": 76930 }, { - "epoch": 0.39, - "learning_rate": 0.00024177416995020456, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.00027008406323795103, + "loss": 0.0246, "step": 76940 }, { - "epoch": 0.39, - "learning_rate": 0.00024176660225719055, - "loss": 0.0224, + "epoch": 0.2, + "learning_rate": 0.00027008017502157955, + "loss": 0.024, "step": 76950 }, { - "epoch": 0.39, - "learning_rate": 0.00024175903456417655, - "loss": 0.0219, + "epoch": 0.2, + "learning_rate": 0.0002700762868052081, + "loss": 0.0265, "step": 76960 }, { - "epoch": 0.39, - "learning_rate": 0.00024175146687116254, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.00027007239858883663, + "loss": 0.0252, "step": 76970 }, { - "epoch": 0.39, - "learning_rate": 0.00024174389917814852, - "loss": 0.0131, + "epoch": 0.2, + "learning_rate": 0.0002700685103724652, + "loss": 0.0282, "step": 76980 }, { - "epoch": 0.39, - "learning_rate": 0.00024173633148513453, - "loss": 0.0148, + "epoch": 0.2, + "learning_rate": 0.0002700646221560937, + "loss": 0.0246, "step": 76990 }, { - "epoch": 0.39, - "learning_rate": 0.0002417287637921205, - "loss": 0.0143, + "epoch": 0.2, + "learning_rate": 0.00027006073393972223, + "loss": 0.028, "step": 77000 }, { - "epoch": 0.39, - "eval_cer": 0.9144974269946735, - "eval_loss": 0.012495556846261024, - "eval_runtime": 116.5435, - "eval_samples_per_second": 17.161, - "eval_steps_per_second": 4.29, + "epoch": 0.2, + "eval_cer": 0.8818398507427173, + "eval_loss": 0.01785467006266117, + "eval_runtime": 107.5617, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.648, "step": 77000 }, { - "epoch": 0.39, - "learning_rate": 0.0002417211960991065, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.0002700568457233508, + "loss": 0.025, "step": 77010 }, { - "epoch": 0.39, - "learning_rate": 0.0002417136284060925, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002700529575069793, + "loss": 0.0253, "step": 77020 }, { - "epoch": 0.39, - "learning_rate": 0.00024170606071307848, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.0002700490692906079, + "loss": 0.0227, "step": 77030 }, { - "epoch": 0.39, - "learning_rate": 0.00024169849302006446, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002700451810742364, + "loss": 0.0252, "step": 77040 }, { - "epoch": 0.39, - "learning_rate": 0.00024169092532705047, - "loss": 0.0164, + "epoch": 0.2, + "learning_rate": 0.00027004129285786496, + "loss": 0.0235, "step": 77050 }, { - "epoch": 0.39, - "learning_rate": 0.00024168335763403645, - "loss": 0.0151, + "epoch": 0.2, + "learning_rate": 0.0002700374046414935, + "loss": 0.0248, "step": 77060 }, { - "epoch": 0.39, - "learning_rate": 0.00024167578994102243, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.000270033516425122, + "loss": 0.0287, "step": 77070 }, { - "epoch": 0.39, - "learning_rate": 0.0002416682222480084, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002700296282087505, + "loss": 0.0279, "step": 77080 }, { - "epoch": 0.39, - "learning_rate": 0.00024166065455499442, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.0002700257399923791, + "loss": 0.0249, "step": 77090 }, { - "epoch": 0.39, - "learning_rate": 0.0002416530868619804, - "loss": 0.0245, + "epoch": 0.2, + "learning_rate": 0.0002700218517760076, + "loss": 0.0236, "step": 77100 }, { - "epoch": 0.39, - "learning_rate": 0.00024164551916896638, - "loss": 0.0208, + "epoch": 0.2, + "learning_rate": 0.00027001796355963616, + "loss": 0.0214, "step": 77110 }, { - "epoch": 0.39, - "learning_rate": 0.0002416379514759524, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.0002700140753432647, + "loss": 0.0204, "step": 77120 }, { - "epoch": 0.39, - "learning_rate": 0.00024163038378293837, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.00027001018712689324, + "loss": 0.0287, "step": 77130 }, { - "epoch": 0.39, - "learning_rate": 0.00024162281608992436, - "loss": 0.0153, + "epoch": 0.2, + "learning_rate": 0.00027000629891052176, + "loss": 0.0271, "step": 77140 }, { - "epoch": 0.39, - "learning_rate": 0.00024161524839691036, - "loss": 0.0219, + "epoch": 0.2, + "learning_rate": 0.00027000241069415027, + "loss": 0.0312, "step": 77150 }, { - "epoch": 0.39, - "learning_rate": 0.00024160768070389635, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.0002699985224777788, + "loss": 0.0255, "step": 77160 }, { - "epoch": 0.39, - "learning_rate": 0.00024160011301088233, - "loss": 0.0222, + "epoch": 0.2, + "learning_rate": 0.00026999463426140736, + "loss": 0.025, "step": 77170 }, { - "epoch": 0.39, - "learning_rate": 0.00024159254531786834, - "loss": 0.0227, + "epoch": 0.2, + "learning_rate": 0.0002699907460450359, + "loss": 0.0225, "step": 77180 }, { - "epoch": 0.39, - "learning_rate": 0.00024158497762485432, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.00026998685782866444, + "loss": 0.0278, "step": 77190 }, { - "epoch": 0.39, - "learning_rate": 0.0002415774099318403, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00026998296961229295, + "loss": 0.0221, "step": 77200 }, { - "epoch": 0.39, - "learning_rate": 0.0002415698422388263, - "loss": 0.0127, + "epoch": 0.2, + "learning_rate": 0.00026997908139592147, + "loss": 0.0267, "step": 77210 }, { - "epoch": 0.39, - "learning_rate": 0.0002415622745458123, - "loss": 0.0152, + "epoch": 0.2, + "learning_rate": 0.00026997519317955004, + "loss": 0.0254, "step": 77220 }, { - "epoch": 0.39, - "learning_rate": 0.00024155470685279827, - "loss": 0.0163, + "epoch": 0.2, + "learning_rate": 0.00026997130496317855, + "loss": 0.0251, "step": 77230 }, { - "epoch": 0.39, - "learning_rate": 0.00024154713915978425, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002699674167468071, + "loss": 0.0195, "step": 77240 }, { - "epoch": 0.39, - "learning_rate": 0.00024153957146677026, - "loss": 0.0155, + "epoch": 0.2, + "learning_rate": 0.00026996352853043563, + "loss": 0.0225, "step": 77250 }, { - "epoch": 0.39, - "learning_rate": 0.00024153200377375624, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002699596403140642, + "loss": 0.032, "step": 77260 }, { - "epoch": 0.39, - "learning_rate": 0.00024152443608074222, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002699557520976927, + "loss": 0.0241, "step": 77270 }, { - "epoch": 0.39, - "learning_rate": 0.00024151686838772823, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00026995186388132123, + "loss": 0.0248, "step": 77280 }, { - "epoch": 0.39, - "learning_rate": 0.0002415093006947142, - "loss": 0.0157, + "epoch": 0.2, + "learning_rate": 0.00026994797566494975, + "loss": 0.0246, "step": 77290 }, { - "epoch": 0.39, - "learning_rate": 0.00024150173300170017, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.0002699440874485783, + "loss": 0.0283, "step": 77300 }, { - "epoch": 0.39, - "learning_rate": 0.00024149416530868615, - "loss": 0.0131, + "epoch": 0.2, + "learning_rate": 0.00026994019923220683, + "loss": 0.024, "step": 77310 }, { - "epoch": 0.39, - "learning_rate": 0.00024148659761567216, - "loss": 0.0155, + "epoch": 0.2, + "learning_rate": 0.0002699363110158354, + "loss": 0.0241, "step": 77320 }, { - "epoch": 0.39, - "learning_rate": 0.00024147902992265814, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.0002699324227994639, + "loss": 0.023, "step": 77330 }, { - "epoch": 0.39, - "learning_rate": 0.00024147146222964412, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002699285345830925, + "loss": 0.025, "step": 77340 }, { - "epoch": 0.39, - "learning_rate": 0.00024146389453663013, - "loss": 0.0167, + "epoch": 0.2, + "learning_rate": 0.000269924646366721, + "loss": 0.0244, "step": 77350 }, { - "epoch": 0.39, - "learning_rate": 0.0002414563268436161, - "loss": 0.0167, + "epoch": 0.2, + "learning_rate": 0.0002699207581503495, + "loss": 0.0269, "step": 77360 }, { - "epoch": 0.39, - "learning_rate": 0.0002414487591506021, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.000269916869933978, + "loss": 0.0267, "step": 77370 }, { - "epoch": 0.39, - "learning_rate": 0.0002414411914575881, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.0002699129817176066, + "loss": 0.0249, "step": 77380 }, { - "epoch": 0.39, - "learning_rate": 0.00024143362376457408, - "loss": 0.0167, + "epoch": 0.2, + "learning_rate": 0.00026990909350123516, + "loss": 0.0237, "step": 77390 }, { - "epoch": 0.39, - "learning_rate": 0.00024142605607156006, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.0002699052052848637, + "loss": 0.0225, "step": 77400 }, { - "epoch": 0.39, - "learning_rate": 0.00024141848837854607, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002699013170684922, + "loss": 0.0258, "step": 77410 }, { - "epoch": 0.39, - "learning_rate": 0.00024141092068553205, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.0002698974288521207, + "loss": 0.0317, "step": 77420 }, { - "epoch": 0.39, - "learning_rate": 0.00024140335299251803, - "loss": 0.0169, + "epoch": 0.2, + "learning_rate": 0.0002698935406357493, + "loss": 0.0248, "step": 77430 }, { - "epoch": 0.39, - "learning_rate": 0.00024139578529950404, - "loss": 0.0234, + "epoch": 0.2, + "learning_rate": 0.0002698896524193778, + "loss": 0.0236, "step": 77440 }, { - "epoch": 0.39, - "learning_rate": 0.00024138821760649002, - "loss": 0.0164, + "epoch": 0.2, + "learning_rate": 0.00026988576420300636, + "loss": 0.0233, "step": 77450 }, { - "epoch": 0.39, - "learning_rate": 0.000241380649913476, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002698818759866349, + "loss": 0.0254, "step": 77460 }, { - "epoch": 0.39, - "learning_rate": 0.000241373082220462, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.00026987798777026344, + "loss": 0.0346, "step": 77470 }, { - "epoch": 0.39, - "learning_rate": 0.000241365514527448, - "loss": 0.0161, + "epoch": 0.2, + "learning_rate": 0.00026987409955389196, + "loss": 0.0269, "step": 77480 }, { - "epoch": 0.39, - "learning_rate": 0.00024135794683443398, - "loss": 0.0137, + "epoch": 0.2, + "learning_rate": 0.00026987021133752047, + "loss": 0.0207, "step": 77490 }, { - "epoch": 0.39, - "learning_rate": 0.00024135037914141996, - "loss": 0.0194, + "epoch": 0.2, + "learning_rate": 0.000269866323121149, + "loss": 0.0267, "step": 77500 }, { - "epoch": 0.39, - "learning_rate": 0.00024134281144840597, - "loss": 0.021, + "epoch": 0.2, + "learning_rate": 0.00026986243490477755, + "loss": 0.0226, "step": 77510 }, { - "epoch": 0.39, - "learning_rate": 0.00024133524375539195, - "loss": 0.0157, + "epoch": 0.2, + "learning_rate": 0.0002698585466884061, + "loss": 0.0266, "step": 77520 }, { - "epoch": 0.39, - "learning_rate": 0.00024132767606237793, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.00026985465847203464, + "loss": 0.0226, "step": 77530 }, { - "epoch": 0.39, - "learning_rate": 0.00024132010836936394, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00026985077025566315, + "loss": 0.0217, "step": 77540 }, { - "epoch": 0.39, - "learning_rate": 0.00024131254067634992, - "loss": 0.017, + "epoch": 0.2, + "learning_rate": 0.0002698468820392917, + "loss": 0.0256, "step": 77550 }, { - "epoch": 0.39, - "learning_rate": 0.0002413049729833359, - "loss": 0.0159, + "epoch": 0.2, + "learning_rate": 0.00026984299382292024, + "loss": 0.0305, "step": 77560 }, { - "epoch": 0.39, - "learning_rate": 0.0002412974052903219, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.00026983910560654875, + "loss": 0.0263, "step": 77570 }, { - "epoch": 0.39, - "learning_rate": 0.0002412898375973079, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.0002698352173901773, + "loss": 0.0222, "step": 77580 }, { - "epoch": 0.39, - "learning_rate": 0.00024128226990429387, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.00026983132917380583, + "loss": 0.0276, "step": 77590 }, { - "epoch": 0.39, - "learning_rate": 0.00024127470221127988, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002698274409574344, + "loss": 0.0266, "step": 77600 }, { - "epoch": 0.39, - "learning_rate": 0.00024126713451826586, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.0002698235527410629, + "loss": 0.0298, "step": 77610 }, { - "epoch": 0.39, - "learning_rate": 0.00024125956682525184, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.00026981966452469143, + "loss": 0.0228, "step": 77620 }, { - "epoch": 0.39, - "learning_rate": 0.00024125199913223783, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.00026981577630832, + "loss": 0.0256, "step": 77630 }, { - "epoch": 0.39, - "learning_rate": 0.00024124443143922383, - "loss": 0.02, + "epoch": 0.2, + "learning_rate": 0.0002698118880919485, + "loss": 0.0304, "step": 77640 }, { - "epoch": 0.39, - "learning_rate": 0.00024123686374620982, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.00026980799987557703, + "loss": 0.0246, "step": 77650 }, { - "epoch": 0.39, - "learning_rate": 0.0002412292960531958, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002698041116592056, + "loss": 0.0246, "step": 77660 }, { - "epoch": 0.39, - "learning_rate": 0.0002412217283601818, - "loss": 0.0242, + "epoch": 0.2, + "learning_rate": 0.0002698002234428341, + "loss": 0.0281, "step": 77670 }, { - "epoch": 0.39, - "learning_rate": 0.0002412141606671678, - "loss": 0.0186, + "epoch": 0.2, + "learning_rate": 0.0002697963352264627, + "loss": 0.0175, "step": 77680 }, { - "epoch": 0.39, - "learning_rate": 0.00024120659297415377, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.0002697924470100912, + "loss": 0.0241, "step": 77690 }, { - "epoch": 0.39, - "learning_rate": 0.00024119902528113978, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.0002697885587937197, + "loss": 0.0256, "step": 77700 }, { - "epoch": 0.39, - "learning_rate": 0.00024119145758812576, - "loss": 0.0163, + "epoch": 0.2, + "learning_rate": 0.0002697846705773482, + "loss": 0.0268, "step": 77710 }, { - "epoch": 0.39, - "learning_rate": 0.00024118388989511174, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.0002697807823609768, + "loss": 0.029, "step": 77720 }, { - "epoch": 0.39, - "learning_rate": 0.00024117632220209775, - "loss": 0.0169, + "epoch": 0.2, + "learning_rate": 0.00026977689414460536, + "loss": 0.021, "step": 77730 }, { - "epoch": 0.39, - "learning_rate": 0.00024116875450908373, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.0002697730059282339, + "loss": 0.0181, "step": 77740 }, { - "epoch": 0.39, - "learning_rate": 0.0002411611868160697, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.0002697691177118624, + "loss": 0.0237, "step": 77750 }, { - "epoch": 0.39, - "learning_rate": 0.00024115361912305572, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.00026976522949549096, + "loss": 0.0266, "step": 77760 }, { - "epoch": 0.39, - "learning_rate": 0.0002411460514300417, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002697613412791195, + "loss": 0.0244, "step": 77770 }, { - "epoch": 0.39, - "learning_rate": 0.00024113848373702768, - "loss": 0.0193, + "epoch": 0.2, + "learning_rate": 0.000269757453062748, + "loss": 0.0185, "step": 77780 }, { - "epoch": 0.39, - "learning_rate": 0.00024113091604401366, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.00026975356484637656, + "loss": 0.0228, "step": 77790 }, { - "epoch": 0.39, - "learning_rate": 0.00024112334835099967, - "loss": 0.0208, + "epoch": 0.2, + "learning_rate": 0.00026974967663000507, + "loss": 0.0242, "step": 77800 }, { - "epoch": 0.39, - "learning_rate": 0.00024111578065798565, - "loss": 0.0158, + "epoch": 0.2, + "learning_rate": 0.00026974578841363364, + "loss": 0.0216, "step": 77810 }, { - "epoch": 0.39, - "learning_rate": 0.00024110821296497164, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.00026974190019726216, + "loss": 0.0216, "step": 77820 }, { - "epoch": 0.39, - "learning_rate": 0.00024110064527195764, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.00026973801198089067, + "loss": 0.0239, "step": 77830 }, { - "epoch": 0.39, - "learning_rate": 0.00024109307757894363, - "loss": 0.0158, + "epoch": 0.2, + "learning_rate": 0.00026973412376451924, + "loss": 0.0254, "step": 77840 }, { - "epoch": 0.39, - "learning_rate": 0.0002410855098859296, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.00026973023554814775, + "loss": 0.0238, "step": 77850 }, { - "epoch": 0.39, - "learning_rate": 0.00024107794219291562, - "loss": 0.0149, + "epoch": 0.2, + "learning_rate": 0.00026972634733177627, + "loss": 0.0256, "step": 77860 }, { - "epoch": 0.39, - "learning_rate": 0.0002410703744999016, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.00026972245911540484, + "loss": 0.0232, "step": 77870 }, { - "epoch": 0.39, - "learning_rate": 0.00024106280680688758, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002697185708990334, + "loss": 0.0287, "step": 77880 }, { - "epoch": 0.39, - "learning_rate": 0.0002410552391138736, - "loss": 0.0159, + "epoch": 0.2, + "learning_rate": 0.0002697146826826619, + "loss": 0.0219, "step": 77890 }, { - "epoch": 0.39, - "learning_rate": 0.00024104767142085957, - "loss": 0.0159, + "epoch": 0.2, + "learning_rate": 0.00026971079446629043, + "loss": 0.0214, "step": 77900 }, { - "epoch": 0.39, - "learning_rate": 0.00024104010372784555, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00026970690624991895, + "loss": 0.0218, "step": 77910 }, { - "epoch": 0.39, - "learning_rate": 0.00024103253603483156, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002697030180335475, + "loss": 0.0287, "step": 77920 }, { - "epoch": 0.39, - "learning_rate": 0.00024102496834181754, - "loss": 0.017, + "epoch": 0.2, + "learning_rate": 0.00026969912981717603, + "loss": 0.0268, "step": 77930 }, { - "epoch": 0.39, - "learning_rate": 0.00024101740064880352, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.0002696952416008046, + "loss": 0.025, "step": 77940 }, { - "epoch": 0.39, - "learning_rate": 0.00024100983295578953, - "loss": 0.015, + "epoch": 0.2, + "learning_rate": 0.0002696913533844331, + "loss": 0.0256, "step": 77950 }, { - "epoch": 0.39, - "learning_rate": 0.0002410022652627755, - "loss": 0.0157, + "epoch": 0.2, + "learning_rate": 0.00026968746516806163, + "loss": 0.0193, "step": 77960 }, { - "epoch": 0.39, - "learning_rate": 0.0002409946975697615, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002696835769516902, + "loss": 0.0234, "step": 77970 }, { - "epoch": 0.39, - "learning_rate": 0.00024098712987674747, - "loss": 0.0163, + "epoch": 0.2, + "learning_rate": 0.0002696796887353187, + "loss": 0.0241, "step": 77980 }, { - "epoch": 0.39, - "learning_rate": 0.00024097956218373348, - "loss": 0.0163, + "epoch": 0.2, + "learning_rate": 0.00026967580051894723, + "loss": 0.0197, "step": 77990 }, { - "epoch": 0.39, - "learning_rate": 0.00024097199449071946, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002696719123025758, + "loss": 0.0258, "step": 78000 }, { - "epoch": 0.39, - "eval_cer": 0.9145148941249307, - "eval_loss": 0.012463193386793137, - "eval_runtime": 116.5238, - "eval_samples_per_second": 17.164, - "eval_steps_per_second": 4.291, + "epoch": 0.2, + "eval_cer": 0.8817250805141147, + "eval_loss": 0.01774117723107338, + "eval_runtime": 107.8059, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, "step": 78000 }, { - "epoch": 0.39, - "learning_rate": 0.00024096442679770545, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002696680240862043, + "loss": 0.0261, "step": 78010 }, { - "epoch": 0.39, - "learning_rate": 0.00024095685910469145, - "loss": 0.016, + "epoch": 0.2, + "learning_rate": 0.0002696641358698329, + "loss": 0.0231, "step": 78020 }, { - "epoch": 0.39, - "learning_rate": 0.00024094929141167744, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002696602476534614, + "loss": 0.0281, "step": 78030 }, { - "epoch": 0.39, - "learning_rate": 0.00024094172371866342, - "loss": 0.0137, + "epoch": 0.2, + "learning_rate": 0.0002696563594370899, + "loss": 0.0205, "step": 78040 }, { - "epoch": 0.39, - "learning_rate": 0.00024093415602564943, - "loss": 0.0163, + "epoch": 0.2, + "learning_rate": 0.0002696524712207185, + "loss": 0.0233, "step": 78050 }, { - "epoch": 0.39, - "learning_rate": 0.0002409265883326354, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.000269648583004347, + "loss": 0.0248, "step": 78060 }, { - "epoch": 0.39, - "learning_rate": 0.0002409190206396214, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.00026964469478797556, + "loss": 0.0262, "step": 78070 }, { - "epoch": 0.39, - "learning_rate": 0.0002409114529466074, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.0002696408065716041, + "loss": 0.0312, "step": 78080 }, { - "epoch": 0.39, - "learning_rate": 0.00024090388525359338, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.00026963691835523264, + "loss": 0.0224, "step": 78090 }, { - "epoch": 0.39, - "learning_rate": 0.00024089631756057936, - "loss": 0.0183, + "epoch": 0.2, + "learning_rate": 0.00026963303013886116, + "loss": 0.0233, "step": 78100 }, { - "epoch": 0.39, - "learning_rate": 0.00024088874986756537, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.0002696291419224897, + "loss": 0.0242, "step": 78110 }, { - "epoch": 0.39, - "learning_rate": 0.00024088118217455135, - "loss": 0.0204, + "epoch": 0.2, + "learning_rate": 0.0002696252537061182, + "loss": 0.0223, "step": 78120 }, { - "epoch": 0.39, - "learning_rate": 0.00024087361448153733, - "loss": 0.0167, + "epoch": 0.2, + "learning_rate": 0.00026962136548974676, + "loss": 0.027, "step": 78130 }, { - "epoch": 0.39, - "learning_rate": 0.0002408660467885233, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.00026961747727337527, + "loss": 0.024, "step": 78140 }, { - "epoch": 0.39, - "learning_rate": 0.00024085847909550932, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.00026961358905700384, + "loss": 0.0219, "step": 78150 }, { - "epoch": 0.39, - "learning_rate": 0.0002408509114024953, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.00026960970084063235, + "loss": 0.0213, "step": 78160 }, { - "epoch": 0.39, - "learning_rate": 0.00024084334370948128, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.00026960581262426087, + "loss": 0.0249, "step": 78170 }, { - "epoch": 0.39, - "learning_rate": 0.0002408357760164673, - "loss": 0.0162, + "epoch": 0.2, + "learning_rate": 0.00026960192440788944, + "loss": 0.0232, "step": 78180 }, { - "epoch": 0.39, - "learning_rate": 0.00024082820832345327, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.00026959803619151795, + "loss": 0.0221, "step": 78190 }, { - "epoch": 0.39, - "learning_rate": 0.00024082064063043926, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.00026959414797514647, + "loss": 0.0252, "step": 78200 }, { - "epoch": 0.39, - "learning_rate": 0.00024081307293742526, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.00026959025975877504, + "loss": 0.0314, "step": 78210 }, { - "epoch": 0.39, - "learning_rate": 0.00024080550524441125, - "loss": 0.0202, + "epoch": 0.2, + "learning_rate": 0.0002695863715424036, + "loss": 0.0235, "step": 78220 }, { - "epoch": 0.39, - "learning_rate": 0.00024079793755139723, - "loss": 0.015, + "epoch": 0.2, + "learning_rate": 0.0002695824833260321, + "loss": 0.0234, "step": 78230 }, { - "epoch": 0.39, - "learning_rate": 0.00024079036985838324, - "loss": 0.0211, + "epoch": 0.2, + "learning_rate": 0.00026957859510966063, + "loss": 0.0224, "step": 78240 }, { - "epoch": 0.39, - "learning_rate": 0.00024078280216536922, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.00026957470689328915, + "loss": 0.0231, "step": 78250 }, { - "epoch": 0.39, - "learning_rate": 0.0002407752344723552, - "loss": 0.015, + "epoch": 0.2, + "learning_rate": 0.0002695708186769177, + "loss": 0.0229, "step": 78260 }, { - "epoch": 0.39, - "learning_rate": 0.0002407676667793412, - "loss": 0.017, + "epoch": 0.2, + "learning_rate": 0.00026956693046054623, + "loss": 0.0235, "step": 78270 }, { - "epoch": 0.39, - "learning_rate": 0.0002407600990863272, - "loss": 0.0243, + "epoch": 0.2, + "learning_rate": 0.0002695630422441748, + "loss": 0.0225, "step": 78280 }, { - "epoch": 0.39, - "learning_rate": 0.00024075253139331317, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.0002695591540278033, + "loss": 0.0276, "step": 78290 }, { - "epoch": 0.4, - "learning_rate": 0.00024074496370029915, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002695552658114319, + "loss": 0.0275, "step": 78300 }, { - "epoch": 0.4, - "learning_rate": 0.00024073739600728516, - "loss": 0.0185, + "epoch": 0.2, + "learning_rate": 0.0002695513775950604, + "loss": 0.0263, "step": 78310 }, { - "epoch": 0.4, - "learning_rate": 0.00024072982831427114, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.0002695474893786889, + "loss": 0.0213, "step": 78320 }, { - "epoch": 0.4, - "learning_rate": 0.00024072226062125712, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002695436011623174, + "loss": 0.0244, "step": 78330 }, { - "epoch": 0.4, - "learning_rate": 0.00024071469292824313, - "loss": 0.0224, + "epoch": 0.2, + "learning_rate": 0.000269539712945946, + "loss": 0.0234, "step": 78340 }, { - "epoch": 0.4, - "learning_rate": 0.0002407071252352291, - "loss": 0.0212, + "epoch": 0.2, + "learning_rate": 0.0002695358247295745, + "loss": 0.0252, "step": 78350 }, { - "epoch": 0.4, - "learning_rate": 0.0002406995575422151, - "loss": 0.0187, + "epoch": 0.2, + "learning_rate": 0.0002695319365132031, + "loss": 0.0204, "step": 78360 }, { - "epoch": 0.4, - "learning_rate": 0.0002406919898492011, - "loss": 0.0203, + "epoch": 0.2, + "learning_rate": 0.0002695280482968316, + "loss": 0.0205, "step": 78370 }, { - "epoch": 0.4, - "learning_rate": 0.00024068442215618708, - "loss": 0.0144, + "epoch": 0.2, + "learning_rate": 0.00026952416008046016, + "loss": 0.0267, "step": 78380 }, { - "epoch": 0.4, - "learning_rate": 0.00024067685446317307, - "loss": 0.016, + "epoch": 0.2, + "learning_rate": 0.0002695202718640887, + "loss": 0.0332, "step": 78390 }, { - "epoch": 0.4, - "learning_rate": 0.00024066928677015907, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.0002695163836477172, + "loss": 0.0212, "step": 78400 }, { - "epoch": 0.4, - "learning_rate": 0.00024066171907714506, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.0002695124954313457, + "loss": 0.0268, "step": 78410 }, { - "epoch": 0.4, - "learning_rate": 0.00024065415138413104, - "loss": 0.0146, + "epoch": 0.2, + "learning_rate": 0.0002695086072149743, + "loss": 0.028, "step": 78420 }, { - "epoch": 0.4, - "learning_rate": 0.00024064658369111705, - "loss": 0.0157, + "epoch": 0.2, + "learning_rate": 0.00026950471899860284, + "loss": 0.0267, "step": 78430 }, { - "epoch": 0.4, - "learning_rate": 0.00024063901599810303, - "loss": 0.0161, + "epoch": 0.2, + "learning_rate": 0.00026950083078223136, + "loss": 0.024, "step": 78440 }, { - "epoch": 0.4, - "learning_rate": 0.000240631448305089, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.00026949694256585987, + "loss": 0.0244, "step": 78450 }, { - "epoch": 0.4, - "learning_rate": 0.00024062388061207502, - "loss": 0.0152, + "epoch": 0.2, + "learning_rate": 0.0002694930543494884, + "loss": 0.0251, "step": 78460 }, { - "epoch": 0.4, - "learning_rate": 0.000240616312919061, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.00026948916613311696, + "loss": 0.0189, "step": 78470 }, { - "epoch": 0.4, - "learning_rate": 0.00024060874522604698, - "loss": 0.0223, + "epoch": 0.2, + "learning_rate": 0.00026948527791674547, + "loss": 0.0274, "step": 78480 }, { - "epoch": 0.4, - "learning_rate": 0.00024060117753303296, - "loss": 0.027, + "epoch": 0.2, + "learning_rate": 0.00026948138970037404, + "loss": 0.0277, "step": 78490 }, { - "epoch": 0.4, - "learning_rate": 0.00024059360984001897, - "loss": 0.0212, + "epoch": 0.2, + "learning_rate": 0.00026947750148400255, + "loss": 0.0319, "step": 78500 }, { - "epoch": 0.4, - "learning_rate": 0.00024058604214700495, - "loss": 0.0158, + "epoch": 0.2, + "learning_rate": 0.0002694736132676311, + "loss": 0.0239, "step": 78510 }, { - "epoch": 0.4, - "learning_rate": 0.00024057847445399093, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.00026946972505125964, + "loss": 0.0296, "step": 78520 }, { - "epoch": 0.4, - "learning_rate": 0.00024057090676097694, - "loss": 0.0138, + "epoch": 0.2, + "learning_rate": 0.00026946583683488815, + "loss": 0.0329, "step": 78530 }, { - "epoch": 0.4, - "learning_rate": 0.00024056333906796292, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.00026946194861851667, + "loss": 0.0314, "step": 78540 }, { - "epoch": 0.4, - "learning_rate": 0.0002405557713749489, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.00026945806040214523, + "loss": 0.0246, "step": 78550 }, { - "epoch": 0.4, - "learning_rate": 0.00024054820368193486, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.00026945417218577375, + "loss": 0.0223, "step": 78560 }, { - "epoch": 0.4, - "learning_rate": 0.00024054063598892087, - "loss": 0.0217, + "epoch": 0.2, + "learning_rate": 0.0002694502839694023, + "loss": 0.0225, "step": 78570 }, { - "epoch": 0.4, - "learning_rate": 0.00024053306829590685, - "loss": 0.0209, + "epoch": 0.2, + "learning_rate": 0.00026944639575303083, + "loss": 0.0274, "step": 78580 }, { - "epoch": 0.4, - "learning_rate": 0.00024052550060289283, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.0002694425075366594, + "loss": 0.0273, "step": 78590 }, { - "epoch": 0.4, - "learning_rate": 0.00024051793290987884, - "loss": 0.0198, + "epoch": 0.2, + "learning_rate": 0.0002694386193202879, + "loss": 0.0247, "step": 78600 }, { - "epoch": 0.4, - "learning_rate": 0.00024051036521686482, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.00026943473110391643, + "loss": 0.0216, "step": 78610 }, { - "epoch": 0.4, - "learning_rate": 0.0002405027975238508, - "loss": 0.0174, + "epoch": 0.2, + "learning_rate": 0.000269430842887545, + "loss": 0.0239, "step": 78620 }, { - "epoch": 0.4, - "learning_rate": 0.0002404952298308368, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.0002694269546711735, + "loss": 0.0266, "step": 78630 }, { - "epoch": 0.4, - "learning_rate": 0.0002404876621378228, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.0002694230664548021, + "loss": 0.0243, "step": 78640 }, { - "epoch": 0.4, - "learning_rate": 0.00024048009444480877, - "loss": 0.0177, + "epoch": 0.2, + "learning_rate": 0.0002694191782384306, + "loss": 0.0271, "step": 78650 }, { - "epoch": 0.4, - "learning_rate": 0.00024047252675179478, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002694152900220591, + "loss": 0.0225, "step": 78660 }, { - "epoch": 0.4, - "learning_rate": 0.00024046495905878076, - "loss": 0.0197, + "epoch": 0.2, + "learning_rate": 0.0002694114018056876, + "loss": 0.0286, "step": 78670 }, { - "epoch": 0.4, - "learning_rate": 0.00024045739136576674, - "loss": 0.0211, + "epoch": 0.2, + "learning_rate": 0.0002694075135893162, + "loss": 0.0242, "step": 78680 }, { - "epoch": 0.4, - "learning_rate": 0.00024044982367275273, - "loss": 0.0175, + "epoch": 0.2, + "learning_rate": 0.0002694036253729447, + "loss": 0.033, "step": 78690 }, { - "epoch": 0.4, - "learning_rate": 0.00024044225597973873, - "loss": 0.0195, + "epoch": 0.2, + "learning_rate": 0.0002693997371565733, + "loss": 0.0265, "step": 78700 }, { - "epoch": 0.4, - "learning_rate": 0.00024043468828672472, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.0002693958489402018, + "loss": 0.025, "step": 78710 }, { - "epoch": 0.4, - "learning_rate": 0.0002404271205937107, - "loss": 0.0165, + "epoch": 0.2, + "learning_rate": 0.00026939196072383036, + "loss": 0.021, "step": 78720 }, { - "epoch": 0.4, - "learning_rate": 0.0002404195529006967, - "loss": 0.0172, + "epoch": 0.2, + "learning_rate": 0.0002693880725074589, + "loss": 0.0214, "step": 78730 }, { - "epoch": 0.4, - "learning_rate": 0.0002404119852076827, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002693841842910874, + "loss": 0.0197, "step": 78740 }, { - "epoch": 0.4, - "learning_rate": 0.00024040441751466867, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.0002693802960747159, + "loss": 0.0263, "step": 78750 }, { - "epoch": 0.4, - "learning_rate": 0.00024039684982165468, - "loss": 0.0156, + "epoch": 0.2, + "learning_rate": 0.0002693764078583445, + "loss": 0.0234, "step": 78760 }, { - "epoch": 0.4, - "learning_rate": 0.00024038928212864066, - "loss": 0.0173, + "epoch": 0.2, + "learning_rate": 0.00026937251964197304, + "loss": 0.025, "step": 78770 }, { - "epoch": 0.4, - "learning_rate": 0.00024038171443562664, - "loss": 0.0184, + "epoch": 0.2, + "learning_rate": 0.00026936863142560156, + "loss": 0.0254, "step": 78780 }, { - "epoch": 0.4, - "learning_rate": 0.00024037414674261265, - "loss": 0.0189, + "epoch": 0.2, + "learning_rate": 0.00026936474320923007, + "loss": 0.0284, "step": 78790 }, { - "epoch": 0.4, - "learning_rate": 0.00024036657904959863, - "loss": 0.0171, + "epoch": 0.2, + "learning_rate": 0.00026936085499285864, + "loss": 0.0228, "step": 78800 }, { - "epoch": 0.4, - "learning_rate": 0.0002403590113565846, - "loss": 0.0196, + "epoch": 0.2, + "learning_rate": 0.00026935696677648715, + "loss": 0.0291, "step": 78810 }, { - "epoch": 0.4, - "learning_rate": 0.00024035144366357062, - "loss": 0.0153, + "epoch": 0.2, + "learning_rate": 0.00026935307856011567, + "loss": 0.0255, "step": 78820 }, { - "epoch": 0.4, - "learning_rate": 0.0002403438759705566, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.00026934919034374424, + "loss": 0.0222, "step": 78830 }, { - "epoch": 0.4, - "learning_rate": 0.00024033630827754258, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.00026934530212737275, + "loss": 0.0222, "step": 78840 }, { - "epoch": 0.4, - "learning_rate": 0.0002403287405845286, - "loss": 0.0221, + "epoch": 0.2, + "learning_rate": 0.0002693414139110013, + "loss": 0.0233, "step": 78850 }, { - "epoch": 0.4, - "learning_rate": 0.00024032117289151457, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.00026933752569462984, + "loss": 0.0219, "step": 78860 }, { - "epoch": 0.4, - "learning_rate": 0.00024031360519850055, - "loss": 0.0216, + "epoch": 0.2, + "learning_rate": 0.00026933363747825835, + "loss": 0.0258, "step": 78870 }, { - "epoch": 0.4, - "learning_rate": 0.00024030603750548654, - "loss": 0.0176, + "epoch": 0.2, + "learning_rate": 0.0002693297492618869, + "loss": 0.0276, "step": 78880 }, { - "epoch": 0.4, - "learning_rate": 0.00024029846981247254, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.00026932586104551543, + "loss": 0.0231, "step": 78890 }, { - "epoch": 0.4, - "learning_rate": 0.00024029090211945853, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.00026932197282914395, + "loss": 0.0262, "step": 78900 }, { - "epoch": 0.4, - "learning_rate": 0.0002402833344264445, - "loss": 0.0208, + "epoch": 0.2, + "learning_rate": 0.0002693180846127725, + "loss": 0.0211, "step": 78910 }, { - "epoch": 0.4, - "learning_rate": 0.00024027576673343052, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.00026931419639640103, + "loss": 0.0238, "step": 78920 }, { - "epoch": 0.4, - "learning_rate": 0.0002402681990404165, - "loss": 0.0192, + "epoch": 0.2, + "learning_rate": 0.0002693103081800296, + "loss": 0.0312, "step": 78930 }, { - "epoch": 0.4, - "learning_rate": 0.00024026063134740248, - "loss": 0.0141, + "epoch": 0.2, + "learning_rate": 0.0002693064199636581, + "loss": 0.0219, "step": 78940 }, { - "epoch": 0.4, - "learning_rate": 0.0002402530636543885, - "loss": 0.0166, + "epoch": 0.2, + "learning_rate": 0.00026930253174728663, + "loss": 0.0204, "step": 78950 }, { - "epoch": 0.4, - "learning_rate": 0.00024024549596137447, - "loss": 0.0179, + "epoch": 0.2, + "learning_rate": 0.00026929864353091514, + "loss": 0.0251, "step": 78960 }, { - "epoch": 0.4, - "learning_rate": 0.00024023792826836045, - "loss": 0.0154, + "epoch": 0.2, + "learning_rate": 0.0002692947553145437, + "loss": 0.0263, "step": 78970 }, { - "epoch": 0.4, - "learning_rate": 0.00024023036057534646, - "loss": 0.0157, + "epoch": 0.2, + "learning_rate": 0.0002692908670981723, + "loss": 0.0219, "step": 78980 }, { - "epoch": 0.4, - "learning_rate": 0.00024022279288233244, - "loss": 0.0167, + "epoch": 0.2, + "learning_rate": 0.0002692869788818008, + "loss": 0.0273, "step": 78990 }, { - "epoch": 0.4, - "learning_rate": 0.00024021522518931842, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002692830906654293, + "loss": 0.0241, "step": 79000 }, { - "epoch": 0.4, - "eval_cer": 0.914508101352053, - "eval_loss": 0.012615088373422623, - "eval_runtime": 116.5859, - "eval_samples_per_second": 17.155, - "eval_steps_per_second": 4.289, + "epoch": 0.2, + "eval_cer": 0.8817754674437451, + "eval_loss": 0.017790012061595917, + "eval_runtime": 107.9618, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, "step": 79000 }, { - "epoch": 0.4, - "learning_rate": 0.00024020765749630443, - "loss": 0.0181, + "epoch": 0.2, + "learning_rate": 0.0002692792024490579, + "loss": 0.0259, "step": 79010 }, { - "epoch": 0.4, - "learning_rate": 0.0002402000898032904, - "loss": 0.0182, + "epoch": 0.2, + "learning_rate": 0.0002692753142326864, + "loss": 0.0266, "step": 79020 }, { - "epoch": 0.4, - "learning_rate": 0.0002401925221102764, - "loss": 0.0178, + "epoch": 0.2, + "learning_rate": 0.0002692714260163149, + "loss": 0.027, "step": 79030 }, { - "epoch": 0.4, - "learning_rate": 0.00024018495441726237, - "loss": 0.019, + "epoch": 0.2, + "learning_rate": 0.0002692675377999435, + "loss": 0.0262, "step": 79040 }, { - "epoch": 0.4, - "learning_rate": 0.00024017738672424838, - "loss": 0.0146, + "epoch": 0.2, + "learning_rate": 0.000269263649583572, + "loss": 0.0243, "step": 79050 }, { - "epoch": 0.4, - "learning_rate": 0.00024016981903123436, - "loss": 0.0158, + "epoch": 0.2, + "learning_rate": 0.00026925976136720056, + "loss": 0.0239, "step": 79060 }, { - "epoch": 0.4, - "learning_rate": 0.00024016225133822035, - "loss": 0.018, + "epoch": 0.2, + "learning_rate": 0.0002692558731508291, + "loss": 0.0233, "step": 79070 }, { - "epoch": 0.4, - "learning_rate": 0.00024015468364520635, - "loss": 0.0188, + "epoch": 0.2, + "learning_rate": 0.0002692519849344576, + "loss": 0.0212, "step": 79080 }, { - "epoch": 0.4, - "learning_rate": 0.00024014711595219234, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026924809671808616, + "loss": 0.0258, "step": 79090 }, { - "epoch": 0.4, - "learning_rate": 0.00024013954825917832, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026924420850171467, + "loss": 0.0214, "step": 79100 }, { - "epoch": 0.4, - "learning_rate": 0.00024013198056616433, - "loss": 0.0146, + "epoch": 0.21, + "learning_rate": 0.00026924032028534324, + "loss": 0.025, "step": 79110 }, { - "epoch": 0.4, - "learning_rate": 0.0002401244128731503, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.00026923643206897176, + "loss": 0.0282, "step": 79120 }, { - "epoch": 0.4, - "learning_rate": 0.0002401168451801363, - "loss": 0.0132, + "epoch": 0.21, + "learning_rate": 0.0002692325438526003, + "loss": 0.0258, "step": 79130 }, { - "epoch": 0.4, - "learning_rate": 0.0002401092774871223, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.00026922865563622884, + "loss": 0.0238, "step": 79140 }, { - "epoch": 0.4, - "learning_rate": 0.00024010170979410828, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026922476741985735, + "loss": 0.0249, "step": 79150 }, { - "epoch": 0.4, - "learning_rate": 0.00024009414210109426, - "loss": 0.022, + "epoch": 0.21, + "learning_rate": 0.00026922087920348587, + "loss": 0.0255, "step": 79160 }, { - "epoch": 0.4, - "learning_rate": 0.00024008657440808027, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026921699098711444, + "loss": 0.0265, "step": 79170 }, { - "epoch": 0.4, - "learning_rate": 0.00024007900671506625, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.00026921310277074295, + "loss": 0.0283, "step": 79180 }, { - "epoch": 0.4, - "learning_rate": 0.00024007143902205223, - "loss": 0.0208, + "epoch": 0.21, + "learning_rate": 0.0002692092145543715, + "loss": 0.0265, "step": 79190 }, { - "epoch": 0.4, - "learning_rate": 0.0002400638713290382, - "loss": 0.0177, + "epoch": 0.21, + "learning_rate": 0.00026920532633800003, + "loss": 0.0229, "step": 79200 }, { - "epoch": 0.4, - "learning_rate": 0.00024005630363602422, - "loss": 0.0155, + "epoch": 0.21, + "learning_rate": 0.00026920143812162855, + "loss": 0.0229, "step": 79210 }, { - "epoch": 0.4, - "learning_rate": 0.0002400487359430102, - "loss": 0.0171, + "epoch": 0.21, + "learning_rate": 0.0002691975499052571, + "loss": 0.0223, "step": 79220 }, { - "epoch": 0.4, - "learning_rate": 0.00024004116824999618, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.00026919366168888563, + "loss": 0.0247, "step": 79230 }, { - "epoch": 0.4, - "learning_rate": 0.0002400336005569822, - "loss": 0.0184, + "epoch": 0.21, + "learning_rate": 0.00026918977347251415, + "loss": 0.0247, "step": 79240 }, { - "epoch": 0.4, - "learning_rate": 0.00024002603286396817, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.0002691858852561427, + "loss": 0.031, "step": 79250 }, { - "epoch": 0.4, - "learning_rate": 0.00024001846517095416, - "loss": 0.0165, + "epoch": 0.21, + "learning_rate": 0.0002691819970397713, + "loss": 0.0256, "step": 79260 }, { - "epoch": 0.4, - "learning_rate": 0.00024001089747794016, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.0002691781088233998, + "loss": 0.02, "step": 79270 }, { - "epoch": 0.4, - "learning_rate": 0.00024000332978492615, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.0002691742206070283, + "loss": 0.0285, "step": 79280 }, { - "epoch": 0.4, - "learning_rate": 0.00023999576209191213, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026917033239065683, + "loss": 0.0251, "step": 79290 }, { - "epoch": 0.4, - "learning_rate": 0.00023998819439889814, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.0002691664441742854, + "loss": 0.0223, "step": 79300 }, { - "epoch": 0.4, - "learning_rate": 0.00023998062670588412, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.0002691625559579139, + "loss": 0.0252, "step": 79310 }, { - "epoch": 0.4, - "learning_rate": 0.0002399730590128701, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.0002691586677415425, + "loss": 0.0218, "step": 79320 }, { - "epoch": 0.4, - "learning_rate": 0.0002399654913198561, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.000269154779525171, + "loss": 0.0254, "step": 79330 }, { - "epoch": 0.4, - "learning_rate": 0.0002399579236268421, - "loss": 0.0147, + "epoch": 0.21, + "learning_rate": 0.00026915089130879956, + "loss": 0.0257, "step": 79340 }, { - "epoch": 0.4, - "learning_rate": 0.00023995035593382807, - "loss": 0.0157, + "epoch": 0.21, + "learning_rate": 0.0002691470030924281, + "loss": 0.0242, "step": 79350 }, { - "epoch": 0.4, - "learning_rate": 0.00023994278824081408, - "loss": 0.0157, + "epoch": 0.21, + "learning_rate": 0.0002691431148760566, + "loss": 0.0252, "step": 79360 }, { - "epoch": 0.4, - "learning_rate": 0.00023993522054780006, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.0002691392266596851, + "loss": 0.0261, "step": 79370 }, { - "epoch": 0.4, - "learning_rate": 0.00023992765285478604, - "loss": 0.0152, + "epoch": 0.21, + "learning_rate": 0.0002691353384433137, + "loss": 0.027, "step": 79380 }, { - "epoch": 0.4, - "learning_rate": 0.00023992008516177202, - "loss": 0.0155, + "epoch": 0.21, + "learning_rate": 0.0002691314502269422, + "loss": 0.0243, "step": 79390 }, { - "epoch": 0.4, - "learning_rate": 0.00023991251746875803, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.00026912756201057076, + "loss": 0.0222, "step": 79400 }, { - "epoch": 0.4, - "learning_rate": 0.000239904949775744, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.0002691236737941993, + "loss": 0.024, "step": 79410 }, { - "epoch": 0.4, - "learning_rate": 0.00023989738208273, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.0002691197855778278, + "loss": 0.0287, "step": 79420 }, { - "epoch": 0.4, - "learning_rate": 0.000239889814389716, - "loss": 0.0262, + "epoch": 0.21, + "learning_rate": 0.00026911589736145636, + "loss": 0.0185, "step": 79430 }, { - "epoch": 0.4, - "learning_rate": 0.00023988224669670198, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026911200914508487, + "loss": 0.0211, "step": 79440 }, { - "epoch": 0.4, - "learning_rate": 0.00023987467900368797, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.0002691081209287134, + "loss": 0.0209, "step": 79450 }, { - "epoch": 0.4, - "learning_rate": 0.00023986711131067397, - "loss": 0.0218, + "epoch": 0.21, + "learning_rate": 0.00026910423271234195, + "loss": 0.0275, "step": 79460 }, { - "epoch": 0.4, - "learning_rate": 0.00023985954361765996, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.0002691003444959705, + "loss": 0.0258, "step": 79470 }, { - "epoch": 0.4, - "learning_rate": 0.00023985197592464594, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026909645627959904, + "loss": 0.0275, "step": 79480 }, { - "epoch": 0.4, - "learning_rate": 0.00023984440823163195, - "loss": 0.0144, + "epoch": 0.21, + "learning_rate": 0.00026909256806322755, + "loss": 0.0215, "step": 79490 }, { - "epoch": 0.4, - "learning_rate": 0.00023983684053861793, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026908867984685607, + "loss": 0.0251, "step": 79500 }, { - "epoch": 0.4, - "learning_rate": 0.0002398292728456039, - "loss": 0.0156, + "epoch": 0.21, + "learning_rate": 0.00026908479163048464, + "loss": 0.025, "step": 79510 }, { - "epoch": 0.4, - "learning_rate": 0.00023982170515258992, - "loss": 0.0184, + "epoch": 0.21, + "learning_rate": 0.00026908090341411315, + "loss": 0.0206, "step": 79520 }, { - "epoch": 0.4, - "learning_rate": 0.0002398141374595759, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.0002690770151977417, + "loss": 0.0224, "step": 79530 }, { - "epoch": 0.4, - "learning_rate": 0.00023980656976656188, - "loss": 0.0204, + "epoch": 0.21, + "learning_rate": 0.00026907312698137023, + "loss": 0.0213, "step": 79540 }, { - "epoch": 0.4, - "learning_rate": 0.00023979900207354786, - "loss": 0.0165, + "epoch": 0.21, + "learning_rate": 0.0002690692387649988, + "loss": 0.021, "step": 79550 }, { - "epoch": 0.4, - "learning_rate": 0.00023979143438053387, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.0002690653505486273, + "loss": 0.0197, "step": 79560 }, { - "epoch": 0.4, - "learning_rate": 0.00023978386668751985, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.00026906146233225583, + "loss": 0.0188, "step": 79570 }, { - "epoch": 0.4, - "learning_rate": 0.00023977629899450583, - "loss": 0.0165, + "epoch": 0.21, + "learning_rate": 0.00026905757411588435, + "loss": 0.0249, "step": 79580 }, { - "epoch": 0.4, - "learning_rate": 0.00023976873130149184, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.0002690536858995129, + "loss": 0.0222, "step": 79590 }, { - "epoch": 0.4, - "learning_rate": 0.00023976116360847782, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.00026904979768314143, + "loss": 0.0225, "step": 79600 }, { - "epoch": 0.4, - "learning_rate": 0.0002397535959154638, - "loss": 0.0217, + "epoch": 0.21, + "learning_rate": 0.00026904590946677, + "loss": 0.0253, "step": 79610 }, { - "epoch": 0.4, - "learning_rate": 0.0002397460282224498, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.0002690420212503985, + "loss": 0.0293, "step": 79620 }, { - "epoch": 0.4, - "learning_rate": 0.0002397384605294358, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.0002690381330340271, + "loss": 0.0268, "step": 79630 }, { - "epoch": 0.4, - "learning_rate": 0.00023973089283642178, - "loss": 0.0191, + "epoch": 0.21, + "learning_rate": 0.0002690342448176556, + "loss": 0.0221, "step": 79640 }, { - "epoch": 0.4, - "learning_rate": 0.00023972332514340778, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002690303566012841, + "loss": 0.0226, "step": 79650 }, { - "epoch": 0.4, - "learning_rate": 0.00023971575745039377, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.0002690264683849127, + "loss": 0.027, "step": 79660 }, { - "epoch": 0.4, - "learning_rate": 0.00023970818975737975, - "loss": 0.0147, + "epoch": 0.21, + "learning_rate": 0.0002690225801685412, + "loss": 0.026, "step": 79670 }, { - "epoch": 0.4, - "learning_rate": 0.00023970062206436576, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026901869195216976, + "loss": 0.0233, "step": 79680 }, { - "epoch": 0.4, - "learning_rate": 0.00023969305437135174, - "loss": 0.0195, + "epoch": 0.21, + "learning_rate": 0.0002690148037357983, + "loss": 0.0224, "step": 79690 }, { - "epoch": 0.4, - "learning_rate": 0.00023968548667833772, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.0002690109155194268, + "loss": 0.0222, "step": 79700 }, { - "epoch": 0.4, - "learning_rate": 0.0002396779189853237, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.0002690070273030553, + "loss": 0.0287, "step": 79710 }, { - "epoch": 0.4, - "learning_rate": 0.0002396703512923097, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.0002690031390866839, + "loss": 0.0246, "step": 79720 }, { - "epoch": 0.4, - "learning_rate": 0.0002396627835992957, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.0002689992508703124, + "loss": 0.0276, "step": 79730 }, { - "epoch": 0.4, - "learning_rate": 0.00023965521590628167, - "loss": 0.0141, + "epoch": 0.21, + "learning_rate": 0.00026899536265394096, + "loss": 0.0239, "step": 79740 }, { - "epoch": 0.4, - "learning_rate": 0.00023964764821326768, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.00026899147443756947, + "loss": 0.0272, "step": 79750 }, { - "epoch": 0.4, - "learning_rate": 0.00023964008052025366, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.00026898758622119804, + "loss": 0.023, "step": 79760 }, { - "epoch": 0.4, - "learning_rate": 0.00023963251282723964, - "loss": 0.0156, + "epoch": 0.21, + "learning_rate": 0.00026898369800482656, + "loss": 0.0254, "step": 79770 }, { - "epoch": 0.4, - "learning_rate": 0.00023962494513422565, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.00026897980978845507, + "loss": 0.0278, "step": 79780 }, { - "epoch": 0.4, - "learning_rate": 0.00023961737744121163, - "loss": 0.0144, + "epoch": 0.21, + "learning_rate": 0.0002689759215720836, + "loss": 0.0205, "step": 79790 }, { - "epoch": 0.4, - "learning_rate": 0.00023960980974819761, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.00026897203335571215, + "loss": 0.0228, "step": 79800 }, { - "epoch": 0.4, - "learning_rate": 0.00023960224205518362, - "loss": 0.0191, + "epoch": 0.21, + "learning_rate": 0.0002689681451393407, + "loss": 0.026, "step": 79810 }, { - "epoch": 0.4, - "learning_rate": 0.00023959467436216958, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026896425692296924, + "loss": 0.0258, "step": 79820 }, { - "epoch": 0.4, - "learning_rate": 0.00023958710666915556, - "loss": 0.0188, + "epoch": 0.21, + "learning_rate": 0.00026896036870659775, + "loss": 0.0226, "step": 79830 }, { - "epoch": 0.4, - "learning_rate": 0.00023957953897614154, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.0002689564804902263, + "loss": 0.0205, "step": 79840 }, { - "epoch": 0.4, - "learning_rate": 0.00023957197128312755, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.00026895259227385483, + "loss": 0.0295, "step": 79850 }, { - "epoch": 0.4, - "learning_rate": 0.00023956440359011353, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.00026894870405748335, + "loss": 0.025, "step": 79860 }, { - "epoch": 0.4, - "learning_rate": 0.0002395568358970995, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.0002689448158411119, + "loss": 0.0289, "step": 79870 }, { - "epoch": 0.4, - "learning_rate": 0.00023954926820408552, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.00026894092762474043, + "loss": 0.0245, "step": 79880 }, { - "epoch": 0.4, - "learning_rate": 0.0002395417005110715, - "loss": 0.0226, + "epoch": 0.21, + "learning_rate": 0.000268937039408369, + "loss": 0.0288, "step": 79890 }, { - "epoch": 0.4, - "learning_rate": 0.00023953413281805748, - "loss": 0.0207, + "epoch": 0.21, + "learning_rate": 0.0002689331511919975, + "loss": 0.0215, "step": 79900 }, { - "epoch": 0.4, - "learning_rate": 0.0002395265651250435, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026892926297562603, + "loss": 0.0312, "step": 79910 }, { - "epoch": 0.4, - "learning_rate": 0.00023951899743202947, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.00026892537475925454, + "loss": 0.0261, "step": 79920 }, { - "epoch": 0.4, - "learning_rate": 0.00023951142973901545, - "loss": 0.0228, + "epoch": 0.21, + "learning_rate": 0.0002689214865428831, + "loss": 0.0219, "step": 79930 }, { - "epoch": 0.4, - "learning_rate": 0.00023950386204600144, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026891759832651163, + "loss": 0.0242, "step": 79940 }, { - "epoch": 0.4, - "learning_rate": 0.00023949629435298744, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.0002689137101101402, + "loss": 0.0259, "step": 79950 }, { - "epoch": 0.4, - "learning_rate": 0.00023948872665997343, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002689098218937687, + "loss": 0.0296, "step": 79960 }, { - "epoch": 0.4, - "learning_rate": 0.0002394811589669594, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.0002689059336773973, + "loss": 0.0249, "step": 79970 }, { - "epoch": 0.4, - "learning_rate": 0.00023947359127394542, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.0002689020454610258, + "loss": 0.0232, "step": 79980 }, { - "epoch": 0.4, - "learning_rate": 0.0002394660235809314, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.0002688981572446543, + "loss": 0.0199, "step": 79990 }, { - "epoch": 0.4, - "learning_rate": 0.00023945845588791738, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.0002688942690282828, + "loss": 0.0253, "step": 80000 }, { - "epoch": 0.4, - "eval_cer": 0.9145207165016832, - "eval_loss": 0.012683646753430367, - "eval_runtime": 116.5374, - "eval_samples_per_second": 17.162, - "eval_steps_per_second": 4.29, + "epoch": 0.21, + "eval_cer": 0.8818090587301654, + "eval_loss": 0.01771540753543377, + "eval_runtime": 108.1716, + "eval_samples_per_second": 18.489, + "eval_steps_per_second": 4.622, "step": 80000 }, { - "epoch": 0.4, - "learning_rate": 0.0002394508881949034, - "loss": 0.021, + "epoch": 0.21, + "learning_rate": 0.0002688903808119114, + "loss": 0.0206, "step": 80010 }, { - "epoch": 0.4, - "learning_rate": 0.00023944332050188937, - "loss": 0.0137, + "epoch": 0.21, + "learning_rate": 0.00026888649259553996, + "loss": 0.0233, "step": 80020 }, { - "epoch": 0.4, - "learning_rate": 0.00023943575280887535, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002688826043791685, + "loss": 0.0202, "step": 80030 }, { - "epoch": 0.4, - "learning_rate": 0.00023942818511586136, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.000268878716162797, + "loss": 0.0244, "step": 80040 }, { - "epoch": 0.4, - "learning_rate": 0.00023942061742284734, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.00026887482794642556, + "loss": 0.0195, "step": 80050 }, { - "epoch": 0.4, - "learning_rate": 0.00023941304972983332, - "loss": 0.0149, + "epoch": 0.21, + "learning_rate": 0.0002688709397300541, + "loss": 0.0162, "step": 80060 }, { - "epoch": 0.4, - "learning_rate": 0.00023940548203681933, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.0002688670515136826, + "loss": 0.0295, "step": 80070 }, { - "epoch": 0.4, - "learning_rate": 0.0002393979143438053, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026886316329731116, + "loss": 0.0213, "step": 80080 }, { - "epoch": 0.4, - "learning_rate": 0.0002393903466507913, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.00026885927508093967, + "loss": 0.021, "step": 80090 }, { - "epoch": 0.4, - "learning_rate": 0.00023938277895777727, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026885538686456824, + "loss": 0.0259, "step": 80100 }, { - "epoch": 0.4, - "learning_rate": 0.00023937521126476328, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.00026885149864819675, + "loss": 0.0232, "step": 80110 }, { - "epoch": 0.4, - "learning_rate": 0.00023936764357174926, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026884761043182527, + "loss": 0.0244, "step": 80120 }, { - "epoch": 0.4, - "learning_rate": 0.00023936007587873525, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026884372221545384, + "loss": 0.0244, "step": 80130 }, { - "epoch": 0.4, - "learning_rate": 0.00023935250818572125, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026883983399908235, + "loss": 0.0239, "step": 80140 }, { - "epoch": 0.4, - "learning_rate": 0.00023934494049270724, - "loss": 0.0166, + "epoch": 0.21, + "learning_rate": 0.00026883594578271087, + "loss": 0.0205, "step": 80150 }, { - "epoch": 0.4, - "learning_rate": 0.00023933737279969322, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.00026883205756633944, + "loss": 0.0288, "step": 80160 }, { - "epoch": 0.4, - "learning_rate": 0.00023932980510667923, - "loss": 0.0182, + "epoch": 0.21, + "learning_rate": 0.00026882816934996795, + "loss": 0.0231, "step": 80170 }, { - "epoch": 0.4, - "learning_rate": 0.0002393222374136652, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002688242811335965, + "loss": 0.0256, "step": 80180 }, { - "epoch": 0.4, - "learning_rate": 0.0002393146697206512, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026882039291722503, + "loss": 0.028, "step": 80190 }, { - "epoch": 0.4, - "learning_rate": 0.0002393071020276372, - "loss": 0.0157, + "epoch": 0.21, + "learning_rate": 0.00026881650470085355, + "loss": 0.0248, "step": 80200 }, { - "epoch": 0.4, - "learning_rate": 0.00023929953433462318, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.0002688126164844821, + "loss": 0.0229, "step": 80210 }, { - "epoch": 0.4, - "learning_rate": 0.00023929196664160916, - "loss": 0.0128, + "epoch": 0.21, + "learning_rate": 0.00026880872826811063, + "loss": 0.0225, "step": 80220 }, { - "epoch": 0.4, - "learning_rate": 0.00023928439894859517, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002688048400517392, + "loss": 0.0298, "step": 80230 }, { - "epoch": 0.4, - "learning_rate": 0.00023927683125558115, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.0002688009518353677, + "loss": 0.0234, "step": 80240 }, { - "epoch": 0.4, - "learning_rate": 0.00023926926356256713, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.00026879706361899623, + "loss": 0.0267, "step": 80250 }, { - "epoch": 0.4, - "learning_rate": 0.00023926169586955314, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.0002687931754026248, + "loss": 0.022, "step": 80260 }, { - "epoch": 0.4, - "learning_rate": 0.00023925412817653912, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.0002687892871862533, + "loss": 0.0261, "step": 80270 }, { - "epoch": 0.41, - "learning_rate": 0.0002392465604835251, - "loss": 0.0347, + "epoch": 0.21, + "learning_rate": 0.0002687853989698818, + "loss": 0.0239, "step": 80280 }, { - "epoch": 0.41, - "learning_rate": 0.00023923899279051108, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.0002687815107535104, + "loss": 0.0229, "step": 80290 }, { - "epoch": 0.41, - "learning_rate": 0.0002392314250974971, - "loss": 0.0184, + "epoch": 0.21, + "learning_rate": 0.00026877762253713896, + "loss": 0.0238, "step": 80300 }, { - "epoch": 0.41, - "learning_rate": 0.00023922385740448307, - "loss": 0.0195, + "epoch": 0.21, + "learning_rate": 0.0002687737343207675, + "loss": 0.0266, "step": 80310 }, { - "epoch": 0.41, - "learning_rate": 0.00023921628971146906, - "loss": 0.0182, + "epoch": 0.21, + "learning_rate": 0.000268769846104396, + "loss": 0.0316, "step": 80320 }, { - "epoch": 0.41, - "learning_rate": 0.00023920872201845506, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.0002687659578880245, + "loss": 0.0255, "step": 80330 }, { - "epoch": 0.41, - "learning_rate": 0.00023920115432544105, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.0002687620696716531, + "loss": 0.0261, "step": 80340 }, { - "epoch": 0.41, - "learning_rate": 0.00023919358663242703, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.0002687581814552816, + "loss": 0.0289, "step": 80350 }, { - "epoch": 0.41, - "learning_rate": 0.00023918601893941304, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.00026875429323891016, + "loss": 0.0235, "step": 80360 }, { - "epoch": 0.41, - "learning_rate": 0.00023917845124639902, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.0002687504050225387, + "loss": 0.0204, "step": 80370 }, { - "epoch": 0.41, - "learning_rate": 0.000239170883553385, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026874651680616724, + "loss": 0.021, "step": 80380 }, { - "epoch": 0.41, - "learning_rate": 0.000239163315860371, - "loss": 0.0207, + "epoch": 0.21, + "learning_rate": 0.00026874262858979576, + "loss": 0.0264, "step": 80390 }, { - "epoch": 0.41, - "learning_rate": 0.000239155748167357, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026873874037342427, + "loss": 0.0289, "step": 80400 }, { - "epoch": 0.41, - "learning_rate": 0.00023914818047434297, - "loss": 0.0211, + "epoch": 0.21, + "learning_rate": 0.0002687348521570528, + "loss": 0.0291, "step": 80410 }, { - "epoch": 0.41, - "learning_rate": 0.00023914061278132898, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.00026873096394068136, + "loss": 0.0233, "step": 80420 }, { - "epoch": 0.41, - "learning_rate": 0.00023913304508831496, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.00026872707572430987, + "loss": 0.0228, "step": 80430 }, { - "epoch": 0.41, - "learning_rate": 0.00023912547739530094, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026872318750793844, + "loss": 0.0233, "step": 80440 }, { - "epoch": 0.41, - "learning_rate": 0.00023911790970228692, - "loss": 0.0182, + "epoch": 0.21, + "learning_rate": 0.00026871929929156695, + "loss": 0.0229, "step": 80450 }, { - "epoch": 0.41, - "learning_rate": 0.00023911034200927293, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.00026871541107519547, + "loss": 0.0239, "step": 80460 }, { - "epoch": 0.41, - "learning_rate": 0.0002391027743162589, - "loss": 0.0227, + "epoch": 0.21, + "learning_rate": 0.00026871152285882404, + "loss": 0.0268, "step": 80470 }, { - "epoch": 0.41, - "learning_rate": 0.0002390952066232449, - "loss": 0.0166, + "epoch": 0.21, + "learning_rate": 0.00026870763464245255, + "loss": 0.0241, "step": 80480 }, { - "epoch": 0.41, - "learning_rate": 0.0002390876389302309, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.00026870374642608107, + "loss": 0.0224, "step": 80490 }, { - "epoch": 0.41, - "learning_rate": 0.00023908007123721688, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.00026869985820970963, + "loss": 0.0305, "step": 80500 }, { - "epoch": 0.41, - "learning_rate": 0.00023907250354420287, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.0002686959699933382, + "loss": 0.0272, "step": 80510 }, { - "epoch": 0.41, - "learning_rate": 0.00023906493585118887, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.0002686920817769667, + "loss": 0.0247, "step": 80520 }, { - "epoch": 0.41, - "learning_rate": 0.00023905736815817486, - "loss": 0.0196, + "epoch": 0.21, + "learning_rate": 0.00026868819356059523, + "loss": 0.0258, "step": 80530 }, { - "epoch": 0.41, - "learning_rate": 0.00023904980046516084, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026868430534422375, + "loss": 0.0274, "step": 80540 }, { - "epoch": 0.41, - "learning_rate": 0.00023904223277214685, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.0002686804171278523, + "loss": 0.0269, "step": 80550 }, { - "epoch": 0.41, - "learning_rate": 0.00023903466507913283, - "loss": 0.0157, + "epoch": 0.21, + "learning_rate": 0.00026867652891148083, + "loss": 0.0221, "step": 80560 }, { - "epoch": 0.41, - "learning_rate": 0.0002390270973861188, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.0002686726406951094, + "loss": 0.0266, "step": 80570 }, { - "epoch": 0.41, - "learning_rate": 0.00023901952969310482, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.0002686687524787379, + "loss": 0.0226, "step": 80580 }, { - "epoch": 0.41, - "learning_rate": 0.0002390119620000908, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.0002686648642623665, + "loss": 0.0207, "step": 80590 }, { - "epoch": 0.41, - "learning_rate": 0.00023900439430707678, - "loss": 0.0153, + "epoch": 0.21, + "learning_rate": 0.000268660976045995, + "loss": 0.0244, "step": 80600 }, { - "epoch": 0.41, - "learning_rate": 0.00023899682661406276, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.0002686570878296235, + "loss": 0.0246, "step": 80610 }, { - "epoch": 0.41, - "learning_rate": 0.00023898925892104877, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.000268653199613252, + "loss": 0.0276, "step": 80620 }, { - "epoch": 0.41, - "learning_rate": 0.00023898169122803475, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002686493113968806, + "loss": 0.0243, "step": 80630 }, { - "epoch": 0.41, - "learning_rate": 0.00023897412353502073, - "loss": 0.015, + "epoch": 0.21, + "learning_rate": 0.0002686454231805091, + "loss": 0.0217, "step": 80640 }, { - "epoch": 0.41, - "learning_rate": 0.00023896655584200674, - "loss": 0.0205, + "epoch": 0.21, + "learning_rate": 0.0002686415349641377, + "loss": 0.0237, "step": 80650 }, { - "epoch": 0.41, - "learning_rate": 0.00023895898814899272, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.0002686376467477662, + "loss": 0.0202, "step": 80660 }, { - "epoch": 0.41, - "learning_rate": 0.0002389514204559787, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.0002686337585313947, + "loss": 0.0207, "step": 80670 }, { - "epoch": 0.41, - "learning_rate": 0.0002389438527629647, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.0002686298703150233, + "loss": 0.021, "step": 80680 }, { - "epoch": 0.41, - "learning_rate": 0.0002389362850699507, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.0002686259820986518, + "loss": 0.0253, "step": 80690 }, { - "epoch": 0.41, - "learning_rate": 0.00023892871737693668, - "loss": 0.015, + "epoch": 0.21, + "learning_rate": 0.00026862209388228036, + "loss": 0.0223, "step": 80700 }, { - "epoch": 0.41, - "learning_rate": 0.00023892114968392268, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.00026861820566590887, + "loss": 0.0203, "step": 80710 }, { - "epoch": 0.41, - "learning_rate": 0.00023891358199090867, - "loss": 0.0204, + "epoch": 0.21, + "learning_rate": 0.00026861431744953744, + "loss": 0.0216, "step": 80720 }, { - "epoch": 0.41, - "learning_rate": 0.00023890601429789465, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026861042923316596, + "loss": 0.0259, "step": 80730 }, { - "epoch": 0.41, - "learning_rate": 0.00023889844660488066, - "loss": 0.0166, + "epoch": 0.21, + "learning_rate": 0.00026860654101679447, + "loss": 0.025, "step": 80740 }, { - "epoch": 0.41, - "learning_rate": 0.00023889087891186664, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.000268602652800423, + "loss": 0.0214, "step": 80750 }, { - "epoch": 0.41, - "learning_rate": 0.00023888331121885262, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.00026859876458405155, + "loss": 0.0232, "step": 80760 }, { - "epoch": 0.41, - "learning_rate": 0.00023887574352583863, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.00026859487636768007, + "loss": 0.0255, "step": 80770 }, { - "epoch": 0.41, - "learning_rate": 0.0002388681758328246, - "loss": 0.016, + "epoch": 0.21, + "learning_rate": 0.00026859098815130864, + "loss": 0.0276, "step": 80780 }, { - "epoch": 0.41, - "learning_rate": 0.0002388606081398106, - "loss": 0.0165, + "epoch": 0.21, + "learning_rate": 0.00026858709993493715, + "loss": 0.026, "step": 80790 }, { - "epoch": 0.41, - "learning_rate": 0.00023885304044679657, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.0002685832117185657, + "loss": 0.0273, "step": 80800 }, { - "epoch": 0.41, - "learning_rate": 0.00023884547275378258, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.00026857932350219424, + "loss": 0.0227, "step": 80810 }, { - "epoch": 0.41, - "learning_rate": 0.00023883790506076856, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.00026857543528582275, + "loss": 0.0215, "step": 80820 }, { - "epoch": 0.41, - "learning_rate": 0.00023883033736775454, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.00026857154706945126, + "loss": 0.025, "step": 80830 }, { - "epoch": 0.41, - "learning_rate": 0.00023882276967474055, - "loss": 0.0154, + "epoch": 0.21, + "learning_rate": 0.00026856765885307983, + "loss": 0.0265, "step": 80840 }, { - "epoch": 0.41, - "learning_rate": 0.00023881520198172653, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.0002685637706367084, + "loss": 0.0239, "step": 80850 }, { - "epoch": 0.41, - "learning_rate": 0.00023880763428871252, - "loss": 0.0255, + "epoch": 0.21, + "learning_rate": 0.0002685598824203369, + "loss": 0.0307, "step": 80860 }, { - "epoch": 0.41, - "learning_rate": 0.00023880006659569852, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.00026855599420396543, + "loss": 0.0375, "step": 80870 }, { - "epoch": 0.41, - "learning_rate": 0.0002387924989026845, - "loss": 0.0139, + "epoch": 0.21, + "learning_rate": 0.000268552105987594, + "loss": 0.0256, "step": 80880 }, { - "epoch": 0.41, - "learning_rate": 0.0002387849312096705, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.0002685482177712225, + "loss": 0.0243, "step": 80890 }, { - "epoch": 0.41, - "learning_rate": 0.0002387773635166565, - "loss": 0.0188, + "epoch": 0.21, + "learning_rate": 0.00026854432955485103, + "loss": 0.0195, "step": 80900 }, { - "epoch": 0.41, - "learning_rate": 0.00023876979582364248, - "loss": 0.0154, + "epoch": 0.21, + "learning_rate": 0.0002685404413384796, + "loss": 0.0251, "step": 80910 }, { - "epoch": 0.41, - "learning_rate": 0.00023876222813062846, - "loss": 0.0137, + "epoch": 0.21, + "learning_rate": 0.0002685365531221081, + "loss": 0.0241, "step": 80920 }, { - "epoch": 0.41, - "learning_rate": 0.00023875466043761447, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002685326649057367, + "loss": 0.0263, "step": 80930 }, { - "epoch": 0.41, - "learning_rate": 0.00023874709274460045, - "loss": 0.015, + "epoch": 0.21, + "learning_rate": 0.0002685287766893652, + "loss": 0.0248, "step": 80940 }, { - "epoch": 0.41, - "learning_rate": 0.00023873952505158643, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.0002685248884729937, + "loss": 0.0218, "step": 80950 }, { - "epoch": 0.41, - "learning_rate": 0.0002387319573585724, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002685210002566222, + "loss": 0.0239, "step": 80960 }, { - "epoch": 0.41, - "learning_rate": 0.00023872438966555842, - "loss": 0.0209, + "epoch": 0.21, + "learning_rate": 0.0002685171120402508, + "loss": 0.0267, "step": 80970 }, { - "epoch": 0.41, - "learning_rate": 0.0002387168219725444, - "loss": 0.0182, + "epoch": 0.21, + "learning_rate": 0.0002685132238238793, + "loss": 0.0225, "step": 80980 }, { - "epoch": 0.41, - "learning_rate": 0.00023870925427953038, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.0002685093356075079, + "loss": 0.0234, "step": 80990 }, { - "epoch": 0.41, - "learning_rate": 0.0002387016865865164, - "loss": 0.016, + "epoch": 0.21, + "learning_rate": 0.0002685054473911364, + "loss": 0.0252, "step": 81000 }, { - "epoch": 0.41, - "eval_cer": 0.9145090717481783, - "eval_loss": 0.012487111613154411, - "eval_runtime": 116.7617, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.21, + "eval_cer": 0.8817964619977577, + "eval_loss": 0.017585597932338715, + "eval_runtime": 107.7913, + "eval_samples_per_second": 18.554, + "eval_steps_per_second": 4.639, "step": 81000 }, { - "epoch": 0.41, - "learning_rate": 0.00023869411889350237, - "loss": 0.0197, + "epoch": 0.21, + "learning_rate": 0.00026850155917476496, + "loss": 0.0256, "step": 81010 }, { - "epoch": 0.41, - "learning_rate": 0.00023868655120048835, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.0002684976709583935, + "loss": 0.021, "step": 81020 }, { - "epoch": 0.41, - "learning_rate": 0.00023867898350747436, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.000268493782742022, + "loss": 0.0247, "step": 81030 }, { - "epoch": 0.41, - "learning_rate": 0.00023867141581446034, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.0002684898945256505, + "loss": 0.0239, "step": 81040 }, { - "epoch": 0.41, - "learning_rate": 0.00023866384812144633, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.00026848600630927907, + "loss": 0.0215, "step": 81050 }, { - "epoch": 0.41, - "learning_rate": 0.00023865628042843233, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.00026848211809290764, + "loss": 0.0254, "step": 81060 }, { - "epoch": 0.41, - "learning_rate": 0.0002386487127354183, - "loss": 0.0177, + "epoch": 0.21, + "learning_rate": 0.00026847822987653615, + "loss": 0.0208, "step": 81070 }, { - "epoch": 0.41, - "learning_rate": 0.00023864114504240427, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.00026847434166016467, + "loss": 0.0251, "step": 81080 }, { - "epoch": 0.41, - "learning_rate": 0.00023863357734939025, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026847045344379324, + "loss": 0.0246, "step": 81090 }, { - "epoch": 0.41, - "learning_rate": 0.00023862600965637626, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.00026846656522742175, + "loss": 0.0216, "step": 81100 }, { - "epoch": 0.41, - "learning_rate": 0.00023861844196336224, - "loss": 0.0203, + "epoch": 0.21, + "learning_rate": 0.00026846267701105027, + "loss": 0.0236, "step": 81110 }, { - "epoch": 0.41, - "learning_rate": 0.00023861087427034822, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026845878879467884, + "loss": 0.0222, "step": 81120 }, { - "epoch": 0.41, - "learning_rate": 0.00023860330657733423, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.00026845490057830735, + "loss": 0.0254, "step": 81130 }, { - "epoch": 0.41, - "learning_rate": 0.0002385957388843202, - "loss": 0.0222, + "epoch": 0.21, + "learning_rate": 0.0002684510123619359, + "loss": 0.0267, "step": 81140 }, { - "epoch": 0.41, - "learning_rate": 0.0002385881711913062, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.00026844712414556443, + "loss": 0.0208, "step": 81150 }, { - "epoch": 0.41, - "learning_rate": 0.0002385806034982922, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026844323592919295, + "loss": 0.0276, "step": 81160 }, { - "epoch": 0.41, - "learning_rate": 0.00023857303580527818, - "loss": 0.0206, + "epoch": 0.21, + "learning_rate": 0.00026843934771282146, + "loss": 0.0233, "step": 81170 }, { - "epoch": 0.41, - "learning_rate": 0.00023856546811226417, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.00026843545949645003, + "loss": 0.0253, "step": 81180 }, { - "epoch": 0.41, - "learning_rate": 0.00023855790041925015, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026843157128007855, + "loss": 0.0213, "step": 81190 }, { - "epoch": 0.41, - "learning_rate": 0.00023855033272623616, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.0002684276830637071, + "loss": 0.0192, "step": 81200 }, { - "epoch": 0.41, - "learning_rate": 0.00023854276503322214, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.00026842379484733563, + "loss": 0.0233, "step": 81210 }, { - "epoch": 0.41, - "learning_rate": 0.00023853519734020812, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.0002684199066309642, + "loss": 0.0222, "step": 81220 }, { - "epoch": 0.41, - "learning_rate": 0.00023852762964719413, - "loss": 0.0163, + "epoch": 0.21, + "learning_rate": 0.0002684160184145927, + "loss": 0.0248, "step": 81230 }, { - "epoch": 0.41, - "learning_rate": 0.0002385200619541801, - "loss": 0.0138, + "epoch": 0.21, + "learning_rate": 0.00026841213019822123, + "loss": 0.024, "step": 81240 }, { - "epoch": 0.41, - "learning_rate": 0.0002385124942611661, - "loss": 0.0166, + "epoch": 0.21, + "learning_rate": 0.0002684082419818498, + "loss": 0.0213, "step": 81250 }, { - "epoch": 0.41, - "learning_rate": 0.0002385049265681521, - "loss": 0.0182, + "epoch": 0.21, + "learning_rate": 0.0002684043537654783, + "loss": 0.0247, "step": 81260 }, { - "epoch": 0.41, - "learning_rate": 0.00023849735887513808, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.0002684004655491069, + "loss": 0.0267, "step": 81270 }, { - "epoch": 0.41, - "learning_rate": 0.00023848979118212406, - "loss": 0.0228, + "epoch": 0.21, + "learning_rate": 0.0002683965773327354, + "loss": 0.027, "step": 81280 }, { - "epoch": 0.41, - "learning_rate": 0.00023848222348911007, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.0002683926891163639, + "loss": 0.0223, "step": 81290 }, { - "epoch": 0.41, - "learning_rate": 0.00023847465579609605, - "loss": 0.016, + "epoch": 0.21, + "learning_rate": 0.0002683888008999925, + "loss": 0.0214, "step": 81300 }, { - "epoch": 0.41, - "learning_rate": 0.00023846708810308203, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.000268384912683621, + "loss": 0.0241, "step": 81310 }, { - "epoch": 0.41, - "learning_rate": 0.00023845952041006804, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.0002683810244672495, + "loss": 0.0242, "step": 81320 }, { - "epoch": 0.41, - "learning_rate": 0.00023845195271705402, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.0002683771362508781, + "loss": 0.024, "step": 81330 }, { - "epoch": 0.41, - "learning_rate": 0.00023844438502404, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.0002683732480345066, + "loss": 0.0239, "step": 81340 }, { - "epoch": 0.41, - "learning_rate": 0.00023843681733102599, - "loss": 0.0149, + "epoch": 0.21, + "learning_rate": 0.00026836935981813516, + "loss": 0.0229, "step": 81350 }, { - "epoch": 0.41, - "learning_rate": 0.000238429249638012, - "loss": 0.0195, + "epoch": 0.21, + "learning_rate": 0.00026836547160176367, + "loss": 0.0264, "step": 81360 }, { - "epoch": 0.41, - "learning_rate": 0.00023842168194499798, - "loss": 0.0214, + "epoch": 0.21, + "learning_rate": 0.0002683615833853922, + "loss": 0.0273, "step": 81370 }, { - "epoch": 0.41, - "learning_rate": 0.00023841411425198396, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.0002683576951690207, + "loss": 0.0276, "step": 81380 }, { - "epoch": 0.41, - "learning_rate": 0.00023840654655896997, - "loss": 0.0145, + "epoch": 0.21, + "learning_rate": 0.00026835380695264927, + "loss": 0.0302, "step": 81390 }, { - "epoch": 0.41, - "learning_rate": 0.00023839897886595595, - "loss": 0.0149, + "epoch": 0.21, + "learning_rate": 0.00026834991873627784, + "loss": 0.0264, "step": 81400 }, { - "epoch": 0.41, - "learning_rate": 0.00023839141117294193, - "loss": 0.0151, + "epoch": 0.21, + "learning_rate": 0.00026834603051990635, + "loss": 0.0287, "step": 81410 }, { - "epoch": 0.41, - "learning_rate": 0.00023838384347992794, - "loss": 0.0137, + "epoch": 0.21, + "learning_rate": 0.00026834214230353487, + "loss": 0.0202, "step": 81420 }, { - "epoch": 0.41, - "learning_rate": 0.00023837627578691392, - "loss": 0.0121, + "epoch": 0.21, + "learning_rate": 0.00026833825408716344, + "loss": 0.022, "step": 81430 }, { - "epoch": 0.41, - "learning_rate": 0.0002383687080938999, - "loss": 0.0143, + "epoch": 0.21, + "learning_rate": 0.00026833436587079195, + "loss": 0.0267, "step": 81440 }, { - "epoch": 0.41, - "learning_rate": 0.0002383611404008859, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.00026833047765442047, + "loss": 0.0245, "step": 81450 }, { - "epoch": 0.41, - "learning_rate": 0.0002383535727078719, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.00026832658943804903, + "loss": 0.0255, "step": 81460 }, { - "epoch": 0.41, - "learning_rate": 0.00023834600501485787, - "loss": 0.0186, + "epoch": 0.21, + "learning_rate": 0.00026832270122167755, + "loss": 0.0183, "step": 81470 }, { - "epoch": 0.41, - "learning_rate": 0.00023833843732184388, - "loss": 0.0154, + "epoch": 0.21, + "learning_rate": 0.0002683188130053061, + "loss": 0.0253, "step": 81480 }, { - "epoch": 0.41, - "learning_rate": 0.00023833086962882986, - "loss": 0.013, + "epoch": 0.21, + "learning_rate": 0.00026831492478893463, + "loss": 0.0228, "step": 81490 }, { - "epoch": 0.41, - "learning_rate": 0.00023832330193581584, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.00026831103657256315, + "loss": 0.0243, "step": 81500 }, { - "epoch": 0.41, - "learning_rate": 0.00023831573424280182, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.0002683071483561917, + "loss": 0.0286, "step": 81510 }, { - "epoch": 0.41, - "learning_rate": 0.00023830816654978783, - "loss": 0.0157, + "epoch": 0.21, + "learning_rate": 0.00026830326013982023, + "loss": 0.023, "step": 81520 }, { - "epoch": 0.41, - "learning_rate": 0.00023830059885677381, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.00026829937192344875, + "loss": 0.0234, "step": 81530 }, { - "epoch": 0.41, - "learning_rate": 0.0002382930311637598, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.0002682954837070773, + "loss": 0.0261, "step": 81540 }, { - "epoch": 0.41, - "learning_rate": 0.0002382854634707458, - "loss": 0.0143, + "epoch": 0.21, + "learning_rate": 0.0002682915954907059, + "loss": 0.0257, "step": 81550 }, { - "epoch": 0.41, - "learning_rate": 0.00023827789577773179, - "loss": 0.0163, + "epoch": 0.21, + "learning_rate": 0.0002682877072743344, + "loss": 0.0252, "step": 81560 }, { - "epoch": 0.41, - "learning_rate": 0.00023827032808471777, - "loss": 0.0148, + "epoch": 0.21, + "learning_rate": 0.0002682838190579629, + "loss": 0.0249, "step": 81570 }, { - "epoch": 0.41, - "learning_rate": 0.00023826276039170378, - "loss": 0.0155, + "epoch": 0.21, + "learning_rate": 0.0002682799308415914, + "loss": 0.0251, "step": 81580 }, { - "epoch": 0.41, - "learning_rate": 0.00023825519269868976, - "loss": 0.0201, + "epoch": 0.21, + "learning_rate": 0.00026827604262522, + "loss": 0.0195, "step": 81590 }, { - "epoch": 0.41, - "learning_rate": 0.00023824762500567574, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.0002682721544088485, + "loss": 0.0234, "step": 81600 }, { - "epoch": 0.41, - "learning_rate": 0.00023824005731266175, - "loss": 0.0149, + "epoch": 0.21, + "learning_rate": 0.0002682682661924771, + "loss": 0.0253, "step": 81610 }, { - "epoch": 0.41, - "learning_rate": 0.00023823248961964773, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.0002682643779761056, + "loss": 0.0239, "step": 81620 }, { - "epoch": 0.41, - "learning_rate": 0.0002382249219266337, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.0002682604897597341, + "loss": 0.0254, "step": 81630 }, { - "epoch": 0.41, - "learning_rate": 0.00023821735423361972, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.0002682566015433627, + "loss": 0.0237, "step": 81640 }, { - "epoch": 0.41, - "learning_rate": 0.0002382097865406057, - "loss": 0.0236, + "epoch": 0.21, + "learning_rate": 0.0002682527133269912, + "loss": 0.0226, "step": 81650 }, { - "epoch": 0.41, - "learning_rate": 0.00023820221884759168, - "loss": 0.0255, + "epoch": 0.21, + "learning_rate": 0.0002682488251106197, + "loss": 0.0201, "step": 81660 }, { - "epoch": 0.41, - "learning_rate": 0.00023819465115457766, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.0002682449368942483, + "loss": 0.0238, "step": 81670 }, { - "epoch": 0.41, - "learning_rate": 0.00023818708346156367, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.0002682410486778768, + "loss": 0.0276, "step": 81680 }, { - "epoch": 0.41, - "learning_rate": 0.00023817951576854965, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026823716046150536, + "loss": 0.0334, "step": 81690 }, { - "epoch": 0.41, - "learning_rate": 0.00023817194807553563, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.00026823327224513387, + "loss": 0.0405, "step": 81700 }, { - "epoch": 0.41, - "learning_rate": 0.00023816438038252164, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.0002682293840287624, + "loss": 0.053, "step": 81710 }, { - "epoch": 0.41, - "learning_rate": 0.00023815681268950762, - "loss": 0.016, + "epoch": 0.21, + "learning_rate": 0.00026822549581239095, + "loss": 0.0338, "step": 81720 }, { - "epoch": 0.41, - "learning_rate": 0.0002381492449964936, - "loss": 0.0171, + "epoch": 0.21, + "learning_rate": 0.00026822160759601947, + "loss": 0.0381, "step": 81730 }, { - "epoch": 0.41, - "learning_rate": 0.00023814167730347961, - "loss": 0.0189, + "epoch": 0.21, + "learning_rate": 0.000268217719379648, + "loss": 0.0248, "step": 81740 }, { - "epoch": 0.41, - "learning_rate": 0.0002381341096104656, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026821383116327655, + "loss": 0.0251, "step": 81750 }, { - "epoch": 0.41, - "learning_rate": 0.00023812654191745158, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.0002682099429469051, + "loss": 0.0318, "step": 81760 }, { - "epoch": 0.41, - "learning_rate": 0.00023811897422443759, - "loss": 0.0141, + "epoch": 0.21, + "learning_rate": 0.00026820605473053364, + "loss": 0.0243, "step": 81770 }, { - "epoch": 0.41, - "learning_rate": 0.00023811140653142357, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.00026820216651416215, + "loss": 0.0267, "step": 81780 }, { - "epoch": 0.41, - "learning_rate": 0.00023810383883840955, - "loss": 0.0135, + "epoch": 0.21, + "learning_rate": 0.00026819827829779066, + "loss": 0.0327, "step": 81790 }, { - "epoch": 0.41, - "learning_rate": 0.00023809627114539556, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.00026819439008141923, + "loss": 0.0303, "step": 81800 }, { - "epoch": 0.41, - "learning_rate": 0.00023808870345238154, - "loss": 0.0172, + "epoch": 0.21, + "learning_rate": 0.00026819050186504775, + "loss": 0.0281, "step": 81810 }, { - "epoch": 0.41, - "learning_rate": 0.00023808113575936752, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.0002681866136486763, + "loss": 0.0204, "step": 81820 }, { - "epoch": 0.41, - "learning_rate": 0.00023807356806635353, - "loss": 0.0211, + "epoch": 0.21, + "learning_rate": 0.00026818272543230483, + "loss": 0.0226, "step": 81830 }, { - "epoch": 0.41, - "learning_rate": 0.0002380660003733395, - "loss": 0.0167, + "epoch": 0.21, + "learning_rate": 0.0002681788372159334, + "loss": 0.0277, "step": 81840 }, { - "epoch": 0.41, - "learning_rate": 0.0002380584326803255, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.0002681749489995619, + "loss": 0.0238, "step": 81850 }, { - "epoch": 0.41, - "learning_rate": 0.00023805086498731147, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.00026817106078319043, + "loss": 0.0246, "step": 81860 }, { - "epoch": 0.41, - "learning_rate": 0.00023804329729429748, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.00026816717256681894, + "loss": 0.0247, "step": 81870 }, { - "epoch": 0.41, - "learning_rate": 0.00023803572960128346, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.0002681632843504475, + "loss": 0.0205, "step": 81880 }, { - "epoch": 0.41, - "learning_rate": 0.00023802816190826944, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.0002681593961340761, + "loss": 0.0256, "step": 81890 }, { - "epoch": 0.41, - "learning_rate": 0.00023802059421525545, - "loss": 0.0191, + "epoch": 0.21, + "learning_rate": 0.0002681555079177046, + "loss": 0.0251, "step": 81900 }, { - "epoch": 0.41, - "learning_rate": 0.00023801302652224143, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.0002681516197013331, + "loss": 0.0245, "step": 81910 }, { - "epoch": 0.41, - "learning_rate": 0.00023800545882922742, - "loss": 0.0177, + "epoch": 0.21, + "learning_rate": 0.0002681477314849616, + "loss": 0.0272, "step": 81920 }, { - "epoch": 0.41, - "learning_rate": 0.00023799789113621342, - "loss": 0.0173, + "epoch": 0.21, + "learning_rate": 0.0002681438432685902, + "loss": 0.0229, "step": 81930 }, { - "epoch": 0.41, - "learning_rate": 0.0002379903234431994, - "loss": 0.0204, + "epoch": 0.21, + "learning_rate": 0.0002681399550522187, + "loss": 0.0256, "step": 81940 }, { - "epoch": 0.41, - "learning_rate": 0.0002379827557501854, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.0002681360668358473, + "loss": 0.022, "step": 81950 }, { - "epoch": 0.41, - "learning_rate": 0.0002379751880571714, - "loss": 0.015, + "epoch": 0.21, + "learning_rate": 0.0002681321786194758, + "loss": 0.0225, "step": 81960 }, { - "epoch": 0.41, - "learning_rate": 0.00023796762036415738, - "loss": 0.0147, + "epoch": 0.21, + "learning_rate": 0.00026812829040310436, + "loss": 0.0209, "step": 81970 }, { - "epoch": 0.41, - "learning_rate": 0.00023796005267114336, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.0002681244021867329, + "loss": 0.0273, "step": 81980 }, { - "epoch": 0.41, - "learning_rate": 0.00023795248497812937, - "loss": 0.016, + "epoch": 0.21, + "learning_rate": 0.0002681205139703614, + "loss": 0.0267, "step": 81990 }, { - "epoch": 0.41, - "learning_rate": 0.00023794491728511535, - "loss": 0.0146, + "epoch": 0.21, + "learning_rate": 0.0002681166257539899, + "loss": 0.0225, "step": 82000 }, { - "epoch": 0.41, - "eval_cer": 0.9144935454101719, - "eval_loss": 0.012472189962863922, - "eval_runtime": 116.6656, - "eval_samples_per_second": 17.143, - "eval_steps_per_second": 4.286, + "epoch": 0.21, + "eval_cer": 0.8817264801510488, + "eval_loss": 0.017370792105793953, + "eval_runtime": 108.1353, + "eval_samples_per_second": 18.495, + "eval_steps_per_second": 4.624, "step": 82000 }, { - "epoch": 0.41, - "learning_rate": 0.00023793734959210133, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.00026811273753761847, + "loss": 0.0232, "step": 82010 }, { - "epoch": 0.41, - "learning_rate": 0.0002379297818990873, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.000268108849321247, + "loss": 0.0268, "step": 82020 }, { - "epoch": 0.41, - "learning_rate": 0.00023792221420607332, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026810496110487556, + "loss": 0.0222, "step": 82030 }, { - "epoch": 0.41, - "learning_rate": 0.0002379146465130593, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.00026810107288850407, + "loss": 0.0364, "step": 82040 }, { - "epoch": 0.41, - "learning_rate": 0.00023790707882004528, - "loss": 0.0302, + "epoch": 0.21, + "learning_rate": 0.00026809718467213264, + "loss": 0.0216, "step": 82050 }, { - "epoch": 0.41, - "learning_rate": 0.0002378995111270313, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.00026809329645576115, + "loss": 0.0272, "step": 82060 }, { - "epoch": 0.41, - "learning_rate": 0.00023789194343401727, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026808940823938967, + "loss": 0.0251, "step": 82070 }, { - "epoch": 0.41, - "learning_rate": 0.00023788437574100325, - "loss": 0.0202, + "epoch": 0.21, + "learning_rate": 0.0002680855200230182, + "loss": 0.0244, "step": 82080 }, { - "epoch": 0.41, - "learning_rate": 0.00023787680804798926, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.00026808163180664675, + "loss": 0.0249, "step": 82090 }, { - "epoch": 0.41, - "learning_rate": 0.00023786924035497524, - "loss": 0.023, + "epoch": 0.21, + "learning_rate": 0.0002680777435902753, + "loss": 0.024, "step": 82100 }, { - "epoch": 0.41, - "learning_rate": 0.00023786167266196123, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.00026807385537390383, + "loss": 0.0209, "step": 82110 }, { - "epoch": 0.41, - "learning_rate": 0.00023785410496894723, - "loss": 0.0151, + "epoch": 0.21, + "learning_rate": 0.00026806996715753235, + "loss": 0.0302, "step": 82120 }, { - "epoch": 0.41, - "learning_rate": 0.00023784653727593322, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.00026806607894116086, + "loss": 0.028, "step": 82130 }, { - "epoch": 0.41, - "learning_rate": 0.0002378389695829192, - "loss": 0.0253, + "epoch": 0.21, + "learning_rate": 0.00026806219072478943, + "loss": 0.0233, "step": 82140 }, { - "epoch": 0.41, - "learning_rate": 0.0002378314018899052, - "loss": 0.0196, + "epoch": 0.21, + "learning_rate": 0.00026805830250841795, + "loss": 0.0238, "step": 82150 }, { - "epoch": 0.41, - "learning_rate": 0.0002378238341968912, - "loss": 0.0166, + "epoch": 0.21, + "learning_rate": 0.0002680544142920465, + "loss": 0.0252, "step": 82160 }, { - "epoch": 0.41, - "learning_rate": 0.00023781626650387717, - "loss": 0.0154, + "epoch": 0.21, + "learning_rate": 0.00026805052607567503, + "loss": 0.0247, "step": 82170 }, { - "epoch": 0.41, - "learning_rate": 0.00023780869881086315, - "loss": 0.0148, + "epoch": 0.21, + "learning_rate": 0.0002680466378593036, + "loss": 0.0246, "step": 82180 }, { - "epoch": 0.41, - "learning_rate": 0.00023780113111784916, - "loss": 0.0206, + "epoch": 0.21, + "learning_rate": 0.0002680427496429321, + "loss": 0.0252, "step": 82190 }, { - "epoch": 0.41, - "learning_rate": 0.00023779356342483514, - "loss": 0.0171, + "epoch": 0.21, + "learning_rate": 0.00026803886142656063, + "loss": 0.0223, "step": 82200 }, { - "epoch": 0.41, - "learning_rate": 0.00023778599573182112, - "loss": 0.0161, + "epoch": 0.21, + "learning_rate": 0.00026803497321018914, + "loss": 0.0213, "step": 82210 }, { - "epoch": 0.41, - "learning_rate": 0.00023777842803880713, - "loss": 0.0177, + "epoch": 0.21, + "learning_rate": 0.0002680310849938177, + "loss": 0.0224, "step": 82220 }, { - "epoch": 0.41, - "learning_rate": 0.0002377708603457931, - "loss": 0.0166, + "epoch": 0.21, + "learning_rate": 0.0002680271967774462, + "loss": 0.0222, "step": 82230 }, { - "epoch": 0.41, - "learning_rate": 0.0002377632926527791, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.0002680233085610748, + "loss": 0.0258, "step": 82240 }, { - "epoch": 0.41, - "learning_rate": 0.0002377557249597651, - "loss": 0.0222, + "epoch": 0.21, + "learning_rate": 0.0002680194203447033, + "loss": 0.0231, "step": 82250 }, { - "epoch": 0.42, - "learning_rate": 0.00023774815726675108, - "loss": 0.0154, + "epoch": 0.21, + "learning_rate": 0.0002680155321283319, + "loss": 0.0266, "step": 82260 }, { - "epoch": 0.42, - "learning_rate": 0.00023774058957373706, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.0002680116439119604, + "loss": 0.0216, "step": 82270 }, { - "epoch": 0.42, - "learning_rate": 0.00023773302188072307, - "loss": 0.0222, + "epoch": 0.21, + "learning_rate": 0.0002680077556955889, + "loss": 0.024, "step": 82280 }, { - "epoch": 0.42, - "learning_rate": 0.00023772545418770905, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.0002680038674792175, + "loss": 0.0274, "step": 82290 }, { - "epoch": 0.42, - "learning_rate": 0.00023771788649469504, - "loss": 0.0132, + "epoch": 0.21, + "learning_rate": 0.000267999979262846, + "loss": 0.0234, "step": 82300 }, { - "epoch": 0.42, - "learning_rate": 0.00023771031880168104, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.00026799609104647456, + "loss": 0.0218, "step": 82310 }, { - "epoch": 0.42, - "learning_rate": 0.00023770275110866703, - "loss": 0.0154, + "epoch": 0.21, + "learning_rate": 0.0002679922028301031, + "loss": 0.0206, "step": 82320 }, { - "epoch": 0.42, - "learning_rate": 0.00023769518341565298, - "loss": 0.0219, + "epoch": 0.21, + "learning_rate": 0.0002679883146137316, + "loss": 0.0179, "step": 82330 }, { - "epoch": 0.42, - "learning_rate": 0.00023768761572263896, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.00026798442639736016, + "loss": 0.0233, "step": 82340 }, { - "epoch": 0.42, - "learning_rate": 0.00023768004802962497, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026798053818098867, + "loss": 0.0247, "step": 82350 }, { - "epoch": 0.42, - "learning_rate": 0.00023767248033661095, - "loss": 0.0175, + "epoch": 0.21, + "learning_rate": 0.0002679766499646172, + "loss": 0.0311, "step": 82360 }, { - "epoch": 0.42, - "learning_rate": 0.00023766491264359693, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.00026797276174824575, + "loss": 0.0234, "step": 82370 }, { - "epoch": 0.42, - "learning_rate": 0.00023765734495058294, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.00026796887353187427, + "loss": 0.0249, "step": 82380 }, { - "epoch": 0.42, - "learning_rate": 0.00023764977725756892, - "loss": 0.0176, + "epoch": 0.21, + "learning_rate": 0.00026796498531550284, + "loss": 0.0234, "step": 82390 }, { - "epoch": 0.42, - "learning_rate": 0.0002376422095645549, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.00026796109709913135, + "loss": 0.026, "step": 82400 }, { - "epoch": 0.42, - "learning_rate": 0.00023763464187154089, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.00026795720888275987, + "loss": 0.0307, "step": 82410 }, { - "epoch": 0.42, - "learning_rate": 0.0002376270741785269, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.0002679533206663884, + "loss": 0.029, "step": 82420 }, { - "epoch": 0.42, - "learning_rate": 0.00023761950648551288, - "loss": 0.0212, + "epoch": 0.21, + "learning_rate": 0.00026794943245001695, + "loss": 0.0259, "step": 82430 }, { - "epoch": 0.42, - "learning_rate": 0.00023761193879249886, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.0002679455442336455, + "loss": 0.0244, "step": 82440 }, { - "epoch": 0.42, - "learning_rate": 0.00023760437109948487, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.00026794165601727403, + "loss": 0.0216, "step": 82450 }, { - "epoch": 0.42, - "learning_rate": 0.00023759680340647085, - "loss": 0.0241, + "epoch": 0.21, + "learning_rate": 0.00026793776780090255, + "loss": 0.0268, "step": 82460 }, { - "epoch": 0.42, - "learning_rate": 0.00023758923571345683, - "loss": 0.0181, + "epoch": 0.21, + "learning_rate": 0.0002679338795845311, + "loss": 0.0214, "step": 82470 }, { - "epoch": 0.42, - "learning_rate": 0.00023758166802044284, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.00026792999136815963, + "loss": 0.021, "step": 82480 }, { - "epoch": 0.42, - "learning_rate": 0.00023757410032742882, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.00026792610315178815, + "loss": 0.0217, "step": 82490 }, { - "epoch": 0.42, - "learning_rate": 0.0002375665326344148, - "loss": 0.0213, + "epoch": 0.21, + "learning_rate": 0.0002679222149354167, + "loss": 0.0223, "step": 82500 }, { - "epoch": 0.42, - "learning_rate": 0.0002375589649414008, - "loss": 0.02, + "epoch": 0.21, + "learning_rate": 0.00026791832671904523, + "loss": 0.0261, "step": 82510 }, { - "epoch": 0.42, - "learning_rate": 0.0002375513972483868, - "loss": 0.0183, + "epoch": 0.21, + "learning_rate": 0.0002679144385026738, + "loss": 0.023, "step": 82520 }, { - "epoch": 0.42, - "learning_rate": 0.00023754382955537277, - "loss": 0.022, + "epoch": 0.21, + "learning_rate": 0.0002679105502863023, + "loss": 0.0281, "step": 82530 }, { - "epoch": 0.42, - "learning_rate": 0.00023753626186235878, - "loss": 0.0179, + "epoch": 0.21, + "learning_rate": 0.0002679066620699308, + "loss": 0.0275, "step": 82540 }, { - "epoch": 0.42, - "learning_rate": 0.00023752869416934476, - "loss": 0.0168, + "epoch": 0.21, + "learning_rate": 0.0002679027738535594, + "loss": 0.0303, "step": 82550 }, { - "epoch": 0.42, - "learning_rate": 0.00023752112647633074, - "loss": 0.0143, + "epoch": 0.21, + "learning_rate": 0.0002678988856371879, + "loss": 0.0251, "step": 82560 }, { - "epoch": 0.42, - "learning_rate": 0.00023751355878331672, - "loss": 0.0146, + "epoch": 0.21, + "learning_rate": 0.0002678949974208164, + "loss": 0.0245, "step": 82570 }, { - "epoch": 0.42, - "learning_rate": 0.00023750599109030273, - "loss": 0.0178, + "epoch": 0.21, + "learning_rate": 0.000267891109204445, + "loss": 0.0239, "step": 82580 }, { - "epoch": 0.42, - "learning_rate": 0.00023749842339728871, - "loss": 0.0188, + "epoch": 0.21, + "learning_rate": 0.00026788722098807356, + "loss": 0.0248, "step": 82590 }, { - "epoch": 0.42, - "learning_rate": 0.0002374908557042747, - "loss": 0.0206, + "epoch": 0.21, + "learning_rate": 0.0002678833327717021, + "loss": 0.0245, "step": 82600 }, { - "epoch": 0.42, - "learning_rate": 0.0002374832880112607, - "loss": 0.0159, + "epoch": 0.21, + "learning_rate": 0.0002678794445553306, + "loss": 0.025, "step": 82610 }, { - "epoch": 0.42, - "learning_rate": 0.00023747572031824669, - "loss": 0.014, + "epoch": 0.21, + "learning_rate": 0.0002678755563389591, + "loss": 0.025, "step": 82620 }, { - "epoch": 0.42, - "learning_rate": 0.00023746815262523267, - "loss": 0.016, + "epoch": 0.21, + "learning_rate": 0.0002678716681225876, + "loss": 0.0234, "step": 82630 }, { - "epoch": 0.42, - "learning_rate": 0.00023746058493221868, - "loss": 0.0213, + "epoch": 0.21, + "learning_rate": 0.0002678677799062162, + "loss": 0.0258, "step": 82640 }, { - "epoch": 0.42, - "learning_rate": 0.00023745301723920466, - "loss": 0.0156, + "epoch": 0.21, + "learning_rate": 0.00026786389168984476, + "loss": 0.0279, "step": 82650 }, { - "epoch": 0.42, - "learning_rate": 0.00023744544954619064, - "loss": 0.0224, + "epoch": 0.21, + "learning_rate": 0.00026786000347347327, + "loss": 0.0216, "step": 82660 }, { - "epoch": 0.42, - "learning_rate": 0.00023743788185317665, - "loss": 0.0151, + "epoch": 0.21, + "learning_rate": 0.0002678561152571018, + "loss": 0.0217, "step": 82670 }, { - "epoch": 0.42, - "learning_rate": 0.00023743031416016263, - "loss": 0.0174, + "epoch": 0.21, + "learning_rate": 0.00026785222704073036, + "loss": 0.0248, "step": 82680 }, { - "epoch": 0.42, - "learning_rate": 0.0002374227464671486, - "loss": 0.0157, + "epoch": 0.21, + "learning_rate": 0.00026784833882435887, + "loss": 0.0234, "step": 82690 }, { - "epoch": 0.42, - "learning_rate": 0.00023741517877413462, - "loss": 0.0215, + "epoch": 0.21, + "learning_rate": 0.0002678444506079874, + "loss": 0.0258, "step": 82700 }, { - "epoch": 0.42, - "learning_rate": 0.0002374076110811206, - "loss": 0.0198, + "epoch": 0.21, + "learning_rate": 0.00026784056239161595, + "loss": 0.0237, "step": 82710 }, { - "epoch": 0.42, - "learning_rate": 0.00023740004338810658, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.00026783667417524447, + "loss": 0.0189, "step": 82720 }, { - "epoch": 0.42, - "learning_rate": 0.0002373924756950926, - "loss": 0.0185, + "epoch": 0.21, + "learning_rate": 0.00026783278595887304, + "loss": 0.024, "step": 82730 }, { - "epoch": 0.42, - "learning_rate": 0.00023738490800207857, - "loss": 0.0238, + "epoch": 0.21, + "learning_rate": 0.00026782889774250155, + "loss": 0.0214, "step": 82740 }, { - "epoch": 0.42, - "learning_rate": 0.00023737734030906455, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.00026782500952613007, + "loss": 0.0244, "step": 82750 }, { - "epoch": 0.42, - "learning_rate": 0.00023736977261605053, - "loss": 0.0216, + "epoch": 0.21, + "learning_rate": 0.00026782112130975863, + "loss": 0.0249, "step": 82760 }, { - "epoch": 0.42, - "learning_rate": 0.00023736220492303654, - "loss": 0.0214, + "epoch": 0.21, + "learning_rate": 0.00026781723309338715, + "loss": 0.0243, "step": 82770 }, { - "epoch": 0.42, - "learning_rate": 0.00023735463723002252, - "loss": 0.0169, + "epoch": 0.21, + "learning_rate": 0.00026781334487701566, + "loss": 0.022, "step": 82780 }, { - "epoch": 0.42, - "learning_rate": 0.0002373470695370085, - "loss": 0.0182, + "epoch": 0.21, + "learning_rate": 0.00026780945666064423, + "loss": 0.0192, "step": 82790 }, { - "epoch": 0.42, - "learning_rate": 0.00023733950184399451, - "loss": 0.017, + "epoch": 0.21, + "learning_rate": 0.0002678055684442728, + "loss": 0.0182, "step": 82800 }, { - "epoch": 0.42, - "learning_rate": 0.0002373319341509805, - "loss": 0.0162, + "epoch": 0.21, + "learning_rate": 0.0002678016802279013, + "loss": 0.0244, "step": 82810 }, { - "epoch": 0.42, - "learning_rate": 0.00023732436645796648, - "loss": 0.0156, + "epoch": 0.21, + "learning_rate": 0.00026779779201152983, + "loss": 0.0276, "step": 82820 }, { - "epoch": 0.42, - "learning_rate": 0.00023731679876495249, - "loss": 0.0242, + "epoch": 0.21, + "learning_rate": 0.00026779390379515834, + "loss": 0.0227, "step": 82830 }, { - "epoch": 0.42, - "learning_rate": 0.00023730923107193847, - "loss": 0.0193, + "epoch": 0.21, + "learning_rate": 0.0002677900155787869, + "loss": 0.0231, "step": 82840 }, { - "epoch": 0.42, - "learning_rate": 0.00023730166337892445, - "loss": 0.0184, + "epoch": 0.21, + "learning_rate": 0.00026778612736241543, + "loss": 0.023, "step": 82850 }, { - "epoch": 0.42, - "learning_rate": 0.00023729409568591046, - "loss": 0.019, + "epoch": 0.21, + "learning_rate": 0.000267782239146044, + "loss": 0.0219, "step": 82860 }, { - "epoch": 0.42, - "learning_rate": 0.00023728652799289644, - "loss": 0.018, + "epoch": 0.21, + "learning_rate": 0.0002677783509296725, + "loss": 0.0242, "step": 82870 }, { - "epoch": 0.42, - "learning_rate": 0.00023727896029988242, - "loss": 0.0199, + "epoch": 0.21, + "learning_rate": 0.000267774462713301, + "loss": 0.0256, "step": 82880 }, { - "epoch": 0.42, - "learning_rate": 0.00023727139260686843, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.0002677705744969296, + "loss": 0.0262, "step": 82890 }, { - "epoch": 0.42, - "learning_rate": 0.0002372638249138544, - "loss": 0.0187, + "epoch": 0.21, + "learning_rate": 0.0002677666862805581, + "loss": 0.0232, "step": 82900 }, { - "epoch": 0.42, - "learning_rate": 0.0002372562572208404, - "loss": 0.0158, + "epoch": 0.21, + "learning_rate": 0.0002677627980641866, + "loss": 0.0279, "step": 82910 }, { - "epoch": 0.42, - "learning_rate": 0.00023724868952782637, - "loss": 0.0192, + "epoch": 0.21, + "learning_rate": 0.0002677589098478152, + "loss": 0.0253, "step": 82920 }, { - "epoch": 0.42, - "learning_rate": 0.00023724112183481238, - "loss": 0.0194, + "epoch": 0.21, + "learning_rate": 0.0002677550216314437, + "loss": 0.0207, "step": 82930 }, { - "epoch": 0.42, - "learning_rate": 0.00023723355414179836, - "loss": 0.0164, + "epoch": 0.21, + "learning_rate": 0.0002677511334150723, + "loss": 0.0234, "step": 82940 }, { - "epoch": 0.42, - "learning_rate": 0.00023722598644878434, - "loss": 0.0245, + "epoch": 0.22, + "learning_rate": 0.0002677472451987008, + "loss": 0.0211, "step": 82950 }, { - "epoch": 0.42, - "learning_rate": 0.00023721841875577035, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.0002677433569823293, + "loss": 0.0269, "step": 82960 }, { - "epoch": 0.42, - "learning_rate": 0.00023721085106275633, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.0002677394687659579, + "loss": 0.0197, "step": 82970 }, { - "epoch": 0.42, - "learning_rate": 0.00023720328336974232, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.0002677355805495864, + "loss": 0.0216, "step": 82980 }, { - "epoch": 0.42, - "learning_rate": 0.00023719571567672832, - "loss": 0.0156, + "epoch": 0.22, + "learning_rate": 0.00026773169233321496, + "loss": 0.0202, "step": 82990 }, { - "epoch": 0.42, - "learning_rate": 0.0002371881479837143, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.00026772780411684347, + "loss": 0.0236, "step": 83000 }, { - "epoch": 0.42, - "eval_cer": 0.9144954862024227, - "eval_loss": 0.012444199062883854, - "eval_runtime": 116.798, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.22, + "eval_cer": 0.881797861634692, + "eval_loss": 0.017287341877818108, + "eval_runtime": 108.0739, + "eval_samples_per_second": 18.506, + "eval_steps_per_second": 4.626, "step": 83000 }, { - "epoch": 0.42, - "learning_rate": 0.0002371805802907003, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.00026772391590047204, + "loss": 0.0273, "step": 83010 }, { - "epoch": 0.42, - "learning_rate": 0.0002371730125976863, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.00026772002768410055, + "loss": 0.0227, "step": 83020 }, { - "epoch": 0.42, - "learning_rate": 0.00023716544490467228, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.00026771613946772907, + "loss": 0.0252, "step": 83030 }, { - "epoch": 0.42, - "learning_rate": 0.00023715787721165826, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.0002677122512513576, + "loss": 0.0159, "step": 83040 }, { - "epoch": 0.42, - "learning_rate": 0.00023715030951864427, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.00026770836303498615, + "loss": 0.0257, "step": 83050 }, { - "epoch": 0.42, - "learning_rate": 0.00023714274182563025, - "loss": 0.0142, + "epoch": 0.22, + "learning_rate": 0.00026770447481861467, + "loss": 0.0197, "step": 83060 }, { - "epoch": 0.42, - "learning_rate": 0.00023713517413261623, - "loss": 0.0178, + "epoch": 0.22, + "learning_rate": 0.00026770058660224324, + "loss": 0.0199, "step": 83070 }, { - "epoch": 0.42, - "learning_rate": 0.0002371276064396022, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.00026769669838587175, + "loss": 0.0243, "step": 83080 }, { - "epoch": 0.42, - "learning_rate": 0.00023712003874658822, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.0002676928101695003, + "loss": 0.0239, "step": 83090 }, { - "epoch": 0.42, - "learning_rate": 0.0002371124710535742, - "loss": 0.017, + "epoch": 0.22, + "learning_rate": 0.00026768892195312883, + "loss": 0.0248, "step": 83100 }, { - "epoch": 0.42, - "learning_rate": 0.00023710490336056018, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.00026768503373675735, + "loss": 0.0243, "step": 83110 }, { - "epoch": 0.42, - "learning_rate": 0.0002370973356675462, - "loss": 0.02, + "epoch": 0.22, + "learning_rate": 0.00026768114552038586, + "loss": 0.0253, "step": 83120 }, { - "epoch": 0.42, - "learning_rate": 0.00023708976797453217, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.00026767725730401443, + "loss": 0.0228, "step": 83130 }, { - "epoch": 0.42, - "learning_rate": 0.00023708220028151815, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.000267673369087643, + "loss": 0.023, "step": 83140 }, { - "epoch": 0.42, - "learning_rate": 0.00023707463258850416, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.0002676694808712715, + "loss": 0.0217, "step": 83150 }, { - "epoch": 0.42, - "learning_rate": 0.00023706706489549014, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.00026766559265490003, + "loss": 0.025, "step": 83160 }, { - "epoch": 0.42, - "learning_rate": 0.00023705949720247613, - "loss": 0.0193, + "epoch": 0.22, + "learning_rate": 0.00026766170443852854, + "loss": 0.024, "step": 83170 }, { - "epoch": 0.42, - "learning_rate": 0.00023705192950946213, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002676578162221571, + "loss": 0.0237, "step": 83180 }, { - "epoch": 0.42, - "learning_rate": 0.00023704436181644812, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.0002676539280057856, + "loss": 0.0236, "step": 83190 }, { - "epoch": 0.42, - "learning_rate": 0.0002370367941234341, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.0002676500397894142, + "loss": 0.0214, "step": 83200 }, { - "epoch": 0.42, - "learning_rate": 0.0002370292264304201, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.0002676461515730427, + "loss": 0.0226, "step": 83210 }, { - "epoch": 0.42, - "learning_rate": 0.0002370216587374061, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.0002676422633566713, + "loss": 0.0259, "step": 83220 }, { - "epoch": 0.42, - "learning_rate": 0.00023701409104439207, - "loss": 0.0147, + "epoch": 0.22, + "learning_rate": 0.0002676383751402998, + "loss": 0.0232, "step": 83230 }, { - "epoch": 0.42, - "learning_rate": 0.00023700652335137808, - "loss": 0.0153, + "epoch": 0.22, + "learning_rate": 0.0002676344869239283, + "loss": 0.0196, "step": 83240 }, { - "epoch": 0.42, - "learning_rate": 0.00023699895565836406, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.0002676305987075568, + "loss": 0.0255, "step": 83250 }, { - "epoch": 0.42, - "learning_rate": 0.00023699138796535004, - "loss": 0.0157, + "epoch": 0.22, + "learning_rate": 0.0002676267104911854, + "loss": 0.0233, "step": 83260 }, { - "epoch": 0.42, - "learning_rate": 0.00023698382027233602, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.0002676228222748139, + "loss": 0.0232, "step": 83270 }, { - "epoch": 0.42, - "learning_rate": 0.00023697625257932203, - "loss": 0.0229, + "epoch": 0.22, + "learning_rate": 0.0002676189340584425, + "loss": 0.0239, "step": 83280 }, { - "epoch": 0.42, - "learning_rate": 0.000236968684886308, - "loss": 0.0139, + "epoch": 0.22, + "learning_rate": 0.000267615045842071, + "loss": 0.0239, "step": 83290 }, { - "epoch": 0.42, - "learning_rate": 0.000236961117193294, - "loss": 0.0156, + "epoch": 0.22, + "learning_rate": 0.00026761115762569956, + "loss": 0.0247, "step": 83300 }, { - "epoch": 0.42, - "learning_rate": 0.00023695354950028, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.00026760726940932807, + "loss": 0.0216, "step": 83310 }, { - "epoch": 0.42, - "learning_rate": 0.00023694598180726598, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.0002676033811929566, + "loss": 0.032, "step": 83320 }, { - "epoch": 0.42, - "learning_rate": 0.00023693841411425196, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.0002675994929765851, + "loss": 0.0268, "step": 83330 }, { - "epoch": 0.42, - "learning_rate": 0.00023693084642123797, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026759560476021367, + "loss": 0.0257, "step": 83340 }, { - "epoch": 0.42, - "learning_rate": 0.00023692327872822395, - "loss": 0.0136, + "epoch": 0.22, + "learning_rate": 0.00026759171654384224, + "loss": 0.027, "step": 83350 }, { - "epoch": 0.42, - "learning_rate": 0.00023691571103520994, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.00026758782832747075, + "loss": 0.019, "step": 83360 }, { - "epoch": 0.42, - "learning_rate": 0.00023690814334219594, - "loss": 0.0152, + "epoch": 0.22, + "learning_rate": 0.00026758394011109927, + "loss": 0.0247, "step": 83370 }, { - "epoch": 0.42, - "learning_rate": 0.00023690057564918193, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.0002675800518947278, + "loss": 0.0209, "step": 83380 }, { - "epoch": 0.42, - "learning_rate": 0.0002368930079561679, - "loss": 0.0157, + "epoch": 0.22, + "learning_rate": 0.00026757616367835635, + "loss": 0.0182, "step": 83390 }, { - "epoch": 0.42, - "learning_rate": 0.00023688544026315392, - "loss": 0.0207, + "epoch": 0.22, + "learning_rate": 0.00026757227546198487, + "loss": 0.0215, "step": 83400 }, { - "epoch": 0.42, - "learning_rate": 0.0002368778725701399, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.00026756838724561343, + "loss": 0.0241, "step": 83410 }, { - "epoch": 0.42, - "learning_rate": 0.00023687030487712588, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.00026756449902924195, + "loss": 0.02, "step": 83420 }, { - "epoch": 0.42, - "learning_rate": 0.00023686273718411186, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.0002675606108128705, + "loss": 0.0284, "step": 83430 }, { - "epoch": 0.42, - "learning_rate": 0.00023685516949109787, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.00026755672259649903, + "loss": 0.021, "step": 83440 }, { - "epoch": 0.42, - "learning_rate": 0.00023684760179808385, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.00026755283438012755, + "loss": 0.021, "step": 83450 }, { - "epoch": 0.42, - "learning_rate": 0.00023684003410506983, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.00026754894616375606, + "loss": 0.0297, "step": 83460 }, { - "epoch": 0.42, - "learning_rate": 0.00023683246641205584, - "loss": 0.0152, + "epoch": 0.22, + "learning_rate": 0.00026754505794738463, + "loss": 0.0278, "step": 83470 }, { - "epoch": 0.42, - "learning_rate": 0.00023682489871904182, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.0002675411697310132, + "loss": 0.0225, "step": 83480 }, { - "epoch": 0.42, - "learning_rate": 0.0002368173310260278, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.0002675372815146417, + "loss": 0.0237, "step": 83490 }, { - "epoch": 0.42, - "learning_rate": 0.0002368097633330138, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.00026753339329827023, + "loss": 0.0244, "step": 83500 }, { - "epoch": 0.42, - "learning_rate": 0.0002368021956399998, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.0002675295050818988, + "loss": 0.0223, "step": 83510 }, { - "epoch": 0.42, - "learning_rate": 0.00023679462794698577, - "loss": 0.0145, + "epoch": 0.22, + "learning_rate": 0.0002675256168655273, + "loss": 0.0288, "step": 83520 }, { - "epoch": 0.42, - "learning_rate": 0.00023678706025397178, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.0002675217286491558, + "loss": 0.0206, "step": 83530 }, { - "epoch": 0.42, - "learning_rate": 0.00023677949256095776, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002675178404327844, + "loss": 0.0254, "step": 83540 }, { - "epoch": 0.42, - "learning_rate": 0.00023677192486794375, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.0002675139522164129, + "loss": 0.0242, "step": 83550 }, { - "epoch": 0.42, - "learning_rate": 0.00023676435717492975, - "loss": 0.0142, + "epoch": 0.22, + "learning_rate": 0.0002675100640000415, + "loss": 0.0279, "step": 83560 }, { - "epoch": 0.42, - "learning_rate": 0.00023675678948191574, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026750617578367, + "loss": 0.023, "step": 83570 }, { - "epoch": 0.42, - "learning_rate": 0.00023674922178890172, - "loss": 0.022, + "epoch": 0.22, + "learning_rate": 0.0002675022875672985, + "loss": 0.0221, "step": 83580 }, { - "epoch": 0.42, - "learning_rate": 0.00023674165409588767, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.0002674983993509271, + "loss": 0.0229, "step": 83590 }, { - "epoch": 0.42, - "learning_rate": 0.00023673408640287368, - "loss": 0.035, + "epoch": 0.22, + "learning_rate": 0.0002674945111345556, + "loss": 0.0234, "step": 83600 }, { - "epoch": 0.42, - "learning_rate": 0.00023672651870985966, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.0002674906229181841, + "loss": 0.021, "step": 83610 }, { - "epoch": 0.42, - "learning_rate": 0.00023671895101684564, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.0002674867347018127, + "loss": 0.0223, "step": 83620 }, { - "epoch": 0.42, - "learning_rate": 0.00023671138332383165, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.0002674828464854412, + "loss": 0.0217, "step": 83630 }, { - "epoch": 0.42, - "learning_rate": 0.00023670381563081763, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.00026747895826906976, + "loss": 0.0206, "step": 83640 }, { - "epoch": 0.42, - "learning_rate": 0.00023669624793780361, - "loss": 0.0148, + "epoch": 0.22, + "learning_rate": 0.00026747507005269827, + "loss": 0.0212, "step": 83650 }, { - "epoch": 0.42, - "learning_rate": 0.0002366886802447896, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.0002674711818363268, + "loss": 0.0233, "step": 83660 }, { - "epoch": 0.42, - "learning_rate": 0.0002366811125517756, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.0002674672936199553, + "loss": 0.0218, "step": 83670 }, { - "epoch": 0.42, - "learning_rate": 0.00023667354485876159, - "loss": 0.0138, + "epoch": 0.22, + "learning_rate": 0.00026746340540358387, + "loss": 0.017, "step": 83680 }, { - "epoch": 0.42, - "learning_rate": 0.00023666597716574757, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026745951718721244, + "loss": 0.0264, "step": 83690 }, { - "epoch": 0.42, - "learning_rate": 0.00023665840947273358, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.00026745562897084095, + "loss": 0.0213, "step": 83700 }, { - "epoch": 0.42, - "learning_rate": 0.00023665084177971956, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.00026745174075446947, + "loss": 0.0224, "step": 83710 }, { - "epoch": 0.42, - "learning_rate": 0.00023664327408670554, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.00026744785253809804, + "loss": 0.022, "step": 83720 }, { - "epoch": 0.42, - "learning_rate": 0.00023663570639369155, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.00026744396432172655, + "loss": 0.0255, "step": 83730 }, { - "epoch": 0.42, - "learning_rate": 0.00023662813870067753, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.00026744007610535506, + "loss": 0.0242, "step": 83740 }, { - "epoch": 0.42, - "learning_rate": 0.0002366205710076635, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026743618788898363, + "loss": 0.024, "step": 83750 }, { - "epoch": 0.42, - "learning_rate": 0.00023661300331464952, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.00026743229967261215, + "loss": 0.0228, "step": 83760 }, { - "epoch": 0.42, - "learning_rate": 0.0002366054356216355, - "loss": 0.0223, + "epoch": 0.22, + "learning_rate": 0.0002674284114562407, + "loss": 0.0167, "step": 83770 }, { - "epoch": 0.42, - "learning_rate": 0.00023659786792862148, - "loss": 0.0146, + "epoch": 0.22, + "learning_rate": 0.00026742452323986923, + "loss": 0.0229, "step": 83780 }, { - "epoch": 0.42, - "learning_rate": 0.0002365903002356075, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.00026742063502349775, + "loss": 0.0249, "step": 83790 }, { - "epoch": 0.42, - "learning_rate": 0.00023658273254259347, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.0002674167468071263, + "loss": 0.0289, "step": 83800 }, { - "epoch": 0.42, - "learning_rate": 0.00023657516484957945, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.00026741285859075483, + "loss": 0.0249, "step": 83810 }, { - "epoch": 0.42, - "learning_rate": 0.00023656759715656543, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026740897037438334, + "loss": 0.0228, "step": 83820 }, { - "epoch": 0.42, - "learning_rate": 0.00023656002946355144, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.0002674050821580119, + "loss": 0.0296, "step": 83830 }, { - "epoch": 0.42, - "learning_rate": 0.00023655246177053742, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.0002674011939416405, + "loss": 0.0269, "step": 83840 }, { - "epoch": 0.42, - "learning_rate": 0.0002365448940775234, - "loss": 0.0143, + "epoch": 0.22, + "learning_rate": 0.000267397305725269, + "loss": 0.0248, "step": 83850 }, { - "epoch": 0.42, - "learning_rate": 0.00023653732638450941, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.0002673934175088975, + "loss": 0.0205, "step": 83860 }, { - "epoch": 0.42, - "learning_rate": 0.0002365297586914954, - "loss": 0.0139, + "epoch": 0.22, + "learning_rate": 0.000267389529292526, + "loss": 0.023, "step": 83870 }, { - "epoch": 0.42, - "learning_rate": 0.00023652219099848138, - "loss": 0.0139, + "epoch": 0.22, + "learning_rate": 0.0002673856410761546, + "loss": 0.0248, "step": 83880 }, { - "epoch": 0.42, - "learning_rate": 0.00023651462330546739, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.0002673817528597831, + "loss": 0.0212, "step": 83890 }, { - "epoch": 0.42, - "learning_rate": 0.00023650705561245337, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.0002673778646434117, + "loss": 0.0241, "step": 83900 }, { - "epoch": 0.42, - "learning_rate": 0.00023649948791943935, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.0002673739764270402, + "loss": 0.0207, "step": 83910 }, { - "epoch": 0.42, - "learning_rate": 0.00023649192022642536, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.0002673700882106687, + "loss": 0.0293, "step": 83920 }, { - "epoch": 0.42, - "learning_rate": 0.00023648435253341134, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.0002673661999942973, + "loss": 0.0247, "step": 83930 }, { - "epoch": 0.42, - "learning_rate": 0.00023647678484039732, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.0002673623117779258, + "loss": 0.0251, "step": 83940 }, { - "epoch": 0.42, - "learning_rate": 0.00023646921714738333, - "loss": 0.0219, + "epoch": 0.22, + "learning_rate": 0.0002673584235615543, + "loss": 0.0196, "step": 83950 }, { - "epoch": 0.42, - "learning_rate": 0.0002364616494543693, - "loss": 0.0189, + "epoch": 0.22, + "learning_rate": 0.00026735453534518287, + "loss": 0.0231, "step": 83960 }, { - "epoch": 0.42, - "learning_rate": 0.0002364540817613553, - "loss": 0.02, + "epoch": 0.22, + "learning_rate": 0.0002673506471288114, + "loss": 0.0242, "step": 83970 }, { - "epoch": 0.42, - "learning_rate": 0.00023644651406834127, - "loss": 0.02, + "epoch": 0.22, + "learning_rate": 0.00026734675891243996, + "loss": 0.0296, "step": 83980 }, { - "epoch": 0.42, - "learning_rate": 0.00023643894637532728, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.00026734287069606847, + "loss": 0.0224, "step": 83990 }, { - "epoch": 0.42, - "learning_rate": 0.00023643137868231326, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.000267338982479697, + "loss": 0.0256, "step": 84000 }, { - "epoch": 0.42, - "eval_cer": 0.9144935454101719, - "eval_loss": 0.012893411330878735, - "eval_runtime": 116.7828, - "eval_samples_per_second": 17.126, - "eval_steps_per_second": 4.281, + "epoch": 0.22, + "eval_cer": 0.8817796663545476, + "eval_loss": 0.017041249200701714, + "eval_runtime": 108.2013, + "eval_samples_per_second": 18.484, + "eval_steps_per_second": 4.621, "step": 84000 }, { - "epoch": 0.42, - "learning_rate": 0.00023642381098929924, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026733509426332555, + "loss": 0.0181, "step": 84010 }, { - "epoch": 0.42, - "learning_rate": 0.00023641624329628525, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.00026733120604695407, + "loss": 0.0207, "step": 84020 }, { - "epoch": 0.42, - "learning_rate": 0.00023640867560327123, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026732731783058264, + "loss": 0.0231, "step": 84030 }, { - "epoch": 0.42, - "learning_rate": 0.00023640110791025722, - "loss": 0.0153, + "epoch": 0.22, + "learning_rate": 0.00026732342961421115, + "loss": 0.0226, "step": 84040 }, { - "epoch": 0.42, - "learning_rate": 0.00023639354021724322, - "loss": 0.0116, + "epoch": 0.22, + "learning_rate": 0.0002673195413978397, + "loss": 0.0216, "step": 84050 }, { - "epoch": 0.42, - "learning_rate": 0.0002363859725242292, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026731565318146823, + "loss": 0.0223, "step": 84060 }, { - "epoch": 0.42, - "learning_rate": 0.0002363784048312152, - "loss": 0.0144, + "epoch": 0.22, + "learning_rate": 0.00026731176496509675, + "loss": 0.0222, "step": 84070 }, { - "epoch": 0.42, - "learning_rate": 0.0002363708371382012, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026730787674872526, + "loss": 0.0187, "step": 84080 }, { - "epoch": 0.42, - "learning_rate": 0.00023636326944518718, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026730398853235383, + "loss": 0.0238, "step": 84090 }, { - "epoch": 0.42, - "learning_rate": 0.00023635570175217316, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026730010031598235, + "loss": 0.0211, "step": 84100 }, { - "epoch": 0.42, - "learning_rate": 0.00023634813405915917, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.0002672962120996109, + "loss": 0.0271, "step": 84110 }, { - "epoch": 0.42, - "learning_rate": 0.00023634056636614515, - "loss": 0.0232, + "epoch": 0.22, + "learning_rate": 0.00026729232388323943, + "loss": 0.0261, "step": 84120 }, { - "epoch": 0.42, - "learning_rate": 0.00023633299867313113, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.00026728843566686794, + "loss": 0.0178, "step": 84130 }, { - "epoch": 0.42, - "learning_rate": 0.00023632543098011714, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.0002672845474504965, + "loss": 0.0259, "step": 84140 }, { - "epoch": 0.42, - "learning_rate": 0.00023631786328710312, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.00026728065923412503, + "loss": 0.0198, "step": 84150 }, { - "epoch": 0.42, - "learning_rate": 0.0002363102955940891, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.00026727677101775354, + "loss": 0.0205, "step": 84160 }, { - "epoch": 0.42, - "learning_rate": 0.00023630272790107508, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.0002672728828013821, + "loss": 0.0233, "step": 84170 }, { - "epoch": 0.42, - "learning_rate": 0.0002362951602080611, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.0002672689945850107, + "loss": 0.0219, "step": 84180 }, { - "epoch": 0.42, - "learning_rate": 0.00023628759251504707, - "loss": 0.015, + "epoch": 0.22, + "learning_rate": 0.0002672651063686392, + "loss": 0.0272, "step": 84190 }, { - "epoch": 0.42, - "learning_rate": 0.00023628002482203305, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.0002672612181522677, + "loss": 0.0217, "step": 84200 }, { - "epoch": 0.42, - "learning_rate": 0.00023627245712901906, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.0002672573299358962, + "loss": 0.0192, "step": 84210 }, { - "epoch": 0.42, - "learning_rate": 0.00023626488943600504, - "loss": 0.0152, + "epoch": 0.22, + "learning_rate": 0.0002672534417195248, + "loss": 0.0277, "step": 84220 }, { - "epoch": 0.42, - "learning_rate": 0.00023625732174299103, - "loss": 0.0144, + "epoch": 0.22, + "learning_rate": 0.0002672495535031533, + "loss": 0.0225, "step": 84230 }, { - "epoch": 0.42, - "learning_rate": 0.00023624975404997703, - "loss": 0.0189, + "epoch": 0.22, + "learning_rate": 0.0002672456652867819, + "loss": 0.0214, "step": 84240 }, { - "epoch": 0.43, - "learning_rate": 0.00023624218635696302, - "loss": 0.0212, + "epoch": 0.22, + "learning_rate": 0.0002672417770704104, + "loss": 0.0306, "step": 84250 }, { - "epoch": 0.43, - "learning_rate": 0.000236234618663949, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.00026723788885403896, + "loss": 0.0198, "step": 84260 }, { - "epoch": 0.43, - "learning_rate": 0.000236227050970935, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.0002672340006376675, + "loss": 0.0214, "step": 84270 }, { - "epoch": 0.43, - "learning_rate": 0.000236219483277921, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.000267230112421296, + "loss": 0.0236, "step": 84280 }, { - "epoch": 0.43, - "learning_rate": 0.00023621191558490697, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.0002672262242049245, + "loss": 0.023, "step": 84290 }, { - "epoch": 0.43, - "learning_rate": 0.00023620434789189298, - "loss": 0.0152, + "epoch": 0.22, + "learning_rate": 0.00026722233598855307, + "loss": 0.021, "step": 84300 }, { - "epoch": 0.43, - "learning_rate": 0.00023619678019887896, - "loss": 0.0189, + "epoch": 0.22, + "learning_rate": 0.0002672184477721816, + "loss": 0.0321, "step": 84310 }, { - "epoch": 0.43, - "learning_rate": 0.00023618921250586494, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.00026721455955581015, + "loss": 0.0218, "step": 84320 }, { - "epoch": 0.43, - "learning_rate": 0.00023618164481285092, - "loss": 0.0188, + "epoch": 0.22, + "learning_rate": 0.00026721067133943867, + "loss": 0.0262, "step": 84330 }, { - "epoch": 0.43, - "learning_rate": 0.00023617407711983693, - "loss": 0.0146, + "epoch": 0.22, + "learning_rate": 0.00026720678312306724, + "loss": 0.0248, "step": 84340 }, { - "epoch": 0.43, - "learning_rate": 0.0002361665094268229, - "loss": 0.0139, + "epoch": 0.22, + "learning_rate": 0.00026720289490669575, + "loss": 0.0222, "step": 84350 }, { - "epoch": 0.43, - "learning_rate": 0.0002361589417338089, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.00026719900669032427, + "loss": 0.0263, "step": 84360 }, { - "epoch": 0.43, - "learning_rate": 0.0002361513740407949, - "loss": 0.0148, + "epoch": 0.22, + "learning_rate": 0.0002671951184739528, + "loss": 0.0282, "step": 84370 }, { - "epoch": 0.43, - "learning_rate": 0.00023614380634778088, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.00026719123025758135, + "loss": 0.0238, "step": 84380 }, { - "epoch": 0.43, - "learning_rate": 0.00023613623865476686, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.0002671873420412099, + "loss": 0.0216, "step": 84390 }, { - "epoch": 0.43, - "learning_rate": 0.00023612867096175287, - "loss": 0.017, + "epoch": 0.22, + "learning_rate": 0.00026718345382483843, + "loss": 0.0263, "step": 84400 }, { - "epoch": 0.43, - "learning_rate": 0.00023612110326873885, - "loss": 0.0207, + "epoch": 0.22, + "learning_rate": 0.00026717956560846695, + "loss": 0.0235, "step": 84410 }, { - "epoch": 0.43, - "learning_rate": 0.00023611353557572484, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.00026717567739209546, + "loss": 0.0241, "step": 84420 }, { - "epoch": 0.43, - "learning_rate": 0.00023610596788271084, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.00026717178917572403, + "loss": 0.0208, "step": 84430 }, { - "epoch": 0.43, - "learning_rate": 0.00023609840018969683, - "loss": 0.0189, + "epoch": 0.22, + "learning_rate": 0.00026716790095935255, + "loss": 0.0195, "step": 84440 }, { - "epoch": 0.43, - "learning_rate": 0.0002360908324966828, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.0002671640127429811, + "loss": 0.0238, "step": 84450 }, { - "epoch": 0.43, - "learning_rate": 0.00023608326480366882, - "loss": 0.021, + "epoch": 0.22, + "learning_rate": 0.00026716012452660963, + "loss": 0.0274, "step": 84460 }, { - "epoch": 0.43, - "learning_rate": 0.0002360756971106548, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.0002671562363102382, + "loss": 0.0219, "step": 84470 }, { - "epoch": 0.43, - "learning_rate": 0.00023606812941764078, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.0002671523480938667, + "loss": 0.0259, "step": 84480 }, { - "epoch": 0.43, - "learning_rate": 0.00023606056172462676, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.0002671484598774952, + "loss": 0.0235, "step": 84490 }, { - "epoch": 0.43, - "learning_rate": 0.00023605299403161277, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.00026714457166112374, + "loss": 0.0226, "step": 84500 }, { - "epoch": 0.43, - "learning_rate": 0.00023604542633859875, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.0002671406834447523, + "loss": 0.02, "step": 84510 }, { - "epoch": 0.43, - "learning_rate": 0.00023603785864558473, - "loss": 0.015, + "epoch": 0.22, + "learning_rate": 0.0002671367952283808, + "loss": 0.0261, "step": 84520 }, { - "epoch": 0.43, - "learning_rate": 0.00023603029095257074, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.0002671329070120094, + "loss": 0.0226, "step": 84530 }, { - "epoch": 0.43, - "learning_rate": 0.00023602272325955672, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.0002671290187956379, + "loss": 0.0231, "step": 84540 }, { - "epoch": 0.43, - "learning_rate": 0.0002360151555665427, - "loss": 0.0156, + "epoch": 0.22, + "learning_rate": 0.0002671251305792665, + "loss": 0.0191, "step": 84550 }, { - "epoch": 0.43, - "learning_rate": 0.0002360075878735287, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.000267121242362895, + "loss": 0.0236, "step": 84560 }, { - "epoch": 0.43, - "learning_rate": 0.0002360000201805147, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.0002671173541465235, + "loss": 0.024, "step": 84570 }, { - "epoch": 0.43, - "learning_rate": 0.00023599245248750067, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.0002671134659301521, + "loss": 0.0221, "step": 84580 }, { - "epoch": 0.43, - "learning_rate": 0.00023598488479448668, - "loss": 0.0142, + "epoch": 0.22, + "learning_rate": 0.0002671095777137806, + "loss": 0.0253, "step": 84590 }, { - "epoch": 0.43, - "learning_rate": 0.00023597731710147266, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.00026710568949740916, + "loss": 0.0212, "step": 84600 }, { - "epoch": 0.43, - "learning_rate": 0.00023596974940845865, - "loss": 0.0174, + "epoch": 0.22, + "learning_rate": 0.00026710180128103767, + "loss": 0.0243, "step": 84610 }, { - "epoch": 0.43, - "learning_rate": 0.00023596218171544465, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.0002670979130646662, + "loss": 0.0235, "step": 84620 }, { - "epoch": 0.43, - "learning_rate": 0.00023595461402243064, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.0002670940248482947, + "loss": 0.0226, "step": 84630 }, { - "epoch": 0.43, - "learning_rate": 0.00023594704632941662, - "loss": 0.017, + "epoch": 0.22, + "learning_rate": 0.00026709013663192327, + "loss": 0.0206, "step": 84640 }, { - "epoch": 0.43, - "learning_rate": 0.00023593947863640263, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.0002670862484155518, + "loss": 0.0299, "step": 84650 }, { - "epoch": 0.43, - "learning_rate": 0.0002359319109433886, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.00026708236019918035, + "loss": 0.0224, "step": 84660 }, { - "epoch": 0.43, - "learning_rate": 0.0002359243432503746, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.00026707847198280887, + "loss": 0.0321, "step": 84670 }, { - "epoch": 0.43, - "learning_rate": 0.00023591677555736057, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.00026707458376643744, + "loss": 0.0238, "step": 84680 }, { - "epoch": 0.43, - "learning_rate": 0.00023590920786434658, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.00026707069555006595, + "loss": 0.025, "step": 84690 }, { - "epoch": 0.43, - "learning_rate": 0.00023590164017133256, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.00026706680733369447, + "loss": 0.0226, "step": 84700 }, { - "epoch": 0.43, - "learning_rate": 0.00023589407247831854, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.000267062919117323, + "loss": 0.0234, "step": 84710 }, { - "epoch": 0.43, - "learning_rate": 0.00023588650478530455, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026705903090095155, + "loss": 0.0303, "step": 84720 }, { - "epoch": 0.43, - "learning_rate": 0.00023587893709229053, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002670551426845801, + "loss": 0.0172, "step": 84730 }, { - "epoch": 0.43, - "learning_rate": 0.0002358713693992765, - "loss": 0.0136, + "epoch": 0.22, + "learning_rate": 0.00026705125446820863, + "loss": 0.0247, "step": 84740 }, { - "epoch": 0.43, - "learning_rate": 0.00023586380170626252, - "loss": 0.015, + "epoch": 0.22, + "learning_rate": 0.00026704736625183715, + "loss": 0.0246, "step": 84750 }, { - "epoch": 0.43, - "learning_rate": 0.0002358562340132485, - "loss": 0.0193, + "epoch": 0.22, + "learning_rate": 0.0002670434780354657, + "loss": 0.0255, "step": 84760 }, { - "epoch": 0.43, - "learning_rate": 0.00023584866632023448, - "loss": 0.0174, + "epoch": 0.22, + "learning_rate": 0.00026703958981909423, + "loss": 0.023, "step": 84770 }, { - "epoch": 0.43, - "learning_rate": 0.0002358410986272205, - "loss": 0.0197, + "epoch": 0.22, + "learning_rate": 0.00026703570160272274, + "loss": 0.0277, "step": 84780 }, { - "epoch": 0.43, - "learning_rate": 0.00023583353093420647, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.0002670318133863513, + "loss": 0.0267, "step": 84790 }, { - "epoch": 0.43, - "learning_rate": 0.00023582596324119246, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026702792516997983, + "loss": 0.0235, "step": 84800 }, { - "epoch": 0.43, - "learning_rate": 0.00023581839554817846, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.0002670240369536084, + "loss": 0.0277, "step": 84810 }, { - "epoch": 0.43, - "learning_rate": 0.00023581082785516445, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.0002670201487372369, + "loss": 0.0231, "step": 84820 }, { - "epoch": 0.43, - "learning_rate": 0.00023580326016215043, - "loss": 0.0206, + "epoch": 0.22, + "learning_rate": 0.0002670162605208654, + "loss": 0.0226, "step": 84830 }, { - "epoch": 0.43, - "learning_rate": 0.00023579569246913638, - "loss": 0.0149, + "epoch": 0.22, + "learning_rate": 0.000267012372304494, + "loss": 0.0237, "step": 84840 }, { - "epoch": 0.43, - "learning_rate": 0.0002357881247761224, - "loss": 0.0203, + "epoch": 0.22, + "learning_rate": 0.0002670084840881225, + "loss": 0.0245, "step": 84850 }, { - "epoch": 0.43, - "learning_rate": 0.00023578055708310837, - "loss": 0.018, + "epoch": 0.22, + "learning_rate": 0.000267004595871751, + "loss": 0.0229, "step": 84860 }, { - "epoch": 0.43, - "learning_rate": 0.00023577298939009435, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.0002670007076553796, + "loss": 0.0195, "step": 84870 }, { - "epoch": 0.43, - "learning_rate": 0.00023576542169708033, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.0002669968194390081, + "loss": 0.0256, "step": 84880 }, { - "epoch": 0.43, - "learning_rate": 0.00023575785400406634, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.0002669929312226367, + "loss": 0.0237, "step": 84890 }, { - "epoch": 0.43, - "learning_rate": 0.00023575028631105232, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.0002669890430062652, + "loss": 0.0219, "step": 84900 }, { - "epoch": 0.43, - "learning_rate": 0.0002357427186180383, - "loss": 0.0219, + "epoch": 0.22, + "learning_rate": 0.0002669851547898937, + "loss": 0.0272, "step": 84910 }, { - "epoch": 0.43, - "learning_rate": 0.00023573515092502431, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.0002669812665735222, + "loss": 0.0224, "step": 84920 }, { - "epoch": 0.43, - "learning_rate": 0.0002357275832320103, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.0002669773783571508, + "loss": 0.0248, "step": 84930 }, { - "epoch": 0.43, - "learning_rate": 0.00023572001553899628, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.00026697349014077936, + "loss": 0.018, "step": 84940 }, { - "epoch": 0.43, - "learning_rate": 0.00023571244784598229, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.00026696960192440787, + "loss": 0.031, "step": 84950 }, { - "epoch": 0.43, - "learning_rate": 0.00023570488015296827, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.0002669657137080364, + "loss": 0.0223, "step": 84960 }, { - "epoch": 0.43, - "learning_rate": 0.00023569731245995425, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.00026696182549166495, + "loss": 0.0245, "step": 84970 }, { - "epoch": 0.43, - "learning_rate": 0.00023568974476694026, - "loss": 0.0209, + "epoch": 0.22, + "learning_rate": 0.00026695793727529347, + "loss": 0.0246, "step": 84980 }, { - "epoch": 0.43, - "learning_rate": 0.00023568217707392624, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.000266954049058922, + "loss": 0.0211, "step": 84990 }, { - "epoch": 0.43, - "learning_rate": 0.00023567460938091222, - "loss": 0.014, + "epoch": 0.22, + "learning_rate": 0.00026695016084255055, + "loss": 0.0232, "step": 85000 }, { - "epoch": 0.43, - "eval_cer": 0.9145236276900593, - "eval_loss": 0.01236006710678339, - "eval_runtime": 116.6924, - "eval_samples_per_second": 17.139, - "eval_steps_per_second": 4.285, + "epoch": 0.22, + "eval_cer": 0.8817908634500211, + "eval_loss": 0.017778005450963974, + "eval_runtime": 108.2093, + "eval_samples_per_second": 18.483, + "eval_steps_per_second": 4.621, "step": 85000 }, { - "epoch": 0.43, - "learning_rate": 0.00023566704168789823, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.00026694627262617907, + "loss": 0.0212, "step": 85010 }, { - "epoch": 0.43, - "learning_rate": 0.0002356594739948842, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.00026694238440980764, + "loss": 0.0298, "step": 85020 }, { - "epoch": 0.43, - "learning_rate": 0.0002356519063018702, - "loss": 0.0167, + "epoch": 0.22, + "learning_rate": 0.00026693849619343615, + "loss": 0.0245, "step": 85030 }, { - "epoch": 0.43, - "learning_rate": 0.0002356443386088562, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.00026693460797706466, + "loss": 0.0234, "step": 85040 }, { - "epoch": 0.43, - "learning_rate": 0.00023563677091584218, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.00026693071976069323, + "loss": 0.0232, "step": 85050 }, { - "epoch": 0.43, - "learning_rate": 0.00023562920322282816, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.00026692683154432175, + "loss": 0.0186, "step": 85060 }, { - "epoch": 0.43, - "learning_rate": 0.00023562163552981414, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.0002669229433279503, + "loss": 0.0321, "step": 85070 }, { - "epoch": 0.43, - "learning_rate": 0.00023561406783680015, - "loss": 0.0224, + "epoch": 0.22, + "learning_rate": 0.00026691905511157883, + "loss": 0.0247, "step": 85080 }, { - "epoch": 0.43, - "learning_rate": 0.00023560650014378613, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.0002669151668952074, + "loss": 0.0245, "step": 85090 }, { - "epoch": 0.43, - "learning_rate": 0.00023559893245077212, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.0002669112786788359, + "loss": 0.0263, "step": 85100 }, { - "epoch": 0.43, - "learning_rate": 0.00023559136475775812, - "loss": 0.017, + "epoch": 0.22, + "learning_rate": 0.00026690739046246443, + "loss": 0.0235, "step": 85110 }, { - "epoch": 0.43, - "learning_rate": 0.0002355837970647441, - "loss": 0.0232, + "epoch": 0.22, + "learning_rate": 0.00026690350224609294, + "loss": 0.0194, "step": 85120 }, { - "epoch": 0.43, - "learning_rate": 0.0002355762293717301, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.0002668996140297215, + "loss": 0.023, "step": 85130 }, { - "epoch": 0.43, - "learning_rate": 0.0002355686616787161, - "loss": 0.0187, + "epoch": 0.22, + "learning_rate": 0.00026689572581335, + "loss": 0.0212, "step": 85140 }, { - "epoch": 0.43, - "learning_rate": 0.00023556109398570208, - "loss": 0.0213, + "epoch": 0.22, + "learning_rate": 0.0002668918375969786, + "loss": 0.0245, "step": 85150 }, { - "epoch": 0.43, - "learning_rate": 0.00023555352629268806, - "loss": 0.0174, + "epoch": 0.22, + "learning_rate": 0.0002668879493806071, + "loss": 0.0223, "step": 85160 }, { - "epoch": 0.43, - "learning_rate": 0.00023554595859967407, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.0002668840611642356, + "loss": 0.0277, "step": 85170 }, { - "epoch": 0.43, - "learning_rate": 0.00023553839090666005, - "loss": 0.0219, + "epoch": 0.22, + "learning_rate": 0.0002668801729478642, + "loss": 0.0267, "step": 85180 }, { - "epoch": 0.43, - "learning_rate": 0.00023553082321364603, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.0002668762847314927, + "loss": 0.0233, "step": 85190 }, { - "epoch": 0.43, - "learning_rate": 0.00023552325552063204, - "loss": 0.0119, + "epoch": 0.22, + "learning_rate": 0.0002668723965151212, + "loss": 0.0211, "step": 85200 }, { - "epoch": 0.43, - "learning_rate": 0.00023551568782761802, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.0002668685082987498, + "loss": 0.0263, "step": 85210 }, { - "epoch": 0.43, - "learning_rate": 0.000235508120134604, - "loss": 0.0229, + "epoch": 0.22, + "learning_rate": 0.00026686462008237836, + "loss": 0.025, "step": 85220 }, { - "epoch": 0.43, - "learning_rate": 0.00023550055244158998, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.0002668607318660069, + "loss": 0.0248, "step": 85230 }, { - "epoch": 0.43, - "learning_rate": 0.000235492984748576, - "loss": 0.0147, + "epoch": 0.22, + "learning_rate": 0.0002668568436496354, + "loss": 0.0232, "step": 85240 }, { - "epoch": 0.43, - "learning_rate": 0.00023548541705556197, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.0002668529554332639, + "loss": 0.0227, "step": 85250 }, { - "epoch": 0.43, - "learning_rate": 0.00023547784936254795, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.00026684906721689247, + "loss": 0.0302, "step": 85260 }, { - "epoch": 0.43, - "learning_rate": 0.00023547028166953396, - "loss": 0.0185, + "epoch": 0.22, + "learning_rate": 0.000266845179000521, + "loss": 0.0242, "step": 85270 }, { - "epoch": 0.43, - "learning_rate": 0.00023546271397651994, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026684129078414956, + "loss": 0.029, "step": 85280 }, { - "epoch": 0.43, - "learning_rate": 0.00023545514628350593, - "loss": 0.0205, + "epoch": 0.22, + "learning_rate": 0.00026683740256777807, + "loss": 0.0237, "step": 85290 }, { - "epoch": 0.43, - "learning_rate": 0.00023544757859049193, - "loss": 0.0212, + "epoch": 0.22, + "learning_rate": 0.00026683351435140664, + "loss": 0.0255, "step": 85300 }, { - "epoch": 0.43, - "learning_rate": 0.00023544001089747792, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.00026682962613503515, + "loss": 0.0204, "step": 85310 }, { - "epoch": 0.43, - "learning_rate": 0.0002354324432044639, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.00026682573791866367, + "loss": 0.0251, "step": 85320 }, { - "epoch": 0.43, - "learning_rate": 0.0002354248755114499, - "loss": 0.0301, + "epoch": 0.22, + "learning_rate": 0.0002668218497022922, + "loss": 0.0263, "step": 85330 }, { - "epoch": 0.43, - "learning_rate": 0.0002354173078184359, - "loss": 0.0199, + "epoch": 0.22, + "learning_rate": 0.00026681796148592075, + "loss": 0.0208, "step": 85340 }, { - "epoch": 0.43, - "learning_rate": 0.00023540974012542187, - "loss": 0.0149, + "epoch": 0.22, + "learning_rate": 0.00026681407326954927, + "loss": 0.0253, "step": 85350 }, { - "epoch": 0.43, - "learning_rate": 0.00023540217243240788, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.00026681018505317783, + "loss": 0.0274, "step": 85360 }, { - "epoch": 0.43, - "learning_rate": 0.00023539460473939386, - "loss": 0.0229, + "epoch": 0.22, + "learning_rate": 0.00026680629683680635, + "loss": 0.0217, "step": 85370 }, { - "epoch": 0.43, - "learning_rate": 0.00023538703704637984, - "loss": 0.0135, + "epoch": 0.22, + "learning_rate": 0.00026680240862043486, + "loss": 0.0241, "step": 85380 }, { - "epoch": 0.43, - "learning_rate": 0.00023537946935336582, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.00026679852040406343, + "loss": 0.028, "step": 85390 }, { - "epoch": 0.43, - "learning_rate": 0.00023537190166035183, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.00026679463218769195, + "loss": 0.0222, "step": 85400 }, { - "epoch": 0.43, - "learning_rate": 0.0002353643339673378, - "loss": 0.0154, + "epoch": 0.22, + "learning_rate": 0.00026679074397132046, + "loss": 0.0296, "step": 85410 }, { - "epoch": 0.43, - "learning_rate": 0.0002353567662743238, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026678685575494903, + "loss": 0.0244, "step": 85420 }, { - "epoch": 0.43, - "learning_rate": 0.0002353491985813098, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.0002667829675385776, + "loss": 0.0251, "step": 85430 }, { - "epoch": 0.43, - "learning_rate": 0.00023534163088829578, - "loss": 0.0134, + "epoch": 0.22, + "learning_rate": 0.0002667790793222061, + "loss": 0.028, "step": 85440 }, { - "epoch": 0.43, - "learning_rate": 0.00023533406319528176, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.00026677519110583463, + "loss": 0.0236, "step": 85450 }, { - "epoch": 0.43, - "learning_rate": 0.00023532649550226777, - "loss": 0.0139, + "epoch": 0.22, + "learning_rate": 0.00026677130288946314, + "loss": 0.0242, "step": 85460 }, { - "epoch": 0.43, - "learning_rate": 0.00023531892780925375, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.0002667674146730917, + "loss": 0.0287, "step": 85470 }, { - "epoch": 0.43, - "learning_rate": 0.00023531136011623974, - "loss": 0.0146, + "epoch": 0.22, + "learning_rate": 0.0002667635264567202, + "loss": 0.0222, "step": 85480 }, { - "epoch": 0.43, - "learning_rate": 0.00023530379242322574, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.0002667596382403488, + "loss": 0.0236, "step": 85490 }, { - "epoch": 0.43, - "learning_rate": 0.00023529622473021173, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.0002667557500239773, + "loss": 0.024, "step": 85500 }, { - "epoch": 0.43, - "learning_rate": 0.0002352886570371977, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.0002667518618076059, + "loss": 0.0204, "step": 85510 }, { - "epoch": 0.43, - "learning_rate": 0.00023528108934418372, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.0002667479735912344, + "loss": 0.0264, "step": 85520 }, { - "epoch": 0.43, - "learning_rate": 0.0002352735216511697, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.0002667440853748629, + "loss": 0.0227, "step": 85530 }, { - "epoch": 0.43, - "learning_rate": 0.00023526595395815568, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.0002667401971584914, + "loss": 0.021, "step": 85540 }, { - "epoch": 0.43, - "learning_rate": 0.00023525838626514166, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.00026673630894212, + "loss": 0.0225, "step": 85550 }, { - "epoch": 0.43, - "learning_rate": 0.00023525081857212767, - "loss": 0.0123, + "epoch": 0.22, + "learning_rate": 0.0002667324207257485, + "loss": 0.0245, "step": 85560 }, { - "epoch": 0.43, - "learning_rate": 0.00023524325087911365, - "loss": 0.0198, + "epoch": 0.22, + "learning_rate": 0.0002667285325093771, + "loss": 0.0172, "step": 85570 }, { - "epoch": 0.43, - "learning_rate": 0.00023523568318609963, - "loss": 0.0272, + "epoch": 0.22, + "learning_rate": 0.0002667246442930056, + "loss": 0.0195, "step": 85580 }, { - "epoch": 0.43, - "learning_rate": 0.00023522811549308564, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.00026672075607663416, + "loss": 0.0277, "step": 85590 }, { - "epoch": 0.43, - "learning_rate": 0.00023522054780007162, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.00026671686786026267, + "loss": 0.0222, "step": 85600 }, { - "epoch": 0.43, - "learning_rate": 0.0002352129801070576, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.0002667129796438912, + "loss": 0.0225, "step": 85610 }, { - "epoch": 0.43, - "learning_rate": 0.0002352054124140436, - "loss": 0.0219, + "epoch": 0.22, + "learning_rate": 0.00026670909142751975, + "loss": 0.0213, "step": 85620 }, { - "epoch": 0.43, - "learning_rate": 0.0002351978447210296, - "loss": 0.0174, + "epoch": 0.22, + "learning_rate": 0.00026670520321114827, + "loss": 0.0245, "step": 85630 }, { - "epoch": 0.43, - "learning_rate": 0.00023519027702801557, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.00026670131499477684, + "loss": 0.0247, "step": 85640 }, { - "epoch": 0.43, - "learning_rate": 0.00023518270933500158, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.00026669742677840535, + "loss": 0.0261, "step": 85650 }, { - "epoch": 0.43, - "learning_rate": 0.00023517514164198756, - "loss": 0.0149, + "epoch": 0.22, + "learning_rate": 0.00026669353856203387, + "loss": 0.0244, "step": 85660 }, { - "epoch": 0.43, - "learning_rate": 0.00023516757394897355, - "loss": 0.0168, + "epoch": 0.22, + "learning_rate": 0.0002666896503456624, + "loss": 0.0318, "step": 85670 }, { - "epoch": 0.43, - "learning_rate": 0.00023516000625595955, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.00026668576212929095, + "loss": 0.0236, "step": 85680 }, { - "epoch": 0.43, - "learning_rate": 0.00023515243856294554, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.00026668187391291946, + "loss": 0.0216, "step": 85690 }, { - "epoch": 0.43, - "learning_rate": 0.00023514487086993152, - "loss": 0.0115, + "epoch": 0.22, + "learning_rate": 0.00026667798569654803, + "loss": 0.0239, "step": 85700 }, { - "epoch": 0.43, - "learning_rate": 0.00023513730317691753, - "loss": 0.0178, + "epoch": 0.22, + "learning_rate": 0.00026667409748017655, + "loss": 0.0245, "step": 85710 }, { - "epoch": 0.43, - "learning_rate": 0.0002351297354839035, - "loss": 0.0152, + "epoch": 0.22, + "learning_rate": 0.0002666702092638051, + "loss": 0.026, "step": 85720 }, { - "epoch": 0.43, - "learning_rate": 0.0002351221677908895, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.00026666632104743363, + "loss": 0.0292, "step": 85730 }, { - "epoch": 0.43, - "learning_rate": 0.00023511460009787547, - "loss": 0.0182, + "epoch": 0.22, + "learning_rate": 0.00026666243283106215, + "loss": 0.0255, "step": 85740 }, { - "epoch": 0.43, - "learning_rate": 0.00023510703240486148, - "loss": 0.0233, + "epoch": 0.22, + "learning_rate": 0.00026665854461469066, + "loss": 0.023, "step": 85750 }, { - "epoch": 0.43, - "learning_rate": 0.00023509946471184746, - "loss": 0.0231, + "epoch": 0.22, + "learning_rate": 0.00026665465639831923, + "loss": 0.0191, "step": 85760 }, { - "epoch": 0.43, - "learning_rate": 0.00023509189701883344, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.0002666507681819478, + "loss": 0.025, "step": 85770 }, { - "epoch": 0.43, - "learning_rate": 0.00023508432932581945, - "loss": 0.0201, + "epoch": 0.22, + "learning_rate": 0.0002666468799655763, + "loss": 0.0227, "step": 85780 }, { - "epoch": 0.43, - "learning_rate": 0.00023507676163280543, - "loss": 0.023, + "epoch": 0.22, + "learning_rate": 0.0002666429917492048, + "loss": 0.0275, "step": 85790 }, { - "epoch": 0.43, - "learning_rate": 0.0002350691939397914, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002666391035328334, + "loss": 0.0272, "step": 85800 }, { - "epoch": 0.43, - "learning_rate": 0.00023506162624677742, - "loss": 0.023, + "epoch": 0.22, + "learning_rate": 0.0002666352153164619, + "loss": 0.0245, "step": 85810 }, { - "epoch": 0.43, - "learning_rate": 0.0002350540585537634, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.0002666313271000904, + "loss": 0.0241, "step": 85820 }, { - "epoch": 0.43, - "learning_rate": 0.00023504649086074938, - "loss": 0.0202, + "epoch": 0.22, + "learning_rate": 0.000266627438883719, + "loss": 0.0236, "step": 85830 }, { - "epoch": 0.43, - "learning_rate": 0.0002350389231677354, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002666235506673475, + "loss": 0.0206, "step": 85840 }, { - "epoch": 0.43, - "learning_rate": 0.00023503135547472137, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.0002666196624509761, + "loss": 0.0258, "step": 85850 }, { - "epoch": 0.43, - "learning_rate": 0.00023502378778170736, - "loss": 0.0139, + "epoch": 0.22, + "learning_rate": 0.0002666157742346046, + "loss": 0.0255, "step": 85860 }, { - "epoch": 0.43, - "learning_rate": 0.00023501622008869336, - "loss": 0.0157, + "epoch": 0.22, + "learning_rate": 0.0002666118860182331, + "loss": 0.0197, "step": 85870 }, { - "epoch": 0.43, - "learning_rate": 0.00023500865239567935, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.0002666079978018616, + "loss": 0.0233, "step": 85880 }, { - "epoch": 0.43, - "learning_rate": 0.00023500108470266533, - "loss": 0.0174, + "epoch": 0.22, + "learning_rate": 0.0002666041095854902, + "loss": 0.0262, "step": 85890 }, { - "epoch": 0.43, - "learning_rate": 0.0002349935170096513, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.0002666002213691187, + "loss": 0.0266, "step": 85900 }, { - "epoch": 0.43, - "learning_rate": 0.00023498594931663732, - "loss": 0.0237, + "epoch": 0.22, + "learning_rate": 0.00026659633315274727, + "loss": 0.0248, "step": 85910 }, { - "epoch": 0.43, - "learning_rate": 0.0002349783816236233, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.0002665924449363758, + "loss": 0.0244, "step": 85920 }, { - "epoch": 0.43, - "learning_rate": 0.00023497081393060928, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.00026658855672000436, + "loss": 0.0233, "step": 85930 }, { - "epoch": 0.43, - "learning_rate": 0.0002349632462375953, - "loss": 0.0175, + "epoch": 0.22, + "learning_rate": 0.00026658466850363287, + "loss": 0.0227, "step": 85940 }, { - "epoch": 0.43, - "learning_rate": 0.00023495567854458127, - "loss": 0.0183, + "epoch": 0.22, + "learning_rate": 0.0002665807802872614, + "loss": 0.0238, "step": 85950 }, { - "epoch": 0.43, - "learning_rate": 0.00023494811085156725, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.0002665768920708899, + "loss": 0.0257, "step": 85960 }, { - "epoch": 0.43, - "learning_rate": 0.00023494054315855326, - "loss": 0.0143, + "epoch": 0.22, + "learning_rate": 0.00026657300385451847, + "loss": 0.0241, "step": 85970 }, { - "epoch": 0.43, - "learning_rate": 0.00023493297546553924, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026656911563814704, + "loss": 0.021, "step": 85980 }, { - "epoch": 0.43, - "learning_rate": 0.00023492540777252522, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026656522742177555, + "loss": 0.0232, "step": 85990 }, { - "epoch": 0.43, - "learning_rate": 0.00023491784007951123, - "loss": 0.0186, + "epoch": 0.22, + "learning_rate": 0.00026656133920540407, + "loss": 0.0236, "step": 86000 }, { - "epoch": 0.43, - "eval_cer": 0.9144702559031622, - "eval_loss": 0.012443006969988346, - "eval_runtime": 116.6618, - "eval_samples_per_second": 17.144, - "eval_steps_per_second": 4.286, + "epoch": 0.22, + "eval_cer": 0.8817950623608236, + "eval_loss": 0.017185769975185394, + "eval_runtime": 107.5803, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, "step": 86000 }, { - "epoch": 0.43, - "learning_rate": 0.0002349102723864972, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.00026655745098903263, + "loss": 0.0215, "step": 86010 }, { - "epoch": 0.43, - "learning_rate": 0.0002349027046934832, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.00026655356277266115, + "loss": 0.032, "step": 86020 }, { - "epoch": 0.43, - "learning_rate": 0.0002348951370004692, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.00026654967455628966, + "loss": 0.0219, "step": 86030 }, { - "epoch": 0.43, - "learning_rate": 0.00023488756930745518, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026654578633991823, + "loss": 0.0273, "step": 86040 }, { - "epoch": 0.43, - "learning_rate": 0.00023488000161444117, - "loss": 0.017, + "epoch": 0.22, + "learning_rate": 0.00026654189812354675, + "loss": 0.0252, "step": 86050 }, { - "epoch": 0.43, - "learning_rate": 0.00023487243392142715, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.0002665380099071753, + "loss": 0.0206, "step": 86060 }, { - "epoch": 0.43, - "learning_rate": 0.00023486486622841316, - "loss": 0.0178, + "epoch": 0.22, + "learning_rate": 0.00026653412169080383, + "loss": 0.0244, "step": 86070 }, { - "epoch": 0.43, - "learning_rate": 0.00023485729853539914, - "loss": 0.0188, + "epoch": 0.22, + "learning_rate": 0.00026653023347443234, + "loss": 0.0289, "step": 86080 }, { - "epoch": 0.43, - "learning_rate": 0.00023484973084238512, - "loss": 0.0184, + "epoch": 0.22, + "learning_rate": 0.0002665263452580609, + "loss": 0.0235, "step": 86090 }, { - "epoch": 0.43, - "learning_rate": 0.0002348421631493711, - "loss": 0.017, + "epoch": 0.22, + "learning_rate": 0.00026652245704168943, + "loss": 0.0226, "step": 86100 }, { - "epoch": 0.43, - "learning_rate": 0.00023483459545635708, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.00026651856882531794, + "loss": 0.0278, "step": 86110 }, { - "epoch": 0.43, - "learning_rate": 0.00023482702776334306, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002665146806089465, + "loss": 0.0233, "step": 86120 }, { - "epoch": 0.43, - "learning_rate": 0.00023481946007032904, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.000266510792392575, + "loss": 0.0228, "step": 86130 }, { - "epoch": 0.43, - "learning_rate": 0.00023481189237731505, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.0002665069041762036, + "loss": 0.0224, "step": 86140 }, { - "epoch": 0.43, - "learning_rate": 0.00023480432468430103, - "loss": 0.021, + "epoch": 0.22, + "learning_rate": 0.0002665030159598321, + "loss": 0.0263, "step": 86150 }, { - "epoch": 0.43, - "learning_rate": 0.00023479675699128702, - "loss": 0.0153, + "epoch": 0.22, + "learning_rate": 0.0002664991277434606, + "loss": 0.0269, "step": 86160 }, { - "epoch": 0.43, - "learning_rate": 0.00023478918929827302, - "loss": 0.0155, + "epoch": 0.22, + "learning_rate": 0.0002664952395270892, + "loss": 0.0238, "step": 86170 }, { - "epoch": 0.43, - "learning_rate": 0.000234781621605259, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.0002664913513107177, + "loss": 0.026, "step": 86180 }, { - "epoch": 0.43, - "learning_rate": 0.000234774053912245, - "loss": 0.0188, + "epoch": 0.22, + "learning_rate": 0.0002664874630943463, + "loss": 0.0211, "step": 86190 }, { - "epoch": 0.43, - "learning_rate": 0.000234766486219231, - "loss": 0.0251, + "epoch": 0.22, + "learning_rate": 0.0002664835748779748, + "loss": 0.0215, "step": 86200 }, { - "epoch": 0.43, - "learning_rate": 0.00023475891852621698, - "loss": 0.0162, + "epoch": 0.22, + "learning_rate": 0.0002664796866616033, + "loss": 0.0246, "step": 86210 }, { - "epoch": 0.43, - "learning_rate": 0.00023475135083320296, - "loss": 0.0194, + "epoch": 0.22, + "learning_rate": 0.0002664757984452319, + "loss": 0.0254, "step": 86220 }, { - "epoch": 0.44, - "learning_rate": 0.00023474378314018897, - "loss": 0.0236, + "epoch": 0.22, + "learning_rate": 0.0002664719102288604, + "loss": 0.0253, "step": 86230 }, { - "epoch": 0.44, - "learning_rate": 0.00023473621544717495, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.0002664680220124889, + "loss": 0.0195, "step": 86240 }, { - "epoch": 0.44, - "learning_rate": 0.00023472864775416093, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.00026646413379611747, + "loss": 0.0259, "step": 86250 }, { - "epoch": 0.44, - "learning_rate": 0.00023472108006114694, - "loss": 0.0137, + "epoch": 0.22, + "learning_rate": 0.000266460245579746, + "loss": 0.024, "step": 86260 }, { - "epoch": 0.44, - "learning_rate": 0.00023471351236813292, - "loss": 0.0157, + "epoch": 0.22, + "learning_rate": 0.00026645635736337455, + "loss": 0.0219, "step": 86270 }, { - "epoch": 0.44, - "learning_rate": 0.0002347059446751189, - "loss": 0.0172, + "epoch": 0.22, + "learning_rate": 0.00026645246914700307, + "loss": 0.0189, "step": 86280 }, { - "epoch": 0.44, - "learning_rate": 0.00023469837698210488, - "loss": 0.0181, + "epoch": 0.22, + "learning_rate": 0.0002664485809306316, + "loss": 0.0269, "step": 86290 }, { - "epoch": 0.44, - "learning_rate": 0.0002346908092890909, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.00026644469271426015, + "loss": 0.0334, "step": 86300 }, { - "epoch": 0.44, - "learning_rate": 0.00023468324159607687, - "loss": 0.0136, + "epoch": 0.22, + "learning_rate": 0.00026644080449788867, + "loss": 0.0241, "step": 86310 }, { - "epoch": 0.44, - "learning_rate": 0.00023467567390306285, - "loss": 0.016, + "epoch": 0.22, + "learning_rate": 0.00026643691628151724, + "loss": 0.0214, "step": 86320 }, { - "epoch": 0.44, - "learning_rate": 0.00023466810621004886, - "loss": 0.0142, + "epoch": 0.22, + "learning_rate": 0.00026643302806514575, + "loss": 0.0231, "step": 86330 }, { - "epoch": 0.44, - "learning_rate": 0.00023466053851703484, - "loss": 0.0193, + "epoch": 0.22, + "learning_rate": 0.0002664291398487743, + "loss": 0.0268, "step": 86340 }, { - "epoch": 0.44, - "learning_rate": 0.00023465297082402083, - "loss": 0.0159, + "epoch": 0.22, + "learning_rate": 0.00026642525163240283, + "loss": 0.0226, "step": 86350 }, { - "epoch": 0.44, - "learning_rate": 0.00023464540313100683, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.00026642136341603135, + "loss": 0.0248, "step": 86360 }, { - "epoch": 0.44, - "learning_rate": 0.00023463783543799282, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.00026641747519965986, + "loss": 0.0222, "step": 86370 }, { - "epoch": 0.44, - "learning_rate": 0.0002346302677449788, - "loss": 0.014, + "epoch": 0.22, + "learning_rate": 0.00026641358698328843, + "loss": 0.0253, "step": 86380 }, { - "epoch": 0.44, - "learning_rate": 0.0002346227000519648, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.00026640969876691695, + "loss": 0.0222, "step": 86390 }, { - "epoch": 0.44, - "learning_rate": 0.0002346151323589508, - "loss": 0.019, + "epoch": 0.22, + "learning_rate": 0.0002664058105505455, + "loss": 0.0197, "step": 86400 }, { - "epoch": 0.44, - "learning_rate": 0.00023460756466593677, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.00026640192233417403, + "loss": 0.0207, "step": 86410 }, { - "epoch": 0.44, - "learning_rate": 0.00023459999697292278, - "loss": 0.0169, + "epoch": 0.22, + "learning_rate": 0.00026639803411780254, + "loss": 0.0242, "step": 86420 }, { - "epoch": 0.44, - "learning_rate": 0.00023459242927990876, - "loss": 0.0149, + "epoch": 0.22, + "learning_rate": 0.0002663941459014311, + "loss": 0.0238, "step": 86430 }, { - "epoch": 0.44, - "learning_rate": 0.00023458486158689474, - "loss": 0.0163, + "epoch": 0.22, + "learning_rate": 0.0002663902576850596, + "loss": 0.0212, "step": 86440 }, { - "epoch": 0.44, - "learning_rate": 0.00023457729389388072, - "loss": 0.0152, + "epoch": 0.22, + "learning_rate": 0.00026638636946868814, + "loss": 0.0186, "step": 86450 }, { - "epoch": 0.44, - "learning_rate": 0.00023456972620086673, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.0002663824812523167, + "loss": 0.0233, "step": 86460 }, { - "epoch": 0.44, - "learning_rate": 0.0002345621585078527, - "loss": 0.0149, + "epoch": 0.22, + "learning_rate": 0.0002663785930359453, + "loss": 0.026, "step": 86470 }, { - "epoch": 0.44, - "learning_rate": 0.0002345545908148387, - "loss": 0.0228, + "epoch": 0.22, + "learning_rate": 0.0002663747048195738, + "loss": 0.0218, "step": 86480 }, { - "epoch": 0.44, - "learning_rate": 0.0002345470231218247, - "loss": 0.0214, + "epoch": 0.22, + "learning_rate": 0.0002663708166032023, + "loss": 0.0253, "step": 86490 }, { - "epoch": 0.44, - "learning_rate": 0.00023453945542881068, - "loss": 0.0142, + "epoch": 0.22, + "learning_rate": 0.0002663669283868308, + "loss": 0.0236, "step": 86500 }, { - "epoch": 0.44, - "learning_rate": 0.00023453188773579667, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.0002663630401704594, + "loss": 0.0227, "step": 86510 }, { - "epoch": 0.44, - "learning_rate": 0.00023452432004278267, - "loss": 0.0293, + "epoch": 0.22, + "learning_rate": 0.0002663591519540879, + "loss": 0.0213, "step": 86520 }, { - "epoch": 0.44, - "learning_rate": 0.00023451675234976865, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.0002663552637377165, + "loss": 0.0287, "step": 86530 }, { - "epoch": 0.44, - "learning_rate": 0.00023450918465675464, - "loss": 0.0191, + "epoch": 0.22, + "learning_rate": 0.000266351375521345, + "loss": 0.025, "step": 86540 }, { - "epoch": 0.44, - "learning_rate": 0.00023450161696374064, - "loss": 0.015, + "epoch": 0.22, + "learning_rate": 0.00026634748730497356, + "loss": 0.0259, "step": 86550 }, { - "epoch": 0.44, - "learning_rate": 0.00023449404927072663, - "loss": 0.02, + "epoch": 0.22, + "learning_rate": 0.00026634359908860207, + "loss": 0.0219, "step": 86560 }, { - "epoch": 0.44, - "learning_rate": 0.0002344864815777126, - "loss": 0.0195, + "epoch": 0.22, + "learning_rate": 0.0002663397108722306, + "loss": 0.0208, "step": 86570 }, { - "epoch": 0.44, - "learning_rate": 0.00023447891388469862, - "loss": 0.0164, + "epoch": 0.22, + "learning_rate": 0.0002663358226558591, + "loss": 0.0216, "step": 86580 }, { - "epoch": 0.44, - "learning_rate": 0.0002344713461916846, - "loss": 0.0173, + "epoch": 0.22, + "learning_rate": 0.00026633193443948767, + "loss": 0.0231, "step": 86590 }, { - "epoch": 0.44, - "learning_rate": 0.00023446377849867058, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002663280462231162, + "loss": 0.0241, "step": 86600 }, { - "epoch": 0.44, - "learning_rate": 0.0002344562108056566, - "loss": 0.0161, + "epoch": 0.22, + "learning_rate": 0.00026632415800674475, + "loss": 0.0268, "step": 86610 }, { - "epoch": 0.44, - "learning_rate": 0.00023444864311264257, - "loss": 0.0179, + "epoch": 0.22, + "learning_rate": 0.00026632026979037327, + "loss": 0.0232, "step": 86620 }, { - "epoch": 0.44, - "learning_rate": 0.00023444107541962855, - "loss": 0.0188, + "epoch": 0.22, + "learning_rate": 0.0002663163815740018, + "loss": 0.0248, "step": 86630 }, { - "epoch": 0.44, - "learning_rate": 0.00023443350772661453, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.00026631249335763035, + "loss": 0.026, "step": 86640 }, { - "epoch": 0.44, - "learning_rate": 0.00023442594003360054, - "loss": 0.0145, + "epoch": 0.22, + "learning_rate": 0.00026630860514125887, + "loss": 0.0222, "step": 86650 }, { - "epoch": 0.44, - "learning_rate": 0.00023441837234058652, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.00026630471692488743, + "loss": 0.0265, "step": 86660 }, { - "epoch": 0.44, - "learning_rate": 0.0002344108046475725, - "loss": 0.0158, + "epoch": 0.22, + "learning_rate": 0.00026630082870851595, + "loss": 0.0216, "step": 86670 }, { - "epoch": 0.44, - "learning_rate": 0.0002344032369545585, - "loss": 0.0177, + "epoch": 0.22, + "learning_rate": 0.0002662969404921445, + "loss": 0.0262, "step": 86680 }, { - "epoch": 0.44, - "learning_rate": 0.0002343956692615445, - "loss": 0.0147, + "epoch": 0.22, + "learning_rate": 0.00026629305227577303, + "loss": 0.0245, "step": 86690 }, { - "epoch": 0.44, - "learning_rate": 0.00023438810156853048, - "loss": 0.0143, + "epoch": 0.22, + "learning_rate": 0.00026628916405940155, + "loss": 0.0211, "step": 86700 }, { - "epoch": 0.44, - "learning_rate": 0.00023438053387551648, - "loss": 0.0138, + "epoch": 0.22, + "learning_rate": 0.00026628527584303006, + "loss": 0.0246, "step": 86710 }, { - "epoch": 0.44, - "learning_rate": 0.00023437296618250247, - "loss": 0.0211, + "epoch": 0.22, + "learning_rate": 0.00026628138762665863, + "loss": 0.026, "step": 86720 }, { - "epoch": 0.44, - "learning_rate": 0.00023436539848948845, - "loss": 0.0192, + "epoch": 0.22, + "learning_rate": 0.00026627749941028714, + "loss": 0.02, "step": 86730 }, { - "epoch": 0.44, - "learning_rate": 0.00023435783079647446, - "loss": 0.0151, + "epoch": 0.22, + "learning_rate": 0.0002662736111939157, + "loss": 0.0186, "step": 86740 }, { - "epoch": 0.44, - "learning_rate": 0.00023435026310346044, - "loss": 0.0171, + "epoch": 0.22, + "learning_rate": 0.00026626972297754423, + "loss": 0.0265, "step": 86750 }, { - "epoch": 0.44, - "learning_rate": 0.00023434269541044642, - "loss": 0.0155, + "epoch": 0.22, + "learning_rate": 0.0002662658347611728, + "loss": 0.0197, "step": 86760 }, { - "epoch": 0.44, - "learning_rate": 0.00023433512771743243, - "loss": 0.0193, + "epoch": 0.22, + "learning_rate": 0.0002662619465448013, + "loss": 0.0199, "step": 86770 }, { - "epoch": 0.44, - "learning_rate": 0.0002343275600244184, - "loss": 0.0165, + "epoch": 0.22, + "learning_rate": 0.0002662580583284298, + "loss": 0.0193, "step": 86780 }, { - "epoch": 0.44, - "learning_rate": 0.0002343199923314044, - "loss": 0.0176, + "epoch": 0.22, + "learning_rate": 0.00026625417011205834, + "loss": 0.0254, "step": 86790 }, { - "epoch": 0.44, - "learning_rate": 0.00023431242463839037, - "loss": 0.0166, + "epoch": 0.22, + "learning_rate": 0.0002662502818956869, + "loss": 0.0278, "step": 86800 }, { - "epoch": 0.44, - "learning_rate": 0.00023430485694537638, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.0002662463936793155, + "loss": 0.0232, "step": 86810 }, { - "epoch": 0.44, - "learning_rate": 0.00023429728925236236, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.000266242505462944, + "loss": 0.0222, "step": 86820 }, { - "epoch": 0.44, - "learning_rate": 0.00023428972155934834, - "loss": 0.0147, + "epoch": 0.23, + "learning_rate": 0.0002662386172465725, + "loss": 0.0206, "step": 86830 }, { - "epoch": 0.44, - "learning_rate": 0.00023428215386633435, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.000266234729030201, + "loss": 0.0219, "step": 86840 }, { - "epoch": 0.44, - "learning_rate": 0.00023427458617332033, - "loss": 0.0196, + "epoch": 0.23, + "learning_rate": 0.0002662308408138296, + "loss": 0.0205, "step": 86850 }, { - "epoch": 0.44, - "learning_rate": 0.00023426701848030631, - "loss": 0.0203, + "epoch": 0.23, + "learning_rate": 0.0002662269525974581, + "loss": 0.0208, "step": 86860 }, { - "epoch": 0.44, - "learning_rate": 0.00023425945078729232, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.00026622306438108667, + "loss": 0.0203, "step": 86870 }, { - "epoch": 0.44, - "learning_rate": 0.0002342518830942783, - "loss": 0.015, + "epoch": 0.23, + "learning_rate": 0.0002662191761647152, + "loss": 0.0225, "step": 86880 }, { - "epoch": 0.44, - "learning_rate": 0.00023424431540126429, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.00026621528794834376, + "loss": 0.0265, "step": 86890 }, { - "epoch": 0.44, - "learning_rate": 0.0002342367477082503, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.00026621139973197227, + "loss": 0.0268, "step": 86900 }, { - "epoch": 0.44, - "learning_rate": 0.00023422918001523628, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.0002662075115156008, + "loss": 0.0244, "step": 86910 }, { - "epoch": 0.44, - "learning_rate": 0.00023422161232222226, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.0002662036232992293, + "loss": 0.0228, "step": 86920 }, { - "epoch": 0.44, - "learning_rate": 0.00023421404462920827, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.00026619973508285787, + "loss": 0.0203, "step": 86930 }, { - "epoch": 0.44, - "learning_rate": 0.00023420647693619425, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002661958468664864, + "loss": 0.0226, "step": 86940 }, { - "epoch": 0.44, - "learning_rate": 0.00023419890924318023, - "loss": 0.0196, + "epoch": 0.23, + "learning_rate": 0.00026619195865011495, + "loss": 0.0195, "step": 86950 }, { - "epoch": 0.44, - "learning_rate": 0.0002341913415501662, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.00026618807043374347, + "loss": 0.0263, "step": 86960 }, { - "epoch": 0.44, - "learning_rate": 0.00023418377385715222, - "loss": 0.0243, + "epoch": 0.23, + "learning_rate": 0.00026618418221737203, + "loss": 0.0193, "step": 86970 }, { - "epoch": 0.44, - "learning_rate": 0.0002341762061641382, - "loss": 0.0139, + "epoch": 0.23, + "learning_rate": 0.00026618029400100055, + "loss": 0.0186, "step": 86980 }, { - "epoch": 0.44, - "learning_rate": 0.00023416863847112418, - "loss": 0.0147, + "epoch": 0.23, + "learning_rate": 0.00026617640578462906, + "loss": 0.0222, "step": 86990 }, { - "epoch": 0.44, - "learning_rate": 0.0002341610707781102, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002661725175682576, + "loss": 0.0225, "step": 87000 }, { - "epoch": 0.44, - "eval_cer": 0.9144848118450433, - "eval_loss": 0.012073654681444168, - "eval_runtime": 116.8061, - "eval_samples_per_second": 17.122, - "eval_steps_per_second": 4.281, + "epoch": 0.23, + "eval_cer": 0.8817950623608236, + "eval_loss": 0.017446931451559067, + "eval_runtime": 107.4054, + "eval_samples_per_second": 18.621, + "eval_steps_per_second": 4.655, "step": 87000 }, { - "epoch": 0.44, - "learning_rate": 0.00023415350308509617, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.00026616862935188615, + "loss": 0.0236, "step": 87010 }, { - "epoch": 0.44, - "learning_rate": 0.00023414593539208215, - "loss": 0.022, + "epoch": 0.23, + "learning_rate": 0.0002661647411355147, + "loss": 0.024, "step": 87020 }, { - "epoch": 0.44, - "learning_rate": 0.00023413836769906816, - "loss": 0.0149, + "epoch": 0.23, + "learning_rate": 0.00026616085291914323, + "loss": 0.0211, "step": 87030 }, { - "epoch": 0.44, - "learning_rate": 0.00023413080000605414, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.00026615696470277175, + "loss": 0.0237, "step": 87040 }, { - "epoch": 0.44, - "learning_rate": 0.00023412323231304012, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002661530764864003, + "loss": 0.0267, "step": 87050 }, { - "epoch": 0.44, - "learning_rate": 0.00023411566462002613, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.00026614918827002883, + "loss": 0.0251, "step": 87060 }, { - "epoch": 0.44, - "learning_rate": 0.00023410809692701211, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.00026614530005365734, + "loss": 0.0212, "step": 87070 }, { - "epoch": 0.44, - "learning_rate": 0.0002341005292339981, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002661414118372859, + "loss": 0.0268, "step": 87080 }, { - "epoch": 0.44, - "learning_rate": 0.0002340929615409841, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.0002661375236209144, + "loss": 0.026, "step": 87090 }, { - "epoch": 0.44, - "learning_rate": 0.00023408539384797009, - "loss": 0.024, + "epoch": 0.23, + "learning_rate": 0.000266133635404543, + "loss": 0.0206, "step": 87100 }, { - "epoch": 0.44, - "learning_rate": 0.00023407782615495607, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002661297471881715, + "loss": 0.0271, "step": 87110 }, { - "epoch": 0.44, - "learning_rate": 0.00023407025846194208, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.0002661258589718, + "loss": 0.0241, "step": 87120 }, { - "epoch": 0.44, - "learning_rate": 0.00023406269076892806, - "loss": 0.012, + "epoch": 0.23, + "learning_rate": 0.00026612197075542854, + "loss": 0.0321, "step": 87130 }, { - "epoch": 0.44, - "learning_rate": 0.00023405512307591404, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002661180825390571, + "loss": 0.0255, "step": 87140 }, { - "epoch": 0.44, - "learning_rate": 0.00023404755538290002, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002661141943226856, + "loss": 0.024, "step": 87150 }, { - "epoch": 0.44, - "learning_rate": 0.00023403998768988603, - "loss": 0.0223, + "epoch": 0.23, + "learning_rate": 0.0002661103061063142, + "loss": 0.0217, "step": 87160 }, { - "epoch": 0.44, - "learning_rate": 0.000234032419996872, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.0002661064178899427, + "loss": 0.025, "step": 87170 }, { - "epoch": 0.44, - "learning_rate": 0.000234024852303858, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.0002661025296735713, + "loss": 0.0264, "step": 87180 }, { - "epoch": 0.44, - "learning_rate": 0.000234017284610844, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.0002660986414571998, + "loss": 0.0302, "step": 87190 }, { - "epoch": 0.44, - "learning_rate": 0.00023400971691782998, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002660947532408283, + "loss": 0.0263, "step": 87200 }, { - "epoch": 0.44, - "learning_rate": 0.00023400214922481596, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.00026609086502445687, + "loss": 0.0264, "step": 87210 }, { - "epoch": 0.44, - "learning_rate": 0.00023399458153180197, - "loss": 0.02, + "epoch": 0.23, + "learning_rate": 0.0002660869768080854, + "loss": 0.0297, "step": 87220 }, { - "epoch": 0.44, - "learning_rate": 0.00023398701383878795, - "loss": 0.0151, + "epoch": 0.23, + "learning_rate": 0.00026608308859171395, + "loss": 0.0233, "step": 87230 }, { - "epoch": 0.44, - "learning_rate": 0.00023397944614577393, - "loss": 0.0207, + "epoch": 0.23, + "learning_rate": 0.00026607920037534247, + "loss": 0.0222, "step": 87240 }, { - "epoch": 0.44, - "learning_rate": 0.00023397187845275994, - "loss": 0.0176, + "epoch": 0.23, + "learning_rate": 0.000266075312158971, + "loss": 0.0302, "step": 87250 }, { - "epoch": 0.44, - "learning_rate": 0.00023396431075974592, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.00026607142394259955, + "loss": 0.0211, "step": 87260 }, { - "epoch": 0.44, - "learning_rate": 0.0002339567430667319, - "loss": 0.021, + "epoch": 0.23, + "learning_rate": 0.00026606753572622807, + "loss": 0.0216, "step": 87270 }, { - "epoch": 0.44, - "learning_rate": 0.00023394917537371791, - "loss": 0.0132, + "epoch": 0.23, + "learning_rate": 0.0002660636475098566, + "loss": 0.0228, "step": 87280 }, { - "epoch": 0.44, - "learning_rate": 0.0002339416076807039, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.00026605975929348515, + "loss": 0.0228, "step": 87290 }, { - "epoch": 0.44, - "learning_rate": 0.00023393403998768988, - "loss": 0.015, + "epoch": 0.23, + "learning_rate": 0.00026605587107711367, + "loss": 0.0226, "step": 87300 }, { - "epoch": 0.44, - "learning_rate": 0.00023392647229467586, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.00026605198286074223, + "loss": 0.0197, "step": 87310 }, { - "epoch": 0.44, - "learning_rate": 0.00023391890460166187, - "loss": 0.0159, + "epoch": 0.23, + "learning_rate": 0.00026604809464437075, + "loss": 0.0256, "step": 87320 }, { - "epoch": 0.44, - "learning_rate": 0.00023391133690864785, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026604420642799926, + "loss": 0.0252, "step": 87330 }, { - "epoch": 0.44, - "learning_rate": 0.00023390376921563383, - "loss": 0.0198, + "epoch": 0.23, + "learning_rate": 0.0002660403182116278, + "loss": 0.0274, "step": 87340 }, { - "epoch": 0.44, - "learning_rate": 0.00023389620152261984, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.00026603642999525635, + "loss": 0.0263, "step": 87350 }, { - "epoch": 0.44, - "learning_rate": 0.0002338886338296058, - "loss": 0.0222, + "epoch": 0.23, + "learning_rate": 0.0002660325417788849, + "loss": 0.0255, "step": 87360 }, { - "epoch": 0.44, - "learning_rate": 0.00023388106613659177, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.00026602865356251343, + "loss": 0.0268, "step": 87370 }, { - "epoch": 0.44, - "learning_rate": 0.00023387349844357776, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.00026602476534614194, + "loss": 0.0247, "step": 87380 }, { - "epoch": 0.44, - "learning_rate": 0.00023386593075056376, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.0002660208771297705, + "loss": 0.0262, "step": 87390 }, { - "epoch": 0.44, - "learning_rate": 0.00023385836305754975, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026601698891339903, + "loss": 0.0247, "step": 87400 }, { - "epoch": 0.44, - "learning_rate": 0.00023385079536453573, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.00026601310069702754, + "loss": 0.0249, "step": 87410 }, { - "epoch": 0.44, - "learning_rate": 0.00023384322767152174, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.0002660092124806561, + "loss": 0.0328, "step": 87420 }, { - "epoch": 0.44, - "learning_rate": 0.00023383565997850772, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002660053242642846, + "loss": 0.0305, "step": 87430 }, { - "epoch": 0.44, - "learning_rate": 0.0002338280922854937, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.0002660014360479132, + "loss": 0.0216, "step": 87440 }, { - "epoch": 0.44, - "learning_rate": 0.0002338205245924797, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.0002659975478315417, + "loss": 0.02, "step": 87450 }, { - "epoch": 0.44, - "learning_rate": 0.0002338129568994657, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.0002659936596151702, + "loss": 0.0247, "step": 87460 }, { - "epoch": 0.44, - "learning_rate": 0.00023380538920645167, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002659897713987988, + "loss": 0.031, "step": 87470 }, { - "epoch": 0.44, - "learning_rate": 0.00023379782151343768, - "loss": 0.0149, + "epoch": 0.23, + "learning_rate": 0.0002659858831824273, + "loss": 0.0235, "step": 87480 }, { - "epoch": 0.44, - "learning_rate": 0.00023379025382042366, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.0002659819949660558, + "loss": 0.0243, "step": 87490 }, { - "epoch": 0.44, - "learning_rate": 0.00023378268612740964, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002659781067496844, + "loss": 0.0237, "step": 87500 }, { - "epoch": 0.44, - "learning_rate": 0.00023377511843439565, - "loss": 0.0138, + "epoch": 0.23, + "learning_rate": 0.00026597421853331296, + "loss": 0.0248, "step": 87510 }, { - "epoch": 0.44, - "learning_rate": 0.00023376755074138163, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.00026597033031694147, + "loss": 0.0258, "step": 87520 }, { - "epoch": 0.44, - "learning_rate": 0.0002337599830483676, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.00026596644210057, + "loss": 0.0231, "step": 87530 }, { - "epoch": 0.44, - "learning_rate": 0.0002337524153553536, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002659625538841985, + "loss": 0.0214, "step": 87540 }, { - "epoch": 0.44, - "learning_rate": 0.0002337448476623396, - "loss": 0.0217, + "epoch": 0.23, + "learning_rate": 0.00026595866566782707, + "loss": 0.0255, "step": 87550 }, { - "epoch": 0.44, - "learning_rate": 0.00023373727996932558, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.0002659547774514556, + "loss": 0.0251, "step": 87560 }, { - "epoch": 0.44, - "learning_rate": 0.00023372971227631157, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.00026595088923508415, + "loss": 0.0335, "step": 87570 }, { - "epoch": 0.44, - "learning_rate": 0.00023372214458329757, - "loss": 0.02, + "epoch": 0.23, + "learning_rate": 0.00026594700101871267, + "loss": 0.0243, "step": 87580 }, { - "epoch": 0.44, - "learning_rate": 0.00023371457689028356, - "loss": 0.0147, + "epoch": 0.23, + "learning_rate": 0.0002659431128023412, + "loss": 0.019, "step": 87590 }, { - "epoch": 0.44, - "learning_rate": 0.00023370700919726954, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.00026593922458596975, + "loss": 0.0243, "step": 87600 }, { - "epoch": 0.44, - "learning_rate": 0.00023369944150425555, - "loss": 0.0147, + "epoch": 0.23, + "learning_rate": 0.00026593533636959827, + "loss": 0.0281, "step": 87610 }, { - "epoch": 0.44, - "learning_rate": 0.00023369187381124153, - "loss": 0.0226, + "epoch": 0.23, + "learning_rate": 0.0002659314481532268, + "loss": 0.0213, "step": 87620 }, { - "epoch": 0.44, - "learning_rate": 0.0002336843061182275, - "loss": 0.0209, + "epoch": 0.23, + "learning_rate": 0.00026592755993685535, + "loss": 0.0245, "step": 87630 }, { - "epoch": 0.44, - "learning_rate": 0.00023367673842521352, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.00026592367172048386, + "loss": 0.0185, "step": 87640 }, { - "epoch": 0.44, - "learning_rate": 0.0002336691707321995, - "loss": 0.0218, + "epoch": 0.23, + "learning_rate": 0.00026591978350411243, + "loss": 0.0232, "step": 87650 }, { - "epoch": 0.44, - "learning_rate": 0.00023366160303918548, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.00026591589528774095, + "loss": 0.0183, "step": 87660 }, { - "epoch": 0.44, - "learning_rate": 0.0002336540353461715, - "loss": 0.0139, + "epoch": 0.23, + "learning_rate": 0.00026591200707136946, + "loss": 0.0258, "step": 87670 }, { - "epoch": 0.44, - "learning_rate": 0.00023364646765315747, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.00026590811885499803, + "loss": 0.0211, "step": 87680 }, { - "epoch": 0.44, - "learning_rate": 0.00023363889996014345, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.00026590423063862654, + "loss": 0.025, "step": 87690 }, { - "epoch": 0.44, - "learning_rate": 0.00023363133226712943, - "loss": 0.0135, + "epoch": 0.23, + "learning_rate": 0.00026590034242225506, + "loss": 0.0242, "step": 87700 }, { - "epoch": 0.44, - "learning_rate": 0.00023362376457411544, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026589645420588363, + "loss": 0.0207, "step": 87710 }, { - "epoch": 0.44, - "learning_rate": 0.00023361619688110142, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.0002658925659895122, + "loss": 0.0225, "step": 87720 }, { - "epoch": 0.44, - "learning_rate": 0.0002336086291880874, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.0002658886777731407, + "loss": 0.0244, "step": 87730 }, { - "epoch": 0.44, - "learning_rate": 0.0002336010614950734, - "loss": 0.0213, + "epoch": 0.23, + "learning_rate": 0.0002658847895567692, + "loss": 0.0228, "step": 87740 }, { - "epoch": 0.44, - "learning_rate": 0.0002335934938020594, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.00026588090134039774, + "loss": 0.0259, "step": 87750 }, { - "epoch": 0.44, - "learning_rate": 0.00023358592610904538, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.0002658770131240263, + "loss": 0.0217, "step": 87760 }, { - "epoch": 0.44, - "learning_rate": 0.00023357835841603138, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002658731249076548, + "loss": 0.02, "step": 87770 }, { - "epoch": 0.44, - "learning_rate": 0.00023357079072301737, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002658692366912834, + "loss": 0.0208, "step": 87780 }, { - "epoch": 0.44, - "learning_rate": 0.00023356322303000335, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.0002658653484749119, + "loss": 0.0268, "step": 87790 }, { - "epoch": 0.44, - "learning_rate": 0.00023355565533698936, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.0002658614602585405, + "loss": 0.0224, "step": 87800 }, { - "epoch": 0.44, - "learning_rate": 0.00023354808764397534, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.000265857572042169, + "loss": 0.0203, "step": 87810 }, { - "epoch": 0.44, - "learning_rate": 0.00023354051995096132, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.0002658536838257975, + "loss": 0.0258, "step": 87820 }, { - "epoch": 0.44, - "learning_rate": 0.00023353295225794733, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.000265849795609426, + "loss": 0.0247, "step": 87830 }, { - "epoch": 0.44, - "learning_rate": 0.0002335253845649333, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.0002658459073930546, + "loss": 0.026, "step": 87840 }, { - "epoch": 0.44, - "learning_rate": 0.0002335178168719193, - "loss": 0.0151, + "epoch": 0.23, + "learning_rate": 0.0002658420191766831, + "loss": 0.0189, "step": 87850 }, { - "epoch": 0.44, - "learning_rate": 0.00023351024917890527, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.00026583813096031167, + "loss": 0.026, "step": 87860 }, { - "epoch": 0.44, - "learning_rate": 0.00023350268148589128, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.0002658342427439402, + "loss": 0.0228, "step": 87870 }, { - "epoch": 0.44, - "learning_rate": 0.00023349511379287726, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.0002658303545275687, + "loss": 0.025, "step": 87880 }, { - "epoch": 0.44, - "learning_rate": 0.00023348754609986324, - "loss": 0.0159, + "epoch": 0.23, + "learning_rate": 0.00026582646631119727, + "loss": 0.0237, "step": 87890 }, { - "epoch": 0.44, - "learning_rate": 0.00023347997840684925, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.0002658225780948258, + "loss": 0.0246, "step": 87900 }, { - "epoch": 0.44, - "learning_rate": 0.00023347241071383523, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026581868987845435, + "loss": 0.0247, "step": 87910 }, { - "epoch": 0.44, - "learning_rate": 0.00023346484302082121, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.00026581480166208287, + "loss": 0.0216, "step": 87920 }, { - "epoch": 0.44, - "learning_rate": 0.00023345727532780722, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026581091344571144, + "loss": 0.0244, "step": 87930 }, { - "epoch": 0.44, - "learning_rate": 0.0002334497076347932, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026580702522933995, + "loss": 0.0251, "step": 87940 }, { - "epoch": 0.44, - "learning_rate": 0.00023344213994177919, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.00026580313701296846, + "loss": 0.038, "step": 87950 }, { - "epoch": 0.44, - "learning_rate": 0.0002334345722487652, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.000265799248796597, + "loss": 0.0268, "step": 87960 }, { - "epoch": 0.44, - "learning_rate": 0.00023342700455575118, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.00026579536058022555, + "loss": 0.0212, "step": 87970 }, { - "epoch": 0.44, - "learning_rate": 0.00023341943686273716, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.00026579147236385406, + "loss": 0.0237, "step": 87980 }, { - "epoch": 0.44, - "learning_rate": 0.00023341186916972317, - "loss": 0.0205, + "epoch": 0.23, + "learning_rate": 0.00026578758414748263, + "loss": 0.025, "step": 87990 }, { - "epoch": 0.44, - "learning_rate": 0.00023340430147670915, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.00026578369593111115, + "loss": 0.0223, "step": 88000 }, { - "epoch": 0.44, - "eval_cer": 0.9145042197675514, - "eval_loss": 0.011925076134502888, - "eval_runtime": 116.6489, - "eval_samples_per_second": 17.145, - "eval_steps_per_second": 4.286, + "epoch": 0.23, + "eval_cer": 0.8818174565517705, + "eval_loss": 0.016908327117562294, + "eval_runtime": 107.5726, + "eval_samples_per_second": 18.592, + "eval_steps_per_second": 4.648, "step": 88000 }, { - "epoch": 0.44, - "learning_rate": 0.00023339673378369513, - "loss": 0.0132, + "epoch": 0.23, + "learning_rate": 0.0002657798077147397, + "loss": 0.0258, "step": 88010 }, { - "epoch": 0.44, - "learning_rate": 0.00023338916609068114, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.00026577591949836823, + "loss": 0.0243, "step": 88020 }, { - "epoch": 0.44, - "learning_rate": 0.00023338159839766712, - "loss": 0.0176, + "epoch": 0.23, + "learning_rate": 0.00026577203128199674, + "loss": 0.0249, "step": 88030 }, { - "epoch": 0.44, - "learning_rate": 0.0002333740307046531, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.00026576814306562526, + "loss": 0.0247, "step": 88040 }, { - "epoch": 0.44, - "learning_rate": 0.00023336646301163908, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.0002657642548492538, + "loss": 0.0197, "step": 88050 }, { - "epoch": 0.44, - "learning_rate": 0.0002333588953186251, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002657603666328824, + "loss": 0.0195, "step": 88060 }, { - "epoch": 0.44, - "learning_rate": 0.00023335132762561107, - "loss": 0.0207, + "epoch": 0.23, + "learning_rate": 0.0002657564784165109, + "loss": 0.0263, "step": 88070 }, { - "epoch": 0.44, - "learning_rate": 0.00023334375993259705, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.0002657525902001394, + "loss": 0.0211, "step": 88080 }, { - "epoch": 0.44, - "learning_rate": 0.00023333619223958306, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.00026574870198376794, + "loss": 0.0204, "step": 88090 }, { - "epoch": 0.44, - "learning_rate": 0.00023332862454656904, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.0002657448137673965, + "loss": 0.0286, "step": 88100 }, { - "epoch": 0.44, - "learning_rate": 0.00023332105685355502, - "loss": 0.0205, + "epoch": 0.23, + "learning_rate": 0.000265740925551025, + "loss": 0.0279, "step": 88110 }, { - "epoch": 0.44, - "learning_rate": 0.00023331348916054103, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002657370373346536, + "loss": 0.0252, "step": 88120 }, { - "epoch": 0.44, - "learning_rate": 0.00023330592146752701, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.0002657331491182821, + "loss": 0.0224, "step": 88130 }, { - "epoch": 0.44, - "learning_rate": 0.000233298353774513, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002657292609019107, + "loss": 0.0267, "step": 88140 }, { - "epoch": 0.44, - "learning_rate": 0.000233290786081499, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002657253726855392, + "loss": 0.0192, "step": 88150 }, { - "epoch": 0.44, - "learning_rate": 0.00023328321838848499, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.0002657214844691677, + "loss": 0.0229, "step": 88160 }, { - "epoch": 0.44, - "learning_rate": 0.00023327565069547097, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.0002657175962527962, + "loss": 0.0232, "step": 88170 }, { - "epoch": 0.44, - "learning_rate": 0.00023326808300245698, - "loss": 0.0176, + "epoch": 0.23, + "learning_rate": 0.0002657137080364248, + "loss": 0.0207, "step": 88180 }, { - "epoch": 0.44, - "learning_rate": 0.00023326051530944296, - "loss": 0.0132, + "epoch": 0.23, + "learning_rate": 0.0002657098198200533, + "loss": 0.024, "step": 88190 }, { - "epoch": 0.44, - "learning_rate": 0.00023325294761642894, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.00026570593160368187, + "loss": 0.0221, "step": 88200 }, { - "epoch": 0.45, - "learning_rate": 0.00023324537992341492, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.0002657020433873104, + "loss": 0.02, "step": 88210 }, { - "epoch": 0.45, - "learning_rate": 0.00023323781223040093, - "loss": 0.0136, + "epoch": 0.23, + "learning_rate": 0.00026569815517093895, + "loss": 0.0225, "step": 88220 }, { - "epoch": 0.45, - "learning_rate": 0.0002332302445373869, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026569426695456747, + "loss": 0.0172, "step": 88230 }, { - "epoch": 0.45, - "learning_rate": 0.0002332226768443729, - "loss": 0.0184, + "epoch": 0.23, + "learning_rate": 0.000265690378738196, + "loss": 0.0252, "step": 88240 }, { - "epoch": 0.45, - "learning_rate": 0.0002332151091513589, - "loss": 0.015, + "epoch": 0.23, + "learning_rate": 0.00026568649052182455, + "loss": 0.0227, "step": 88250 }, { - "epoch": 0.45, - "learning_rate": 0.00023320754145834488, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.00026568260230545307, + "loss": 0.017, "step": 88260 }, { - "epoch": 0.45, - "learning_rate": 0.00023319997376533086, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026567871408908163, + "loss": 0.0235, "step": 88270 }, { - "epoch": 0.45, - "learning_rate": 0.00023319240607231687, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026567482587271015, + "loss": 0.0203, "step": 88280 }, { - "epoch": 0.45, - "learning_rate": 0.00023318483837930285, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.00026567093765633866, + "loss": 0.026, "step": 88290 }, { - "epoch": 0.45, - "learning_rate": 0.00023317727068628883, - "loss": 0.0176, + "epoch": 0.23, + "learning_rate": 0.00026566704943996723, + "loss": 0.0215, "step": 88300 }, { - "epoch": 0.45, - "learning_rate": 0.00023316970299327484, - "loss": 0.0203, + "epoch": 0.23, + "learning_rate": 0.00026566316122359575, + "loss": 0.025, "step": 88310 }, { - "epoch": 0.45, - "learning_rate": 0.00023316213530026082, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.00026565927300722426, + "loss": 0.0221, "step": 88320 }, { - "epoch": 0.45, - "learning_rate": 0.0002331545676072468, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026565538479085283, + "loss": 0.02, "step": 88330 }, { - "epoch": 0.45, - "learning_rate": 0.00023314699991423281, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.00026565149657448134, + "loss": 0.0222, "step": 88340 }, { - "epoch": 0.45, - "learning_rate": 0.0002331394322212188, - "loss": 0.0159, + "epoch": 0.23, + "learning_rate": 0.0002656476083581099, + "loss": 0.0228, "step": 88350 }, { - "epoch": 0.45, - "learning_rate": 0.00023313186452820478, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026564372014173843, + "loss": 0.0211, "step": 88360 }, { - "epoch": 0.45, - "learning_rate": 0.00023312429683519076, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.00026563983192536694, + "loss": 0.0244, "step": 88370 }, { - "epoch": 0.45, - "learning_rate": 0.00023311672914217677, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.00026563594370899546, + "loss": 0.0256, "step": 88380 }, { - "epoch": 0.45, - "learning_rate": 0.00023310916144916275, - "loss": 0.0198, + "epoch": 0.23, + "learning_rate": 0.000265632055492624, + "loss": 0.0229, "step": 88390 }, { - "epoch": 0.45, - "learning_rate": 0.00023310159375614873, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.0002656281672762526, + "loss": 0.025, "step": 88400 }, { - "epoch": 0.45, - "learning_rate": 0.00023309402606313474, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002656242790598811, + "loss": 0.0193, "step": 88410 }, { - "epoch": 0.45, - "learning_rate": 0.00023308645837012072, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.0002656203908435096, + "loss": 0.0205, "step": 88420 }, { - "epoch": 0.45, - "learning_rate": 0.0002330788906771067, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.0002656165026271382, + "loss": 0.0235, "step": 88430 }, { - "epoch": 0.45, - "learning_rate": 0.0002330713229840927, - "loss": 0.0205, + "epoch": 0.23, + "learning_rate": 0.0002656126144107667, + "loss": 0.0248, "step": 88440 }, { - "epoch": 0.45, - "learning_rate": 0.0002330637552910787, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.0002656087261943952, + "loss": 0.0188, "step": 88450 }, { - "epoch": 0.45, - "learning_rate": 0.00023305618759806467, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.0002656048379780238, + "loss": 0.0269, "step": 88460 }, { - "epoch": 0.45, - "learning_rate": 0.00023304861990505068, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.0002656009497616523, + "loss": 0.023, "step": 88470 }, { - "epoch": 0.45, - "learning_rate": 0.00023304105221203666, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002655970615452809, + "loss": 0.0264, "step": 88480 }, { - "epoch": 0.45, - "learning_rate": 0.00023303348451902264, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.0002655931733289094, + "loss": 0.0214, "step": 88490 }, { - "epoch": 0.45, - "learning_rate": 0.00023302591682600865, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.0002655892851125379, + "loss": 0.0237, "step": 88500 }, { - "epoch": 0.45, - "learning_rate": 0.00023301834913299463, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.00026558539689616647, + "loss": 0.0211, "step": 88510 }, { - "epoch": 0.45, - "learning_rate": 0.00023301078143998062, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.000265581508679795, + "loss": 0.0235, "step": 88520 }, { - "epoch": 0.45, - "learning_rate": 0.00023300321374696662, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002655776204634235, + "loss": 0.0257, "step": 88530 }, { - "epoch": 0.45, - "learning_rate": 0.0002329956460539526, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.00026557373224705207, + "loss": 0.0251, "step": 88540 }, { - "epoch": 0.45, - "learning_rate": 0.0002329880783609386, - "loss": 0.0197, + "epoch": 0.23, + "learning_rate": 0.00026556984403068064, + "loss": 0.0271, "step": 88550 }, { - "epoch": 0.45, - "learning_rate": 0.00023298051066792457, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.00026556595581430915, + "loss": 0.0292, "step": 88560 }, { - "epoch": 0.45, - "learning_rate": 0.00023297294297491058, - "loss": 0.0136, + "epoch": 0.23, + "learning_rate": 0.00026556206759793767, + "loss": 0.0197, "step": 88570 }, { - "epoch": 0.45, - "learning_rate": 0.00023296537528189656, - "loss": 0.0144, + "epoch": 0.23, + "learning_rate": 0.0002655581793815662, + "loss": 0.0228, "step": 88580 }, { - "epoch": 0.45, - "learning_rate": 0.00023295780758888254, - "loss": 0.0136, + "epoch": 0.23, + "learning_rate": 0.0002655542911651947, + "loss": 0.023, "step": 88590 }, { - "epoch": 0.45, - "learning_rate": 0.00023295023989586855, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.00026555040294882326, + "loss": 0.0259, "step": 88600 }, { - "epoch": 0.45, - "learning_rate": 0.00023294267220285453, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026554651473245183, + "loss": 0.0251, "step": 88610 }, { - "epoch": 0.45, - "learning_rate": 0.00023293510450984048, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026554262651608035, + "loss": 0.0218, "step": 88620 }, { - "epoch": 0.45, - "learning_rate": 0.00023292753681682647, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.00026553873829970886, + "loss": 0.0241, "step": 88630 }, { - "epoch": 0.45, - "learning_rate": 0.00023291996912381247, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026553485008333743, + "loss": 0.0239, "step": 88640 }, { - "epoch": 0.45, - "learning_rate": 0.00023291240143079846, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.00026553096186696595, + "loss": 0.0217, "step": 88650 }, { - "epoch": 0.45, - "learning_rate": 0.00023290483373778444, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.00026552707365059446, + "loss": 0.0206, "step": 88660 }, { - "epoch": 0.45, - "learning_rate": 0.00023289726604477045, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026552318543422303, + "loss": 0.0261, "step": 88670 }, { - "epoch": 0.45, - "learning_rate": 0.00023288969835175643, - "loss": 0.014, + "epoch": 0.23, + "learning_rate": 0.00026551929721785154, + "loss": 0.0253, "step": 88680 }, { - "epoch": 0.45, - "learning_rate": 0.0002328821306587424, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.0002655154090014801, + "loss": 0.0197, "step": 88690 }, { - "epoch": 0.45, - "learning_rate": 0.00023287456296572842, - "loss": 0.0229, + "epoch": 0.23, + "learning_rate": 0.0002655115207851086, + "loss": 0.0256, "step": 88700 }, { - "epoch": 0.45, - "learning_rate": 0.0002328669952727144, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.00026550763256873714, + "loss": 0.0227, "step": 88710 }, { - "epoch": 0.45, - "learning_rate": 0.00023285942757970038, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.0002655037443523657, + "loss": 0.021, "step": 88720 }, { - "epoch": 0.45, - "learning_rate": 0.0002328518598866864, - "loss": 0.0206, + "epoch": 0.23, + "learning_rate": 0.0002654998561359942, + "loss": 0.0266, "step": 88730 }, { - "epoch": 0.45, - "learning_rate": 0.00023284429219367237, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.00026549596791962274, + "loss": 0.0228, "step": 88740 }, { - "epoch": 0.45, - "learning_rate": 0.00023283672450065835, - "loss": 0.014, + "epoch": 0.23, + "learning_rate": 0.0002654920797032513, + "loss": 0.0268, "step": 88750 }, { - "epoch": 0.45, - "learning_rate": 0.00023282915680764433, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.0002654881914868799, + "loss": 0.0274, "step": 88760 }, { - "epoch": 0.45, - "learning_rate": 0.00023282158911463034, - "loss": 0.0184, + "epoch": 0.23, + "learning_rate": 0.0002654843032705084, + "loss": 0.0243, "step": 88770 }, { - "epoch": 0.45, - "learning_rate": 0.00023281402142161632, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.0002654804150541369, + "loss": 0.0223, "step": 88780 }, { - "epoch": 0.45, - "learning_rate": 0.0002328064537286023, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.0002654765268377654, + "loss": 0.0212, "step": 88790 }, { - "epoch": 0.45, - "learning_rate": 0.0002327988860355883, - "loss": 0.0208, + "epoch": 0.23, + "learning_rate": 0.000265472638621394, + "loss": 0.0233, "step": 88800 }, { - "epoch": 0.45, - "learning_rate": 0.0002327913183425743, - "loss": 0.0166, + "epoch": 0.23, + "learning_rate": 0.0002654687504050225, + "loss": 0.0243, "step": 88810 }, { - "epoch": 0.45, - "learning_rate": 0.00023278375064956028, - "loss": 0.0134, + "epoch": 0.23, + "learning_rate": 0.00026546486218865107, + "loss": 0.0226, "step": 88820 }, { - "epoch": 0.45, - "learning_rate": 0.00023277618295654628, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.0002654609739722796, + "loss": 0.0213, "step": 88830 }, { - "epoch": 0.45, - "learning_rate": 0.00023276861526353227, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002654570857559081, + "loss": 0.0223, "step": 88840 }, { - "epoch": 0.45, - "learning_rate": 0.00023276104757051825, - "loss": 0.0149, + "epoch": 0.23, + "learning_rate": 0.00026545319753953667, + "loss": 0.024, "step": 88850 }, { - "epoch": 0.45, - "learning_rate": 0.00023275347987750426, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.0002654493093231652, + "loss": 0.0198, "step": 88860 }, { - "epoch": 0.45, - "learning_rate": 0.00023274591218449024, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.0002654454211067937, + "loss": 0.0244, "step": 88870 }, { - "epoch": 0.45, - "learning_rate": 0.00023273834449147622, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.00026544153289042227, + "loss": 0.0219, "step": 88880 }, { - "epoch": 0.45, - "learning_rate": 0.00023273077679846223, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.0002654376446740508, + "loss": 0.0232, "step": 88890 }, { - "epoch": 0.45, - "learning_rate": 0.0002327232091054482, - "loss": 0.0216, + "epoch": 0.23, + "learning_rate": 0.00026543375645767935, + "loss": 0.0213, "step": 88900 }, { - "epoch": 0.45, - "learning_rate": 0.0002327156414124342, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.00026542986824130787, + "loss": 0.025, "step": 88910 }, { - "epoch": 0.45, - "learning_rate": 0.0002327080737194202, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.0002654259800249364, + "loss": 0.0254, "step": 88920 }, { - "epoch": 0.45, - "learning_rate": 0.00023270050602640618, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.00026542209180856495, + "loss": 0.0191, "step": 88930 }, { - "epoch": 0.45, - "learning_rate": 0.00023269293833339216, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.00026541820359219346, + "loss": 0.0238, "step": 88940 }, { - "epoch": 0.45, - "learning_rate": 0.00023268537064037814, - "loss": 0.023, + "epoch": 0.23, + "learning_rate": 0.00026541431537582203, + "loss": 0.0318, "step": 88950 }, { - "epoch": 0.45, - "learning_rate": 0.00023267780294736415, - "loss": 0.0185, + "epoch": 0.23, + "learning_rate": 0.00026541042715945055, + "loss": 0.03, "step": 88960 }, { - "epoch": 0.45, - "learning_rate": 0.00023267023525435013, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002654065389430791, + "loss": 0.0256, "step": 88970 }, { - "epoch": 0.45, - "learning_rate": 0.00023266266756133611, - "loss": 0.0144, + "epoch": 0.23, + "learning_rate": 0.00026540265072670763, + "loss": 0.0204, "step": 88980 }, { - "epoch": 0.45, - "learning_rate": 0.00023265509986832212, - "loss": 0.0162, + "epoch": 0.23, + "learning_rate": 0.00026539876251033614, + "loss": 0.0232, "step": 88990 }, { - "epoch": 0.45, - "learning_rate": 0.0002326475321753081, - "loss": 0.0146, + "epoch": 0.23, + "learning_rate": 0.00026539487429396466, + "loss": 0.0214, "step": 89000 }, { - "epoch": 0.45, - "eval_cer": 0.9144906342217957, - "eval_loss": 0.01203860528767109, - "eval_runtime": 116.6624, - "eval_samples_per_second": 17.143, - "eval_steps_per_second": 4.286, + "epoch": 0.23, + "eval_cer": 0.8818370514688489, + "eval_loss": 0.017352329567074776, + "eval_runtime": 107.8338, + "eval_samples_per_second": 18.547, + "eval_steps_per_second": 4.637, "step": 89000 }, { - "epoch": 0.45, - "learning_rate": 0.00023263996448229409, - "loss": 0.0206, + "epoch": 0.23, + "learning_rate": 0.00026539098607759323, + "loss": 0.0279, "step": 89010 }, { - "epoch": 0.45, - "learning_rate": 0.0002326323967892801, - "loss": 0.0151, + "epoch": 0.23, + "learning_rate": 0.00026538709786122174, + "loss": 0.0255, "step": 89020 }, { - "epoch": 0.45, - "learning_rate": 0.00023262482909626608, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002653832096448503, + "loss": 0.0242, "step": 89030 }, { - "epoch": 0.45, - "learning_rate": 0.00023261726140325206, - "loss": 0.0193, + "epoch": 0.23, + "learning_rate": 0.0002653793214284788, + "loss": 0.0247, "step": 89040 }, { - "epoch": 0.45, - "learning_rate": 0.00023260969371023807, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.0002653754332121074, + "loss": 0.0216, "step": 89050 }, { - "epoch": 0.45, - "learning_rate": 0.00023260212601722405, - "loss": 0.0126, + "epoch": 0.23, + "learning_rate": 0.0002653715449957359, + "loss": 0.0241, "step": 89060 }, { - "epoch": 0.45, - "learning_rate": 0.00023259455832421003, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.0002653676567793644, + "loss": 0.0189, "step": 89070 }, { - "epoch": 0.45, - "learning_rate": 0.00023258699063119604, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.00026536376856299294, + "loss": 0.028, "step": 89080 }, { - "epoch": 0.45, - "learning_rate": 0.00023257942293818202, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.0002653598803466215, + "loss": 0.0288, "step": 89090 }, { - "epoch": 0.45, - "learning_rate": 0.000232571855245168, - "loss": 0.0183, + "epoch": 0.23, + "learning_rate": 0.0002653559921302501, + "loss": 0.0241, "step": 89100 }, { - "epoch": 0.45, - "learning_rate": 0.00023256428755215398, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.0002653521039138786, + "loss": 0.0254, "step": 89110 }, { - "epoch": 0.45, - "learning_rate": 0.00023255671985914, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.0002653482156975071, + "loss": 0.0269, "step": 89120 }, { - "epoch": 0.45, - "learning_rate": 0.00023254915216612597, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.0002653443274811356, + "loss": 0.034, "step": 89130 }, { - "epoch": 0.45, - "learning_rate": 0.00023254158447311195, - "loss": 0.0146, + "epoch": 0.23, + "learning_rate": 0.0002653404392647642, + "loss": 0.0245, "step": 89140 }, { - "epoch": 0.45, - "learning_rate": 0.00023253401678009796, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.0002653365510483927, + "loss": 0.031, "step": 89150 }, { - "epoch": 0.45, - "learning_rate": 0.00023252644908708394, - "loss": 0.0179, + "epoch": 0.23, + "learning_rate": 0.00026533266283202127, + "loss": 0.0258, "step": 89160 }, { - "epoch": 0.45, - "learning_rate": 0.00023251888139406992, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.0002653287746156498, + "loss": 0.027, "step": 89170 }, { - "epoch": 0.45, - "learning_rate": 0.00023251131370105593, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.00026532488639927835, + "loss": 0.0232, "step": 89180 }, { - "epoch": 0.45, - "learning_rate": 0.00023250374600804191, - "loss": 0.0164, + "epoch": 0.23, + "learning_rate": 0.00026532099818290687, + "loss": 0.0256, "step": 89190 }, { - "epoch": 0.45, - "learning_rate": 0.0002324961783150279, - "loss": 0.0138, + "epoch": 0.23, + "learning_rate": 0.0002653171099665354, + "loss": 0.0192, "step": 89200 }, { - "epoch": 0.45, - "learning_rate": 0.0002324886106220139, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.0002653132217501639, + "loss": 0.0295, "step": 89210 }, { - "epoch": 0.45, - "learning_rate": 0.00023248104292899989, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026530933353379247, + "loss": 0.0272, "step": 89220 }, { - "epoch": 0.45, - "learning_rate": 0.00023247347523598587, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.000265305445317421, + "loss": 0.0266, "step": 89230 }, { - "epoch": 0.45, - "learning_rate": 0.00023246590754297188, - "loss": 0.0216, + "epoch": 0.23, + "learning_rate": 0.00026530155710104955, + "loss": 0.0196, "step": 89240 }, { - "epoch": 0.45, - "learning_rate": 0.00023245833984995786, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.00026529766888467806, + "loss": 0.0235, "step": 89250 }, { - "epoch": 0.45, - "learning_rate": 0.00023245077215694384, - "loss": 0.0187, + "epoch": 0.23, + "learning_rate": 0.00026529378066830663, + "loss": 0.0195, "step": 89260 }, { - "epoch": 0.45, - "learning_rate": 0.00023244320446392982, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.00026528989245193515, + "loss": 0.0224, "step": 89270 }, { - "epoch": 0.45, - "learning_rate": 0.00023243563677091583, - "loss": 0.0155, + "epoch": 0.23, + "learning_rate": 0.00026528600423556366, + "loss": 0.0279, "step": 89280 }, { - "epoch": 0.45, - "learning_rate": 0.0002324280690779018, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.0002652821160191922, + "loss": 0.0232, "step": 89290 }, { - "epoch": 0.45, - "learning_rate": 0.0002324205013848878, - "loss": 0.0177, + "epoch": 0.23, + "learning_rate": 0.00026527822780282075, + "loss": 0.0271, "step": 89300 }, { - "epoch": 0.45, - "learning_rate": 0.0002324129336918738, - "loss": 0.0223, + "epoch": 0.23, + "learning_rate": 0.0002652743395864493, + "loss": 0.0241, "step": 89310 }, { - "epoch": 0.45, - "learning_rate": 0.00023240536599885978, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026527045137007783, + "loss": 0.0247, "step": 89320 }, { - "epoch": 0.45, - "learning_rate": 0.00023239779830584576, - "loss": 0.0197, + "epoch": 0.23, + "learning_rate": 0.00026526656315370634, + "loss": 0.0229, "step": 89330 }, { - "epoch": 0.45, - "learning_rate": 0.00023239023061283177, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.00026526267493733486, + "loss": 0.0221, "step": 89340 }, { - "epoch": 0.45, - "learning_rate": 0.00023238266291981775, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002652587867209634, + "loss": 0.024, "step": 89350 }, { - "epoch": 0.45, - "learning_rate": 0.00023237509522680373, - "loss": 0.0146, + "epoch": 0.23, + "learning_rate": 0.00026525489850459194, + "loss": 0.0245, "step": 89360 }, { - "epoch": 0.45, - "learning_rate": 0.00023236752753378974, - "loss": 0.0138, + "epoch": 0.23, + "learning_rate": 0.0002652510102882205, + "loss": 0.0196, "step": 89370 }, { - "epoch": 0.45, - "learning_rate": 0.00023235995984077572, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.000265247122071849, + "loss": 0.0232, "step": 89380 }, { - "epoch": 0.45, - "learning_rate": 0.0002323523921477617, - "loss": 0.0192, + "epoch": 0.23, + "learning_rate": 0.0002652432338554776, + "loss": 0.0187, "step": 89390 }, { - "epoch": 0.45, - "learning_rate": 0.00023234482445474771, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.0002652393456391061, + "loss": 0.0218, "step": 89400 }, { - "epoch": 0.45, - "learning_rate": 0.0002323372567617337, - "loss": 0.0165, + "epoch": 0.23, + "learning_rate": 0.0002652354574227346, + "loss": 0.0266, "step": 89410 }, { - "epoch": 0.45, - "learning_rate": 0.00023232968906871968, - "loss": 0.016, + "epoch": 0.23, + "learning_rate": 0.00026523156920636314, + "loss": 0.0218, "step": 89420 }, { - "epoch": 0.45, - "learning_rate": 0.00023232212137570566, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.0002652276809899917, + "loss": 0.0229, "step": 89430 }, { - "epoch": 0.45, - "learning_rate": 0.00023231455368269167, - "loss": 0.0133, + "epoch": 0.23, + "learning_rate": 0.0002652237927736202, + "loss": 0.0211, "step": 89440 }, { - "epoch": 0.45, - "learning_rate": 0.00023230698598967765, - "loss": 0.0127, + "epoch": 0.23, + "learning_rate": 0.0002652199045572488, + "loss": 0.0227, "step": 89450 }, { - "epoch": 0.45, - "learning_rate": 0.00023229941829666363, - "loss": 0.0155, + "epoch": 0.23, + "learning_rate": 0.0002652160163408773, + "loss": 0.026, "step": 89460 }, { - "epoch": 0.45, - "learning_rate": 0.00023229185060364964, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.00026521212812450587, + "loss": 0.0218, "step": 89470 }, { - "epoch": 0.45, - "learning_rate": 0.00023228428291063562, - "loss": 0.0136, + "epoch": 0.23, + "learning_rate": 0.0002652082399081344, + "loss": 0.0222, "step": 89480 }, { - "epoch": 0.45, - "learning_rate": 0.0002322767152176216, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.0002652043516917629, + "loss": 0.0207, "step": 89490 }, { - "epoch": 0.45, - "learning_rate": 0.0002322691475246076, - "loss": 0.0151, + "epoch": 0.23, + "learning_rate": 0.00026520046347539147, + "loss": 0.0222, "step": 89500 }, { - "epoch": 0.45, - "learning_rate": 0.0002322615798315936, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.00026519657525902, + "loss": 0.0214, "step": 89510 }, { - "epoch": 0.45, - "learning_rate": 0.00023225401213857957, - "loss": 0.0214, + "epoch": 0.23, + "learning_rate": 0.00026519268704264855, + "loss": 0.0189, "step": 89520 }, { - "epoch": 0.45, - "learning_rate": 0.00023224644444556558, - "loss": 0.0207, + "epoch": 0.23, + "learning_rate": 0.00026518879882627707, + "loss": 0.0243, "step": 89530 }, { - "epoch": 0.45, - "learning_rate": 0.00023223887675255156, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.0002651849106099056, + "loss": 0.0208, "step": 89540 }, { - "epoch": 0.45, - "learning_rate": 0.00023223130905953754, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.00026518102239353415, + "loss": 0.0213, "step": 89550 }, { - "epoch": 0.45, - "learning_rate": 0.00023222374136652355, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.00026517713417716267, + "loss": 0.0214, "step": 89560 }, { - "epoch": 0.45, - "learning_rate": 0.00023221617367350953, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002651732459607912, + "loss": 0.0227, "step": 89570 }, { - "epoch": 0.45, - "learning_rate": 0.00023220860598049552, - "loss": 0.0153, + "epoch": 0.23, + "learning_rate": 0.00026516935774441975, + "loss": 0.0286, "step": 89580 }, { - "epoch": 0.45, - "learning_rate": 0.00023220103828748152, - "loss": 0.0172, + "epoch": 0.23, + "learning_rate": 0.00026516546952804826, + "loss": 0.0222, "step": 89590 }, { - "epoch": 0.45, - "learning_rate": 0.0002321934705944675, - "loss": 0.0229, + "epoch": 0.23, + "learning_rate": 0.00026516158131167683, + "loss": 0.028, "step": 89600 }, { - "epoch": 0.45, - "learning_rate": 0.0002321859029014535, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.00026515769309530535, + "loss": 0.0208, "step": 89610 }, { - "epoch": 0.45, - "learning_rate": 0.00023217833520843947, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.00026515380487893386, + "loss": 0.0227, "step": 89620 }, { - "epoch": 0.45, - "learning_rate": 0.00023217076751542548, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.0002651499166625624, + "loss": 0.02, "step": 89630 }, { - "epoch": 0.45, - "learning_rate": 0.00023216319982241146, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.00026514602844619094, + "loss": 0.024, "step": 89640 }, { - "epoch": 0.45, - "learning_rate": 0.00023215563212939744, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002651421402298195, + "loss": 0.0233, "step": 89650 }, { - "epoch": 0.45, - "learning_rate": 0.00023214806443638345, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.00026513825201344803, + "loss": 0.0219, "step": 89660 }, { - "epoch": 0.45, - "learning_rate": 0.00023214049674336943, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.00026513436379707654, + "loss": 0.0228, "step": 89670 }, { - "epoch": 0.45, - "learning_rate": 0.0002321329290503554, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.0002651304755807051, + "loss": 0.0218, "step": 89680 }, { - "epoch": 0.45, - "learning_rate": 0.00023212536135734142, - "loss": 0.0139, + "epoch": 0.23, + "learning_rate": 0.0002651265873643336, + "loss": 0.0248, "step": 89690 }, { - "epoch": 0.45, - "learning_rate": 0.0002321177936643274, - "loss": 0.0133, + "epoch": 0.23, + "learning_rate": 0.00026512269914796214, + "loss": 0.0289, "step": 89700 }, { - "epoch": 0.45, - "learning_rate": 0.00023211022597131338, - "loss": 0.0133, + "epoch": 0.23, + "learning_rate": 0.0002651188109315907, + "loss": 0.023, "step": 89710 }, { - "epoch": 0.45, - "learning_rate": 0.0002321026582782994, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.0002651149227152192, + "loss": 0.0194, "step": 89720 }, { - "epoch": 0.45, - "learning_rate": 0.00023209509058528537, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.0002651110344988478, + "loss": 0.0206, "step": 89730 }, { - "epoch": 0.45, - "learning_rate": 0.00023208752289227135, - "loss": 0.0176, + "epoch": 0.23, + "learning_rate": 0.0002651071462824763, + "loss": 0.0258, "step": 89740 }, { - "epoch": 0.45, - "learning_rate": 0.00023207995519925736, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002651032580661048, + "loss": 0.0208, "step": 89750 }, { - "epoch": 0.45, - "learning_rate": 0.00023207238750624334, - "loss": 0.0197, + "epoch": 0.23, + "learning_rate": 0.0002650993698497334, + "loss": 0.0228, "step": 89760 }, { - "epoch": 0.45, - "learning_rate": 0.00023206481981322933, - "loss": 0.0126, + "epoch": 0.23, + "learning_rate": 0.0002650954816333619, + "loss": 0.0232, "step": 89770 }, { - "epoch": 0.45, - "learning_rate": 0.0002320572521202153, - "loss": 0.0146, + "epoch": 0.23, + "learning_rate": 0.0002650915934169904, + "loss": 0.0242, "step": 89780 }, { - "epoch": 0.45, - "learning_rate": 0.00023204968442720132, - "loss": 0.0126, + "epoch": 0.23, + "learning_rate": 0.000265087705200619, + "loss": 0.0218, "step": 89790 }, { - "epoch": 0.45, - "learning_rate": 0.0002320421167341873, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.00026508381698424756, + "loss": 0.0228, "step": 89800 }, { - "epoch": 0.45, - "learning_rate": 0.00023203454904117328, - "loss": 0.0147, + "epoch": 0.23, + "learning_rate": 0.00026507992876787607, + "loss": 0.0245, "step": 89810 }, { - "epoch": 0.45, - "learning_rate": 0.0002320269813481593, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002650760405515046, + "loss": 0.024, "step": 89820 }, { - "epoch": 0.45, - "learning_rate": 0.00023201941365514527, - "loss": 0.0202, + "epoch": 0.23, + "learning_rate": 0.0002650721523351331, + "loss": 0.0252, "step": 89830 }, { - "epoch": 0.45, - "learning_rate": 0.00023201184596213125, - "loss": 0.0135, + "epoch": 0.23, + "learning_rate": 0.0002650682641187616, + "loss": 0.0286, "step": 89840 }, { - "epoch": 0.45, - "learning_rate": 0.00023200427826911726, - "loss": 0.0138, + "epoch": 0.23, + "learning_rate": 0.0002650643759023902, + "loss": 0.0223, "step": 89850 }, { - "epoch": 0.45, - "learning_rate": 0.00023199671057610324, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.00026506048768601875, + "loss": 0.0191, "step": 89860 }, { - "epoch": 0.45, - "learning_rate": 0.0002319891428830892, - "loss": 0.015, + "epoch": 0.23, + "learning_rate": 0.00026505659946964727, + "loss": 0.0219, "step": 89870 }, { - "epoch": 0.45, - "learning_rate": 0.00023198157519007518, - "loss": 0.0149, + "epoch": 0.23, + "learning_rate": 0.0002650527112532758, + "loss": 0.0276, "step": 89880 }, { - "epoch": 0.45, - "learning_rate": 0.00023197400749706118, - "loss": 0.0162, + "epoch": 0.23, + "learning_rate": 0.00026504882303690435, + "loss": 0.0242, "step": 89890 }, { - "epoch": 0.45, - "learning_rate": 0.00023196643980404717, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.00026504493482053286, + "loss": 0.0239, "step": 89900 }, { - "epoch": 0.45, - "learning_rate": 0.00023195887211103315, - "loss": 0.0146, + "epoch": 0.23, + "learning_rate": 0.0002650410466041614, + "loss": 0.0223, "step": 89910 }, { - "epoch": 0.45, - "learning_rate": 0.00023195130441801916, - "loss": 0.0142, + "epoch": 0.23, + "learning_rate": 0.00026503715838778995, + "loss": 0.0198, "step": 89920 }, { - "epoch": 0.45, - "learning_rate": 0.00023194373672500514, - "loss": 0.0144, + "epoch": 0.23, + "learning_rate": 0.00026503327017141846, + "loss": 0.0223, "step": 89930 }, { - "epoch": 0.45, - "learning_rate": 0.00023193616903199112, - "loss": 0.0159, + "epoch": 0.23, + "learning_rate": 0.00026502938195504703, + "loss": 0.028, "step": 89940 }, { - "epoch": 0.45, - "learning_rate": 0.00023192860133897713, - "loss": 0.0333, + "epoch": 0.23, + "learning_rate": 0.00026502549373867555, + "loss": 0.0261, "step": 89950 }, { - "epoch": 0.45, - "learning_rate": 0.0002319210336459631, - "loss": 0.0643, + "epoch": 0.23, + "learning_rate": 0.00026502160552230406, + "loss": 0.0237, "step": 89960 }, { - "epoch": 0.45, - "learning_rate": 0.0002319134659529491, - "loss": 0.0249, + "epoch": 0.23, + "learning_rate": 0.00026501771730593263, + "loss": 0.025, "step": 89970 }, { - "epoch": 0.45, - "learning_rate": 0.0002319058982599351, - "loss": 0.0134, + "epoch": 0.23, + "learning_rate": 0.00026501382908956114, + "loss": 0.0226, "step": 89980 }, { - "epoch": 0.45, - "learning_rate": 0.00023189833056692108, - "loss": 0.0211, + "epoch": 0.23, + "learning_rate": 0.0002650099408731897, + "loss": 0.0293, "step": 89990 }, { - "epoch": 0.45, - "learning_rate": 0.00023189076287390706, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.0002650060526568182, + "loss": 0.0216, "step": 90000 }, { - "epoch": 0.45, - "eval_cer": 0.9144983973907989, - "eval_loss": 0.0122450590133667, - "eval_runtime": 116.807, - "eval_samples_per_second": 17.122, - "eval_steps_per_second": 4.281, + "epoch": 0.23, + "eval_cer": 0.8817908634500211, + "eval_loss": 0.016553279012441635, + "eval_runtime": 107.9226, + "eval_samples_per_second": 18.532, + "eval_steps_per_second": 4.633, "step": 90000 }, { - "epoch": 0.45, - "learning_rate": 0.00023188319518089304, - "loss": 0.0216, + "epoch": 0.23, + "learning_rate": 0.0002650021644404468, + "loss": 0.0248, "step": 90010 }, { - "epoch": 0.45, - "learning_rate": 0.00023187562748787905, - "loss": 0.0186, + "epoch": 0.23, + "learning_rate": 0.0002649982762240753, + "loss": 0.0222, "step": 90020 }, { - "epoch": 0.45, - "learning_rate": 0.00023186805979486503, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.0002649943880077038, + "loss": 0.0301, "step": 90030 }, { - "epoch": 0.45, - "learning_rate": 0.00023186049210185101, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.00026499049979133234, + "loss": 0.0276, "step": 90040 }, { - "epoch": 0.45, - "learning_rate": 0.00023185292440883702, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.0002649866115749609, + "loss": 0.0208, "step": 90050 }, { - "epoch": 0.45, - "learning_rate": 0.000231845356715823, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.0002649827233585894, + "loss": 0.0272, "step": 90060 }, { - "epoch": 0.45, - "learning_rate": 0.00023183778902280899, - "loss": 0.0145, + "epoch": 0.23, + "learning_rate": 0.000264978835142218, + "loss": 0.025, "step": 90070 }, { - "epoch": 0.45, - "learning_rate": 0.000231830221329795, - "loss": 0.0184, + "epoch": 0.23, + "learning_rate": 0.0002649749469258465, + "loss": 0.0236, "step": 90080 }, { - "epoch": 0.45, - "learning_rate": 0.00023182265363678098, - "loss": 0.0175, + "epoch": 0.23, + "learning_rate": 0.000264971058709475, + "loss": 0.02, "step": 90090 }, { - "epoch": 0.45, - "learning_rate": 0.00023181508594376696, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.0002649671704931036, + "loss": 0.0234, "step": 90100 }, { - "epoch": 0.45, - "learning_rate": 0.00023180751825075297, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.0002649632822767321, + "loss": 0.0252, "step": 90110 }, { - "epoch": 0.45, - "learning_rate": 0.00023179995055773895, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.0002649593940603606, + "loss": 0.0217, "step": 90120 }, { - "epoch": 0.45, - "learning_rate": 0.00023179238286472493, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.0002649555058439892, + "loss": 0.0208, "step": 90130 }, { - "epoch": 0.45, - "learning_rate": 0.00023178481517171094, - "loss": 0.017, + "epoch": 0.23, + "learning_rate": 0.00026495161762761776, + "loss": 0.0267, "step": 90140 }, { - "epoch": 0.45, - "learning_rate": 0.00023177724747869692, - "loss": 0.0173, + "epoch": 0.23, + "learning_rate": 0.00026494772941124627, + "loss": 0.0237, "step": 90150 }, { - "epoch": 0.45, - "learning_rate": 0.0002317696797856829, - "loss": 0.0188, + "epoch": 0.23, + "learning_rate": 0.0002649438411948748, + "loss": 0.0224, "step": 90160 }, { - "epoch": 0.45, - "learning_rate": 0.00023176211209266888, - "loss": 0.0174, + "epoch": 0.23, + "learning_rate": 0.0002649399529785033, + "loss": 0.0245, "step": 90170 }, { - "epoch": 0.45, - "learning_rate": 0.0002317545443996549, - "loss": 0.0222, + "epoch": 0.23, + "learning_rate": 0.00026493606476213187, + "loss": 0.0193, "step": 90180 }, { - "epoch": 0.46, - "learning_rate": 0.00023174697670664087, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.0002649321765457604, + "loss": 0.0224, "step": 90190 }, { - "epoch": 0.46, - "learning_rate": 0.00023173940901362685, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.00026492828832938895, + "loss": 0.0214, "step": 90200 }, { - "epoch": 0.46, - "learning_rate": 0.00023173184132061286, - "loss": 0.0191, + "epoch": 0.23, + "learning_rate": 0.00026492440011301747, + "loss": 0.0257, "step": 90210 }, { - "epoch": 0.46, - "learning_rate": 0.00023172427362759884, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.00026492051189664603, + "loss": 0.0214, "step": 90220 }, { - "epoch": 0.46, - "learning_rate": 0.00023171670593458482, - "loss": 0.0176, + "epoch": 0.23, + "learning_rate": 0.00026491662368027455, + "loss": 0.0227, "step": 90230 }, { - "epoch": 0.46, - "learning_rate": 0.00023170913824157083, - "loss": 0.0167, + "epoch": 0.23, + "learning_rate": 0.00026491273546390306, + "loss": 0.0307, "step": 90240 }, { - "epoch": 0.46, - "learning_rate": 0.00023170157054855681, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.0002649088472475316, + "loss": 0.0233, "step": 90250 }, { - "epoch": 0.46, - "learning_rate": 0.0002316940028555428, - "loss": 0.0155, + "epoch": 0.23, + "learning_rate": 0.00026490495903116015, + "loss": 0.0292, "step": 90260 }, { - "epoch": 0.46, - "learning_rate": 0.0002316864351625288, - "loss": 0.0184, + "epoch": 0.23, + "learning_rate": 0.00026490107081478866, + "loss": 0.0223, "step": 90270 }, { - "epoch": 0.46, - "learning_rate": 0.00023167886746951479, - "loss": 0.019, + "epoch": 0.23, + "learning_rate": 0.00026489718259841723, + "loss": 0.0219, "step": 90280 }, { - "epoch": 0.46, - "learning_rate": 0.00023167129977650077, - "loss": 0.0158, + "epoch": 0.23, + "learning_rate": 0.00026489329438204574, + "loss": 0.0218, "step": 90290 }, { - "epoch": 0.46, - "learning_rate": 0.00023166373208348678, - "loss": 0.0136, + "epoch": 0.23, + "learning_rate": 0.0002648894061656743, + "loss": 0.0248, "step": 90300 }, { - "epoch": 0.46, - "learning_rate": 0.00023165616439047276, - "loss": 0.0182, + "epoch": 0.23, + "learning_rate": 0.00026488551794930283, + "loss": 0.0229, "step": 90310 }, { - "epoch": 0.46, - "learning_rate": 0.00023164859669745874, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.00026488162973293134, + "loss": 0.0276, "step": 90320 }, { - "epoch": 0.46, - "learning_rate": 0.00023164102900444472, - "loss": 0.0161, + "epoch": 0.23, + "learning_rate": 0.00026487774151655986, + "loss": 0.0322, "step": 90330 }, { - "epoch": 0.46, - "learning_rate": 0.00023163346131143073, - "loss": 0.0169, + "epoch": 0.23, + "learning_rate": 0.0002648738533001884, + "loss": 0.025, "step": 90340 }, { - "epoch": 0.46, - "learning_rate": 0.0002316258936184167, - "loss": 0.0159, + "epoch": 0.23, + "learning_rate": 0.000264869965083817, + "loss": 0.0259, "step": 90350 }, { - "epoch": 0.46, - "learning_rate": 0.0002316183259254027, - "loss": 0.0181, + "epoch": 0.23, + "learning_rate": 0.0002648660768674455, + "loss": 0.0236, "step": 90360 }, { - "epoch": 0.46, - "learning_rate": 0.0002316107582323887, - "loss": 0.0152, + "epoch": 0.23, + "learning_rate": 0.000264862188651074, + "loss": 0.0214, "step": 90370 }, { - "epoch": 0.46, - "learning_rate": 0.00023160319053937468, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026485830043470254, + "loss": 0.0258, "step": 90380 }, { - "epoch": 0.46, - "learning_rate": 0.00023159562284636066, - "loss": 0.018, + "epoch": 0.23, + "learning_rate": 0.0002648544122183311, + "loss": 0.0252, "step": 90390 }, { - "epoch": 0.46, - "learning_rate": 0.00023158805515334667, - "loss": 0.0143, + "epoch": 0.23, + "learning_rate": 0.0002648505240019596, + "loss": 0.0248, "step": 90400 }, { - "epoch": 0.46, - "learning_rate": 0.00023158048746033265, - "loss": 0.0194, + "epoch": 0.23, + "learning_rate": 0.0002648466357855882, + "loss": 0.0182, "step": 90410 }, { - "epoch": 0.46, - "learning_rate": 0.00023157291976731863, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002648427475692167, + "loss": 0.0244, "step": 90420 }, { - "epoch": 0.46, - "learning_rate": 0.00023156535207430464, - "loss": 0.0149, + "epoch": 0.23, + "learning_rate": 0.0002648388593528453, + "loss": 0.0302, "step": 90430 }, { - "epoch": 0.46, - "learning_rate": 0.00023155778438129062, - "loss": 0.0148, + "epoch": 0.23, + "learning_rate": 0.0002648349711364738, + "loss": 0.0194, "step": 90440 }, { - "epoch": 0.46, - "learning_rate": 0.0002315502166882766, - "loss": 0.0171, + "epoch": 0.23, + "learning_rate": 0.0002648310829201023, + "loss": 0.0249, "step": 90450 }, { - "epoch": 0.46, - "learning_rate": 0.00023154264899526261, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.0002648271947037308, + "loss": 0.0208, "step": 90460 }, { - "epoch": 0.46, - "learning_rate": 0.0002315350813022486, - "loss": 0.0168, + "epoch": 0.23, + "learning_rate": 0.0002648233064873594, + "loss": 0.0227, "step": 90470 }, { - "epoch": 0.46, - "learning_rate": 0.00023152751360923458, - "loss": 0.0157, + "epoch": 0.23, + "learning_rate": 0.0002648194182709879, + "loss": 0.0315, "step": 90480 }, { - "epoch": 0.46, - "learning_rate": 0.00023151994591622059, - "loss": 0.0178, + "epoch": 0.23, + "learning_rate": 0.00026481553005461647, + "loss": 0.0255, "step": 90490 }, { - "epoch": 0.46, - "learning_rate": 0.00023151237822320657, - "loss": 0.013, + "epoch": 0.23, + "learning_rate": 0.000264811641838245, + "loss": 0.0182, "step": 90500 }, { - "epoch": 0.46, - "learning_rate": 0.00023150481053019255, - "loss": 0.0145, + "epoch": 0.23, + "learning_rate": 0.00026480775362187355, + "loss": 0.024, "step": 90510 }, { - "epoch": 0.46, - "learning_rate": 0.00023149724283717853, - "loss": 0.0141, + "epoch": 0.23, + "learning_rate": 0.00026480386540550207, + "loss": 0.0215, "step": 90520 }, { - "epoch": 0.46, - "learning_rate": 0.00023148967514416454, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.0002647999771891306, + "loss": 0.0251, "step": 90530 }, { - "epoch": 0.46, - "learning_rate": 0.00023148210745115052, - "loss": 0.0154, + "epoch": 0.23, + "learning_rate": 0.00026479608897275915, + "loss": 0.0241, "step": 90540 }, { - "epoch": 0.46, - "learning_rate": 0.0002314745397581365, - "loss": 0.0155, + "epoch": 0.23, + "learning_rate": 0.00026479220075638766, + "loss": 0.0233, "step": 90550 }, { - "epoch": 0.46, - "learning_rate": 0.0002314669720651225, - "loss": 0.0163, + "epoch": 0.23, + "learning_rate": 0.00026478831254001623, + "loss": 0.023, "step": 90560 }, { - "epoch": 0.46, - "learning_rate": 0.0002314594043721085, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026478442432364475, + "loss": 0.0267, "step": 90570 }, { - "epoch": 0.46, - "learning_rate": 0.00023145183667909447, - "loss": 0.014, + "epoch": 0.23, + "learning_rate": 0.00026478053610727326, + "loss": 0.0205, "step": 90580 }, { - "epoch": 0.46, - "learning_rate": 0.00023144426898608048, - "loss": 0.0141, + "epoch": 0.23, + "learning_rate": 0.0002647766478909018, + "loss": 0.0202, "step": 90590 }, { - "epoch": 0.46, - "learning_rate": 0.00023143670129306646, - "loss": 0.0144, + "epoch": 0.23, + "learning_rate": 0.00026477275967453035, + "loss": 0.0228, "step": 90600 }, { - "epoch": 0.46, - "learning_rate": 0.00023142913360005244, - "loss": 0.0135, + "epoch": 0.23, + "learning_rate": 0.00026476887145815886, + "loss": 0.0229, "step": 90610 }, { - "epoch": 0.46, - "learning_rate": 0.00023142156590703845, - "loss": 0.0189, + "epoch": 0.23, + "learning_rate": 0.00026476498324178743, + "loss": 0.0302, "step": 90620 }, { - "epoch": 0.46, - "learning_rate": 0.00023141399821402443, - "loss": 0.0156, + "epoch": 0.23, + "learning_rate": 0.00026476109502541594, + "loss": 0.0241, "step": 90630 }, { - "epoch": 0.46, - "learning_rate": 0.00023140643052101042, - "loss": 0.0198, + "epoch": 0.23, + "learning_rate": 0.0002647572068090445, + "loss": 0.0227, "step": 90640 }, { - "epoch": 0.46, - "learning_rate": 0.00023139886282799642, - "loss": 0.015, + "epoch": 0.23, + "learning_rate": 0.000264753318592673, + "loss": 0.024, "step": 90650 }, { - "epoch": 0.46, - "learning_rate": 0.0002313912951349824, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026474943037630154, + "loss": 0.0269, "step": 90660 }, { - "epoch": 0.46, - "learning_rate": 0.0002313837274419684, - "loss": 0.018, + "epoch": 0.24, + "learning_rate": 0.00026474554215993006, + "loss": 0.0262, "step": 90670 }, { - "epoch": 0.46, - "learning_rate": 0.00023137615974895437, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.0002647416539435586, + "loss": 0.0245, "step": 90680 }, { - "epoch": 0.46, - "learning_rate": 0.00023136859205594038, - "loss": 0.0194, + "epoch": 0.24, + "learning_rate": 0.0002647377657271872, + "loss": 0.0231, "step": 90690 }, { - "epoch": 0.46, - "learning_rate": 0.00023136102436292636, - "loss": 0.018, + "epoch": 0.24, + "learning_rate": 0.0002647338775108157, + "loss": 0.0242, "step": 90700 }, { - "epoch": 0.46, - "learning_rate": 0.00023135345666991234, - "loss": 0.0119, + "epoch": 0.24, + "learning_rate": 0.0002647299892944442, + "loss": 0.0248, "step": 90710 }, { - "epoch": 0.46, - "learning_rate": 0.00023134588897689835, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.0002647261010780728, + "loss": 0.0253, "step": 90720 }, { - "epoch": 0.46, - "learning_rate": 0.00023133832128388433, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.0002647222128617013, + "loss": 0.0251, "step": 90730 }, { - "epoch": 0.46, - "learning_rate": 0.0002313307535908703, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.0002647183246453298, + "loss": 0.0212, "step": 90740 }, { - "epoch": 0.46, - "learning_rate": 0.00023132318589785632, - "loss": 0.0151, + "epoch": 0.24, + "learning_rate": 0.0002647144364289584, + "loss": 0.0184, "step": 90750 }, { - "epoch": 0.46, - "learning_rate": 0.0002313156182048423, - "loss": 0.0207, + "epoch": 0.24, + "learning_rate": 0.0002647105482125869, + "loss": 0.0244, "step": 90760 }, { - "epoch": 0.46, - "learning_rate": 0.00023130805051182828, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026470665999621547, + "loss": 0.0194, "step": 90770 }, { - "epoch": 0.46, - "learning_rate": 0.0002313004828188143, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.000264702771779844, + "loss": 0.0215, "step": 90780 }, { - "epoch": 0.46, - "learning_rate": 0.00023129291512580027, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.0002646988835634725, + "loss": 0.021, "step": 90790 }, { - "epoch": 0.46, - "learning_rate": 0.00023128534743278625, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.00026469499534710107, + "loss": 0.0274, "step": 90800 }, { - "epoch": 0.46, - "learning_rate": 0.00023127777973977226, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002646911071307296, + "loss": 0.0228, "step": 90810 }, { - "epoch": 0.46, - "learning_rate": 0.00023127021204675824, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.0002646872189143581, + "loss": 0.0266, "step": 90820 }, { - "epoch": 0.46, - "learning_rate": 0.00023126264435374423, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.00026468333069798667, + "loss": 0.0224, "step": 90830 }, { - "epoch": 0.46, - "learning_rate": 0.0002312550766607302, - "loss": 0.0152, + "epoch": 0.24, + "learning_rate": 0.0002646794424816152, + "loss": 0.0233, "step": 90840 }, { - "epoch": 0.46, - "learning_rate": 0.00023124750896771622, - "loss": 0.0134, + "epoch": 0.24, + "learning_rate": 0.00026467555426524375, + "loss": 0.0257, "step": 90850 }, { - "epoch": 0.46, - "learning_rate": 0.0002312399412747022, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.00026467166604887227, + "loss": 0.0223, "step": 90860 }, { - "epoch": 0.46, - "learning_rate": 0.00023123237358168818, - "loss": 0.0211, + "epoch": 0.24, + "learning_rate": 0.0002646677778325008, + "loss": 0.0226, "step": 90870 }, { - "epoch": 0.46, - "learning_rate": 0.0002312248058886742, - "loss": 0.0192, + "epoch": 0.24, + "learning_rate": 0.0002646638896161293, + "loss": 0.0302, "step": 90880 }, { - "epoch": 0.46, - "learning_rate": 0.00023121723819566017, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.00026466000139975786, + "loss": 0.0241, "step": 90890 }, { - "epoch": 0.46, - "learning_rate": 0.00023120967050264615, - "loss": 0.0156, + "epoch": 0.24, + "learning_rate": 0.00026465611318338643, + "loss": 0.0209, "step": 90900 }, { - "epoch": 0.46, - "learning_rate": 0.00023120210280963216, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.00026465222496701495, + "loss": 0.0247, "step": 90910 }, { - "epoch": 0.46, - "learning_rate": 0.00023119453511661814, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.00026464833675064346, + "loss": 0.0226, "step": 90920 }, { - "epoch": 0.46, - "learning_rate": 0.00023118696742360412, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.00026464444853427203, + "loss": 0.0227, "step": 90930 }, { - "epoch": 0.46, - "learning_rate": 0.00023117939973059013, - "loss": 0.0145, + "epoch": 0.24, + "learning_rate": 0.00026464056031790054, + "loss": 0.0215, "step": 90940 }, { - "epoch": 0.46, - "learning_rate": 0.0002311718320375761, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.00026463667210152906, + "loss": 0.0187, "step": 90950 }, { - "epoch": 0.46, - "learning_rate": 0.0002311642643445621, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.00026463278388515763, + "loss": 0.0236, "step": 90960 }, { - "epoch": 0.46, - "learning_rate": 0.0002311566966515481, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.00026462889566878614, + "loss": 0.0259, "step": 90970 }, { - "epoch": 0.46, - "learning_rate": 0.00023114912895853408, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002646250074524147, + "loss": 0.0225, "step": 90980 }, { - "epoch": 0.46, - "learning_rate": 0.00023114156126552006, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002646211192360432, + "loss": 0.0193, "step": 90990 }, { - "epoch": 0.46, - "learning_rate": 0.00023113399357250607, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026461723101967174, + "loss": 0.0276, "step": 91000 }, { - "epoch": 0.46, - "eval_cer": 0.9145022789753005, - "eval_loss": 0.01197886560112238, - "eval_runtime": 116.7595, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.24, + "eval_cer": 0.8817712685329425, + "eval_loss": 0.01665649563074112, + "eval_runtime": 107.8663, + "eval_samples_per_second": 18.541, + "eval_steps_per_second": 4.635, "step": 91000 }, { - "epoch": 0.46, - "learning_rate": 0.00023112642587949205, - "loss": 0.0226, + "epoch": 0.24, + "learning_rate": 0.0002646133428033003, + "loss": 0.0229, "step": 91010 }, { - "epoch": 0.46, - "learning_rate": 0.00023111885818647804, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.0002646094545869288, + "loss": 0.0249, "step": 91020 }, { - "epoch": 0.46, - "learning_rate": 0.00023111129049346402, - "loss": 0.0138, + "epoch": 0.24, + "learning_rate": 0.00026460556637055734, + "loss": 0.0241, "step": 91030 }, { - "epoch": 0.46, - "learning_rate": 0.00023110372280045003, - "loss": 0.0222, + "epoch": 0.24, + "learning_rate": 0.0002646016781541859, + "loss": 0.024, "step": 91040 }, { - "epoch": 0.46, - "learning_rate": 0.000231096155107436, - "loss": 0.0136, + "epoch": 0.24, + "learning_rate": 0.0002645977899378145, + "loss": 0.0218, "step": 91050 }, { - "epoch": 0.46, - "learning_rate": 0.000231088587414422, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.000264593901721443, + "loss": 0.0206, "step": 91060 }, { - "epoch": 0.46, - "learning_rate": 0.000231081019721408, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.0002645900135050715, + "loss": 0.0247, "step": 91070 }, { - "epoch": 0.46, - "learning_rate": 0.00023107345202839398, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002645861252887, + "loss": 0.027, "step": 91080 }, { - "epoch": 0.46, - "learning_rate": 0.00023106588433537996, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.0002645822370723286, + "loss": 0.0251, "step": 91090 }, { - "epoch": 0.46, - "learning_rate": 0.00023105831664236597, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.0002645783488559571, + "loss": 0.0222, "step": 91100 }, { - "epoch": 0.46, - "learning_rate": 0.00023105074894935195, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.00026457446063958567, + "loss": 0.0186, "step": 91110 }, { - "epoch": 0.46, - "learning_rate": 0.00023104318125633793, + "epoch": 0.24, + "learning_rate": 0.0002645705724232142, "loss": 0.0212, "step": 91120 }, { - "epoch": 0.46, - "learning_rate": 0.00023103561356332389, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.0002645666842068427, + "loss": 0.0225, "step": 91130 }, { - "epoch": 0.46, - "learning_rate": 0.0002310280458703099, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026456279599047127, + "loss": 0.0313, "step": 91140 }, { - "epoch": 0.46, - "learning_rate": 0.00023102047817729588, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.0002645589077740998, + "loss": 0.0237, "step": 91150 }, { - "epoch": 0.46, - "learning_rate": 0.00023101291048428186, - "loss": 0.014, + "epoch": 0.24, + "learning_rate": 0.0002645550195577283, + "loss": 0.0196, "step": 91160 }, { - "epoch": 0.46, - "learning_rate": 0.00023100534279126787, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.00026455113134135687, + "loss": 0.0213, "step": 91170 }, { - "epoch": 0.46, - "learning_rate": 0.00023099777509825385, - "loss": 0.019, + "epoch": 0.24, + "learning_rate": 0.00026454724312498544, + "loss": 0.0243, "step": 91180 }, { - "epoch": 0.46, - "learning_rate": 0.00023099020740523983, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.00026454335490861395, + "loss": 0.0213, "step": 91190 }, { - "epoch": 0.46, - "learning_rate": 0.00023098263971222584, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.00026453946669224246, + "loss": 0.0206, "step": 91200 }, { - "epoch": 0.46, - "learning_rate": 0.00023097507201921182, - "loss": 0.0221, + "epoch": 0.24, + "learning_rate": 0.000264535578475871, + "loss": 0.0234, "step": 91210 }, { - "epoch": 0.46, - "learning_rate": 0.0002309675043261978, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.00026453169025949955, + "loss": 0.0234, "step": 91220 }, { - "epoch": 0.46, - "learning_rate": 0.00023095993663318378, - "loss": 0.0129, + "epoch": 0.24, + "learning_rate": 0.00026452780204312806, + "loss": 0.0281, "step": 91230 }, { - "epoch": 0.46, - "learning_rate": 0.0002309523689401698, - "loss": 0.0206, + "epoch": 0.24, + "learning_rate": 0.00026452391382675663, + "loss": 0.0243, "step": 91240 }, { - "epoch": 0.46, - "learning_rate": 0.00023094480124715577, - "loss": 0.0123, + "epoch": 0.24, + "learning_rate": 0.00026452002561038515, + "loss": 0.0278, "step": 91250 }, { - "epoch": 0.46, - "learning_rate": 0.00023093723355414175, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.0002645161373940137, + "loss": 0.0222, "step": 91260 }, { - "epoch": 0.46, - "learning_rate": 0.00023092966586112776, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026451224917764223, + "loss": 0.0227, "step": 91270 }, { - "epoch": 0.46, - "learning_rate": 0.00023092209816811374, - "loss": 0.0197, + "epoch": 0.24, + "learning_rate": 0.00026450836096127074, + "loss": 0.0222, "step": 91280 }, { - "epoch": 0.46, - "learning_rate": 0.00023091453047509972, - "loss": 0.0165, + "epoch": 0.24, + "learning_rate": 0.00026450447274489926, + "loss": 0.0293, "step": 91290 }, { - "epoch": 0.46, - "learning_rate": 0.00023090696278208573, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.0002645005845285278, + "loss": 0.023, "step": 91300 }, { - "epoch": 0.46, - "learning_rate": 0.00023089939508907171, - "loss": 0.0194, + "epoch": 0.24, + "learning_rate": 0.00026449669631215634, + "loss": 0.0244, "step": 91310 }, { - "epoch": 0.46, - "learning_rate": 0.0002308918273960577, - "loss": 0.022, + "epoch": 0.24, + "learning_rate": 0.0002644928080957849, + "loss": 0.0232, "step": 91320 }, { - "epoch": 0.46, - "learning_rate": 0.0002308842597030437, - "loss": 0.0215, + "epoch": 0.24, + "learning_rate": 0.0002644889198794134, + "loss": 0.0254, "step": 91330 }, { - "epoch": 0.46, - "learning_rate": 0.00023087669201002969, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.00026448503166304194, + "loss": 0.0213, "step": 91340 }, { - "epoch": 0.46, - "learning_rate": 0.00023086912431701567, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.0002644811434466705, + "loss": 0.0227, "step": 91350 }, { - "epoch": 0.46, - "learning_rate": 0.00023086155662400168, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.000264477255230299, + "loss": 0.0255, "step": 91360 }, { - "epoch": 0.46, - "learning_rate": 0.00023085398893098766, - "loss": 0.018, + "epoch": 0.24, + "learning_rate": 0.00026447336701392754, + "loss": 0.0234, "step": 91370 }, { - "epoch": 0.46, - "learning_rate": 0.00023084642123797364, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002644694787975561, + "loss": 0.0234, "step": 91380 }, { - "epoch": 0.46, - "learning_rate": 0.00023083885354495965, - "loss": 0.0251, + "epoch": 0.24, + "learning_rate": 0.0002644655905811847, + "loss": 0.0242, "step": 91390 }, { - "epoch": 0.46, - "learning_rate": 0.00023083128585194563, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.0002644617023648132, + "loss": 0.0236, "step": 91400 }, { - "epoch": 0.46, - "learning_rate": 0.0002308237181589316, - "loss": 0.022, + "epoch": 0.24, + "learning_rate": 0.0002644578141484417, + "loss": 0.0179, "step": 91410 }, { - "epoch": 0.46, - "learning_rate": 0.0002308161504659176, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002644539259320702, + "loss": 0.0289, "step": 91420 }, { - "epoch": 0.46, - "learning_rate": 0.0002308085827729036, - "loss": 0.0198, + "epoch": 0.24, + "learning_rate": 0.0002644500377156988, + "loss": 0.0207, "step": 91430 }, { - "epoch": 0.46, - "learning_rate": 0.00023080101507988958, - "loss": 0.0189, + "epoch": 0.24, + "learning_rate": 0.0002644461494993273, + "loss": 0.0259, "step": 91440 }, { - "epoch": 0.46, - "learning_rate": 0.00023079344738687556, - "loss": 0.0196, + "epoch": 0.24, + "learning_rate": 0.00026444226128295587, + "loss": 0.0192, "step": 91450 }, { - "epoch": 0.46, - "learning_rate": 0.00023078587969386157, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002644383730665844, + "loss": 0.0186, "step": 91460 }, { - "epoch": 0.46, - "learning_rate": 0.00023077831200084755, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.00026443448485021295, + "loss": 0.0195, "step": 91470 }, { - "epoch": 0.46, - "learning_rate": 0.00023077074430783353, - "loss": 0.0145, + "epoch": 0.24, + "learning_rate": 0.00026443059663384147, + "loss": 0.0201, "step": 91480 }, { - "epoch": 0.46, - "learning_rate": 0.00023076317661481954, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026442670841747, + "loss": 0.0207, "step": 91490 }, { - "epoch": 0.46, - "learning_rate": 0.00023075560892180552, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.0002644228202010985, + "loss": 0.0218, "step": 91500 }, { - "epoch": 0.46, - "learning_rate": 0.0002307480412287915, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.00026441893198472707, + "loss": 0.0231, "step": 91510 }, { - "epoch": 0.46, - "learning_rate": 0.00023074047353577751, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002644150437683556, + "loss": 0.0226, "step": 91520 }, { - "epoch": 0.46, - "learning_rate": 0.0002307329058427635, - "loss": 0.0138, + "epoch": 0.24, + "learning_rate": 0.00026441115555198415, + "loss": 0.022, "step": 91530 }, { - "epoch": 0.46, - "learning_rate": 0.00023072533814974948, - "loss": 0.0204, + "epoch": 0.24, + "learning_rate": 0.00026440726733561266, + "loss": 0.0249, "step": 91540 }, { - "epoch": 0.46, - "learning_rate": 0.00023071777045673549, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.00026440337911924123, + "loss": 0.0238, "step": 91550 }, { - "epoch": 0.46, - "learning_rate": 0.00023071020276372147, - "loss": 0.0135, + "epoch": 0.24, + "learning_rate": 0.00026439949090286975, + "loss": 0.0216, "step": 91560 }, { - "epoch": 0.46, - "learning_rate": 0.00023070263507070745, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.00026439560268649826, + "loss": 0.0273, "step": 91570 }, { - "epoch": 0.46, - "learning_rate": 0.00023069506737769343, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.00026439171447012683, + "loss": 0.0245, "step": 91580 }, { - "epoch": 0.46, - "learning_rate": 0.00023068749968467944, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.00026438782625375534, + "loss": 0.02, "step": 91590 }, { - "epoch": 0.46, - "learning_rate": 0.00023067993199166542, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.0002643839380373839, + "loss": 0.0192, "step": 91600 }, { - "epoch": 0.46, - "learning_rate": 0.0002306723642986514, - "loss": 0.0202, + "epoch": 0.24, + "learning_rate": 0.00026438004982101243, + "loss": 0.0261, "step": 91610 }, { - "epoch": 0.46, - "learning_rate": 0.0002306647966056374, - "loss": 0.0194, + "epoch": 0.24, + "learning_rate": 0.00026437616160464094, + "loss": 0.0234, "step": 91620 }, { - "epoch": 0.46, - "learning_rate": 0.0002306572289126234, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.00026437227338826946, + "loss": 0.0193, "step": 91630 }, { - "epoch": 0.46, - "learning_rate": 0.00023064966121960937, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.000264368385171898, + "loss": 0.0206, "step": 91640 }, { - "epoch": 0.46, - "learning_rate": 0.00023064209352659538, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026436449695552654, + "loss": 0.0219, "step": 91650 }, { - "epoch": 0.46, - "learning_rate": 0.00023063452583358136, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.0002643606087391551, + "loss": 0.0233, "step": 91660 }, { - "epoch": 0.46, - "learning_rate": 0.00023062695814056734, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.0002643567205227836, + "loss": 0.0254, "step": 91670 }, { - "epoch": 0.46, - "learning_rate": 0.00023061939044755335, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002643528323064122, + "loss": 0.0265, "step": 91680 }, { - "epoch": 0.46, - "learning_rate": 0.00023061182275453933, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.0002643489440900407, + "loss": 0.0223, "step": 91690 }, { - "epoch": 0.46, - "learning_rate": 0.00023060425506152532, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.0002643450558736692, + "loss": 0.0236, "step": 91700 }, { - "epoch": 0.46, - "learning_rate": 0.00023059668736851132, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.00026434116765729774, + "loss": 0.0263, "step": 91710 }, { - "epoch": 0.46, - "learning_rate": 0.0002305891196754973, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.0002643372794409263, + "loss": 0.0239, "step": 91720 }, { - "epoch": 0.46, - "learning_rate": 0.0002305815519824833, - "loss": 0.0165, + "epoch": 0.24, + "learning_rate": 0.0002643333912245549, + "loss": 0.0206, "step": 91730 }, { - "epoch": 0.46, - "learning_rate": 0.00023057398428946927, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002643295030081834, + "loss": 0.0224, "step": 91740 }, { - "epoch": 0.46, - "learning_rate": 0.00023056641659645528, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.0002643256147918119, + "loss": 0.0244, "step": 91750 }, { - "epoch": 0.46, - "learning_rate": 0.00023055884890344126, - "loss": 0.0185, + "epoch": 0.24, + "learning_rate": 0.00026432172657544047, + "loss": 0.0227, "step": 91760 }, { - "epoch": 0.46, - "learning_rate": 0.00023055128121042724, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.000264317838359069, + "loss": 0.0255, "step": 91770 }, { - "epoch": 0.46, - "learning_rate": 0.00023054371351741325, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.0002643139501426975, + "loss": 0.0223, "step": 91780 }, { - "epoch": 0.46, - "learning_rate": 0.00023053614582439923, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.00026431006192632607, + "loss": 0.0219, "step": 91790 }, { - "epoch": 0.46, - "learning_rate": 0.0002305285781313852, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.0002643061737099546, + "loss": 0.0253, "step": 91800 }, { - "epoch": 0.46, - "learning_rate": 0.00023052101043837122, - "loss": 0.0141, + "epoch": 0.24, + "learning_rate": 0.00026430228549358315, + "loss": 0.0257, "step": 91810 }, { - "epoch": 0.46, - "learning_rate": 0.0002305134427453572, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.00026429839727721167, + "loss": 0.0213, "step": 91820 }, { - "epoch": 0.46, - "learning_rate": 0.00023050587505234318, - "loss": 0.0146, + "epoch": 0.24, + "learning_rate": 0.0002642945090608402, + "loss": 0.0212, "step": 91830 }, { - "epoch": 0.46, - "learning_rate": 0.0002304983073593292, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.0002642906208444687, + "loss": 0.022, "step": 91840 }, { - "epoch": 0.46, - "learning_rate": 0.00023049073966631517, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.00026428673262809726, + "loss": 0.0252, "step": 91850 }, { - "epoch": 0.46, - "learning_rate": 0.00023048317197330115, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.0002642828444117258, + "loss": 0.0264, "step": 91860 }, { - "epoch": 0.46, - "learning_rate": 0.00023047560428028716, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.00026427895619535435, + "loss": 0.0204, "step": 91870 }, { - "epoch": 0.46, - "learning_rate": 0.00023046803658727314, - "loss": 0.0133, + "epoch": 0.24, + "learning_rate": 0.00026427506797898286, + "loss": 0.0252, "step": 91880 }, { - "epoch": 0.46, - "learning_rate": 0.00023046046889425913, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026427117976261143, + "loss": 0.0242, "step": 91890 }, { - "epoch": 0.46, - "learning_rate": 0.00023045290120124513, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.00026426729154623995, + "loss": 0.0243, "step": 91900 }, { - "epoch": 0.46, - "learning_rate": 0.00023044533350823112, - "loss": 0.0262, + "epoch": 0.24, + "learning_rate": 0.00026426340332986846, + "loss": 0.0231, "step": 91910 }, { - "epoch": 0.46, - "learning_rate": 0.0002304377658152171, - "loss": 0.0167, + "epoch": 0.24, + "learning_rate": 0.000264259515113497, + "loss": 0.0237, "step": 91920 }, { - "epoch": 0.46, - "learning_rate": 0.00023043019812220308, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.00026425562689712554, + "loss": 0.0241, "step": 91930 }, { - "epoch": 0.46, - "learning_rate": 0.0002304226304291891, - "loss": 0.0152, + "epoch": 0.24, + "learning_rate": 0.0002642517386807541, + "loss": 0.0211, "step": 91940 }, { - "epoch": 0.46, - "learning_rate": 0.00023041506273617507, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002642478504643826, + "loss": 0.0227, "step": 91950 }, { - "epoch": 0.46, - "learning_rate": 0.00023040749504316105, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.00026424396224801114, + "loss": 0.0242, "step": 91960 }, { - "epoch": 0.46, - "learning_rate": 0.00023039992735014706, - "loss": 0.0129, + "epoch": 0.24, + "learning_rate": 0.0002642400740316397, + "loss": 0.0209, "step": 91970 }, { - "epoch": 0.46, - "learning_rate": 0.00023039235965713304, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002642361858152682, + "loss": 0.025, "step": 91980 }, { - "epoch": 0.46, - "learning_rate": 0.00023038479196411902, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.00026423229759889674, + "loss": 0.0241, "step": 91990 }, { - "epoch": 0.46, - "learning_rate": 0.00023037722427110503, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.0002642284093825253, + "loss": 0.021, "step": 92000 }, { - "epoch": 0.46, - "eval_cer": 0.9144974269946735, - "eval_loss": 0.011690773069858551, - "eval_runtime": 116.7969, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.24, + "eval_cer": 0.881813257640968, + "eval_loss": 0.01661667600274086, + "eval_runtime": 108.0448, + "eval_samples_per_second": 18.511, + "eval_steps_per_second": 4.628, "step": 92000 }, { - "epoch": 0.46, - "learning_rate": 0.000230369656578091, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002642245211661538, + "loss": 0.023, "step": 92010 }, { - "epoch": 0.46, - "learning_rate": 0.000230362088885077, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002642206329497824, + "loss": 0.0262, "step": 92020 }, { - "epoch": 0.46, - "learning_rate": 0.000230354521192063, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.0002642167447334109, + "loss": 0.0172, "step": 92030 }, { - "epoch": 0.46, - "learning_rate": 0.00023034695349904898, - "loss": 0.0254, + "epoch": 0.24, + "learning_rate": 0.0002642128565170394, + "loss": 0.0251, "step": 92040 }, { - "epoch": 0.46, - "learning_rate": 0.00023033938580603496, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.00026420896830066793, + "loss": 0.0206, "step": 92050 }, { - "epoch": 0.46, - "learning_rate": 0.00023033181811302097, - "loss": 0.0218, + "epoch": 0.24, + "learning_rate": 0.0002642050800842965, + "loss": 0.0226, "step": 92060 }, { - "epoch": 0.46, - "learning_rate": 0.00023032425042000695, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.000264201191867925, + "loss": 0.0262, "step": 92070 }, { - "epoch": 0.46, - "learning_rate": 0.00023031668272699294, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.0002641973036515536, + "loss": 0.0224, "step": 92080 }, { - "epoch": 0.46, - "learning_rate": 0.00023030911503397892, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.0002641934154351821, + "loss": 0.0252, "step": 92090 }, { - "epoch": 0.46, - "learning_rate": 0.00023030154734096493, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026418952721881067, + "loss": 0.0276, "step": 92100 }, { - "epoch": 0.46, - "learning_rate": 0.0002302939796479509, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.0002641856390024392, + "loss": 0.0239, "step": 92110 }, { - "epoch": 0.46, - "learning_rate": 0.0002302864119549369, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.0002641817507860677, + "loss": 0.0231, "step": 92120 }, { - "epoch": 0.46, - "learning_rate": 0.0002302788442619229, - "loss": 0.019, + "epoch": 0.24, + "learning_rate": 0.00026417786256969627, + "loss": 0.029, "step": 92130 }, { - "epoch": 0.46, - "learning_rate": 0.00023027127656890888, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002641739743533248, + "loss": 0.0256, "step": 92140 }, { - "epoch": 0.46, - "learning_rate": 0.00023026370887589486, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.00026417008613695335, + "loss": 0.0206, "step": 92150 }, { - "epoch": 0.46, - "learning_rate": 0.00023025614118288087, - "loss": 0.0189, + "epoch": 0.24, + "learning_rate": 0.00026416619792058187, + "loss": 0.0234, "step": 92160 }, { - "epoch": 0.47, - "learning_rate": 0.00023024857348986685, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002641623097042104, + "loss": 0.0239, "step": 92170 }, { - "epoch": 0.47, - "learning_rate": 0.00023024100579685283, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.00026415842148783895, + "loss": 0.0247, "step": 92180 }, { - "epoch": 0.47, - "learning_rate": 0.00023023343810383884, - "loss": 0.0141, + "epoch": 0.24, + "learning_rate": 0.00026415453327146746, + "loss": 0.028, "step": 92190 }, { - "epoch": 0.47, - "learning_rate": 0.00023022587041082482, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.000264150645055096, + "loss": 0.023, "step": 92200 }, { - "epoch": 0.47, - "learning_rate": 0.0002302183027178108, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.00026414675683872455, + "loss": 0.027, "step": 92210 }, { - "epoch": 0.47, - "learning_rate": 0.0002302107350247968, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026414286862235306, + "loss": 0.0219, "step": 92220 }, { - "epoch": 0.47, - "learning_rate": 0.0002302031673317828, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.00026413898040598163, + "loss": 0.0177, "step": 92230 }, { - "epoch": 0.47, - "learning_rate": 0.00023019559963876877, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.00026413509218961014, + "loss": 0.0214, "step": 92240 }, { - "epoch": 0.47, - "learning_rate": 0.00023018803194575476, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.00026413120397323866, + "loss": 0.0281, "step": 92250 }, { - "epoch": 0.47, - "learning_rate": 0.00023018046425274076, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026412731575686723, + "loss": 0.025, "step": 92260 }, { - "epoch": 0.47, - "learning_rate": 0.00023017289655972675, - "loss": 0.0177, + "epoch": 0.24, + "learning_rate": 0.00026412342754049574, + "loss": 0.0286, "step": 92270 }, { - "epoch": 0.47, - "learning_rate": 0.00023016532886671273, - "loss": 0.0205, + "epoch": 0.24, + "learning_rate": 0.0002641195393241243, + "loss": 0.0233, "step": 92280 }, { - "epoch": 0.47, - "learning_rate": 0.00023015776117369874, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.0002641156511077528, + "loss": 0.0201, "step": 92290 }, { - "epoch": 0.47, - "learning_rate": 0.00023015019348068472, - "loss": 0.0143, + "epoch": 0.24, + "learning_rate": 0.00026411176289138134, + "loss": 0.0218, "step": 92300 }, { - "epoch": 0.47, - "learning_rate": 0.0002301426257876707, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.0002641078746750099, + "loss": 0.0286, "step": 92310 }, { - "epoch": 0.47, - "learning_rate": 0.0002301350580946567, - "loss": 0.0189, + "epoch": 0.24, + "learning_rate": 0.0002641039864586384, + "loss": 0.0216, "step": 92320 }, { - "epoch": 0.47, - "learning_rate": 0.0002301274904016427, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.00026410009824226694, + "loss": 0.0227, "step": 92330 }, { - "epoch": 0.47, - "learning_rate": 0.00023011992270862867, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.0002640962100258955, + "loss": 0.0204, "step": 92340 }, { - "epoch": 0.47, - "learning_rate": 0.00023011235501561468, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.000264092321809524, + "loss": 0.0247, "step": 92350 }, { - "epoch": 0.47, - "learning_rate": 0.00023010478732260066, - "loss": 0.0132, + "epoch": 0.24, + "learning_rate": 0.0002640884335931526, + "loss": 0.0253, "step": 92360 }, { - "epoch": 0.47, - "learning_rate": 0.00023009721962958664, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.0002640845453767811, + "loss": 0.0197, "step": 92370 }, { - "epoch": 0.47, - "learning_rate": 0.00023008965193657265, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.0002640806571604096, + "loss": 0.0221, "step": 92380 }, { - "epoch": 0.47, - "learning_rate": 0.0002300820842435586, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.0002640767689440382, + "loss": 0.0203, "step": 92390 }, { - "epoch": 0.47, - "learning_rate": 0.0002300745165505446, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.0002640728807276667, + "loss": 0.0251, "step": 92400 }, { - "epoch": 0.47, - "learning_rate": 0.00023006694885753057, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.0002640689925112952, + "loss": 0.0241, "step": 92410 }, { - "epoch": 0.47, - "learning_rate": 0.00023005938116451658, - "loss": 0.0182, + "epoch": 0.24, + "learning_rate": 0.0002640651042949238, + "loss": 0.0233, "step": 92420 }, { - "epoch": 0.47, - "learning_rate": 0.00023005181347150256, - "loss": 0.0189, + "epoch": 0.24, + "learning_rate": 0.00026406121607855235, + "loss": 0.0187, "step": 92430 }, { - "epoch": 0.47, - "learning_rate": 0.00023004424577848854, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.00026405732786218087, + "loss": 0.0242, "step": 92440 }, { - "epoch": 0.47, - "learning_rate": 0.00023003667808547455, - "loss": 0.0221, + "epoch": 0.24, + "learning_rate": 0.0002640534396458094, + "loss": 0.0235, "step": 92450 }, { - "epoch": 0.47, - "learning_rate": 0.00023002911039246053, - "loss": 0.0119, + "epoch": 0.24, + "learning_rate": 0.0002640495514294379, + "loss": 0.0201, "step": 92460 }, { - "epoch": 0.47, - "learning_rate": 0.0002300215426994465, - "loss": 0.0139, + "epoch": 0.24, + "learning_rate": 0.00026404566321306647, + "loss": 0.0241, "step": 92470 }, { - "epoch": 0.47, - "learning_rate": 0.0002300139750064325, - "loss": 0.0143, + "epoch": 0.24, + "learning_rate": 0.000264041774996695, + "loss": 0.0288, "step": 92480 }, { - "epoch": 0.47, - "learning_rate": 0.0002300064073134185, - "loss": 0.0151, + "epoch": 0.24, + "learning_rate": 0.00026403788678032355, + "loss": 0.0239, "step": 92490 }, { - "epoch": 0.47, - "learning_rate": 0.00022999883962040448, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.00026403399856395206, + "loss": 0.0253, "step": 92500 }, { - "epoch": 0.47, - "learning_rate": 0.00022999127192739046, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.00026403011034758063, + "loss": 0.0206, "step": 92510 }, { - "epoch": 0.47, - "learning_rate": 0.00022998370423437647, - "loss": 0.0209, + "epoch": 0.24, + "learning_rate": 0.00026402622213120915, + "loss": 0.0185, "step": 92520 }, { - "epoch": 0.47, - "learning_rate": 0.00022997613654136245, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026402233391483766, + "loss": 0.0201, "step": 92530 }, { - "epoch": 0.47, - "learning_rate": 0.00022996856884834844, - "loss": 0.0165, + "epoch": 0.24, + "learning_rate": 0.0002640184456984662, + "loss": 0.0264, "step": 92540 }, { - "epoch": 0.47, - "learning_rate": 0.00022996100115533444, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.00026401455748209475, + "loss": 0.0254, "step": 92550 }, { - "epoch": 0.47, - "learning_rate": 0.00022995343346232043, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026401066926572326, + "loss": 0.0217, "step": 92560 }, { - "epoch": 0.47, - "learning_rate": 0.0002299458657693064, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.00026400678104935183, + "loss": 0.0203, "step": 92570 }, { - "epoch": 0.47, - "learning_rate": 0.00022993829807629242, - "loss": 0.0194, + "epoch": 0.24, + "learning_rate": 0.00026400289283298034, + "loss": 0.029, "step": 92580 }, { - "epoch": 0.47, - "learning_rate": 0.0002299307303832784, - "loss": 0.0141, + "epoch": 0.24, + "learning_rate": 0.00026399900461660886, + "loss": 0.024, "step": 92590 }, { - "epoch": 0.47, - "learning_rate": 0.00022992316269026438, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.0002639951164002374, + "loss": 0.0231, "step": 92600 }, { - "epoch": 0.47, - "learning_rate": 0.0002299155949972504, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.00026399122818386594, + "loss": 0.0295, "step": 92610 }, { - "epoch": 0.47, - "learning_rate": 0.00022990802730423637, - "loss": 0.0131, + "epoch": 0.24, + "learning_rate": 0.00026398733996749446, + "loss": 0.0231, "step": 92620 }, { - "epoch": 0.47, - "learning_rate": 0.00022990045961122235, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.000263983451751123, + "loss": 0.0224, "step": 92630 }, { - "epoch": 0.47, - "learning_rate": 0.00022989289191820833, - "loss": 0.0124, + "epoch": 0.24, + "learning_rate": 0.0002639795635347516, + "loss": 0.0256, "step": 92640 }, { - "epoch": 0.47, - "learning_rate": 0.00022988532422519434, - "loss": 0.0141, + "epoch": 0.24, + "learning_rate": 0.0002639756753183801, + "loss": 0.0254, "step": 92650 }, { - "epoch": 0.47, - "learning_rate": 0.00022987775653218032, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.0002639717871020086, + "loss": 0.0232, "step": 92660 }, { - "epoch": 0.47, - "learning_rate": 0.0002298701888391663, - "loss": 0.0133, + "epoch": 0.24, + "learning_rate": 0.00026396789888563714, + "loss": 0.0192, "step": 92670 }, { - "epoch": 0.47, - "learning_rate": 0.0002298626211461523, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.0002639640106692657, + "loss": 0.0297, "step": 92680 }, { - "epoch": 0.47, - "learning_rate": 0.0002298550534531383, - "loss": 0.0207, + "epoch": 0.24, + "learning_rate": 0.0002639601224528942, + "loss": 0.0254, "step": 92690 }, { - "epoch": 0.47, - "learning_rate": 0.00022984748576012427, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.0002639562342365228, + "loss": 0.0223, "step": 92700 }, { - "epoch": 0.47, - "learning_rate": 0.00022983991806711028, - "loss": 0.0129, + "epoch": 0.24, + "learning_rate": 0.0002639523460201513, + "loss": 0.0215, "step": 92710 }, { - "epoch": 0.47, - "learning_rate": 0.00022983235037409626, - "loss": 0.0137, + "epoch": 0.24, + "learning_rate": 0.00026394845780377987, + "loss": 0.0241, "step": 92720 }, { - "epoch": 0.47, - "learning_rate": 0.00022982478268108225, - "loss": 0.0151, + "epoch": 0.24, + "learning_rate": 0.0002639445695874084, + "loss": 0.0244, "step": 92730 }, { - "epoch": 0.47, - "learning_rate": 0.00022981721498806825, - "loss": 0.0135, + "epoch": 0.24, + "learning_rate": 0.0002639406813710369, + "loss": 0.021, "step": 92740 }, { - "epoch": 0.47, - "learning_rate": 0.00022980964729505424, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.0002639367931546654, + "loss": 0.0221, "step": 92750 }, { - "epoch": 0.47, - "learning_rate": 0.00022980207960204022, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.000263932904938294, + "loss": 0.0234, "step": 92760 }, { - "epoch": 0.47, - "learning_rate": 0.00022979451190902623, - "loss": 0.0157, + "epoch": 0.24, + "learning_rate": 0.00026392901672192255, + "loss": 0.0228, "step": 92770 }, { - "epoch": 0.47, - "learning_rate": 0.0002297869442160122, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026392512850555107, + "loss": 0.0207, "step": 92780 }, { - "epoch": 0.47, - "learning_rate": 0.0002297793765229982, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002639212402891796, + "loss": 0.0211, "step": 92790 }, { - "epoch": 0.47, - "learning_rate": 0.0002297718088299842, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.0002639173520728081, + "loss": 0.0221, "step": 92800 }, { - "epoch": 0.47, - "learning_rate": 0.00022976424113697018, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.00026391346385643667, + "loss": 0.02, "step": 92810 }, { - "epoch": 0.47, - "learning_rate": 0.00022975667344395616, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002639095756400652, + "loss": 0.0174, "step": 92820 }, { - "epoch": 0.47, - "learning_rate": 0.00022974910575094214, - "loss": 0.0156, + "epoch": 0.24, + "learning_rate": 0.00026390568742369375, + "loss": 0.0253, "step": 92830 }, { - "epoch": 0.47, - "learning_rate": 0.00022974153805792815, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.00026390179920732226, + "loss": 0.026, "step": 92840 }, { - "epoch": 0.47, - "learning_rate": 0.00022973397036491413, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026389791099095083, + "loss": 0.024, "step": 92850 }, { - "epoch": 0.47, - "learning_rate": 0.0002297264026719001, - "loss": 0.0185, + "epoch": 0.24, + "learning_rate": 0.00026389402277457935, + "loss": 0.0203, "step": 92860 }, { - "epoch": 0.47, - "learning_rate": 0.00022971883497888612, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.00026389013455820786, + "loss": 0.0233, "step": 92870 }, { - "epoch": 0.47, - "learning_rate": 0.0002297112672858721, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002638862463418364, + "loss": 0.0219, "step": 92880 }, { - "epoch": 0.47, - "learning_rate": 0.00022970369959285808, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026388235812546494, + "loss": 0.0217, "step": 92890 }, { - "epoch": 0.47, - "learning_rate": 0.0002296961318998441, - "loss": 0.0174, + "epoch": 0.24, + "learning_rate": 0.00026387846990909346, + "loss": 0.0199, "step": 92900 }, { - "epoch": 0.47, - "learning_rate": 0.00022968856420683007, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.00026387458169272203, + "loss": 0.0192, "step": 92910 }, { - "epoch": 0.47, - "learning_rate": 0.00022968099651381606, - "loss": 0.0147, + "epoch": 0.24, + "learning_rate": 0.00026387069347635054, + "loss": 0.0264, "step": 92920 }, { - "epoch": 0.47, - "learning_rate": 0.00022967342882080206, - "loss": 0.0154, + "epoch": 0.24, + "learning_rate": 0.0002638668052599791, + "loss": 0.0237, "step": 92930 }, { - "epoch": 0.47, - "learning_rate": 0.00022966586112778805, - "loss": 0.0139, + "epoch": 0.24, + "learning_rate": 0.0002638629170436076, + "loss": 0.0223, "step": 92940 }, { - "epoch": 0.47, - "learning_rate": 0.00022965829343477403, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.00026385902882723614, + "loss": 0.0233, "step": 92950 }, { - "epoch": 0.47, - "learning_rate": 0.00022965072574176004, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.00026385514061086465, + "loss": 0.017, "step": 92960 }, { - "epoch": 0.47, - "learning_rate": 0.00022964315804874602, - "loss": 0.0146, + "epoch": 0.24, + "learning_rate": 0.0002638512523944932, + "loss": 0.02, "step": 92970 }, { - "epoch": 0.47, - "learning_rate": 0.000229635590355732, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002638473641781218, + "loss": 0.0249, "step": 92980 }, { - "epoch": 0.47, - "learning_rate": 0.00022962802266271798, - "loss": 0.0197, + "epoch": 0.24, + "learning_rate": 0.0002638434759617503, + "loss": 0.0195, "step": 92990 }, { - "epoch": 0.47, - "learning_rate": 0.000229620454969704, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.0002638395877453788, + "loss": 0.0226, "step": 93000 }, { - "epoch": 0.47, - "eval_cer": 0.9144867526372941, - "eval_loss": 0.0119341891258955, - "eval_runtime": 116.7754, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.24, + "eval_cer": 0.881806259456297, + "eval_loss": 0.016998477280139923, + "eval_runtime": 108.1066, + "eval_samples_per_second": 18.5, + "eval_steps_per_second": 4.625, "step": 93000 }, { - "epoch": 0.47, - "learning_rate": 0.00022961288727668997, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.0002638356995290074, + "loss": 0.0262, "step": 93010 }, { - "epoch": 0.47, - "learning_rate": 0.00022960531958367595, - "loss": 0.0176, + "epoch": 0.24, + "learning_rate": 0.0002638318113126359, + "loss": 0.0273, "step": 93020 }, { - "epoch": 0.47, - "learning_rate": 0.00022959775189066196, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.0002638279230962644, + "loss": 0.0274, "step": 93030 }, { - "epoch": 0.47, - "learning_rate": 0.00022959018419764794, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.000263824034879893, + "loss": 0.0271, "step": 93040 }, { - "epoch": 0.47, - "learning_rate": 0.00022958261650463392, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.0002638201466635215, + "loss": 0.022, "step": 93050 }, { - "epoch": 0.47, - "learning_rate": 0.00022957504881161993, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026381625844715007, + "loss": 0.021, "step": 93060 }, { - "epoch": 0.47, - "learning_rate": 0.0002295674811186059, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.0002638123702307786, + "loss": 0.0232, "step": 93070 }, { - "epoch": 0.47, - "learning_rate": 0.0002295599134255919, - "loss": 0.0144, + "epoch": 0.24, + "learning_rate": 0.0002638084820144071, + "loss": 0.0202, "step": 93080 }, { - "epoch": 0.47, - "learning_rate": 0.0002295523457325779, - "loss": 0.0169, + "epoch": 0.24, + "learning_rate": 0.0002638045937980356, + "loss": 0.021, "step": 93090 }, { - "epoch": 0.47, - "learning_rate": 0.00022954477803956388, - "loss": 0.0152, + "epoch": 0.24, + "learning_rate": 0.0002638007055816642, + "loss": 0.0228, "step": 93100 }, { - "epoch": 0.47, - "learning_rate": 0.00022953721034654987, - "loss": 0.013, + "epoch": 0.24, + "learning_rate": 0.0002637968173652927, + "loss": 0.0204, "step": 93110 }, { - "epoch": 0.47, - "learning_rate": 0.00022952964265353587, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.00026379292914892127, + "loss": 0.0215, "step": 93120 }, { - "epoch": 0.47, - "learning_rate": 0.00022952207496052186, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.0002637890409325498, + "loss": 0.0249, "step": 93130 }, { - "epoch": 0.47, - "learning_rate": 0.00022951450726750784, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.00026378515271617835, + "loss": 0.0228, "step": 93140 }, { - "epoch": 0.47, - "learning_rate": 0.00022950693957449382, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.00026378126449980686, + "loss": 0.0274, "step": 93150 }, { - "epoch": 0.47, - "learning_rate": 0.00022949937188147983, - "loss": 0.0143, + "epoch": 0.24, + "learning_rate": 0.0002637773762834354, + "loss": 0.0242, "step": 93160 }, { - "epoch": 0.47, - "learning_rate": 0.0002294918041884658, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.00026377348806706395, + "loss": 0.0232, "step": 93170 }, { - "epoch": 0.47, - "learning_rate": 0.0002294842364954518, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.00026376959985069246, + "loss": 0.0272, "step": 93180 }, { - "epoch": 0.47, - "learning_rate": 0.0002294766688024378, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.00026376571163432103, + "loss": 0.0205, "step": 93190 }, { - "epoch": 0.47, - "learning_rate": 0.00022946910110942378, - "loss": 0.0154, + "epoch": 0.24, + "learning_rate": 0.00026376182341794955, + "loss": 0.0225, "step": 93200 }, { - "epoch": 0.47, - "learning_rate": 0.00022946153341640976, - "loss": 0.0138, + "epoch": 0.24, + "learning_rate": 0.00026375793520157806, + "loss": 0.022, "step": 93210 }, { - "epoch": 0.47, - "learning_rate": 0.00022945396572339577, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.00026375404698520663, + "loss": 0.0236, "step": 93220 }, { - "epoch": 0.47, - "learning_rate": 0.00022944639803038175, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.00026375015876883514, + "loss": 0.0207, "step": 93230 }, { - "epoch": 0.47, - "learning_rate": 0.00022943883033736773, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026374627055246366, + "loss": 0.0234, "step": 93240 }, { - "epoch": 0.47, - "learning_rate": 0.00022943126264435374, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.0002637423823360922, + "loss": 0.0234, "step": 93250 }, { - "epoch": 0.47, - "learning_rate": 0.00022942369495133972, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.00026373849411972074, + "loss": 0.0224, "step": 93260 }, { - "epoch": 0.47, - "learning_rate": 0.0002294161272583257, - "loss": 0.02, + "epoch": 0.24, + "learning_rate": 0.0002637346059033493, + "loss": 0.0238, "step": 93270 }, { - "epoch": 0.47, - "learning_rate": 0.0002294085595653117, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.0002637307176869778, + "loss": 0.022, "step": 93280 }, { - "epoch": 0.47, - "learning_rate": 0.0002294009918722977, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.00026372682947060634, + "loss": 0.0223, "step": 93290 }, { - "epoch": 0.47, - "learning_rate": 0.00022939342417928368, - "loss": 0.0146, + "epoch": 0.24, + "learning_rate": 0.00026372294125423485, + "loss": 0.026, "step": 93300 }, { - "epoch": 0.47, - "learning_rate": 0.00022938585648626966, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.0002637190530378634, + "loss": 0.0222, "step": 93310 }, { - "epoch": 0.47, - "learning_rate": 0.00022937828879325567, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.000263715164821492, + "loss": 0.0229, "step": 93320 }, { - "epoch": 0.47, - "learning_rate": 0.00022937072110024165, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002637112766051205, + "loss": 0.02, "step": 93330 }, { - "epoch": 0.47, - "learning_rate": 0.00022936315340722763, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.000263707388388749, + "loss": 0.0199, "step": 93340 }, { - "epoch": 0.47, - "learning_rate": 0.00022935558571421364, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.0002637035001723776, + "loss": 0.0264, "step": 93350 }, { - "epoch": 0.47, - "learning_rate": 0.00022934801802119962, - "loss": 0.0145, + "epoch": 0.24, + "learning_rate": 0.0002636996119560061, + "loss": 0.0211, "step": 93360 }, { - "epoch": 0.47, - "learning_rate": 0.0002293404503281856, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.0002636957237396346, + "loss": 0.0294, "step": 93370 }, { - "epoch": 0.47, - "learning_rate": 0.0002293328826351716, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.0002636918355232632, + "loss": 0.0266, "step": 93380 }, { - "epoch": 0.47, - "learning_rate": 0.0002293253149421576, - "loss": 0.0172, + "epoch": 0.24, + "learning_rate": 0.0002636879473068917, + "loss": 0.0297, "step": 93390 }, { - "epoch": 0.47, - "learning_rate": 0.00022931774724914357, - "loss": 0.0138, + "epoch": 0.24, + "learning_rate": 0.00026368405909052027, + "loss": 0.026, "step": 93400 }, { - "epoch": 0.47, - "learning_rate": 0.00022931017955612958, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.0002636801708741488, + "loss": 0.0232, "step": 93410 }, { - "epoch": 0.47, - "learning_rate": 0.00022930261186311556, - "loss": 0.014, + "epoch": 0.24, + "learning_rate": 0.0002636762826577773, + "loss": 0.022, "step": 93420 }, { - "epoch": 0.47, - "learning_rate": 0.00022929504417010154, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.00026367239444140587, + "loss": 0.0227, "step": 93430 }, { - "epoch": 0.47, - "learning_rate": 0.00022928747647708755, - "loss": 0.0141, + "epoch": 0.24, + "learning_rate": 0.0002636685062250344, + "loss": 0.0208, "step": 93440 }, { - "epoch": 0.47, - "learning_rate": 0.00022927990878407353, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.0002636646180086629, + "loss": 0.0214, "step": 93450 }, { - "epoch": 0.47, - "learning_rate": 0.00022927234109105951, - "loss": 0.0208, + "epoch": 0.24, + "learning_rate": 0.00026366072979229147, + "loss": 0.0206, "step": 93460 }, { - "epoch": 0.47, - "learning_rate": 0.00022926477339804552, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.00026365684157592003, + "loss": 0.025, "step": 93470 }, { - "epoch": 0.47, - "learning_rate": 0.0002292572057050315, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026365295335954855, + "loss": 0.0234, "step": 93480 }, { - "epoch": 0.47, - "learning_rate": 0.00022924963801201749, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.00026364906514317706, + "loss": 0.0239, "step": 93490 }, { - "epoch": 0.47, - "learning_rate": 0.00022924207031900347, - "loss": 0.0197, + "epoch": 0.24, + "learning_rate": 0.0002636451769268056, + "loss": 0.0226, "step": 93500 }, { - "epoch": 0.47, - "learning_rate": 0.00022923450262598948, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.00026364128871043415, + "loss": 0.0287, "step": 93510 }, { - "epoch": 0.47, - "learning_rate": 0.00022922693493297546, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026363740049406266, + "loss": 0.022, "step": 93520 }, { - "epoch": 0.47, - "learning_rate": 0.00022921936723996144, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.00026363351227769123, + "loss": 0.0216, "step": 93530 }, { - "epoch": 0.47, - "learning_rate": 0.00022921179954694745, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.00026362962406131974, + "loss": 0.0222, "step": 93540 }, { - "epoch": 0.47, - "learning_rate": 0.00022920423185393343, - "loss": 0.0185, + "epoch": 0.24, + "learning_rate": 0.00026362573584494826, + "loss": 0.0232, "step": 93550 }, { - "epoch": 0.47, - "learning_rate": 0.0002291966641609194, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.00026362184762857683, + "loss": 0.0203, "step": 93560 }, { - "epoch": 0.47, - "learning_rate": 0.00022918909646790542, - "loss": 0.0161, + "epoch": 0.24, + "learning_rate": 0.00026361795941220534, + "loss": 0.0207, "step": 93570 }, { - "epoch": 0.47, - "learning_rate": 0.0002291815287748914, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.00026361407119583386, + "loss": 0.0263, "step": 93580 }, { - "epoch": 0.47, - "learning_rate": 0.00022917396108187738, - "loss": 0.016, + "epoch": 0.24, + "learning_rate": 0.0002636101829794624, + "loss": 0.028, "step": 93590 }, { - "epoch": 0.47, - "learning_rate": 0.0002291663933888634, - "loss": 0.0143, + "epoch": 0.24, + "learning_rate": 0.00026360629476309094, + "loss": 0.0223, "step": 93600 }, { - "epoch": 0.47, - "learning_rate": 0.00022915882569584937, - "loss": 0.0143, + "epoch": 0.24, + "learning_rate": 0.0002636024065467195, + "loss": 0.0196, "step": 93610 }, { - "epoch": 0.47, - "learning_rate": 0.00022915125800283535, - "loss": 0.014, + "epoch": 0.24, + "learning_rate": 0.000263598518330348, + "loss": 0.0227, "step": 93620 }, { - "epoch": 0.47, - "learning_rate": 0.00022914369030982136, - "loss": 0.0147, + "epoch": 0.24, + "learning_rate": 0.00026359463011397654, + "loss": 0.0236, "step": 93630 }, { - "epoch": 0.47, - "learning_rate": 0.00022913612261680732, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.0002635907418976051, + "loss": 0.0192, "step": 93640 }, { - "epoch": 0.47, - "learning_rate": 0.0002291285549237933, - "loss": 0.0168, + "epoch": 0.24, + "learning_rate": 0.0002635868536812336, + "loss": 0.0231, "step": 93650 }, { - "epoch": 0.47, - "learning_rate": 0.00022912098723077928, - "loss": 0.0145, + "epoch": 0.24, + "learning_rate": 0.00026358296546486214, + "loss": 0.0226, "step": 93660 }, { - "epoch": 0.47, - "learning_rate": 0.0002291134195377653, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.0002635790772484907, + "loss": 0.0187, "step": 93670 }, { - "epoch": 0.47, - "learning_rate": 0.00022910585184475127, - "loss": 0.0151, + "epoch": 0.24, + "learning_rate": 0.00026357518903211927, + "loss": 0.0239, "step": 93680 }, { - "epoch": 0.47, - "learning_rate": 0.00022909828415173725, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.0002635713008157478, + "loss": 0.0206, "step": 93690 }, { - "epoch": 0.47, - "learning_rate": 0.00022909071645872326, - "loss": 0.0286, + "epoch": 0.24, + "learning_rate": 0.0002635674125993763, + "loss": 0.0194, "step": 93700 }, { - "epoch": 0.47, - "learning_rate": 0.00022908314876570924, - "loss": 0.0202, + "epoch": 0.24, + "learning_rate": 0.0002635635243830048, + "loss": 0.0309, "step": 93710 }, { - "epoch": 0.47, - "learning_rate": 0.00022907558107269522, - "loss": 0.0162, + "epoch": 0.24, + "learning_rate": 0.0002635596361666334, + "loss": 0.0199, "step": 93720 }, { - "epoch": 0.47, - "learning_rate": 0.0002290680133796812, - "loss": 0.0167, + "epoch": 0.24, + "learning_rate": 0.0002635557479502619, + "loss": 0.0194, "step": 93730 }, { - "epoch": 0.47, - "learning_rate": 0.0002290604456866672, - "loss": 0.0191, + "epoch": 0.24, + "learning_rate": 0.00026355185973389047, + "loss": 0.0204, "step": 93740 }, { - "epoch": 0.47, - "learning_rate": 0.0002290528779936532, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.000263547971517519, + "loss": 0.023, "step": 93750 }, { - "epoch": 0.47, - "learning_rate": 0.00022904531030063917, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.00026354408330114755, + "loss": 0.0246, "step": 93760 }, { - "epoch": 0.47, - "learning_rate": 0.00022903774260762518, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.00026354019508477607, + "loss": 0.0218, "step": 93770 }, { - "epoch": 0.47, - "learning_rate": 0.00022903017491461116, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.0002635363068684046, + "loss": 0.0221, "step": 93780 }, { - "epoch": 0.47, - "learning_rate": 0.00022902260722159715, - "loss": 0.0206, + "epoch": 0.24, + "learning_rate": 0.0002635324186520331, + "loss": 0.0243, "step": 93790 }, { - "epoch": 0.47, - "learning_rate": 0.00022901503952858315, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.00026352853043566166, + "loss": 0.0224, "step": 93800 }, { - "epoch": 0.47, - "learning_rate": 0.00022900747183556914, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.0002635246422192902, + "loss": 0.0304, "step": 93810 }, { - "epoch": 0.47, - "learning_rate": 0.00022899990414255512, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.00026352075400291875, + "loss": 0.0194, "step": 93820 }, { - "epoch": 0.47, - "learning_rate": 0.00022899233644954113, - "loss": 0.018, + "epoch": 0.24, + "learning_rate": 0.00026351686578654726, + "loss": 0.0253, "step": 93830 }, { - "epoch": 0.47, - "learning_rate": 0.0002289847687565271, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.0002635129775701758, + "loss": 0.0189, "step": 93840 }, { - "epoch": 0.47, - "learning_rate": 0.0002289772010635131, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.00026350908935380434, + "loss": 0.0235, "step": 93850 }, { - "epoch": 0.47, - "learning_rate": 0.0002289696333704991, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026350520113743286, + "loss": 0.0208, "step": 93860 }, { - "epoch": 0.47, - "learning_rate": 0.00022896206567748508, - "loss": 0.0165, + "epoch": 0.24, + "learning_rate": 0.00026350131292106143, + "loss": 0.0219, "step": 93870 }, { - "epoch": 0.47, - "learning_rate": 0.00022895449798447106, - "loss": 0.0183, + "epoch": 0.24, + "learning_rate": 0.00026349742470468994, + "loss": 0.0197, "step": 93880 }, { - "epoch": 0.47, - "learning_rate": 0.00022894693029145704, - "loss": 0.013, + "epoch": 0.24, + "learning_rate": 0.0002634935364883185, + "loss": 0.0204, "step": 93890 }, { - "epoch": 0.47, - "learning_rate": 0.00022893936259844305, - "loss": 0.0163, + "epoch": 0.24, + "learning_rate": 0.000263489648271947, + "loss": 0.0216, "step": 93900 }, { - "epoch": 0.47, - "learning_rate": 0.00022893179490542903, - "loss": 0.0166, + "epoch": 0.24, + "learning_rate": 0.00026348576005557554, + "loss": 0.0215, "step": 93910 }, { - "epoch": 0.47, - "learning_rate": 0.000228924227212415, - "loss": 0.0152, + "epoch": 0.24, + "learning_rate": 0.00026348187183920406, + "loss": 0.0267, "step": 93920 }, { - "epoch": 0.47, - "learning_rate": 0.00022891665951940102, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.0002634779836228326, + "loss": 0.0273, "step": 93930 }, { - "epoch": 0.47, - "learning_rate": 0.000228909091826387, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.00026347409540646114, + "loss": 0.0219, "step": 93940 }, { - "epoch": 0.47, - "learning_rate": 0.00022890152413337298, - "loss": 0.012, + "epoch": 0.24, + "learning_rate": 0.0002634702071900897, + "loss": 0.0194, "step": 93950 }, { - "epoch": 0.47, - "learning_rate": 0.000228893956440359, - "loss": 0.0129, + "epoch": 0.24, + "learning_rate": 0.0002634663189737182, + "loss": 0.0244, "step": 93960 }, { - "epoch": 0.47, - "learning_rate": 0.00022888638874734497, - "loss": 0.0165, + "epoch": 0.24, + "learning_rate": 0.0002634624307573468, + "loss": 0.0198, "step": 93970 }, { - "epoch": 0.47, - "learning_rate": 0.00022887882105433096, - "loss": 0.0173, + "epoch": 0.24, + "learning_rate": 0.0002634585425409753, + "loss": 0.0219, "step": 93980 }, { - "epoch": 0.47, - "learning_rate": 0.00022887125336131696, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.0002634546543246038, + "loss": 0.0236, "step": 93990 }, { - "epoch": 0.47, - "learning_rate": 0.00022886368566830295, - "loss": 0.0188, + "epoch": 0.24, + "learning_rate": 0.00026345076610823233, + "loss": 0.023, "step": 94000 }, { - "epoch": 0.47, - "eval_cer": 0.914481900656667, - "eval_loss": 0.011606461368501186, - "eval_runtime": 116.7314, - "eval_samples_per_second": 17.133, - "eval_steps_per_second": 4.283, + "epoch": 0.24, + "eval_cer": 0.8818440496535199, + "eval_loss": 0.016325943171977997, + "eval_runtime": 108.0327, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, "step": 94000 }, { - "epoch": 0.47, - "learning_rate": 0.00022885611797528893, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002634468778918609, + "loss": 0.0215, "step": 94010 }, { - "epoch": 0.47, - "learning_rate": 0.00022884855028227494, - "loss": 0.0155, + "epoch": 0.24, + "learning_rate": 0.00026344298967548947, + "loss": 0.0205, "step": 94020 }, { - "epoch": 0.47, - "learning_rate": 0.00022884098258926092, - "loss": 0.014, + "epoch": 0.24, + "learning_rate": 0.000263439101459118, + "loss": 0.0206, "step": 94030 }, { - "epoch": 0.47, - "learning_rate": 0.0002288334148962469, - "loss": 0.0193, + "epoch": 0.24, + "learning_rate": 0.0002634352132427465, + "loss": 0.0208, "step": 94040 }, { - "epoch": 0.47, - "learning_rate": 0.00022882584720323288, - "loss": 0.0132, + "epoch": 0.24, + "learning_rate": 0.000263431325026375, + "loss": 0.0246, "step": 94050 }, { - "epoch": 0.47, - "learning_rate": 0.0002288182795102189, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.0002634274368100036, + "loss": 0.021, "step": 94060 }, { - "epoch": 0.47, - "learning_rate": 0.00022881071181720487, - "loss": 0.0152, + "epoch": 0.24, + "learning_rate": 0.0002634235485936321, + "loss": 0.0289, "step": 94070 }, { - "epoch": 0.47, - "learning_rate": 0.00022880314412419085, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.00026341966037726067, + "loss": 0.0201, "step": 94080 }, { - "epoch": 0.47, - "learning_rate": 0.00022879557643117686, - "loss": 0.0151, + "epoch": 0.24, + "learning_rate": 0.0002634157721608892, + "loss": 0.0218, "step": 94090 }, { - "epoch": 0.47, - "learning_rate": 0.00022878800873816284, - "loss": 0.0186, + "epoch": 0.24, + "learning_rate": 0.00026341188394451775, + "loss": 0.0234, "step": 94100 }, { - "epoch": 0.47, - "learning_rate": 0.00022878044104514882, - "loss": 0.0133, + "epoch": 0.24, + "learning_rate": 0.00026340799572814626, + "loss": 0.0196, "step": 94110 }, { - "epoch": 0.47, - "learning_rate": 0.00022877287335213483, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002634041075117748, + "loss": 0.0222, "step": 94120 }, { - "epoch": 0.47, - "learning_rate": 0.0002287653056591208, - "loss": 0.0217, + "epoch": 0.24, + "learning_rate": 0.0002634002192954033, + "loss": 0.0242, "step": 94130 }, { - "epoch": 0.47, - "learning_rate": 0.0002287577379661068, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.00026339633107903186, + "loss": 0.024, "step": 94140 }, { - "epoch": 0.47, - "learning_rate": 0.0002287501702730928, - "loss": 0.0171, + "epoch": 0.24, + "learning_rate": 0.0002633924428626604, + "loss": 0.0206, "step": 94150 }, { - "epoch": 0.48, - "learning_rate": 0.00022874260258007878, - "loss": 0.0178, + "epoch": 0.24, + "learning_rate": 0.00026338855464628895, + "loss": 0.0227, "step": 94160 }, { - "epoch": 0.48, - "learning_rate": 0.00022873503488706477, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.00026338466642991746, + "loss": 0.0258, "step": 94170 }, { - "epoch": 0.48, - "learning_rate": 0.00022872746719405077, - "loss": 0.0225, + "epoch": 0.24, + "learning_rate": 0.00026338077821354603, + "loss": 0.0218, "step": 94180 }, { - "epoch": 0.48, - "learning_rate": 0.00022871989950103676, - "loss": 0.0164, + "epoch": 0.24, + "learning_rate": 0.00026337688999717454, + "loss": 0.0222, "step": 94190 }, { - "epoch": 0.48, - "learning_rate": 0.00022871233180802274, - "loss": 0.0153, + "epoch": 0.24, + "learning_rate": 0.00026337300178080306, + "loss": 0.0222, "step": 94200 }, { - "epoch": 0.48, - "learning_rate": 0.00022870476411500872, - "loss": 0.014, + "epoch": 0.24, + "learning_rate": 0.00026336911356443157, + "loss": 0.0246, "step": 94210 }, { - "epoch": 0.48, - "learning_rate": 0.00022869719642199473, - "loss": 0.0184, + "epoch": 0.24, + "learning_rate": 0.00026336522534806014, + "loss": 0.0252, "step": 94220 }, { - "epoch": 0.48, - "learning_rate": 0.0002286896287289807, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.0002633613371316887, + "loss": 0.0266, "step": 94230 }, { - "epoch": 0.48, - "learning_rate": 0.0002286820610359667, - "loss": 0.0145, + "epoch": 0.24, + "learning_rate": 0.0002633574489153172, + "loss": 0.0234, "step": 94240 }, { - "epoch": 0.48, - "learning_rate": 0.0002286744933429527, - "loss": 0.0138, + "epoch": 0.24, + "learning_rate": 0.00026335356069894574, + "loss": 0.0229, "step": 94250 }, { - "epoch": 0.48, - "learning_rate": 0.00022866692564993868, - "loss": 0.0158, + "epoch": 0.24, + "learning_rate": 0.0002633496724825743, + "loss": 0.0185, "step": 94260 }, { - "epoch": 0.48, - "learning_rate": 0.00022865935795692466, - "loss": 0.0149, + "epoch": 0.24, + "learning_rate": 0.0002633457842662028, + "loss": 0.0255, "step": 94270 }, { - "epoch": 0.48, - "learning_rate": 0.00022865179026391067, - "loss": 0.0147, + "epoch": 0.24, + "learning_rate": 0.00026334189604983134, + "loss": 0.0269, "step": 94280 }, { - "epoch": 0.48, - "learning_rate": 0.00022864422257089665, - "loss": 0.0195, + "epoch": 0.24, + "learning_rate": 0.0002633380078334599, + "loss": 0.0192, "step": 94290 }, { - "epoch": 0.48, - "learning_rate": 0.00022863665487788263, - "loss": 0.0234, + "epoch": 0.24, + "learning_rate": 0.0002633341196170884, + "loss": 0.0236, "step": 94300 }, { - "epoch": 0.48, - "learning_rate": 0.00022862908718486864, - "loss": 0.019, + "epoch": 0.24, + "learning_rate": 0.000263330231400717, + "loss": 0.0185, "step": 94310 }, { - "epoch": 0.48, - "learning_rate": 0.00022862151949185462, - "loss": 0.0175, + "epoch": 0.24, + "learning_rate": 0.0002633263431843455, + "loss": 0.0194, "step": 94320 }, { - "epoch": 0.48, - "learning_rate": 0.0002286139517988406, - "loss": 0.0148, + "epoch": 0.24, + "learning_rate": 0.000263322454967974, + "loss": 0.0258, "step": 94330 }, { - "epoch": 0.48, - "learning_rate": 0.0002286063841058266, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.00026331856675160253, + "loss": 0.0274, "step": 94340 }, { - "epoch": 0.48, - "learning_rate": 0.0002285988164128126, - "loss": 0.0187, + "epoch": 0.24, + "learning_rate": 0.0002633146785352311, + "loss": 0.0206, "step": 94350 }, { - "epoch": 0.48, - "learning_rate": 0.00022859124871979858, - "loss": 0.0143, + "epoch": 0.24, + "learning_rate": 0.00026331079031885967, + "loss": 0.0191, "step": 94360 }, { - "epoch": 0.48, - "learning_rate": 0.00022858368102678458, - "loss": 0.017, + "epoch": 0.24, + "learning_rate": 0.0002633069021024882, + "loss": 0.0232, "step": 94370 }, { - "epoch": 0.48, - "learning_rate": 0.00022857611333377057, - "loss": 0.0137, + "epoch": 0.24, + "learning_rate": 0.0002633030138861167, + "loss": 0.02, "step": 94380 }, { - "epoch": 0.48, - "learning_rate": 0.00022856854564075655, - "loss": 0.015, + "epoch": 0.24, + "learning_rate": 0.00026329912566974527, + "loss": 0.0191, "step": 94390 }, { - "epoch": 0.48, - "learning_rate": 0.00022856097794774253, - "loss": 0.0181, + "epoch": 0.24, + "learning_rate": 0.0002632952374533738, + "loss": 0.0211, "step": 94400 }, { - "epoch": 0.48, - "learning_rate": 0.00022855341025472854, - "loss": 0.0182, + "epoch": 0.24, + "learning_rate": 0.0002632913492370023, + "loss": 0.0249, "step": 94410 }, { - "epoch": 0.48, - "learning_rate": 0.00022854584256171452, - "loss": 0.0202, + "epoch": 0.24, + "learning_rate": 0.00026328746102063087, + "loss": 0.0226, "step": 94420 }, { - "epoch": 0.48, - "learning_rate": 0.0002285382748687005, - "loss": 0.0156, + "epoch": 0.24, + "learning_rate": 0.0002632835728042594, + "loss": 0.0212, "step": 94430 }, { - "epoch": 0.48, - "learning_rate": 0.0002285307071756865, - "loss": 0.0179, + "epoch": 0.24, + "learning_rate": 0.00026327968458788795, + "loss": 0.0227, "step": 94440 }, { - "epoch": 0.48, - "learning_rate": 0.0002285231394826725, - "loss": 0.0136, + "epoch": 0.24, + "learning_rate": 0.00026327579637151646, + "loss": 0.0257, "step": 94450 }, { - "epoch": 0.48, - "learning_rate": 0.00022851557178965847, - "loss": 0.0125, + "epoch": 0.24, + "learning_rate": 0.000263271908155145, + "loss": 0.0225, "step": 94460 }, { - "epoch": 0.48, - "learning_rate": 0.00022850800409664448, - "loss": 0.0137, + "epoch": 0.24, + "learning_rate": 0.00026326801993877355, + "loss": 0.0234, "step": 94470 }, { - "epoch": 0.48, - "learning_rate": 0.00022850043640363046, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.00026326413172240206, + "loss": 0.0265, "step": 94480 }, { - "epoch": 0.48, - "learning_rate": 0.00022849286871061644, - "loss": 0.0159, + "epoch": 0.24, + "learning_rate": 0.0002632602435060306, + "loss": 0.0265, "step": 94490 }, { - "epoch": 0.48, - "learning_rate": 0.00022848530101760245, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.00026325635528965914, + "loss": 0.0278, "step": 94500 }, { - "epoch": 0.48, - "learning_rate": 0.00022847773332458843, - "loss": 0.0142, + "epoch": 0.24, + "learning_rate": 0.0002632524670732877, + "loss": 0.0201, "step": 94510 }, { - "epoch": 0.48, - "learning_rate": 0.00022847016563157441, - "loss": 0.0151, + "epoch": 0.25, + "learning_rate": 0.00026324857885691623, + "loss": 0.0162, "step": 94520 }, { - "epoch": 0.48, - "learning_rate": 0.00022846259793856042, - "loss": 0.0179, + "epoch": 0.25, + "learning_rate": 0.00026324469064054474, + "loss": 0.0243, "step": 94530 }, { - "epoch": 0.48, - "learning_rate": 0.0002284550302455464, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.00026324080242417326, + "loss": 0.0195, "step": 94540 }, { - "epoch": 0.48, - "learning_rate": 0.00022844746255253239, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026323691420780177, + "loss": 0.0202, "step": 94550 }, { - "epoch": 0.48, - "learning_rate": 0.00022843989485951837, - "loss": 0.0119, + "epoch": 0.25, + "learning_rate": 0.00026323302599143034, + "loss": 0.0293, "step": 94560 }, { - "epoch": 0.48, - "learning_rate": 0.00022843232716650438, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.0002632291377750589, + "loss": 0.0206, "step": 94570 }, { - "epoch": 0.48, - "learning_rate": 0.00022842475947349036, - "loss": 0.0196, + "epoch": 0.25, + "learning_rate": 0.0002632252495586874, + "loss": 0.023, "step": 94580 }, { - "epoch": 0.48, - "learning_rate": 0.00022841719178047634, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026322136134231594, + "loss": 0.022, "step": 94590 }, { - "epoch": 0.48, - "learning_rate": 0.00022840962408746235, - "loss": 0.0139, + "epoch": 0.25, + "learning_rate": 0.0002632174731259445, + "loss": 0.0211, "step": 94600 }, { - "epoch": 0.48, - "learning_rate": 0.00022840205639444833, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.000263213584909573, + "loss": 0.024, "step": 94610 }, { - "epoch": 0.48, - "learning_rate": 0.0002283944887014343, - "loss": 0.0126, + "epoch": 0.25, + "learning_rate": 0.00026320969669320154, + "loss": 0.0224, "step": 94620 }, { - "epoch": 0.48, - "learning_rate": 0.00022838692100842032, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002632058084768301, + "loss": 0.0222, "step": 94630 }, { - "epoch": 0.48, - "learning_rate": 0.0002283793533154063, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002632019202604586, + "loss": 0.0227, "step": 94640 }, { - "epoch": 0.48, - "learning_rate": 0.00022837178562239228, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002631980320440872, + "loss": 0.0218, "step": 94650 }, { - "epoch": 0.48, - "learning_rate": 0.0002283642179293783, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.0002631941438277157, + "loss": 0.0234, "step": 94660 }, { - "epoch": 0.48, - "learning_rate": 0.00022835665023636427, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.0002631902556113442, + "loss": 0.0164, "step": 94670 }, { - "epoch": 0.48, - "learning_rate": 0.00022834908254335025, - "loss": 0.0193, + "epoch": 0.25, + "learning_rate": 0.0002631863673949728, + "loss": 0.0212, "step": 94680 }, { - "epoch": 0.48, - "learning_rate": 0.00022834151485033626, - "loss": 0.019, + "epoch": 0.25, + "learning_rate": 0.0002631824791786013, + "loss": 0.0219, "step": 94690 }, { - "epoch": 0.48, - "learning_rate": 0.00022833394715732224, - "loss": 0.0185, + "epoch": 0.25, + "learning_rate": 0.0002631785909622298, + "loss": 0.0235, "step": 94700 }, { - "epoch": 0.48, - "learning_rate": 0.00022832637946430822, - "loss": 0.0194, + "epoch": 0.25, + "learning_rate": 0.0002631747027458584, + "loss": 0.0225, "step": 94710 }, { - "epoch": 0.48, - "learning_rate": 0.0002283188117712942, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026317081452948695, + "loss": 0.0271, "step": 94720 }, { - "epoch": 0.48, - "learning_rate": 0.00022831124407828021, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.00026316692631311547, + "loss": 0.0222, "step": 94730 }, { - "epoch": 0.48, - "learning_rate": 0.0002283036763852662, - "loss": 0.0141, + "epoch": 0.25, + "learning_rate": 0.000263163038096744, + "loss": 0.0277, "step": 94740 }, { - "epoch": 0.48, - "learning_rate": 0.00022829610869225218, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.0002631591498803725, + "loss": 0.018, "step": 94750 }, { - "epoch": 0.48, - "learning_rate": 0.00022828854099923819, - "loss": 0.0184, + "epoch": 0.25, + "learning_rate": 0.00026315526166400106, + "loss": 0.0245, "step": 94760 }, { - "epoch": 0.48, - "learning_rate": 0.00022828097330622417, - "loss": 0.0151, + "epoch": 0.25, + "learning_rate": 0.0002631513734476296, + "loss": 0.0267, "step": 94770 }, { - "epoch": 0.48, - "learning_rate": 0.00022827340561321015, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.00026314748523125815, + "loss": 0.0243, "step": 94780 }, { - "epoch": 0.48, - "learning_rate": 0.00022826583792019616, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.00026314359701488666, + "loss": 0.0243, "step": 94790 }, { - "epoch": 0.48, - "learning_rate": 0.00022825827022718214, - "loss": 0.0218, + "epoch": 0.25, + "learning_rate": 0.0002631397087985152, + "loss": 0.0244, "step": 94800 }, { - "epoch": 0.48, - "learning_rate": 0.00022825070253416812, - "loss": 0.0139, + "epoch": 0.25, + "learning_rate": 0.00026313582058214375, + "loss": 0.0194, "step": 94810 }, { - "epoch": 0.48, - "learning_rate": 0.00022824313484115413, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026313193236577226, + "loss": 0.023, "step": 94820 }, { - "epoch": 0.48, - "learning_rate": 0.0002282355671481401, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002631280441494008, + "loss": 0.0247, "step": 94830 }, { - "epoch": 0.48, - "learning_rate": 0.0002282279994551261, - "loss": 0.0205, + "epoch": 0.25, + "learning_rate": 0.00026312415593302934, + "loss": 0.0257, "step": 94840 }, { - "epoch": 0.48, - "learning_rate": 0.0002282204317621121, - "loss": 0.012, + "epoch": 0.25, + "learning_rate": 0.00026312026771665786, + "loss": 0.021, "step": 94850 }, { - "epoch": 0.48, - "learning_rate": 0.00022821286406909808, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.0002631163795002864, + "loss": 0.0169, "step": 94860 }, { - "epoch": 0.48, - "learning_rate": 0.00022820529637608406, - "loss": 0.0121, + "epoch": 0.25, + "learning_rate": 0.00026311249128391494, + "loss": 0.0242, "step": 94870 }, { - "epoch": 0.48, - "learning_rate": 0.00022819772868307007, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.00026310860306754346, + "loss": 0.0234, "step": 94880 }, { - "epoch": 0.48, - "learning_rate": 0.00022819016099005605, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.000263104714851172, + "loss": 0.0205, "step": 94890 }, { - "epoch": 0.48, - "learning_rate": 0.000228182593297042, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.00026310082663480054, + "loss": 0.0228, "step": 94900 }, { - "epoch": 0.48, - "learning_rate": 0.000228175025604028, - "loss": 0.0202, + "epoch": 0.25, + "learning_rate": 0.0002630969384184291, + "loss": 0.0248, "step": 94910 }, { - "epoch": 0.48, - "learning_rate": 0.000228167457911014, - "loss": 0.0141, + "epoch": 0.25, + "learning_rate": 0.0002630930502020576, + "loss": 0.0303, "step": 94920 }, { - "epoch": 0.48, - "learning_rate": 0.00022815989021799998, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002630891619856862, + "loss": 0.0204, "step": 94930 }, { - "epoch": 0.48, - "learning_rate": 0.00022815232252498596, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.0002630852737693147, + "loss": 0.019, "step": 94940 }, { - "epoch": 0.48, - "learning_rate": 0.00022814475483197194, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.0002630813855529432, + "loss": 0.0221, "step": 94950 }, { - "epoch": 0.48, - "learning_rate": 0.00022813718713895795, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.00026307749733657173, + "loss": 0.0193, "step": 94960 }, { - "epoch": 0.48, - "learning_rate": 0.00022812961944594393, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002630736091202003, + "loss": 0.0259, "step": 94970 }, { - "epoch": 0.48, - "learning_rate": 0.0002281220517529299, - "loss": 0.0185, + "epoch": 0.25, + "learning_rate": 0.0002630697209038288, + "loss": 0.0214, "step": 94980 }, { - "epoch": 0.48, - "learning_rate": 0.00022811448405991592, - "loss": 0.0203, + "epoch": 0.25, + "learning_rate": 0.0002630658326874574, + "loss": 0.0231, "step": 94990 }, { - "epoch": 0.48, - "learning_rate": 0.0002281069163669019, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.0002630619444710859, + "loss": 0.0236, "step": 95000 }, { - "epoch": 0.48, - "eval_cer": 0.9144848118450433, - "eval_loss": 0.012143060564994812, - "eval_runtime": 116.8022, - "eval_samples_per_second": 17.123, - "eval_steps_per_second": 4.281, + "epoch": 0.25, + "eval_cer": 0.8818146572779021, + "eval_loss": 0.01712987571954727, + "eval_runtime": 108.1006, + "eval_samples_per_second": 18.501, + "eval_steps_per_second": 4.625, "step": 95000 }, { - "epoch": 0.48, - "learning_rate": 0.00022809934867388788, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.00026305805625471447, + "loss": 0.0222, "step": 95010 }, { - "epoch": 0.48, - "learning_rate": 0.0002280917809808739, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.000263054168038343, + "loss": 0.0312, "step": 95020 }, { - "epoch": 0.48, - "learning_rate": 0.00022808421328785987, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002630502798219715, + "loss": 0.0223, "step": 95030 }, { - "epoch": 0.48, - "learning_rate": 0.00022807664559484586, - "loss": 0.0143, + "epoch": 0.25, + "learning_rate": 0.0002630463916056, + "loss": 0.0236, "step": 95040 }, { - "epoch": 0.48, - "learning_rate": 0.00022806907790183186, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002630425033892286, + "loss": 0.0203, "step": 95050 }, { - "epoch": 0.48, - "learning_rate": 0.00022806151020881785, - "loss": 0.0133, + "epoch": 0.25, + "learning_rate": 0.00026303861517285715, + "loss": 0.0268, "step": 95060 }, { - "epoch": 0.48, - "learning_rate": 0.00022805394251580383, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.00026303472695648567, + "loss": 0.0258, "step": 95070 }, { - "epoch": 0.48, - "learning_rate": 0.00022804637482278984, - "loss": 0.0126, + "epoch": 0.25, + "learning_rate": 0.0002630308387401142, + "loss": 0.0242, "step": 95080 }, { - "epoch": 0.48, - "learning_rate": 0.00022803880712977582, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002630269505237427, + "loss": 0.0207, "step": 95090 }, { - "epoch": 0.48, - "learning_rate": 0.0002280312394367618, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.00026302306230737126, + "loss": 0.0302, "step": 95100 }, { - "epoch": 0.48, - "learning_rate": 0.00022802367174374778, - "loss": 0.0134, + "epoch": 0.25, + "learning_rate": 0.0002630191740909998, + "loss": 0.0394, "step": 95110 }, { - "epoch": 0.48, - "learning_rate": 0.0002280161040507338, - "loss": 0.0182, + "epoch": 0.25, + "learning_rate": 0.00026301528587462835, + "loss": 0.0264, "step": 95120 }, { - "epoch": 0.48, - "learning_rate": 0.00022800853635771977, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.00026301139765825686, + "loss": 0.0219, "step": 95130 }, { - "epoch": 0.48, - "learning_rate": 0.00022800096866470575, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.00026300750944188543, + "loss": 0.0278, "step": 95140 }, { - "epoch": 0.48, - "learning_rate": 0.00022799340097169176, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026300362122551394, + "loss": 0.0278, "step": 95150 }, { - "epoch": 0.48, - "learning_rate": 0.00022798583327867774, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.00026299973300914246, + "loss": 0.0267, "step": 95160 }, { - "epoch": 0.48, - "learning_rate": 0.00022797826558566372, - "loss": 0.0139, + "epoch": 0.25, + "learning_rate": 0.000262995844792771, + "loss": 0.0246, "step": 95170 }, { - "epoch": 0.48, - "learning_rate": 0.00022797069789264973, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.00026299195657639954, + "loss": 0.0247, "step": 95180 }, { - "epoch": 0.48, - "learning_rate": 0.0002279631301996357, - "loss": 0.018, + "epoch": 0.25, + "learning_rate": 0.00026298806836002806, + "loss": 0.024, "step": 95190 }, { - "epoch": 0.48, - "learning_rate": 0.0002279555625066217, - "loss": 0.0143, + "epoch": 0.25, + "learning_rate": 0.0002629841801436566, + "loss": 0.0246, "step": 95200 }, { - "epoch": 0.48, - "learning_rate": 0.0002279479948136077, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.00026298029192728514, + "loss": 0.0258, "step": 95210 }, { - "epoch": 0.48, - "learning_rate": 0.00022794042712059368, - "loss": 0.0145, + "epoch": 0.25, + "learning_rate": 0.0002629764037109137, + "loss": 0.0233, "step": 95220 }, { - "epoch": 0.48, - "learning_rate": 0.00022793285942757967, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002629725154945422, + "loss": 0.0232, "step": 95230 }, { - "epoch": 0.48, - "learning_rate": 0.00022792529173456567, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.00026296862727817074, + "loss": 0.0231, "step": 95240 }, { - "epoch": 0.48, - "learning_rate": 0.00022791772404155166, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.00026296473906179925, + "loss": 0.0219, "step": 95250 }, { - "epoch": 0.48, - "learning_rate": 0.00022791015634853764, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.0002629608508454278, + "loss": 0.0233, "step": 95260 }, { - "epoch": 0.48, - "learning_rate": 0.00022790258865552365, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.0002629569626290564, + "loss": 0.0215, "step": 95270 }, { - "epoch": 0.48, - "learning_rate": 0.00022789502096250963, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002629530744126849, + "loss": 0.024, "step": 95280 }, { - "epoch": 0.48, - "learning_rate": 0.0002278874532694956, - "loss": 0.0332, + "epoch": 0.25, + "learning_rate": 0.0002629491861963134, + "loss": 0.0246, "step": 95290 }, { - "epoch": 0.48, - "learning_rate": 0.0002278798855764816, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.00026294529797994193, + "loss": 0.0181, "step": 95300 }, { - "epoch": 0.48, - "learning_rate": 0.0002278723178834676, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.0002629414097635705, + "loss": 0.0273, "step": 95310 }, { - "epoch": 0.48, - "learning_rate": 0.00022786475019045358, - "loss": 0.0529, + "epoch": 0.25, + "learning_rate": 0.000262937521547199, + "loss": 0.03, "step": 95320 }, { - "epoch": 0.48, - "learning_rate": 0.00022785718249743956, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.0002629336333308276, + "loss": 0.0268, "step": 95330 }, { - "epoch": 0.48, - "learning_rate": 0.00022784961480442557, - "loss": 0.0187, + "epoch": 0.25, + "learning_rate": 0.0002629297451144561, + "loss": 0.0232, "step": 95340 }, { - "epoch": 0.48, - "learning_rate": 0.00022784204711141155, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.00026292585689808467, + "loss": 0.02, "step": 95350 }, { - "epoch": 0.48, - "learning_rate": 0.00022783447941839753, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.0002629219686817132, + "loss": 0.0213, "step": 95360 }, { - "epoch": 0.48, - "learning_rate": 0.00022782691172538354, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.0002629180804653417, + "loss": 0.0252, "step": 95370 }, { - "epoch": 0.48, - "learning_rate": 0.00022781934403236952, + "epoch": 0.25, + "learning_rate": 0.0002629141922489702, "loss": 0.0187, "step": 95380 }, { - "epoch": 0.48, - "learning_rate": 0.0002278117763393555, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.0002629103040325988, + "loss": 0.0474, "step": 95390 }, { - "epoch": 0.48, - "learning_rate": 0.0002278042086463415, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002629064158162273, + "loss": 0.0239, "step": 95400 }, { - "epoch": 0.48, - "learning_rate": 0.0002277966409533275, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.00026290252759985586, + "loss": 0.0216, "step": 95410 }, { - "epoch": 0.48, - "learning_rate": 0.00022778907326031348, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.0002628986393834844, + "loss": 0.0224, "step": 95420 }, { - "epoch": 0.48, - "learning_rate": 0.00022778150556729948, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026289475116711295, + "loss": 0.0261, "step": 95430 }, { - "epoch": 0.48, - "learning_rate": 0.00022777393787428547, - "loss": 0.0189, + "epoch": 0.25, + "learning_rate": 0.00026289086295074146, + "loss": 0.0242, "step": 95440 }, { - "epoch": 0.48, - "learning_rate": 0.00022776637018127145, - "loss": 0.018, + "epoch": 0.25, + "learning_rate": 0.00026288697473437, + "loss": 0.0195, "step": 95450 }, { - "epoch": 0.48, - "learning_rate": 0.00022775880248825743, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.00026288308651799855, + "loss": 0.0212, "step": 95460 }, { - "epoch": 0.48, - "learning_rate": 0.00022775123479524344, - "loss": 0.0179, + "epoch": 0.25, + "learning_rate": 0.00026287919830162706, + "loss": 0.0232, "step": 95470 }, { - "epoch": 0.48, - "learning_rate": 0.00022774366710222942, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.00026287531008525563, + "loss": 0.023, "step": 95480 }, { - "epoch": 0.48, - "learning_rate": 0.0002277360994092154, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.00026287142186888414, + "loss": 0.021, "step": 95490 }, { - "epoch": 0.48, - "learning_rate": 0.0002277285317162014, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.00026286753365251266, + "loss": 0.024, "step": 95500 }, { - "epoch": 0.48, - "learning_rate": 0.0002277209640231874, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.0002628636454361412, + "loss": 0.0206, "step": 95510 }, { - "epoch": 0.48, - "learning_rate": 0.00022771339633017337, - "loss": 0.019, + "epoch": 0.25, + "learning_rate": 0.00026285975721976974, + "loss": 0.0242, "step": 95520 }, { - "epoch": 0.48, - "learning_rate": 0.00022770582863715938, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.00026285586900339826, + "loss": 0.0225, "step": 95530 }, { - "epoch": 0.48, - "learning_rate": 0.00022769826094414536, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002628519807870268, + "loss": 0.0296, "step": 95540 }, { - "epoch": 0.48, - "learning_rate": 0.00022769069325113134, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026284809257065534, + "loss": 0.0278, "step": 95550 }, { - "epoch": 0.48, - "learning_rate": 0.00022768312555811735, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.0002628442043542839, + "loss": 0.0302, "step": 95560 }, { - "epoch": 0.48, - "learning_rate": 0.00022767555786510333, - "loss": 0.0152, + "epoch": 0.25, + "learning_rate": 0.0002628403161379124, + "loss": 0.0253, "step": 95570 }, { - "epoch": 0.48, - "learning_rate": 0.00022766799017208931, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.00026283642792154094, + "loss": 0.0206, "step": 95580 }, { - "epoch": 0.48, - "learning_rate": 0.00022766042247907532, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.00026283253970516945, + "loss": 0.0221, "step": 95590 }, { - "epoch": 0.48, - "learning_rate": 0.0002276528547860613, - "loss": 0.0194, + "epoch": 0.25, + "learning_rate": 0.000262828651488798, + "loss": 0.0269, "step": 95600 }, { - "epoch": 0.48, - "learning_rate": 0.00022764528709304729, - "loss": 0.0181, + "epoch": 0.25, + "learning_rate": 0.0002628247632724266, + "loss": 0.0239, "step": 95610 }, { - "epoch": 0.48, - "learning_rate": 0.00022763771940003327, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.0002628208750560551, + "loss": 0.0263, "step": 95620 }, { - "epoch": 0.48, - "learning_rate": 0.00022763015170701928, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.0002628169868396836, + "loss": 0.0246, "step": 95630 }, { - "epoch": 0.48, - "learning_rate": 0.00022762258401400526, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.0002628130986233122, + "loss": 0.0213, "step": 95640 }, { - "epoch": 0.48, - "learning_rate": 0.00022761501632099124, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002628092104069407, + "loss": 0.0205, "step": 95650 }, { - "epoch": 0.48, - "learning_rate": 0.00022760744862797725, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.0002628053221905692, + "loss": 0.0243, "step": 95660 }, { - "epoch": 0.48, - "learning_rate": 0.00022759988093496323, - "loss": 0.0214, + "epoch": 0.25, + "learning_rate": 0.0002628014339741978, + "loss": 0.0259, "step": 95670 }, { - "epoch": 0.48, - "learning_rate": 0.0002275923132419492, - "loss": 0.0203, + "epoch": 0.25, + "learning_rate": 0.0002627975457578263, + "loss": 0.0225, "step": 95680 }, { - "epoch": 0.48, - "learning_rate": 0.00022758474554893522, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.00026279365754145487, + "loss": 0.0225, "step": 95690 }, { - "epoch": 0.48, - "learning_rate": 0.0002275771778559212, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.0002627897693250834, + "loss": 0.0246, "step": 95700 }, { - "epoch": 0.48, - "learning_rate": 0.00022756961016290718, - "loss": 0.0123, + "epoch": 0.25, + "learning_rate": 0.0002627858811087119, + "loss": 0.0295, "step": 95710 }, { - "epoch": 0.48, - "learning_rate": 0.0002275620424698932, - "loss": 0.0182, + "epoch": 0.25, + "learning_rate": 0.00026278199289234047, + "loss": 0.0247, "step": 95720 }, { - "epoch": 0.48, - "learning_rate": 0.00022755447477687917, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.000262778104675969, + "loss": 0.0198, "step": 95730 }, { - "epoch": 0.48, - "learning_rate": 0.00022754690708386515, - "loss": 0.0231, + "epoch": 0.25, + "learning_rate": 0.0002627742164595975, + "loss": 0.0252, "step": 95740 }, { - "epoch": 0.48, - "learning_rate": 0.00022753933939085116, - "loss": 0.0151, + "epoch": 0.25, + "learning_rate": 0.00026277032824322606, + "loss": 0.0224, "step": 95750 }, { - "epoch": 0.48, - "learning_rate": 0.00022753177169783714, - "loss": 0.018, + "epoch": 0.25, + "learning_rate": 0.00026276644002685463, + "loss": 0.0235, "step": 95760 }, { - "epoch": 0.48, - "learning_rate": 0.00022752420400482312, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.00026276255181048315, + "loss": 0.02, "step": 95770 }, { - "epoch": 0.48, - "learning_rate": 0.00022751663631180913, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.00026275866359411166, + "loss": 0.0227, "step": 95780 }, { - "epoch": 0.48, - "learning_rate": 0.00022750906861879511, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.0002627547753777402, + "loss": 0.0249, "step": 95790 }, { - "epoch": 0.48, - "learning_rate": 0.0002275015009257811, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002627508871613687, + "loss": 0.018, "step": 95800 }, { - "epoch": 0.48, - "learning_rate": 0.00022749393323276708, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.00026274699894499726, + "loss": 0.0222, "step": 95810 }, { - "epoch": 0.48, - "learning_rate": 0.00022748636553975309, - "loss": 0.0189, + "epoch": 0.25, + "learning_rate": 0.00026274311072862583, + "loss": 0.0268, "step": 95820 }, { - "epoch": 0.48, - "learning_rate": 0.00022747879784673907, - "loss": 0.018, + "epoch": 0.25, + "learning_rate": 0.00026273922251225434, + "loss": 0.0263, "step": 95830 }, { - "epoch": 0.48, - "learning_rate": 0.00022747123015372505, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.00026273533429588286, + "loss": 0.0219, "step": 95840 }, { - "epoch": 0.48, - "learning_rate": 0.00022746366246071106, - "loss": 0.0138, + "epoch": 0.25, + "learning_rate": 0.0002627314460795114, + "loss": 0.0213, "step": 95850 }, { - "epoch": 0.48, - "learning_rate": 0.00022745609476769704, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.00026272755786313994, + "loss": 0.0186, "step": 95860 }, { - "epoch": 0.48, - "learning_rate": 0.00022744852707468302, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.00026272366964676845, + "loss": 0.0234, "step": 95870 }, { - "epoch": 0.48, - "learning_rate": 0.00022744095938166903, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.000262719781430397, + "loss": 0.0201, "step": 95880 }, { - "epoch": 0.48, - "learning_rate": 0.000227433391688655, - "loss": 0.0162, + "epoch": 0.25, + "learning_rate": 0.00026271589321402554, + "loss": 0.0196, "step": 95890 }, { - "epoch": 0.48, - "learning_rate": 0.000227425823995641, - "loss": 0.0163, + "epoch": 0.25, + "learning_rate": 0.0002627120049976541, + "loss": 0.0332, "step": 95900 }, { - "epoch": 0.48, - "learning_rate": 0.000227418256302627, - "loss": 0.0139, + "epoch": 0.25, + "learning_rate": 0.0002627081167812826, + "loss": 0.0205, "step": 95910 }, { - "epoch": 0.48, - "learning_rate": 0.00022741068860961298, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.00026270422856491114, + "loss": 0.0223, "step": 95920 }, { - "epoch": 0.48, - "learning_rate": 0.00022740312091659896, - "loss": 0.0179, + "epoch": 0.25, + "learning_rate": 0.0002627003403485397, + "loss": 0.0253, "step": 95930 }, { - "epoch": 0.48, - "learning_rate": 0.00022739555322358497, - "loss": 0.0145, + "epoch": 0.25, + "learning_rate": 0.0002626964521321682, + "loss": 0.0275, "step": 95940 }, { - "epoch": 0.48, - "learning_rate": 0.00022738798553057095, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002626925639157968, + "loss": 0.0231, "step": 95950 }, { - "epoch": 0.48, - "learning_rate": 0.00022738041783755693, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.0002626886756994253, + "loss": 0.0235, "step": 95960 }, { - "epoch": 0.48, - "learning_rate": 0.00022737285014454292, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.00026268478748305387, + "loss": 0.0194, "step": 95970 }, { - "epoch": 0.48, - "learning_rate": 0.00022736528245152892, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002626808992666824, + "loss": 0.0291, "step": 95980 }, { - "epoch": 0.48, - "learning_rate": 0.0002273577147585149, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002626770110503109, + "loss": 0.0247, "step": 95990 }, { - "epoch": 0.48, - "learning_rate": 0.0002273501470655009, - "loss": 0.0244, + "epoch": 0.25, + "learning_rate": 0.0002626731228339394, + "loss": 0.0224, "step": 96000 }, { - "epoch": 0.48, - "eval_cer": 0.9144906342217957, - "eval_loss": 0.011497566476464272, - "eval_runtime": 116.7865, - "eval_samples_per_second": 17.125, - "eval_steps_per_second": 4.281, + "epoch": 0.25, + "eval_cer": 0.881751673615864, + "eval_loss": 0.017516400665044785, + "eval_runtime": 107.996, + "eval_samples_per_second": 18.519, + "eval_steps_per_second": 4.63, "step": 96000 }, { - "epoch": 0.48, - "learning_rate": 0.0002273425793724869, - "loss": 0.0185, + "epoch": 0.25, + "learning_rate": 0.000262669234617568, + "loss": 0.03, "step": 96010 }, { - "epoch": 0.48, - "learning_rate": 0.00022733501167947288, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002626653464011965, + "loss": 0.0249, "step": 96020 }, { - "epoch": 0.48, - "learning_rate": 0.00022732744398645886, - "loss": 0.0142, + "epoch": 0.25, + "learning_rate": 0.00026266145818482507, + "loss": 0.0214, "step": 96030 }, { - "epoch": 0.48, - "learning_rate": 0.00022731987629344487, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002626575699684536, + "loss": 0.0229, "step": 96040 }, { - "epoch": 0.48, - "learning_rate": 0.00022731230860043085, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.0002626536817520821, + "loss": 0.0199, "step": 96050 }, { - "epoch": 0.48, - "learning_rate": 0.00022730474090741683, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.00026264979353571066, + "loss": 0.0229, "step": 96060 }, { - "epoch": 0.48, - "learning_rate": 0.00022729717321440284, - "loss": 0.0204, + "epoch": 0.25, + "learning_rate": 0.0002626459053193392, + "loss": 0.0228, "step": 96070 }, { - "epoch": 0.48, - "learning_rate": 0.00022728960552138882, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002626420171029677, + "loss": 0.0202, "step": 96080 }, { - "epoch": 0.48, - "learning_rate": 0.0002272820378283748, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.00026263812888659626, + "loss": 0.0246, "step": 96090 }, { - "epoch": 0.48, - "learning_rate": 0.0002272744701353608, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.00026263424067022483, + "loss": 0.0272, "step": 96100 }, { - "epoch": 0.48, - "learning_rate": 0.0002272669024423468, - "loss": 0.0193, + "epoch": 0.25, + "learning_rate": 0.00026263035245385335, + "loss": 0.0252, "step": 96110 }, { - "epoch": 0.48, - "learning_rate": 0.00022725933474933277, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.00026262646423748186, + "loss": 0.0245, "step": 96120 }, { - "epoch": 0.48, - "learning_rate": 0.00022725176705631875, - "loss": 0.0213, + "epoch": 0.25, + "learning_rate": 0.0002626225760211104, + "loss": 0.0236, "step": 96130 }, { - "epoch": 0.49, - "learning_rate": 0.00022724419936330476, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.00026261868780473894, + "loss": 0.0206, "step": 96140 }, { - "epoch": 0.49, - "learning_rate": 0.00022723663167029074, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.00026261479958836746, + "loss": 0.0211, "step": 96150 }, { - "epoch": 0.49, - "learning_rate": 0.0002272290639772767, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.000262610911371996, + "loss": 0.019, "step": 96160 }, { - "epoch": 0.49, - "learning_rate": 0.0002272214962842627, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.00026260702315562454, + "loss": 0.0243, "step": 96170 }, { - "epoch": 0.49, - "learning_rate": 0.0002272139285912487, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.0002626031349392531, + "loss": 0.0239, "step": 96180 }, { - "epoch": 0.49, - "learning_rate": 0.00022720636089823467, - "loss": 0.0181, + "epoch": 0.25, + "learning_rate": 0.0002625992467228816, + "loss": 0.0226, "step": 96190 }, { - "epoch": 0.49, - "learning_rate": 0.00022719879320522065, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.00026259535850651014, + "loss": 0.0216, "step": 96200 }, { - "epoch": 0.49, - "learning_rate": 0.00022719122551220666, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.00026259147029013865, + "loss": 0.0244, "step": 96210 }, { - "epoch": 0.49, - "learning_rate": 0.00022718365781919264, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.0002625875820737672, + "loss": 0.0203, "step": 96220 }, { - "epoch": 0.49, - "learning_rate": 0.00022717609012617862, - "loss": 0.0201, + "epoch": 0.25, + "learning_rate": 0.00026258369385739574, + "loss": 0.0193, "step": 96230 }, { - "epoch": 0.49, - "learning_rate": 0.00022716852243316463, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.0002625798056410243, + "loss": 0.0216, "step": 96240 }, { - "epoch": 0.49, - "learning_rate": 0.0002271609547401506, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002625759174246528, + "loss": 0.0192, "step": 96250 }, { - "epoch": 0.49, - "learning_rate": 0.0002271533870471366, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.0002625720292082814, + "loss": 0.0254, "step": 96260 }, { - "epoch": 0.49, - "learning_rate": 0.0002271458193541226, - "loss": 0.0141, + "epoch": 0.25, + "learning_rate": 0.0002625681409919099, + "loss": 0.0176, "step": 96270 }, { - "epoch": 0.49, - "learning_rate": 0.00022713825166110858, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002625642527755384, + "loss": 0.0225, "step": 96280 }, { - "epoch": 0.49, - "learning_rate": 0.00022713068396809457, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026256036455916693, + "loss": 0.0221, "step": 96290 }, { - "epoch": 0.49, - "learning_rate": 0.00022712311627508057, - "loss": 0.013, + "epoch": 0.25, + "learning_rate": 0.0002625564763427955, + "loss": 0.0228, "step": 96300 }, { - "epoch": 0.49, - "learning_rate": 0.00022711554858206656, - "loss": 0.0132, + "epoch": 0.25, + "learning_rate": 0.00026255258812642407, + "loss": 0.0239, "step": 96310 }, { - "epoch": 0.49, - "learning_rate": 0.00022710798088905254, - "loss": 0.0177, + "epoch": 0.25, + "learning_rate": 0.0002625486999100526, + "loss": 0.0254, "step": 96320 }, { - "epoch": 0.49, - "learning_rate": 0.00022710041319603855, - "loss": 0.017, + "epoch": 0.25, + "learning_rate": 0.0002625448116936811, + "loss": 0.0238, "step": 96330 }, { - "epoch": 0.49, - "learning_rate": 0.00022709284550302453, - "loss": 0.0189, + "epoch": 0.25, + "learning_rate": 0.0002625409234773096, + "loss": 0.0202, "step": 96340 }, { - "epoch": 0.49, - "learning_rate": 0.0002270852778100105, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002625370352609382, + "loss": 0.0183, "step": 96350 }, { - "epoch": 0.49, - "learning_rate": 0.0002270777101169965, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.0002625331470445667, + "loss": 0.0207, "step": 96360 }, { - "epoch": 0.49, - "learning_rate": 0.0002270701424239825, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.00026252925882819527, + "loss": 0.0237, "step": 96370 }, { - "epoch": 0.49, - "learning_rate": 0.00022706257473096848, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.0002625253706118238, + "loss": 0.0236, "step": 96380 }, { - "epoch": 0.49, - "learning_rate": 0.00022705500703795446, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.00026252148239545235, + "loss": 0.0191, "step": 96390 }, { - "epoch": 0.49, - "learning_rate": 0.00022704743934494047, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026251759417908086, + "loss": 0.0277, "step": 96400 }, { - "epoch": 0.49, - "learning_rate": 0.00022703987165192645, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002625137059627094, + "loss": 0.019, "step": 96410 }, { - "epoch": 0.49, - "learning_rate": 0.00022703230395891243, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002625098177463379, + "loss": 0.0202, "step": 96420 }, { - "epoch": 0.49, - "learning_rate": 0.00022702473626589844, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026250592952996646, + "loss": 0.0288, "step": 96430 }, { - "epoch": 0.49, - "learning_rate": 0.00022701716857288442, - "loss": 0.0172, + "epoch": 0.25, + "learning_rate": 0.000262502041313595, + "loss": 0.0273, "step": 96440 }, { - "epoch": 0.49, - "learning_rate": 0.0002270096008798704, - "loss": 0.0163, + "epoch": 0.25, + "learning_rate": 0.00026249815309722354, + "loss": 0.0206, "step": 96450 }, { - "epoch": 0.49, - "learning_rate": 0.0002270020331868564, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.00026249426488085206, + "loss": 0.0216, "step": 96460 }, { - "epoch": 0.49, - "learning_rate": 0.0002269944654938424, - "loss": 0.0123, + "epoch": 0.25, + "learning_rate": 0.00026249037666448063, + "loss": 0.0235, "step": 96470 }, { - "epoch": 0.49, - "learning_rate": 0.00022698689780082838, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.00026248648844810914, + "loss": 0.0196, "step": 96480 }, { - "epoch": 0.49, - "learning_rate": 0.00022697933010781438, - "loss": 0.0138, + "epoch": 0.25, + "learning_rate": 0.00026248260023173766, + "loss": 0.0204, "step": 96490 }, { - "epoch": 0.49, - "learning_rate": 0.00022697176241480037, - "loss": 0.0142, + "epoch": 0.25, + "learning_rate": 0.0002624787120153662, + "loss": 0.0219, "step": 96500 }, { - "epoch": 0.49, - "learning_rate": 0.00022696419472178635, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.00026247482379899474, + "loss": 0.0186, "step": 96510 }, { - "epoch": 0.49, - "learning_rate": 0.00022695662702877233, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002624709355826233, + "loss": 0.0247, "step": 96520 }, { - "epoch": 0.49, - "learning_rate": 0.00022694905933575834, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.0002624670473662518, + "loss": 0.0307, "step": 96530 }, { - "epoch": 0.49, - "learning_rate": 0.00022694149164274432, - "loss": 0.0202, + "epoch": 0.25, + "learning_rate": 0.00026246315914988034, + "loss": 0.0238, "step": 96540 }, { - "epoch": 0.49, - "learning_rate": 0.0002269339239497303, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.00026245927093350885, + "loss": 0.0259, "step": 96550 }, { - "epoch": 0.49, - "learning_rate": 0.0002269263562567163, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.0002624553827171374, + "loss": 0.0231, "step": 96560 }, { - "epoch": 0.49, - "learning_rate": 0.0002269187885637023, - "loss": 0.0142, + "epoch": 0.25, + "learning_rate": 0.00026245149450076594, + "loss": 0.0279, "step": 96570 }, { - "epoch": 0.49, - "learning_rate": 0.00022691122087068827, - "loss": 0.0137, + "epoch": 0.25, + "learning_rate": 0.0002624476062843945, + "loss": 0.0199, "step": 96580 }, { - "epoch": 0.49, - "learning_rate": 0.00022690365317767428, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.000262443718068023, + "loss": 0.0186, "step": 96590 }, { - "epoch": 0.49, - "learning_rate": 0.00022689608548466026, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.0002624398298516516, + "loss": 0.0189, "step": 96600 }, { - "epoch": 0.49, - "learning_rate": 0.00022688851779164624, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002624359416352801, + "loss": 0.022, "step": 96610 }, { - "epoch": 0.49, - "learning_rate": 0.00022688095009863225, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002624320534189086, + "loss": 0.0252, "step": 96620 }, { - "epoch": 0.49, - "learning_rate": 0.00022687338240561823, - "loss": 0.0162, + "epoch": 0.25, + "learning_rate": 0.00026242816520253713, + "loss": 0.0194, "step": 96630 }, { - "epoch": 0.49, - "learning_rate": 0.00022686581471260421, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.0002624242769861657, + "loss": 0.0182, "step": 96640 }, { - "epoch": 0.49, - "learning_rate": 0.00022685824701959022, - "loss": 0.0116, + "epoch": 0.25, + "learning_rate": 0.00026242038876979427, + "loss": 0.0244, "step": 96650 }, { - "epoch": 0.49, - "learning_rate": 0.0002268506793265762, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.0002624165005534228, + "loss": 0.0255, "step": 96660 }, { - "epoch": 0.49, - "learning_rate": 0.00022684311163356219, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.0002624126123370513, + "loss": 0.0238, "step": 96670 }, { - "epoch": 0.49, - "learning_rate": 0.0002268355439405482, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026240872412067987, + "loss": 0.0243, "step": 96680 }, { - "epoch": 0.49, - "learning_rate": 0.00022682797624753418, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.0002624048359043084, + "loss": 0.0197, "step": 96690 }, { - "epoch": 0.49, - "learning_rate": 0.00022682040855452016, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002624009476879369, + "loss": 0.0253, "step": 96700 }, { - "epoch": 0.49, - "learning_rate": 0.00022681284086150614, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.00026239705947156546, + "loss": 0.0206, "step": 96710 }, { - "epoch": 0.49, - "learning_rate": 0.00022680527316849215, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.000262393171255194, + "loss": 0.0228, "step": 96720 }, { - "epoch": 0.49, - "learning_rate": 0.00022679770547547813, - "loss": 0.0143, + "epoch": 0.25, + "learning_rate": 0.00026238928303882255, + "loss": 0.0206, "step": 96730 }, { - "epoch": 0.49, - "learning_rate": 0.0002267901377824641, - "loss": 0.0199, + "epoch": 0.25, + "learning_rate": 0.00026238539482245106, + "loss": 0.0258, "step": 96740 }, { - "epoch": 0.49, - "learning_rate": 0.00022678257008945012, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002623815066060796, + "loss": 0.0245, "step": 96750 }, { - "epoch": 0.49, - "learning_rate": 0.0002267750023964361, - "loss": 0.0136, + "epoch": 0.25, + "learning_rate": 0.00026237761838970815, + "loss": 0.0176, "step": 96760 }, { - "epoch": 0.49, - "learning_rate": 0.00022676743470342208, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.00026237373017333666, + "loss": 0.0235, "step": 96770 }, { - "epoch": 0.49, - "learning_rate": 0.0002267598670104081, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.0002623698419569652, + "loss": 0.0234, "step": 96780 }, { - "epoch": 0.49, - "learning_rate": 0.00022675229931739407, - "loss": 0.0163, + "epoch": 0.25, + "learning_rate": 0.00026236595374059374, + "loss": 0.0259, "step": 96790 }, { - "epoch": 0.49, - "learning_rate": 0.00022674473162438005, - "loss": 0.0152, + "epoch": 0.25, + "learning_rate": 0.00026236206552422226, + "loss": 0.0218, "step": 96800 }, { - "epoch": 0.49, - "learning_rate": 0.00022673716393136606, - "loss": 0.0138, + "epoch": 0.25, + "learning_rate": 0.0002623581773078508, + "loss": 0.0227, "step": 96810 }, { - "epoch": 0.49, - "learning_rate": 0.00022672959623835204, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026235428909147934, + "loss": 0.0229, "step": 96820 }, { - "epoch": 0.49, - "learning_rate": 0.00022672202854533802, - "loss": 0.0184, + "epoch": 0.25, + "learning_rate": 0.00026235040087510786, + "loss": 0.025, "step": 96830 }, { - "epoch": 0.49, - "learning_rate": 0.00022671446085232403, - "loss": 0.0129, + "epoch": 0.25, + "learning_rate": 0.00026234651265873637, + "loss": 0.0188, "step": 96840 }, { - "epoch": 0.49, - "learning_rate": 0.00022670689315931001, - "loss": 0.0134, + "epoch": 0.25, + "learning_rate": 0.00026234262444236494, + "loss": 0.0253, "step": 96850 }, { - "epoch": 0.49, - "learning_rate": 0.000226699325466296, - "loss": 0.0167, + "epoch": 0.25, + "learning_rate": 0.0002623387362259935, + "loss": 0.0241, "step": 96860 }, { - "epoch": 0.49, - "learning_rate": 0.00022669175777328198, - "loss": 0.0128, + "epoch": 0.25, + "learning_rate": 0.000262334848009622, + "loss": 0.0215, "step": 96870 }, { - "epoch": 0.49, - "learning_rate": 0.00022668419008026799, - "loss": 0.0195, + "epoch": 0.25, + "learning_rate": 0.00026233095979325054, + "loss": 0.021, "step": 96880 }, { - "epoch": 0.49, - "learning_rate": 0.00022667662238725397, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002623270715768791, + "loss": 0.0251, "step": 96890 }, { - "epoch": 0.49, - "learning_rate": 0.00022666905469423995, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.0002623231833605076, + "loss": 0.0225, "step": 96900 }, { - "epoch": 0.49, - "learning_rate": 0.00022666148700122596, - "loss": 0.0137, + "epoch": 0.25, + "learning_rate": 0.00026231929514413613, + "loss": 0.0237, "step": 96910 }, { - "epoch": 0.49, - "learning_rate": 0.00022665391930821194, - "loss": 0.0152, + "epoch": 0.25, + "learning_rate": 0.0002623154069277647, + "loss": 0.0289, "step": 96920 }, { - "epoch": 0.49, - "learning_rate": 0.00022664635161519792, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.0002623115187113932, + "loss": 0.0258, "step": 96930 }, { - "epoch": 0.49, - "learning_rate": 0.00022663878392218393, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002623076304950218, + "loss": 0.0183, "step": 96940 }, { - "epoch": 0.49, - "learning_rate": 0.0002266312162291699, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002623037422786503, + "loss": 0.0241, "step": 96950 }, { - "epoch": 0.49, - "learning_rate": 0.0002266236485361559, - "loss": 0.0227, + "epoch": 0.25, + "learning_rate": 0.0002622998540622788, + "loss": 0.0189, "step": 96960 }, { - "epoch": 0.49, - "learning_rate": 0.0002266160808431419, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.0002622959658459074, + "loss": 0.0213, "step": 96970 }, { - "epoch": 0.49, - "learning_rate": 0.00022660851315012788, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.0002622920776295359, + "loss": 0.0244, "step": 96980 }, { - "epoch": 0.49, - "learning_rate": 0.00022660094545711386, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002622881894131644, + "loss": 0.024, "step": 96990 }, { - "epoch": 0.49, - "learning_rate": 0.00022659337776409987, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.000262284301196793, + "loss": 0.0202, "step": 97000 }, { - "epoch": 0.49, - "eval_cer": 0.9144644335264098, - "eval_loss": 0.011374830268323421, - "eval_runtime": 116.7311, - "eval_samples_per_second": 17.133, - "eval_steps_per_second": 4.283, + "epoch": 0.25, + "eval_cer": 0.8818160569148363, + "eval_loss": 0.016042526811361313, + "eval_runtime": 107.9667, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, "step": 97000 }, { - "epoch": 0.49, - "learning_rate": 0.00022658581007108585, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002622804129804215, + "loss": 0.0227, "step": 97010 }, { - "epoch": 0.49, - "learning_rate": 0.00022657824237807183, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.00026227652476405007, + "loss": 0.0175, "step": 97020 }, { - "epoch": 0.49, - "learning_rate": 0.00022657067468505782, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002622726365476786, + "loss": 0.0196, "step": 97030 }, { - "epoch": 0.49, - "learning_rate": 0.00022656310699204382, - "loss": 0.0217, + "epoch": 0.25, + "learning_rate": 0.0002622687483313071, + "loss": 0.0252, "step": 97040 }, { - "epoch": 0.49, - "learning_rate": 0.0002265555392990298, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.00026226486011493566, + "loss": 0.021, "step": 97050 }, { - "epoch": 0.49, - "learning_rate": 0.0002265479716060158, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002622609718985642, + "loss": 0.0247, "step": 97060 }, { - "epoch": 0.49, - "learning_rate": 0.0002265404039130018, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.00026225708368219275, + "loss": 0.0296, "step": 97070 }, { - "epoch": 0.49, - "learning_rate": 0.00022653283621998778, - "loss": 0.0138, + "epoch": 0.25, + "learning_rate": 0.00026225319546582126, + "loss": 0.0238, "step": 97080 }, { - "epoch": 0.49, - "learning_rate": 0.00022652526852697376, - "loss": 0.0137, + "epoch": 0.25, + "learning_rate": 0.0002622493072494498, + "loss": 0.0204, "step": 97090 }, { - "epoch": 0.49, - "learning_rate": 0.00022651770083395977, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.00026224541903307834, + "loss": 0.0246, "step": 97100 }, { - "epoch": 0.49, - "learning_rate": 0.00022651013314094575, - "loss": 0.0136, + "epoch": 0.25, + "learning_rate": 0.00026224153081670686, + "loss": 0.0229, "step": 97110 }, { - "epoch": 0.49, - "learning_rate": 0.00022650256544793173, - "loss": 0.0191, + "epoch": 0.25, + "learning_rate": 0.0002622376426003354, + "loss": 0.0236, "step": 97120 }, { - "epoch": 0.49, - "learning_rate": 0.00022649499775491774, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.00026223375438396394, + "loss": 0.021, "step": 97130 }, { - "epoch": 0.49, - "learning_rate": 0.00022648743006190372, - "loss": 0.0108, + "epoch": 0.25, + "learning_rate": 0.0002622298661675925, + "loss": 0.0214, "step": 97140 }, { - "epoch": 0.49, - "learning_rate": 0.0002264798623688897, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.000262225977951221, + "loss": 0.0232, "step": 97150 }, { - "epoch": 0.49, - "learning_rate": 0.0002264722946758757, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026222208973484954, + "loss": 0.0223, "step": 97160 }, { - "epoch": 0.49, - "learning_rate": 0.0002264647269828617, - "loss": 0.0145, + "epoch": 0.25, + "learning_rate": 0.00026221820151847805, + "loss": 0.0248, "step": 97170 }, { - "epoch": 0.49, - "learning_rate": 0.00022645715928984767, - "loss": 0.0152, + "epoch": 0.25, + "learning_rate": 0.0002622143133021066, + "loss": 0.0238, "step": 97180 }, { - "epoch": 0.49, - "learning_rate": 0.00022644959159683365, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026221042508573514, + "loss": 0.0227, "step": 97190 }, { - "epoch": 0.49, - "learning_rate": 0.00022644202390381966, - "loss": 0.0151, + "epoch": 0.25, + "learning_rate": 0.0002622065368693637, + "loss": 0.022, "step": 97200 }, { - "epoch": 0.49, - "learning_rate": 0.00022643445621080564, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.0002622026486529922, + "loss": 0.0239, "step": 97210 }, { - "epoch": 0.49, - "learning_rate": 0.00022642688851779163, - "loss": 0.0143, + "epoch": 0.25, + "learning_rate": 0.0002621987604366208, + "loss": 0.02, "step": 97220 }, { - "epoch": 0.49, - "learning_rate": 0.00022641932082477763, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.0002621948722202493, + "loss": 0.023, "step": 97230 }, { - "epoch": 0.49, - "learning_rate": 0.00022641175313176362, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002621909840038778, + "loss": 0.0185, "step": 97240 }, { - "epoch": 0.49, - "learning_rate": 0.0002264041854387496, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026218709578750633, + "loss": 0.0222, "step": 97250 }, { - "epoch": 0.49, - "learning_rate": 0.0002263966177457356, - "loss": 0.0162, + "epoch": 0.25, + "learning_rate": 0.0002621832075711349, + "loss": 0.022, "step": 97260 }, { - "epoch": 0.49, - "learning_rate": 0.0002263890500527216, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.0002621793193547634, + "loss": 0.0252, "step": 97270 }, { - "epoch": 0.49, - "learning_rate": 0.00022638148235970757, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.000262175431138392, + "loss": 0.027, "step": 97280 }, { - "epoch": 0.49, - "learning_rate": 0.00022637391466669358, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002621715429220205, + "loss": 0.0224, "step": 97290 }, { - "epoch": 0.49, - "learning_rate": 0.00022636634697367956, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.000262167654705649, + "loss": 0.0209, "step": 97300 }, { - "epoch": 0.49, - "learning_rate": 0.00022635877928066554, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.0002621637664892776, + "loss": 0.0219, "step": 97310 }, { - "epoch": 0.49, - "learning_rate": 0.00022635121158765155, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.0002621598782729061, + "loss": 0.0227, "step": 97320 }, { - "epoch": 0.49, - "learning_rate": 0.00022634364389463753, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.0002621559900565346, + "loss": 0.0263, "step": 97330 }, { - "epoch": 0.49, - "learning_rate": 0.0002263360762016235, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002621521018401632, + "loss": 0.0215, "step": 97340 }, { - "epoch": 0.49, - "learning_rate": 0.00022632850850860952, - "loss": 0.0205, + "epoch": 0.25, + "learning_rate": 0.00026214821362379175, + "loss": 0.0214, "step": 97350 }, { - "epoch": 0.49, - "learning_rate": 0.0002263209408155955, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.00026214432540742026, + "loss": 0.0172, "step": 97360 }, { - "epoch": 0.49, - "learning_rate": 0.00022631337312258148, - "loss": 0.0188, + "epoch": 0.25, + "learning_rate": 0.0002621404371910488, + "loss": 0.0268, "step": 97370 }, { - "epoch": 0.49, - "learning_rate": 0.00022630580542956746, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002621365489746773, + "loss": 0.0224, "step": 97380 }, { - "epoch": 0.49, - "learning_rate": 0.00022629823773655347, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026213266075830586, + "loss": 0.0195, "step": 97390 }, { - "epoch": 0.49, - "learning_rate": 0.00022629067004353945, - "loss": 0.0132, + "epoch": 0.25, + "learning_rate": 0.0002621287725419344, + "loss": 0.0219, "step": 97400 }, { - "epoch": 0.49, - "learning_rate": 0.0002262831023505254, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.00026212488432556295, + "loss": 0.02, "step": 97410 }, { - "epoch": 0.49, - "learning_rate": 0.0002262755346575114, - "loss": 0.0175, + "epoch": 0.25, + "learning_rate": 0.00026212099610919146, + "loss": 0.0233, "step": 97420 }, { - "epoch": 0.49, - "learning_rate": 0.0002262679669644974, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.00026211710789282003, + "loss": 0.0182, "step": 97430 }, { - "epoch": 0.49, - "learning_rate": 0.00022626039927148338, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026211321967644854, + "loss": 0.0235, "step": 97440 }, { - "epoch": 0.49, - "learning_rate": 0.00022625283157846936, - "loss": 0.0173, + "epoch": 0.25, + "learning_rate": 0.00026210933146007706, + "loss": 0.0277, "step": 97450 }, { - "epoch": 0.49, - "learning_rate": 0.00022624526388545537, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.00026210544324370557, + "loss": 0.0193, "step": 97460 }, { - "epoch": 0.49, - "learning_rate": 0.00022623769619244135, - "loss": 0.0131, + "epoch": 0.25, + "learning_rate": 0.00026210155502733414, + "loss": 0.0187, "step": 97470 }, { - "epoch": 0.49, - "learning_rate": 0.00022623012849942733, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.00026209766681096266, + "loss": 0.0199, "step": 97480 }, { - "epoch": 0.49, - "learning_rate": 0.00022622256080641334, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.0002620937785945912, + "loss": 0.0221, "step": 97490 }, { - "epoch": 0.49, - "learning_rate": 0.00022621499311339932, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.00026208989037821974, + "loss": 0.023, "step": 97500 }, { - "epoch": 0.49, - "learning_rate": 0.0002262074254203853, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.00026208600216184825, + "loss": 0.0252, "step": 97510 }, { - "epoch": 0.49, - "learning_rate": 0.0002261998577273713, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002620821139454768, + "loss": 0.0199, "step": 97520 }, { - "epoch": 0.49, - "learning_rate": 0.0002261922900343573, - "loss": 0.0162, + "epoch": 0.25, + "learning_rate": 0.00026207822572910534, + "loss": 0.0201, "step": 97530 }, { - "epoch": 0.49, - "learning_rate": 0.00022618472234134328, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.0002620743375127339, + "loss": 0.0221, "step": 97540 }, { - "epoch": 0.49, - "learning_rate": 0.00022617715464832928, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.0002620704492963624, + "loss": 0.0242, "step": 97550 }, { - "epoch": 0.49, - "learning_rate": 0.00022616958695531527, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.000262066561079991, + "loss": 0.0248, "step": 97560 }, { - "epoch": 0.49, - "learning_rate": 0.00022616201926230125, - "loss": 0.0186, + "epoch": 0.25, + "learning_rate": 0.0002620626728636195, + "loss": 0.0214, "step": 97570 }, { - "epoch": 0.49, - "learning_rate": 0.00022615445156928726, - "loss": 0.0147, + "epoch": 0.25, + "learning_rate": 0.000262058784647248, + "loss": 0.0246, "step": 97580 }, { - "epoch": 0.49, - "learning_rate": 0.00022614688387627324, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026205489643087653, + "loss": 0.0233, "step": 97590 }, { - "epoch": 0.49, - "learning_rate": 0.00022613931618325922, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002620510082145051, + "loss": 0.02, "step": 97600 }, { - "epoch": 0.49, - "learning_rate": 0.0002261317484902452, - "loss": 0.0112, + "epoch": 0.25, + "learning_rate": 0.0002620471199981336, + "loss": 0.021, "step": 97610 }, { - "epoch": 0.49, - "learning_rate": 0.0002261241807972312, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.0002620432317817622, + "loss": 0.0219, "step": 97620 }, { - "epoch": 0.49, - "learning_rate": 0.0002261166131042172, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002620393435653907, + "loss": 0.0237, "step": 97630 }, { - "epoch": 0.49, - "learning_rate": 0.00022610904541120317, - "loss": 0.0125, + "epoch": 0.25, + "learning_rate": 0.00026203545534901927, + "loss": 0.0237, "step": 97640 }, { - "epoch": 0.49, - "learning_rate": 0.00022610147771818918, - "loss": 0.0181, + "epoch": 0.25, + "learning_rate": 0.0002620315671326478, + "loss": 0.0202, "step": 97650 }, { - "epoch": 0.49, - "learning_rate": 0.00022609391002517516, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002620276789162763, + "loss": 0.0219, "step": 97660 }, { - "epoch": 0.49, - "learning_rate": 0.00022608634233216114, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.0002620237906999048, + "loss": 0.0214, "step": 97670 }, { - "epoch": 0.49, - "learning_rate": 0.00022607877463914715, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.0002620199024835334, + "loss": 0.0295, "step": 97680 }, { - "epoch": 0.49, - "learning_rate": 0.00022607120694613313, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026201601426716195, + "loss": 0.0185, "step": 97690 }, { - "epoch": 0.49, - "learning_rate": 0.00022606363925311911, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026201212605079046, + "loss": 0.0212, "step": 97700 }, { - "epoch": 0.49, - "learning_rate": 0.00022605607156010512, - "loss": 0.0154, + "epoch": 0.25, + "learning_rate": 0.000262008237834419, + "loss": 0.0268, "step": 97710 }, { - "epoch": 0.49, - "learning_rate": 0.0002260485038670911, - "loss": 0.0138, + "epoch": 0.25, + "learning_rate": 0.00026200434961804755, + "loss": 0.0236, "step": 97720 }, { - "epoch": 0.49, - "learning_rate": 0.00022604093617407709, - "loss": 0.0142, + "epoch": 0.25, + "learning_rate": 0.00026200046140167606, + "loss": 0.0239, "step": 97730 }, { - "epoch": 0.49, - "learning_rate": 0.0002260333684810631, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002619965731853046, + "loss": 0.0194, "step": 97740 }, { - "epoch": 0.49, - "learning_rate": 0.00022602580078804908, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026199268496893314, + "loss": 0.0236, "step": 97750 }, { - "epoch": 0.49, - "learning_rate": 0.00022601823309503506, - "loss": 0.0156, + "epoch": 0.25, + "learning_rate": 0.00026198879675256166, + "loss": 0.02, "step": 97760 }, { - "epoch": 0.49, - "learning_rate": 0.00022601066540202104, - "loss": 0.0197, + "epoch": 0.25, + "learning_rate": 0.00026198490853619023, + "loss": 0.0215, "step": 97770 }, { - "epoch": 0.49, - "learning_rate": 0.00022600309770900705, - "loss": 0.0141, + "epoch": 0.25, + "learning_rate": 0.00026198102031981874, + "loss": 0.0231, "step": 97780 }, { - "epoch": 0.49, - "learning_rate": 0.00022599553001599303, - "loss": 0.0131, + "epoch": 0.25, + "learning_rate": 0.00026197713210344726, + "loss": 0.0298, "step": 97790 }, { - "epoch": 0.49, - "learning_rate": 0.000225987962322979, - "loss": 0.0169, + "epoch": 0.25, + "learning_rate": 0.00026197324388707577, + "loss": 0.0227, "step": 97800 }, { - "epoch": 0.49, - "learning_rate": 0.00022598039462996502, - "loss": 0.0127, + "epoch": 0.25, + "learning_rate": 0.00026196935567070434, + "loss": 0.0215, "step": 97810 }, { - "epoch": 0.49, - "learning_rate": 0.000225972826936951, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.00026196546745433285, + "loss": 0.0186, "step": 97820 }, { - "epoch": 0.49, - "learning_rate": 0.00022596525924393698, - "loss": 0.0144, + "epoch": 0.25, + "learning_rate": 0.0002619615792379614, + "loss": 0.0246, "step": 97830 }, { - "epoch": 0.49, - "learning_rate": 0.000225957691550923, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.00026195769102158994, + "loss": 0.0229, "step": 97840 }, { - "epoch": 0.49, - "learning_rate": 0.00022595012385790897, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002619538028052185, + "loss": 0.0218, "step": 97850 }, { - "epoch": 0.49, - "learning_rate": 0.00022594255616489495, - "loss": 0.0182, + "epoch": 0.25, + "learning_rate": 0.000261949914588847, + "loss": 0.018, "step": 97860 }, { - "epoch": 0.49, - "learning_rate": 0.00022593498847188096, - "loss": 0.0152, + "epoch": 0.25, + "learning_rate": 0.00026194602637247554, + "loss": 0.0201, "step": 97870 }, { - "epoch": 0.49, - "learning_rate": 0.00022592742077886694, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.00026194213815610405, + "loss": 0.0216, "step": 97880 }, { - "epoch": 0.49, - "learning_rate": 0.00022591985308585292, - "loss": 0.0179, + "epoch": 0.25, + "learning_rate": 0.0002619382499397326, + "loss": 0.0217, "step": 97890 }, { - "epoch": 0.49, - "learning_rate": 0.00022591228539283893, - "loss": 0.0192, + "epoch": 0.25, + "learning_rate": 0.0002619343617233612, + "loss": 0.0193, "step": 97900 }, { - "epoch": 0.49, - "learning_rate": 0.00022590471769982491, - "loss": 0.0176, + "epoch": 0.25, + "learning_rate": 0.0002619304735069897, + "loss": 0.0183, "step": 97910 }, { - "epoch": 0.49, - "learning_rate": 0.0002258971500068109, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002619265852906182, + "loss": 0.0198, "step": 97920 }, { - "epoch": 0.49, - "learning_rate": 0.00022588958231379688, - "loss": 0.0187, + "epoch": 0.25, + "learning_rate": 0.0002619226970742468, + "loss": 0.0229, "step": 97930 }, { - "epoch": 0.49, - "learning_rate": 0.00022588201462078289, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.0002619188088578753, + "loss": 0.0204, "step": 97940 }, { - "epoch": 0.49, - "learning_rate": 0.00022587444692776887, - "loss": 0.02, + "epoch": 0.25, + "learning_rate": 0.0002619149206415038, + "loss": 0.0208, "step": 97950 }, { - "epoch": 0.49, - "learning_rate": 0.00022586687923475485, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.0002619110324251324, + "loss": 0.0247, "step": 97960 }, { - "epoch": 0.49, - "learning_rate": 0.00022585931154174086, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002619071442087609, + "loss": 0.0209, "step": 97970 }, { - "epoch": 0.49, - "learning_rate": 0.00022585174384872684, - "loss": 0.0226, + "epoch": 0.25, + "learning_rate": 0.00026190325599238947, + "loss": 0.0225, "step": 97980 }, { - "epoch": 0.49, - "learning_rate": 0.00022584417615571282, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.000261899367776018, + "loss": 0.0227, "step": 97990 }, { - "epoch": 0.49, - "learning_rate": 0.00022583660846269883, - "loss": 0.0241, + "epoch": 0.25, + "learning_rate": 0.0002618954795596465, + "loss": 0.0202, "step": 98000 }, { - "epoch": 0.49, - "eval_cer": 0.9144799598644162, - "eval_loss": 0.011652790941298008, - "eval_runtime": 116.7303, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.283, + "epoch": 0.25, + "eval_cer": 0.8818538471120592, + "eval_loss": 0.016256479546427727, + "eval_runtime": 107.9645, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, "step": 98000 }, { - "epoch": 0.49, - "learning_rate": 0.0002258290407696848, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.000261891591343275, + "loss": 0.0266, "step": 98010 }, { - "epoch": 0.49, - "learning_rate": 0.0002258214730766708, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.0002618877031269036, + "loss": 0.0213, "step": 98020 }, { - "epoch": 0.49, - "learning_rate": 0.0002258139053836568, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.0002618838149105321, + "loss": 0.0209, "step": 98030 }, { - "epoch": 0.49, - "learning_rate": 0.00022580633769064278, - "loss": 0.0136, + "epoch": 0.25, + "learning_rate": 0.00026187992669416066, + "loss": 0.0241, "step": 98040 }, { - "epoch": 0.49, - "learning_rate": 0.00022579876999762876, - "loss": 0.016, + "epoch": 0.25, + "learning_rate": 0.0002618760384777892, + "loss": 0.0208, "step": 98050 }, { - "epoch": 0.49, - "learning_rate": 0.00022579120230461477, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026187215026141775, + "loss": 0.0212, "step": 98060 }, { - "epoch": 0.49, - "learning_rate": 0.00022578363461160075, - "loss": 0.0166, + "epoch": 0.25, + "learning_rate": 0.00026186826204504626, + "loss": 0.0241, "step": 98070 }, { - "epoch": 0.49, - "learning_rate": 0.00022577606691858673, - "loss": 0.0158, + "epoch": 0.25, + "learning_rate": 0.0002618643738286748, + "loss": 0.0228, "step": 98080 }, { - "epoch": 0.49, - "learning_rate": 0.00022576849922557272, - "loss": 0.0232, + "epoch": 0.25, + "learning_rate": 0.00026186048561230334, + "loss": 0.0236, "step": 98090 }, { - "epoch": 0.49, - "learning_rate": 0.00022576093153255872, - "loss": 0.0201, + "epoch": 0.25, + "learning_rate": 0.00026185659739593186, + "loss": 0.0243, "step": 98100 }, { - "epoch": 0.49, - "learning_rate": 0.0002257533638395447, - "loss": 0.0174, + "epoch": 0.25, + "learning_rate": 0.0002618527091795604, + "loss": 0.0225, "step": 98110 }, { - "epoch": 0.5, - "learning_rate": 0.0002257457961465307, - "loss": 0.0155, + "epoch": 0.25, + "learning_rate": 0.00026184882096318894, + "loss": 0.0208, "step": 98120 }, { - "epoch": 0.5, - "learning_rate": 0.0002257382284535167, - "loss": 0.0171, + "epoch": 0.25, + "learning_rate": 0.00026184493274681746, + "loss": 0.0218, "step": 98130 }, { - "epoch": 0.5, - "learning_rate": 0.00022573066076050268, - "loss": 0.0146, + "epoch": 0.25, + "learning_rate": 0.000261841044530446, + "loss": 0.0229, "step": 98140 }, { - "epoch": 0.5, - "learning_rate": 0.00022572309306748866, - "loss": 0.019, + "epoch": 0.25, + "learning_rate": 0.00026183715631407454, + "loss": 0.0221, "step": 98150 }, { - "epoch": 0.5, - "learning_rate": 0.00022571552537447467, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.00026183326809770305, + "loss": 0.0188, "step": 98160 }, { - "epoch": 0.5, - "learning_rate": 0.00022570795768146065, - "loss": 0.0203, + "epoch": 0.25, + "learning_rate": 0.0002618293798813316, + "loss": 0.0269, "step": 98170 }, { - "epoch": 0.5, - "learning_rate": 0.00022570038998844663, - "loss": 0.0153, + "epoch": 0.25, + "learning_rate": 0.00026182549166496014, + "loss": 0.021, "step": 98180 }, { - "epoch": 0.5, - "learning_rate": 0.00022569282229543264, - "loss": 0.0159, + "epoch": 0.25, + "learning_rate": 0.0002618216034485887, + "loss": 0.0239, "step": 98190 }, { - "epoch": 0.5, - "learning_rate": 0.00022568525460241862, - "loss": 0.0148, + "epoch": 0.25, + "learning_rate": 0.0002618177152322172, + "loss": 0.025, "step": 98200 }, { - "epoch": 0.5, - "learning_rate": 0.0002256776869094046, - "loss": 0.0161, + "epoch": 0.25, + "learning_rate": 0.00026181382701584573, + "loss": 0.0194, "step": 98210 }, { - "epoch": 0.5, - "learning_rate": 0.0002256701192163906, - "loss": 0.0164, + "epoch": 0.25, + "learning_rate": 0.0002618099387994743, + "loss": 0.0218, "step": 98220 }, { - "epoch": 0.5, - "learning_rate": 0.0002256625515233766, - "loss": 0.0165, + "epoch": 0.25, + "learning_rate": 0.0002618060505831028, + "loss": 0.0222, "step": 98230 }, { - "epoch": 0.5, - "learning_rate": 0.00022565498383036257, - "loss": 0.014, + "epoch": 0.25, + "learning_rate": 0.0002618021623667314, + "loss": 0.0166, "step": 98240 }, { - "epoch": 0.5, - "learning_rate": 0.00022564741613734858, - "loss": 0.0178, + "epoch": 0.25, + "learning_rate": 0.0002617982741503599, + "loss": 0.0207, "step": 98250 }, { - "epoch": 0.5, - "learning_rate": 0.00022563984844433456, - "loss": 0.0131, + "epoch": 0.25, + "learning_rate": 0.0002617943859339884, + "loss": 0.0205, "step": 98260 }, { - "epoch": 0.5, - "learning_rate": 0.00022563228075132055, - "loss": 0.0209, + "epoch": 0.25, + "learning_rate": 0.000261790497717617, + "loss": 0.0233, "step": 98270 }, { - "epoch": 0.5, - "learning_rate": 0.00022562471305830653, - "loss": 0.0115, + "epoch": 0.25, + "learning_rate": 0.0002617866095012455, + "loss": 0.0188, "step": 98280 }, { - "epoch": 0.5, - "learning_rate": 0.00022561714536529253, - "loss": 0.0183, + "epoch": 0.25, + "learning_rate": 0.000261782721284874, + "loss": 0.0242, "step": 98290 }, { - "epoch": 0.5, - "learning_rate": 0.00022560957767227852, - "loss": 0.0143, + "epoch": 0.25, + "learning_rate": 0.0002617788330685026, + "loss": 0.0202, "step": 98300 }, { - "epoch": 0.5, - "learning_rate": 0.0002256020099792645, - "loss": 0.015, + "epoch": 0.25, + "learning_rate": 0.0002617749448521311, + "loss": 0.0292, "step": 98310 }, { - "epoch": 0.5, - "learning_rate": 0.0002255944422862505, - "loss": 0.0122, + "epoch": 0.25, + "learning_rate": 0.00026177105663575967, + "loss": 0.0216, "step": 98320 }, { - "epoch": 0.5, - "learning_rate": 0.0002255868745932365, - "loss": 0.0149, + "epoch": 0.25, + "learning_rate": 0.0002617671684193882, + "loss": 0.0205, "step": 98330 }, { - "epoch": 0.5, - "learning_rate": 0.00022557930690022247, - "loss": 0.0157, + "epoch": 0.25, + "learning_rate": 0.0002617632802030167, + "loss": 0.024, "step": 98340 }, { - "epoch": 0.5, - "learning_rate": 0.00022557173920720848, - "loss": 0.0168, + "epoch": 0.25, + "learning_rate": 0.00026175939198664526, + "loss": 0.0222, "step": 98350 }, { - "epoch": 0.5, - "learning_rate": 0.00022556417151419446, - "loss": 0.0139, + "epoch": 0.25, + "learning_rate": 0.0002617555037702738, + "loss": 0.03, "step": 98360 }, { - "epoch": 0.5, - "learning_rate": 0.00022555660382118044, - "loss": 0.0133, + "epoch": 0.25, + "learning_rate": 0.0002617516155539023, + "loss": 0.0225, "step": 98370 }, { - "epoch": 0.5, - "learning_rate": 0.00022554903612816645, - "loss": 0.0243, + "epoch": 0.26, + "learning_rate": 0.00026174772733753086, + "loss": 0.028, "step": 98380 }, { - "epoch": 0.5, - "learning_rate": 0.00022554146843515243, - "loss": 0.0139, + "epoch": 0.26, + "learning_rate": 0.00026174383912115943, + "loss": 0.0211, "step": 98390 }, { - "epoch": 0.5, - "learning_rate": 0.0002255339007421384, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.00026173995090478794, + "loss": 0.027, "step": 98400 }, { - "epoch": 0.5, - "learning_rate": 0.00022552633304912442, - "loss": 0.0178, + "epoch": 0.26, + "learning_rate": 0.00026173606268841646, + "loss": 0.022, "step": 98410 }, { - "epoch": 0.5, - "learning_rate": 0.0002255187653561104, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.000261732174472045, + "loss": 0.0218, "step": 98420 }, { - "epoch": 0.5, - "learning_rate": 0.00022551119766309638, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.00026172828625567354, + "loss": 0.0186, "step": 98430 }, { - "epoch": 0.5, - "learning_rate": 0.00022550362997008237, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026172439803930206, + "loss": 0.0247, "step": 98440 }, { - "epoch": 0.5, - "learning_rate": 0.00022549606227706837, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.0002617205098229306, + "loss": 0.0229, "step": 98450 }, { - "epoch": 0.5, - "learning_rate": 0.00022548849458405436, - "loss": 0.013, + "epoch": 0.26, + "learning_rate": 0.00026171662160655914, + "loss": 0.0177, "step": 98460 }, { - "epoch": 0.5, - "learning_rate": 0.00022548092689104034, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002617127333901877, + "loss": 0.0238, "step": 98470 }, { - "epoch": 0.5, - "learning_rate": 0.00022547335919802635, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.0002617088451738162, + "loss": 0.0207, "step": 98480 }, { - "epoch": 0.5, - "learning_rate": 0.00022546579150501233, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.00026170495695744474, + "loss": 0.0229, "step": 98490 }, { - "epoch": 0.5, - "learning_rate": 0.0002254582238119983, - "loss": 0.0276, + "epoch": 0.26, + "learning_rate": 0.00026170106874107325, + "loss": 0.0228, "step": 98500 }, { - "epoch": 0.5, - "learning_rate": 0.00022545065611898432, - "loss": 0.0217, + "epoch": 0.26, + "learning_rate": 0.0002616971805247018, + "loss": 0.0234, "step": 98510 }, { - "epoch": 0.5, - "learning_rate": 0.0002254430884259703, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.00026169329230833034, + "loss": 0.0276, "step": 98520 }, { - "epoch": 0.5, - "learning_rate": 0.00022543552073295628, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002616894040919589, + "loss": 0.0217, "step": 98530 }, { - "epoch": 0.5, - "learning_rate": 0.0002254279530399423, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.0002616855158755874, + "loss": 0.0235, "step": 98540 }, { - "epoch": 0.5, - "learning_rate": 0.00022542038534692827, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.00026168162765921593, + "loss": 0.0204, "step": 98550 }, { - "epoch": 0.5, - "learning_rate": 0.00022541281765391425, - "loss": 0.0161, + "epoch": 0.26, + "learning_rate": 0.0002616777394428445, + "loss": 0.0252, "step": 98560 }, { - "epoch": 0.5, - "learning_rate": 0.00022540524996090026, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.000261673851226473, + "loss": 0.0271, "step": 98570 }, { - "epoch": 0.5, - "learning_rate": 0.00022539768226788624, - "loss": 0.0195, + "epoch": 0.26, + "learning_rate": 0.00026166996301010153, + "loss": 0.0296, "step": 98580 }, { - "epoch": 0.5, - "learning_rate": 0.00022539011457487222, - "loss": 0.0179, + "epoch": 0.26, + "learning_rate": 0.0002616660747937301, + "loss": 0.0246, "step": 98590 }, { - "epoch": 0.5, - "learning_rate": 0.0002253825468818582, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.00026166218657735867, + "loss": 0.0202, "step": 98600 }, { - "epoch": 0.5, - "learning_rate": 0.0002253749791888442, - "loss": 0.0187, + "epoch": 0.26, + "learning_rate": 0.0002616582983609872, + "loss": 0.0229, "step": 98610 }, { - "epoch": 0.5, - "learning_rate": 0.0002253674114958302, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.0002616544101446157, + "loss": 0.0245, "step": 98620 }, { - "epoch": 0.5, - "learning_rate": 0.00022535984380281618, - "loss": 0.0126, + "epoch": 0.26, + "learning_rate": 0.0002616505219282442, + "loss": 0.021, "step": 98630 }, { - "epoch": 0.5, - "learning_rate": 0.00022535227610980218, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002616466337118728, + "loss": 0.0212, "step": 98640 }, { - "epoch": 0.5, - "learning_rate": 0.00022534470841678817, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002616427454955013, + "loss": 0.0243, "step": 98650 }, { - "epoch": 0.5, - "learning_rate": 0.00022533714072377415, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.00026163885727912986, + "loss": 0.0236, "step": 98660 }, { - "epoch": 0.5, - "learning_rate": 0.0002253295730307601, - "loss": 0.0134, + "epoch": 0.26, + "learning_rate": 0.0002616349690627584, + "loss": 0.0226, "step": 98670 }, { - "epoch": 0.5, - "learning_rate": 0.0002253220053377461, - "loss": 0.017, + "epoch": 0.26, + "learning_rate": 0.00026163108084638695, + "loss": 0.0222, "step": 98680 }, { - "epoch": 0.5, - "learning_rate": 0.0002253144376447321, - "loss": 0.014, + "epoch": 0.26, + "learning_rate": 0.00026162719263001546, + "loss": 0.0247, "step": 98690 }, { - "epoch": 0.5, - "learning_rate": 0.00022530686995171807, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.000261623304413644, + "loss": 0.0238, "step": 98700 }, { - "epoch": 0.5, - "learning_rate": 0.00022529930225870408, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002616194161972725, + "loss": 0.0241, "step": 98710 }, { - "epoch": 0.5, - "learning_rate": 0.00022529173456569006, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.00026161552798090106, + "loss": 0.0229, "step": 98720 }, { - "epoch": 0.5, - "learning_rate": 0.00022528416687267604, - "loss": 0.0142, + "epoch": 0.26, + "learning_rate": 0.00026161163976452963, + "loss": 0.0178, "step": 98730 }, { - "epoch": 0.5, - "learning_rate": 0.00022527659917966205, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.00026160775154815814, + "loss": 0.0238, "step": 98740 }, { - "epoch": 0.5, - "learning_rate": 0.00022526903148664803, - "loss": 0.0203, + "epoch": 0.26, + "learning_rate": 0.00026160386333178666, + "loss": 0.019, "step": 98750 }, { - "epoch": 0.5, - "learning_rate": 0.00022526146379363402, - "loss": 0.014, + "epoch": 0.26, + "learning_rate": 0.00026159997511541517, + "loss": 0.022, "step": 98760 }, { - "epoch": 0.5, - "learning_rate": 0.00022525389610062002, - "loss": 0.0125, + "epoch": 0.26, + "learning_rate": 0.00026159608689904374, + "loss": 0.0239, "step": 98770 }, { - "epoch": 0.5, - "learning_rate": 0.000225246328407606, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.00026159219868267226, + "loss": 0.0189, "step": 98780 }, { - "epoch": 0.5, - "learning_rate": 0.000225238760714592, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.0002615883104663008, + "loss": 0.0236, "step": 98790 }, { - "epoch": 0.5, - "learning_rate": 0.000225231193021578, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026158442224992934, + "loss": 0.0194, "step": 98800 }, { - "epoch": 0.5, - "learning_rate": 0.00022522362532856398, - "loss": 0.0132, + "epoch": 0.26, + "learning_rate": 0.0002615805340335579, + "loss": 0.0263, "step": 98810 }, { - "epoch": 0.5, - "learning_rate": 0.00022521605763554996, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.0002615766458171864, + "loss": 0.0217, "step": 98820 }, { - "epoch": 0.5, - "learning_rate": 0.00022520848994253594, - "loss": 0.0187, + "epoch": 0.26, + "learning_rate": 0.00026157275760081494, + "loss": 0.0203, "step": 98830 }, { - "epoch": 0.5, - "learning_rate": 0.00022520092224952195, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026156886938444345, + "loss": 0.0248, "step": 98840 }, { - "epoch": 0.5, - "learning_rate": 0.00022519335455650793, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.000261564981168072, + "loss": 0.0175, "step": 98850 }, { - "epoch": 0.5, - "learning_rate": 0.0002251857868634939, - "loss": 0.0135, + "epoch": 0.26, + "learning_rate": 0.00026156109295170053, + "loss": 0.0217, "step": 98860 }, { - "epoch": 0.5, - "learning_rate": 0.00022517821917047992, - "loss": 0.0213, + "epoch": 0.26, + "learning_rate": 0.0002615572047353291, + "loss": 0.0209, "step": 98870 }, { - "epoch": 0.5, - "learning_rate": 0.0002251706514774659, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002615533165189576, + "loss": 0.0261, "step": 98880 }, { - "epoch": 0.5, - "learning_rate": 0.00022516308378445188, - "loss": 0.0165, + "epoch": 0.26, + "learning_rate": 0.0002615494283025862, + "loss": 0.0221, "step": 98890 }, { - "epoch": 0.5, - "learning_rate": 0.0002251555160914379, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.0002615455400862147, + "loss": 0.0204, "step": 98900 }, { - "epoch": 0.5, - "learning_rate": 0.00022514794839842387, - "loss": 0.0125, + "epoch": 0.26, + "learning_rate": 0.0002615416518698432, + "loss": 0.0233, "step": 98910 }, { - "epoch": 0.5, - "learning_rate": 0.00022514038070540985, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.00026153776365347173, + "loss": 0.0231, "step": 98920 }, { - "epoch": 0.5, - "learning_rate": 0.00022513281301239586, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.0002615338754371003, + "loss": 0.0212, "step": 98930 }, { - "epoch": 0.5, - "learning_rate": 0.00022512524531938184, - "loss": 0.0142, + "epoch": 0.26, + "learning_rate": 0.00026152998722072887, + "loss": 0.019, "step": 98940 }, { - "epoch": 0.5, - "learning_rate": 0.00022511767762636783, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.0002615260990043574, + "loss": 0.0218, "step": 98950 }, { - "epoch": 0.5, - "learning_rate": 0.00022511010993335383, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002615222107879859, + "loss": 0.0286, "step": 98960 }, { - "epoch": 0.5, - "learning_rate": 0.00022510254224033982, - "loss": 0.0134, + "epoch": 0.26, + "learning_rate": 0.00026151832257161447, + "loss": 0.0237, "step": 98970 }, { - "epoch": 0.5, - "learning_rate": 0.0002250949745473258, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.000261514434355243, + "loss": 0.0218, "step": 98980 }, { - "epoch": 0.5, - "learning_rate": 0.00022508740685431178, - "loss": 0.0195, + "epoch": 0.26, + "learning_rate": 0.0002615105461388715, + "loss": 0.0207, "step": 98990 }, { - "epoch": 0.5, - "learning_rate": 0.0002250798391612978, - "loss": 0.0132, + "epoch": 0.26, + "learning_rate": 0.00026150665792250006, + "loss": 0.0205, "step": 99000 }, { - "epoch": 0.5, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.011587457731366158, - "eval_runtime": 116.7415, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.26, + "eval_cer": 0.8817950623608236, + "eval_loss": 0.015839723870158195, + "eval_runtime": 108.0387, + "eval_samples_per_second": 18.512, + "eval_steps_per_second": 4.628, "step": 99000 }, { - "epoch": 0.5, - "learning_rate": 0.00022507227146828377, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002615027697061286, + "loss": 0.0234, "step": 99010 }, { - "epoch": 0.5, - "learning_rate": 0.00022506470377526975, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.00026149888148975715, + "loss": 0.0225, "step": 99020 }, { - "epoch": 0.5, - "learning_rate": 0.00022505713608225576, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.00026149499327338566, + "loss": 0.0271, "step": 99030 }, { - "epoch": 0.5, - "learning_rate": 0.00022504956838924174, - "loss": 0.0127, + "epoch": 0.26, + "learning_rate": 0.0002614911050570142, + "loss": 0.0229, "step": 99040 }, { - "epoch": 0.5, - "learning_rate": 0.00022504200069622772, - "loss": 0.0199, + "epoch": 0.26, + "learning_rate": 0.0002614872168406427, + "loss": 0.0305, "step": 99050 }, { - "epoch": 0.5, - "learning_rate": 0.00022503443300321373, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.00026148332862427126, + "loss": 0.0265, "step": 99060 }, { - "epoch": 0.5, - "learning_rate": 0.0002250268653101997, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002614794404078998, + "loss": 0.0224, "step": 99070 }, { - "epoch": 0.5, - "learning_rate": 0.0002250192976171857, - "loss": 0.0187, + "epoch": 0.26, + "learning_rate": 0.00026147555219152834, + "loss": 0.0176, "step": 99080 }, { - "epoch": 0.5, - "learning_rate": 0.0002250117299241717, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.00026147166397515686, + "loss": 0.0172, "step": 99090 }, { - "epoch": 0.5, - "learning_rate": 0.00022500416223115768, - "loss": 0.014, + "epoch": 0.26, + "learning_rate": 0.0002614677757587854, + "loss": 0.0232, "step": 99100 }, { - "epoch": 0.5, - "learning_rate": 0.00022499659453814366, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.00026146388754241394, + "loss": 0.0228, "step": 99110 }, { - "epoch": 0.5, - "learning_rate": 0.00022498902684512967, - "loss": 0.013, + "epoch": 0.26, + "learning_rate": 0.00026145999932604245, + "loss": 0.0266, "step": 99120 }, { - "epoch": 0.5, - "learning_rate": 0.00022498145915211565, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.000261456111109671, + "loss": 0.0196, "step": 99130 }, { - "epoch": 0.5, - "learning_rate": 0.00022497389145910164, - "loss": 0.0135, + "epoch": 0.26, + "learning_rate": 0.00026145222289329954, + "loss": 0.0225, "step": 99140 }, { - "epoch": 0.5, - "learning_rate": 0.00022496632376608764, - "loss": 0.0234, + "epoch": 0.26, + "learning_rate": 0.0002614483346769281, + "loss": 0.0243, "step": 99150 }, { - "epoch": 0.5, - "learning_rate": 0.00022495875607307363, - "loss": 0.013, + "epoch": 0.26, + "learning_rate": 0.0002614444464605566, + "loss": 0.0239, "step": 99160 }, { - "epoch": 0.5, - "learning_rate": 0.0002249511883800596, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.00026144055824418514, + "loss": 0.0237, "step": 99170 }, { - "epoch": 0.5, - "learning_rate": 0.0002249436206870456, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.0002614366700278137, + "loss": 0.0182, "step": 99180 }, { - "epoch": 0.5, - "learning_rate": 0.0002249360529940316, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.0002614327818114422, + "loss": 0.0192, "step": 99190 }, { - "epoch": 0.5, - "learning_rate": 0.00022492848530101758, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026142889359507073, + "loss": 0.0272, "step": 99200 }, { - "epoch": 0.5, - "learning_rate": 0.00022492091760800356, - "loss": 0.0122, + "epoch": 0.26, + "learning_rate": 0.0002614250053786993, + "loss": 0.0214, "step": 99210 }, { - "epoch": 0.5, - "learning_rate": 0.00022491334991498957, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.0002614211171623278, + "loss": 0.0237, "step": 99220 }, { - "epoch": 0.5, - "learning_rate": 0.00022490578222197555, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.0002614172289459564, + "loss": 0.0208, "step": 99230 }, { - "epoch": 0.5, - "learning_rate": 0.00022489821452896153, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002614133407295849, + "loss": 0.0245, "step": 99240 }, { - "epoch": 0.5, - "learning_rate": 0.00022489064683594754, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.0002614094525132134, + "loss": 0.0259, "step": 99250 }, { - "epoch": 0.5, - "learning_rate": 0.00022488307914293352, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.00026140556429684193, + "loss": 0.0242, "step": 99260 }, { - "epoch": 0.5, - "learning_rate": 0.0002248755114499195, - "loss": 0.0116, + "epoch": 0.26, + "learning_rate": 0.0002614016760804705, + "loss": 0.0194, "step": 99270 }, { - "epoch": 0.5, - "learning_rate": 0.0002248679437569055, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.00026139778786409907, + "loss": 0.0268, "step": 99280 }, { - "epoch": 0.5, - "learning_rate": 0.0002248603760638915, - "loss": 0.0368, + "epoch": 0.26, + "learning_rate": 0.0002613938996477276, + "loss": 0.0219, "step": 99290 }, { - "epoch": 0.5, - "learning_rate": 0.00022485280837087747, - "loss": 0.0209, + "epoch": 0.26, + "learning_rate": 0.0002613900114313561, + "loss": 0.0215, "step": 99300 }, { - "epoch": 0.5, - "learning_rate": 0.00022484524067786348, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.00026138612321498466, + "loss": 0.0217, "step": 99310 }, { - "epoch": 0.5, - "learning_rate": 0.00022483767298484946, - "loss": 0.019, + "epoch": 0.26, + "learning_rate": 0.0002613822349986132, + "loss": 0.0239, "step": 99320 }, { - "epoch": 0.5, - "learning_rate": 0.00022483010529183545, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002613783467822417, + "loss": 0.0217, "step": 99330 }, { - "epoch": 0.5, - "learning_rate": 0.00022482253759882143, - "loss": 0.0179, + "epoch": 0.26, + "learning_rate": 0.00026137445856587026, + "loss": 0.0265, "step": 99340 }, { - "epoch": 0.5, - "learning_rate": 0.00022481496990580744, - "loss": 0.0215, + "epoch": 0.26, + "learning_rate": 0.0002613705703494988, + "loss": 0.0266, "step": 99350 }, { - "epoch": 0.5, - "learning_rate": 0.00022480740221279342, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026136668213312734, + "loss": 0.0191, "step": 99360 }, { - "epoch": 0.5, - "learning_rate": 0.0002247998345197794, - "loss": 0.0178, + "epoch": 0.26, + "learning_rate": 0.00026136279391675586, + "loss": 0.0228, "step": 99370 }, { - "epoch": 0.5, - "learning_rate": 0.0002247922668267654, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.0002613589057003844, + "loss": 0.0236, "step": 99380 }, { - "epoch": 0.5, - "learning_rate": 0.0002247846991337514, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026135501748401294, + "loss": 0.0258, "step": 99390 }, { - "epoch": 0.5, - "learning_rate": 0.00022477713144073737, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.00026135112926764146, + "loss": 0.0284, "step": 99400 }, { - "epoch": 0.5, - "learning_rate": 0.00022476956374772338, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.00026134724105126997, + "loss": 0.0198, "step": 99410 }, { - "epoch": 0.5, - "learning_rate": 0.00022476199605470936, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.00026134335283489854, + "loss": 0.0243, "step": 99420 }, { - "epoch": 0.5, - "learning_rate": 0.00022475442836169534, - "loss": 0.0247, + "epoch": 0.26, + "learning_rate": 0.0002613394646185271, + "loss": 0.024, "step": 99430 }, { - "epoch": 0.5, - "learning_rate": 0.00022474686066868135, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.0002613355764021556, + "loss": 0.0189, "step": 99440 }, { - "epoch": 0.5, - "learning_rate": 0.00022473929297566733, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.00026133168818578414, + "loss": 0.0216, "step": 99450 }, { - "epoch": 0.5, - "learning_rate": 0.0002247317252826533, - "loss": 0.0129, + "epoch": 0.26, + "learning_rate": 0.00026132779996941265, + "loss": 0.0211, "step": 99460 }, { - "epoch": 0.5, - "learning_rate": 0.00022472415758963932, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.0002613239117530412, + "loss": 0.0249, "step": 99470 }, { - "epoch": 0.5, - "learning_rate": 0.0002247165898966253, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.00026132002353666974, + "loss": 0.0242, "step": 99480 }, { - "epoch": 0.5, - "learning_rate": 0.00022470902220361128, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.0002613161353202983, + "loss": 0.0225, "step": 99490 }, { - "epoch": 0.5, - "learning_rate": 0.00022470145451059727, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002613122471039268, + "loss": 0.0191, "step": 99500 }, { - "epoch": 0.5, - "learning_rate": 0.00022469388681758327, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.00026130835888755533, + "loss": 0.0225, "step": 99510 }, { - "epoch": 0.5, - "learning_rate": 0.00022468631912456926, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.0002613044706711839, + "loss": 0.0226, "step": 99520 }, { - "epoch": 0.5, - "learning_rate": 0.00022467875143155524, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.0002613005824548124, + "loss": 0.0258, "step": 99530 }, { - "epoch": 0.5, - "learning_rate": 0.00022467118373854125, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026129669423844093, + "loss": 0.0223, "step": 99540 }, { - "epoch": 0.5, - "learning_rate": 0.00022466361604552723, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.0002612928060220695, + "loss": 0.0273, "step": 99550 }, { - "epoch": 0.5, - "learning_rate": 0.0002246560483525132, - "loss": 0.0177, + "epoch": 0.26, + "learning_rate": 0.000261288917805698, + "loss": 0.0221, "step": 99560 }, { - "epoch": 0.5, - "learning_rate": 0.00022464848065949922, - "loss": 0.0186, + "epoch": 0.26, + "learning_rate": 0.0002612850295893266, + "loss": 0.0271, "step": 99570 }, { - "epoch": 0.5, - "learning_rate": 0.0002246409129664852, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.0002612811413729551, + "loss": 0.021, "step": 99580 }, { - "epoch": 0.5, - "learning_rate": 0.00022463334527347118, - "loss": 0.0136, + "epoch": 0.26, + "learning_rate": 0.0002612772531565836, + "loss": 0.0252, "step": 99590 }, { - "epoch": 0.5, - "learning_rate": 0.0002246257775804572, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002612733649402122, + "loss": 0.0385, "step": 99600 }, { - "epoch": 0.5, - "learning_rate": 0.00022461820988744317, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.0002612694767238407, + "loss": 0.0196, "step": 99610 }, { - "epoch": 0.5, - "learning_rate": 0.00022461064219442915, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002612655885074692, + "loss": 0.0225, "step": 99620 }, { - "epoch": 0.5, - "learning_rate": 0.00022460307450141516, - "loss": 0.024, + "epoch": 0.26, + "learning_rate": 0.0002612617002910978, + "loss": 0.0233, "step": 99630 }, { - "epoch": 0.5, - "learning_rate": 0.00022459550680840114, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026125781207472635, + "loss": 0.0218, "step": 99640 }, { - "epoch": 0.5, - "learning_rate": 0.00022458793911538712, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026125392385835486, + "loss": 0.0198, "step": 99650 }, { - "epoch": 0.5, - "learning_rate": 0.00022458037142237313, - "loss": 0.0136, + "epoch": 0.26, + "learning_rate": 0.0002612500356419834, + "loss": 0.0203, "step": 99660 }, { - "epoch": 0.5, - "learning_rate": 0.0002245728037293591, - "loss": 0.0141, + "epoch": 0.26, + "learning_rate": 0.0002612461474256119, + "loss": 0.0211, "step": 99670 }, { - "epoch": 0.5, - "learning_rate": 0.0002245652360363451, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026124225920924046, + "loss": 0.0228, "step": 99680 }, { - "epoch": 0.5, - "learning_rate": 0.00022455766834333108, - "loss": 0.0183, + "epoch": 0.26, + "learning_rate": 0.000261238370992869, + "loss": 0.0217, "step": 99690 }, { - "epoch": 0.5, - "learning_rate": 0.00022455010065031708, - "loss": 0.0212, + "epoch": 0.26, + "learning_rate": 0.00026123448277649754, + "loss": 0.0228, "step": 99700 }, { - "epoch": 0.5, - "learning_rate": 0.00022454253295730307, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.00026123059456012606, + "loss": 0.0227, "step": 99710 }, { - "epoch": 0.5, - "learning_rate": 0.00022453496526428905, - "loss": 0.0161, + "epoch": 0.26, + "learning_rate": 0.00026122670634375463, + "loss": 0.0241, "step": 99720 }, { - "epoch": 0.5, - "learning_rate": 0.00022452739757127506, - "loss": 0.0134, + "epoch": 0.26, + "learning_rate": 0.00026122281812738314, + "loss": 0.0253, "step": 99730 }, { - "epoch": 0.5, - "learning_rate": 0.00022451982987826104, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026121892991101166, + "loss": 0.02, "step": 99740 }, { - "epoch": 0.5, - "learning_rate": 0.00022451226218524702, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026121504169464017, + "loss": 0.0224, "step": 99750 }, { - "epoch": 0.5, - "learning_rate": 0.00022450469449223303, - "loss": 0.0138, + "epoch": 0.26, + "learning_rate": 0.00026121115347826874, + "loss": 0.0276, "step": 99760 }, { - "epoch": 0.5, - "learning_rate": 0.000224497126799219, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.00026120726526189725, + "loss": 0.0225, "step": 99770 }, { - "epoch": 0.5, - "learning_rate": 0.000224489559106205, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002612033770455258, + "loss": 0.0234, "step": 99780 }, { - "epoch": 0.5, - "learning_rate": 0.000224481991413191, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.00026119948882915434, + "loss": 0.0194, "step": 99790 }, { - "epoch": 0.5, - "learning_rate": 0.00022447442372017698, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.00026119560061278285, + "loss": 0.021, "step": 99800 }, { - "epoch": 0.5, - "learning_rate": 0.00022446685602716296, - "loss": 0.014, + "epoch": 0.26, + "learning_rate": 0.0002611917123964114, + "loss": 0.0239, "step": 99810 }, { - "epoch": 0.5, - "learning_rate": 0.00022445928833414897, - "loss": 0.0141, + "epoch": 0.26, + "learning_rate": 0.00026118782418003994, + "loss": 0.0196, "step": 99820 }, { - "epoch": 0.5, - "learning_rate": 0.00022445172064113495, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.0002611839359636685, + "loss": 0.0227, "step": 99830 }, { - "epoch": 0.5, - "learning_rate": 0.00022444415294812093, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.000261180047747297, + "loss": 0.0228, "step": 99840 }, { - "epoch": 0.5, - "learning_rate": 0.00022443658525510691, - "loss": 0.0165, + "epoch": 0.26, + "learning_rate": 0.0002611761595309256, + "loss": 0.0228, "step": 99850 }, { - "epoch": 0.5, - "learning_rate": 0.00022442901756209292, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.0002611722713145541, + "loss": 0.0219, "step": 99860 }, { - "epoch": 0.5, - "learning_rate": 0.0002244214498690789, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.0002611683830981826, + "loss": 0.0187, "step": 99870 }, { - "epoch": 0.5, - "learning_rate": 0.00022441388217606489, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.00026116449488181113, + "loss": 0.0194, "step": 99880 }, { - "epoch": 0.5, - "learning_rate": 0.0002244063144830509, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002611606066654397, + "loss": 0.0174, "step": 99890 }, { - "epoch": 0.5, - "learning_rate": 0.00022439874679003688, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.0002611567184490682, + "loss": 0.0234, "step": 99900 }, { - "epoch": 0.5, - "learning_rate": 0.00022439117909702286, - "loss": 0.0136, + "epoch": 0.26, + "learning_rate": 0.0002611528302326968, + "loss": 0.0185, "step": 99910 }, { - "epoch": 0.5, - "learning_rate": 0.00022438361140400887, - "loss": 0.0163, + "epoch": 0.26, + "learning_rate": 0.0002611489420163253, + "loss": 0.0366, "step": 99920 }, { - "epoch": 0.5, - "learning_rate": 0.00022437604371099482, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.00026114505379995387, + "loss": 0.0209, "step": 99930 }, { - "epoch": 0.5, - "learning_rate": 0.0002243684760179808, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.0002611411655835824, + "loss": 0.0215, "step": 99940 }, { - "epoch": 0.5, - "learning_rate": 0.00022436090832496678, - "loss": 0.013, + "epoch": 0.26, + "learning_rate": 0.0002611372773672109, + "loss": 0.0184, "step": 99950 }, { - "epoch": 0.5, - "learning_rate": 0.0002243533406319528, - "loss": 0.0189, + "epoch": 0.26, + "learning_rate": 0.0002611333891508394, + "loss": 0.0215, "step": 99960 }, { - "epoch": 0.5, - "learning_rate": 0.00022434577293893877, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.000261129500934468, + "loss": 0.0276, "step": 99970 }, { - "epoch": 0.5, - "learning_rate": 0.00022433820524592475, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.00026112561271809655, + "loss": 0.0232, "step": 99980 }, { - "epoch": 0.5, - "learning_rate": 0.00022433063755291076, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026112172450172506, + "loss": 0.0189, "step": 99990 }, { - "epoch": 0.5, - "learning_rate": 0.00022432306985989674, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002611178362853536, + "loss": 0.0244, "step": 100000 }, { - "epoch": 0.5, - "eval_cer": 0.9145051901636767, - "eval_loss": 0.011643487960100174, - "eval_runtime": 116.6776, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.26, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.01607738994061947, + "eval_runtime": 108.1372, + "eval_samples_per_second": 18.495, + "eval_steps_per_second": 4.624, "step": 100000 }, { - "epoch": 0.5, - "learning_rate": 0.00022431550216688273, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.0002611139480689821, + "loss": 0.0241, "step": 100010 }, { - "epoch": 0.5, - "learning_rate": 0.00022430793447386873, - "loss": 0.0181, + "epoch": 0.26, + "learning_rate": 0.00026111005985261066, + "loss": 0.0211, "step": 100020 }, { - "epoch": 0.5, - "learning_rate": 0.00022430036678085472, - "loss": 0.0136, + "epoch": 0.26, + "learning_rate": 0.0002611061716362392, + "loss": 0.046, "step": 100030 }, { - "epoch": 0.5, - "learning_rate": 0.0002242927990878407, - "loss": 0.0213, + "epoch": 0.26, + "learning_rate": 0.00026110228341986774, + "loss": 0.0293, "step": 100040 }, { - "epoch": 0.5, - "learning_rate": 0.0002242852313948267, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.00026109839520349626, + "loss": 0.0233, "step": 100050 }, { - "epoch": 0.5, - "learning_rate": 0.0002242776637018127, - "loss": 0.0217, + "epoch": 0.26, + "learning_rate": 0.0002610945069871248, + "loss": 0.0241, "step": 100060 }, { - "epoch": 0.5, - "learning_rate": 0.00022427009600879867, - "loss": 0.0161, + "epoch": 0.26, + "learning_rate": 0.00026109061877075334, + "loss": 0.0217, "step": 100070 }, { - "epoch": 0.5, - "learning_rate": 0.00022426252831578465, - "loss": 0.0185, + "epoch": 0.26, + "learning_rate": 0.00026108673055438186, + "loss": 0.0227, "step": 100080 }, { - "epoch": 0.5, - "learning_rate": 0.00022425496062277066, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026108284233801037, + "loss": 0.0247, "step": 100090 }, { - "epoch": 0.51, - "learning_rate": 0.00022424739292975664, - "loss": 0.0131, + "epoch": 0.26, + "learning_rate": 0.00026107895412163894, + "loss": 0.023, "step": 100100 }, { - "epoch": 0.51, - "learning_rate": 0.00022423982523674262, - "loss": 0.0179, + "epoch": 0.26, + "learning_rate": 0.00026107506590526745, + "loss": 0.0218, "step": 100110 }, { - "epoch": 0.51, - "learning_rate": 0.00022423225754372863, - "loss": 0.0163, + "epoch": 0.26, + "learning_rate": 0.000261071177688896, + "loss": 0.0217, "step": 100120 }, { - "epoch": 0.51, - "learning_rate": 0.0002242246898507146, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.00026106728947252454, + "loss": 0.0204, "step": 100130 }, { - "epoch": 0.51, - "learning_rate": 0.0002242171221577006, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.0002610634012561531, + "loss": 0.0181, "step": 100140 }, { - "epoch": 0.51, - "learning_rate": 0.0002242095544646866, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.0002610595130397816, + "loss": 0.021, "step": 100150 }, { - "epoch": 0.51, - "learning_rate": 0.00022420198677167258, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026105562482341013, + "loss": 0.0241, "step": 100160 }, { - "epoch": 0.51, - "learning_rate": 0.00022419441907865856, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.00026105173660703865, + "loss": 0.0221, "step": 100170 }, { - "epoch": 0.51, - "learning_rate": 0.00022418685138564457, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002610478483906672, + "loss": 0.0231, "step": 100180 }, { - "epoch": 0.51, - "learning_rate": 0.00022417928369263055, - "loss": 0.017, + "epoch": 0.26, + "learning_rate": 0.0002610439601742958, + "loss": 0.0257, "step": 100190 }, { - "epoch": 0.51, - "learning_rate": 0.00022417171599961654, - "loss": 0.014, + "epoch": 0.26, + "learning_rate": 0.0002610400719579243, + "loss": 0.024, "step": 100200 }, { - "epoch": 0.51, - "learning_rate": 0.00022416414830660254, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.0002610361837415528, + "loss": 0.0207, "step": 100210 }, { - "epoch": 0.51, - "learning_rate": 0.00022415658061358853, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002610322955251814, + "loss": 0.0226, "step": 100220 }, { - "epoch": 0.51, - "learning_rate": 0.0002241490129205745, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002610284073088099, + "loss": 0.029, "step": 100230 }, { - "epoch": 0.51, - "learning_rate": 0.0002241414452275605, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002610245190924384, + "loss": 0.0264, "step": 100240 }, { - "epoch": 0.51, - "learning_rate": 0.0002241338775345465, - "loss": 0.0186, + "epoch": 0.26, + "learning_rate": 0.000261020630876067, + "loss": 0.0246, "step": 100250 }, { - "epoch": 0.51, - "learning_rate": 0.00022412630984153248, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.0002610167426596955, + "loss": 0.0245, "step": 100260 }, { - "epoch": 0.51, - "learning_rate": 0.00022411874214851846, - "loss": 0.0182, + "epoch": 0.26, + "learning_rate": 0.00026101285444332406, + "loss": 0.0193, "step": 100270 }, { - "epoch": 0.51, - "learning_rate": 0.00022411117445550447, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002610089662269526, + "loss": 0.0197, "step": 100280 }, { - "epoch": 0.51, - "learning_rate": 0.00022410360676249045, - "loss": 0.0149, + "epoch": 0.26, + "learning_rate": 0.0002610050780105811, + "loss": 0.0241, "step": 100290 }, { - "epoch": 0.51, - "learning_rate": 0.00022409603906947643, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.0002610011897942096, + "loss": 0.0238, "step": 100300 }, { - "epoch": 0.51, - "learning_rate": 0.00022408847137646244, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.0002609973015778382, + "loss": 0.0232, "step": 100310 }, { - "epoch": 0.51, - "learning_rate": 0.00022408090368344842, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.00026099341336146675, + "loss": 0.0185, "step": 100320 }, { - "epoch": 0.51, - "learning_rate": 0.0002240733359904344, - "loss": 0.0181, + "epoch": 0.26, + "learning_rate": 0.00026098952514509526, + "loss": 0.0279, "step": 100330 }, { - "epoch": 0.51, - "learning_rate": 0.0002240657682974204, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002609856369287238, + "loss": 0.0223, "step": 100340 }, { - "epoch": 0.51, - "learning_rate": 0.0002240582006044064, - "loss": 0.0133, + "epoch": 0.26, + "learning_rate": 0.00026098174871235234, + "loss": 0.0223, "step": 100350 }, { - "epoch": 0.51, - "learning_rate": 0.00022405063291139237, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.00026097786049598086, + "loss": 0.0231, "step": 100360 }, { - "epoch": 0.51, - "learning_rate": 0.00022404306521837838, - "loss": 0.0195, + "epoch": 0.26, + "learning_rate": 0.00026097397227960937, + "loss": 0.0207, "step": 100370 }, { - "epoch": 0.51, - "learning_rate": 0.00022403549752536436, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026097008406323794, + "loss": 0.0213, "step": 100380 }, { - "epoch": 0.51, - "learning_rate": 0.00022402792983235035, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.00026096619584686646, + "loss": 0.0245, "step": 100390 }, { - "epoch": 0.51, - "learning_rate": 0.00022402036213933633, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.000260962307630495, + "loss": 0.0227, "step": 100400 }, { - "epoch": 0.51, - "learning_rate": 0.00022401279444632234, - "loss": 0.0224, + "epoch": 0.26, + "learning_rate": 0.00026095841941412354, + "loss": 0.0236, "step": 100410 }, { - "epoch": 0.51, - "learning_rate": 0.00022400522675330832, - "loss": 0.019, + "epoch": 0.26, + "learning_rate": 0.00026095453119775205, + "loss": 0.0216, "step": 100420 }, { - "epoch": 0.51, - "learning_rate": 0.0002239976590602943, - "loss": 0.0199, + "epoch": 0.26, + "learning_rate": 0.0002609506429813806, + "loss": 0.0227, "step": 100430 }, { - "epoch": 0.51, - "learning_rate": 0.0002239900913672803, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026094675476500914, + "loss": 0.027, "step": 100440 }, { - "epoch": 0.51, - "learning_rate": 0.0002239825236742663, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.00026094286654863765, + "loss": 0.0248, "step": 100450 }, { - "epoch": 0.51, - "learning_rate": 0.00022397495598125227, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.0002609389783322662, + "loss": 0.0228, "step": 100460 }, { - "epoch": 0.51, - "learning_rate": 0.00022396738828823828, - "loss": 0.0125, + "epoch": 0.26, + "learning_rate": 0.0002609350901158948, + "loss": 0.0181, "step": 100470 }, { - "epoch": 0.51, - "learning_rate": 0.00022395982059522426, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.0002609312018995233, + "loss": 0.0184, "step": 100480 }, { - "epoch": 0.51, - "learning_rate": 0.00022395225290221024, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002609273136831518, + "loss": 0.0245, "step": 100490 }, { - "epoch": 0.51, - "learning_rate": 0.00022394468520919625, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.00026092342546678033, + "loss": 0.0253, "step": 100500 }, { - "epoch": 0.51, - "learning_rate": 0.00022393711751618223, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026091953725040885, + "loss": 0.0218, "step": 100510 }, { - "epoch": 0.51, - "learning_rate": 0.0002239295498231682, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002609156490340374, + "loss": 0.0249, "step": 100520 }, { - "epoch": 0.51, - "learning_rate": 0.00022392198213015422, - "loss": 0.0196, + "epoch": 0.26, + "learning_rate": 0.000260911760817666, + "loss": 0.0237, "step": 100530 }, { - "epoch": 0.51, - "learning_rate": 0.0002239144144371402, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.0002609078726012945, + "loss": 0.0275, "step": 100540 }, { - "epoch": 0.51, - "learning_rate": 0.00022390684674412618, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.000260903984384923, + "loss": 0.0228, "step": 100550 }, { - "epoch": 0.51, - "learning_rate": 0.0002238992790511122, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.0002609000961685516, + "loss": 0.0279, "step": 100560 }, { - "epoch": 0.51, - "learning_rate": 0.00022389171135809817, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.0002608962079521801, + "loss": 0.0254, "step": 100570 }, { - "epoch": 0.51, - "learning_rate": 0.00022388414366508416, - "loss": 0.0132, + "epoch": 0.26, + "learning_rate": 0.0002608923197358086, + "loss": 0.0253, "step": 100580 }, { - "epoch": 0.51, - "learning_rate": 0.00022387657597207014, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002608884315194372, + "loss": 0.0215, "step": 100590 }, { - "epoch": 0.51, - "learning_rate": 0.00022386900827905615, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.0002608845433030657, + "loss": 0.024, "step": 100600 }, { - "epoch": 0.51, - "learning_rate": 0.00022386144058604213, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.00026088065508669426, + "loss": 0.0226, "step": 100610 }, { - "epoch": 0.51, - "learning_rate": 0.0002238538728930281, - "loss": 0.0119, + "epoch": 0.26, + "learning_rate": 0.0002608767668703228, + "loss": 0.0256, "step": 100620 }, { - "epoch": 0.51, - "learning_rate": 0.00022384630520001412, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.0002608728786539513, + "loss": 0.0261, "step": 100630 }, { - "epoch": 0.51, - "learning_rate": 0.0002238387375070001, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.00026086899043757986, + "loss": 0.0236, "step": 100640 }, { - "epoch": 0.51, - "learning_rate": 0.00022383116981398608, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.0002608651022212084, + "loss": 0.0191, "step": 100650 }, { - "epoch": 0.51, - "learning_rate": 0.0002238236021209721, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002608612140048369, + "loss": 0.0231, "step": 100660 }, { - "epoch": 0.51, - "learning_rate": 0.00022381603442795807, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.00026085732578846546, + "loss": 0.0195, "step": 100670 }, { - "epoch": 0.51, - "learning_rate": 0.00022380846673494405, - "loss": 0.0135, + "epoch": 0.26, + "learning_rate": 0.00026085343757209403, + "loss": 0.0232, "step": 100680 }, { - "epoch": 0.51, - "learning_rate": 0.00022380089904193006, - "loss": 0.0151, + "epoch": 0.26, + "learning_rate": 0.00026084954935572254, + "loss": 0.0223, "step": 100690 }, { - "epoch": 0.51, - "learning_rate": 0.00022379333134891604, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.00026084566113935106, + "loss": 0.0222, "step": 100700 }, { - "epoch": 0.51, - "learning_rate": 0.00022378576365590202, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.00026084177292297957, + "loss": 0.0238, "step": 100710 }, { - "epoch": 0.51, - "learning_rate": 0.00022377819596288803, - "loss": 0.0127, + "epoch": 0.26, + "learning_rate": 0.00026083788470660814, + "loss": 0.0177, "step": 100720 }, { - "epoch": 0.51, - "learning_rate": 0.000223770628269874, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026083399649023665, + "loss": 0.0284, "step": 100730 }, { - "epoch": 0.51, - "learning_rate": 0.00022376306057686, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.0002608301082738652, + "loss": 0.0255, "step": 100740 }, { - "epoch": 0.51, - "learning_rate": 0.00022375549288384598, - "loss": 0.0149, + "epoch": 0.26, + "learning_rate": 0.00026082622005749374, + "loss": 0.0242, "step": 100750 }, { - "epoch": 0.51, - "learning_rate": 0.00022374792519083198, - "loss": 0.0138, + "epoch": 0.26, + "learning_rate": 0.00026082233184112225, + "loss": 0.0192, "step": 100760 }, { - "epoch": 0.51, - "learning_rate": 0.00022374035749781797, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002608184436247508, + "loss": 0.0256, "step": 100770 }, { - "epoch": 0.51, - "learning_rate": 0.00022373278980480395, - "loss": 0.0126, + "epoch": 0.26, + "learning_rate": 0.00026081455540837934, + "loss": 0.0208, "step": 100780 }, { - "epoch": 0.51, - "learning_rate": 0.00022372522211178996, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.00026081066719200785, + "loss": 0.0274, "step": 100790 }, { - "epoch": 0.51, - "learning_rate": 0.00022371765441877594, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.0002608067789756364, + "loss": 0.0235, "step": 100800 }, { - "epoch": 0.51, - "learning_rate": 0.00022371008672576192, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.00026080289075926493, + "loss": 0.0306, "step": 100810 }, { - "epoch": 0.51, - "learning_rate": 0.00022370251903274793, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.0002607990025428935, + "loss": 0.0194, "step": 100820 }, { - "epoch": 0.51, - "learning_rate": 0.0002236949513397339, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.000260795114326522, + "loss": 0.0222, "step": 100830 }, { - "epoch": 0.51, - "learning_rate": 0.0002236873836467199, - "loss": 0.0142, + "epoch": 0.26, + "learning_rate": 0.00026079122611015053, + "loss": 0.0261, "step": 100840 }, { - "epoch": 0.51, - "learning_rate": 0.0002236798159537059, - "loss": 0.0141, + "epoch": 0.26, + "learning_rate": 0.0002607873378937791, + "loss": 0.029, "step": 100850 }, { - "epoch": 0.51, - "learning_rate": 0.00022367224826069188, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.0002607834496774076, + "loss": 0.0205, "step": 100860 }, { - "epoch": 0.51, - "learning_rate": 0.00022366468056767786, - "loss": 0.0126, + "epoch": 0.26, + "learning_rate": 0.0002607795614610362, + "loss": 0.0206, "step": 100870 }, { - "epoch": 0.51, - "learning_rate": 0.00022365711287466387, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.0002607756732446647, + "loss": 0.0235, "step": 100880 }, { - "epoch": 0.51, - "learning_rate": 0.00022364954518164985, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.00026077178502829327, + "loss": 0.02, "step": 100890 }, { - "epoch": 0.51, - "learning_rate": 0.00022364197748863583, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002607678968119218, + "loss": 0.0231, "step": 100900 }, { - "epoch": 0.51, - "learning_rate": 0.00022363440979562181, - "loss": 0.0138, + "epoch": 0.26, + "learning_rate": 0.0002607640085955503, + "loss": 0.0265, "step": 100910 }, { - "epoch": 0.51, - "learning_rate": 0.00022362684210260782, - "loss": 0.013, + "epoch": 0.26, + "learning_rate": 0.0002607601203791788, + "loss": 0.0222, "step": 100920 }, { - "epoch": 0.51, - "learning_rate": 0.0002236192744095938, - "loss": 0.0135, + "epoch": 0.26, + "learning_rate": 0.0002607562321628074, + "loss": 0.0176, "step": 100930 }, { - "epoch": 0.51, - "learning_rate": 0.00022361170671657979, - "loss": 0.025, + "epoch": 0.26, + "learning_rate": 0.0002607523439464359, + "loss": 0.0242, "step": 100940 }, { - "epoch": 0.51, - "learning_rate": 0.0002236041390235658, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.00026074845573006446, + "loss": 0.0206, "step": 100950 }, { - "epoch": 0.51, - "learning_rate": 0.00022359657133055178, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.000260744567513693, + "loss": 0.0225, "step": 100960 }, { - "epoch": 0.51, - "learning_rate": 0.00022358900363753776, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.00026074067929732155, + "loss": 0.0296, "step": 100970 }, { - "epoch": 0.51, - "learning_rate": 0.00022358143594452377, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.00026073679108095006, + "loss": 0.0254, "step": 100980 }, { - "epoch": 0.51, - "learning_rate": 0.00022357386825150975, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002607329028645786, + "loss": 0.0212, "step": 100990 }, { - "epoch": 0.51, - "learning_rate": 0.00022356630055849573, - "loss": 0.0195, + "epoch": 0.26, + "learning_rate": 0.0002607290146482071, + "loss": 0.0226, "step": 101000 }, { - "epoch": 0.51, - "eval_cer": 0.9145022789753005, - "eval_loss": 0.011683492921292782, - "eval_runtime": 116.7876, - "eval_samples_per_second": 17.125, - "eval_steps_per_second": 4.281, + "epoch": 0.26, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.01563679240643978, + "eval_runtime": 108.1764, + "eval_samples_per_second": 18.488, + "eval_steps_per_second": 4.622, "step": 101000 }, { - "epoch": 0.51, - "learning_rate": 0.00022355873286548174, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026072512643183566, + "loss": 0.0201, "step": 101010 }, { - "epoch": 0.51, - "learning_rate": 0.00022355116517246772, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002607212382154642, + "loss": 0.0201, "step": 101020 }, { - "epoch": 0.51, - "learning_rate": 0.0002235435974794537, - "loss": 0.0156, + "epoch": 0.26, + "learning_rate": 0.00026071734999909274, + "loss": 0.0254, "step": 101030 }, { - "epoch": 0.51, - "learning_rate": 0.0002235360297864397, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.00026071346178272126, + "loss": 0.0207, "step": 101040 }, { - "epoch": 0.51, - "learning_rate": 0.0002235284620934257, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.00026070957356634977, + "loss": 0.0215, "step": 101050 }, { - "epoch": 0.51, - "learning_rate": 0.00022352089440041167, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.00026070568534997834, + "loss": 0.0232, "step": 101060 }, { - "epoch": 0.51, - "learning_rate": 0.00022351332670739765, - "loss": 0.0113, + "epoch": 0.26, + "learning_rate": 0.00026070179713360685, + "loss": 0.0203, "step": 101070 }, { - "epoch": 0.51, - "learning_rate": 0.00022350575901438366, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002606979089172354, + "loss": 0.0196, "step": 101080 }, { - "epoch": 0.51, - "learning_rate": 0.00022349819132136964, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.00026069402070086394, + "loss": 0.0232, "step": 101090 }, { - "epoch": 0.51, - "learning_rate": 0.00022349062362835562, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002606901324844925, + "loss": 0.0243, "step": 101100 }, { - "epoch": 0.51, - "learning_rate": 0.00022348305593534163, - "loss": 0.0161, + "epoch": 0.26, + "learning_rate": 0.000260686244268121, + "loss": 0.0192, "step": 101110 }, { - "epoch": 0.51, - "learning_rate": 0.00022347548824232761, - "loss": 0.0133, + "epoch": 0.26, + "learning_rate": 0.00026068235605174953, + "loss": 0.0193, "step": 101120 }, { - "epoch": 0.51, - "learning_rate": 0.0002234679205493136, - "loss": 0.0164, + "epoch": 0.26, + "learning_rate": 0.00026067846783537805, + "loss": 0.0203, "step": 101130 }, { - "epoch": 0.51, - "learning_rate": 0.0002234603528562996, - "loss": 0.0149, + "epoch": 0.26, + "learning_rate": 0.0002606745796190066, + "loss": 0.0181, "step": 101140 }, { - "epoch": 0.51, - "learning_rate": 0.00022345278516328559, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.00026067069140263513, + "loss": 0.0202, "step": 101150 }, { - "epoch": 0.51, - "learning_rate": 0.00022344521747027157, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002606668031862637, + "loss": 0.024, "step": 101160 }, { - "epoch": 0.51, - "learning_rate": 0.00022343764977725758, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.0002606629149698922, + "loss": 0.0217, "step": 101170 }, { - "epoch": 0.51, - "learning_rate": 0.00022343008208424353, - "loss": 0.0172, + "epoch": 0.26, + "learning_rate": 0.0002606590267535208, + "loss": 0.0239, "step": 101180 }, { - "epoch": 0.51, - "learning_rate": 0.0002234225143912295, - "loss": 0.0138, + "epoch": 0.26, + "learning_rate": 0.0002606551385371493, + "loss": 0.0188, "step": 101190 }, { - "epoch": 0.51, - "learning_rate": 0.0002234149466982155, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002606512503207778, + "loss": 0.0195, "step": 101200 }, { - "epoch": 0.51, - "learning_rate": 0.0002234073790052015, - "loss": 0.0155, + "epoch": 0.26, + "learning_rate": 0.00026064736210440633, + "loss": 0.0211, "step": 101210 }, { - "epoch": 0.51, - "learning_rate": 0.00022339981131218748, - "loss": 0.0124, + "epoch": 0.26, + "learning_rate": 0.0002606434738880349, + "loss": 0.0213, "step": 101220 }, { - "epoch": 0.51, - "learning_rate": 0.00022339224361917346, - "loss": 0.0125, + "epoch": 0.26, + "learning_rate": 0.00026063958567166347, + "loss": 0.0299, "step": 101230 }, { - "epoch": 0.51, - "learning_rate": 0.00022338467592615947, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.000260635697455292, + "loss": 0.0198, "step": 101240 }, { - "epoch": 0.51, - "learning_rate": 0.00022337710823314545, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.0002606318092389205, + "loss": 0.0223, "step": 101250 }, { - "epoch": 0.51, - "learning_rate": 0.00022336954054013144, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.000260627921022549, + "loss": 0.0198, "step": 101260 }, { - "epoch": 0.51, - "learning_rate": 0.00022336197284711744, - "loss": 0.0157, + "epoch": 0.26, + "learning_rate": 0.0002606240328061776, + "loss": 0.0201, "step": 101270 }, { - "epoch": 0.51, - "learning_rate": 0.00022335440515410343, - "loss": 0.0123, + "epoch": 0.26, + "learning_rate": 0.0002606201445898061, + "loss": 0.0251, "step": 101280 }, { - "epoch": 0.51, - "learning_rate": 0.0002233468374610894, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.00026061625637343466, + "loss": 0.0141, "step": 101290 }, { - "epoch": 0.51, - "learning_rate": 0.0002233392697680754, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002606123681570632, + "loss": 0.0219, "step": 101300 }, { - "epoch": 0.51, - "learning_rate": 0.0002233317020750614, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.00026060847994069174, + "loss": 0.0223, "step": 101310 }, { - "epoch": 0.51, - "learning_rate": 0.00022332413438204738, - "loss": 0.0219, + "epoch": 0.26, + "learning_rate": 0.00026060459172432026, + "loss": 0.0216, "step": 101320 }, { - "epoch": 0.51, - "learning_rate": 0.00022331656668903336, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.0002606007035079488, + "loss": 0.0209, "step": 101330 }, { - "epoch": 0.51, - "learning_rate": 0.00022330899899601937, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002605968152915773, + "loss": 0.0244, "step": 101340 }, { - "epoch": 0.51, - "learning_rate": 0.00022330143130300535, - "loss": 0.0124, + "epoch": 0.26, + "learning_rate": 0.00026059292707520586, + "loss": 0.0212, "step": 101350 }, { - "epoch": 0.51, - "learning_rate": 0.00022329386360999133, - "loss": 0.0125, + "epoch": 0.26, + "learning_rate": 0.00026058903885883437, + "loss": 0.0246, "step": 101360 }, { - "epoch": 0.51, - "learning_rate": 0.00022328629591697734, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.00026058515064246294, + "loss": 0.02, "step": 101370 }, { - "epoch": 0.51, - "learning_rate": 0.00022327872822396332, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.00026058126242609145, + "loss": 0.0214, "step": 101380 }, { - "epoch": 0.51, - "learning_rate": 0.0002232711605309493, - "loss": 0.0207, + "epoch": 0.26, + "learning_rate": 0.00026057737420972, + "loss": 0.0216, "step": 101390 }, { - "epoch": 0.51, - "learning_rate": 0.0002232635928379353, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.00026057348599334854, + "loss": 0.0249, "step": 101400 }, { - "epoch": 0.51, - "learning_rate": 0.0002232560251449213, - "loss": 0.0133, + "epoch": 0.26, + "learning_rate": 0.00026056959777697705, + "loss": 0.0288, "step": 101410 }, { - "epoch": 0.51, - "learning_rate": 0.00022324845745190727, - "loss": 0.0153, + "epoch": 0.26, + "learning_rate": 0.0002605657095606056, + "loss": 0.029, "step": 101420 }, { - "epoch": 0.51, - "learning_rate": 0.00022324088975889328, - "loss": 0.0181, + "epoch": 0.26, + "learning_rate": 0.00026056182134423414, + "loss": 0.021, "step": 101430 }, { - "epoch": 0.51, - "learning_rate": 0.00022323332206587926, - "loss": 0.0198, + "epoch": 0.26, + "learning_rate": 0.0002605579331278627, + "loss": 0.0176, "step": 101440 }, { - "epoch": 0.51, - "learning_rate": 0.00022322575437286525, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002605540449114912, + "loss": 0.0212, "step": 101450 }, { - "epoch": 0.51, - "learning_rate": 0.00022321818667985125, - "loss": 0.0171, + "epoch": 0.26, + "learning_rate": 0.00026055015669511973, + "loss": 0.019, "step": 101460 }, { - "epoch": 0.51, - "learning_rate": 0.00022321061898683724, - "loss": 0.0182, + "epoch": 0.26, + "learning_rate": 0.0002605462684787483, + "loss": 0.0265, "step": 101470 }, { - "epoch": 0.51, - "learning_rate": 0.00022320305129382322, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002605423802623768, + "loss": 0.0243, "step": 101480 }, { - "epoch": 0.51, - "learning_rate": 0.0002231954836008092, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.00026053849204600533, + "loss": 0.0266, "step": 101490 }, { - "epoch": 0.51, - "learning_rate": 0.0002231879159077952, - "loss": 0.0168, + "epoch": 0.26, + "learning_rate": 0.0002605346038296339, + "loss": 0.0262, "step": 101500 }, { - "epoch": 0.51, - "learning_rate": 0.0002231803482147812, - "loss": 0.0165, + "epoch": 0.26, + "learning_rate": 0.0002605307156132624, + "loss": 0.0278, "step": 101510 }, { - "epoch": 0.51, - "learning_rate": 0.00022317278052176717, - "loss": 0.0142, + "epoch": 0.26, + "learning_rate": 0.000260526827396891, + "loss": 0.0215, "step": 101520 }, { - "epoch": 0.51, - "learning_rate": 0.00022316521282875318, - "loss": 0.0134, + "epoch": 0.26, + "learning_rate": 0.0002605229391805195, + "loss": 0.024, "step": 101530 }, { - "epoch": 0.51, - "learning_rate": 0.00022315764513573916, - "loss": 0.0169, + "epoch": 0.26, + "learning_rate": 0.000260519050964148, + "loss": 0.0204, "step": 101540 }, { - "epoch": 0.51, - "learning_rate": 0.00022315007744272514, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002605151627477765, + "loss": 0.0228, "step": 101550 }, { - "epoch": 0.51, - "learning_rate": 0.00022314250974971115, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.0002605112745314051, + "loss": 0.0247, "step": 101560 }, { - "epoch": 0.51, - "learning_rate": 0.00022313494205669713, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.00026050738631503366, + "loss": 0.0179, "step": 101570 }, { - "epoch": 0.51, - "learning_rate": 0.0002231273743636831, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.0002605034980986622, + "loss": 0.0184, "step": 101580 }, { - "epoch": 0.51, - "learning_rate": 0.00022311980667066912, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.0002604996098822907, + "loss": 0.0192, "step": 101590 }, { - "epoch": 0.51, - "learning_rate": 0.0002231122389776551, - "loss": 0.0205, + "epoch": 0.26, + "learning_rate": 0.00026049572166591926, + "loss": 0.0194, "step": 101600 }, { - "epoch": 0.51, - "learning_rate": 0.00022310467128464108, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.0002604918334495478, + "loss": 0.0202, "step": 101610 }, { - "epoch": 0.51, - "learning_rate": 0.0002230971035916271, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.0002604879452331763, + "loss": 0.0197, "step": 101620 }, { - "epoch": 0.51, - "learning_rate": 0.00022308953589861307, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.00026048405701680486, + "loss": 0.0195, "step": 101630 }, { - "epoch": 0.51, - "learning_rate": 0.00022308196820559906, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002604801688004334, + "loss": 0.0209, "step": 101640 }, { - "epoch": 0.51, - "learning_rate": 0.00022307440051258504, - "loss": 0.018, + "epoch": 0.26, + "learning_rate": 0.00026047628058406194, + "loss": 0.0172, "step": 101650 }, { - "epoch": 0.51, - "learning_rate": 0.00022306683281957105, - "loss": 0.0131, + "epoch": 0.26, + "learning_rate": 0.00026047239236769046, + "loss": 0.0262, "step": 101660 }, { - "epoch": 0.51, - "learning_rate": 0.00022305926512655703, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.00026046850415131897, + "loss": 0.0229, "step": 101670 }, { - "epoch": 0.51, - "learning_rate": 0.000223051697433543, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.00026046461593494754, + "loss": 0.0266, "step": 101680 }, { - "epoch": 0.51, - "learning_rate": 0.00022304412974052902, - "loss": 0.0176, + "epoch": 0.26, + "learning_rate": 0.00026046072771857606, + "loss": 0.0252, "step": 101690 }, { - "epoch": 0.51, - "learning_rate": 0.000223036562047515, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026045683950220457, + "loss": 0.0202, "step": 101700 }, { - "epoch": 0.51, - "learning_rate": 0.00022302899435450098, - "loss": 0.0174, + "epoch": 0.26, + "learning_rate": 0.00026045295128583314, + "loss": 0.0222, "step": 101710 }, { - "epoch": 0.51, - "learning_rate": 0.000223021426661487, - "loss": 0.0142, + "epoch": 0.26, + "learning_rate": 0.0002604490630694617, + "loss": 0.0185, "step": 101720 }, { - "epoch": 0.51, - "learning_rate": 0.00022301385896847297, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.0002604451748530902, + "loss": 0.0232, "step": 101730 }, { - "epoch": 0.51, - "learning_rate": 0.00022300629127545895, - "loss": 0.0193, + "epoch": 0.26, + "learning_rate": 0.00026044128663671874, + "loss": 0.0213, "step": 101740 }, { - "epoch": 0.51, - "learning_rate": 0.00022299872358244496, - "loss": 0.0144, + "epoch": 0.26, + "learning_rate": 0.00026043739842034725, + "loss": 0.023, "step": 101750 }, { - "epoch": 0.51, - "learning_rate": 0.00022299115588943094, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.00026043351020397577, + "loss": 0.0213, "step": 101760 }, { - "epoch": 0.51, - "learning_rate": 0.00022298358819641692, - "loss": 0.0147, + "epoch": 0.26, + "learning_rate": 0.00026042962198760433, + "loss": 0.0235, "step": 101770 }, { - "epoch": 0.51, - "learning_rate": 0.00022297602050340293, - "loss": 0.0142, + "epoch": 0.26, + "learning_rate": 0.0002604257337712329, + "loss": 0.0256, "step": 101780 }, { - "epoch": 0.51, - "learning_rate": 0.0002229684528103889, - "loss": 0.0119, + "epoch": 0.26, + "learning_rate": 0.0002604218455548614, + "loss": 0.0209, "step": 101790 }, { - "epoch": 0.51, - "learning_rate": 0.0002229608851173749, - "loss": 0.0143, + "epoch": 0.26, + "learning_rate": 0.00026041795733848993, + "loss": 0.0241, "step": 101800 }, { - "epoch": 0.51, - "learning_rate": 0.00022295331742436088, - "loss": 0.0134, + "epoch": 0.26, + "learning_rate": 0.0002604140691221185, + "loss": 0.0203, "step": 101810 }, { - "epoch": 0.51, - "learning_rate": 0.00022294574973134688, - "loss": 0.0136, + "epoch": 0.26, + "learning_rate": 0.000260410180905747, + "loss": 0.026, "step": 101820 }, { - "epoch": 0.51, - "learning_rate": 0.00022293818203833287, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.00026040629268937553, + "loss": 0.0194, "step": 101830 }, { - "epoch": 0.51, - "learning_rate": 0.00022293061434531885, - "loss": 0.0158, + "epoch": 0.26, + "learning_rate": 0.0002604024044730041, + "loss": 0.0298, "step": 101840 }, { - "epoch": 0.51, - "learning_rate": 0.00022292304665230486, - "loss": 0.0152, + "epoch": 0.26, + "learning_rate": 0.0002603985162566326, + "loss": 0.0223, "step": 101850 }, { - "epoch": 0.51, - "learning_rate": 0.00022291547895929084, - "loss": 0.0188, + "epoch": 0.26, + "learning_rate": 0.0002603946280402612, + "loss": 0.0252, "step": 101860 }, { - "epoch": 0.51, - "learning_rate": 0.00022290791126627682, - "loss": 0.0135, + "epoch": 0.26, + "learning_rate": 0.0002603907398238897, + "loss": 0.0211, "step": 101870 }, { - "epoch": 0.51, - "learning_rate": 0.00022290034357326283, - "loss": 0.0136, + "epoch": 0.26, + "learning_rate": 0.0002603868516075182, + "loss": 0.0221, "step": 101880 }, { - "epoch": 0.51, - "learning_rate": 0.0002228927758802488, - "loss": 0.0166, + "epoch": 0.26, + "learning_rate": 0.0002603829633911468, + "loss": 0.0239, "step": 101890 }, { - "epoch": 0.51, - "learning_rate": 0.0002228852081872348, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002603790751747753, + "loss": 0.0209, "step": 101900 }, { - "epoch": 0.51, - "learning_rate": 0.0002228776404942208, - "loss": 0.0161, + "epoch": 0.26, + "learning_rate": 0.00026037518695840386, + "loss": 0.0233, "step": 101910 }, { - "epoch": 0.51, - "learning_rate": 0.00022287007280120678, - "loss": 0.0154, + "epoch": 0.26, + "learning_rate": 0.0002603712987420324, + "loss": 0.0232, "step": 101920 }, { - "epoch": 0.51, - "learning_rate": 0.00022286250510819276, - "loss": 0.0179, + "epoch": 0.26, + "learning_rate": 0.00026036741052566095, + "loss": 0.019, "step": 101930 }, { - "epoch": 0.51, - "learning_rate": 0.00022285493741517877, - "loss": 0.0133, + "epoch": 0.26, + "learning_rate": 0.00026036352230928946, + "loss": 0.0206, "step": 101940 }, { - "epoch": 0.51, - "learning_rate": 0.00022284736972216475, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.000260359634092918, + "loss": 0.0181, "step": 101950 }, { - "epoch": 0.51, - "learning_rate": 0.00022283980202915073, - "loss": 0.0141, + "epoch": 0.26, + "learning_rate": 0.0002603557458765465, + "loss": 0.0232, "step": 101960 }, { - "epoch": 0.51, - "learning_rate": 0.00022283223433613671, - "loss": 0.0124, + "epoch": 0.26, + "learning_rate": 0.00026035185766017506, + "loss": 0.0202, "step": 101970 }, { - "epoch": 0.51, - "learning_rate": 0.00022282466664312272, - "loss": 0.0195, + "epoch": 0.26, + "learning_rate": 0.0002603479694438036, + "loss": 0.0261, "step": 101980 }, { - "epoch": 0.51, - "learning_rate": 0.0002228170989501087, - "loss": 0.0167, + "epoch": 0.26, + "learning_rate": 0.00026034408122743214, + "loss": 0.0205, "step": 101990 }, { - "epoch": 0.51, - "learning_rate": 0.00022280953125709469, - "loss": 0.0192, + "epoch": 0.26, + "learning_rate": 0.00026034019301106066, + "loss": 0.0178, "step": 102000 }, { - "epoch": 0.51, - "eval_cer": 0.9145119829365546, - "eval_loss": 0.01138813141733408, - "eval_runtime": 116.604, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.26, + "eval_cer": 0.8817614710744033, + "eval_loss": 0.016096029430627823, + "eval_runtime": 108.1492, + "eval_samples_per_second": 18.493, + "eval_steps_per_second": 4.623, "step": 102000 }, { - "epoch": 0.51, - "learning_rate": 0.0002228019635640807, - "loss": 0.0137, + "epoch": 0.26, + "learning_rate": 0.00026033630479468917, + "loss": 0.0204, "step": 102010 }, { - "epoch": 0.51, - "learning_rate": 0.00022279439587106668, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.00026033241657831774, + "loss": 0.0265, "step": 102020 }, { - "epoch": 0.51, - "learning_rate": 0.00022278682817805266, - "loss": 0.0133, + "epoch": 0.26, + "learning_rate": 0.00026032852836194625, + "loss": 0.0247, "step": 102030 }, { - "epoch": 0.51, - "learning_rate": 0.00022277926048503867, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.00026032464014557477, + "loss": 0.0232, "step": 102040 }, { - "epoch": 0.51, - "learning_rate": 0.00022277169279202465, - "loss": 0.0159, + "epoch": 0.26, + "learning_rate": 0.00026032075192920334, + "loss": 0.0182, "step": 102050 }, { - "epoch": 0.51, - "learning_rate": 0.00022276412509901063, - "loss": 0.0133, + "epoch": 0.26, + "learning_rate": 0.0002603168637128319, + "loss": 0.0215, "step": 102060 }, { - "epoch": 0.51, - "learning_rate": 0.00022275655740599664, - "loss": 0.0162, + "epoch": 0.26, + "learning_rate": 0.0002603129754964604, + "loss": 0.0235, "step": 102070 }, { - "epoch": 0.52, - "learning_rate": 0.00022274898971298262, - "loss": 0.0128, + "epoch": 0.26, + "learning_rate": 0.00026030908728008894, + "loss": 0.0246, "step": 102080 }, { - "epoch": 0.52, - "learning_rate": 0.0002227414220199686, - "loss": 0.0179, + "epoch": 0.26, + "learning_rate": 0.00026030519906371745, + "loss": 0.0203, "step": 102090 }, { - "epoch": 0.52, - "learning_rate": 0.0002227338543269546, - "loss": 0.015, + "epoch": 0.26, + "learning_rate": 0.000260301310847346, + "loss": 0.0218, "step": 102100 }, { - "epoch": 0.52, - "learning_rate": 0.0002227262866339406, - "loss": 0.0145, + "epoch": 0.26, + "learning_rate": 0.00026029742263097453, + "loss": 0.0203, "step": 102110 }, { - "epoch": 0.52, - "learning_rate": 0.00022271871894092657, - "loss": 0.0146, + "epoch": 0.26, + "learning_rate": 0.0002602935344146031, + "loss": 0.0229, "step": 102120 }, { - "epoch": 0.52, - "learning_rate": 0.00022271115124791258, - "loss": 0.0182, + "epoch": 0.26, + "learning_rate": 0.0002602896461982316, + "loss": 0.0193, "step": 102130 }, { - "epoch": 0.52, - "learning_rate": 0.00022270358355489856, - "loss": 0.0148, + "epoch": 0.26, + "learning_rate": 0.0002602857579818602, + "loss": 0.0247, "step": 102140 }, { - "epoch": 0.52, - "learning_rate": 0.00022269601586188454, - "loss": 0.0123, + "epoch": 0.26, + "learning_rate": 0.0002602818697654887, + "loss": 0.0252, "step": 102150 }, { - "epoch": 0.52, - "learning_rate": 0.00022268844816887052, - "loss": 0.0175, + "epoch": 0.26, + "learning_rate": 0.0002602779815491172, + "loss": 0.018, "step": 102160 }, { - "epoch": 0.52, - "learning_rate": 0.00022268088047585653, - "loss": 0.0134, + "epoch": 0.26, + "learning_rate": 0.00026027409333274573, + "loss": 0.0245, "step": 102170 }, { - "epoch": 0.52, - "learning_rate": 0.00022267331278284251, - "loss": 0.016, + "epoch": 0.26, + "learning_rate": 0.0002602702051163743, + "loss": 0.0187, "step": 102180 }, { - "epoch": 0.52, - "learning_rate": 0.0002226657450898285, - "loss": 0.014, + "epoch": 0.26, + "learning_rate": 0.0002602663169000028, + "loss": 0.0228, "step": 102190 }, { - "epoch": 0.52, - "learning_rate": 0.0002226581773968145, - "loss": 0.0111, + "epoch": 0.26, + "learning_rate": 0.0002602624286836314, + "loss": 0.0218, "step": 102200 }, { - "epoch": 0.52, - "learning_rate": 0.00022265060970380049, - "loss": 0.0173, + "epoch": 0.26, + "learning_rate": 0.0002602585404672599, + "loss": 0.023, "step": 102210 }, { - "epoch": 0.52, - "learning_rate": 0.00022264304201078647, - "loss": 0.017, + "epoch": 0.26, + "learning_rate": 0.0002602546522508884, + "loss": 0.023, "step": 102220 }, { - "epoch": 0.52, - "learning_rate": 0.00022263547431777248, - "loss": 0.0149, + "epoch": 0.26, + "learning_rate": 0.000260250764034517, + "loss": 0.0262, "step": 102230 }, { - "epoch": 0.52, - "learning_rate": 0.00022262790662475846, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.0002602468758181455, + "loss": 0.0173, "step": 102240 }, { - "epoch": 0.52, - "learning_rate": 0.00022262033893174444, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.000260242987601774, + "loss": 0.0263, "step": 102250 }, { - "epoch": 0.52, - "learning_rate": 0.00022261277123873045, - "loss": 0.0135, + "epoch": 0.27, + "learning_rate": 0.0002602390993854026, + "loss": 0.0231, "step": 102260 }, { - "epoch": 0.52, - "learning_rate": 0.00022260520354571643, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00026023521116903115, + "loss": 0.0287, "step": 102270 }, { - "epoch": 0.52, - "learning_rate": 0.0002225976358527024, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.00026023132295265966, + "loss": 0.0219, "step": 102280 }, { - "epoch": 0.52, - "learning_rate": 0.00022259006815968842, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.0002602274347362882, + "loss": 0.0237, "step": 102290 }, { - "epoch": 0.52, - "learning_rate": 0.0002225825004666744, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002602235465199167, + "loss": 0.0212, "step": 102300 }, { - "epoch": 0.52, - "learning_rate": 0.00022257493277366038, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.00026021965830354526, + "loss": 0.0219, "step": 102310 }, { - "epoch": 0.52, - "learning_rate": 0.00022256736508064636, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.00026021577008717377, + "loss": 0.0232, "step": 102320 }, { - "epoch": 0.52, - "learning_rate": 0.00022255979738763237, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.00026021188187080234, + "loss": 0.0262, "step": 102330 }, { - "epoch": 0.52, - "learning_rate": 0.00022255222969461835, - "loss": 0.0174, + "epoch": 0.27, + "learning_rate": 0.00026020799365443086, + "loss": 0.0234, "step": 102340 }, { - "epoch": 0.52, - "learning_rate": 0.00022254466200160433, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.0002602041054380594, + "loss": 0.0228, "step": 102350 }, { - "epoch": 0.52, - "learning_rate": 0.00022253709430859034, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.00026020021722168794, + "loss": 0.0192, "step": 102360 }, { - "epoch": 0.52, - "learning_rate": 0.00022252952661557632, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.00026019632900531645, + "loss": 0.0245, "step": 102370 }, { - "epoch": 0.52, - "learning_rate": 0.0002225219589225623, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.00026019244078894497, + "loss": 0.0228, "step": 102380 }, { - "epoch": 0.52, - "learning_rate": 0.00022251439122954831, - "loss": 0.0213, + "epoch": 0.27, + "learning_rate": 0.00026018855257257354, + "loss": 0.0248, "step": 102390 }, { - "epoch": 0.52, - "learning_rate": 0.0002225068235365343, - "loss": 0.0141, + "epoch": 0.27, + "learning_rate": 0.00026018466435620205, + "loss": 0.0218, "step": 102400 }, { - "epoch": 0.52, - "learning_rate": 0.00022249925584352028, - "loss": 0.0218, + "epoch": 0.27, + "learning_rate": 0.0002601807761398306, + "loss": 0.0213, "step": 102410 }, { - "epoch": 0.52, - "learning_rate": 0.00022249168815050629, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.00026017688792345913, + "loss": 0.0205, "step": 102420 }, { - "epoch": 0.52, - "learning_rate": 0.00022248412045749227, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.0002601729997070877, + "loss": 0.0196, "step": 102430 }, { - "epoch": 0.52, - "learning_rate": 0.00022247655276447822, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.0002601691114907162, + "loss": 0.021, "step": 102440 }, { - "epoch": 0.52, - "learning_rate": 0.0002224689850714642, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.00026016522327434473, + "loss": 0.0212, "step": 102450 }, { - "epoch": 0.52, - "learning_rate": 0.0002224614173784502, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.0002601613350579733, + "loss": 0.024, "step": 102460 }, { - "epoch": 0.52, - "learning_rate": 0.0002224538496854362, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.0002601574468416018, + "loss": 0.0204, "step": 102470 }, { - "epoch": 0.52, - "learning_rate": 0.00022244628199242217, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.0002601535586252304, + "loss": 0.0252, "step": 102480 }, { - "epoch": 0.52, - "learning_rate": 0.00022243871429940818, - "loss": 0.014, + "epoch": 0.27, + "learning_rate": 0.0002601496704088589, + "loss": 0.0236, "step": 102490 }, { - "epoch": 0.52, - "learning_rate": 0.00022243114660639416, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002601457821924874, + "loss": 0.0225, "step": 102500 }, { - "epoch": 0.52, - "learning_rate": 0.00022242357891338015, - "loss": 0.0132, + "epoch": 0.27, + "learning_rate": 0.00026014189397611593, + "loss": 0.0265, "step": 102510 }, { - "epoch": 0.52, - "learning_rate": 0.00022241601122036615, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.0002601380057597445, + "loss": 0.0227, "step": 102520 }, { - "epoch": 0.52, - "learning_rate": 0.00022240844352735214, - "loss": 0.0139, + "epoch": 0.27, + "learning_rate": 0.000260134117543373, + "loss": 0.0204, "step": 102530 }, { - "epoch": 0.52, - "learning_rate": 0.00022240087583433812, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.0002601302293270016, + "loss": 0.0248, "step": 102540 }, { - "epoch": 0.52, - "learning_rate": 0.0002223933081413241, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.0002601263411106301, + "loss": 0.0226, "step": 102550 }, { - "epoch": 0.52, - "learning_rate": 0.0002223857404483101, - "loss": 0.0205, + "epoch": 0.27, + "learning_rate": 0.00026012245289425866, + "loss": 0.0213, "step": 102560 }, { - "epoch": 0.52, - "learning_rate": 0.0002223781727552961, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.0002601185646778872, + "loss": 0.0233, "step": 102570 }, { - "epoch": 0.52, - "learning_rate": 0.00022237060506228207, - "loss": 0.0136, + "epoch": 0.27, + "learning_rate": 0.0002601146764615157, + "loss": 0.0225, "step": 102580 }, { - "epoch": 0.52, - "learning_rate": 0.00022236303736926808, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002601107882451442, + "loss": 0.0209, "step": 102590 }, { - "epoch": 0.52, - "learning_rate": 0.00022235546967625406, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.0002601069000287728, + "loss": 0.0224, "step": 102600 }, { - "epoch": 0.52, - "learning_rate": 0.00022234790198324004, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00026010301181240134, + "loss": 0.0187, "step": 102610 }, { - "epoch": 0.52, - "learning_rate": 0.00022234033429022605, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.00026009912359602986, + "loss": 0.0184, "step": 102620 }, { - "epoch": 0.52, - "learning_rate": 0.00022233276659721203, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.0002600952353796584, + "loss": 0.0252, "step": 102630 }, { - "epoch": 0.52, - "learning_rate": 0.000222325198904198, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.00026009134716328694, + "loss": 0.0234, "step": 102640 }, { - "epoch": 0.52, - "learning_rate": 0.00022231763121118402, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.00026008745894691546, + "loss": 0.0215, "step": 102650 }, { - "epoch": 0.52, - "learning_rate": 0.00022231006351817, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00026008357073054397, + "loss": 0.0236, "step": 102660 }, { - "epoch": 0.52, - "learning_rate": 0.00022230249582515598, - "loss": 0.0201, + "epoch": 0.27, + "learning_rate": 0.00026007968251417254, + "loss": 0.0207, "step": 102670 }, { - "epoch": 0.52, - "learning_rate": 0.000222294928132142, - "loss": 0.0174, + "epoch": 0.27, + "learning_rate": 0.00026007579429780105, + "loss": 0.0205, "step": 102680 }, { - "epoch": 0.52, - "learning_rate": 0.00022228736043912797, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002600719060814296, + "loss": 0.0192, "step": 102690 }, { - "epoch": 0.52, - "learning_rate": 0.00022227979274611396, - "loss": 0.0131, + "epoch": 0.27, + "learning_rate": 0.00026006801786505814, + "loss": 0.0207, "step": 102700 }, { - "epoch": 0.52, - "learning_rate": 0.00022227222505309994, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00026006412964868665, + "loss": 0.038, "step": 102710 }, { - "epoch": 0.52, - "learning_rate": 0.00022226465736008595, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.00026006024143231517, + "loss": 0.0287, "step": 102720 }, { - "epoch": 0.52, - "learning_rate": 0.00022225708966707193, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.00026005635321594374, + "loss": 0.0215, "step": 102730 }, { - "epoch": 0.52, - "learning_rate": 0.0002222495219740579, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.00026005246499957225, + "loss": 0.0255, "step": 102740 }, { - "epoch": 0.52, - "learning_rate": 0.00022224195428104392, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.0002600485767832008, + "loss": 0.0299, "step": 102750 }, { - "epoch": 0.52, - "learning_rate": 0.0002222343865880299, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.00026004468856682933, + "loss": 0.0219, "step": 102760 }, { - "epoch": 0.52, - "learning_rate": 0.00022222681889501588, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.0002600408003504579, + "loss": 0.0325, "step": 102770 }, { - "epoch": 0.52, - "learning_rate": 0.0002222192512020019, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.0002600369121340864, + "loss": 0.0274, "step": 102780 }, { - "epoch": 0.52, - "learning_rate": 0.00022221168350898787, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00026003302391771493, + "loss": 0.0242, "step": 102790 }, { - "epoch": 0.52, - "learning_rate": 0.00022220411581597385, - "loss": 0.0216, + "epoch": 0.27, + "learning_rate": 0.00026002913570134345, + "loss": 0.0253, "step": 102800 }, { - "epoch": 0.52, - "learning_rate": 0.00022219654812295986, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.000260025247484972, + "loss": 0.0203, "step": 102810 }, { - "epoch": 0.52, - "learning_rate": 0.00022218898042994584, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002600213592686006, + "loss": 0.023, "step": 102820 }, { - "epoch": 0.52, - "learning_rate": 0.00022218141273693182, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.0002600174710522291, + "loss": 0.0176, "step": 102830 }, { - "epoch": 0.52, - "learning_rate": 0.00022217384504391783, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.0002600135828358576, + "loss": 0.0224, "step": 102840 }, { - "epoch": 0.52, - "learning_rate": 0.0002221662773509038, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.0002600096946194862, + "loss": 0.0232, "step": 102850 }, { - "epoch": 0.52, - "learning_rate": 0.0002221587096578898, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002600058064031147, + "loss": 0.0216, "step": 102860 }, { - "epoch": 0.52, - "learning_rate": 0.00022215114196487578, - "loss": 0.0124, + "epoch": 0.27, + "learning_rate": 0.0002600019181867432, + "loss": 0.0218, "step": 102870 }, { - "epoch": 0.52, - "learning_rate": 0.00022214357427186178, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002599980299703718, + "loss": 0.0226, "step": 102880 }, { - "epoch": 0.52, - "learning_rate": 0.00022213600657884777, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.0002599941417540003, + "loss": 0.0242, "step": 102890 }, { - "epoch": 0.52, - "learning_rate": 0.00022212843888583375, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025999025353762886, + "loss": 0.023, "step": 102900 }, { - "epoch": 0.52, - "learning_rate": 0.00022212087119281976, - "loss": 0.018, + "epoch": 0.27, + "learning_rate": 0.0002599863653212574, + "loss": 0.0215, "step": 102910 }, { - "epoch": 0.52, - "learning_rate": 0.00022211330349980574, - "loss": 0.016, + "epoch": 0.27, + "learning_rate": 0.0002599824771048859, + "loss": 0.0189, "step": 102920 }, { - "epoch": 0.52, - "learning_rate": 0.00022210573580679172, - "loss": 0.0134, + "epoch": 0.27, + "learning_rate": 0.00025997858888851446, + "loss": 0.0189, "step": 102930 }, { - "epoch": 0.52, - "learning_rate": 0.00022209816811377773, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.000259974700672143, + "loss": 0.0222, "step": 102940 }, { - "epoch": 0.52, - "learning_rate": 0.0002220906004207637, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002599708124557715, + "loss": 0.026, "step": 102950 }, { - "epoch": 0.52, - "learning_rate": 0.0002220830327277497, - "loss": 0.0121, + "epoch": 0.27, + "learning_rate": 0.00025996692423940006, + "loss": 0.0221, "step": 102960 }, { - "epoch": 0.52, - "learning_rate": 0.0002220754650347357, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025996303602302857, + "loss": 0.0236, "step": 102970 }, { - "epoch": 0.52, - "learning_rate": 0.00022206789734172168, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.00025995914780665714, + "loss": 0.0222, "step": 102980 }, { - "epoch": 0.52, - "learning_rate": 0.00022206032964870766, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.00025995525959028566, + "loss": 0.0254, "step": 102990 }, { - "epoch": 0.52, - "learning_rate": 0.00022205276195569367, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.00025995137137391417, + "loss": 0.0274, "step": 103000 }, { - "epoch": 0.52, - "eval_cer": 0.9144828710527925, - "eval_loss": 0.011572513729333878, - "eval_runtime": 116.71, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.27, + "eval_cer": 0.8817922630869552, + "eval_loss": 0.01607452891767025, + "eval_runtime": 108.0632, + "eval_samples_per_second": 18.508, + "eval_steps_per_second": 4.627, "step": 103000 }, { - "epoch": 0.52, - "learning_rate": 0.00022204519426267965, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00025994748315754274, + "loss": 0.0228, "step": 103010 }, { - "epoch": 0.52, - "learning_rate": 0.00022203762656966563, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.00025994359494117125, + "loss": 0.0228, "step": 103020 }, { - "epoch": 0.52, - "learning_rate": 0.00022203005887665164, - "loss": 0.0147, + "epoch": 0.27, + "learning_rate": 0.0002599397067247998, + "loss": 0.0239, "step": 103030 }, { - "epoch": 0.52, - "learning_rate": 0.00022202249118363762, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025993581850842834, + "loss": 0.0223, "step": 103040 }, { - "epoch": 0.52, - "learning_rate": 0.0002220149234906236, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025993193029205685, + "loss": 0.0216, "step": 103050 }, { - "epoch": 0.52, - "learning_rate": 0.00022200735579760959, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.0002599280420756854, + "loss": 0.0254, "step": 103060 }, { - "epoch": 0.52, - "learning_rate": 0.0002219997881045956, - "loss": 0.019, + "epoch": 0.27, + "learning_rate": 0.00025992415385931393, + "loss": 0.0222, "step": 103070 }, { - "epoch": 0.52, - "learning_rate": 0.00022199222041158158, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.00025992026564294245, + "loss": 0.0226, "step": 103080 }, { - "epoch": 0.52, - "learning_rate": 0.00022198465271856756, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.000259916377426571, + "loss": 0.0283, "step": 103090 }, { - "epoch": 0.52, - "learning_rate": 0.00022197708502555357, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.00025991248921019953, + "loss": 0.0223, "step": 103100 }, { - "epoch": 0.52, - "learning_rate": 0.00022196951733253955, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.0002599086009938281, + "loss": 0.0225, "step": 103110 }, { - "epoch": 0.52, - "learning_rate": 0.00022196194963952553, - "loss": 0.0132, + "epoch": 0.27, + "learning_rate": 0.0002599047127774566, + "loss": 0.0225, "step": 103120 }, { - "epoch": 0.52, - "learning_rate": 0.00022195438194651154, - "loss": 0.014, + "epoch": 0.27, + "learning_rate": 0.00025990082456108513, + "loss": 0.0256, "step": 103130 }, { - "epoch": 0.52, - "learning_rate": 0.00022194681425349752, - "loss": 0.0137, + "epoch": 0.27, + "learning_rate": 0.0002598969363447137, + "loss": 0.0211, "step": 103140 }, { - "epoch": 0.52, - "learning_rate": 0.0002219392465604835, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.0002598930481283422, + "loss": 0.0195, "step": 103150 }, { - "epoch": 0.52, - "learning_rate": 0.0002219316788674695, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.0002598891599119708, + "loss": 0.024, "step": 103160 }, { - "epoch": 0.52, - "learning_rate": 0.0002219241111744555, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.0002598852716955993, + "loss": 0.0273, "step": 103170 }, { - "epoch": 0.52, - "learning_rate": 0.00022191654348144147, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025988138347922787, + "loss": 0.0194, "step": 103180 }, { - "epoch": 0.52, - "learning_rate": 0.00022190897578842748, - "loss": 0.0135, + "epoch": 0.27, + "learning_rate": 0.0002598774952628564, + "loss": 0.025, "step": 103190 }, { - "epoch": 0.52, - "learning_rate": 0.00022190140809541346, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.0002598736070464849, + "loss": 0.0207, "step": 103200 }, { - "epoch": 0.52, - "learning_rate": 0.00022189384040239944, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.0002598697188301134, + "loss": 0.0245, "step": 103210 }, { - "epoch": 0.52, - "learning_rate": 0.00022188627270938542, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.000259865830613742, + "loss": 0.0213, "step": 103220 }, { - "epoch": 0.52, - "learning_rate": 0.00022187870501637143, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002598619423973705, + "loss": 0.0222, "step": 103230 }, { - "epoch": 0.52, - "learning_rate": 0.00022187113732335741, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.00025985805418099906, + "loss": 0.0201, "step": 103240 }, { - "epoch": 0.52, - "learning_rate": 0.0002218635696303434, - "loss": 0.0184, + "epoch": 0.27, + "learning_rate": 0.0002598541659646276, + "loss": 0.0252, "step": 103250 }, { - "epoch": 0.52, - "learning_rate": 0.0002218560019373294, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002598502777482561, + "loss": 0.0311, "step": 103260 }, { - "epoch": 0.52, - "learning_rate": 0.00022184843424431539, - "loss": 0.016, + "epoch": 0.27, + "learning_rate": 0.00025984638953188466, + "loss": 0.0249, "step": 103270 }, { - "epoch": 0.52, - "learning_rate": 0.00022184086655130137, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002598425013155132, + "loss": 0.0222, "step": 103280 }, { - "epoch": 0.52, - "learning_rate": 0.00022183329885828738, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002598386130991417, + "loss": 0.0226, "step": 103290 }, { - "epoch": 0.52, - "learning_rate": 0.00022182573116527336, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.00025983472488277026, + "loss": 0.0213, "step": 103300 }, { - "epoch": 0.52, - "learning_rate": 0.00022181816347225934, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.0002598308366663988, + "loss": 0.0233, "step": 103310 }, { - "epoch": 0.52, - "learning_rate": 0.00022181059577924535, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.00025982694845002734, + "loss": 0.023, "step": 103320 }, { - "epoch": 0.52, - "learning_rate": 0.00022180302808623133, - "loss": 0.0216, + "epoch": 0.27, + "learning_rate": 0.00025982306023365585, + "loss": 0.0206, "step": 103330 }, { - "epoch": 0.52, - "learning_rate": 0.0002217954603932173, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025981917201728437, + "loss": 0.0207, "step": 103340 }, { - "epoch": 0.52, - "learning_rate": 0.00022178789270020332, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.00025981528380091294, + "loss": 0.0251, "step": 103350 }, { - "epoch": 0.52, - "learning_rate": 0.0002217803250071893, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00025981139558454145, + "loss": 0.0238, "step": 103360 }, { - "epoch": 0.52, - "learning_rate": 0.00022177275731417528, - "loss": 0.0164, + "epoch": 0.27, + "learning_rate": 0.00025980750736817, + "loss": 0.0199, "step": 103370 }, { - "epoch": 0.52, - "learning_rate": 0.00022176518962116126, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.00025980361915179854, + "loss": 0.0233, "step": 103380 }, { - "epoch": 0.52, - "learning_rate": 0.00022175762192814727, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002597997309354271, + "loss": 0.0244, "step": 103390 }, { - "epoch": 0.52, - "learning_rate": 0.00022175005423513325, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.0002597958427190556, + "loss": 0.0286, "step": 103400 }, { - "epoch": 0.52, - "learning_rate": 0.00022174248654211923, - "loss": 0.0134, + "epoch": 0.27, + "learning_rate": 0.00025979195450268413, + "loss": 0.0271, "step": 103410 }, { - "epoch": 0.52, - "learning_rate": 0.00022173491884910524, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.00025978806628631265, + "loss": 0.0238, "step": 103420 }, { - "epoch": 0.52, - "learning_rate": 0.00022172735115609122, - "loss": 0.019, + "epoch": 0.27, + "learning_rate": 0.0002597841780699412, + "loss": 0.0216, "step": 103430 }, { - "epoch": 0.52, - "learning_rate": 0.0002217197834630772, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.00025978028985356973, + "loss": 0.0199, "step": 103440 }, { - "epoch": 0.52, - "learning_rate": 0.00022171221577006321, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.0002597764016371983, + "loss": 0.0258, "step": 103450 }, { - "epoch": 0.52, - "learning_rate": 0.0002217046480770492, - "loss": 0.03, + "epoch": 0.27, + "learning_rate": 0.0002597725134208268, + "loss": 0.0259, "step": 103460 }, { - "epoch": 0.52, - "learning_rate": 0.00022169708038403518, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025976862520445533, + "loss": 0.019, "step": 103470 }, { - "epoch": 0.52, - "learning_rate": 0.00022168951269102119, - "loss": 0.0197, + "epoch": 0.27, + "learning_rate": 0.0002597647369880839, + "loss": 0.0189, "step": 103480 }, { - "epoch": 0.52, - "learning_rate": 0.00022168194499800717, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.0002597608487717124, + "loss": 0.025, "step": 103490 }, { - "epoch": 0.52, - "learning_rate": 0.00022167437730499315, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.000259756960555341, + "loss": 0.0208, "step": 103500 }, { - "epoch": 0.52, - "learning_rate": 0.00022166680961197916, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.0002597530723389695, + "loss": 0.0244, "step": 103510 }, { - "epoch": 0.52, - "learning_rate": 0.00022165924191896514, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.00025974918412259806, + "loss": 0.0229, "step": 103520 }, { - "epoch": 0.52, - "learning_rate": 0.00022165167422595112, - "loss": 0.018, + "epoch": 0.27, + "learning_rate": 0.0002597452959062266, + "loss": 0.0199, "step": 103530 }, { - "epoch": 0.52, - "learning_rate": 0.00022164410653293713, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002597414076898551, + "loss": 0.0228, "step": 103540 }, { - "epoch": 0.52, - "learning_rate": 0.0002216365388399231, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.0002597375194734836, + "loss": 0.0211, "step": 103550 }, { - "epoch": 0.52, - "learning_rate": 0.0002216289711469091, - "loss": 0.0211, + "epoch": 0.27, + "learning_rate": 0.0002597336312571122, + "loss": 0.0234, "step": 103560 }, { - "epoch": 0.52, - "learning_rate": 0.00022162140345389507, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.0002597297430407407, + "loss": 0.025, "step": 103570 }, { - "epoch": 0.52, - "learning_rate": 0.00022161383576088108, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025972585482436926, + "loss": 0.0225, "step": 103580 }, { - "epoch": 0.52, - "learning_rate": 0.00022160626806786706, - "loss": 0.0139, + "epoch": 0.27, + "learning_rate": 0.0002597219666079978, + "loss": 0.0224, "step": 103590 }, { - "epoch": 0.52, - "learning_rate": 0.00022159870037485304, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.00025971807839162634, + "loss": 0.0223, "step": 103600 }, { - "epoch": 0.52, - "learning_rate": 0.00022159113268183905, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.00025971419017525486, + "loss": 0.0231, "step": 103610 }, { - "epoch": 0.52, - "learning_rate": 0.00022158356498882503, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.00025971030195888337, + "loss": 0.0224, "step": 103620 }, { - "epoch": 0.52, - "learning_rate": 0.00022157599729581102, - "loss": 0.02, + "epoch": 0.27, + "learning_rate": 0.0002597064137425119, + "loss": 0.0183, "step": 103630 }, { - "epoch": 0.52, - "learning_rate": 0.00022156842960279702, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025970252552614046, + "loss": 0.023, "step": 103640 }, { - "epoch": 0.52, - "learning_rate": 0.000221560861909783, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.000259698637309769, + "loss": 0.0193, "step": 103650 }, { - "epoch": 0.52, - "learning_rate": 0.000221553294216769, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.00025969474909339754, + "loss": 0.0231, "step": 103660 }, { - "epoch": 0.52, - "learning_rate": 0.000221545726523755, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.00025969086087702605, + "loss": 0.0204, "step": 103670 }, { - "epoch": 0.52, - "learning_rate": 0.00022153815883074098, - "loss": 0.0144, + "epoch": 0.27, + "learning_rate": 0.0002596869726606546, + "loss": 0.0194, "step": 103680 }, { - "epoch": 0.52, - "learning_rate": 0.00022153059113772696, - "loss": 0.0126, + "epoch": 0.27, + "learning_rate": 0.00025968308444428314, + "loss": 0.0245, "step": 103690 }, { - "epoch": 0.52, - "learning_rate": 0.0002215230234447129, + "epoch": 0.27, + "learning_rate": 0.00025967919622791165, "loss": 0.0229, "step": 103700 }, { - "epoch": 0.52, - "learning_rate": 0.00022151545575169892, - "loss": 0.016, + "epoch": 0.27, + "learning_rate": 0.0002596753080115402, + "loss": 0.0213, "step": 103710 }, { - "epoch": 0.52, - "learning_rate": 0.0002215078880586849, - "loss": 0.0139, + "epoch": 0.27, + "learning_rate": 0.00025967141979516873, + "loss": 0.0242, "step": 103720 }, { - "epoch": 0.52, - "learning_rate": 0.00022150032036567088, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.0002596675315787973, + "loss": 0.0221, "step": 103730 }, { - "epoch": 0.52, - "learning_rate": 0.0002214927526726569, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.0002596636433624258, + "loss": 0.0292, "step": 103740 }, { - "epoch": 0.52, - "learning_rate": 0.00022148518497964287, - "loss": 0.0144, + "epoch": 0.27, + "learning_rate": 0.00025965975514605433, + "loss": 0.0289, "step": 103750 }, { - "epoch": 0.52, - "learning_rate": 0.00022147761728662886, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025965586692968285, + "loss": 0.0242, "step": 103760 }, { - "epoch": 0.52, - "learning_rate": 0.00022147004959361484, - "loss": 0.0164, + "epoch": 0.27, + "learning_rate": 0.0002596519787133114, + "loss": 0.0205, "step": 103770 }, { - "epoch": 0.52, - "learning_rate": 0.00022146248190060085, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.00025964809049693993, + "loss": 0.0193, "step": 103780 }, { - "epoch": 0.52, - "learning_rate": 0.00022145491420758683, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002596442022805685, + "loss": 0.0229, "step": 103790 }, { - "epoch": 0.52, - "learning_rate": 0.0002214473465145728, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.000259640314064197, + "loss": 0.0211, "step": 103800 }, { - "epoch": 0.52, - "learning_rate": 0.00022143977882155882, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.0002596364258478256, + "loss": 0.0227, "step": 103810 }, { - "epoch": 0.52, - "learning_rate": 0.0002214322111285448, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.0002596325376314541, + "loss": 0.0283, "step": 103820 }, { - "epoch": 0.52, - "learning_rate": 0.00022142464343553078, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.0002596286494150826, + "loss": 0.02, "step": 103830 }, { - "epoch": 0.52, - "learning_rate": 0.0002214170757425168, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002596247611987111, + "loss": 0.0248, "step": 103840 }, { - "epoch": 0.52, - "learning_rate": 0.00022140950804950277, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002596208729823397, + "loss": 0.022, "step": 103850 }, { - "epoch": 0.52, - "learning_rate": 0.00022140194035648875, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025961698476596826, + "loss": 0.026, "step": 103860 }, { - "epoch": 0.52, - "learning_rate": 0.00022139437266347476, - "loss": 0.0147, + "epoch": 0.27, + "learning_rate": 0.0002596130965495968, + "loss": 0.0227, "step": 103870 }, { - "epoch": 0.52, - "learning_rate": 0.00022138680497046074, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002596092083332253, + "loss": 0.0201, "step": 103880 }, { - "epoch": 0.52, - "learning_rate": 0.00022137923727744672, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025960532011685386, + "loss": 0.0211, "step": 103890 }, { - "epoch": 0.52, - "learning_rate": 0.00022137166958443273, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002596014319004824, + "loss": 0.0245, "step": 103900 }, { - "epoch": 0.52, - "learning_rate": 0.0002213641018914187, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.0002595975436841109, + "loss": 0.0263, "step": 103910 }, { - "epoch": 0.52, - "learning_rate": 0.0002213565341984047, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.00025959365546773946, + "loss": 0.0287, "step": 103920 }, { - "epoch": 0.52, - "learning_rate": 0.0002213489665053907, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.000259589767251368, + "loss": 0.0211, "step": 103930 }, { - "epoch": 0.52, - "learning_rate": 0.00022134139881237668, - "loss": 0.0125, + "epoch": 0.27, + "learning_rate": 0.00025958587903499654, + "loss": 0.0261, "step": 103940 }, { - "epoch": 0.52, - "learning_rate": 0.00022133383111936267, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.00025958199081862506, + "loss": 0.022, "step": 103950 }, { - "epoch": 0.52, - "learning_rate": 0.00022132626342634865, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025957810260225357, + "loss": 0.0207, "step": 103960 }, { - "epoch": 0.52, - "learning_rate": 0.00022131869573333466, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002595742143858821, + "loss": 0.0229, "step": 103970 }, { - "epoch": 0.52, - "learning_rate": 0.00022131112804032064, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025957032616951065, + "loss": 0.0238, "step": 103980 }, { - "epoch": 0.52, - "learning_rate": 0.00022130356034730662, - "loss": 0.0114, + "epoch": 0.27, + "learning_rate": 0.00025956643795313917, + "loss": 0.0224, "step": 103990 }, { - "epoch": 0.52, - "learning_rate": 0.00022129599265429263, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.00025956254973676774, + "loss": 0.0207, "step": 104000 }, { - "epoch": 0.52, - "eval_cer": 0.9145071309559275, - "eval_loss": 0.01152227446436882, - "eval_runtime": 116.6853, - "eval_samples_per_second": 17.14, - "eval_steps_per_second": 4.285, + "epoch": 0.27, + "eval_cer": 0.8818706427552693, + "eval_loss": 0.01605622097849846, + "eval_runtime": 108.0768, + "eval_samples_per_second": 18.505, + "eval_steps_per_second": 4.626, "step": 104000 }, { - "epoch": 0.52, - "learning_rate": 0.0002212884249612786, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00025955866152039625, + "loss": 0.0184, "step": 104010 }, { - "epoch": 0.52, - "learning_rate": 0.0002212808572682646, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.0002595547733040248, + "loss": 0.0211, "step": 104020 }, { - "epoch": 0.52, - "learning_rate": 0.0002212732895752506, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00025955088508765334, + "loss": 0.0221, "step": 104030 }, { - "epoch": 0.52, - "learning_rate": 0.00022126572188223658, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00025954699687128185, + "loss": 0.0233, "step": 104040 }, { - "epoch": 0.52, - "learning_rate": 0.00022125815418922256, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.0002595431086549104, + "loss": 0.0246, "step": 104050 }, { - "epoch": 0.52, - "learning_rate": 0.00022125058649620857, - "loss": 0.0134, + "epoch": 0.27, + "learning_rate": 0.00025953922043853893, + "loss": 0.0202, "step": 104060 }, { - "epoch": 0.53, - "learning_rate": 0.00022124301880319455, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.0002595353322221675, + "loss": 0.028, "step": 104070 }, { - "epoch": 0.53, - "learning_rate": 0.00022123545111018053, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.000259531444005796, + "loss": 0.0202, "step": 104080 }, { - "epoch": 0.53, - "learning_rate": 0.00022122788341716654, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.00025952755578942453, + "loss": 0.0262, "step": 104090 }, { - "epoch": 0.53, - "learning_rate": 0.00022122031572415252, - "loss": 0.0135, + "epoch": 0.27, + "learning_rate": 0.0002595236675730531, + "loss": 0.0242, "step": 104100 }, { - "epoch": 0.53, - "learning_rate": 0.0002212127480311385, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.0002595197793566816, + "loss": 0.0228, "step": 104110 }, { - "epoch": 0.53, - "learning_rate": 0.0002212051803381245, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.00025951589114031013, + "loss": 0.0226, "step": 104120 }, { - "epoch": 0.53, - "learning_rate": 0.0002211976126451105, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.0002595120029239387, + "loss": 0.0183, "step": 104130 }, { - "epoch": 0.53, - "learning_rate": 0.00022119004495209648, - "loss": 0.0179, + "epoch": 0.27, + "learning_rate": 0.0002595081147075672, + "loss": 0.0297, "step": 104140 }, { - "epoch": 0.53, - "learning_rate": 0.00022118247725908246, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.0002595042264911958, + "loss": 0.0289, "step": 104150 }, { - "epoch": 0.53, - "learning_rate": 0.00022117490956606847, - "loss": 0.0132, + "epoch": 0.27, + "learning_rate": 0.0002595003382748243, + "loss": 0.0192, "step": 104160 }, { - "epoch": 0.53, - "learning_rate": 0.00022116734187305445, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002594964500584528, + "loss": 0.0206, "step": 104170 }, { - "epoch": 0.53, - "learning_rate": 0.00022115977418004043, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002594925618420814, + "loss": 0.0242, "step": 104180 }, { - "epoch": 0.53, - "learning_rate": 0.00022115220648702644, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002594886736257099, + "loss": 0.0188, "step": 104190 }, { - "epoch": 0.53, - "learning_rate": 0.00022114463879401242, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00025948478540933846, + "loss": 0.0211, "step": 104200 }, { - "epoch": 0.53, - "learning_rate": 0.0002211370711009984, - "loss": 0.0234, + "epoch": 0.27, + "learning_rate": 0.000259480897192967, + "loss": 0.0196, "step": 104210 }, { - "epoch": 0.53, - "learning_rate": 0.0002211295034079844, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.0002594770089765955, + "loss": 0.0242, "step": 104220 }, { - "epoch": 0.53, - "learning_rate": 0.0002211219357149704, - "loss": 0.019, + "epoch": 0.27, + "learning_rate": 0.00025947312076022406, + "loss": 0.0237, "step": 104230 }, { - "epoch": 0.53, - "learning_rate": 0.00022111436802195637, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.0002594692325438526, + "loss": 0.0244, "step": 104240 }, { - "epoch": 0.53, - "learning_rate": 0.00022110680032894238, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.0002594653443274811, + "loss": 0.0178, "step": 104250 }, { - "epoch": 0.53, - "learning_rate": 0.00022109923263592836, - "loss": 0.0144, + "epoch": 0.27, + "learning_rate": 0.00025946145611110966, + "loss": 0.0218, "step": 104260 }, { - "epoch": 0.53, - "learning_rate": 0.00022109166494291434, - "loss": 0.0125, + "epoch": 0.27, + "learning_rate": 0.00025945756789473817, + "loss": 0.0218, "step": 104270 }, { - "epoch": 0.53, - "learning_rate": 0.00022108409724990033, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025945367967836674, + "loss": 0.0248, "step": 104280 }, { - "epoch": 0.53, - "learning_rate": 0.00022107652955688633, - "loss": 0.0124, + "epoch": 0.27, + "learning_rate": 0.00025944979146199526, + "loss": 0.0276, "step": 104290 }, { - "epoch": 0.53, - "learning_rate": 0.00022106896186387232, - "loss": 0.0134, + "epoch": 0.27, + "learning_rate": 0.00025944590324562377, + "loss": 0.021, "step": 104300 }, { - "epoch": 0.53, - "learning_rate": 0.0002210613941708583, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025944201502925234, + "loss": 0.026, "step": 104310 }, { - "epoch": 0.53, - "learning_rate": 0.0002210538264778443, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.00025943812681288085, + "loss": 0.0212, "step": 104320 }, { - "epoch": 0.53, - "learning_rate": 0.0002210462587848303, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025943423859650937, + "loss": 0.022, "step": 104330 }, { - "epoch": 0.53, - "learning_rate": 0.00022103869109181627, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.00025943035038013794, + "loss": 0.0201, "step": 104340 }, { - "epoch": 0.53, - "learning_rate": 0.00022103112339880228, - "loss": 0.0202, + "epoch": 0.27, + "learning_rate": 0.0002594264621637665, + "loss": 0.0268, "step": 104350 }, { - "epoch": 0.53, - "learning_rate": 0.00022102355570578826, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.000259422573947395, + "loss": 0.0214, "step": 104360 }, { - "epoch": 0.53, - "learning_rate": 0.00022101598801277424, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.00025941868573102353, + "loss": 0.0221, "step": 104370 }, { - "epoch": 0.53, - "learning_rate": 0.00022100842031976025, - "loss": 0.0135, + "epoch": 0.27, + "learning_rate": 0.00025941479751465205, + "loss": 0.0212, "step": 104380 }, { - "epoch": 0.53, - "learning_rate": 0.00022100085262674623, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.0002594109092982806, + "loss": 0.0234, "step": 104390 }, { - "epoch": 0.53, - "learning_rate": 0.0002209932849337322, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.00025940702108190913, + "loss": 0.0228, "step": 104400 }, { - "epoch": 0.53, - "learning_rate": 0.00022098571724071822, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.0002594031328655377, + "loss": 0.021, "step": 104410 }, { - "epoch": 0.53, - "learning_rate": 0.0002209781495477042, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.0002593992446491662, + "loss": 0.0208, "step": 104420 }, { - "epoch": 0.53, - "learning_rate": 0.00022097058185469018, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002593953564327948, + "loss": 0.0237, "step": 104430 }, { - "epoch": 0.53, - "learning_rate": 0.0002209630141616762, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002593914682164233, + "loss": 0.0283, "step": 104440 }, { - "epoch": 0.53, - "learning_rate": 0.00022095544646866217, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.0002593875800000518, + "loss": 0.0163, "step": 104450 }, { - "epoch": 0.53, - "learning_rate": 0.00022094787877564815, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025938369178368033, + "loss": 0.0202, "step": 104460 }, { - "epoch": 0.53, - "learning_rate": 0.00022094031108263414, - "loss": 0.0214, + "epoch": 0.27, + "learning_rate": 0.0002593798035673089, + "loss": 0.0197, "step": 104470 }, { - "epoch": 0.53, - "learning_rate": 0.00022093274338962014, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.0002593759153509374, + "loss": 0.0176, "step": 104480 }, { - "epoch": 0.53, - "learning_rate": 0.00022092517569660613, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.000259372027134566, + "loss": 0.0226, "step": 104490 }, { - "epoch": 0.53, - "learning_rate": 0.0002209176080035921, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.0002593681389181945, + "loss": 0.019, "step": 104500 }, { - "epoch": 0.53, - "learning_rate": 0.00022091004031057812, - "loss": 0.0147, + "epoch": 0.27, + "learning_rate": 0.000259364250701823, + "loss": 0.0245, "step": 104510 }, { - "epoch": 0.53, - "learning_rate": 0.0002209024726175641, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.0002593603624854516, + "loss": 0.0179, "step": 104520 }, { - "epoch": 0.53, - "learning_rate": 0.00022089490492455008, - "loss": 0.0137, + "epoch": 0.27, + "learning_rate": 0.0002593564742690801, + "loss": 0.0228, "step": 104530 }, { - "epoch": 0.53, - "learning_rate": 0.0002208873372315361, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.0002593525860527086, + "loss": 0.0245, "step": 104540 }, { - "epoch": 0.53, - "learning_rate": 0.00022087976953852207, - "loss": 0.0167, + "epoch": 0.27, + "learning_rate": 0.0002593486978363372, + "loss": 0.0224, "step": 104550 }, { - "epoch": 0.53, - "learning_rate": 0.00022087220184550805, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.00025934480961996574, + "loss": 0.018, "step": 104560 }, { - "epoch": 0.53, - "learning_rate": 0.00022086463415249406, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.00025934092140359426, + "loss": 0.0235, "step": 104570 }, { - "epoch": 0.53, - "learning_rate": 0.00022085706645948004, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.0002593370331872228, + "loss": 0.0226, "step": 104580 }, { - "epoch": 0.53, - "learning_rate": 0.00022084949876646602, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002593331449708513, + "loss": 0.0219, "step": 104590 }, { - "epoch": 0.53, - "learning_rate": 0.00022084193107345203, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00025932925675447986, + "loss": 0.0183, "step": 104600 }, { - "epoch": 0.53, - "learning_rate": 0.000220834363380438, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.00025932536853810837, + "loss": 0.0246, "step": 104610 }, { - "epoch": 0.53, - "learning_rate": 0.000220826795687424, - "loss": 0.0147, + "epoch": 0.27, + "learning_rate": 0.00025932148032173694, + "loss": 0.0213, "step": 104620 }, { - "epoch": 0.53, - "learning_rate": 0.00022081922799440997, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.00025931759210536545, + "loss": 0.022, "step": 104630 }, { - "epoch": 0.53, - "learning_rate": 0.00022081166030139598, - "loss": 0.0171, + "epoch": 0.27, + "learning_rate": 0.000259313703888994, + "loss": 0.0248, "step": 104640 }, { - "epoch": 0.53, - "learning_rate": 0.00022080409260838196, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.00025930981567262254, + "loss": 0.0233, "step": 104650 }, { - "epoch": 0.53, - "learning_rate": 0.00022079652491536795, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.00025930592745625105, + "loss": 0.0218, "step": 104660 }, { - "epoch": 0.53, - "learning_rate": 0.00022078895722235395, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.00025930203923987957, + "loss": 0.0231, "step": 104670 }, { - "epoch": 0.53, - "learning_rate": 0.00022078138952933994, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.00025929815102350814, + "loss": 0.0208, "step": 104680 }, { - "epoch": 0.53, - "learning_rate": 0.00022077382183632592, - "loss": 0.0147, + "epoch": 0.27, + "learning_rate": 0.00025929426280713665, + "loss": 0.0179, "step": 104690 }, { - "epoch": 0.53, - "learning_rate": 0.00022076625414331193, - "loss": 0.0147, + "epoch": 0.27, + "learning_rate": 0.0002592903745907652, + "loss": 0.022, "step": 104700 }, { - "epoch": 0.53, - "learning_rate": 0.0002207586864502979, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.00025928648637439373, + "loss": 0.0231, "step": 104710 }, { - "epoch": 0.53, - "learning_rate": 0.0002207511187572839, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.00025928259815802225, + "loss": 0.0225, "step": 104720 }, { - "epoch": 0.53, - "learning_rate": 0.0002207435510642699, - "loss": 0.019, + "epoch": 0.27, + "learning_rate": 0.0002592787099416508, + "loss": 0.0278, "step": 104730 }, { - "epoch": 0.53, - "learning_rate": 0.00022073598337125588, - "loss": 0.0171, + "epoch": 0.27, + "learning_rate": 0.00025927482172527933, + "loss": 0.0204, "step": 104740 }, { - "epoch": 0.53, - "learning_rate": 0.00022072841567824186, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002592709335089079, + "loss": 0.0194, "step": 104750 }, { - "epoch": 0.53, - "learning_rate": 0.00022072084798522787, - "loss": 0.0176, + "epoch": 0.27, + "learning_rate": 0.0002592670452925364, + "loss": 0.0254, "step": 104760 }, { - "epoch": 0.53, - "learning_rate": 0.00022071328029221385, - "loss": 0.012, + "epoch": 0.27, + "learning_rate": 0.000259263157076165, + "loss": 0.0322, "step": 104770 }, { - "epoch": 0.53, - "learning_rate": 0.00022070571259919983, - "loss": 0.013, + "epoch": 0.27, + "learning_rate": 0.0002592592688597935, + "loss": 0.0241, "step": 104780 }, { - "epoch": 0.53, - "learning_rate": 0.0002206981449061858, - "loss": 0.0134, + "epoch": 0.27, + "learning_rate": 0.000259255380643422, + "loss": 0.02, "step": 104790 }, { - "epoch": 0.53, - "learning_rate": 0.00022069057721317182, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.0002592514924270505, + "loss": 0.0224, "step": 104800 }, { - "epoch": 0.53, - "learning_rate": 0.0002206830095201578, - "loss": 0.0211, + "epoch": 0.27, + "learning_rate": 0.0002592476042106791, + "loss": 0.025, "step": 104810 }, { - "epoch": 0.53, - "learning_rate": 0.00022067544182714378, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002592437159943076, + "loss": 0.025, "step": 104820 }, { - "epoch": 0.53, - "learning_rate": 0.0002206678741341298, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.0002592398277779362, + "loss": 0.0223, "step": 104830 }, { - "epoch": 0.53, - "learning_rate": 0.00022066030644111577, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.0002592359395615647, + "loss": 0.0234, "step": 104840 }, { - "epoch": 0.53, - "learning_rate": 0.00022065273874810176, - "loss": 0.0184, + "epoch": 0.27, + "learning_rate": 0.00025923205134519326, + "loss": 0.019, "step": 104850 }, { - "epoch": 0.53, - "learning_rate": 0.00022064517105508776, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.0002592281631288218, + "loss": 0.0263, "step": 104860 }, { - "epoch": 0.53, - "learning_rate": 0.00022063760336207375, - "loss": 0.0152, + "epoch": 0.27, + "learning_rate": 0.0002592242749124503, + "loss": 0.0286, "step": 104870 }, { - "epoch": 0.53, - "learning_rate": 0.00022063003566905973, - "loss": 0.0127, + "epoch": 0.27, + "learning_rate": 0.0002592203866960788, + "loss": 0.0264, "step": 104880 }, { - "epoch": 0.53, - "learning_rate": 0.00022062246797604574, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002592164984797074, + "loss": 0.0244, "step": 104890 }, { - "epoch": 0.53, - "learning_rate": 0.00022061490028303172, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.00025921261026333594, + "loss": 0.0249, "step": 104900 }, { - "epoch": 0.53, - "learning_rate": 0.0002206073325900177, - "loss": 0.0136, + "epoch": 0.27, + "learning_rate": 0.00025920872204696446, + "loss": 0.0239, "step": 104910 }, { - "epoch": 0.53, - "learning_rate": 0.0002205997648970037, - "loss": 0.0136, + "epoch": 0.27, + "learning_rate": 0.00025920483383059297, + "loss": 0.0215, "step": 104920 }, { - "epoch": 0.53, - "learning_rate": 0.0002205921972039897, - "loss": 0.0199, + "epoch": 0.27, + "learning_rate": 0.00025920094561422154, + "loss": 0.0195, "step": 104930 }, { - "epoch": 0.53, - "learning_rate": 0.00022058462951097567, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.00025919705739785006, + "loss": 0.0241, "step": 104940 }, { - "epoch": 0.53, - "learning_rate": 0.00022057706181796165, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.00025919316918147857, + "loss": 0.0228, "step": 104950 }, { - "epoch": 0.53, - "learning_rate": 0.00022056949412494763, - "loss": 0.0142, + "epoch": 0.27, + "learning_rate": 0.00025918928096510714, + "loss": 0.0248, "step": 104960 }, { - "epoch": 0.53, - "learning_rate": 0.00022056192643193361, - "loss": 0.013, + "epoch": 0.27, + "learning_rate": 0.00025918539274873565, + "loss": 0.0211, "step": 104970 }, { - "epoch": 0.53, - "learning_rate": 0.0002205543587389196, - "loss": 0.0197, + "epoch": 0.27, + "learning_rate": 0.0002591815045323642, + "loss": 0.0212, "step": 104980 }, { - "epoch": 0.53, - "learning_rate": 0.0002205467910459056, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.00025917761631599274, + "loss": 0.0263, "step": 104990 }, { - "epoch": 0.53, - "learning_rate": 0.00022053922335289159, - "loss": 0.018, + "epoch": 0.27, + "learning_rate": 0.00025917372809962125, + "loss": 0.029, "step": 105000 }, { - "epoch": 0.53, - "eval_cer": 0.9144848118450433, - "eval_loss": 0.011399283073842525, - "eval_runtime": 116.6482, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.286, + "epoch": 0.27, + "eval_cer": 0.8818118580040337, + "eval_loss": 0.01607823558151722, + "eval_runtime": 108.0567, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, "step": 105000 }, { - "epoch": 0.53, - "learning_rate": 0.00022053165565987757, - "loss": 0.0184, + "epoch": 0.27, + "learning_rate": 0.00025916983988324977, + "loss": 0.0226, "step": 105010 }, { - "epoch": 0.53, - "learning_rate": 0.00022052408796686355, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025916595166687833, + "loss": 0.0231, "step": 105020 }, { - "epoch": 0.53, - "learning_rate": 0.00022051652027384956, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.00025916206345050685, + "loss": 0.0302, "step": 105030 }, { - "epoch": 0.53, - "learning_rate": 0.00022050895258083554, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.0002591581752341354, + "loss": 0.02, "step": 105040 }, { - "epoch": 0.53, - "learning_rate": 0.00022050138488782152, - "loss": 0.016, + "epoch": 0.27, + "learning_rate": 0.00025915428701776393, + "loss": 0.0235, "step": 105050 }, { - "epoch": 0.53, - "learning_rate": 0.00022049381719480753, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.0002591503988013925, + "loss": 0.0243, "step": 105060 }, { - "epoch": 0.53, - "learning_rate": 0.0002204862495017935, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.000259146510585021, + "loss": 0.0219, "step": 105070 }, { - "epoch": 0.53, - "learning_rate": 0.0002204786818087795, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.00025914262236864953, + "loss": 0.0244, "step": 105080 }, { - "epoch": 0.53, - "learning_rate": 0.0002204711141157655, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.00025913873415227804, + "loss": 0.0231, "step": 105090 }, { - "epoch": 0.53, - "learning_rate": 0.00022046354642275148, - "loss": 0.0233, + "epoch": 0.27, + "learning_rate": 0.0002591348459359066, + "loss": 0.0244, "step": 105100 }, { - "epoch": 0.53, - "learning_rate": 0.00022045597872973746, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002591309577195352, + "loss": 0.0199, "step": 105110 }, { - "epoch": 0.53, - "learning_rate": 0.00022044841103672347, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002591270695031637, + "loss": 0.0269, "step": 105120 }, { - "epoch": 0.53, - "learning_rate": 0.00022044084334370945, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002591231812867922, + "loss": 0.0225, "step": 105130 }, { - "epoch": 0.53, - "learning_rate": 0.00022043327565069543, - "loss": 0.0185, + "epoch": 0.27, + "learning_rate": 0.0002591192930704208, + "loss": 0.0226, "step": 105140 }, { - "epoch": 0.53, - "learning_rate": 0.00022042570795768144, - "loss": 0.0161, + "epoch": 0.27, + "learning_rate": 0.0002591154048540493, + "loss": 0.0216, "step": 105150 }, { - "epoch": 0.53, - "learning_rate": 0.00022041814026466742, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.0002591115166376778, + "loss": 0.0258, "step": 105160 }, { - "epoch": 0.53, - "learning_rate": 0.0002204105725716534, - "loss": 0.0132, + "epoch": 0.27, + "learning_rate": 0.0002591076284213064, + "loss": 0.0206, "step": 105170 }, { - "epoch": 0.53, - "learning_rate": 0.0002204030048786394, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.0002591037402049349, + "loss": 0.0167, "step": 105180 }, { - "epoch": 0.53, - "learning_rate": 0.0002203954371856254, - "loss": 0.016, + "epoch": 0.27, + "learning_rate": 0.00025909985198856346, + "loss": 0.0209, "step": 105190 }, { - "epoch": 0.53, - "learning_rate": 0.00022038786949261138, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.000259095963772192, + "loss": 0.0213, "step": 105200 }, { - "epoch": 0.53, - "learning_rate": 0.00022038030179959736, - "loss": 0.018, + "epoch": 0.27, + "learning_rate": 0.0002590920755558205, + "loss": 0.0249, "step": 105210 }, { - "epoch": 0.53, - "learning_rate": 0.00022037273410658337, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.000259088187339449, + "loss": 0.0194, "step": 105220 }, { - "epoch": 0.53, - "learning_rate": 0.00022036516641356935, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002590842991230776, + "loss": 0.021, "step": 105230 }, { - "epoch": 0.53, - "learning_rate": 0.00022035759872055533, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.00025908041090670614, + "loss": 0.0155, "step": 105240 }, { - "epoch": 0.53, - "learning_rate": 0.00022035003102754134, - "loss": 0.0138, + "epoch": 0.27, + "learning_rate": 0.00025907652269033466, + "loss": 0.0196, "step": 105250 }, { - "epoch": 0.53, - "learning_rate": 0.00022034246333452732, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.00025907263447396317, + "loss": 0.0219, "step": 105260 }, { - "epoch": 0.53, - "learning_rate": 0.0002203348956415133, - "loss": 0.0154, + "epoch": 0.27, + "learning_rate": 0.00025906874625759174, + "loss": 0.0184, "step": 105270 }, { - "epoch": 0.53, - "learning_rate": 0.0002203273279484993, - "loss": 0.0162, + "epoch": 0.27, + "learning_rate": 0.00025906485804122025, + "loss": 0.0233, "step": 105280 }, { - "epoch": 0.53, - "learning_rate": 0.0002203197602554853, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.00025906096982484877, + "loss": 0.027, "step": 105290 }, { - "epoch": 0.53, - "learning_rate": 0.00022031219256247127, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025905708160847734, + "loss": 0.0251, "step": 105300 }, { - "epoch": 0.53, - "learning_rate": 0.00022030462486945728, - "loss": 0.0169, + "epoch": 0.27, + "learning_rate": 0.00025905319339210585, + "loss": 0.0178, "step": 105310 }, { - "epoch": 0.53, - "learning_rate": 0.00022029705717644326, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002590493051757344, + "loss": 0.0208, "step": 105320 }, { - "epoch": 0.53, - "learning_rate": 0.00022028948948342924, - "loss": 0.017, + "epoch": 0.27, + "learning_rate": 0.00025904541695936294, + "loss": 0.0249, "step": 105330 }, { - "epoch": 0.53, - "learning_rate": 0.00022028192179041525, - "loss": 0.016, + "epoch": 0.27, + "learning_rate": 0.00025904152874299145, + "loss": 0.0219, "step": 105340 }, { - "epoch": 0.53, - "learning_rate": 0.00022027435409740123, - "loss": 0.0195, + "epoch": 0.27, + "learning_rate": 0.00025903764052662, + "loss": 0.0226, "step": 105350 }, { - "epoch": 0.53, - "learning_rate": 0.00022026678640438722, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.00025903375231024853, + "loss": 0.0244, "step": 105360 }, { - "epoch": 0.53, - "learning_rate": 0.0002202592187113732, - "loss": 0.0194, + "epoch": 0.27, + "learning_rate": 0.00025902986409387705, + "loss": 0.0237, "step": 105370 }, { - "epoch": 0.53, - "learning_rate": 0.0002202516510183592, - "loss": 0.0134, + "epoch": 0.27, + "learning_rate": 0.0002590259758775056, + "loss": 0.0231, "step": 105380 }, { - "epoch": 0.53, - "learning_rate": 0.0002202440833253452, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.0002590220876611342, + "loss": 0.0243, "step": 105390 }, { - "epoch": 0.53, - "learning_rate": 0.00022023651563233117, - "loss": 0.0136, + "epoch": 0.27, + "learning_rate": 0.0002590181994447627, + "loss": 0.0205, "step": 105400 }, { - "epoch": 0.53, - "learning_rate": 0.00022022894793931718, - "loss": 0.0141, + "epoch": 0.27, + "learning_rate": 0.0002590143112283912, + "loss": 0.023, "step": 105410 }, { - "epoch": 0.53, - "learning_rate": 0.00022022138024630316, - "loss": 0.0151, + "epoch": 0.27, + "learning_rate": 0.00025901042301201973, + "loss": 0.022, "step": 105420 }, { - "epoch": 0.53, - "learning_rate": 0.00022021381255328914, - "loss": 0.0143, + "epoch": 0.27, + "learning_rate": 0.0002590065347956483, + "loss": 0.0213, "step": 105430 }, { - "epoch": 0.53, - "learning_rate": 0.00022020624486027515, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.0002590026465792768, + "loss": 0.0218, "step": 105440 }, { - "epoch": 0.53, - "learning_rate": 0.00022019867716726113, - "loss": 0.0214, + "epoch": 0.27, + "learning_rate": 0.0002589987583629054, + "loss": 0.0167, "step": 105450 }, { - "epoch": 0.53, - "learning_rate": 0.0002201911094742471, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.0002589948701465339, + "loss": 0.0178, "step": 105460 }, { - "epoch": 0.53, - "learning_rate": 0.00022018354178123312, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.0002589909819301624, + "loss": 0.0212, "step": 105470 }, { - "epoch": 0.53, - "learning_rate": 0.0002201759740882191, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.000258987093713791, + "loss": 0.0242, "step": 105480 }, { - "epoch": 0.53, - "learning_rate": 0.00022016840639520508, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.0002589832054974195, + "loss": 0.0238, "step": 105490 }, { - "epoch": 0.53, - "learning_rate": 0.0002201608387021911, - "loss": 0.0131, + "epoch": 0.27, + "learning_rate": 0.000258979317281048, + "loss": 0.0201, "step": 105500 }, { - "epoch": 0.53, - "learning_rate": 0.00022015327100917707, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.0002589754290646766, + "loss": 0.0201, "step": 105510 }, { - "epoch": 0.53, - "learning_rate": 0.00022014570331616305, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002589715408483051, + "loss": 0.0261, "step": 105520 }, { - "epoch": 0.53, - "learning_rate": 0.00022013813562314904, - "loss": 0.0125, + "epoch": 0.27, + "learning_rate": 0.00025896765263193366, + "loss": 0.0201, "step": 105530 }, { - "epoch": 0.53, - "learning_rate": 0.00022013056793013504, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.0002589637644155622, + "loss": 0.02, "step": 105540 }, { - "epoch": 0.53, - "learning_rate": 0.00022012300023712103, - "loss": 0.0188, + "epoch": 0.27, + "learning_rate": 0.0002589598761991907, + "loss": 0.0218, "step": 105550 }, { - "epoch": 0.53, - "learning_rate": 0.000220115432544107, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00025895598798281926, + "loss": 0.0228, "step": 105560 }, { - "epoch": 0.53, - "learning_rate": 0.00022010786485109302, - "loss": 0.0173, + "epoch": 0.27, + "learning_rate": 0.00025895209976644777, + "loss": 0.0232, "step": 105570 }, { - "epoch": 0.53, - "learning_rate": 0.000220100297158079, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002589482115500763, + "loss": 0.0205, "step": 105580 }, { - "epoch": 0.53, - "learning_rate": 0.00022009272946506498, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.00025894432333370486, + "loss": 0.0214, "step": 105590 }, { - "epoch": 0.53, - "learning_rate": 0.000220085161772051, - "loss": 0.0187, + "epoch": 0.27, + "learning_rate": 0.0002589404351173334, + "loss": 0.0217, "step": 105600 }, { - "epoch": 0.53, - "learning_rate": 0.00022007759407903697, - "loss": 0.0186, + "epoch": 0.27, + "learning_rate": 0.00025893654690096194, + "loss": 0.0203, "step": 105610 }, { - "epoch": 0.53, - "learning_rate": 0.00022007002638602295, - "loss": 0.0146, + "epoch": 0.27, + "learning_rate": 0.00025893265868459045, + "loss": 0.0192, "step": 105620 }, { - "epoch": 0.53, - "learning_rate": 0.00022006245869300896, - "loss": 0.0139, + "epoch": 0.27, + "learning_rate": 0.00025892877046821897, + "loss": 0.0302, "step": 105630 }, { - "epoch": 0.53, - "learning_rate": 0.00022005489099999494, - "loss": 0.0125, + "epoch": 0.27, + "learning_rate": 0.00025892488225184754, + "loss": 0.0219, "step": 105640 }, { - "epoch": 0.53, - "learning_rate": 0.00022004732330698092, - "loss": 0.0139, + "epoch": 0.27, + "learning_rate": 0.00025892099403547605, + "loss": 0.0284, "step": 105650 }, { - "epoch": 0.53, - "learning_rate": 0.00022003975561396693, - "loss": 0.0158, + "epoch": 0.27, + "learning_rate": 0.0002589171058191046, + "loss": 0.0227, "step": 105660 }, { - "epoch": 0.53, - "learning_rate": 0.0002200321879209529, - "loss": 0.0153, + "epoch": 0.27, + "learning_rate": 0.00025891321760273313, + "loss": 0.0287, "step": 105670 }, { - "epoch": 0.53, - "learning_rate": 0.0002200246202279389, - "loss": 0.0165, + "epoch": 0.27, + "learning_rate": 0.0002589093293863617, + "loss": 0.0239, "step": 105680 }, { - "epoch": 0.53, - "learning_rate": 0.00022001705253492487, - "loss": 0.0164, + "epoch": 0.27, + "learning_rate": 0.0002589054411699902, + "loss": 0.0215, "step": 105690 }, { - "epoch": 0.53, - "learning_rate": 0.00022000948484191088, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.00025890155295361873, + "loss": 0.0226, "step": 105700 }, { - "epoch": 0.53, - "learning_rate": 0.00022000191714889686, - "loss": 0.0166, + "epoch": 0.27, + "learning_rate": 0.00025889766473724725, + "loss": 0.0244, "step": 105710 }, { - "epoch": 0.53, - "learning_rate": 0.00021999434945588285, - "loss": 0.0141, + "epoch": 0.27, + "learning_rate": 0.0002588937765208758, + "loss": 0.024, "step": 105720 }, { - "epoch": 0.53, - "learning_rate": 0.00021998678176286885, - "loss": 0.0182, + "epoch": 0.27, + "learning_rate": 0.00025888988830450433, + "loss": 0.0263, "step": 105730 }, { - "epoch": 0.53, - "learning_rate": 0.00021997921406985484, - "loss": 0.0159, + "epoch": 0.27, + "learning_rate": 0.0002588860000881329, + "loss": 0.0243, "step": 105740 }, { - "epoch": 0.53, - "learning_rate": 0.00021997164637684082, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002588821118717614, + "loss": 0.0243, "step": 105750 }, { - "epoch": 0.53, - "learning_rate": 0.00021996407868382683, - "loss": 0.0137, + "epoch": 0.27, + "learning_rate": 0.00025887822365538993, + "loss": 0.0187, "step": 105760 }, { - "epoch": 0.53, - "learning_rate": 0.0002199565109908128, - "loss": 0.0157, + "epoch": 0.27, + "learning_rate": 0.0002588743354390185, + "loss": 0.0284, "step": 105770 }, { - "epoch": 0.53, - "learning_rate": 0.0002199489432977988, - "loss": 0.0184, + "epoch": 0.27, + "learning_rate": 0.000258870447222647, + "loss": 0.0211, "step": 105780 }, { - "epoch": 0.53, - "learning_rate": 0.0002199413756047848, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.0002588665590062756, + "loss": 0.0202, "step": 105790 }, { - "epoch": 0.53, - "learning_rate": 0.00021993380791177078, - "loss": 0.0133, + "epoch": 0.27, + "learning_rate": 0.0002588626707899041, + "loss": 0.0195, "step": 105800 }, { - "epoch": 0.53, - "learning_rate": 0.00021992624021875676, - "loss": 0.021, + "epoch": 0.27, + "learning_rate": 0.00025885878257353266, + "loss": 0.1621, "step": 105810 }, { - "epoch": 0.53, - "learning_rate": 0.00021991867252574277, - "loss": 0.0119, + "epoch": 0.27, + "learning_rate": 0.0002588548943571612, + "loss": 0.0283, "step": 105820 }, { - "epoch": 0.53, - "learning_rate": 0.00021991110483272875, - "loss": 0.013, + "epoch": 0.27, + "learning_rate": 0.0002588510061407897, + "loss": 0.0251, "step": 105830 }, { - "epoch": 0.53, - "learning_rate": 0.00021990353713971473, - "loss": 0.0163, + "epoch": 0.27, + "learning_rate": 0.0002588471179244182, + "loss": 0.027, "step": 105840 }, { - "epoch": 0.53, - "learning_rate": 0.0002198959694467007, - "loss": 0.0225, + "epoch": 0.27, + "learning_rate": 0.0002588432297080468, + "loss": 0.0229, "step": 105850 }, { - "epoch": 0.53, - "learning_rate": 0.00021988840175368672, - "loss": 0.0149, + "epoch": 0.27, + "learning_rate": 0.0002588393414916753, + "loss": 0.0342, "step": 105860 }, { - "epoch": 0.53, - "learning_rate": 0.0002198808340606727, - "loss": 0.0129, + "epoch": 0.27, + "learning_rate": 0.00025883545327530386, + "loss": 0.0246, "step": 105870 }, { - "epoch": 0.53, - "learning_rate": 0.00021987326636765868, - "loss": 0.0191, + "epoch": 0.27, + "learning_rate": 0.00025883156505893237, + "loss": 0.0222, "step": 105880 }, { - "epoch": 0.53, - "learning_rate": 0.0002198656986746447, - "loss": 0.0123, + "epoch": 0.27, + "learning_rate": 0.00025882767684256094, + "loss": 0.023, "step": 105890 }, { - "epoch": 0.53, - "learning_rate": 0.00021985813098163067, - "loss": 0.0126, + "epoch": 0.27, + "learning_rate": 0.00025882378862618946, + "loss": 0.0236, "step": 105900 }, { - "epoch": 0.53, - "learning_rate": 0.00021985056328861666, - "loss": 0.0144, + "epoch": 0.27, + "learning_rate": 0.00025881990040981797, + "loss": 0.0262, "step": 105910 }, { - "epoch": 0.53, - "learning_rate": 0.00021984299559560266, - "loss": 0.0123, + "epoch": 0.27, + "learning_rate": 0.0002588160121934465, + "loss": 0.0186, "step": 105920 }, { - "epoch": 0.53, - "learning_rate": 0.00021983542790258865, - "loss": 0.0156, + "epoch": 0.27, + "learning_rate": 0.00025881212397707505, + "loss": 0.025, "step": 105930 }, { - "epoch": 0.53, - "learning_rate": 0.00021982786020957463, - "loss": 0.0114, + "epoch": 0.27, + "learning_rate": 0.0002588082357607036, + "loss": 0.0226, "step": 105940 }, { - "epoch": 0.53, - "learning_rate": 0.00021982029251656064, - "loss": 0.015, + "epoch": 0.27, + "learning_rate": 0.00025880434754433214, + "loss": 0.0217, "step": 105950 }, { - "epoch": 0.53, - "learning_rate": 0.00021981272482354662, - "loss": 0.0171, + "epoch": 0.27, + "learning_rate": 0.00025880045932796065, + "loss": 0.02, "step": 105960 }, { - "epoch": 0.53, - "learning_rate": 0.0002198051571305326, - "loss": 0.0175, + "epoch": 0.27, + "learning_rate": 0.00025879657111158917, + "loss": 0.0279, "step": 105970 }, { - "epoch": 0.53, - "learning_rate": 0.0002197975894375186, - "loss": 0.0168, + "epoch": 0.27, + "learning_rate": 0.00025879268289521774, + "loss": 0.029, "step": 105980 }, { - "epoch": 0.53, - "learning_rate": 0.0002197900217445046, - "loss": 0.0145, + "epoch": 0.27, + "learning_rate": 0.00025878879467884625, + "loss": 0.0252, "step": 105990 }, { - "epoch": 0.53, - "learning_rate": 0.00021978245405149057, - "loss": 0.02, + "epoch": 0.27, + "learning_rate": 0.0002587849064624748, + "loss": 0.0186, "step": 106000 }, { - "epoch": 0.53, - "eval_cer": 0.9144886934295449, - "eval_loss": 0.01085778046399355, - "eval_runtime": 116.7271, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.283, + "epoch": 0.27, + "eval_cer": 0.8818118580040337, + "eval_loss": 0.016281619668006897, + "eval_runtime": 107.9063, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, "step": 106000 }, { - "epoch": 0.53, - "learning_rate": 0.00021977488635847658, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025878101824610333, + "loss": 0.0226, "step": 106010 }, { - "epoch": 0.53, - "learning_rate": 0.00021976731866546256, - "loss": 0.0119, + "epoch": 0.27, + "learning_rate": 0.0002587771300297319, + "loss": 0.0201, "step": 106020 }, { - "epoch": 0.53, - "learning_rate": 0.00021975975097244854, - "loss": 0.0178, + "epoch": 0.27, + "learning_rate": 0.0002587732418133604, + "loss": 0.0224, "step": 106030 }, { - "epoch": 0.53, - "learning_rate": 0.00021975218327943452, - "loss": 0.0181, + "epoch": 0.27, + "learning_rate": 0.00025876935359698893, + "loss": 0.0183, "step": 106040 }, { - "epoch": 0.54, - "learning_rate": 0.00021974461558642053, - "loss": 0.0155, + "epoch": 0.27, + "learning_rate": 0.00025876546538061745, + "loss": 0.0205, "step": 106050 }, { - "epoch": 0.54, - "learning_rate": 0.0002197370478934065, - "loss": 0.0122, + "epoch": 0.27, + "learning_rate": 0.000258761577164246, + "loss": 0.0176, "step": 106060 }, { - "epoch": 0.54, - "learning_rate": 0.0002197294802003925, - "loss": 0.0148, + "epoch": 0.27, + "learning_rate": 0.00025875768894787453, + "loss": 0.0208, "step": 106070 }, { - "epoch": 0.54, - "learning_rate": 0.0002197219125073785, - "loss": 0.0172, + "epoch": 0.27, + "learning_rate": 0.0002587538007315031, + "loss": 0.0234, "step": 106080 }, { - "epoch": 0.54, - "learning_rate": 0.00021971434481436448, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.0002587499125151316, + "loss": 0.0255, "step": 106090 }, { - "epoch": 0.54, - "learning_rate": 0.00021970677712135047, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.0002587460242987602, + "loss": 0.022, "step": 106100 }, { - "epoch": 0.54, - "learning_rate": 0.00021969920942833647, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.0002587421360823887, + "loss": 0.0204, "step": 106110 }, { - "epoch": 0.54, - "learning_rate": 0.00021969164173532246, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002587382478660172, + "loss": 0.0262, "step": 106120 }, { - "epoch": 0.54, - "learning_rate": 0.00021968407404230844, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.0002587343596496457, + "loss": 0.0248, "step": 106130 }, { - "epoch": 0.54, - "learning_rate": 0.00021967650634929445, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.0002587304714332743, + "loss": 0.0177, "step": 106140 }, { - "epoch": 0.54, - "learning_rate": 0.00021966893865628043, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025872658321690286, + "loss": 0.022, "step": 106150 }, { - "epoch": 0.54, - "learning_rate": 0.0002196613709632664, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.0002587226950005314, + "loss": 0.0208, "step": 106160 }, { - "epoch": 0.54, - "learning_rate": 0.00021965380327025242, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.0002587188067841599, + "loss": 0.0206, "step": 106170 }, { - "epoch": 0.54, - "learning_rate": 0.0002196462355772384, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025871491856778846, + "loss": 0.0228, "step": 106180 }, { - "epoch": 0.54, - "learning_rate": 0.00021963866788422438, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.000258711030351417, + "loss": 0.0223, "step": 106190 }, { - "epoch": 0.54, - "learning_rate": 0.00021963110019121036, - "loss": 0.0139, + "epoch": 0.28, + "learning_rate": 0.0002587071421350455, + "loss": 0.0208, "step": 106200 }, { - "epoch": 0.54, - "learning_rate": 0.00021962353249819634, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.00025870325391867406, + "loss": 0.0219, "step": 106210 }, { - "epoch": 0.54, - "learning_rate": 0.00021961596480518232, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.00025869936570230257, + "loss": 0.0294, "step": 106220 }, { - "epoch": 0.54, - "learning_rate": 0.0002196083971121683, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.00025869547748593114, + "loss": 0.0223, "step": 106230 }, { - "epoch": 0.54, - "learning_rate": 0.0002196008294191543, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.00025869158926955965, + "loss": 0.0202, "step": 106240 }, { - "epoch": 0.54, - "learning_rate": 0.0002195932617261403, - "loss": 0.0126, + "epoch": 0.28, + "learning_rate": 0.00025868770105318817, + "loss": 0.0192, "step": 106250 }, { - "epoch": 0.54, - "learning_rate": 0.00021958569403312628, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.0002586838128368167, + "loss": 0.0159, "step": 106260 }, { - "epoch": 0.54, - "learning_rate": 0.00021957812634011226, - "loss": 0.012, + "epoch": 0.28, + "learning_rate": 0.00025867992462044525, + "loss": 0.0194, "step": 106270 }, { - "epoch": 0.54, - "learning_rate": 0.00021957055864709827, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.00025867603640407377, + "loss": 0.0178, "step": 106280 }, { - "epoch": 0.54, - "learning_rate": 0.00021956299095408425, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.00025867214818770234, + "loss": 0.0219, "step": 106290 }, { - "epoch": 0.54, - "learning_rate": 0.00021955542326107023, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025866825997133085, + "loss": 0.0237, "step": 106300 }, { - "epoch": 0.54, - "learning_rate": 0.00021954785556805624, - "loss": 0.0129, + "epoch": 0.28, + "learning_rate": 0.0002586643717549594, + "loss": 0.0208, "step": 106310 }, { - "epoch": 0.54, - "learning_rate": 0.00021954028787504222, - "loss": 0.012, + "epoch": 0.28, + "learning_rate": 0.00025866048353858793, + "loss": 0.024, "step": 106320 }, { - "epoch": 0.54, - "learning_rate": 0.0002195327201820282, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.00025865659532221645, + "loss": 0.0222, "step": 106330 }, { - "epoch": 0.54, - "learning_rate": 0.0002195251524890142, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.000258652707105845, + "loss": 0.0211, "step": 106340 }, { - "epoch": 0.54, - "learning_rate": 0.0002195175847960002, - "loss": 0.013, + "epoch": 0.28, + "learning_rate": 0.00025864881888947353, + "loss": 0.0209, "step": 106350 }, { - "epoch": 0.54, - "learning_rate": 0.00021951001710298617, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.0002586449306731021, + "loss": 0.0204, "step": 106360 }, { - "epoch": 0.54, - "learning_rate": 0.00021950244940997218, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.0002586410424567306, + "loss": 0.0217, "step": 106370 }, { - "epoch": 0.54, - "learning_rate": 0.00021949488171695816, - "loss": 0.0124, + "epoch": 0.28, + "learning_rate": 0.00025863715424035913, + "loss": 0.0173, "step": 106380 }, { - "epoch": 0.54, - "learning_rate": 0.00021948731402394414, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.0002586332660239877, + "loss": 0.0237, "step": 106390 }, { - "epoch": 0.54, - "learning_rate": 0.00021947974633093015, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.0002586293778076162, + "loss": 0.0216, "step": 106400 }, { - "epoch": 0.54, - "learning_rate": 0.00021947217863791613, - "loss": 0.0129, + "epoch": 0.28, + "learning_rate": 0.00025862548959124473, + "loss": 0.0207, "step": 106410 }, { - "epoch": 0.54, - "learning_rate": 0.00021946461094490212, - "loss": 0.0194, + "epoch": 0.28, + "learning_rate": 0.0002586216013748733, + "loss": 0.0204, "step": 106420 }, { - "epoch": 0.54, - "learning_rate": 0.0002194570432518881, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.00025861771315850186, + "loss": 0.0215, "step": 106430 }, { - "epoch": 0.54, - "learning_rate": 0.0002194494755588741, - "loss": 0.0191, + "epoch": 0.28, + "learning_rate": 0.0002586138249421304, + "loss": 0.0244, "step": 106440 }, { - "epoch": 0.54, - "learning_rate": 0.0002194419078658601, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.0002586099367257589, + "loss": 0.0232, "step": 106450 }, { - "epoch": 0.54, - "learning_rate": 0.00021943434017284607, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002586060485093874, + "loss": 0.0292, "step": 106460 }, { - "epoch": 0.54, - "learning_rate": 0.00021942677247983208, - "loss": 0.0128, + "epoch": 0.28, + "learning_rate": 0.0002586021602930159, + "loss": 0.0233, "step": 106470 }, { - "epoch": 0.54, - "learning_rate": 0.00021941920478681806, - "loss": 0.0176, + "epoch": 0.28, + "learning_rate": 0.0002585982720766445, + "loss": 0.0212, "step": 106480 }, { - "epoch": 0.54, - "learning_rate": 0.00021941163709380404, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025859438386027306, + "loss": 0.022, "step": 106490 }, { - "epoch": 0.54, - "learning_rate": 0.00021940406940079005, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.0002585904956439016, + "loss": 0.0221, "step": 106500 }, { - "epoch": 0.54, - "learning_rate": 0.00021939650170777603, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002585866074275301, + "loss": 0.023, "step": 106510 }, { - "epoch": 0.54, - "learning_rate": 0.000219388934014762, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.00025858271921115866, + "loss": 0.0239, "step": 106520 }, { - "epoch": 0.54, - "learning_rate": 0.00021938136632174802, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025857883099478717, + "loss": 0.0247, "step": 106530 }, { - "epoch": 0.54, - "learning_rate": 0.000219373798628734, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.0002585749427784157, + "loss": 0.0191, "step": 106540 }, { - "epoch": 0.54, - "learning_rate": 0.00021936623093571998, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.00025857105456204426, + "loss": 0.0249, "step": 106550 }, { - "epoch": 0.54, - "learning_rate": 0.000219358663242706, - "loss": 0.0263, + "epoch": 0.28, + "learning_rate": 0.00025856716634567277, + "loss": 0.0228, "step": 106560 }, { - "epoch": 0.54, - "learning_rate": 0.00021935109554969197, - "loss": 0.0191, + "epoch": 0.28, + "learning_rate": 0.00025856327812930134, + "loss": 0.022, "step": 106570 }, { - "epoch": 0.54, - "learning_rate": 0.00021934352785667795, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025855938991292985, + "loss": 0.0259, "step": 106580 }, { - "epoch": 0.54, - "learning_rate": 0.00021933596016366394, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025855550169655837, + "loss": 0.0219, "step": 106590 }, { - "epoch": 0.54, - "learning_rate": 0.00021932839247064994, - "loss": 0.0171, + "epoch": 0.28, + "learning_rate": 0.00025855161348018694, + "loss": 0.0226, "step": 106600 }, { - "epoch": 0.54, - "learning_rate": 0.00021932082477763593, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.00025854772526381545, + "loss": 0.0292, "step": 106610 }, { - "epoch": 0.54, - "learning_rate": 0.0002193132570846219, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.00025854383704744397, + "loss": 0.0251, "step": 106620 }, { - "epoch": 0.54, - "learning_rate": 0.00021930568939160792, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025853994883107253, + "loss": 0.025, "step": 106630 }, { - "epoch": 0.54, - "learning_rate": 0.0002192981216985939, - "loss": 0.012, + "epoch": 0.28, + "learning_rate": 0.0002585360606147011, + "loss": 0.0238, "step": 106640 }, { - "epoch": 0.54, - "learning_rate": 0.00021929055400557988, - "loss": 0.0155, + "epoch": 0.28, + "learning_rate": 0.0002585321723983296, + "loss": 0.0234, "step": 106650 }, { - "epoch": 0.54, - "learning_rate": 0.0002192829863125659, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025852828418195813, + "loss": 0.0202, "step": 106660 }, { - "epoch": 0.54, - "learning_rate": 0.00021927541861955187, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025852439596558665, + "loss": 0.0269, "step": 106670 }, { - "epoch": 0.54, - "learning_rate": 0.00021926785092653785, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002585205077492152, + "loss": 0.023, "step": 106680 }, { - "epoch": 0.54, - "learning_rate": 0.00021926028323352386, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.00025851661953284373, + "loss": 0.022, "step": 106690 }, { - "epoch": 0.54, - "learning_rate": 0.00021925271554050984, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002585127313164723, + "loss": 0.0244, "step": 106700 }, { - "epoch": 0.54, - "learning_rate": 0.00021924514784749582, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002585088431001008, + "loss": 0.0223, "step": 106710 }, { - "epoch": 0.54, - "learning_rate": 0.00021923758015448183, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.00025850495488372933, + "loss": 0.0187, "step": 106720 }, { - "epoch": 0.54, - "learning_rate": 0.0002192300124614678, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.0002585010666673579, + "loss": 0.0182, "step": 106730 }, { - "epoch": 0.54, - "learning_rate": 0.0002192224447684538, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.0002584971784509864, + "loss": 0.0182, "step": 106740 }, { - "epoch": 0.54, - "learning_rate": 0.00021921487707543977, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.0002584932902346149, + "loss": 0.0187, "step": 106750 }, { - "epoch": 0.54, - "learning_rate": 0.00021920730938242578, - "loss": 0.0155, + "epoch": 0.28, + "learning_rate": 0.0002584894020182435, + "loss": 0.0228, "step": 106760 }, { - "epoch": 0.54, - "learning_rate": 0.00021919974168941176, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.000258485513801872, + "loss": 0.026, "step": 106770 }, { - "epoch": 0.54, - "learning_rate": 0.00021919217399639775, - "loss": 0.0216, + "epoch": 0.28, + "learning_rate": 0.0002584816255855006, + "loss": 0.0246, "step": 106780 }, { - "epoch": 0.54, - "learning_rate": 0.00021918460630338375, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002584777373691291, + "loss": 0.021, "step": 106790 }, { - "epoch": 0.54, - "learning_rate": 0.00021917703861036974, - "loss": 0.013, + "epoch": 0.28, + "learning_rate": 0.0002584738491527576, + "loss": 0.0238, "step": 106800 }, { - "epoch": 0.54, - "learning_rate": 0.00021916947091735572, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002584699609363862, + "loss": 0.0225, "step": 106810 }, { - "epoch": 0.54, - "learning_rate": 0.00021916190322434173, - "loss": 0.0186, + "epoch": 0.28, + "learning_rate": 0.0002584660727200147, + "loss": 0.0187, "step": 106820 }, { - "epoch": 0.54, - "learning_rate": 0.0002191543355313277, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.00025846218450364326, + "loss": 0.0206, "step": 106830 }, { - "epoch": 0.54, - "learning_rate": 0.0002191467678383137, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.0002584582962872718, + "loss": 0.0227, "step": 106840 }, { - "epoch": 0.54, - "learning_rate": 0.0002191392001452997, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025845440807090034, + "loss": 0.0179, "step": 106850 }, { - "epoch": 0.54, - "learning_rate": 0.00021913163245228568, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.00025845051985452886, + "loss": 0.0262, "step": 106860 }, { - "epoch": 0.54, - "learning_rate": 0.00021912406475927166, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025844663163815737, + "loss": 0.0178, "step": 106870 }, { - "epoch": 0.54, - "learning_rate": 0.00021911649706625767, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.0002584427434217859, + "loss": 0.0258, "step": 106880 }, { - "epoch": 0.54, - "learning_rate": 0.00021910892937324365, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025843885520541445, + "loss": 0.0245, "step": 106890 }, { - "epoch": 0.54, - "learning_rate": 0.00021910136168022963, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.00025843496698904297, + "loss": 0.0285, "step": 106900 }, { - "epoch": 0.54, - "learning_rate": 0.00021909379398721564, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025843107877267154, + "loss": 0.0283, "step": 106910 }, { - "epoch": 0.54, - "learning_rate": 0.00021908622629420162, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.00025842719055630005, + "loss": 0.0239, "step": 106920 }, { - "epoch": 0.54, - "learning_rate": 0.0002190786586011876, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.0002584233023399286, + "loss": 0.0235, "step": 106930 }, { - "epoch": 0.54, - "learning_rate": 0.00021907109090817358, - "loss": 0.011, + "epoch": 0.28, + "learning_rate": 0.00025841941412355714, + "loss": 0.0221, "step": 106940 }, { - "epoch": 0.54, - "learning_rate": 0.0002190635232151596, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.00025841552590718565, + "loss": 0.0223, "step": 106950 }, { - "epoch": 0.54, - "learning_rate": 0.00021905595552214557, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.00025841163769081417, + "loss": 0.0192, "step": 106960 }, { - "epoch": 0.54, - "learning_rate": 0.00021904838782913156, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025840774947444273, + "loss": 0.0261, "step": 106970 }, { - "epoch": 0.54, - "learning_rate": 0.00021904082013611756, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.0002584038612580713, + "loss": 0.0217, "step": 106980 }, { - "epoch": 0.54, - "learning_rate": 0.00021903325244310355, - "loss": 0.0132, + "epoch": 0.28, + "learning_rate": 0.0002583999730416998, + "loss": 0.02, "step": 106990 }, { - "epoch": 0.54, - "learning_rate": 0.00021902568475008953, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025839608482532833, + "loss": 0.0276, "step": 107000 }, { - "epoch": 0.54, - "eval_cer": 0.9144886934295449, - "eval_loss": 0.010931231081485748, - "eval_runtime": 116.6714, - "eval_samples_per_second": 17.142, - "eval_steps_per_second": 4.286, + "epoch": 0.28, + "eval_cer": 0.8818300532841781, + "eval_loss": 0.01527465507388115, + "eval_runtime": 108.0078, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 107000 }, { - "epoch": 0.54, - "learning_rate": 0.00021901811705707554, - "loss": 0.0139, + "epoch": 0.28, + "learning_rate": 0.00025839219660895685, + "loss": 0.0254, "step": 107010 }, { - "epoch": 0.54, - "learning_rate": 0.00021901054936406152, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002583883083925854, + "loss": 0.0237, "step": 107020 }, { - "epoch": 0.54, - "learning_rate": 0.0002190029816710475, - "loss": 0.0108, + "epoch": 0.28, + "learning_rate": 0.00025838442017621393, + "loss": 0.022, "step": 107030 }, { - "epoch": 0.54, - "learning_rate": 0.0002189954139780335, - "loss": 0.0194, + "epoch": 0.28, + "learning_rate": 0.0002583805319598425, + "loss": 0.0197, "step": 107040 }, { - "epoch": 0.54, - "learning_rate": 0.0002189878462850195, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.000258376643743471, + "loss": 0.0205, "step": 107050 }, { - "epoch": 0.54, - "learning_rate": 0.00021898027859200547, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.0002583727555270996, + "loss": 0.0228, "step": 107060 }, { - "epoch": 0.54, - "learning_rate": 0.00021897271089899148, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.0002583688673107281, + "loss": 0.0245, "step": 107070 }, { - "epoch": 0.54, - "learning_rate": 0.00021896514320597746, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.0002583649790943566, + "loss": 0.0182, "step": 107080 }, { - "epoch": 0.54, - "learning_rate": 0.00021895757551296344, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.0002583610908779851, + "loss": 0.0297, "step": 107090 }, { - "epoch": 0.54, - "learning_rate": 0.00021895000781994942, - "loss": 0.0282, + "epoch": 0.28, + "learning_rate": 0.0002583572026616137, + "loss": 0.0242, "step": 107100 }, { - "epoch": 0.54, - "learning_rate": 0.00021894244012693543, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.0002583533144452422, + "loss": 0.0244, "step": 107110 }, { - "epoch": 0.54, - "learning_rate": 0.0002189348724339214, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002583494262288708, + "loss": 0.0221, "step": 107120 }, { - "epoch": 0.54, - "learning_rate": 0.0002189273047409074, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.0002583455380124993, + "loss": 0.0231, "step": 107130 }, { - "epoch": 0.54, - "learning_rate": 0.0002189197370478934, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.00025834164979612786, + "loss": 0.0224, "step": 107140 }, { - "epoch": 0.54, - "learning_rate": 0.00021891216935487938, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.0002583377615797564, + "loss": 0.0194, "step": 107150 }, { - "epoch": 0.54, - "learning_rate": 0.00021890460166186537, - "loss": 0.0209, + "epoch": 0.28, + "learning_rate": 0.0002583338733633849, + "loss": 0.0175, "step": 107160 }, { - "epoch": 0.54, - "learning_rate": 0.00021889703396885137, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.0002583299851470134, + "loss": 0.0215, "step": 107170 }, { - "epoch": 0.54, - "learning_rate": 0.00021888946627583736, - "loss": 0.0118, + "epoch": 0.28, + "learning_rate": 0.00025832609693064197, + "loss": 0.0264, "step": 107180 }, { - "epoch": 0.54, - "learning_rate": 0.00021888189858282334, - "loss": 0.017, + "epoch": 0.28, + "learning_rate": 0.00025832220871427054, + "loss": 0.0214, "step": 107190 }, { - "epoch": 0.54, - "learning_rate": 0.00021887433088980935, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.00025831832049789906, + "loss": 0.022, "step": 107200 }, { - "epoch": 0.54, - "learning_rate": 0.00021886676319679533, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.00025831443228152757, + "loss": 0.0236, "step": 107210 }, { - "epoch": 0.54, - "learning_rate": 0.0002188591955037813, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.0002583105440651561, + "loss": 0.0234, "step": 107220 }, { - "epoch": 0.54, - "learning_rate": 0.00021885162781076732, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.00025830665584878465, + "loss": 0.0257, "step": 107230 }, { - "epoch": 0.54, - "learning_rate": 0.0002188440601177533, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.00025830276763241317, + "loss": 0.0184, "step": 107240 }, { - "epoch": 0.54, - "learning_rate": 0.00021883649242473928, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025829887941604174, + "loss": 0.0213, "step": 107250 }, { - "epoch": 0.54, - "learning_rate": 0.00021882892473172526, - "loss": 0.0155, + "epoch": 0.28, + "learning_rate": 0.00025829499119967025, + "loss": 0.0219, "step": 107260 }, { - "epoch": 0.54, - "learning_rate": 0.00021882135703871127, - "loss": 0.013, + "epoch": 0.28, + "learning_rate": 0.0002582911029832988, + "loss": 0.0222, "step": 107270 }, { - "epoch": 0.54, - "learning_rate": 0.00021881378934569725, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.00025828721476692733, + "loss": 0.0227, "step": 107280 }, { - "epoch": 0.54, - "learning_rate": 0.00021880622165268323, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025828332655055585, + "loss": 0.0175, "step": 107290 }, { - "epoch": 0.54, - "learning_rate": 0.00021879865395966924, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025827943833418436, + "loss": 0.0207, "step": 107300 }, { - "epoch": 0.54, - "learning_rate": 0.00021879108626665522, - "loss": 0.0117, + "epoch": 0.28, + "learning_rate": 0.00025827555011781293, + "loss": 0.023, "step": 107310 }, { - "epoch": 0.54, - "learning_rate": 0.0002187835185736412, - "loss": 0.0171, + "epoch": 0.28, + "learning_rate": 0.00025827166190144145, + "loss": 0.0207, "step": 107320 }, { - "epoch": 0.54, - "learning_rate": 0.0002187759508806272, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.00025826777368507, + "loss": 0.0236, "step": 107330 }, { - "epoch": 0.54, - "learning_rate": 0.0002187683831876132, - "loss": 0.0203, + "epoch": 0.28, + "learning_rate": 0.00025826388546869853, + "loss": 0.0219, "step": 107340 }, { - "epoch": 0.54, - "learning_rate": 0.00021876081549459918, - "loss": 0.014, + "epoch": 0.28, + "learning_rate": 0.0002582599972523271, + "loss": 0.0228, "step": 107350 }, { - "epoch": 0.54, - "learning_rate": 0.00021875324780158518, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.0002582561090359556, + "loss": 0.0209, "step": 107360 }, { - "epoch": 0.54, - "learning_rate": 0.00021874568010857117, - "loss": 0.0205, + "epoch": 0.28, + "learning_rate": 0.00025825222081958413, + "loss": 0.0197, "step": 107370 }, { - "epoch": 0.54, - "learning_rate": 0.00021873811241555715, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002582483326032127, + "loss": 0.027, "step": 107380 }, { - "epoch": 0.54, - "learning_rate": 0.00021873054472254316, - "loss": 0.0134, + "epoch": 0.28, + "learning_rate": 0.0002582444443868412, + "loss": 0.0255, "step": 107390 }, { - "epoch": 0.54, - "learning_rate": 0.00021872297702952914, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.0002582405561704698, + "loss": 0.0193, "step": 107400 }, { - "epoch": 0.54, - "learning_rate": 0.00021871540933651512, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002582366679540983, + "loss": 0.0231, "step": 107410 }, { - "epoch": 0.54, - "learning_rate": 0.00021870784164350113, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002582327797377268, + "loss": 0.02, "step": 107420 }, { - "epoch": 0.54, - "learning_rate": 0.0002187002739504871, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.0002582288915213554, + "loss": 0.0211, "step": 107430 }, { - "epoch": 0.54, - "learning_rate": 0.0002186927062574731, - "loss": 0.0188, + "epoch": 0.28, + "learning_rate": 0.0002582250033049839, + "loss": 0.0234, "step": 107440 }, { - "epoch": 0.54, - "learning_rate": 0.00021868513856445907, - "loss": 0.0185, + "epoch": 0.28, + "learning_rate": 0.0002582211150886124, + "loss": 0.0261, "step": 107450 }, { - "epoch": 0.54, - "learning_rate": 0.00021867757087144508, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.000258217226872241, + "loss": 0.0282, "step": 107460 }, { - "epoch": 0.54, - "learning_rate": 0.00021867000317843103, - "loss": 0.0124, + "epoch": 0.28, + "learning_rate": 0.0002582133386558695, + "loss": 0.0224, "step": 107470 }, { - "epoch": 0.54, - "learning_rate": 0.00021866243548541702, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.00025820945043949806, + "loss": 0.0216, "step": 107480 }, { - "epoch": 0.54, - "learning_rate": 0.000218654867792403, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.0002582055622231266, + "loss": 0.0215, "step": 107490 }, { - "epoch": 0.54, - "learning_rate": 0.000218647300099389, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.0002582016740067551, + "loss": 0.0206, "step": 107500 }, { - "epoch": 0.54, - "learning_rate": 0.000218639732406375, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.0002581977857903836, + "loss": 0.018, "step": 107510 }, { - "epoch": 0.54, - "learning_rate": 0.00021863216471336097, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025819389757401217, + "loss": 0.0195, "step": 107520 }, { - "epoch": 0.54, - "learning_rate": 0.00021862459702034698, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.00025819000935764074, + "loss": 0.0236, "step": 107530 }, { - "epoch": 0.54, - "learning_rate": 0.00021861702932733296, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025818612114126925, + "loss": 0.0307, "step": 107540 }, { - "epoch": 0.54, - "learning_rate": 0.00021860946163431894, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.00025818223292489777, + "loss": 0.0197, "step": 107550 }, { - "epoch": 0.54, - "learning_rate": 0.00021860189394130495, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.00025817834470852634, + "loss": 0.0247, "step": 107560 }, { - "epoch": 0.54, - "learning_rate": 0.00021859432624829093, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.00025817445649215485, + "loss": 0.0217, "step": 107570 }, { - "epoch": 0.54, - "learning_rate": 0.0002185867585552769, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.00025817056827578337, + "loss": 0.0279, "step": 107580 }, { - "epoch": 0.54, - "learning_rate": 0.00021857919086226292, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025816668005941194, + "loss": 0.021, "step": 107590 }, { - "epoch": 0.54, - "learning_rate": 0.0002185716231692489, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.00025816279184304045, + "loss": 0.0283, "step": 107600 }, { - "epoch": 0.54, - "learning_rate": 0.00021856405547623488, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.000258158903626669, + "loss": 0.0193, "step": 107610 }, { - "epoch": 0.54, - "learning_rate": 0.0002185564877832209, - "loss": 0.0119, + "epoch": 0.28, + "learning_rate": 0.00025815501541029753, + "loss": 0.023, "step": 107620 }, { - "epoch": 0.54, - "learning_rate": 0.00021854892009020687, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025815112719392605, + "loss": 0.0198, "step": 107630 }, { - "epoch": 0.54, - "learning_rate": 0.00021854135239719285, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.0002581472389775546, + "loss": 0.0207, "step": 107640 }, { - "epoch": 0.54, - "learning_rate": 0.00021853378470417884, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025814335076118313, + "loss": 0.0219, "step": 107650 }, { - "epoch": 0.54, - "learning_rate": 0.00021852621701116484, - "loss": 0.0188, + "epoch": 0.28, + "learning_rate": 0.00025813946254481165, + "loss": 0.0187, "step": 107660 }, { - "epoch": 0.54, - "learning_rate": 0.00021851864931815083, - "loss": 0.0186, + "epoch": 0.28, + "learning_rate": 0.0002581355743284402, + "loss": 0.0238, "step": 107670 }, { - "epoch": 0.54, - "learning_rate": 0.0002185110816251368, - "loss": 0.0114, + "epoch": 0.28, + "learning_rate": 0.00025813168611206873, + "loss": 0.0191, "step": 107680 }, { - "epoch": 0.54, - "learning_rate": 0.00021850351393212282, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002581277978956973, + "loss": 0.0215, "step": 107690 }, { - "epoch": 0.54, - "learning_rate": 0.0002184959462391088, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.0002581239096793258, + "loss": 0.0268, "step": 107700 }, { - "epoch": 0.54, - "learning_rate": 0.00021848837854609478, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.0002581200214629543, + "loss": 0.0232, "step": 107710 }, { - "epoch": 0.54, - "learning_rate": 0.0002184808108530808, - "loss": 0.0178, + "epoch": 0.28, + "learning_rate": 0.00025811613324658284, + "loss": 0.0224, "step": 107720 }, { - "epoch": 0.54, - "learning_rate": 0.00021847324316006677, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.0002581122450302114, + "loss": 0.0255, "step": 107730 }, { - "epoch": 0.54, - "learning_rate": 0.00021846567546705275, - "loss": 0.0134, + "epoch": 0.28, + "learning_rate": 0.00025810835681384, + "loss": 0.0223, "step": 107740 }, { - "epoch": 0.54, - "learning_rate": 0.00021845810777403876, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002581044685974685, + "loss": 0.024, "step": 107750 }, { - "epoch": 0.54, - "learning_rate": 0.00021845054008102474, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.000258100580381097, + "loss": 0.0188, "step": 107760 }, { - "epoch": 0.54, - "learning_rate": 0.00021844297238801072, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.0002580966921647256, + "loss": 0.0217, "step": 107770 }, { - "epoch": 0.54, - "learning_rate": 0.00021843540469499673, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.0002580928039483541, + "loss": 0.0216, "step": 107780 }, { - "epoch": 0.54, - "learning_rate": 0.0002184278370019827, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002580889157319826, + "loss": 0.0179, "step": 107790 }, { - "epoch": 0.54, - "learning_rate": 0.0002184202693089687, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002580850275156112, + "loss": 0.0261, "step": 107800 }, { - "epoch": 0.54, - "learning_rate": 0.0002184127016159547, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002580811392992397, + "loss": 0.0266, "step": 107810 }, { - "epoch": 0.54, - "learning_rate": 0.00021840513392294068, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.00025807725108286826, + "loss": 0.0195, "step": 107820 }, { - "epoch": 0.54, - "learning_rate": 0.00021839756622992666, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.00025807336286649677, + "loss": 0.0209, "step": 107830 }, { - "epoch": 0.54, - "learning_rate": 0.00021838999853691265, - "loss": 0.0128, + "epoch": 0.28, + "learning_rate": 0.0002580694746501253, + "loss": 0.026, "step": 107840 }, { - "epoch": 0.54, - "learning_rate": 0.00021838243084389865, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025806558643375386, + "loss": 0.0256, "step": 107850 }, { - "epoch": 0.54, - "learning_rate": 0.00021837486315088464, - "loss": 0.0123, + "epoch": 0.28, + "learning_rate": 0.00025806169821738237, + "loss": 0.0209, "step": 107860 }, { - "epoch": 0.54, - "learning_rate": 0.00021836729545787062, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.0002580578100010109, + "loss": 0.0206, "step": 107870 }, { - "epoch": 0.54, - "learning_rate": 0.00021835972776485663, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.00025805392178463945, + "loss": 0.0207, "step": 107880 }, { - "epoch": 0.54, - "learning_rate": 0.0002183521600718426, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.000258050033568268, + "loss": 0.0201, "step": 107890 }, { - "epoch": 0.54, - "learning_rate": 0.0002183445923788286, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025804614535189654, + "loss": 0.0208, "step": 107900 }, { - "epoch": 0.54, - "learning_rate": 0.0002183370246858146, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025804225713552505, + "loss": 0.0212, "step": 107910 }, { - "epoch": 0.54, - "learning_rate": 0.00021832945699280058, - "loss": 0.0183, + "epoch": 0.28, + "learning_rate": 0.00025803836891915357, + "loss": 0.0233, "step": 107920 }, { - "epoch": 0.54, - "learning_rate": 0.00021832188929978656, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.00025803448070278213, + "loss": 0.0252, "step": 107930 }, { - "epoch": 0.54, - "learning_rate": 0.00021831432160677257, - "loss": 0.0179, + "epoch": 0.28, + "learning_rate": 0.00025803059248641065, + "loss": 0.022, "step": 107940 }, { - "epoch": 0.54, - "learning_rate": 0.00021830675391375855, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002580267042700392, + "loss": 0.0214, "step": 107950 }, { - "epoch": 0.54, - "learning_rate": 0.00021829918622074453, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025802281605366773, + "loss": 0.0284, "step": 107960 }, { - "epoch": 0.54, - "learning_rate": 0.00021829161852773054, - "loss": 0.0139, + "epoch": 0.28, + "learning_rate": 0.00025801892783729625, + "loss": 0.0172, "step": 107970 }, { - "epoch": 0.54, - "learning_rate": 0.00021828405083471652, - "loss": 0.0175, + "epoch": 0.28, + "learning_rate": 0.0002580150396209248, + "loss": 0.0183, "step": 107980 }, { - "epoch": 0.54, - "learning_rate": 0.0002182764831417025, - "loss": 0.0176, + "epoch": 0.28, + "learning_rate": 0.00025801115140455333, + "loss": 0.0229, "step": 107990 }, { - "epoch": 0.54, - "learning_rate": 0.00021826891544868848, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025800726318818184, + "loss": 0.0215, "step": 108000 }, { - "epoch": 0.54, - "eval_cer": 0.9144886934295449, - "eval_loss": 0.011288284324109554, - "eval_runtime": 116.6804, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.28, + "eval_cer": 0.8817796663545476, + "eval_loss": 0.015666382387280464, + "eval_runtime": 108.1495, + "eval_samples_per_second": 18.493, + "eval_steps_per_second": 4.623, "step": 108000 }, { - "epoch": 0.54, - "learning_rate": 0.0002182613477556745, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.0002580033749718104, + "loss": 0.023, "step": 108010 }, { - "epoch": 0.54, - "learning_rate": 0.00021825378006266047, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.000257999486755439, + "loss": 0.0263, "step": 108020 }, { - "epoch": 0.55, - "learning_rate": 0.00021824621236964646, - "loss": 0.0117, + "epoch": 0.28, + "learning_rate": 0.0002579955985390675, + "loss": 0.0264, "step": 108030 }, { - "epoch": 0.55, - "learning_rate": 0.00021823864467663246, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.000257991710322696, + "loss": 0.0242, "step": 108040 }, { - "epoch": 0.55, - "learning_rate": 0.00021823107698361845, - "loss": 0.0155, + "epoch": 0.28, + "learning_rate": 0.0002579878221063245, + "loss": 0.0232, "step": 108050 }, { - "epoch": 0.55, - "learning_rate": 0.00021822350929060443, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.0002579839338899531, + "loss": 0.0198, "step": 108060 }, { - "epoch": 0.55, - "learning_rate": 0.00021821594159759044, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.0002579800456735816, + "loss": 0.0242, "step": 108070 }, { - "epoch": 0.55, - "learning_rate": 0.00021820837390457642, - "loss": 0.0119, + "epoch": 0.28, + "learning_rate": 0.0002579761574572102, + "loss": 0.0188, "step": 108080 }, { - "epoch": 0.55, - "learning_rate": 0.0002182008062115624, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.0002579722692408387, + "loss": 0.0236, "step": 108090 }, { - "epoch": 0.55, - "learning_rate": 0.0002181932385185484, - "loss": 0.0184, + "epoch": 0.28, + "learning_rate": 0.00025796838102446726, + "loss": 0.0189, "step": 108100 }, { - "epoch": 0.55, - "learning_rate": 0.0002181856708255344, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.0002579644928080958, + "loss": 0.0216, "step": 108110 }, { - "epoch": 0.55, - "learning_rate": 0.00021817810313252037, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.0002579606045917243, + "loss": 0.0237, "step": 108120 }, { - "epoch": 0.55, - "learning_rate": 0.00021817053543950638, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.0002579567163753528, + "loss": 0.0222, "step": 108130 }, { - "epoch": 0.55, - "learning_rate": 0.00021816296774649236, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002579528281589814, + "loss": 0.0203, "step": 108140 }, { - "epoch": 0.55, - "learning_rate": 0.00021815540005347834, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.0002579489399426099, + "loss": 0.0217, "step": 108150 }, { - "epoch": 0.55, - "learning_rate": 0.00021814783236046432, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.00025794505172623846, + "loss": 0.0234, "step": 108160 }, { - "epoch": 0.55, - "learning_rate": 0.00021814026466745033, - "loss": 0.0132, + "epoch": 0.28, + "learning_rate": 0.00025794116350986697, + "loss": 0.0203, "step": 108170 }, { - "epoch": 0.55, - "learning_rate": 0.0002181326969744363, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.0002579372752934955, + "loss": 0.0218, "step": 108180 }, { - "epoch": 0.55, - "learning_rate": 0.0002181251292814223, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.00025793338707712405, + "loss": 0.0195, "step": 108190 }, { - "epoch": 0.55, - "learning_rate": 0.0002181175615884083, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025792949886075257, + "loss": 0.0189, "step": 108200 }, { - "epoch": 0.55, - "learning_rate": 0.00021810999389539428, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.0002579256106443811, + "loss": 0.0199, "step": 108210 }, { - "epoch": 0.55, - "learning_rate": 0.00021810242620238027, - "loss": 0.0171, + "epoch": 0.28, + "learning_rate": 0.00025792172242800965, + "loss": 0.0198, "step": 108220 }, { - "epoch": 0.55, - "learning_rate": 0.00021809485850936627, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.0002579178342116382, + "loss": 0.0193, "step": 108230 }, { - "epoch": 0.55, - "learning_rate": 0.00021808729081635226, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025791394599526674, + "loss": 0.02, "step": 108240 }, { - "epoch": 0.55, - "learning_rate": 0.00021807972312333824, - "loss": 0.0192, + "epoch": 0.28, + "learning_rate": 0.00025791005777889525, + "loss": 0.0224, "step": 108250 }, { - "epoch": 0.55, - "learning_rate": 0.00021807215543032425, - "loss": 0.013, + "epoch": 0.28, + "learning_rate": 0.00025790616956252376, + "loss": 0.0213, "step": 108260 }, { - "epoch": 0.55, - "learning_rate": 0.00021806458773731023, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.00025790228134615233, + "loss": 0.0217, "step": 108270 }, { - "epoch": 0.55, - "learning_rate": 0.0002180570200442962, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.00025789839312978085, + "loss": 0.0221, "step": 108280 }, { - "epoch": 0.55, - "learning_rate": 0.00021804945235128222, - "loss": 0.0175, + "epoch": 0.28, + "learning_rate": 0.0002578945049134094, + "loss": 0.0254, "step": 108290 }, { - "epoch": 0.55, - "learning_rate": 0.0002180418846582682, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.00025789061669703793, + "loss": 0.0167, "step": 108300 }, { - "epoch": 0.55, - "learning_rate": 0.00021803431696525418, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002578867284806665, + "loss": 0.0195, "step": 108310 }, { - "epoch": 0.55, - "learning_rate": 0.0002180267492722402, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.000257882840264295, + "loss": 0.0226, "step": 108320 }, { - "epoch": 0.55, - "learning_rate": 0.00021801918157922617, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.00025787895204792353, + "loss": 0.0268, "step": 108330 }, { - "epoch": 0.55, - "learning_rate": 0.00021801161388621215, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025787506383155204, + "loss": 0.0205, "step": 108340 }, { - "epoch": 0.55, - "learning_rate": 0.00021800404619319813, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.0002578711756151806, + "loss": 0.0256, "step": 108350 }, { - "epoch": 0.55, - "learning_rate": 0.00021799647850018414, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.0002578672873988091, + "loss": 0.0284, "step": 108360 }, { - "epoch": 0.55, - "learning_rate": 0.00021798891080717012, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.0002578633991824377, + "loss": 0.0218, "step": 108370 }, { - "epoch": 0.55, - "learning_rate": 0.0002179813431141561, - "loss": 0.0173, + "epoch": 0.28, + "learning_rate": 0.0002578595109660662, + "loss": 0.0226, "step": 108380 }, { - "epoch": 0.55, - "learning_rate": 0.0002179737754211421, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.0002578556227496948, + "loss": 0.0244, "step": 108390 }, { - "epoch": 0.55, - "learning_rate": 0.0002179662077281281, - "loss": 0.0167, + "epoch": 0.28, + "learning_rate": 0.0002578517345333233, + "loss": 0.0202, "step": 108400 }, { - "epoch": 0.55, - "learning_rate": 0.00021795864003511408, - "loss": 0.0154, + "epoch": 0.28, + "learning_rate": 0.0002578478463169518, + "loss": 0.0227, "step": 108410 }, { - "epoch": 0.55, - "learning_rate": 0.00021795107234210008, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002578439581005804, + "loss": 0.0245, "step": 108420 }, { - "epoch": 0.55, - "learning_rate": 0.00021794350464908607, - "loss": 0.0185, + "epoch": 0.28, + "learning_rate": 0.0002578400698842089, + "loss": 0.0199, "step": 108430 }, { - "epoch": 0.55, - "learning_rate": 0.00021793593695607205, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.00025783618166783746, + "loss": 0.0197, "step": 108440 }, { - "epoch": 0.55, - "learning_rate": 0.00021792836926305806, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.000257832293451466, + "loss": 0.0235, "step": 108450 }, { - "epoch": 0.55, - "learning_rate": 0.00021792080157004404, - "loss": 0.016, + "epoch": 0.28, + "learning_rate": 0.0002578284052350945, + "loss": 0.0236, "step": 108460 }, { - "epoch": 0.55, - "learning_rate": 0.00021791323387703002, - "loss": 0.0127, + "epoch": 0.28, + "learning_rate": 0.000257824517018723, + "loss": 0.0243, "step": 108470 }, { - "epoch": 0.55, - "learning_rate": 0.00021790566618401603, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.00025782062880235157, + "loss": 0.0202, "step": 108480 }, { - "epoch": 0.55, - "learning_rate": 0.000217898098491002, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.0002578167405859801, + "loss": 0.0254, "step": 108490 }, { - "epoch": 0.55, - "learning_rate": 0.000217890530797988, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025781285236960866, + "loss": 0.0234, "step": 108500 }, { - "epoch": 0.55, - "learning_rate": 0.00021788296310497397, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.00025780896415323717, + "loss": 0.0199, "step": 108510 }, { - "epoch": 0.55, - "learning_rate": 0.00021787539541195998, - "loss": 0.0122, + "epoch": 0.28, + "learning_rate": 0.00025780507593686574, + "loss": 0.0249, "step": 108520 }, { - "epoch": 0.55, - "learning_rate": 0.00021786782771894596, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.00025780118772049425, + "loss": 0.0236, "step": 108530 }, { - "epoch": 0.55, - "learning_rate": 0.00021786026002593194, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025779729950412277, + "loss": 0.0274, "step": 108540 }, { - "epoch": 0.55, - "learning_rate": 0.00021785269233291795, - "loss": 0.0116, + "epoch": 0.28, + "learning_rate": 0.0002577934112877513, + "loss": 0.0202, "step": 108550 }, { - "epoch": 0.55, - "learning_rate": 0.00021784512463990393, - "loss": 0.0165, + "epoch": 0.28, + "learning_rate": 0.00025778952307137985, + "loss": 0.0241, "step": 108560 }, { - "epoch": 0.55, - "learning_rate": 0.00021783755694688991, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.0002577856348550084, + "loss": 0.0239, "step": 108570 }, { - "epoch": 0.55, - "learning_rate": 0.00021782998925387592, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.00025778174663863693, + "loss": 0.0218, "step": 108580 }, { - "epoch": 0.55, - "learning_rate": 0.0002178224215608619, - "loss": 0.0196, + "epoch": 0.28, + "learning_rate": 0.00025777785842226545, + "loss": 0.0177, "step": 108590 }, { - "epoch": 0.55, - "learning_rate": 0.00021781485386784789, - "loss": 0.012, + "epoch": 0.28, + "learning_rate": 0.000257773970205894, + "loss": 0.022, "step": 108600 }, { - "epoch": 0.55, - "learning_rate": 0.0002178072861748339, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.00025777008198952253, + "loss": 0.0217, "step": 108610 }, { - "epoch": 0.55, - "learning_rate": 0.00021779971848181988, - "loss": 0.0168, + "epoch": 0.28, + "learning_rate": 0.00025776619377315105, + "loss": 0.0259, "step": 108620 }, { - "epoch": 0.55, - "learning_rate": 0.00021779215078880586, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002577623055567796, + "loss": 0.0246, "step": 108630 }, { - "epoch": 0.55, - "learning_rate": 0.00021778458309579187, - "loss": 0.014, + "epoch": 0.28, + "learning_rate": 0.00025775841734040813, + "loss": 0.0237, "step": 108640 }, { - "epoch": 0.55, - "learning_rate": 0.00021777701540277785, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.0002577545291240367, + "loss": 0.0241, "step": 108650 }, { - "epoch": 0.55, - "learning_rate": 0.00021776944770976383, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002577506409076652, + "loss": 0.0229, "step": 108660 }, { - "epoch": 0.55, - "learning_rate": 0.0002177618800167498, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.00025774675269129373, + "loss": 0.0248, "step": 108670 }, { - "epoch": 0.55, - "learning_rate": 0.00021775431232373582, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025774286447492224, + "loss": 0.0264, "step": 108680 }, { - "epoch": 0.55, - "learning_rate": 0.0002177467446307218, - "loss": 0.0203, + "epoch": 0.28, + "learning_rate": 0.0002577389762585508, + "loss": 0.0248, "step": 108690 }, { - "epoch": 0.55, - "learning_rate": 0.00021773917693770778, - "loss": 0.02, + "epoch": 0.28, + "learning_rate": 0.0002577350880421793, + "loss": 0.0237, "step": 108700 }, { - "epoch": 0.55, - "learning_rate": 0.0002177316092446938, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002577311998258079, + "loss": 0.0256, "step": 108710 }, { - "epoch": 0.55, - "learning_rate": 0.00021772404155167977, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.0002577273116094364, + "loss": 0.0216, "step": 108720 }, { - "epoch": 0.55, - "learning_rate": 0.00021771647385866573, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.000257723423393065, + "loss": 0.0202, "step": 108730 }, { - "epoch": 0.55, - "learning_rate": 0.0002177089061656517, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.0002577195351766935, + "loss": 0.0274, "step": 108740 }, { - "epoch": 0.55, - "learning_rate": 0.00021770133847263772, - "loss": 0.0164, + "epoch": 0.28, + "learning_rate": 0.000257715646960322, + "loss": 0.0233, "step": 108750 }, { - "epoch": 0.55, - "learning_rate": 0.0002176937707796237, - "loss": 0.0166, + "epoch": 0.28, + "learning_rate": 0.0002577117587439505, + "loss": 0.0202, "step": 108760 }, { - "epoch": 0.55, - "learning_rate": 0.00021768620308660968, - "loss": 0.0131, + "epoch": 0.28, + "learning_rate": 0.0002577078705275791, + "loss": 0.021, "step": 108770 }, { - "epoch": 0.55, - "learning_rate": 0.0002176786353935957, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025770398231120766, + "loss": 0.0233, "step": 108780 }, { - "epoch": 0.55, - "learning_rate": 0.00021767106770058167, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002577000940948362, + "loss": 0.0219, "step": 108790 }, { - "epoch": 0.55, - "learning_rate": 0.00021766350000756765, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.0002576962058784647, + "loss": 0.019, "step": 108800 }, { - "epoch": 0.55, - "learning_rate": 0.00021765593231455366, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.00025769231766209326, + "loss": 0.0215, "step": 108810 }, { - "epoch": 0.55, - "learning_rate": 0.00021764836462153964, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.00025768842944572177, + "loss": 0.0254, "step": 108820 }, { - "epoch": 0.55, - "learning_rate": 0.00021764079692852562, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.0002576845412293503, + "loss": 0.0184, "step": 108830 }, { - "epoch": 0.55, - "learning_rate": 0.00021763322923551163, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.00025768065301297885, + "loss": 0.0195, "step": 108840 }, { - "epoch": 0.55, - "learning_rate": 0.0002176256615424976, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025767676479660737, + "loss": 0.0212, "step": 108850 }, { - "epoch": 0.55, - "learning_rate": 0.0002176180938494836, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.00025767287658023594, + "loss": 0.022, "step": 108860 }, { - "epoch": 0.55, - "learning_rate": 0.0002176105261564696, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025766898836386445, + "loss": 0.0202, "step": 108870 }, { - "epoch": 0.55, - "learning_rate": 0.00021760295846345558, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025766510014749297, + "loss": 0.0198, "step": 108880 }, { - "epoch": 0.55, - "learning_rate": 0.00021759539077044156, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025766121193112154, + "loss": 0.0236, "step": 108890 }, { - "epoch": 0.55, - "learning_rate": 0.00021758782307742755, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025765732371475005, + "loss": 0.0221, "step": 108900 }, { - "epoch": 0.55, - "learning_rate": 0.00021758025538441355, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025765343549837856, + "loss": 0.0211, "step": 108910 }, { - "epoch": 0.55, - "learning_rate": 0.00021757268769139954, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.00025764954728200713, + "loss": 0.0228, "step": 108920 }, { - "epoch": 0.55, - "learning_rate": 0.00021756511999838552, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025764565906563565, + "loss": 0.0187, "step": 108930 }, { - "epoch": 0.55, - "learning_rate": 0.00021755755230537153, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.0002576417708492642, + "loss": 0.0232, "step": 108940 }, { - "epoch": 0.55, - "learning_rate": 0.0002175499846123575, - "loss": 0.0129, + "epoch": 0.28, + "learning_rate": 0.00025763788263289273, + "loss": 0.0217, "step": 108950 }, { - "epoch": 0.55, - "learning_rate": 0.0002175424169193435, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.00025763399441652125, + "loss": 0.018, "step": 108960 }, { - "epoch": 0.55, - "learning_rate": 0.0002175348492263295, - "loss": 0.0119, + "epoch": 0.28, + "learning_rate": 0.0002576301062001498, + "loss": 0.0197, "step": 108970 }, { - "epoch": 0.55, - "learning_rate": 0.00021752728153331548, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025762621798377833, + "loss": 0.0196, "step": 108980 }, { - "epoch": 0.55, - "learning_rate": 0.00021751971384030146, - "loss": 0.0128, + "epoch": 0.28, + "learning_rate": 0.0002576223297674069, + "loss": 0.0274, "step": 108990 }, { - "epoch": 0.55, - "learning_rate": 0.00021751214614728747, - "loss": 0.0128, + "epoch": 0.28, + "learning_rate": 0.0002576184415510354, + "loss": 0.0261, "step": 109000 }, { - "epoch": 0.55, - "eval_cer": 0.9145003381830497, - "eval_loss": 0.011132709681987762, - "eval_runtime": 116.5842, - "eval_samples_per_second": 17.155, - "eval_steps_per_second": 4.289, + "epoch": 0.28, + "eval_cer": 0.8818188561887047, + "eval_loss": 0.015223901718854904, + "eval_runtime": 107.9791, + "eval_samples_per_second": 18.522, + "eval_steps_per_second": 4.631, "step": 109000 }, { - "epoch": 0.55, - "learning_rate": 0.00021750457845427345, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.0002576145533346639, + "loss": 0.0208, "step": 109010 }, { - "epoch": 0.55, - "learning_rate": 0.00021749701076125943, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.0002576106651182925, + "loss": 0.0222, "step": 109020 }, { - "epoch": 0.55, - "learning_rate": 0.00021748944306824544, - "loss": 0.0132, + "epoch": 0.28, + "learning_rate": 0.000257606776901921, + "loss": 0.0232, "step": 109030 }, { - "epoch": 0.55, - "learning_rate": 0.00021748187537523142, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.0002576028886855495, + "loss": 0.0207, "step": 109040 }, { - "epoch": 0.55, - "learning_rate": 0.0002174743076822174, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.0002575990004691781, + "loss": 0.0246, "step": 109050 }, { - "epoch": 0.55, - "learning_rate": 0.00021746673998920338, - "loss": 0.0134, + "epoch": 0.28, + "learning_rate": 0.0002575951122528066, + "loss": 0.0203, "step": 109060 }, { - "epoch": 0.55, - "learning_rate": 0.0002174591722961894, - "loss": 0.0126, + "epoch": 0.28, + "learning_rate": 0.0002575912240364352, + "loss": 0.0244, "step": 109070 }, { - "epoch": 0.55, - "learning_rate": 0.00021745160460317537, - "loss": 0.0146, - "step": 109080 + "epoch": 0.28, + "learning_rate": 0.0002575873358200637, + "loss": 0.0191, + "step": 109080 }, { - "epoch": 0.55, - "learning_rate": 0.00021744403691016136, - "loss": 0.013, + "epoch": 0.28, + "learning_rate": 0.0002575834476036922, + "loss": 0.0215, "step": 109090 }, { - "epoch": 0.55, - "learning_rate": 0.00021743646921714736, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.0002575795593873208, + "loss": 0.0185, "step": 109100 }, { - "epoch": 0.55, - "learning_rate": 0.00021742890152413335, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.0002575756711709493, + "loss": 0.0202, "step": 109110 }, { - "epoch": 0.55, - "learning_rate": 0.00021742133383111933, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025757178295457786, + "loss": 0.0197, "step": 109120 }, { - "epoch": 0.55, - "learning_rate": 0.00021741376613810534, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.00025756789473820637, + "loss": 0.0281, "step": 109130 }, { - "epoch": 0.55, - "learning_rate": 0.00021740619844509132, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.00025756400652183494, + "loss": 0.0189, "step": 109140 }, { - "epoch": 0.55, - "learning_rate": 0.0002173986307520773, - "loss": 0.017, + "epoch": 0.28, + "learning_rate": 0.00025756011830546346, + "loss": 0.0202, "step": 109150 }, { - "epoch": 0.55, - "learning_rate": 0.0002173910630590633, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.00025755623008909197, + "loss": 0.0213, "step": 109160 }, { - "epoch": 0.55, - "learning_rate": 0.0002173834953660493, - "loss": 0.0227, + "epoch": 0.28, + "learning_rate": 0.0002575523418727205, + "loss": 0.021, "step": 109170 }, { - "epoch": 0.55, - "learning_rate": 0.00021737592767303527, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.00025754845365634905, + "loss": 0.0239, "step": 109180 }, { - "epoch": 0.55, - "learning_rate": 0.00021736835998002128, - "loss": 0.0136, + "epoch": 0.28, + "learning_rate": 0.00025754456543997757, + "loss": 0.0215, "step": 109190 }, { - "epoch": 0.55, - "learning_rate": 0.00021736079228700726, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025754067722360614, + "loss": 0.0238, "step": 109200 }, { - "epoch": 0.55, - "learning_rate": 0.00021735322459399324, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025753678900723465, + "loss": 0.0175, "step": 109210 }, { - "epoch": 0.55, - "learning_rate": 0.00021734565690097925, - "loss": 0.0196, + "epoch": 0.28, + "learning_rate": 0.00025753290079086317, + "loss": 0.0167, "step": 109220 }, { - "epoch": 0.55, - "learning_rate": 0.00021733808920796523, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025752901257449173, + "loss": 0.0215, "step": 109230 }, { - "epoch": 0.55, - "learning_rate": 0.0002173305215149512, - "loss": 0.0141, + "epoch": 0.28, + "learning_rate": 0.00025752512435812025, + "loss": 0.0168, "step": 109240 }, { - "epoch": 0.55, - "learning_rate": 0.0002173229538219372, - "loss": 0.0138, + "epoch": 0.28, + "learning_rate": 0.00025752123614174876, + "loss": 0.0192, "step": 109250 }, { - "epoch": 0.55, - "learning_rate": 0.0002173153861289232, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025751734792537733, + "loss": 0.0218, "step": 109260 }, { - "epoch": 0.55, - "learning_rate": 0.00021730781843590918, - "loss": 0.0148, + "epoch": 0.28, + "learning_rate": 0.0002575134597090059, + "loss": 0.0212, "step": 109270 }, { - "epoch": 0.55, - "learning_rate": 0.00021730025074289517, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.0002575095714926344, + "loss": 0.0231, "step": 109280 }, { - "epoch": 0.55, - "learning_rate": 0.00021729268304988117, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.00025750568327626293, + "loss": 0.0226, "step": 109290 }, { - "epoch": 0.55, - "learning_rate": 0.00021728511535686716, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.00025750179505989144, + "loss": 0.0241, "step": 109300 }, { - "epoch": 0.55, - "learning_rate": 0.00021727754766385314, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025749790684352, + "loss": 0.0224, "step": 109310 }, { - "epoch": 0.55, - "learning_rate": 0.00021726997997083915, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.00025749401862714853, + "loss": 0.0214, "step": 109320 }, { - "epoch": 0.55, - "learning_rate": 0.00021726241227782513, - "loss": 0.0135, + "epoch": 0.28, + "learning_rate": 0.0002574901304107771, + "loss": 0.0227, "step": 109330 }, { - "epoch": 0.55, - "learning_rate": 0.0002172548445848111, - "loss": 0.0156, + "epoch": 0.28, + "learning_rate": 0.0002574862421944056, + "loss": 0.0185, "step": 109340 }, { - "epoch": 0.55, - "learning_rate": 0.00021724727689179712, - "loss": 0.0176, + "epoch": 0.28, + "learning_rate": 0.0002574823539780342, + "loss": 0.0197, "step": 109350 }, { - "epoch": 0.55, - "learning_rate": 0.0002172397091987831, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.0002574784657616627, + "loss": 0.0195, "step": 109360 }, { - "epoch": 0.55, - "learning_rate": 0.00021723214150576908, - "loss": 0.0128, + "epoch": 0.28, + "learning_rate": 0.0002574745775452912, + "loss": 0.0177, "step": 109370 }, { - "epoch": 0.55, - "learning_rate": 0.0002172245738127551, - "loss": 0.0181, + "epoch": 0.28, + "learning_rate": 0.0002574706893289197, + "loss": 0.0205, "step": 109380 }, { - "epoch": 0.55, - "learning_rate": 0.00021721700611974107, - "loss": 0.017, + "epoch": 0.28, + "learning_rate": 0.0002574668011125483, + "loss": 0.0208, "step": 109390 }, { - "epoch": 0.55, - "learning_rate": 0.00021720943842672705, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002574629128961768, + "loss": 0.0256, "step": 109400 }, { - "epoch": 0.55, - "learning_rate": 0.00021720187073371303, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.0002574590246798054, + "loss": 0.0169, "step": 109410 }, { - "epoch": 0.55, - "learning_rate": 0.00021719430304069904, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.0002574551364634339, + "loss": 0.0218, "step": 109420 }, { - "epoch": 0.55, - "learning_rate": 0.00021718673534768502, - "loss": 0.0212, + "epoch": 0.28, + "learning_rate": 0.0002574512482470624, + "loss": 0.0201, "step": 109430 }, { - "epoch": 0.55, - "learning_rate": 0.000217179167654671, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.000257447360030691, + "loss": 0.0205, "step": 109440 }, { - "epoch": 0.55, - "learning_rate": 0.000217171599961657, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.0002574434718143195, + "loss": 0.0203, "step": 109450 }, { - "epoch": 0.55, - "learning_rate": 0.000217164032268643, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.000257439583597948, + "loss": 0.0186, "step": 109460 }, { - "epoch": 0.55, - "learning_rate": 0.00021715646457562898, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.00025743569538157657, + "loss": 0.0241, "step": 109470 }, { - "epoch": 0.55, - "learning_rate": 0.00021714889688261498, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025743180716520514, + "loss": 0.0164, "step": 109480 }, { - "epoch": 0.55, - "learning_rate": 0.00021714132918960097, - "loss": 0.0137, + "epoch": 0.28, + "learning_rate": 0.00025742791894883365, + "loss": 0.019, "step": 109490 }, { - "epoch": 0.55, - "learning_rate": 0.00021713376149658695, + "epoch": 0.28, + "learning_rate": 0.00025742403073246217, "loss": 0.0174, "step": 109500 }, { - "epoch": 0.55, - "learning_rate": 0.00021712619380357296, - "loss": 0.0149, + "epoch": 0.28, + "learning_rate": 0.0002574201425160907, + "loss": 0.0209, "step": 109510 }, { - "epoch": 0.55, - "learning_rate": 0.00021711862611055894, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025741625429971925, + "loss": 0.0232, "step": 109520 }, { - "epoch": 0.55, - "learning_rate": 0.00021711105841754492, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025741236608334777, + "loss": 0.0191, "step": 109530 }, { - "epoch": 0.55, - "learning_rate": 0.00021710349072453093, - "loss": 0.0132, + "epoch": 0.28, + "learning_rate": 0.00025740847786697634, + "loss": 0.0218, "step": 109540 }, { - "epoch": 0.55, - "learning_rate": 0.0002170959230315169, - "loss": 0.0123, + "epoch": 0.28, + "learning_rate": 0.00025740458965060485, + "loss": 0.0238, "step": 109550 }, { - "epoch": 0.55, - "learning_rate": 0.0002170883553385029, - "loss": 0.0172, + "epoch": 0.28, + "learning_rate": 0.0002574007014342334, + "loss": 0.0251, "step": 109560 }, { - "epoch": 0.55, - "learning_rate": 0.00021708078764548887, - "loss": 0.0189, + "epoch": 0.28, + "learning_rate": 0.00025739681321786193, + "loss": 0.0235, "step": 109570 }, { - "epoch": 0.55, - "learning_rate": 0.00021707321995247488, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025739292500149045, + "loss": 0.0253, "step": 109580 }, { - "epoch": 0.55, - "learning_rate": 0.00021706565225946086, - "loss": 0.0143, + "epoch": 0.28, + "learning_rate": 0.00025738903678511896, + "loss": 0.0196, "step": 109590 }, { - "epoch": 0.55, - "learning_rate": 0.00021705808456644684, - "loss": 0.0121, + "epoch": 0.28, + "learning_rate": 0.00025738514856874753, + "loss": 0.0223, "step": 109600 }, { - "epoch": 0.55, - "learning_rate": 0.00021705051687343285, - "loss": 0.015, + "epoch": 0.28, + "learning_rate": 0.0002573812603523761, + "loss": 0.0206, "step": 109610 }, { - "epoch": 0.55, - "learning_rate": 0.00021704294918041883, - "loss": 0.0157, + "epoch": 0.28, + "learning_rate": 0.0002573773721360046, + "loss": 0.0238, "step": 109620 }, { - "epoch": 0.55, - "learning_rate": 0.00021703538148740481, - "loss": 0.0152, + "epoch": 0.28, + "learning_rate": 0.00025737348391963313, + "loss": 0.0256, "step": 109630 }, { - "epoch": 0.55, - "learning_rate": 0.00021702781379439082, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002573695957032617, + "loss": 0.0183, "step": 109640 }, { - "epoch": 0.55, - "learning_rate": 0.0002170202461013768, - "loss": 0.0134, + "epoch": 0.28, + "learning_rate": 0.0002573657074868902, + "loss": 0.0223, "step": 109650 }, { - "epoch": 0.55, - "learning_rate": 0.00021701267840836279, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.0002573618192705187, + "loss": 0.0202, "step": 109660 }, { - "epoch": 0.55, - "learning_rate": 0.0002170051107153488, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002573579310541473, + "loss": 0.0204, "step": 109670 }, { - "epoch": 0.55, - "learning_rate": 0.00021699754302233478, - "loss": 0.012, + "epoch": 0.28, + "learning_rate": 0.0002573540428377758, + "loss": 0.0226, "step": 109680 }, { - "epoch": 0.55, - "learning_rate": 0.00021698997532932076, - "loss": 0.0158, + "epoch": 0.28, + "learning_rate": 0.0002573501546214044, + "loss": 0.0218, "step": 109690 }, { - "epoch": 0.55, - "learning_rate": 0.00021698240763630677, - "loss": 0.0142, + "epoch": 0.28, + "learning_rate": 0.0002573462664050329, + "loss": 0.0223, "step": 109700 }, { - "epoch": 0.55, - "learning_rate": 0.00021697483994329275, - "loss": 0.0159, + "epoch": 0.28, + "learning_rate": 0.0002573423781886614, + "loss": 0.0228, "step": 109710 }, { - "epoch": 0.55, - "learning_rate": 0.00021696727225027873, - "loss": 0.0153, + "epoch": 0.28, + "learning_rate": 0.0002573384899722899, + "loss": 0.0213, "step": 109720 }, { - "epoch": 0.55, - "learning_rate": 0.0002169597045572647, - "loss": 0.0123, + "epoch": 0.28, + "learning_rate": 0.0002573346017559185, + "loss": 0.0266, "step": 109730 }, { - "epoch": 0.55, - "learning_rate": 0.00021695213686425072, - "loss": 0.0161, + "epoch": 0.28, + "learning_rate": 0.000257330713539547, + "loss": 0.0202, "step": 109740 }, { - "epoch": 0.55, - "learning_rate": 0.0002169445691712367, - "loss": 0.0119, + "epoch": 0.28, + "learning_rate": 0.0002573268253231756, + "loss": 0.0275, "step": 109750 }, { - "epoch": 0.55, - "learning_rate": 0.00021693700147822268, - "loss": 0.0182, + "epoch": 0.28, + "learning_rate": 0.0002573229371068041, + "loss": 0.025, "step": 109760 }, { - "epoch": 0.55, - "learning_rate": 0.0002169294337852087, - "loss": 0.019, + "epoch": 0.28, + "learning_rate": 0.00025731904889043266, + "loss": 0.0211, "step": 109770 }, { - "epoch": 0.55, - "learning_rate": 0.00021692186609219467, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.00025731516067406117, + "loss": 0.0222, "step": 109780 }, { - "epoch": 0.55, - "learning_rate": 0.00021691429839918065, - "loss": 0.0151, + "epoch": 0.28, + "learning_rate": 0.0002573112724576897, + "loss": 0.0186, "step": 109790 }, { - "epoch": 0.55, - "learning_rate": 0.00021690673070616666, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.0002573073842413182, + "loss": 0.0222, "step": 109800 }, { - "epoch": 0.55, - "learning_rate": 0.00021689916301315264, - "loss": 0.0112, + "epoch": 0.28, + "learning_rate": 0.00025730349602494677, + "loss": 0.0212, "step": 109810 }, { - "epoch": 0.55, - "learning_rate": 0.00021689159532013862, - "loss": 0.0145, + "epoch": 0.28, + "learning_rate": 0.00025729960780857534, + "loss": 0.0257, "step": 109820 }, { - "epoch": 0.55, - "learning_rate": 0.00021688402762712463, - "loss": 0.0114, + "epoch": 0.28, + "learning_rate": 0.00025729571959220385, + "loss": 0.0221, "step": 109830 }, { - "epoch": 0.55, - "learning_rate": 0.00021687645993411061, - "loss": 0.0134, + "epoch": 0.28, + "learning_rate": 0.00025729183137583237, + "loss": 0.0223, "step": 109840 }, { - "epoch": 0.55, - "learning_rate": 0.0002168688922410966, - "loss": 0.0146, + "epoch": 0.28, + "learning_rate": 0.00025728794315946094, + "loss": 0.0256, "step": 109850 }, { - "epoch": 0.55, - "learning_rate": 0.0002168613245480826, - "loss": 0.0147, + "epoch": 0.28, + "learning_rate": 0.00025728405494308945, + "loss": 0.0196, "step": 109860 }, { - "epoch": 0.55, - "learning_rate": 0.00021685375685506859, - "loss": 0.0115, + "epoch": 0.28, + "learning_rate": 0.00025728016672671797, + "loss": 0.0204, "step": 109870 }, { - "epoch": 0.55, - "learning_rate": 0.00021684618916205457, - "loss": 0.0162, + "epoch": 0.28, + "learning_rate": 0.00025727627851034653, + "loss": 0.0242, "step": 109880 }, { - "epoch": 0.55, - "learning_rate": 0.00021683862146904058, - "loss": 0.0133, + "epoch": 0.28, + "learning_rate": 0.00025727239029397505, + "loss": 0.0205, "step": 109890 }, { - "epoch": 0.55, - "learning_rate": 0.00021683105377602656, - "loss": 0.0174, + "epoch": 0.28, + "learning_rate": 0.0002572685020776036, + "loss": 0.0211, "step": 109900 }, { - "epoch": 0.55, - "learning_rate": 0.00021682348608301254, - "loss": 0.0163, + "epoch": 0.28, + "learning_rate": 0.00025726461386123213, + "loss": 0.0192, "step": 109910 }, { - "epoch": 0.55, - "learning_rate": 0.00021681591838999852, - "loss": 0.018, + "epoch": 0.28, + "learning_rate": 0.00025726072564486065, + "loss": 0.0177, "step": 109920 }, { - "epoch": 0.55, - "learning_rate": 0.00021680835069698453, - "loss": 0.0169, + "epoch": 0.28, + "learning_rate": 0.00025725683742848916, + "loss": 0.0231, "step": 109930 }, { - "epoch": 0.55, - "learning_rate": 0.0002168007830039705, - "loss": 0.0144, + "epoch": 0.28, + "learning_rate": 0.00025725294921211773, + "loss": 0.0218, "step": 109940 }, { - "epoch": 0.55, - "learning_rate": 0.0002167932153109565, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.00025724906099574624, + "loss": 0.0221, "step": 109950 }, { - "epoch": 0.55, - "learning_rate": 0.0002167856476179425, - "loss": 0.0112, + "epoch": 0.29, + "learning_rate": 0.0002572451727793748, + "loss": 0.0207, "step": 109960 }, { - "epoch": 0.55, - "learning_rate": 0.00021677807992492848, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.00025724128456300333, + "loss": 0.0224, "step": 109970 }, { - "epoch": 0.55, - "learning_rate": 0.00021677051223191444, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002572373963466319, + "loss": 0.0183, "step": 109980 }, { - "epoch": 0.55, - "learning_rate": 0.00021676294453890042, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.0002572335081302604, + "loss": 0.0168, "step": 109990 }, { - "epoch": 0.55, - "learning_rate": 0.00021675537684588643, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002572296199138889, + "loss": 0.0189, "step": 110000 }, { - "epoch": 0.55, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.010691503062844276, - "eval_runtime": 116.7007, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.284, + "epoch": 0.29, + "eval_cer": 0.8817908634500211, + "eval_loss": 0.01513556856662035, + "eval_runtime": 108.099, + "eval_samples_per_second": 18.502, + "eval_steps_per_second": 4.625, "step": 110000 }, { - "epoch": 0.56, - "learning_rate": 0.0002167478091528724, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002572257316975175, + "loss": 0.0182, "step": 110010 }, { - "epoch": 0.56, - "learning_rate": 0.0002167402414598584, - "loss": 0.0209, + "epoch": 0.29, + "learning_rate": 0.000257221843481146, + "loss": 0.0203, "step": 110020 }, { - "epoch": 0.56, - "learning_rate": 0.0002167326737668444, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.0002572179552647746, + "loss": 0.0241, "step": 110030 }, { - "epoch": 0.56, - "learning_rate": 0.00021672510607383038, - "loss": 0.0184, + "epoch": 0.29, + "learning_rate": 0.0002572140670484031, + "loss": 0.0205, "step": 110040 }, { - "epoch": 0.56, - "learning_rate": 0.00021671753838081636, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.0002572101788320316, + "loss": 0.0173, "step": 110050 }, { - "epoch": 0.56, - "learning_rate": 0.00021670997068780237, - "loss": 0.0206, + "epoch": 0.29, + "learning_rate": 0.0002572062906156602, + "loss": 0.02, "step": 110060 }, { - "epoch": 0.56, - "learning_rate": 0.00021670240299478835, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.0002572024023992887, + "loss": 0.0204, "step": 110070 }, { - "epoch": 0.56, - "learning_rate": 0.00021669483530177433, - "loss": 0.0166, + "epoch": 0.29, + "learning_rate": 0.0002571985141829172, + "loss": 0.0193, "step": 110080 }, { - "epoch": 0.56, - "learning_rate": 0.00021668726760876034, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.0002571946259665458, + "loss": 0.0222, "step": 110090 }, { - "epoch": 0.56, - "learning_rate": 0.00021667969991574632, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.0002571907377501743, + "loss": 0.0211, "step": 110100 }, { - "epoch": 0.56, - "learning_rate": 0.0002166721322227323, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025718684953380286, + "loss": 0.022, "step": 110110 }, { - "epoch": 0.56, - "learning_rate": 0.00021666456452971829, - "loss": 0.0174, + "epoch": 0.29, + "learning_rate": 0.00025718296131743137, + "loss": 0.0216, "step": 110120 }, { - "epoch": 0.56, - "learning_rate": 0.0002166569968367043, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.0002571790731010599, + "loss": 0.0221, "step": 110130 }, { - "epoch": 0.56, - "learning_rate": 0.00021664942914369028, - "loss": 0.0202, + "epoch": 0.29, + "learning_rate": 0.00025717518488468845, + "loss": 0.0183, "step": 110140 }, { - "epoch": 0.56, - "learning_rate": 0.00021664186145067626, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025717129666831697, + "loss": 0.0219, "step": 110150 }, { - "epoch": 0.56, - "learning_rate": 0.00021663429375766227, - "loss": 0.0186, + "epoch": 0.29, + "learning_rate": 0.00025716740845194554, + "loss": 0.0193, "step": 110160 }, { - "epoch": 0.56, - "learning_rate": 0.00021662672606464825, - "loss": 0.0183, + "epoch": 0.29, + "learning_rate": 0.00025716352023557405, + "loss": 0.0228, "step": 110170 }, { - "epoch": 0.56, - "learning_rate": 0.00021661915837163423, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.00025715963201920257, + "loss": 0.0214, "step": 110180 }, { - "epoch": 0.56, - "learning_rate": 0.00021661159067862024, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.00025715574380283114, + "loss": 0.0222, "step": 110190 }, { - "epoch": 0.56, - "learning_rate": 0.00021660402298560622, - "loss": 0.0195, + "epoch": 0.29, + "learning_rate": 0.00025715185558645965, + "loss": 0.0171, "step": 110200 }, { - "epoch": 0.56, - "learning_rate": 0.0002165964552925922, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.00025714796737008816, + "loss": 0.0174, "step": 110210 }, { - "epoch": 0.56, - "learning_rate": 0.0002165888875995782, - "loss": 0.0144, + "epoch": 0.29, + "learning_rate": 0.00025714407915371673, + "loss": 0.0217, "step": 110220 }, { - "epoch": 0.56, - "learning_rate": 0.0002165813199065642, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025714019093734525, + "loss": 0.0259, "step": 110230 }, { - "epoch": 0.56, - "learning_rate": 0.00021657375221355017, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.0002571363027209738, + "loss": 0.0193, "step": 110240 }, { - "epoch": 0.56, - "learning_rate": 0.00021656618452053618, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.00025713241450460233, + "loss": 0.024, "step": 110250 }, { - "epoch": 0.56, - "learning_rate": 0.00021655861682752216, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025712852628823085, + "loss": 0.0211, "step": 110260 }, { - "epoch": 0.56, - "learning_rate": 0.00021655104913450814, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.0002571246380718594, + "loss": 0.022, "step": 110270 }, { - "epoch": 0.56, - "learning_rate": 0.00021654348144149415, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.00025712074985548793, + "loss": 0.0226, "step": 110280 }, { - "epoch": 0.56, - "learning_rate": 0.00021653591374848013, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.00025711686163911644, + "loss": 0.0248, "step": 110290 }, { - "epoch": 0.56, - "learning_rate": 0.00021652834605546611, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.000257112973422745, + "loss": 0.0216, "step": 110300 }, { - "epoch": 0.56, - "learning_rate": 0.0002165207783624521, - "loss": 0.021, + "epoch": 0.29, + "learning_rate": 0.0002571090852063736, + "loss": 0.0293, "step": 110310 }, { - "epoch": 0.56, - "learning_rate": 0.0002165132106694381, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.0002571051969900021, + "loss": 0.0251, "step": 110320 }, { - "epoch": 0.56, - "learning_rate": 0.00021650564297642409, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.0002571013087736306, + "loss": 0.0201, "step": 110330 }, { - "epoch": 0.56, - "learning_rate": 0.00021649807528341007, - "loss": 0.0179, + "epoch": 0.29, + "learning_rate": 0.0002570974205572591, + "loss": 0.0238, "step": 110340 }, { - "epoch": 0.56, - "learning_rate": 0.00021649050759039608, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.0002570935323408877, + "loss": 0.0224, "step": 110350 }, { - "epoch": 0.56, - "learning_rate": 0.00021648293989738206, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002570896441245162, + "loss": 0.0234, "step": 110360 }, { - "epoch": 0.56, - "learning_rate": 0.00021647537220436804, - "loss": 0.0187, + "epoch": 0.29, + "learning_rate": 0.0002570857559081448, + "loss": 0.0218, "step": 110370 }, { - "epoch": 0.56, - "learning_rate": 0.00021646780451135405, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002570818676917733, + "loss": 0.0251, "step": 110380 }, { - "epoch": 0.56, - "learning_rate": 0.00021646023681834003, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.00025707797947540186, + "loss": 0.0265, "step": 110390 }, { - "epoch": 0.56, - "learning_rate": 0.000216452669125326, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.0002570740912590304, + "loss": 0.025, "step": 110400 }, { - "epoch": 0.56, - "learning_rate": 0.00021644510143231202, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.0002570702030426589, + "loss": 0.0197, "step": 110410 }, { - "epoch": 0.56, - "learning_rate": 0.000216437533739298, - "loss": 0.0112, + "epoch": 0.29, + "learning_rate": 0.0002570663148262874, + "loss": 0.0283, "step": 110420 }, { - "epoch": 0.56, - "learning_rate": 0.00021642996604628398, - "loss": 0.0148, + "epoch": 0.29, + "learning_rate": 0.00025706242660991597, + "loss": 0.0254, "step": 110430 }, { - "epoch": 0.56, - "learning_rate": 0.00021642239835327, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.0002570585383935445, + "loss": 0.0272, "step": 110440 }, { - "epoch": 0.56, - "learning_rate": 0.00021641483066025597, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.00025705465017717306, + "loss": 0.0203, "step": 110450 }, { - "epoch": 0.56, - "learning_rate": 0.00021640726296724195, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025705076196080157, + "loss": 0.0258, "step": 110460 }, { - "epoch": 0.56, - "learning_rate": 0.00021639969527422793, - "loss": 0.0181, + "epoch": 0.29, + "learning_rate": 0.0002570468737444301, + "loss": 0.024, "step": 110470 }, { - "epoch": 0.56, - "learning_rate": 0.00021639212758121394, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.00025704298552805865, + "loss": 0.0201, "step": 110480 }, { - "epoch": 0.56, - "learning_rate": 0.00021638455988819992, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.00025703909731168717, + "loss": 0.0203, "step": 110490 }, { - "epoch": 0.56, - "learning_rate": 0.0002163769921951859, - "loss": 0.0187, + "epoch": 0.29, + "learning_rate": 0.0002570352090953157, + "loss": 0.0204, "step": 110500 }, { - "epoch": 0.56, - "learning_rate": 0.00021636942450217191, - "loss": 0.014, + "epoch": 0.29, + "learning_rate": 0.00025703132087894425, + "loss": 0.0207, "step": 110510 }, { - "epoch": 0.56, - "learning_rate": 0.0002163618568091579, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.0002570274326625728, + "loss": 0.0206, "step": 110520 }, { - "epoch": 0.56, - "learning_rate": 0.00021635428911614388, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025702354444620133, + "loss": 0.0223, "step": 110530 }, { - "epoch": 0.56, - "learning_rate": 0.00021634672142312989, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.00025701965622982985, + "loss": 0.0181, "step": 110540 }, { - "epoch": 0.56, - "learning_rate": 0.00021633915373011587, - "loss": 0.0117, + "epoch": 0.29, + "learning_rate": 0.00025701576801345836, + "loss": 0.0215, "step": 110550 }, { - "epoch": 0.56, - "learning_rate": 0.00021633158603710185, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.00025701187979708693, + "loss": 0.0214, "step": 110560 }, { - "epoch": 0.56, - "learning_rate": 0.00021632401834408786, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.00025700799158071545, + "loss": 0.0217, "step": 110570 }, { - "epoch": 0.56, - "learning_rate": 0.00021631645065107384, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.000257004103364344, + "loss": 0.0212, "step": 110580 }, { - "epoch": 0.56, - "learning_rate": 0.00021630888295805982, - "loss": 0.0235, + "epoch": 0.29, + "learning_rate": 0.00025700021514797253, + "loss": 0.0182, "step": 110590 }, { - "epoch": 0.56, - "learning_rate": 0.00021630131526504583, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.0002569963269316011, + "loss": 0.0223, "step": 110600 }, { - "epoch": 0.56, - "learning_rate": 0.0002162937475720318, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.0002569924387152296, + "loss": 0.0213, "step": 110610 }, { - "epoch": 0.56, - "learning_rate": 0.0002162861798790178, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025698855049885813, + "loss": 0.0233, "step": 110620 }, { - "epoch": 0.56, - "learning_rate": 0.00021627861218600377, - "loss": 0.0175, + "epoch": 0.29, + "learning_rate": 0.00025698466228248664, + "loss": 0.0208, "step": 110630 }, { - "epoch": 0.56, - "learning_rate": 0.00021627104449298978, - "loss": 0.0148, + "epoch": 0.29, + "learning_rate": 0.0002569807740661152, + "loss": 0.0198, "step": 110640 }, { - "epoch": 0.56, - "learning_rate": 0.00021626347679997576, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.0002569768858497437, + "loss": 0.0181, "step": 110650 }, { - "epoch": 0.56, - "learning_rate": 0.00021625590910696174, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.0002569729976333723, + "loss": 0.0178, "step": 110660 }, { - "epoch": 0.56, - "learning_rate": 0.00021624834141394775, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.0002569691094170008, + "loss": 0.0212, "step": 110670 }, { - "epoch": 0.56, - "learning_rate": 0.00021624077372093373, - "loss": 0.0148, + "epoch": 0.29, + "learning_rate": 0.0002569652212006293, + "loss": 0.023, "step": 110680 }, { - "epoch": 0.56, - "learning_rate": 0.00021623320602791972, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.0002569613329842579, + "loss": 0.0227, "step": 110690 }, { - "epoch": 0.56, - "learning_rate": 0.00021622563833490572, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002569574447678864, + "loss": 0.0243, "step": 110700 }, { - "epoch": 0.56, - "learning_rate": 0.0002162180706418917, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.000256953556551515, + "loss": 0.0203, "step": 110710 }, { - "epoch": 0.56, - "learning_rate": 0.0002162105029488777, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002569496683351435, + "loss": 0.0212, "step": 110720 }, { - "epoch": 0.56, - "learning_rate": 0.0002162029352558637, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.00025694578011877206, + "loss": 0.0208, "step": 110730 }, { - "epoch": 0.56, - "learning_rate": 0.00021619536756284968, - "loss": 0.0123, + "epoch": 0.29, + "learning_rate": 0.0002569418919024006, + "loss": 0.0243, "step": 110740 }, { - "epoch": 0.56, - "learning_rate": 0.00021618779986983566, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002569380036860291, + "loss": 0.0183, "step": 110750 }, { - "epoch": 0.56, - "learning_rate": 0.00021618023217682167, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.0002569341154696576, + "loss": 0.0196, "step": 110760 }, { - "epoch": 0.56, - "learning_rate": 0.00021617266448380765, - "loss": 0.0148, + "epoch": 0.29, + "learning_rate": 0.00025693022725328617, + "loss": 0.0196, "step": 110770 }, { - "epoch": 0.56, - "learning_rate": 0.00021616509679079363, - "loss": 0.0186, + "epoch": 0.29, + "learning_rate": 0.0002569263390369147, + "loss": 0.0209, "step": 110780 }, { - "epoch": 0.56, - "learning_rate": 0.00021615752909777964, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.00025692245082054325, + "loss": 0.0202, "step": 110790 }, { - "epoch": 0.56, - "learning_rate": 0.00021614996140476562, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025691856260417177, + "loss": 0.0227, "step": 110800 }, { - "epoch": 0.56, - "learning_rate": 0.0002161423937117516, - "loss": 0.0126, + "epoch": 0.29, + "learning_rate": 0.00025691467438780034, + "loss": 0.0204, "step": 110810 }, { - "epoch": 0.56, - "learning_rate": 0.00021613482601873758, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.00025691078617142885, + "loss": 0.0221, "step": 110820 }, { - "epoch": 0.56, - "learning_rate": 0.0002161272583257236, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.00025690689795505737, + "loss": 0.0219, "step": 110830 }, { - "epoch": 0.56, - "learning_rate": 0.00021611969063270957, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.0002569030097386859, + "loss": 0.028, "step": 110840 }, { - "epoch": 0.56, - "learning_rate": 0.00021611212293969555, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025689912152231445, + "loss": 0.0185, "step": 110850 }, { - "epoch": 0.56, - "learning_rate": 0.00021610455524668156, - "loss": 0.019, + "epoch": 0.29, + "learning_rate": 0.000256895233305943, + "loss": 0.0245, "step": 110860 }, { - "epoch": 0.56, - "learning_rate": 0.00021609698755366754, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.00025689134508957153, + "loss": 0.0203, "step": 110870 }, { - "epoch": 0.56, - "learning_rate": 0.00021608941986065353, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.00025688745687320005, + "loss": 0.0255, "step": 110880 }, { - "epoch": 0.56, - "learning_rate": 0.00021608185216763953, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002568835686568286, + "loss": 0.0221, "step": 110890 }, { - "epoch": 0.56, - "learning_rate": 0.00021607428447462552, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.00025687968044045713, + "loss": 0.0208, "step": 110900 }, { - "epoch": 0.56, - "learning_rate": 0.0002160667167816115, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025687579222408565, + "loss": 0.0195, "step": 110910 }, { - "epoch": 0.56, - "learning_rate": 0.0002160591490885975, - "loss": 0.0135, + "epoch": 0.29, + "learning_rate": 0.0002568719040077142, + "loss": 0.0185, "step": 110920 }, { - "epoch": 0.56, - "learning_rate": 0.0002160515813955835, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.00025686801579134273, + "loss": 0.0215, "step": 110930 }, { - "epoch": 0.56, - "learning_rate": 0.00021604401370256947, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.0002568641275749713, + "loss": 0.023, "step": 110940 }, { - "epoch": 0.56, - "learning_rate": 0.00021603644600955548, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.0002568602393585998, + "loss": 0.0179, "step": 110950 }, { - "epoch": 0.56, - "learning_rate": 0.00021602887831654146, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.0002568563511422283, + "loss": 0.0208, "step": 110960 }, { - "epoch": 0.56, - "learning_rate": 0.00021602131062352744, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.00025685246292585684, + "loss": 0.0222, "step": 110970 }, { - "epoch": 0.56, - "learning_rate": 0.00021601374293051342, - "loss": 0.0126, + "epoch": 0.29, + "learning_rate": 0.0002568485747094854, + "loss": 0.0232, "step": 110980 }, { - "epoch": 0.56, - "learning_rate": 0.00021600617523749943, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002568446864931139, + "loss": 0.0218, "step": 110990 }, { - "epoch": 0.56, - "learning_rate": 0.0002159986075444854, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.0002568407982767425, + "loss": 0.0216, "step": 111000 }, { - "epoch": 0.56, - "eval_cer": 0.914462492734159, - "eval_loss": 0.010961051099002361, - "eval_runtime": 116.7509, - "eval_samples_per_second": 17.13, - "eval_steps_per_second": 4.283, + "epoch": 0.29, + "eval_cer": 0.8817768670806793, + "eval_loss": 0.015027694404125214, + "eval_runtime": 107.3953, + "eval_samples_per_second": 18.623, + "eval_steps_per_second": 4.656, "step": 111000 }, { - "epoch": 0.56, - "learning_rate": 0.0002159910398514714, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.000256836910060371, + "loss": 0.0184, "step": 111010 }, { - "epoch": 0.56, - "learning_rate": 0.0002159834721584574, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.0002568330218439996, + "loss": 0.0263, "step": 111020 }, { - "epoch": 0.56, - "learning_rate": 0.00021597590446544338, - "loss": 0.0179, + "epoch": 0.29, + "learning_rate": 0.0002568291336276281, + "loss": 0.0229, "step": 111030 }, { - "epoch": 0.56, - "learning_rate": 0.00021596833677242936, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.0002568252454112566, + "loss": 0.0244, "step": 111040 }, { - "epoch": 0.56, - "learning_rate": 0.00021596076907941537, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.0002568213571948851, + "loss": 0.0261, "step": 111050 }, { - "epoch": 0.56, - "learning_rate": 0.00021595320138640135, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002568174689785137, + "loss": 0.0261, "step": 111060 }, { - "epoch": 0.56, - "learning_rate": 0.00021594563369338734, - "loss": 0.011, + "epoch": 0.29, + "learning_rate": 0.00025681358076214226, + "loss": 0.0212, "step": 111070 }, { - "epoch": 0.56, - "learning_rate": 0.00021593806600037334, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025680969254577077, + "loss": 0.023, "step": 111080 }, { - "epoch": 0.56, - "learning_rate": 0.00021593049830735933, - "loss": 0.0135, + "epoch": 0.29, + "learning_rate": 0.0002568058043293993, + "loss": 0.0245, "step": 111090 }, { - "epoch": 0.56, - "learning_rate": 0.0002159229306143453, - "loss": 0.013, + "epoch": 0.29, + "learning_rate": 0.00025680191611302786, + "loss": 0.0261, "step": 111100 }, { - "epoch": 0.56, - "learning_rate": 0.00021591536292133132, - "loss": 0.0121, + "epoch": 0.29, + "learning_rate": 0.00025679802789665637, + "loss": 0.0242, "step": 111110 }, { - "epoch": 0.56, - "learning_rate": 0.0002159077952283173, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.0002567941396802849, + "loss": 0.0203, "step": 111120 }, { - "epoch": 0.56, - "learning_rate": 0.00021590022753530328, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.00025679025146391345, + "loss": 0.0209, "step": 111130 }, { - "epoch": 0.56, - "learning_rate": 0.00021589265984228926, - "loss": 0.0119, + "epoch": 0.29, + "learning_rate": 0.00025678636324754197, + "loss": 0.0235, "step": 111140 }, { - "epoch": 0.56, - "learning_rate": 0.00021588509214927527, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.00025678247503117054, + "loss": 0.0218, "step": 111150 }, { - "epoch": 0.56, - "learning_rate": 0.00021587752445626125, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.00025677858681479905, + "loss": 0.0181, "step": 111160 }, { - "epoch": 0.56, - "learning_rate": 0.00021586995676324723, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.00025677469859842757, + "loss": 0.0223, "step": 111170 }, { - "epoch": 0.56, - "learning_rate": 0.00021586238907023324, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.0002567708103820561, + "loss": 0.0178, "step": 111180 }, { - "epoch": 0.56, - "learning_rate": 0.00021585482137721922, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.00025676692216568465, + "loss": 0.0201, "step": 111190 }, { - "epoch": 0.56, - "learning_rate": 0.0002158472536842052, - "loss": 0.0184, + "epoch": 0.29, + "learning_rate": 0.0002567630339493132, + "loss": 0.0222, "step": 111200 }, { - "epoch": 0.56, - "learning_rate": 0.0002158396859911912, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025675914573294173, + "loss": 0.0233, "step": 111210 }, { - "epoch": 0.56, - "learning_rate": 0.0002158321182981772, - "loss": 0.0189, + "epoch": 0.29, + "learning_rate": 0.00025675525751657025, + "loss": 0.02, "step": 111220 }, { - "epoch": 0.56, - "learning_rate": 0.00021582455060516317, - "loss": 0.0204, + "epoch": 0.29, + "learning_rate": 0.0002567513693001988, + "loss": 0.0214, "step": 111230 }, { - "epoch": 0.56, - "learning_rate": 0.00021581698291214913, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.00025674748108382733, + "loss": 0.0224, "step": 111240 }, { - "epoch": 0.56, - "learning_rate": 0.00021580941521913514, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025674359286745584, + "loss": 0.02, "step": 111250 }, { - "epoch": 0.56, - "learning_rate": 0.00021580184752612112, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002567397046510844, + "loss": 0.0188, "step": 111260 }, { - "epoch": 0.56, - "learning_rate": 0.0002157942798331071, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.00025673581643471293, + "loss": 0.0176, "step": 111270 }, { - "epoch": 0.56, - "learning_rate": 0.0002157867121400931, - "loss": 0.0121, + "epoch": 0.29, + "learning_rate": 0.0002567319282183415, + "loss": 0.0215, "step": 111280 }, { - "epoch": 0.56, - "learning_rate": 0.0002157791444470791, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.00025672804000197, + "loss": 0.0214, "step": 111290 }, { - "epoch": 0.56, - "learning_rate": 0.00021577157675406507, - "loss": 0.0119, + "epoch": 0.29, + "learning_rate": 0.0002567241517855985, + "loss": 0.0276, "step": 111300 }, { - "epoch": 0.56, - "learning_rate": 0.00021576400906105108, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.0002567202635692271, + "loss": 0.0264, "step": 111310 }, { - "epoch": 0.56, - "learning_rate": 0.00021575644136803706, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.0002567163753528556, + "loss": 0.0247, "step": 111320 }, { - "epoch": 0.56, - "learning_rate": 0.00021574887367502304, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.0002567124871364841, + "loss": 0.0254, "step": 111330 }, { - "epoch": 0.56, - "learning_rate": 0.00021574130598200905, - "loss": 0.014, + "epoch": 0.29, + "learning_rate": 0.0002567085989201127, + "loss": 0.0247, "step": 111340 }, { - "epoch": 0.56, - "learning_rate": 0.00021573373828899503, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.00025670471070374126, + "loss": 0.0222, "step": 111350 }, { - "epoch": 0.56, - "learning_rate": 0.00021572617059598101, - "loss": 0.0144, + "epoch": 0.29, + "learning_rate": 0.0002567008224873698, + "loss": 0.0237, "step": 111360 }, { - "epoch": 0.56, - "learning_rate": 0.000215718602902967, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.0002566969342709983, + "loss": 0.0229, "step": 111370 }, { - "epoch": 0.56, - "learning_rate": 0.000215711035209953, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002566930460546268, + "loss": 0.0257, "step": 111380 }, { - "epoch": 0.56, - "learning_rate": 0.00021570346751693899, - "loss": 0.0174, + "epoch": 0.29, + "learning_rate": 0.0002566891578382554, + "loss": 0.0203, "step": 111390 }, { - "epoch": 0.56, - "learning_rate": 0.00021569589982392497, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.0002566852696218839, + "loss": 0.0259, "step": 111400 }, { - "epoch": 0.56, - "learning_rate": 0.00021568833213091098, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025668138140551246, + "loss": 0.0197, "step": 111410 }, { - "epoch": 0.56, - "learning_rate": 0.00021568076443789696, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.00025667749318914097, + "loss": 0.0206, "step": 111420 }, { - "epoch": 0.56, - "learning_rate": 0.00021567319674488294, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.0002566736049727695, + "loss": 0.0165, "step": 111430 }, { - "epoch": 0.56, - "learning_rate": 0.00021566562905186895, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.00025666971675639805, + "loss": 0.0222, "step": 111440 }, { - "epoch": 0.56, - "learning_rate": 0.00021565806135885493, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.00025666582854002657, + "loss": 0.0198, "step": 111450 }, { - "epoch": 0.56, - "learning_rate": 0.0002156504936658409, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.0002566619403236551, + "loss": 0.0193, "step": 111460 }, { - "epoch": 0.56, - "learning_rate": 0.00021564292597282692, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.00025665805210728365, + "loss": 0.0248, "step": 111470 }, { - "epoch": 0.56, - "learning_rate": 0.0002156353582798129, - "loss": 0.0124, + "epoch": 0.29, + "learning_rate": 0.00025665416389091217, + "loss": 0.0193, "step": 111480 }, { - "epoch": 0.56, - "learning_rate": 0.00021562779058679888, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.00025665027567454074, + "loss": 0.0249, "step": 111490 }, { - "epoch": 0.56, - "learning_rate": 0.0002156202228937849, - "loss": 0.0125, + "epoch": 0.29, + "learning_rate": 0.00025664638745816925, + "loss": 0.0228, "step": 111500 }, { - "epoch": 0.56, - "learning_rate": 0.00021561265520077087, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025664249924179776, + "loss": 0.0266, "step": 111510 }, { - "epoch": 0.56, - "learning_rate": 0.00021560508750775685, - "loss": 0.0203, + "epoch": 0.29, + "learning_rate": 0.00025663861102542633, + "loss": 0.0218, "step": 111520 }, { - "epoch": 0.56, - "learning_rate": 0.00021559751981474283, - "loss": 0.014, + "epoch": 0.29, + "learning_rate": 0.00025663472280905485, + "loss": 0.0217, "step": 111530 }, { - "epoch": 0.56, - "learning_rate": 0.00021558995212172884, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.00025663083459268336, + "loss": 0.0193, "step": 111540 }, { - "epoch": 0.56, - "learning_rate": 0.00021558238442871482, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.00025662694637631193, + "loss": 0.0245, "step": 111550 }, { - "epoch": 0.56, - "learning_rate": 0.0002155748167357008, - "loss": 0.0158, + "epoch": 0.29, + "learning_rate": 0.0002566230581599405, + "loss": 0.0206, "step": 111560 }, { - "epoch": 0.56, - "learning_rate": 0.00021556724904268681, - "loss": 0.0125, + "epoch": 0.29, + "learning_rate": 0.000256619169943569, + "loss": 0.0195, "step": 111570 }, { - "epoch": 0.56, - "learning_rate": 0.0002155596813496728, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025661528172719753, + "loss": 0.0179, "step": 111580 }, { - "epoch": 0.56, - "learning_rate": 0.00021555211365665878, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025661139351082604, + "loss": 0.019, "step": 111590 }, { - "epoch": 0.56, - "learning_rate": 0.00021554454596364479, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.0002566075052944546, + "loss": 0.0215, "step": 111600 }, { - "epoch": 0.56, - "learning_rate": 0.00021553697827063077, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.0002566036170780831, + "loss": 0.0229, "step": 111610 }, { - "epoch": 0.56, - "learning_rate": 0.00021552941057761675, - "loss": 0.0135, + "epoch": 0.29, + "learning_rate": 0.0002565997288617117, + "loss": 0.0212, "step": 111620 }, { - "epoch": 0.56, - "learning_rate": 0.00021552184288460276, - "loss": 0.0147, - "step": 111630 + "epoch": 0.29, + "learning_rate": 0.0002565958406453402, + "loss": 0.0206, + "step": 111630 }, { - "epoch": 0.56, - "learning_rate": 0.00021551427519158874, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.0002565919524289688, + "loss": 0.0237, "step": 111640 }, { - "epoch": 0.56, - "learning_rate": 0.00021550670749857472, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002565880642125973, + "loss": 0.0206, "step": 111650 }, { - "epoch": 0.56, - "learning_rate": 0.00021549913980556073, - "loss": 0.0135, + "epoch": 0.29, + "learning_rate": 0.0002565841759962258, + "loss": 0.0248, "step": 111660 }, { - "epoch": 0.56, - "learning_rate": 0.0002154915721125467, - "loss": 0.0114, + "epoch": 0.29, + "learning_rate": 0.0002565802877798543, + "loss": 0.0244, "step": 111670 }, { - "epoch": 0.56, - "learning_rate": 0.0002154840044195327, - "loss": 0.0199, + "epoch": 0.29, + "learning_rate": 0.0002565763995634829, + "loss": 0.0221, "step": 111680 }, { - "epoch": 0.56, - "learning_rate": 0.0002154764367265187, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.0002565725113471114, + "loss": 0.0193, "step": 111690 }, { - "epoch": 0.56, - "learning_rate": 0.00021546886903350468, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.00025656862313074, + "loss": 0.0303, "step": 111700 }, { - "epoch": 0.56, - "learning_rate": 0.00021546130134049066, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.0002565647349143685, + "loss": 0.0178, "step": 111710 }, { - "epoch": 0.56, - "learning_rate": 0.00021545373364747664, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.000256560846697997, + "loss": 0.0268, "step": 111720 }, { - "epoch": 0.56, - "learning_rate": 0.00021544616595446265, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.00025655695848162557, + "loss": 0.022, "step": 111730 }, { - "epoch": 0.56, - "learning_rate": 0.00021543859826144863, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.0002565530702652541, + "loss": 0.0282, "step": 111740 }, { - "epoch": 0.56, - "learning_rate": 0.00021543103056843462, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.00025654918204888266, + "loss": 0.0237, "step": 111750 }, { - "epoch": 0.56, - "learning_rate": 0.00021542346287542062, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.00025654529383251117, + "loss": 0.0197, "step": 111760 }, { - "epoch": 0.56, - "learning_rate": 0.0002154158951824066, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.00025654140561613974, + "loss": 0.0217, "step": 111770 }, { - "epoch": 0.56, - "learning_rate": 0.0002154083274893926, - "loss": 0.0135, + "epoch": 0.29, + "learning_rate": 0.00025653751739976825, + "loss": 0.0259, "step": 111780 }, { - "epoch": 0.56, - "learning_rate": 0.0002154007597963786, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.00025653362918339677, + "loss": 0.0278, "step": 111790 }, { - "epoch": 0.56, - "learning_rate": 0.00021539319210336458, - "loss": 0.0188, + "epoch": 0.29, + "learning_rate": 0.0002565297409670253, + "loss": 0.02, "step": 111800 }, { - "epoch": 0.56, - "learning_rate": 0.00021538562441035056, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.00025652585275065385, + "loss": 0.025, "step": 111810 }, { - "epoch": 0.56, - "learning_rate": 0.00021537805671733657, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.00025652196453428237, + "loss": 0.0207, "step": 111820 }, { - "epoch": 0.56, - "learning_rate": 0.00021537048902432255, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.00025651807631791093, + "loss": 0.0216, "step": 111830 }, { - "epoch": 0.56, - "learning_rate": 0.00021536292133130853, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025651418810153945, + "loss": 0.0175, "step": 111840 }, { - "epoch": 0.56, - "learning_rate": 0.00021535535363829454, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.000256510299885168, + "loss": 0.0194, "step": 111850 }, { - "epoch": 0.56, - "learning_rate": 0.00021534778594528052, - "loss": 0.0123, + "epoch": 0.29, + "learning_rate": 0.00025650641166879653, + "loss": 0.0175, "step": 111860 }, { - "epoch": 0.56, - "learning_rate": 0.0002153402182522665, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.00025650252345242505, + "loss": 0.0198, "step": 111870 }, { - "epoch": 0.56, - "learning_rate": 0.00021533265055925248, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025649863523605356, + "loss": 0.0211, "step": 111880 }, { - "epoch": 0.56, - "learning_rate": 0.0002153250828662385, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025649474701968213, + "loss": 0.0205, "step": 111890 }, { - "epoch": 0.56, - "learning_rate": 0.00021531751517322447, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.0002564908588033107, + "loss": 0.0208, "step": 111900 }, { - "epoch": 0.56, - "learning_rate": 0.00021530994748021045, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.0002564869705869392, + "loss": 0.0216, "step": 111910 }, { - "epoch": 0.56, - "learning_rate": 0.00021530237978719646, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025648308237056773, + "loss": 0.0177, "step": 111920 }, { - "epoch": 0.56, - "learning_rate": 0.00021529481209418244, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.00025647919415419624, + "loss": 0.0228, "step": 111930 }, { - "epoch": 0.56, - "learning_rate": 0.00021528724440116843, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.0002564753059378248, + "loss": 0.0206, "step": 111940 }, { - "epoch": 0.56, - "learning_rate": 0.00021527967670815443, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.0002564714177214533, + "loss": 0.0187, "step": 111950 }, { - "epoch": 0.56, - "learning_rate": 0.00021527210901514042, - "loss": 0.0118, + "epoch": 0.29, + "learning_rate": 0.0002564675295050819, + "loss": 0.0284, "step": 111960 }, { - "epoch": 0.56, - "learning_rate": 0.0002152645413221264, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.0002564636412887104, + "loss": 0.0221, "step": 111970 }, { - "epoch": 0.56, - "learning_rate": 0.0002152569736291124, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.000256459753072339, + "loss": 0.0197, "step": 111980 }, { - "epoch": 0.57, - "learning_rate": 0.0002152494059360984, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.0002564558648559675, + "loss": 0.0229, "step": 111990 }, { - "epoch": 0.57, - "learning_rate": 0.00021524183824308437, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.000256451976639596, + "loss": 0.0198, "step": 112000 }, { - "epoch": 0.57, - "eval_cer": 0.9144595815457828, - "eval_loss": 0.011023299768567085, - "eval_runtime": 116.6938, - "eval_samples_per_second": 17.139, - "eval_steps_per_second": 4.285, + "epoch": 0.29, + "eval_cer": 0.8818104583670996, + "eval_loss": 0.014513031579554081, + "eval_runtime": 107.5973, + "eval_samples_per_second": 18.588, + "eval_steps_per_second": 4.647, "step": 112000 }, { - "epoch": 0.57, - "learning_rate": 0.00021523427055007038, - "loss": 0.0195, + "epoch": 0.29, + "learning_rate": 0.0002564480884232245, + "loss": 0.0193, "step": 112010 }, { - "epoch": 0.57, - "learning_rate": 0.00021522670285705636, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.0002564442002068531, + "loss": 0.0259, "step": 112020 }, { - "epoch": 0.57, - "learning_rate": 0.00021521913516404234, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.0002564403119904816, + "loss": 0.0191, "step": 112030 }, { - "epoch": 0.57, - "learning_rate": 0.00021521156747102832, - "loss": 0.0166, + "epoch": 0.29, + "learning_rate": 0.00025643642377411017, + "loss": 0.0239, "step": 112040 }, { - "epoch": 0.57, - "learning_rate": 0.00021520399977801433, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.0002564325355577387, + "loss": 0.0213, "step": 112050 }, { - "epoch": 0.57, - "learning_rate": 0.0002151964320850003, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.00025642864734136726, + "loss": 0.0212, "step": 112060 }, { - "epoch": 0.57, - "learning_rate": 0.0002151888643919863, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.00025642475912499577, + "loss": 0.023, "step": 112070 }, { - "epoch": 0.57, - "learning_rate": 0.0002151812966989723, - "loss": 0.0179, + "epoch": 0.29, + "learning_rate": 0.0002564208709086243, + "loss": 0.018, "step": 112080 }, { - "epoch": 0.57, - "learning_rate": 0.00021517372900595828, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.0002564169826922528, + "loss": 0.022, "step": 112090 }, { - "epoch": 0.57, - "learning_rate": 0.00021516616131294426, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.00025641309447588137, + "loss": 0.0197, "step": 112100 }, { - "epoch": 0.57, - "learning_rate": 0.00021515859361993027, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.00025640920625950994, + "loss": 0.0261, "step": 112110 }, { - "epoch": 0.57, - "learning_rate": 0.00021515102592691625, - "loss": 0.0191, + "epoch": 0.29, + "learning_rate": 0.00025640531804313845, + "loss": 0.019, "step": 112120 }, { - "epoch": 0.57, - "learning_rate": 0.00021514345823390224, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.00025640142982676697, + "loss": 0.0225, "step": 112130 }, { - "epoch": 0.57, - "learning_rate": 0.00021513589054088824, - "loss": 0.0165, + "epoch": 0.29, + "learning_rate": 0.00025639754161039553, + "loss": 0.0282, "step": 112140 }, { - "epoch": 0.57, - "learning_rate": 0.00021512832284787423, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.00025639365339402405, + "loss": 0.0186, "step": 112150 }, { - "epoch": 0.57, - "learning_rate": 0.0002151207551548602, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025638976517765256, + "loss": 0.02, "step": 112160 }, { - "epoch": 0.57, - "learning_rate": 0.00021511318746184622, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.00025638587696128113, + "loss": 0.0325, "step": 112170 }, { - "epoch": 0.57, - "learning_rate": 0.0002151056197688322, - "loss": 0.0132, + "epoch": 0.29, + "learning_rate": 0.00025638198874490965, + "loss": 0.0204, "step": 112180 }, { - "epoch": 0.57, - "learning_rate": 0.00021509805207581818, - "loss": 0.0111, + "epoch": 0.29, + "learning_rate": 0.0002563781005285382, + "loss": 0.0177, "step": 112190 }, { - "epoch": 0.57, - "learning_rate": 0.0002150904843828042, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.00025637421231216673, + "loss": 0.0204, "step": 112200 }, { - "epoch": 0.57, - "learning_rate": 0.00021508291668979017, - "loss": 0.0165, + "epoch": 0.29, + "learning_rate": 0.00025637032409579525, + "loss": 0.0215, "step": 112210 }, { - "epoch": 0.57, - "learning_rate": 0.00021507534899677615, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.00025636643587942376, + "loss": 0.0195, "step": 112220 }, { - "epoch": 0.57, - "learning_rate": 0.00021506778130376213, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025636254766305233, + "loss": 0.0216, "step": 112230 }, { - "epoch": 0.57, - "learning_rate": 0.00021506021361074814, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025635865944668084, + "loss": 0.023, "step": 112240 }, { - "epoch": 0.57, - "learning_rate": 0.00021505264591773412, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.0002563547712303094, + "loss": 0.0198, "step": 112250 }, { - "epoch": 0.57, - "learning_rate": 0.0002150450782247201, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.0002563508830139379, + "loss": 0.0223, "step": 112260 }, { - "epoch": 0.57, - "learning_rate": 0.0002150375105317061, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.0002563469947975665, + "loss": 0.0184, "step": 112270 }, { - "epoch": 0.57, - "learning_rate": 0.0002150299428386921, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.000256343106581195, + "loss": 0.0204, "step": 112280 }, { - "epoch": 0.57, - "learning_rate": 0.00021502237514567807, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.0002563392183648235, + "loss": 0.0226, "step": 112290 }, { - "epoch": 0.57, - "learning_rate": 0.00021501480745266408, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.0002563353301484521, + "loss": 0.0317, "step": 112300 }, { - "epoch": 0.57, - "learning_rate": 0.00021500723975965006, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.0002563314419320806, + "loss": 0.0268, "step": 112310 }, { - "epoch": 0.57, - "learning_rate": 0.00021499967206663605, - "loss": 0.0123, + "epoch": 0.29, + "learning_rate": 0.0002563275537157092, + "loss": 0.0247, "step": 112320 }, { - "epoch": 0.57, - "learning_rate": 0.00021499210437362205, - "loss": 0.0195, + "epoch": 0.29, + "learning_rate": 0.0002563236654993377, + "loss": 0.0246, "step": 112330 }, { - "epoch": 0.57, - "learning_rate": 0.00021498453668060804, - "loss": 0.0159, + "epoch": 0.29, + "learning_rate": 0.0002563197772829662, + "loss": 0.0198, "step": 112340 }, { - "epoch": 0.57, - "learning_rate": 0.00021497696898759402, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.0002563158890665948, + "loss": 0.0226, "step": 112350 }, { - "epoch": 0.57, - "learning_rate": 0.00021496940129458003, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.0002563120008502233, + "loss": 0.0214, "step": 112360 }, { - "epoch": 0.57, - "learning_rate": 0.000214961833601566, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.0002563081126338518, + "loss": 0.0207, "step": 112370 }, { - "epoch": 0.57, - "learning_rate": 0.000214954265908552, - "loss": 0.0178, + "epoch": 0.29, + "learning_rate": 0.00025630422441748037, + "loss": 0.023, "step": 112380 }, { - "epoch": 0.57, - "learning_rate": 0.00021494669821553797, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.00025630033620110894, + "loss": 0.0205, "step": 112390 }, { - "epoch": 0.57, - "learning_rate": 0.00021493913052252398, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025629644798473745, + "loss": 0.0296, "step": 112400 }, { - "epoch": 0.57, - "learning_rate": 0.00021493156282950996, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.00025629255976836597, + "loss": 0.0195, "step": 112410 }, { - "epoch": 0.57, - "learning_rate": 0.00021492399513649594, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.0002562886715519945, + "loss": 0.0336, "step": 112420 }, { - "epoch": 0.57, - "learning_rate": 0.00021491642744348195, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.000256284783335623, + "loss": 0.0191, "step": 112430 }, { - "epoch": 0.57, - "learning_rate": 0.00021490885975046793, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025628089511925157, + "loss": 0.0231, "step": 112440 }, { - "epoch": 0.57, - "learning_rate": 0.0002149012920574539, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025627700690288014, + "loss": 0.0214, "step": 112450 }, { - "epoch": 0.57, - "learning_rate": 0.00021489372436443992, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.00025627311868650865, + "loss": 0.0366, "step": 112460 }, { - "epoch": 0.57, - "learning_rate": 0.0002148861566714259, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025626923047013717, + "loss": 0.0222, "step": 112470 }, { - "epoch": 0.57, - "learning_rate": 0.00021487858897841188, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.00025626534225376573, + "loss": 0.0205, "step": 112480 }, { - "epoch": 0.57, - "learning_rate": 0.0002148710212853979, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.00025626145403739425, + "loss": 0.021, "step": 112490 }, { - "epoch": 0.57, - "learning_rate": 0.00021486345359238385, - "loss": 0.0151, + "epoch": 0.29, + "learning_rate": 0.00025625756582102276, + "loss": 0.0244, "step": 112500 }, { - "epoch": 0.57, - "learning_rate": 0.00021485588589936983, - "loss": 0.0166, + "epoch": 0.29, + "learning_rate": 0.00025625367760465133, + "loss": 0.0211, "step": 112510 }, { - "epoch": 0.57, - "learning_rate": 0.0002148483182063558, - "loss": 0.0154, + "epoch": 0.29, + "learning_rate": 0.00025624978938827985, + "loss": 0.0202, "step": 112520 }, { - "epoch": 0.57, - "learning_rate": 0.00021484075051334182, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.0002562459011719084, + "loss": 0.0184, "step": 112530 }, { - "epoch": 0.57, - "learning_rate": 0.0002148331828203278, - "loss": 0.018, + "epoch": 0.29, + "learning_rate": 0.00025624201295553693, + "loss": 0.0196, "step": 112540 }, { - "epoch": 0.57, - "learning_rate": 0.00021482561512731378, - "loss": 0.0169, + "epoch": 0.29, + "learning_rate": 0.00025623812473916544, + "loss": 0.0208, "step": 112550 }, { - "epoch": 0.57, - "learning_rate": 0.0002148180474342998, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.000256234236522794, + "loss": 0.0204, "step": 112560 }, { - "epoch": 0.57, - "learning_rate": 0.00021481047974128577, - "loss": 0.0176, + "epoch": 0.29, + "learning_rate": 0.00025623034830642253, + "loss": 0.0196, "step": 112570 }, { - "epoch": 0.57, - "learning_rate": 0.00021480291204827175, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025622646009005104, + "loss": 0.0266, "step": 112580 }, { - "epoch": 0.57, - "learning_rate": 0.00021479534435525776, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.0002562225718736796, + "loss": 0.0209, "step": 112590 }, { - "epoch": 0.57, - "learning_rate": 0.00021478777666224374, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.0002562186836573082, + "loss": 0.0248, "step": 112600 }, { - "epoch": 0.57, - "learning_rate": 0.00021478020896922972, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.0002562147954409367, + "loss": 0.0199, "step": 112610 }, { - "epoch": 0.57, - "learning_rate": 0.0002147726412762157, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.0002562109072245652, + "loss": 0.0228, "step": 112620 }, { - "epoch": 0.57, - "learning_rate": 0.00021476507358320171, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.0002562070190081937, + "loss": 0.0294, "step": 112630 }, { - "epoch": 0.57, - "learning_rate": 0.0002147575058901877, - "loss": 0.0161, + "epoch": 0.29, + "learning_rate": 0.0002562031307918223, + "loss": 0.0217, "step": 112640 }, { - "epoch": 0.57, - "learning_rate": 0.00021474993819717368, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.0002561992425754508, + "loss": 0.0192, "step": 112650 }, { - "epoch": 0.57, - "learning_rate": 0.00021474237050415969, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002561953543590794, + "loss": 0.0228, "step": 112660 }, { - "epoch": 0.57, - "learning_rate": 0.00021473480281114567, - "loss": 0.0124, + "epoch": 0.29, + "learning_rate": 0.0002561914661427079, + "loss": 0.0229, "step": 112670 }, { - "epoch": 0.57, - "learning_rate": 0.00021472723511813165, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.0002561875779263364, + "loss": 0.0264, "step": 112680 }, { - "epoch": 0.57, - "learning_rate": 0.00021471966742511766, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025618368970996497, + "loss": 0.0239, "step": 112690 }, { - "epoch": 0.57, - "learning_rate": 0.00021471209973210364, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.0002561798014935935, + "loss": 0.0209, "step": 112700 }, { - "epoch": 0.57, - "learning_rate": 0.00021470453203908962, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.000256175913277222, + "loss": 0.023, "step": 112710 }, { - "epoch": 0.57, - "learning_rate": 0.00021469696434607563, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.00025617202506085057, + "loss": 0.0176, "step": 112720 }, { - "epoch": 0.57, - "learning_rate": 0.0002146893966530616, - "loss": 0.0144, + "epoch": 0.29, + "learning_rate": 0.0002561681368444791, + "loss": 0.0204, "step": 112730 }, { - "epoch": 0.57, - "learning_rate": 0.0002146818289600476, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.00025616424862810765, + "loss": 0.0192, "step": 112740 }, { - "epoch": 0.57, - "learning_rate": 0.0002146742612670336, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025616036041173617, + "loss": 0.0244, "step": 112750 }, { - "epoch": 0.57, - "learning_rate": 0.00021466669357401958, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.0002561564721953647, + "loss": 0.0233, "step": 112760 }, { - "epoch": 0.57, - "learning_rate": 0.00021465912588100556, - "loss": 0.0149, + "epoch": 0.29, + "learning_rate": 0.00025615258397899325, + "loss": 0.0216, "step": 112770 }, { - "epoch": 0.57, - "learning_rate": 0.00021465155818799154, - "loss": 0.0145, + "epoch": 0.29, + "learning_rate": 0.00025614869576262177, + "loss": 0.0232, "step": 112780 }, { - "epoch": 0.57, - "learning_rate": 0.00021464399049497755, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.00025614480754625033, + "loss": 0.0215, "step": 112790 }, { - "epoch": 0.57, - "learning_rate": 0.00021463642280196353, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.00025614091932987885, + "loss": 0.0228, "step": 112800 }, { - "epoch": 0.57, - "learning_rate": 0.00021462885510894952, - "loss": 0.0184, + "epoch": 0.29, + "learning_rate": 0.0002561370311135074, + "loss": 0.0231, "step": 112810 }, { - "epoch": 0.57, - "learning_rate": 0.00021462128741593552, - "loss": 0.0125, + "epoch": 0.29, + "learning_rate": 0.00025613314289713593, + "loss": 0.0226, "step": 112820 }, { - "epoch": 0.57, - "learning_rate": 0.0002146137197229215, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.00025612925468076445, + "loss": 0.0259, "step": 112830 }, { - "epoch": 0.57, - "learning_rate": 0.0002146061520299075, - "loss": 0.0189, + "epoch": 0.29, + "learning_rate": 0.00025612536646439296, + "loss": 0.0187, "step": 112840 }, { - "epoch": 0.57, - "learning_rate": 0.0002145985843368935, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.00025612147824802153, + "loss": 0.0247, "step": 112850 }, { - "epoch": 0.57, - "learning_rate": 0.00021459101664387948, - "loss": 0.0165, + "epoch": 0.29, + "learning_rate": 0.00025611759003165005, + "loss": 0.018, "step": 112860 }, { - "epoch": 0.57, - "learning_rate": 0.00021458344895086546, - "loss": 0.0146, + "epoch": 0.29, + "learning_rate": 0.0002561137018152786, + "loss": 0.0238, "step": 112870 }, { - "epoch": 0.57, - "learning_rate": 0.00021457588125785147, - "loss": 0.0148, + "epoch": 0.29, + "learning_rate": 0.00025610981359890713, + "loss": 0.0218, "step": 112880 }, { - "epoch": 0.57, - "learning_rate": 0.00021456831356483745, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.00025610592538253564, + "loss": 0.0219, "step": 112890 }, { - "epoch": 0.57, - "learning_rate": 0.00021456074587182343, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.0002561020371661642, + "loss": 0.0236, "step": 112900 }, { - "epoch": 0.57, - "learning_rate": 0.00021455317817880944, - "loss": 0.0157, + "epoch": 0.29, + "learning_rate": 0.0002560981489497927, + "loss": 0.0201, "step": 112910 }, { - "epoch": 0.57, - "learning_rate": 0.00021454561048579542, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.00025609426073342124, + "loss": 0.0227, "step": 112920 }, { - "epoch": 0.57, - "learning_rate": 0.0002145380427927814, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.0002560903725170498, + "loss": 0.0221, "step": 112930 }, { - "epoch": 0.57, - "learning_rate": 0.00021453047509976738, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.0002560864843006784, + "loss": 0.0248, "step": 112940 }, { - "epoch": 0.57, - "learning_rate": 0.0002145229074067534, - "loss": 0.013, + "epoch": 0.29, + "learning_rate": 0.0002560825960843069, + "loss": 0.0201, "step": 112950 }, { - "epoch": 0.57, - "learning_rate": 0.00021451533971373937, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002560787078679354, + "loss": 0.0302, "step": 112960 }, { - "epoch": 0.57, - "learning_rate": 0.00021450777202072535, - "loss": 0.0171, + "epoch": 0.29, + "learning_rate": 0.0002560748196515639, + "loss": 0.0223, "step": 112970 }, { - "epoch": 0.57, - "learning_rate": 0.00021450020432771136, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.0002560709314351925, + "loss": 0.0267, "step": 112980 }, { - "epoch": 0.57, - "learning_rate": 0.00021449263663469734, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.000256067043218821, + "loss": 0.0223, "step": 112990 }, { - "epoch": 0.57, - "learning_rate": 0.00021448506894168333, - "loss": 0.012, + "epoch": 0.29, + "learning_rate": 0.0002560631550024496, + "loss": 0.0195, "step": 113000 }, { - "epoch": 0.57, - "eval_cer": 0.9144906342217957, - "eval_loss": 0.01105137262493372, - "eval_runtime": 116.8218, - "eval_samples_per_second": 17.12, - "eval_steps_per_second": 4.28, + "epoch": 0.29, + "eval_cer": 0.881782465628416, + "eval_loss": 0.015686366707086563, + "eval_runtime": 107.7549, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, "step": 113000 }, { - "epoch": 0.57, - "learning_rate": 0.00021447750124866933, - "loss": 0.0144, + "epoch": 0.29, + "learning_rate": 0.0002560592667860781, + "loss": 0.018, "step": 113010 }, { - "epoch": 0.57, - "learning_rate": 0.00021446993355565532, - "loss": 0.0109, + "epoch": 0.29, + "learning_rate": 0.00025605537856970666, + "loss": 0.0211, "step": 113020 }, { - "epoch": 0.57, - "learning_rate": 0.0002144623658626413, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.00025605149035333517, + "loss": 0.0255, "step": 113030 }, { - "epoch": 0.57, - "learning_rate": 0.0002144547981696273, - "loss": 0.0138, + "epoch": 0.29, + "learning_rate": 0.0002560476021369637, + "loss": 0.0197, "step": 113040 }, { - "epoch": 0.57, - "learning_rate": 0.0002144472304766133, - "loss": 0.0126, + "epoch": 0.29, + "learning_rate": 0.0002560437139205922, + "loss": 0.0235, "step": 113050 }, { - "epoch": 0.57, - "learning_rate": 0.00021443966278359927, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.00025603982570422077, + "loss": 0.0211, "step": 113060 }, { - "epoch": 0.57, - "learning_rate": 0.00021443209509058528, - "loss": 0.0164, + "epoch": 0.29, + "learning_rate": 0.0002560359374878493, + "loss": 0.0195, "step": 113070 }, { - "epoch": 0.57, - "learning_rate": 0.00021442452739757126, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.00025603204927147785, + "loss": 0.0229, "step": 113080 }, { - "epoch": 0.57, - "learning_rate": 0.00021441695970455724, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025602816105510637, + "loss": 0.0226, "step": 113090 }, { - "epoch": 0.57, - "learning_rate": 0.00021440939201154325, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.00025602427283873494, + "loss": 0.0202, "step": 113100 }, { - "epoch": 0.57, - "learning_rate": 0.00021440182431852923, - "loss": 0.0133, + "epoch": 0.29, + "learning_rate": 0.00025602038462236345, + "loss": 0.0269, "step": 113110 }, { - "epoch": 0.57, - "learning_rate": 0.0002143942566255152, - "loss": 0.0129, + "epoch": 0.29, + "learning_rate": 0.00025601649640599196, + "loss": 0.025, "step": 113120 }, { - "epoch": 0.57, - "learning_rate": 0.0002143866889325012, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.0002560126081896205, + "loss": 0.0194, "step": 113130 }, { - "epoch": 0.57, - "learning_rate": 0.0002143791212394872, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.00025600871997324905, + "loss": 0.0276, "step": 113140 }, { - "epoch": 0.57, - "learning_rate": 0.00021437155354647318, - "loss": 0.015, + "epoch": 0.29, + "learning_rate": 0.0002560048317568776, + "loss": 0.0211, "step": 113150 }, { - "epoch": 0.57, - "learning_rate": 0.00021436398585345916, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.00025600094354050613, + "loss": 0.0219, "step": 113160 }, { - "epoch": 0.57, - "learning_rate": 0.00021435641816044517, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.00025599705532413465, + "loss": 0.0227, "step": 113170 }, { - "epoch": 0.57, - "learning_rate": 0.00021434885046743115, - "loss": 0.0121, + "epoch": 0.29, + "learning_rate": 0.00025599316710776316, + "loss": 0.0203, "step": 113180 }, { - "epoch": 0.57, - "learning_rate": 0.00021434128277441714, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.00025598927889139173, + "loss": 0.0216, "step": 113190 }, { - "epoch": 0.57, - "learning_rate": 0.00021433371508140314, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.00025598539067502024, + "loss": 0.0183, "step": 113200 }, { - "epoch": 0.57, - "learning_rate": 0.00021432614738838913, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.0002559815024586488, + "loss": 0.0243, "step": 113210 }, { - "epoch": 0.57, - "learning_rate": 0.0002143185796953751, - "loss": 0.0118, + "epoch": 0.29, + "learning_rate": 0.00025597761424227733, + "loss": 0.0169, "step": 113220 }, { - "epoch": 0.57, - "learning_rate": 0.00021431101200236112, - "loss": 0.0115, + "epoch": 0.29, + "learning_rate": 0.0002559737260259059, + "loss": 0.0185, "step": 113230 }, { - "epoch": 0.57, - "learning_rate": 0.0002143034443093471, - "loss": 0.0165, + "epoch": 0.29, + "learning_rate": 0.0002559698378095344, + "loss": 0.0218, "step": 113240 }, { - "epoch": 0.57, - "learning_rate": 0.00021429587661633308, - "loss": 0.013, + "epoch": 0.29, + "learning_rate": 0.0002559659495931629, + "loss": 0.0206, "step": 113250 }, { - "epoch": 0.57, - "learning_rate": 0.0002142883089233191, - "loss": 0.0122, + "epoch": 0.29, + "learning_rate": 0.00025596206137679144, + "loss": 0.0198, "step": 113260 }, { - "epoch": 0.57, - "learning_rate": 0.00021428074123030507, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.00025595817316042, + "loss": 0.0201, "step": 113270 }, { - "epoch": 0.57, - "learning_rate": 0.00021427317353729105, - "loss": 0.0123, + "epoch": 0.29, + "learning_rate": 0.0002559542849440485, + "loss": 0.0222, "step": 113280 }, { - "epoch": 0.57, - "learning_rate": 0.00021426560584427703, - "loss": 0.0125, + "epoch": 0.29, + "learning_rate": 0.0002559503967276771, + "loss": 0.02, "step": 113290 }, { - "epoch": 0.57, - "learning_rate": 0.00021425803815126304, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.0002559465085113056, + "loss": 0.0238, "step": 113300 }, { - "epoch": 0.57, - "learning_rate": 0.00021425047045824902, - "loss": 0.0155, + "epoch": 0.29, + "learning_rate": 0.0002559426202949342, + "loss": 0.0193, "step": 113310 }, { - "epoch": 0.57, - "learning_rate": 0.000214242902765235, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.0002559387320785627, + "loss": 0.0174, "step": 113320 }, { - "epoch": 0.57, - "learning_rate": 0.000214235335072221, - "loss": 0.0177, + "epoch": 0.29, + "learning_rate": 0.0002559348438621912, + "loss": 0.0216, "step": 113330 }, { - "epoch": 0.57, - "learning_rate": 0.000214227767379207, - "loss": 0.0179, + "epoch": 0.29, + "learning_rate": 0.00025593095564581977, + "loss": 0.0217, "step": 113340 }, { - "epoch": 0.57, - "learning_rate": 0.00021422019968619297, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.0002559270674294483, + "loss": 0.0231, "step": 113350 }, { - "epoch": 0.57, - "learning_rate": 0.00021421263199317898, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025592317921307686, + "loss": 0.0232, "step": 113360 }, { - "epoch": 0.57, - "learning_rate": 0.00021420506430016496, - "loss": 0.0126, + "epoch": 0.29, + "learning_rate": 0.00025591929099670537, + "loss": 0.0269, "step": 113370 }, { - "epoch": 0.57, - "learning_rate": 0.00021419749660715095, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.0002559154027803339, + "loss": 0.0205, "step": 113380 }, { - "epoch": 0.57, - "learning_rate": 0.00021418992891413695, - "loss": 0.0182, + "epoch": 0.29, + "learning_rate": 0.0002559115145639624, + "loss": 0.0204, "step": 113390 }, { - "epoch": 0.57, - "learning_rate": 0.00021418236122112294, - "loss": 0.0153, + "epoch": 0.29, + "learning_rate": 0.00025590762634759097, + "loss": 0.0214, "step": 113400 }, { - "epoch": 0.57, - "learning_rate": 0.00021417479352810892, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002559037381312195, + "loss": 0.0195, "step": 113410 }, { - "epoch": 0.57, - "learning_rate": 0.00021416722583509493, - "loss": 0.0167, + "epoch": 0.29, + "learning_rate": 0.00025589984991484805, + "loss": 0.0221, "step": 113420 }, { - "epoch": 0.57, - "learning_rate": 0.0002141596581420809, - "loss": 0.0156, + "epoch": 0.29, + "learning_rate": 0.00025589596169847657, + "loss": 0.0228, "step": 113430 }, { - "epoch": 0.57, - "learning_rate": 0.0002141520904490669, - "loss": 0.0175, + "epoch": 0.29, + "learning_rate": 0.00025589207348210513, + "loss": 0.022, "step": 113440 }, { - "epoch": 0.57, - "learning_rate": 0.00021414452275605287, - "loss": 0.017, + "epoch": 0.29, + "learning_rate": 0.00025588818526573365, + "loss": 0.0197, "step": 113450 }, { - "epoch": 0.57, - "learning_rate": 0.00021413695506303888, - "loss": 0.0131, + "epoch": 0.29, + "learning_rate": 0.00025588429704936216, + "loss": 0.0226, "step": 113460 }, { - "epoch": 0.57, - "learning_rate": 0.00021412938737002486, - "loss": 0.0128, + "epoch": 0.29, + "learning_rate": 0.0002558804088329907, + "loss": 0.0212, "step": 113470 }, { - "epoch": 0.57, - "learning_rate": 0.00021412181967701084, - "loss": 0.0122, + "epoch": 0.29, + "learning_rate": 0.00025587652061661925, + "loss": 0.0322, "step": 113480 }, { - "epoch": 0.57, - "learning_rate": 0.00021411425198399685, - "loss": 0.0181, + "epoch": 0.29, + "learning_rate": 0.0002558726324002478, + "loss": 0.0199, "step": 113490 }, { - "epoch": 0.57, - "learning_rate": 0.00021410668429098283, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.00025586874418387633, + "loss": 0.0212, "step": 113500 }, { - "epoch": 0.57, - "learning_rate": 0.0002140991165979688, - "loss": 0.014, + "epoch": 0.29, + "learning_rate": 0.00025586485596750484, + "loss": 0.0203, "step": 113510 }, { - "epoch": 0.57, - "learning_rate": 0.00021409154890495482, - "loss": 0.0205, + "epoch": 0.29, + "learning_rate": 0.0002558609677511334, + "loss": 0.0266, "step": 113520 }, { - "epoch": 0.57, - "learning_rate": 0.0002140839812119408, - "loss": 0.0162, + "epoch": 0.29, + "learning_rate": 0.00025585707953476193, + "loss": 0.0209, "step": 113530 }, { - "epoch": 0.57, - "learning_rate": 0.00021407641351892678, - "loss": 0.0136, + "epoch": 0.29, + "learning_rate": 0.00025585319131839044, + "loss": 0.0232, "step": 113540 }, { - "epoch": 0.57, - "learning_rate": 0.0002140688458259128, - "loss": 0.0142, + "epoch": 0.29, + "learning_rate": 0.000255849303102019, + "loss": 0.0195, "step": 113550 }, { - "epoch": 0.57, - "learning_rate": 0.00021406127813289877, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.0002558454148856475, + "loss": 0.0258, "step": 113560 }, { - "epoch": 0.57, - "learning_rate": 0.00021405371043988476, - "loss": 0.013, + "epoch": 0.29, + "learning_rate": 0.0002558415266692761, + "loss": 0.0208, "step": 113570 }, { - "epoch": 0.57, - "learning_rate": 0.00021404614274687076, - "loss": 0.0134, + "epoch": 0.29, + "learning_rate": 0.0002558376384529046, + "loss": 0.0214, "step": 113580 }, { - "epoch": 0.57, - "learning_rate": 0.00021403857505385675, - "loss": 0.0112, + "epoch": 0.29, + "learning_rate": 0.0002558337502365331, + "loss": 0.0206, "step": 113590 }, { - "epoch": 0.57, - "learning_rate": 0.00021403100736084273, - "loss": 0.0147, + "epoch": 0.29, + "learning_rate": 0.0002558298620201617, + "loss": 0.0238, "step": 113600 }, { - "epoch": 0.57, - "learning_rate": 0.0002140234396678287, - "loss": 0.0163, + "epoch": 0.29, + "learning_rate": 0.0002558259738037902, + "loss": 0.0208, "step": 113610 }, { - "epoch": 0.57, - "learning_rate": 0.00021401587197481472, - "loss": 0.013, + "epoch": 0.29, + "learning_rate": 0.0002558220855874187, + "loss": 0.019, "step": 113620 }, { - "epoch": 0.57, - "learning_rate": 0.0002140083042818007, - "loss": 0.0175, + "epoch": 0.29, + "learning_rate": 0.0002558181973710473, + "loss": 0.0192, "step": 113630 }, { - "epoch": 0.57, - "learning_rate": 0.00021400073658878668, - "loss": 0.0173, + "epoch": 0.29, + "learning_rate": 0.0002558143091546758, + "loss": 0.0201, "step": 113640 }, { - "epoch": 0.57, - "learning_rate": 0.0002139931688957727, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.0002558104209383044, + "loss": 0.0194, "step": 113650 }, { - "epoch": 0.57, - "learning_rate": 0.00021398560120275867, - "loss": 0.013, + "epoch": 0.29, + "learning_rate": 0.0002558065327219329, + "loss": 0.0223, "step": 113660 }, { - "epoch": 0.57, - "learning_rate": 0.00021397803350974465, - "loss": 0.0123, + "epoch": 0.29, + "learning_rate": 0.0002558026445055614, + "loss": 0.0227, "step": 113670 }, { - "epoch": 0.57, - "learning_rate": 0.00021397046581673066, - "loss": 0.0183, + "epoch": 0.29, + "learning_rate": 0.0002557987562891899, + "loss": 0.0186, "step": 113680 }, { - "epoch": 0.57, - "learning_rate": 0.00021396289812371664, - "loss": 0.016, + "epoch": 0.29, + "learning_rate": 0.0002557948680728185, + "loss": 0.0192, "step": 113690 }, { - "epoch": 0.57, - "learning_rate": 0.00021395533043070262, - "loss": 0.0172, + "epoch": 0.29, + "learning_rate": 0.00025579097985644705, + "loss": 0.0265, "step": 113700 }, { - "epoch": 0.57, - "learning_rate": 0.00021394776273768863, - "loss": 0.0139, + "epoch": 0.29, + "learning_rate": 0.00025578709164007557, + "loss": 0.02, "step": 113710 }, { - "epoch": 0.57, - "learning_rate": 0.0002139401950446746, - "loss": 0.0141, + "epoch": 0.29, + "learning_rate": 0.0002557832034237041, + "loss": 0.0197, "step": 113720 }, { - "epoch": 0.57, - "learning_rate": 0.0002139326273516606, - "loss": 0.0152, + "epoch": 0.29, + "learning_rate": 0.00025577931520733265, + "loss": 0.0253, "step": 113730 }, { - "epoch": 0.57, - "learning_rate": 0.0002139250596586466, - "loss": 0.0127, + "epoch": 0.29, + "learning_rate": 0.00025577542699096117, + "loss": 0.02, "step": 113740 }, { - "epoch": 0.57, - "learning_rate": 0.00021391749196563256, - "loss": 0.0144, + "epoch": 0.29, + "learning_rate": 0.0002557715387745897, + "loss": 0.0237, "step": 113750 }, { - "epoch": 0.57, - "learning_rate": 0.00021390992427261854, - "loss": 0.0143, + "epoch": 0.29, + "learning_rate": 0.00025576765055821825, + "loss": 0.0243, "step": 113760 }, { - "epoch": 0.57, - "learning_rate": 0.00021390235657960452, - "loss": 0.0119, + "epoch": 0.29, + "learning_rate": 0.00025576376234184676, + "loss": 0.022, "step": 113770 }, { - "epoch": 0.57, - "learning_rate": 0.00021389478888659053, - "loss": 0.0137, + "epoch": 0.29, + "learning_rate": 0.00025575987412547533, + "loss": 0.0217, "step": 113780 }, { - "epoch": 0.57, - "learning_rate": 0.0002138872211935765, - "loss": 0.0168, + "epoch": 0.29, + "learning_rate": 0.00025575598590910385, + "loss": 0.0213, "step": 113790 }, { - "epoch": 0.57, - "learning_rate": 0.0002138796535005625, - "loss": 0.014, + "epoch": 0.29, + "learning_rate": 0.00025575209769273236, + "loss": 0.0167, "step": 113800 }, { - "epoch": 0.57, - "learning_rate": 0.0002138720858075485, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025574820947636093, + "loss": 0.0228, "step": 113810 }, { - "epoch": 0.57, - "learning_rate": 0.00021386451811453448, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025574432125998945, + "loss": 0.0182, "step": 113820 }, { - "epoch": 0.57, - "learning_rate": 0.00021385695042152046, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025574043304361796, + "loss": 0.0174, "step": 113830 }, { - "epoch": 0.57, - "learning_rate": 0.00021384938272850644, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.00025573654482724653, + "loss": 0.0182, "step": 113840 }, { - "epoch": 0.57, - "learning_rate": 0.00021384181503549245, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002557326566108751, + "loss": 0.0195, "step": 113850 }, { - "epoch": 0.57, - "learning_rate": 0.00021383424734247843, - "loss": 0.0124, + "epoch": 0.3, + "learning_rate": 0.0002557287683945036, + "loss": 0.0219, "step": 113860 }, { - "epoch": 0.57, - "learning_rate": 0.00021382667964946442, - "loss": 0.0167, + "epoch": 0.3, + "learning_rate": 0.0002557248801781321, + "loss": 0.017, "step": 113870 }, { - "epoch": 0.57, - "learning_rate": 0.00021381911195645042, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.00025572099196176064, + "loss": 0.0233, "step": 113880 }, { - "epoch": 0.57, - "learning_rate": 0.0002138115442634364, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002557171037453892, + "loss": 0.0201, "step": 113890 }, { - "epoch": 0.57, - "learning_rate": 0.0002138039765704224, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.0002557132155290177, + "loss": 0.0208, "step": 113900 }, { - "epoch": 0.57, - "learning_rate": 0.0002137964088774084, - "loss": 0.0146, + "epoch": 0.3, + "learning_rate": 0.0002557093273126463, + "loss": 0.0187, "step": 113910 }, { - "epoch": 0.57, - "learning_rate": 0.00021378884118439438, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002557054390962748, + "loss": 0.0216, "step": 113920 }, { - "epoch": 0.57, - "learning_rate": 0.00021378127349138036, - "loss": 0.0117, + "epoch": 0.3, + "learning_rate": 0.0002557015508799033, + "loss": 0.0215, "step": 113930 }, { - "epoch": 0.57, - "learning_rate": 0.00021377370579836637, - "loss": 0.0126, + "epoch": 0.3, + "learning_rate": 0.0002556976626635319, + "loss": 0.0257, "step": 113940 }, { - "epoch": 0.57, - "learning_rate": 0.00021376613810535235, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.0002556937744471604, + "loss": 0.0241, "step": 113950 }, { - "epoch": 0.57, - "learning_rate": 0.00021375857041233833, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.0002556898862307889, + "loss": 0.0205, "step": 113960 }, { - "epoch": 0.57, - "learning_rate": 0.00021375100271932434, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.0002556859980144175, + "loss": 0.0199, "step": 113970 }, { - "epoch": 0.58, - "learning_rate": 0.00021374343502631032, - "loss": 0.0132, + "epoch": 0.3, + "learning_rate": 0.00025568210979804606, + "loss": 0.0186, "step": 113980 }, { - "epoch": 0.58, - "learning_rate": 0.0002137358673332963, - "loss": 0.0198, + "epoch": 0.3, + "learning_rate": 0.00025567822158167457, + "loss": 0.0213, "step": 113990 }, { - "epoch": 0.58, - "learning_rate": 0.00021372829964028228, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.0002556743333653031, + "loss": 0.025, "step": 114000 }, { - "epoch": 0.58, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.010899759829044342, - "eval_runtime": 116.7433, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.3, + "eval_cer": 0.881782465628416, + "eval_loss": 0.015355234034359455, + "eval_runtime": 107.8728, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, "step": 114000 }, { - "epoch": 0.58, - "learning_rate": 0.0002137207319472683, - "loss": 0.0124, + "epoch": 0.3, + "learning_rate": 0.0002556704451489316, + "loss": 0.0244, "step": 114010 }, { - "epoch": 0.58, - "learning_rate": 0.00021371316425425427, - "loss": 0.0174, + "epoch": 0.3, + "learning_rate": 0.00025566655693256017, + "loss": 0.0278, "step": 114020 }, { - "epoch": 0.58, - "learning_rate": 0.00021370559656124025, - "loss": 0.0158, + "epoch": 0.3, + "learning_rate": 0.0002556626687161887, + "loss": 0.0215, "step": 114030 }, { - "epoch": 0.58, - "learning_rate": 0.00021369802886822626, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.00025565878049981725, + "loss": 0.0179, "step": 114040 }, { - "epoch": 0.58, - "learning_rate": 0.00021369046117521224, - "loss": 0.0124, + "epoch": 0.3, + "learning_rate": 0.00025565489228344577, + "loss": 0.0199, "step": 114050 }, { - "epoch": 0.58, - "learning_rate": 0.00021368289348219823, - "loss": 0.0182, + "epoch": 0.3, + "learning_rate": 0.00025565100406707434, + "loss": 0.025, "step": 114060 }, { - "epoch": 0.58, - "learning_rate": 0.00021367532578918423, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.00025564711585070285, + "loss": 0.0258, "step": 114070 }, { - "epoch": 0.58, - "learning_rate": 0.00021366775809617022, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.00025564322763433137, + "loss": 0.0193, "step": 114080 }, { - "epoch": 0.58, - "learning_rate": 0.0002136601904031562, - "loss": 0.0182, + "epoch": 0.3, + "learning_rate": 0.0002556393394179599, + "loss": 0.0183, "step": 114090 }, { - "epoch": 0.58, - "learning_rate": 0.0002136526227101422, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025563545120158845, + "loss": 0.0202, "step": 114100 }, { - "epoch": 0.58, - "learning_rate": 0.0002136450550171282, - "loss": 0.019, + "epoch": 0.3, + "learning_rate": 0.00025563156298521696, + "loss": 0.0207, "step": 114110 }, { - "epoch": 0.58, - "learning_rate": 0.00021363748732411417, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.00025562767476884553, + "loss": 0.0218, "step": 114120 }, { - "epoch": 0.58, - "learning_rate": 0.00021362991963110018, - "loss": 0.0116, + "epoch": 0.3, + "learning_rate": 0.00025562378655247405, + "loss": 0.0231, "step": 114130 }, { - "epoch": 0.58, - "learning_rate": 0.00021362235193808616, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.00025561989833610256, + "loss": 0.0192, "step": 114140 }, { - "epoch": 0.58, - "learning_rate": 0.00021361478424507214, - "loss": 0.0135, + "epoch": 0.3, + "learning_rate": 0.00025561601011973113, + "loss": 0.0231, "step": 114150 }, { - "epoch": 0.58, - "learning_rate": 0.00021360721655205815, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025561212190335964, + "loss": 0.0217, "step": 114160 }, { - "epoch": 0.58, - "learning_rate": 0.00021359964885904413, - "loss": 0.015, - "step": 114170 + "epoch": 0.3, + "learning_rate": 0.00025560823368698816, + "loss": 0.0277, + "step": 114170 }, { - "epoch": 0.58, - "learning_rate": 0.0002135920811660301, - "loss": 0.0125, + "epoch": 0.3, + "learning_rate": 0.00025560434547061673, + "loss": 0.0228, "step": 114180 }, { - "epoch": 0.58, - "learning_rate": 0.0002135845134730161, - "loss": 0.0199, + "epoch": 0.3, + "learning_rate": 0.0002556004572542453, + "loss": 0.0203, "step": 114190 }, { - "epoch": 0.58, - "learning_rate": 0.0002135769457800021, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.0002555965690378738, + "loss": 0.0259, "step": 114200 }, { - "epoch": 0.58, - "learning_rate": 0.00021356937808698808, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002555926808215023, + "loss": 0.0199, "step": 114210 }, { - "epoch": 0.58, - "learning_rate": 0.00021356181039397406, - "loss": 0.0158, + "epoch": 0.3, + "learning_rate": 0.00025558879260513084, + "loss": 0.0235, "step": 114220 }, { - "epoch": 0.58, - "learning_rate": 0.00021355424270096007, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002555849043887594, + "loss": 0.0211, "step": 114230 }, { - "epoch": 0.58, - "learning_rate": 0.00021354667500794605, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.0002555810161723879, + "loss": 0.0206, "step": 114240 }, { - "epoch": 0.58, - "learning_rate": 0.00021353910731493204, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.0002555771279560165, + "loss": 0.0187, "step": 114250 }, { - "epoch": 0.58, - "learning_rate": 0.00021353153962191804, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.000255573239739645, + "loss": 0.0203, "step": 114260 }, { - "epoch": 0.58, - "learning_rate": 0.00021352397192890403, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.0002555693515232736, + "loss": 0.0241, "step": 114270 }, { - "epoch": 0.58, - "learning_rate": 0.00021351640423589, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002555654633069021, + "loss": 0.0217, "step": 114280 }, { - "epoch": 0.58, - "learning_rate": 0.00021350883654287602, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002555615750905306, + "loss": 0.026, "step": 114290 }, { - "epoch": 0.58, - "learning_rate": 0.000213501268849862, - "loss": 0.0177, + "epoch": 0.3, + "learning_rate": 0.0002555576868741591, + "loss": 0.0187, "step": 114300 }, { - "epoch": 0.58, - "learning_rate": 0.00021349370115684798, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002555537986577877, + "loss": 0.0185, "step": 114310 }, { - "epoch": 0.58, - "learning_rate": 0.000213486133463834, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002555499104414162, + "loss": 0.0251, "step": 114320 }, { - "epoch": 0.58, - "learning_rate": 0.00021347856577081997, - "loss": 0.0191, + "epoch": 0.3, + "learning_rate": 0.00025554602222504477, + "loss": 0.0204, "step": 114330 }, { - "epoch": 0.58, - "learning_rate": 0.00021347099807780595, - "loss": 0.0184, + "epoch": 0.3, + "learning_rate": 0.0002555421340086733, + "loss": 0.0209, "step": 114340 }, { - "epoch": 0.58, - "learning_rate": 0.00021346343038479193, - "loss": 0.018, + "epoch": 0.3, + "learning_rate": 0.00025553824579230185, + "loss": 0.0231, "step": 114350 }, { - "epoch": 0.58, - "learning_rate": 0.00021345586269177794, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.00025553435757593037, + "loss": 0.0213, "step": 114360 }, { - "epoch": 0.58, - "learning_rate": 0.00021344829499876392, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.0002555304693595589, + "loss": 0.0175, "step": 114370 }, { - "epoch": 0.58, - "learning_rate": 0.0002134407273057499, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.00025552658114318745, + "loss": 0.0267, "step": 114380 }, { - "epoch": 0.58, - "learning_rate": 0.0002134331596127359, - "loss": 0.0158, + "epoch": 0.3, + "learning_rate": 0.00025552269292681597, + "loss": 0.0205, "step": 114390 }, { - "epoch": 0.58, - "learning_rate": 0.0002134255919197219, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025551880471044454, + "loss": 0.0195, "step": 114400 }, { - "epoch": 0.58, - "learning_rate": 0.00021341802422670787, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025551491649407305, + "loss": 0.02, "step": 114410 }, { - "epoch": 0.58, - "learning_rate": 0.00021341045653369388, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.00025551102827770156, + "loss": 0.0203, "step": 114420 }, { - "epoch": 0.58, - "learning_rate": 0.00021340288884067986, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002555071400613301, + "loss": 0.0238, "step": 114430 }, { - "epoch": 0.58, - "learning_rate": 0.00021339532114766585, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.00025550325184495865, + "loss": 0.0234, "step": 114440 }, { - "epoch": 0.58, - "learning_rate": 0.00021338775345465185, - "loss": 0.0173, + "epoch": 0.3, + "learning_rate": 0.00025549936362858716, + "loss": 0.0232, "step": 114450 }, { - "epoch": 0.58, - "learning_rate": 0.00021338018576163784, - "loss": 0.0167, + "epoch": 0.3, + "learning_rate": 0.00025549547541221573, + "loss": 0.0203, "step": 114460 }, { - "epoch": 0.58, - "learning_rate": 0.00021337261806862382, - "loss": 0.0128, + "epoch": 0.3, + "learning_rate": 0.00025549158719584425, + "loss": 0.0215, "step": 114470 }, { - "epoch": 0.58, - "learning_rate": 0.00021336505037560983, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.0002554876989794728, + "loss": 0.0237, "step": 114480 }, { - "epoch": 0.58, - "learning_rate": 0.0002133574826825958, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025548381076310133, + "loss": 0.0181, "step": 114490 }, { - "epoch": 0.58, - "learning_rate": 0.0002133499149895818, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025547992254672984, + "loss": 0.0194, "step": 114500 }, { - "epoch": 0.58, - "learning_rate": 0.00021334234729656777, - "loss": 0.0123, + "epoch": 0.3, + "learning_rate": 0.00025547603433035836, + "loss": 0.0186, "step": 114510 }, { - "epoch": 0.58, - "learning_rate": 0.00021333477960355378, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.0002554721461139869, + "loss": 0.021, "step": 114520 }, { - "epoch": 0.58, - "learning_rate": 0.00021332721191053976, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.0002554682578976155, + "loss": 0.0206, "step": 114530 }, { - "epoch": 0.58, - "learning_rate": 0.00021331964421752574, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.000255464369681244, + "loss": 0.0186, "step": 114540 }, { - "epoch": 0.58, - "learning_rate": 0.00021331207652451175, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002554604814648725, + "loss": 0.0196, "step": 114550 }, { - "epoch": 0.58, - "learning_rate": 0.00021330450883149773, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002554565932485011, + "loss": 0.0195, "step": 114560 }, { - "epoch": 0.58, - "learning_rate": 0.0002132969411384837, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.0002554527050321296, + "loss": 0.0193, "step": 114570 }, { - "epoch": 0.58, - "learning_rate": 0.00021328937344546972, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.0002554488168157581, + "loss": 0.0156, "step": 114580 }, { - "epoch": 0.58, - "learning_rate": 0.0002132818057524557, - "loss": 0.0122, + "epoch": 0.3, + "learning_rate": 0.0002554449285993867, + "loss": 0.0186, "step": 114590 }, { - "epoch": 0.58, - "learning_rate": 0.00021327423805944168, - "loss": 0.0126, + "epoch": 0.3, + "learning_rate": 0.0002554410403830152, + "loss": 0.0207, "step": 114600 }, { - "epoch": 0.58, - "learning_rate": 0.0002132666703664277, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.0002554371521666438, + "loss": 0.0213, "step": 114610 }, { - "epoch": 0.58, - "learning_rate": 0.00021325910267341367, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.0002554332639502723, + "loss": 0.022, "step": 114620 }, { - "epoch": 0.58, - "learning_rate": 0.00021325153498039966, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.0002554293757339008, + "loss": 0.0173, "step": 114630 }, { - "epoch": 0.58, - "learning_rate": 0.00021324396728738566, - "loss": 0.0113, + "epoch": 0.3, + "learning_rate": 0.0002554254875175293, + "loss": 0.021, "step": 114640 }, { - "epoch": 0.58, - "learning_rate": 0.00021323639959437165, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.0002554215993011579, + "loss": 0.0197, "step": 114650 }, { - "epoch": 0.58, - "learning_rate": 0.00021322883190135763, - "loss": 0.0173, + "epoch": 0.3, + "learning_rate": 0.0002554177110847864, + "loss": 0.0207, "step": 114660 }, { - "epoch": 0.58, - "learning_rate": 0.00021322126420834364, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025541382286841497, + "loss": 0.0202, "step": 114670 }, { - "epoch": 0.58, - "learning_rate": 0.00021321369651532962, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002554099346520435, + "loss": 0.0195, "step": 114680 }, { - "epoch": 0.58, - "learning_rate": 0.0002132061288223156, - "loss": 0.0195, + "epoch": 0.3, + "learning_rate": 0.00025540604643567205, + "loss": 0.0218, "step": 114690 }, { - "epoch": 0.58, - "learning_rate": 0.00021319856112930158, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025540215821930057, + "loss": 0.04, "step": 114700 }, { - "epoch": 0.58, - "learning_rate": 0.0002131909934362876, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002553982700029291, + "loss": 0.0181, "step": 114710 }, { - "epoch": 0.58, - "learning_rate": 0.00021318342574327357, - "loss": 0.0176, + "epoch": 0.3, + "learning_rate": 0.0002553943817865576, + "loss": 0.0224, "step": 114720 }, { - "epoch": 0.58, - "learning_rate": 0.00021317585805025955, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025539049357018617, + "loss": 0.0232, "step": 114730 }, { - "epoch": 0.58, - "learning_rate": 0.00021316829035724556, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.00025538660535381473, + "loss": 0.0207, "step": 114740 }, { - "epoch": 0.58, - "learning_rate": 0.00021316072266423154, - "loss": 0.0113, + "epoch": 0.3, + "learning_rate": 0.00025538271713744325, + "loss": 0.0202, "step": 114750 }, { - "epoch": 0.58, - "learning_rate": 0.00021315315497121752, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025537882892107176, + "loss": 0.0271, "step": 114760 }, { - "epoch": 0.58, - "learning_rate": 0.00021314558727820353, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.00025537494070470033, + "loss": 0.0231, "step": 114770 }, { - "epoch": 0.58, - "learning_rate": 0.0002131380195851895, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.00025537105248832885, + "loss": 0.0199, "step": 114780 }, { - "epoch": 0.58, - "learning_rate": 0.0002131304518921755, - "loss": 0.0176, + "epoch": 0.3, + "learning_rate": 0.00025536716427195736, + "loss": 0.0193, "step": 114790 }, { - "epoch": 0.58, - "learning_rate": 0.0002131228841991615, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025536327605558593, + "loss": 0.0194, "step": 114800 }, { - "epoch": 0.58, - "learning_rate": 0.00021311531650614748, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025535938783921444, + "loss": 0.0207, "step": 114810 }, { - "epoch": 0.58, - "learning_rate": 0.00021310774881313347, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.000255355499622843, + "loss": 0.0233, "step": 114820 }, { - "epoch": 0.58, - "learning_rate": 0.00021310018112011947, - "loss": 0.0126, + "epoch": 0.3, + "learning_rate": 0.00025535161140647153, + "loss": 0.0252, "step": 114830 }, { - "epoch": 0.58, - "learning_rate": 0.00021309261342710546, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.00025534772319010004, + "loss": 0.0262, "step": 114840 }, { - "epoch": 0.58, - "learning_rate": 0.00021308504573409144, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.0002553438349737286, + "loss": 0.0193, "step": 114850 }, { - "epoch": 0.58, - "learning_rate": 0.00021307747804107742, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.0002553399467573571, + "loss": 0.0226, "step": 114860 }, { - "epoch": 0.58, - "learning_rate": 0.00021306991034806343, - "loss": 0.0135, + "epoch": 0.3, + "learning_rate": 0.00025533605854098564, + "loss": 0.0194, "step": 114870 }, { - "epoch": 0.58, - "learning_rate": 0.0002130623426550494, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002553321703246142, + "loss": 0.0183, "step": 114880 }, { - "epoch": 0.58, - "learning_rate": 0.0002130547749620354, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002553282821082427, + "loss": 0.0174, "step": 114890 }, { - "epoch": 0.58, - "learning_rate": 0.0002130472072690214, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002553243938918713, + "loss": 0.0189, "step": 114900 }, { - "epoch": 0.58, - "learning_rate": 0.00021303963957600738, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.0002553205056754998, + "loss": 0.0272, "step": 114910 }, { - "epoch": 0.58, - "learning_rate": 0.00021303207188299336, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.0002553166174591283, + "loss": 0.02, "step": 114920 }, { - "epoch": 0.58, - "learning_rate": 0.00021302450418997937, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.0002553127292427569, + "loss": 0.0211, "step": 114930 }, { - "epoch": 0.58, - "learning_rate": 0.00021301693649696535, - "loss": 0.0177, + "epoch": 0.3, + "learning_rate": 0.0002553088410263854, + "loss": 0.0223, "step": 114940 }, { - "epoch": 0.58, - "learning_rate": 0.00021300936880395133, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.000255304952810014, + "loss": 0.0208, "step": 114950 }, { - "epoch": 0.58, - "learning_rate": 0.00021300180111093734, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.0002553010645936425, + "loss": 0.0195, "step": 114960 }, { - "epoch": 0.58, - "learning_rate": 0.00021299423341792332, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.000255297176377271, + "loss": 0.0182, "step": 114970 }, { - "epoch": 0.58, - "learning_rate": 0.0002129866657249093, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.00025529328816089957, + "loss": 0.026, "step": 114980 }, { - "epoch": 0.58, - "learning_rate": 0.0002129790980318953, - "loss": 0.0122, + "epoch": 0.3, + "learning_rate": 0.0002552893999445281, + "loss": 0.0227, "step": 114990 }, { - "epoch": 0.58, - "learning_rate": 0.0002129715303388813, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002552855117281566, + "loss": 0.0228, "step": 115000 }, { - "epoch": 0.58, - "eval_cer": 0.914481900656667, - "eval_loss": 0.010673732496798038, - "eval_runtime": 116.7514, - "eval_samples_per_second": 17.13, - "eval_steps_per_second": 4.283, + "epoch": 0.3, + "eval_cer": 0.8817908634500211, + "eval_loss": 0.015144613571465015, + "eval_runtime": 107.6259, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 115000 }, { - "epoch": 0.58, - "learning_rate": 0.00021296396264586725, - "loss": 0.0189, + "epoch": 0.3, + "learning_rate": 0.00025528162351178517, + "loss": 0.022, "step": 115010 }, { - "epoch": 0.58, - "learning_rate": 0.00021295639495285323, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.0002552777352954137, + "loss": 0.0163, "step": 115020 }, { - "epoch": 0.58, - "learning_rate": 0.00021294882725983924, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.00025527384707904225, + "loss": 0.0192, "step": 115030 }, { - "epoch": 0.58, - "learning_rate": 0.00021294125956682522, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.00025526995886267077, + "loss": 0.0187, "step": 115040 }, { - "epoch": 0.58, - "learning_rate": 0.0002129336918738112, - "loss": 0.0132, + "epoch": 0.3, + "learning_rate": 0.0002552660706462993, + "loss": 0.0206, "step": 115050 }, { - "epoch": 0.58, - "learning_rate": 0.0002129261241807972, - "loss": 0.0175, + "epoch": 0.3, + "learning_rate": 0.00025526218242992785, + "loss": 0.021, "step": 115060 }, { - "epoch": 0.58, - "learning_rate": 0.0002129185564877832, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.00025525829421355636, + "loss": 0.0214, "step": 115070 }, { - "epoch": 0.58, - "learning_rate": 0.00021291098879476917, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025525440599718493, + "loss": 0.0222, "step": 115080 }, { - "epoch": 0.58, - "learning_rate": 0.00021290342110175515, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.00025525051778081345, + "loss": 0.0186, "step": 115090 }, { - "epoch": 0.58, - "learning_rate": 0.00021289585340874116, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.000255246629564442, + "loss": 0.0262, "step": 115100 }, { - "epoch": 0.58, - "learning_rate": 0.00021288828571572714, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.00025524274134807053, + "loss": 0.0235, "step": 115110 }, { - "epoch": 0.58, - "learning_rate": 0.00021288071802271313, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025523885313169905, + "loss": 0.0195, "step": 115120 }, { - "epoch": 0.58, - "learning_rate": 0.00021287315032969913, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025523496491532756, + "loss": 0.0191, "step": 115130 }, { - "epoch": 0.58, - "learning_rate": 0.00021286558263668512, - "loss": 0.0165, + "epoch": 0.3, + "learning_rate": 0.00025523107669895613, + "loss": 0.0203, "step": 115140 }, { - "epoch": 0.58, - "learning_rate": 0.0002128580149436711, - "loss": 0.0177, + "epoch": 0.3, + "learning_rate": 0.00025522718848258464, + "loss": 0.018, "step": 115150 }, { - "epoch": 0.58, - "learning_rate": 0.0002128504472506571, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.0002552233002662132, + "loss": 0.0212, "step": 115160 }, { - "epoch": 0.58, - "learning_rate": 0.0002128428795576431, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002552194120498417, + "loss": 0.0229, "step": 115170 }, { - "epoch": 0.58, - "learning_rate": 0.00021283531186462907, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025521552383347024, + "loss": 0.019, "step": 115180 }, { - "epoch": 0.58, - "learning_rate": 0.00021282774417161508, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.0002552116356170988, + "loss": 0.018, "step": 115190 }, { - "epoch": 0.58, - "learning_rate": 0.00021282017647860106, - "loss": 0.0125, + "epoch": 0.3, + "learning_rate": 0.0002552077474007273, + "loss": 0.0253, "step": 115200 }, { - "epoch": 0.58, - "learning_rate": 0.00021281260878558704, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.00025520385918435584, + "loss": 0.0282, "step": 115210 }, { - "epoch": 0.58, - "learning_rate": 0.00021280504109257305, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002551999709679844, + "loss": 0.019, "step": 115220 }, { - "epoch": 0.58, - "learning_rate": 0.00021279747339955903, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.000255196082751613, + "loss": 0.0257, "step": 115230 }, { - "epoch": 0.58, - "learning_rate": 0.000212789905706545, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.0002551921945352415, + "loss": 0.0339, "step": 115240 }, { - "epoch": 0.58, - "learning_rate": 0.000212782338013531, - "loss": 0.0171, + "epoch": 0.3, + "learning_rate": 0.00025518830631887, + "loss": 0.0211, "step": 115250 }, { - "epoch": 0.58, - "learning_rate": 0.000212774770320517, - "loss": 0.0167, + "epoch": 0.3, + "learning_rate": 0.0002551844181024985, + "loss": 0.0225, "step": 115260 }, { - "epoch": 0.58, - "learning_rate": 0.00021276720262750298, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002551805298861271, + "loss": 0.0246, "step": 115270 }, { - "epoch": 0.58, - "learning_rate": 0.00021275963493448896, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002551766416697556, + "loss": 0.0216, "step": 115280 }, { - "epoch": 0.58, - "learning_rate": 0.00021275206724147497, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.00025517275345338417, + "loss": 0.0232, "step": 115290 }, { - "epoch": 0.58, - "learning_rate": 0.00021274449954846095, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.0002551688652370127, + "loss": 0.0202, "step": 115300 }, { - "epoch": 0.58, - "learning_rate": 0.00021273693185544694, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.00025516497702064126, + "loss": 0.0195, "step": 115310 }, { - "epoch": 0.58, - "learning_rate": 0.00021272936416243294, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.00025516108880426977, + "loss": 0.0257, "step": 115320 }, { - "epoch": 0.58, - "learning_rate": 0.00021272179646941893, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.0002551572005878983, + "loss": 0.0199, "step": 115330 }, { - "epoch": 0.58, - "learning_rate": 0.0002127142287764049, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.0002551533123715268, + "loss": 0.0216, "step": 115340 }, { - "epoch": 0.58, - "learning_rate": 0.00021270666108339092, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.00025514942415515537, + "loss": 0.0211, "step": 115350 }, { - "epoch": 0.58, - "learning_rate": 0.0002126990933903769, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.0002551455359387839, + "loss": 0.0184, "step": 115360 }, { - "epoch": 0.58, - "learning_rate": 0.00021269152569736288, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025514164772241245, + "loss": 0.0212, "step": 115370 }, { - "epoch": 0.58, - "learning_rate": 0.0002126839580043489, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025513775950604097, + "loss": 0.0153, "step": 115380 }, { - "epoch": 0.58, - "learning_rate": 0.00021267639031133487, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002551338712896695, + "loss": 0.0221, "step": 115390 }, { - "epoch": 0.58, - "learning_rate": 0.00021266882261832085, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025512998307329805, + "loss": 0.0267, "step": 115400 }, { - "epoch": 0.58, - "learning_rate": 0.00021266125492530683, - "loss": 0.0124, + "epoch": 0.3, + "learning_rate": 0.00025512609485692656, + "loss": 0.0244, "step": 115410 }, { - "epoch": 0.58, - "learning_rate": 0.00021265368723229284, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002551222066405551, + "loss": 0.0245, "step": 115420 }, { - "epoch": 0.58, - "learning_rate": 0.00021264611953927882, - "loss": 0.0134, + "epoch": 0.3, + "learning_rate": 0.00025511831842418365, + "loss": 0.0227, "step": 115430 }, { - "epoch": 0.58, - "learning_rate": 0.0002126385518462648, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.0002551144302078122, + "loss": 0.0183, "step": 115440 }, { - "epoch": 0.58, - "learning_rate": 0.0002126309841532508, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.00025511054199144073, + "loss": 0.0203, "step": 115450 }, { - "epoch": 0.58, - "learning_rate": 0.0002126234164602368, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025510665377506924, + "loss": 0.0214, "step": 115460 }, { - "epoch": 0.58, - "learning_rate": 0.00021261584876722277, + "epoch": 0.3, + "learning_rate": 0.00025510276555869776, "loss": 0.0212, "step": 115470 }, { - "epoch": 0.58, - "learning_rate": 0.00021260828107420878, - "loss": 0.0134, + "epoch": 0.3, + "learning_rate": 0.00025509887734232633, + "loss": 0.0207, "step": 115480 }, { - "epoch": 0.58, - "learning_rate": 0.00021260071338119476, - "loss": 0.0186, + "epoch": 0.3, + "learning_rate": 0.00025509498912595484, + "loss": 0.0247, "step": 115490 }, { - "epoch": 0.58, - "learning_rate": 0.00021259314568818075, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.0002550911009095834, + "loss": 0.0275, "step": 115500 }, { - "epoch": 0.58, - "learning_rate": 0.00021258557799516675, - "loss": 0.0126, + "epoch": 0.3, + "learning_rate": 0.0002550872126932119, + "loss": 0.0182, "step": 115510 }, { - "epoch": 0.58, - "learning_rate": 0.00021257801030215274, - "loss": 0.0182, + "epoch": 0.3, + "learning_rate": 0.0002550833244768405, + "loss": 0.0294, "step": 115520 }, { - "epoch": 0.58, - "learning_rate": 0.00021257044260913872, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.000255079436260469, + "loss": 0.0199, "step": 115530 }, { - "epoch": 0.58, - "learning_rate": 0.00021256287491612473, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002550755480440975, + "loss": 0.0167, "step": 115540 }, { - "epoch": 0.58, - "learning_rate": 0.0002125553072231107, - "loss": 0.0121, + "epoch": 0.3, + "learning_rate": 0.00025507165982772604, + "loss": 0.022, "step": 115550 }, { - "epoch": 0.58, - "learning_rate": 0.0002125477395300967, - "loss": 0.0132, + "epoch": 0.3, + "learning_rate": 0.0002550677716113546, + "loss": 0.024, "step": 115560 }, { - "epoch": 0.58, - "learning_rate": 0.0002125401718370827, - "loss": 0.0173, + "epoch": 0.3, + "learning_rate": 0.0002550638833949832, + "loss": 0.0184, "step": 115570 }, { - "epoch": 0.58, - "learning_rate": 0.00021253260414406868, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.0002550599951786117, + "loss": 0.0216, "step": 115580 }, { - "epoch": 0.58, - "learning_rate": 0.00021252503645105466, - "loss": 0.0125, + "epoch": 0.3, + "learning_rate": 0.0002550561069622402, + "loss": 0.0188, "step": 115590 }, { - "epoch": 0.58, - "learning_rate": 0.00021251746875804064, - "loss": 0.0122, + "epoch": 0.3, + "learning_rate": 0.0002550522187458688, + "loss": 0.0237, "step": 115600 }, { - "epoch": 0.58, - "learning_rate": 0.00021250990106502665, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.0002550483305294973, + "loss": 0.025, "step": 115610 }, { - "epoch": 0.58, - "learning_rate": 0.00021250233337201263, - "loss": 0.0173, + "epoch": 0.3, + "learning_rate": 0.0002550444423131258, + "loss": 0.0268, "step": 115620 }, { - "epoch": 0.58, - "learning_rate": 0.00021249476567899861, - "loss": 0.0134, + "epoch": 0.3, + "learning_rate": 0.00025504055409675437, + "loss": 0.0286, "step": 115630 }, { - "epoch": 0.58, - "learning_rate": 0.00021248719798598462, - "loss": 0.0141, + "epoch": 0.3, + "learning_rate": 0.0002550366658803829, + "loss": 0.0239, "step": 115640 }, { - "epoch": 0.58, - "learning_rate": 0.0002124796302929706, - "loss": 0.0159, + "epoch": 0.3, + "learning_rate": 0.00025503277766401145, + "loss": 0.0213, "step": 115650 }, { - "epoch": 0.58, - "learning_rate": 0.00021247206259995659, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025502888944763997, + "loss": 0.0227, "step": 115660 }, { - "epoch": 0.58, - "learning_rate": 0.0002124644949069426, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002550250012312685, + "loss": 0.0234, "step": 115670 }, { - "epoch": 0.58, - "learning_rate": 0.00021245692721392858, - "loss": 0.0172, + "epoch": 0.3, + "learning_rate": 0.000255021113014897, + "loss": 0.0248, "step": 115680 }, { - "epoch": 0.58, - "learning_rate": 0.00021244935952091456, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.00025501722479852557, + "loss": 0.0198, "step": 115690 }, { - "epoch": 0.58, - "learning_rate": 0.00021244179182790056, - "loss": 0.0121, + "epoch": 0.3, + "learning_rate": 0.0002550133365821541, + "loss": 0.0175, "step": 115700 }, { - "epoch": 0.58, - "learning_rate": 0.00021243422413488655, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025500944836578265, + "loss": 0.0212, "step": 115710 }, { - "epoch": 0.58, - "learning_rate": 0.00021242665644187253, - "loss": 0.0119, + "epoch": 0.3, + "learning_rate": 0.00025500556014941116, + "loss": 0.0252, "step": 115720 }, { - "epoch": 0.58, - "learning_rate": 0.00021241908874885854, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.00025500167193303973, + "loss": 0.0208, "step": 115730 }, { - "epoch": 0.58, - "learning_rate": 0.00021241152105584452, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.00025499778371666825, + "loss": 0.0196, "step": 115740 }, { - "epoch": 0.58, - "learning_rate": 0.0002124039533628305, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025499389550029676, + "loss": 0.0213, "step": 115750 }, { - "epoch": 0.58, - "learning_rate": 0.00021239638566981648, - "loss": 0.012, + "epoch": 0.3, + "learning_rate": 0.0002549900072839253, + "loss": 0.0201, "step": 115760 }, { - "epoch": 0.58, - "learning_rate": 0.0002123888179768025, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025498611906755385, + "loss": 0.0186, "step": 115770 }, { - "epoch": 0.58, - "learning_rate": 0.00021238125028378847, - "loss": 0.0127, + "epoch": 0.3, + "learning_rate": 0.0002549822308511824, + "loss": 0.023, "step": 115780 }, { - "epoch": 0.58, - "learning_rate": 0.00021237368259077445, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025497834263481093, + "loss": 0.021, "step": 115790 }, { - "epoch": 0.58, - "learning_rate": 0.00021236611489776046, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025497445441843944, + "loss": 0.0283, "step": 115800 }, { - "epoch": 0.58, - "learning_rate": 0.00021235854720474644, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.000254970566202068, + "loss": 0.0212, "step": 115810 }, { - "epoch": 0.58, - "learning_rate": 0.00021235097951173242, - "loss": 0.0127, + "epoch": 0.3, + "learning_rate": 0.0002549666779856965, + "loss": 0.0266, "step": 115820 }, { - "epoch": 0.58, - "learning_rate": 0.00021234341181871843, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.00025496278976932504, + "loss": 0.0206, "step": 115830 }, { - "epoch": 0.58, - "learning_rate": 0.00021233584412570441, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002549589015529536, + "loss": 0.0193, "step": 115840 }, { - "epoch": 0.58, - "learning_rate": 0.0002123282764326904, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.0002549550133365821, + "loss": 0.0229, "step": 115850 }, { - "epoch": 0.58, - "learning_rate": 0.0002123207087396764, - "loss": 0.0158, + "epoch": 0.3, + "learning_rate": 0.0002549511251202107, + "loss": 0.0203, "step": 115860 }, { - "epoch": 0.58, - "learning_rate": 0.00021231314104666239, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.0002549472369038392, + "loss": 0.0216, "step": 115870 }, { - "epoch": 0.58, - "learning_rate": 0.00021230557335364837, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002549433486874677, + "loss": 0.0194, "step": 115880 }, { - "epoch": 0.58, - "learning_rate": 0.00021229800566063438, - "loss": 0.0112, + "epoch": 0.3, + "learning_rate": 0.00025493946047109624, + "loss": 0.0246, "step": 115890 }, { - "epoch": 0.58, - "learning_rate": 0.00021229043796762036, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002549355722547248, + "loss": 0.0267, "step": 115900 }, { - "epoch": 0.58, - "learning_rate": 0.00021228287027460634, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002549316840383533, + "loss": 0.021, "step": 115910 }, { - "epoch": 0.58, - "learning_rate": 0.00021227530258159232, - "loss": 0.0189, + "epoch": 0.3, + "learning_rate": 0.0002549277958219819, + "loss": 0.0204, "step": 115920 }, { - "epoch": 0.58, - "learning_rate": 0.00021226773488857833, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002549239076056104, + "loss": 0.0262, "step": 115930 }, { - "epoch": 0.58, - "learning_rate": 0.0002122601671955643, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.00025492001938923897, + "loss": 0.0229, "step": 115940 }, { - "epoch": 0.58, - "learning_rate": 0.0002122525995025503, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002549161311728675, + "loss": 0.0204, "step": 115950 }, { - "epoch": 0.59, - "learning_rate": 0.0002122450318095363, - "loss": 0.0187, + "epoch": 0.3, + "learning_rate": 0.000254912242956496, + "loss": 0.0202, "step": 115960 }, { - "epoch": 0.59, - "learning_rate": 0.00021223746411652228, - "loss": 0.021, + "epoch": 0.3, + "learning_rate": 0.00025490835474012457, + "loss": 0.0223, "step": 115970 }, { - "epoch": 0.59, - "learning_rate": 0.00021222989642350826, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002549044665237531, + "loss": 0.0209, "step": 115980 }, { - "epoch": 0.59, - "learning_rate": 0.00021222232873049427, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.00025490057830738165, + "loss": 0.0197, "step": 115990 }, { - "epoch": 0.59, - "learning_rate": 0.00021221476103748025, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025489669009101017, + "loss": 0.0192, "step": 116000 }, { - "epoch": 0.59, - "eval_cer": 0.9144634631302844, - "eval_loss": 0.01081350538879633, - "eval_runtime": 116.7675, - "eval_samples_per_second": 17.128, - "eval_steps_per_second": 4.282, + "epoch": 0.3, + "eval_cer": 0.8818174565517705, + "eval_loss": 0.01587188057601452, + "eval_runtime": 107.3455, + "eval_samples_per_second": 18.631, + "eval_steps_per_second": 4.658, "step": 116000 }, { - "epoch": 0.59, - "learning_rate": 0.00021220719334446623, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.0002548928018746387, + "loss": 0.0173, "step": 116010 }, { - "epoch": 0.59, - "learning_rate": 0.00021219962565145224, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025488891365826725, + "loss": 0.0195, "step": 116020 }, { - "epoch": 0.59, - "learning_rate": 0.00021219205795843822, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025488502544189577, + "loss": 0.0254, "step": 116030 }, { - "epoch": 0.59, - "learning_rate": 0.0002121844902654242, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002548811372255243, + "loss": 0.0293, "step": 116040 }, { - "epoch": 0.59, - "learning_rate": 0.00021217692257241021, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.00025487724900915285, + "loss": 0.0287, "step": 116050 }, { - "epoch": 0.59, - "learning_rate": 0.0002121693548793962, - "loss": 0.024, + "epoch": 0.3, + "learning_rate": 0.00025487336079278136, + "loss": 0.0235, "step": 116060 }, { - "epoch": 0.59, - "learning_rate": 0.00021216178718638218, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025486947257640993, + "loss": 0.0197, "step": 116070 }, { - "epoch": 0.59, - "learning_rate": 0.00021215421949336819, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025486558436003845, + "loss": 0.0195, "step": 116080 }, { - "epoch": 0.59, - "learning_rate": 0.00021214665180035417, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025486169614366696, + "loss": 0.0204, "step": 116090 }, { - "epoch": 0.59, - "learning_rate": 0.00021213908410734015, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025485780792729553, + "loss": 0.0207, "step": 116100 }, { - "epoch": 0.59, - "learning_rate": 0.00021213151641432613, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025485391971092404, + "loss": 0.0156, "step": 116110 }, { - "epoch": 0.59, - "learning_rate": 0.00021212394872131214, - "loss": 0.0126, + "epoch": 0.3, + "learning_rate": 0.0002548500314945526, + "loss": 0.0231, "step": 116120 }, { - "epoch": 0.59, - "learning_rate": 0.00021211638102829812, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.00025484614327818113, + "loss": 0.0221, "step": 116130 }, { - "epoch": 0.59, - "learning_rate": 0.0002121088133352841, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025484225506180964, + "loss": 0.0162, "step": 116140 }, { - "epoch": 0.59, - "learning_rate": 0.0002121012456422701, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.0002548383668454382, + "loss": 0.0211, "step": 116150 }, { - "epoch": 0.59, - "learning_rate": 0.0002120936779492561, - "loss": 0.0127, + "epoch": 0.3, + "learning_rate": 0.0002548344786290667, + "loss": 0.0206, "step": 116160 }, { - "epoch": 0.59, - "learning_rate": 0.00021208611025624207, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025483059041269524, + "loss": 0.0179, "step": 116170 }, { - "epoch": 0.59, - "learning_rate": 0.00021207854256322808, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.0002548267021963238, + "loss": 0.0178, "step": 116180 }, { - "epoch": 0.59, - "learning_rate": 0.00021207097487021406, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.0002548228139799523, + "loss": 0.0238, "step": 116190 }, { - "epoch": 0.59, - "learning_rate": 0.00021206340717720004, - "loss": 0.0145, + "epoch": 0.3, + "learning_rate": 0.0002548189257635809, + "loss": 0.0222, "step": 116200 }, { - "epoch": 0.59, - "learning_rate": 0.00021205583948418605, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.0002548150375472094, + "loss": 0.018, "step": 116210 }, { - "epoch": 0.59, - "learning_rate": 0.00021204827179117203, - "loss": 0.0171, + "epoch": 0.3, + "learning_rate": 0.0002548111493308379, + "loss": 0.0243, "step": 116220 }, { - "epoch": 0.59, - "learning_rate": 0.00021204070409815802, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.0002548072611144665, + "loss": 0.0186, "step": 116230 }, { - "epoch": 0.59, - "learning_rate": 0.00021203313640514402, - "loss": 0.0171, + "epoch": 0.3, + "learning_rate": 0.000254803372898095, + "loss": 0.0178, "step": 116240 }, { - "epoch": 0.59, - "learning_rate": 0.00021202556871213, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.0002547994846817235, + "loss": 0.025, "step": 116250 }, { - "epoch": 0.59, - "learning_rate": 0.000212018001019116, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002547955964653521, + "loss": 0.0211, "step": 116260 }, { - "epoch": 0.59, - "learning_rate": 0.00021201043332610194, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025479170824898066, + "loss": 0.0183, "step": 116270 }, { - "epoch": 0.59, - "learning_rate": 0.00021200286563308795, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.00025478782003260917, + "loss": 0.0219, "step": 116280 }, { - "epoch": 0.59, - "learning_rate": 0.00021199529794007393, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.0002547839318162377, + "loss": 0.0191, "step": 116290 }, { - "epoch": 0.59, - "learning_rate": 0.0002119877302470599, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002547800435998662, + "loss": 0.0219, "step": 116300 }, { - "epoch": 0.59, - "learning_rate": 0.0002119801625540459, - "loss": 0.0122, + "epoch": 0.3, + "learning_rate": 0.00025477615538349477, + "loss": 0.024, "step": 116310 }, { - "epoch": 0.59, - "learning_rate": 0.0002119725948610319, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002547722671671233, + "loss": 0.0217, "step": 116320 }, { - "epoch": 0.59, - "learning_rate": 0.00021196502716801788, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025476837895075185, + "loss": 0.0228, "step": 116330 }, { - "epoch": 0.59, - "learning_rate": 0.00021195745947500387, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.00025476449073438037, + "loss": 0.0164, "step": 116340 }, { - "epoch": 0.59, - "learning_rate": 0.00021194989178198987, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.00025476060251800894, + "loss": 0.0224, "step": 116350 }, { - "epoch": 0.59, - "learning_rate": 0.00021194232408897586, - "loss": 0.0161, + "epoch": 0.3, + "learning_rate": 0.00025475671430163745, + "loss": 0.0201, "step": 116360 }, { - "epoch": 0.59, - "learning_rate": 0.00021193475639596184, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025475282608526596, + "loss": 0.0243, "step": 116370 }, { - "epoch": 0.59, - "learning_rate": 0.00021192718870294785, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002547489378688945, + "loss": 0.0305, "step": 116380 }, { - "epoch": 0.59, - "learning_rate": 0.00021191962100993383, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.00025474504965252305, + "loss": 0.0223, "step": 116390 }, { - "epoch": 0.59, - "learning_rate": 0.0002119120533169198, - "loss": 0.0126, + "epoch": 0.3, + "learning_rate": 0.00025474116143615156, + "loss": 0.0229, "step": 116400 }, { - "epoch": 0.59, - "learning_rate": 0.00021190448562390582, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.00025473727321978013, + "loss": 0.0213, "step": 116410 }, { - "epoch": 0.59, - "learning_rate": 0.0002118969179308918, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.00025473338500340865, + "loss": 0.0213, "step": 116420 }, { - "epoch": 0.59, - "learning_rate": 0.00021188935023787778, - "loss": 0.0128, + "epoch": 0.3, + "learning_rate": 0.00025472949678703716, + "loss": 0.0185, "step": 116430 }, { - "epoch": 0.59, - "learning_rate": 0.0002118817825448638, - "loss": 0.0144, + "epoch": 0.3, + "learning_rate": 0.00025472560857066573, + "loss": 0.0238, "step": 116440 }, { - "epoch": 0.59, - "learning_rate": 0.00021187421485184977, - "loss": 0.0169, + "epoch": 0.3, + "learning_rate": 0.00025472172035429424, + "loss": 0.0227, "step": 116450 }, { - "epoch": 0.59, - "learning_rate": 0.00021186664715883575, - "loss": 0.0134, + "epoch": 0.3, + "learning_rate": 0.00025471783213792276, + "loss": 0.0221, "step": 116460 }, { - "epoch": 0.59, - "learning_rate": 0.00021185907946582176, - "loss": 0.0123, + "epoch": 0.3, + "learning_rate": 0.0002547139439215513, + "loss": 0.0186, "step": 116470 }, { - "epoch": 0.59, - "learning_rate": 0.00021185151177280774, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002547100557051799, + "loss": 0.0214, "step": 116480 }, { - "epoch": 0.59, - "learning_rate": 0.00021184394407979372, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002547061674888084, + "loss": 0.0214, "step": 116490 }, { - "epoch": 0.59, - "learning_rate": 0.0002118363763867797, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.0002547022792724369, + "loss": 0.0194, "step": 116500 }, { - "epoch": 0.59, - "learning_rate": 0.0002118288086937657, - "loss": 0.015, + "epoch": 0.3, + "learning_rate": 0.00025469839105606544, + "loss": 0.0203, "step": 116510 }, { - "epoch": 0.59, - "learning_rate": 0.0002118212410007517, - "loss": 0.0177, + "epoch": 0.3, + "learning_rate": 0.000254694502839694, + "loss": 0.0224, "step": 116520 }, { - "epoch": 0.59, - "learning_rate": 0.00021181367330773768, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.0002546906146233225, + "loss": 0.0245, "step": 116530 }, { - "epoch": 0.59, - "learning_rate": 0.00021180610561472368, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.0002546867264069511, + "loss": 0.0227, "step": 116540 }, { - "epoch": 0.59, - "learning_rate": 0.00021179853792170967, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002546828381905796, + "loss": 0.0244, "step": 116550 }, { - "epoch": 0.59, - "learning_rate": 0.00021179097022869565, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.0002546789499742082, + "loss": 0.0213, "step": 116560 }, { - "epoch": 0.59, - "learning_rate": 0.00021178340253568166, - "loss": 0.0141, + "epoch": 0.3, + "learning_rate": 0.0002546750617578367, + "loss": 0.0196, "step": 116570 }, { - "epoch": 0.59, - "learning_rate": 0.00021177583484266764, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.0002546711735414652, + "loss": 0.0202, "step": 116580 }, { - "epoch": 0.59, - "learning_rate": 0.00021176826714965362, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.0002546672853250937, + "loss": 0.02, "step": 116590 }, { - "epoch": 0.59, - "learning_rate": 0.00021176069945663963, - "loss": 0.0142, + "epoch": 0.3, + "learning_rate": 0.0002546633971087223, + "loss": 0.0189, "step": 116600 }, { - "epoch": 0.59, - "learning_rate": 0.0002117531317636256, - "loss": 0.0128, + "epoch": 0.3, + "learning_rate": 0.0002546595088923508, + "loss": 0.0183, "step": 116610 }, { - "epoch": 0.59, - "learning_rate": 0.0002117455640706116, - "loss": 0.0121, + "epoch": 0.3, + "learning_rate": 0.00025465562067597937, + "loss": 0.0207, "step": 116620 }, { - "epoch": 0.59, - "learning_rate": 0.0002117379963775976, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.0002546517324596079, + "loss": 0.0189, "step": 116630 }, { - "epoch": 0.59, - "learning_rate": 0.00021173042868458358, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002546478442432364, + "loss": 0.0219, "step": 116640 }, { - "epoch": 0.59, - "learning_rate": 0.00021172286099156956, - "loss": 0.0132, + "epoch": 0.3, + "learning_rate": 0.00025464395602686497, + "loss": 0.0228, "step": 116650 }, { - "epoch": 0.59, - "learning_rate": 0.00021171529329855554, - "loss": 0.0128, + "epoch": 0.3, + "learning_rate": 0.0002546400678104935, + "loss": 0.0261, "step": 116660 }, { - "epoch": 0.59, - "learning_rate": 0.00021170772560554155, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.00025463617959412205, + "loss": 0.021, "step": 116670 }, { - "epoch": 0.59, - "learning_rate": 0.00021170015791252753, - "loss": 0.0124, + "epoch": 0.3, + "learning_rate": 0.00025463229137775057, + "loss": 0.0192, "step": 116680 }, { - "epoch": 0.59, - "learning_rate": 0.00021169259021951351, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.00025462840316137913, + "loss": 0.0216, "step": 116690 }, { - "epoch": 0.59, - "learning_rate": 0.00021168502252649952, - "loss": 0.012, + "epoch": 0.3, + "learning_rate": 0.00025462451494500765, + "loss": 0.0198, "step": 116700 }, { - "epoch": 0.59, - "learning_rate": 0.0002116774548334855, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.00025462062672863616, + "loss": 0.0197, "step": 116710 }, { - "epoch": 0.59, - "learning_rate": 0.00021166988714047149, - "loss": 0.0139, - "step": 116720 + "epoch": 0.3, + "learning_rate": 0.0002546167385122647, + "loss": 0.0247, + "step": 116720 }, { - "epoch": 0.59, - "learning_rate": 0.0002116623194474575, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.00025461285029589325, + "loss": 0.022, "step": 116730 }, { - "epoch": 0.59, - "learning_rate": 0.00021165475175444348, - "loss": 0.0128, + "epoch": 0.3, + "learning_rate": 0.00025460896207952176, + "loss": 0.0283, "step": 116740 }, { - "epoch": 0.59, - "learning_rate": 0.00021164718406142946, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.00025460507386315033, + "loss": 0.0268, "step": 116750 }, { - "epoch": 0.59, - "learning_rate": 0.00021163961636841547, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025460118564677884, + "loss": 0.0178, "step": 116760 }, { - "epoch": 0.59, - "learning_rate": 0.00021163204867540145, - "loss": 0.0214, + "epoch": 0.3, + "learning_rate": 0.0002545972974304074, + "loss": 0.0195, "step": 116770 }, { - "epoch": 0.59, - "learning_rate": 0.00021162448098238743, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.00025459340921403593, + "loss": 0.0205, "step": 116780 }, { - "epoch": 0.59, - "learning_rate": 0.00021161691328937344, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025458952099766444, + "loss": 0.0243, "step": 116790 }, { - "epoch": 0.59, - "learning_rate": 0.00021160934559635942, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.00025458563278129296, + "loss": 0.02, "step": 116800 }, { - "epoch": 0.59, - "learning_rate": 0.0002116017779033454, - "loss": 0.0171, + "epoch": 0.3, + "learning_rate": 0.0002545817445649215, + "loss": 0.0239, "step": 116810 }, { - "epoch": 0.59, - "learning_rate": 0.00021159421021033138, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.0002545778563485501, + "loss": 0.0248, "step": 116820 }, { - "epoch": 0.59, - "learning_rate": 0.0002115866425173174, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.0002545739681321786, + "loss": 0.023, "step": 116830 }, { - "epoch": 0.59, - "learning_rate": 0.00021157907482430337, - "loss": 0.0132, + "epoch": 0.3, + "learning_rate": 0.0002545700799158071, + "loss": 0.0212, "step": 116840 }, { - "epoch": 0.59, - "learning_rate": 0.00021157150713128935, - "loss": 0.0106, + "epoch": 0.3, + "learning_rate": 0.0002545661916994357, + "loss": 0.0209, "step": 116850 }, { - "epoch": 0.59, - "learning_rate": 0.00021156393943827536, - "loss": 0.014, + "epoch": 0.3, + "learning_rate": 0.0002545623034830642, + "loss": 0.0228, "step": 116860 }, { - "epoch": 0.59, - "learning_rate": 0.00021155637174526134, - "loss": 0.0123, + "epoch": 0.3, + "learning_rate": 0.0002545584152666927, + "loss": 0.0211, "step": 116870 }, { - "epoch": 0.59, - "learning_rate": 0.00021154880405224732, - "loss": 0.0143, + "epoch": 0.3, + "learning_rate": 0.0002545545270503213, + "loss": 0.0278, "step": 116880 }, { - "epoch": 0.59, - "learning_rate": 0.00021154123635923333, - "loss": 0.0156, + "epoch": 0.3, + "learning_rate": 0.0002545506388339498, + "loss": 0.0188, "step": 116890 }, { - "epoch": 0.59, - "learning_rate": 0.00021153366866621931, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002545467506175784, + "loss": 0.0211, "step": 116900 }, { - "epoch": 0.59, - "learning_rate": 0.0002115261009732053, - "loss": 0.0118, + "epoch": 0.3, + "learning_rate": 0.0002545428624012069, + "loss": 0.0238, "step": 116910 }, { - "epoch": 0.59, - "learning_rate": 0.0002115185332801913, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.0002545389741848354, + "loss": 0.0189, "step": 116920 }, { - "epoch": 0.59, - "learning_rate": 0.00021151096558717729, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002545350859684639, + "loss": 0.0178, "step": 116930 }, { - "epoch": 0.59, - "learning_rate": 0.00021150339789416327, - "loss": 0.0103, + "epoch": 0.3, + "learning_rate": 0.0002545311977520925, + "loss": 0.02, "step": 116940 }, { - "epoch": 0.59, - "learning_rate": 0.00021149583020114928, - "loss": 0.0173, + "epoch": 0.3, + "learning_rate": 0.000254527309535721, + "loss": 0.0202, "step": 116950 }, { - "epoch": 0.59, - "learning_rate": 0.00021148826250813526, - "loss": 0.0185, + "epoch": 0.3, + "learning_rate": 0.00025452342131934957, + "loss": 0.018, "step": 116960 }, { - "epoch": 0.59, - "learning_rate": 0.00021148069481512124, - "loss": 0.0136, + "epoch": 0.3, + "learning_rate": 0.0002545195331029781, + "loss": 0.0244, "step": 116970 }, { - "epoch": 0.59, - "learning_rate": 0.00021147312712210725, - "loss": 0.017, + "epoch": 0.3, + "learning_rate": 0.00025451564488660665, + "loss": 0.0263, "step": 116980 }, { - "epoch": 0.59, - "learning_rate": 0.00021146555942909323, - "loss": 0.0213, + "epoch": 0.3, + "learning_rate": 0.00025451175667023517, + "loss": 0.0231, "step": 116990 }, { - "epoch": 0.59, - "learning_rate": 0.0002114579917360792, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.0002545078684538637, + "loss": 0.0218, "step": 117000 }, { - "epoch": 0.59, - "eval_cer": 0.9145207165016832, - "eval_loss": 0.01061397697776556, - "eval_runtime": 116.746, - "eval_samples_per_second": 17.131, - "eval_steps_per_second": 4.283, + "epoch": 0.3, + "eval_cer": 0.8818328525580464, + "eval_loss": 0.015921663492918015, + "eval_runtime": 107.4591, + "eval_samples_per_second": 18.612, + "eval_steps_per_second": 4.653, "step": 117000 }, { - "epoch": 0.59, - "learning_rate": 0.0002114504240430652, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.0002545039802374922, + "loss": 0.028, "step": 117010 }, { - "epoch": 0.59, - "learning_rate": 0.0002114428563500512, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025450009202112076, + "loss": 0.0212, "step": 117020 }, { - "epoch": 0.59, - "learning_rate": 0.00021143528865703718, - "loss": 0.0135, + "epoch": 0.3, + "learning_rate": 0.00025449620380474933, + "loss": 0.023, "step": 117030 }, { - "epoch": 0.59, - "learning_rate": 0.00021142772096402316, - "loss": 0.0175, + "epoch": 0.3, + "learning_rate": 0.00025449231558837785, + "loss": 0.0256, "step": 117040 }, { - "epoch": 0.59, - "learning_rate": 0.00021142015327100917, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.00025448842737200636, + "loss": 0.0259, "step": 117050 }, { - "epoch": 0.59, - "learning_rate": 0.00021141258557799515, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.00025448453915563493, + "loss": 0.0243, "step": 117060 }, { - "epoch": 0.59, - "learning_rate": 0.00021140501788498113, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025448065093926345, + "loss": 0.0193, "step": 117070 }, { - "epoch": 0.59, - "learning_rate": 0.00021139745019196714, - "loss": 0.0141, + "epoch": 0.3, + "learning_rate": 0.00025447676272289196, + "loss": 0.0229, "step": 117080 }, { - "epoch": 0.59, - "learning_rate": 0.00021138988249895312, - "loss": 0.0133, + "epoch": 0.3, + "learning_rate": 0.00025447287450652053, + "loss": 0.0233, "step": 117090 }, { - "epoch": 0.59, - "learning_rate": 0.0002113823148059391, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.00025446898629014904, + "loss": 0.0187, "step": 117100 }, { - "epoch": 0.59, - "learning_rate": 0.00021137474711292511, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.0002544650980737776, + "loss": 0.0268, "step": 117110 }, { - "epoch": 0.59, - "learning_rate": 0.0002113671794199111, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.0002544612098574061, + "loss": 0.0267, "step": 117120 }, { - "epoch": 0.59, - "learning_rate": 0.00021135961172689708, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025445732164103464, + "loss": 0.0208, "step": 117130 }, { - "epoch": 0.59, - "learning_rate": 0.00021135204403388309, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.00025445343342466316, + "loss": 0.0315, "step": 117140 }, { - "epoch": 0.59, - "learning_rate": 0.00021134447634086907, - "loss": 0.0135, + "epoch": 0.3, + "learning_rate": 0.0002544495452082917, + "loss": 0.0196, "step": 117150 }, { - "epoch": 0.59, - "learning_rate": 0.00021133690864785505, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.0002544456569919203, + "loss": 0.0302, "step": 117160 }, { - "epoch": 0.59, - "learning_rate": 0.00021132934095484103, - "loss": 0.0162, + "epoch": 0.3, + "learning_rate": 0.0002544417687755488, + "loss": 0.021, "step": 117170 }, { - "epoch": 0.59, - "learning_rate": 0.00021132177326182704, - "loss": 0.0168, + "epoch": 0.3, + "learning_rate": 0.0002544378805591773, + "loss": 0.022, "step": 117180 }, { - "epoch": 0.59, - "learning_rate": 0.00021131420556881302, - "loss": 0.0176, + "epoch": 0.3, + "learning_rate": 0.0002544339923428059, + "loss": 0.0208, "step": 117190 }, { - "epoch": 0.59, - "learning_rate": 0.000211306637875799, - "loss": 0.0166, + "epoch": 0.3, + "learning_rate": 0.0002544301041264344, + "loss": 0.0187, "step": 117200 }, { - "epoch": 0.59, - "learning_rate": 0.000211299070182785, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.0002544262159100629, + "loss": 0.0224, "step": 117210 }, { - "epoch": 0.59, - "learning_rate": 0.000211291502489771, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002544223276936915, + "loss": 0.0218, "step": 117220 }, { - "epoch": 0.59, - "learning_rate": 0.00021128393479675697, - "loss": 0.0152, + "epoch": 0.3, + "learning_rate": 0.00025441843947732, + "loss": 0.0214, "step": 117230 }, { - "epoch": 0.59, - "learning_rate": 0.00021127636710374298, - "loss": 0.0146, + "epoch": 0.3, + "learning_rate": 0.00025441455126094857, + "loss": 0.0171, "step": 117240 }, { - "epoch": 0.59, - "learning_rate": 0.00021126879941072896, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.0002544106630445771, + "loss": 0.0236, "step": 117250 }, { - "epoch": 0.59, - "learning_rate": 0.00021126123171771494, - "loss": 0.0137, + "epoch": 0.3, + "learning_rate": 0.0002544067748282056, + "loss": 0.0218, "step": 117260 }, { - "epoch": 0.59, - "learning_rate": 0.00021125366402470095, - "loss": 0.013, + "epoch": 0.3, + "learning_rate": 0.00025440288661183417, + "loss": 0.0273, "step": 117270 }, { - "epoch": 0.59, - "learning_rate": 0.00021124609633168693, - "loss": 0.0134, + "epoch": 0.3, + "learning_rate": 0.0002543989983954627, + "loss": 0.0197, "step": 117280 }, { - "epoch": 0.59, - "learning_rate": 0.00021123852863867292, - "loss": 0.0115, + "epoch": 0.3, + "learning_rate": 0.0002543951101790912, + "loss": 0.0227, "step": 117290 }, { - "epoch": 0.59, - "learning_rate": 0.00021123096094565892, - "loss": 0.0174, + "epoch": 0.3, + "learning_rate": 0.00025439122196271977, + "loss": 0.0224, "step": 117300 }, { - "epoch": 0.59, - "learning_rate": 0.0002112233932526449, - "loss": 0.0155, + "epoch": 0.3, + "learning_rate": 0.00025438733374634834, + "loss": 0.0215, "step": 117310 }, { - "epoch": 0.59, - "learning_rate": 0.0002112158255596309, - "loss": 0.0114, + "epoch": 0.3, + "learning_rate": 0.00025438344552997685, + "loss": 0.0262, "step": 117320 }, { - "epoch": 0.59, - "learning_rate": 0.00021120825786661687, - "loss": 0.0146, + "epoch": 0.3, + "learning_rate": 0.00025437955731360537, + "loss": 0.0221, "step": 117330 }, { - "epoch": 0.59, - "learning_rate": 0.00021120069017360288, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.0002543756690972339, + "loss": 0.0211, "step": 117340 }, { - "epoch": 0.59, - "learning_rate": 0.00021119312248058886, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.00025437178088086245, + "loss": 0.018, "step": 117350 }, { - "epoch": 0.59, - "learning_rate": 0.00021118555478757484, - "loss": 0.0113, + "epoch": 0.3, + "learning_rate": 0.00025436789266449096, + "loss": 0.0231, "step": 117360 }, { - "epoch": 0.59, - "learning_rate": 0.00021117798709456085, - "loss": 0.0131, + "epoch": 0.3, + "learning_rate": 0.00025436400444811953, + "loss": 0.0187, "step": 117370 }, { - "epoch": 0.59, - "learning_rate": 0.00021117041940154683, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.00025436011623174805, + "loss": 0.019, "step": 117380 }, { - "epoch": 0.59, - "learning_rate": 0.0002111628517085328, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.00025435622801537656, + "loss": 0.0188, "step": 117390 }, { - "epoch": 0.59, - "learning_rate": 0.00021115528401551882, - "loss": 0.0163, + "epoch": 0.3, + "learning_rate": 0.00025435233979900513, + "loss": 0.0216, "step": 117400 }, { - "epoch": 0.59, - "learning_rate": 0.0002111477163225048, - "loss": 0.016, + "epoch": 0.3, + "learning_rate": 0.00025434845158263364, + "loss": 0.0248, "step": 117410 }, { - "epoch": 0.59, - "learning_rate": 0.00021114014862949078, - "loss": 0.018, + "epoch": 0.3, + "learning_rate": 0.00025434456336626216, + "loss": 0.0224, "step": 117420 }, { - "epoch": 0.59, - "learning_rate": 0.0002111325809364768, - "loss": 0.0146, + "epoch": 0.3, + "learning_rate": 0.00025434067514989073, + "loss": 0.0303, "step": 117430 }, { - "epoch": 0.59, - "learning_rate": 0.00021112501324346277, - "loss": 0.0153, + "epoch": 0.3, + "learning_rate": 0.00025433678693351924, + "loss": 0.0186, "step": 117440 }, { - "epoch": 0.59, - "learning_rate": 0.00021111744555044875, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.0002543328987171478, + "loss": 0.0206, "step": 117450 }, { - "epoch": 0.59, - "learning_rate": 0.00021110987785743476, - "loss": 0.0149, + "epoch": 0.3, + "learning_rate": 0.0002543290105007763, + "loss": 0.0188, "step": 117460 }, { - "epoch": 0.59, - "learning_rate": 0.00021110231016442074, - "loss": 0.0228, + "epoch": 0.3, + "learning_rate": 0.00025432512228440484, + "loss": 0.0189, "step": 117470 }, { - "epoch": 0.59, - "learning_rate": 0.00021109474247140673, - "loss": 0.0154, + "epoch": 0.3, + "learning_rate": 0.0002543212340680334, + "loss": 0.0211, "step": 117480 }, { - "epoch": 0.59, - "learning_rate": 0.0002110871747783927, - "loss": 0.0123, + "epoch": 0.3, + "learning_rate": 0.0002543173458516619, + "loss": 0.0202, "step": 117490 }, { - "epoch": 0.59, - "learning_rate": 0.00021107960708537872, - "loss": 0.0124, + "epoch": 0.3, + "learning_rate": 0.00025431345763529044, + "loss": 0.0207, "step": 117500 }, { - "epoch": 0.59, - "learning_rate": 0.0002110720393923647, - "loss": 0.0125, + "epoch": 0.3, + "learning_rate": 0.000254309569418919, + "loss": 0.018, "step": 117510 }, { - "epoch": 0.59, - "learning_rate": 0.00021106447169935065, - "loss": 0.0151, + "epoch": 0.3, + "learning_rate": 0.0002543056812025476, + "loss": 0.0247, "step": 117520 }, { - "epoch": 0.59, - "learning_rate": 0.00021105690400633666, - "loss": 0.0168, + "epoch": 0.3, + "learning_rate": 0.0002543017929861761, + "loss": 0.025, "step": 117530 }, { - "epoch": 0.59, - "learning_rate": 0.00021104933631332264, - "loss": 0.0157, + "epoch": 0.3, + "learning_rate": 0.0002542979047698046, + "loss": 0.0197, "step": 117540 }, { - "epoch": 0.59, - "learning_rate": 0.00021104176862030862, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.0002542940165534331, + "loss": 0.0258, "step": 117550 }, { - "epoch": 0.59, - "learning_rate": 0.0002110342009272946, - "loss": 0.0121, + "epoch": 0.3, + "learning_rate": 0.0002542901283370617, + "loss": 0.0203, "step": 117560 }, { - "epoch": 0.59, - "learning_rate": 0.0002110266332342806, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002542862401206902, + "loss": 0.0233, "step": 117570 }, { - "epoch": 0.59, - "learning_rate": 0.0002110190655412666, - "loss": 0.0167, + "epoch": 0.3, + "learning_rate": 0.00025428235190431877, + "loss": 0.0198, "step": 117580 }, { - "epoch": 0.59, - "learning_rate": 0.00021101149784825258, - "loss": 0.0138, + "epoch": 0.3, + "learning_rate": 0.0002542784636879473, + "loss": 0.0202, "step": 117590 }, { - "epoch": 0.59, - "learning_rate": 0.00021100393015523858, - "loss": 0.0147, + "epoch": 0.3, + "learning_rate": 0.00025427457547157585, + "loss": 0.0177, "step": 117600 }, { - "epoch": 0.59, - "learning_rate": 0.00021099636246222457, - "loss": 0.0164, + "epoch": 0.3, + "learning_rate": 0.00025427068725520437, + "loss": 0.0217, "step": 117610 }, { - "epoch": 0.59, - "learning_rate": 0.00021098879476921055, - "loss": 0.0148, + "epoch": 0.3, + "learning_rate": 0.0002542667990388329, + "loss": 0.0155, "step": 117620 }, { - "epoch": 0.59, - "learning_rate": 0.00021098122707619656, - "loss": 0.0139, + "epoch": 0.3, + "learning_rate": 0.0002542629108224614, + "loss": 0.021, "step": 117630 }, { - "epoch": 0.59, - "learning_rate": 0.00021097365938318254, - "loss": 0.0129, + "epoch": 0.3, + "learning_rate": 0.00025425902260608997, + "loss": 0.043, "step": 117640 }, { - "epoch": 0.59, - "learning_rate": 0.00021096609169016852, - "loss": 0.0179, + "epoch": 0.3, + "learning_rate": 0.0002542551343897185, + "loss": 0.0243, "step": 117650 }, { - "epoch": 0.59, - "learning_rate": 0.00021095852399715453, - "loss": 0.0141, + "epoch": 0.3, + "learning_rate": 0.00025425124617334705, + "loss": 0.0247, "step": 117660 }, { - "epoch": 0.59, - "learning_rate": 0.0002109509563041405, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.00025424735795697556, + "loss": 0.0206, "step": 117670 }, { - "epoch": 0.59, - "learning_rate": 0.0002109433886111265, - "loss": 0.0187, + "epoch": 0.31, + "learning_rate": 0.0002542434697406041, + "loss": 0.0204, "step": 117680 }, { - "epoch": 0.59, - "learning_rate": 0.0002109358209181125, - "loss": 0.012, + "epoch": 0.31, + "learning_rate": 0.00025423958152423265, + "loss": 0.0211, "step": 117690 }, { - "epoch": 0.59, - "learning_rate": 0.00021092825322509848, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025423569330786116, + "loss": 0.0222, "step": 117700 }, { - "epoch": 0.59, - "learning_rate": 0.00021092068553208446, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.00025423180509148973, + "loss": 0.0199, "step": 117710 }, { - "epoch": 0.59, - "learning_rate": 0.00021091311783907044, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.00025422791687511825, + "loss": 0.0241, "step": 117720 }, { - "epoch": 0.59, - "learning_rate": 0.00021090555014605645, - "loss": 0.0204, + "epoch": 0.31, + "learning_rate": 0.0002542240286587468, + "loss": 0.0281, "step": 117730 }, { - "epoch": 0.59, - "learning_rate": 0.00021089798245304243, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.00025422014044237533, + "loss": 0.0241, "step": 117740 }, { - "epoch": 0.59, - "learning_rate": 0.00021089041476002841, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.00025421625222600384, + "loss": 0.0257, "step": 117750 }, { - "epoch": 0.59, - "learning_rate": 0.00021088284706701442, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.00025421236400963236, + "loss": 0.0217, "step": 117760 }, { - "epoch": 0.59, - "learning_rate": 0.0002108752793740004, - "loss": 0.0114, + "epoch": 0.31, + "learning_rate": 0.0002542084757932609, + "loss": 0.0205, "step": 117770 }, { - "epoch": 0.59, - "learning_rate": 0.00021086771168098639, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.00025420458757688944, + "loss": 0.0203, "step": 117780 }, { - "epoch": 0.59, - "learning_rate": 0.0002108601439879724, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.000254200699360518, + "loss": 0.0186, "step": 117790 }, { - "epoch": 0.59, - "learning_rate": 0.00021085257629495838, - "loss": 0.0261, + "epoch": 0.31, + "learning_rate": 0.0002541968111441465, + "loss": 0.0244, "step": 117800 }, { - "epoch": 0.59, - "learning_rate": 0.00021084500860194436, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.0002541929229277751, + "loss": 0.0226, "step": 117810 }, { - "epoch": 0.59, - "learning_rate": 0.00021083744090893037, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.0002541890347114036, + "loss": 0.0232, "step": 117820 }, { - "epoch": 0.59, - "learning_rate": 0.00021082987321591635, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002541851464950321, + "loss": 0.0186, "step": 117830 }, { - "epoch": 0.59, - "learning_rate": 0.00021082230552290233, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.00025418125827866064, + "loss": 0.0266, "step": 117840 }, { - "epoch": 0.59, - "learning_rate": 0.00021081473782988834, - "loss": 0.018, + "epoch": 0.31, + "learning_rate": 0.0002541773700622892, + "loss": 0.0207, "step": 117850 }, { - "epoch": 0.59, - "learning_rate": 0.00021080717013687432, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.0002541734818459178, + "loss": 0.0221, "step": 117860 }, { - "epoch": 0.59, - "learning_rate": 0.0002107996024438603, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.0002541695936295463, + "loss": 0.0163, "step": 117870 }, { - "epoch": 0.59, - "learning_rate": 0.00021079203475084628, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.0002541657054131748, + "loss": 0.0258, "step": 117880 }, { - "epoch": 0.59, - "learning_rate": 0.0002107844670578323, - "loss": 0.0208, + "epoch": 0.31, + "learning_rate": 0.0002541618171968033, + "loss": 0.0186, "step": 117890 }, { - "epoch": 0.59, - "learning_rate": 0.00021077689936481827, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.0002541579289804319, + "loss": 0.023, "step": 117900 }, { - "epoch": 0.59, - "learning_rate": 0.00021076933167180425, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002541540407640604, + "loss": 0.0194, "step": 117910 }, { - "epoch": 0.59, - "learning_rate": 0.00021076176397879026, - "loss": 0.0122, + "epoch": 0.31, + "learning_rate": 0.00025415015254768897, + "loss": 0.0269, "step": 117920 }, { - "epoch": 0.59, - "learning_rate": 0.00021075419628577624, - "loss": 0.0154, + "epoch": 0.31, + "learning_rate": 0.0002541462643313175, + "loss": 0.0249, "step": 117930 }, { - "epoch": 0.6, - "learning_rate": 0.00021074662859276222, - "loss": 0.0141, + "epoch": 0.31, + "learning_rate": 0.00025414237611494605, + "loss": 0.0177, "step": 117940 }, { - "epoch": 0.6, - "learning_rate": 0.00021073906089974823, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.00025413848789857457, + "loss": 0.0282, "step": 117950 }, { - "epoch": 0.6, - "learning_rate": 0.00021073149320673421, - "loss": 0.0141, + "epoch": 0.31, + "learning_rate": 0.0002541345996822031, + "loss": 0.0198, "step": 117960 }, { - "epoch": 0.6, - "learning_rate": 0.0002107239255137202, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.0002541307114658316, + "loss": 0.0197, "step": 117970 }, { - "epoch": 0.6, - "learning_rate": 0.0002107163578207062, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.00025412682324946017, + "loss": 0.0248, "step": 117980 }, { - "epoch": 0.6, - "learning_rate": 0.00021070879012769219, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.0002541229350330887, + "loss": 0.0281, "step": 117990 }, { - "epoch": 0.6, - "learning_rate": 0.00021070122243467817, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.00025411904681671725, + "loss": 0.0184, "step": 118000 }, { - "epoch": 0.6, - "eval_cer": 0.9144702559031622, - "eval_loss": 0.011005792766809464, - "eval_runtime": 116.812, - "eval_samples_per_second": 17.122, - "eval_steps_per_second": 4.28, + "epoch": 0.31, + "eval_cer": 0.8817810659914818, + "eval_loss": 0.014615286141633987, + "eval_runtime": 107.2768, + "eval_samples_per_second": 18.643, + "eval_steps_per_second": 4.661, "step": 118000 }, { - "epoch": 0.6, - "learning_rate": 0.00021069365474166418, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025411515860034576, + "loss": 0.0351, "step": 118010 }, { - "epoch": 0.6, - "learning_rate": 0.00021068608704865016, - "loss": 0.018, + "epoch": 0.31, + "learning_rate": 0.00025411127038397433, + "loss": 0.0185, "step": 118020 }, { - "epoch": 0.6, - "learning_rate": 0.00021067851935563614, - "loss": 0.0176, + "epoch": 0.31, + "learning_rate": 0.00025410738216760285, + "loss": 0.0203, "step": 118030 }, { - "epoch": 0.6, - "learning_rate": 0.00021067095166262215, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.00025410349395123136, + "loss": 0.0176, "step": 118040 }, { - "epoch": 0.6, - "learning_rate": 0.00021066338396960813, - "loss": 0.0209, + "epoch": 0.31, + "learning_rate": 0.0002540996057348599, + "loss": 0.021, "step": 118050 }, { - "epoch": 0.6, - "learning_rate": 0.0002106558162765941, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.00025409571751848844, + "loss": 0.0182, "step": 118060 }, { - "epoch": 0.6, - "learning_rate": 0.0002106482485835801, - "loss": 0.0283, + "epoch": 0.31, + "learning_rate": 0.000254091829302117, + "loss": 0.0255, "step": 118070 }, { - "epoch": 0.6, - "learning_rate": 0.0002106406808905661, - "loss": 0.0113, + "epoch": 0.31, + "learning_rate": 0.00025408794108574553, + "loss": 0.0211, "step": 118080 }, { - "epoch": 0.6, - "learning_rate": 0.00021063311319755208, - "loss": 0.0216, + "epoch": 0.31, + "learning_rate": 0.00025408405286937404, + "loss": 0.0226, "step": 118090 }, { - "epoch": 0.6, - "learning_rate": 0.00021062554550453806, - "loss": 0.0129, + "epoch": 0.31, + "learning_rate": 0.00025408016465300256, + "loss": 0.018, "step": 118100 }, { - "epoch": 0.6, - "learning_rate": 0.00021061797781152407, - "loss": 0.0196, + "epoch": 0.31, + "learning_rate": 0.0002540762764366311, + "loss": 0.0234, "step": 118110 }, { - "epoch": 0.6, - "learning_rate": 0.00021061041011851005, - "loss": 0.0197, + "epoch": 0.31, + "learning_rate": 0.00025407238822025964, + "loss": 0.0198, "step": 118120 }, { - "epoch": 0.6, - "learning_rate": 0.00021060284242549603, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.0002540685000038882, + "loss": 0.0257, "step": 118130 }, { - "epoch": 0.6, - "learning_rate": 0.00021059527473248204, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.0002540646117875167, + "loss": 0.018, "step": 118140 }, { - "epoch": 0.6, - "learning_rate": 0.00021058770703946802, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.0002540607235711453, + "loss": 0.0205, "step": 118150 }, { - "epoch": 0.6, - "learning_rate": 0.000210580139346454, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.0002540568353547738, + "loss": 0.0227, "step": 118160 }, { - "epoch": 0.6, - "learning_rate": 0.00021057257165344001, - "loss": 0.0123, + "epoch": 0.31, + "learning_rate": 0.0002540529471384023, + "loss": 0.0208, "step": 118170 }, { - "epoch": 0.6, - "learning_rate": 0.000210565003960426, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025404905892203084, + "loss": 0.0199, "step": 118180 }, { - "epoch": 0.6, - "learning_rate": 0.00021055743626741198, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.0002540451707056594, + "loss": 0.0237, "step": 118190 }, { - "epoch": 0.6, - "learning_rate": 0.00021054986857439799, - "loss": 0.0126, + "epoch": 0.31, + "learning_rate": 0.0002540412824892879, + "loss": 0.023, "step": 118200 }, { - "epoch": 0.6, - "learning_rate": 0.00021054230088138397, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002540373942729165, + "loss": 0.0218, "step": 118210 }, { - "epoch": 0.6, - "learning_rate": 0.00021053473318836995, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.000254033506056545, + "loss": 0.0221, "step": 118220 }, { - "epoch": 0.6, - "learning_rate": 0.00021052716549535593, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.00025402961784017357, + "loss": 0.0237, "step": 118230 }, { - "epoch": 0.6, - "learning_rate": 0.00021051959780234194, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.0002540257296238021, + "loss": 0.0222, "step": 118240 }, { - "epoch": 0.6, - "learning_rate": 0.00021051203010932792, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.0002540218414074306, + "loss": 0.0172, "step": 118250 }, { - "epoch": 0.6, - "learning_rate": 0.0002105044624163139, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.00025401795319105917, + "loss": 0.0208, "step": 118260 }, { - "epoch": 0.6, - "learning_rate": 0.0002104968947232999, - "loss": 0.0161, + "epoch": 0.31, + "learning_rate": 0.0002540140649746877, + "loss": 0.0176, "step": 118270 }, { - "epoch": 0.6, - "learning_rate": 0.0002104893270302859, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.00025401017675831625, + "loss": 0.0218, "step": 118280 }, { - "epoch": 0.6, - "learning_rate": 0.00021048175933727187, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.00025400628854194477, + "loss": 0.0168, "step": 118290 }, { - "epoch": 0.6, - "learning_rate": 0.00021047419164425788, - "loss": 0.0122, + "epoch": 0.31, + "learning_rate": 0.0002540024003255733, + "loss": 0.0242, "step": 118300 }, { - "epoch": 0.6, - "learning_rate": 0.00021046662395124386, - "loss": 0.0108, + "epoch": 0.31, + "learning_rate": 0.00025399851210920185, + "loss": 0.0189, "step": 118310 }, { - "epoch": 0.6, - "learning_rate": 0.00021045905625822984, - "loss": 0.0183, + "epoch": 0.31, + "learning_rate": 0.00025399462389283036, + "loss": 0.0214, "step": 118320 }, { - "epoch": 0.6, - "learning_rate": 0.00021045148856521585, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.0002539907356764589, + "loss": 0.0241, "step": 118330 }, { - "epoch": 0.6, - "learning_rate": 0.00021044392087220183, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.00025398684746008745, + "loss": 0.0176, "step": 118340 }, { - "epoch": 0.6, - "learning_rate": 0.00021043635317918782, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.00025398295924371596, + "loss": 0.0227, "step": 118350 }, { - "epoch": 0.6, - "learning_rate": 0.00021042878548617382, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.00025397907102734453, + "loss": 0.0192, "step": 118360 }, { - "epoch": 0.6, - "learning_rate": 0.0002104212177931598, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.00025397518281097305, + "loss": 0.02, "step": 118370 }, { - "epoch": 0.6, - "learning_rate": 0.0002104136501001458, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.00025397129459460156, + "loss": 0.0205, "step": 118380 }, { - "epoch": 0.6, - "learning_rate": 0.00021040608240713177, - "loss": 0.0197, + "epoch": 0.31, + "learning_rate": 0.0002539674063782301, + "loss": 0.0226, "step": 118390 }, { - "epoch": 0.6, - "learning_rate": 0.00021039851471411778, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.00025396351816185864, + "loss": 0.0194, "step": 118400 }, { - "epoch": 0.6, - "learning_rate": 0.00021039094702110376, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002539596299454872, + "loss": 0.0232, "step": 118410 }, { - "epoch": 0.6, - "learning_rate": 0.00021038337932808974, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.0002539557417291157, + "loss": 0.0188, "step": 118420 }, { - "epoch": 0.6, - "learning_rate": 0.00021037581163507575, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.00025395185351274424, + "loss": 0.0221, "step": 118430 }, { - "epoch": 0.6, - "learning_rate": 0.00021036824394206173, - "loss": 0.0125, + "epoch": 0.31, + "learning_rate": 0.0002539479652963728, + "loss": 0.0273, "step": 118440 }, { - "epoch": 0.6, - "learning_rate": 0.0002103606762490477, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.0002539440770800013, + "loss": 0.0191, "step": 118450 }, { - "epoch": 0.6, - "learning_rate": 0.00021035310855603372, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.00025394018886362984, + "loss": 0.0211, "step": 118460 }, { - "epoch": 0.6, - "learning_rate": 0.0002103455408630197, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.0002539363006472584, + "loss": 0.023, "step": 118470 }, { - "epoch": 0.6, - "learning_rate": 0.00021033797317000568, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.0002539324124308869, + "loss": 0.0215, "step": 118480 }, { - "epoch": 0.6, - "learning_rate": 0.0002103304054769917, - "loss": 0.0129, + "epoch": 0.31, + "learning_rate": 0.0002539285242145155, + "loss": 0.0231, "step": 118490 }, { - "epoch": 0.6, - "learning_rate": 0.00021032283778397767, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.000253924635998144, + "loss": 0.0247, "step": 118500 }, { - "epoch": 0.6, - "learning_rate": 0.00021031527009096365, - "loss": 0.0148, + "epoch": 0.31, + "learning_rate": 0.0002539207477817725, + "loss": 0.0252, "step": 118510 }, { - "epoch": 0.6, - "learning_rate": 0.00021030770239794966, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002539168595654011, + "loss": 0.0252, "step": 118520 }, { - "epoch": 0.6, - "learning_rate": 0.00021030013470493564, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002539129713490296, + "loss": 0.0214, "step": 118530 }, { - "epoch": 0.6, - "learning_rate": 0.00021029256701192163, - "loss": 0.018, + "epoch": 0.31, + "learning_rate": 0.0002539090831326581, + "loss": 0.0218, "step": 118540 }, { - "epoch": 0.6, - "learning_rate": 0.00021028499931890763, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002539051949162867, + "loss": 0.0194, "step": 118550 }, { - "epoch": 0.6, - "learning_rate": 0.00021027743162589362, - "loss": 0.0125, + "epoch": 0.31, + "learning_rate": 0.00025390130669991525, + "loss": 0.02, "step": 118560 }, { - "epoch": 0.6, - "learning_rate": 0.0002102698639328796, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.00025389741848354377, + "loss": 0.024, "step": 118570 }, { - "epoch": 0.6, - "learning_rate": 0.00021026229623986558, - "loss": 0.0133, + "epoch": 0.31, + "learning_rate": 0.0002538935302671723, + "loss": 0.0187, "step": 118580 }, { - "epoch": 0.6, - "learning_rate": 0.0002102547285468516, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.0002538896420508008, + "loss": 0.0226, "step": 118590 }, { - "epoch": 0.6, - "learning_rate": 0.00021024716085383757, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002538857538344293, + "loss": 0.0191, "step": 118600 }, { - "epoch": 0.6, - "learning_rate": 0.00021023959316082355, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.0002538818656180579, + "loss": 0.026, "step": 118610 }, { - "epoch": 0.6, - "learning_rate": 0.00021023202546780956, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.00025387797740168645, + "loss": 0.0223, "step": 118620 }, { - "epoch": 0.6, - "learning_rate": 0.00021022445777479554, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025387408918531497, + "loss": 0.0209, "step": 118630 }, { - "epoch": 0.6, - "learning_rate": 0.00021021689008178152, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.0002538702009689435, + "loss": 0.0221, "step": 118640 }, { - "epoch": 0.6, - "learning_rate": 0.00021020932238876753, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.00025386631275257205, + "loss": 0.0205, "step": 118650 }, { - "epoch": 0.6, - "learning_rate": 0.0002102017546957535, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025386242453620056, + "loss": 0.0199, "step": 118660 }, { - "epoch": 0.6, - "learning_rate": 0.0002101941870027395, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.0002538585363198291, + "loss": 0.0172, "step": 118670 }, { - "epoch": 0.6, - "learning_rate": 0.0002101866193097255, - "loss": 0.0181, + "epoch": 0.31, + "learning_rate": 0.00025385464810345765, + "loss": 0.0188, "step": 118680 }, { - "epoch": 0.6, - "learning_rate": 0.00021017905161671148, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.00025385075988708616, + "loss": 0.0229, "step": 118690 }, { - "epoch": 0.6, - "learning_rate": 0.00021017148392369746, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.00025384687167071473, + "loss": 0.0167, "step": 118700 }, { - "epoch": 0.6, - "learning_rate": 0.00021016391623068347, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.00025384298345434324, + "loss": 0.019, "step": 118710 }, { - "epoch": 0.6, - "learning_rate": 0.00021015634853766945, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.00025383909523797176, + "loss": 0.0179, "step": 118720 }, { - "epoch": 0.6, - "learning_rate": 0.00021014878084465544, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.00025383520702160033, + "loss": 0.0163, "step": 118730 }, { - "epoch": 0.6, - "learning_rate": 0.00021014121315164142, - "loss": 0.0123, + "epoch": 0.31, + "learning_rate": 0.00025383131880522884, + "loss": 0.0211, "step": 118740 }, { - "epoch": 0.6, - "learning_rate": 0.00021013364545862743, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.0002538274305888574, + "loss": 0.0199, "step": 118750 }, { - "epoch": 0.6, - "learning_rate": 0.0002101260777656134, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.0002538235423724859, + "loss": 0.0213, "step": 118760 }, { - "epoch": 0.6, - "learning_rate": 0.0002101185100725994, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.0002538196541561145, + "loss": 0.0189, "step": 118770 }, { - "epoch": 0.6, - "learning_rate": 0.00021011094237958534, - "loss": 0.0118, + "epoch": 0.31, + "learning_rate": 0.000253815765939743, + "loss": 0.016, "step": 118780 }, { - "epoch": 0.6, - "learning_rate": 0.00021010337468657135, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002538118777233715, + "loss": 0.0246, "step": 118790 }, { - "epoch": 0.6, - "learning_rate": 0.00021009580699355733, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.00025380798950700004, + "loss": 0.0209, "step": 118800 }, { - "epoch": 0.6, - "learning_rate": 0.00021008823930054331, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002538041012906286, + "loss": 0.0209, "step": 118810 }, { - "epoch": 0.6, - "learning_rate": 0.00021008067160752932, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.0002538002130742571, + "loss": 0.0254, "step": 118820 }, { - "epoch": 0.6, - "learning_rate": 0.0002100731039145153, - "loss": 0.0172, + "epoch": 0.31, + "learning_rate": 0.0002537963248578857, + "loss": 0.0237, "step": 118830 }, { - "epoch": 0.6, - "learning_rate": 0.00021006553622150129, - "loss": 0.0176, + "epoch": 0.31, + "learning_rate": 0.0002537924366415142, + "loss": 0.0206, "step": 118840 }, { - "epoch": 0.6, - "learning_rate": 0.0002100579685284873, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.0002537885484251427, + "loss": 0.023, "step": 118850 }, { - "epoch": 0.6, - "learning_rate": 0.00021005040083547328, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.0002537846602087713, + "loss": 0.0228, "step": 118860 }, { - "epoch": 0.6, - "learning_rate": 0.00021004283314245926, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.0002537807719923998, + "loss": 0.0221, "step": 118870 }, { - "epoch": 0.6, - "learning_rate": 0.00021003526544944527, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.0002537768837760283, + "loss": 0.0232, "step": 118880 }, { - "epoch": 0.6, - "learning_rate": 0.00021002769775643125, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.0002537729955596569, + "loss": 0.022, "step": 118890 }, { - "epoch": 0.6, - "learning_rate": 0.00021002013006341723, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.00025376910734328545, + "loss": 0.0168, "step": 118900 }, { - "epoch": 0.6, - "learning_rate": 0.00021001256237040324, - "loss": 0.0106, + "epoch": 0.31, + "learning_rate": 0.00025376521912691397, + "loss": 0.0212, "step": 118910 }, { - "epoch": 0.6, - "learning_rate": 0.00021000499467738922, - "loss": 0.0191, + "epoch": 0.31, + "learning_rate": 0.0002537613309105425, + "loss": 0.0207, "step": 118920 }, { - "epoch": 0.6, - "learning_rate": 0.0002099974269843752, - "loss": 0.0199, + "epoch": 0.31, + "learning_rate": 0.000253757442694171, + "loss": 0.0229, "step": 118930 }, { - "epoch": 0.6, - "learning_rate": 0.0002099898592913612, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.00025375355447779957, + "loss": 0.0207, "step": 118940 }, { - "epoch": 0.6, - "learning_rate": 0.0002099822915983472, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.0002537496662614281, + "loss": 0.0226, "step": 118950 }, { - "epoch": 0.6, - "learning_rate": 0.00020997472390533317, - "loss": 0.0181, + "epoch": 0.31, + "learning_rate": 0.00025374577804505665, + "loss": 0.0188, "step": 118960 }, { - "epoch": 0.6, - "learning_rate": 0.00020996715621231915, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025374188982868516, + "loss": 0.0273, "step": 118970 }, { - "epoch": 0.6, - "learning_rate": 0.00020995958851930516, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.00025373800161231373, + "loss": 0.018, "step": 118980 }, { - "epoch": 0.6, - "learning_rate": 0.00020995202082629114, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.00025373411339594225, + "loss": 0.0232, "step": 118990 }, { - "epoch": 0.6, - "learning_rate": 0.00020994445313327712, - "loss": 0.0123, + "epoch": 0.31, + "learning_rate": 0.00025373022517957076, + "loss": 0.0183, "step": 119000 }, { - "epoch": 0.6, - "eval_cer": 0.9144935454101719, - "eval_loss": 0.010422189719974995, - "eval_runtime": 116.7072, - "eval_samples_per_second": 17.137, - "eval_steps_per_second": 4.284, + "epoch": 0.31, + "eval_cer": 0.8817894638130869, + "eval_loss": 0.01590069569647312, + "eval_runtime": 107.3244, + "eval_samples_per_second": 18.635, + "eval_steps_per_second": 4.659, "step": 119000 }, { - "epoch": 0.6, - "learning_rate": 0.00020993688544026313, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.0002537263369631993, + "loss": 0.0201, "step": 119010 }, { - "epoch": 0.6, - "learning_rate": 0.00020992931774724911, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.00025372244874682784, + "loss": 0.0195, "step": 119020 }, { - "epoch": 0.6, - "learning_rate": 0.0002099217500542351, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025371856053045636, + "loss": 0.0243, "step": 119030 }, { - "epoch": 0.6, - "learning_rate": 0.0002099141823612211, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.00025371467231408493, + "loss": 0.0203, "step": 119040 }, { - "epoch": 0.6, - "learning_rate": 0.00020990661466820709, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.00025371078409771344, + "loss": 0.0212, "step": 119050 }, { - "epoch": 0.6, - "learning_rate": 0.00020989904697519307, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.000253706895881342, + "loss": 0.021, "step": 119060 }, { - "epoch": 0.6, - "learning_rate": 0.00020989147928217908, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002537030076649705, + "loss": 0.0214, "step": 119070 }, { - "epoch": 0.6, - "learning_rate": 0.00020988391158916506, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.00025369911944859904, + "loss": 0.0175, "step": 119080 }, { - "epoch": 0.6, - "learning_rate": 0.00020987634389615104, - "loss": 0.0136, + "epoch": 0.31, + "learning_rate": 0.00025369523123222756, + "loss": 0.0196, "step": 119090 }, { - "epoch": 0.6, - "learning_rate": 0.00020986877620313705, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.0002536913430158561, + "loss": 0.025, "step": 119100 }, { - "epoch": 0.6, - "learning_rate": 0.00020986120851012303, - "loss": 0.012, + "epoch": 0.31, + "learning_rate": 0.0002536874547994847, + "loss": 0.0209, "step": 119110 }, { - "epoch": 0.6, - "learning_rate": 0.000209853640817109, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002536835665831132, + "loss": 0.0221, "step": 119120 }, { - "epoch": 0.6, - "learning_rate": 0.000209846073124095, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.0002536796783667417, + "loss": 0.0219, "step": 119130 }, { - "epoch": 0.6, - "learning_rate": 0.000209838505431081, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.00025367579015037024, + "loss": 0.0196, "step": 119140 }, { - "epoch": 0.6, - "learning_rate": 0.00020983093773806698, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002536719019339988, + "loss": 0.0194, "step": 119150 }, { - "epoch": 0.6, - "learning_rate": 0.00020982337004505296, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.0002536680137176273, + "loss": 0.0205, "step": 119160 }, { - "epoch": 0.6, - "learning_rate": 0.00020981580235203897, - "loss": 0.0181, + "epoch": 0.31, + "learning_rate": 0.0002536641255012559, + "loss": 0.0215, "step": 119170 }, { - "epoch": 0.6, - "learning_rate": 0.00020980823465902495, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002536602372848844, + "loss": 0.0177, "step": 119180 }, { - "epoch": 0.6, - "learning_rate": 0.00020980066696601093, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.00025365634906851297, + "loss": 0.0243, "step": 119190 }, { - "epoch": 0.6, - "learning_rate": 0.00020979309927299694, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.0002536524608521415, + "loss": 0.0204, "step": 119200 }, { - "epoch": 0.6, - "learning_rate": 0.00020978553157998292, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.00025364857263577, + "loss": 0.0201, "step": 119210 }, { - "epoch": 0.6, - "learning_rate": 0.0002097779638869689, - "loss": 0.0161, + "epoch": 0.31, + "learning_rate": 0.0002536446844193985, + "loss": 0.0267, "step": 119220 }, { - "epoch": 0.6, - "learning_rate": 0.00020977039619395491, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.0002536407962030271, + "loss": 0.026, "step": 119230 }, { - "epoch": 0.6, - "learning_rate": 0.0002097628285009409, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002536369079866556, + "loss": 0.0255, "step": 119240 }, { - "epoch": 0.6, - "learning_rate": 0.00020975526080792688, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.00025363301977028417, + "loss": 0.0215, "step": 119250 }, { - "epoch": 0.6, - "learning_rate": 0.00020974769311491289, - "loss": 0.0141, - "step": 119260 + "epoch": 0.31, + "learning_rate": 0.0002536291315539127, + "loss": 0.0256, + "step": 119260 }, { - "epoch": 0.6, - "learning_rate": 0.00020974012542189887, - "loss": 0.0148, + "epoch": 0.31, + "learning_rate": 0.00025362524333754125, + "loss": 0.0251, "step": 119270 }, { - "epoch": 0.6, - "learning_rate": 0.00020973255772888485, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.00025362135512116976, + "loss": 0.0196, "step": 119280 }, { - "epoch": 0.6, - "learning_rate": 0.00020972499003587083, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.0002536174669047983, + "loss": 0.019, "step": 119290 }, { - "epoch": 0.6, - "learning_rate": 0.00020971742234285684, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.00025361357868842685, + "loss": 0.0174, "step": 119300 }, { - "epoch": 0.6, - "learning_rate": 0.00020970985464984282, - "loss": 0.0168, + "epoch": 0.31, + "learning_rate": 0.00025360969047205536, + "loss": 0.023, "step": 119310 }, { - "epoch": 0.6, - "learning_rate": 0.0002097022869568288, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.00025360580225568393, + "loss": 0.0217, "step": 119320 }, { - "epoch": 0.6, - "learning_rate": 0.0002096947192638148, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.00025360191403931245, + "loss": 0.0207, "step": 119330 }, { - "epoch": 0.6, - "learning_rate": 0.0002096871515708008, - "loss": 0.0113, + "epoch": 0.31, + "learning_rate": 0.00025359802582294096, + "loss": 0.0217, "step": 119340 }, { - "epoch": 0.6, - "learning_rate": 0.00020967958387778677, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.0002535941376065695, + "loss": 0.0228, "step": 119350 }, { - "epoch": 0.6, - "learning_rate": 0.00020967201618477278, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.00025359024939019804, + "loss": 0.0221, "step": 119360 }, { - "epoch": 0.6, - "learning_rate": 0.00020966444849175876, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.00025358636117382656, + "loss": 0.019, "step": 119370 }, { - "epoch": 0.6, - "learning_rate": 0.00020965688079874474, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002535824729574551, + "loss": 0.0182, "step": 119380 }, { - "epoch": 0.6, - "learning_rate": 0.00020964931310573075, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.00025357858474108364, + "loss": 0.0196, "step": 119390 }, { - "epoch": 0.6, - "learning_rate": 0.00020964174541271673, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002535746965247122, + "loss": 0.0273, "step": 119400 }, { - "epoch": 0.6, - "learning_rate": 0.00020963417771970272, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002535708083083407, + "loss": 0.0263, "step": 119410 }, { - "epoch": 0.6, - "learning_rate": 0.00020962661002668872, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.00025356692009196924, + "loss": 0.0232, "step": 119420 }, { - "epoch": 0.6, - "learning_rate": 0.0002096190423336747, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.00025356303187559775, + "loss": 0.0197, "step": 119430 }, { - "epoch": 0.6, - "learning_rate": 0.0002096114746406607, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.0002535591436592263, + "loss": 0.0188, "step": 119440 }, { - "epoch": 0.6, - "learning_rate": 0.0002096039069476467, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002535552554428549, + "loss": 0.0196, "step": 119450 }, { - "epoch": 0.6, - "learning_rate": 0.00020959633925463268, - "loss": 0.0136, + "epoch": 0.31, + "learning_rate": 0.0002535513672264834, + "loss": 0.0199, "step": 119460 }, { - "epoch": 0.6, - "learning_rate": 0.00020958877156161866, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002535474790101119, + "loss": 0.029, "step": 119470 }, { - "epoch": 0.6, - "learning_rate": 0.00020958120386860464, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.0002535435907937405, + "loss": 0.0221, "step": 119480 }, { - "epoch": 0.6, - "learning_rate": 0.00020957363617559065, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.000253539702577369, + "loss": 0.0217, "step": 119490 }, { - "epoch": 0.6, - "learning_rate": 0.00020956606848257663, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.0002535358143609975, + "loss": 0.0198, "step": 119500 }, { - "epoch": 0.6, - "learning_rate": 0.0002095585007895626, - "loss": 0.0122, + "epoch": 0.31, + "learning_rate": 0.0002535319261446261, + "loss": 0.0203, "step": 119510 }, { - "epoch": 0.6, - "learning_rate": 0.00020955093309654862, - "loss": 0.011, + "epoch": 0.31, + "learning_rate": 0.0002535280379282546, + "loss": 0.0198, "step": 119520 }, { - "epoch": 0.6, - "learning_rate": 0.0002095433654035346, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.00025352414971188317, + "loss": 0.0197, "step": 119530 }, { - "epoch": 0.6, - "learning_rate": 0.00020953579771052058, - "loss": 0.0115, + "epoch": 0.31, + "learning_rate": 0.0002535202614955117, + "loss": 0.0214, "step": 119540 }, { - "epoch": 0.6, - "learning_rate": 0.0002095282300175066, - "loss": 0.0141, + "epoch": 0.31, + "learning_rate": 0.0002535163732791402, + "loss": 0.02, "step": 119550 }, { - "epoch": 0.6, - "learning_rate": 0.00020952066232449257, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.00025351248506276877, + "loss": 0.0213, "step": 119560 }, { - "epoch": 0.6, - "learning_rate": 0.00020951309463147855, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.0002535085968463973, + "loss": 0.0279, "step": 119570 }, { - "epoch": 0.6, - "learning_rate": 0.00020950552693846456, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002535047086300258, + "loss": 0.0245, "step": 119580 }, { - "epoch": 0.6, - "learning_rate": 0.00020949795924545054, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.00025350082041365437, + "loss": 0.0212, "step": 119590 }, { - "epoch": 0.6, - "learning_rate": 0.00020949039155243653, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.0002534969321972829, + "loss": 0.0231, "step": 119600 }, { - "epoch": 0.6, - "learning_rate": 0.00020948282385942253, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.00025349304398091145, + "loss": 0.0271, "step": 119610 }, { - "epoch": 0.6, - "learning_rate": 0.00020947525616640852, - "loss": 0.0117, + "epoch": 0.31, + "learning_rate": 0.00025348915576453996, + "loss": 0.0231, "step": 119620 }, { - "epoch": 0.6, - "learning_rate": 0.0002094676884733945, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002534852675481685, + "loss": 0.0225, "step": 119630 }, { - "epoch": 0.6, - "learning_rate": 0.00020946012078038048, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.000253481379331797, + "loss": 0.0233, "step": 119640 }, { - "epoch": 0.6, - "learning_rate": 0.0002094525530873665, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025347749111542556, + "loss": 0.0263, "step": 119650 }, { - "epoch": 0.6, - "learning_rate": 0.00020944498539435247, - "loss": 0.0191, + "epoch": 0.31, + "learning_rate": 0.00025347360289905413, + "loss": 0.0222, "step": 119660 }, { - "epoch": 0.6, - "learning_rate": 0.00020943741770133845, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.00025346971468268264, + "loss": 0.0228, "step": 119670 }, { - "epoch": 0.6, - "learning_rate": 0.00020942985000832446, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.00025346582646631116, + "loss": 0.0186, "step": 119680 }, { - "epoch": 0.6, - "learning_rate": 0.00020942228231531044, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.00025346193824993973, + "loss": 0.0223, "step": 119690 }, { - "epoch": 0.6, - "learning_rate": 0.00020941471462229642, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.00025345805003356824, + "loss": 0.0225, "step": 119700 }, { - "epoch": 0.6, - "learning_rate": 0.00020940714692928243, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.00025345416181719676, + "loss": 0.0237, "step": 119710 }, { - "epoch": 0.6, - "learning_rate": 0.0002093995792362684, - "loss": 0.021, + "epoch": 0.31, + "learning_rate": 0.0002534502736008253, + "loss": 0.022, "step": 119720 }, { - "epoch": 0.6, - "learning_rate": 0.0002093920115432544, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025344638538445384, + "loss": 0.0168, "step": 119730 }, { - "epoch": 0.6, - "learning_rate": 0.0002093844438502404, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.0002534424971680824, + "loss": 0.0217, "step": 119740 }, { - "epoch": 0.6, - "learning_rate": 0.00020937687615722638, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002534386089517109, + "loss": 0.0207, "step": 119750 }, { - "epoch": 0.6, - "learning_rate": 0.00020936930846421236, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.00025343472073533944, + "loss": 0.0375, "step": 119760 }, { - "epoch": 0.6, - "learning_rate": 0.00020936174077119837, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.000253430832518968, + "loss": 0.025, "step": 119770 }, { - "epoch": 0.6, - "learning_rate": 0.00020935417307818435, - "loss": 0.0162, + "epoch": 0.31, + "learning_rate": 0.0002534269443025965, + "loss": 0.0153, "step": 119780 }, { - "epoch": 0.6, - "learning_rate": 0.00020934660538517034, - "loss": 0.0112, + "epoch": 0.31, + "learning_rate": 0.00025342305608622504, + "loss": 0.0274, "step": 119790 }, { - "epoch": 0.6, - "learning_rate": 0.00020933903769215632, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.0002534191678698536, + "loss": 0.0189, "step": 119800 }, { - "epoch": 0.6, - "learning_rate": 0.00020933146999914233, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.0002534152796534822, + "loss": 0.0216, "step": 119810 }, { - "epoch": 0.6, - "learning_rate": 0.0002093239023061283, - "loss": 0.0204, + "epoch": 0.31, + "learning_rate": 0.0002534113914371107, + "loss": 0.0214, "step": 119820 }, { - "epoch": 0.6, - "learning_rate": 0.0002093163346131143, - "loss": 0.0165, + "epoch": 0.31, + "learning_rate": 0.0002534075032207392, + "loss": 0.0193, "step": 119830 }, { - "epoch": 0.6, - "learning_rate": 0.0002093087669201003, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002534036150043677, + "loss": 0.0212, "step": 119840 }, { - "epoch": 0.6, - "learning_rate": 0.00020930119922708628, - "loss": 0.0148, + "epoch": 0.31, + "learning_rate": 0.0002533997267879963, + "loss": 0.0262, "step": 119850 }, { - "epoch": 0.6, - "learning_rate": 0.00020929363153407226, - "loss": 0.0122, + "epoch": 0.31, + "learning_rate": 0.0002533958385716248, + "loss": 0.0227, "step": 119860 }, { - "epoch": 0.6, - "learning_rate": 0.00020928606384105827, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.00025339195035525337, + "loss": 0.0193, "step": 119870 }, { - "epoch": 0.6, - "learning_rate": 0.00020927849614804425, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.0002533880621388819, + "loss": 0.0178, "step": 119880 }, { - "epoch": 0.6, - "learning_rate": 0.00020927092845503023, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002533841739225104, + "loss": 0.0253, "step": 119890 }, { - "epoch": 0.6, - "learning_rate": 0.00020926336076201624, - "loss": 0.0159, + "epoch": 0.31, + "learning_rate": 0.00025338028570613897, + "loss": 0.0181, "step": 119900 }, { - "epoch": 0.6, - "learning_rate": 0.00020925579306900222, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002533763974897675, + "loss": 0.0215, "step": 119910 }, { - "epoch": 0.61, - "learning_rate": 0.0002092482253759882, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.000253372509273396, + "loss": 0.0196, "step": 119920 }, { - "epoch": 0.61, - "learning_rate": 0.0002092406576829742, - "loss": 0.0276, + "epoch": 0.31, + "learning_rate": 0.00025336862105702456, + "loss": 0.0246, "step": 119930 }, { - "epoch": 0.61, - "learning_rate": 0.0002092330899899602, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.0002533647328406531, + "loss": 0.0221, "step": 119940 }, { - "epoch": 0.61, - "learning_rate": 0.00020922552229694617, - "loss": 0.019, + "epoch": 0.31, + "learning_rate": 0.00025336084462428165, + "loss": 0.0208, "step": 119950 }, { - "epoch": 0.61, - "learning_rate": 0.00020921795460393218, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025335695640791016, + "loss": 0.0248, "step": 119960 }, { - "epoch": 0.61, - "learning_rate": 0.00020921038691091816, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.0002533530681915387, + "loss": 0.028, "step": 119970 }, { - "epoch": 0.61, - "learning_rate": 0.00020920281921790415, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.00025334917997516725, + "loss": 0.0217, "step": 119980 }, { - "epoch": 0.61, - "learning_rate": 0.00020919525152489013, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.00025334529175879576, + "loss": 0.0274, "step": 119990 }, { - "epoch": 0.61, - "learning_rate": 0.00020918768383187614, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.00025334140354242433, + "loss": 0.0192, "step": 120000 }, { - "epoch": 0.61, - "eval_cer": 0.9144925750140465, - "eval_loss": 0.0107016796246171, - "eval_runtime": 116.8152, - "eval_samples_per_second": 17.121, - "eval_steps_per_second": 4.28, + "epoch": 0.31, + "eval_cer": 0.8818244547364413, + "eval_loss": 0.015779657289385796, + "eval_runtime": 107.2547, + "eval_samples_per_second": 18.647, + "eval_steps_per_second": 4.662, "step": 120000 }, { - "epoch": 0.61, - "learning_rate": 0.00020918011613886212, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.00025333751532605284, + "loss": 0.0188, "step": 120010 }, { - "epoch": 0.61, - "learning_rate": 0.0002091725484458481, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002533336271096814, + "loss": 0.0222, "step": 120020 }, { - "epoch": 0.61, - "learning_rate": 0.0002091649807528341, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002533297388933099, + "loss": 0.0204, "step": 120030 }, { - "epoch": 0.61, - "learning_rate": 0.00020915741305982006, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.00025332585067693844, + "loss": 0.0215, "step": 120040 }, { - "epoch": 0.61, - "learning_rate": 0.00020914984536680604, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.00025332196246056696, + "loss": 0.0209, "step": 120050 }, { - "epoch": 0.61, - "learning_rate": 0.00020914227767379202, - "loss": 0.0129, + "epoch": 0.31, + "learning_rate": 0.0002533180742441955, + "loss": 0.023, "step": 120060 }, { - "epoch": 0.61, - "learning_rate": 0.00020913470998077803, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.00025331418602782404, + "loss": 0.0249, "step": 120070 }, { - "epoch": 0.61, - "learning_rate": 0.00020912714228776401, - "loss": 0.0199, + "epoch": 0.31, + "learning_rate": 0.0002533102978114526, + "loss": 0.0184, "step": 120080 }, { - "epoch": 0.61, - "learning_rate": 0.00020911957459475, - "loss": 0.0168, + "epoch": 0.31, + "learning_rate": 0.0002533064095950811, + "loss": 0.0216, "step": 120090 }, { - "epoch": 0.61, - "learning_rate": 0.000209112006901736, - "loss": 0.0181, + "epoch": 0.31, + "learning_rate": 0.00025330252137870964, + "loss": 0.021, "step": 120100 }, { - "epoch": 0.61, - "learning_rate": 0.00020910443920872199, - "loss": 0.0154, + "epoch": 0.31, + "learning_rate": 0.0002532986331623382, + "loss": 0.0233, "step": 120110 }, { - "epoch": 0.61, - "learning_rate": 0.00020909687151570797, - "loss": 0.0125, + "epoch": 0.31, + "learning_rate": 0.0002532947449459667, + "loss": 0.0195, "step": 120120 }, { - "epoch": 0.61, - "learning_rate": 0.00020908930382269398, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.00025329085672959523, + "loss": 0.021, "step": 120130 }, { - "epoch": 0.61, - "learning_rate": 0.00020908173612967996, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.0002532869685132238, + "loss": 0.0314, "step": 120140 }, { - "epoch": 0.61, - "learning_rate": 0.00020907416843666594, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.00025328308029685237, + "loss": 0.0195, "step": 120150 }, { - "epoch": 0.61, - "learning_rate": 0.00020906660074365195, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.0002532791920804809, + "loss": 0.0249, "step": 120160 }, { - "epoch": 0.61, - "learning_rate": 0.00020905903305063793, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.0002532753038641094, + "loss": 0.025, "step": 120170 }, { - "epoch": 0.61, - "learning_rate": 0.0002090514653576239, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.0002532714156477379, + "loss": 0.0184, "step": 120180 }, { - "epoch": 0.61, - "learning_rate": 0.0002090438976646099, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002532675274313665, + "loss": 0.0183, "step": 120190 }, { - "epoch": 0.61, - "learning_rate": 0.0002090363299715959, - "loss": 0.0133, + "epoch": 0.31, + "learning_rate": 0.000253263639214995, + "loss": 0.0205, "step": 120200 }, { - "epoch": 0.61, - "learning_rate": 0.00020902876227858188, - "loss": 0.0129, + "epoch": 0.31, + "learning_rate": 0.00025325975099862357, + "loss": 0.023, "step": 120210 }, { - "epoch": 0.61, - "learning_rate": 0.00020902119458556786, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002532558627822521, + "loss": 0.0265, "step": 120220 }, { - "epoch": 0.61, - "learning_rate": 0.00020901362689255387, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025325197456588065, + "loss": 0.0284, "step": 120230 }, { - "epoch": 0.61, - "learning_rate": 0.00020900605919953985, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025324808634950917, + "loss": 0.0227, "step": 120240 }, { - "epoch": 0.61, - "learning_rate": 0.00020899849150652583, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.0002532441981331377, + "loss": 0.0238, "step": 120250 }, { - "epoch": 0.61, - "learning_rate": 0.00020899092381351184, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.0002532403099167662, + "loss": 0.0244, "step": 120260 }, { - "epoch": 0.61, - "learning_rate": 0.00020898335612049782, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.00025323642170039476, + "loss": 0.0201, "step": 120270 }, { - "epoch": 0.61, - "learning_rate": 0.0002089757884274838, - "loss": 0.0173, + "epoch": 0.31, + "learning_rate": 0.0002532325334840233, + "loss": 0.0197, "step": 120280 }, { - "epoch": 0.61, - "learning_rate": 0.00020896822073446981, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.00025322864526765185, + "loss": 0.0228, "step": 120290 }, { - "epoch": 0.61, - "learning_rate": 0.0002089606530414558, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025322475705128036, + "loss": 0.0239, "step": 120300 }, { - "epoch": 0.61, - "learning_rate": 0.00020895308534844178, - "loss": 0.0184, + "epoch": 0.31, + "learning_rate": 0.00025322086883490893, + "loss": 0.0221, "step": 120310 }, { - "epoch": 0.61, - "learning_rate": 0.00020894551765542779, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.00025321698061853744, + "loss": 0.0221, "step": 120320 }, { - "epoch": 0.61, - "learning_rate": 0.00020893794996241377, - "loss": 0.0196, + "epoch": 0.31, + "learning_rate": 0.00025321309240216596, + "loss": 0.0271, "step": 120330 }, { - "epoch": 0.61, - "learning_rate": 0.00020893038226939975, - "loss": 0.0188, + "epoch": 0.31, + "learning_rate": 0.0002532092041857945, + "loss": 0.0165, "step": 120340 }, { - "epoch": 0.61, - "learning_rate": 0.00020892281457638576, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.00025320531596942304, + "loss": 0.0212, "step": 120350 }, { - "epoch": 0.61, - "learning_rate": 0.00020891524688337174, - "loss": 0.0193, + "epoch": 0.31, + "learning_rate": 0.0002532014277530516, + "loss": 0.0216, "step": 120360 }, { - "epoch": 0.61, - "learning_rate": 0.00020890767919035772, - "loss": 0.0121, + "epoch": 0.31, + "learning_rate": 0.0002531975395366801, + "loss": 0.0253, "step": 120370 }, { - "epoch": 0.61, - "learning_rate": 0.0002089001114973437, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.00025319365132030864, + "loss": 0.0224, "step": 120380 }, { - "epoch": 0.61, - "learning_rate": 0.0002088925438043297, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.00025318976310393715, + "loss": 0.0218, "step": 120390 }, { - "epoch": 0.61, - "learning_rate": 0.0002088849761113157, - "loss": 0.0119, + "epoch": 0.31, + "learning_rate": 0.0002531858748875657, + "loss": 0.0203, "step": 120400 }, { - "epoch": 0.61, - "learning_rate": 0.00020887740841830167, - "loss": 0.0116, + "epoch": 0.31, + "learning_rate": 0.00025318198667119424, + "loss": 0.0248, "step": 120410 }, { - "epoch": 0.61, - "learning_rate": 0.00020886984072528768, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002531780984548228, + "loss": 0.0233, "step": 120420 }, { - "epoch": 0.61, - "learning_rate": 0.00020886227303227366, - "loss": 0.0198, + "epoch": 0.31, + "learning_rate": 0.0002531742102384513, + "loss": 0.0258, "step": 120430 }, { - "epoch": 0.61, - "learning_rate": 0.00020885470533925964, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.0002531703220220799, + "loss": 0.0204, "step": 120440 }, { - "epoch": 0.61, - "learning_rate": 0.00020884713764624565, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.0002531664338057084, + "loss": 0.0221, "step": 120450 }, { - "epoch": 0.61, - "learning_rate": 0.00020883956995323163, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.0002531625455893369, + "loss": 0.0202, "step": 120460 }, { - "epoch": 0.61, - "learning_rate": 0.00020883200226021762, - "loss": 0.0122, + "epoch": 0.31, + "learning_rate": 0.00025315865737296543, + "loss": 0.0231, "step": 120470 }, { - "epoch": 0.61, - "learning_rate": 0.00020882443456720362, - "loss": 0.0163, + "epoch": 0.31, + "learning_rate": 0.000253154769156594, + "loss": 0.019, "step": 120480 }, { - "epoch": 0.61, - "learning_rate": 0.0002088168668741896, - "loss": 0.0124, + "epoch": 0.31, + "learning_rate": 0.00025315088094022257, + "loss": 0.0284, "step": 120490 }, { - "epoch": 0.61, - "learning_rate": 0.0002088092991811756, - "loss": 0.0133, + "epoch": 0.31, + "learning_rate": 0.0002531469927238511, + "loss": 0.021, "step": 120500 }, { - "epoch": 0.61, - "learning_rate": 0.0002088017314881616, - "loss": 0.0107, + "epoch": 0.31, + "learning_rate": 0.0002531431045074796, + "loss": 0.0211, "step": 120510 }, { - "epoch": 0.61, - "learning_rate": 0.00020879416379514758, - "loss": 0.0141, + "epoch": 0.31, + "learning_rate": 0.00025313921629110817, + "loss": 0.02, "step": 120520 }, { - "epoch": 0.61, - "learning_rate": 0.00020878659610213356, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002531353280747367, + "loss": 0.0216, "step": 120530 }, { - "epoch": 0.61, - "learning_rate": 0.00020877902840911954, - "loss": 0.0169, + "epoch": 0.31, + "learning_rate": 0.0002531314398583652, + "loss": 0.02, "step": 120540 }, { - "epoch": 0.61, - "learning_rate": 0.00020877146071610555, - "loss": 0.016, + "epoch": 0.31, + "learning_rate": 0.00025312755164199377, + "loss": 0.0221, "step": 120550 }, { - "epoch": 0.61, - "learning_rate": 0.00020876389302309153, - "loss": 0.0174, + "epoch": 0.31, + "learning_rate": 0.0002531236634256223, + "loss": 0.0222, "step": 120560 }, { - "epoch": 0.61, - "learning_rate": 0.0002087563253300775, - "loss": 0.0186, + "epoch": 0.31, + "learning_rate": 0.00025311977520925085, + "loss": 0.0253, "step": 120570 }, { - "epoch": 0.61, - "learning_rate": 0.00020874875763706352, - "loss": 0.0281, + "epoch": 0.31, + "learning_rate": 0.00025311588699287936, + "loss": 0.0226, "step": 120580 }, { - "epoch": 0.61, - "learning_rate": 0.0002087411899440495, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002531119987765079, + "loss": 0.0218, "step": 120590 }, { - "epoch": 0.61, - "learning_rate": 0.00020873362225103548, - "loss": 0.0112, + "epoch": 0.31, + "learning_rate": 0.0002531081105601364, + "loss": 0.0267, "step": 120600 }, { - "epoch": 0.61, - "learning_rate": 0.0002087260545580215, - "loss": 0.018, + "epoch": 0.31, + "learning_rate": 0.00025310422234376496, + "loss": 0.0252, "step": 120610 }, { - "epoch": 0.61, - "learning_rate": 0.00020871848686500747, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002531003341273935, + "loss": 0.0192, "step": 120620 }, { - "epoch": 0.61, - "learning_rate": 0.00020871091917199345, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.00025309644591102205, + "loss": 0.0202, "step": 120630 }, { - "epoch": 0.61, - "learning_rate": 0.00020870335147897946, - "loss": 0.0145, + "epoch": 0.31, + "learning_rate": 0.00025309255769465056, + "loss": 0.0211, "step": 120640 }, { - "epoch": 0.61, - "learning_rate": 0.00020869578378596544, - "loss": 0.0171, + "epoch": 0.31, + "learning_rate": 0.00025308866947827913, + "loss": 0.0169, "step": 120650 }, { - "epoch": 0.61, - "learning_rate": 0.00020868821609295143, - "loss": 0.0136, + "epoch": 0.31, + "learning_rate": 0.00025308478126190764, + "loss": 0.0209, "step": 120660 }, { - "epoch": 0.61, - "learning_rate": 0.00020868064839993743, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025308089304553616, + "loss": 0.0205, "step": 120670 }, { - "epoch": 0.61, - "learning_rate": 0.00020867308070692342, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025307700482916467, + "loss": 0.0186, "step": 120680 }, { - "epoch": 0.61, - "learning_rate": 0.0002086655130139094, - "loss": 0.0136, + "epoch": 0.31, + "learning_rate": 0.00025307311661279324, + "loss": 0.0213, "step": 120690 }, { - "epoch": 0.61, - "learning_rate": 0.00020865794532089538, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002530692283964218, + "loss": 0.0186, "step": 120700 }, { - "epoch": 0.61, - "learning_rate": 0.0002086503776278814, - "loss": 0.0199, + "epoch": 0.31, + "learning_rate": 0.0002530653401800503, + "loss": 0.022, "step": 120710 }, { - "epoch": 0.61, - "learning_rate": 0.00020864280993486737, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025306145196367884, + "loss": 0.0214, "step": 120720 }, { - "epoch": 0.61, - "learning_rate": 0.00020863524224185335, - "loss": 0.0137, + "epoch": 0.31, + "learning_rate": 0.0002530575637473074, + "loss": 0.018, "step": 120730 }, { - "epoch": 0.61, - "learning_rate": 0.00020862767454883936, - "loss": 0.0138, + "epoch": 0.31, + "learning_rate": 0.0002530536755309359, + "loss": 0.0217, "step": 120740 }, { - "epoch": 0.61, - "learning_rate": 0.00020862010685582534, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.00025304978731456444, + "loss": 0.0224, "step": 120750 }, { - "epoch": 0.61, - "learning_rate": 0.00020861253916281132, - "loss": 0.0144, + "epoch": 0.31, + "learning_rate": 0.000253045899098193, + "loss": 0.0227, "step": 120760 }, { - "epoch": 0.61, - "learning_rate": 0.00020860497146979733, - "loss": 0.0176, + "epoch": 0.31, + "learning_rate": 0.0002530420108818215, + "loss": 0.026, "step": 120770 }, { - "epoch": 0.61, - "learning_rate": 0.0002085974037767833, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.0002530381226654501, + "loss": 0.02, "step": 120780 }, { - "epoch": 0.61, - "learning_rate": 0.0002085898360837693, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.0002530342344490786, + "loss": 0.0237, "step": 120790 }, { - "epoch": 0.61, - "learning_rate": 0.0002085822683907553, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.0002530303462327071, + "loss": 0.0217, "step": 120800 }, { - "epoch": 0.61, - "learning_rate": 0.00020857470069774128, - "loss": 0.0111, + "epoch": 0.31, + "learning_rate": 0.0002530264580163357, + "loss": 0.022, "step": 120810 }, { - "epoch": 0.61, - "learning_rate": 0.00020856713300472726, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002530225697999642, + "loss": 0.0209, "step": 120820 }, { - "epoch": 0.61, - "learning_rate": 0.00020855956531171327, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002530186815835927, + "loss": 0.0259, "step": 120830 }, { - "epoch": 0.61, - "learning_rate": 0.00020855199761869925, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.0002530147933672213, + "loss": 0.0202, "step": 120840 }, { - "epoch": 0.61, - "learning_rate": 0.00020854442992568524, - "loss": 0.0185, + "epoch": 0.31, + "learning_rate": 0.0002530109051508498, + "loss": 0.0181, "step": 120850 }, { - "epoch": 0.61, - "learning_rate": 0.00020853686223267124, - "loss": 0.0151, + "epoch": 0.31, + "learning_rate": 0.00025300701693447837, + "loss": 0.0178, "step": 120860 }, { - "epoch": 0.61, - "learning_rate": 0.00020852929453965723, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.0002530031287181069, + "loss": 0.0198, "step": 120870 }, { - "epoch": 0.61, - "learning_rate": 0.0002085217268466432, - "loss": 0.0119, + "epoch": 0.31, + "learning_rate": 0.0002529992405017354, + "loss": 0.0252, "step": 120880 }, { - "epoch": 0.61, - "learning_rate": 0.0002085141591536292, - "loss": 0.0171, + "epoch": 0.31, + "learning_rate": 0.00025299535228536397, + "loss": 0.0201, "step": 120890 }, { - "epoch": 0.61, - "learning_rate": 0.0002085065914606152, - "loss": 0.017, + "epoch": 0.31, + "learning_rate": 0.0002529914640689925, + "loss": 0.018, "step": 120900 }, { - "epoch": 0.61, - "learning_rate": 0.00020849902376760118, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.00025298757585262105, + "loss": 0.0197, "step": 120910 }, { - "epoch": 0.61, - "learning_rate": 0.00020849145607458716, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.00025298368763624956, + "loss": 0.0238, "step": 120920 }, { - "epoch": 0.61, - "learning_rate": 0.00020848388838157317, - "loss": 0.0156, + "epoch": 0.31, + "learning_rate": 0.0002529797994198781, + "loss": 0.0183, "step": 120930 }, { - "epoch": 0.61, - "learning_rate": 0.00020847632068855915, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025297591120350665, + "loss": 0.0201, "step": 120940 }, { - "epoch": 0.61, - "learning_rate": 0.00020846875299554513, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.00025297202298713516, + "loss": 0.0222, "step": 120950 }, { - "epoch": 0.61, - "learning_rate": 0.00020846118530253114, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.0002529681347707637, + "loss": 0.0182, "step": 120960 }, { - "epoch": 0.61, - "learning_rate": 0.00020845361760951712, - "loss": 0.0167, + "epoch": 0.31, + "learning_rate": 0.00025296424655439224, + "loss": 0.0213, "step": 120970 }, { - "epoch": 0.61, - "learning_rate": 0.0002084460499165031, - "loss": 0.0149, + "epoch": 0.31, + "learning_rate": 0.00025296035833802076, + "loss": 0.0224, "step": 120980 }, { - "epoch": 0.61, - "learning_rate": 0.0002084384822234891, - "loss": 0.0136, + "epoch": 0.31, + "learning_rate": 0.00025295647012164933, + "loss": 0.0173, "step": 120990 }, { - "epoch": 0.61, - "learning_rate": 0.0002084309145304751, - "loss": 0.0164, + "epoch": 0.31, + "learning_rate": 0.00025295258190527784, + "loss": 0.0219, "step": 121000 }, { - "epoch": 0.61, - "eval_cer": 0.9144799598644162, - "eval_loss": 0.010320211760699749, - "eval_runtime": 116.7947, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.31, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.015187835320830345, + "eval_runtime": 107.3871, + "eval_samples_per_second": 18.624, + "eval_steps_per_second": 4.656, "step": 121000 }, { - "epoch": 0.61, - "learning_rate": 0.00020842334683746107, - "loss": 0.0171, + "epoch": 0.31, + "learning_rate": 0.00025294869368890636, + "loss": 0.0245, "step": 121010 }, { - "epoch": 0.61, - "learning_rate": 0.00020841577914444708, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.0002529448054725349, + "loss": 0.0248, "step": 121020 }, { - "epoch": 0.61, - "learning_rate": 0.00020840821145143306, - "loss": 0.0111, + "epoch": 0.31, + "learning_rate": 0.00025294091725616344, + "loss": 0.0209, "step": 121030 }, { - "epoch": 0.61, - "learning_rate": 0.00020840064375841905, - "loss": 0.0125, + "epoch": 0.31, + "learning_rate": 0.000252937029039792, + "loss": 0.0217, "step": 121040 }, { - "epoch": 0.61, - "learning_rate": 0.00020839307606540503, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002529331408234205, + "loss": 0.0222, "step": 121050 }, { - "epoch": 0.61, - "learning_rate": 0.00020838550837239104, - "loss": 0.0125, + "epoch": 0.31, + "learning_rate": 0.0002529292526070491, + "loss": 0.0213, "step": 121060 }, { - "epoch": 0.61, - "learning_rate": 0.00020837794067937702, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.0002529253643906776, + "loss": 0.0208, "step": 121070 }, { - "epoch": 0.61, - "learning_rate": 0.000208370372986363, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002529214761743061, + "loss": 0.0194, "step": 121080 }, { - "epoch": 0.61, - "learning_rate": 0.000208362805293349, - "loss": 0.015, + "epoch": 0.31, + "learning_rate": 0.00025291758795793464, + "loss": 0.0206, "step": 121090 }, { - "epoch": 0.61, - "learning_rate": 0.000208355237600335, - "loss": 0.0185, + "epoch": 0.31, + "learning_rate": 0.0002529136997415632, + "loss": 0.0216, "step": 121100 }, { - "epoch": 0.61, - "learning_rate": 0.00020834766990732097, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002529098115251917, + "loss": 0.0208, "step": 121110 }, { - "epoch": 0.61, - "learning_rate": 0.00020834010221430698, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002529059233088203, + "loss": 0.0183, "step": 121120 }, { - "epoch": 0.61, - "learning_rate": 0.00020833253452129296, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002529020350924488, + "loss": 0.0198, "step": 121130 }, { - "epoch": 0.61, - "learning_rate": 0.00020832496682827894, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.0002528981468760773, + "loss": 0.0227, "step": 121140 }, { - "epoch": 0.61, - "learning_rate": 0.00020831739913526495, - "loss": 0.0155, + "epoch": 0.31, + "learning_rate": 0.0002528942586597059, + "loss": 0.0174, "step": 121150 }, { - "epoch": 0.61, - "learning_rate": 0.00020830983144225093, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.0002528903704433344, + "loss": 0.0201, "step": 121160 }, { - "epoch": 0.61, - "learning_rate": 0.0002083022637492369, - "loss": 0.0139, + "epoch": 0.31, + "learning_rate": 0.0002528864822269629, + "loss": 0.0207, "step": 121170 }, { - "epoch": 0.61, - "learning_rate": 0.00020829469605622292, - "loss": 0.0123, + "epoch": 0.31, + "learning_rate": 0.0002528825940105915, + "loss": 0.0196, "step": 121180 }, { - "epoch": 0.61, - "learning_rate": 0.0002082871283632089, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.00025287870579422005, + "loss": 0.0244, "step": 121190 }, { - "epoch": 0.61, - "learning_rate": 0.00020827956067019488, - "loss": 0.0135, + "epoch": 0.31, + "learning_rate": 0.00025287481757784857, + "loss": 0.0205, "step": 121200 }, { - "epoch": 0.61, - "learning_rate": 0.00020827199297718087, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.0002528709293614771, + "loss": 0.0209, "step": 121210 }, { - "epoch": 0.61, - "learning_rate": 0.00020826442528416687, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002528670411451056, + "loss": 0.021, "step": 121220 }, { - "epoch": 0.61, - "learning_rate": 0.00020825685759115286, - "loss": 0.0178, + "epoch": 0.31, + "learning_rate": 0.00025286315292873416, + "loss": 0.0207, "step": 121230 }, { - "epoch": 0.61, - "learning_rate": 0.00020824928989813884, - "loss": 0.013, + "epoch": 0.31, + "learning_rate": 0.0002528592647123627, + "loss": 0.0232, "step": 121240 }, { - "epoch": 0.61, - "learning_rate": 0.00020824172220512485, - "loss": 0.012, + "epoch": 0.31, + "learning_rate": 0.00025285537649599125, + "loss": 0.0245, "step": 121250 }, { - "epoch": 0.61, - "learning_rate": 0.00020823415451211083, - "loss": 0.0182, + "epoch": 0.31, + "learning_rate": 0.00025285148827961976, + "loss": 0.0224, "step": 121260 }, { - "epoch": 0.61, - "learning_rate": 0.0002082265868190968, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.00025284760006324833, + "loss": 0.0206, "step": 121270 }, { - "epoch": 0.61, - "learning_rate": 0.00020821901912608282, - "loss": 0.0131, + "epoch": 0.31, + "learning_rate": 0.00025284371184687685, + "loss": 0.0188, "step": 121280 }, { - "epoch": 0.61, - "learning_rate": 0.00020821145143306877, - "loss": 0.0132, + "epoch": 0.31, + "learning_rate": 0.00025283982363050536, + "loss": 0.0211, "step": 121290 }, { - "epoch": 0.61, - "learning_rate": 0.00020820388374005475, - "loss": 0.0175, + "epoch": 0.31, + "learning_rate": 0.0002528359354141339, + "loss": 0.0218, "step": 121300 }, { - "epoch": 0.61, - "learning_rate": 0.00020819631604704073, - "loss": 0.014, + "epoch": 0.31, + "learning_rate": 0.00025283204719776244, + "loss": 0.0212, "step": 121310 }, { - "epoch": 0.61, - "learning_rate": 0.00020818874835402674, - "loss": 0.0147, + "epoch": 0.31, + "learning_rate": 0.00025282815898139096, + "loss": 0.0267, "step": 121320 }, { - "epoch": 0.61, - "learning_rate": 0.00020818118066101272, - "loss": 0.0177, + "epoch": 0.31, + "learning_rate": 0.0002528242707650195, + "loss": 0.0202, "step": 121330 }, { - "epoch": 0.61, - "learning_rate": 0.0002081736129679987, - "loss": 0.0204, + "epoch": 0.31, + "learning_rate": 0.00025282038254864804, + "loss": 0.0201, "step": 121340 }, { - "epoch": 0.61, - "learning_rate": 0.00020816604527498471, - "loss": 0.0134, + "epoch": 0.31, + "learning_rate": 0.00025281649433227656, + "loss": 0.0165, "step": 121350 }, { - "epoch": 0.61, - "learning_rate": 0.0002081584775819707, - "loss": 0.0176, + "epoch": 0.31, + "learning_rate": 0.0002528126061159051, + "loss": 0.0182, "step": 121360 }, { - "epoch": 0.61, - "learning_rate": 0.00020815090988895668, - "loss": 0.0171, + "epoch": 0.31, + "learning_rate": 0.00025280871789953364, + "loss": 0.0164, "step": 121370 }, { - "epoch": 0.61, - "learning_rate": 0.00020814334219594269, - "loss": 0.0166, + "epoch": 0.31, + "learning_rate": 0.00025280482968316215, + "loss": 0.0263, "step": 121380 }, { - "epoch": 0.61, - "learning_rate": 0.00020813577450292867, - "loss": 0.0158, + "epoch": 0.31, + "learning_rate": 0.0002528009414667907, + "loss": 0.0191, "step": 121390 }, { - "epoch": 0.61, - "learning_rate": 0.00020812820680991465, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.0002527970532504193, + "loss": 0.018, "step": 121400 }, { - "epoch": 0.61, - "learning_rate": 0.00020812063911690066, - "loss": 0.0157, + "epoch": 0.31, + "learning_rate": 0.0002527931650340478, + "loss": 0.0179, "step": 121410 }, { - "epoch": 0.61, - "learning_rate": 0.00020811307142388664, - "loss": 0.0127, + "epoch": 0.31, + "learning_rate": 0.0002527892768176763, + "loss": 0.0237, "step": 121420 }, { - "epoch": 0.61, - "learning_rate": 0.00020810550373087262, - "loss": 0.0142, + "epoch": 0.31, + "learning_rate": 0.00025278538860130483, + "loss": 0.0168, "step": 121430 }, { - "epoch": 0.61, - "learning_rate": 0.0002080979360378586, - "loss": 0.0117, + "epoch": 0.31, + "learning_rate": 0.0002527815003849334, + "loss": 0.0226, "step": 121440 }, { - "epoch": 0.61, - "learning_rate": 0.0002080903683448446, - "loss": 0.0126, + "epoch": 0.31, + "learning_rate": 0.0002527776121685619, + "loss": 0.0178, "step": 121450 }, { - "epoch": 0.61, - "learning_rate": 0.0002080828006518306, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.0002527737239521905, + "loss": 0.0236, "step": 121460 }, { - "epoch": 0.61, - "learning_rate": 0.00020807523295881657, - "loss": 0.0128, + "epoch": 0.31, + "learning_rate": 0.000252769835735819, + "loss": 0.0255, "step": 121470 }, { - "epoch": 0.61, - "learning_rate": 0.00020806766526580258, - "loss": 0.0146, + "epoch": 0.31, + "learning_rate": 0.00025276594751944757, + "loss": 0.0256, "step": 121480 }, { - "epoch": 0.61, - "learning_rate": 0.00020806009757278856, - "loss": 0.0152, + "epoch": 0.31, + "learning_rate": 0.0002527620593030761, + "loss": 0.0208, "step": 121490 }, { - "epoch": 0.61, - "learning_rate": 0.00020805252987977455, - "loss": 0.0143, + "epoch": 0.31, + "learning_rate": 0.0002527581710867046, + "loss": 0.0197, "step": 121500 }, { - "epoch": 0.61, - "learning_rate": 0.00020804496218676055, - "loss": 0.0154, + "epoch": 0.31, + "learning_rate": 0.0002527542828703331, + "loss": 0.0202, "step": 121510 }, { - "epoch": 0.61, - "learning_rate": 0.00020803739449374654, - "loss": 0.0153, + "epoch": 0.31, + "learning_rate": 0.0002527503946539617, + "loss": 0.0247, "step": 121520 }, { - "epoch": 0.61, - "learning_rate": 0.00020802982680073252, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002527465064375902, + "loss": 0.0168, "step": 121530 }, { - "epoch": 0.61, - "learning_rate": 0.00020802225910771853, - "loss": 0.0113, + "epoch": 0.32, + "learning_rate": 0.00025274261822121877, + "loss": 0.0154, "step": 121540 }, { - "epoch": 0.61, - "learning_rate": 0.0002080146914147045, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.0002527387300048473, + "loss": 0.0227, "step": 121550 }, { - "epoch": 0.61, - "learning_rate": 0.0002080071237216905, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.00025273484178847585, + "loss": 0.0195, "step": 121560 }, { - "epoch": 0.61, - "learning_rate": 0.0002079995560286765, - "loss": 0.0168, + "epoch": 0.32, + "learning_rate": 0.00025273095357210436, + "loss": 0.0211, "step": 121570 }, { - "epoch": 0.61, - "learning_rate": 0.00020799198833566248, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.0002527270653557329, + "loss": 0.0187, "step": 121580 }, { - "epoch": 0.61, - "learning_rate": 0.00020798442064264846, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.00025272317713936145, + "loss": 0.0191, "step": 121590 }, { - "epoch": 0.61, - "learning_rate": 0.00020797685294963444, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.00025271928892298996, + "loss": 0.0189, "step": 121600 }, { - "epoch": 0.61, - "learning_rate": 0.00020796928525662045, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025271540070661853, + "loss": 0.0172, "step": 121610 }, { - "epoch": 0.61, - "learning_rate": 0.00020796171756360643, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025271151249024704, + "loss": 0.0167, "step": 121620 }, { - "epoch": 0.61, - "learning_rate": 0.0002079541498705924, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.00025270762427387556, + "loss": 0.027, "step": 121630 }, { - "epoch": 0.61, - "learning_rate": 0.00020794658217757842, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.0002527037360575041, + "loss": 0.0156, "step": 121640 }, { - "epoch": 0.61, - "learning_rate": 0.0002079390144845644, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.00025269984784113264, + "loss": 0.0225, "step": 121650 }, { - "epoch": 0.61, - "learning_rate": 0.00020793144679155038, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025269595962476116, + "loss": 0.0206, "step": 121660 }, { - "epoch": 0.61, - "learning_rate": 0.0002079238790985364, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.0002526920714083897, + "loss": 0.0227, "step": 121670 }, { - "epoch": 0.61, - "learning_rate": 0.00020791631140552237, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.00025268818319201824, + "loss": 0.0271, "step": 121680 }, { - "epoch": 0.61, - "learning_rate": 0.00020790874371250836, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.0002526842949756468, + "loss": 0.0195, "step": 121690 }, { - "epoch": 0.61, - "learning_rate": 0.00020790117601949436, - "loss": 0.0159, + "epoch": 0.32, + "learning_rate": 0.0002526804067592753, + "loss": 0.0181, "step": 121700 }, { - "epoch": 0.61, - "learning_rate": 0.00020789360832648035, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.00025267651854290384, + "loss": 0.0248, "step": 121710 }, { - "epoch": 0.61, - "learning_rate": 0.00020788604063346633, - "loss": 0.012, + "epoch": 0.32, + "learning_rate": 0.00025267263032653235, + "loss": 0.0211, "step": 121720 }, { - "epoch": 0.61, - "learning_rate": 0.00020787847294045234, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.0002526687421101609, + "loss": 0.0165, "step": 121730 }, { - "epoch": 0.61, - "learning_rate": 0.00020787090524743832, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.0002526648538937895, + "loss": 0.0188, "step": 121740 }, { - "epoch": 0.61, - "learning_rate": 0.0002078633375544243, - "loss": 0.0109, + "epoch": 0.32, + "learning_rate": 0.000252660965677418, + "loss": 0.0176, "step": 121750 }, { - "epoch": 0.61, - "learning_rate": 0.00020785576986141028, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.0002526570774610465, + "loss": 0.0165, "step": 121760 }, { - "epoch": 0.61, - "learning_rate": 0.0002078482021683963, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.0002526531892446751, + "loss": 0.0231, "step": 121770 }, { - "epoch": 0.61, - "learning_rate": 0.00020784063447538227, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.0002526493010283036, + "loss": 0.0189, "step": 121780 }, { - "epoch": 0.61, - "learning_rate": 0.00020783306678236825, - "loss": 0.012, + "epoch": 0.32, + "learning_rate": 0.0002526454128119321, + "loss": 0.0177, "step": 121790 }, { - "epoch": 0.61, - "learning_rate": 0.00020782549908935426, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002526415245955607, + "loss": 0.0243, "step": 121800 }, { - "epoch": 0.61, - "learning_rate": 0.00020781793139634024, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.0002526376363791892, + "loss": 0.0218, "step": 121810 }, { - "epoch": 0.61, - "learning_rate": 0.00020781036370332622, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.00025263374816281777, + "loss": 0.022, "step": 121820 }, { - "epoch": 0.61, - "learning_rate": 0.00020780279601031223, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.0002526298599464463, + "loss": 0.0189, "step": 121830 }, { - "epoch": 0.61, - "learning_rate": 0.0002077952283172982, - "loss": 0.0129, + "epoch": 0.32, + "learning_rate": 0.0002526259717300748, + "loss": 0.0157, "step": 121840 }, { - "epoch": 0.61, - "learning_rate": 0.0002077876606242842, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.0002526220835137033, + "loss": 0.0208, "step": 121850 }, { - "epoch": 0.61, - "learning_rate": 0.0002077800929312702, - "loss": 0.0112, + "epoch": 0.32, + "learning_rate": 0.0002526181952973319, + "loss": 0.0236, "step": 121860 }, { - "epoch": 0.61, - "learning_rate": 0.00020777252523825618, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.0002526143070809604, + "loss": 0.0174, "step": 121870 }, { - "epoch": 0.61, - "learning_rate": 0.00020776495754524217, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.00025261041886458896, + "loss": 0.0222, "step": 121880 }, { - "epoch": 0.61, - "learning_rate": 0.00020775738985222817, - "loss": 0.0188, + "epoch": 0.32, + "learning_rate": 0.0002526065306482175, + "loss": 0.0222, "step": 121890 }, { - "epoch": 0.61, - "learning_rate": 0.00020774982215921416, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025260264243184605, + "loss": 0.0183, "step": 121900 }, { - "epoch": 0.62, - "learning_rate": 0.00020774225446620014, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025259875421547456, + "loss": 0.0179, "step": 121910 }, { - "epoch": 0.62, - "learning_rate": 0.00020773468677318615, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.0002525948659991031, + "loss": 0.0251, "step": 121920 }, { - "epoch": 0.62, - "learning_rate": 0.00020772711908017213, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.0002525909777827316, + "loss": 0.0172, "step": 121930 }, { - "epoch": 0.62, - "learning_rate": 0.0002077195513871581, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.00025258708956636016, + "loss": 0.0188, "step": 121940 }, { - "epoch": 0.62, - "learning_rate": 0.0002077119836941441, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025258320134998873, + "loss": 0.0169, "step": 121950 }, { - "epoch": 0.62, - "learning_rate": 0.0002077044160011301, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025257931313361724, + "loss": 0.0192, "step": 121960 }, { - "epoch": 0.62, - "learning_rate": 0.00020769684830811608, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.00025257542491724576, + "loss": 0.019, "step": 121970 }, { - "epoch": 0.62, - "learning_rate": 0.00020768928061510206, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.0002525715367008743, + "loss": 0.0195, "step": 121980 }, { - "epoch": 0.62, - "learning_rate": 0.00020768171292208807, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025256764848450284, + "loss": 0.0207, "step": 121990 }, { - "epoch": 0.62, - "learning_rate": 0.00020767414522907405, - "loss": 0.0116, + "epoch": 0.32, + "learning_rate": 0.00025256376026813136, + "loss": 0.022, "step": 122000 }, { - "epoch": 0.62, - "eval_cer": 0.9145071309559275, - "eval_loss": 0.010251490399241447, - "eval_runtime": 116.7533, - "eval_samples_per_second": 17.13, - "eval_steps_per_second": 4.283, + "epoch": 0.32, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.014596437104046345, + "eval_runtime": 107.3326, + "eval_samples_per_second": 18.634, + "eval_steps_per_second": 4.658, "step": 122000 }, { - "epoch": 0.62, - "learning_rate": 0.00020766657753606003, - "loss": 0.0127, + "epoch": 0.32, + "learning_rate": 0.0002525598720517599, + "loss": 0.0222, "step": 122010 }, { - "epoch": 0.62, - "learning_rate": 0.00020765900984304604, - "loss": 0.0129, + "epoch": 0.32, + "learning_rate": 0.00025255598383538844, + "loss": 0.021, "step": 122020 }, { - "epoch": 0.62, - "learning_rate": 0.00020765144215003202, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.000252552095619017, + "loss": 0.0211, "step": 122030 }, { - "epoch": 0.62, - "learning_rate": 0.000207643874457018, - "loss": 0.0144, + "epoch": 0.32, + "learning_rate": 0.0002525482074026455, + "loss": 0.0231, "step": 122040 }, { - "epoch": 0.62, - "learning_rate": 0.000207636306764004, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.00025254431918627404, + "loss": 0.025, "step": 122050 }, { - "epoch": 0.62, - "learning_rate": 0.00020762873907099, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.0002525404309699026, + "loss": 0.0221, "step": 122060 }, { - "epoch": 0.62, - "learning_rate": 0.00020762117137797598, - "loss": 0.0123, + "epoch": 0.32, + "learning_rate": 0.0002525365427535311, + "loss": 0.0211, "step": 122070 }, { - "epoch": 0.62, - "learning_rate": 0.00020761360368496198, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.0002525326545371597, + "loss": 0.0206, "step": 122080 }, { - "epoch": 0.62, - "learning_rate": 0.00020760603599194797, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.0002525287663207882, + "loss": 0.0259, "step": 122090 }, { - "epoch": 0.62, - "learning_rate": 0.00020759846829893395, - "loss": 0.0135, + "epoch": 0.32, + "learning_rate": 0.0002525248781044167, + "loss": 0.0188, "step": 122100 }, { - "epoch": 0.62, - "learning_rate": 0.00020759090060591993, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.0002525209898880453, + "loss": 0.0224, "step": 122110 }, { - "epoch": 0.62, - "learning_rate": 0.00020758333291290594, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.0002525171016716738, + "loss": 0.0218, "step": 122120 }, { - "epoch": 0.62, - "learning_rate": 0.00020757576521989192, - "loss": 0.0123, + "epoch": 0.32, + "learning_rate": 0.0002525132134553023, + "loss": 0.0206, "step": 122130 }, { - "epoch": 0.62, - "learning_rate": 0.0002075681975268779, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.0002525093252389309, + "loss": 0.028, "step": 122140 }, { - "epoch": 0.62, - "learning_rate": 0.0002075606298338639, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.0002525054370225594, + "loss": 0.0221, "step": 122150 }, { - "epoch": 0.62, - "learning_rate": 0.0002075530621408499, - "loss": 0.0135, + "epoch": 0.32, + "learning_rate": 0.00025250154880618797, + "loss": 0.0199, "step": 122160 }, { - "epoch": 0.62, - "learning_rate": 0.00020754549444783587, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002524976605898165, + "loss": 0.0213, "step": 122170 }, { - "epoch": 0.62, - "learning_rate": 0.00020753792675482188, - "loss": 0.0187, + "epoch": 0.32, + "learning_rate": 0.000252493772373445, + "loss": 0.0235, "step": 122180 }, { - "epoch": 0.62, - "learning_rate": 0.00020753035906180786, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025248988415707357, + "loss": 0.0197, "step": 122190 }, { - "epoch": 0.62, - "learning_rate": 0.00020752279136879384, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.0002524859959407021, + "loss": 0.0199, "step": 122200 }, { - "epoch": 0.62, - "learning_rate": 0.00020751522367577985, - "loss": 0.0169, + "epoch": 0.32, + "learning_rate": 0.0002524821077243306, + "loss": 0.0241, "step": 122210 }, { - "epoch": 0.62, - "learning_rate": 0.00020750765598276583, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.00025247821950795916, + "loss": 0.0236, "step": 122220 }, { - "epoch": 0.62, - "learning_rate": 0.00020750008828975181, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.00025247433129158773, + "loss": 0.021, "step": 122230 }, { - "epoch": 0.62, - "learning_rate": 0.00020749252059673782, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025247044307521625, + "loss": 0.0214, "step": 122240 }, { - "epoch": 0.62, - "learning_rate": 0.0002074849529037238, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.00025246655485884476, + "loss": 0.0242, "step": 122250 }, { - "epoch": 0.62, - "learning_rate": 0.00020747738521070979, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.0002524626666424733, + "loss": 0.0202, "step": 122260 }, { - "epoch": 0.62, - "learning_rate": 0.00020746981751769577, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.00025245877842610184, + "loss": 0.0181, "step": 122270 }, { - "epoch": 0.62, - "learning_rate": 0.00020746224982468178, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.00025245489020973036, + "loss": 0.0225, "step": 122280 }, { - "epoch": 0.62, - "learning_rate": 0.00020745468213166776, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.00025245100199335893, + "loss": 0.0226, "step": 122290 }, { - "epoch": 0.62, - "learning_rate": 0.00020744711443865374, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.00025244711377698744, + "loss": 0.0238, "step": 122300 }, { - "epoch": 0.62, - "learning_rate": 0.00020743954674563975, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.000252443225560616, + "loss": 0.0197, "step": 122310 }, { - "epoch": 0.62, - "learning_rate": 0.00020743197905262573, - "loss": 0.0123, + "epoch": 0.32, + "learning_rate": 0.0002524393373442445, + "loss": 0.0215, "step": 122320 }, { - "epoch": 0.62, - "learning_rate": 0.0002074244113596117, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.00025243544912787304, + "loss": 0.0239, "step": 122330 }, { - "epoch": 0.62, - "learning_rate": 0.00020741684366659772, - "loss": 0.011, + "epoch": 0.32, + "learning_rate": 0.00025243156091150155, + "loss": 0.0213, "step": 122340 }, { - "epoch": 0.62, - "learning_rate": 0.0002074092759735837, - "loss": 0.012, + "epoch": 0.32, + "learning_rate": 0.0002524276726951301, + "loss": 0.0194, "step": 122350 }, { - "epoch": 0.62, - "learning_rate": 0.00020740170828056968, - "loss": 0.0123, + "epoch": 0.32, + "learning_rate": 0.00025242378447875864, + "loss": 0.0188, "step": 122360 }, { - "epoch": 0.62, - "learning_rate": 0.0002073941405875557, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.0002524198962623872, + "loss": 0.0185, "step": 122370 }, { - "epoch": 0.62, - "learning_rate": 0.00020738657289454167, - "loss": 0.0435, + "epoch": 0.32, + "learning_rate": 0.0002524160080460157, + "loss": 0.0214, "step": 122380 }, { - "epoch": 0.62, - "learning_rate": 0.00020737900520152765, - "loss": 0.0144, + "epoch": 0.32, + "learning_rate": 0.00025241211982964424, + "loss": 0.0222, "step": 122390 }, { - "epoch": 0.62, - "learning_rate": 0.00020737143750851366, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.0002524082316132728, + "loss": 0.0225, "step": 122400 }, { - "epoch": 0.62, - "learning_rate": 0.00020736386981549964, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.0002524043433969013, + "loss": 0.02, "step": 122410 }, { - "epoch": 0.62, - "learning_rate": 0.00020735630212248562, - "loss": 0.0156, + "epoch": 0.32, + "learning_rate": 0.00025240045518052983, + "loss": 0.0207, "step": 122420 }, { - "epoch": 0.62, - "learning_rate": 0.00020734873442947163, - "loss": 0.0174, + "epoch": 0.32, + "learning_rate": 0.0002523965669641584, + "loss": 0.0228, "step": 122430 }, { - "epoch": 0.62, - "learning_rate": 0.00020734116673645761, - "loss": 0.0168, + "epoch": 0.32, + "learning_rate": 0.00025239267874778697, + "loss": 0.0216, "step": 122440 }, { - "epoch": 0.62, - "learning_rate": 0.0002073335990434436, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.0002523887905314155, + "loss": 0.0292, "step": 122450 }, { - "epoch": 0.62, - "learning_rate": 0.00020732603135042958, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.000252384902315044, + "loss": 0.0216, "step": 122460 }, { - "epoch": 0.62, - "learning_rate": 0.00020731846365741559, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.0002523810140986725, + "loss": 0.0214, "step": 122470 }, { - "epoch": 0.62, - "learning_rate": 0.00020731089596440157, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002523771258823011, + "loss": 0.0217, "step": 122480 }, { - "epoch": 0.62, - "learning_rate": 0.00020730332827138755, - "loss": 0.0142, + "epoch": 0.32, + "learning_rate": 0.0002523732376659296, + "loss": 0.0212, "step": 122490 }, { - "epoch": 0.62, - "learning_rate": 0.00020729576057837356, - "loss": 0.0159, + "epoch": 0.32, + "learning_rate": 0.00025236934944955817, + "loss": 0.0199, "step": 122500 }, { - "epoch": 0.62, - "learning_rate": 0.00020728819288535954, - "loss": 0.0119, + "epoch": 0.32, + "learning_rate": 0.0002523654612331867, + "loss": 0.0219, "step": 122510 }, { - "epoch": 0.62, - "learning_rate": 0.00020728062519234552, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.00025236157301681525, + "loss": 0.0232, "step": 122520 }, { - "epoch": 0.62, - "learning_rate": 0.00020727305749933153, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025235768480044376, + "loss": 0.0243, "step": 122530 }, { - "epoch": 0.62, - "learning_rate": 0.0002072654898063175, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.0002523537965840723, + "loss": 0.0204, "step": 122540 }, { - "epoch": 0.62, - "learning_rate": 0.00020725792211330346, - "loss": 0.0196, + "epoch": 0.32, + "learning_rate": 0.0002523499083677008, + "loss": 0.0185, "step": 122550 }, { - "epoch": 0.62, - "learning_rate": 0.00020725035442028945, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025234602015132936, + "loss": 0.0233, "step": 122560 }, { - "epoch": 0.62, - "learning_rate": 0.00020724278672727545, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002523421319349579, + "loss": 0.0249, "step": 122570 }, { - "epoch": 0.62, - "learning_rate": 0.00020723521903426144, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.00025233824371858645, + "loss": 0.0151, "step": 122580 }, { - "epoch": 0.62, - "learning_rate": 0.00020722765134124742, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.00025233435550221496, + "loss": 0.0225, "step": 122590 }, { - "epoch": 0.62, - "learning_rate": 0.00020722008364823343, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.0002523304672858435, + "loss": 0.0215, "step": 122600 }, { - "epoch": 0.62, - "learning_rate": 0.0002072125159552194, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.00025232657906947204, + "loss": 0.0184, "step": 122610 }, { - "epoch": 0.62, - "learning_rate": 0.0002072049482622054, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.00025232269085310056, + "loss": 0.0186, "step": 122620 }, { - "epoch": 0.62, - "learning_rate": 0.0002071973805691914, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.0002523188026367291, + "loss": 0.0216, "step": 122630 }, { - "epoch": 0.62, - "learning_rate": 0.00020718981287617738, - "loss": 0.0117, + "epoch": 0.32, + "learning_rate": 0.00025231491442035764, + "loss": 0.0255, "step": 122640 }, { - "epoch": 0.62, - "learning_rate": 0.00020718224518316336, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.0002523110262039862, + "loss": 0.0215, "step": 122650 }, { - "epoch": 0.62, - "learning_rate": 0.00020717467749014934, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002523071379876147, + "loss": 0.0246, "step": 122660 }, { - "epoch": 0.62, - "learning_rate": 0.00020716710979713535, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025230324977124324, + "loss": 0.025, "step": 122670 }, { - "epoch": 0.62, - "learning_rate": 0.00020715954210412133, - "loss": 0.0175, + "epoch": 0.32, + "learning_rate": 0.00025229936155487175, + "loss": 0.0224, "step": 122680 }, { - "epoch": 0.62, - "learning_rate": 0.0002071519744111073, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.0002522954733385003, + "loss": 0.0175, "step": 122690 }, { - "epoch": 0.62, - "learning_rate": 0.00020714440671809332, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025229158512212884, + "loss": 0.0198, "step": 122700 }, { - "epoch": 0.62, - "learning_rate": 0.0002071368390250793, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.0002522876969057574, + "loss": 0.0201, "step": 122710 }, { - "epoch": 0.62, - "learning_rate": 0.00020712927133206528, - "loss": 0.018, + "epoch": 0.32, + "learning_rate": 0.0002522838086893859, + "loss": 0.0172, "step": 122720 }, { - "epoch": 0.62, - "learning_rate": 0.0002071217036390513, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.0002522799204730145, + "loss": 0.0209, "step": 122730 }, { - "epoch": 0.62, - "learning_rate": 0.00020711413594603727, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.000252276032256643, + "loss": 0.0203, "step": 122740 }, { - "epoch": 0.62, - "learning_rate": 0.00020710656825302326, - "loss": 0.0204, + "epoch": 0.32, + "learning_rate": 0.0002522721440402715, + "loss": 0.0225, "step": 122750 }, { - "epoch": 0.62, - "learning_rate": 0.00020709900056000926, - "loss": 0.0187, + "epoch": 0.32, + "learning_rate": 0.00025226825582390003, + "loss": 0.023, "step": 122760 }, { - "epoch": 0.62, - "learning_rate": 0.00020709143286699525, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002522643676075286, + "loss": 0.0218, "step": 122770 }, { - "epoch": 0.62, - "learning_rate": 0.00020708386517398123, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025226047939115717, + "loss": 0.0203, "step": 122780 }, { - "epoch": 0.62, - "learning_rate": 0.00020707629748096724, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002522565911747857, + "loss": 0.0195, "step": 122790 }, { - "epoch": 0.62, - "learning_rate": 0.00020706872978795322, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.0002522527029584142, + "loss": 0.018, "step": 122800 }, { - "epoch": 0.62, - "learning_rate": 0.0002070611620949392, - "loss": 0.0142, + "epoch": 0.32, + "learning_rate": 0.00025224881474204277, + "loss": 0.0222, "step": 122810 }, { - "epoch": 0.62, - "learning_rate": 0.0002070535944019252, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.0002522449265256713, + "loss": 0.0215, "step": 122820 }, { - "epoch": 0.62, - "learning_rate": 0.0002070460267089112, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.0002522410383092998, + "loss": 0.0203, "step": 122830 }, { - "epoch": 0.62, - "learning_rate": 0.00020703845901589717, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.00025223715009292837, + "loss": 0.0382, "step": 122840 }, { - "epoch": 0.62, - "learning_rate": 0.00020703089132288315, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.0002522332618765569, + "loss": 0.021, "step": 122850 }, { - "epoch": 0.62, - "learning_rate": 0.00020702332362986916, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025222937366018545, + "loss": 0.0275, "step": 122860 }, { - "epoch": 0.62, - "learning_rate": 0.00020701575593685514, - "loss": 0.0124, + "epoch": 0.32, + "learning_rate": 0.00025222548544381396, + "loss": 0.0171, "step": 122870 }, { - "epoch": 0.62, - "learning_rate": 0.00020700818824384112, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002522215972274425, + "loss": 0.0314, "step": 122880 }, { - "epoch": 0.62, - "learning_rate": 0.00020700062055082713, - "loss": 0.0104, + "epoch": 0.32, + "learning_rate": 0.000252217709011071, + "loss": 0.0213, "step": 122890 }, { - "epoch": 0.62, - "learning_rate": 0.0002069930528578131, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.00025221382079469956, + "loss": 0.0243, "step": 122900 }, { - "epoch": 0.62, - "learning_rate": 0.0002069854851647991, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.0002522099325783281, + "loss": 0.0176, "step": 122910 }, { - "epoch": 0.62, - "learning_rate": 0.0002069779174717851, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.00025220604436195664, + "loss": 0.0387, "step": 122920 }, { - "epoch": 0.62, - "learning_rate": 0.00020697034977877108, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.00025220215614558516, + "loss": 0.038, "step": 122930 }, { - "epoch": 0.62, - "learning_rate": 0.00020696278208575707, - "loss": 0.0142, + "epoch": 0.32, + "learning_rate": 0.00025219826792921373, + "loss": 0.0198, "step": 122940 }, { - "epoch": 0.62, - "learning_rate": 0.00020695521439274307, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025219437971284224, + "loss": 0.0229, "step": 122950 }, { - "epoch": 0.62, - "learning_rate": 0.00020694764669972906, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.00025219049149647076, + "loss": 0.0242, "step": 122960 }, { - "epoch": 0.62, - "learning_rate": 0.00020694007900671504, - "loss": 0.0127, + "epoch": 0.32, + "learning_rate": 0.00025218660328009927, + "loss": 0.0191, "step": 122970 }, { - "epoch": 0.62, - "learning_rate": 0.00020693251131370105, - "loss": 0.0159, + "epoch": 0.32, + "learning_rate": 0.00025218271506372784, + "loss": 0.025, "step": 122980 }, { - "epoch": 0.62, - "learning_rate": 0.00020692494362068703, - "loss": 0.0124, + "epoch": 0.32, + "learning_rate": 0.0002521788268473564, + "loss": 0.0173, "step": 122990 }, { - "epoch": 0.62, - "learning_rate": 0.000206917375927673, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.0002521749386309849, + "loss": 0.0186, "step": 123000 }, { - "epoch": 0.62, - "eval_cer": 0.9144566703574066, - "eval_loss": 0.010365525260567665, - "eval_runtime": 116.8218, - "eval_samples_per_second": 17.12, - "eval_steps_per_second": 4.28, + "epoch": 0.32, + "eval_cer": 0.8817936627238894, + "eval_loss": 0.014675342477858067, + "eval_runtime": 107.4618, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, "step": 123000 }, { - "epoch": 0.62, - "learning_rate": 0.000206909808234659, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.00025217105041461344, + "loss": 0.0247, "step": 123010 }, { - "epoch": 0.62, - "learning_rate": 0.000206902240541645, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.000252167162198242, + "loss": 0.025, "step": 123020 }, { - "epoch": 0.62, - "learning_rate": 0.00020689467284863098, - "loss": 0.0168, + "epoch": 0.32, + "learning_rate": 0.0002521632739818705, + "loss": 0.0311, "step": 123030 }, { - "epoch": 0.62, - "learning_rate": 0.00020688710515561696, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.00025215938576549904, + "loss": 0.0247, "step": 123040 }, { - "epoch": 0.62, - "learning_rate": 0.00020687953746260297, - "loss": 0.0169, + "epoch": 0.32, + "learning_rate": 0.0002521554975491276, + "loss": 0.022, "step": 123050 }, { - "epoch": 0.62, - "learning_rate": 0.00020687196976958895, - "loss": 0.0119, + "epoch": 0.32, + "learning_rate": 0.0002521516093327561, + "loss": 0.0219, "step": 123060 }, { - "epoch": 0.62, - "learning_rate": 0.00020686440207657493, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002521477211163847, + "loss": 0.0271, "step": 123070 }, { - "epoch": 0.62, - "learning_rate": 0.00020685683438356094, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.0002521438329000132, + "loss": 0.0209, "step": 123080 }, { - "epoch": 0.62, - "learning_rate": 0.00020684926669054692, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.0002521399446836417, + "loss": 0.0216, "step": 123090 }, { - "epoch": 0.62, - "learning_rate": 0.0002068416989975329, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.00025213605646727023, + "loss": 0.019, "step": 123100 }, { - "epoch": 0.62, - "learning_rate": 0.0002068341313045189, - "loss": 0.0182, + "epoch": 0.32, + "learning_rate": 0.0002521321682508988, + "loss": 0.0241, "step": 123110 }, { - "epoch": 0.62, - "learning_rate": 0.0002068265636115049, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.0002521282800345273, + "loss": 0.0206, "step": 123120 }, { - "epoch": 0.62, - "learning_rate": 0.00020681899591849088, - "loss": 0.0186, + "epoch": 0.32, + "learning_rate": 0.0002521243918181559, + "loss": 0.0212, "step": 123130 }, { - "epoch": 0.62, - "learning_rate": 0.00020681142822547688, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.0002521205036017844, + "loss": 0.0256, "step": 123140 }, { - "epoch": 0.62, - "learning_rate": 0.00020680386053246287, - "loss": 0.0183, + "epoch": 0.32, + "learning_rate": 0.00025211661538541297, + "loss": 0.0208, "step": 123150 }, { - "epoch": 0.62, - "learning_rate": 0.00020679629283944885, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002521127271690415, + "loss": 0.0233, "step": 123160 }, { - "epoch": 0.62, - "learning_rate": 0.00020678872514643483, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025210883895267, + "loss": 0.0223, "step": 123170 }, { - "epoch": 0.62, - "learning_rate": 0.00020678115745342084, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.00025210495073629856, + "loss": 0.0203, "step": 123180 }, { - "epoch": 0.62, - "learning_rate": 0.00020677358976040682, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.0002521010625199271, + "loss": 0.0176, "step": 123190 }, { - "epoch": 0.62, - "learning_rate": 0.0002067660220673928, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.00025209717430355565, + "loss": 0.0208, "step": 123200 }, { - "epoch": 0.62, - "learning_rate": 0.0002067584543743788, - "loss": 0.0189, + "epoch": 0.32, + "learning_rate": 0.00025209328608718416, + "loss": 0.0216, "step": 123210 }, { - "epoch": 0.62, - "learning_rate": 0.0002067508866813648, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.0002520893978708127, + "loss": 0.0249, "step": 123220 }, { - "epoch": 0.62, - "learning_rate": 0.00020674331898835077, - "loss": 0.0174, + "epoch": 0.32, + "learning_rate": 0.00025208550965444125, + "loss": 0.0181, "step": 123230 }, { - "epoch": 0.62, - "learning_rate": 0.00020673575129533678, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025208162143806976, + "loss": 0.0198, "step": 123240 }, { - "epoch": 0.62, - "learning_rate": 0.00020672818360232276, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002520777332216983, + "loss": 0.0192, "step": 123250 }, { - "epoch": 0.62, - "learning_rate": 0.00020672061590930874, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025207384500532684, + "loss": 0.023, "step": 123260 }, { - "epoch": 0.62, - "learning_rate": 0.00020671304821629475, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.0002520699567889554, + "loss": 0.0213, "step": 123270 }, { - "epoch": 0.62, - "learning_rate": 0.00020670548052328073, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.0002520660685725839, + "loss": 0.0185, "step": 123280 }, { - "epoch": 0.62, - "learning_rate": 0.00020669791283026671, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025206218035621244, + "loss": 0.0276, "step": 123290 }, { - "epoch": 0.62, - "learning_rate": 0.00020669034513725272, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.00025205829213984096, + "loss": 0.0242, "step": 123300 }, { - "epoch": 0.62, - "learning_rate": 0.0002066827774442387, - "loss": 0.0129, + "epoch": 0.32, + "learning_rate": 0.00025205440392346947, + "loss": 0.0188, "step": 123310 }, { - "epoch": 0.62, - "learning_rate": 0.00020667520975122469, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.00025205051570709804, + "loss": 0.0214, "step": 123320 }, { - "epoch": 0.62, - "learning_rate": 0.0002066676420582107, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.0002520466274907266, + "loss": 0.0244, "step": 123330 }, { - "epoch": 0.62, - "learning_rate": 0.00020666007436519668, - "loss": 0.0118, + "epoch": 0.32, + "learning_rate": 0.0002520427392743551, + "loss": 0.0188, "step": 123340 }, { - "epoch": 0.62, - "learning_rate": 0.00020665250667218266, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.00025203885105798364, + "loss": 0.0222, "step": 123350 }, { - "epoch": 0.62, - "learning_rate": 0.00020664493897916864, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002520349628416122, + "loss": 0.0228, "step": 123360 }, { - "epoch": 0.62, - "learning_rate": 0.00020663737128615465, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.0002520310746252407, + "loss": 0.0228, "step": 123370 }, { - "epoch": 0.62, - "learning_rate": 0.00020662980359314063, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.00025202718640886923, + "loss": 0.0202, "step": 123380 }, { - "epoch": 0.62, - "learning_rate": 0.0002066222359001266, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.0002520232981924978, + "loss": 0.025, "step": 123390 }, { - "epoch": 0.62, - "learning_rate": 0.00020661466820711262, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.0002520194099761263, + "loss": 0.0188, "step": 123400 }, { - "epoch": 0.62, - "learning_rate": 0.0002066071005140986, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002520155217597549, + "loss": 0.0209, "step": 123410 }, { - "epoch": 0.62, - "learning_rate": 0.00020659953282108458, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.0002520116335433834, + "loss": 0.0214, "step": 123420 }, { - "epoch": 0.62, - "learning_rate": 0.0002065919651280706, - "loss": 0.0118, + "epoch": 0.32, + "learning_rate": 0.0002520077453270119, + "loss": 0.0203, "step": 123430 }, { - "epoch": 0.62, - "learning_rate": 0.00020658439743505657, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.0002520038571106405, + "loss": 0.0194, "step": 123440 }, { - "epoch": 0.62, - "learning_rate": 0.00020657682974204255, - "loss": 0.011, + "epoch": 0.32, + "learning_rate": 0.000251999968894269, + "loss": 0.0243, "step": 123450 }, { - "epoch": 0.62, - "learning_rate": 0.00020656926204902856, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002519960806778975, + "loss": 0.0217, "step": 123460 }, { - "epoch": 0.62, - "learning_rate": 0.00020656169435601454, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.0002519921924615261, + "loss": 0.0196, "step": 123470 }, { - "epoch": 0.62, - "learning_rate": 0.00020655412666300052, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025198830424515465, + "loss": 0.017, "step": 123480 }, { - "epoch": 0.62, - "learning_rate": 0.00020654655896998653, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.00025198441602878317, + "loss": 0.0212, "step": 123490 }, { - "epoch": 0.62, - "learning_rate": 0.00020653899127697251, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.0002519805278124117, + "loss": 0.0238, "step": 123500 }, { - "epoch": 0.62, - "learning_rate": 0.0002065314235839585, - "loss": 0.0124, + "epoch": 0.32, + "learning_rate": 0.0002519766395960402, + "loss": 0.0215, "step": 123510 }, { - "epoch": 0.62, - "learning_rate": 0.00020652385589094448, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.00025197275137966876, + "loss": 0.023, "step": 123520 }, { - "epoch": 0.62, - "learning_rate": 0.00020651628819793049, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.0002519688631632973, + "loss": 0.0194, "step": 123530 }, { - "epoch": 0.62, - "learning_rate": 0.00020650872050491647, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025196497494692585, + "loss": 0.0211, "step": 123540 }, { - "epoch": 0.62, - "learning_rate": 0.00020650115281190245, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.00025196108673055436, + "loss": 0.0182, "step": 123550 }, { - "epoch": 0.62, - "learning_rate": 0.00020649358511888846, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.0002519571985141829, + "loss": 0.0201, "step": 123560 }, { - "epoch": 0.62, - "learning_rate": 0.00020648601742587444, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.00025195331029781144, + "loss": 0.0198, "step": 123570 }, { - "epoch": 0.62, - "learning_rate": 0.00020647844973286042, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.00025194942208143996, + "loss": 0.0202, "step": 123580 }, { - "epoch": 0.62, - "learning_rate": 0.00020647088203984643, - "loss": 0.0129, + "epoch": 0.32, + "learning_rate": 0.0002519455338650685, + "loss": 0.022, "step": 123590 }, { - "epoch": 0.62, - "learning_rate": 0.0002064633143468324, - "loss": 0.0127, + "epoch": 0.32, + "learning_rate": 0.00025194164564869704, + "loss": 0.0167, "step": 123600 }, { - "epoch": 0.62, - "learning_rate": 0.0002064557466538184, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.00025193775743232556, + "loss": 0.0187, "step": 123610 }, { - "epoch": 0.62, - "learning_rate": 0.0002064481789608044, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002519338692159541, + "loss": 0.0217, "step": 123620 }, { - "epoch": 0.62, - "learning_rate": 0.00020644061126779038, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025192998099958264, + "loss": 0.0202, "step": 123630 }, { - "epoch": 0.62, - "learning_rate": 0.00020643304357477636, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.00025192609278321115, + "loss": 0.0227, "step": 123640 }, { - "epoch": 0.62, - "learning_rate": 0.00020642547588176237, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.0002519222045668397, + "loss": 0.0162, "step": 123650 }, { - "epoch": 0.62, - "learning_rate": 0.00020641790818874835, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.00025191831635046824, + "loss": 0.0172, "step": 123660 }, { - "epoch": 0.62, - "learning_rate": 0.00020641034049573433, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002519144281340968, + "loss": 0.0285, "step": 123670 }, { - "epoch": 0.62, - "learning_rate": 0.00020640277280272032, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002519105399177253, + "loss": 0.022, "step": 123680 }, { - "epoch": 0.62, - "learning_rate": 0.00020639520510970632, - "loss": 0.0123, + "epoch": 0.32, + "learning_rate": 0.0002519066517013539, + "loss": 0.0183, "step": 123690 }, { - "epoch": 0.62, - "learning_rate": 0.0002063876374166923, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.0002519027634849824, + "loss": 0.0222, "step": 123700 }, { - "epoch": 0.62, - "learning_rate": 0.0002063800697236783, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.0002518988752686109, + "loss": 0.021, "step": 123710 }, { - "epoch": 0.62, - "learning_rate": 0.0002063725020306643, - "loss": 0.0119, + "epoch": 0.32, + "learning_rate": 0.00025189498705223943, + "loss": 0.018, "step": 123720 }, { - "epoch": 0.62, - "learning_rate": 0.00020636493433765028, - "loss": 0.015, + "epoch": 0.32, + "learning_rate": 0.000251891098835868, + "loss": 0.0232, "step": 123730 }, { - "epoch": 0.62, - "learning_rate": 0.00020635736664463626, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.0002518872106194965, + "loss": 0.0166, "step": 123740 }, { - "epoch": 0.62, - "learning_rate": 0.00020634979895162227, - "loss": 0.0183, + "epoch": 0.32, + "learning_rate": 0.0002518833224031251, + "loss": 0.0203, "step": 123750 }, { - "epoch": 0.62, - "learning_rate": 0.00020634223125860825, - "loss": 0.0192, + "epoch": 0.32, + "learning_rate": 0.0002518794341867536, + "loss": 0.0287, "step": 123760 }, { - "epoch": 0.62, - "learning_rate": 0.00020633466356559423, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.00025187554597038217, + "loss": 0.0179, "step": 123770 }, { - "epoch": 0.62, - "learning_rate": 0.00020632709587258024, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002518716577540107, + "loss": 0.0211, "step": 123780 }, { - "epoch": 0.62, - "learning_rate": 0.00020631952817956622, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.0002518677695376392, + "loss": 0.018, "step": 123790 }, { - "epoch": 0.62, - "learning_rate": 0.0002063119604865522, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.0002518638813212677, + "loss": 0.0184, "step": 123800 }, { - "epoch": 0.62, - "learning_rate": 0.00020630439279353816, - "loss": 0.0111, + "epoch": 0.32, + "learning_rate": 0.0002518599931048963, + "loss": 0.028, "step": 123810 }, { - "epoch": 0.62, - "learning_rate": 0.00020629682510052416, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.00025185610488852485, + "loss": 0.0213, "step": 123820 }, { - "epoch": 0.62, - "learning_rate": 0.00020628925740751015, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.00025185221667215336, + "loss": 0.0255, "step": 123830 }, { - "epoch": 0.62, - "learning_rate": 0.00020628168971449613, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.0002518483284557819, + "loss": 0.0208, "step": 123840 }, { - "epoch": 0.62, - "learning_rate": 0.00020627412202148214, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.0002518444402394104, + "loss": 0.0195, "step": 123850 }, { - "epoch": 0.62, - "learning_rate": 0.00020626655432846812, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025184055202303896, + "loss": 0.0225, "step": 123860 }, { - "epoch": 0.62, - "learning_rate": 0.0002062589866354541, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.0002518366638066675, + "loss": 0.0196, "step": 123870 }, { - "epoch": 0.62, - "learning_rate": 0.0002062514189424401, - "loss": 0.0114, + "epoch": 0.32, + "learning_rate": 0.00025183277559029605, + "loss": 0.0244, "step": 123880 }, { - "epoch": 0.63, - "learning_rate": 0.0002062438512494261, - "loss": 0.0118, + "epoch": 0.32, + "learning_rate": 0.00025182888737392456, + "loss": 0.0204, "step": 123890 }, { - "epoch": 0.63, - "learning_rate": 0.00020623628355641207, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.00025182499915755313, + "loss": 0.0255, "step": 123900 }, { - "epoch": 0.63, - "learning_rate": 0.00020622871586339805, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.00025182111094118164, + "loss": 0.0199, "step": 123910 }, { - "epoch": 0.63, - "learning_rate": 0.00020622114817038406, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.00025181722272481016, + "loss": 0.0199, "step": 123920 }, { - "epoch": 0.63, - "learning_rate": 0.00020621358047737004, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.00025181333450843867, + "loss": 0.0196, "step": 123930 }, { - "epoch": 0.63, - "learning_rate": 0.00020620601278435602, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.00025180944629206724, + "loss": 0.0216, "step": 123940 }, { - "epoch": 0.63, - "learning_rate": 0.00020619844509134203, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.00025180555807569576, + "loss": 0.0196, "step": 123950 }, { - "epoch": 0.63, - "learning_rate": 0.000206190877398328, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.0002518016698593243, + "loss": 0.0168, "step": 123960 }, { - "epoch": 0.63, - "learning_rate": 0.000206183309705314, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.00025179778164295284, + "loss": 0.0189, "step": 123970 }, { - "epoch": 0.63, - "learning_rate": 0.0002061757420123, - "loss": 0.0101, + "epoch": 0.32, + "learning_rate": 0.0002517938934265814, + "loss": 0.0192, "step": 123980 }, { - "epoch": 0.63, - "learning_rate": 0.00020616817431928598, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.0002517900052102099, + "loss": 0.0225, "step": 123990 }, { - "epoch": 0.63, - "learning_rate": 0.00020616060662627197, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025178611699383844, + "loss": 0.0202, "step": 124000 }, { - "epoch": 0.63, - "eval_cer": 0.9144877230334195, - "eval_loss": 0.010582580231130123, - "eval_runtime": 116.7375, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.32, + "eval_cer": 0.8818104583670996, + "eval_loss": 0.014676877297461033, + "eval_runtime": 107.4759, + "eval_samples_per_second": 18.609, + "eval_steps_per_second": 4.652, "step": 124000 }, { - "epoch": 0.63, - "learning_rate": 0.00020615303893325797, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025178222877746695, + "loss": 0.0221, "step": 124010 }, { - "epoch": 0.63, - "learning_rate": 0.00020614547124024396, - "loss": 0.0124, + "epoch": 0.32, + "learning_rate": 0.0002517783405610955, + "loss": 0.0261, "step": 124020 }, { - "epoch": 0.63, - "learning_rate": 0.00020613790354722994, - "loss": 0.0161, + "epoch": 0.32, + "learning_rate": 0.0002517744523447241, + "loss": 0.0192, "step": 124030 }, { - "epoch": 0.63, - "learning_rate": 0.00020613033585421595, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.0002517705641283526, + "loss": 0.0195, "step": 124040 }, { - "epoch": 0.63, - "learning_rate": 0.00020612276816120193, - "loss": 0.0119, + "epoch": 0.32, + "learning_rate": 0.0002517666759119811, + "loss": 0.0262, "step": 124050 }, { - "epoch": 0.63, - "learning_rate": 0.0002061152004681879, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025176278769560963, + "loss": 0.0215, "step": 124060 }, { - "epoch": 0.63, - "learning_rate": 0.0002061076327751739, - "loss": 0.0129, + "epoch": 0.32, + "learning_rate": 0.0002517588994792382, + "loss": 0.0199, "step": 124070 }, { - "epoch": 0.63, - "learning_rate": 0.0002061000650821599, - "loss": 0.0137, + "epoch": 0.32, + "learning_rate": 0.0002517550112628667, + "loss": 0.0188, "step": 124080 }, { - "epoch": 0.63, - "learning_rate": 0.00020609249738914588, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.0002517511230464953, + "loss": 0.02, "step": 124090 }, { - "epoch": 0.63, - "learning_rate": 0.00020608492969613186, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.0002517472348301238, + "loss": 0.0207, "step": 124100 }, { - "epoch": 0.63, - "learning_rate": 0.00020607736200311787, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025174334661375237, + "loss": 0.0262, "step": 124110 }, { - "epoch": 0.63, - "learning_rate": 0.00020606979431010385, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.0002517394583973809, + "loss": 0.0236, "step": 124120 }, { - "epoch": 0.63, - "learning_rate": 0.00020606222661708983, - "loss": 0.0169, + "epoch": 0.32, + "learning_rate": 0.0002517355701810094, + "loss": 0.0206, "step": 124130 }, { - "epoch": 0.63, - "learning_rate": 0.00020605465892407584, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.0002517316819646379, + "loss": 0.0224, "step": 124140 }, { - "epoch": 0.63, - "learning_rate": 0.00020604709123106182, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002517277937482665, + "loss": 0.0224, "step": 124150 }, { - "epoch": 0.63, - "learning_rate": 0.0002060395235380478, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.000251723905531895, + "loss": 0.0225, "step": 124160 }, { - "epoch": 0.63, - "learning_rate": 0.0002060319558450338, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.00025172001731552356, + "loss": 0.0191, "step": 124170 }, { - "epoch": 0.63, - "learning_rate": 0.0002060243881520198, - "loss": 0.0148, + "epoch": 0.32, + "learning_rate": 0.0002517161290991521, + "loss": 0.0218, "step": 124180 }, { - "epoch": 0.63, - "learning_rate": 0.00020601682045900578, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025171224088278065, + "loss": 0.0212, "step": 124190 }, { - "epoch": 0.63, - "learning_rate": 0.00020600925276599178, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.00025170835266640916, + "loss": 0.0253, "step": 124200 }, { - "epoch": 0.63, - "learning_rate": 0.00020600168507297777, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.0002517044644500377, + "loss": 0.0269, "step": 124210 }, { - "epoch": 0.63, - "learning_rate": 0.00020599411737996375, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.00025170057623366624, + "loss": 0.0265, "step": 124220 }, { - "epoch": 0.63, - "learning_rate": 0.00020598654968694976, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.00025169668801729476, + "loss": 0.0196, "step": 124230 }, { - "epoch": 0.63, - "learning_rate": 0.00020597898199393574, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025169279980092333, + "loss": 0.0232, "step": 124240 }, { - "epoch": 0.63, - "learning_rate": 0.00020597141430092172, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.00025168891158455184, + "loss": 0.0222, "step": 124250 }, { - "epoch": 0.63, - "learning_rate": 0.0002059638466079077, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.00025168502336818036, + "loss": 0.0178, "step": 124260 }, { - "epoch": 0.63, - "learning_rate": 0.0002059562789148937, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002516811351518089, + "loss": 0.0208, "step": 124270 }, { - "epoch": 0.63, - "learning_rate": 0.0002059487112218797, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.00025167724693543744, + "loss": 0.0233, "step": 124280 }, { - "epoch": 0.63, - "learning_rate": 0.00020594114352886567, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.00025167335871906595, + "loss": 0.016, "step": 124290 }, { - "epoch": 0.63, - "learning_rate": 0.00020593357583585168, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.0002516694705026945, + "loss": 0.0219, "step": 124300 }, { - "epoch": 0.63, - "learning_rate": 0.00020592600814283766, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.00025166558228632304, + "loss": 0.0211, "step": 124310 }, { - "epoch": 0.63, - "learning_rate": 0.00020591844044982364, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.0002516616940699516, + "loss": 0.0177, "step": 124320 }, { - "epoch": 0.63, - "learning_rate": 0.00020591087275680965, - "loss": 0.0158, + "epoch": 0.32, + "learning_rate": 0.0002516578058535801, + "loss": 0.023, "step": 124330 }, { - "epoch": 0.63, - "learning_rate": 0.00020590330506379563, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.00025165391763720864, + "loss": 0.0228, "step": 124340 }, { - "epoch": 0.63, - "learning_rate": 0.00020589573737078161, - "loss": 0.0133, - "step": 124350 + "epoch": 0.32, + "learning_rate": 0.00025165002942083715, + "loss": 0.0186, + "step": 124350 }, { - "epoch": 0.63, - "learning_rate": 0.00020588816967776762, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.0002516461412044657, + "loss": 0.0283, "step": 124360 }, { - "epoch": 0.63, - "learning_rate": 0.0002058806019847536, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.0002516422529880943, + "loss": 0.0212, "step": 124370 }, { - "epoch": 0.63, - "learning_rate": 0.00020587303429173959, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.0002516383647717228, + "loss": 0.0202, "step": 124380 }, { - "epoch": 0.63, - "learning_rate": 0.0002058654665987256, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.0002516344765553513, + "loss": 0.0259, "step": 124390 }, { - "epoch": 0.63, - "learning_rate": 0.00020585789890571158, - "loss": 0.0272, + "epoch": 0.32, + "learning_rate": 0.0002516305883389799, + "loss": 0.0225, "step": 124400 }, { - "epoch": 0.63, - "learning_rate": 0.00020585033121269756, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.0002516267001226084, + "loss": 0.0201, "step": 124410 }, { - "epoch": 0.63, - "learning_rate": 0.00020584276351968354, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.0002516228119062369, + "loss": 0.0157, "step": 124420 }, { - "epoch": 0.63, - "learning_rate": 0.00020583519582666955, - "loss": 0.0132, + "epoch": 0.32, + "learning_rate": 0.0002516189236898655, + "loss": 0.0159, "step": 124430 }, { - "epoch": 0.63, - "learning_rate": 0.00020582762813365553, - "loss": 0.0104, + "epoch": 0.32, + "learning_rate": 0.000251615035473494, + "loss": 0.0193, "step": 124440 }, { - "epoch": 0.63, - "learning_rate": 0.0002058200604406415, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.00025161114725712257, + "loss": 0.0249, "step": 124450 }, { - "epoch": 0.63, - "learning_rate": 0.00020581249274762752, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002516072590407511, + "loss": 0.019, "step": 124460 }, { - "epoch": 0.63, - "learning_rate": 0.0002058049250546135, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.0002516033708243796, + "loss": 0.024, "step": 124470 }, { - "epoch": 0.63, - "learning_rate": 0.00020579735736159948, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.00025159948260800816, + "loss": 0.0227, "step": 124480 }, { - "epoch": 0.63, - "learning_rate": 0.0002057897896685855, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.0002515955943916367, + "loss": 0.0208, "step": 124490 }, { - "epoch": 0.63, - "learning_rate": 0.00020578222197557147, - "loss": 0.0135, + "epoch": 0.32, + "learning_rate": 0.0002515917061752652, + "loss": 0.0205, "step": 124500 }, { - "epoch": 0.63, - "learning_rate": 0.00020577465428255745, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.00025158781795889376, + "loss": 0.022, "step": 124510 }, { - "epoch": 0.63, - "learning_rate": 0.00020576708658954346, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.00025158392974252233, + "loss": 0.0238, "step": 124520 }, { - "epoch": 0.63, - "learning_rate": 0.00020575951889652944, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.00025158004152615085, + "loss": 0.0198, "step": 124530 }, { - "epoch": 0.63, - "learning_rate": 0.00020575195120351542, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025157615330977936, + "loss": 0.0205, "step": 124540 }, { - "epoch": 0.63, - "learning_rate": 0.00020574438351050143, - "loss": 0.017, + "epoch": 0.32, + "learning_rate": 0.0002515722650934079, + "loss": 0.0181, "step": 124550 }, { - "epoch": 0.63, - "learning_rate": 0.00020573681581748741, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.0002515683768770364, + "loss": 0.0204, "step": 124560 }, { - "epoch": 0.63, - "learning_rate": 0.0002057292481244734, - "loss": 0.0118, + "epoch": 0.32, + "learning_rate": 0.00025156448866066496, + "loss": 0.0172, "step": 124570 }, { - "epoch": 0.63, - "learning_rate": 0.00020572168043145938, - "loss": 0.014, + "epoch": 0.32, + "learning_rate": 0.0002515606004442935, + "loss": 0.0179, "step": 124580 }, { - "epoch": 0.63, - "learning_rate": 0.00020571411273844539, - "loss": 0.0118, + "epoch": 0.32, + "learning_rate": 0.00025155671222792204, + "loss": 0.0209, "step": 124590 }, { - "epoch": 0.63, - "learning_rate": 0.00020570654504543137, - "loss": 0.0144, + "epoch": 0.32, + "learning_rate": 0.00025155282401155056, + "loss": 0.0255, "step": 124600 }, { - "epoch": 0.63, - "learning_rate": 0.00020569897735241735, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.0002515489357951791, + "loss": 0.0176, "step": 124610 }, { - "epoch": 0.63, - "learning_rate": 0.00020569140965940336, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.00025154504757880764, + "loss": 0.019, "step": 124620 }, { - "epoch": 0.63, - "learning_rate": 0.00020568384196638934, - "loss": 0.0174, + "epoch": 0.32, + "learning_rate": 0.00025154115936243615, + "loss": 0.0169, "step": 124630 }, { - "epoch": 0.63, - "learning_rate": 0.00020567627427337532, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002515372711460647, + "loss": 0.0262, "step": 124640 }, { - "epoch": 0.63, - "learning_rate": 0.00020566870658036133, - "loss": 0.0133, + "epoch": 0.32, + "learning_rate": 0.00025153338292969324, + "loss": 0.0184, "step": 124650 }, { - "epoch": 0.63, - "learning_rate": 0.0002056611388873473, - "loss": 0.0157, + "epoch": 0.32, + "learning_rate": 0.0002515294947133218, + "loss": 0.0194, "step": 124660 }, { - "epoch": 0.63, - "learning_rate": 0.0002056535711943333, - "loss": 0.0131, + "epoch": 0.32, + "learning_rate": 0.0002515256064969503, + "loss": 0.0214, "step": 124670 }, { - "epoch": 0.63, - "learning_rate": 0.0002056460035013193, - "loss": 0.0143, + "epoch": 0.32, + "learning_rate": 0.00025152171828057883, + "loss": 0.0153, "step": 124680 }, { - "epoch": 0.63, - "learning_rate": 0.00020563843580830528, - "loss": 0.0127, + "epoch": 0.32, + "learning_rate": 0.0002515178300642074, + "loss": 0.0226, "step": 124690 }, { - "epoch": 0.63, - "learning_rate": 0.00020563086811529126, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.0002515139418478359, + "loss": 0.0199, "step": 124700 }, { - "epoch": 0.63, - "learning_rate": 0.00020562330042227727, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025151005363146443, + "loss": 0.0219, "step": 124710 }, { - "epoch": 0.63, - "learning_rate": 0.00020561573272926325, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.000251506165415093, + "loss": 0.0261, "step": 124720 }, { - "epoch": 0.63, - "learning_rate": 0.00020560816503624923, - "loss": 0.0147, + "epoch": 0.32, + "learning_rate": 0.00025150227719872157, + "loss": 0.022, "step": 124730 }, { - "epoch": 0.63, - "learning_rate": 0.00020560059734323524, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.0002514983889823501, + "loss": 0.0253, "step": 124740 }, { - "epoch": 0.63, - "learning_rate": 0.00020559302965022122, - "loss": 0.0116, + "epoch": 0.32, + "learning_rate": 0.0002514945007659786, + "loss": 0.0252, "step": 124750 }, { - "epoch": 0.63, - "learning_rate": 0.0002055854619572072, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002514906125496071, + "loss": 0.018, "step": 124760 }, { - "epoch": 0.63, - "learning_rate": 0.0002055778942641932, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.0002514867243332357, + "loss": 0.0213, "step": 124770 }, { - "epoch": 0.63, - "learning_rate": 0.0002055703265711792, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.0002514828361168642, + "loss": 0.0212, "step": 124780 }, { - "epoch": 0.63, - "learning_rate": 0.00020556275887816518, - "loss": 0.0167, + "epoch": 0.32, + "learning_rate": 0.00025147894790049276, + "loss": 0.018, "step": 124790 }, { - "epoch": 0.63, - "learning_rate": 0.00020555519118515116, - "loss": 0.0149, + "epoch": 0.32, + "learning_rate": 0.0002514750596841213, + "loss": 0.0188, "step": 124800 }, { - "epoch": 0.63, - "learning_rate": 0.00020554762349213717, - "loss": 0.0176, + "epoch": 0.32, + "learning_rate": 0.0002514711714677498, + "loss": 0.0222, "step": 124810 }, { - "epoch": 0.63, - "learning_rate": 0.00020554005579912315, - "loss": 0.0127, + "epoch": 0.32, + "learning_rate": 0.00025146728325137836, + "loss": 0.0192, "step": 124820 }, { - "epoch": 0.63, - "learning_rate": 0.00020553248810610913, - "loss": 0.0127, + "epoch": 0.32, + "learning_rate": 0.0002514633950350069, + "loss": 0.0219, "step": 124830 }, { - "epoch": 0.63, - "learning_rate": 0.00020552492041309514, - "loss": 0.0134, + "epoch": 0.32, + "learning_rate": 0.0002514595068186354, + "loss": 0.0234, "step": 124840 }, { - "epoch": 0.63, - "learning_rate": 0.00020551735272008112, - "loss": 0.0144, + "epoch": 0.32, + "learning_rate": 0.00025145561860226396, + "loss": 0.0169, "step": 124850 }, { - "epoch": 0.63, - "learning_rate": 0.0002055097850270671, - "loss": 0.0129, + "epoch": 0.32, + "learning_rate": 0.00025145173038589253, + "loss": 0.021, "step": 124860 }, { - "epoch": 0.63, - "learning_rate": 0.0002055022173340531, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.00025144784216952104, + "loss": 0.0215, "step": 124870 }, { - "epoch": 0.63, - "learning_rate": 0.0002054946496410391, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.00025144395395314956, + "loss": 0.0225, "step": 124880 }, { - "epoch": 0.63, - "learning_rate": 0.00020548708194802507, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.0002514400657367781, + "loss": 0.0195, "step": 124890 }, { - "epoch": 0.63, - "learning_rate": 0.00020547951425501108, - "loss": 0.0141, + "epoch": 0.32, + "learning_rate": 0.00025143617752040664, + "loss": 0.0213, "step": 124900 }, { - "epoch": 0.63, - "learning_rate": 0.00020547194656199706, - "loss": 0.0107, + "epoch": 0.32, + "learning_rate": 0.00025143228930403516, + "loss": 0.0206, "step": 124910 }, { - "epoch": 0.63, - "learning_rate": 0.00020546437886898304, - "loss": 0.0128, + "epoch": 0.32, + "learning_rate": 0.0002514284010876637, + "loss": 0.0211, "step": 124920 }, { - "epoch": 0.63, - "learning_rate": 0.00020545681117596903, - "loss": 0.0165, + "epoch": 0.32, + "learning_rate": 0.00025142451287129224, + "loss": 0.0205, "step": 124930 }, { - "epoch": 0.63, - "learning_rate": 0.00020544924348295503, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002514206246549208, + "loss": 0.026, "step": 124940 }, { - "epoch": 0.63, - "learning_rate": 0.00020544167578994102, - "loss": 0.0172, + "epoch": 0.32, + "learning_rate": 0.0002514167364385493, + "loss": 0.062, "step": 124950 }, { - "epoch": 0.63, - "learning_rate": 0.000205434108096927, - "loss": 0.0126, + "epoch": 0.32, + "learning_rate": 0.00025141284822217784, + "loss": 0.0207, "step": 124960 }, { - "epoch": 0.63, - "learning_rate": 0.000205426540403913, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.00025140896000580635, + "loss": 0.0191, "step": 124970 }, { - "epoch": 0.63, - "learning_rate": 0.000205418972710899, - "loss": 0.0107, + "epoch": 0.32, + "learning_rate": 0.0002514050717894349, + "loss": 0.0331, "step": 124980 }, { - "epoch": 0.63, - "learning_rate": 0.00020541140501788497, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.00025140118357306344, + "loss": 0.0186, "step": 124990 }, { - "epoch": 0.63, - "learning_rate": 0.00020540383732487098, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.000251397295356692, + "loss": 0.0224, "step": 125000 }, { - "epoch": 0.63, - "eval_cer": 0.9144945158062973, - "eval_loss": 0.010605525225400925, - "eval_runtime": 116.7031, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.284, + "epoch": 0.32, + "eval_cer": 0.8818118580040337, + "eval_loss": 0.01477042119950056, + "eval_runtime": 107.7289, + "eval_samples_per_second": 18.565, + "eval_steps_per_second": 4.641, "step": 125000 }, { - "epoch": 0.63, - "learning_rate": 0.00020539626963185696, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002513934071403205, + "loss": 0.0177, "step": 125010 }, { - "epoch": 0.63, - "learning_rate": 0.00020538870193884294, - "loss": 0.0101, + "epoch": 0.32, + "learning_rate": 0.0002513895189239491, + "loss": 0.0228, "step": 125020 }, { - "epoch": 0.63, - "learning_rate": 0.00020538113424582895, - "loss": 0.0155, + "epoch": 0.32, + "learning_rate": 0.0002513856307075776, + "loss": 0.02, "step": 125030 }, { - "epoch": 0.63, - "learning_rate": 0.00020537356655281493, - "loss": 0.0162, + "epoch": 0.32, + "learning_rate": 0.0002513817424912061, + "loss": 0.0206, "step": 125040 }, { - "epoch": 0.63, - "learning_rate": 0.0002053659988598009, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.00025137785427483463, + "loss": 0.0192, "step": 125050 }, { - "epoch": 0.63, - "learning_rate": 0.00020535843116678692, - "loss": 0.013, + "epoch": 0.32, + "learning_rate": 0.0002513739660584632, + "loss": 0.0262, "step": 125060 }, { - "epoch": 0.63, - "learning_rate": 0.00020535086347377287, - "loss": 0.0175, + "epoch": 0.32, + "learning_rate": 0.00025137007784209177, + "loss": 0.0206, "step": 125070 }, { - "epoch": 0.63, - "learning_rate": 0.00020534329578075886, - "loss": 0.0138, + "epoch": 0.32, + "learning_rate": 0.0002513661896257203, + "loss": 0.022, "step": 125080 }, { - "epoch": 0.63, - "learning_rate": 0.00020533572808774484, - "loss": 0.0142, + "epoch": 0.32, + "learning_rate": 0.0002513623014093488, + "loss": 0.0263, "step": 125090 }, { - "epoch": 0.63, - "learning_rate": 0.00020532816039473085, - "loss": 0.0121, + "epoch": 0.32, + "learning_rate": 0.0002513584131929773, + "loss": 0.0224, "step": 125100 }, { - "epoch": 0.63, - "learning_rate": 0.00020532059270171683, - "loss": 0.0125, + "epoch": 0.32, + "learning_rate": 0.0002513545249766059, + "loss": 0.023, "step": 125110 }, { - "epoch": 0.63, - "learning_rate": 0.0002053130250087028, - "loss": 0.0135, + "epoch": 0.32, + "learning_rate": 0.0002513506367602344, + "loss": 0.018, "step": 125120 }, { - "epoch": 0.63, - "learning_rate": 0.00020530545731568882, - "loss": 0.0145, + "epoch": 0.32, + "learning_rate": 0.00025134674854386296, + "loss": 0.0184, "step": 125130 }, { - "epoch": 0.63, - "learning_rate": 0.0002052978896226748, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.0002513428603274915, + "loss": 0.0243, "step": 125140 }, { - "epoch": 0.63, - "learning_rate": 0.00020529032192966078, - "loss": 0.0107, + "epoch": 0.32, + "learning_rate": 0.00025133897211112005, + "loss": 0.0185, "step": 125150 }, { - "epoch": 0.63, - "learning_rate": 0.00020528275423664676, - "loss": 0.0136, + "epoch": 0.32, + "learning_rate": 0.00025133508389474856, + "loss": 0.0221, "step": 125160 }, { - "epoch": 0.63, - "learning_rate": 0.00020527518654363277, - "loss": 0.0103, + "epoch": 0.32, + "learning_rate": 0.0002513311956783771, + "loss": 0.0222, "step": 125170 }, { - "epoch": 0.63, - "learning_rate": 0.00020526761885061875, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.0002513273074620056, + "loss": 0.0198, "step": 125180 }, { - "epoch": 0.63, - "learning_rate": 0.00020526005115760473, - "loss": 0.0118, + "epoch": 0.32, + "learning_rate": 0.00025132341924563416, + "loss": 0.0197, "step": 125190 }, { - "epoch": 0.63, - "learning_rate": 0.00020525248346459074, - "loss": 0.0113, + "epoch": 0.32, + "learning_rate": 0.0002513195310292627, + "loss": 0.018, "step": 125200 }, { - "epoch": 0.63, - "learning_rate": 0.00020524491577157672, - "loss": 0.0166, + "epoch": 0.32, + "learning_rate": 0.00025131564281289124, + "loss": 0.0199, "step": 125210 }, { - "epoch": 0.63, - "learning_rate": 0.0002052373480785627, - "loss": 0.0146, + "epoch": 0.32, + "learning_rate": 0.00025131175459651976, + "loss": 0.0224, "step": 125220 }, { - "epoch": 0.63, - "learning_rate": 0.0002052297803855487, - "loss": 0.016, + "epoch": 0.32, + "learning_rate": 0.0002513078663801483, + "loss": 0.0217, "step": 125230 }, { - "epoch": 0.63, - "learning_rate": 0.0002052222126925347, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.00025130397816377684, + "loss": 0.0217, "step": 125240 }, { - "epoch": 0.63, - "learning_rate": 0.00020521464499952068, - "loss": 0.0163, + "epoch": 0.32, + "learning_rate": 0.00025130008994740536, + "loss": 0.0231, "step": 125250 }, { - "epoch": 0.63, - "learning_rate": 0.00020520707730650668, - "loss": 0.0192, + "epoch": 0.32, + "learning_rate": 0.0002512962017310339, + "loss": 0.027, "step": 125260 }, { - "epoch": 0.63, - "learning_rate": 0.00020519950961349267, - "loss": 0.0153, + "epoch": 0.32, + "learning_rate": 0.00025129231351466244, + "loss": 0.0207, "step": 125270 }, { - "epoch": 0.63, - "learning_rate": 0.00020519194192047865, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.000251288425298291, + "loss": 0.0191, "step": 125280 }, { - "epoch": 0.63, - "learning_rate": 0.00020518437422746466, - "loss": 0.0154, + "epoch": 0.32, + "learning_rate": 0.0002512845370819195, + "loss": 0.0158, "step": 125290 }, { - "epoch": 0.63, - "learning_rate": 0.00020517680653445064, - "loss": 0.0135, + "epoch": 0.32, + "learning_rate": 0.00025128064886554804, + "loss": 0.0265, "step": 125300 }, { - "epoch": 0.63, - "learning_rate": 0.00020516923884143662, - "loss": 0.0164, + "epoch": 0.32, + "learning_rate": 0.00025127676064917655, + "loss": 0.0198, "step": 125310 }, { - "epoch": 0.63, - "learning_rate": 0.0002051616711484226, - "loss": 0.0139, + "epoch": 0.32, + "learning_rate": 0.0002512728724328051, + "loss": 0.0228, "step": 125320 }, { - "epoch": 0.63, - "learning_rate": 0.0002051541034554086, - "loss": 0.0178, + "epoch": 0.32, + "learning_rate": 0.00025126898421643363, + "loss": 0.0218, "step": 125330 }, { - "epoch": 0.63, - "learning_rate": 0.0002051465357623946, - "loss": 0.0122, + "epoch": 0.32, + "learning_rate": 0.0002512650960000622, + "loss": 0.0233, "step": 125340 }, { - "epoch": 0.63, - "learning_rate": 0.00020513896806938057, - "loss": 0.0152, + "epoch": 0.32, + "learning_rate": 0.0002512612077836907, + "loss": 0.024, "step": 125350 }, { - "epoch": 0.63, - "learning_rate": 0.00020513140037636658, - "loss": 0.0173, + "epoch": 0.32, + "learning_rate": 0.0002512573195673193, + "loss": 0.021, "step": 125360 }, { - "epoch": 0.63, - "learning_rate": 0.00020512383268335256, - "loss": 0.0151, + "epoch": 0.32, + "learning_rate": 0.0002512534313509478, + "loss": 0.0163, "step": 125370 }, { - "epoch": 0.63, - "learning_rate": 0.00020511626499033854, - "loss": 0.0117, + "epoch": 0.33, + "learning_rate": 0.0002512495431345763, + "loss": 0.0362, "step": 125380 }, { - "epoch": 0.63, - "learning_rate": 0.00020510869729732455, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00025124565491820483, + "loss": 0.0203, "step": 125390 }, { - "epoch": 0.63, - "learning_rate": 0.00020510112960431053, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.0002512417667018334, + "loss": 0.0207, "step": 125400 }, { - "epoch": 0.63, - "learning_rate": 0.00020509356191129651, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025123787848546197, + "loss": 0.0197, "step": 125410 }, { - "epoch": 0.63, - "learning_rate": 0.00020508599421828252, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.0002512339902690905, + "loss": 0.0175, "step": 125420 }, { - "epoch": 0.63, - "learning_rate": 0.0002050784265252685, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.000251230102052719, + "loss": 0.0215, "step": 125430 }, { - "epoch": 0.63, - "learning_rate": 0.00020507085883225449, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.00025122621383634756, + "loss": 0.0242, "step": 125440 }, { - "epoch": 0.63, - "learning_rate": 0.0002050632911392405, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.0002512223256199761, + "loss": 0.023, "step": 125450 }, { - "epoch": 0.63, - "learning_rate": 0.00020505572344622648, - "loss": 0.0165, + "epoch": 0.33, + "learning_rate": 0.0002512184374036046, + "loss": 0.0194, "step": 125460 }, { - "epoch": 0.63, - "learning_rate": 0.00020504815575321246, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025121454918723316, + "loss": 0.0221, "step": 125470 }, { - "epoch": 0.63, - "learning_rate": 0.00020504058806019844, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002512106609708617, + "loss": 0.0176, "step": 125480 }, { - "epoch": 0.63, - "learning_rate": 0.00020503302036718445, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.00025120677275449025, + "loss": 0.0173, "step": 125490 }, { - "epoch": 0.63, - "learning_rate": 0.00020502545267417043, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025120288453811876, + "loss": 0.022, "step": 125500 }, { - "epoch": 0.63, - "learning_rate": 0.0002050178849811564, - "loss": 0.0153, + "epoch": 0.33, + "learning_rate": 0.0002511989963217473, + "loss": 0.0197, "step": 125510 }, { - "epoch": 0.63, - "learning_rate": 0.00020501031728814242, - "loss": 0.0153, + "epoch": 0.33, + "learning_rate": 0.00025119510810537584, + "loss": 0.0199, "step": 125520 }, { - "epoch": 0.63, - "learning_rate": 0.0002050027495951284, - "loss": 0.012, + "epoch": 0.33, + "learning_rate": 0.00025119121988900436, + "loss": 0.0187, "step": 125530 }, { - "epoch": 0.63, - "learning_rate": 0.00020499518190211438, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025118733167263287, + "loss": 0.0189, "step": 125540 }, { - "epoch": 0.63, - "learning_rate": 0.0002049876142091004, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.00025118344345626144, + "loss": 0.0175, "step": 125550 }, { - "epoch": 0.63, - "learning_rate": 0.00020498004651608637, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.00025117955523988996, + "loss": 0.0202, "step": 125560 }, { - "epoch": 0.63, - "learning_rate": 0.00020497247882307235, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.0002511756670235185, + "loss": 0.0197, "step": 125570 }, { - "epoch": 0.63, - "learning_rate": 0.00020496491113005836, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.00025117177880714704, + "loss": 0.026, "step": 125580 }, { - "epoch": 0.63, - "learning_rate": 0.00020495734343704434, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.00025116789059077555, + "loss": 0.031, "step": 125590 }, { - "epoch": 0.63, - "learning_rate": 0.00020494977574403032, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.00025116400237440407, + "loss": 0.022, "step": 125600 }, { - "epoch": 0.63, - "learning_rate": 0.00020494220805101633, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.00025116011415803264, + "loss": 0.0219, "step": 125610 }, { - "epoch": 0.63, - "learning_rate": 0.00020493464035800231, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.0002511562259416612, + "loss": 0.0194, "step": 125620 }, { - "epoch": 0.63, - "learning_rate": 0.0002049270726649883, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002511523377252897, + "loss": 0.0225, "step": 125630 }, { - "epoch": 0.63, - "learning_rate": 0.00020491950497197428, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.00025114844950891823, + "loss": 0.0212, "step": 125640 }, { - "epoch": 0.63, - "learning_rate": 0.00020491193727896029, - "loss": 0.0103, + "epoch": 0.33, + "learning_rate": 0.0002511445612925468, + "loss": 0.0187, "step": 125650 }, { - "epoch": 0.63, - "learning_rate": 0.00020490436958594627, - "loss": 0.0116, + "epoch": 0.33, + "learning_rate": 0.0002511406730761753, + "loss": 0.0243, "step": 125660 }, { - "epoch": 0.63, - "learning_rate": 0.00020489680189293225, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00025113678485980383, + "loss": 0.0213, "step": 125670 }, { - "epoch": 0.63, - "learning_rate": 0.00020488923419991826, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.0002511328966434324, + "loss": 0.0213, "step": 125680 }, { - "epoch": 0.63, - "learning_rate": 0.00020488166650690424, - "loss": 0.0188, + "epoch": 0.33, + "learning_rate": 0.0002511290084270609, + "loss": 0.0262, "step": 125690 }, { - "epoch": 0.63, - "learning_rate": 0.00020487409881389022, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.0002511251202106895, + "loss": 0.0268, "step": 125700 }, { - "epoch": 0.63, - "learning_rate": 0.00020486653112087623, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.000251121231994318, + "loss": 0.0237, "step": 125710 }, { - "epoch": 0.63, - "learning_rate": 0.0002048589634278622, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.0002511173437779465, + "loss": 0.0179, "step": 125720 }, { - "epoch": 0.63, - "learning_rate": 0.0002048513957348482, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.0002511134555615751, + "loss": 0.0195, "step": 125730 }, { - "epoch": 0.63, - "learning_rate": 0.0002048438280418342, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002511095673452036, + "loss": 0.0244, "step": 125740 }, { - "epoch": 0.63, - "learning_rate": 0.00020483626034882018, - "loss": 0.019, + "epoch": 0.33, + "learning_rate": 0.0002511056791288321, + "loss": 0.0196, "step": 125750 }, { - "epoch": 0.63, - "learning_rate": 0.00020482869265580616, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.0002511017909124607, + "loss": 0.0235, "step": 125760 }, { - "epoch": 0.63, - "learning_rate": 0.00020482112496279217, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.00025109790269608925, + "loss": 0.0243, "step": 125770 }, { - "epoch": 0.63, - "learning_rate": 0.00020481355726977815, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.00025109401447971776, + "loss": 0.0258, "step": 125780 }, { - "epoch": 0.63, - "learning_rate": 0.00020480598957676413, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002510901262633463, + "loss": 0.0314, "step": 125790 }, { - "epoch": 0.63, - "learning_rate": 0.00020479842188375014, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.0002510862380469748, + "loss": 0.0227, "step": 125800 }, { - "epoch": 0.63, - "learning_rate": 0.00020479085419073612, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.00025108234983060336, + "loss": 0.0201, "step": 125810 }, { - "epoch": 0.63, - "learning_rate": 0.0002047832864977221, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.0002510784616142319, + "loss": 0.0186, "step": 125820 }, { - "epoch": 0.63, - "learning_rate": 0.0002047757188047081, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.00025107457339786044, + "loss": 0.0297, "step": 125830 }, { - "epoch": 0.63, - "learning_rate": 0.0002047681511116941, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.00025107068518148896, + "loss": 0.0212, "step": 125840 }, { - "epoch": 0.63, - "learning_rate": 0.00020476058341868008, - "loss": 0.0178, + "epoch": 0.33, + "learning_rate": 0.0002510667969651175, + "loss": 0.0173, "step": 125850 }, { - "epoch": 0.63, - "learning_rate": 0.00020475301572566606, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.00025106290874874604, + "loss": 0.0261, "step": 125860 }, { - "epoch": 0.64, - "learning_rate": 0.00020474544803265207, - "loss": 0.017, + "epoch": 0.33, + "learning_rate": 0.00025105902053237456, + "loss": 0.0222, "step": 125870 }, { - "epoch": 0.64, - "learning_rate": 0.00020473788033963805, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.00025105513231600307, + "loss": 0.0188, "step": 125880 }, { - "epoch": 0.64, - "learning_rate": 0.00020473031264662403, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.00025105124409963164, + "loss": 0.0213, "step": 125890 }, { - "epoch": 0.64, - "learning_rate": 0.00020472274495361004, - "loss": 0.0113, + "epoch": 0.33, + "learning_rate": 0.00025104735588326015, + "loss": 0.0249, "step": 125900 }, { - "epoch": 0.64, - "learning_rate": 0.00020471517726059602, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002510434676668887, + "loss": 0.0184, "step": 125910 }, { - "epoch": 0.64, - "learning_rate": 0.000204707609567582, - "loss": 0.0166, + "epoch": 0.33, + "learning_rate": 0.00025103957945051724, + "loss": 0.0184, "step": 125920 }, { - "epoch": 0.64, - "learning_rate": 0.000204700041874568, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025103569123414575, + "loss": 0.0236, "step": 125930 }, { - "epoch": 0.64, - "learning_rate": 0.000204692474181554, - "loss": 0.0121, + "epoch": 0.33, + "learning_rate": 0.0002510318030177743, + "loss": 0.02, "step": 125940 }, { - "epoch": 0.64, - "learning_rate": 0.00020468490648853997, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00025102791480140284, + "loss": 0.0239, "step": 125950 }, { - "epoch": 0.64, - "learning_rate": 0.00020467733879552598, - "loss": 0.0165, + "epoch": 0.33, + "learning_rate": 0.0002510240265850314, + "loss": 0.0223, "step": 125960 }, { - "epoch": 0.64, - "learning_rate": 0.00020466977110251196, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.0002510201383686599, + "loss": 0.0183, "step": 125970 }, { - "epoch": 0.64, - "learning_rate": 0.00020466220340949794, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002510162501522885, + "loss": 0.0225, "step": 125980 }, { - "epoch": 0.64, - "learning_rate": 0.00020465463571648393, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.000251012361935917, + "loss": 0.0206, "step": 125990 }, { - "epoch": 0.64, - "learning_rate": 0.00020464706802346993, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002510084737195455, + "loss": 0.0194, "step": 126000 }, { - "epoch": 0.64, - "eval_cer": 0.9145129533326799, - "eval_loss": 0.010170434601604939, - "eval_runtime": 116.6449, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.287, + "epoch": 0.33, + "eval_cer": 0.8818146572779021, + "eval_loss": 0.014803457073867321, + "eval_runtime": 107.7105, + "eval_samples_per_second": 18.568, + "eval_steps_per_second": 4.642, "step": 126000 }, { - "epoch": 0.64, - "learning_rate": 0.00020463950033045592, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025100458550317403, + "loss": 0.0184, "step": 126010 }, { - "epoch": 0.64, - "learning_rate": 0.0002046319326374419, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.0002510006972868026, + "loss": 0.0157, "step": 126020 }, { - "epoch": 0.64, - "learning_rate": 0.0002046243649444279, - "loss": 0.0171, + "epoch": 0.33, + "learning_rate": 0.0002509968090704311, + "loss": 0.0205, "step": 126030 }, { - "epoch": 0.64, - "learning_rate": 0.0002046167972514139, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.0002509929208540597, + "loss": 0.0212, "step": 126040 }, { - "epoch": 0.64, - "learning_rate": 0.00020460922955839987, - "loss": 0.0152, + "epoch": 0.33, + "learning_rate": 0.0002509890326376882, + "loss": 0.017, "step": 126050 }, { - "epoch": 0.64, - "learning_rate": 0.00020460166186538588, - "loss": 0.0184, + "epoch": 0.33, + "learning_rate": 0.0002509851444213167, + "loss": 0.0213, "step": 126060 }, { - "epoch": 0.64, - "learning_rate": 0.00020459409417237186, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.0002509812562049453, + "loss": 0.0203, "step": 126070 }, { - "epoch": 0.64, - "learning_rate": 0.00020458652647935784, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.0002509773679885738, + "loss": 0.0206, "step": 126080 }, { - "epoch": 0.64, - "learning_rate": 0.00020457895878634385, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002509734797722023, + "loss": 0.0189, "step": 126090 }, { - "epoch": 0.64, - "learning_rate": 0.00020457139109332983, - "loss": 0.0206, + "epoch": 0.33, + "learning_rate": 0.0002509695915558309, + "loss": 0.0177, "step": 126100 }, { - "epoch": 0.64, - "learning_rate": 0.0002045638234003158, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025096570333945945, + "loss": 0.0171, "step": 126110 }, { - "epoch": 0.64, - "learning_rate": 0.00020455625570730182, - "loss": 0.0186, + "epoch": 0.33, + "learning_rate": 0.00025096181512308796, + "loss": 0.0227, "step": 126120 }, { - "epoch": 0.64, - "learning_rate": 0.0002045486880142878, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.0002509579269067165, + "loss": 0.0209, "step": 126130 }, { - "epoch": 0.64, - "learning_rate": 0.00020454112032127378, - "loss": 0.0152, + "epoch": 0.33, + "learning_rate": 0.000250954038690345, + "loss": 0.0257, "step": 126140 }, { - "epoch": 0.64, - "learning_rate": 0.00020453355262825976, - "loss": 0.0171, + "epoch": 0.33, + "learning_rate": 0.00025095015047397356, + "loss": 0.0224, "step": 126150 }, { - "epoch": 0.64, - "learning_rate": 0.00020452598493524577, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.0002509462622576021, + "loss": 0.0165, "step": 126160 }, { - "epoch": 0.64, - "learning_rate": 0.00020451841724223175, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.00025094237404123064, + "loss": 0.0174, "step": 126170 }, { - "epoch": 0.64, - "learning_rate": 0.00020451084954921774, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.00025093848582485916, + "loss": 0.0176, "step": 126180 }, { - "epoch": 0.64, - "learning_rate": 0.00020450328185620374, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.0002509345976084877, + "loss": 0.0258, "step": 126190 }, { - "epoch": 0.64, - "learning_rate": 0.00020449571416318973, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.00025093070939211624, + "loss": 0.0216, "step": 126200 }, { - "epoch": 0.64, - "learning_rate": 0.0002044881464701757, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.00025092682117574476, + "loss": 0.0257, "step": 126210 }, { - "epoch": 0.64, - "learning_rate": 0.00020448057877716172, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.00025092293295937327, + "loss": 0.0194, "step": 126220 }, { - "epoch": 0.64, - "learning_rate": 0.0002044730110841477, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025091904474300184, + "loss": 0.0168, "step": 126230 }, { - "epoch": 0.64, - "learning_rate": 0.00020446544339113368, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025091515652663035, + "loss": 0.0249, "step": 126240 }, { - "epoch": 0.64, - "learning_rate": 0.0002044578756981197, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.0002509112683102589, + "loss": 0.0213, "step": 126250 }, { - "epoch": 0.64, - "learning_rate": 0.00020445030800510567, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.00025090738009388744, + "loss": 0.0203, "step": 126260 }, { - "epoch": 0.64, - "learning_rate": 0.00020444274031209165, - "loss": 0.0187, + "epoch": 0.33, + "learning_rate": 0.000250903491877516, + "loss": 0.0185, "step": 126270 }, { - "epoch": 0.64, - "learning_rate": 0.00020443517261907766, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002508996036611445, + "loss": 0.0283, "step": 126280 }, { - "epoch": 0.64, - "learning_rate": 0.00020442760492606364, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.00025089571544477303, + "loss": 0.0175, "step": 126290 }, { - "epoch": 0.64, - "learning_rate": 0.00020442003723304962, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.00025089182722840155, + "loss": 0.0197, "step": 126300 }, { - "epoch": 0.64, - "learning_rate": 0.00020441246954003563, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002508879390120301, + "loss": 0.0209, "step": 126310 }, { - "epoch": 0.64, - "learning_rate": 0.00020440490184702158, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.0002508840507956587, + "loss": 0.021, "step": 126320 }, { - "epoch": 0.64, - "learning_rate": 0.00020439733415400757, - "loss": 0.0179, + "epoch": 0.33, + "learning_rate": 0.0002508801625792872, + "loss": 0.0175, "step": 126330 }, { - "epoch": 0.64, - "learning_rate": 0.00020438976646099355, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.0002508762743629157, + "loss": 0.0187, "step": 126340 }, { - "epoch": 0.64, - "learning_rate": 0.00020438219876797956, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025087238614654423, + "loss": 0.0225, "step": 126350 }, { - "epoch": 0.64, - "learning_rate": 0.00020437463107496554, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002508684979301728, + "loss": 0.0188, "step": 126360 }, { - "epoch": 0.64, - "learning_rate": 0.00020436706338195152, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.0002508646097138013, + "loss": 0.0289, "step": 126370 }, { - "epoch": 0.64, - "learning_rate": 0.0002043594956889375, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002508607214974299, + "loss": 0.0224, "step": 126380 }, { - "epoch": 0.64, - "learning_rate": 0.0002043519279959235, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002508568332810584, + "loss": 0.0216, "step": 126390 }, { - "epoch": 0.64, - "learning_rate": 0.0002043443603029095, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025085294506468697, + "loss": 0.0187, "step": 126400 }, { - "epoch": 0.64, - "learning_rate": 0.00020433679260989547, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.0002508490568483155, + "loss": 0.0218, "step": 126410 }, { - "epoch": 0.64, - "learning_rate": 0.00020432922491688148, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.000250845168631944, + "loss": 0.0185, "step": 126420 }, { - "epoch": 0.64, - "learning_rate": 0.00020432165722386746, - "loss": 0.0115, + "epoch": 0.33, + "learning_rate": 0.0002508412804155725, + "loss": 0.0188, "step": 126430 }, { - "epoch": 0.64, - "learning_rate": 0.00020431408953085344, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.0002508373921992011, + "loss": 0.0202, "step": 126440 }, { - "epoch": 0.64, - "learning_rate": 0.00020430652183783945, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.00025083350398282965, + "loss": 0.0198, "step": 126450 }, { - "epoch": 0.64, - "learning_rate": 0.00020429895414482543, - "loss": 0.0117, + "epoch": 0.33, + "learning_rate": 0.00025082961576645816, + "loss": 0.0237, "step": 126460 }, { - "epoch": 0.64, - "learning_rate": 0.00020429138645181141, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.0002508257275500867, + "loss": 0.0255, "step": 126470 }, { - "epoch": 0.64, - "learning_rate": 0.00020428381875879742, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025082183933371524, + "loss": 0.0248, "step": 126480 }, { - "epoch": 0.64, - "learning_rate": 0.0002042762510657834, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.00025081795111734376, + "loss": 0.0199, "step": 126490 }, { - "epoch": 0.64, - "learning_rate": 0.00020426868337276939, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002508140629009723, + "loss": 0.02, "step": 126500 }, { - "epoch": 0.64, - "learning_rate": 0.0002042611156797554, - "loss": 0.0168, + "epoch": 0.33, + "learning_rate": 0.00025081017468460084, + "loss": 0.0212, "step": 126510 }, { - "epoch": 0.64, - "learning_rate": 0.00020425354798674138, - "loss": 0.0119, + "epoch": 0.33, + "learning_rate": 0.00025080628646822936, + "loss": 0.0201, "step": 126520 }, { - "epoch": 0.64, - "learning_rate": 0.00020424598029372736, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.0002508023982518579, + "loss": 0.0226, "step": 126530 }, { - "epoch": 0.64, - "learning_rate": 0.00020423841260071334, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.00025079851003548644, + "loss": 0.0191, "step": 126540 }, { - "epoch": 0.64, - "learning_rate": 0.00020423084490769935, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.00025079462181911495, + "loss": 0.0225, "step": 126550 }, { - "epoch": 0.64, - "learning_rate": 0.00020422327721468533, - "loss": 0.0168, + "epoch": 0.33, + "learning_rate": 0.00025079073360274347, + "loss": 0.0228, "step": 126560 }, { - "epoch": 0.64, - "learning_rate": 0.0002042157095216713, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00025078684538637204, + "loss": 0.0221, "step": 126570 }, { - "epoch": 0.64, - "learning_rate": 0.00020420814182865732, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.00025078295717000055, + "loss": 0.0206, "step": 126580 }, { - "epoch": 0.64, - "learning_rate": 0.0002042005741356433, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002507790689536291, + "loss": 0.0202, "step": 126590 }, { - "epoch": 0.64, - "learning_rate": 0.00020419300644262928, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025077518073725764, + "loss": 0.0227, "step": 126600 }, { - "epoch": 0.64, - "learning_rate": 0.0002041854387496153, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.0002507712925208862, + "loss": 0.0213, "step": 126610 }, { - "epoch": 0.64, - "learning_rate": 0.00020417787105660127, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002507674043045147, + "loss": 0.0212, "step": 126620 }, { - "epoch": 0.64, - "learning_rate": 0.00020417030336358725, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.00025076351608814323, + "loss": 0.021, "step": 126630 }, { - "epoch": 0.64, - "learning_rate": 0.00020416273567057326, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00025075962787177175, + "loss": 0.0206, "step": 126640 }, { - "epoch": 0.64, - "learning_rate": 0.00020415516797755924, - "loss": 0.0119, + "epoch": 0.33, + "learning_rate": 0.0002507557396554003, + "loss": 0.0207, "step": 126650 }, { - "epoch": 0.64, - "learning_rate": 0.00020414760028454522, - "loss": 0.0109, + "epoch": 0.33, + "learning_rate": 0.0002507518514390289, + "loss": 0.0216, "step": 126660 }, { - "epoch": 0.64, - "learning_rate": 0.00020414003259153123, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002507479632226574, + "loss": 0.0213, "step": 126670 }, { - "epoch": 0.64, - "learning_rate": 0.00020413246489851721, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.0002507440750062859, + "loss": 0.0198, "step": 126680 }, { - "epoch": 0.64, - "learning_rate": 0.0002041248972055032, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.0002507401867899145, + "loss": 0.0192, "step": 126690 }, { - "epoch": 0.64, - "learning_rate": 0.0002041173295124892, - "loss": 0.0172, + "epoch": 0.33, + "learning_rate": 0.000250736298573543, + "loss": 0.0165, "step": 126700 }, { - "epoch": 0.64, - "learning_rate": 0.00020410976181947519, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.0002507324103571715, + "loss": 0.0185, "step": 126710 }, { - "epoch": 0.64, - "learning_rate": 0.00020410219412646117, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002507285221408001, + "loss": 0.0172, "step": 126720 }, { - "epoch": 0.64, - "learning_rate": 0.00020409462643344715, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002507246339244286, + "loss": 0.0198, "step": 126730 }, { - "epoch": 0.64, - "learning_rate": 0.00020408705874043316, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.00025072074570805716, + "loss": 0.0219, "step": 126740 }, { - "epoch": 0.64, - "learning_rate": 0.00020407949104741914, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.0002507168574916857, + "loss": 0.0182, "step": 126750 }, { - "epoch": 0.64, - "learning_rate": 0.00020407192335440512, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.0002507129692753142, + "loss": 0.0192, "step": 126760 }, { - "epoch": 0.64, - "learning_rate": 0.00020406435566139113, - "loss": 0.0166, + "epoch": 0.33, + "learning_rate": 0.00025070908105894276, + "loss": 0.0221, "step": 126770 }, { - "epoch": 0.64, - "learning_rate": 0.0002040567879683771, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002507051928425713, + "loss": 0.0184, "step": 126780 }, { - "epoch": 0.64, - "learning_rate": 0.0002040492202753631, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002507013046261998, + "loss": 0.0216, "step": 126790 }, { - "epoch": 0.64, - "learning_rate": 0.0002040416525823491, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.00025069741640982836, + "loss": 0.0191, "step": 126800 }, { - "epoch": 0.64, - "learning_rate": 0.00020403408488933508, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.0002506935281934569, + "loss": 0.0183, "step": 126810 }, { - "epoch": 0.64, - "learning_rate": 0.00020402651719632106, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025068963997708544, + "loss": 0.0201, "step": 126820 }, { - "epoch": 0.64, - "learning_rate": 0.00020401894950330707, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00025068575176071396, + "loss": 0.0204, "step": 126830 }, { - "epoch": 0.64, - "learning_rate": 0.00020401138181029305, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00025068186354434247, + "loss": 0.019, "step": 126840 }, { - "epoch": 0.64, - "learning_rate": 0.00020400381411727903, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.00025067797532797104, + "loss": 0.0197, "step": 126850 }, { - "epoch": 0.64, - "learning_rate": 0.00020399624642426504, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.00025067408711159956, + "loss": 0.0196, "step": 126860 }, { - "epoch": 0.64, - "learning_rate": 0.00020398867873125102, - "loss": 0.0111, + "epoch": 0.33, + "learning_rate": 0.0002506701988952281, + "loss": 0.0257, "step": 126870 }, { - "epoch": 0.64, - "learning_rate": 0.000203981111038237, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.00025066631067885664, + "loss": 0.0209, "step": 126880 }, { - "epoch": 0.64, - "learning_rate": 0.000203973543345223, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025066242246248515, + "loss": 0.0198, "step": 126890 }, { - "epoch": 0.64, - "learning_rate": 0.000203965975652209, - "loss": 0.0117, + "epoch": 0.33, + "learning_rate": 0.0002506585342461137, + "loss": 0.0192, "step": 126900 }, { - "epoch": 0.64, - "learning_rate": 0.00020395840795919498, - "loss": 0.0152, + "epoch": 0.33, + "learning_rate": 0.00025065464602974224, + "loss": 0.0201, "step": 126910 }, { - "epoch": 0.64, - "learning_rate": 0.00020395084026618096, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.00025065075781337075, + "loss": 0.0198, "step": 126920 }, { - "epoch": 0.64, - "learning_rate": 0.00020394327257316697, - "loss": 0.0108, + "epoch": 0.33, + "learning_rate": 0.0002506468695969993, + "loss": 0.0202, "step": 126930 }, { - "epoch": 0.64, - "learning_rate": 0.00020393570488015295, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.00025064298138062783, + "loss": 0.0201, "step": 126940 }, { - "epoch": 0.64, - "learning_rate": 0.00020392813718713893, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.0002506390931642564, + "loss": 0.0191, "step": 126950 }, { - "epoch": 0.64, - "learning_rate": 0.00020392056949412494, - "loss": 0.019, + "epoch": 0.33, + "learning_rate": 0.0002506352049478849, + "loss": 0.0179, "step": 126960 }, { - "epoch": 0.64, - "learning_rate": 0.00020391300180111092, - "loss": 0.0196, + "epoch": 0.33, + "learning_rate": 0.00025063131673151343, + "loss": 0.0231, "step": 126970 }, { - "epoch": 0.64, - "learning_rate": 0.0002039054341080969, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.000250627428515142, + "loss": 0.0216, "step": 126980 }, { - "epoch": 0.64, - "learning_rate": 0.0002038978664150829, - "loss": 0.012, + "epoch": 0.33, + "learning_rate": 0.0002506235402987705, + "loss": 0.0217, "step": 126990 }, { - "epoch": 0.64, - "learning_rate": 0.0002038902987220689, - "loss": 0.0183, + "epoch": 0.33, + "learning_rate": 0.0002506196520823991, + "loss": 0.025, "step": 127000 }, { - "epoch": 0.64, - "eval_cer": 0.9145129533326799, - "eval_loss": 0.010238048620522022, - "eval_runtime": 116.573, - "eval_samples_per_second": 17.157, - "eval_steps_per_second": 4.289, + "epoch": 0.33, + "eval_cer": 0.8817880641761527, + "eval_loss": 0.014219284057617188, + "eval_runtime": 107.5382, + "eval_samples_per_second": 18.598, + "eval_steps_per_second": 4.65, "step": 127000 }, { - "epoch": 0.64, - "learning_rate": 0.00020388273102905487, - "loss": 0.0118, + "epoch": 0.33, + "learning_rate": 0.0002506157638660276, + "loss": 0.0177, "step": 127010 }, { - "epoch": 0.64, - "learning_rate": 0.00020387516333604088, - "loss": 0.0171, + "epoch": 0.33, + "learning_rate": 0.00025061187564965617, + "loss": 0.0191, "step": 127020 }, { - "epoch": 0.64, - "learning_rate": 0.00020386759564302686, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002506079874332847, + "loss": 0.0191, "step": 127030 }, { - "epoch": 0.64, - "learning_rate": 0.00020386002795001284, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002506040992169132, + "loss": 0.0264, "step": 127040 }, { - "epoch": 0.64, - "learning_rate": 0.00020385246025699883, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002506002110005417, + "loss": 0.0173, "step": 127050 }, { - "epoch": 0.64, - "learning_rate": 0.00020384489256398483, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.0002505963227841703, + "loss": 0.0218, "step": 127060 }, { - "epoch": 0.64, - "learning_rate": 0.00020383732487097082, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.0002505924345677988, + "loss": 0.0217, "step": 127070 }, { - "epoch": 0.64, - "learning_rate": 0.0002038297571779568, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.00025058854635142736, + "loss": 0.0215, "step": 127080 }, { - "epoch": 0.64, - "learning_rate": 0.0002038221894849428, - "loss": 0.0158, + "epoch": 0.33, + "learning_rate": 0.0002505846581350559, + "loss": 0.0159, "step": 127090 }, { - "epoch": 0.64, - "learning_rate": 0.0002038146217919288, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.0002505807699186844, + "loss": 0.0215, "step": 127100 }, { - "epoch": 0.64, - "learning_rate": 0.00020380705409891477, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.00025057688170231296, + "loss": 0.017, "step": 127110 }, { - "epoch": 0.64, - "learning_rate": 0.00020379948640590078, - "loss": 0.0113, + "epoch": 0.33, + "learning_rate": 0.0002505729934859415, + "loss": 0.02, "step": 127120 }, { - "epoch": 0.64, - "learning_rate": 0.00020379191871288676, - "loss": 0.0169, + "epoch": 0.33, + "learning_rate": 0.00025056910526957, + "loss": 0.0178, "step": 127130 }, { - "epoch": 0.64, - "learning_rate": 0.00020378435101987274, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025056521705319856, + "loss": 0.0167, "step": 127140 }, { - "epoch": 0.64, - "learning_rate": 0.00020377678332685875, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.00025056132883682713, + "loss": 0.025, "step": 127150 }, { - "epoch": 0.64, - "learning_rate": 0.00020376921563384473, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00025055744062045564, + "loss": 0.0197, "step": 127160 }, { - "epoch": 0.64, - "learning_rate": 0.0002037616479408307, - "loss": 0.0113, + "epoch": 0.33, + "learning_rate": 0.00025055355240408416, + "loss": 0.0211, "step": 127170 }, { - "epoch": 0.64, - "learning_rate": 0.00020375408024781672, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.00025054966418771267, + "loss": 0.022, "step": 127180 }, { - "epoch": 0.64, - "learning_rate": 0.0002037465125548027, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025054577597134124, + "loss": 0.025, "step": 127190 }, { - "epoch": 0.64, - "learning_rate": 0.00020373894486178868, - "loss": 0.0126, + "epoch": 0.33, + "learning_rate": 0.00025054188775496975, + "loss": 0.0424, "step": 127200 }, { - "epoch": 0.64, - "learning_rate": 0.0002037313771687747, - "loss": 0.0143, + "epoch": 0.33, + "learning_rate": 0.0002505379995385983, + "loss": 0.0212, "step": 127210 }, { - "epoch": 0.64, - "learning_rate": 0.00020372380947576067, - "loss": 0.0108, + "epoch": 0.33, + "learning_rate": 0.00025053411132222684, + "loss": 0.0181, "step": 127220 }, { - "epoch": 0.64, - "learning_rate": 0.00020371624178274665, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002505302231058554, + "loss": 0.0205, "step": 127230 }, { - "epoch": 0.64, - "learning_rate": 0.00020370867408973264, - "loss": 0.0126, + "epoch": 0.33, + "learning_rate": 0.0002505263348894839, + "loss": 0.0221, "step": 127240 }, { - "epoch": 0.64, - "learning_rate": 0.00020370110639671864, - "loss": 0.0116, + "epoch": 0.33, + "learning_rate": 0.00025052244667311244, + "loss": 0.0223, "step": 127250 }, { - "epoch": 0.64, - "learning_rate": 0.00020369353870370463, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.00025051855845674095, + "loss": 0.0235, "step": 127260 }, { - "epoch": 0.64, - "learning_rate": 0.0002036859710106906, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.0002505146702403695, + "loss": 0.0272, "step": 127270 }, { - "epoch": 0.64, - "learning_rate": 0.00020367840331767662, - "loss": 0.0186, + "epoch": 0.33, + "learning_rate": 0.00025051078202399803, + "loss": 0.0237, "step": 127280 }, { - "epoch": 0.64, - "learning_rate": 0.0002036708356246626, - "loss": 0.012, + "epoch": 0.33, + "learning_rate": 0.0002505068938076266, + "loss": 0.0257, "step": 127290 }, { - "epoch": 0.64, - "learning_rate": 0.00020366326793164858, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.0002505030055912551, + "loss": 0.019, "step": 127300 }, { - "epoch": 0.64, - "learning_rate": 0.0002036557002386346, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025049911737488363, + "loss": 0.021, "step": 127310 }, { - "epoch": 0.64, - "learning_rate": 0.00020364813254562057, - "loss": 0.0152, + "epoch": 0.33, + "learning_rate": 0.0002504952291585122, + "loss": 0.0188, "step": 127320 }, { - "epoch": 0.64, - "learning_rate": 0.00020364056485260655, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.0002504913409421407, + "loss": 0.0188, "step": 127330 }, { - "epoch": 0.64, - "learning_rate": 0.00020363299715959256, - "loss": 0.0158, + "epoch": 0.33, + "learning_rate": 0.00025048745272576923, + "loss": 0.021, "step": 127340 }, { - "epoch": 0.64, - "learning_rate": 0.00020362542946657854, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.0002504835645093978, + "loss": 0.0234, "step": 127350 }, { - "epoch": 0.64, - "learning_rate": 0.00020361786177356452, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025047967629302637, + "loss": 0.0212, "step": 127360 }, { - "epoch": 0.64, - "learning_rate": 0.00020361029408055053, - "loss": 0.0118, + "epoch": 0.33, + "learning_rate": 0.0002504757880766549, + "loss": 0.0178, "step": 127370 }, { - "epoch": 0.64, - "learning_rate": 0.0002036027263875365, - "loss": 0.0121, + "epoch": 0.33, + "learning_rate": 0.0002504718998602834, + "loss": 0.0211, "step": 127380 }, { - "epoch": 0.64, - "learning_rate": 0.0002035951586945225, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002504680116439119, + "loss": 0.0168, "step": 127390 }, { - "epoch": 0.64, - "learning_rate": 0.00020358759100150848, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002504641234275405, + "loss": 0.0211, "step": 127400 }, { - "epoch": 0.64, - "learning_rate": 0.00020358002330849448, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.000250460235211169, + "loss": 0.0196, "step": 127410 }, { - "epoch": 0.64, - "learning_rate": 0.00020357245561548047, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.00025045634699479756, + "loss": 0.0209, "step": 127420 }, { - "epoch": 0.64, - "learning_rate": 0.00020356488792246645, - "loss": 0.0091, + "epoch": 0.33, + "learning_rate": 0.0002504524587784261, + "loss": 0.0173, "step": 127430 }, { - "epoch": 0.64, - "learning_rate": 0.00020355732022945246, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.00025044857056205465, + "loss": 0.0191, "step": 127440 }, { - "epoch": 0.64, - "learning_rate": 0.00020354975253643844, - "loss": 0.0116, + "epoch": 0.33, + "learning_rate": 0.00025044468234568316, + "loss": 0.0209, "step": 127450 }, { - "epoch": 0.64, - "learning_rate": 0.00020354218484342442, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.0002504407941293117, + "loss": 0.0201, "step": 127460 }, { - "epoch": 0.64, - "learning_rate": 0.00020353461715041043, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.0002504369059129402, + "loss": 0.0207, "step": 127470 }, { - "epoch": 0.64, - "learning_rate": 0.0002035270494573964, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.00025043301769656876, + "loss": 0.018, "step": 127480 }, { - "epoch": 0.64, - "learning_rate": 0.0002035194817643824, - "loss": 0.016, + "epoch": 0.33, + "learning_rate": 0.00025042912948019727, + "loss": 0.0221, "step": 127490 }, { - "epoch": 0.64, - "learning_rate": 0.0002035119140713684, - "loss": 0.0121, + "epoch": 0.33, + "learning_rate": 0.00025042524126382584, + "loss": 0.0213, "step": 127500 }, { - "epoch": 0.64, - "learning_rate": 0.00020350434637835438, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00025042135304745436, + "loss": 0.0197, "step": 127510 }, { - "epoch": 0.64, - "learning_rate": 0.00020349677868534036, - "loss": 0.0117, + "epoch": 0.33, + "learning_rate": 0.0002504174648310829, + "loss": 0.0195, "step": 127520 }, { - "epoch": 0.64, - "learning_rate": 0.00020348921099232637, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025041357661471144, + "loss": 0.0204, "step": 127530 }, { - "epoch": 0.64, - "learning_rate": 0.00020348164329931235, - "loss": 0.0107, + "epoch": 0.33, + "learning_rate": 0.00025040968839833995, + "loss": 0.0199, "step": 127540 }, { - "epoch": 0.64, - "learning_rate": 0.00020347407560629833, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002504058001819685, + "loss": 0.0184, "step": 127550 }, { - "epoch": 0.64, - "learning_rate": 0.00020346650791328431, - "loss": 0.0116, + "epoch": 0.33, + "learning_rate": 0.00025040191196559704, + "loss": 0.0242, "step": 127560 }, { - "epoch": 0.64, - "learning_rate": 0.00020345894022027032, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.0002503980237492256, + "loss": 0.0169, "step": 127570 }, { - "epoch": 0.64, - "learning_rate": 0.00020345137252725628, - "loss": 0.0171, + "epoch": 0.33, + "learning_rate": 0.0002503941355328541, + "loss": 0.0169, "step": 127580 }, { - "epoch": 0.64, - "learning_rate": 0.00020344380483424226, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.00025039024731648263, + "loss": 0.0254, "step": 127590 }, { - "epoch": 0.64, - "learning_rate": 0.00020343623714122827, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00025038635910011115, + "loss": 0.0198, "step": 127600 }, { - "epoch": 0.64, - "learning_rate": 0.00020342866944821425, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.0002503824708837397, + "loss": 0.0172, "step": 127610 }, { - "epoch": 0.64, - "learning_rate": 0.00020342110175520023, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.00025037858266736823, + "loss": 0.0194, "step": 127620 }, { - "epoch": 0.64, - "learning_rate": 0.0002034135340621862, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.0002503746944509968, + "loss": 0.0216, "step": 127630 }, { - "epoch": 0.64, - "learning_rate": 0.00020340596636917222, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.0002503708062346253, + "loss": 0.019, "step": 127640 }, { - "epoch": 0.64, - "learning_rate": 0.0002033983986761582, - "loss": 0.0109, + "epoch": 0.33, + "learning_rate": 0.0002503669180182539, + "loss": 0.0207, "step": 127650 }, { - "epoch": 0.64, - "learning_rate": 0.00020339083098314418, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.0002503630298018824, + "loss": 0.0209, "step": 127660 }, { - "epoch": 0.64, - "learning_rate": 0.0002033832632901302, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.0002503591415855109, + "loss": 0.0203, "step": 127670 }, { - "epoch": 0.64, - "learning_rate": 0.00020337569559711617, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.00025035525336913943, + "loss": 0.0189, "step": 127680 }, { - "epoch": 0.64, - "learning_rate": 0.00020336812790410215, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.000250351365152768, + "loss": 0.0206, "step": 127690 }, { - "epoch": 0.64, - "learning_rate": 0.00020336056021108816, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.00025034747693639657, + "loss": 0.0172, "step": 127700 }, { - "epoch": 0.64, - "learning_rate": 0.00020335299251807414, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.0002503435887200251, + "loss": 0.0189, "step": 127710 }, { - "epoch": 0.64, - "learning_rate": 0.00020334542482506013, - "loss": 0.0164, + "epoch": 0.33, + "learning_rate": 0.0002503397005036536, + "loss": 0.0234, "step": 127720 }, { - "epoch": 0.64, - "learning_rate": 0.00020333785713204613, - "loss": 0.0194, + "epoch": 0.33, + "learning_rate": 0.00025033581228728216, + "loss": 0.0295, "step": 127730 }, { - "epoch": 0.64, - "learning_rate": 0.00020333028943903212, - "loss": 0.0193, + "epoch": 0.33, + "learning_rate": 0.0002503319240709107, + "loss": 0.0194, "step": 127740 }, { - "epoch": 0.64, - "learning_rate": 0.0002033227217460181, - "loss": 0.0237, + "epoch": 0.33, + "learning_rate": 0.0002503280358545392, + "loss": 0.0182, "step": 127750 }, { - "epoch": 0.64, - "learning_rate": 0.0002033151540530041, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.00025032414763816776, + "loss": 0.0185, "step": 127760 }, { - "epoch": 0.64, - "learning_rate": 0.0002033075863599901, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002503202594217963, + "loss": 0.0203, "step": 127770 }, { - "epoch": 0.64, - "learning_rate": 0.00020330001866697607, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.00025031637120542484, + "loss": 0.0155, "step": 127780 }, { - "epoch": 0.64, - "learning_rate": 0.00020329245097396205, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.00025031248298905336, + "loss": 0.0207, "step": 127790 }, { - "epoch": 0.64, - "learning_rate": 0.00020328488328094806, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002503085947726819, + "loss": 0.0215, "step": 127800 }, { - "epoch": 0.64, - "learning_rate": 0.00020327731558793404, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.0002503047065563104, + "loss": 0.0191, "step": 127810 }, { - "epoch": 0.64, - "learning_rate": 0.00020326974789492002, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.00025030081833993896, + "loss": 0.0204, "step": 127820 }, { - "epoch": 0.64, - "learning_rate": 0.00020326218020190603, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025029693012356747, + "loss": 0.0221, "step": 127830 }, { - "epoch": 0.64, - "learning_rate": 0.000203254612508892, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.00025029304190719604, + "loss": 0.0219, "step": 127840 }, { - "epoch": 0.65, - "learning_rate": 0.000203247044815878, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.00025028915369082455, + "loss": 0.0199, "step": 127850 }, { - "epoch": 0.65, - "learning_rate": 0.000203239477122864, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.0002502852654744531, + "loss": 0.0245, "step": 127860 }, { - "epoch": 0.65, - "learning_rate": 0.00020323190942984998, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.00025028137725808164, + "loss": 0.0193, "step": 127870 }, { - "epoch": 0.65, - "learning_rate": 0.00020322434173683596, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.00025027748904171015, + "loss": 0.0216, "step": 127880 }, { - "epoch": 0.65, - "learning_rate": 0.00020321677404382197, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.00025027360082533867, + "loss": 0.0226, "step": 127890 }, { - "epoch": 0.65, - "learning_rate": 0.00020320920635080795, - "loss": 0.0119, + "epoch": 0.33, + "learning_rate": 0.00025026971260896724, + "loss": 0.0233, "step": 127900 }, { - "epoch": 0.65, - "learning_rate": 0.00020320163865779394, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002502658243925958, + "loss": 0.0191, "step": 127910 }, { - "epoch": 0.65, - "learning_rate": 0.00020319407096477994, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.0002502619361762243, + "loss": 0.0189, "step": 127920 }, { - "epoch": 0.65, - "learning_rate": 0.00020318650327176593, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.00025025804795985283, + "loss": 0.0217, "step": 127930 }, { - "epoch": 0.65, - "learning_rate": 0.0002031789355787519, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.0002502541597434814, + "loss": 0.0197, "step": 127940 }, { - "epoch": 0.65, - "learning_rate": 0.0002031713678857379, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.0002502502715271099, + "loss": 0.0201, "step": 127950 }, { - "epoch": 0.65, - "learning_rate": 0.0002031638001927239, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00025024638331073843, + "loss": 0.0249, "step": 127960 }, { - "epoch": 0.65, - "learning_rate": 0.00020315623249970988, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.000250242495094367, + "loss": 0.0215, "step": 127970 }, { - "epoch": 0.65, - "learning_rate": 0.00020314866480669586, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.0002502386068779955, + "loss": 0.0176, "step": 127980 }, { - "epoch": 0.65, - "learning_rate": 0.00020314109711368187, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.0002502347186616241, + "loss": 0.0257, "step": 127990 }, { - "epoch": 0.65, - "learning_rate": 0.00020313352942066785, - "loss": 0.0139, + "epoch": 0.33, + "learning_rate": 0.0002502308304452526, + "loss": 0.0264, "step": 128000 }, { - "epoch": 0.65, - "eval_cer": 0.914481900656667, - "eval_loss": 0.01020896527916193, - "eval_runtime": 116.605, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.33, + "eval_cer": 0.8818188561887047, + "eval_loss": 0.014465493150055408, + "eval_runtime": 107.6927, + "eval_samples_per_second": 18.571, + "eval_steps_per_second": 4.643, "step": 128000 }, { - "epoch": 0.65, - "learning_rate": 0.00020312596172765383, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.0002502269422288811, + "loss": 0.0197, "step": 128010 }, { - "epoch": 0.65, - "learning_rate": 0.00020311839403463984, - "loss": 0.0158, + "epoch": 0.33, + "learning_rate": 0.0002502230540125097, + "loss": 0.0175, "step": 128020 }, { - "epoch": 0.65, - "learning_rate": 0.00020311082634162582, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.0002502191657961382, + "loss": 0.0189, "step": 128030 }, { - "epoch": 0.65, - "learning_rate": 0.0002031032586486118, + "epoch": 0.33, + "learning_rate": 0.00025021527757976676, "loss": 0.0171, "step": 128040 }, { - "epoch": 0.65, - "learning_rate": 0.0002030956909555978, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.0002502113893633953, + "loss": 0.0202, "step": 128050 }, { - "epoch": 0.65, - "learning_rate": 0.0002030881232625838, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002502075011470238, + "loss": 0.0208, "step": 128060 }, { - "epoch": 0.65, - "learning_rate": 0.00020308055556956977, - "loss": 0.0196, + "epoch": 0.33, + "learning_rate": 0.00025020361293065236, + "loss": 0.0198, "step": 128070 }, { - "epoch": 0.65, - "learning_rate": 0.00020307298787655578, - "loss": 0.0173, + "epoch": 0.33, + "learning_rate": 0.0002501997247142809, + "loss": 0.0223, "step": 128080 }, { - "epoch": 0.65, - "learning_rate": 0.00020306542018354176, - "loss": 0.018, + "epoch": 0.33, + "learning_rate": 0.0002501958364979094, + "loss": 0.0223, "step": 128090 }, { - "epoch": 0.65, - "learning_rate": 0.00020305785249052775, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.00025019194828153796, + "loss": 0.02, "step": 128100 }, { - "epoch": 0.65, - "learning_rate": 0.00020305028479751375, - "loss": 0.0195, + "epoch": 0.33, + "learning_rate": 0.0002501880600651665, + "loss": 0.0143, "step": 128110 }, { - "epoch": 0.65, - "learning_rate": 0.00020304271710449974, - "loss": 0.0158, + "epoch": 0.33, + "learning_rate": 0.00025018417184879504, + "loss": 0.0262, "step": 128120 }, { - "epoch": 0.65, - "learning_rate": 0.00020303514941148572, - "loss": 0.0177, + "epoch": 0.33, + "learning_rate": 0.00025018028363242356, + "loss": 0.0189, "step": 128130 }, { - "epoch": 0.65, - "learning_rate": 0.0002030275817184717, - "loss": 0.0116, + "epoch": 0.33, + "learning_rate": 0.00025017639541605207, + "loss": 0.0191, "step": 128140 }, { - "epoch": 0.65, - "learning_rate": 0.0002030200140254577, - "loss": 0.0167, + "epoch": 0.33, + "learning_rate": 0.00025017250719968064, + "loss": 0.0209, "step": 128150 }, { - "epoch": 0.65, - "learning_rate": 0.0002030124463324437, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025016861898330916, + "loss": 0.0221, "step": 128160 }, { - "epoch": 0.65, - "learning_rate": 0.00020300487863942967, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.00025016473076693767, + "loss": 0.0179, "step": 128170 }, { - "epoch": 0.65, - "learning_rate": 0.00020299731094641568, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.00025016084255056624, + "loss": 0.0213, "step": 128180 }, { - "epoch": 0.65, - "learning_rate": 0.00020298974325340166, - "loss": 0.013, + "epoch": 0.33, + "learning_rate": 0.0002501569543341948, + "loss": 0.0218, "step": 128190 }, { - "epoch": 0.65, - "learning_rate": 0.00020298217556038764, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.0002501530661178233, + "loss": 0.0248, "step": 128200 }, { - "epoch": 0.65, - "learning_rate": 0.00020297460786737365, - "loss": 0.0165, + "epoch": 0.33, + "learning_rate": 0.00025014917790145184, + "loss": 0.0224, "step": 128210 }, { - "epoch": 0.65, - "learning_rate": 0.00020296704017435963, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025014528968508035, + "loss": 0.0183, "step": 128220 }, { - "epoch": 0.65, - "learning_rate": 0.0002029594724813456, - "loss": 0.0138, + "epoch": 0.33, + "learning_rate": 0.0002501414014687089, + "loss": 0.0208, "step": 128230 }, { - "epoch": 0.65, - "learning_rate": 0.00020295190478833162, - "loss": 0.014, + "epoch": 0.33, + "learning_rate": 0.00025013751325233743, + "loss": 0.0207, "step": 128240 }, { - "epoch": 0.65, - "learning_rate": 0.0002029443370953176, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.000250133625035966, + "loss": 0.0201, "step": 128250 }, { - "epoch": 0.65, - "learning_rate": 0.00020293676940230358, - "loss": 0.0154, + "epoch": 0.33, + "learning_rate": 0.0002501297368195945, + "loss": 0.0189, "step": 128260 }, { - "epoch": 0.65, - "learning_rate": 0.0002029292017092896, - "loss": 0.0186, + "epoch": 0.33, + "learning_rate": 0.0002501258486032231, + "loss": 0.0241, "step": 128270 }, { - "epoch": 0.65, - "learning_rate": 0.00020292163401627557, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.0002501219603868516, + "loss": 0.0173, "step": 128280 }, { - "epoch": 0.65, - "learning_rate": 0.00020291406632326156, - "loss": 0.0123, + "epoch": 0.33, + "learning_rate": 0.0002501180721704801, + "loss": 0.0243, "step": 128290 }, { - "epoch": 0.65, - "learning_rate": 0.00020290649863024754, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.00025011418395410863, + "loss": 0.0201, "step": 128300 }, { - "epoch": 0.65, - "learning_rate": 0.00020289893093723355, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.0002501102957377372, + "loss": 0.0202, "step": 128310 }, { - "epoch": 0.65, - "learning_rate": 0.00020289136324421953, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.0002501064075213657, + "loss": 0.0185, "step": 128320 }, { - "epoch": 0.65, - "learning_rate": 0.0002028837955512055, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002501025193049943, + "loss": 0.0246, "step": 128330 }, { - "epoch": 0.65, - "learning_rate": 0.00020287622785819152, - "loss": 0.0156, + "epoch": 0.33, + "learning_rate": 0.0002500986310886228, + "loss": 0.0218, "step": 128340 }, { - "epoch": 0.65, - "learning_rate": 0.0002028686601651775, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.0002500947428722513, + "loss": 0.0248, "step": 128350 }, { - "epoch": 0.65, - "learning_rate": 0.00020286109247216348, - "loss": 0.0191, + "epoch": 0.33, + "learning_rate": 0.0002500908546558799, + "loss": 0.0222, "step": 128360 }, { - "epoch": 0.65, - "learning_rate": 0.0002028535247791495, - "loss": 0.0147, + "epoch": 0.33, + "learning_rate": 0.0002500869664395084, + "loss": 0.0159, "step": 128370 }, { - "epoch": 0.65, - "learning_rate": 0.00020284595708613547, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002500830782231369, + "loss": 0.0207, "step": 128380 }, { - "epoch": 0.65, - "learning_rate": 0.00020283838939312145, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.0002500791900067655, + "loss": 0.0187, "step": 128390 }, { - "epoch": 0.65, - "learning_rate": 0.00020283082170010746, - "loss": 0.0162, + "epoch": 0.33, + "learning_rate": 0.00025007530179039405, + "loss": 0.0243, "step": 128400 }, { - "epoch": 0.65, - "learning_rate": 0.00020282325400709344, - "loss": 0.01, + "epoch": 0.33, + "learning_rate": 0.00025007141357402256, + "loss": 0.0262, "step": 128410 }, { - "epoch": 0.65, - "learning_rate": 0.00020281568631407942, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.0002500675253576511, + "loss": 0.0252, "step": 128420 }, { - "epoch": 0.65, - "learning_rate": 0.00020280811862106543, - "loss": 0.0126, + "epoch": 0.33, + "learning_rate": 0.0002500636371412796, + "loss": 0.022, "step": 128430 }, { - "epoch": 0.65, - "learning_rate": 0.0002028005509280514, - "loss": 0.0132, + "epoch": 0.33, + "learning_rate": 0.00025005974892490816, + "loss": 0.0202, "step": 128440 }, { - "epoch": 0.65, - "learning_rate": 0.0002027929832350374, - "loss": 0.0175, + "epoch": 0.33, + "learning_rate": 0.0002500558607085367, + "loss": 0.0201, "step": 128450 }, { - "epoch": 0.65, - "learning_rate": 0.00020278541554202338, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.00025005197249216524, + "loss": 0.024, "step": 128460 }, { - "epoch": 0.65, - "learning_rate": 0.00020277784784900938, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00025004808427579376, + "loss": 0.0218, "step": 128470 }, { - "epoch": 0.65, - "learning_rate": 0.00020277028015599537, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002500441960594223, + "loss": 0.0173, "step": 128480 }, { - "epoch": 0.65, - "learning_rate": 0.00020276271246298135, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.00025004030784305084, + "loss": 0.0176, "step": 128490 }, { - "epoch": 0.65, - "learning_rate": 0.00020275514476996736, - "loss": 0.0153, + "epoch": 0.33, + "learning_rate": 0.00025003641962667935, + "loss": 0.0137, "step": 128500 }, { - "epoch": 0.65, - "learning_rate": 0.00020274757707695334, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.00025003253141030787, + "loss": 0.0233, "step": 128510 }, { - "epoch": 0.65, - "learning_rate": 0.00020274000938393932, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00025002864319393644, + "loss": 0.0206, "step": 128520 }, { - "epoch": 0.65, - "learning_rate": 0.00020273244169092533, - "loss": 0.0214, + "epoch": 0.33, + "learning_rate": 0.00025002475497756495, + "loss": 0.0226, "step": 128530 }, { - "epoch": 0.65, - "learning_rate": 0.0002027248739979113, - "loss": 0.0165, + "epoch": 0.33, + "learning_rate": 0.0002500208667611935, + "loss": 0.0214, "step": 128540 }, { - "epoch": 0.65, - "learning_rate": 0.0002027173063048973, - "loss": 0.0131, + "epoch": 0.33, + "learning_rate": 0.00025001697854482204, + "loss": 0.0179, "step": 128550 }, { - "epoch": 0.65, - "learning_rate": 0.0002027097386118833, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.00025001309032845055, + "loss": 0.0236, "step": 128560 }, { - "epoch": 0.65, - "learning_rate": 0.00020270217091886928, - "loss": 0.0182, + "epoch": 0.33, + "learning_rate": 0.0002500092021120791, + "loss": 0.0265, "step": 128570 }, { - "epoch": 0.65, - "learning_rate": 0.00020269460322585526, - "loss": 0.0145, + "epoch": 0.33, + "learning_rate": 0.00025000531389570763, + "loss": 0.0375, "step": 128580 }, { - "epoch": 0.65, - "learning_rate": 0.00020268703553284127, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002500014256793362, + "loss": 0.0272, "step": 128590 }, { - "epoch": 0.65, - "learning_rate": 0.00020267946783982725, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002499975374629647, + "loss": 0.0224, "step": 128600 }, { - "epoch": 0.65, - "learning_rate": 0.00020267190014681323, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.0002499936492465933, + "loss": 0.1259, "step": 128610 }, { - "epoch": 0.65, - "learning_rate": 0.00020266433245379924, - "loss": 0.0161, + "epoch": 0.33, + "learning_rate": 0.0002499897610302218, + "loss": 0.079, "step": 128620 }, { - "epoch": 0.65, - "learning_rate": 0.00020265676476078522, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002499858728138503, + "loss": 0.0776, "step": 128630 }, { - "epoch": 0.65, - "learning_rate": 0.0002026491970677712, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00024998198459747883, + "loss": 0.0215, "step": 128640 }, { - "epoch": 0.65, - "learning_rate": 0.00020264162937475719, - "loss": 0.0121, + "epoch": 0.33, + "learning_rate": 0.0002499780963811074, + "loss": 0.0355, "step": 128650 }, { - "epoch": 0.65, - "learning_rate": 0.0002026340616817432, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002499742081647359, + "loss": 0.0206, "step": 128660 }, { - "epoch": 0.65, - "learning_rate": 0.00020262649398872918, - "loss": 0.0126, + "epoch": 0.33, + "learning_rate": 0.0002499703199483645, + "loss": 0.0219, "step": 128670 }, { - "epoch": 0.65, - "learning_rate": 0.00020261892629571516, - "loss": 0.0126, + "epoch": 0.33, + "learning_rate": 0.000249966431731993, + "loss": 0.0319, "step": 128680 }, { - "epoch": 0.65, - "learning_rate": 0.00020261135860270117, - "loss": 0.0142, + "epoch": 0.33, + "learning_rate": 0.00024996254351562156, + "loss": 0.0222, "step": 128690 }, { - "epoch": 0.65, - "learning_rate": 0.00020260379090968715, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.0002499586552992501, + "loss": 0.0281, "step": 128700 }, { - "epoch": 0.65, - "learning_rate": 0.00020259622321667313, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.0002499547670828786, + "loss": 0.0226, "step": 128710 }, { - "epoch": 0.65, - "learning_rate": 0.00020258865552365914, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.0002499508788665071, + "loss": 0.0225, "step": 128720 }, { - "epoch": 0.65, - "learning_rate": 0.00020258108783064512, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002499469906501357, + "loss": 0.0233, "step": 128730 }, { - "epoch": 0.65, - "learning_rate": 0.0002025735201376311, - "loss": 0.0125, + "epoch": 0.33, + "learning_rate": 0.00024994310243376425, + "loss": 0.0173, "step": 128740 }, { - "epoch": 0.65, - "learning_rate": 0.0002025659524446171, - "loss": 0.0118, + "epoch": 0.33, + "learning_rate": 0.00024993921421739276, + "loss": 0.0192, "step": 128750 }, { - "epoch": 0.65, - "learning_rate": 0.0002025583847516031, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.0002499353260010213, + "loss": 0.0218, "step": 128760 }, { - "epoch": 0.65, - "learning_rate": 0.00020255081705858907, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002499314377846498, + "loss": 0.0216, "step": 128770 }, { - "epoch": 0.65, - "learning_rate": 0.00020254324936557508, - "loss": 0.0152, + "epoch": 0.33, + "learning_rate": 0.00024992754956827836, + "loss": 0.0174, "step": 128780 }, { - "epoch": 0.65, - "learning_rate": 0.00020253568167256106, - "loss": 0.0172, + "epoch": 0.33, + "learning_rate": 0.00024992366135190687, + "loss": 0.0178, "step": 128790 }, { - "epoch": 0.65, - "learning_rate": 0.00020252811397954704, - "loss": 0.0157, + "epoch": 0.33, + "learning_rate": 0.00024991977313553544, + "loss": 0.0205, "step": 128800 }, { - "epoch": 0.65, - "learning_rate": 0.00020252054628653302, - "loss": 0.0136, + "epoch": 0.33, + "learning_rate": 0.00024991588491916396, + "loss": 0.0251, "step": 128810 }, { - "epoch": 0.65, - "learning_rate": 0.00020251297859351903, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002499119967027925, + "loss": 0.0253, "step": 128820 }, { - "epoch": 0.65, - "learning_rate": 0.00020250541090050501, - "loss": 0.0151, + "epoch": 0.33, + "learning_rate": 0.00024990810848642104, + "loss": 0.0201, "step": 128830 }, { - "epoch": 0.65, - "learning_rate": 0.00020249784320749097, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.00024990422027004955, + "loss": 0.0284, "step": 128840 }, { - "epoch": 0.65, - "learning_rate": 0.00020249027551447695, - "loss": 0.0118, + "epoch": 0.33, + "learning_rate": 0.00024990033205367807, + "loss": 0.0311, "step": 128850 }, { - "epoch": 0.65, - "learning_rate": 0.00020248270782146296, - "loss": 0.0117, + "epoch": 0.33, + "learning_rate": 0.00024989644383730664, + "loss": 0.022, "step": 128860 }, { - "epoch": 0.65, - "learning_rate": 0.00020247514012844894, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.00024989255562093515, + "loss": 0.0217, "step": 128870 }, { - "epoch": 0.65, - "learning_rate": 0.00020246757243543492, - "loss": 0.015, + "epoch": 0.33, + "learning_rate": 0.0002498886674045637, + "loss": 0.0201, "step": 128880 }, { - "epoch": 0.65, - "learning_rate": 0.00020246000474242093, - "loss": 0.0144, + "epoch": 0.33, + "learning_rate": 0.00024988477918819223, + "loss": 0.0184, "step": 128890 }, { - "epoch": 0.65, - "learning_rate": 0.0002024524370494069, - "loss": 0.016, + "epoch": 0.33, + "learning_rate": 0.0002498808909718208, + "loss": 0.0221, "step": 128900 }, { - "epoch": 0.65, - "learning_rate": 0.0002024448693563929, - "loss": 0.0163, + "epoch": 0.33, + "learning_rate": 0.0002498770027554493, + "loss": 0.0244, "step": 128910 }, { - "epoch": 0.65, - "learning_rate": 0.0002024373016633789, - "loss": 0.0116, + "epoch": 0.33, + "learning_rate": 0.00024987311453907783, + "loss": 0.021, "step": 128920 }, { - "epoch": 0.65, - "learning_rate": 0.00020242973397036488, - "loss": 0.0106, + "epoch": 0.33, + "learning_rate": 0.00024986922632270635, + "loss": 0.0218, "step": 128930 }, { - "epoch": 0.65, - "learning_rate": 0.00020242216627735086, - "loss": 0.0153, + "epoch": 0.33, + "learning_rate": 0.0002498653381063349, + "loss": 0.0191, "step": 128940 }, { - "epoch": 0.65, - "learning_rate": 0.00020241459858433687, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.0002498614498899635, + "loss": 0.0182, "step": 128950 }, { - "epoch": 0.65, - "learning_rate": 0.00020240703089132285, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.000249857561673592, + "loss": 0.0191, "step": 128960 }, { - "epoch": 0.65, - "learning_rate": 0.00020239946319830884, - "loss": 0.0117, + "epoch": 0.33, + "learning_rate": 0.0002498536734572205, + "loss": 0.0186, "step": 128970 }, { - "epoch": 0.65, - "learning_rate": 0.00020239189550529484, - "loss": 0.0112, + "epoch": 0.33, + "learning_rate": 0.0002498497852408491, + "loss": 0.0176, "step": 128980 }, { - "epoch": 0.65, - "learning_rate": 0.00020238432781228083, - "loss": 0.0128, + "epoch": 0.33, + "learning_rate": 0.0002498458970244776, + "loss": 0.0174, "step": 128990 }, { - "epoch": 0.65, - "learning_rate": 0.0002023767601192668, - "loss": 0.0141, + "epoch": 0.33, + "learning_rate": 0.0002498420088081061, + "loss": 0.0213, "step": 129000 }, { - "epoch": 0.65, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.009670346975326538, - "eval_runtime": 116.6611, - "eval_samples_per_second": 17.144, - "eval_steps_per_second": 4.286, + "epoch": 0.33, + "eval_cer": 0.8818006609085604, + "eval_loss": 0.014310148544609547, + "eval_runtime": 107.6549, + "eval_samples_per_second": 18.578, + "eval_steps_per_second": 4.644, "step": 129000 }, { - "epoch": 0.65, - "learning_rate": 0.00020236919242625282, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.0002498381205917347, + "loss": 0.0241, "step": 129010 }, { - "epoch": 0.65, - "learning_rate": 0.0002023616247332388, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.0002498342323753632, + "loss": 0.0188, "step": 129020 }, { - "epoch": 0.65, - "learning_rate": 0.00020235405704022478, - "loss": 0.0115, + "epoch": 0.33, + "learning_rate": 0.00024983034415899176, + "loss": 0.0225, "step": 129030 }, { - "epoch": 0.65, - "learning_rate": 0.00020234648934721076, - "loss": 0.0146, + "epoch": 0.33, + "learning_rate": 0.0002498264559426203, + "loss": 0.0198, "step": 129040 }, { - "epoch": 0.65, - "learning_rate": 0.00020233892165419677, - "loss": 0.0119, + "epoch": 0.33, + "learning_rate": 0.0002498225677262488, + "loss": 0.0195, "step": 129050 }, { - "epoch": 0.65, - "learning_rate": 0.00020233135396118275, - "loss": 0.0129, + "epoch": 0.33, + "learning_rate": 0.0002498186795098773, + "loss": 0.0177, "step": 129060 }, { - "epoch": 0.65, - "learning_rate": 0.00020232378626816873, - "loss": 0.0137, + "epoch": 0.33, + "learning_rate": 0.0002498147912935059, + "loss": 0.0186, "step": 129070 }, { - "epoch": 0.65, - "learning_rate": 0.00020231621857515474, - "loss": 0.0115, + "epoch": 0.33, + "learning_rate": 0.0002498109030771344, + "loss": 0.0202, "step": 129080 }, { - "epoch": 0.65, - "learning_rate": 0.00020230865088214072, - "loss": 0.0122, + "epoch": 0.33, + "learning_rate": 0.00024980701486076296, + "loss": 0.0189, "step": 129090 }, { - "epoch": 0.65, - "learning_rate": 0.0002023010831891267, - "loss": 0.0133, + "epoch": 0.33, + "learning_rate": 0.0002498031266443915, + "loss": 0.0154, "step": 129100 }, { - "epoch": 0.65, - "learning_rate": 0.0002022935154961127, - "loss": 0.0194, + "epoch": 0.33, + "learning_rate": 0.00024979923842802004, + "loss": 0.0221, "step": 129110 }, { - "epoch": 0.65, - "learning_rate": 0.0002022859478030987, - "loss": 0.0124, + "epoch": 0.33, + "learning_rate": 0.00024979535021164856, + "loss": 0.021, "step": 129120 }, { - "epoch": 0.65, - "learning_rate": 0.00020227838011008467, - "loss": 0.0149, + "epoch": 0.33, + "learning_rate": 0.00024979146199527707, + "loss": 0.0163, "step": 129130 }, { - "epoch": 0.65, - "learning_rate": 0.00020227081241707068, - "loss": 0.0134, + "epoch": 0.33, + "learning_rate": 0.00024978757377890564, + "loss": 0.0226, "step": 129140 }, { - "epoch": 0.65, - "learning_rate": 0.00020226324472405666, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00024978368556253415, + "loss": 0.0169, "step": 129150 }, { - "epoch": 0.65, - "learning_rate": 0.00020225567703104265, - "loss": 0.0111, + "epoch": 0.33, + "learning_rate": 0.0002497797973461627, + "loss": 0.0202, "step": 129160 }, { - "epoch": 0.65, - "learning_rate": 0.00020224810933802865, - "loss": 0.0187, + "epoch": 0.33, + "learning_rate": 0.00024977590912979124, + "loss": 0.0197, "step": 129170 }, { - "epoch": 0.65, - "learning_rate": 0.00020224054164501464, - "loss": 0.0127, + "epoch": 0.33, + "learning_rate": 0.00024977202091341975, + "loss": 0.0182, "step": 129180 }, { - "epoch": 0.65, - "learning_rate": 0.00020223297395200062, - "loss": 0.0135, + "epoch": 0.33, + "learning_rate": 0.0002497681326970483, + "loss": 0.0222, "step": 129190 }, { - "epoch": 0.65, - "learning_rate": 0.0002022254062589866, - "loss": 0.0155, + "epoch": 0.33, + "learning_rate": 0.00024976424448067684, + "loss": 0.019, "step": 129200 }, { - "epoch": 0.65, - "learning_rate": 0.0002022178385659726, - "loss": 0.0159, + "epoch": 0.33, + "learning_rate": 0.00024976035626430535, + "loss": 0.0198, "step": 129210 }, { - "epoch": 0.65, - "learning_rate": 0.0002022102708729586, - "loss": 0.0148, + "epoch": 0.33, + "learning_rate": 0.0002497564680479339, + "loss": 0.0168, "step": 129220 }, { - "epoch": 0.65, - "learning_rate": 0.00020220270317994457, - "loss": 0.0113, + "epoch": 0.33, + "learning_rate": 0.0002497525798315625, + "loss": 0.0194, "step": 129230 }, { - "epoch": 0.65, - "learning_rate": 0.00020219513548693058, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.000249748691615191, + "loss": 0.0175, "step": 129240 }, { - "epoch": 0.65, - "learning_rate": 0.00020218756779391656, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002497448033988195, + "loss": 0.0208, "step": 129250 }, { - "epoch": 0.65, - "learning_rate": 0.00020218000010090254, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.00024974091518244803, + "loss": 0.0208, "step": 129260 }, { - "epoch": 0.65, - "learning_rate": 0.00020217243240788855, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.00024973702696607655, + "loss": 0.0189, "step": 129270 }, { - "epoch": 0.65, - "learning_rate": 0.00020216486471487453, - "loss": 0.0101, + "epoch": 0.34, + "learning_rate": 0.0002497331387497051, + "loss": 0.0232, "step": 129280 }, { - "epoch": 0.65, - "learning_rate": 0.0002021572970218605, - "loss": 0.0203, + "epoch": 0.34, + "learning_rate": 0.0002497292505333337, + "loss": 0.0241, "step": 129290 }, { - "epoch": 0.65, - "learning_rate": 0.00020214972932884652, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.0002497253623169622, + "loss": 0.0191, "step": 129300 }, { - "epoch": 0.65, - "learning_rate": 0.0002021421616358325, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002497214741005907, + "loss": 0.0222, "step": 129310 }, { - "epoch": 0.65, - "learning_rate": 0.00020213459394281848, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.0002497175858842193, + "loss": 0.0175, "step": 129320 }, { - "epoch": 0.65, - "learning_rate": 0.0002021270262498045, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.0002497136976678478, + "loss": 0.0217, "step": 129330 }, { - "epoch": 0.65, - "learning_rate": 0.00020211945855679047, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.0002497098094514763, + "loss": 0.0167, "step": 129340 }, { - "epoch": 0.65, - "learning_rate": 0.00020211189086377646, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002497059212351049, + "loss": 0.0196, "step": 129350 }, { - "epoch": 0.65, - "learning_rate": 0.00020210432317076244, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002497020330187334, + "loss": 0.0204, "step": 129360 }, { - "epoch": 0.65, - "learning_rate": 0.00020209675547774845, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.00024969814480236196, + "loss": 0.0202, "step": 129370 }, { - "epoch": 0.65, - "learning_rate": 0.00020208918778473443, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002496942565859905, + "loss": 0.0174, "step": 129380 }, { - "epoch": 0.65, - "learning_rate": 0.0002020816200917204, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.000249690368369619, + "loss": 0.02, "step": 129390 }, { - "epoch": 0.65, - "learning_rate": 0.00020207405239870642, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.00024968648015324756, + "loss": 0.021, "step": 129400 }, { - "epoch": 0.65, - "learning_rate": 0.0002020664847056924, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002496825919368761, + "loss": 0.0193, "step": 129410 }, { - "epoch": 0.65, - "learning_rate": 0.00020205891701267838, - "loss": 0.0123, + "epoch": 0.34, + "learning_rate": 0.0002496787037205046, + "loss": 0.0191, "step": 129420 }, { - "epoch": 0.65, - "learning_rate": 0.0002020513493196644, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.00024967481550413316, + "loss": 0.0247, "step": 129430 }, { - "epoch": 0.65, - "learning_rate": 0.00020204378162665037, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002496709272877617, + "loss": 0.0211, "step": 129440 }, { - "epoch": 0.65, - "learning_rate": 0.00020203621393363635, - "loss": 0.0182, - "step": 129450 + "epoch": 0.34, + "learning_rate": 0.00024966703907139024, + "loss": 0.0227, + "step": 129450 }, { - "epoch": 0.65, - "learning_rate": 0.00020202864624062236, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.00024966315085501876, + "loss": 0.0194, "step": 129460 }, { - "epoch": 0.65, - "learning_rate": 0.00020202107854760834, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.00024965926263864727, + "loss": 0.0244, "step": 129470 }, { - "epoch": 0.65, - "learning_rate": 0.00020201351085459432, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.00024965537442227584, + "loss": 0.0218, "step": 129480 }, { - "epoch": 0.65, - "learning_rate": 0.00020200594316158033, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.00024965148620590435, + "loss": 0.0207, "step": 129490 }, { - "epoch": 0.65, - "learning_rate": 0.0002019983754685663, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.0002496475979895329, + "loss": 0.024, "step": 129500 }, { - "epoch": 0.65, - "learning_rate": 0.0002019908077755523, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.00024964370977316144, + "loss": 0.0211, "step": 129510 }, { - "epoch": 0.65, - "learning_rate": 0.00020198324008253828, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.00024963982155678995, + "loss": 0.0178, "step": 129520 }, { - "epoch": 0.65, - "learning_rate": 0.00020197567238952428, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002496359333404185, + "loss": 0.0166, "step": 129530 }, { - "epoch": 0.65, - "learning_rate": 0.00020196810469651027, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.00024963204512404703, + "loss": 0.0151, "step": 129540 }, { - "epoch": 0.65, - "learning_rate": 0.00020196053700349625, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024962815690767555, + "loss": 0.0205, "step": 129550 }, { - "epoch": 0.65, - "learning_rate": 0.00020195296931048226, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002496242686913041, + "loss": 0.0232, "step": 129560 }, { - "epoch": 0.65, - "learning_rate": 0.00020194540161746824, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.00024962038047493263, + "loss": 0.0232, "step": 129570 }, { - "epoch": 0.65, - "learning_rate": 0.00020193783392445422, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.0002496164922585612, + "loss": 0.0257, "step": 129580 }, { - "epoch": 0.65, - "learning_rate": 0.00020193026623144023, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.0002496126040421897, + "loss": 0.017, "step": 129590 }, { - "epoch": 0.65, - "learning_rate": 0.0002019226985384262, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.00024960871582581823, + "loss": 0.0211, "step": 129600 }, { - "epoch": 0.65, - "learning_rate": 0.0002019151308454122, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.0002496048276094468, + "loss": 0.0203, "step": 129610 }, { - "epoch": 0.65, - "learning_rate": 0.0002019075631523982, - "loss": 0.0119, + "epoch": 0.34, + "learning_rate": 0.0002496009393930753, + "loss": 0.02, "step": 129620 }, { - "epoch": 0.65, - "learning_rate": 0.00020189999545938418, - "loss": 0.0114, + "epoch": 0.34, + "learning_rate": 0.0002495970511767039, + "loss": 0.0193, "step": 129630 }, { - "epoch": 0.65, - "learning_rate": 0.00020189242776637016, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.0002495931629603324, + "loss": 0.0181, "step": 129640 }, { - "epoch": 0.65, - "learning_rate": 0.00020188486007335617, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.00024958927474396097, + "loss": 0.0218, "step": 129650 }, { - "epoch": 0.65, - "learning_rate": 0.00020187729238034215, - "loss": 0.0171, + "epoch": 0.34, + "learning_rate": 0.0002495853865275895, + "loss": 0.0191, "step": 129660 }, { - "epoch": 0.65, - "learning_rate": 0.00020186972468732813, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.000249581498311218, + "loss": 0.0202, "step": 129670 }, { - "epoch": 0.65, - "learning_rate": 0.00020186215699431414, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002495776100948465, + "loss": 0.016, "step": 129680 }, { - "epoch": 0.65, - "learning_rate": 0.00020185458930130012, - "loss": 0.0105, + "epoch": 0.34, + "learning_rate": 0.0002495737218784751, + "loss": 0.028, "step": 129690 }, { - "epoch": 0.65, - "learning_rate": 0.0002018470216082861, - "loss": 0.0118, + "epoch": 0.34, + "learning_rate": 0.0002495698336621036, + "loss": 0.0181, "step": 129700 }, { - "epoch": 0.65, - "learning_rate": 0.00020183945391527209, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.00024956594544573216, + "loss": 0.0199, "step": 129710 }, { - "epoch": 0.65, - "learning_rate": 0.0002018318862222581, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002495620572293607, + "loss": 0.0192, "step": 129720 }, { - "epoch": 0.65, - "learning_rate": 0.00020182431852924408, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.00024955816901298924, + "loss": 0.0247, "step": 129730 }, { - "epoch": 0.65, - "learning_rate": 0.00020181675083623006, - "loss": 0.0102, + "epoch": 0.34, + "learning_rate": 0.00024955428079661776, + "loss": 0.021, "step": 129740 }, { - "epoch": 0.65, - "learning_rate": 0.00020180918314321607, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.0002495503925802463, + "loss": 0.0299, "step": 129750 }, { - "epoch": 0.65, - "learning_rate": 0.00020180161545020205, - "loss": 0.0114, + "epoch": 0.34, + "learning_rate": 0.0002495465043638748, + "loss": 0.0207, "step": 129760 }, { - "epoch": 0.65, - "learning_rate": 0.00020179404775718803, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.00024954261614750336, + "loss": 0.0235, "step": 129770 }, { - "epoch": 0.65, - "learning_rate": 0.00020178648006417404, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.0002495387279311319, + "loss": 0.0247, "step": 129780 }, { - "epoch": 0.65, - "learning_rate": 0.00020177891237116002, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024953483971476044, + "loss": 0.0201, "step": 129790 }, { - "epoch": 0.65, - "learning_rate": 0.000201771344678146, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.00024953095149838895, + "loss": 0.022, "step": 129800 }, { - "epoch": 0.65, - "learning_rate": 0.000201763776985132, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.00024952706328201747, + "loss": 0.0166, "step": 129810 }, { - "epoch": 0.65, - "learning_rate": 0.000201756209292118, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024952317506564604, + "loss": 0.0178, "step": 129820 }, { - "epoch": 0.66, - "learning_rate": 0.00020174864159910397, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.00024951928684927455, + "loss": 0.0193, "step": 129830 }, { - "epoch": 0.66, - "learning_rate": 0.00020174107390608998, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.0002495153986329031, + "loss": 0.0194, "step": 129840 }, { - "epoch": 0.66, - "learning_rate": 0.00020173350621307596, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.00024951151041653164, + "loss": 0.0228, "step": 129850 }, { - "epoch": 0.66, - "learning_rate": 0.00020172593852006194, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.0002495076222001602, + "loss": 0.0194, "step": 129860 }, { - "epoch": 0.66, - "learning_rate": 0.00020171837082704792, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.0002495037339837887, + "loss": 0.02, "step": 129870 }, { - "epoch": 0.66, - "learning_rate": 0.00020171080313403393, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024949984576741723, + "loss": 0.0243, "step": 129880 }, { - "epoch": 0.66, - "learning_rate": 0.00020170323544101991, - "loss": 0.0127, + "epoch": 0.34, + "learning_rate": 0.00024949595755104575, + "loss": 0.0251, "step": 129890 }, { - "epoch": 0.66, - "learning_rate": 0.0002016956677480059, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.0002494920693346743, + "loss": 0.0214, "step": 129900 }, { - "epoch": 0.66, - "learning_rate": 0.0002016881000549919, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.00024948818111830283, + "loss": 0.0245, "step": 129910 }, { - "epoch": 0.66, - "learning_rate": 0.00020168053236197789, - "loss": 0.0127, + "epoch": 0.34, + "learning_rate": 0.0002494842929019314, + "loss": 0.0192, "step": 129920 }, { - "epoch": 0.66, - "learning_rate": 0.00020167296466896387, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.0002494804046855599, + "loss": 0.0215, "step": 129930 }, { - "epoch": 0.66, - "learning_rate": 0.00020166539697594988, - "loss": 0.0163, + "epoch": 0.34, + "learning_rate": 0.0002494765164691885, + "loss": 0.0212, "step": 129940 }, { - "epoch": 0.66, - "learning_rate": 0.00020165782928293586, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.000249472628252817, + "loss": 0.0188, "step": 129950 }, { - "epoch": 0.66, - "learning_rate": 0.00020165026158992184, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.0002494687400364455, + "loss": 0.0179, "step": 129960 }, { - "epoch": 0.66, - "learning_rate": 0.00020164269389690785, - "loss": 0.0164, + "epoch": 0.34, + "learning_rate": 0.000249464851820074, + "loss": 0.0188, "step": 129970 }, { - "epoch": 0.66, - "learning_rate": 0.00020163512620389383, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.0002494609636037026, + "loss": 0.0214, "step": 129980 }, { - "epoch": 0.66, - "learning_rate": 0.0002016275585108798, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.00024945707538733116, + "loss": 0.0201, "step": 129990 }, { - "epoch": 0.66, - "learning_rate": 0.00020161999081786582, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.0002494531871709597, + "loss": 0.0232, "step": 130000 }, { - "epoch": 0.66, - "eval_cer": 0.9144828710527925, - "eval_loss": 0.009702015668153763, - "eval_runtime": 116.6027, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.34, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.014468919485807419, + "eval_runtime": 107.45, + "eval_samples_per_second": 18.613, + "eval_steps_per_second": 4.653, "step": 130000 }, { - "epoch": 0.66, - "learning_rate": 0.0002016124231248518, - "loss": 0.0188, + "epoch": 0.34, + "learning_rate": 0.0002494492989545882, + "loss": 0.0175, "step": 130010 }, { - "epoch": 0.66, - "learning_rate": 0.00020160485543183778, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.0002494454107382167, + "loss": 0.0188, "step": 130020 }, { - "epoch": 0.66, - "learning_rate": 0.00020159728773882376, - "loss": 0.0123, + "epoch": 0.34, + "learning_rate": 0.0002494415225218453, + "loss": 0.0199, "step": 130030 }, { - "epoch": 0.66, - "learning_rate": 0.00020158972004580977, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.0002494376343054738, + "loss": 0.0191, "step": 130040 }, { - "epoch": 0.66, - "learning_rate": 0.00020158215235279575, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024943374608910236, + "loss": 0.0191, "step": 130050 }, { - "epoch": 0.66, - "learning_rate": 0.00020157458465978173, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.0002494298578727309, + "loss": 0.0204, "step": 130060 }, { - "epoch": 0.66, - "learning_rate": 0.00020156701696676774, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.00024942596965635944, + "loss": 0.0189, "step": 130070 }, { - "epoch": 0.66, - "learning_rate": 0.00020155944927375372, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.00024942208143998796, + "loss": 0.0179, "step": 130080 }, { - "epoch": 0.66, - "learning_rate": 0.00020155188158073968, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.00024941819322361647, + "loss": 0.0202, "step": 130090 }, { - "epoch": 0.66, - "learning_rate": 0.00020154431388772566, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.000249414305007245, + "loss": 0.0166, "step": 130100 }, { - "epoch": 0.66, - "learning_rate": 0.00020153674619471167, - "loss": 0.0168, + "epoch": 0.34, + "learning_rate": 0.00024941041679087356, + "loss": 0.0184, "step": 130110 }, { - "epoch": 0.66, - "learning_rate": 0.00020152917850169765, - "loss": 0.0158, + "epoch": 0.34, + "learning_rate": 0.00024940652857450207, + "loss": 0.0193, "step": 130120 }, { - "epoch": 0.66, - "learning_rate": 0.00020152161080868363, - "loss": 0.0163, + "epoch": 0.34, + "learning_rate": 0.00024940264035813064, + "loss": 0.0198, "step": 130130 }, { - "epoch": 0.66, - "learning_rate": 0.00020151404311566964, - "loss": 0.0116, + "epoch": 0.34, + "learning_rate": 0.00024939875214175915, + "loss": 0.0192, "step": 130140 }, { - "epoch": 0.66, - "learning_rate": 0.00020150647542265562, - "loss": 0.0121, + "epoch": 0.34, + "learning_rate": 0.0002493948639253877, + "loss": 0.0172, "step": 130150 }, { - "epoch": 0.66, - "learning_rate": 0.0002014989077296416, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.00024939097570901624, + "loss": 0.0215, "step": 130160 }, { - "epoch": 0.66, - "learning_rate": 0.0002014913400366276, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.00024938708749264475, + "loss": 0.0212, "step": 130170 }, { - "epoch": 0.66, - "learning_rate": 0.0002014837723436136, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.0002493831992762733, + "loss": 0.0207, "step": 130180 }, { - "epoch": 0.66, - "learning_rate": 0.00020147620465059957, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.00024937931105990183, + "loss": 0.018, "step": 130190 }, { - "epoch": 0.66, - "learning_rate": 0.00020146863695758558, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002493754228435304, + "loss": 0.0207, "step": 130200 }, { - "epoch": 0.66, - "learning_rate": 0.00020146106926457156, - "loss": 0.0201, + "epoch": 0.34, + "learning_rate": 0.0002493715346271589, + "loss": 0.0171, "step": 130210 }, { - "epoch": 0.66, - "learning_rate": 0.00020145350157155755, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024936764641078743, + "loss": 0.0253, "step": 130220 }, { - "epoch": 0.66, - "learning_rate": 0.00020144593387854355, - "loss": 0.0121, + "epoch": 0.34, + "learning_rate": 0.000249363758194416, + "loss": 0.0208, "step": 130230 }, { - "epoch": 0.66, - "learning_rate": 0.00020143836618552954, - "loss": 0.0109, + "epoch": 0.34, + "learning_rate": 0.0002493598699780445, + "loss": 0.0219, "step": 130240 }, { - "epoch": 0.66, - "learning_rate": 0.00020143079849251552, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.00024935598176167303, + "loss": 0.0166, "step": 130250 }, { - "epoch": 0.66, - "learning_rate": 0.0002014232307995015, - "loss": 0.0118, + "epoch": 0.34, + "learning_rate": 0.0002493520935453016, + "loss": 0.0195, "step": 130260 }, { - "epoch": 0.66, - "learning_rate": 0.0002014156631064875, - "loss": 0.0164, + "epoch": 0.34, + "learning_rate": 0.0002493482053289301, + "loss": 0.0231, "step": 130270 }, { - "epoch": 0.66, - "learning_rate": 0.0002014080954134735, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.0002493443171125587, + "loss": 0.0214, "step": 130280 }, { - "epoch": 0.66, - "learning_rate": 0.00020140052772045947, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002493404288961872, + "loss": 0.0206, "step": 130290 }, { - "epoch": 0.66, - "learning_rate": 0.00020139296002744548, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002493365406798157, + "loss": 0.0252, "step": 130300 }, { - "epoch": 0.66, - "learning_rate": 0.00020138539233443146, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002493326524634442, + "loss": 0.015, "step": 130310 }, { - "epoch": 0.66, - "learning_rate": 0.00020137782464141744, - "loss": 0.017, + "epoch": 0.34, + "learning_rate": 0.0002493287642470728, + "loss": 0.0154, "step": 130320 }, { - "epoch": 0.66, - "learning_rate": 0.00020137025694840345, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024932487603070136, + "loss": 0.0199, "step": 130330 }, { - "epoch": 0.66, - "learning_rate": 0.00020136268925538943, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.0002493209878143299, + "loss": 0.0218, "step": 130340 }, { - "epoch": 0.66, - "learning_rate": 0.0002013551215623754, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.0002493170995979584, + "loss": 0.0351, "step": 130350 }, { - "epoch": 0.66, - "learning_rate": 0.00020134755386936142, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.00024931321138158696, + "loss": 0.0207, "step": 130360 }, { - "epoch": 0.66, - "learning_rate": 0.0002013399861763474, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.0002493093231652155, + "loss": 0.0218, "step": 130370 }, { - "epoch": 0.66, - "learning_rate": 0.00020133241848333338, - "loss": 0.0123, + "epoch": 0.34, + "learning_rate": 0.000249305434948844, + "loss": 0.1019, "step": 130380 }, { - "epoch": 0.66, - "learning_rate": 0.0002013248507903194, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.00024930154673247256, + "loss": 0.0271, "step": 130390 }, { - "epoch": 0.66, - "learning_rate": 0.00020131728309730537, - "loss": 0.018, + "epoch": 0.34, + "learning_rate": 0.0002492976585161011, + "loss": 0.0184, "step": 130400 }, { - "epoch": 0.66, - "learning_rate": 0.00020130971540429136, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.00024929377029972964, + "loss": 0.021, "step": 130410 }, { - "epoch": 0.66, - "learning_rate": 0.00020130214771127734, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.00024928988208335816, + "loss": 0.0239, "step": 130420 }, { - "epoch": 0.66, - "learning_rate": 0.00020129458001826335, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.00024928599386698667, + "loss": 0.0193, "step": 130430 }, { - "epoch": 0.66, - "learning_rate": 0.00020128701232524933, - "loss": 0.0147, + "epoch": 0.34, + "learning_rate": 0.00024928210565061524, + "loss": 0.0252, "step": 130440 }, { - "epoch": 0.66, - "learning_rate": 0.0002012794446322353, - "loss": 0.0171, + "epoch": 0.34, + "learning_rate": 0.00024927821743424375, + "loss": 0.0154, "step": 130450 }, { - "epoch": 0.66, - "learning_rate": 0.00020127187693922132, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024927432921787227, + "loss": 0.0199, "step": 130460 }, { - "epoch": 0.66, - "learning_rate": 0.0002012643092462073, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.00024927044100150084, + "loss": 0.0221, "step": 130470 }, { - "epoch": 0.66, - "learning_rate": 0.00020125674155319328, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.0002492665527851294, + "loss": 0.0141, "step": 130480 }, { - "epoch": 0.66, - "learning_rate": 0.0002012491738601793, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.0002492626645687579, + "loss": 0.0172, "step": 130490 }, { - "epoch": 0.66, - "learning_rate": 0.00020124160616716527, - "loss": 0.0121, + "epoch": 0.34, + "learning_rate": 0.00024925877635238644, + "loss": 0.0235, "step": 130500 }, { - "epoch": 0.66, - "learning_rate": 0.00020123403847415125, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.00024925488813601495, + "loss": 0.0228, "step": 130510 }, { - "epoch": 0.66, - "learning_rate": 0.00020122647078113726, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.00024925099991964346, + "loss": 0.0239, "step": 130520 }, { - "epoch": 0.66, - "learning_rate": 0.00020121890308812324, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.00024924711170327203, + "loss": 0.0213, "step": 130530 }, { - "epoch": 0.66, - "learning_rate": 0.00020121133539510922, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.0002492432234869006, + "loss": 0.0235, "step": 130540 }, { - "epoch": 0.66, - "learning_rate": 0.00020120376770209523, - "loss": 0.0113, + "epoch": 0.34, + "learning_rate": 0.0002492393352705291, + "loss": 0.0214, "step": 130550 }, { - "epoch": 0.66, - "learning_rate": 0.0002011962000090812, - "loss": 0.0197, + "epoch": 0.34, + "learning_rate": 0.00024923544705415763, + "loss": 0.0186, "step": 130560 }, { - "epoch": 0.66, - "learning_rate": 0.0002011886323160672, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002492315588377862, + "loss": 0.018, "step": 130570 }, { - "epoch": 0.66, - "learning_rate": 0.0002011810646230532, - "loss": 0.0151, + "epoch": 0.34, + "learning_rate": 0.0002492276706214147, + "loss": 0.0197, "step": 130580 }, { - "epoch": 0.66, - "learning_rate": 0.00020117349693003918, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.00024922378240504323, + "loss": 0.0252, "step": 130590 }, { - "epoch": 0.66, - "learning_rate": 0.00020116592923702517, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002492198941886718, + "loss": 0.0204, "step": 130600 }, { - "epoch": 0.66, - "learning_rate": 0.00020115836154401115, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.0002492160059723003, + "loss": 0.0194, "step": 130610 }, { - "epoch": 0.66, - "learning_rate": 0.00020115079385099716, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.0002492121177559289, + "loss": 0.0211, "step": 130620 }, { - "epoch": 0.66, - "learning_rate": 0.00020114322615798314, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.0002492082295395574, + "loss": 0.0193, "step": 130630 }, { - "epoch": 0.66, - "learning_rate": 0.00020113565846496912, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.0002492043413231859, + "loss": 0.0243, "step": 130640 }, { - "epoch": 0.66, - "learning_rate": 0.00020112809077195513, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002492004531068145, + "loss": 0.0162, "step": 130650 }, { - "epoch": 0.66, - "learning_rate": 0.0002011205230789411, - "loss": 0.0109, + "epoch": 0.34, + "learning_rate": 0.000249196564890443, + "loss": 0.0184, "step": 130660 }, { - "epoch": 0.66, - "learning_rate": 0.0002011129553859271, - "loss": 0.016, + "epoch": 0.34, + "learning_rate": 0.0002491926766740715, + "loss": 0.0253, "step": 130670 }, { - "epoch": 0.66, - "learning_rate": 0.0002011053876929131, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.0002491887884577001, + "loss": 0.0179, "step": 130680 }, { - "epoch": 0.66, - "learning_rate": 0.00020109781999989908, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.00024918490024132864, + "loss": 0.0198, "step": 130690 }, { - "epoch": 0.66, - "learning_rate": 0.00020109025230688506, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.00024918101202495716, + "loss": 0.0197, "step": 130700 }, { - "epoch": 0.66, - "learning_rate": 0.00020108268461387107, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002491771238085857, + "loss": 0.0204, "step": 130710 }, { - "epoch": 0.66, - "learning_rate": 0.00020107511692085705, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.0002491732355922142, + "loss": 0.0152, "step": 130720 }, { - "epoch": 0.66, - "learning_rate": 0.00020106754922784303, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.00024916934737584276, + "loss": 0.0218, "step": 130730 }, { - "epoch": 0.66, - "learning_rate": 0.00020105998153482904, - "loss": 0.0123, + "epoch": 0.34, + "learning_rate": 0.00024916545915947127, + "loss": 0.021, "step": 130740 }, { - "epoch": 0.66, - "learning_rate": 0.00020105241384181502, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.00024916157094309984, + "loss": 0.0208, "step": 130750 }, { - "epoch": 0.66, - "learning_rate": 0.000201044846148801, - "loss": 0.0175, + "epoch": 0.34, + "learning_rate": 0.00024915768272672836, + "loss": 0.0204, "step": 130760 }, { - "epoch": 0.66, - "learning_rate": 0.00020103727845578699, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.00024915379451035687, + "loss": 0.0194, "step": 130770 }, { - "epoch": 0.66, - "learning_rate": 0.000201029710762773, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.00024914990629398544, + "loss": 0.0173, "step": 130780 }, { - "epoch": 0.66, - "learning_rate": 0.00020102214306975898, - "loss": 0.0116, + "epoch": 0.34, + "learning_rate": 0.00024914601807761395, + "loss": 0.019, "step": 130790 }, { - "epoch": 0.66, - "learning_rate": 0.00020101457537674496, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.00024914212986124247, + "loss": 0.0222, "step": 130800 }, { - "epoch": 0.66, - "learning_rate": 0.00020100700768373097, - "loss": 0.0121, + "epoch": 0.34, + "learning_rate": 0.00024913824164487104, + "loss": 0.0227, "step": 130810 }, { - "epoch": 0.66, - "learning_rate": 0.00020099943999071695, - "loss": 0.0189, + "epoch": 0.34, + "learning_rate": 0.0002491343534284996, + "loss": 0.0239, "step": 130820 }, { - "epoch": 0.66, - "learning_rate": 0.00020099187229770293, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.0002491304652121281, + "loss": 0.0196, "step": 130830 }, { - "epoch": 0.66, - "learning_rate": 0.00020098430460468894, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024912657699575663, + "loss": 0.0236, "step": 130840 }, { - "epoch": 0.66, - "learning_rate": 0.00020097673691167492, - "loss": 0.0127, + "epoch": 0.34, + "learning_rate": 0.00024912268877938515, + "loss": 0.0241, "step": 130850 }, { - "epoch": 0.66, - "learning_rate": 0.0002009691692186609, - "loss": 0.0109, + "epoch": 0.34, + "learning_rate": 0.0002491188005630137, + "loss": 0.0294, "step": 130860 }, { - "epoch": 0.66, - "learning_rate": 0.0002009616015256469, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.00024911491234664223, + "loss": 0.0326, "step": 130870 }, { - "epoch": 0.66, - "learning_rate": 0.0002009540338326329, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002491110241302708, + "loss": 0.0183, "step": 130880 }, { - "epoch": 0.66, - "learning_rate": 0.00020094646613961887, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.0002491071359138993, + "loss": 0.0181, "step": 130890 }, { - "epoch": 0.66, - "learning_rate": 0.00020093889844660488, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.0002491032476975279, + "loss": 0.0191, "step": 130900 }, { - "epoch": 0.66, - "learning_rate": 0.00020093133075359086, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.0002490993594811564, + "loss": 0.0243, "step": 130910 }, { - "epoch": 0.66, - "learning_rate": 0.00020092376306057684, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.0002490954712647849, + "loss": 0.0197, "step": 130920 }, { - "epoch": 0.66, - "learning_rate": 0.00020091619536756282, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.00024909158304841343, + "loss": 0.0186, "step": 130930 }, { - "epoch": 0.66, - "learning_rate": 0.00020090862767454883, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.000249087694832042, + "loss": 0.02, "step": 130940 }, { - "epoch": 0.66, - "learning_rate": 0.00020090105998153481, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002490838066156705, + "loss": 0.0225, "step": 130950 }, { - "epoch": 0.66, - "learning_rate": 0.0002008934922885208, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.0002490799183992991, + "loss": 0.0232, "step": 130960 }, { - "epoch": 0.66, - "learning_rate": 0.0002008859245955068, - "loss": 0.0184, + "epoch": 0.34, + "learning_rate": 0.0002490760301829276, + "loss": 0.0251, "step": 130970 }, { - "epoch": 0.66, - "learning_rate": 0.00020087835690249279, - "loss": 0.0131, + "epoch": 0.34, + "learning_rate": 0.00024907214196655616, + "loss": 0.0156, "step": 130980 }, { - "epoch": 0.66, - "learning_rate": 0.00020087078920947877, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.0002490682537501847, + "loss": 0.023, "step": 130990 }, { - "epoch": 0.66, - "learning_rate": 0.00020086322151646478, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.0002490643655338132, + "loss": 0.0232, "step": 131000 }, { - "epoch": 0.66, - "eval_cer": 0.9145090717481783, - "eval_loss": 0.009523593820631504, - "eval_runtime": 116.9784, - "eval_samples_per_second": 17.097, - "eval_steps_per_second": 4.274, + "epoch": 0.34, + "eval_cer": 0.8818034601824287, + "eval_loss": 0.014057641848921776, + "eval_runtime": 107.6812, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, "step": 131000 }, { - "epoch": 0.66, - "learning_rate": 0.00020085565382345076, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.0002490604773174417, + "loss": 0.0197, "step": 131010 }, { - "epoch": 0.66, - "learning_rate": 0.00020084808613043674, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.0002490565891010703, + "loss": 0.0217, "step": 131020 }, { - "epoch": 0.66, - "learning_rate": 0.00020084051843742275, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.00024905270088469884, + "loss": 0.023, "step": 131030 }, { - "epoch": 0.66, - "learning_rate": 0.00020083295074440873, - "loss": 0.0114, + "epoch": 0.34, + "learning_rate": 0.00024904881266832736, + "loss": 0.0172, "step": 131040 }, { - "epoch": 0.66, - "learning_rate": 0.0002008253830513947, - "loss": 0.0119, + "epoch": 0.34, + "learning_rate": 0.00024904492445195587, + "loss": 0.0207, "step": 131050 }, { - "epoch": 0.66, - "learning_rate": 0.00020081781535838072, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.0002490410362355844, + "loss": 0.0194, "step": 131060 }, { - "epoch": 0.66, - "learning_rate": 0.0002008102476653667, - "loss": 0.0111, + "epoch": 0.34, + "learning_rate": 0.00024903714801921296, + "loss": 0.022, "step": 131070 }, { - "epoch": 0.66, - "learning_rate": 0.00020080267997235268, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.00024903325980284147, + "loss": 0.0248, "step": 131080 }, { - "epoch": 0.66, - "learning_rate": 0.0002007951122793387, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.00024902937158647004, + "loss": 0.0176, "step": 131090 }, { - "epoch": 0.66, - "learning_rate": 0.00020078754458632467, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024902548337009855, + "loss": 0.0179, "step": 131100 }, { - "epoch": 0.66, - "learning_rate": 0.00020077997689331065, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002490215951537271, + "loss": 0.0191, "step": 131110 }, { - "epoch": 0.66, - "learning_rate": 0.00020077240920029663, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.00024901770693735564, + "loss": 0.0238, "step": 131120 }, { - "epoch": 0.66, - "learning_rate": 0.00020076484150728264, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.00024901381872098415, + "loss": 0.0221, "step": 131130 }, { - "epoch": 0.66, - "learning_rate": 0.00020075727381426862, - "loss": 0.0147, + "epoch": 0.34, + "learning_rate": 0.00024900993050461267, + "loss": 0.0194, "step": 131140 }, { - "epoch": 0.66, - "learning_rate": 0.0002007497061212546, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.00024900604228824124, + "loss": 0.0202, "step": 131150 }, { - "epoch": 0.66, - "learning_rate": 0.00020074213842824061, - "loss": 0.0187, + "epoch": 0.34, + "learning_rate": 0.00024900215407186975, + "loss": 0.0243, "step": 131160 }, { - "epoch": 0.66, - "learning_rate": 0.0002007345707352266, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002489982658554983, + "loss": 0.0246, "step": 131170 }, { - "epoch": 0.66, - "learning_rate": 0.00020072700304221258, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.00024899437763912683, + "loss": 0.0236, "step": 131180 }, { - "epoch": 0.66, - "learning_rate": 0.00020071943534919859, - "loss": 0.0176, + "epoch": 0.34, + "learning_rate": 0.0002489904894227554, + "loss": 0.0231, "step": 131190 }, { - "epoch": 0.66, - "learning_rate": 0.00020071186765618457, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002489866012063839, + "loss": 0.0265, "step": 131200 }, { - "epoch": 0.66, - "learning_rate": 0.00020070429996317055, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.00024898271299001243, + "loss": 0.0243, "step": 131210 }, { - "epoch": 0.66, - "learning_rate": 0.00020069673227015656, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.000248978824773641, + "loss": 0.0198, "step": 131220 }, { - "epoch": 0.66, - "learning_rate": 0.00020068916457714254, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002489749365572695, + "loss": 0.02, "step": 131230 }, { - "epoch": 0.66, - "learning_rate": 0.00020068159688412852, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.0002489710483408981, + "loss": 0.0212, "step": 131240 }, { - "epoch": 0.66, - "learning_rate": 0.00020067402919111453, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.0002489671601245266, + "loss": 0.0206, "step": 131250 }, { - "epoch": 0.66, - "learning_rate": 0.0002006664614981005, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002489632719081551, + "loss": 0.0242, "step": 131260 }, { - "epoch": 0.66, - "learning_rate": 0.0002006588938050865, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.0002489593836917836, + "loss": 0.0182, "step": 131270 }, { - "epoch": 0.66, - "learning_rate": 0.00020065132611207247, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002489554954754122, + "loss": 0.021, "step": 131280 }, { - "epoch": 0.66, - "learning_rate": 0.00020064375841905848, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.0002489516072590407, + "loss": 0.0202, "step": 131290 }, { - "epoch": 0.66, - "learning_rate": 0.00020063619072604446, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002489477190426693, + "loss": 0.0171, "step": 131300 }, { - "epoch": 0.66, - "learning_rate": 0.00020062862303303044, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.0002489438308262978, + "loss": 0.0244, "step": 131310 }, { - "epoch": 0.66, - "learning_rate": 0.00020062105534001645, - "loss": 0.0113, + "epoch": 0.34, + "learning_rate": 0.00024893994260992636, + "loss": 0.0236, "step": 131320 }, { - "epoch": 0.66, - "learning_rate": 0.00020061348764700243, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.0002489360543935549, + "loss": 0.0174, "step": 131330 }, { - "epoch": 0.66, - "learning_rate": 0.00020060591995398842, - "loss": 0.0164, + "epoch": 0.34, + "learning_rate": 0.0002489321661771834, + "loss": 0.021, "step": 131340 }, { - "epoch": 0.66, - "learning_rate": 0.00020059835226097437, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002489282779608119, + "loss": 0.0309, "step": 131350 }, { - "epoch": 0.66, - "learning_rate": 0.00020059078456796038, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002489243897444405, + "loss": 0.0274, "step": 131360 }, { - "epoch": 0.66, - "learning_rate": 0.00020058321687494636, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.00024892050152806904, + "loss": 0.0248, "step": 131370 }, { - "epoch": 0.66, - "learning_rate": 0.00020057564918193234, - "loss": 0.0184, + "epoch": 0.34, + "learning_rate": 0.00024891661331169756, + "loss": 0.0181, "step": 131380 }, { - "epoch": 0.66, - "learning_rate": 0.00020056808148891835, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.00024891272509532607, + "loss": 0.0198, "step": 131390 }, { - "epoch": 0.66, - "learning_rate": 0.00020056051379590433, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.00024890883687895464, + "loss": 0.018, "step": 131400 }, { - "epoch": 0.66, - "learning_rate": 0.0002005529461028903, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.00024890494866258316, + "loss": 0.0204, "step": 131410 }, { - "epoch": 0.66, - "learning_rate": 0.00020054537840987632, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024890106044621167, + "loss": 0.0238, "step": 131420 }, { - "epoch": 0.66, - "learning_rate": 0.0002005378107168623, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024889717222984024, + "loss": 0.0193, "step": 131430 }, { - "epoch": 0.66, - "learning_rate": 0.00020053024302384828, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.00024889328401346875, + "loss": 0.0192, "step": 131440 }, { - "epoch": 0.66, - "learning_rate": 0.0002005226753308343, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.0002488893957970973, + "loss": 0.0235, "step": 131450 }, { - "epoch": 0.66, - "learning_rate": 0.00020051510763782027, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.00024888550758072584, + "loss": 0.0193, "step": 131460 }, { - "epoch": 0.66, - "learning_rate": 0.00020050753994480626, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024888161936435435, + "loss": 0.0233, "step": 131470 }, { - "epoch": 0.66, - "learning_rate": 0.00020049997225179226, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002488777311479829, + "loss": 0.0183, "step": 131480 }, { - "epoch": 0.66, - "learning_rate": 0.00020049240455877825, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.00024887384293161143, + "loss": 0.0217, "step": 131490 }, { - "epoch": 0.66, - "learning_rate": 0.00020048483686576423, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.00024886995471523995, + "loss": 0.0279, "step": 131500 }, { - "epoch": 0.66, - "learning_rate": 0.0002004772691727502, - "loss": 0.0174, + "epoch": 0.34, + "learning_rate": 0.0002488660664988685, + "loss": 0.0225, "step": 131510 }, { - "epoch": 0.66, - "learning_rate": 0.00020046970147973622, - "loss": 0.0156, + "epoch": 0.34, + "learning_rate": 0.00024886217828249703, + "loss": 0.0184, "step": 131520 }, { - "epoch": 0.66, - "learning_rate": 0.0002004621337867222, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002488582900661256, + "loss": 0.022, "step": 131530 }, { - "epoch": 0.66, - "learning_rate": 0.00020045456609370818, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002488544018497541, + "loss": 0.0161, "step": 131540 }, { - "epoch": 0.66, - "learning_rate": 0.0002004469984006942, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.00024885051363338263, + "loss": 0.0215, "step": 131550 }, { - "epoch": 0.66, - "learning_rate": 0.00020043943070768017, - "loss": 0.0114, + "epoch": 0.34, + "learning_rate": 0.00024884662541701114, + "loss": 0.0188, "step": 131560 }, { - "epoch": 0.66, - "learning_rate": 0.00020043186301466615, - "loss": 0.01, + "epoch": 0.34, + "learning_rate": 0.0002488427372006397, + "loss": 0.0204, "step": 131570 }, { - "epoch": 0.66, - "learning_rate": 0.00020042429532165216, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.0002488388489842683, + "loss": 0.0186, "step": 131580 }, { - "epoch": 0.66, - "learning_rate": 0.00020041672762863814, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.0002488349607678968, + "loss": 0.0233, "step": 131590 }, { - "epoch": 0.66, - "learning_rate": 0.00020040915993562412, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.0002488310725515253, + "loss": 0.0213, "step": 131600 }, { - "epoch": 0.66, - "learning_rate": 0.00020040159224261013, - "loss": 0.0111, + "epoch": 0.34, + "learning_rate": 0.0002488271843351539, + "loss": 0.0195, "step": 131610 }, { - "epoch": 0.66, - "learning_rate": 0.0002003940245495961, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.0002488232961187824, + "loss": 0.0191, "step": 131620 }, { - "epoch": 0.66, - "learning_rate": 0.0002003864568565821, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002488194079024109, + "loss": 0.021, "step": 131630 }, { - "epoch": 0.66, - "learning_rate": 0.0002003788891635681, - "loss": 0.0105, + "epoch": 0.34, + "learning_rate": 0.0002488155196860395, + "loss": 0.0206, "step": 131640 }, { - "epoch": 0.66, - "learning_rate": 0.00020037132147055408, - "loss": 0.0123, + "epoch": 0.34, + "learning_rate": 0.000248811631469668, + "loss": 0.0297, "step": 131650 }, { - "epoch": 0.66, - "learning_rate": 0.00020036375377754007, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.00024880774325329656, + "loss": 0.0209, "step": 131660 }, { - "epoch": 0.66, - "learning_rate": 0.00020035618608452605, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.0002488038550369251, + "loss": 0.0245, "step": 131670 }, { - "epoch": 0.66, - "learning_rate": 0.00020034861839151206, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.0002487999668205536, + "loss": 0.0215, "step": 131680 }, { - "epoch": 0.66, - "learning_rate": 0.00020034105069849804, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024879607860418216, + "loss": 0.0237, "step": 131690 }, { - "epoch": 0.66, - "learning_rate": 0.00020033348300548402, - "loss": 0.0121, + "epoch": 0.34, + "learning_rate": 0.00024879219038781067, + "loss": 0.0248, "step": 131700 }, { - "epoch": 0.66, - "learning_rate": 0.00020032591531247003, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.0002487883021714392, + "loss": 0.0216, "step": 131710 }, { - "epoch": 0.66, - "learning_rate": 0.000200318347619456, - "loss": 0.0125, + "epoch": 0.34, + "learning_rate": 0.00024878441395506776, + "loss": 0.0255, "step": 131720 }, { - "epoch": 0.66, - "learning_rate": 0.000200310779926442, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002487805257386963, + "loss": 0.0177, "step": 131730 }, { - "epoch": 0.66, - "learning_rate": 0.000200303212233428, - "loss": 0.0193, + "epoch": 0.34, + "learning_rate": 0.00024877663752232484, + "loss": 0.0201, "step": 131740 }, { - "epoch": 0.66, - "learning_rate": 0.00020029564454041398, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.00024877274930595335, + "loss": 0.0216, "step": 131750 }, { - "epoch": 0.66, - "learning_rate": 0.00020028807684739996, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.00024876886108958187, + "loss": 0.0192, "step": 131760 }, { - "epoch": 0.66, - "learning_rate": 0.00020028050915438597, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.00024876497287321044, + "loss": 0.0173, "step": 131770 }, { - "epoch": 0.66, - "learning_rate": 0.00020027294146137195, - "loss": 0.0099, + "epoch": 0.34, + "learning_rate": 0.00024876108465683895, + "loss": 0.0177, "step": 131780 }, { - "epoch": 0.66, - "learning_rate": 0.00020026537376835793, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.0002487571964404675, + "loss": 0.0171, "step": 131790 }, { - "epoch": 0.66, - "learning_rate": 0.00020025780607534394, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024875330822409603, + "loss": 0.0196, "step": 131800 }, { - "epoch": 0.66, - "learning_rate": 0.00020025023838232992, - "loss": 0.0179, + "epoch": 0.34, + "learning_rate": 0.00024874942000772455, + "loss": 0.02, "step": 131810 }, { - "epoch": 0.67, - "learning_rate": 0.0002002426706893159, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002487455317913531, + "loss": 0.0203, "step": 131820 }, { - "epoch": 0.67, - "learning_rate": 0.00020023510299630189, - "loss": 0.0191, + "epoch": 0.34, + "learning_rate": 0.00024874164357498163, + "loss": 0.0204, "step": 131830 }, { - "epoch": 0.67, - "learning_rate": 0.0002002275353032879, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.00024873775535861015, + "loss": 0.0201, "step": 131840 }, { - "epoch": 0.67, - "learning_rate": 0.00020021996761027388, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.0002487338671422387, + "loss": 0.0176, "step": 131850 }, { - "epoch": 0.67, - "learning_rate": 0.00020021239991725986, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.00024872997892586723, + "loss": 0.0216, "step": 131860 }, { - "epoch": 0.67, - "learning_rate": 0.00020020483222424587, - "loss": 0.0146, + "epoch": 0.34, + "learning_rate": 0.0002487260907094958, + "loss": 0.0163, "step": 131870 }, { - "epoch": 0.67, - "learning_rate": 0.00020019726453123185, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.0002487222024931243, + "loss": 0.0173, "step": 131880 }, { - "epoch": 0.67, - "learning_rate": 0.00020018969683821783, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.00024871831427675283, + "loss": 0.025, "step": 131890 }, { - "epoch": 0.67, - "learning_rate": 0.00020018212914520384, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002487144260603814, + "loss": 0.0205, "step": 131900 }, { - "epoch": 0.67, - "learning_rate": 0.00020017456145218982, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.0002487105378440099, + "loss": 0.021, "step": 131910 }, { - "epoch": 0.67, - "learning_rate": 0.0002001669937591758, - "loss": 0.013, + "epoch": 0.34, + "learning_rate": 0.0002487066496276385, + "loss": 0.0164, "step": 131920 }, { - "epoch": 0.67, - "learning_rate": 0.0002001594260661618, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.000248702761411267, + "loss": 0.0203, "step": 131930 }, { - "epoch": 0.67, - "learning_rate": 0.0002001518583731478, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.00024869887319489556, + "loss": 0.0201, "step": 131940 }, { - "epoch": 0.67, - "learning_rate": 0.00020014429068013377, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002486949849785241, + "loss": 0.0176, "step": 131950 }, { - "epoch": 0.67, - "learning_rate": 0.00020013672298711978, - "loss": 0.0124, + "epoch": 0.34, + "learning_rate": 0.0002486910967621526, + "loss": 0.0203, "step": 131960 }, { - "epoch": 0.67, - "learning_rate": 0.00020012915529410576, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.0002486872085457811, + "loss": 0.0196, "step": 131970 }, { - "epoch": 0.67, - "learning_rate": 0.00020012158760109174, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.0002486833203294097, + "loss": 0.0183, "step": 131980 }, { - "epoch": 0.67, - "learning_rate": 0.00020011401990807775, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002486794321130382, + "loss": 0.0199, "step": 131990 }, { - "epoch": 0.67, - "learning_rate": 0.00020010645221506373, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.00024867554389666676, + "loss": 0.0186, "step": 132000 }, { - "epoch": 0.67, - "eval_cer": 0.9144430848116509, - "eval_loss": 0.009661003015935421, - "eval_runtime": 116.7282, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.283, + "epoch": 0.34, + "eval_cer": 0.8818034601824287, + "eval_loss": 0.014384100213646889, + "eval_runtime": 107.6844, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, "step": 132000 }, { - "epoch": 0.67, - "learning_rate": 0.00020009888452204971, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.0002486716556802953, + "loss": 0.0219, "step": 132010 }, { - "epoch": 0.67, - "learning_rate": 0.0002000913168290357, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.0002486677674639238, + "loss": 0.0215, "step": 132020 }, { - "epoch": 0.67, - "learning_rate": 0.0002000837491360217, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.00024866387924755236, + "loss": 0.014, "step": 132030 }, { - "epoch": 0.67, - "learning_rate": 0.00020007618144300769, - "loss": 0.0115, + "epoch": 0.34, + "learning_rate": 0.00024865999103118087, + "loss": 0.0201, "step": 132040 }, { - "epoch": 0.67, - "learning_rate": 0.00020006861374999367, - "loss": 0.0116, + "epoch": 0.34, + "learning_rate": 0.0002486561028148094, + "loss": 0.0265, "step": 132050 }, { - "epoch": 0.67, - "learning_rate": 0.00020006104605697968, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.00024865221459843795, + "loss": 0.0225, "step": 132060 }, { - "epoch": 0.67, - "learning_rate": 0.00020005347836396566, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.0002486483263820665, + "loss": 0.0199, "step": 132070 }, { - "epoch": 0.67, - "learning_rate": 0.00020004591067095164, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024864443816569504, + "loss": 0.0173, "step": 132080 }, { - "epoch": 0.67, - "learning_rate": 0.00020003834297793765, + "epoch": 0.34, + "learning_rate": 0.00024864054994932355, "loss": 0.0195, "step": 132090 }, { - "epoch": 0.67, - "learning_rate": 0.00020003077528492363, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024863666173295207, + "loss": 0.0237, "step": 132100 }, { - "epoch": 0.67, - "learning_rate": 0.0002000232075919096, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.00024863277351658064, + "loss": 0.0182, "step": 132110 }, { - "epoch": 0.67, - "learning_rate": 0.00020001563989889562, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.00024862888530020915, + "loss": 0.0182, "step": 132120 }, { - "epoch": 0.67, - "learning_rate": 0.0002000080722058816, - "loss": 0.0092, + "epoch": 0.34, + "learning_rate": 0.0002486249970838377, + "loss": 0.0155, "step": 132130 }, { - "epoch": 0.67, - "learning_rate": 0.00020000050451286758, - "loss": 0.0113, + "epoch": 0.34, + "learning_rate": 0.00024862110886746623, + "loss": 0.0221, "step": 132140 }, { - "epoch": 0.67, - "learning_rate": 0.0001999929368198536, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.0002486172206510948, + "loss": 0.0224, "step": 132150 }, { - "epoch": 0.67, - "learning_rate": 0.00019998536912683957, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002486133324347233, + "loss": 0.0163, "step": 132160 }, { - "epoch": 0.67, - "learning_rate": 0.00019997780143382555, - "loss": 0.0112, + "epoch": 0.34, + "learning_rate": 0.00024860944421835183, + "loss": 0.0236, "step": 132170 }, { - "epoch": 0.67, - "learning_rate": 0.00019997023374081153, - "loss": 0.0116, + "epoch": 0.34, + "learning_rate": 0.00024860555600198035, + "loss": 0.0199, "step": 132180 }, { - "epoch": 0.67, - "learning_rate": 0.00019996266604779754, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.0002486016677856089, + "loss": 0.0201, "step": 132190 }, { - "epoch": 0.67, - "learning_rate": 0.00019995509835478352, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024859777956923743, + "loss": 0.0166, "step": 132200 }, { - "epoch": 0.67, - "learning_rate": 0.0001999475306617695, - "loss": 0.0152, + "epoch": 0.34, + "learning_rate": 0.000248593891352866, + "loss": 0.0163, "step": 132210 }, { - "epoch": 0.67, - "learning_rate": 0.00019993996296875551, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.0002485900031364945, + "loss": 0.021, "step": 132220 }, { - "epoch": 0.67, - "learning_rate": 0.0001999323952757415, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.0002485861149201231, + "loss": 0.0202, "step": 132230 }, { - "epoch": 0.67, - "learning_rate": 0.00019992482758272748, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.0002485822267037516, + "loss": 0.0176, "step": 132240 }, { - "epoch": 0.67, - "learning_rate": 0.00019991725988971349, - "loss": 0.0118, + "epoch": 0.34, + "learning_rate": 0.0002485783384873801, + "loss": 0.0223, "step": 132250 }, { - "epoch": 0.67, - "learning_rate": 0.00019990969219669947, - "loss": 0.0154, + "epoch": 0.34, + "learning_rate": 0.0002485744502710086, + "loss": 0.0225, "step": 132260 }, { - "epoch": 0.67, - "learning_rate": 0.00019990212450368545, - "loss": 0.0166, + "epoch": 0.34, + "learning_rate": 0.0002485705620546372, + "loss": 0.0205, "step": 132270 }, { - "epoch": 0.67, - "learning_rate": 0.00019989455681067146, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024856667383826576, + "loss": 0.0192, "step": 132280 }, { - "epoch": 0.67, - "learning_rate": 0.00019988698911765744, - "loss": 0.011, + "epoch": 0.34, + "learning_rate": 0.0002485627856218943, + "loss": 0.0194, "step": 132290 }, { - "epoch": 0.67, - "learning_rate": 0.00019987942142464342, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.0002485588974055228, + "loss": 0.0192, "step": 132300 }, { - "epoch": 0.67, - "learning_rate": 0.00019987185373162943, - "loss": 0.015, + "epoch": 0.34, + "learning_rate": 0.0002485550091891513, + "loss": 0.0182, "step": 132310 }, { - "epoch": 0.67, - "learning_rate": 0.0001998642860386154, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.0002485511209727799, + "loss": 0.0224, "step": 132320 }, { - "epoch": 0.67, - "learning_rate": 0.0001998567183456014, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.0002485472327564084, + "loss": 0.02, "step": 132330 }, { - "epoch": 0.67, - "learning_rate": 0.00019984915065258737, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.00024854334454003696, + "loss": 0.0202, "step": 132340 }, { - "epoch": 0.67, - "learning_rate": 0.00019984158295957338, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024853945632366547, + "loss": 0.0181, "step": 132350 }, { - "epoch": 0.67, - "learning_rate": 0.00019983401526655936, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.00024853556810729404, + "loss": 0.0209, "step": 132360 }, { - "epoch": 0.67, - "learning_rate": 0.00019982644757354534, - "loss": 0.0192, + "epoch": 0.34, + "learning_rate": 0.00024853167989092256, + "loss": 0.0193, "step": 132370 }, { - "epoch": 0.67, - "learning_rate": 0.00019981887988053135, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.00024852779167455107, + "loss": 0.02, "step": 132380 }, { - "epoch": 0.67, - "learning_rate": 0.00019981131218751733, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.0002485239034581796, + "loss": 0.0223, "step": 132390 }, { - "epoch": 0.67, - "learning_rate": 0.00019980374449450332, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.00024852001524180815, + "loss": 0.0206, "step": 132400 }, { - "epoch": 0.67, - "learning_rate": 0.00019979617680148932, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.0002485161270254367, + "loss": 0.0152, "step": 132410 }, { - "epoch": 0.67, - "learning_rate": 0.0001997886091084753, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.00024851223880906524, + "loss": 0.0231, "step": 132420 }, { - "epoch": 0.67, - "learning_rate": 0.0001997810414154613, - "loss": 0.0144, + "epoch": 0.34, + "learning_rate": 0.00024850835059269375, + "loss": 0.0174, "step": 132430 }, { - "epoch": 0.67, - "learning_rate": 0.0001997734737224473, - "loss": 0.0115, + "epoch": 0.34, + "learning_rate": 0.0002485044623763223, + "loss": 0.0193, "step": 132440 }, { - "epoch": 0.67, - "learning_rate": 0.00019976590602943328, - "loss": 0.0166, + "epoch": 0.34, + "learning_rate": 0.00024850057415995083, + "loss": 0.0246, "step": 132450 }, { - "epoch": 0.67, - "learning_rate": 0.00019975833833641926, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.00024849668594357935, + "loss": 0.0179, "step": 132460 }, { - "epoch": 0.67, - "learning_rate": 0.00019975077064340527, - "loss": 0.0301, + "epoch": 0.34, + "learning_rate": 0.0002484927977272079, + "loss": 0.0207, "step": 132470 }, { - "epoch": 0.67, - "learning_rate": 0.00019974320295039125, - "loss": 0.0163, + "epoch": 0.34, + "learning_rate": 0.00024848890951083643, + "loss": 0.0174, "step": 132480 }, { - "epoch": 0.67, - "learning_rate": 0.00019973563525737723, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.000248485021294465, + "loss": 0.0222, "step": 132490 }, { - "epoch": 0.67, - "learning_rate": 0.00019972806756436324, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.0002484811330780935, + "loss": 0.0167, "step": 132500 }, { - "epoch": 0.67, - "learning_rate": 0.00019972049987134922, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.00024847724486172203, + "loss": 0.0165, "step": 132510 }, { - "epoch": 0.67, - "learning_rate": 0.0001997129321783352, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.00024847335664535054, + "loss": 0.0196, "step": 132520 }, { - "epoch": 0.67, - "learning_rate": 0.00019970536448532118, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.0002484694684289791, + "loss": 0.0184, "step": 132530 }, { - "epoch": 0.67, - "learning_rate": 0.0001996977967923072, - "loss": 0.0157, + "epoch": 0.34, + "learning_rate": 0.00024846558021260763, + "loss": 0.0199, "step": 132540 }, { - "epoch": 0.67, - "learning_rate": 0.00019969022909929317, - "loss": 0.0149, + "epoch": 0.34, + "learning_rate": 0.0002484616919962362, + "loss": 0.0226, "step": 132550 }, { - "epoch": 0.67, - "learning_rate": 0.00019968266140627915, - "loss": 0.0137, + "epoch": 0.34, + "learning_rate": 0.0002484578037798647, + "loss": 0.0185, "step": 132560 }, { - "epoch": 0.67, - "learning_rate": 0.00019967509371326516, - "loss": 0.0116, + "epoch": 0.34, + "learning_rate": 0.0002484539155634933, + "loss": 0.0163, "step": 132570 }, { - "epoch": 0.67, - "learning_rate": 0.00019966752602025114, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.0002484500273471218, + "loss": 0.0295, "step": 132580 }, { - "epoch": 0.67, - "learning_rate": 0.00019965995832723713, - "loss": 0.0176, + "epoch": 0.34, + "learning_rate": 0.0002484461391307503, + "loss": 0.0218, "step": 132590 }, { - "epoch": 0.67, - "learning_rate": 0.00019965239063422313, - "loss": 0.0151, + "epoch": 0.34, + "learning_rate": 0.0002484422509143788, + "loss": 0.0221, "step": 132600 }, { - "epoch": 0.67, - "learning_rate": 0.0001996448229412091, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002484383626980074, + "loss": 0.0211, "step": 132610 }, { - "epoch": 0.67, - "learning_rate": 0.00019963725524819507, - "loss": 0.025, + "epoch": 0.34, + "learning_rate": 0.00024843447448163596, + "loss": 0.0205, "step": 132620 }, { - "epoch": 0.67, - "learning_rate": 0.00019962968755518105, - "loss": 0.0155, + "epoch": 0.34, + "learning_rate": 0.0002484305862652645, + "loss": 0.0191, "step": 132630 }, { - "epoch": 0.67, - "learning_rate": 0.00019962211986216706, - "loss": 0.0168, + "epoch": 0.34, + "learning_rate": 0.000248426698048893, + "loss": 0.0255, "step": 132640 }, { - "epoch": 0.67, - "learning_rate": 0.00019961455216915304, - "loss": 0.0151, + "epoch": 0.34, + "learning_rate": 0.00024842280983252156, + "loss": 0.0191, "step": 132650 }, { - "epoch": 0.67, - "learning_rate": 0.00019960698447613902, - "loss": 0.0133, + "epoch": 0.34, + "learning_rate": 0.0002484189216161501, + "loss": 0.0225, "step": 132660 }, { - "epoch": 0.67, - "learning_rate": 0.00019959941678312503, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.0002484150333997786, + "loss": 0.0192, "step": 132670 }, { - "epoch": 0.67, - "learning_rate": 0.000199591849090111, - "loss": 0.0165, + "epoch": 0.34, + "learning_rate": 0.00024841114518340716, + "loss": 0.0208, "step": 132680 }, { - "epoch": 0.67, - "learning_rate": 0.000199584281397097, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.00024840725696703567, + "loss": 0.0172, "step": 132690 }, { - "epoch": 0.67, - "learning_rate": 0.000199576713704083, - "loss": 0.011, + "epoch": 0.34, + "learning_rate": 0.00024840336875066424, + "loss": 0.0233, "step": 132700 }, { - "epoch": 0.67, - "learning_rate": 0.00019956914601106898, - "loss": 0.0129, + "epoch": 0.34, + "learning_rate": 0.00024839948053429275, + "loss": 0.0197, "step": 132710 }, { - "epoch": 0.67, - "learning_rate": 0.00019956157831805497, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.00024839559231792127, + "loss": 0.0177, "step": 132720 }, { - "epoch": 0.67, - "learning_rate": 0.00019955401062504095, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.00024839170410154984, + "loss": 0.0217, "step": 132730 }, { - "epoch": 0.67, - "learning_rate": 0.00019954644293202696, - "loss": 0.012, + "epoch": 0.34, + "learning_rate": 0.00024838781588517835, + "loss": 0.0263, "step": 132740 }, { - "epoch": 0.67, - "learning_rate": 0.00019953887523901294, - "loss": 0.0143, + "epoch": 0.34, + "learning_rate": 0.00024838392766880687, + "loss": 0.0199, "step": 132750 }, { - "epoch": 0.67, - "learning_rate": 0.00019953130754599892, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.00024838003945243544, + "loss": 0.024, "step": 132760 }, { - "epoch": 0.67, - "learning_rate": 0.00019952373985298493, - "loss": 0.0135, + "epoch": 0.34, + "learning_rate": 0.00024837615123606395, + "loss": 0.0186, "step": 132770 }, { - "epoch": 0.67, - "learning_rate": 0.0001995161721599709, - "loss": 0.0138, + "epoch": 0.34, + "learning_rate": 0.0002483722630196925, + "loss": 0.0164, "step": 132780 }, { - "epoch": 0.67, - "learning_rate": 0.0001995086044669569, - "loss": 0.0139, + "epoch": 0.34, + "learning_rate": 0.00024836837480332103, + "loss": 0.0183, "step": 132790 }, { - "epoch": 0.67, - "learning_rate": 0.0001995010367739429, - "loss": 0.0161, + "epoch": 0.34, + "learning_rate": 0.00024836448658694955, + "loss": 0.0205, "step": 132800 }, { - "epoch": 0.67, - "learning_rate": 0.00019949346908092888, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.0002483605983705781, + "loss": 0.0255, "step": 132810 }, { - "epoch": 0.67, - "learning_rate": 0.00019948590138791486, - "loss": 0.0119, + "epoch": 0.34, + "learning_rate": 0.00024835671015420663, + "loss": 0.0201, "step": 132820 }, { - "epoch": 0.67, - "learning_rate": 0.00019947833369490087, - "loss": 0.017, + "epoch": 0.34, + "learning_rate": 0.0002483528219378352, + "loss": 0.0171, "step": 132830 }, { - "epoch": 0.67, - "learning_rate": 0.00019947076600188685, - "loss": 0.0116, + "epoch": 0.34, + "learning_rate": 0.0002483489337214637, + "loss": 0.0185, "step": 132840 }, { - "epoch": 0.67, - "learning_rate": 0.00019946319830887283, - "loss": 0.0134, + "epoch": 0.34, + "learning_rate": 0.00024834504550509223, + "loss": 0.0183, "step": 132850 }, { - "epoch": 0.67, - "learning_rate": 0.00019945563061585884, - "loss": 0.0169, + "epoch": 0.34, + "learning_rate": 0.0002483411572887208, + "loss": 0.021, "step": 132860 }, { - "epoch": 0.67, - "learning_rate": 0.00019944806292284482, - "loss": 0.0109, + "epoch": 0.34, + "learning_rate": 0.0002483372690723493, + "loss": 0.0272, "step": 132870 }, { - "epoch": 0.67, - "learning_rate": 0.0001994404952298308, - "loss": 0.0142, + "epoch": 0.34, + "learning_rate": 0.0002483333808559778, + "loss": 0.0232, "step": 132880 }, { - "epoch": 0.67, - "learning_rate": 0.0001994329275368168, - "loss": 0.0132, + "epoch": 0.34, + "learning_rate": 0.0002483294926396064, + "loss": 0.0209, "step": 132890 }, { - "epoch": 0.67, - "learning_rate": 0.0001994253598438028, - "loss": 0.0153, + "epoch": 0.34, + "learning_rate": 0.0002483256044232349, + "loss": 0.0192, "step": 132900 }, { - "epoch": 0.67, - "learning_rate": 0.00019941779215078878, - "loss": 0.0141, + "epoch": 0.34, + "learning_rate": 0.0002483217162068635, + "loss": 0.0187, "step": 132910 }, { - "epoch": 0.67, - "learning_rate": 0.00019941022445777476, - "loss": 0.0148, + "epoch": 0.34, + "learning_rate": 0.000248317827990492, + "loss": 0.0169, "step": 132920 }, { - "epoch": 0.67, - "learning_rate": 0.00019940265676476077, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.0002483139397741205, + "loss": 0.0193, "step": 132930 }, { - "epoch": 0.67, - "learning_rate": 0.00019939508907174675, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.0002483100515577491, + "loss": 0.0233, "step": 132940 }, { - "epoch": 0.67, - "learning_rate": 0.00019938752137873273, - "loss": 0.0159, + "epoch": 0.34, + "learning_rate": 0.0002483061633413776, + "loss": 0.023, "step": 132950 }, { - "epoch": 0.67, - "learning_rate": 0.00019937995368571874, - "loss": 0.0128, + "epoch": 0.34, + "learning_rate": 0.00024830227512500616, + "loss": 0.02, "step": 132960 }, { - "epoch": 0.67, - "learning_rate": 0.00019937238599270472, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.0002482983869086347, + "loss": 0.0231, "step": 132970 }, { - "epoch": 0.67, - "learning_rate": 0.0001993648182996907, - "loss": 0.0122, + "epoch": 0.34, + "learning_rate": 0.00024829449869226324, + "loss": 0.0239, "step": 132980 }, { - "epoch": 0.67, - "learning_rate": 0.0001993572506066767, - "loss": 0.0117, + "epoch": 0.34, + "learning_rate": 0.00024829061047589176, + "loss": 0.0284, "step": 132990 }, { - "epoch": 0.67, - "learning_rate": 0.0001993496829136627, - "loss": 0.0126, + "epoch": 0.34, + "learning_rate": 0.00024828672225952027, + "loss": 0.0241, "step": 133000 }, { - "epoch": 0.67, - "eval_cer": 0.9144964565985481, - "eval_loss": 0.009822376072406769, - "eval_runtime": 116.6404, - "eval_samples_per_second": 17.147, - "eval_steps_per_second": 4.287, + "epoch": 0.34, + "eval_cer": 0.8817880641761527, + "eval_loss": 0.013718601316213608, + "eval_runtime": 107.4626, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, "step": 133000 }, { - "epoch": 0.67, - "learning_rate": 0.00019934211522064867, - "loss": 0.0111, + "epoch": 0.34, + "learning_rate": 0.0002482828340431488, + "loss": 0.0189, "step": 133010 }, { - "epoch": 0.67, - "learning_rate": 0.00019933454752763468, - "loss": 0.0119, + "epoch": 0.34, + "learning_rate": 0.00024827894582677736, + "loss": 0.0176, "step": 133020 }, { - "epoch": 0.67, - "learning_rate": 0.00019932697983462066, - "loss": 0.0162, + "epoch": 0.34, + "learning_rate": 0.00024827505761040587, + "loss": 0.0176, "step": 133030 }, { - "epoch": 0.67, - "learning_rate": 0.00019931941214160664, - "loss": 0.0136, + "epoch": 0.34, + "learning_rate": 0.00024827116939403444, + "loss": 0.0172, "step": 133040 }, { - "epoch": 0.67, - "learning_rate": 0.00019931184444859265, - "loss": 0.0115, + "epoch": 0.34, + "learning_rate": 0.00024826728117766295, + "loss": 0.0291, "step": 133050 }, { - "epoch": 0.67, - "learning_rate": 0.00019930427675557863, - "loss": 0.0158, + "epoch": 0.34, + "learning_rate": 0.00024826339296129147, + "loss": 0.02, "step": 133060 }, { - "epoch": 0.67, - "learning_rate": 0.00019929670906256462, - "loss": 0.014, + "epoch": 0.34, + "learning_rate": 0.00024825950474492004, + "loss": 0.0188, "step": 133070 }, { - "epoch": 0.67, - "learning_rate": 0.0001992891413695506, - "loss": 0.0145, + "epoch": 0.34, + "learning_rate": 0.00024825561652854855, + "loss": 0.0192, "step": 133080 }, { - "epoch": 0.67, - "learning_rate": 0.0001992815736765366, - "loss": 0.0151, + "epoch": 0.34, + "learning_rate": 0.00024825172831217707, + "loss": 0.0204, "step": 133090 }, { - "epoch": 0.67, - "learning_rate": 0.00019927400598352259, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.00024824784009580563, + "loss": 0.0207, "step": 133100 }, { - "epoch": 0.67, - "learning_rate": 0.00019926643829050857, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.0002482439518794342, + "loss": 0.0218, "step": 133110 }, { - "epoch": 0.67, - "learning_rate": 0.00019925887059749458, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.0002482400636630627, + "loss": 0.0222, "step": 133120 }, { - "epoch": 0.67, - "learning_rate": 0.00019925130290448056, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.00024823617544669123, + "loss": 0.0202, "step": 133130 }, { - "epoch": 0.67, - "learning_rate": 0.00019924373521146654, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.00024823228723031975, + "loss": 0.0239, "step": 133140 }, { - "epoch": 0.67, - "learning_rate": 0.00019923616751845255, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.0002482283990139483, + "loss": 0.0236, "step": 133150 }, { - "epoch": 0.67, - "learning_rate": 0.00019922859982543853, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.00024822451079757683, + "loss": 0.0206, "step": 133160 }, { - "epoch": 0.67, - "learning_rate": 0.0001992210321324245, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.0002482206225812054, + "loss": 0.0239, "step": 133170 }, { - "epoch": 0.67, - "learning_rate": 0.00019921346443941052, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.0002482167343648339, + "loss": 0.0222, "step": 133180 }, { - "epoch": 0.67, - "learning_rate": 0.0001992058967463965, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002482128461484625, + "loss": 0.0209, "step": 133190 }, { - "epoch": 0.67, - "learning_rate": 0.00019919832905338248, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.000248208957932091, + "loss": 0.0202, "step": 133200 }, { - "epoch": 0.67, - "learning_rate": 0.0001991907613603685, - "loss": 0.012, + "epoch": 0.35, + "learning_rate": 0.0002482050697157195, + "loss": 0.0233, "step": 133210 }, { - "epoch": 0.67, - "learning_rate": 0.00019918319366735447, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.000248201181499348, + "loss": 0.0335, "step": 133220 }, { - "epoch": 0.67, - "learning_rate": 0.00019917562597434045, - "loss": 0.0119, + "epoch": 0.35, + "learning_rate": 0.0002481972932829766, + "loss": 0.0234, "step": 133230 }, { - "epoch": 0.67, - "learning_rate": 0.00019916805828132644, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.0002481934050666051, + "loss": 0.0199, "step": 133240 }, { - "epoch": 0.67, - "learning_rate": 0.00019916049058831244, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.0002481895168502337, + "loss": 0.0229, "step": 133250 }, { - "epoch": 0.67, - "learning_rate": 0.00019915292289529843, - "loss": 0.016, + "epoch": 0.35, + "learning_rate": 0.0002481856286338622, + "loss": 0.0246, "step": 133260 }, { - "epoch": 0.67, - "learning_rate": 0.0001991453552022844, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.0002481817404174907, + "loss": 0.0192, "step": 133270 }, { - "epoch": 0.67, - "learning_rate": 0.00019913778750927042, - "loss": 0.017, + "epoch": 0.35, + "learning_rate": 0.0002481778522011193, + "loss": 0.0238, "step": 133280 }, { - "epoch": 0.67, - "learning_rate": 0.0001991302198162564, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002481739639847478, + "loss": 0.0188, "step": 133290 }, { - "epoch": 0.67, - "learning_rate": 0.00019912265212324238, - "loss": 0.0113, + "epoch": 0.35, + "learning_rate": 0.0002481700757683763, + "loss": 0.0198, "step": 133300 }, { - "epoch": 0.67, - "learning_rate": 0.0001991150844302284, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002481661875520049, + "loss": 0.0197, "step": 133310 }, { - "epoch": 0.67, - "learning_rate": 0.00019910751673721437, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.00024816229933563344, + "loss": 0.0181, "step": 133320 }, { - "epoch": 0.67, - "learning_rate": 0.00019909994904420035, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.00024815841111926196, + "loss": 0.02, "step": 133330 }, { - "epoch": 0.67, - "learning_rate": 0.00019909238135118636, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.00024815452290289047, + "loss": 0.0222, "step": 133340 }, { - "epoch": 0.67, - "learning_rate": 0.00019908481365817234, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.000248150634686519, + "loss": 0.0215, "step": 133350 }, { - "epoch": 0.67, - "learning_rate": 0.00019907724596515832, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.00024814674647014755, + "loss": 0.019, "step": 133360 }, { - "epoch": 0.67, - "learning_rate": 0.00019906967827214433, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024814285825377607, + "loss": 0.0203, "step": 133370 }, { - "epoch": 0.67, - "learning_rate": 0.0001990621105791303, - "loss": 0.0222, + "epoch": 0.35, + "learning_rate": 0.00024813897003740464, + "loss": 0.0188, "step": 133380 }, { - "epoch": 0.67, - "learning_rate": 0.0001990545428861163, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.00024813508182103315, + "loss": 0.0169, "step": 133390 }, { - "epoch": 0.67, - "learning_rate": 0.00019904697519310227, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002481311936046617, + "loss": 0.0201, "step": 133400 }, { - "epoch": 0.67, - "learning_rate": 0.00019903940750008828, - "loss": 0.0174, + "epoch": 0.35, + "learning_rate": 0.00024812730538829024, + "loss": 0.0274, "step": 133410 }, { - "epoch": 0.67, - "learning_rate": 0.00019903183980707426, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.00024812341717191875, + "loss": 0.0221, "step": 133420 }, { - "epoch": 0.67, - "learning_rate": 0.00019902427211406025, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024811952895554726, + "loss": 0.0216, "step": 133430 }, { - "epoch": 0.67, - "learning_rate": 0.00019901670442104625, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.00024811564073917583, + "loss": 0.0192, "step": 133440 }, { - "epoch": 0.67, - "learning_rate": 0.00019900913672803224, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.00024811175252280435, + "loss": 0.0176, "step": 133450 }, { - "epoch": 0.67, - "learning_rate": 0.00019900156903501822, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.0002481078643064329, + "loss": 0.0193, "step": 133460 }, { - "epoch": 0.67, - "learning_rate": 0.00019899400134200423, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.00024810397609006143, + "loss": 0.0204, "step": 133470 }, { - "epoch": 0.67, - "learning_rate": 0.0001989864336489902, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.00024810008787369, + "loss": 0.0206, "step": 133480 }, { - "epoch": 0.67, - "learning_rate": 0.0001989788659559762, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002480961996573185, + "loss": 0.025, "step": 133490 }, { - "epoch": 0.67, - "learning_rate": 0.0001989712982629622, - "loss": 0.0167, + "epoch": 0.35, + "learning_rate": 0.00024809231144094703, + "loss": 0.018, "step": 133500 }, { - "epoch": 0.67, - "learning_rate": 0.00019896373056994818, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002480884232245756, + "loss": 0.0194, "step": 133510 }, { - "epoch": 0.67, - "learning_rate": 0.00019895616287693416, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.0002480845350082041, + "loss": 0.0168, "step": 133520 }, { - "epoch": 0.67, - "learning_rate": 0.00019894859518392017, - "loss": 0.0181, + "epoch": 0.35, + "learning_rate": 0.0002480806467918327, + "loss": 0.0211, "step": 133530 }, { - "epoch": 0.67, - "learning_rate": 0.00019894102749090615, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002480767585754612, + "loss": 0.02, "step": 133540 }, { - "epoch": 0.67, - "learning_rate": 0.00019893345979789213, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.0002480728703590897, + "loss": 0.0183, "step": 133550 }, { - "epoch": 0.67, - "learning_rate": 0.00019892589210487814, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.0002480689821427182, + "loss": 0.0205, "step": 133560 }, { - "epoch": 0.67, - "learning_rate": 0.00019891832441186412, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.0002480650939263468, + "loss": 0.0154, "step": 133570 }, { - "epoch": 0.67, - "learning_rate": 0.0001989107567188501, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002480612057099753, + "loss": 0.0229, "step": 133580 }, { - "epoch": 0.67, - "learning_rate": 0.00019890318902583608, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.0002480573174936039, + "loss": 0.0167, "step": 133590 }, { - "epoch": 0.67, - "learning_rate": 0.0001988956213328221, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.0002480534292772324, + "loss": 0.0184, "step": 133600 }, { - "epoch": 0.67, - "learning_rate": 0.00019888805363980807, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.00024804954106086096, + "loss": 0.018, "step": 133610 }, { - "epoch": 0.67, - "learning_rate": 0.00019888048594679406, - "loss": 0.0156, + "epoch": 0.35, + "learning_rate": 0.0002480456528444895, + "loss": 0.018, "step": 133620 }, { - "epoch": 0.67, - "learning_rate": 0.00019887291825378006, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.000248041764628118, + "loss": 0.0242, "step": 133630 }, { - "epoch": 0.67, - "learning_rate": 0.00019886535056076605, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002480378764117465, + "loss": 0.0195, "step": 133640 }, { - "epoch": 0.67, - "learning_rate": 0.00019885778286775203, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024803398819537507, + "loss": 0.0196, "step": 133650 }, { - "epoch": 0.67, - "learning_rate": 0.00019885021517473804, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.00024803009997900364, + "loss": 0.0199, "step": 133660 }, { - "epoch": 0.67, - "learning_rate": 0.00019884264748172402, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024802621176263216, + "loss": 0.0195, "step": 133670 }, { - "epoch": 0.67, - "learning_rate": 0.00019883507978871, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.00024802232354626067, + "loss": 0.0233, "step": 133680 }, { - "epoch": 0.67, - "learning_rate": 0.000198827512095696, - "loss": 0.017, + "epoch": 0.35, + "learning_rate": 0.00024801843532988924, + "loss": 0.0257, "step": 133690 }, { - "epoch": 0.67, - "learning_rate": 0.000198819944402682, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.00024801454711351775, + "loss": 0.0197, "step": 133700 }, { - "epoch": 0.67, - "learning_rate": 0.00019881237670966797, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024801065889714627, + "loss": 0.0213, "step": 133710 }, { - "epoch": 0.67, - "learning_rate": 0.00019880480901665398, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024800677068077484, + "loss": 0.0207, "step": 133720 }, { - "epoch": 0.67, - "learning_rate": 0.00019879724132363996, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024800288246440335, + "loss": 0.0271, "step": 133730 }, { - "epoch": 0.67, - "learning_rate": 0.00019878967363062594, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.0002479989942480319, + "loss": 0.0203, "step": 133740 }, { - "epoch": 0.67, - "learning_rate": 0.00019878210593761192, - "loss": 0.0173, + "epoch": 0.35, + "learning_rate": 0.00024799510603166043, + "loss": 0.0204, "step": 133750 }, { - "epoch": 0.67, - "learning_rate": 0.00019877453824459793, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.00024799121781528895, + "loss": 0.0198, "step": 133760 }, { - "epoch": 0.67, - "learning_rate": 0.0001987669705515839, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024798732959891746, + "loss": 0.0179, "step": 133770 }, { - "epoch": 0.67, - "learning_rate": 0.0001987594028585699, - "loss": 0.0199, + "epoch": 0.35, + "learning_rate": 0.00024798344138254603, + "loss": 0.0252, "step": 133780 }, { - "epoch": 0.67, - "learning_rate": 0.0001987518351655559, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.00024797955316617455, + "loss": 0.0194, "step": 133790 }, { - "epoch": 0.68, - "learning_rate": 0.00019874426747254188, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002479756649498031, + "loss": 0.0185, "step": 133800 }, { - "epoch": 0.68, - "learning_rate": 0.00019873669977952787, - "loss": 0.0168, + "epoch": 0.35, + "learning_rate": 0.00024797177673343163, + "loss": 0.0207, "step": 133810 }, { - "epoch": 0.68, - "learning_rate": 0.00019872913208651387, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.0002479678885170602, + "loss": 0.0258, "step": 133820 }, { - "epoch": 0.68, - "learning_rate": 0.00019872156439349986, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002479640003006887, + "loss": 0.0333, "step": 133830 }, { - "epoch": 0.68, - "learning_rate": 0.00019871399670048584, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.00024796011208431723, + "loss": 0.0189, "step": 133840 }, { - "epoch": 0.68, - "learning_rate": 0.00019870642900747185, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.00024795622386794574, + "loss": 0.0186, "step": 133850 }, { - "epoch": 0.68, - "learning_rate": 0.0001986988613144578, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002479523356515743, + "loss": 0.0225, "step": 133860 }, { - "epoch": 0.68, - "learning_rate": 0.00019869129362144378, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002479484474352029, + "loss": 0.096, "step": 133870 }, { - "epoch": 0.68, - "learning_rate": 0.00019868372592842976, - "loss": 0.0165, + "epoch": 0.35, + "learning_rate": 0.0002479445592188314, + "loss": 0.0277, "step": 133880 }, { - "epoch": 0.68, - "learning_rate": 0.00019867615823541577, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002479406710024599, + "loss": 0.0213, "step": 133890 }, { - "epoch": 0.68, - "learning_rate": 0.00019866859054240175, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.0002479367827860885, + "loss": 0.0272, "step": 133900 }, { - "epoch": 0.68, - "learning_rate": 0.00019866102284938773, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.000247932894569717, + "loss": 0.024, "step": 133910 }, { - "epoch": 0.68, - "learning_rate": 0.00019865345515637374, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002479290063533455, + "loss": 0.0212, "step": 133920 }, { - "epoch": 0.68, - "learning_rate": 0.00019864588746335972, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002479251181369741, + "loss": 0.02, "step": 133930 }, { - "epoch": 0.68, - "learning_rate": 0.0001986383197703457, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.0002479212299206026, + "loss": 0.0205, "step": 133940 }, { - "epoch": 0.68, - "learning_rate": 0.00019863075207733171, - "loss": 0.0327, + "epoch": 0.35, + "learning_rate": 0.00024791734170423116, + "loss": 0.0214, "step": 133950 }, { - "epoch": 0.68, - "learning_rate": 0.0001986231843843177, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002479134534878597, + "loss": 0.018, "step": 133960 }, { - "epoch": 0.68, - "learning_rate": 0.00019861561669130368, - "loss": 0.0166, + "epoch": 0.35, + "learning_rate": 0.0002479095652714882, + "loss": 0.0302, "step": 133970 }, { - "epoch": 0.68, - "learning_rate": 0.00019860804899828966, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.0002479056770551167, + "loss": 0.0189, "step": 133980 }, { - "epoch": 0.68, - "learning_rate": 0.00019860048130527567, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.00024790178883874527, + "loss": 0.0169, "step": 133990 }, { - "epoch": 0.68, - "learning_rate": 0.00019859291361226165, - "loss": 0.0116, + "epoch": 0.35, + "learning_rate": 0.00024789790062237384, + "loss": 0.0197, "step": 134000 }, { - "epoch": 0.68, - "eval_cer": 0.9144634631302844, - "eval_loss": 0.009661918506026268, - "eval_runtime": 116.6673, - "eval_samples_per_second": 17.143, - "eval_steps_per_second": 4.286, + "epoch": 0.35, + "eval_cer": 0.8817558725266665, + "eval_loss": 0.014305938966572285, + "eval_runtime": 107.3575, + "eval_samples_per_second": 18.629, + "eval_steps_per_second": 4.657, "step": 134000 }, { - "epoch": 0.68, - "learning_rate": 0.00019858534591924763, - "loss": 0.0112, + "epoch": 0.35, + "learning_rate": 0.00024789401240600235, + "loss": 0.0234, "step": 134010 }, { - "epoch": 0.68, - "learning_rate": 0.00019857777822623364, - "loss": 0.0165, + "epoch": 0.35, + "learning_rate": 0.00024789012418963087, + "loss": 0.0222, "step": 134020 }, { - "epoch": 0.68, - "learning_rate": 0.00019857021053321962, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.00024788623597325944, + "loss": 0.0188, "step": 134030 }, { - "epoch": 0.68, - "learning_rate": 0.0001985626428402056, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024788234775688795, + "loss": 0.0258, "step": 134040 }, { - "epoch": 0.68, - "learning_rate": 0.0001985550751471916, - "loss": 0.0279, + "epoch": 0.35, + "learning_rate": 0.00024787845954051647, + "loss": 0.0175, "step": 134050 }, { - "epoch": 0.68, - "learning_rate": 0.0001985475074541776, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.00024787457132414504, + "loss": 0.0185, "step": 134060 }, { - "epoch": 0.68, - "learning_rate": 0.00019853993976116357, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.00024787068310777355, + "loss": 0.0167, "step": 134070 }, { - "epoch": 0.68, - "learning_rate": 0.00019853237206814958, - "loss": 0.0199, + "epoch": 0.35, + "learning_rate": 0.0002478667948914021, + "loss": 0.0151, "step": 134080 }, { - "epoch": 0.68, - "learning_rate": 0.00019852480437513556, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024786290667503063, + "loss": 0.0213, "step": 134090 }, { - "epoch": 0.68, - "learning_rate": 0.00019851723668212154, - "loss": 0.0144, + "epoch": 0.35, + "learning_rate": 0.00024785901845865915, + "loss": 0.0181, "step": 134100 }, { - "epoch": 0.68, - "learning_rate": 0.00019850966898910755, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002478551302422877, + "loss": 0.0192, "step": 134110 }, { - "epoch": 0.68, - "learning_rate": 0.00019850210129609353, + "epoch": 0.35, + "learning_rate": 0.00024785124202591623, "loss": 0.0191, "step": 134120 }, { - "epoch": 0.68, - "learning_rate": 0.00019849453360307952, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.00024784735380954475, + "loss": 0.0223, "step": 134130 }, { - "epoch": 0.68, - "learning_rate": 0.0001984869659100655, - "loss": 0.0112, + "epoch": 0.35, + "learning_rate": 0.0002478434655931733, + "loss": 0.0249, "step": 134140 }, { - "epoch": 0.68, - "learning_rate": 0.0001984793982170515, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002478395773768019, + "loss": 0.0263, "step": 134150 }, { - "epoch": 0.68, - "learning_rate": 0.0001984718305240375, - "loss": 0.0197, + "epoch": 0.35, + "learning_rate": 0.0002478356891604304, + "loss": 0.0172, "step": 134160 }, { - "epoch": 0.68, - "learning_rate": 0.00019846426283102347, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.0002478318009440589, + "loss": 0.0192, "step": 134170 }, { - "epoch": 0.68, - "learning_rate": 0.00019845669513800948, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002478279127276874, + "loss": 0.021, "step": 134180 }, { - "epoch": 0.68, - "learning_rate": 0.00019844912744499546, - "loss": 0.0188, + "epoch": 0.35, + "learning_rate": 0.000247824024511316, + "loss": 0.0197, "step": 134190 }, { - "epoch": 0.68, - "learning_rate": 0.00019844155975198144, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.0002478201362949445, + "loss": 0.0251, "step": 134200 }, { - "epoch": 0.68, - "learning_rate": 0.00019843399205896745, - "loss": 0.0116, + "epoch": 0.35, + "learning_rate": 0.0002478162480785731, + "loss": 0.0189, "step": 134210 }, { - "epoch": 0.68, - "learning_rate": 0.00019842642436595343, - "loss": 0.0155, + "epoch": 0.35, + "learning_rate": 0.0002478123598622016, + "loss": 0.0208, "step": 134220 }, { - "epoch": 0.68, - "learning_rate": 0.0001984188566729394, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.0002478084716458301, + "loss": 0.0239, "step": 134230 }, { - "epoch": 0.68, - "learning_rate": 0.00019841128897992542, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002478045834294587, + "loss": 0.0206, "step": 134240 }, { - "epoch": 0.68, - "learning_rate": 0.0001984037212869114, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.0002478006952130872, + "loss": 0.0227, "step": 134250 }, { - "epoch": 0.68, - "learning_rate": 0.00019839615359389738, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002477968069967157, + "loss": 0.0201, "step": 134260 }, { - "epoch": 0.68, - "learning_rate": 0.0001983885859008834, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.0002477929187803443, + "loss": 0.0173, "step": 134270 }, { - "epoch": 0.68, - "learning_rate": 0.00019838101820786937, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.0002477890305639728, + "loss": 0.0236, "step": 134280 }, { - "epoch": 0.68, - "learning_rate": 0.00019837345051485535, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024778514234760136, + "loss": 0.0223, "step": 134290 }, { - "epoch": 0.68, - "learning_rate": 0.00019836588282184134, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.00024778125413122987, + "loss": 0.0169, "step": 134300 }, { - "epoch": 0.68, - "learning_rate": 0.00019835831512882734, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.0002477773659148584, + "loss": 0.0148, "step": 134310 }, { - "epoch": 0.68, - "learning_rate": 0.00019835074743581333, - "loss": 0.016, + "epoch": 0.35, + "learning_rate": 0.00024777347769848696, + "loss": 0.019, "step": 134320 }, { - "epoch": 0.68, - "learning_rate": 0.0001983431797427993, - "loss": 0.0169, + "epoch": 0.35, + "learning_rate": 0.00024776958948211547, + "loss": 0.021, "step": 134330 }, { - "epoch": 0.68, - "learning_rate": 0.00019833561204978532, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.000247765701265744, + "loss": 0.0199, "step": 134340 }, { - "epoch": 0.68, - "learning_rate": 0.0001983280443567713, - "loss": 0.0122, + "epoch": 0.35, + "learning_rate": 0.00024776181304937255, + "loss": 0.0196, "step": 134350 }, { - "epoch": 0.68, - "learning_rate": 0.00019832047666375728, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002477579248330011, + "loss": 0.0189, "step": 134360 }, { - "epoch": 0.68, - "learning_rate": 0.0001983129089707433, - "loss": 0.0157, + "epoch": 0.35, + "learning_rate": 0.00024775403661662964, + "loss": 0.0212, "step": 134370 }, { - "epoch": 0.68, - "learning_rate": 0.00019830534127772927, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.00024775014840025815, + "loss": 0.0212, "step": 134380 }, { - "epoch": 0.68, - "learning_rate": 0.00019829777358471525, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.00024774626018388667, + "loss": 0.0153, "step": 134390 }, { - "epoch": 0.68, - "learning_rate": 0.00019829020589170126, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.00024774237196751523, + "loss": 0.019, "step": 134400 }, { - "epoch": 0.68, - "learning_rate": 0.00019828263819868724, - "loss": 0.015, + "epoch": 0.35, + "learning_rate": 0.00024773848375114375, + "loss": 0.0214, "step": 134410 }, { - "epoch": 0.68, - "learning_rate": 0.00019827507050567322, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.0002477345955347723, + "loss": 0.0176, "step": 134420 }, { - "epoch": 0.68, - "learning_rate": 0.00019826750281265923, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.00024773070731840083, + "loss": 0.0231, "step": 134430 }, { - "epoch": 0.68, - "learning_rate": 0.0001982599351196452, - "loss": 0.0155, + "epoch": 0.35, + "learning_rate": 0.0002477268191020294, + "loss": 0.0193, "step": 134440 }, { - "epoch": 0.68, - "learning_rate": 0.0001982523674266312, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.0002477229308856579, + "loss": 0.0196, "step": 134450 }, { - "epoch": 0.68, - "learning_rate": 0.0001982447997336172, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.00024771904266928643, + "loss": 0.0195, "step": 134460 }, { - "epoch": 0.68, - "learning_rate": 0.00019823723204060318, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.00024771515445291494, + "loss": 0.0208, "step": 134470 }, { - "epoch": 0.68, - "learning_rate": 0.00019822966434758916, - "loss": 0.0139, + "epoch": 0.35, + "learning_rate": 0.0002477112662365435, + "loss": 0.0219, "step": 134480 }, { - "epoch": 0.68, - "learning_rate": 0.00019822209665457515, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.00024770737802017203, + "loss": 0.0233, "step": 134490 }, { - "epoch": 0.68, - "learning_rate": 0.00019821452896156115, - "loss": 0.0156, + "epoch": 0.35, + "learning_rate": 0.0002477034898038006, + "loss": 0.023, "step": 134500 }, { - "epoch": 0.68, - "learning_rate": 0.00019820696126854714, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.0002476996015874291, + "loss": 0.0276, "step": 134510 }, { - "epoch": 0.68, - "learning_rate": 0.00019819939357553312, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.0002476957133710576, + "loss": 0.019, "step": 134520 }, { - "epoch": 0.68, - "learning_rate": 0.00019819182588251913, - "loss": 0.0165, + "epoch": 0.35, + "learning_rate": 0.0002476918251546862, + "loss": 0.0204, "step": 134530 }, { - "epoch": 0.68, - "learning_rate": 0.0001981842581895051, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.0002476879369383147, + "loss": 0.0204, "step": 134540 }, { - "epoch": 0.68, - "learning_rate": 0.0001981766904964911, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002476840487219433, + "loss": 0.0237, "step": 134550 }, { - "epoch": 0.68, - "learning_rate": 0.0001981691228034771, - "loss": 0.0169, + "epoch": 0.35, + "learning_rate": 0.0002476801605055718, + "loss": 0.0187, "step": 134560 }, { - "epoch": 0.68, - "learning_rate": 0.00019816155511046308, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024767627228920036, + "loss": 0.0149, "step": 134570 }, { - "epoch": 0.68, - "learning_rate": 0.00019815398741744906, - "loss": 0.0189, + "epoch": 0.35, + "learning_rate": 0.0002476723840728289, + "loss": 0.0172, "step": 134580 }, { - "epoch": 0.68, - "learning_rate": 0.00019814641972443507, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002476684958564574, + "loss": 0.022, "step": 134590 }, { - "epoch": 0.68, - "learning_rate": 0.00019813885203142105, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.0002476646076400859, + "loss": 0.0168, "step": 134600 }, { - "epoch": 0.68, - "learning_rate": 0.00019813128433840703, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002476607194237145, + "loss": 0.0272, "step": 134610 }, { - "epoch": 0.68, - "learning_rate": 0.00019812371664539304, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.000247656831207343, + "loss": 0.0198, "step": 134620 }, { - "epoch": 0.68, - "learning_rate": 0.00019811614895237902, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.00024765294299097156, + "loss": 0.0221, "step": 134630 }, { - "epoch": 0.68, - "learning_rate": 0.000198108581259365, - "loss": 0.0166, + "epoch": 0.35, + "learning_rate": 0.00024764905477460007, + "loss": 0.0182, "step": 134640 }, { - "epoch": 0.68, - "learning_rate": 0.00019810101356635098, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.00024764516655822864, + "loss": 0.0162, "step": 134650 }, { - "epoch": 0.68, - "learning_rate": 0.000198093445873337, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.00024764127834185715, + "loss": 0.0194, "step": 134660 }, { - "epoch": 0.68, - "learning_rate": 0.00019808587818032297, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024763739012548567, + "loss": 0.0161, "step": 134670 }, { - "epoch": 0.68, - "learning_rate": 0.00019807831048730896, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.0002476335019091142, + "loss": 0.0225, "step": 134680 }, { - "epoch": 0.68, - "learning_rate": 0.00019807074279429496, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.00024762961369274275, + "loss": 0.0176, "step": 134690 }, { - "epoch": 0.68, - "learning_rate": 0.00019806317510128095, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.0002476257254763713, + "loss": 0.0228, "step": 134700 }, { - "epoch": 0.68, - "learning_rate": 0.00019805560740826693, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.00024762183725999984, + "loss": 0.0216, "step": 134710 }, { - "epoch": 0.68, - "learning_rate": 0.00019804803971525294, - "loss": 0.0112, + "epoch": 0.35, + "learning_rate": 0.00024761794904362835, + "loss": 0.0204, "step": 134720 }, { - "epoch": 0.68, - "learning_rate": 0.00019804047202223892, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024761406082725686, + "loss": 0.0236, "step": 134730 }, { - "epoch": 0.68, - "learning_rate": 0.0001980329043292249, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.00024761017261088543, + "loss": 0.0191, "step": 134740 }, { - "epoch": 0.68, - "learning_rate": 0.0001980253366362109, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.00024760628439451395, + "loss": 0.0188, "step": 134750 }, { - "epoch": 0.68, - "learning_rate": 0.0001980177689431969, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002476023961781425, + "loss": 0.0197, "step": 134760 }, { - "epoch": 0.68, - "learning_rate": 0.00019801020125018287, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024759850796177103, + "loss": 0.0197, "step": 134770 }, { - "epoch": 0.68, - "learning_rate": 0.00019800263355716888, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.0002475946197453996, + "loss": 0.0255, "step": 134780 }, { - "epoch": 0.68, - "learning_rate": 0.00019799506586415486, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.0002475907315290281, + "loss": 0.0158, "step": 134790 }, { - "epoch": 0.68, - "learning_rate": 0.00019798749817114084, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.00024758684331265663, + "loss": 0.02, "step": 134800 }, { - "epoch": 0.68, - "learning_rate": 0.00019797993047812682, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024758295509628514, + "loss": 0.0279, "step": 134810 }, { - "epoch": 0.68, - "learning_rate": 0.00019797236278511283, - "loss": 0.0144, + "epoch": 0.35, + "learning_rate": 0.0002475790668799137, + "loss": 0.0248, "step": 134820 }, { - "epoch": 0.68, - "learning_rate": 0.0001979647950920988, - "loss": 0.0155, + "epoch": 0.35, + "learning_rate": 0.0002475751786635422, + "loss": 0.0192, "step": 134830 }, { - "epoch": 0.68, - "learning_rate": 0.0001979572273990848, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002475712904471708, + "loss": 0.0161, "step": 134840 }, { - "epoch": 0.68, - "learning_rate": 0.0001979496597060708, - "loss": 0.0176, + "epoch": 0.35, + "learning_rate": 0.0002475674022307993, + "loss": 0.0209, "step": 134850 }, { - "epoch": 0.68, - "learning_rate": 0.00019794209201305678, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.0002475635140144279, + "loss": 0.0199, "step": 134860 }, { - "epoch": 0.68, - "learning_rate": 0.00019793452432004277, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.0002475596257980564, + "loss": 0.0196, "step": 134870 }, { - "epoch": 0.68, - "learning_rate": 0.00019792695662702877, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002475557375816849, + "loss": 0.0227, "step": 134880 }, { - "epoch": 0.68, - "learning_rate": 0.00019791938893401476, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002475518493653134, + "loss": 0.0169, "step": 134890 }, { - "epoch": 0.68, - "learning_rate": 0.00019791182124100074, - "loss": 0.0109, + "epoch": 0.35, + "learning_rate": 0.000247547961148942, + "loss": 0.0208, "step": 134900 }, { - "epoch": 0.68, - "learning_rate": 0.00019790425354798675, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.00024754407293257056, + "loss": 0.0254, "step": 134910 }, { - "epoch": 0.68, - "learning_rate": 0.00019789668585497273, - "loss": 0.0203, + "epoch": 0.35, + "learning_rate": 0.0002475401847161991, + "loss": 0.0204, "step": 134920 }, { - "epoch": 0.68, - "learning_rate": 0.0001978891181619587, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.0002475362964998276, + "loss": 0.0184, "step": 134930 }, { - "epoch": 0.68, - "learning_rate": 0.00019788155046894472, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.00024753240828345616, + "loss": 0.0191, "step": 134940 }, { - "epoch": 0.68, - "learning_rate": 0.0001978739827759307, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.00024752852006708467, + "loss": 0.0216, "step": 134950 }, { - "epoch": 0.68, - "learning_rate": 0.00019786641508291668, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.0002475246318507132, + "loss": 0.0157, "step": 134960 }, { - "epoch": 0.68, - "learning_rate": 0.0001978588473899027, - "loss": 0.0152, + "epoch": 0.35, + "learning_rate": 0.00024752074363434176, + "loss": 0.019, "step": 134970 }, { - "epoch": 0.68, - "learning_rate": 0.00019785127969688867, - "loss": 0.0125, + "epoch": 0.35, + "learning_rate": 0.00024751685541797027, + "loss": 0.0192, "step": 134980 }, { - "epoch": 0.68, - "learning_rate": 0.00019784371200387465, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024751296720159884, + "loss": 0.0192, "step": 134990 }, { - "epoch": 0.68, - "learning_rate": 0.00019783614431086063, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.00024750907898522735, + "loss": 0.0196, "step": 135000 }, { - "epoch": 0.68, - "eval_cer": 0.9144663743186606, - "eval_loss": 0.00933473464101553, - "eval_runtime": 116.6822, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.35, + "eval_cer": 0.8818258543733756, + "eval_loss": 0.014533363282680511, + "eval_runtime": 107.3258, + "eval_samples_per_second": 18.635, + "eval_steps_per_second": 4.659, "step": 135000 }, { - "epoch": 0.68, - "learning_rate": 0.00019782857661784664, - "loss": 0.0122, + "epoch": 0.35, + "learning_rate": 0.00024750519076885587, + "loss": 0.0254, "step": 135010 }, { - "epoch": 0.68, - "learning_rate": 0.00019782100892483262, - "loss": 0.0107, + "epoch": 0.35, + "learning_rate": 0.0002475013025524844, + "loss": 0.019, "step": 135020 }, { - "epoch": 0.68, - "learning_rate": 0.0001978134412318186, - "loss": 0.015, + "epoch": 0.35, + "learning_rate": 0.00024749741433611295, + "loss": 0.0226, "step": 135030 }, { - "epoch": 0.68, - "learning_rate": 0.0001978058735388046, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024749352611974147, + "loss": 0.0187, "step": 135040 }, { - "epoch": 0.68, - "learning_rate": 0.0001977983058457906, + "epoch": 0.35, + "learning_rate": 0.00024748963790337003, "loss": 0.019, "step": 135050 }, { - "epoch": 0.68, - "learning_rate": 0.00019779073815277658, - "loss": 0.0179, + "epoch": 0.35, + "learning_rate": 0.00024748574968699855, + "loss": 0.0212, "step": 135060 }, { - "epoch": 0.68, - "learning_rate": 0.00019778317045976258, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.0002474818614706271, + "loss": 0.0222, "step": 135070 }, { - "epoch": 0.68, - "learning_rate": 0.00019777560276674857, - "loss": 0.0168, + "epoch": 0.35, + "learning_rate": 0.00024747797325425563, + "loss": 0.0229, "step": 135080 }, { - "epoch": 0.68, - "learning_rate": 0.00019776803507373455, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.00024747408503788415, + "loss": 0.0265, "step": 135090 }, { - "epoch": 0.68, - "learning_rate": 0.00019776046738072056, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.0002474701968215127, + "loss": 0.0213, "step": 135100 }, { - "epoch": 0.68, - "learning_rate": 0.00019775289968770654, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.00024746630860514123, + "loss": 0.0177, "step": 135110 }, { - "epoch": 0.68, - "learning_rate": 0.0001977453319946925, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.0002474624203887698, + "loss": 0.0261, "step": 135120 }, { - "epoch": 0.68, - "learning_rate": 0.00019773776430167847, - "loss": 0.0116, + "epoch": 0.35, + "learning_rate": 0.0002474585321723983, + "loss": 0.0226, "step": 135130 }, { - "epoch": 0.68, - "learning_rate": 0.00019773019660866448, - "loss": 0.0169, + "epoch": 0.35, + "learning_rate": 0.00024745464395602683, + "loss": 0.0196, "step": 135140 }, { - "epoch": 0.68, - "learning_rate": 0.00019772262891565046, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.0002474507557396554, + "loss": 0.0213, "step": 135150 }, { - "epoch": 0.68, - "learning_rate": 0.00019771506122263644, - "loss": 0.0118, + "epoch": 0.35, + "learning_rate": 0.0002474468675232839, + "loss": 0.0192, "step": 135160 }, { - "epoch": 0.68, - "learning_rate": 0.00019770749352962245, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002474429793069124, + "loss": 0.0301, "step": 135170 }, { - "epoch": 0.68, - "learning_rate": 0.00019769992583660843, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.000247439091090541, + "loss": 0.0226, "step": 135180 }, { - "epoch": 0.68, - "learning_rate": 0.00019769235814359442, - "loss": 0.0119, + "epoch": 0.35, + "learning_rate": 0.0002474352028741695, + "loss": 0.0235, "step": 135190 }, { - "epoch": 0.68, - "learning_rate": 0.0001976847904505804, - "loss": 0.0158, + "epoch": 0.35, + "learning_rate": 0.0002474313146577981, + "loss": 0.0198, "step": 135200 }, { - "epoch": 0.68, - "learning_rate": 0.0001976772227575664, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.0002474274264414266, + "loss": 0.0214, "step": 135210 }, { - "epoch": 0.68, - "learning_rate": 0.0001976696550645524, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002474235382250551, + "loss": 0.0174, "step": 135220 }, { - "epoch": 0.68, - "learning_rate": 0.00019766208737153837, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.0002474196500086836, + "loss": 0.02, "step": 135230 }, { - "epoch": 0.68, - "learning_rate": 0.00019765451967852438, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.0002474157617923122, + "loss": 0.0181, "step": 135240 }, { - "epoch": 0.68, - "learning_rate": 0.00019764695198551036, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.00024741187357594076, + "loss": 0.018, "step": 135250 }, { - "epoch": 0.68, - "learning_rate": 0.00019763938429249634, - "loss": 0.0205, + "epoch": 0.35, + "learning_rate": 0.0002474079853595693, + "loss": 0.0198, "step": 135260 }, { - "epoch": 0.68, - "learning_rate": 0.00019763181659948235, - "loss": 0.011, + "epoch": 0.35, + "learning_rate": 0.0002474040971431978, + "loss": 0.0225, "step": 135270 }, { - "epoch": 0.68, - "learning_rate": 0.00019762424890646833, - "loss": 0.0122, + "epoch": 0.35, + "learning_rate": 0.00024740020892682636, + "loss": 0.0236, "step": 135280 }, { - "epoch": 0.68, - "learning_rate": 0.0001976166812134543, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.00024739632071045487, + "loss": 0.0175, "step": 135290 }, { - "epoch": 0.68, - "learning_rate": 0.00019760911352044032, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002473924324940834, + "loss": 0.0161, "step": 135300 }, { - "epoch": 0.68, - "learning_rate": 0.0001976015458274263, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.00024738854427771195, + "loss": 0.0263, "step": 135310 }, { - "epoch": 0.68, - "learning_rate": 0.00019759397813441228, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.00024738465606134047, + "loss": 0.0182, "step": 135320 }, { - "epoch": 0.68, - "learning_rate": 0.0001975864104413983, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.00024738076784496904, + "loss": 0.0192, "step": 135330 }, { - "epoch": 0.68, - "learning_rate": 0.00019757884274838427, - "loss": 0.0113, + "epoch": 0.35, + "learning_rate": 0.00024737687962859755, + "loss": 0.0229, "step": 135340 }, { - "epoch": 0.68, - "learning_rate": 0.00019757127505537025, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024737299141222607, + "loss": 0.0315, "step": 135350 }, { - "epoch": 0.68, - "learning_rate": 0.00019756370736235626, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.00024736910319585464, + "loss": 0.0268, "step": 135360 }, { - "epoch": 0.68, - "learning_rate": 0.00019755613966934224, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024736521497948315, + "loss": 0.0181, "step": 135370 }, { - "epoch": 0.68, - "learning_rate": 0.00019754857197632823, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.00024736132676311166, + "loss": 0.0164, "step": 135380 }, { - "epoch": 0.68, - "learning_rate": 0.0001975410042833142, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.00024735743854674023, + "loss": 0.0188, "step": 135390 }, { - "epoch": 0.68, - "learning_rate": 0.00019753343659030022, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.0002473535503303688, + "loss": 0.0198, "step": 135400 }, { - "epoch": 0.68, - "learning_rate": 0.0001975258688972862, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002473496621139973, + "loss": 0.0185, "step": 135410 }, { - "epoch": 0.68, - "learning_rate": 0.00019751830120427218, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.00024734577389762583, + "loss": 0.0196, "step": 135420 }, { - "epoch": 0.68, - "learning_rate": 0.0001975107335112582, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024734188568125435, + "loss": 0.02, "step": 135430 }, { - "epoch": 0.68, - "learning_rate": 0.00019750316581824417, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002473379974648829, + "loss": 0.0183, "step": 135440 }, { - "epoch": 0.68, - "learning_rate": 0.00019749559812523015, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.00024733410924851143, + "loss": 0.0273, "step": 135450 }, { - "epoch": 0.68, - "learning_rate": 0.00019748803043221616, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.00024733022103214, + "loss": 0.0256, "step": 135460 }, { - "epoch": 0.68, - "learning_rate": 0.00019748046273920214, - "loss": 0.0108, + "epoch": 0.35, + "learning_rate": 0.0002473263328157685, + "loss": 0.0197, "step": 135470 }, { - "epoch": 0.68, - "learning_rate": 0.00019747289504618812, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.000247322444599397, + "loss": 0.0219, "step": 135480 }, { - "epoch": 0.68, - "learning_rate": 0.00019746532735317413, - "loss": 0.0164, + "epoch": 0.35, + "learning_rate": 0.0002473185563830256, + "loss": 0.0232, "step": 135490 }, { - "epoch": 0.68, - "learning_rate": 0.0001974577596601601, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.0002473146681666541, + "loss": 0.0209, "step": 135500 }, { - "epoch": 0.68, - "learning_rate": 0.0001974501919671461, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002473107799502826, + "loss": 0.0222, "step": 135510 }, { - "epoch": 0.68, - "learning_rate": 0.0001974426242741321, - "loss": 0.0177, + "epoch": 0.35, + "learning_rate": 0.0002473068917339112, + "loss": 0.0227, "step": 135520 }, { - "epoch": 0.68, - "learning_rate": 0.00019743505658111808, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.0002473030035175397, + "loss": 0.0164, "step": 135530 }, { - "epoch": 0.68, - "learning_rate": 0.00019742748888810406, - "loss": 0.0183, + "epoch": 0.35, + "learning_rate": 0.0002472991153011683, + "loss": 0.0259, "step": 135540 }, { - "epoch": 0.68, - "learning_rate": 0.00019741992119509005, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002472952270847968, + "loss": 0.0186, "step": 135550 }, { - "epoch": 0.68, - "learning_rate": 0.00019741235350207605, - "loss": 0.0183, + "epoch": 0.35, + "learning_rate": 0.0002472913388684253, + "loss": 0.0185, "step": 135560 }, { - "epoch": 0.68, - "learning_rate": 0.00019740478580906204, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002472874506520539, + "loss": 0.0191, "step": 135570 }, { - "epoch": 0.68, - "learning_rate": 0.00019739721811604802, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.0002472835624356824, + "loss": 0.0192, "step": 135580 }, { - "epoch": 0.68, - "learning_rate": 0.00019738965042303403, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.0002472796742193109, + "loss": 0.0209, "step": 135590 }, { - "epoch": 0.68, - "learning_rate": 0.00019738208273002, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024727578600293947, + "loss": 0.0162, "step": 135600 }, { - "epoch": 0.68, - "learning_rate": 0.000197374515037006, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.00024727189778656804, + "loss": 0.0182, "step": 135610 }, { - "epoch": 0.68, - "learning_rate": 0.000197366947343992, - "loss": 0.0145, + "epoch": 0.35, + "learning_rate": 0.00024726800957019656, + "loss": 0.0189, "step": 135620 }, { - "epoch": 0.68, - "learning_rate": 0.00019735937965097798, - "loss": 0.0105, + "epoch": 0.35, + "learning_rate": 0.00024726412135382507, + "loss": 0.027, "step": 135630 }, { - "epoch": 0.68, - "learning_rate": 0.00019735181195796396, - "loss": 0.0102, + "epoch": 0.35, + "learning_rate": 0.0002472602331374536, + "loss": 0.0158, "step": 135640 }, { - "epoch": 0.68, - "learning_rate": 0.00019734424426494997, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.00024725634492108215, + "loss": 0.0216, "step": 135650 }, { - "epoch": 0.68, - "learning_rate": 0.00019733667657193595, - "loss": 0.0098, + "epoch": 0.35, + "learning_rate": 0.00024725245670471067, + "loss": 0.0161, "step": 135660 }, { - "epoch": 0.68, - "learning_rate": 0.00019732910887892193, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.00024724856848833924, + "loss": 0.023, "step": 135670 }, { - "epoch": 0.68, - "learning_rate": 0.00019732154118590794, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.00024724468027196775, + "loss": 0.0194, "step": 135680 }, { - "epoch": 0.68, - "learning_rate": 0.00019731397349289392, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.0002472407920555963, + "loss": 0.0152, "step": 135690 }, { - "epoch": 0.68, - "learning_rate": 0.0001973064057998799, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024723690383922483, + "loss": 0.0186, "step": 135700 }, { - "epoch": 0.68, - "learning_rate": 0.00019729883810686588, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.00024723301562285335, + "loss": 0.0247, "step": 135710 }, { - "epoch": 0.68, - "learning_rate": 0.0001972912704138519, - "loss": 0.0122, + "epoch": 0.35, + "learning_rate": 0.00024722912740648186, + "loss": 0.0223, "step": 135720 }, { - "epoch": 0.68, - "learning_rate": 0.00019728370272083787, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024722523919011043, + "loss": 0.018, "step": 135730 }, { - "epoch": 0.68, - "learning_rate": 0.00019727613502782386, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.000247221350973739, + "loss": 0.019, "step": 135740 }, { - "epoch": 0.68, - "learning_rate": 0.00019726856733480986, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002472174627573675, + "loss": 0.0253, "step": 135750 }, { - "epoch": 0.68, - "learning_rate": 0.00019726099964179585, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024721357454099603, + "loss": 0.0202, "step": 135760 }, { - "epoch": 0.68, - "learning_rate": 0.00019725343194878183, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.00024720968632462454, + "loss": 0.0213, "step": 135770 }, { - "epoch": 0.69, - "learning_rate": 0.00019724586425576784, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.0002472057981082531, + "loss": 0.0212, "step": 135780 }, { - "epoch": 0.69, - "learning_rate": 0.00019723829656275382, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.00024720190989188163, + "loss": 0.0192, "step": 135790 }, { - "epoch": 0.69, - "learning_rate": 0.0001972307288697398, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002471980216755102, + "loss": 0.0169, "step": 135800 }, { - "epoch": 0.69, - "learning_rate": 0.0001972231611767258, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.0002471941334591387, + "loss": 0.0173, "step": 135810 }, { - "epoch": 0.69, - "learning_rate": 0.0001972155934837118, - "loss": 0.0104, + "epoch": 0.35, + "learning_rate": 0.0002471902452427673, + "loss": 0.0198, "step": 135820 }, { - "epoch": 0.69, - "learning_rate": 0.00019720802579069777, - "loss": 0.0129, + "epoch": 0.35, + "learning_rate": 0.0002471863570263958, + "loss": 0.0205, "step": 135830 }, { - "epoch": 0.69, - "learning_rate": 0.00019720045809768378, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.0002471824688100243, + "loss": 0.024, "step": 135840 }, { - "epoch": 0.69, - "learning_rate": 0.00019719289040466976, - "loss": 0.0154, + "epoch": 0.35, + "learning_rate": 0.0002471785805936528, + "loss": 0.0199, "step": 135850 }, { - "epoch": 0.69, - "learning_rate": 0.00019718532271165574, - "loss": 0.0106, + "epoch": 0.35, + "learning_rate": 0.0002471746923772814, + "loss": 0.0264, "step": 135860 }, { - "epoch": 0.69, - "learning_rate": 0.00019717775501864175, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002471708041609099, + "loss": 0.0166, "step": 135870 }, { - "epoch": 0.69, - "learning_rate": 0.00019717018732562773, - "loss": 0.0121, + "epoch": 0.35, + "learning_rate": 0.0002471669159445385, + "loss": 0.0195, "step": 135880 }, { - "epoch": 0.69, - "learning_rate": 0.0001971626196326137, - "loss": 0.0112, + "epoch": 0.35, + "learning_rate": 0.000247163027728167, + "loss": 0.0234, "step": 135890 }, { - "epoch": 0.69, - "learning_rate": 0.0001971550519395997, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.00024715913951179556, + "loss": 0.0211, "step": 135900 }, { - "epoch": 0.69, - "learning_rate": 0.0001971474842465857, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.0002471552512954241, + "loss": 0.0157, "step": 135910 }, { - "epoch": 0.69, - "learning_rate": 0.00019713991655357168, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.0002471513630790526, + "loss": 0.0195, "step": 135920 }, { - "epoch": 0.69, - "learning_rate": 0.00019713234886055767, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002471474748626811, + "loss": 0.022, "step": 135930 }, { - "epoch": 0.69, - "learning_rate": 0.00019712478116754367, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024714358664630967, + "loss": 0.0199, "step": 135940 }, { - "epoch": 0.69, - "learning_rate": 0.00019711721347452966, - "loss": 0.0143, + "epoch": 0.35, + "learning_rate": 0.00024713969842993824, + "loss": 0.0205, "step": 135950 }, { - "epoch": 0.69, - "learning_rate": 0.00019710964578151564, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.00024713581021356675, + "loss": 0.0183, "step": 135960 }, { - "epoch": 0.69, - "learning_rate": 0.00019710207808850165, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.00024713192199719527, + "loss": 0.0178, "step": 135970 }, { - "epoch": 0.69, - "learning_rate": 0.00019709451039548763, - "loss": 0.0162, + "epoch": 0.35, + "learning_rate": 0.0002471280337808238, + "loss": 0.0184, "step": 135980 }, { - "epoch": 0.69, - "learning_rate": 0.0001970869427024736, - "loss": 0.0157, + "epoch": 0.35, + "learning_rate": 0.00024712414556445235, + "loss": 0.0195, "step": 135990 }, { - "epoch": 0.69, - "learning_rate": 0.00019707937500945962, - "loss": 0.0106, + "epoch": 0.35, + "learning_rate": 0.00024712025734808087, + "loss": 0.0224, "step": 136000 }, { - "epoch": 0.69, - "eval_cer": 0.9144586111496574, - "eval_loss": 0.009702920913696289, - "eval_runtime": 116.6777, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.35, + "eval_cer": 0.8818034601824287, + "eval_loss": 0.013970781117677689, + "eval_runtime": 107.2477, + "eval_samples_per_second": 18.648, + "eval_steps_per_second": 4.662, "step": 136000 }, { - "epoch": 0.69, - "learning_rate": 0.0001970718073164456, - "loss": 0.0132, + "epoch": 0.35, + "learning_rate": 0.00024711636913170944, + "loss": 0.0188, "step": 136010 }, { - "epoch": 0.69, - "learning_rate": 0.00019706423962343158, - "loss": 0.011, + "epoch": 0.35, + "learning_rate": 0.00024711248091533795, + "loss": 0.021, "step": 136020 }, { - "epoch": 0.69, - "learning_rate": 0.0001970566719304176, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.0002471085926989665, + "loss": 0.0186, "step": 136030 }, { - "epoch": 0.69, - "learning_rate": 0.00019704910423740357, - "loss": 0.017, + "epoch": 0.35, + "learning_rate": 0.00024710470448259503, + "loss": 0.0191, "step": 136040 }, { - "epoch": 0.69, - "learning_rate": 0.00019704153654438955, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024710081626622355, + "loss": 0.0254, "step": 136050 }, { - "epoch": 0.69, - "learning_rate": 0.00019703396885137553, - "loss": 0.0156, + "epoch": 0.35, + "learning_rate": 0.00024709692804985206, + "loss": 0.0232, "step": 136060 }, { - "epoch": 0.69, - "learning_rate": 0.00019702640115836154, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.00024709303983348063, + "loss": 0.0216, "step": 136070 }, { - "epoch": 0.69, - "learning_rate": 0.00019701883346534752, - "loss": 0.0122, + "epoch": 0.35, + "learning_rate": 0.00024708915161710915, + "loss": 0.0212, "step": 136080 }, { - "epoch": 0.69, - "learning_rate": 0.0001970112657723335, - "loss": 0.0161, + "epoch": 0.35, + "learning_rate": 0.0002470852634007377, + "loss": 0.0164, "step": 136090 }, { - "epoch": 0.69, - "learning_rate": 0.0001970036980793195, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.00024708137518436623, + "loss": 0.0183, "step": 136100 }, { - "epoch": 0.69, - "learning_rate": 0.0001969961303863055, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002470774869679948, + "loss": 0.0187, "step": 136110 }, { - "epoch": 0.69, - "learning_rate": 0.00019698856269329148, - "loss": 0.0146, + "epoch": 0.35, + "learning_rate": 0.0002470735987516233, + "loss": 0.0187, "step": 136120 }, { - "epoch": 0.69, - "learning_rate": 0.00019698099500027748, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002470697105352518, + "loss": 0.0157, "step": 136130 }, { - "epoch": 0.69, - "learning_rate": 0.00019697342730726347, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002470658223188804, + "loss": 0.0174, "step": 136140 }, { - "epoch": 0.69, - "learning_rate": 0.00019696585961424945, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.0002470619341025089, + "loss": 0.0138, "step": 136150 }, { - "epoch": 0.69, - "learning_rate": 0.00019695829192123546, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002470580458861375, + "loss": 0.0188, "step": 136160 }, { - "epoch": 0.69, - "learning_rate": 0.00019695072422822144, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.000247054157669766, + "loss": 0.0201, "step": 136170 }, { - "epoch": 0.69, - "learning_rate": 0.00019694315653520742, - "loss": 0.0131, + "epoch": 0.35, + "learning_rate": 0.0002470502694533945, + "loss": 0.017, "step": 136180 }, { - "epoch": 0.69, - "learning_rate": 0.00019693558884219343, - "loss": 0.0183, + "epoch": 0.35, + "learning_rate": 0.0002470463812370231, + "loss": 0.0185, "step": 136190 }, { - "epoch": 0.69, - "learning_rate": 0.0001969280211491794, - "loss": 0.0163, + "epoch": 0.35, + "learning_rate": 0.0002470424930206516, + "loss": 0.0238, "step": 136200 }, { - "epoch": 0.69, - "learning_rate": 0.0001969204534561654, - "loss": 0.0133, + "epoch": 0.35, + "learning_rate": 0.0002470386048042801, + "loss": 0.0228, "step": 136210 }, { - "epoch": 0.69, - "learning_rate": 0.00019691288576315137, - "loss": 0.0157, + "epoch": 0.35, + "learning_rate": 0.0002470347165879087, + "loss": 0.0263, "step": 136220 }, { - "epoch": 0.69, - "learning_rate": 0.00019690531807013738, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002470308283715372, + "loss": 0.0205, "step": 136230 }, { - "epoch": 0.69, - "learning_rate": 0.00019689775037712336, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024702694015516576, + "loss": 0.0233, "step": 136240 }, { - "epoch": 0.69, - "learning_rate": 0.00019689018268410934, - "loss": 0.0109, + "epoch": 0.35, + "learning_rate": 0.00024702305193879427, + "loss": 0.018, "step": 136250 }, { - "epoch": 0.69, - "learning_rate": 0.00019688261499109535, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002470191637224228, + "loss": 0.0175, "step": 136260 }, { - "epoch": 0.69, - "learning_rate": 0.00019687504729808133, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.0002470152755060513, + "loss": 0.0227, "step": 136270 }, { - "epoch": 0.69, - "learning_rate": 0.00019686747960506731, - "loss": 0.0179, + "epoch": 0.35, + "learning_rate": 0.00024701138728967987, + "loss": 0.0217, "step": 136280 }, { - "epoch": 0.69, - "learning_rate": 0.00019685991191205332, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.00024700749907330844, + "loss": 0.0188, "step": 136290 }, { - "epoch": 0.69, - "learning_rate": 0.0001968523442190393, - "loss": 0.0116, + "epoch": 0.35, + "learning_rate": 0.00024700361085693695, + "loss": 0.0199, "step": 136300 }, { - "epoch": 0.69, - "learning_rate": 0.00019684477652602529, - "loss": 0.0128, + "epoch": 0.35, + "learning_rate": 0.00024699972264056547, + "loss": 0.0264, "step": 136310 }, { - "epoch": 0.69, - "learning_rate": 0.0001968372088330113, - "loss": 0.0176, + "epoch": 0.35, + "learning_rate": 0.00024699583442419404, + "loss": 0.0186, "step": 136320 }, { - "epoch": 0.69, - "learning_rate": 0.00019682964113999728, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.00024699194620782255, + "loss": 0.0209, "step": 136330 }, { - "epoch": 0.69, - "learning_rate": 0.00019682207344698326, - "loss": 0.0114, + "epoch": 0.35, + "learning_rate": 0.00024698805799145107, + "loss": 0.0217, "step": 136340 }, { - "epoch": 0.69, - "learning_rate": 0.00019681450575396927, - "loss": 0.014, + "epoch": 0.35, + "learning_rate": 0.00024698416977507963, + "loss": 0.0215, "step": 136350 }, { - "epoch": 0.69, - "learning_rate": 0.00019680693806095525, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.00024698028155870815, + "loss": 0.0181, "step": 136360 }, { - "epoch": 0.69, - "learning_rate": 0.00019679937036794123, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002469763933423367, + "loss": 0.0204, "step": 136370 }, { - "epoch": 0.69, - "learning_rate": 0.00019679180267492718, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.00024697250512596523, + "loss": 0.0192, "step": 136380 }, { - "epoch": 0.69, - "learning_rate": 0.0001967842349819132, - "loss": 0.011, + "epoch": 0.35, + "learning_rate": 0.00024696861690959375, + "loss": 0.0202, "step": 136390 }, { - "epoch": 0.69, - "learning_rate": 0.00019677666728889917, - "loss": 0.0117, + "epoch": 0.35, + "learning_rate": 0.0002469647286932223, + "loss": 0.0198, "step": 136400 }, { - "epoch": 0.69, - "learning_rate": 0.00019676909959588515, - "loss": 0.0144, + "epoch": 0.35, + "learning_rate": 0.00024696084047685083, + "loss": 0.021, "step": 136410 }, { - "epoch": 0.69, - "learning_rate": 0.00019676153190287116, - "loss": 0.0189, + "epoch": 0.35, + "learning_rate": 0.00024695695226047934, + "loss": 0.0192, "step": 136420 }, { - "epoch": 0.69, - "learning_rate": 0.00019675396420985714, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002469530640441079, + "loss": 0.02, "step": 136430 }, { - "epoch": 0.69, - "learning_rate": 0.00019674639651684313, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002469491758277365, + "loss": 0.0186, "step": 136440 }, { - "epoch": 0.69, - "learning_rate": 0.0001967388288238291, - "loss": 0.0118, + "epoch": 0.35, + "learning_rate": 0.000246945287611365, + "loss": 0.0255, "step": 136450 }, { - "epoch": 0.69, - "learning_rate": 0.00019673126113081512, - "loss": 0.0119, + "epoch": 0.35, + "learning_rate": 0.0002469413993949935, + "loss": 0.0192, "step": 136460 }, { - "epoch": 0.69, - "learning_rate": 0.0001967236934378011, - "loss": 0.0147, + "epoch": 0.35, + "learning_rate": 0.000246937511178622, + "loss": 0.0191, "step": 136470 }, { - "epoch": 0.69, - "learning_rate": 0.00019671612574478708, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.00024693362296225054, + "loss": 0.0182, "step": 136480 }, { - "epoch": 0.69, - "learning_rate": 0.0001967085580517731, - "loss": 0.012, + "epoch": 0.35, + "learning_rate": 0.0002469297347458791, + "loss": 0.0209, "step": 136490 }, { - "epoch": 0.69, - "learning_rate": 0.00019670099035875907, - "loss": 0.0116, + "epoch": 0.35, + "learning_rate": 0.0002469258465295077, + "loss": 0.0217, "step": 136500 }, { - "epoch": 0.69, - "learning_rate": 0.00019669342266574505, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.0002469219583131362, + "loss": 0.022, "step": 136510 }, { - "epoch": 0.69, - "learning_rate": 0.00019668585497273106, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.0002469180700967647, + "loss": 0.021, "step": 136520 }, { - "epoch": 0.69, - "learning_rate": 0.00019667828727971704, - "loss": 0.0134, + "epoch": 0.35, + "learning_rate": 0.0002469141818803933, + "loss": 0.0167, "step": 136530 }, { - "epoch": 0.69, - "learning_rate": 0.00019667071958670302, - "loss": 0.0137, + "epoch": 0.35, + "learning_rate": 0.0002469102936640218, + "loss": 0.0191, "step": 136540 }, { - "epoch": 0.69, - "learning_rate": 0.00019666315189368903, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.0002469064054476503, + "loss": 0.021, "step": 136550 }, { - "epoch": 0.69, - "learning_rate": 0.000196655584200675, - "loss": 0.0112, + "epoch": 0.35, + "learning_rate": 0.0002469025172312789, + "loss": 0.022, "step": 136560 }, { - "epoch": 0.69, - "learning_rate": 0.000196648016507661, - "loss": 0.0183, + "epoch": 0.35, + "learning_rate": 0.0002468986290149074, + "loss": 0.0214, "step": 136570 }, { - "epoch": 0.69, - "learning_rate": 0.000196640448814647, - "loss": 0.0112, + "epoch": 0.35, + "learning_rate": 0.00024689474079853596, + "loss": 0.0209, "step": 136580 }, { - "epoch": 0.69, - "learning_rate": 0.00019663288112163298, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.00024689085258216447, + "loss": 0.0171, "step": 136590 }, { - "epoch": 0.69, - "learning_rate": 0.00019662531342861896, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.000246886964365793, + "loss": 0.0187, "step": 136600 }, { - "epoch": 0.69, - "learning_rate": 0.00019661774573560495, - "loss": 0.0127, + "epoch": 0.35, + "learning_rate": 0.00024688307614942155, + "loss": 0.0168, "step": 136610 }, { - "epoch": 0.69, - "learning_rate": 0.00019661017804259095, - "loss": 0.01, + "epoch": 0.35, + "learning_rate": 0.00024687918793305007, + "loss": 0.0266, "step": 136620 }, { - "epoch": 0.69, - "learning_rate": 0.00019660261034957694, - "loss": 0.0118, + "epoch": 0.35, + "learning_rate": 0.0002468752997166786, + "loss": 0.0191, "step": 136630 }, { - "epoch": 0.69, - "learning_rate": 0.00019659504265656292, - "loss": 0.0179, + "epoch": 0.35, + "learning_rate": 0.00024687141150030715, + "loss": 0.0212, "step": 136640 }, { - "epoch": 0.69, - "learning_rate": 0.00019658747496354893, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.0002468675232839357, + "loss": 0.0217, "step": 136650 }, { - "epoch": 0.69, - "learning_rate": 0.0001965799072705349, - "loss": 0.0122, + "epoch": 0.35, + "learning_rate": 0.00024686363506756424, + "loss": 0.0259, "step": 136660 }, { - "epoch": 0.69, - "learning_rate": 0.0001965723395775209, - "loss": 0.0123, + "epoch": 0.35, + "learning_rate": 0.00024685974685119275, + "loss": 0.0219, "step": 136670 }, { - "epoch": 0.69, - "learning_rate": 0.0001965647718845069, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.00024685585863482126, + "loss": 0.0205, "step": 136680 }, { - "epoch": 0.69, - "learning_rate": 0.00019655720419149288, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.00024685197041844983, + "loss": 0.0196, "step": 136690 }, { - "epoch": 0.69, - "learning_rate": 0.00019654963649847886, - "loss": 0.0124, + "epoch": 0.35, + "learning_rate": 0.00024684808220207835, + "loss": 0.019, "step": 136700 }, { - "epoch": 0.69, - "learning_rate": 0.00019654206880546487, - "loss": 0.015, + "epoch": 0.35, + "learning_rate": 0.0002468441939857069, + "loss": 0.0249, "step": 136710 }, { - "epoch": 0.69, - "learning_rate": 0.00019653450111245085, - "loss": 0.0141, + "epoch": 0.35, + "learning_rate": 0.00024684030576933543, + "loss": 0.0221, "step": 136720 }, { - "epoch": 0.69, - "learning_rate": 0.00019652693341943683, - "loss": 0.0182, + "epoch": 0.35, + "learning_rate": 0.00024683641755296395, + "loss": 0.0183, "step": 136730 }, { - "epoch": 0.69, - "learning_rate": 0.00019651936572642284, - "loss": 0.0153, + "epoch": 0.35, + "learning_rate": 0.0002468325293365925, + "loss": 0.0235, "step": 136740 }, { - "epoch": 0.69, - "learning_rate": 0.00019651179803340882, - "loss": 0.0119, + "epoch": 0.35, + "learning_rate": 0.00024682864112022103, + "loss": 0.0176, "step": 136750 }, { - "epoch": 0.69, - "learning_rate": 0.0001965042303403948, - "loss": 0.0148, + "epoch": 0.35, + "learning_rate": 0.00024682475290384954, + "loss": 0.0196, "step": 136760 }, { - "epoch": 0.69, - "learning_rate": 0.0001964966626473808, - "loss": 0.0092, + "epoch": 0.35, + "learning_rate": 0.0002468208646874781, + "loss": 0.023, "step": 136770 }, { - "epoch": 0.69, - "learning_rate": 0.0001964890949543668, - "loss": 0.0151, + "epoch": 0.35, + "learning_rate": 0.0002468169764711066, + "loss": 0.0164, "step": 136780 }, { - "epoch": 0.69, - "learning_rate": 0.00019648152726135277, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.0002468130882547352, + "loss": 0.0252, "step": 136790 }, { - "epoch": 0.69, - "learning_rate": 0.00019647395956833876, - "loss": 0.0186, + "epoch": 0.35, + "learning_rate": 0.0002468092000383637, + "loss": 0.0229, "step": 136800 }, { - "epoch": 0.69, - "learning_rate": 0.00019646639187532476, - "loss": 0.015, + "epoch": 0.35, + "learning_rate": 0.0002468053118219922, + "loss": 0.0198, "step": 136810 }, { - "epoch": 0.69, - "learning_rate": 0.00019645882418231075, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002468014236056208, + "loss": 0.0225, "step": 136820 }, { - "epoch": 0.69, - "learning_rate": 0.00019645125648929673, - "loss": 0.013, + "epoch": 0.35, + "learning_rate": 0.0002467975353892493, + "loss": 0.0171, "step": 136830 }, { - "epoch": 0.69, - "learning_rate": 0.00019644368879628274, - "loss": 0.0142, + "epoch": 0.35, + "learning_rate": 0.0002467936471728779, + "loss": 0.0171, "step": 136840 }, { - "epoch": 0.69, - "learning_rate": 0.00019643612110326872, - "loss": 0.0135, + "epoch": 0.35, + "learning_rate": 0.0002467897589565064, + "loss": 0.0238, "step": 136850 }, { - "epoch": 0.69, - "learning_rate": 0.0001964285534102547, - "loss": 0.0171, + "epoch": 0.35, + "learning_rate": 0.00024678587074013496, + "loss": 0.0194, "step": 136860 }, { - "epoch": 0.69, - "learning_rate": 0.0001964209857172407, - "loss": 0.0136, + "epoch": 0.35, + "learning_rate": 0.0002467819825237635, + "loss": 0.0233, "step": 136870 }, { - "epoch": 0.69, - "learning_rate": 0.0001964134180242267, - "loss": 0.0126, + "epoch": 0.35, + "learning_rate": 0.000246778094307392, + "loss": 0.0209, "step": 136880 }, { - "epoch": 0.69, - "learning_rate": 0.00019640585033121267, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.0002467742060910205, + "loss": 0.0178, "step": 136890 }, { - "epoch": 0.69, - "learning_rate": 0.00019639828263819868, - "loss": 0.0149, + "epoch": 0.35, + "learning_rate": 0.00024677031787464907, + "loss": 0.0235, "step": 136900 }, { - "epoch": 0.69, - "learning_rate": 0.00019639071494518466, - "loss": 0.0183, + "epoch": 0.35, + "learning_rate": 0.0002467664296582776, + "loss": 0.0217, "step": 136910 }, { - "epoch": 0.69, - "learning_rate": 0.00019638314725217064, - "loss": 0.0138, + "epoch": 0.35, + "learning_rate": 0.00024676254144190616, + "loss": 0.0262, "step": 136920 }, { - "epoch": 0.69, - "learning_rate": 0.00019637557955915665, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.00024675865322553467, + "loss": 0.0199, "step": 136930 }, { - "epoch": 0.69, - "learning_rate": 0.00019636801186614263, - "loss": 0.0111, + "epoch": 0.35, + "learning_rate": 0.00024675476500916324, + "loss": 0.017, "step": 136940 }, { - "epoch": 0.69, - "learning_rate": 0.0001963604441731286, - "loss": 0.0159, + "epoch": 0.35, + "learning_rate": 0.00024675087679279175, + "loss": 0.0197, "step": 136950 }, { - "epoch": 0.69, - "learning_rate": 0.0001963528764801146, - "loss": 0.0109, + "epoch": 0.36, + "learning_rate": 0.00024674698857642027, + "loss": 0.0187, "step": 136960 }, { - "epoch": 0.69, - "learning_rate": 0.0001963453087871006, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.0002467431003600488, + "loss": 0.0239, "step": 136970 }, { - "epoch": 0.69, - "learning_rate": 0.00019633774109408658, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.00024673921214367735, + "loss": 0.025, "step": 136980 }, { - "epoch": 0.69, - "learning_rate": 0.00019633017340107257, - "loss": 0.011, + "epoch": 0.36, + "learning_rate": 0.0002467353239273059, + "loss": 0.0183, "step": 136990 }, { - "epoch": 0.69, - "learning_rate": 0.00019632260570805857, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.00024673143571093443, + "loss": 0.0171, "step": 137000 }, { - "epoch": 0.69, - "eval_cer": 0.914462492734159, - "eval_loss": 0.009697197005152702, - "eval_runtime": 116.8588, - "eval_samples_per_second": 17.115, - "eval_steps_per_second": 4.279, + "epoch": 0.36, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.014788404107093811, + "eval_runtime": 107.1104, + "eval_samples_per_second": 18.672, + "eval_steps_per_second": 4.668, "step": 137000 }, { - "epoch": 0.69, - "learning_rate": 0.00019631503801504456, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.00024672754749456295, + "loss": 0.0182, "step": 137010 }, { - "epoch": 0.69, - "learning_rate": 0.00019630747032203054, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.00024672365927819146, + "loss": 0.0249, "step": 137020 }, { - "epoch": 0.69, - "learning_rate": 0.00019629990262901655, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024671977106182003, + "loss": 0.0182, "step": 137030 }, { - "epoch": 0.69, - "learning_rate": 0.00019629233493600253, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024671588284544855, + "loss": 0.0198, "step": 137040 }, { - "epoch": 0.69, - "learning_rate": 0.0001962847672429885, - "loss": 0.0112, + "epoch": 0.36, + "learning_rate": 0.0002467119946290771, + "loss": 0.019, "step": 137050 }, { - "epoch": 0.69, - "learning_rate": 0.00019627719954997452, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024670810641270563, + "loss": 0.0227, "step": 137060 }, { - "epoch": 0.69, - "learning_rate": 0.0001962696318569605, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.0002467042181963342, + "loss": 0.0217, "step": 137070 }, { - "epoch": 0.69, - "learning_rate": 0.00019626206416394648, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002467003299799627, + "loss": 0.0237, "step": 137080 }, { - "epoch": 0.69, - "learning_rate": 0.0001962544964709325, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024669644176359123, + "loss": 0.0211, "step": 137090 }, { - "epoch": 0.69, - "learning_rate": 0.00019624692877791847, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024669255354721974, + "loss": 0.0221, "step": 137100 }, { - "epoch": 0.69, - "learning_rate": 0.00019623936108490445, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.0002466886653308483, + "loss": 0.0206, "step": 137110 }, { - "epoch": 0.69, - "learning_rate": 0.00019623179339189043, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.0002466847771144768, + "loss": 0.0215, "step": 137120 }, { - "epoch": 0.69, - "learning_rate": 0.00019622422569887644, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002466808888981054, + "loss": 0.0209, "step": 137130 }, { - "epoch": 0.69, - "learning_rate": 0.00019621665800586242, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.0002466770006817339, + "loss": 0.0268, "step": 137140 }, { - "epoch": 0.69, - "learning_rate": 0.0001962090903128484, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002466731124653625, + "loss": 0.0247, "step": 137150 }, { - "epoch": 0.69, - "learning_rate": 0.0001962015226198344, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.000246669224248991, + "loss": 0.02, "step": 137160 }, { - "epoch": 0.69, - "learning_rate": 0.0001961939549268204, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002466653360326195, + "loss": 0.0155, "step": 137170 }, { - "epoch": 0.69, - "learning_rate": 0.00019618638723380638, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.000246661447816248, + "loss": 0.0213, "step": 137180 }, { - "epoch": 0.69, - "learning_rate": 0.00019617881954079238, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.0002466575595998766, + "loss": 0.0186, "step": 137190 }, { - "epoch": 0.69, - "learning_rate": 0.00019617125184777837, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.00024665367138350516, + "loss": 0.0199, "step": 137200 }, { - "epoch": 0.69, - "learning_rate": 0.00019616368415476435, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.00024664978316713367, + "loss": 0.0165, "step": 137210 }, { - "epoch": 0.69, - "learning_rate": 0.00019615611646175036, - "loss": 0.0115, + "epoch": 0.36, + "learning_rate": 0.0002466458949507622, + "loss": 0.0223, "step": 137220 }, { - "epoch": 0.69, - "learning_rate": 0.00019614854876873634, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.0002466420067343907, + "loss": 0.0173, "step": 137230 }, { - "epoch": 0.69, - "learning_rate": 0.00019614098107572232, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024663811851801927, + "loss": 0.022, "step": 137240 }, { - "epoch": 0.69, - "learning_rate": 0.00019613341338270833, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.0002466342303016478, + "loss": 0.0213, "step": 137250 }, { - "epoch": 0.69, - "learning_rate": 0.0001961258456896943, - "loss": 0.0119, + "epoch": 0.36, + "learning_rate": 0.00024663034208527635, + "loss": 0.0254, "step": 137260 }, { - "epoch": 0.69, - "learning_rate": 0.0001961182779966803, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024662645386890487, + "loss": 0.0207, "step": 137270 }, { - "epoch": 0.69, - "learning_rate": 0.00019611071030366627, - "loss": 0.0175, + "epoch": 0.36, + "learning_rate": 0.00024662256565253344, + "loss": 0.022, "step": 137280 }, { - "epoch": 0.69, - "learning_rate": 0.00019610314261065228, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.00024661867743616195, + "loss": 0.0177, "step": 137290 }, { - "epoch": 0.69, - "learning_rate": 0.00019609557491763826, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.00024661478921979047, + "loss": 0.0208, "step": 137300 }, { - "epoch": 0.69, - "learning_rate": 0.00019608800722462424, - "loss": 0.0115, + "epoch": 0.36, + "learning_rate": 0.000246610901003419, + "loss": 0.02, "step": 137310 }, { - "epoch": 0.69, - "learning_rate": 0.00019608043953161025, - "loss": 0.0112, + "epoch": 0.36, + "learning_rate": 0.00024660701278704755, + "loss": 0.0202, "step": 137320 }, { - "epoch": 0.69, - "learning_rate": 0.00019607287183859623, - "loss": 0.0111, + "epoch": 0.36, + "learning_rate": 0.0002466031245706761, + "loss": 0.0242, "step": 137330 }, { - "epoch": 0.69, - "learning_rate": 0.00019606530414558221, - "loss": 0.0155, + "epoch": 0.36, + "learning_rate": 0.00024659923635430463, + "loss": 0.0181, "step": 137340 }, { - "epoch": 0.69, - "learning_rate": 0.00019605773645256822, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024659534813793315, + "loss": 0.0177, "step": 137350 }, { - "epoch": 0.69, - "learning_rate": 0.0001960501687595542, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002465914599215617, + "loss": 0.0194, "step": 137360 }, { - "epoch": 0.69, - "learning_rate": 0.00019604260106654019, - "loss": 0.011, + "epoch": 0.36, + "learning_rate": 0.00024658757170519023, + "loss": 0.0221, "step": 137370 }, { - "epoch": 0.69, - "learning_rate": 0.0001960350333735262, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.00024658368348881875, + "loss": 0.0188, "step": 137380 }, { - "epoch": 0.69, - "learning_rate": 0.00019602746568051218, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.0002465797952724473, + "loss": 0.0175, "step": 137390 }, { - "epoch": 0.69, - "learning_rate": 0.00019601989798749816, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024657590705607583, + "loss": 0.016, "step": 137400 }, { - "epoch": 0.69, - "learning_rate": 0.00019601233029448417, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.0002465720188397044, + "loss": 0.0196, "step": 137410 }, { - "epoch": 0.69, - "learning_rate": 0.00019600476260147015, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.0002465681306233329, + "loss": 0.0167, "step": 137420 }, { - "epoch": 0.69, - "learning_rate": 0.00019599719490845613, - "loss": 0.0148, + "epoch": 0.36, + "learning_rate": 0.0002465642424069614, + "loss": 0.0236, "step": 137430 }, { - "epoch": 0.69, - "learning_rate": 0.00019598962721544214, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.00024656035419059, + "loss": 0.0182, "step": 137440 }, { - "epoch": 0.69, - "learning_rate": 0.00019598205952242812, - "loss": 0.0148, + "epoch": 0.36, + "learning_rate": 0.0002465564659742185, + "loss": 0.0177, "step": 137450 }, { - "epoch": 0.69, - "learning_rate": 0.0001959744918294141, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.000246552577757847, + "loss": 0.0224, "step": 137460 }, { - "epoch": 0.69, - "learning_rate": 0.00019596692413640008, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.0002465486895414756, + "loss": 0.0223, "step": 137470 }, { - "epoch": 0.69, - "learning_rate": 0.0001959593564433861, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002465448013251041, + "loss": 0.0168, "step": 137480 }, { - "epoch": 0.69, - "learning_rate": 0.00019595178875037207, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.0002465409131087327, + "loss": 0.0205, "step": 137490 }, { - "epoch": 0.69, - "learning_rate": 0.00019594422105735805, - "loss": 0.0161, + "epoch": 0.36, + "learning_rate": 0.0002465370248923612, + "loss": 0.0188, "step": 137500 }, { - "epoch": 0.69, - "learning_rate": 0.00019593665336434406, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.0002465331366759897, + "loss": 0.0169, "step": 137510 }, { - "epoch": 0.69, - "learning_rate": 0.00019592908567133004, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002465292484596182, + "loss": 0.0165, "step": 137520 }, { - "epoch": 0.69, - "learning_rate": 0.00019592151797831602, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.0002465253602432468, + "loss": 0.0172, "step": 137530 }, { - "epoch": 0.69, - "learning_rate": 0.00019591395028530203, - "loss": 0.0099, + "epoch": 0.36, + "learning_rate": 0.00024652147202687536, + "loss": 0.0214, "step": 137540 }, { - "epoch": 0.69, - "learning_rate": 0.00019590638259228801, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.00024651758381050387, + "loss": 0.0186, "step": 137550 }, { - "epoch": 0.69, - "learning_rate": 0.000195898814899274, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.0002465136955941324, + "loss": 0.0241, "step": 137560 }, { - "epoch": 0.69, - "learning_rate": 0.00019589124720626, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024650980737776095, + "loss": 0.0189, "step": 137570 }, { - "epoch": 0.69, - "learning_rate": 0.00019588367951324599, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024650591916138947, + "loss": 0.0223, "step": 137580 }, { - "epoch": 0.69, - "learning_rate": 0.00019587611182023197, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.000246502030945018, + "loss": 0.0218, "step": 137590 }, { - "epoch": 0.69, - "learning_rate": 0.00019586854412721798, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.00024649814272864655, + "loss": 0.0206, "step": 137600 }, { - "epoch": 0.69, - "learning_rate": 0.00019586097643420396, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024649425451227507, + "loss": 0.0172, "step": 137610 }, { - "epoch": 0.69, - "learning_rate": 0.00019585340874118994, - "loss": 0.0162, + "epoch": 0.36, + "learning_rate": 0.00024649036629590364, + "loss": 0.0308, "step": 137620 }, { - "epoch": 0.69, - "learning_rate": 0.0001958458410481759, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024648647807953215, + "loss": 0.0273, "step": 137630 }, { - "epoch": 0.69, - "learning_rate": 0.0001958382733551619, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.00024648258986316067, + "loss": 0.0213, "step": 137640 }, { - "epoch": 0.69, - "learning_rate": 0.00019583070566214788, - "loss": 0.0111, + "epoch": 0.36, + "learning_rate": 0.00024647870164678923, + "loss": 0.0264, "step": 137650 }, { - "epoch": 0.69, - "learning_rate": 0.00019582313796913386, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.00024647481343041775, + "loss": 0.017, "step": 137660 }, { - "epoch": 0.69, - "learning_rate": 0.00019581557027611985, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.00024647092521404626, + "loss": 0.0193, "step": 137670 }, { - "epoch": 0.69, - "learning_rate": 0.00019580800258310585, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.00024646703699767483, + "loss": 0.0182, "step": 137680 }, { - "epoch": 0.69, - "learning_rate": 0.00019580043489009184, - "loss": 0.0167, + "epoch": 0.36, + "learning_rate": 0.0002464631487813034, + "loss": 0.02, "step": 137690 }, { - "epoch": 0.69, - "learning_rate": 0.00019579286719707782, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.0002464592605649319, + "loss": 0.0187, "step": 137700 }, { - "epoch": 0.69, - "learning_rate": 0.00019578529950406383, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024645537234856043, + "loss": 0.0213, "step": 137710 }, { - "epoch": 0.69, - "learning_rate": 0.0001957777318110498, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024645148413218894, + "loss": 0.0213, "step": 137720 }, { - "epoch": 0.69, - "learning_rate": 0.0001957701641180358, - "loss": 0.0108, + "epoch": 0.36, + "learning_rate": 0.0002464475959158175, + "loss": 0.0195, "step": 137730 }, { - "epoch": 0.69, - "learning_rate": 0.0001957625964250218, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.00024644370769944603, + "loss": 0.0218, "step": 137740 }, { - "epoch": 0.69, - "learning_rate": 0.00019575502873200778, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.0002464398194830746, + "loss": 0.0196, "step": 137750 }, { - "epoch": 0.7, - "learning_rate": 0.00019574746103899376, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002464359312667031, + "loss": 0.0201, "step": 137760 }, { - "epoch": 0.7, - "learning_rate": 0.00019573989334597977, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002464320430503316, + "loss": 0.0206, "step": 137770 }, { - "epoch": 0.7, - "learning_rate": 0.00019573232565296575, - "loss": 0.0156, + "epoch": 0.36, + "learning_rate": 0.0002464281548339602, + "loss": 0.0198, "step": 137780 }, { - "epoch": 0.7, - "learning_rate": 0.00019572475795995173, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.0002464242666175887, + "loss": 0.0235, "step": 137790 }, { - "epoch": 0.7, - "learning_rate": 0.00019571719026693774, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002464203784012172, + "loss": 0.0202, "step": 137800 }, { - "epoch": 0.7, - "learning_rate": 0.00019570962257392372, - "loss": 0.0113, + "epoch": 0.36, + "learning_rate": 0.0002464164901848458, + "loss": 0.0227, "step": 137810 }, { - "epoch": 0.7, - "learning_rate": 0.0001957020548809097, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.0002464126019684743, + "loss": 0.021, "step": 137820 }, { - "epoch": 0.7, - "learning_rate": 0.0001956944871878957, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.0002464087137521029, + "loss": 0.0181, "step": 137830 }, { - "epoch": 0.7, - "learning_rate": 0.0001956869194948817, - "loss": 0.0109, + "epoch": 0.36, + "learning_rate": 0.0002464048255357314, + "loss": 0.016, "step": 137840 }, { - "epoch": 0.7, - "learning_rate": 0.00019567935180186767, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002464009373193599, + "loss": 0.0288, "step": 137850 }, { - "epoch": 0.7, - "learning_rate": 0.00019567178410885366, - "loss": 0.0111, + "epoch": 0.36, + "learning_rate": 0.00024639704910298847, + "loss": 0.0218, "step": 137860 }, { - "epoch": 0.7, - "learning_rate": 0.00019566421641583966, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.000246393160886617, + "loss": 0.0156, "step": 137870 }, { - "epoch": 0.7, - "learning_rate": 0.00019565664872282565, - "loss": 0.0167, + "epoch": 0.36, + "learning_rate": 0.00024638927267024556, + "loss": 0.0209, "step": 137880 }, { - "epoch": 0.7, - "learning_rate": 0.00019564908102981163, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.00024638538445387407, + "loss": 0.0216, "step": 137890 }, { - "epoch": 0.7, - "learning_rate": 0.00019564151333679764, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.00024638149623750264, + "loss": 0.0212, "step": 137900 }, { - "epoch": 0.7, - "learning_rate": 0.00019563394564378362, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024637760802113115, + "loss": 0.0215, "step": 137910 }, { - "epoch": 0.7, - "learning_rate": 0.0001956263779507696, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024637371980475967, + "loss": 0.0198, "step": 137920 }, { - "epoch": 0.7, - "learning_rate": 0.0001956188102577556, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.0002463698315883882, + "loss": 0.0178, "step": 137930 }, { - "epoch": 0.7, - "learning_rate": 0.0001956112425647416, - "loss": 0.0113, + "epoch": 0.36, + "learning_rate": 0.00024636594337201675, + "loss": 0.021, "step": 137940 }, { - "epoch": 0.7, - "learning_rate": 0.00019560367487172757, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.00024636205515564527, + "loss": 0.017, "step": 137950 }, { - "epoch": 0.7, - "learning_rate": 0.00019559610717871358, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.00024635816693927383, + "loss": 0.0229, "step": 137960 }, { - "epoch": 0.7, - "learning_rate": 0.00019558853948569956, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.00024635427872290235, + "loss": 0.0217, "step": 137970 }, { - "epoch": 0.7, - "learning_rate": 0.00019558097179268554, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.00024635039050653086, + "loss": 0.0227, "step": 137980 }, { - "epoch": 0.7, - "learning_rate": 0.00019557340409967155, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024634650229015943, + "loss": 0.0214, "step": 137990 }, { - "epoch": 0.7, - "learning_rate": 0.00019556583640665753, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.00024634261407378795, + "loss": 0.0189, "step": 138000 }, { - "epoch": 0.7, - "eval_cer": 0.9144770486760401, - "eval_loss": 0.009700953029096127, - "eval_runtime": 116.67, - "eval_samples_per_second": 17.142, - "eval_steps_per_second": 4.286, + "epoch": 0.36, + "eval_cer": 0.8817936627238894, + "eval_loss": 0.014577467925846577, + "eval_runtime": 107.3326, + "eval_samples_per_second": 18.634, + "eval_steps_per_second": 4.658, "step": 138000 }, { - "epoch": 0.7, - "learning_rate": 0.0001955582687136435, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024633872585741646, + "loss": 0.0155, "step": 138010 }, { - "epoch": 0.7, - "learning_rate": 0.0001955507010206295, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024633483764104503, + "loss": 0.0157, "step": 138020 }, { - "epoch": 0.7, - "learning_rate": 0.0001955431333276155, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.0002463309494246736, + "loss": 0.0175, "step": 138030 }, { - "epoch": 0.7, - "learning_rate": 0.00019553556563460148, - "loss": 0.0182, + "epoch": 0.36, + "learning_rate": 0.0002463270612083021, + "loss": 0.0184, "step": 138040 }, { - "epoch": 0.7, - "learning_rate": 0.00019552799794158747, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024632317299193063, + "loss": 0.0183, "step": 138050 }, { - "epoch": 0.7, - "learning_rate": 0.00019552043024857347, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024631928477555914, + "loss": 0.024, "step": 138060 }, { - "epoch": 0.7, - "learning_rate": 0.00019551286255555946, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002463153965591877, + "loss": 0.0215, "step": 138070 }, { - "epoch": 0.7, - "learning_rate": 0.00019550529486254544, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.0002463115083428162, + "loss": 0.0188, "step": 138080 }, { - "epoch": 0.7, - "learning_rate": 0.00019549772716953145, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.0002463076201264448, + "loss": 0.0207, "step": 138090 }, { - "epoch": 0.7, - "learning_rate": 0.00019549015947651743, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.0002463037319100733, + "loss": 0.0168, "step": 138100 }, { - "epoch": 0.7, - "learning_rate": 0.0001954825917835034, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.0002462998436937019, + "loss": 0.0191, "step": 138110 }, { - "epoch": 0.7, - "learning_rate": 0.00019547502409048942, - "loss": 0.0108, + "epoch": 0.36, + "learning_rate": 0.0002462959554773304, + "loss": 0.0234, "step": 138120 }, { - "epoch": 0.7, - "learning_rate": 0.0001954674563974754, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.0002462920672609589, + "loss": 0.0177, "step": 138130 }, { - "epoch": 0.7, - "learning_rate": 0.00019545988870446138, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002462881790445874, + "loss": 0.0203, "step": 138140 }, { - "epoch": 0.7, - "learning_rate": 0.0001954523210114474, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.000246284290828216, + "loss": 0.0191, "step": 138150 }, { - "epoch": 0.7, - "learning_rate": 0.00019544475331843337, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.0002462804026118445, + "loss": 0.0174, "step": 138160 }, { - "epoch": 0.7, - "learning_rate": 0.00019543718562541935, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.0002462765143954731, + "loss": 0.0203, "step": 138170 }, { - "epoch": 0.7, - "learning_rate": 0.00019542961793240533, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002462726261791016, + "loss": 0.0222, "step": 138180 }, { - "epoch": 0.7, - "learning_rate": 0.00019542205023939134, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024626873796273016, + "loss": 0.0224, "step": 138190 }, { - "epoch": 0.7, - "learning_rate": 0.00019541448254637732, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.00024626484974635867, + "loss": 0.0207, "step": 138200 }, { - "epoch": 0.7, - "learning_rate": 0.0001954069148533633, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002462609615299872, + "loss": 0.0205, "step": 138210 }, { - "epoch": 0.7, - "learning_rate": 0.0001953993471603493, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002462570733136157, + "loss": 0.023, "step": 138220 }, { - "epoch": 0.7, - "learning_rate": 0.0001953917794673353, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024625318509724427, + "loss": 0.0208, "step": 138230 }, { - "epoch": 0.7, - "learning_rate": 0.00019538421177432128, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024624929688087284, + "loss": 0.0171, "step": 138240 }, { - "epoch": 0.7, - "learning_rate": 0.00019537664408130728, + "epoch": 0.36, + "learning_rate": 0.00024624540866450135, "loss": 0.0177, "step": 138250 }, { - "epoch": 0.7, - "learning_rate": 0.00019536907638829327, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.00024624152044812987, + "loss": 0.0193, "step": 138260 }, { - "epoch": 0.7, - "learning_rate": 0.00019536150869527925, - "loss": 0.0106, + "epoch": 0.36, + "learning_rate": 0.0002462376322317584, + "loss": 0.021, "step": 138270 }, { - "epoch": 0.7, - "learning_rate": 0.00019535394100226526, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.00024623374401538695, + "loss": 0.0188, "step": 138280 }, { - "epoch": 0.7, - "learning_rate": 0.00019534637330925124, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024622985579901546, + "loss": 0.018, "step": 138290 }, { - "epoch": 0.7, - "learning_rate": 0.00019533880561623722, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.00024622596758264403, + "loss": 0.0179, "step": 138300 }, { - "epoch": 0.7, - "learning_rate": 0.00019533123792322323, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.00024622207936627255, + "loss": 0.0161, "step": 138310 }, { - "epoch": 0.7, - "learning_rate": 0.0001953236702302092, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.0002462181911499011, + "loss": 0.0168, "step": 138320 }, { - "epoch": 0.7, - "learning_rate": 0.0001953161025371952, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.00024621430293352963, + "loss": 0.0221, "step": 138330 }, { - "epoch": 0.7, - "learning_rate": 0.0001953085348441812, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024621041471715815, + "loss": 0.0214, "step": 138340 }, { - "epoch": 0.7, - "learning_rate": 0.00019530096715116718, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024620652650078666, + "loss": 0.0206, "step": 138350 }, { - "epoch": 0.7, - "learning_rate": 0.00019529339945815316, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.00024620263828441523, + "loss": 0.0243, "step": 138360 }, { - "epoch": 0.7, - "learning_rate": 0.00019528583176513914, - "loss": 0.0105, + "epoch": 0.36, + "learning_rate": 0.00024619875006804374, + "loss": 0.02, "step": 138370 }, { - "epoch": 0.7, - "learning_rate": 0.00019527826407212515, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.0002461948618516723, + "loss": 0.0298, "step": 138380 }, { - "epoch": 0.7, - "learning_rate": 0.00019527069637911113, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.00024619097363530083, + "loss": 0.0176, "step": 138390 }, { - "epoch": 0.7, - "learning_rate": 0.00019526312868609711, - "loss": 0.0154, + "epoch": 0.36, + "learning_rate": 0.0002461870854189294, + "loss": 0.023, "step": 138400 }, { - "epoch": 0.7, - "learning_rate": 0.00019525556099308312, - "loss": 0.0113, + "epoch": 0.36, + "learning_rate": 0.0002461831972025579, + "loss": 0.0194, "step": 138410 }, { - "epoch": 0.7, - "learning_rate": 0.0001952479933000691, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002461793089861864, + "loss": 0.0203, "step": 138420 }, { - "epoch": 0.7, - "learning_rate": 0.00019524042560705509, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.000246175420769815, + "loss": 0.022, "step": 138430 }, { - "epoch": 0.7, - "learning_rate": 0.0001952328579140411, - "loss": 0.0094, + "epoch": 0.36, + "learning_rate": 0.0002461715325534435, + "loss": 0.0217, "step": 138440 }, { - "epoch": 0.7, - "learning_rate": 0.00019522529022102708, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002461676443370721, + "loss": 0.031, "step": 138450 }, { - "epoch": 0.7, - "learning_rate": 0.00019521772252801306, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.0002461637561207006, + "loss": 0.0164, "step": 138460 }, { - "epoch": 0.7, - "learning_rate": 0.00019521015483499907, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.0002461598679043291, + "loss": 0.0178, "step": 138470 }, { - "epoch": 0.7, - "learning_rate": 0.00019520258714198505, - "loss": 0.0146, + "epoch": 0.36, + "learning_rate": 0.0002461559796879576, + "loss": 0.0205, "step": 138480 }, { - "epoch": 0.7, - "learning_rate": 0.00019519501944897103, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002461520914715862, + "loss": 0.0215, "step": 138490 }, { - "epoch": 0.7, - "learning_rate": 0.00019518745175595704, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002461482032552147, + "loss": 0.0215, "step": 138500 }, { - "epoch": 0.7, - "learning_rate": 0.00019517988406294302, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024614431503884327, + "loss": 0.0217, "step": 138510 }, { - "epoch": 0.7, - "learning_rate": 0.000195172316369929, - "loss": 0.011, + "epoch": 0.36, + "learning_rate": 0.0002461404268224718, + "loss": 0.0188, "step": 138520 }, { - "epoch": 0.7, - "learning_rate": 0.00019516474867691498, - "loss": 0.0153, + "epoch": 0.36, + "learning_rate": 0.00024613653860610036, + "loss": 0.019, "step": 138530 }, { - "epoch": 0.7, - "learning_rate": 0.000195157180983901, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.00024613265038972887, + "loss": 0.0221, "step": 138540 }, { - "epoch": 0.7, - "learning_rate": 0.00019514961329088697, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.0002461287621733574, + "loss": 0.0185, "step": 138550 }, { - "epoch": 0.7, - "learning_rate": 0.00019514204559787295, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002461248739569859, + "loss": 0.0198, "step": 138560 }, { - "epoch": 0.7, - "learning_rate": 0.00019513447790485896, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024612098574061447, + "loss": 0.0182, "step": 138570 }, { - "epoch": 0.7, - "learning_rate": 0.00019512691021184494, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.00024611709752424304, + "loss": 0.0183, "step": 138580 }, { - "epoch": 0.7, - "learning_rate": 0.00019511934251883092, - "loss": 0.0183, + "epoch": 0.36, + "learning_rate": 0.00024611320930787155, + "loss": 0.0171, "step": 138590 }, { - "epoch": 0.7, - "learning_rate": 0.00019511177482581693, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.00024610932109150007, + "loss": 0.0191, "step": 138600 }, { - "epoch": 0.7, - "learning_rate": 0.00019510420713280291, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.00024610543287512863, + "loss": 0.0189, "step": 138610 }, { - "epoch": 0.7, - "learning_rate": 0.0001950966394397889, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024610154465875715, + "loss": 0.023, "step": 138620 }, { - "epoch": 0.7, - "learning_rate": 0.0001950890717467749, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.00024609765644238566, + "loss": 0.0185, "step": 138630 }, { - "epoch": 0.7, - "learning_rate": 0.00019508150405376089, - "loss": 0.0172, + "epoch": 0.36, + "learning_rate": 0.00024609376822601423, + "loss": 0.0194, "step": 138640 }, { - "epoch": 0.7, - "learning_rate": 0.00019507393636074687, - "loss": 0.018, + "epoch": 0.36, + "learning_rate": 0.00024608988000964275, + "loss": 0.0241, "step": 138650 }, { - "epoch": 0.7, - "learning_rate": 0.00019506636866773288, - "loss": 0.0112, + "epoch": 0.36, + "learning_rate": 0.0002460859917932713, + "loss": 0.0221, "step": 138660 }, { - "epoch": 0.7, - "learning_rate": 0.00019505880097471886, - "loss": 0.0169, + "epoch": 0.36, + "learning_rate": 0.00024608210357689983, + "loss": 0.018, "step": 138670 }, { - "epoch": 0.7, - "learning_rate": 0.00019505123328170484, - "loss": 0.0119, + "epoch": 0.36, + "learning_rate": 0.00024607821536052834, + "loss": 0.028, "step": 138680 }, { - "epoch": 0.7, - "learning_rate": 0.00019504366558869082, - "loss": 0.0108, + "epoch": 0.36, + "learning_rate": 0.0002460743271441569, + "loss": 0.0193, "step": 138690 }, { - "epoch": 0.7, - "learning_rate": 0.00019503609789567683, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.00024607043892778543, + "loss": 0.0266, "step": 138700 }, { - "epoch": 0.7, - "learning_rate": 0.0001950285302026628, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024606655071141394, + "loss": 0.0242, "step": 138710 }, { - "epoch": 0.7, - "learning_rate": 0.0001950209625096488, - "loss": 0.0104, + "epoch": 0.36, + "learning_rate": 0.0002460626624950425, + "loss": 0.0157, "step": 138720 }, { - "epoch": 0.7, - "learning_rate": 0.0001950133948166348, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.000246058774278671, + "loss": 0.0176, "step": 138730 }, { - "epoch": 0.7, - "learning_rate": 0.00019500582712362078, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002460548860622996, + "loss": 0.0213, "step": 138740 }, { - "epoch": 0.7, - "learning_rate": 0.00019499825943060676, - "loss": 0.0109, + "epoch": 0.36, + "learning_rate": 0.0002460509978459281, + "loss": 0.0162, "step": 138750 }, { - "epoch": 0.7, - "learning_rate": 0.00019499069173759277, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.0002460471096295566, + "loss": 0.0228, "step": 138760 }, { - "epoch": 0.7, - "learning_rate": 0.00019498312404457875, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.00024604322141318514, + "loss": 0.0207, "step": 138770 }, { - "epoch": 0.7, - "learning_rate": 0.00019497555635156473, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002460393331968137, + "loss": 0.0213, "step": 138780 }, { - "epoch": 0.7, - "learning_rate": 0.00019496798865855074, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.0002460354449804423, + "loss": 0.02, "step": 138790 }, { - "epoch": 0.7, - "learning_rate": 0.00019496042096553672, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.0002460315567640708, + "loss": 0.0229, "step": 138800 }, { - "epoch": 0.7, - "learning_rate": 0.0001949528532725227, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.0002460276685476993, + "loss": 0.0216, "step": 138810 }, { - "epoch": 0.7, - "learning_rate": 0.00019494528557950871, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002460237803313279, + "loss": 0.0185, "step": 138820 }, { - "epoch": 0.7, - "learning_rate": 0.0001949377178864947, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.0002460198921149564, + "loss": 0.0204, "step": 138830 }, { - "epoch": 0.7, - "learning_rate": 0.00019493015019348068, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002460160038985849, + "loss": 0.0205, "step": 138840 }, { - "epoch": 0.7, - "learning_rate": 0.00019492258250046669, - "loss": 0.0177, + "epoch": 0.36, + "learning_rate": 0.00024601211568221347, + "loss": 0.0166, "step": 138850 }, { - "epoch": 0.7, - "learning_rate": 0.00019491501480745267, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.000246008227465842, + "loss": 0.0198, "step": 138860 }, { - "epoch": 0.7, - "learning_rate": 0.00019490744711443865, - "loss": 0.0197, + "epoch": 0.36, + "learning_rate": 0.00024600433924947055, + "loss": 0.0206, "step": 138870 }, { - "epoch": 0.7, - "learning_rate": 0.00019489987942142463, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.00024600045103309907, + "loss": 0.0175, "step": 138880 }, { - "epoch": 0.7, - "learning_rate": 0.0001948923117284106, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002459965628167276, + "loss": 0.0219, "step": 138890 }, { - "epoch": 0.7, - "learning_rate": 0.0001948847440353966, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024599267460035615, + "loss": 0.018, "step": 138900 }, { - "epoch": 0.7, - "learning_rate": 0.00019487717634238258, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.00024598878638398467, + "loss": 0.0213, "step": 138910 }, { - "epoch": 0.7, - "learning_rate": 0.00019486960864936856, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024598489816761324, + "loss": 0.0194, "step": 138920 }, { - "epoch": 0.7, - "learning_rate": 0.00019486204095635457, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024598100995124175, + "loss": 0.0229, "step": 138930 }, { - "epoch": 0.7, - "learning_rate": 0.00019485447326334055, - "loss": 0.0102, + "epoch": 0.36, + "learning_rate": 0.00024597712173487026, + "loss": 0.0224, "step": 138940 }, { - "epoch": 0.7, - "learning_rate": 0.00019484690557032653, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024597323351849883, + "loss": 0.0201, "step": 138950 }, { - "epoch": 0.7, - "learning_rate": 0.00019483933787731254, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.00024596934530212735, + "loss": 0.0205, "step": 138960 }, { - "epoch": 0.7, - "learning_rate": 0.00019483177018429852, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.00024596545708575586, + "loss": 0.0233, "step": 138970 }, { - "epoch": 0.7, - "learning_rate": 0.0001948242024912845, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024596156886938443, + "loss": 0.0196, "step": 138980 }, { - "epoch": 0.7, - "learning_rate": 0.0001948166347982705, - "loss": 0.0174, + "epoch": 0.36, + "learning_rate": 0.00024595768065301295, + "loss": 0.022, "step": 138990 }, { - "epoch": 0.7, - "learning_rate": 0.0001948090671052565, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002459537924366415, + "loss": 0.026, "step": 139000 }, { - "epoch": 0.7, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.009447253309190273, - "eval_runtime": 116.7733, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.36, + "eval_cer": 0.8817642703482717, + "eval_loss": 0.013596959412097931, + "eval_runtime": 107.3644, + "eval_samples_per_second": 18.628, + "eval_steps_per_second": 4.657, "step": 139000 }, { - "epoch": 0.7, - "learning_rate": 0.00019480149941224247, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.00024594990422027003, + "loss": 0.017, "step": 139010 }, { - "epoch": 0.7, - "learning_rate": 0.00019479393171922848, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.00024594601600389854, + "loss": 0.0219, "step": 139020 }, { - "epoch": 0.7, - "learning_rate": 0.00019478636402621446, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002459421277875271, + "loss": 0.0151, "step": 139030 }, { - "epoch": 0.7, - "learning_rate": 0.00019477879633320044, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.0002459382395711556, + "loss": 0.0265, "step": 139040 }, { - "epoch": 0.7, - "learning_rate": 0.00019477122864018645, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.00024593435135478414, + "loss": 0.0203, "step": 139050 }, { - "epoch": 0.7, - "learning_rate": 0.00019476366094717243, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002459304631384127, + "loss": 0.0248, "step": 139060 }, { - "epoch": 0.7, - "learning_rate": 0.00019475609325415841, - "loss": 0.0104, + "epoch": 0.36, + "learning_rate": 0.0002459265749220413, + "loss": 0.0183, "step": 139070 }, { - "epoch": 0.7, - "learning_rate": 0.0001947485255611444, - "loss": 0.0156, + "epoch": 0.36, + "learning_rate": 0.0002459226867056698, + "loss": 0.0164, "step": 139080 }, { - "epoch": 0.7, - "learning_rate": 0.0001947409578681304, - "loss": 0.0188, + "epoch": 0.36, + "learning_rate": 0.0002459187984892983, + "loss": 0.0196, "step": 139090 }, { - "epoch": 0.7, - "learning_rate": 0.00019473339017511639, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.0002459149102729268, + "loss": 0.0211, "step": 139100 }, { - "epoch": 0.7, - "learning_rate": 0.00019472582248210237, - "loss": 0.0193, + "epoch": 0.36, + "learning_rate": 0.0002459110220565554, + "loss": 0.0167, "step": 139110 }, { - "epoch": 0.7, - "learning_rate": 0.00019471825478908838, - "loss": 0.0167, + "epoch": 0.36, + "learning_rate": 0.0002459071338401839, + "loss": 0.0239, "step": 139120 }, { - "epoch": 0.7, - "learning_rate": 0.00019471068709607436, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002459032456238125, + "loss": 0.0185, "step": 139130 }, { - "epoch": 0.7, - "learning_rate": 0.00019470311940306034, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.000245899357407441, + "loss": 0.0204, "step": 139140 }, { - "epoch": 0.7, - "learning_rate": 0.00019469555171004635, - "loss": 0.0144, + "epoch": 0.36, + "learning_rate": 0.00024589546919106956, + "loss": 0.0242, "step": 139150 }, { - "epoch": 0.7, - "learning_rate": 0.00019468798401703233, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.00024589158097469807, + "loss": 0.0273, "step": 139160 }, { - "epoch": 0.7, - "learning_rate": 0.0001946804163240183, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.0002458876927583266, + "loss": 0.0193, "step": 139170 }, { - "epoch": 0.7, - "learning_rate": 0.00019467284863100432, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.0002458838045419551, + "loss": 0.021, "step": 139180 }, { - "epoch": 0.7, - "learning_rate": 0.0001946652809379903, - "loss": 0.0188, + "epoch": 0.36, + "learning_rate": 0.00024587991632558367, + "loss": 0.0202, "step": 139190 }, { - "epoch": 0.7, - "learning_rate": 0.00019465771324497628, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002458760281092122, + "loss": 0.0179, "step": 139200 }, { - "epoch": 0.7, - "learning_rate": 0.0001946501455519623, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.00024587213989284075, + "loss": 0.0233, "step": 139210 }, { - "epoch": 0.7, - "learning_rate": 0.00019464257785894827, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.00024586825167646927, + "loss": 0.0301, "step": 139220 }, { - "epoch": 0.7, - "learning_rate": 0.00019463501016593425, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002458643634600978, + "loss": 0.0205, "step": 139230 }, { - "epoch": 0.7, - "learning_rate": 0.00019462744247292026, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.00024586047524372635, + "loss": 0.0237, "step": 139240 }, { - "epoch": 0.7, - "learning_rate": 0.00019461987477990624, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.00024585658702735487, + "loss": 0.0197, "step": 139250 }, { - "epoch": 0.7, - "learning_rate": 0.00019461230708689222, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002458526988109834, + "loss": 0.0218, "step": 139260 }, { - "epoch": 0.7, - "learning_rate": 0.0001946047393938782, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.00024584881059461195, + "loss": 0.0204, "step": 139270 }, { - "epoch": 0.7, - "learning_rate": 0.00019459717170086421, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002458449223782405, + "loss": 0.0206, "step": 139280 }, { - "epoch": 0.7, - "learning_rate": 0.0001945896040078502, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.00024584103416186903, + "loss": 0.0246, "step": 139290 }, { - "epoch": 0.7, - "learning_rate": 0.00019458203631483618, - "loss": 0.0111, + "epoch": 0.36, + "learning_rate": 0.00024583714594549755, + "loss": 0.0168, "step": 139300 }, { - "epoch": 0.7, - "learning_rate": 0.00019457446862182219, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.00024583325772912606, + "loss": 0.0215, "step": 139310 }, { - "epoch": 0.7, - "learning_rate": 0.00019456690092880817, - "loss": 0.0106, + "epoch": 0.36, + "learning_rate": 0.00024582936951275463, + "loss": 0.0187, "step": 139320 }, { - "epoch": 0.7, - "learning_rate": 0.00019455933323579415, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.00024582548129638314, + "loss": 0.0196, "step": 139330 }, { - "epoch": 0.7, - "learning_rate": 0.00019455176554278016, - "loss": 0.0112, + "epoch": 0.36, + "learning_rate": 0.0002458215930800117, + "loss": 0.0218, "step": 139340 }, { - "epoch": 0.7, - "learning_rate": 0.00019454419784976614, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.00024581770486364023, + "loss": 0.0234, "step": 139350 }, { - "epoch": 0.7, - "learning_rate": 0.00019453663015675212, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.0002458138166472688, + "loss": 0.017, "step": 139360 }, { - "epoch": 0.7, - "learning_rate": 0.00019452906246373813, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.0002458099284308973, + "loss": 0.0214, "step": 139370 }, { - "epoch": 0.7, - "learning_rate": 0.0001945214947707241, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.0002458060402145258, + "loss": 0.0184, "step": 139380 }, { - "epoch": 0.7, - "learning_rate": 0.0001945139270777101, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024580215199815434, + "loss": 0.016, "step": 139390 }, { - "epoch": 0.7, - "learning_rate": 0.0001945063593846961, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002457982637817829, + "loss": 0.0262, "step": 139400 }, { - "epoch": 0.7, - "learning_rate": 0.00019449879169168208, - "loss": 0.016, + "epoch": 0.36, + "learning_rate": 0.0002457943755654114, + "loss": 0.0203, "step": 139410 }, { - "epoch": 0.7, - "learning_rate": 0.00019449122399866806, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024579048734904, + "loss": 0.0191, "step": 139420 }, { - "epoch": 0.7, - "learning_rate": 0.00019448365630565404, - "loss": 0.0158, + "epoch": 0.36, + "learning_rate": 0.0002457865991326685, + "loss": 0.0213, "step": 139430 }, { - "epoch": 0.7, - "learning_rate": 0.00019447608861264005, - "loss": 0.0159, + "epoch": 0.36, + "learning_rate": 0.000245782710916297, + "loss": 0.0208, "step": 139440 }, { - "epoch": 0.7, - "learning_rate": 0.00019446852091962603, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002457788226999256, + "loss": 0.0186, "step": 139450 }, { - "epoch": 0.7, - "learning_rate": 0.00019446095322661202, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.0002457749344835541, + "loss": 0.0195, "step": 139460 }, { - "epoch": 0.7, - "learning_rate": 0.00019445338553359802, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.0002457710462671827, + "loss": 0.0201, "step": 139470 }, { - "epoch": 0.7, - "learning_rate": 0.000194445817840584, - "loss": 0.0168, + "epoch": 0.36, + "learning_rate": 0.0002457671580508112, + "loss": 0.0204, "step": 139480 }, { - "epoch": 0.7, - "learning_rate": 0.00019443825014757, - "loss": 0.0159, + "epoch": 0.36, + "learning_rate": 0.00024576326983443976, + "loss": 0.019, "step": 139490 }, { - "epoch": 0.7, - "learning_rate": 0.000194430682454556, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.00024575938161806827, + "loss": 0.0231, "step": 139500 }, { - "epoch": 0.7, - "learning_rate": 0.00019442311476154198, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.0002457554934016968, + "loss": 0.0213, "step": 139510 }, { - "epoch": 0.7, - "learning_rate": 0.00019441554706852796, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.0002457516051853253, + "loss": 0.027, "step": 139520 }, { - "epoch": 0.7, - "learning_rate": 0.00019440797937551397, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.00024574771696895387, + "loss": 0.0179, "step": 139530 }, { - "epoch": 0.7, - "learning_rate": 0.00019440041168249995, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.0002457438287525824, + "loss": 0.0165, "step": 139540 }, { - "epoch": 0.7, - "learning_rate": 0.00019439284398948593, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.00024573994053621095, + "loss": 0.0219, "step": 139550 }, { - "epoch": 0.7, - "learning_rate": 0.00019438527629647194, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.00024573605231983947, + "loss": 0.0288, "step": 139560 }, { - "epoch": 0.7, - "learning_rate": 0.00019437770860345792, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.00024573216410346804, + "loss": 0.0222, "step": 139570 }, { - "epoch": 0.7, - "learning_rate": 0.0001943701409104439, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.00024572827588709655, + "loss": 0.0198, "step": 139580 }, { - "epoch": 0.7, - "learning_rate": 0.00019436257321742988, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.00024572438767072506, + "loss": 0.027, "step": 139590 }, { - "epoch": 0.7, - "learning_rate": 0.0001943550055244159, - "loss": 0.0157, + "epoch": 0.36, + "learning_rate": 0.0002457204994543536, + "loss": 0.0204, "step": 139600 }, { - "epoch": 0.7, - "learning_rate": 0.00019434743783140187, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.00024571661123798215, + "loss": 0.0223, "step": 139610 }, { - "epoch": 0.7, - "learning_rate": 0.00019433987013838785, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.0002457127230216107, + "loss": 0.0211, "step": 139620 }, { - "epoch": 0.7, - "learning_rate": 0.00019433230244537386, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.00024570883480523923, + "loss": 0.0189, "step": 139630 }, { - "epoch": 0.7, - "learning_rate": 0.00019432473475235984, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024570494658886775, + "loss": 0.024, "step": 139640 }, { - "epoch": 0.7, - "learning_rate": 0.00019431716705934583, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002457010583724963, + "loss": 0.0231, "step": 139650 }, { - "epoch": 0.7, - "learning_rate": 0.00019430959936633183, - "loss": 0.0118, - "step": 139660 + "epoch": 0.36, + "learning_rate": 0.00024569717015612483, + "loss": 0.0195, + "step": 139660 }, { - "epoch": 0.7, - "learning_rate": 0.00019430203167331782, - "loss": 0.0101, + "epoch": 0.36, + "learning_rate": 0.00024569328193975334, + "loss": 0.0296, "step": 139670 }, { - "epoch": 0.7, - "learning_rate": 0.0001942944639803038, - "loss": 0.0125, + "epoch": 0.36, + "learning_rate": 0.0002456893937233819, + "loss": 0.018, "step": 139680 }, { - "epoch": 0.7, - "learning_rate": 0.0001942868962872898, - "loss": 0.0119, + "epoch": 0.36, + "learning_rate": 0.0002456855055070104, + "loss": 0.0211, "step": 139690 }, { - "epoch": 0.7, - "learning_rate": 0.0001942793285942758, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.000245681617290639, + "loss": 0.0206, "step": 139700 }, { - "epoch": 0.7, - "learning_rate": 0.00019427176090126177, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002456777290742675, + "loss": 0.0192, "step": 139710 }, { - "epoch": 0.7, - "learning_rate": 0.00019426419320824778, - "loss": 0.0115, + "epoch": 0.36, + "learning_rate": 0.000245673840857896, + "loss": 0.0212, "step": 139720 }, { - "epoch": 0.7, - "learning_rate": 0.00019425662551523376, - "loss": 0.0163, + "epoch": 0.36, + "learning_rate": 0.00024566995264152454, + "loss": 0.0192, "step": 139730 }, { - "epoch": 0.71, - "learning_rate": 0.00019424905782221974, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.0002456660644251531, + "loss": 0.0259, "step": 139740 }, { - "epoch": 0.71, - "learning_rate": 0.00019424149012920575, - "loss": 0.0147, + "epoch": 0.36, + "learning_rate": 0.0002456621762087816, + "loss": 0.0363, "step": 139750 }, { - "epoch": 0.71, - "learning_rate": 0.00019423392243619173, - "loss": 0.0118, + "epoch": 0.36, + "learning_rate": 0.0002456582879924102, + "loss": 0.0213, "step": 139760 }, { - "epoch": 0.71, - "learning_rate": 0.0001942263547431777, - "loss": 0.017, + "epoch": 0.36, + "learning_rate": 0.0002456543997760387, + "loss": 0.018, "step": 139770 }, { - "epoch": 0.71, - "learning_rate": 0.0001942187870501637, - "loss": 0.0108, + "epoch": 0.36, + "learning_rate": 0.0002456505115596673, + "loss": 0.0209, "step": 139780 }, { - "epoch": 0.71, - "learning_rate": 0.0001942112193571497, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.0002456466233432958, + "loss": 0.021, "step": 139790 }, { - "epoch": 0.71, - "learning_rate": 0.00019420365166413568, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.0002456427351269243, + "loss": 0.0205, "step": 139800 }, { - "epoch": 0.71, - "learning_rate": 0.00019419608397112166, - "loss": 0.0132, + "epoch": 0.36, + "learning_rate": 0.0002456388469105528, + "loss": 0.0195, "step": 139810 }, { - "epoch": 0.71, - "learning_rate": 0.00019418851627810767, - "loss": 0.0099, + "epoch": 0.36, + "learning_rate": 0.0002456349586941814, + "loss": 0.0216, "step": 139820 }, { - "epoch": 0.71, - "learning_rate": 0.00019418094858509365, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.00024563107047780996, + "loss": 0.0244, "step": 139830 }, { - "epoch": 0.71, - "learning_rate": 0.00019417338089207964, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024562718226143847, + "loss": 0.0234, "step": 139840 }, { - "epoch": 0.71, - "learning_rate": 0.00019416581319906564, - "loss": 0.0111, + "epoch": 0.36, + "learning_rate": 0.000245623294045067, + "loss": 0.0223, "step": 139850 }, { - "epoch": 0.71, - "learning_rate": 0.00019415824550605163, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024561940582869555, + "loss": 0.0237, "step": 139860 }, { - "epoch": 0.71, - "learning_rate": 0.0001941506778130376, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024561551761232407, + "loss": 0.0231, "step": 139870 }, { - "epoch": 0.71, - "learning_rate": 0.00019414311012002362, - "loss": 0.0105, + "epoch": 0.36, + "learning_rate": 0.0002456116293959526, + "loss": 0.0214, "step": 139880 }, { - "epoch": 0.71, - "learning_rate": 0.0001941355424270096, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.00024560774117958115, + "loss": 0.0239, "step": 139890 }, { - "epoch": 0.71, - "learning_rate": 0.00019412797473399558, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.00024560385296320967, + "loss": 0.0211, "step": 139900 }, { - "epoch": 0.71, - "learning_rate": 0.0001941204070409816, - "loss": 0.0176, + "epoch": 0.36, + "learning_rate": 0.00024559996474683823, + "loss": 0.018, "step": 139910 }, { - "epoch": 0.71, - "learning_rate": 0.00019411283934796757, - "loss": 0.0124, + "epoch": 0.36, + "learning_rate": 0.00024559607653046675, + "loss": 0.0256, "step": 139920 }, { - "epoch": 0.71, - "learning_rate": 0.00019410527165495355, - "loss": 0.0143, + "epoch": 0.36, + "learning_rate": 0.00024559218831409526, + "loss": 0.0214, "step": 139930 }, { - "epoch": 0.71, - "learning_rate": 0.00019409770396193953, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.0002455883000977238, + "loss": 0.0214, "step": 139940 }, { - "epoch": 0.71, - "learning_rate": 0.00019409013626892554, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.00024558441188135235, + "loss": 0.0225, "step": 139950 }, { - "epoch": 0.71, - "learning_rate": 0.00019408256857591152, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.00024558052366498086, + "loss": 0.0226, "step": 139960 }, { - "epoch": 0.71, - "learning_rate": 0.0001940750008828975, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.00024557663544860943, + "loss": 0.0175, "step": 139970 }, { - "epoch": 0.71, - "learning_rate": 0.0001940674331898835, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.00024557274723223794, + "loss": 0.0215, "step": 139980 }, { - "epoch": 0.71, - "learning_rate": 0.0001940598654968695, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.0002455688590158665, + "loss": 0.0247, "step": 139990 }, { - "epoch": 0.71, - "learning_rate": 0.00019405229780385547, - "loss": 0.0152, + "epoch": 0.36, + "learning_rate": 0.00024556497079949503, + "loss": 0.016, "step": 140000 }, { - "epoch": 0.71, - "eval_cer": 0.9144741374876638, - "eval_loss": 0.009188586845993996, - "eval_runtime": 116.7594, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.36, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.013859533704817295, + "eval_runtime": 107.2731, + "eval_samples_per_second": 18.644, + "eval_steps_per_second": 4.661, "step": 140000 }, { - "epoch": 0.71, - "learning_rate": 0.00019404473011084148, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.00024556108258312354, + "loss": 0.0173, "step": 140010 }, { - "epoch": 0.71, - "learning_rate": 0.00019403716241782746, - "loss": 0.0123, + "epoch": 0.36, + "learning_rate": 0.0002455571943667521, + "loss": 0.0205, "step": 140020 }, { - "epoch": 0.71, - "learning_rate": 0.00019402959472481345, - "loss": 0.0155, + "epoch": 0.36, + "learning_rate": 0.0002455533061503806, + "loss": 0.0218, "step": 140030 }, { - "epoch": 0.71, - "learning_rate": 0.00019402202703179945, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002455494179340092, + "loss": 0.018, "step": 140040 }, { - "epoch": 0.71, - "learning_rate": 0.00019401445933878544, - "loss": 0.0173, + "epoch": 0.36, + "learning_rate": 0.0002455455297176377, + "loss": 0.0199, "step": 140050 }, { - "epoch": 0.71, - "learning_rate": 0.00019400689164577142, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002455416415012662, + "loss": 0.0196, "step": 140060 }, { - "epoch": 0.71, - "learning_rate": 0.00019399932395275743, - "loss": 0.0115, + "epoch": 0.36, + "learning_rate": 0.0002455377532848948, + "loss": 0.0162, "step": 140070 }, { - "epoch": 0.71, - "learning_rate": 0.0001939917562597434, - "loss": 0.0169, + "epoch": 0.36, + "learning_rate": 0.0002455338650685233, + "loss": 0.0223, "step": 140080 }, { - "epoch": 0.71, - "learning_rate": 0.0001939841885667294, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.0002455299768521518, + "loss": 0.0172, "step": 140090 }, { - "epoch": 0.71, - "learning_rate": 0.00019397662087371537, - "loss": 0.0138, + "epoch": 0.36, + "learning_rate": 0.0002455260886357804, + "loss": 0.0185, "step": 140100 }, { - "epoch": 0.71, - "learning_rate": 0.00019396905318070138, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.00024552220041940896, + "loss": 0.018, "step": 140110 }, { - "epoch": 0.71, - "learning_rate": 0.00019396148548768736, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.0002455183122030375, + "loss": 0.019, "step": 140120 }, { - "epoch": 0.71, - "learning_rate": 0.00019395391779467334, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.000245514423986666, + "loss": 0.0161, "step": 140130 }, { - "epoch": 0.71, - "learning_rate": 0.00019394635010165935, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002455105357702945, + "loss": 0.0226, "step": 140140 }, { - "epoch": 0.71, - "learning_rate": 0.0001939387824086453, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024550664755392307, + "loss": 0.0178, "step": 140150 }, { - "epoch": 0.71, - "learning_rate": 0.00019393121471563129, - "loss": 0.0104, + "epoch": 0.36, + "learning_rate": 0.0002455027593375516, + "loss": 0.0188, "step": 140160 }, { - "epoch": 0.71, - "learning_rate": 0.00019392364702261727, - "loss": 0.0169, + "epoch": 0.36, + "learning_rate": 0.00024549887112118015, + "loss": 0.0174, "step": 140170 }, { - "epoch": 0.71, - "learning_rate": 0.00019391607932960328, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.00024549498290480867, + "loss": 0.0196, "step": 140180 }, { - "epoch": 0.71, - "learning_rate": 0.00019390851163658926, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.0002454910946884372, + "loss": 0.0207, "step": 140190 }, { - "epoch": 0.71, - "learning_rate": 0.00019390094394357524, - "loss": 0.011, + "epoch": 0.36, + "learning_rate": 0.00024548720647206575, + "loss": 0.0201, "step": 140200 }, { - "epoch": 0.71, - "learning_rate": 0.00019389337625056125, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024548331825569427, + "loss": 0.0195, "step": 140210 }, { - "epoch": 0.71, - "learning_rate": 0.00019388580855754723, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.0002454794300393228, + "loss": 0.0189, "step": 140220 }, { - "epoch": 0.71, - "learning_rate": 0.0001938782408645332, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.00024547554182295135, + "loss": 0.0199, "step": 140230 }, { - "epoch": 0.71, - "learning_rate": 0.00019387067317151922, - "loss": 0.0191, + "epoch": 0.36, + "learning_rate": 0.00024547165360657986, + "loss": 0.0207, "step": 140240 }, { - "epoch": 0.71, - "learning_rate": 0.0001938631054785052, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.00024546776539020843, + "loss": 0.0187, "step": 140250 }, { - "epoch": 0.71, - "learning_rate": 0.00019385553778549118, - "loss": 0.0164, + "epoch": 0.36, + "learning_rate": 0.00024546387717383695, + "loss": 0.0181, "step": 140260 }, { - "epoch": 0.71, - "learning_rate": 0.0001938479700924772, - "loss": 0.0151, + "epoch": 0.36, + "learning_rate": 0.00024545998895746546, + "loss": 0.0164, "step": 140270 }, { - "epoch": 0.71, - "learning_rate": 0.00019384040239946317, - "loss": 0.0122, + "epoch": 0.36, + "learning_rate": 0.00024545610074109403, + "loss": 0.0199, "step": 140280 }, { - "epoch": 0.71, - "learning_rate": 0.00019383283470644915, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.00024545221252472255, + "loss": 0.0232, "step": 140290 }, { - "epoch": 0.71, - "learning_rate": 0.00019382526701343516, - "loss": 0.0121, + "epoch": 0.36, + "learning_rate": 0.00024544832430835106, + "loss": 0.0234, "step": 140300 }, { - "epoch": 0.71, - "learning_rate": 0.00019381769932042114, - "loss": 0.012, + "epoch": 0.36, + "learning_rate": 0.00024544443609197963, + "loss": 0.0203, "step": 140310 }, { - "epoch": 0.71, - "learning_rate": 0.00019381013162740712, - "loss": 0.0141, + "epoch": 0.36, + "learning_rate": 0.0002454405478756082, + "loss": 0.0219, "step": 140320 }, { - "epoch": 0.71, - "learning_rate": 0.0001938025639343931, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002454366596592367, + "loss": 0.0212, "step": 140330 }, { - "epoch": 0.71, - "learning_rate": 0.00019379499624137911, - "loss": 0.0094, + "epoch": 0.36, + "learning_rate": 0.0002454327714428652, + "loss": 0.0219, "step": 140340 }, { - "epoch": 0.71, - "learning_rate": 0.0001937874285483651, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024542888322649374, + "loss": 0.0204, "step": 140350 }, { - "epoch": 0.71, - "learning_rate": 0.00019377986085535108, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.0002454249950101223, + "loss": 0.0142, "step": 140360 }, { - "epoch": 0.71, - "learning_rate": 0.00019377229316233709, - "loss": 0.0177, + "epoch": 0.36, + "learning_rate": 0.0002454211067937508, + "loss": 0.0163, "step": 140370 }, { - "epoch": 0.71, - "learning_rate": 0.00019376472546932307, - "loss": 0.0164, + "epoch": 0.36, + "learning_rate": 0.0002454172185773794, + "loss": 0.0213, "step": 140380 }, { - "epoch": 0.71, - "learning_rate": 0.00019375715777630905, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.0002454133303610079, + "loss": 0.018, "step": 140390 }, { - "epoch": 0.71, - "learning_rate": 0.00019374959008329506, - "loss": 0.0131, + "epoch": 0.36, + "learning_rate": 0.0002454094421446365, + "loss": 0.022, "step": 140400 }, { - "epoch": 0.71, - "learning_rate": 0.00019374202239028104, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.000245405553928265, + "loss": 0.021, "step": 140410 }, { - "epoch": 0.71, - "learning_rate": 0.00019373445469726702, - "loss": 0.0133, + "epoch": 0.36, + "learning_rate": 0.0002454016657118935, + "loss": 0.015, "step": 140420 }, { - "epoch": 0.71, - "learning_rate": 0.00019372688700425303, - "loss": 0.014, + "epoch": 0.36, + "learning_rate": 0.000245397777495522, + "loss": 0.0184, "step": 140430 }, { - "epoch": 0.71, - "learning_rate": 0.000193719319311239, - "loss": 0.013, + "epoch": 0.36, + "learning_rate": 0.0002453938892791506, + "loss": 0.0213, "step": 140440 }, { - "epoch": 0.71, - "learning_rate": 0.000193711751618225, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.0002453900010627791, + "loss": 0.016, "step": 140450 }, { - "epoch": 0.71, - "learning_rate": 0.000193704183925211, - "loss": 0.0134, + "epoch": 0.36, + "learning_rate": 0.00024538611284640767, + "loss": 0.0191, "step": 140460 }, { - "epoch": 0.71, - "learning_rate": 0.00019369661623219698, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002453822246300362, + "loss": 0.0165, "step": 140470 }, { - "epoch": 0.71, - "learning_rate": 0.00019368904853918296, - "loss": 0.0159, + "epoch": 0.36, + "learning_rate": 0.0002453783364136647, + "loss": 0.0198, "step": 140480 }, { - "epoch": 0.71, - "learning_rate": 0.00019368148084616894, - "loss": 0.0162, + "epoch": 0.36, + "learning_rate": 0.00024537444819729327, + "loss": 0.0172, "step": 140490 }, { - "epoch": 0.71, - "learning_rate": 0.00019367391315315495, - "loss": 0.0142, + "epoch": 0.36, + "learning_rate": 0.0002453705599809218, + "loss": 0.0207, "step": 140500 }, { - "epoch": 0.71, - "learning_rate": 0.00019366634546014093, - "loss": 0.0115, + "epoch": 0.36, + "learning_rate": 0.00024536667176455035, + "loss": 0.0188, "step": 140510 }, { - "epoch": 0.71, - "learning_rate": 0.00019365877776712692, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024536278354817887, + "loss": 0.02, "step": 140520 }, { - "epoch": 0.71, - "learning_rate": 0.00019365121007411292, - "loss": 0.0145, + "epoch": 0.36, + "learning_rate": 0.00024535889533180744, + "loss": 0.0195, "step": 140530 }, { - "epoch": 0.71, - "learning_rate": 0.0001936436423810989, - "loss": 0.0166, + "epoch": 0.36, + "learning_rate": 0.00024535500711543595, + "loss": 0.0181, "step": 140540 }, { - "epoch": 0.71, - "learning_rate": 0.0001936360746880849, - "loss": 0.0129, + "epoch": 0.36, + "learning_rate": 0.00024535111889906447, + "loss": 0.0151, "step": 140550 }, { - "epoch": 0.71, - "learning_rate": 0.0001936285069950709, - "loss": 0.0117, + "epoch": 0.36, + "learning_rate": 0.000245347230682693, + "loss": 0.0159, "step": 140560 }, { - "epoch": 0.71, - "learning_rate": 0.00019362093930205688, - "loss": 0.0149, + "epoch": 0.36, + "learning_rate": 0.00024534334246632155, + "loss": 0.0195, "step": 140570 }, { - "epoch": 0.71, - "learning_rate": 0.00019361337160904286, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024533945424995006, + "loss": 0.0189, "step": 140580 }, { - "epoch": 0.71, - "learning_rate": 0.00019360580391602887, - "loss": 0.0128, + "epoch": 0.36, + "learning_rate": 0.00024533556603357863, + "loss": 0.0239, "step": 140590 }, { - "epoch": 0.71, - "learning_rate": 0.00019359823622301485, - "loss": 0.0126, + "epoch": 0.36, + "learning_rate": 0.00024533167781720715, + "loss": 0.0194, "step": 140600 }, { - "epoch": 0.71, - "learning_rate": 0.00019359066853000083, - "loss": 0.0108, + "epoch": 0.36, + "learning_rate": 0.0002453277896008357, + "loss": 0.0218, "step": 140610 }, { - "epoch": 0.71, - "learning_rate": 0.00019358310083698684, - "loss": 0.0111, + "epoch": 0.36, + "learning_rate": 0.00024532390138446423, + "loss": 0.0195, "step": 140620 }, { - "epoch": 0.71, - "learning_rate": 0.00019357553314397282, - "loss": 0.0137, + "epoch": 0.36, + "learning_rate": 0.00024532001316809274, + "loss": 0.0216, "step": 140630 }, { - "epoch": 0.71, - "learning_rate": 0.0001935679654509588, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.00024531612495172126, + "loss": 0.0172, "step": 140640 }, { - "epoch": 0.71, - "learning_rate": 0.0001935603977579448, - "loss": 0.0156, + "epoch": 0.36, + "learning_rate": 0.00024531223673534983, + "loss": 0.0194, "step": 140650 }, { - "epoch": 0.71, - "learning_rate": 0.0001935528300649308, - "loss": 0.0108, + "epoch": 0.36, + "learning_rate": 0.0002453083485189784, + "loss": 0.0193, "step": 140660 }, { - "epoch": 0.71, - "learning_rate": 0.00019354526237191677, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.0002453044603026069, + "loss": 0.0199, "step": 140670 }, { - "epoch": 0.71, - "learning_rate": 0.00019353769467890275, - "loss": 0.0103, + "epoch": 0.36, + "learning_rate": 0.0002453005720862354, + "loss": 0.0194, "step": 140680 }, { - "epoch": 0.71, - "learning_rate": 0.00019353012698588876, - "loss": 0.0114, + "epoch": 0.36, + "learning_rate": 0.00024529668386986394, + "loss": 0.0172, "step": 140690 }, { - "epoch": 0.71, - "learning_rate": 0.00019352255929287474, - "loss": 0.0127, + "epoch": 0.36, + "learning_rate": 0.0002452927956534925, + "loss": 0.0183, "step": 140700 }, { - "epoch": 0.71, - "learning_rate": 0.00019351499159986073, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.000245288907437121, + "loss": 0.022, "step": 140710 }, { - "epoch": 0.71, - "learning_rate": 0.00019350742390684673, - "loss": 0.015, + "epoch": 0.36, + "learning_rate": 0.0002452850192207496, + "loss": 0.0168, "step": 140720 }, { - "epoch": 0.71, - "learning_rate": 0.00019349985621383272, - "loss": 0.0135, + "epoch": 0.36, + "learning_rate": 0.0002452811310043781, + "loss": 0.0171, "step": 140730 }, { - "epoch": 0.71, - "learning_rate": 0.0001934922885208187, - "loss": 0.0119, + "epoch": 0.36, + "learning_rate": 0.0002452772427880067, + "loss": 0.0241, "step": 140740 }, { - "epoch": 0.71, - "learning_rate": 0.0001934847208278047, - "loss": 0.0116, + "epoch": 0.36, + "learning_rate": 0.0002452733545716352, + "loss": 0.0196, "step": 140750 }, { - "epoch": 0.71, - "learning_rate": 0.0001934771531347907, - "loss": 0.0139, + "epoch": 0.36, + "learning_rate": 0.0002452694663552637, + "loss": 0.0224, "step": 140760 }, { - "epoch": 0.71, - "learning_rate": 0.00019346958544177667, - "loss": 0.0136, + "epoch": 0.36, + "learning_rate": 0.0002452655781388922, + "loss": 0.0205, "step": 140770 }, { - "epoch": 0.71, - "learning_rate": 0.00019346201774876268, - "loss": 0.011, + "epoch": 0.36, + "learning_rate": 0.0002452616899225208, + "loss": 0.0209, "step": 140780 }, { - "epoch": 0.71, - "learning_rate": 0.00019345445005574866, - "loss": 0.0107, + "epoch": 0.36, + "learning_rate": 0.0002452578017061493, + "loss": 0.0185, "step": 140790 }, { - "epoch": 0.71, - "learning_rate": 0.00019344688236273464, - "loss": 0.0098, + "epoch": 0.36, + "learning_rate": 0.00024525391348977787, + "loss": 0.0212, "step": 140800 }, { - "epoch": 0.71, - "learning_rate": 0.00019343931466972065, - "loss": 0.0113, + "epoch": 0.36, + "learning_rate": 0.0002452500252734064, + "loss": 0.02, "step": 140810 }, { - "epoch": 0.71, - "learning_rate": 0.00019343174697670663, - "loss": 0.0161, + "epoch": 0.37, + "learning_rate": 0.00024524613705703495, + "loss": 0.0236, "step": 140820 }, { - "epoch": 0.71, - "learning_rate": 0.0001934241792836926, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.00024524224884066347, + "loss": 0.0196, "step": 140830 }, { - "epoch": 0.71, - "learning_rate": 0.0001934166115906786, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.000245238360624292, + "loss": 0.0249, "step": 140840 }, { - "epoch": 0.71, - "learning_rate": 0.0001934090438976646, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002452344724079205, + "loss": 0.0203, "step": 140850 }, { - "epoch": 0.71, - "learning_rate": 0.00019340147620465058, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024523058419154907, + "loss": 0.0232, "step": 140860 }, { - "epoch": 0.71, - "learning_rate": 0.00019339390851163656, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024522669597517764, + "loss": 0.0229, "step": 140870 }, { - "epoch": 0.71, - "learning_rate": 0.00019338634081862257, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024522280775880615, + "loss": 0.024, "step": 140880 }, { - "epoch": 0.71, - "learning_rate": 0.00019337877312560855, - "loss": 0.0095, + "epoch": 0.37, + "learning_rate": 0.00024521891954243466, + "loss": 0.0189, "step": 140890 }, { - "epoch": 0.71, - "learning_rate": 0.00019337120543259454, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024521503132606323, + "loss": 0.0198, "step": 140900 }, { - "epoch": 0.71, - "learning_rate": 0.00019336363773958054, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.00024521114310969175, + "loss": 0.0157, "step": 140910 }, { - "epoch": 0.71, - "learning_rate": 0.00019335607004656653, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.00024520725489332026, + "loss": 0.0219, "step": 140920 }, { - "epoch": 0.71, - "learning_rate": 0.0001933485023535525, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.00024520336667694883, + "loss": 0.0207, "step": 140930 }, { - "epoch": 0.71, - "learning_rate": 0.00019334093466053852, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024519947846057735, + "loss": 0.0223, "step": 140940 }, { - "epoch": 0.71, - "learning_rate": 0.0001933333669675245, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.0002451955902442059, + "loss": 0.0213, "step": 140950 }, { - "epoch": 0.71, - "learning_rate": 0.00019332579927451048, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024519170202783443, + "loss": 0.0233, "step": 140960 }, { - "epoch": 0.71, - "learning_rate": 0.0001933182315814965, - "loss": 0.0111, + "epoch": 0.37, + "learning_rate": 0.00024518781381146294, + "loss": 0.0178, "step": 140970 }, { - "epoch": 0.71, - "learning_rate": 0.00019331066388848247, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.00024518392559509146, + "loss": 0.0178, "step": 140980 }, { - "epoch": 0.71, - "learning_rate": 0.00019330309619546845, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024518003737872, + "loss": 0.0191, "step": 140990 }, { - "epoch": 0.71, - "learning_rate": 0.00019329552850245443, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024517614916234854, + "loss": 0.021, "step": 141000 }, { - "epoch": 0.71, - "eval_cer": 0.9144789894682909, - "eval_loss": 0.009155085310339928, - "eval_runtime": 116.8383, - "eval_samples_per_second": 17.118, - "eval_steps_per_second": 4.279, + "epoch": 0.37, + "eval_cer": 0.881751673615864, + "eval_loss": 0.013707040809094906, + "eval_runtime": 107.3675, + "eval_samples_per_second": 18.628, + "eval_steps_per_second": 4.657, "step": 141000 }, { - "epoch": 0.71, - "learning_rate": 0.00019328796080944044, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.0002451722609459771, + "loss": 0.02, "step": 141010 }, { - "epoch": 0.71, - "learning_rate": 0.00019328039311642642, - "loss": 0.0152, + "epoch": 0.37, + "learning_rate": 0.0002451683727296056, + "loss": 0.025, "step": 141020 }, { - "epoch": 0.71, - "learning_rate": 0.0001932728254234124, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.0002451644845132342, + "loss": 0.0184, "step": 141030 }, { - "epoch": 0.71, - "learning_rate": 0.0001932652577303984, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.0002451605962968627, + "loss": 0.0201, "step": 141040 }, { - "epoch": 0.71, - "learning_rate": 0.0001932576900373844, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.0002451567080804912, + "loss": 0.0246, "step": 141050 }, { - "epoch": 0.71, - "learning_rate": 0.00019325012234437037, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.0002451528198641198, + "loss": 0.0242, "step": 141060 }, { - "epoch": 0.71, - "learning_rate": 0.00019324255465135638, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.0002451489316477483, + "loss": 0.0196, "step": 141070 }, { - "epoch": 0.71, - "learning_rate": 0.00019323498695834236, - "loss": 0.0138, + "epoch": 0.37, + "learning_rate": 0.0002451450434313769, + "loss": 0.0184, "step": 141080 }, { - "epoch": 0.71, - "learning_rate": 0.00019322741926532835, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.0002451411552150054, + "loss": 0.0204, "step": 141090 }, { - "epoch": 0.71, - "learning_rate": 0.00019321985157231435, - "loss": 0.0108, + "epoch": 0.37, + "learning_rate": 0.0002451372669986339, + "loss": 0.0174, "step": 141100 }, { - "epoch": 0.71, - "learning_rate": 0.00019321228387930034, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024513337878226247, + "loss": 0.0163, "step": 141110 }, { - "epoch": 0.71, - "learning_rate": 0.00019320471618628632, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.000245129490565891, + "loss": 0.025, "step": 141120 }, { - "epoch": 0.71, - "learning_rate": 0.00019319714849327233, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002451256023495195, + "loss": 0.0191, "step": 141130 }, { - "epoch": 0.71, - "learning_rate": 0.0001931895808002583, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.00024512171413314807, + "loss": 0.022, "step": 141140 }, { - "epoch": 0.71, - "learning_rate": 0.0001931820131072443, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.0002451178259167766, + "loss": 0.0183, "step": 141150 }, { - "epoch": 0.71, - "learning_rate": 0.00019317444541423027, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.00024511393770040515, + "loss": 0.0149, "step": 141160 }, { - "epoch": 0.71, - "learning_rate": 0.00019316687772121628, - "loss": 0.0108, + "epoch": 0.37, + "learning_rate": 0.00024511004948403367, + "loss": 0.0181, "step": 141170 }, { - "epoch": 0.71, - "learning_rate": 0.00019315931002820226, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.0002451061612676622, + "loss": 0.0156, "step": 141180 }, { - "epoch": 0.71, - "learning_rate": 0.00019315174233518824, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.0002451022730512907, + "loss": 0.0168, "step": 141190 }, { - "epoch": 0.71, - "learning_rate": 0.00019314417464217425, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.00024509838483491927, + "loss": 0.0202, "step": 141200 }, { - "epoch": 0.71, - "learning_rate": 0.00019313660694916023, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.00024509449661854783, + "loss": 0.0188, "step": 141210 }, { - "epoch": 0.71, - "learning_rate": 0.0001931290392561462, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024509060840217635, + "loss": 0.0246, "step": 141220 }, { - "epoch": 0.71, - "learning_rate": 0.00019312147156313222, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024508672018580486, + "loss": 0.0237, "step": 141230 }, { - "epoch": 0.71, - "learning_rate": 0.0001931139038701182, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.00024508283196943343, + "loss": 0.0199, "step": 141240 }, { - "epoch": 0.71, - "learning_rate": 0.00019310633617710418, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024507894375306195, + "loss": 0.0233, "step": 141250 }, { - "epoch": 0.71, - "learning_rate": 0.0001930987684840902, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024507505553669046, + "loss": 0.0236, "step": 141260 }, { - "epoch": 0.71, - "learning_rate": 0.00019309120079107617, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024507116732031903, + "loss": 0.0192, "step": 141270 }, { - "epoch": 0.71, - "learning_rate": 0.00019308363309806216, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024506727910394754, + "loss": 0.0238, "step": 141280 }, { - "epoch": 0.71, - "learning_rate": 0.00019307606540504816, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002450633908875761, + "loss": 0.0228, "step": 141290 }, { - "epoch": 0.71, - "learning_rate": 0.00019306849771203415, - "loss": 0.0113, + "epoch": 0.37, + "learning_rate": 0.00024505950267120463, + "loss": 0.016, "step": 141300 }, { - "epoch": 0.71, - "learning_rate": 0.00019306093001902013, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024505561445483314, + "loss": 0.0178, "step": 141310 }, { - "epoch": 0.71, - "learning_rate": 0.00019305336232600614, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.0002450517262384617, + "loss": 0.0259, "step": 141320 }, { - "epoch": 0.71, - "learning_rate": 0.00019304579463299212, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.0002450478380220902, + "loss": 0.0133, "step": 141330 }, { - "epoch": 0.71, - "learning_rate": 0.0001930382269399781, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024504394980571874, + "loss": 0.0183, "step": 141340 }, { - "epoch": 0.71, - "learning_rate": 0.00019303065924696408, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002450400615893473, + "loss": 0.0212, "step": 141350 }, { - "epoch": 0.71, - "learning_rate": 0.0001930230915539501, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.0002450361733729759, + "loss": 0.0233, "step": 141360 }, { - "epoch": 0.71, - "learning_rate": 0.00019301552386093607, - "loss": 0.0127, + "epoch": 0.37, + "learning_rate": 0.0002450322851566044, + "loss": 0.0202, "step": 141370 }, { - "epoch": 0.71, - "learning_rate": 0.00019300795616792205, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.0002450283969402329, + "loss": 0.017, "step": 141380 }, { - "epoch": 0.71, - "learning_rate": 0.00019300038847490806, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.0002450245087238614, + "loss": 0.0219, "step": 141390 }, { - "epoch": 0.71, - "learning_rate": 0.00019299282078189401, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024502062050749, + "loss": 0.02, "step": 141400 }, { - "epoch": 0.71, - "learning_rate": 0.00019298525308888, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.0002450167322911185, + "loss": 0.0224, "step": 141410 }, { - "epoch": 0.71, - "learning_rate": 0.00019297768539586598, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.0002450128440747471, + "loss": 0.0216, "step": 141420 }, { - "epoch": 0.71, - "learning_rate": 0.00019297011770285199, - "loss": 0.0157, + "epoch": 0.37, + "learning_rate": 0.0002450089558583756, + "loss": 0.0209, "step": 141430 }, { - "epoch": 0.71, - "learning_rate": 0.00019296255000983797, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.0002450050676420041, + "loss": 0.0211, "step": 141440 }, { - "epoch": 0.71, - "learning_rate": 0.00019295498231682395, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024500117942563267, + "loss": 0.0181, "step": 141450 }, { - "epoch": 0.71, - "learning_rate": 0.00019294741462380996, - "loss": 0.0173, + "epoch": 0.37, + "learning_rate": 0.0002449972912092612, + "loss": 0.0188, "step": 141460 }, { - "epoch": 0.71, - "learning_rate": 0.00019293984693079594, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.0002449934029928897, + "loss": 0.0206, "step": 141470 }, { - "epoch": 0.71, - "learning_rate": 0.00019293227923778192, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024498951477651827, + "loss": 0.0213, "step": 141480 }, { - "epoch": 0.71, - "learning_rate": 0.00019292471154476793, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002449856265601468, + "loss": 0.02, "step": 141490 }, { - "epoch": 0.71, - "learning_rate": 0.0001929171438517539, - "loss": 0.0169, + "epoch": 0.37, + "learning_rate": 0.00024498173834377535, + "loss": 0.0202, "step": 141500 }, { - "epoch": 0.71, - "learning_rate": 0.0001929095761587399, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024497785012740387, + "loss": 0.019, "step": 141510 }, { - "epoch": 0.71, - "learning_rate": 0.0001929020084657259, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.0002449739619110324, + "loss": 0.0163, "step": 141520 }, { - "epoch": 0.71, - "learning_rate": 0.00019289444077271188, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024497007369466095, + "loss": 0.0186, "step": 141530 }, { - "epoch": 0.71, - "learning_rate": 0.00019288687307969786, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.00024496618547828946, + "loss": 0.0173, "step": 141540 }, { - "epoch": 0.71, - "learning_rate": 0.00019287930538668384, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.000244962297261918, + "loss": 0.0164, "step": 141550 }, { - "epoch": 0.71, - "learning_rate": 0.00019287173769366985, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024495840904554655, + "loss": 0.0176, "step": 141560 }, { - "epoch": 0.71, - "learning_rate": 0.00019286417000065583, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.0002449545208291751, + "loss": 0.0175, "step": 141570 }, { - "epoch": 0.71, - "learning_rate": 0.00019285660230764182, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024495063261280363, + "loss": 0.0247, "step": 141580 }, { - "epoch": 0.71, - "learning_rate": 0.00019284903461462782, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.00024494674439643215, + "loss": 0.017, "step": 141590 }, { - "epoch": 0.71, - "learning_rate": 0.0001928414669216138, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.00024494285618006066, + "loss": 0.0213, "step": 141600 }, { - "epoch": 0.71, - "learning_rate": 0.0001928338992285998, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024493896796368923, + "loss": 0.0205, "step": 141610 }, { - "epoch": 0.71, - "learning_rate": 0.0001928263315355858, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.00024493507974731774, + "loss": 0.0171, "step": 141620 }, { - "epoch": 0.71, - "learning_rate": 0.00019281876384257178, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.0002449311915309463, + "loss": 0.0189, "step": 141630 }, { - "epoch": 0.71, - "learning_rate": 0.00019281119614955776, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.0002449273033145748, + "loss": 0.0221, "step": 141640 }, { - "epoch": 0.71, - "learning_rate": 0.00019280362845654377, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.0002449234150982034, + "loss": 0.0195, "step": 141650 }, { - "epoch": 0.71, - "learning_rate": 0.00019279606076352975, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002449195268818319, + "loss": 0.0194, "step": 141660 }, { - "epoch": 0.71, - "learning_rate": 0.00019278849307051573, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.0002449156386654604, + "loss": 0.0206, "step": 141670 }, { - "epoch": 0.71, - "learning_rate": 0.00019278092537750174, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.00024491175044908894, + "loss": 0.0195, "step": 141680 }, { - "epoch": 0.71, - "learning_rate": 0.00019277335768448772, - "loss": 0.0108, + "epoch": 0.37, + "learning_rate": 0.0002449078622327175, + "loss": 0.0246, "step": 141690 }, { - "epoch": 0.71, - "learning_rate": 0.0001927657899914737, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.0002449039740163461, + "loss": 0.0185, "step": 141700 }, { - "epoch": 0.71, - "learning_rate": 0.0001927582222984597, - "loss": 0.0109, + "epoch": 0.37, + "learning_rate": 0.0002449000857999746, + "loss": 0.0226, "step": 141710 }, { - "epoch": 0.71, - "learning_rate": 0.0001927506546054457, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.0002448961975836031, + "loss": 0.021, "step": 141720 }, { - "epoch": 0.72, - "learning_rate": 0.00019274308691243167, - "loss": 0.0158, + "epoch": 0.37, + "learning_rate": 0.0002448923093672316, + "loss": 0.018, "step": 141730 }, { - "epoch": 0.72, - "learning_rate": 0.00019273551921941765, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.0002448884211508602, + "loss": 0.0163, "step": 141740 }, { - "epoch": 0.72, - "learning_rate": 0.00019272795152640366, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.0002448845329344887, + "loss": 0.0166, "step": 141750 }, { - "epoch": 0.72, - "learning_rate": 0.00019272038383338964, - "loss": 0.0113, + "epoch": 0.37, + "learning_rate": 0.00024488064471811727, + "loss": 0.0202, "step": 141760 }, { - "epoch": 0.72, - "learning_rate": 0.00019271281614037563, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.0002448767565017458, + "loss": 0.0168, "step": 141770 }, { - "epoch": 0.72, - "learning_rate": 0.00019270524844736163, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024487286828537436, + "loss": 0.0332, "step": 141780 }, { - "epoch": 0.72, - "learning_rate": 0.00019269768075434762, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024486898006900287, + "loss": 0.0185, "step": 141790 }, { - "epoch": 0.72, - "learning_rate": 0.0001926901130613336, - "loss": 0.0109, + "epoch": 0.37, + "learning_rate": 0.0002448650918526314, + "loss": 0.0211, "step": 141800 }, { - "epoch": 0.72, - "learning_rate": 0.0001926825453683196, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.0002448612036362599, + "loss": 0.0179, "step": 141810 }, { - "epoch": 0.72, - "learning_rate": 0.0001926749776753056, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024485731541988847, + "loss": 0.0176, "step": 141820 }, { - "epoch": 0.72, - "learning_rate": 0.00019266740998229157, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.000244853427203517, + "loss": 0.0204, "step": 141830 }, { - "epoch": 0.72, - "learning_rate": 0.00019265984228927758, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.00024484953898714555, + "loss": 0.0216, "step": 141840 }, { - "epoch": 0.72, - "learning_rate": 0.00019265227459626356, - "loss": 0.0221, + "epoch": 0.37, + "learning_rate": 0.00024484565077077407, + "loss": 0.0211, "step": 141850 }, { - "epoch": 0.72, - "learning_rate": 0.00019264470690324954, - "loss": 0.0091, + "epoch": 0.37, + "learning_rate": 0.00024484176255440263, + "loss": 0.0224, "step": 141860 }, { - "epoch": 0.72, - "learning_rate": 0.00019263713921023555, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024483787433803115, + "loss": 0.0162, "step": 141870 }, { - "epoch": 0.72, - "learning_rate": 0.00019262957151722153, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024483398612165966, + "loss": 0.0216, "step": 141880 }, { - "epoch": 0.72, - "learning_rate": 0.0001926220038242075, - "loss": 0.0193, + "epoch": 0.37, + "learning_rate": 0.0002448300979052882, + "loss": 0.0207, "step": 141890 }, { - "epoch": 0.72, - "learning_rate": 0.0001926144361311935, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024482620968891675, + "loss": 0.0189, "step": 141900 }, { - "epoch": 0.72, - "learning_rate": 0.0001926068684381795, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.0002448223214725453, + "loss": 0.0212, "step": 141910 }, { - "epoch": 0.72, - "learning_rate": 0.00019259930074516548, - "loss": 0.0165, + "epoch": 0.37, + "learning_rate": 0.00024481843325617383, + "loss": 0.0225, "step": 141920 }, { - "epoch": 0.72, - "learning_rate": 0.00019259173305215146, - "loss": 0.0159, + "epoch": 0.37, + "learning_rate": 0.00024481454503980234, + "loss": 0.0201, "step": 141930 }, { - "epoch": 0.72, - "learning_rate": 0.00019258416535913747, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024481065682343086, + "loss": 0.0171, "step": 141940 }, { - "epoch": 0.72, - "learning_rate": 0.00019257659766612345, - "loss": 0.0166, + "epoch": 0.37, + "learning_rate": 0.00024480676860705943, + "loss": 0.0159, "step": 141950 }, { - "epoch": 0.72, - "learning_rate": 0.00019256902997310944, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.00024480288039068794, + "loss": 0.0184, "step": 141960 }, { - "epoch": 0.72, - "learning_rate": 0.00019256146228009544, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.0002447989921743165, + "loss": 0.0179, "step": 141970 }, { - "epoch": 0.72, - "learning_rate": 0.00019255389458708143, + "epoch": 0.37, + "learning_rate": 0.000244795103957945, "loss": 0.0146, "step": 141980 }, { - "epoch": 0.72, - "learning_rate": 0.0001925463268940674, - "loss": 0.015, + "epoch": 0.37, + "learning_rate": 0.0002447912157415736, + "loss": 0.0225, "step": 141990 }, { - "epoch": 0.72, - "learning_rate": 0.00019253875920105342, - "loss": 0.0109, + "epoch": 0.37, + "learning_rate": 0.0002447873275252021, + "loss": 0.0215, "step": 142000 }, { - "epoch": 0.72, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.009451182559132576, - "eval_runtime": 116.6955, - "eval_samples_per_second": 17.139, - "eval_steps_per_second": 4.285, + "epoch": 0.37, + "eval_cer": 0.8817838652653501, + "eval_loss": 0.013540214858949184, + "eval_runtime": 107.2038, + "eval_samples_per_second": 18.656, + "eval_steps_per_second": 4.664, "step": 142000 }, { - "epoch": 0.72, - "learning_rate": 0.0001925311915080394, - "loss": 0.0138, + "epoch": 0.37, + "learning_rate": 0.0002447834393088306, + "loss": 0.0176, "step": 142010 }, { - "epoch": 0.72, - "learning_rate": 0.00019252362381502538, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024477955109245914, + "loss": 0.0222, "step": 142020 }, { - "epoch": 0.72, - "learning_rate": 0.0001925160561220114, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.0002447756628760877, + "loss": 0.023, "step": 142030 }, { - "epoch": 0.72, - "learning_rate": 0.00019250848842899737, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.0002447717746597162, + "loss": 0.0215, "step": 142040 }, { - "epoch": 0.72, - "learning_rate": 0.00019250092073598335, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.0002447678864433448, + "loss": 0.0245, "step": 142050 }, { - "epoch": 0.72, - "learning_rate": 0.00019249335304296933, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.0002447639982269733, + "loss": 0.0216, "step": 142060 }, { - "epoch": 0.72, - "learning_rate": 0.00019248578534995534, - "loss": 0.0151, + "epoch": 0.37, + "learning_rate": 0.0002447601100106019, + "loss": 0.019, "step": 142070 }, { - "epoch": 0.72, - "learning_rate": 0.00019247821765694132, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.0002447562217942304, + "loss": 0.0218, "step": 142080 }, { - "epoch": 0.72, - "learning_rate": 0.0001924706499639273, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.0002447523335778589, + "loss": 0.032, "step": 142090 }, { - "epoch": 0.72, - "learning_rate": 0.0001924630822709133, - "loss": 0.0106, + "epoch": 0.37, + "learning_rate": 0.00024474844536148747, + "loss": 0.0201, "step": 142100 }, { - "epoch": 0.72, - "learning_rate": 0.0001924555145778993, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.000244744557145116, + "loss": 0.017, "step": 142110 }, { - "epoch": 0.72, - "learning_rate": 0.00019244794688488527, - "loss": 0.0152, + "epoch": 0.37, + "learning_rate": 0.00024474066892874455, + "loss": 0.0207, "step": 142120 }, { - "epoch": 0.72, - "learning_rate": 0.00019244037919187128, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024473678071237307, + "loss": 0.0204, "step": 142130 }, { - "epoch": 0.72, - "learning_rate": 0.00019243281149885726, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.0002447328924960016, + "loss": 0.0184, "step": 142140 }, { - "epoch": 0.72, - "learning_rate": 0.00019242524380584325, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024472900427963015, + "loss": 0.0174, "step": 142150 }, { - "epoch": 0.72, - "learning_rate": 0.00019241767611282925, - "loss": 0.0171, + "epoch": 0.37, + "learning_rate": 0.00024472511606325867, + "loss": 0.0207, "step": 142160 }, { - "epoch": 0.72, - "learning_rate": 0.00019241010841981524, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.0002447212278468872, + "loss": 0.0221, "step": 142170 }, { - "epoch": 0.72, - "learning_rate": 0.00019240254072680122, - "loss": 0.0184, + "epoch": 0.37, + "learning_rate": 0.00024471733963051575, + "loss": 0.0201, "step": 142180 }, { - "epoch": 0.72, - "learning_rate": 0.00019239497303378723, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.00024471345141414426, + "loss": 0.0194, "step": 142190 }, { - "epoch": 0.72, - "learning_rate": 0.0001923874053407732, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024470956319777283, + "loss": 0.0194, "step": 142200 }, { - "epoch": 0.72, - "learning_rate": 0.0001923798376477592, + "epoch": 0.37, + "learning_rate": 0.00024470567498140135, "loss": 0.018, "step": 142210 }, { - "epoch": 0.72, - "learning_rate": 0.0001923722699547452, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024470178676502986, + "loss": 0.0162, "step": 142220 }, { - "epoch": 0.72, - "learning_rate": 0.00019236470226173118, - "loss": 0.0103, + "epoch": 0.37, + "learning_rate": 0.0002446978985486584, + "loss": 0.019, "step": 142230 }, { - "epoch": 0.72, - "learning_rate": 0.00019235713456871716, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.00024469401033228695, + "loss": 0.0166, "step": 142240 }, { - "epoch": 0.72, - "learning_rate": 0.00019234956687570314, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.0002446901221159155, + "loss": 0.0193, "step": 142250 }, { - "epoch": 0.72, - "learning_rate": 0.00019234199918268915, - "loss": 0.0158, + "epoch": 0.37, + "learning_rate": 0.00024468623389954403, + "loss": 0.0223, "step": 142260 }, { - "epoch": 0.72, - "learning_rate": 0.00019233443148967513, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.00024468234568317254, + "loss": 0.0235, "step": 142270 }, { - "epoch": 0.72, - "learning_rate": 0.0001923268637966611, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.0002446784574668011, + "loss": 0.0162, "step": 142280 }, { - "epoch": 0.72, - "learning_rate": 0.00019231929610364712, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.0002446745692504296, + "loss": 0.0191, "step": 142290 }, { - "epoch": 0.72, - "learning_rate": 0.0001923117284106331, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024467068103405814, + "loss": 0.0178, "step": 142300 }, { - "epoch": 0.72, - "learning_rate": 0.00019230416071761908, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.0002446667928176867, + "loss": 0.0229, "step": 142310 }, { - "epoch": 0.72, - "learning_rate": 0.0001922965930246051, - "loss": 0.0179, + "epoch": 0.37, + "learning_rate": 0.0002446629046013152, + "loss": 0.0271, "step": 142320 }, { - "epoch": 0.72, - "learning_rate": 0.00019228902533159107, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.0002446590163849438, + "loss": 0.0199, "step": 142330 }, { - "epoch": 0.72, - "learning_rate": 0.00019228145763857706, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.0002446551281685723, + "loss": 0.018, "step": 142340 }, { - "epoch": 0.72, - "learning_rate": 0.00019227388994556306, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.0002446512399522008, + "loss": 0.0187, "step": 142350 }, { - "epoch": 0.72, - "learning_rate": 0.00019226632225254905, - "loss": 0.011, + "epoch": 0.37, + "learning_rate": 0.0002446473517358294, + "loss": 0.0159, "step": 142360 }, { - "epoch": 0.72, - "learning_rate": 0.00019225875455953503, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.0002446434635194579, + "loss": 0.0195, "step": 142370 }, { - "epoch": 0.72, - "learning_rate": 0.00019225118686652104, - "loss": 0.0181, + "epoch": 0.37, + "learning_rate": 0.0002446395753030864, + "loss": 0.0175, "step": 142380 }, { - "epoch": 0.72, - "learning_rate": 0.00019224361917350702, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.000244635687086715, + "loss": 0.0208, "step": 142390 }, { - "epoch": 0.72, - "learning_rate": 0.000192236051480493, - "loss": 0.0149, + "epoch": 0.37, + "learning_rate": 0.00024463179887034356, + "loss": 0.0201, "step": 142400 }, { - "epoch": 0.72, - "learning_rate": 0.00019222848378747898, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.00024462791065397207, + "loss": 0.0211, "step": 142410 }, { - "epoch": 0.72, - "learning_rate": 0.000192220916094465, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.0002446240224376006, + "loss": 0.0238, "step": 142420 }, { - "epoch": 0.72, - "learning_rate": 0.00019221334840145097, - "loss": 0.0121, + "epoch": 0.37, + "learning_rate": 0.0002446201342212291, + "loss": 0.0168, "step": 142430 }, { - "epoch": 0.72, - "learning_rate": 0.00019220578070843695, - "loss": 0.011, + "epoch": 0.37, + "learning_rate": 0.0002446162460048576, + "loss": 0.017, "step": 142440 }, { - "epoch": 0.72, - "learning_rate": 0.00019219821301542296, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.0002446123577884862, + "loss": 0.0254, "step": 142450 }, { - "epoch": 0.72, - "learning_rate": 0.00019219064532240894, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024460846957211475, + "loss": 0.0216, "step": 142460 }, { - "epoch": 0.72, - "learning_rate": 0.00019218307762939492, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.00024460458135574327, + "loss": 0.0221, "step": 142470 }, { - "epoch": 0.72, - "learning_rate": 0.00019217550993638093, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.0002446006931393718, + "loss": 0.0156, "step": 142480 }, { - "epoch": 0.72, - "learning_rate": 0.0001921679422433669, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024459680492300035, + "loss": 0.0212, "step": 142490 }, { - "epoch": 0.72, - "learning_rate": 0.0001921603745503529, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.00024459291670662887, + "loss": 0.023, "step": 142500 }, { - "epoch": 0.72, - "learning_rate": 0.0001921528068573389, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.0002445890284902574, + "loss": 0.0181, "step": 142510 }, { - "epoch": 0.72, - "learning_rate": 0.00019214523916432488, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024458514027388595, + "loss": 0.0197, "step": 142520 }, { - "epoch": 0.72, - "learning_rate": 0.00019213767147131087, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.00024458125205751446, + "loss": 0.0222, "step": 142530 }, { - "epoch": 0.72, - "learning_rate": 0.00019213010377829687, - "loss": 0.016, + "epoch": 0.37, + "learning_rate": 0.00024457736384114303, + "loss": 0.0186, "step": 142540 }, { - "epoch": 0.72, - "learning_rate": 0.00019212253608528286, - "loss": 0.0103, + "epoch": 0.37, + "learning_rate": 0.00024457347562477155, + "loss": 0.0189, "step": 142550 }, { - "epoch": 0.72, - "learning_rate": 0.00019211496839226884, - "loss": 0.0127, + "epoch": 0.37, + "learning_rate": 0.00024456958740840006, + "loss": 0.0155, "step": 142560 }, { - "epoch": 0.72, - "learning_rate": 0.00019210740069925482, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024456569919202863, + "loss": 0.0171, "step": 142570 }, { - "epoch": 0.72, - "learning_rate": 0.00019209983300624083, - "loss": 0.0091, + "epoch": 0.37, + "learning_rate": 0.00024456181097565714, + "loss": 0.018, "step": 142580 }, { - "epoch": 0.72, - "learning_rate": 0.0001920922653132268, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024455792275928566, + "loss": 0.0173, "step": 142590 }, { - "epoch": 0.72, - "learning_rate": 0.0001920846976202128, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.00024455403454291423, + "loss": 0.0222, "step": 142600 }, { - "epoch": 0.72, - "learning_rate": 0.0001920771299271988, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.0002445501463265428, + "loss": 0.0174, "step": 142610 }, { - "epoch": 0.72, - "learning_rate": 0.00019206956223418478, - "loss": 0.01, + "epoch": 0.37, + "learning_rate": 0.0002445462581101713, + "loss": 0.0191, "step": 142620 }, { - "epoch": 0.72, - "learning_rate": 0.00019206199454117076, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.0002445423698937998, + "loss": 0.0218, "step": 142630 }, { - "epoch": 0.72, - "learning_rate": 0.00019205442684815677, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024453848167742834, + "loss": 0.0175, "step": 142640 }, { - "epoch": 0.72, - "learning_rate": 0.00019204685915514275, - "loss": 0.0164, + "epoch": 0.37, + "learning_rate": 0.0002445345934610569, + "loss": 0.0141, "step": 142650 }, { - "epoch": 0.72, - "learning_rate": 0.0001920392914621287, - "loss": 0.0102, + "epoch": 0.37, + "learning_rate": 0.0002445307052446854, + "loss": 0.0215, "step": 142660 }, { - "epoch": 0.72, - "learning_rate": 0.0001920317237691147, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.000244526817028314, + "loss": 0.0164, "step": 142670 }, { - "epoch": 0.72, - "learning_rate": 0.0001920241560761007, - "loss": 0.0115, + "epoch": 0.37, + "learning_rate": 0.0002445229288119425, + "loss": 0.0214, "step": 142680 }, { - "epoch": 0.72, - "learning_rate": 0.00019201658838308668, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.000244519040595571, + "loss": 0.0234, "step": 142690 }, { - "epoch": 0.72, - "learning_rate": 0.00019200902069007266, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.0002445151523791996, + "loss": 0.018, "step": 142700 }, { - "epoch": 0.72, - "learning_rate": 0.00019200145299705867, - "loss": 0.0121, + "epoch": 0.37, + "learning_rate": 0.0002445112641628281, + "loss": 0.021, "step": 142710 }, { - "epoch": 0.72, - "learning_rate": 0.00019199388530404465, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.0002445073759464566, + "loss": 0.0208, "step": 142720 }, { - "epoch": 0.72, - "learning_rate": 0.00019198631761103063, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.0002445034877300852, + "loss": 0.0196, "step": 142730 }, { - "epoch": 0.72, - "learning_rate": 0.00019197874991801664, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.0002444995995137137, + "loss": 0.0202, "step": 142740 }, { - "epoch": 0.72, - "learning_rate": 0.00019197118222500262, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024449571129734227, + "loss": 0.0189, "step": 142750 }, { - "epoch": 0.72, - "learning_rate": 0.0001919636145319886, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.0002444918230809708, + "loss": 0.0154, "step": 142760 }, { - "epoch": 0.72, - "learning_rate": 0.0001919560468389746, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.0002444879348645993, + "loss": 0.0178, "step": 142770 }, { - "epoch": 0.72, - "learning_rate": 0.0001919484791459606, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024448404664822787, + "loss": 0.0212, "step": 142780 }, { - "epoch": 0.72, - "learning_rate": 0.00019194091145294657, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.0002444801584318564, + "loss": 0.0165, "step": 142790 }, { - "epoch": 0.72, - "learning_rate": 0.00019193334375993255, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024447627021548495, + "loss": 0.0165, "step": 142800 }, { - "epoch": 0.72, - "learning_rate": 0.00019192577606691856, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024447238199911347, + "loss": 0.0182, "step": 142810 }, { - "epoch": 0.72, - "learning_rate": 0.00019191820837390454, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.00024446849378274204, + "loss": 0.0183, "step": 142820 }, { - "epoch": 0.72, - "learning_rate": 0.00019191064068089053, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024446460556637055, + "loss": 0.0215, "step": 142830 }, { - "epoch": 0.72, - "learning_rate": 0.00019190307298787653, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024446071734999906, + "loss": 0.0193, "step": 142840 }, { - "epoch": 0.72, - "learning_rate": 0.00019189550529486252, - "loss": 0.0115, + "epoch": 0.37, + "learning_rate": 0.0002444568291336276, + "loss": 0.0188, "step": 142850 }, { - "epoch": 0.72, - "learning_rate": 0.0001918879376018485, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.00024445294091725615, + "loss": 0.0179, "step": 142860 }, { - "epoch": 0.72, - "learning_rate": 0.0001918803699088345, - "loss": 0.0101, + "epoch": 0.37, + "learning_rate": 0.00024444905270088466, + "loss": 0.0195, "step": 142870 }, { - "epoch": 0.72, - "learning_rate": 0.0001918728022158205, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024444516448451323, + "loss": 0.0235, "step": 142880 }, { - "epoch": 0.72, - "learning_rate": 0.00019186523452280647, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024444127626814175, + "loss": 0.0147, "step": 142890 }, { - "epoch": 0.72, - "learning_rate": 0.00019185766682979248, - "loss": 0.0127, + "epoch": 0.37, + "learning_rate": 0.0002444373880517703, + "loss": 0.019, "step": 142900 }, { - "epoch": 0.72, - "learning_rate": 0.00019185009913677846, - "loss": 0.0171, + "epoch": 0.37, + "learning_rate": 0.00024443349983539883, + "loss": 0.0204, "step": 142910 }, { - "epoch": 0.72, - "learning_rate": 0.00019184253144376444, - "loss": 0.0109, + "epoch": 0.37, + "learning_rate": 0.00024442961161902734, + "loss": 0.0167, "step": 142920 }, { - "epoch": 0.72, - "learning_rate": 0.00019183496375075045, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.00024442572340265586, + "loss": 0.0155, "step": 142930 }, { - "epoch": 0.72, - "learning_rate": 0.00019182739605773643, - "loss": 0.0149, + "epoch": 0.37, + "learning_rate": 0.0002444218351862844, + "loss": 0.0229, "step": 142940 }, { - "epoch": 0.72, - "learning_rate": 0.0001918198283647224, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.000244417946969913, + "loss": 0.0182, "step": 142950 }, { - "epoch": 0.72, - "learning_rate": 0.0001918122606717084, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.0002444140587535415, + "loss": 0.0203, "step": 142960 }, { - "epoch": 0.72, - "learning_rate": 0.0001918046929786944, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024441017053717, + "loss": 0.0189, "step": 142970 }, { - "epoch": 0.72, - "learning_rate": 0.00019179712528568038, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024440628232079854, + "loss": 0.0207, "step": 142980 }, { - "epoch": 0.72, - "learning_rate": 0.00019178955759266636, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.0002444023941044271, + "loss": 0.0215, "step": 142990 }, { - "epoch": 0.72, - "learning_rate": 0.00019178198989965237, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.0002443985058880556, + "loss": 0.022, "step": 143000 }, { - "epoch": 0.72, - "eval_cer": 0.9144770486760401, - "eval_loss": 0.00942008476704359, - "eval_runtime": 116.7292, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.283, + "epoch": 0.37, + "eval_cer": 0.8818286536472439, + "eval_loss": 0.013993228785693645, + "eval_runtime": 107.6329, + "eval_samples_per_second": 18.582, + "eval_steps_per_second": 4.645, "step": 143000 }, { - "epoch": 0.72, - "learning_rate": 0.00019177442220663835, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.0002443946176716842, + "loss": 0.0182, "step": 143010 }, { - "epoch": 0.72, - "learning_rate": 0.00019176685451362434, - "loss": 0.0151, + "epoch": 0.37, + "learning_rate": 0.0002443907294553127, + "loss": 0.0179, "step": 143020 }, { - "epoch": 0.72, - "learning_rate": 0.00019175928682061034, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.0002443868412389413, + "loss": 0.0181, "step": 143030 }, { - "epoch": 0.72, - "learning_rate": 0.00019175171912759633, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.0002443829530225698, + "loss": 0.016, "step": 143040 }, { - "epoch": 0.72, - "learning_rate": 0.0001917441514345823, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.0002443790648061983, + "loss": 0.0215, "step": 143050 }, { - "epoch": 0.72, - "learning_rate": 0.00019173658374156832, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.0002443751765898268, + "loss": 0.0219, "step": 143060 }, { - "epoch": 0.72, - "learning_rate": 0.0001917290160485543, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.0002443712883734554, + "loss": 0.0195, "step": 143070 }, { - "epoch": 0.72, - "learning_rate": 0.00019172144835554028, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.0002443674001570839, + "loss": 0.0209, "step": 143080 }, { - "epoch": 0.72, - "learning_rate": 0.0001917138806625263, - "loss": 0.0156, + "epoch": 0.37, + "learning_rate": 0.00024436351194071247, + "loss": 0.0194, "step": 143090 }, { - "epoch": 0.72, - "learning_rate": 0.00019170631296951227, - "loss": 0.0138, + "epoch": 0.37, + "learning_rate": 0.000244359623724341, + "loss": 0.0202, "step": 143100 }, { - "epoch": 0.72, - "learning_rate": 0.00019169874527649825, - "loss": 0.0142, + "epoch": 0.37, + "learning_rate": 0.00024435573550796955, + "loss": 0.017, "step": 143110 }, { - "epoch": 0.72, - "learning_rate": 0.00019169117758348426, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024435184729159807, + "loss": 0.0219, "step": 143120 }, { - "epoch": 0.72, - "learning_rate": 0.00019168360989047024, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.0002443479590752266, + "loss": 0.0197, "step": 143130 }, { - "epoch": 0.72, - "learning_rate": 0.00019167604219745622, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.0002443440708588551, + "loss": 0.0221, "step": 143140 }, { - "epoch": 0.72, - "learning_rate": 0.0001916684745044422, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024434018264248367, + "loss": 0.0189, "step": 143150 }, { - "epoch": 0.72, - "learning_rate": 0.0001916609068114282, - "loss": 0.0154, + "epoch": 0.37, + "learning_rate": 0.00024433629442611223, + "loss": 0.0175, "step": 143160 }, { - "epoch": 0.72, - "learning_rate": 0.0001916533391184142, - "loss": 0.0101, + "epoch": 0.37, + "learning_rate": 0.00024433240620974075, + "loss": 0.0202, "step": 143170 }, { - "epoch": 0.72, - "learning_rate": 0.00019164577142540017, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.00024432851799336926, + "loss": 0.0215, "step": 143180 }, { - "epoch": 0.72, - "learning_rate": 0.00019163820373238618, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.0002443246297769978, + "loss": 0.0135, "step": 143190 }, { - "epoch": 0.72, - "learning_rate": 0.00019163063603937216, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.00024432074156062635, + "loss": 0.015, "step": 143200 }, { - "epoch": 0.72, - "learning_rate": 0.00019162306834635815, - "loss": 0.0127, + "epoch": 0.37, + "learning_rate": 0.00024431685334425486, + "loss": 0.0231, "step": 143210 }, { - "epoch": 0.72, - "learning_rate": 0.00019161550065334415, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.00024431296512788343, + "loss": 0.0198, "step": 143220 }, { - "epoch": 0.72, - "learning_rate": 0.00019160793296033014, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024430907691151194, + "loss": 0.0205, "step": 143230 }, { - "epoch": 0.72, - "learning_rate": 0.00019160036526731612, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.0002443051886951405, + "loss": 0.0251, "step": 143240 }, { - "epoch": 0.72, - "learning_rate": 0.00019159279757430213, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024430130047876903, + "loss": 0.0202, "step": 143250 }, { - "epoch": 0.72, - "learning_rate": 0.0001915852298812881, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.00024429741226239754, + "loss": 0.0211, "step": 143260 }, { - "epoch": 0.72, - "learning_rate": 0.0001915776621882741, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.00024429352404602606, + "loss": 0.0174, "step": 143270 }, { - "epoch": 0.72, - "learning_rate": 0.0001915700944952601, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.0002442896358296546, + "loss": 0.0176, "step": 143280 }, { - "epoch": 0.72, - "learning_rate": 0.00019156252680224608, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.0002442857476132832, + "loss": 0.0179, "step": 143290 }, { - "epoch": 0.72, - "learning_rate": 0.00019155495910923206, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.0002442818593969117, + "loss": 0.0205, "step": 143300 }, { - "epoch": 0.72, - "learning_rate": 0.00019154739141621804, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.0002442779711805402, + "loss": 0.0203, "step": 143310 }, { - "epoch": 0.72, - "learning_rate": 0.00019153982372320405, - "loss": 0.0184, + "epoch": 0.37, + "learning_rate": 0.0002442740829641688, + "loss": 0.0263, "step": 143320 }, { - "epoch": 0.72, - "learning_rate": 0.00019153225603019003, - "loss": 0.013, + "epoch": 0.37, + "learning_rate": 0.0002442701947477973, + "loss": 0.0184, "step": 143330 }, { - "epoch": 0.72, - "learning_rate": 0.000191524688337176, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.0002442663065314258, + "loss": 0.0194, "step": 143340 }, { - "epoch": 0.72, - "learning_rate": 0.00019151712064416202, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.0002442624183150544, + "loss": 0.0178, "step": 143350 }, { - "epoch": 0.72, - "learning_rate": 0.000191509552951148, - "loss": 0.0104, + "epoch": 0.37, + "learning_rate": 0.0002442585300986829, + "loss": 0.022, "step": 143360 }, { - "epoch": 0.72, - "learning_rate": 0.00019150198525813398, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024425464188231147, + "loss": 0.0241, "step": 143370 }, { - "epoch": 0.72, - "learning_rate": 0.00019149441756512, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024425075366594, + "loss": 0.0201, "step": 143380 }, { - "epoch": 0.72, - "learning_rate": 0.00019148684987210597, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.0002442468654495685, + "loss": 0.0185, "step": 143390 }, { - "epoch": 0.72, - "learning_rate": 0.00019147928217909196, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024424297723319707, + "loss": 0.0227, "step": 143400 }, { - "epoch": 0.72, - "learning_rate": 0.00019147171448607796, - "loss": 0.0101, + "epoch": 0.37, + "learning_rate": 0.0002442390890168256, + "loss": 0.0223, "step": 143410 }, { - "epoch": 0.72, - "learning_rate": 0.00019146414679306395, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.0002442352008004541, + "loss": 0.0191, "step": 143420 }, { - "epoch": 0.72, - "learning_rate": 0.00019145657910004993, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024423131258408267, + "loss": 0.02, "step": 143430 }, { - "epoch": 0.72, - "learning_rate": 0.00019144901140703594, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.0002442274243677112, + "loss": 0.0191, "step": 143440 }, { - "epoch": 0.72, - "learning_rate": 0.00019144144371402192, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024422353615133975, + "loss": 0.0204, "step": 143450 }, { - "epoch": 0.72, - "learning_rate": 0.0001914338760210079, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024421964793496827, + "loss": 0.021, "step": 143460 }, { - "epoch": 0.72, - "learning_rate": 0.00019142630832799388, - "loss": 0.0151, + "epoch": 0.37, + "learning_rate": 0.0002442157597185968, + "loss": 0.0237, "step": 143470 }, { - "epoch": 0.72, - "learning_rate": 0.0001914187406349799, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.0002442118715022253, + "loss": 0.0191, "step": 143480 }, { - "epoch": 0.72, - "learning_rate": 0.00019141117294196587, - "loss": 0.0106, + "epoch": 0.37, + "learning_rate": 0.00024420798328585386, + "loss": 0.0193, "step": 143490 }, { - "epoch": 0.72, - "learning_rate": 0.00019140360524895185, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.00024420409506948243, + "loss": 0.0185, "step": 143500 }, { - "epoch": 0.72, - "learning_rate": 0.00019139603755593786, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024420020685311095, + "loss": 0.0221, "step": 143510 }, { - "epoch": 0.72, - "learning_rate": 0.00019138846986292384, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.00024419631863673946, + "loss": 0.0192, "step": 143520 }, { - "epoch": 0.72, - "learning_rate": 0.00019138090216990982, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024419243042036803, + "loss": 0.0181, "step": 143530 }, { - "epoch": 0.72, - "learning_rate": 0.00019137333447689583, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.00024418854220399655, + "loss": 0.0172, "step": 143540 }, { - "epoch": 0.72, - "learning_rate": 0.0001913657667838818, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.00024418465398762506, + "loss": 0.0165, "step": 143550 }, { - "epoch": 0.72, - "learning_rate": 0.0001913581990908678, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024418076577125363, + "loss": 0.0211, "step": 143560 }, { - "epoch": 0.72, - "learning_rate": 0.0001913506313978538, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.00024417687755488214, + "loss": 0.0184, "step": 143570 }, { - "epoch": 0.72, - "learning_rate": 0.00019134306370483978, - "loss": 0.0104, + "epoch": 0.37, + "learning_rate": 0.0002441729893385107, + "loss": 0.0184, "step": 143580 }, { - "epoch": 0.72, - "learning_rate": 0.00019133549601182577, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.0002441691011221392, + "loss": 0.0224, "step": 143590 }, { - "epoch": 0.72, - "learning_rate": 0.00019132792831881177, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.00024416521290576774, + "loss": 0.0267, "step": 143600 }, { - "epoch": 0.72, - "learning_rate": 0.00019132036062579776, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.0002441613246893963, + "loss": 0.0242, "step": 143610 }, { - "epoch": 0.72, - "learning_rate": 0.00019131279293278374, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.0002441574364730248, + "loss": 0.0209, "step": 143620 }, { - "epoch": 0.72, - "learning_rate": 0.00019130522523976975, - "loss": 0.0189, + "epoch": 0.37, + "learning_rate": 0.00024415354825665334, + "loss": 0.0208, "step": 143630 }, { - "epoch": 0.72, - "learning_rate": 0.00019129765754675573, - "loss": 0.0178, + "epoch": 0.37, + "learning_rate": 0.0002441496600402819, + "loss": 0.0217, "step": 143640 }, { - "epoch": 0.72, - "learning_rate": 0.0001912900898537417, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.0002441457718239105, + "loss": 0.0259, "step": 143650 }, { - "epoch": 0.72, - "learning_rate": 0.0001912825221607277, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.000244141883607539, + "loss": 0.0221, "step": 143660 }, { - "epoch": 0.72, - "learning_rate": 0.0001912749544677137, - "loss": 0.0155, + "epoch": 0.37, + "learning_rate": 0.0002441379953911675, + "loss": 0.0188, "step": 143670 }, { - "epoch": 0.72, - "learning_rate": 0.00019126738677469968, - "loss": 0.0131, + "epoch": 0.37, + "learning_rate": 0.00024413410717479605, + "loss": 0.0222, "step": 143680 }, { - "epoch": 0.72, - "learning_rate": 0.00019125981908168566, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.00024413021895842456, + "loss": 0.02, "step": 143690 }, { - "epoch": 0.72, - "learning_rate": 0.00019125225138867167, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024412633074205313, + "loss": 0.0203, "step": 143700 }, { - "epoch": 0.73, - "learning_rate": 0.00019124468369565765, - "loss": 0.0117, + "epoch": 0.37, + "learning_rate": 0.00024412244252568164, + "loss": 0.0195, "step": 143710 }, { - "epoch": 0.73, - "learning_rate": 0.00019123711600264363, - "loss": 0.0148, + "epoch": 0.37, + "learning_rate": 0.00024411855430931019, + "loss": 0.0168, "step": 143720 }, { - "epoch": 0.73, - "learning_rate": 0.00019122954830962964, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.0002441146660929387, + "loss": 0.0219, "step": 143730 }, { - "epoch": 0.73, - "learning_rate": 0.00019122198061661562, - "loss": 0.0124, + "epoch": 0.37, + "learning_rate": 0.00024411077787656727, + "loss": 0.0179, "step": 143740 }, { - "epoch": 0.73, - "learning_rate": 0.0001912144129236016, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024410688966019578, + "loss": 0.0181, "step": 143750 }, { - "epoch": 0.73, - "learning_rate": 0.0001912068452305876, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.00024410300144382433, + "loss": 0.0172, "step": 143760 }, { - "epoch": 0.73, - "learning_rate": 0.0001911992775375736, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024409911322745284, + "loss": 0.0186, "step": 143770 }, { - "epoch": 0.73, - "learning_rate": 0.00019119170984455958, - "loss": 0.0149, + "epoch": 0.37, + "learning_rate": 0.0002440952250110814, + "loss": 0.0234, "step": 143780 }, { - "epoch": 0.73, - "learning_rate": 0.00019118414215154558, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.00024409133679470992, + "loss": 0.0172, "step": 143790 }, { - "epoch": 0.73, - "learning_rate": 0.00019117657445853157, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024408744857833847, + "loss": 0.0196, "step": 143800 }, { - "epoch": 0.73, - "learning_rate": 0.00019116900676551755, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024408356036196698, + "loss": 0.0217, "step": 143810 }, { - "epoch": 0.73, - "learning_rate": 0.00019116143907250353, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.00024407967214559555, + "loss": 0.0192, "step": 143820 }, { - "epoch": 0.73, - "learning_rate": 0.00019115387137948954, - "loss": 0.0146, + "epoch": 0.37, + "learning_rate": 0.0002440757839292241, + "loss": 0.0252, "step": 143830 }, { - "epoch": 0.73, - "learning_rate": 0.00019114630368647552, - "loss": 0.011, + "epoch": 0.37, + "learning_rate": 0.0002440718957128526, + "loss": 0.0214, "step": 143840 }, { - "epoch": 0.73, - "learning_rate": 0.0001911387359934615, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.00024406800749648115, + "loss": 0.0249, "step": 143850 }, { - "epoch": 0.73, - "learning_rate": 0.0001911311683004475, - "loss": 0.0162, + "epoch": 0.37, + "learning_rate": 0.0002440641192801097, + "loss": 0.0182, "step": 143860 }, { - "epoch": 0.73, - "learning_rate": 0.0001911236006074335, - "loss": 0.0139, + "epoch": 0.37, + "learning_rate": 0.00024406023106373823, + "loss": 0.0203, "step": 143870 }, { - "epoch": 0.73, - "learning_rate": 0.00019111603291441947, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024405634284736674, + "loss": 0.0259, "step": 143880 }, { - "epoch": 0.73, - "learning_rate": 0.00019110846522140548, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024405245463099529, + "loss": 0.02, "step": 143890 }, { - "epoch": 0.73, - "learning_rate": 0.00019110089752839146, - "loss": 0.0126, + "epoch": 0.37, + "learning_rate": 0.00024404856641462383, + "loss": 0.0193, "step": 143900 }, { - "epoch": 0.73, - "learning_rate": 0.00019109332983537744, - "loss": 0.0127, + "epoch": 0.37, + "learning_rate": 0.00024404467819825237, + "loss": 0.0215, "step": 143910 }, { - "epoch": 0.73, - "learning_rate": 0.0001910857621423634, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.00024404078998188088, + "loss": 0.0187, "step": 143920 }, { - "epoch": 0.73, - "learning_rate": 0.0001910781944493494, - "loss": 0.016, + "epoch": 0.37, + "learning_rate": 0.00024403690176550943, + "loss": 0.02, "step": 143930 }, { - "epoch": 0.73, - "learning_rate": 0.0001910706267563354, - "loss": 0.0108, + "epoch": 0.37, + "learning_rate": 0.00024403301354913794, + "loss": 0.0228, "step": 143940 }, { - "epoch": 0.73, - "learning_rate": 0.00019106305906332137, - "loss": 0.0166, + "epoch": 0.37, + "learning_rate": 0.0002440291253327665, + "loss": 0.0226, "step": 143950 }, { - "epoch": 0.73, - "learning_rate": 0.00019105549137030738, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024402523711639502, + "loss": 0.0178, "step": 143960 }, { - "epoch": 0.73, - "learning_rate": 0.00019104792367729336, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.00024402134890002356, + "loss": 0.0185, "step": 143970 }, { - "epoch": 0.73, - "learning_rate": 0.00019104035598427934, - "loss": 0.0134, + "epoch": 0.37, + "learning_rate": 0.00024401746068365208, + "loss": 0.0209, "step": 143980 }, { - "epoch": 0.73, - "learning_rate": 0.00019103278829126535, - "loss": 0.0121, + "epoch": 0.37, + "learning_rate": 0.00024401357246728065, + "loss": 0.0218, "step": 143990 }, { - "epoch": 0.73, - "learning_rate": 0.00019102522059825133, - "loss": 0.0111, + "epoch": 0.37, + "learning_rate": 0.0002440096842509092, + "loss": 0.0212, "step": 144000 }, { - "epoch": 0.73, - "eval_cer": 0.914481900656667, - "eval_loss": 0.009388601407408714, - "eval_runtime": 116.6959, - "eval_samples_per_second": 17.139, - "eval_steps_per_second": 4.285, + "epoch": 0.37, + "eval_cer": 0.881806259456297, + "eval_loss": 0.014057588763535023, + "eval_runtime": 107.315, + "eval_samples_per_second": 18.637, + "eval_steps_per_second": 4.659, "step": 144000 }, { - "epoch": 0.73, - "learning_rate": 0.0001910176529052373, - "loss": 0.01, + "epoch": 0.37, + "learning_rate": 0.0002440057960345377, + "loss": 0.023, "step": 144010 }, { - "epoch": 0.73, - "learning_rate": 0.00019101008521222332, - "loss": 0.0112, + "epoch": 0.37, + "learning_rate": 0.00024400190781816622, + "loss": 0.0212, "step": 144020 }, { - "epoch": 0.73, - "learning_rate": 0.0001910025175192093, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.0002439980196017948, + "loss": 0.0209, "step": 144030 }, { - "epoch": 0.73, - "learning_rate": 0.00019099494982619528, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024399413138542333, + "loss": 0.0195, "step": 144040 }, { - "epoch": 0.73, - "learning_rate": 0.00019098738213318126, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024399024316905184, + "loss": 0.0245, "step": 144050 }, { - "epoch": 0.73, - "learning_rate": 0.00019097981444016727, - "loss": 0.0136, + "epoch": 0.37, + "learning_rate": 0.00024398635495268039, + "loss": 0.0192, "step": 144060 }, { - "epoch": 0.73, - "learning_rate": 0.00019097224674715325, - "loss": 0.011, + "epoch": 0.37, + "learning_rate": 0.00024398246673630893, + "loss": 0.022, "step": 144070 }, { - "epoch": 0.73, - "learning_rate": 0.00019096467905413924, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024397857851993747, + "loss": 0.0249, "step": 144080 }, { - "epoch": 0.73, - "learning_rate": 0.00019095711136112524, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.00024397469030356598, + "loss": 0.0198, "step": 144090 }, { - "epoch": 0.73, - "learning_rate": 0.00019094954366811123, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024397080208719452, + "loss": 0.0166, "step": 144100 }, { - "epoch": 0.73, - "learning_rate": 0.0001909419759750972, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024396691387082307, + "loss": 0.0193, "step": 144110 }, { - "epoch": 0.73, - "learning_rate": 0.00019093440828208322, - "loss": 0.0133, + "epoch": 0.37, + "learning_rate": 0.0002439630256544516, + "loss": 0.0195, "step": 144120 }, { - "epoch": 0.73, - "learning_rate": 0.0001909268405890692, - "loss": 0.0107, + "epoch": 0.37, + "learning_rate": 0.00024395913743808012, + "loss": 0.0189, "step": 144130 }, { - "epoch": 0.73, - "learning_rate": 0.00019091927289605518, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.00024395524922170866, + "loss": 0.0237, "step": 144140 }, { - "epoch": 0.73, - "learning_rate": 0.0001909117052030412, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024395136100533718, + "loss": 0.0182, "step": 144150 }, { - "epoch": 0.73, - "learning_rate": 0.00019090413751002717, - "loss": 0.0115, + "epoch": 0.37, + "learning_rate": 0.00024394747278896575, + "loss": 0.0198, "step": 144160 }, { - "epoch": 0.73, - "learning_rate": 0.00019089656981701315, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024394358457259426, + "loss": 0.0202, "step": 144170 }, { - "epoch": 0.73, - "learning_rate": 0.00019088900212399916, - "loss": 0.0101, + "epoch": 0.37, + "learning_rate": 0.0002439396963562228, + "loss": 0.0228, "step": 144180 }, { - "epoch": 0.73, - "learning_rate": 0.00019088143443098514, - "loss": 0.016, + "epoch": 0.37, + "learning_rate": 0.00024393580813985132, + "loss": 0.0233, "step": 144190 }, { - "epoch": 0.73, - "learning_rate": 0.00019087386673797112, - "loss": 0.0162, + "epoch": 0.37, + "learning_rate": 0.0002439319199234799, + "loss": 0.0174, "step": 144200 }, { - "epoch": 0.73, - "learning_rate": 0.0001908662990449571, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024392803170710843, + "loss": 0.0219, "step": 144210 }, { - "epoch": 0.73, - "learning_rate": 0.0001908587313519431, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.00024392414349073694, + "loss": 0.0176, "step": 144220 }, { - "epoch": 0.73, - "learning_rate": 0.0001908511636589291, - "loss": 0.0149, + "epoch": 0.37, + "learning_rate": 0.00024392025527436548, + "loss": 0.0165, "step": 144230 }, { - "epoch": 0.73, - "learning_rate": 0.00019084359596591507, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.00024391636705799403, + "loss": 0.0217, "step": 144240 }, { - "epoch": 0.73, - "learning_rate": 0.00019083602827290108, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024391247884162257, + "loss": 0.0149, "step": 144250 }, { - "epoch": 0.73, - "learning_rate": 0.00019082846057988706, - "loss": 0.0098, + "epoch": 0.37, + "learning_rate": 0.00024390859062525108, + "loss": 0.0286, "step": 144260 }, { - "epoch": 0.73, - "learning_rate": 0.00019082089288687305, - "loss": 0.0121, + "epoch": 0.37, + "learning_rate": 0.00024390470240887962, + "loss": 0.0187, "step": 144270 }, { - "epoch": 0.73, - "learning_rate": 0.00019081332519385905, - "loss": 0.0129, + "epoch": 0.37, + "learning_rate": 0.00024390081419250817, + "loss": 0.0224, "step": 144280 }, { - "epoch": 0.73, - "learning_rate": 0.00019080575750084504, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.0002438969259761367, + "loss": 0.0183, "step": 144290 }, { - "epoch": 0.73, - "learning_rate": 0.00019079818980783102, - "loss": 0.012, + "epoch": 0.37, + "learning_rate": 0.00024389303775976522, + "loss": 0.0224, "step": 144300 }, { - "epoch": 0.73, - "learning_rate": 0.00019079062211481703, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024388914954339376, + "loss": 0.0328, "step": 144310 }, { - "epoch": 0.73, - "learning_rate": 0.000190783054421803, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024388526132702233, + "loss": 0.0206, "step": 144320 }, { - "epoch": 0.73, - "learning_rate": 0.000190775486728789, - "loss": 0.0153, + "epoch": 0.37, + "learning_rate": 0.00024388137311065085, + "loss": 0.0226, "step": 144330 }, { - "epoch": 0.73, - "learning_rate": 0.000190767919035775, - "loss": 0.014, + "epoch": 0.37, + "learning_rate": 0.00024387748489427936, + "loss": 0.026, "step": 144340 }, { - "epoch": 0.73, - "learning_rate": 0.00019076035134276098, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.0002438735966779079, + "loss": 0.0238, "step": 144350 }, { - "epoch": 0.73, - "learning_rate": 0.00019075278364974696, - "loss": 0.0138, + "epoch": 0.37, + "learning_rate": 0.00024386970846153647, + "loss": 0.0215, "step": 144360 }, { - "epoch": 0.73, - "learning_rate": 0.00019074521595673294, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.00024386582024516499, + "loss": 0.0233, "step": 144370 }, { - "epoch": 0.73, - "learning_rate": 0.00019073764826371895, - "loss": 0.0121, + "epoch": 0.37, + "learning_rate": 0.00024386193202879353, + "loss": 0.0296, "step": 144380 }, { - "epoch": 0.73, - "learning_rate": 0.00019073008057070493, - "loss": 0.0144, + "epoch": 0.37, + "learning_rate": 0.00024385804381242204, + "loss": 0.021, "step": 144390 }, { - "epoch": 0.73, - "learning_rate": 0.0001907225128776909, - "loss": 0.0141, + "epoch": 0.37, + "learning_rate": 0.00024385415559605058, + "loss": 0.0208, "step": 144400 }, { - "epoch": 0.73, - "learning_rate": 0.00019071494518467692, - "loss": 0.0119, + "epoch": 0.37, + "learning_rate": 0.00024385026737967913, + "loss": 0.0181, "step": 144410 }, { - "epoch": 0.73, - "learning_rate": 0.0001907073774916629, - "loss": 0.0145, + "epoch": 0.37, + "learning_rate": 0.00024384637916330767, + "loss": 0.0185, "step": 144420 }, { - "epoch": 0.73, - "learning_rate": 0.00019069980979864888, - "loss": 0.0189, + "epoch": 0.37, + "learning_rate": 0.00024384249094693618, + "loss": 0.0194, "step": 144430 }, { - "epoch": 0.73, - "learning_rate": 0.0001906922421056349, - "loss": 0.0111, + "epoch": 0.37, + "learning_rate": 0.00024383860273056472, + "loss": 0.0224, "step": 144440 }, { - "epoch": 0.73, - "learning_rate": 0.00019068467441262087, - "loss": 0.0135, + "epoch": 0.37, + "learning_rate": 0.00024383471451419326, + "loss": 0.0197, "step": 144450 }, { - "epoch": 0.73, - "learning_rate": 0.00019067710671960686, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.0002438308262978218, + "loss": 0.0154, "step": 144460 }, { - "epoch": 0.73, - "learning_rate": 0.00019066953902659286, - "loss": 0.0092, + "epoch": 0.37, + "learning_rate": 0.00024382693808145032, + "loss": 0.0212, "step": 144470 }, { - "epoch": 0.73, - "learning_rate": 0.00019066197133357885, - "loss": 0.0114, + "epoch": 0.37, + "learning_rate": 0.00024382304986507886, + "loss": 0.0207, "step": 144480 }, { - "epoch": 0.73, - "learning_rate": 0.00019065440364056483, - "loss": 0.0122, + "epoch": 0.37, + "learning_rate": 0.0002438191616487074, + "loss": 0.0236, "step": 144490 }, { - "epoch": 0.73, - "learning_rate": 0.00019064683594755084, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024381527343233595, + "loss": 0.0192, "step": 144500 }, { - "epoch": 0.73, - "learning_rate": 0.00019063926825453682, - "loss": 0.0137, + "epoch": 0.37, + "learning_rate": 0.00024381138521596446, + "loss": 0.0185, "step": 144510 }, { - "epoch": 0.73, - "learning_rate": 0.0001906317005615228, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.000243807496999593, + "loss": 0.015, "step": 144520 }, { - "epoch": 0.73, - "learning_rate": 0.0001906241328685088, - "loss": 0.0152, + "epoch": 0.37, + "learning_rate": 0.00024380360878322157, + "loss": 0.0194, "step": 144530 }, { - "epoch": 0.73, - "learning_rate": 0.0001906165651754948, - "loss": 0.0183, + "epoch": 0.37, + "learning_rate": 0.00024379972056685009, + "loss": 0.0217, "step": 144540 }, { - "epoch": 0.73, - "learning_rate": 0.00019060899748248077, - "loss": 0.0167, + "epoch": 0.37, + "learning_rate": 0.00024379583235047863, + "loss": 0.0211, "step": 144550 }, { - "epoch": 0.73, - "learning_rate": 0.00019060142978946675, - "loss": 0.0118, + "epoch": 0.37, + "learning_rate": 0.00024379194413410714, + "loss": 0.022, "step": 144560 }, { - "epoch": 0.73, - "learning_rate": 0.00019059386209645276, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.0002437880559177357, + "loss": 0.0211, "step": 144570 }, { - "epoch": 0.73, - "learning_rate": 0.00019058629440343874, - "loss": 0.0116, + "epoch": 0.37, + "learning_rate": 0.00024378416770136422, + "loss": 0.0248, "step": 144580 }, { - "epoch": 0.73, - "learning_rate": 0.00019057872671042472, - "loss": 0.0121, + "epoch": 0.37, + "learning_rate": 0.00024378027948499277, + "loss": 0.019, "step": 144590 }, { - "epoch": 0.73, - "learning_rate": 0.00019057115901741073, - "loss": 0.0132, + "epoch": 0.37, + "learning_rate": 0.00024377639126862128, + "loss": 0.0181, "step": 144600 }, { - "epoch": 0.73, - "learning_rate": 0.0001905635913243967, - "loss": 0.0143, + "epoch": 0.37, + "learning_rate": 0.00024377250305224985, + "loss": 0.0239, "step": 144610 }, { - "epoch": 0.73, - "learning_rate": 0.0001905560236313827, - "loss": 0.0125, + "epoch": 0.37, + "learning_rate": 0.00024376861483587836, + "loss": 0.0198, "step": 144620 }, { - "epoch": 0.73, - "learning_rate": 0.0001905484559383687, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.0002437647266195069, + "loss": 0.0288, "step": 144630 }, { - "epoch": 0.73, - "learning_rate": 0.00019054088824535468, - "loss": 0.0128, + "epoch": 0.37, + "learning_rate": 0.00024376083840313542, + "loss": 0.0218, "step": 144640 }, { - "epoch": 0.73, - "learning_rate": 0.00019053332055234067, - "loss": 0.0147, + "epoch": 0.37, + "learning_rate": 0.00024375695018676396, + "loss": 0.019, "step": 144650 }, { - "epoch": 0.73, - "learning_rate": 0.00019052575285932667, - "loss": 0.0123, + "epoch": 0.37, + "learning_rate": 0.0002437530619703925, + "loss": 0.0176, "step": 144660 }, { - "epoch": 0.73, - "learning_rate": 0.00019051818516631266, - "loss": 0.0182, + "epoch": 0.38, + "learning_rate": 0.00024374917375402105, + "loss": 0.0231, "step": 144670 }, { - "epoch": 0.73, - "learning_rate": 0.00019051061747329864, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024374528553764956, + "loss": 0.0169, "step": 144680 }, { - "epoch": 0.73, - "learning_rate": 0.00019050304978028465, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.0002437413973212781, + "loss": 0.0212, "step": 144690 }, { - "epoch": 0.73, - "learning_rate": 0.00019049548208727063, - "loss": 0.0149, + "epoch": 0.38, + "learning_rate": 0.00024373750910490667, + "loss": 0.0247, "step": 144700 }, { - "epoch": 0.73, - "learning_rate": 0.0001904879143942566, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024373362088853518, + "loss": 0.0245, "step": 144710 }, { - "epoch": 0.73, - "learning_rate": 0.0001904803467012426, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024372973267216373, + "loss": 0.0174, "step": 144720 }, { - "epoch": 0.73, - "learning_rate": 0.0001904727790082286, - "loss": 0.0174, + "epoch": 0.38, + "learning_rate": 0.00024372584445579224, + "loss": 0.0208, "step": 144730 }, { - "epoch": 0.73, - "learning_rate": 0.00019046521131521458, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.0002437219562394208, + "loss": 0.0191, "step": 144740 }, { - "epoch": 0.73, - "learning_rate": 0.00019045764362220056, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024371806802304932, + "loss": 0.0173, "step": 144750 }, { - "epoch": 0.73, - "learning_rate": 0.00019045007592918657, - "loss": 0.0161, - "step": 144760 + "epoch": 0.38, + "learning_rate": 0.00024371417980667787, + "loss": 0.0211, + "step": 144760 }, { - "epoch": 0.73, - "learning_rate": 0.00019044250823617255, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024371029159030638, + "loss": 0.0189, "step": 144770 }, { - "epoch": 0.73, - "learning_rate": 0.00019043494054315853, - "loss": 0.0159, + "epoch": 0.38, + "learning_rate": 0.00024370640337393495, + "loss": 0.0184, "step": 144780 }, { - "epoch": 0.73, - "learning_rate": 0.00019042737285014454, - "loss": 0.0115, + "epoch": 0.38, + "learning_rate": 0.00024370251515756346, + "loss": 0.0195, "step": 144790 }, { - "epoch": 0.73, - "learning_rate": 0.00019041980515713052, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.000243698626941192, + "loss": 0.0243, "step": 144800 }, { - "epoch": 0.73, - "learning_rate": 0.0001904122374641165, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024369473872482052, + "loss": 0.0192, "step": 144810 }, { - "epoch": 0.73, - "learning_rate": 0.00019040466977110251, - "loss": 0.0158, + "epoch": 0.38, + "learning_rate": 0.0002436908505084491, + "loss": 0.0244, "step": 144820 }, { - "epoch": 0.73, - "learning_rate": 0.0001903971020780885, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.0002436869622920776, + "loss": 0.0197, "step": 144830 }, { - "epoch": 0.73, - "learning_rate": 0.00019038953438507448, - "loss": 0.0149, + "epoch": 0.38, + "learning_rate": 0.00024368307407570614, + "loss": 0.0257, "step": 144840 }, { - "epoch": 0.73, - "learning_rate": 0.00019038196669206049, - "loss": 0.0154, + "epoch": 0.38, + "learning_rate": 0.00024367918585933466, + "loss": 0.017, "step": 144850 }, { - "epoch": 0.73, - "learning_rate": 0.00019037439899904647, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024367529764296323, + "loss": 0.0299, "step": 144860 }, { - "epoch": 0.73, - "learning_rate": 0.00019036683130603245, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024367140942659177, + "loss": 0.0194, "step": 144870 }, { - "epoch": 0.73, - "learning_rate": 0.00019035926361301843, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024366752121022028, + "loss": 0.0217, "step": 144880 }, { - "epoch": 0.73, - "learning_rate": 0.00019035169592000444, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.0002436636329938488, + "loss": 0.0205, "step": 144890 }, { - "epoch": 0.73, - "learning_rate": 0.00019034412822699042, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.00024365974477747734, + "loss": 0.0273, "step": 144900 }, { - "epoch": 0.73, - "learning_rate": 0.0001903365605339764, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.0002436558565611059, + "loss": 0.0214, "step": 144910 }, { - "epoch": 0.73, - "learning_rate": 0.0001903289928409624, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.00024365196834473442, + "loss": 0.0197, "step": 144920 }, { - "epoch": 0.73, - "learning_rate": 0.0001903214251479484, - "loss": 0.0157, + "epoch": 0.38, + "learning_rate": 0.00024364808012836297, + "loss": 0.0215, "step": 144930 }, { - "epoch": 0.73, - "learning_rate": 0.00019031385745493437, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.00024364419191199148, + "loss": 0.0182, "step": 144940 }, { - "epoch": 0.73, - "learning_rate": 0.00019030628976192038, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024364030369562005, + "loss": 0.0226, "step": 144950 }, { - "epoch": 0.73, - "learning_rate": 0.00019029872206890636, - "loss": 0.0115, + "epoch": 0.38, + "learning_rate": 0.00024363641547924856, + "loss": 0.0177, "step": 144960 }, { - "epoch": 0.73, - "learning_rate": 0.00019029115437589234, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.0002436325272628771, + "loss": 0.0187, "step": 144970 }, { - "epoch": 0.73, - "learning_rate": 0.00019028358668287835, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.00024362863904650562, + "loss": 0.0195, "step": 144980 }, { - "epoch": 0.73, - "learning_rate": 0.00019027601898986433, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.0002436247508301342, + "loss": 0.0241, "step": 144990 }, { - "epoch": 0.73, - "learning_rate": 0.00019026845129685032, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.0002436208626137627, + "loss": 0.019, "step": 145000 }, { - "epoch": 0.73, - "eval_cer": 0.9144566703574066, - "eval_loss": 0.00918771605938673, - "eval_runtime": 116.6602, - "eval_samples_per_second": 17.144, - "eval_steps_per_second": 4.286, + "epoch": 0.38, + "eval_cer": 0.881751673615864, + "eval_loss": 0.013631855137646198, + "eval_runtime": 107.3251, + "eval_samples_per_second": 18.635, + "eval_steps_per_second": 4.659, "step": 145000 }, { - "epoch": 0.73, - "learning_rate": 0.00019026088360383632, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024361697439739124, + "loss": 0.0184, "step": 145010 }, { - "epoch": 0.73, - "learning_rate": 0.0001902533159108223, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024361308618101976, + "loss": 0.0243, "step": 145020 }, { - "epoch": 0.73, - "learning_rate": 0.0001902457482178083, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024360919796464833, + "loss": 0.022, "step": 145030 }, { - "epoch": 0.73, - "learning_rate": 0.00019023818052479427, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024360530974827687, + "loss": 0.0166, "step": 145040 }, { - "epoch": 0.73, - "learning_rate": 0.00019023061283178028, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.00024360142153190538, + "loss": 0.0215, "step": 145050 }, { - "epoch": 0.73, - "learning_rate": 0.00019022304513876626, - "loss": 0.0146, + "epoch": 0.38, + "learning_rate": 0.0002435975333155339, + "loss": 0.0185, "step": 145060 }, { - "epoch": 0.73, - "learning_rate": 0.00019021547744575224, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.00024359364509916247, + "loss": 0.0275, "step": 145070 }, { - "epoch": 0.73, - "learning_rate": 0.00019020790975273825, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.000243589756882791, + "loss": 0.0207, "step": 145080 }, { - "epoch": 0.73, - "learning_rate": 0.00019020034205972423, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024358586866641952, + "loss": 0.0248, "step": 145090 }, { - "epoch": 0.73, - "learning_rate": 0.0001901927743667102, - "loss": 0.0154, + "epoch": 0.38, + "learning_rate": 0.00024358198045004806, + "loss": 0.0264, "step": 145100 }, { - "epoch": 0.73, - "learning_rate": 0.00019018520667369622, - "loss": 0.0162, + "epoch": 0.38, + "learning_rate": 0.0002435780922336766, + "loss": 0.0247, "step": 145110 }, { - "epoch": 0.73, - "learning_rate": 0.0001901776389806822, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.00024357420401730515, + "loss": 0.0189, "step": 145120 }, { - "epoch": 0.73, - "learning_rate": 0.00019017007128766818, - "loss": 0.0099, + "epoch": 0.38, + "learning_rate": 0.00024357031580093366, + "loss": 0.0253, "step": 145130 }, { - "epoch": 0.73, - "learning_rate": 0.0001901625035946542, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.0002435664275845622, + "loss": 0.0188, "step": 145140 }, { - "epoch": 0.73, - "learning_rate": 0.00019015493590164017, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024356253936819072, + "loss": 0.0186, "step": 145150 }, { - "epoch": 0.73, - "learning_rate": 0.00019014736820862615, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.0002435586511518193, + "loss": 0.0215, "step": 145160 }, { - "epoch": 0.73, - "learning_rate": 0.00019013980051561216, - "loss": 0.0083, + "epoch": 0.38, + "learning_rate": 0.0002435547629354478, + "loss": 0.0196, "step": 145170 }, { - "epoch": 0.73, - "learning_rate": 0.00019013223282259812, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.00024355087471907634, + "loss": 0.0212, "step": 145180 }, { - "epoch": 0.73, - "learning_rate": 0.0001901246651295841, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024354698650270486, + "loss": 0.0189, "step": 145190 }, { - "epoch": 0.73, - "learning_rate": 0.00019011709743657008, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024354309828633343, + "loss": 0.0186, "step": 145200 }, { - "epoch": 0.73, - "learning_rate": 0.0001901095297435561, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024353921006996194, + "loss": 0.0184, "step": 145210 }, { - "epoch": 0.73, - "learning_rate": 0.00019010196205054207, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024353532185359048, + "loss": 0.0231, "step": 145220 }, { - "epoch": 0.73, - "learning_rate": 0.00019009439435752805, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.000243531433637219, + "loss": 0.0197, "step": 145230 }, { - "epoch": 0.73, - "learning_rate": 0.00019008682666451406, - "loss": 0.0104, + "epoch": 0.38, + "learning_rate": 0.00024352754542084757, + "loss": 0.019, "step": 145240 }, { - "epoch": 0.73, - "learning_rate": 0.00019007925897150004, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.0002435236572044761, + "loss": 0.0169, "step": 145250 }, { - "epoch": 0.73, - "learning_rate": 0.00019007169127848602, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024351976898810462, + "loss": 0.015, "step": 145260 }, { - "epoch": 0.73, - "learning_rate": 0.000190064123585472, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024351588077173316, + "loss": 0.0223, "step": 145270 }, { - "epoch": 0.73, - "learning_rate": 0.000190056555892458, - "loss": 0.0102, + "epoch": 0.38, + "learning_rate": 0.0002435119925553617, + "loss": 0.0172, "step": 145280 }, { - "epoch": 0.73, - "learning_rate": 0.000190048988199444, - "loss": 0.0148, + "epoch": 0.38, + "learning_rate": 0.00024350810433899025, + "loss": 0.0421, "step": 145290 }, { - "epoch": 0.73, - "learning_rate": 0.00019004142050642998, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.00024350421612261876, + "loss": 0.0221, "step": 145300 }, { - "epoch": 0.73, - "learning_rate": 0.00019003385281341598, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.0002435003279062473, + "loss": 0.0297, "step": 145310 }, { - "epoch": 0.73, - "learning_rate": 0.00019002628512040197, - "loss": 0.0093, + "epoch": 0.38, + "learning_rate": 0.00024349643968987585, + "loss": 0.0212, "step": 145320 }, { - "epoch": 0.73, - "learning_rate": 0.00019001871742738795, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.0002434925514735044, + "loss": 0.03, "step": 145330 }, { - "epoch": 0.73, - "learning_rate": 0.00019001114973437396, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.0002434886632571329, + "loss": 0.0266, "step": 145340 }, { - "epoch": 0.73, - "learning_rate": 0.00019000358204135994, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024348477504076144, + "loss": 0.0174, "step": 145350 }, { - "epoch": 0.73, - "learning_rate": 0.00018999601434834592, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024348088682438998, + "loss": 0.0342, "step": 145360 }, { - "epoch": 0.73, - "learning_rate": 0.00018998844665533193, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024347699860801853, + "loss": 0.0269, "step": 145370 }, { - "epoch": 0.73, - "learning_rate": 0.0001899808789623179, - "loss": 0.0155, + "epoch": 0.38, + "learning_rate": 0.00024347311039164704, + "loss": 0.0198, "step": 145380 }, { - "epoch": 0.73, - "learning_rate": 0.0001899733112693039, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024346922217527558, + "loss": 0.02, "step": 145390 }, { - "epoch": 0.73, - "learning_rate": 0.0001899657435762899, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.0002434653339589041, + "loss": 0.0163, "step": 145400 }, { - "epoch": 0.73, - "learning_rate": 0.00018995817588327588, - "loss": 0.0098, + "epoch": 0.38, + "learning_rate": 0.00024346144574253267, + "loss": 0.0172, "step": 145410 }, { - "epoch": 0.73, - "learning_rate": 0.00018995060819026186, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.0002434575575261612, + "loss": 0.0207, "step": 145420 }, { - "epoch": 0.73, - "learning_rate": 0.00018994304049724784, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024345366930978972, + "loss": 0.0201, "step": 145430 }, { - "epoch": 0.73, - "learning_rate": 0.00018993547280423385, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024344978109341826, + "loss": 0.0256, "step": 145440 }, { - "epoch": 0.73, - "learning_rate": 0.00018992790511121983, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.0002434458928770468, + "loss": 0.0194, "step": 145450 }, { - "epoch": 0.73, - "learning_rate": 0.00018992033741820581, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024344200466067535, + "loss": 0.0187, "step": 145460 }, { - "epoch": 0.73, - "learning_rate": 0.00018991276972519182, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.00024343811644430386, + "loss": 0.0209, "step": 145470 }, { - "epoch": 0.73, - "learning_rate": 0.0001899052020321778, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.0002434342282279324, + "loss": 0.0183, "step": 145480 }, { - "epoch": 0.73, - "learning_rate": 0.00018989763433916379, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024343034001156094, + "loss": 0.0179, "step": 145490 }, { - "epoch": 0.73, - "learning_rate": 0.0001898900666461498, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024342645179518949, + "loss": 0.0206, "step": 145500 }, { - "epoch": 0.73, - "learning_rate": 0.00018988249895313578, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.000243422563578818, + "loss": 0.0194, "step": 145510 }, { - "epoch": 0.73, - "learning_rate": 0.00018987493126012176, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.00024341867536244654, + "loss": 0.0194, "step": 145520 }, { - "epoch": 0.73, - "learning_rate": 0.00018986736356710777, - "loss": 0.0169, + "epoch": 0.38, + "learning_rate": 0.00024341478714607508, + "loss": 0.0269, "step": 145530 }, { - "epoch": 0.73, - "learning_rate": 0.00018985979587409375, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.00024341089892970363, + "loss": 0.0195, "step": 145540 }, { - "epoch": 0.73, - "learning_rate": 0.00018985222818107973, - "loss": 0.0183, + "epoch": 0.38, + "learning_rate": 0.00024340701071333214, + "loss": 0.0213, "step": 145550 }, { - "epoch": 0.73, - "learning_rate": 0.00018984466048806574, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024340312249696068, + "loss": 0.0207, "step": 145560 }, { - "epoch": 0.73, - "learning_rate": 0.00018983709279505172, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024339923428058925, + "loss": 0.02, "step": 145570 }, { - "epoch": 0.73, - "learning_rate": 0.0001898295251020377, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024339534606421777, + "loss": 0.0216, "step": 145580 }, { - "epoch": 0.73, - "learning_rate": 0.0001898219574090237, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.0002433914578478463, + "loss": 0.0268, "step": 145590 }, { - "epoch": 0.73, - "learning_rate": 0.0001898143897160097, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024338756963147482, + "loss": 0.0235, "step": 145600 }, { - "epoch": 0.73, - "learning_rate": 0.00018980682202299567, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.0002433836814151034, + "loss": 0.0168, "step": 145610 }, { - "epoch": 0.73, - "learning_rate": 0.00018979925432998165, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.0002433797931987319, + "loss": 0.0216, "step": 145620 }, { - "epoch": 0.73, - "learning_rate": 0.00018979168663696766, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024337590498236045, + "loss": 0.0179, "step": 145630 }, { - "epoch": 0.73, - "learning_rate": 0.00018978411894395364, - "loss": 0.0169, + "epoch": 0.38, + "learning_rate": 0.00024337201676598896, + "loss": 0.0167, "step": 145640 }, { - "epoch": 0.73, - "learning_rate": 0.00018977655125093962, - "loss": 0.0104, + "epoch": 0.38, + "learning_rate": 0.0002433681285496175, + "loss": 0.0202, "step": 145650 }, { - "epoch": 0.73, - "learning_rate": 0.00018976898355792563, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024336424033324604, + "loss": 0.0205, "step": 145660 }, { - "epoch": 0.73, - "learning_rate": 0.00018976141586491161, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024336035211687459, + "loss": 0.019, "step": 145670 }, { - "epoch": 0.73, - "learning_rate": 0.0001897538481718976, - "loss": 0.0149, + "epoch": 0.38, + "learning_rate": 0.0002433564639005031, + "loss": 0.0192, "step": 145680 }, { - "epoch": 0.74, - "learning_rate": 0.0001897462804788836, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024335257568413164, + "loss": 0.0148, "step": 145690 }, { - "epoch": 0.74, - "learning_rate": 0.00018973871278586959, - "loss": 0.0147, + "epoch": 0.38, + "learning_rate": 0.00024334868746776018, + "loss": 0.0165, "step": 145700 }, { - "epoch": 0.74, - "learning_rate": 0.00018973114509285557, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024334479925138873, + "loss": 0.0164, "step": 145710 }, { - "epoch": 0.74, - "learning_rate": 0.00018972357739984158, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024334091103501724, + "loss": 0.0201, "step": 145720 }, { - "epoch": 0.74, - "learning_rate": 0.00018971600970682756, - "loss": 0.0156, + "epoch": 0.38, + "learning_rate": 0.00024333702281864578, + "loss": 0.0184, "step": 145730 }, { - "epoch": 0.74, - "learning_rate": 0.00018970844201381354, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024333313460227435, + "loss": 0.0222, "step": 145740 }, { - "epoch": 0.74, - "learning_rate": 0.00018970087432079955, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024332924638590286, + "loss": 0.02, "step": 145750 }, { - "epoch": 0.74, - "learning_rate": 0.00018969330662778553, - "loss": 0.0172, + "epoch": 0.38, + "learning_rate": 0.00024332535816953138, + "loss": 0.0213, "step": 145760 }, { - "epoch": 0.74, - "learning_rate": 0.0001896857389347715, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024332146995315992, + "loss": 0.0229, "step": 145770 }, { - "epoch": 0.74, - "learning_rate": 0.0001896781712417575, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.0002433175817367885, + "loss": 0.024, "step": 145780 }, { - "epoch": 0.74, - "learning_rate": 0.0001896706035487435, - "loss": 0.0107, + "epoch": 0.38, + "learning_rate": 0.000243313693520417, + "loss": 0.0219, "step": 145790 }, { - "epoch": 0.74, - "learning_rate": 0.00018966303585572948, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024330980530404555, + "loss": 0.0213, "step": 145800 }, { - "epoch": 0.74, - "learning_rate": 0.00018965546816271546, - "loss": 0.0175, + "epoch": 0.38, + "learning_rate": 0.00024330591708767406, + "loss": 0.0253, "step": 145810 }, { - "epoch": 0.74, - "learning_rate": 0.00018964790046970147, - "loss": 0.0105, + "epoch": 0.38, + "learning_rate": 0.00024330202887130263, + "loss": 0.0199, "step": 145820 }, { - "epoch": 0.74, - "learning_rate": 0.00018964033277668745, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024329814065493114, + "loss": 0.0198, "step": 145830 }, { - "epoch": 0.74, - "learning_rate": 0.00018963276508367343, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024329425243855969, + "loss": 0.0156, "step": 145840 }, { - "epoch": 0.74, - "learning_rate": 0.00018962519739065944, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.0002432903642221882, + "loss": 0.0218, "step": 145850 }, { - "epoch": 0.74, - "learning_rate": 0.00018961762969764542, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024328647600581677, + "loss": 0.018, "step": 145860 }, { - "epoch": 0.74, - "learning_rate": 0.0001896100620046314, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024328258778944528, + "loss": 0.0215, "step": 145870 }, { - "epoch": 0.74, - "learning_rate": 0.00018960249431161741, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024327869957307382, + "loss": 0.0181, "step": 145880 }, { - "epoch": 0.74, - "learning_rate": 0.0001895949266186034, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024327481135670234, + "loss": 0.0169, "step": 145890 }, { - "epoch": 0.74, - "learning_rate": 0.00018958735892558938, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024327092314033088, + "loss": 0.0169, "step": 145900 }, { - "epoch": 0.74, - "learning_rate": 0.00018957979123257539, - "loss": 0.0146, + "epoch": 0.38, + "learning_rate": 0.00024326703492395945, + "loss": 0.0192, "step": 145910 }, { - "epoch": 0.74, - "learning_rate": 0.00018957222353956137, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024326314670758796, + "loss": 0.0229, "step": 145920 }, { - "epoch": 0.74, - "learning_rate": 0.00018956465584654735, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024325925849121648, + "loss": 0.0207, "step": 145930 }, { - "epoch": 0.74, - "learning_rate": 0.00018955708815353333, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024325537027484502, + "loss": 0.0191, "step": 145940 }, { - "epoch": 0.74, - "learning_rate": 0.00018954952046051934, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.0002432514820584736, + "loss": 0.0205, "step": 145950 }, { - "epoch": 0.74, - "learning_rate": 0.00018954195276750532, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.0002432475938421021, + "loss": 0.0161, "step": 145960 }, { - "epoch": 0.74, - "learning_rate": 0.0001895343850744913, - "loss": 0.0102, + "epoch": 0.38, + "learning_rate": 0.00024324370562573065, + "loss": 0.0197, "step": 145970 }, { - "epoch": 0.74, - "learning_rate": 0.0001895268173814773, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024323981740935916, + "loss": 0.0213, "step": 145980 }, { - "epoch": 0.74, - "learning_rate": 0.0001895192496884633, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024323592919298773, + "loss": 0.0208, "step": 145990 }, { - "epoch": 0.74, - "learning_rate": 0.00018951168199544927, - "loss": 0.0157, + "epoch": 0.38, + "learning_rate": 0.00024323204097661624, + "loss": 0.0181, "step": 146000 }, { - "epoch": 0.74, - "eval_cer": 0.9144770486760401, - "eval_loss": 0.009305712766945362, - "eval_runtime": 116.6484, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.286, + "epoch": 0.38, + "eval_cer": 0.8817628707113375, + "eval_loss": 0.013447397388517857, + "eval_runtime": 107.4268, + "eval_samples_per_second": 18.617, + "eval_steps_per_second": 4.654, "step": 146000 }, { - "epoch": 0.74, - "learning_rate": 0.00018950411430243528, - "loss": 0.0103, + "epoch": 0.38, + "learning_rate": 0.00024322815276024478, + "loss": 0.0197, "step": 146010 }, { - "epoch": 0.74, - "learning_rate": 0.00018949654660942126, - "loss": 0.0162, + "epoch": 0.38, + "learning_rate": 0.0002432242645438733, + "loss": 0.0184, "step": 146020 }, { - "epoch": 0.74, - "learning_rate": 0.00018948897891640724, - "loss": 0.01, + "epoch": 0.38, + "learning_rate": 0.00024322037632750187, + "loss": 0.0296, "step": 146030 }, { - "epoch": 0.74, - "learning_rate": 0.00018948141122339325, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024321648811113038, + "loss": 0.0268, "step": 146040 }, { - "epoch": 0.74, - "learning_rate": 0.00018947384353037923, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024321259989475892, + "loss": 0.0156, "step": 146050 }, { - "epoch": 0.74, - "learning_rate": 0.00018946627583736522, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024320871167838744, + "loss": 0.0191, "step": 146060 }, { - "epoch": 0.74, - "learning_rate": 0.00018945870814435122, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.000243204823462016, + "loss": 0.0186, "step": 146070 }, { - "epoch": 0.74, - "learning_rate": 0.0001894511404513372, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024320093524564452, + "loss": 0.0205, "step": 146080 }, { - "epoch": 0.74, - "learning_rate": 0.0001894435727583232, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024319704702927306, + "loss": 0.0219, "step": 146090 }, { - "epoch": 0.74, - "learning_rate": 0.0001894360050653092, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024319315881290158, + "loss": 0.0225, "step": 146100 }, { - "epoch": 0.74, - "learning_rate": 0.00018942843737229518, - "loss": 0.0104, + "epoch": 0.38, + "learning_rate": 0.00024318927059653015, + "loss": 0.0206, "step": 146110 }, { - "epoch": 0.74, - "learning_rate": 0.00018942086967928116, - "loss": 0.0102, + "epoch": 0.38, + "learning_rate": 0.0002431853823801587, + "loss": 0.0415, "step": 146120 }, { - "epoch": 0.74, - "learning_rate": 0.00018941330198626714, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.0002431814941637872, + "loss": 0.0226, "step": 146130 }, { - "epoch": 0.74, - "learning_rate": 0.00018940573429325315, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024317760594741574, + "loss": 0.022, "step": 146140 }, { - "epoch": 0.74, - "learning_rate": 0.00018939816660023913, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024317371773104426, + "loss": 0.021, "step": 146150 }, { - "epoch": 0.74, - "learning_rate": 0.0001893905989072251, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024316982951467283, + "loss": 0.0163, "step": 146160 }, { - "epoch": 0.74, - "learning_rate": 0.00018938303121421112, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024316594129830134, + "loss": 0.0177, "step": 146170 }, { - "epoch": 0.74, - "learning_rate": 0.0001893754635211971, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024316205308192988, + "loss": 0.0206, "step": 146180 }, { - "epoch": 0.74, - "learning_rate": 0.00018936789582818308, - "loss": 0.0154, + "epoch": 0.38, + "learning_rate": 0.0002431581648655584, + "loss": 0.0218, "step": 146190 }, { - "epoch": 0.74, - "learning_rate": 0.0001893603281351691, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024315427664918697, + "loss": 0.0216, "step": 146200 }, { - "epoch": 0.74, - "learning_rate": 0.00018935276044215507, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024315038843281548, + "loss": 0.0207, "step": 146210 }, { - "epoch": 0.74, - "learning_rate": 0.00018934519274914105, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.00024314650021644402, + "loss": 0.0203, "step": 146220 }, { - "epoch": 0.74, - "learning_rate": 0.00018933762505612706, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.00024314261200007254, + "loss": 0.0177, "step": 146230 }, { - "epoch": 0.74, - "learning_rate": 0.00018933005736311304, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.0002431387237837011, + "loss": 0.0155, "step": 146240 }, { - "epoch": 0.74, - "learning_rate": 0.00018932248967009903, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024313483556732962, + "loss": 0.0193, "step": 146250 }, { - "epoch": 0.74, - "learning_rate": 0.00018931492197708503, - "loss": 0.0094, + "epoch": 0.38, + "learning_rate": 0.00024313094735095816, + "loss": 0.0347, "step": 146260 }, { - "epoch": 0.74, - "learning_rate": 0.00018930735428407102, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024312705913458668, + "loss": 0.021, "step": 146270 }, { - "epoch": 0.74, - "learning_rate": 0.000189299786591057, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.00024312317091821525, + "loss": 0.02, "step": 146280 }, { - "epoch": 0.74, - "learning_rate": 0.00018929221889804298, - "loss": 0.0165, + "epoch": 0.38, + "learning_rate": 0.0002431192827018438, + "loss": 0.0198, "step": 146290 }, { - "epoch": 0.74, - "learning_rate": 0.000189284651205029, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.0002431153944854723, + "loss": 0.0171, "step": 146300 }, { - "epoch": 0.74, - "learning_rate": 0.00018927708351201497, - "loss": 0.0185, + "epoch": 0.38, + "learning_rate": 0.00024311150626910084, + "loss": 0.019, "step": 146310 }, { - "epoch": 0.74, - "learning_rate": 0.00018926951581900095, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024310761805272939, + "loss": 0.0218, "step": 146320 }, { - "epoch": 0.74, - "learning_rate": 0.00018926194812598696, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024310372983635793, + "loss": 0.0185, "step": 146330 }, { - "epoch": 0.74, - "learning_rate": 0.00018925438043297294, - "loss": 0.01, + "epoch": 0.38, + "learning_rate": 0.00024309984161998644, + "loss": 0.0225, "step": 146340 }, { - "epoch": 0.74, - "learning_rate": 0.00018924681273995892, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024309595340361498, + "loss": 0.018, "step": 146350 }, { - "epoch": 0.74, - "learning_rate": 0.00018923924504694493, - "loss": 0.0106, + "epoch": 0.38, + "learning_rate": 0.00024309206518724353, + "loss": 0.0207, "step": 146360 }, { - "epoch": 0.74, - "learning_rate": 0.0001892316773539309, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024308817697087207, + "loss": 0.0185, "step": 146370 }, { - "epoch": 0.74, - "learning_rate": 0.0001892241096609169, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024308428875450058, + "loss": 0.0187, "step": 146380 }, { - "epoch": 0.74, - "learning_rate": 0.0001892165419679029, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024308040053812912, + "loss": 0.0184, "step": 146390 }, { - "epoch": 0.74, - "learning_rate": 0.00018920897427488888, - "loss": 0.015, + "epoch": 0.38, + "learning_rate": 0.00024307651232175764, + "loss": 0.0155, "step": 146400 }, { - "epoch": 0.74, - "learning_rate": 0.00018920140658187486, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.0002430726241053862, + "loss": 0.0215, "step": 146410 }, { - "epoch": 0.74, - "learning_rate": 0.00018919383888886087, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024306873588901472, + "loss": 0.0262, "step": 146420 }, { - "epoch": 0.74, - "learning_rate": 0.00018918627119584683, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.00024306484767264326, + "loss": 0.0223, "step": 146430 }, { - "epoch": 0.74, - "learning_rate": 0.0001891787035028328, - "loss": 0.0099, + "epoch": 0.38, + "learning_rate": 0.00024306095945627178, + "loss": 0.0216, "step": 146440 }, { - "epoch": 0.74, - "learning_rate": 0.0001891711358098188, - "loss": 0.0089, + "epoch": 0.38, + "learning_rate": 0.00024305707123990035, + "loss": 0.0185, "step": 146450 }, { - "epoch": 0.74, - "learning_rate": 0.0001891635681168048, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.0002430531830235289, + "loss": 0.0186, "step": 146460 }, { - "epoch": 0.74, - "learning_rate": 0.00018915600042379078, - "loss": 0.0104, + "epoch": 0.38, + "learning_rate": 0.0002430492948071574, + "loss": 0.0198, "step": 146470 }, { - "epoch": 0.74, - "learning_rate": 0.00018914843273077676, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.00024304540659078592, + "loss": 0.0189, "step": 146480 }, { - "epoch": 0.74, - "learning_rate": 0.00018914086503776277, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024304151837441449, + "loss": 0.0186, "step": 146490 }, { - "epoch": 0.74, - "learning_rate": 0.00018913329734474875, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024303763015804303, + "loss": 0.0213, "step": 146500 }, { - "epoch": 0.74, - "learning_rate": 0.00018912572965173473, - "loss": 0.012, + "epoch": 0.38, + "learning_rate": 0.00024303374194167154, + "loss": 0.0164, "step": 146510 }, { - "epoch": 0.74, - "learning_rate": 0.00018911816195872071, - "loss": 0.0107, + "epoch": 0.38, + "learning_rate": 0.00024302985372530008, + "loss": 0.017, "step": 146520 }, { - "epoch": 0.74, - "learning_rate": 0.00018911059426570672, - "loss": 0.0107, + "epoch": 0.38, + "learning_rate": 0.00024302596550892862, + "loss": 0.0216, "step": 146530 }, { - "epoch": 0.74, - "learning_rate": 0.0001891030265726927, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024302207729255717, + "loss": 0.0189, "step": 146540 }, { - "epoch": 0.74, - "learning_rate": 0.00018909545887967869, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024301818907618568, + "loss": 0.0205, "step": 146550 }, { - "epoch": 0.74, - "learning_rate": 0.0001890878911866647, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024301430085981422, + "loss": 0.0169, "step": 146560 }, { - "epoch": 0.74, - "learning_rate": 0.00018908032349365068, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024301041264344276, + "loss": 0.0188, "step": 146570 }, { - "epoch": 0.74, - "learning_rate": 0.00018907275580063666, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.0002430065244270713, + "loss": 0.0178, "step": 146580 }, { - "epoch": 0.74, - "learning_rate": 0.00018906518810762267, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024300263621069982, + "loss": 0.019, "step": 146590 }, { - "epoch": 0.74, - "learning_rate": 0.00018905762041460865, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024299874799432836, + "loss": 0.0183, "step": 146600 }, { - "epoch": 0.74, - "learning_rate": 0.00018905005272159463, - "loss": 0.0141, + "epoch": 0.38, + "learning_rate": 0.00024299485977795693, + "loss": 0.0206, "step": 146610 }, { - "epoch": 0.74, - "learning_rate": 0.00018904248502858064, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024299097156158545, + "loss": 0.0173, "step": 146620 }, { - "epoch": 0.74, - "learning_rate": 0.00018903491733556662, - "loss": 0.0158, + "epoch": 0.38, + "learning_rate": 0.00024298708334521396, + "loss": 0.0171, "step": 146630 }, { - "epoch": 0.74, - "learning_rate": 0.0001890273496425526, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.0002429831951288425, + "loss": 0.0196, "step": 146640 }, { - "epoch": 0.74, - "learning_rate": 0.0001890197819495386, - "loss": 0.0097, + "epoch": 0.38, + "learning_rate": 0.00024297930691247102, + "loss": 0.0186, "step": 146650 }, { - "epoch": 0.74, - "learning_rate": 0.0001890122142565246, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.00024297541869609958, + "loss": 0.0232, "step": 146660 }, { - "epoch": 0.74, - "learning_rate": 0.00018900464656351057, - "loss": 0.0094, + "epoch": 0.38, + "learning_rate": 0.00024297153047972813, + "loss": 0.0239, "step": 146670 }, { - "epoch": 0.74, - "learning_rate": 0.00018899707887049655, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024296764226335664, + "loss": 0.0182, "step": 146680 }, { - "epoch": 0.74, - "learning_rate": 0.00018898951117748256, - "loss": 0.015, + "epoch": 0.38, + "learning_rate": 0.00024296375404698518, + "loss": 0.0298, "step": 146690 }, { - "epoch": 0.74, - "learning_rate": 0.00018898194348446854, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024295986583061372, + "loss": 0.0183, "step": 146700 }, { - "epoch": 0.74, - "learning_rate": 0.00018897437579145452, - "loss": 0.0152, + "epoch": 0.38, + "learning_rate": 0.00024295597761424227, + "loss": 0.0175, "step": 146710 }, { - "epoch": 0.74, - "learning_rate": 0.00018896680809844053, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024295208939787078, + "loss": 0.025, "step": 146720 }, { - "epoch": 0.74, - "learning_rate": 0.00018895924040542651, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024294820118149932, + "loss": 0.0187, "step": 146730 }, { - "epoch": 0.74, - "learning_rate": 0.0001889516727124125, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.00024294431296512786, + "loss": 0.0251, "step": 146740 }, { - "epoch": 0.74, - "learning_rate": 0.0001889441050193985, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.0002429404247487564, + "loss": 0.0278, "step": 146750 }, { - "epoch": 0.74, - "learning_rate": 0.00018893653732638449, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024293653653238492, + "loss": 0.023, "step": 146760 }, { - "epoch": 0.74, - "learning_rate": 0.00018892896963337047, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024293264831601346, + "loss": 0.018, "step": 146770 }, { - "epoch": 0.74, - "learning_rate": 0.00018892140194035648, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.00024292876009964203, + "loss": 0.0179, "step": 146780 }, { - "epoch": 0.74, - "learning_rate": 0.00018891383424734246, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024292487188327054, + "loss": 0.0224, "step": 146790 }, { - "epoch": 0.74, - "learning_rate": 0.00018890626655432844, - "loss": 0.0107, + "epoch": 0.38, + "learning_rate": 0.00024292098366689906, + "loss": 0.0198, "step": 146800 }, { - "epoch": 0.74, - "learning_rate": 0.00018889869886131445, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.0002429170954505276, + "loss": 0.0178, "step": 146810 }, { - "epoch": 0.74, - "learning_rate": 0.00018889113116830043, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024291320723415617, + "loss": 0.0212, "step": 146820 }, { - "epoch": 0.74, - "learning_rate": 0.0001888835634752864, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024290931901778468, + "loss": 0.0179, "step": 146830 }, { - "epoch": 0.74, - "learning_rate": 0.0001888759957822724, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.00024290543080141323, + "loss": 0.0164, "step": 146840 }, { - "epoch": 0.74, - "learning_rate": 0.0001888684280892584, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024290154258504174, + "loss": 0.0181, "step": 146850 }, { - "epoch": 0.74, - "learning_rate": 0.00018886086039624438, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.0002428976543686703, + "loss": 0.0171, "step": 146860 }, { - "epoch": 0.74, - "learning_rate": 0.00018885329270323036, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024289376615229882, + "loss": 0.0169, "step": 146870 }, { - "epoch": 0.74, - "learning_rate": 0.00018884572501021637, - "loss": 0.0156, + "epoch": 0.38, + "learning_rate": 0.00024288987793592737, + "loss": 0.0197, "step": 146880 }, { - "epoch": 0.74, - "learning_rate": 0.00018883815731720235, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024288598971955588, + "loss": 0.0194, "step": 146890 }, { - "epoch": 0.74, - "learning_rate": 0.00018883058962418833, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.00024288210150318442, + "loss": 0.017, "step": 146900 }, { - "epoch": 0.74, - "learning_rate": 0.00018882302193117434, - "loss": 0.0141, + "epoch": 0.38, + "learning_rate": 0.00024287821328681296, + "loss": 0.0176, "step": 146910 }, { - "epoch": 0.74, - "learning_rate": 0.00018881545423816032, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.0002428743250704415, + "loss": 0.016, "step": 146920 }, { - "epoch": 0.74, - "learning_rate": 0.0001888078865451463, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.00024287043685407002, + "loss": 0.0171, "step": 146930 }, { - "epoch": 0.74, - "learning_rate": 0.00018880031885213231, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.00024286654863769856, + "loss": 0.0226, "step": 146940 }, { - "epoch": 0.74, - "learning_rate": 0.0001887927511591183, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.0002428626604213271, + "loss": 0.021, "step": 146950 }, { - "epoch": 0.74, - "learning_rate": 0.00018878518346610428, - "loss": 0.0141, + "epoch": 0.38, + "learning_rate": 0.00024285877220495564, + "loss": 0.0215, "step": 146960 }, { - "epoch": 0.74, - "learning_rate": 0.00018877761577309029, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024285488398858416, + "loss": 0.0211, "step": 146970 }, { - "epoch": 0.74, - "learning_rate": 0.00018877004808007627, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.0002428509957722127, + "loss": 0.0181, "step": 146980 }, { - "epoch": 0.74, - "learning_rate": 0.00018876248038706225, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.00024284710755584127, + "loss": 0.0173, "step": 146990 }, { - "epoch": 0.74, - "learning_rate": 0.00018875491269404826, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.00024284321933946978, + "loss": 0.0228, "step": 147000 }, { - "epoch": 0.74, - "eval_cer": 0.914457640753532, - "eval_loss": 0.009390231221914291, - "eval_runtime": 115.7292, - "eval_samples_per_second": 17.282, - "eval_steps_per_second": 4.32, + "epoch": 0.38, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.013879619538784027, + "eval_runtime": 107.3335, + "eval_samples_per_second": 18.634, + "eval_steps_per_second": 4.658, "step": 147000 }, { - "epoch": 0.74, - "learning_rate": 0.00018874734500103424, - "loss": 0.0168, + "epoch": 0.38, + "learning_rate": 0.00024283933112309833, + "loss": 0.0175, "step": 147010 }, { - "epoch": 0.74, - "learning_rate": 0.00018873977730802022, - "loss": 0.0153, + "epoch": 0.38, + "learning_rate": 0.00024283544290672684, + "loss": 0.0203, "step": 147020 }, { - "epoch": 0.74, - "learning_rate": 0.0001887322096150062, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.0002428315546903554, + "loss": 0.0163, "step": 147030 }, { - "epoch": 0.74, - "learning_rate": 0.0001887246419219922, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024282766647398392, + "loss": 0.0183, "step": 147040 }, { - "epoch": 0.74, - "learning_rate": 0.0001887170742289782, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024282377825761246, + "loss": 0.0199, "step": 147050 }, { - "epoch": 0.74, - "learning_rate": 0.00018870950653596417, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024281989004124098, + "loss": 0.0171, "step": 147060 }, { - "epoch": 0.74, - "learning_rate": 0.00018870193884295018, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024281600182486955, + "loss": 0.0255, "step": 147070 }, { - "epoch": 0.74, - "learning_rate": 0.00018869437114993616, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024281211360849806, + "loss": 0.0162, "step": 147080 }, { - "epoch": 0.74, - "learning_rate": 0.00018868680345692214, - "loss": 0.0148, + "epoch": 0.38, + "learning_rate": 0.0002428082253921266, + "loss": 0.0153, "step": 147090 }, { - "epoch": 0.74, - "learning_rate": 0.00018867923576390815, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024280433717575512, + "loss": 0.0172, "step": 147100 }, { - "epoch": 0.74, - "learning_rate": 0.00018867166807089413, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.0002428004489593837, + "loss": 0.0194, "step": 147110 }, { - "epoch": 0.74, - "learning_rate": 0.00018866410037788012, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.0002427965607430122, + "loss": 0.0189, "step": 147120 }, { - "epoch": 0.74, - "learning_rate": 0.00018865653268486612, - "loss": 0.0127, + "epoch": 0.38, + "learning_rate": 0.00024279267252664074, + "loss": 0.0208, "step": 147130 }, { - "epoch": 0.74, - "learning_rate": 0.0001886489649918521, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.00024278878431026926, + "loss": 0.0163, "step": 147140 }, { - "epoch": 0.74, - "learning_rate": 0.0001886413972988381, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.0002427848960938978, + "loss": 0.0222, "step": 147150 }, { - "epoch": 0.74, - "learning_rate": 0.0001886338296058241, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024278100787752637, + "loss": 0.0192, "step": 147160 }, { - "epoch": 0.74, - "learning_rate": 0.00018862626191281008, - "loss": 0.0187, + "epoch": 0.38, + "learning_rate": 0.00024277711966115488, + "loss": 0.0219, "step": 147170 }, { - "epoch": 0.74, - "learning_rate": 0.00018861869421979606, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024277323144478342, + "loss": 0.0223, "step": 147180 }, { - "epoch": 0.74, - "learning_rate": 0.00018861112652678204, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024276934322841194, + "loss": 0.0221, "step": 147190 }, { - "epoch": 0.74, - "learning_rate": 0.00018860355883376805, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.0002427654550120405, + "loss": 0.0149, "step": 147200 }, { - "epoch": 0.74, - "learning_rate": 0.00018859599114075403, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024276156679566902, + "loss": 0.0185, "step": 147210 }, { - "epoch": 0.74, - "learning_rate": 0.00018858842344774, - "loss": 0.0144, + "epoch": 0.38, + "learning_rate": 0.00024275767857929756, + "loss": 0.0203, "step": 147220 }, { - "epoch": 0.74, - "learning_rate": 0.00018858085575472602, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024275379036292608, + "loss": 0.021, "step": 147230 }, { - "epoch": 0.74, - "learning_rate": 0.000188573288061712, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024274990214655465, + "loss": 0.022, "step": 147240 }, { - "epoch": 0.74, - "learning_rate": 0.00018856572036869798, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.00024274601393018316, + "loss": 0.0204, "step": 147250 }, { - "epoch": 0.74, - "learning_rate": 0.000188558152675684, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.0002427421257138117, + "loss": 0.0228, "step": 147260 }, { - "epoch": 0.74, - "learning_rate": 0.00018855058498266997, - "loss": 0.0156, + "epoch": 0.38, + "learning_rate": 0.00024273823749744022, + "loss": 0.0194, "step": 147270 }, { - "epoch": 0.74, - "learning_rate": 0.00018854301728965595, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.0002427343492810688, + "loss": 0.0245, "step": 147280 }, { - "epoch": 0.74, - "learning_rate": 0.00018853544959664196, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.0002427304610646973, + "loss": 0.0195, "step": 147290 }, { - "epoch": 0.74, - "learning_rate": 0.00018852788190362794, - "loss": 0.0152, - "step": 147300 + "epoch": 0.38, + "learning_rate": 0.00024272657284832584, + "loss": 0.0183, + "step": 147300 }, { - "epoch": 0.74, - "learning_rate": 0.00018852031421061393, - "loss": 0.0135, + "epoch": 0.38, + "learning_rate": 0.00024272268463195436, + "loss": 0.0229, "step": 147310 }, { - "epoch": 0.74, - "learning_rate": 0.00018851274651759993, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.00024271879641558293, + "loss": 0.0195, "step": 147320 }, { - "epoch": 0.74, - "learning_rate": 0.00018850517882458592, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024271490819921147, + "loss": 0.0189, "step": 147330 }, { - "epoch": 0.74, - "learning_rate": 0.0001884976111315719, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024271101998283998, + "loss": 0.0139, "step": 147340 }, { - "epoch": 0.74, - "learning_rate": 0.00018849004343855788, - "loss": 0.0097, + "epoch": 0.38, + "learning_rate": 0.0002427071317664685, + "loss": 0.0235, "step": 147350 }, { - "epoch": 0.74, - "learning_rate": 0.0001884824757455439, - "loss": 0.0157, + "epoch": 0.38, + "learning_rate": 0.00024270324355009707, + "loss": 0.0226, "step": 147360 }, { - "epoch": 0.74, - "learning_rate": 0.00018847490805252987, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.0002426993553337256, + "loss": 0.0192, "step": 147370 }, { - "epoch": 0.74, - "learning_rate": 0.00018846734035951585, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024269546711735412, + "loss": 0.0169, "step": 147380 }, { - "epoch": 0.74, - "learning_rate": 0.00018845977266650186, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024269157890098266, + "loss": 0.0218, "step": 147390 }, { - "epoch": 0.74, - "learning_rate": 0.00018845220497348784, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024268769068461118, + "loss": 0.0174, "step": 147400 }, { - "epoch": 0.74, - "learning_rate": 0.00018844463728047382, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024268380246823975, + "loss": 0.0222, "step": 147410 }, { - "epoch": 0.74, - "learning_rate": 0.00018843706958745983, - "loss": 0.0169, + "epoch": 0.38, + "learning_rate": 0.00024267991425186826, + "loss": 0.0237, "step": 147420 }, { - "epoch": 0.74, - "learning_rate": 0.0001884295018944458, - "loss": 0.0117, + "epoch": 0.38, + "learning_rate": 0.0002426760260354968, + "loss": 0.0199, "step": 147430 }, { - "epoch": 0.74, - "learning_rate": 0.0001884219342014318, - "loss": 0.0177, + "epoch": 0.38, + "learning_rate": 0.00024267213781912532, + "loss": 0.0204, "step": 147440 }, { - "epoch": 0.74, - "learning_rate": 0.0001884143665084178, - "loss": 0.0168, + "epoch": 0.38, + "learning_rate": 0.00024266824960275389, + "loss": 0.0205, "step": 147450 }, { - "epoch": 0.74, - "learning_rate": 0.00018840679881540378, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.0002426643613863824, + "loss": 0.0197, "step": 147460 }, { - "epoch": 0.74, - "learning_rate": 0.00018839923112238976, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024266047317001094, + "loss": 0.0168, "step": 147470 }, { - "epoch": 0.74, - "learning_rate": 0.00018839166342937577, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024265658495363946, + "loss": 0.0196, "step": 147480 }, { - "epoch": 0.74, - "learning_rate": 0.00018838409573636175, - "loss": 0.0148, + "epoch": 0.38, + "learning_rate": 0.00024265269673726803, + "loss": 0.0188, "step": 147490 }, { - "epoch": 0.74, - "learning_rate": 0.00018837652804334774, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.00024264880852089657, + "loss": 0.016, "step": 147500 }, { - "epoch": 0.74, - "learning_rate": 0.00018836896035033374, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024264492030452508, + "loss": 0.0176, "step": 147510 }, { - "epoch": 0.74, - "learning_rate": 0.00018836139265731973, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.0002426410320881536, + "loss": 0.0207, "step": 147520 }, { - "epoch": 0.74, - "learning_rate": 0.0001883538249643057, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024263714387178216, + "loss": 0.019, "step": 147530 }, { - "epoch": 0.74, - "learning_rate": 0.0001883462572712917, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.0002426332556554107, + "loss": 0.0171, "step": 147540 }, { - "epoch": 0.74, - "learning_rate": 0.0001883386895782777, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024262936743903922, + "loss": 0.0197, "step": 147550 }, { - "epoch": 0.74, - "learning_rate": 0.00018833112188526368, - "loss": 0.0161, + "epoch": 0.38, + "learning_rate": 0.00024262547922266776, + "loss": 0.0219, "step": 147560 }, { - "epoch": 0.74, - "learning_rate": 0.00018832355419224966, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.0002426215910062963, + "loss": 0.0235, "step": 147570 }, { - "epoch": 0.74, - "learning_rate": 0.00018831598649923567, - "loss": 0.0163, + "epoch": 0.38, + "learning_rate": 0.00024261770278992485, + "loss": 0.0182, "step": 147580 }, { - "epoch": 0.74, - "learning_rate": 0.00018830841880622165, - "loss": 0.0165, + "epoch": 0.38, + "learning_rate": 0.00024261381457355336, + "loss": 0.0196, "step": 147590 }, { - "epoch": 0.74, - "learning_rate": 0.00018830085111320763, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.0002426099263571819, + "loss": 0.0189, "step": 147600 }, { - "epoch": 0.74, - "learning_rate": 0.00018829328342019364, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.00024260603814081044, + "loss": 0.0192, "step": 147610 }, { - "epoch": 0.74, - "learning_rate": 0.00018828571572717962, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024260214992443899, + "loss": 0.0171, "step": 147620 }, { - "epoch": 0.74, - "learning_rate": 0.0001882781480341656, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.0002425982617080675, + "loss": 0.0167, "step": 147630 }, { - "epoch": 0.74, - "learning_rate": 0.0001882705803411516, - "loss": 0.014, + "epoch": 0.38, + "learning_rate": 0.00024259437349169604, + "loss": 0.0154, "step": 147640 }, { - "epoch": 0.74, - "learning_rate": 0.0001882630126481376, - "loss": 0.0203, + "epoch": 0.38, + "learning_rate": 0.00024259048527532456, + "loss": 0.0214, "step": 147650 }, { - "epoch": 0.74, - "learning_rate": 0.00018825544495512357, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.00024258659705895312, + "loss": 0.0229, "step": 147660 }, { - "epoch": 0.75, - "learning_rate": 0.00018824787726210958, - "loss": 0.0102, + "epoch": 0.38, + "learning_rate": 0.00024258270884258164, + "loss": 0.0196, "step": 147670 }, { - "epoch": 0.75, - "learning_rate": 0.00018824030956909556, - "loss": 0.0194, + "epoch": 0.38, + "learning_rate": 0.00024257882062621018, + "loss": 0.0181, "step": 147680 }, { - "epoch": 0.75, - "learning_rate": 0.00018823274187608152, - "loss": 0.0132, + "epoch": 0.38, + "learning_rate": 0.0002425749324098387, + "loss": 0.018, "step": 147690 }, { - "epoch": 0.75, - "learning_rate": 0.0001882251741830675, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024257104419346726, + "loss": 0.0187, "step": 147700 }, { - "epoch": 0.75, - "learning_rate": 0.0001882176064900535, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.0002425671559770958, + "loss": 0.0196, "step": 147710 }, { - "epoch": 0.75, - "learning_rate": 0.0001882100387970395, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024256326776072432, + "loss": 0.0192, "step": 147720 }, { - "epoch": 0.75, - "learning_rate": 0.00018820247110402547, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024255937954435286, + "loss": 0.016, "step": 147730 }, { - "epoch": 0.75, - "learning_rate": 0.00018819490341101145, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.0002425554913279814, + "loss": 0.0184, "step": 147740 }, { - "epoch": 0.75, - "learning_rate": 0.00018818733571799746, - "loss": 0.0118, + "epoch": 0.38, + "learning_rate": 0.00024255160311160995, + "loss": 0.0241, "step": 147750 }, { - "epoch": 0.75, - "learning_rate": 0.00018817976802498344, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024254771489523846, + "loss": 0.0151, "step": 147760 }, { - "epoch": 0.75, - "learning_rate": 0.00018817220033196942, - "loss": 0.0151, + "epoch": 0.38, + "learning_rate": 0.000242543826678867, + "loss": 0.0191, "step": 147770 }, { - "epoch": 0.75, - "learning_rate": 0.00018816463263895543, - "loss": 0.0143, + "epoch": 0.38, + "learning_rate": 0.00024253993846249554, + "loss": 0.0155, "step": 147780 }, { - "epoch": 0.75, - "learning_rate": 0.00018815706494594141, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024253605024612408, + "loss": 0.0166, "step": 147790 }, { - "epoch": 0.75, - "learning_rate": 0.0001881494972529274, - "loss": 0.0103, + "epoch": 0.38, + "learning_rate": 0.0002425321620297526, + "loss": 0.0171, "step": 147800 }, { - "epoch": 0.75, - "learning_rate": 0.0001881419295599134, - "loss": 0.0167, + "epoch": 0.38, + "learning_rate": 0.00024252827381338114, + "loss": 0.0203, "step": 147810 }, { - "epoch": 0.75, - "learning_rate": 0.00018813436186689939, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.00024252438559700968, + "loss": 0.0194, "step": 147820 }, { - "epoch": 0.75, - "learning_rate": 0.00018812679417388537, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.00024252049738063822, + "loss": 0.0197, "step": 147830 }, { - "epoch": 0.75, - "learning_rate": 0.00018811922648087138, - "loss": 0.0152, + "epoch": 0.38, + "learning_rate": 0.00024251660916426674, + "loss": 0.0192, "step": 147840 }, { - "epoch": 0.75, - "learning_rate": 0.00018811165878785736, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024251272094789528, + "loss": 0.0207, "step": 147850 }, { - "epoch": 0.75, - "learning_rate": 0.00018810409109484334, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024250883273152385, + "loss": 0.0198, "step": 147860 }, { - "epoch": 0.75, - "learning_rate": 0.00018809652340182935, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024250494451515236, + "loss": 0.0177, "step": 147870 }, { - "epoch": 0.75, - "learning_rate": 0.00018808895570881533, - "loss": 0.0126, + "epoch": 0.38, + "learning_rate": 0.0002425010562987809, + "loss": 0.0227, "step": 147880 }, { - "epoch": 0.75, - "learning_rate": 0.0001880813880158013, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024249716808240942, + "loss": 0.0198, "step": 147890 }, { - "epoch": 0.75, - "learning_rate": 0.00018807382032278732, - "loss": 0.0108, + "epoch": 0.38, + "learning_rate": 0.00024249327986603796, + "loss": 0.0229, "step": 147900 }, { - "epoch": 0.75, - "learning_rate": 0.0001880662526297733, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.0002424893916496665, + "loss": 0.0161, "step": 147910 }, { - "epoch": 0.75, - "learning_rate": 0.00018805868493675928, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024248550343329504, + "loss": 0.0201, "step": 147920 }, { - "epoch": 0.75, - "learning_rate": 0.00018805111724374526, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024248161521692356, + "loss": 0.024, "step": 147930 }, { - "epoch": 0.75, - "learning_rate": 0.00018804354955073127, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.0002424777270005521, + "loss": 0.0166, "step": 147940 }, { - "epoch": 0.75, - "learning_rate": 0.00018803598185771725, - "loss": 0.0095, + "epoch": 0.38, + "learning_rate": 0.00024247383878418064, + "loss": 0.0185, "step": 147950 }, { - "epoch": 0.75, - "learning_rate": 0.00018802841416470323, - "loss": 0.0169, + "epoch": 0.38, + "learning_rate": 0.00024246995056780918, + "loss": 0.0204, "step": 147960 }, { - "epoch": 0.75, - "learning_rate": 0.00018802084647168924, - "loss": 0.0119, + "epoch": 0.38, + "learning_rate": 0.0002424660623514377, + "loss": 0.0138, "step": 147970 }, { - "epoch": 0.75, - "learning_rate": 0.00018801327877867522, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024246217413506624, + "loss": 0.0176, "step": 147980 }, { - "epoch": 0.75, - "learning_rate": 0.0001880057110856612, - "loss": 0.0152, + "epoch": 0.38, + "learning_rate": 0.00024245828591869478, + "loss": 0.0167, "step": 147990 }, { - "epoch": 0.75, - "learning_rate": 0.00018799814339264721, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.00024245439770232332, + "loss": 0.0176, "step": 148000 }, { - "epoch": 0.75, - "eval_cer": 0.9144741374876638, - "eval_loss": 0.009097721427679062, - "eval_runtime": 116.6762, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.38, + "eval_cer": 0.881782465628416, + "eval_loss": 0.013744070194661617, + "eval_runtime": 107.4219, + "eval_samples_per_second": 18.618, + "eval_steps_per_second": 4.655, "step": 148000 }, { - "epoch": 0.75, - "learning_rate": 0.0001879905756996332, - "loss": 0.016, + "epoch": 0.38, + "learning_rate": 0.00024245050948595184, + "loss": 0.0171, "step": 148010 }, { - "epoch": 0.75, - "learning_rate": 0.00018798300800661918, - "loss": 0.0138, + "epoch": 0.38, + "learning_rate": 0.00024244662126958038, + "loss": 0.0143, "step": 148020 }, { - "epoch": 0.75, - "learning_rate": 0.00018797544031360519, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.00024244273305320895, + "loss": 0.0181, "step": 148030 }, { - "epoch": 0.75, - "learning_rate": 0.00018796787262059117, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024243884483683746, + "loss": 0.0167, "step": 148040 }, { - "epoch": 0.75, - "learning_rate": 0.00018796030492757715, - "loss": 0.0167, + "epoch": 0.38, + "learning_rate": 0.000242434956620466, + "loss": 0.0174, "step": 148050 }, { - "epoch": 0.75, - "learning_rate": 0.00018795273723456316, - "loss": 0.0175, + "epoch": 0.38, + "learning_rate": 0.00024243106840409452, + "loss": 0.0236, "step": 148060 }, { - "epoch": 0.75, - "learning_rate": 0.00018794516954154914, - "loss": 0.0136, + "epoch": 0.38, + "learning_rate": 0.0002424271801877231, + "loss": 0.0184, "step": 148070 }, { - "epoch": 0.75, - "learning_rate": 0.00018793760184853512, - "loss": 0.0129, + "epoch": 0.38, + "learning_rate": 0.0002424232919713516, + "loss": 0.0193, "step": 148080 }, { - "epoch": 0.75, - "learning_rate": 0.0001879300341555211, - "loss": 0.0146, + "epoch": 0.38, + "learning_rate": 0.00024241940375498014, + "loss": 0.0216, "step": 148090 }, { - "epoch": 0.75, - "learning_rate": 0.0001879224664625071, - "loss": 0.0162, + "epoch": 0.38, + "learning_rate": 0.00024241551553860866, + "loss": 0.021, "step": 148100 }, { - "epoch": 0.75, - "learning_rate": 0.0001879148987694931, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.00024241162732223723, + "loss": 0.0228, "step": 148110 }, { - "epoch": 0.75, - "learning_rate": 0.00018790733107647907, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024240773910586574, + "loss": 0.0188, "step": 148120 }, { - "epoch": 0.75, - "learning_rate": 0.00018789976338346508, - "loss": 0.0124, + "epoch": 0.38, + "learning_rate": 0.00024240385088949428, + "loss": 0.0199, "step": 148130 }, { - "epoch": 0.75, - "learning_rate": 0.00018789219569045106, - "loss": 0.0112, + "epoch": 0.38, + "learning_rate": 0.0002423999626731228, + "loss": 0.0226, "step": 148140 }, { - "epoch": 0.75, - "learning_rate": 0.00018788462799743704, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024239607445675134, + "loss": 0.0202, "step": 148150 }, { - "epoch": 0.75, - "learning_rate": 0.00018787706030442305, - "loss": 0.0113, + "epoch": 0.38, + "learning_rate": 0.00024239218624037988, + "loss": 0.0192, "step": 148160 }, { - "epoch": 0.75, - "learning_rate": 0.00018786949261140903, - "loss": 0.0106, + "epoch": 0.38, + "learning_rate": 0.00024238829802400842, + "loss": 0.0168, "step": 148170 }, { - "epoch": 0.75, - "learning_rate": 0.00018786192491839502, - "loss": 0.012, + "epoch": 0.38, + "learning_rate": 0.00024238440980763694, + "loss": 0.019, "step": 148180 }, { - "epoch": 0.75, - "learning_rate": 0.00018785435722538102, - "loss": 0.013, + "epoch": 0.38, + "learning_rate": 0.00024238052159126548, + "loss": 0.0228, "step": 148190 }, { - "epoch": 0.75, - "learning_rate": 0.000187846789532367, - "loss": 0.0164, + "epoch": 0.38, + "learning_rate": 0.00024237663337489405, + "loss": 0.0206, "step": 148200 }, { - "epoch": 0.75, - "learning_rate": 0.000187839221839353, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.00024237274515852256, + "loss": 0.0192, "step": 148210 }, { - "epoch": 0.75, - "learning_rate": 0.000187831654146339, - "loss": 0.017, + "epoch": 0.38, + "learning_rate": 0.00024236885694215108, + "loss": 0.0248, "step": 148220 }, { - "epoch": 0.75, - "learning_rate": 0.00018782408645332498, - "loss": 0.015, + "epoch": 0.38, + "learning_rate": 0.00024236496872577962, + "loss": 0.025, "step": 148230 }, { - "epoch": 0.75, - "learning_rate": 0.00018781651876031096, - "loss": 0.0115, + "epoch": 0.38, + "learning_rate": 0.0002423610805094082, + "loss": 0.0178, "step": 148240 }, { - "epoch": 0.75, - "learning_rate": 0.00018780895106729694, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.0002423571922930367, + "loss": 0.0205, "step": 148250 }, { - "epoch": 0.75, - "learning_rate": 0.00018780138337428295, - "loss": 0.0139, + "epoch": 0.38, + "learning_rate": 0.00024235330407666524, + "loss": 0.0227, "step": 148260 }, { - "epoch": 0.75, - "learning_rate": 0.00018779381568126893, - "loss": 0.0115, + "epoch": 0.38, + "learning_rate": 0.00024234941586029376, + "loss": 0.0205, "step": 148270 }, { - "epoch": 0.75, - "learning_rate": 0.0001877862479882549, - "loss": 0.0128, + "epoch": 0.38, + "learning_rate": 0.00024234552764392233, + "loss": 0.0186, "step": 148280 }, { - "epoch": 0.75, - "learning_rate": 0.00018777868029524092, - "loss": 0.0121, + "epoch": 0.38, + "learning_rate": 0.00024234163942755084, + "loss": 0.0214, "step": 148290 }, { - "epoch": 0.75, - "learning_rate": 0.0001877711126022269, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024233775121117938, + "loss": 0.0202, "step": 148300 }, { - "epoch": 0.75, - "learning_rate": 0.00018776354490921288, - "loss": 0.0091, + "epoch": 0.38, + "learning_rate": 0.0002423338629948079, + "loss": 0.0185, "step": 148310 }, { - "epoch": 0.75, - "learning_rate": 0.0001877559772161989, - "loss": 0.0105, + "epoch": 0.38, + "learning_rate": 0.00024232997477843647, + "loss": 0.0241, "step": 148320 }, { - "epoch": 0.75, - "learning_rate": 0.00018774840952318487, - "loss": 0.0131, + "epoch": 0.38, + "learning_rate": 0.00024232608656206498, + "loss": 0.0224, "step": 148330 }, { - "epoch": 0.75, - "learning_rate": 0.00018774084183017085, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.00024232219834569352, + "loss": 0.0219, "step": 148340 }, { - "epoch": 0.75, - "learning_rate": 0.00018773327413715686, - "loss": 0.0142, + "epoch": 0.38, + "learning_rate": 0.00024231831012932204, + "loss": 0.0234, "step": 148350 }, { - "epoch": 0.75, - "learning_rate": 0.00018772570644414284, - "loss": 0.012, + "epoch": 0.38, + "learning_rate": 0.0002423144219129506, + "loss": 0.023, "step": 148360 }, { - "epoch": 0.75, - "learning_rate": 0.00018771813875112883, - "loss": 0.0122, + "epoch": 0.38, + "learning_rate": 0.00024231053369657915, + "loss": 0.0174, "step": 148370 }, { - "epoch": 0.75, - "learning_rate": 0.00018771057105811483, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.00024230664548020766, + "loss": 0.0254, "step": 148380 }, { - "epoch": 0.75, - "learning_rate": 0.00018770300336510082, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024230275726383618, + "loss": 0.0168, "step": 148390 }, { - "epoch": 0.75, - "learning_rate": 0.0001876954356720868, - "loss": 0.0158, + "epoch": 0.38, + "learning_rate": 0.00024229886904746472, + "loss": 0.0212, "step": 148400 }, { - "epoch": 0.75, - "learning_rate": 0.0001876878679790728, - "loss": 0.0137, + "epoch": 0.38, + "learning_rate": 0.0002422949808310933, + "loss": 0.023, "step": 148410 }, { - "epoch": 0.75, - "learning_rate": 0.0001876803002860588, - "loss": 0.0114, + "epoch": 0.38, + "learning_rate": 0.0002422910926147218, + "loss": 0.02, "step": 148420 }, { - "epoch": 0.75, - "learning_rate": 0.00018767273259304477, - "loss": 0.0125, + "epoch": 0.38, + "learning_rate": 0.00024228720439835034, + "loss": 0.0161, "step": 148430 }, { - "epoch": 0.75, - "learning_rate": 0.00018766516490003075, - "loss": 0.0134, + "epoch": 0.38, + "learning_rate": 0.00024228331618197886, + "loss": 0.0205, "step": 148440 }, { - "epoch": 0.75, - "learning_rate": 0.00018765759720701676, - "loss": 0.0123, + "epoch": 0.38, + "learning_rate": 0.00024227942796560743, + "loss": 0.0217, "step": 148450 }, { - "epoch": 0.75, - "learning_rate": 0.00018765002951400274, - "loss": 0.0112, + "epoch": 0.38, + "learning_rate": 0.00024227553974923594, + "loss": 0.0225, "step": 148460 }, { - "epoch": 0.75, - "learning_rate": 0.00018764246182098872, - "loss": 0.0111, + "epoch": 0.38, + "learning_rate": 0.00024227165153286448, + "loss": 0.0183, "step": 148470 }, { - "epoch": 0.75, - "learning_rate": 0.00018763489412797473, - "loss": 0.012, + "epoch": 0.38, + "learning_rate": 0.000242267763316493, + "loss": 0.0182, "step": 148480 }, { - "epoch": 0.75, - "learning_rate": 0.0001876273264349607, - "loss": 0.0116, + "epoch": 0.38, + "learning_rate": 0.00024226387510012157, + "loss": 0.0218, "step": 148490 }, { - "epoch": 0.75, - "learning_rate": 0.0001876197587419467, - "loss": 0.0145, + "epoch": 0.38, + "learning_rate": 0.00024225998688375008, + "loss": 0.0204, "step": 148500 }, { - "epoch": 0.75, - "learning_rate": 0.0001876121910489327, - "loss": 0.0133, + "epoch": 0.38, + "learning_rate": 0.00024225609866737862, + "loss": 0.019, "step": 148510 }, { - "epoch": 0.75, - "learning_rate": 0.00018760462335591868, - "loss": 0.011, + "epoch": 0.38, + "learning_rate": 0.00024225221045100714, + "loss": 0.0203, "step": 148520 }, { - "epoch": 0.75, - "learning_rate": 0.00018759705566290466, - "loss": 0.0161, + "epoch": 0.39, + "learning_rate": 0.0002422483222346357, + "loss": 0.0201, "step": 148530 }, { - "epoch": 0.75, - "learning_rate": 0.00018758948796989067, - "loss": 0.0134, + "epoch": 0.39, + "learning_rate": 0.00024224443401826422, + "loss": 0.0154, "step": 148540 }, { - "epoch": 0.75, - "learning_rate": 0.00018758192027687665, - "loss": 0.0102, + "epoch": 0.39, + "learning_rate": 0.00024224054580189276, + "loss": 0.0182, "step": 148550 }, { - "epoch": 0.75, - "learning_rate": 0.00018757435258386264, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024223665758552128, + "loss": 0.022, "step": 148560 }, { - "epoch": 0.75, - "learning_rate": 0.00018756678489084864, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024223276936914984, + "loss": 0.0198, "step": 148570 }, { - "epoch": 0.75, - "learning_rate": 0.00018755921719783463, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024222888115277839, + "loss": 0.0213, "step": 148580 }, { - "epoch": 0.75, - "learning_rate": 0.0001875516495048206, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.0002422249929364069, + "loss": 0.0234, "step": 148590 }, { - "epoch": 0.75, - "learning_rate": 0.0001875440818118066, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024222110472003544, + "loss": 0.0174, "step": 148600 }, { - "epoch": 0.75, - "learning_rate": 0.0001875365141187926, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024221721650366398, + "loss": 0.018, "step": 148610 }, { - "epoch": 0.75, - "learning_rate": 0.00018752894642577858, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024221332828729253, + "loss": 0.0184, "step": 148620 }, { - "epoch": 0.75, - "learning_rate": 0.00018752137873276456, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024220944007092104, + "loss": 0.0233, "step": 148630 }, { - "epoch": 0.75, - "learning_rate": 0.00018751381103975057, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024220555185454958, + "loss": 0.0187, "step": 148640 }, { - "epoch": 0.75, - "learning_rate": 0.00018750624334673655, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002422016636381781, + "loss": 0.0177, "step": 148650 }, { - "epoch": 0.75, - "learning_rate": 0.00018749867565372253, - "loss": 0.0177, + "epoch": 0.39, + "learning_rate": 0.00024219777542180667, + "loss": 0.02, "step": 148660 }, { - "epoch": 0.75, - "learning_rate": 0.00018749110796070854, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024219388720543518, + "loss": 0.0184, "step": 148670 }, { - "epoch": 0.75, - "learning_rate": 0.00018748354026769452, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.00024218999898906372, + "loss": 0.0229, "step": 148680 }, { - "epoch": 0.75, - "learning_rate": 0.0001874759725746805, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024218611077269224, + "loss": 0.0194, "step": 148690 }, { - "epoch": 0.75, - "learning_rate": 0.0001874684048816665, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.0002421822225563208, + "loss": 0.0246, "step": 148700 }, { - "epoch": 0.75, - "learning_rate": 0.0001874608371886525, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024217833433994932, + "loss": 0.0209, "step": 148710 }, { - "epoch": 0.75, - "learning_rate": 0.00018745326949563847, - "loss": 0.0102, + "epoch": 0.39, + "learning_rate": 0.00024217444612357786, + "loss": 0.019, "step": 148720 }, { - "epoch": 0.75, - "learning_rate": 0.00018744570180262448, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.00024217055790720638, + "loss": 0.0242, "step": 148730 }, { - "epoch": 0.75, - "learning_rate": 0.00018743813410961046, - "loss": 0.0094, + "epoch": 0.39, + "learning_rate": 0.00024216666969083494, + "loss": 0.0198, "step": 148740 }, { - "epoch": 0.75, - "learning_rate": 0.00018743056641659645, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024216278147446349, + "loss": 0.0239, "step": 148750 }, { - "epoch": 0.75, - "learning_rate": 0.00018742299872358243, - "loss": 0.011, + "epoch": 0.39, + "learning_rate": 0.000242158893258092, + "loss": 0.0196, "step": 148760 }, { - "epoch": 0.75, - "learning_rate": 0.00018741543103056844, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024215500504172054, + "loss": 0.0171, "step": 148770 }, { - "epoch": 0.75, - "learning_rate": 0.00018740786333755442, - "loss": 0.0189, + "epoch": 0.39, + "learning_rate": 0.00024215111682534908, + "loss": 0.0198, "step": 148780 }, { - "epoch": 0.75, - "learning_rate": 0.0001874002956445404, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.00024214722860897763, + "loss": 0.0196, "step": 148790 }, { - "epoch": 0.75, - "learning_rate": 0.0001873927279515264, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024214334039260614, + "loss": 0.0163, "step": 148800 }, { - "epoch": 0.75, - "learning_rate": 0.0001873851602585124, - "loss": 0.013, + "epoch": 0.39, + "learning_rate": 0.00024213945217623468, + "loss": 0.0217, "step": 148810 }, { - "epoch": 0.75, - "learning_rate": 0.00018737759256549837, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024213556395986322, + "loss": 0.0201, "step": 148820 }, { - "epoch": 0.75, - "learning_rate": 0.00018737002487248438, - "loss": 0.0098, + "epoch": 0.39, + "learning_rate": 0.00024213167574349176, + "loss": 0.0173, "step": 148830 }, { - "epoch": 0.75, - "learning_rate": 0.00018736245717947036, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024212778752712028, + "loss": 0.0146, "step": 148840 }, { - "epoch": 0.75, - "learning_rate": 0.00018735488948645634, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024212389931074882, + "loss": 0.0231, "step": 148850 }, { - "epoch": 0.75, - "learning_rate": 0.00018734732179344235, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024212001109437736, + "loss": 0.0252, "step": 148860 }, { - "epoch": 0.75, - "learning_rate": 0.00018733975410042833, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.0002421161228780059, + "loss": 0.0196, "step": 148870 }, { - "epoch": 0.75, - "learning_rate": 0.0001873321864074143, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024211223466163442, + "loss": 0.0187, "step": 148880 }, { - "epoch": 0.75, - "learning_rate": 0.00018732461871440032, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024210834644526296, + "loss": 0.0165, "step": 148890 }, { - "epoch": 0.75, - "learning_rate": 0.0001873170510213863, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024210445822889147, + "loss": 0.0169, "step": 148900 }, { - "epoch": 0.75, - "learning_rate": 0.00018730948332837228, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024210057001252004, + "loss": 0.0169, "step": 148910 }, { - "epoch": 0.75, - "learning_rate": 0.00018730191563535827, - "loss": 0.0228, + "epoch": 0.39, + "learning_rate": 0.00024209668179614859, + "loss": 0.0189, "step": 148920 }, { - "epoch": 0.75, - "learning_rate": 0.00018729434794234427, - "loss": 0.0132, + "epoch": 0.39, + "learning_rate": 0.0002420927935797771, + "loss": 0.0217, "step": 148930 }, { - "epoch": 0.75, - "learning_rate": 0.00018728678024933026, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024208890536340561, + "loss": 0.0185, "step": 148940 }, { - "epoch": 0.75, - "learning_rate": 0.0001872792125563162, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024208501714703418, + "loss": 0.0166, "step": 148950 }, { - "epoch": 0.75, - "learning_rate": 0.00018727164486330222, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.00024208112893066272, + "loss": 0.0183, "step": 148960 }, { - "epoch": 0.75, - "learning_rate": 0.0001872640771702882, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.00024207724071429124, + "loss": 0.0195, "step": 148970 }, { - "epoch": 0.75, - "learning_rate": 0.00018725650947727418, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024207335249791978, + "loss": 0.0149, "step": 148980 }, { - "epoch": 0.75, - "learning_rate": 0.00018724894178426016, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.00024206946428154832, + "loss": 0.0185, "step": 148990 }, { - "epoch": 0.75, - "learning_rate": 0.00018724137409124617, - "loss": 0.019, + "epoch": 0.39, + "learning_rate": 0.00024206557606517686, + "loss": 0.0198, "step": 149000 }, { - "epoch": 0.75, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.009037774056196213, - "eval_runtime": 116.6835, - "eval_samples_per_second": 17.14, - "eval_steps_per_second": 4.285, + "epoch": 0.39, + "eval_cer": 0.8817642703482717, + "eval_loss": 0.013767913915216923, + "eval_runtime": 107.1271, + "eval_samples_per_second": 18.669, + "eval_steps_per_second": 4.667, "step": 149000 }, { - "epoch": 0.75, - "learning_rate": 0.00018723380639823215, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024206168784880538, + "loss": 0.0155, "step": 149010 }, { - "epoch": 0.75, - "learning_rate": 0.00018722623870521813, - "loss": 0.013, + "epoch": 0.39, + "learning_rate": 0.00024205779963243392, + "loss": 0.0183, "step": 149020 }, { - "epoch": 0.75, - "learning_rate": 0.00018721867101220414, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024205391141606246, + "loss": 0.0186, "step": 149030 }, { - "epoch": 0.75, - "learning_rate": 0.00018721110331919012, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.000242050023199691, + "loss": 0.0151, "step": 149040 }, { - "epoch": 0.75, - "learning_rate": 0.0001872035356261761, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.00024204613498331952, + "loss": 0.0163, "step": 149050 }, { - "epoch": 0.75, - "learning_rate": 0.00018719596793316211, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024204224676694806, + "loss": 0.025, "step": 149060 }, { - "epoch": 0.75, - "learning_rate": 0.0001871884002401481, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.00024203835855057663, + "loss": 0.0172, "step": 149070 }, { - "epoch": 0.75, - "learning_rate": 0.00018718083254713408, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.00024203447033420514, + "loss": 0.0188, "step": 149080 }, { - "epoch": 0.75, - "learning_rate": 0.00018717326485412009, - "loss": 0.0127, + "epoch": 0.39, + "learning_rate": 0.00024203058211783368, + "loss": 0.0281, "step": 149090 }, { - "epoch": 0.75, - "learning_rate": 0.00018716569716110607, - "loss": 0.0153, + "epoch": 0.39, + "learning_rate": 0.0002420266939014622, + "loss": 0.0243, "step": 149100 }, { - "epoch": 0.75, - "learning_rate": 0.00018715812946809205, - "loss": 0.0154, + "epoch": 0.39, + "learning_rate": 0.00024202280568509077, + "loss": 0.0232, "step": 149110 }, { - "epoch": 0.75, - "learning_rate": 0.00018715056177507806, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024201891746871928, + "loss": 0.017, "step": 149120 }, { - "epoch": 0.75, - "learning_rate": 0.00018714299408206404, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024201502925234782, + "loss": 0.0256, "step": 149130 }, { - "epoch": 0.75, - "learning_rate": 0.00018713542638905002, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024201114103597634, + "loss": 0.0198, "step": 149140 }, { - "epoch": 0.75, - "learning_rate": 0.000187127858696036, - "loss": 0.0185, + "epoch": 0.39, + "learning_rate": 0.00024200725281960488, + "loss": 0.0237, "step": 149150 }, { - "epoch": 0.75, - "learning_rate": 0.000187120291003022, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024200336460323342, + "loss": 0.0184, "step": 149160 }, { - "epoch": 0.75, - "learning_rate": 0.000187112723310008, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024199947638686196, + "loss": 0.0187, "step": 149170 }, { - "epoch": 0.75, - "learning_rate": 0.00018710515561699397, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024199558817049048, + "loss": 0.0193, "step": 149180 }, { - "epoch": 0.75, - "learning_rate": 0.00018709758792397998, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024199169995411902, + "loss": 0.017, "step": 149190 }, { - "epoch": 0.75, - "learning_rate": 0.00018709002023096596, - "loss": 0.0101, + "epoch": 0.39, + "learning_rate": 0.00024198781173774756, + "loss": 0.0265, "step": 149200 }, { - "epoch": 0.75, - "learning_rate": 0.00018708245253795194, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.0002419839235213761, + "loss": 0.022, "step": 149210 }, { - "epoch": 0.75, - "learning_rate": 0.00018707488484493795, - "loss": 0.0132, + "epoch": 0.39, + "learning_rate": 0.00024198003530500462, + "loss": 0.0174, "step": 149220 }, { - "epoch": 0.75, - "learning_rate": 0.00018706731715192393, - "loss": 0.0107, + "epoch": 0.39, + "learning_rate": 0.00024197614708863316, + "loss": 0.016, "step": 149230 }, { - "epoch": 0.75, - "learning_rate": 0.00018705974945890992, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024197225887226173, + "loss": 0.0184, "step": 149240 }, { - "epoch": 0.75, - "learning_rate": 0.00018705218176589592, - "loss": 0.0107, + "epoch": 0.39, + "learning_rate": 0.00024196837065589024, + "loss": 0.0168, "step": 149250 }, { - "epoch": 0.75, - "learning_rate": 0.0001870446140728819, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024196448243951876, + "loss": 0.0184, "step": 149260 }, { - "epoch": 0.75, - "learning_rate": 0.0001870370463798679, - "loss": 0.011, + "epoch": 0.39, + "learning_rate": 0.0002419605942231473, + "loss": 0.0174, "step": 149270 }, { - "epoch": 0.75, - "learning_rate": 0.0001870294786868539, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024195670600677587, + "loss": 0.0175, "step": 149280 }, { - "epoch": 0.75, - "learning_rate": 0.00018702191099383988, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024195281779040438, + "loss": 0.0159, "step": 149290 }, { - "epoch": 0.75, - "learning_rate": 0.00018701434330082586, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024194892957403292, + "loss": 0.0197, "step": 149300 }, { - "epoch": 0.75, - "learning_rate": 0.00018700677560781184, - "loss": 0.0155, + "epoch": 0.39, + "learning_rate": 0.00024194504135766144, + "loss": 0.0186, "step": 149310 }, { - "epoch": 0.75, - "learning_rate": 0.00018699920791479785, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024194115314129, + "loss": 0.0207, "step": 149320 }, { - "epoch": 0.75, - "learning_rate": 0.00018699164022178383, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024193726492491852, + "loss": 0.0241, "step": 149330 }, { - "epoch": 0.75, - "learning_rate": 0.0001869840725287698, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024193337670854706, + "loss": 0.0191, "step": 149340 }, { - "epoch": 0.75, - "learning_rate": 0.00018697650483575582, - "loss": 0.0114, + "epoch": 0.39, + "learning_rate": 0.00024192948849217558, + "loss": 0.017, "step": 149350 }, { - "epoch": 0.75, - "learning_rate": 0.0001869689371427418, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024192560027580415, + "loss": 0.0164, "step": 149360 }, { - "epoch": 0.75, - "learning_rate": 0.00018696136944972778, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024192171205943266, + "loss": 0.02, "step": 149370 }, { - "epoch": 0.75, - "learning_rate": 0.0001869538017567138, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.0002419178238430612, + "loss": 0.0229, "step": 149380 }, { - "epoch": 0.75, - "learning_rate": 0.00018694623406369977, - "loss": 0.0155, + "epoch": 0.39, + "learning_rate": 0.00024191393562668972, + "loss": 0.0206, "step": 149390 }, { - "epoch": 0.75, - "learning_rate": 0.00018693866637068575, - "loss": 0.0161, + "epoch": 0.39, + "learning_rate": 0.00024191004741031826, + "loss": 0.0176, "step": 149400 }, { - "epoch": 0.75, - "learning_rate": 0.00018693109867767176, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.0002419061591939468, + "loss": 0.0216, "step": 149410 }, { - "epoch": 0.75, - "learning_rate": 0.00018692353098465774, - "loss": 0.0132, + "epoch": 0.39, + "learning_rate": 0.00024190227097757534, + "loss": 0.0219, "step": 149420 }, { - "epoch": 0.75, - "learning_rate": 0.00018691596329164373, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024189838276120386, + "loss": 0.0126, "step": 149430 }, { - "epoch": 0.75, - "learning_rate": 0.00018690839559862973, - "loss": 0.018, + "epoch": 0.39, + "learning_rate": 0.0002418944945448324, + "loss": 0.0185, "step": 149440 }, { - "epoch": 0.75, - "learning_rate": 0.00018690082790561572, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.00024189060632846097, + "loss": 0.0169, "step": 149450 }, { - "epoch": 0.75, - "learning_rate": 0.0001868932602126017, - "loss": 0.0142, + "epoch": 0.39, + "learning_rate": 0.00024188671811208948, + "loss": 0.0228, "step": 149460 }, { - "epoch": 0.75, - "learning_rate": 0.0001868856925195877, - "loss": 0.0145, + "epoch": 0.39, + "learning_rate": 0.00024188282989571802, + "loss": 0.0179, "step": 149470 }, { - "epoch": 0.75, - "learning_rate": 0.0001868781248265737, - "loss": 0.0095, + "epoch": 0.39, + "learning_rate": 0.00024187894167934654, + "loss": 0.0179, "step": 149480 }, { - "epoch": 0.75, - "learning_rate": 0.00018687055713355967, - "loss": 0.0127, + "epoch": 0.39, + "learning_rate": 0.0002418750534629751, + "loss": 0.0213, "step": 149490 }, { - "epoch": 0.75, - "learning_rate": 0.00018686298944054565, - "loss": 0.0162, + "epoch": 0.39, + "learning_rate": 0.00024187116524660362, + "loss": 0.0188, "step": 149500 }, { - "epoch": 0.75, - "learning_rate": 0.00018685542174753166, - "loss": 0.0174, + "epoch": 0.39, + "learning_rate": 0.00024186727703023216, + "loss": 0.0229, "step": 149510 }, { - "epoch": 0.75, - "learning_rate": 0.00018684785405451764, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024186338881386068, + "loss": 0.018, "step": 149520 }, { - "epoch": 0.75, - "learning_rate": 0.00018684028636150362, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.00024185950059748925, + "loss": 0.0181, "step": 149530 }, { - "epoch": 0.75, - "learning_rate": 0.00018683271866848963, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024185561238111776, + "loss": 0.024, "step": 149540 }, { - "epoch": 0.75, - "learning_rate": 0.0001868251509754756, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.0002418517241647463, + "loss": 0.0189, "step": 149550 }, { - "epoch": 0.75, - "learning_rate": 0.0001868175832824616, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024184783594837482, + "loss": 0.0158, "step": 149560 }, { - "epoch": 0.75, - "learning_rate": 0.0001868100155894476, - "loss": 0.0166, + "epoch": 0.39, + "learning_rate": 0.00024184394773200339, + "loss": 0.0213, "step": 149570 }, { - "epoch": 0.75, - "learning_rate": 0.00018680244789643358, - "loss": 0.0095, + "epoch": 0.39, + "learning_rate": 0.0002418400595156319, + "loss": 0.017, "step": 149580 }, { - "epoch": 0.75, - "learning_rate": 0.00018679488020341956, - "loss": 0.0134, + "epoch": 0.39, + "learning_rate": 0.00024183617129926044, + "loss": 0.0161, "step": 149590 }, { - "epoch": 0.75, - "learning_rate": 0.00018678731251040557, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.00024183228308288896, + "loss": 0.0158, "step": 149600 }, { - "epoch": 0.75, - "learning_rate": 0.00018677974481739155, - "loss": 0.0167, + "epoch": 0.39, + "learning_rate": 0.0002418283948665175, + "loss": 0.0202, "step": 149610 }, { - "epoch": 0.75, - "learning_rate": 0.00018677217712437754, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024182450665014607, + "loss": 0.0202, "step": 149620 }, { - "epoch": 0.75, - "learning_rate": 0.00018676460943136354, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024182061843377458, + "loss": 0.0172, "step": 149630 }, { - "epoch": 0.75, - "learning_rate": 0.00018675704173834953, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024181673021740312, + "loss": 0.0196, "step": 149640 }, { - "epoch": 0.76, - "learning_rate": 0.0001867494740453355, - "loss": 0.0172, + "epoch": 0.39, + "learning_rate": 0.00024181284200103164, + "loss": 0.0196, "step": 149650 }, { - "epoch": 0.76, - "learning_rate": 0.0001867419063523215, - "loss": 0.0099, + "epoch": 0.39, + "learning_rate": 0.0002418089537846602, + "loss": 0.018, "step": 149660 }, { - "epoch": 0.76, - "learning_rate": 0.0001867343386593075, - "loss": 0.0109, + "epoch": 0.39, + "learning_rate": 0.00024180506556828872, + "loss": 0.0191, "step": 149670 }, { - "epoch": 0.76, - "learning_rate": 0.00018672677096629348, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024180117735191726, + "loss": 0.0201, "step": 149680 }, { - "epoch": 0.76, - "learning_rate": 0.00018671920327327946, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024179728913554578, + "loss": 0.0196, "step": 149690 }, { - "epoch": 0.76, - "learning_rate": 0.00018671163558026547, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024179340091917435, + "loss": 0.0182, "step": 149700 }, { - "epoch": 0.76, - "learning_rate": 0.00018670406788725145, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.00024178951270280286, + "loss": 0.0198, "step": 149710 }, { - "epoch": 0.76, - "learning_rate": 0.00018669650019423743, - "loss": 0.0166, + "epoch": 0.39, + "learning_rate": 0.0002417856244864314, + "loss": 0.017, "step": 149720 }, { - "epoch": 0.76, - "learning_rate": 0.00018668893250122344, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024178173627005992, + "loss": 0.0162, "step": 149730 }, { - "epoch": 0.76, - "learning_rate": 0.00018668136480820942, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024177784805368848, + "loss": 0.0191, "step": 149740 }, { - "epoch": 0.76, - "learning_rate": 0.0001866737971151954, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.000241773959837317, + "loss": 0.0194, "step": 149750 }, { - "epoch": 0.76, - "learning_rate": 0.0001866662294221814, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024177007162094554, + "loss": 0.0212, "step": 149760 }, { - "epoch": 0.76, - "learning_rate": 0.0001866586617291674, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024176618340457406, + "loss": 0.0174, "step": 149770 }, { - "epoch": 0.76, - "learning_rate": 0.00018665109403615337, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024176229518820262, + "loss": 0.0209, "step": 149780 }, { - "epoch": 0.76, - "learning_rate": 0.00018664352634313938, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024175840697183117, + "loss": 0.0157, "step": 149790 }, { - "epoch": 0.76, - "learning_rate": 0.00018663595865012536, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024175451875545968, + "loss": 0.0183, "step": 149800 }, { - "epoch": 0.76, - "learning_rate": 0.00018662839095711135, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.0002417506305390882, + "loss": 0.0174, "step": 149810 }, { - "epoch": 0.76, - "learning_rate": 0.00018662082326409733, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024174674232271676, + "loss": 0.019, "step": 149820 }, { - "epoch": 0.76, - "learning_rate": 0.00018661325557108334, - "loss": 0.0165, + "epoch": 0.39, + "learning_rate": 0.0002417428541063453, + "loss": 0.0222, "step": 149830 }, { - "epoch": 0.76, - "learning_rate": 0.00018660568787806932, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024173896588997382, + "loss": 0.0179, "step": 149840 }, { - "epoch": 0.76, - "learning_rate": 0.0001865981201850553, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024173507767360236, + "loss": 0.0152, "step": 149850 }, { - "epoch": 0.76, - "learning_rate": 0.0001865905524920413, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024173118945723088, + "loss": 0.0192, "step": 149860 }, { - "epoch": 0.76, - "learning_rate": 0.0001865829847990273, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024172730124085944, + "loss": 0.0188, "step": 149870 }, { - "epoch": 0.76, - "learning_rate": 0.00018657541710601327, - "loss": 0.0148, + "epoch": 0.39, + "learning_rate": 0.00024172341302448796, + "loss": 0.0205, "step": 149880 }, { - "epoch": 0.76, - "learning_rate": 0.00018656784941299928, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.0002417195248081165, + "loss": 0.0219, "step": 149890 }, { - "epoch": 0.76, - "learning_rate": 0.00018656028171998526, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024171563659174502, + "loss": 0.0183, "step": 149900 }, { - "epoch": 0.76, - "learning_rate": 0.00018655271402697124, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024171174837537358, + "loss": 0.0199, "step": 149910 }, { - "epoch": 0.76, - "learning_rate": 0.00018654514633395725, - "loss": 0.0161, + "epoch": 0.39, + "learning_rate": 0.0002417078601590021, + "loss": 0.0219, "step": 149920 }, { - "epoch": 0.76, - "learning_rate": 0.00018653757864094323, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.00024170397194263064, + "loss": 0.0151, "step": 149930 }, { - "epoch": 0.76, - "learning_rate": 0.0001865300109479292, + "epoch": 0.39, + "learning_rate": 0.00024170008372625915, "loss": 0.0218, "step": 149940 }, { - "epoch": 0.76, - "learning_rate": 0.00018652244325491522, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024169619550988772, + "loss": 0.0186, "step": 149950 }, { - "epoch": 0.76, - "learning_rate": 0.0001865148755619012, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024169230729351627, + "loss": 0.0194, "step": 149960 }, { - "epoch": 0.76, - "learning_rate": 0.00018650730786888718, - "loss": 0.0104, + "epoch": 0.39, + "learning_rate": 0.00024168841907714478, + "loss": 0.0216, "step": 149970 }, { - "epoch": 0.76, - "learning_rate": 0.0001864997401758732, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.0002416845308607733, + "loss": 0.0188, "step": 149980 }, { - "epoch": 0.76, - "learning_rate": 0.00018649217248285917, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024168064264440186, + "loss": 0.025, "step": 149990 }, { - "epoch": 0.76, - "learning_rate": 0.00018648460478984516, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.0002416767544280304, + "loss": 0.0238, "step": 150000 }, { - "epoch": 0.76, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.008926572278141975, - "eval_runtime": 116.0551, - "eval_samples_per_second": 17.233, - "eval_steps_per_second": 4.308, + "epoch": 0.39, + "eval_cer": 0.8817754674437451, + "eval_loss": 0.013502559624612331, + "eval_runtime": 107.4245, + "eval_samples_per_second": 18.618, + "eval_steps_per_second": 4.654, "step": 150000 }, { - "epoch": 0.76, - "learning_rate": 0.00018647703709683114, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024167286621165892, + "loss": 0.0176, "step": 150010 }, { - "epoch": 0.76, - "learning_rate": 0.00018646946940381715, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024166897799528746, + "loss": 0.0341, "step": 150020 }, { - "epoch": 0.76, - "learning_rate": 0.00018646190171080313, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.000241665089778916, + "loss": 0.0205, "step": 150030 }, { - "epoch": 0.76, - "learning_rate": 0.0001864543340177891, - "loss": 0.0109, + "epoch": 0.39, + "learning_rate": 0.00024166120156254454, + "loss": 0.0226, "step": 150040 }, { - "epoch": 0.76, - "learning_rate": 0.00018644676632477512, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.00024165731334617306, + "loss": 0.0161, "step": 150050 }, { - "epoch": 0.76, - "learning_rate": 0.0001864391986317611, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.0002416534251298016, + "loss": 0.0308, "step": 150060 }, { - "epoch": 0.76, - "learning_rate": 0.00018643163093874708, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.00024164953691343014, + "loss": 0.0184, "step": 150070 }, { - "epoch": 0.76, - "learning_rate": 0.0001864240632457331, - "loss": 0.0114, + "epoch": 0.39, + "learning_rate": 0.00024164564869705868, + "loss": 0.0197, "step": 150080 }, { - "epoch": 0.76, - "learning_rate": 0.00018641649555271907, - "loss": 0.0102, + "epoch": 0.39, + "learning_rate": 0.0002416417604806872, + "loss": 0.0215, "step": 150090 }, { - "epoch": 0.76, - "learning_rate": 0.00018640892785970505, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024163787226431574, + "loss": 0.0169, "step": 150100 }, { - "epoch": 0.76, - "learning_rate": 0.00018640136016669106, - "loss": 0.0132, + "epoch": 0.39, + "learning_rate": 0.00024163398404794425, + "loss": 0.0251, "step": 150110 }, { - "epoch": 0.76, - "learning_rate": 0.00018639379247367704, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024163009583157282, + "loss": 0.0158, "step": 150120 }, { - "epoch": 0.76, - "learning_rate": 0.00018638622478066302, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024162620761520134, + "loss": 0.0179, "step": 150130 }, { - "epoch": 0.76, - "learning_rate": 0.00018637865708764903, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024162231939882988, + "loss": 0.0196, "step": 150140 }, { - "epoch": 0.76, - "learning_rate": 0.000186371089394635, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.0002416184311824584, + "loss": 0.0172, "step": 150150 }, { - "epoch": 0.76, - "learning_rate": 0.000186363521701621, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024161454296608696, + "loss": 0.0204, "step": 150160 }, { - "epoch": 0.76, - "learning_rate": 0.00018635595400860698, - "loss": 0.0127, + "epoch": 0.39, + "learning_rate": 0.0002416106547497155, + "loss": 0.0239, "step": 150170 }, { - "epoch": 0.76, - "learning_rate": 0.00018634838631559298, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024160676653334402, + "loss": 0.0191, "step": 150180 }, { - "epoch": 0.76, - "learning_rate": 0.00018634081862257897, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.00024160287831697256, + "loss": 0.0205, "step": 150190 }, { - "epoch": 0.76, - "learning_rate": 0.00018633325092956492, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.0002415989901006011, + "loss": 0.0229, "step": 150200 }, { - "epoch": 0.76, - "learning_rate": 0.0001863256832365509, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024159510188422964, + "loss": 0.0258, "step": 150210 }, { - "epoch": 0.76, - "learning_rate": 0.0001863181155435369, - "loss": 0.0157, + "epoch": 0.39, + "learning_rate": 0.00024159121366785816, + "loss": 0.019, "step": 150220 }, { - "epoch": 0.76, - "learning_rate": 0.0001863105478505229, - "loss": 0.0153, + "epoch": 0.39, + "learning_rate": 0.0002415873254514867, + "loss": 0.0192, "step": 150230 }, { - "epoch": 0.76, - "learning_rate": 0.00018630298015750887, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024158343723511524, + "loss": 0.0186, "step": 150240 }, { - "epoch": 0.76, - "learning_rate": 0.00018629541246449488, - "loss": 0.0134, + "epoch": 0.39, + "learning_rate": 0.00024157954901874378, + "loss": 0.0193, "step": 150250 }, { - "epoch": 0.76, - "learning_rate": 0.00018628784477148086, - "loss": 0.0107, + "epoch": 0.39, + "learning_rate": 0.0002415756608023723, + "loss": 0.0212, "step": 150260 }, { - "epoch": 0.76, - "learning_rate": 0.00018628027707846684, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024157177258600084, + "loss": 0.0183, "step": 150270 }, { - "epoch": 0.76, - "learning_rate": 0.00018627270938545285, - "loss": 0.0164, + "epoch": 0.39, + "learning_rate": 0.0002415678843696294, + "loss": 0.0208, "step": 150280 }, { - "epoch": 0.76, - "learning_rate": 0.00018626514169243883, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024156399615325792, + "loss": 0.0169, "step": 150290 }, { - "epoch": 0.76, - "learning_rate": 0.00018625757399942482, - "loss": 0.0094, + "epoch": 0.39, + "learning_rate": 0.00024156010793688644, + "loss": 0.0193, "step": 150300 }, { - "epoch": 0.76, - "learning_rate": 0.00018625000630641082, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024155621972051498, + "loss": 0.017, "step": 150310 }, { - "epoch": 0.76, - "learning_rate": 0.0001862424386133968, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024155233150414355, + "loss": 0.0218, "step": 150320 }, { - "epoch": 0.76, - "learning_rate": 0.0001862348709203828, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024154844328777206, + "loss": 0.0178, "step": 150330 }, { - "epoch": 0.76, - "learning_rate": 0.0001862273032273688, - "loss": 0.0137, + "epoch": 0.39, + "learning_rate": 0.0002415445550714006, + "loss": 0.0217, "step": 150340 }, { - "epoch": 0.76, - "learning_rate": 0.00018621973553435478, - "loss": 0.0163, + "epoch": 0.39, + "learning_rate": 0.00024154066685502912, + "loss": 0.0173, "step": 150350 }, { - "epoch": 0.76, - "learning_rate": 0.00018621216784134076, - "loss": 0.0098, + "epoch": 0.39, + "learning_rate": 0.00024153677863865766, + "loss": 0.0231, "step": 150360 }, { - "epoch": 0.76, - "learning_rate": 0.00018620460014832677, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.0002415328904222862, + "loss": 0.0197, "step": 150370 }, { - "epoch": 0.76, - "learning_rate": 0.00018619703245531275, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024152900220591474, + "loss": 0.0168, "step": 150380 }, { - "epoch": 0.76, - "learning_rate": 0.00018618946476229873, - "loss": 0.0127, + "epoch": 0.39, + "learning_rate": 0.00024152511398954326, + "loss": 0.0149, "step": 150390 }, { - "epoch": 0.76, - "learning_rate": 0.0001861818970692847, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.0002415212257731718, + "loss": 0.0185, "step": 150400 }, { - "epoch": 0.76, - "learning_rate": 0.00018617432937627072, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024151733755680034, + "loss": 0.016, "step": 150410 }, { - "epoch": 0.76, - "learning_rate": 0.0001861667616832567, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024151344934042888, + "loss": 0.0174, "step": 150420 }, { - "epoch": 0.76, - "learning_rate": 0.00018615919399024268, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.0002415095611240574, + "loss": 0.0171, "step": 150430 }, { - "epoch": 0.76, - "learning_rate": 0.0001861516262972287, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024150567290768594, + "loss": 0.0186, "step": 150440 }, { - "epoch": 0.76, - "learning_rate": 0.00018614405860421467, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024150178469131448, + "loss": 0.0182, "step": 150450 }, { - "epoch": 0.76, - "learning_rate": 0.00018613649091120066, - "loss": 0.0167, + "epoch": 0.39, + "learning_rate": 0.00024149789647494302, + "loss": 0.0171, "step": 150460 }, { - "epoch": 0.76, - "learning_rate": 0.00018612892321818666, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024149400825857154, + "loss": 0.0251, "step": 150470 }, { - "epoch": 0.76, - "learning_rate": 0.00018612135552517264, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024149012004220008, + "loss": 0.0246, "step": 150480 }, { - "epoch": 0.76, - "learning_rate": 0.00018611378783215863, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024148623182582865, + "loss": 0.0232, "step": 150490 }, { - "epoch": 0.76, - "learning_rate": 0.00018610622013914463, - "loss": 0.0169, + "epoch": 0.39, + "learning_rate": 0.00024148234360945716, + "loss": 0.0227, "step": 150500 }, { - "epoch": 0.76, - "learning_rate": 0.00018609865244613062, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002414784553930857, + "loss": 0.0206, "step": 150510 }, { - "epoch": 0.76, - "learning_rate": 0.0001860910847531166, - "loss": 0.0155, + "epoch": 0.39, + "learning_rate": 0.00024147456717671422, + "loss": 0.0205, "step": 150520 }, { - "epoch": 0.76, - "learning_rate": 0.0001860835170601026, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024147067896034279, + "loss": 0.0249, "step": 150530 }, { - "epoch": 0.76, - "learning_rate": 0.0001860759493670886, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.0002414667907439713, + "loss": 0.0168, "step": 150540 }, { - "epoch": 0.76, - "learning_rate": 0.00018606838167407457, - "loss": 0.0092, + "epoch": 0.39, + "learning_rate": 0.00024146290252759984, + "loss": 0.0191, "step": 150550 }, { - "epoch": 0.76, - "learning_rate": 0.00018606081398106055, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024145901431122836, + "loss": 0.0232, "step": 150560 }, { - "epoch": 0.76, - "learning_rate": 0.00018605324628804656, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024145512609485693, + "loss": 0.0203, "step": 150570 }, { - "epoch": 0.76, - "learning_rate": 0.00018604567859503254, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024145123787848544, + "loss": 0.015, "step": 150580 }, { - "epoch": 0.76, - "learning_rate": 0.00018603811090201852, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024144734966211398, + "loss": 0.0203, "step": 150590 }, { - "epoch": 0.76, - "learning_rate": 0.00018603054320900453, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.0002414434614457425, + "loss": 0.0185, "step": 150600 }, { - "epoch": 0.76, - "learning_rate": 0.0001860229755159905, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024143957322937104, + "loss": 0.019, "step": 150610 }, { - "epoch": 0.76, - "learning_rate": 0.0001860154078229765, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024143568501299958, + "loss": 0.0172, "step": 150620 }, { - "epoch": 0.76, - "learning_rate": 0.0001860078401299625, - "loss": 0.0148, + "epoch": 0.39, + "learning_rate": 0.00024143179679662812, + "loss": 0.0178, "step": 150630 }, { - "epoch": 0.76, - "learning_rate": 0.00018600027243694848, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024142790858025664, + "loss": 0.0204, "step": 150640 }, { - "epoch": 0.76, - "learning_rate": 0.00018599270474393447, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024142402036388518, + "loss": 0.0188, "step": 150650 }, { - "epoch": 0.76, - "learning_rate": 0.00018598513705092047, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.00024142013214751375, + "loss": 0.0201, "step": 150660 }, { - "epoch": 0.76, - "learning_rate": 0.00018597756935790646, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024141624393114226, + "loss": 0.0197, "step": 150670 }, { - "epoch": 0.76, - "learning_rate": 0.00018597000166489244, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.0002414123557147708, + "loss": 0.0191, "step": 150680 }, { - "epoch": 0.76, - "learning_rate": 0.00018596243397187845, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.00024140846749839932, + "loss": 0.0203, "step": 150690 }, { - "epoch": 0.76, - "learning_rate": 0.00018595486627886443, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024140457928202789, + "loss": 0.0189, "step": 150700 }, { - "epoch": 0.76, - "learning_rate": 0.0001859472985858504, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.0002414006910656564, + "loss": 0.0179, "step": 150710 }, { - "epoch": 0.76, - "learning_rate": 0.0001859397308928364, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024139680284928494, + "loss": 0.0175, "step": 150720 }, { - "epoch": 0.76, - "learning_rate": 0.0001859321631998224, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024139291463291346, + "loss": 0.019, "step": 150730 }, { - "epoch": 0.76, - "learning_rate": 0.00018592459550680838, - "loss": 0.0114, + "epoch": 0.39, + "learning_rate": 0.00024138902641654202, + "loss": 0.0149, "step": 150740 }, { - "epoch": 0.76, - "learning_rate": 0.00018591702781379436, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024138513820017054, + "loss": 0.0164, "step": 150750 }, { - "epoch": 0.76, - "learning_rate": 0.00018590946012078037, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.00024138124998379908, + "loss": 0.019, "step": 150760 }, { - "epoch": 0.76, - "learning_rate": 0.00018590189242776635, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.0002413773617674276, + "loss": 0.0216, "step": 150770 }, { - "epoch": 0.76, - "learning_rate": 0.00018589432473475233, - "loss": 0.0138, + "epoch": 0.39, + "learning_rate": 0.00024137347355105616, + "loss": 0.0212, "step": 150780 }, { - "epoch": 0.76, - "learning_rate": 0.00018588675704173834, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024136958533468468, + "loss": 0.0181, "step": 150790 }, { - "epoch": 0.76, - "learning_rate": 0.00018587918934872432, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024136569711831322, + "loss": 0.0241, "step": 150800 }, { - "epoch": 0.76, - "learning_rate": 0.0001858716216557103, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024136180890194174, + "loss": 0.0173, "step": 150810 }, { - "epoch": 0.76, - "learning_rate": 0.0001858640539626963, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.0002413579206855703, + "loss": 0.0216, "step": 150820 }, { - "epoch": 0.76, - "learning_rate": 0.0001858564862696823, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.00024135403246919885, + "loss": 0.017, "step": 150830 }, { - "epoch": 0.76, - "learning_rate": 0.00018584891857666828, - "loss": 0.0104, + "epoch": 0.39, + "learning_rate": 0.00024135014425282736, + "loss": 0.029, "step": 150840 }, { - "epoch": 0.76, - "learning_rate": 0.00018584135088365428, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024134625603645587, + "loss": 0.0181, "step": 150850 }, { - "epoch": 0.76, - "learning_rate": 0.00018583378319064027, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024134236782008442, + "loss": 0.0198, "step": 150860 }, { - "epoch": 0.76, - "learning_rate": 0.00018582621549762625, - "loss": 0.0142, + "epoch": 0.39, + "learning_rate": 0.00024133847960371298, + "loss": 0.0212, "step": 150870 }, { - "epoch": 0.76, - "learning_rate": 0.00018581864780461226, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.0002413345913873415, + "loss": 0.0168, "step": 150880 }, { - "epoch": 0.76, - "learning_rate": 0.00018581108011159824, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024133070317097004, + "loss": 0.0203, "step": 150890 }, { - "epoch": 0.76, - "learning_rate": 0.00018580351241858422, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024132681495459856, + "loss": 0.0181, "step": 150900 }, { - "epoch": 0.76, - "learning_rate": 0.0001857959447255702, - "loss": 0.0147, + "epoch": 0.39, + "learning_rate": 0.00024132292673822712, + "loss": 0.0174, "step": 150910 }, { - "epoch": 0.76, - "learning_rate": 0.0001857883770325562, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024131903852185564, + "loss": 0.0264, "step": 150920 }, { - "epoch": 0.76, - "learning_rate": 0.0001857808093395422, - "loss": 0.0158, + "epoch": 0.39, + "learning_rate": 0.00024131515030548418, + "loss": 0.0209, "step": 150930 }, { - "epoch": 0.76, - "learning_rate": 0.00018577324164652817, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.0002413112620891127, + "loss": 0.0198, "step": 150940 }, { - "epoch": 0.76, - "learning_rate": 0.00018576567395351418, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024130737387274126, + "loss": 0.0142, "step": 150950 }, { - "epoch": 0.76, - "learning_rate": 0.00018575810626050016, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024130348565636978, + "loss": 0.0176, "step": 150960 }, { - "epoch": 0.76, - "learning_rate": 0.00018575053856748614, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024129959743999832, + "loss": 0.0168, "step": 150970 }, { - "epoch": 0.76, - "learning_rate": 0.00018574297087447215, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024129570922362683, + "loss": 0.0203, "step": 150980 }, { - "epoch": 0.76, - "learning_rate": 0.00018573540318145813, - "loss": 0.0116, + "epoch": 0.39, + "learning_rate": 0.0002412918210072554, + "loss": 0.0202, "step": 150990 }, { - "epoch": 0.76, - "learning_rate": 0.00018572783548844411, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024128793279088392, + "loss": 0.0206, "step": 151000 }, { - "epoch": 0.76, - "eval_cer": 0.9144760782799146, - "eval_loss": 0.00918071623891592, - "eval_runtime": 116.7205, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.39, + "eval_cer": 0.8817768670806793, + "eval_loss": 0.013644468039274216, + "eval_runtime": 107.4348, + "eval_samples_per_second": 18.616, + "eval_steps_per_second": 4.654, "step": 151000 }, { - "epoch": 0.76, - "learning_rate": 0.00018572026779543012, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024128404457451246, + "loss": 0.0214, "step": 151010 }, { - "epoch": 0.76, - "learning_rate": 0.0001857127001024161, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024128015635814097, + "loss": 0.0141, "step": 151020 }, { - "epoch": 0.76, - "learning_rate": 0.00018570513240940209, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024127626814176954, + "loss": 0.0167, "step": 151030 }, { - "epoch": 0.76, - "learning_rate": 0.0001856975647163881, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024127237992539808, + "loss": 0.0133, "step": 151040 }, { - "epoch": 0.76, - "learning_rate": 0.00018568999702337408, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.0002412684917090266, + "loss": 0.0183, "step": 151050 }, { - "epoch": 0.76, - "learning_rate": 0.00018568242933036006, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024126460349265514, + "loss": 0.0167, "step": 151060 }, { - "epoch": 0.76, - "learning_rate": 0.00018567486163734604, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024126071527628368, + "loss": 0.0179, "step": 151070 }, { - "epoch": 0.76, - "learning_rate": 0.00018566729394433205, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024125682705991222, + "loss": 0.0189, "step": 151080 }, { - "epoch": 0.76, - "learning_rate": 0.00018565972625131803, - "loss": 0.015, + "epoch": 0.39, + "learning_rate": 0.00024125293884354074, + "loss": 0.0177, "step": 151090 }, { - "epoch": 0.76, - "learning_rate": 0.000185652158558304, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.00024124905062716928, + "loss": 0.0192, "step": 151100 }, { - "epoch": 0.76, - "learning_rate": 0.00018564459086529002, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.0002412451624107978, + "loss": 0.0243, "step": 151110 }, { - "epoch": 0.76, - "learning_rate": 0.000185637023172276, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.00024124127419442636, + "loss": 0.0169, "step": 151120 }, { - "epoch": 0.76, - "learning_rate": 0.00018562945547926198, - "loss": 0.013, + "epoch": 0.39, + "learning_rate": 0.00024123738597805488, + "loss": 0.0246, "step": 151130 }, { - "epoch": 0.76, - "learning_rate": 0.000185621887786248, - "loss": 0.0111, + "epoch": 0.39, + "learning_rate": 0.00024123349776168342, + "loss": 0.0186, "step": 151140 }, { - "epoch": 0.76, - "learning_rate": 0.00018561432009323397, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024122960954531193, + "loss": 0.0216, "step": 151150 }, { - "epoch": 0.76, - "learning_rate": 0.00018560675240021995, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.0002412257213289405, + "loss": 0.0183, "step": 151160 }, { - "epoch": 0.76, - "learning_rate": 0.00018559918470720596, - "loss": 0.0114, + "epoch": 0.39, + "learning_rate": 0.00024122183311256902, + "loss": 0.0175, "step": 151170 }, { - "epoch": 0.76, - "learning_rate": 0.00018559161701419194, - "loss": 0.0111, + "epoch": 0.39, + "learning_rate": 0.00024121794489619756, + "loss": 0.018, "step": 151180 }, { - "epoch": 0.76, - "learning_rate": 0.00018558404932117792, - "loss": 0.0192, + "epoch": 0.39, + "learning_rate": 0.00024121405667982607, + "loss": 0.02, "step": 151190 }, { - "epoch": 0.76, - "learning_rate": 0.00018557648162816393, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024121016846345464, + "loss": 0.0177, "step": 151200 }, { - "epoch": 0.76, - "learning_rate": 0.00018556891393514991, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.00024120628024708318, + "loss": 0.0233, "step": 151210 }, { - "epoch": 0.76, - "learning_rate": 0.0001855613462421359, - "loss": 0.0114, + "epoch": 0.39, + "learning_rate": 0.0002412023920307117, + "loss": 0.0175, "step": 151220 }, { - "epoch": 0.76, - "learning_rate": 0.00018555377854912188, - "loss": 0.0104, + "epoch": 0.39, + "learning_rate": 0.00024119850381434024, + "loss": 0.0192, "step": 151230 }, { - "epoch": 0.76, - "learning_rate": 0.00018554621085610789, - "loss": 0.0143, + "epoch": 0.39, + "learning_rate": 0.00024119461559796878, + "loss": 0.0196, "step": 151240 }, { - "epoch": 0.76, - "learning_rate": 0.00018553864316309387, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024119072738159732, + "loss": 0.0199, "step": 151250 }, { - "epoch": 0.76, - "learning_rate": 0.00018553107547007985, - "loss": 0.0103, + "epoch": 0.39, + "learning_rate": 0.00024118683916522584, + "loss": 0.0207, "step": 151260 }, { - "epoch": 0.76, - "learning_rate": 0.00018552350777706586, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024118295094885438, + "loss": 0.0209, "step": 151270 }, { - "epoch": 0.76, - "learning_rate": 0.00018551594008405184, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.00024117906273248292, + "loss": 0.0185, "step": 151280 }, { - "epoch": 0.76, - "learning_rate": 0.00018550837239103782, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024117517451611146, + "loss": 0.0189, "step": 151290 }, { - "epoch": 0.76, - "learning_rate": 0.00018550080469802383, - "loss": 0.0121, + "epoch": 0.39, + "learning_rate": 0.00024117128629973998, + "loss": 0.0156, "step": 151300 }, { - "epoch": 0.76, - "learning_rate": 0.0001854932370050098, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024116739808336852, + "loss": 0.016, "step": 151310 }, { - "epoch": 0.76, - "learning_rate": 0.0001854856693119958, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.00024116350986699706, + "loss": 0.019, "step": 151320 }, { - "epoch": 0.76, - "learning_rate": 0.0001854781016189818, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.0002411596216506256, + "loss": 0.0172, "step": 151330 }, { - "epoch": 0.76, - "learning_rate": 0.00018547053392596778, - "loss": 0.0086, + "epoch": 0.39, + "learning_rate": 0.00024115573343425412, + "loss": 0.0229, "step": 151340 }, { - "epoch": 0.76, - "learning_rate": 0.00018546296623295376, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024115184521788266, + "loss": 0.0242, "step": 151350 }, { - "epoch": 0.76, - "learning_rate": 0.00018545539853993977, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024114795700151117, + "loss": 0.0291, "step": 151360 }, { - "epoch": 0.76, - "learning_rate": 0.00018544783084692575, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.00024114406878513974, + "loss": 0.0241, "step": 151370 }, { - "epoch": 0.76, - "learning_rate": 0.00018544026315391173, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024114018056876828, + "loss": 0.0215, "step": 151380 }, { - "epoch": 0.76, - "learning_rate": 0.00018543269546089774, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.0002411362923523968, + "loss": 0.0178, "step": 151390 }, { - "epoch": 0.76, - "learning_rate": 0.00018542512776788372, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.0002411324041360253, + "loss": 0.018, "step": 151400 }, { - "epoch": 0.76, - "learning_rate": 0.0001854175600748697, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.00024112851591965388, + "loss": 0.0203, "step": 151410 }, { - "epoch": 0.76, - "learning_rate": 0.0001854099923818557, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.00024112462770328242, + "loss": 0.0197, "step": 151420 }, { - "epoch": 0.76, - "learning_rate": 0.0001854024246888417, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024112073948691094, + "loss": 0.0217, "step": 151430 }, { - "epoch": 0.76, - "learning_rate": 0.00018539485699582768, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024111685127053948, + "loss": 0.0219, "step": 151440 }, { - "epoch": 0.76, - "learning_rate": 0.00018538728930281366, - "loss": 0.0111, + "epoch": 0.39, + "learning_rate": 0.00024111296305416802, + "loss": 0.0179, "step": 151450 }, { - "epoch": 0.76, - "learning_rate": 0.0001853797216097996, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.00024110907483779656, + "loss": 0.0168, "step": 151460 }, { - "epoch": 0.76, - "learning_rate": 0.00018537215391678562, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024110518662142508, + "loss": 0.0168, "step": 151470 }, { - "epoch": 0.76, - "learning_rate": 0.0001853645862237716, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024110129840505362, + "loss": 0.0189, "step": 151480 }, { - "epoch": 0.76, - "learning_rate": 0.00018535701853075758, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024109741018868216, + "loss": 0.022, "step": 151490 }, { - "epoch": 0.76, - "learning_rate": 0.0001853494508377436, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.0002410935219723107, + "loss": 0.0195, "step": 151500 }, { - "epoch": 0.76, - "learning_rate": 0.00018534188314472957, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.00024108963375593922, + "loss": 0.02, "step": 151510 }, { - "epoch": 0.76, - "learning_rate": 0.00018533431545171556, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024108574553956776, + "loss": 0.0189, "step": 151520 }, { - "epoch": 0.76, - "learning_rate": 0.00018532674775870156, - "loss": 0.0142, + "epoch": 0.39, + "learning_rate": 0.00024108185732319633, + "loss": 0.0182, "step": 151530 }, { - "epoch": 0.76, - "learning_rate": 0.00018531918006568755, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024107796910682484, + "loss": 0.0229, "step": 151540 }, { - "epoch": 0.76, - "learning_rate": 0.00018531161237267353, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024107408089045338, + "loss": 0.0214, "step": 151550 }, { - "epoch": 0.76, - "learning_rate": 0.00018530404467965954, - "loss": 0.0178, + "epoch": 0.39, + "learning_rate": 0.0002410701926740819, + "loss": 0.0196, "step": 151560 }, { - "epoch": 0.76, - "learning_rate": 0.00018529647698664552, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024106630445771047, + "loss": 0.0223, "step": 151570 }, { - "epoch": 0.76, - "learning_rate": 0.0001852889092936315, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024106241624133898, + "loss": 0.0199, "step": 151580 }, { - "epoch": 0.76, - "learning_rate": 0.0001852813416006175, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024105852802496752, + "loss": 0.0212, "step": 151590 }, { - "epoch": 0.76, - "learning_rate": 0.0001852737739076035, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024105463980859604, + "loss": 0.021, "step": 151600 }, { - "epoch": 0.76, - "learning_rate": 0.00018526620621458947, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024105075159222458, + "loss": 0.0213, "step": 151610 }, { - "epoch": 0.76, - "learning_rate": 0.00018525863852157545, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024104686337585312, + "loss": 0.0202, "step": 151620 }, { - "epoch": 0.76, - "learning_rate": 0.00018525107082856146, - "loss": 0.0166, + "epoch": 0.39, + "learning_rate": 0.00024104297515948166, + "loss": 0.0192, "step": 151630 }, { - "epoch": 0.77, - "learning_rate": 0.00018524350313554744, - "loss": 0.0127, + "epoch": 0.39, + "learning_rate": 0.00024103908694311018, + "loss": 0.0154, "step": 151640 }, { - "epoch": 0.77, - "learning_rate": 0.00018523593544253342, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024103519872673872, + "loss": 0.0175, "step": 151650 }, { - "epoch": 0.77, - "learning_rate": 0.00018522836774951943, - "loss": 0.0187, + "epoch": 0.39, + "learning_rate": 0.00024103131051036726, + "loss": 0.0204, "step": 151660 }, { - "epoch": 0.77, - "learning_rate": 0.0001852208000565054, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.0002410274222939958, + "loss": 0.0178, "step": 151670 }, { - "epoch": 0.77, - "learning_rate": 0.0001852132323634914, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024102353407762432, + "loss": 0.0204, "step": 151680 }, { - "epoch": 0.77, - "learning_rate": 0.0001852056646704774, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.00024101964586125286, + "loss": 0.0238, "step": 151690 }, { - "epoch": 0.77, - "learning_rate": 0.00018519809697746338, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024101575764488143, + "loss": 0.023, "step": 151700 }, { - "epoch": 0.77, - "learning_rate": 0.00018519052928444937, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024101186942850994, + "loss": 0.0191, "step": 151710 }, { - "epoch": 0.77, - "learning_rate": 0.00018518296159143537, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024100798121213845, + "loss": 0.0182, "step": 151720 }, { - "epoch": 0.77, - "learning_rate": 0.00018517539389842136, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.000241004092995767, + "loss": 0.0195, "step": 151730 }, { - "epoch": 0.77, - "learning_rate": 0.00018516782620540734, - "loss": 0.0099, + "epoch": 0.39, + "learning_rate": 0.00024100020477939557, + "loss": 0.022, "step": 151740 }, { - "epoch": 0.77, - "learning_rate": 0.00018516025851239335, - "loss": 0.0105, + "epoch": 0.39, + "learning_rate": 0.00024099631656302408, + "loss": 0.021, "step": 151750 }, { - "epoch": 0.77, - "learning_rate": 0.00018515269081937933, - "loss": 0.0139, + "epoch": 0.39, + "learning_rate": 0.00024099242834665262, + "loss": 0.0201, "step": 151760 }, { - "epoch": 0.77, - "learning_rate": 0.0001851451231263653, - "loss": 0.0109, + "epoch": 0.39, + "learning_rate": 0.00024098854013028114, + "loss": 0.0205, "step": 151770 }, { - "epoch": 0.77, - "learning_rate": 0.00018513755543335132, - "loss": 0.0135, + "epoch": 0.39, + "learning_rate": 0.0002409846519139097, + "loss": 0.0146, "step": 151780 }, { - "epoch": 0.77, - "learning_rate": 0.0001851299877403373, - "loss": 0.0145, + "epoch": 0.39, + "learning_rate": 0.00024098076369753822, + "loss": 0.0214, "step": 151790 }, { - "epoch": 0.77, - "learning_rate": 0.00018512242004732328, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024097687548116676, + "loss": 0.0181, "step": 151800 }, { - "epoch": 0.77, - "learning_rate": 0.00018511485235430926, - "loss": 0.018, + "epoch": 0.39, + "learning_rate": 0.00024097298726479528, + "loss": 0.021, "step": 151810 }, { - "epoch": 0.77, - "learning_rate": 0.00018510728466129527, - "loss": 0.0134, + "epoch": 0.39, + "learning_rate": 0.00024096909904842384, + "loss": 0.0163, "step": 151820 }, { - "epoch": 0.77, - "learning_rate": 0.00018509971696828125, - "loss": 0.0104, + "epoch": 0.39, + "learning_rate": 0.00024096521083205236, + "loss": 0.0233, "step": 151830 }, { - "epoch": 0.77, - "learning_rate": 0.00018509214927526723, - "loss": 0.0141, + "epoch": 0.39, + "learning_rate": 0.0002409613226156809, + "loss": 0.0209, "step": 151840 }, { - "epoch": 0.77, - "learning_rate": 0.00018508458158225324, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024095743439930941, + "loss": 0.0198, "step": 151850 }, { - "epoch": 0.77, - "learning_rate": 0.00018507701388923922, - "loss": 0.0154, + "epoch": 0.39, + "learning_rate": 0.00024095354618293796, + "loss": 0.0184, "step": 151860 }, { - "epoch": 0.77, - "learning_rate": 0.0001850694461962252, - "loss": 0.0109, + "epoch": 0.39, + "learning_rate": 0.00024094965796656653, + "loss": 0.0179, "step": 151870 }, { - "epoch": 0.77, - "learning_rate": 0.0001850618785032112, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.00024094576975019504, + "loss": 0.0202, "step": 151880 }, { - "epoch": 0.77, - "learning_rate": 0.0001850543108101972, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024094188153382355, + "loss": 0.0237, "step": 151890 }, { - "epoch": 0.77, - "learning_rate": 0.00018504674311718318, - "loss": 0.0095, + "epoch": 0.39, + "learning_rate": 0.0002409379933174521, + "loss": 0.0259, "step": 151900 }, { - "epoch": 0.77, - "learning_rate": 0.00018503917542416918, - "loss": 0.0151, + "epoch": 0.39, + "learning_rate": 0.00024093410510108066, + "loss": 0.0211, "step": 151910 }, { - "epoch": 0.77, - "learning_rate": 0.00018503160773115517, - "loss": 0.0112, + "epoch": 0.39, + "learning_rate": 0.00024093021688470918, + "loss": 0.0242, "step": 151920 }, { - "epoch": 0.77, - "learning_rate": 0.00018502404003814115, - "loss": 0.0126, + "epoch": 0.39, + "learning_rate": 0.00024092632866833772, + "loss": 0.0167, "step": 151930 }, { - "epoch": 0.77, - "learning_rate": 0.00018501647234512716, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024092244045196624, + "loss": 0.0157, "step": 151940 }, { - "epoch": 0.77, - "learning_rate": 0.00018500890465211314, - "loss": 0.0118, + "epoch": 0.39, + "learning_rate": 0.0002409185522355948, + "loss": 0.0192, "step": 151950 }, { - "epoch": 0.77, - "learning_rate": 0.00018500133695909912, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024091466401922332, + "loss": 0.0178, "step": 151960 }, { - "epoch": 0.77, - "learning_rate": 0.0001849937692660851, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024091077580285186, + "loss": 0.0163, "step": 151970 }, { - "epoch": 0.77, - "learning_rate": 0.0001849862015730711, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.00024090688758648037, + "loss": 0.0229, "step": 151980 }, { - "epoch": 0.77, - "learning_rate": 0.0001849786338800571, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024090299937010894, + "loss": 0.0192, "step": 151990 }, { - "epoch": 0.77, - "learning_rate": 0.00018497106618704307, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024089911115373746, + "loss": 0.0169, "step": 152000 }, { - "epoch": 0.77, - "eval_cer": 0.914467344714786, - "eval_loss": 0.00894253607839346, - "eval_runtime": 116.687, - "eval_samples_per_second": 17.14, - "eval_steps_per_second": 4.285, + "epoch": 0.39, + "eval_cer": 0.8817950623608236, + "eval_loss": 0.013452214188873768, + "eval_runtime": 107.3551, + "eval_samples_per_second": 18.63, + "eval_steps_per_second": 4.657, "step": 152000 }, { - "epoch": 0.77, - "learning_rate": 0.00018496349849402908, - "loss": 0.0124, + "epoch": 0.39, + "learning_rate": 0.000240895222937366, + "loss": 0.0205, "step": 152010 }, { - "epoch": 0.77, - "learning_rate": 0.00018495593080101506, - "loss": 0.0146, + "epoch": 0.39, + "learning_rate": 0.00024089133472099451, + "loss": 0.0222, "step": 152020 }, { - "epoch": 0.77, - "learning_rate": 0.00018494836310800104, - "loss": 0.0107, + "epoch": 0.39, + "learning_rate": 0.00024088744650462308, + "loss": 0.0189, "step": 152030 }, { - "epoch": 0.77, - "learning_rate": 0.00018494079541498705, - "loss": 0.014, + "epoch": 0.39, + "learning_rate": 0.0002408835582882516, + "loss": 0.0212, "step": 152040 }, { - "epoch": 0.77, - "learning_rate": 0.00018493322772197303, - "loss": 0.0096, + "epoch": 0.39, + "learning_rate": 0.00024087967007188014, + "loss": 0.0227, "step": 152050 }, { - "epoch": 0.77, - "learning_rate": 0.00018492566002895901, - "loss": 0.0149, + "epoch": 0.39, + "learning_rate": 0.00024087578185550865, + "loss": 0.0204, "step": 152060 }, { - "epoch": 0.77, - "learning_rate": 0.00018491809233594502, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.00024087189363913722, + "loss": 0.0189, "step": 152070 }, { - "epoch": 0.77, - "learning_rate": 0.000184910524642931, - "loss": 0.0122, + "epoch": 0.39, + "learning_rate": 0.00024086800542276576, + "loss": 0.018, "step": 152080 }, { - "epoch": 0.77, - "learning_rate": 0.00018490295694991699, - "loss": 0.0115, + "epoch": 0.39, + "learning_rate": 0.00024086411720639428, + "loss": 0.0217, "step": 152090 }, { - "epoch": 0.77, - "learning_rate": 0.000184895389256903, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.00024086022899002282, + "loss": 0.0205, "step": 152100 }, { - "epoch": 0.77, - "learning_rate": 0.00018488782156388898, - "loss": 0.0134, + "epoch": 0.39, + "learning_rate": 0.00024085634077365133, + "loss": 0.0212, "step": 152110 }, { - "epoch": 0.77, - "learning_rate": 0.00018488025387087496, - "loss": 0.0129, + "epoch": 0.39, + "learning_rate": 0.0002408524525572799, + "loss": 0.0205, "step": 152120 }, { - "epoch": 0.77, - "learning_rate": 0.00018487268617786094, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.00024084856434090842, + "loss": 0.0284, "step": 152130 }, { - "epoch": 0.77, - "learning_rate": 0.00018486511848484695, - "loss": 0.0098, + "epoch": 0.39, + "learning_rate": 0.00024084467612453696, + "loss": 0.0207, "step": 152140 }, { - "epoch": 0.77, - "learning_rate": 0.00018485755079183293, - "loss": 0.0128, + "epoch": 0.39, + "learning_rate": 0.00024084078790816547, + "loss": 0.0164, "step": 152150 }, { - "epoch": 0.77, - "learning_rate": 0.0001848499830988189, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.00024083689969179404, + "loss": 0.0189, "step": 152160 }, { - "epoch": 0.77, - "learning_rate": 0.00018484241540580492, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024083301147542256, + "loss": 0.0172, "step": 152170 }, { - "epoch": 0.77, - "learning_rate": 0.0001848348477127909, - "loss": 0.0114, + "epoch": 0.39, + "learning_rate": 0.0002408291232590511, + "loss": 0.0194, "step": 152180 }, { - "epoch": 0.77, - "learning_rate": 0.00018482728001977688, - "loss": 0.0113, + "epoch": 0.39, + "learning_rate": 0.00024082523504267961, + "loss": 0.0237, "step": 152190 }, { - "epoch": 0.77, - "learning_rate": 0.0001848197123267629, - "loss": 0.0161, + "epoch": 0.39, + "learning_rate": 0.00024082134682630818, + "loss": 0.0167, "step": 152200 }, { - "epoch": 0.77, - "learning_rate": 0.00018481214463374887, - "loss": 0.0161, + "epoch": 0.39, + "learning_rate": 0.0002408174586099367, + "loss": 0.0203, "step": 152210 }, { - "epoch": 0.77, - "learning_rate": 0.00018480457694073485, - "loss": 0.0136, + "epoch": 0.39, + "learning_rate": 0.00024081357039356524, + "loss": 0.0267, "step": 152220 }, { - "epoch": 0.77, - "learning_rate": 0.00018479700924772086, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.00024080968217719375, + "loss": 0.0219, "step": 152230 }, { - "epoch": 0.77, - "learning_rate": 0.00018478944155470684, - "loss": 0.0123, + "epoch": 0.39, + "learning_rate": 0.00024080579396082232, + "loss": 0.0188, "step": 152240 }, { - "epoch": 0.77, - "learning_rate": 0.00018478187386169282, - "loss": 0.0108, + "epoch": 0.39, + "learning_rate": 0.00024080190574445086, + "loss": 0.0183, "step": 152250 }, { - "epoch": 0.77, - "learning_rate": 0.00018477430616867883, - "loss": 0.0125, + "epoch": 0.39, + "learning_rate": 0.00024079801752807938, + "loss": 0.0217, "step": 152260 }, { - "epoch": 0.77, - "learning_rate": 0.00018476673847566481, - "loss": 0.012, + "epoch": 0.39, + "learning_rate": 0.00024079412931170792, + "loss": 0.0181, "step": 152270 }, { - "epoch": 0.77, - "learning_rate": 0.0001847591707826508, - "loss": 0.0111, + "epoch": 0.39, + "learning_rate": 0.00024079024109533646, + "loss": 0.0265, "step": 152280 }, { - "epoch": 0.77, - "learning_rate": 0.0001847516030896368, - "loss": 0.0152, + "epoch": 0.39, + "learning_rate": 0.000240786352878965, + "loss": 0.0199, "step": 152290 }, { - "epoch": 0.77, - "learning_rate": 0.00018474403539662279, - "loss": 0.0117, + "epoch": 0.39, + "learning_rate": 0.00024078246466259352, + "loss": 0.0238, "step": 152300 }, { - "epoch": 0.77, - "learning_rate": 0.00018473646770360877, - "loss": 0.0133, + "epoch": 0.39, + "learning_rate": 0.00024077857644622206, + "loss": 0.0163, "step": 152310 }, { - "epoch": 0.77, - "learning_rate": 0.00018472890001059475, - "loss": 0.0144, + "epoch": 0.39, + "learning_rate": 0.0002407746882298506, + "loss": 0.0183, "step": 152320 }, { - "epoch": 0.77, - "learning_rate": 0.00018472133231758076, - "loss": 0.0119, + "epoch": 0.39, + "learning_rate": 0.00024077080001347914, + "loss": 0.0213, "step": 152330 }, { - "epoch": 0.77, - "learning_rate": 0.00018471376462456674, - "loss": 0.0142, + "epoch": 0.39, + "learning_rate": 0.00024076691179710766, + "loss": 0.0185, "step": 152340 }, { - "epoch": 0.77, - "learning_rate": 0.00018470619693155272, - "loss": 0.0156, + "epoch": 0.39, + "learning_rate": 0.0002407630235807362, + "loss": 0.0202, "step": 152350 }, { - "epoch": 0.77, - "learning_rate": 0.00018469862923853873, - "loss": 0.0131, + "epoch": 0.39, + "learning_rate": 0.0002407591353643647, + "loss": 0.0177, "step": 152360 }, { - "epoch": 0.77, - "learning_rate": 0.0001846910615455247, - "loss": 0.0107, + "epoch": 0.39, + "learning_rate": 0.00024075524714799328, + "loss": 0.0156, "step": 152370 }, { - "epoch": 0.77, - "learning_rate": 0.0001846834938525107, - "loss": 0.0103, + "epoch": 0.39, + "learning_rate": 0.0002407513589316218, + "loss": 0.0207, "step": 152380 }, { - "epoch": 0.77, - "learning_rate": 0.0001846759261594967, - "loss": 0.0149, + "epoch": 0.4, + "learning_rate": 0.00024074747071525034, + "loss": 0.0191, "step": 152390 }, { - "epoch": 0.77, - "learning_rate": 0.00018466835846648268, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00024074358249887885, + "loss": 0.0239, "step": 152400 }, { - "epoch": 0.77, - "learning_rate": 0.00018466079077346866, - "loss": 0.0113, + "epoch": 0.4, + "learning_rate": 0.00024073969428250742, + "loss": 0.0164, "step": 152410 }, { - "epoch": 0.77, - "learning_rate": 0.00018465322308045467, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00024073580606613596, + "loss": 0.0174, "step": 152420 }, { - "epoch": 0.77, - "learning_rate": 0.00018464565538744065, - "loss": 0.0164, + "epoch": 0.4, + "learning_rate": 0.00024073191784976448, + "loss": 0.0159, "step": 152430 }, { - "epoch": 0.77, - "learning_rate": 0.00018463808769442663, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.000240728029633393, + "loss": 0.018, "step": 152440 }, { - "epoch": 0.77, - "learning_rate": 0.00018463052000141264, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00024072414141702156, + "loss": 0.019, "step": 152450 }, { - "epoch": 0.77, - "learning_rate": 0.00018462295230839862, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.0002407202532006501, + "loss": 0.0291, "step": 152460 }, { - "epoch": 0.77, - "learning_rate": 0.0001846153846153846, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.00024071636498427862, + "loss": 0.0212, "step": 152470 }, { - "epoch": 0.77, - "learning_rate": 0.0001846078169223706, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00024071247676790716, + "loss": 0.021, "step": 152480 }, { - "epoch": 0.77, - "learning_rate": 0.0001846002492293566, - "loss": 0.0225, + "epoch": 0.4, + "learning_rate": 0.0002407085885515357, + "loss": 0.0197, "step": 152490 }, { - "epoch": 0.77, - "learning_rate": 0.00018459268153634258, - "loss": 0.0156, + "epoch": 0.4, + "learning_rate": 0.00024070470033516424, + "loss": 0.0184, "step": 152500 }, { - "epoch": 0.77, - "learning_rate": 0.00018458511384332856, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.00024070081211879276, + "loss": 0.0204, "step": 152510 }, { - "epoch": 0.77, - "learning_rate": 0.00018457754615031457, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.0002406969239024213, + "loss": 0.0153, "step": 152520 }, { - "epoch": 0.77, - "learning_rate": 0.00018456997845730055, - "loss": 0.0178, + "epoch": 0.4, + "learning_rate": 0.00024069303568604984, + "loss": 0.0184, "step": 152530 }, { - "epoch": 0.77, - "learning_rate": 0.00018456241076428653, - "loss": 0.0088, + "epoch": 0.4, + "learning_rate": 0.00024068914746967838, + "loss": 0.019, "step": 152540 }, { - "epoch": 0.77, - "learning_rate": 0.00018455484307127254, - "loss": 0.0104, + "epoch": 0.4, + "learning_rate": 0.0002406852592533069, + "loss": 0.0198, "step": 152550 }, { - "epoch": 0.77, - "learning_rate": 0.00018454727537825852, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00024068137103693544, + "loss": 0.0248, "step": 152560 }, { - "epoch": 0.77, - "learning_rate": 0.0001845397076852445, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.000240677482820564, + "loss": 0.0158, "step": 152570 }, { - "epoch": 0.77, - "learning_rate": 0.0001845321399922305, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024067359460419252, + "loss": 0.0207, "step": 152580 }, { - "epoch": 0.77, - "learning_rate": 0.0001845245722992165, - "loss": 0.0107, + "epoch": 0.4, + "learning_rate": 0.00024066970638782104, + "loss": 0.0186, "step": 152590 }, { - "epoch": 0.77, - "learning_rate": 0.00018451700460620247, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024066581817144958, + "loss": 0.0234, "step": 152600 }, { - "epoch": 0.77, - "learning_rate": 0.00018450943691318848, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.0002406619299550781, + "loss": 0.0202, "step": 152610 }, { - "epoch": 0.77, - "learning_rate": 0.00018450186922017446, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00024065804173870666, + "loss": 0.0223, "step": 152620 }, { - "epoch": 0.77, - "learning_rate": 0.00018449430152716044, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.0002406541535223352, + "loss": 0.0205, "step": 152630 }, { - "epoch": 0.77, - "learning_rate": 0.00018448673383414643, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.00024065026530596372, + "loss": 0.0279, "step": 152640 }, { - "epoch": 0.77, - "learning_rate": 0.00018447916614113243, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00024064637708959226, + "loss": 0.0212, "step": 152650 }, { - "epoch": 0.77, - "learning_rate": 0.00018447159844811842, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.0002406424888732208, + "loss": 0.0202, "step": 152660 }, { - "epoch": 0.77, - "learning_rate": 0.0001844640307551044, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00024063860065684934, + "loss": 0.0184, "step": 152670 }, { - "epoch": 0.77, - "learning_rate": 0.0001844564630620904, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024063471244047786, + "loss": 0.0209, "step": 152680 }, { - "epoch": 0.77, - "learning_rate": 0.0001844488953690764, - "loss": 0.0152, + "epoch": 0.4, + "learning_rate": 0.0002406308242241064, + "loss": 0.0185, "step": 152690 }, { - "epoch": 0.77, - "learning_rate": 0.00018444132767606237, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00024062693600773494, + "loss": 0.0199, "step": 152700 }, { - "epoch": 0.77, - "learning_rate": 0.00018443375998304838, - "loss": 0.01, + "epoch": 0.4, + "learning_rate": 0.00024062304779136348, + "loss": 0.0249, "step": 152710 }, { - "epoch": 0.77, - "learning_rate": 0.00018442619229003433, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.000240619159574992, + "loss": 0.0193, "step": 152720 }, { - "epoch": 0.77, - "learning_rate": 0.0001844186245970203, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.00024061527135862054, + "loss": 0.0219, "step": 152730 }, { - "epoch": 0.77, - "learning_rate": 0.0001844110569040063, - "loss": 0.0171, + "epoch": 0.4, + "learning_rate": 0.0002406113831422491, + "loss": 0.0218, "step": 152740 }, { - "epoch": 0.77, - "learning_rate": 0.0001844034892109923, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00024060749492587762, + "loss": 0.0188, "step": 152750 }, { - "epoch": 0.77, - "learning_rate": 0.00018439592151797828, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.00024060360670950613, + "loss": 0.0164, "step": 152760 }, { - "epoch": 0.77, - "learning_rate": 0.00018438835382496427, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.00024059971849313468, + "loss": 0.0167, "step": 152770 }, { - "epoch": 0.77, - "learning_rate": 0.00018438078613195027, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00024059583027676325, + "loss": 0.018, "step": 152780 }, { - "epoch": 0.77, - "learning_rate": 0.00018437321843893626, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00024059194206039176, + "loss": 0.021, "step": 152790 }, { - "epoch": 0.77, - "learning_rate": 0.00018436565074592224, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.0002405880538440203, + "loss": 0.0228, "step": 152800 }, { - "epoch": 0.77, - "learning_rate": 0.00018435808305290825, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00024058416562764882, + "loss": 0.019, "step": 152810 }, { - "epoch": 0.77, - "learning_rate": 0.00018435051535989423, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00024058027741127738, + "loss": 0.0181, "step": 152820 }, { - "epoch": 0.77, - "learning_rate": 0.0001843429476668802, - "loss": 0.0105, + "epoch": 0.4, + "learning_rate": 0.0002405763891949059, + "loss": 0.0261, "step": 152830 }, { - "epoch": 0.77, - "learning_rate": 0.00018433537997386622, - "loss": 0.0113, + "epoch": 0.4, + "learning_rate": 0.00024057250097853444, + "loss": 0.0174, "step": 152840 }, { - "epoch": 0.77, - "learning_rate": 0.0001843278122808522, - "loss": 0.0186, + "epoch": 0.4, + "learning_rate": 0.00024056861276216296, + "loss": 0.0172, "step": 152850 }, { - "epoch": 0.77, - "learning_rate": 0.00018432024458783818, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.0002405647245457915, + "loss": 0.0236, "step": 152860 }, { - "epoch": 0.77, - "learning_rate": 0.00018431267689482416, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00024056083632942004, + "loss": 0.0173, "step": 152870 }, { - "epoch": 0.77, - "learning_rate": 0.00018430510920181017, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00024055694811304858, + "loss": 0.0189, "step": 152880 }, { - "epoch": 0.77, - "learning_rate": 0.00018429754150879615, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.0002405530598966771, + "loss": 0.0164, "step": 152890 }, { - "epoch": 0.77, - "learning_rate": 0.00018428997381578213, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00024054917168030564, + "loss": 0.0164, "step": 152900 }, { - "epoch": 0.77, - "learning_rate": 0.00018428240612276814, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.00024054528346393418, + "loss": 0.0195, "step": 152910 }, { - "epoch": 0.77, - "learning_rate": 0.00018427483842975412, - "loss": 0.0119, + "epoch": 0.4, + "learning_rate": 0.00024054139524756272, + "loss": 0.0188, "step": 152920 }, { - "epoch": 0.77, - "learning_rate": 0.0001842672707367401, - "loss": 0.0155, + "epoch": 0.4, + "learning_rate": 0.00024053750703119123, + "loss": 0.0208, "step": 152930 }, { - "epoch": 0.77, - "learning_rate": 0.0001842597030437261, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.00024053361881481978, + "loss": 0.0192, "step": 152940 }, { - "epoch": 0.77, - "learning_rate": 0.0001842521353507121, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024052973059844834, + "loss": 0.0201, "step": 152950 }, { - "epoch": 0.77, - "learning_rate": 0.00018424456765769808, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024052584238207686, + "loss": 0.0238, "step": 152960 }, { - "epoch": 0.77, - "learning_rate": 0.00018423699996468408, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.0002405219541657054, + "loss": 0.0199, "step": 152970 }, { - "epoch": 0.77, - "learning_rate": 0.00018422943227167007, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.00024051806594933392, + "loss": 0.0242, "step": 152980 }, { - "epoch": 0.77, - "learning_rate": 0.00018422186457865605, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00024051417773296248, + "loss": 0.0164, "step": 152990 }, { - "epoch": 0.77, - "learning_rate": 0.00018421429688564206, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.000240510289516591, + "loss": 0.0165, "step": 153000 }, { - "epoch": 0.77, - "eval_cer": 0.9144702559031622, - "eval_loss": 0.008783689700067043, - "eval_runtime": 116.6617, - "eval_samples_per_second": 17.144, - "eval_steps_per_second": 4.286, + "epoch": 0.4, + "eval_cer": 0.881782465628416, + "eval_loss": 0.013410561718046665, + "eval_runtime": 107.4393, + "eval_samples_per_second": 18.615, + "eval_steps_per_second": 4.654, "step": 153000 }, { - "epoch": 0.77, - "learning_rate": 0.00018420672919262804, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00024050640130021954, + "loss": 0.0188, "step": 153010 }, { - "epoch": 0.77, - "learning_rate": 0.00018419916149961402, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.00024050251308384805, + "loss": 0.0178, "step": 153020 }, { - "epoch": 0.77, - "learning_rate": 0.0001841915938066, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00024049862486747662, + "loss": 0.0191, "step": 153030 }, { - "epoch": 0.77, - "learning_rate": 0.000184184026113586, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00024049473665110514, + "loss": 0.0207, "step": 153040 }, { - "epoch": 0.77, - "learning_rate": 0.000184176458420572, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.00024049084843473368, + "loss": 0.0182, "step": 153050 }, { - "epoch": 0.77, - "learning_rate": 0.00018416889072755797, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.0002404869602183622, + "loss": 0.0223, "step": 153060 }, { - "epoch": 0.77, - "learning_rate": 0.00018416132303454398, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00024048307200199076, + "loss": 0.0171, "step": 153070 }, { - "epoch": 0.77, - "learning_rate": 0.00018415375534152996, - "loss": 0.0151, + "epoch": 0.4, + "learning_rate": 0.00024047918378561928, + "loss": 0.0201, "step": 153080 }, { - "epoch": 0.77, - "learning_rate": 0.00018414618764851594, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00024047529556924782, + "loss": 0.0197, "step": 153090 }, { - "epoch": 0.77, - "learning_rate": 0.00018413861995550195, - "loss": 0.0153, + "epoch": 0.4, + "learning_rate": 0.00024047140735287633, + "loss": 0.0207, "step": 153100 }, { - "epoch": 0.77, - "learning_rate": 0.00018413105226248793, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00024046751913650488, + "loss": 0.0221, "step": 153110 }, { - "epoch": 0.77, - "learning_rate": 0.00018412348456947391, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00024046363092013344, + "loss": 0.0176, "step": 153120 }, { - "epoch": 0.77, - "learning_rate": 0.00018411591687645992, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.00024045974270376196, + "loss": 0.0261, "step": 153130 }, { - "epoch": 0.77, - "learning_rate": 0.0001841083491834459, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.0002404558544873905, + "loss": 0.019, "step": 153140 }, { - "epoch": 0.77, - "learning_rate": 0.00018410078149043189, - "loss": 0.0183, + "epoch": 0.4, + "learning_rate": 0.00024045196627101901, + "loss": 0.0173, "step": 153150 }, { - "epoch": 0.77, - "learning_rate": 0.0001840932137974179, - "loss": 0.0155, + "epoch": 0.4, + "learning_rate": 0.00024044807805464758, + "loss": 0.0199, "step": 153160 }, { - "epoch": 0.77, - "learning_rate": 0.00018408564610440388, - "loss": 0.016, + "epoch": 0.4, + "learning_rate": 0.0002404441898382761, + "loss": 0.0196, "step": 153170 }, { - "epoch": 0.77, - "learning_rate": 0.00018407807841138986, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00024044030162190464, + "loss": 0.016, "step": 153180 }, { - "epoch": 0.77, - "learning_rate": 0.00018407051071837584, - "loss": 0.0181, + "epoch": 0.4, + "learning_rate": 0.00024043641340553315, + "loss": 0.0148, "step": 153190 }, { - "epoch": 0.77, - "learning_rate": 0.00018406294302536185, - "loss": 0.0173, + "epoch": 0.4, + "learning_rate": 0.00024043252518916172, + "loss": 0.0197, "step": 153200 }, { - "epoch": 0.77, - "learning_rate": 0.00018405537533234783, - "loss": 0.018, + "epoch": 0.4, + "learning_rate": 0.00024042863697279024, + "loss": 0.0213, "step": 153210 }, { - "epoch": 0.77, - "learning_rate": 0.0001840478076393338, - "loss": 0.0161, + "epoch": 0.4, + "learning_rate": 0.00024042474875641878, + "loss": 0.0198, "step": 153220 }, { - "epoch": 0.77, - "learning_rate": 0.00018404023994631982, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.0002404208605400473, + "loss": 0.0205, "step": 153230 }, { - "epoch": 0.77, - "learning_rate": 0.0001840326722533058, - "loss": 0.015, + "epoch": 0.4, + "learning_rate": 0.00024041697232367586, + "loss": 0.0238, "step": 153240 }, { - "epoch": 0.77, - "learning_rate": 0.00018402510456029178, - "loss": 0.0151, + "epoch": 0.4, + "learning_rate": 0.00024041308410730438, + "loss": 0.0233, "step": 153250 }, { - "epoch": 0.77, - "learning_rate": 0.0001840175368672778, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024040919589093292, + "loss": 0.0198, "step": 153260 }, { - "epoch": 0.77, - "learning_rate": 0.00018400996917426377, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00024040530767456143, + "loss": 0.0196, "step": 153270 }, { - "epoch": 0.77, - "learning_rate": 0.00018400240148124975, - "loss": 0.0149, + "epoch": 0.4, + "learning_rate": 0.00024040141945819, + "loss": 0.0206, "step": 153280 }, { - "epoch": 0.77, - "learning_rate": 0.00018399483378823576, - "loss": 0.0156, + "epoch": 0.4, + "learning_rate": 0.00024039753124181854, + "loss": 0.0193, "step": 153290 }, { - "epoch": 0.77, - "learning_rate": 0.00018398726609522174, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.00024039364302544706, + "loss": 0.0203, "step": 153300 }, { - "epoch": 0.77, - "learning_rate": 0.00018397969840220772, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024038975480907557, + "loss": 0.0212, "step": 153310 }, { - "epoch": 0.77, - "learning_rate": 0.00018397213070919373, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00024038586659270414, + "loss": 0.0184, "step": 153320 }, { - "epoch": 0.77, - "learning_rate": 0.00018396456301617971, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.00024038197837633268, + "loss": 0.0194, "step": 153330 }, { - "epoch": 0.77, - "learning_rate": 0.0001839569953231657, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.0002403780901599612, + "loss": 0.016, "step": 153340 }, { - "epoch": 0.77, - "learning_rate": 0.0001839494276301517, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00024037420194358974, + "loss": 0.0182, "step": 153350 }, { - "epoch": 0.77, - "learning_rate": 0.00018394185993713769, - "loss": 0.0146, + "epoch": 0.4, + "learning_rate": 0.00024037031372721825, + "loss": 0.0208, "step": 153360 }, { - "epoch": 0.77, - "learning_rate": 0.00018393429224412367, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00024036642551084682, + "loss": 0.0207, "step": 153370 }, { - "epoch": 0.77, - "learning_rate": 0.00018392672455110965, - "loss": 0.0106, + "epoch": 0.4, + "learning_rate": 0.00024036253729447534, + "loss": 0.0435, "step": 153380 }, { - "epoch": 0.77, - "learning_rate": 0.00018391915685809566, - "loss": 0.0102, + "epoch": 0.4, + "learning_rate": 0.00024035864907810388, + "loss": 0.0195, "step": 153390 }, { - "epoch": 0.77, - "learning_rate": 0.00018391158916508164, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.0002403547608617324, + "loss": 0.0639, "step": 153400 }, { - "epoch": 0.77, - "learning_rate": 0.00018390402147206762, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024035087264536096, + "loss": 0.0275, "step": 153410 }, { - "epoch": 0.77, - "learning_rate": 0.00018389645377905363, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024034698442898948, + "loss": 0.0176, "step": 153420 }, { - "epoch": 0.77, - "learning_rate": 0.0001838888860860396, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00024034309621261802, + "loss": 0.0191, "step": 153430 }, { - "epoch": 0.77, - "learning_rate": 0.0001838813183930256, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00024033920799624653, + "loss": 0.0187, "step": 153440 }, { - "epoch": 0.77, - "learning_rate": 0.0001838737507000116, - "loss": 0.0145, + "epoch": 0.4, + "learning_rate": 0.0002403353197798751, + "loss": 0.0221, "step": 153450 }, { - "epoch": 0.77, - "learning_rate": 0.00018386618300699758, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00024033143156350364, + "loss": 0.0181, "step": 153460 }, { - "epoch": 0.77, - "learning_rate": 0.00018385861531398356, - "loss": 0.0088, + "epoch": 0.4, + "learning_rate": 0.00024032754334713216, + "loss": 0.02, "step": 153470 }, { - "epoch": 0.77, - "learning_rate": 0.00018385104762096957, - "loss": 0.0178, + "epoch": 0.4, + "learning_rate": 0.00024032365513076067, + "loss": 0.0193, "step": 153480 }, { - "epoch": 0.77, - "learning_rate": 0.00018384347992795555, - "loss": 0.017, + "epoch": 0.4, + "learning_rate": 0.00024031976691438924, + "loss": 0.0174, "step": 153490 }, { - "epoch": 0.77, - "learning_rate": 0.00018383591223494153, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00024031587869801778, + "loss": 0.0208, "step": 153500 }, { - "epoch": 0.77, - "learning_rate": 0.00018382834454192754, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.0002403119904816463, + "loss": 0.0218, "step": 153510 }, { - "epoch": 0.77, - "learning_rate": 0.00018382077684891352, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024030810226527484, + "loss": 0.0221, "step": 153520 }, { - "epoch": 0.77, - "learning_rate": 0.0001838132091558995, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00024030421404890338, + "loss": 0.0238, "step": 153530 }, { - "epoch": 0.77, - "learning_rate": 0.0001838056414628855, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.00024030032583253192, + "loss": 0.0215, "step": 153540 }, { - "epoch": 0.77, - "learning_rate": 0.0001837980737698715, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024029643761616044, + "loss": 0.0229, "step": 153550 }, { - "epoch": 0.77, - "learning_rate": 0.00018379050607685748, - "loss": 0.0107, + "epoch": 0.4, + "learning_rate": 0.00024029254939978898, + "loss": 0.0206, "step": 153560 }, { - "epoch": 0.77, - "learning_rate": 0.00018378293838384346, - "loss": 0.0158, + "epoch": 0.4, + "learning_rate": 0.00024028866118341752, + "loss": 0.0204, "step": 153570 }, { - "epoch": 0.77, - "learning_rate": 0.00018377537069082947, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00024028477296704606, + "loss": 0.0187, "step": 153580 }, { - "epoch": 0.77, - "learning_rate": 0.00018376780299781545, - "loss": 0.0098, + "epoch": 0.4, + "learning_rate": 0.00024028088475067458, + "loss": 0.0206, "step": 153590 }, { - "epoch": 0.77, - "learning_rate": 0.00018376023530480143, - "loss": 0.0156, + "epoch": 0.4, + "learning_rate": 0.00024027699653430312, + "loss": 0.0372, "step": 153600 }, { - "epoch": 0.77, - "learning_rate": 0.00018375266761178744, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00024027310831793163, + "loss": 0.0185, "step": 153610 }, { - "epoch": 0.78, - "learning_rate": 0.00018374509991877342, - "loss": 0.0095, + "epoch": 0.4, + "learning_rate": 0.0002402692201015602, + "loss": 0.0205, "step": 153620 }, { - "epoch": 0.78, - "learning_rate": 0.0001837375322257594, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.00024026533188518872, + "loss": 0.0197, "step": 153630 }, { - "epoch": 0.78, - "learning_rate": 0.0001837299645327454, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024026144366881726, + "loss": 0.0178, "step": 153640 }, { - "epoch": 0.78, - "learning_rate": 0.0001837223968397314, - "loss": 0.0146, + "epoch": 0.4, + "learning_rate": 0.00024025755545244577, + "loss": 0.0201, "step": 153650 }, { - "epoch": 0.78, - "learning_rate": 0.00018371482914671737, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00024025366723607434, + "loss": 0.0194, "step": 153660 }, { - "epoch": 0.78, - "learning_rate": 0.00018370726145370338, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00024024977901970288, + "loss": 0.0182, "step": 153670 }, { - "epoch": 0.78, - "learning_rate": 0.00018369969376068936, - "loss": 0.0119, + "epoch": 0.4, + "learning_rate": 0.0002402458908033314, + "loss": 0.0262, "step": 153680 }, { - "epoch": 0.78, - "learning_rate": 0.00018369212606767534, - "loss": 0.0089, + "epoch": 0.4, + "learning_rate": 0.00024024200258695994, + "loss": 0.0213, "step": 153690 }, { - "epoch": 0.78, - "learning_rate": 0.00018368455837466133, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024023811437058848, + "loss": 0.019, "step": 153700 }, { - "epoch": 0.78, - "learning_rate": 0.00018367699068164733, - "loss": 0.0145, + "epoch": 0.4, + "learning_rate": 0.00024023422615421702, + "loss": 0.019, "step": 153710 }, { - "epoch": 0.78, - "learning_rate": 0.00018366942298863332, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00024023033793784554, + "loss": 0.0234, "step": 153720 }, { - "epoch": 0.78, - "learning_rate": 0.0001836618552956193, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00024022644972147408, + "loss": 0.02, "step": 153730 }, { - "epoch": 0.78, - "learning_rate": 0.0001836542876026053, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024022256150510262, + "loss": 0.0206, "step": 153740 }, { - "epoch": 0.78, - "learning_rate": 0.0001836467199095913, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00024021867328873116, + "loss": 0.0197, "step": 153750 }, { - "epoch": 0.78, - "learning_rate": 0.00018363915221657727, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00024021478507235968, + "loss": 0.0168, "step": 153760 }, { - "epoch": 0.78, - "learning_rate": 0.00018363158452356328, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024021089685598822, + "loss": 0.0201, "step": 153770 }, { - "epoch": 0.78, - "learning_rate": 0.00018362401683054926, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00024020700863961676, + "loss": 0.0204, "step": 153780 }, { - "epoch": 0.78, - "learning_rate": 0.00018361644913753524, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.0002402031204232453, + "loss": 0.015, "step": 153790 }, { - "epoch": 0.78, - "learning_rate": 0.00018360888144452125, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.00024019923220687381, + "loss": 0.0151, "step": 153800 }, { - "epoch": 0.78, - "learning_rate": 0.00018360131375150723, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.00024019534399050236, + "loss": 0.0208, "step": 153810 }, { - "epoch": 0.78, - "learning_rate": 0.0001835937460584932, - "loss": 0.0145, + "epoch": 0.4, + "learning_rate": 0.00024019145577413092, + "loss": 0.0139, "step": 153820 }, { - "epoch": 0.78, - "learning_rate": 0.00018358617836547922, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00024018756755775944, + "loss": 0.0166, "step": 153830 }, { - "epoch": 0.78, - "learning_rate": 0.0001835786106724652, - "loss": 0.0104, + "epoch": 0.4, + "learning_rate": 0.00024018367934138798, + "loss": 0.023, "step": 153840 }, { - "epoch": 0.78, - "learning_rate": 0.00018357104297945118, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.0002401797911250165, + "loss": 0.0191, "step": 153850 }, { - "epoch": 0.78, - "learning_rate": 0.0001835634752864372, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00024017590290864504, + "loss": 0.0244, "step": 153860 }, { - "epoch": 0.78, - "learning_rate": 0.00018355590759342317, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00024017201469227358, + "loss": 0.0241, "step": 153870 }, { - "epoch": 0.78, - "learning_rate": 0.00018354833990040915, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00024016812647590212, + "loss": 0.0162, "step": 153880 }, { - "epoch": 0.78, - "learning_rate": 0.00018354077220739514, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00024016423825953063, + "loss": 0.0162, "step": 153890 }, { - "epoch": 0.78, - "learning_rate": 0.00018353320451438114, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024016035004315918, + "loss": 0.0184, "step": 153900 }, { - "epoch": 0.78, - "learning_rate": 0.00018352563682136713, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00024015646182678772, + "loss": 0.0183, "step": 153910 }, { - "epoch": 0.78, - "learning_rate": 0.0001835180691283531, - "loss": 0.01, + "epoch": 0.4, + "learning_rate": 0.00024015257361041626, + "loss": 0.0175, "step": 153920 }, { - "epoch": 0.78, - "learning_rate": 0.00018351050143533912, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.00024014868539404477, + "loss": 0.017, "step": 153930 }, { - "epoch": 0.78, - "learning_rate": 0.0001835029337423251, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024014479717767332, + "loss": 0.02, "step": 153940 }, { - "epoch": 0.78, - "learning_rate": 0.00018349536604931108, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024014090896130186, + "loss": 0.0201, "step": 153950 }, { - "epoch": 0.78, - "learning_rate": 0.0001834877983562971, - "loss": 0.0158, + "epoch": 0.4, + "learning_rate": 0.0002401370207449304, + "loss": 0.0263, "step": 153960 }, { - "epoch": 0.78, - "learning_rate": 0.00018348023066328304, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00024013313252855891, + "loss": 0.0175, "step": 153970 }, { - "epoch": 0.78, - "learning_rate": 0.00018347266297026902, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00024012924431218746, + "loss": 0.0172, "step": 153980 }, { - "epoch": 0.78, - "learning_rate": 0.000183465095277255, - "loss": 0.0096, + "epoch": 0.4, + "learning_rate": 0.00024012535609581602, + "loss": 0.0157, "step": 153990 }, { - "epoch": 0.78, - "learning_rate": 0.000183457527584241, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00024012146787944454, + "loss": 0.0188, "step": 154000 }, { - "epoch": 0.78, - "eval_cer": 0.9144789894682909, - "eval_loss": 0.008818663656711578, - "eval_runtime": 116.7061, - "eval_samples_per_second": 17.137, - "eval_steps_per_second": 4.284, + "epoch": 0.4, + "eval_cer": 0.881782465628416, + "eval_loss": 0.013507870957255363, + "eval_runtime": 107.4654, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, "step": 154000 }, { - "epoch": 0.78, - "learning_rate": 0.000183449959891227, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024011757966307308, + "loss": 0.0161, "step": 154010 }, { - "epoch": 0.78, - "learning_rate": 0.00018344239219821298, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.0002401136914467016, + "loss": 0.0192, "step": 154020 }, { - "epoch": 0.78, - "learning_rate": 0.00018343482450519898, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.00024010980323033016, + "loss": 0.028, "step": 154030 }, { - "epoch": 0.78, - "learning_rate": 0.00018342725681218497, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00024010591501395868, + "loss": 0.0159, "step": 154040 }, { - "epoch": 0.78, - "learning_rate": 0.00018341968911917095, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00024010202679758722, + "loss": 0.0208, "step": 154050 }, { - "epoch": 0.78, - "learning_rate": 0.00018341212142615696, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.00024009813858121573, + "loss": 0.0195, "step": 154060 }, { - "epoch": 0.78, - "learning_rate": 0.00018340455373314294, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.0002400942503648443, + "loss": 0.0249, "step": 154070 }, { - "epoch": 0.78, - "learning_rate": 0.00018339698604012892, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00024009036214847282, + "loss": 0.018, "step": 154080 }, { - "epoch": 0.78, - "learning_rate": 0.0001833894183471149, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00024008647393210136, + "loss": 0.0182, "step": 154090 }, { - "epoch": 0.78, - "learning_rate": 0.0001833818506541009, - "loss": 0.0158, + "epoch": 0.4, + "learning_rate": 0.00024008258571572987, + "loss": 0.0196, "step": 154100 }, { - "epoch": 0.78, - "learning_rate": 0.0001833742829610869, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00024007869749935842, + "loss": 0.0205, "step": 154110 }, { - "epoch": 0.78, - "learning_rate": 0.00018336671526807287, - "loss": 0.0161, + "epoch": 0.4, + "learning_rate": 0.00024007480928298696, + "loss": 0.0203, "step": 154120 }, { - "epoch": 0.78, - "learning_rate": 0.00018335914757505888, - "loss": 0.0153, + "epoch": 0.4, + "learning_rate": 0.0002400709210666155, + "loss": 0.0191, "step": 154130 }, { - "epoch": 0.78, - "learning_rate": 0.00018335157988204486, - "loss": 0.0163, + "epoch": 0.4, + "learning_rate": 0.000240067032850244, + "loss": 0.0156, "step": 154140 }, { - "epoch": 0.78, - "learning_rate": 0.00018334401218903084, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00024006314463387255, + "loss": 0.0186, "step": 154150 }, { - "epoch": 0.78, - "learning_rate": 0.00018333644449601685, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00024005925641750112, + "loss": 0.0222, "step": 154160 }, { - "epoch": 0.78, - "learning_rate": 0.00018332887680300283, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00024005536820112964, + "loss": 0.0201, "step": 154170 }, { - "epoch": 0.78, - "learning_rate": 0.00018332130910998881, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.00024005147998475815, + "loss": 0.0195, "step": 154180 }, { - "epoch": 0.78, - "learning_rate": 0.00018331374141697482, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.0002400475917683867, + "loss": 0.0205, "step": 154190 }, { - "epoch": 0.78, - "learning_rate": 0.0001833061737239608, - "loss": 0.0103, + "epoch": 0.4, + "learning_rate": 0.00024004370355201526, + "loss": 0.0156, "step": 154200 }, { - "epoch": 0.78, - "learning_rate": 0.00018329860603094679, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00024003981533564378, + "loss": 0.0213, "step": 154210 }, { - "epoch": 0.78, - "learning_rate": 0.0001832910383379328, - "loss": 0.0098, + "epoch": 0.4, + "learning_rate": 0.00024003592711927232, + "loss": 0.0216, "step": 154220 }, { - "epoch": 0.78, - "learning_rate": 0.00018328347064491878, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00024003203890290083, + "loss": 0.0215, "step": 154230 }, { - "epoch": 0.78, - "learning_rate": 0.00018327590295190476, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.0002400281506865294, + "loss": 0.0162, "step": 154240 }, { - "epoch": 0.78, - "learning_rate": 0.00018326833525889077, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00024002426247015792, + "loss": 0.0188, "step": 154250 }, { - "epoch": 0.78, - "learning_rate": 0.00018326076756587675, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00024002037425378646, + "loss": 0.0197, "step": 154260 }, { - "epoch": 0.78, - "learning_rate": 0.00018325319987286273, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00024001648603741497, + "loss": 0.0243, "step": 154270 }, { - "epoch": 0.78, - "learning_rate": 0.0001832456321798487, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00024001259782104354, + "loss": 0.0184, "step": 154280 }, { - "epoch": 0.78, - "learning_rate": 0.00018323806448683472, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00024000870960467206, + "loss": 0.0182, "step": 154290 }, { - "epoch": 0.78, - "learning_rate": 0.0001832304967938207, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.0002400048213883006, + "loss": 0.0213, "step": 154300 }, { - "epoch": 0.78, - "learning_rate": 0.00018322292910080668, - "loss": 0.0166, + "epoch": 0.4, + "learning_rate": 0.0002400009331719291, + "loss": 0.0192, "step": 154310 }, { - "epoch": 0.78, - "learning_rate": 0.0001832153614077927, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00023999704495555768, + "loss": 0.0196, "step": 154320 }, { - "epoch": 0.78, - "learning_rate": 0.00018320779371477867, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00023999315673918622, + "loss": 0.0177, "step": 154330 }, { - "epoch": 0.78, - "learning_rate": 0.00018320022602176465, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00023998926852281474, + "loss": 0.02, "step": 154340 }, { - "epoch": 0.78, - "learning_rate": 0.00018319265832875066, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00023998538030644325, + "loss": 0.019, "step": 154350 }, { - "epoch": 0.78, - "learning_rate": 0.00018318509063573664, - "loss": 0.0096, + "epoch": 0.4, + "learning_rate": 0.0002399814920900718, + "loss": 0.0291, "step": 154360 }, { - "epoch": 0.78, - "learning_rate": 0.00018317752294272262, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023997760387370036, + "loss": 0.0213, "step": 154370 }, { - "epoch": 0.78, - "learning_rate": 0.00018316995524970863, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00023997371565732888, + "loss": 0.0187, "step": 154380 }, { - "epoch": 0.78, - "learning_rate": 0.00018316238755669461, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.00023996982744095742, + "loss": 0.0168, "step": 154390 }, { - "epoch": 0.78, - "learning_rate": 0.0001831548198636806, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00023996593922458593, + "loss": 0.0206, "step": 154400 }, { - "epoch": 0.78, - "learning_rate": 0.0001831472521706666, - "loss": 0.0094, + "epoch": 0.4, + "learning_rate": 0.0002399620510082145, + "loss": 0.0189, "step": 154410 }, { - "epoch": 0.78, - "learning_rate": 0.00018313968447765259, - "loss": 0.0119, + "epoch": 0.4, + "learning_rate": 0.00023995816279184302, + "loss": 0.0188, "step": 154420 }, { - "epoch": 0.78, - "learning_rate": 0.00018313211678463857, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023995427457547156, + "loss": 0.0177, "step": 154430 }, { - "epoch": 0.78, - "learning_rate": 0.00018312454909162455, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.00023995038635910007, + "loss": 0.0221, "step": 154440 }, { - "epoch": 0.78, - "learning_rate": 0.00018311698139861056, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00023994649814272864, + "loss": 0.0184, "step": 154450 }, { - "epoch": 0.78, - "learning_rate": 0.00018310941370559654, - "loss": 0.0107, + "epoch": 0.4, + "learning_rate": 0.00023994260992635716, + "loss": 0.0169, "step": 154460 }, { - "epoch": 0.78, - "learning_rate": 0.00018310184601258252, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.0002399387217099857, + "loss": 0.0225, "step": 154470 }, { - "epoch": 0.78, - "learning_rate": 0.00018309427831956853, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.0002399348334936142, + "loss": 0.018, "step": 154480 }, { - "epoch": 0.78, - "learning_rate": 0.0001830867106265545, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.00023993094527724278, + "loss": 0.0175, "step": 154490 }, { - "epoch": 0.78, - "learning_rate": 0.0001830791429335405, - "loss": 0.0103, + "epoch": 0.4, + "learning_rate": 0.0002399270570608713, + "loss": 0.018, "step": 154500 }, { - "epoch": 0.78, - "learning_rate": 0.0001830715752405265, - "loss": 0.0175, + "epoch": 0.4, + "learning_rate": 0.00023992316884449984, + "loss": 0.0172, "step": 154510 }, { - "epoch": 0.78, - "learning_rate": 0.00018306400754751248, - "loss": 0.0152, + "epoch": 0.4, + "learning_rate": 0.00023991928062812835, + "loss": 0.0216, "step": 154520 }, { - "epoch": 0.78, - "learning_rate": 0.00018305643985449846, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.00023991539241175692, + "loss": 0.0176, "step": 154530 }, { - "epoch": 0.78, - "learning_rate": 0.00018304887216148447, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023991150419538546, + "loss": 0.0216, "step": 154540 }, { - "epoch": 0.78, - "learning_rate": 0.00018304130446847045, - "loss": 0.0145, + "epoch": 0.4, + "learning_rate": 0.00023990761597901398, + "loss": 0.0204, "step": 154550 }, { - "epoch": 0.78, - "learning_rate": 0.00018303373677545643, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00023990372776264252, + "loss": 0.0187, "step": 154560 }, { - "epoch": 0.78, - "learning_rate": 0.00018302616908244244, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00023989983954627106, + "loss": 0.0179, "step": 154570 }, { - "epoch": 0.78, - "learning_rate": 0.00018301860138942842, - "loss": 0.0149, + "epoch": 0.4, + "learning_rate": 0.0002398959513298996, + "loss": 0.0192, "step": 154580 }, { - "epoch": 0.78, - "learning_rate": 0.0001830110336964144, - "loss": 0.0105, + "epoch": 0.4, + "learning_rate": 0.00023989206311352812, + "loss": 0.0168, "step": 154590 }, { - "epoch": 0.78, - "learning_rate": 0.0001830034660034004, - "loss": 0.0161, + "epoch": 0.4, + "learning_rate": 0.00023988817489715666, + "loss": 0.0163, "step": 154600 }, { - "epoch": 0.78, - "learning_rate": 0.0001829958983103864, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023988428668078517, + "loss": 0.0194, "step": 154610 }, { - "epoch": 0.78, - "learning_rate": 0.00018298833061737238, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00023988039846441374, + "loss": 0.016, "step": 154620 }, { - "epoch": 0.78, - "learning_rate": 0.00018298076292435836, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023987651024804226, + "loss": 0.0188, "step": 154630 }, { - "epoch": 0.78, - "learning_rate": 0.00018297319523134437, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.0002398726220316708, + "loss": 0.0145, "step": 154640 }, { - "epoch": 0.78, - "learning_rate": 0.00018296562753833035, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.0002398687338152993, + "loss": 0.0206, "step": 154650 }, { - "epoch": 0.78, - "learning_rate": 0.00018295805984531633, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00023986484559892788, + "loss": 0.0242, "step": 154660 }, { - "epoch": 0.78, - "learning_rate": 0.00018295049215230234, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.0002398609573825564, + "loss": 0.0242, "step": 154670 }, { - "epoch": 0.78, - "learning_rate": 0.00018294292445928832, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023985706916618494, + "loss": 0.0187, "step": 154680 }, { - "epoch": 0.78, - "learning_rate": 0.0001829353567662743, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.00023985318094981345, + "loss": 0.0158, "step": 154690 }, { - "epoch": 0.78, - "learning_rate": 0.0001829277890732603, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00023984929273344202, + "loss": 0.0173, "step": 154700 }, { - "epoch": 0.78, - "learning_rate": 0.0001829202213802463, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00023984540451707056, + "loss": 0.0183, "step": 154710 }, { - "epoch": 0.78, - "learning_rate": 0.00018291265368723227, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00023984151630069908, + "loss": 0.0207, "step": 154720 }, { - "epoch": 0.78, - "learning_rate": 0.00018290508599421828, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00023983762808432762, + "loss": 0.0167, "step": 154730 }, { - "epoch": 0.78, - "learning_rate": 0.00018289751830120426, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00023983373986795616, + "loss": 0.016, "step": 154740 }, { - "epoch": 0.78, - "learning_rate": 0.00018288995060819024, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.0002398298516515847, + "loss": 0.0175, "step": 154750 }, { - "epoch": 0.78, - "learning_rate": 0.00018288238291517625, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00023982596343521322, + "loss": 0.018, "step": 154760 }, { - "epoch": 0.78, - "learning_rate": 0.00018287481522216223, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.00023982207521884176, + "loss": 0.0179, "step": 154770 }, { - "epoch": 0.78, - "learning_rate": 0.00018286724752914822, - "loss": 0.0113, + "epoch": 0.4, + "learning_rate": 0.0002398181870024703, + "loss": 0.0197, "step": 154780 }, { - "epoch": 0.78, - "learning_rate": 0.0001828596798361342, - "loss": 0.0159, + "epoch": 0.4, + "learning_rate": 0.00023981429878609884, + "loss": 0.0184, "step": 154790 }, { - "epoch": 0.78, - "learning_rate": 0.0001828521121431202, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023981041056972735, + "loss": 0.0186, "step": 154800 }, { - "epoch": 0.78, - "learning_rate": 0.0001828445444501062, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.0002398065223533559, + "loss": 0.0181, "step": 154810 }, { - "epoch": 0.78, - "learning_rate": 0.00018283697675709217, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.0002398026341369844, + "loss": 0.02, "step": 154820 }, { - "epoch": 0.78, - "learning_rate": 0.00018282940906407818, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00023979874592061298, + "loss": 0.0162, "step": 154830 }, { - "epoch": 0.78, - "learning_rate": 0.00018282184137106416, - "loss": 0.0113, + "epoch": 0.4, + "learning_rate": 0.0002397948577042415, + "loss": 0.0206, "step": 154840 }, { - "epoch": 0.78, - "learning_rate": 0.00018281427367805014, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023979096948787004, + "loss": 0.0187, "step": 154850 }, { - "epoch": 0.78, - "learning_rate": 0.00018280670598503615, - "loss": 0.0141, + "epoch": 0.4, + "learning_rate": 0.00023978708127149855, + "loss": 0.0191, "step": 154860 }, { - "epoch": 0.78, - "learning_rate": 0.00018279913829202213, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.00023978319305512712, + "loss": 0.0179, "step": 154870 }, { - "epoch": 0.78, - "learning_rate": 0.0001827915705990081, - "loss": 0.0107, + "epoch": 0.4, + "learning_rate": 0.00023977930483875566, + "loss": 0.0167, "step": 154880 }, { - "epoch": 0.78, - "learning_rate": 0.00018278400290599412, - "loss": 0.0158, + "epoch": 0.4, + "learning_rate": 0.00023977541662238418, + "loss": 0.0198, "step": 154890 }, { - "epoch": 0.78, - "learning_rate": 0.0001827764352129801, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.0002397715284060127, + "loss": 0.0165, "step": 154900 }, { - "epoch": 0.78, - "learning_rate": 0.00018276886751996608, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023976764018964126, + "loss": 0.0211, "step": 154910 }, { - "epoch": 0.78, - "learning_rate": 0.0001827612998269521, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.0002397637519732698, + "loss": 0.0191, "step": 154920 }, { - "epoch": 0.78, - "learning_rate": 0.00018275373213393807, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00023975986375689831, + "loss": 0.0166, "step": 154930 }, { - "epoch": 0.78, - "learning_rate": 0.00018274616444092405, - "loss": 0.0102, + "epoch": 0.4, + "learning_rate": 0.00023975597554052686, + "loss": 0.0177, "step": 154940 }, { - "epoch": 0.78, - "learning_rate": 0.00018273859674791004, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.0002397520873241554, + "loss": 0.0177, "step": 154950 }, { - "epoch": 0.78, - "learning_rate": 0.00018273102905489604, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023974819910778394, + "loss": 0.0171, "step": 154960 }, { - "epoch": 0.78, - "learning_rate": 0.00018272346136188203, - "loss": 0.0162, + "epoch": 0.4, + "learning_rate": 0.00023974431089141245, + "loss": 0.0249, "step": 154970 }, { - "epoch": 0.78, - "learning_rate": 0.000182715893668868, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.000239740422675041, + "loss": 0.0234, "step": 154980 }, { - "epoch": 0.78, - "learning_rate": 0.00018270832597585402, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00023973653445866954, + "loss": 0.0175, "step": 154990 }, { - "epoch": 0.78, - "learning_rate": 0.00018270075828284, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023973264624229808, + "loss": 0.0185, "step": 155000 }, { - "epoch": 0.78, - "eval_cer": 0.9144731670915385, - "eval_loss": 0.009108257479965687, - "eval_runtime": 116.7273, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.283, + "epoch": 0.4, + "eval_cer": 0.8818146572779021, + "eval_loss": 0.013523012399673462, + "eval_runtime": 108.0058, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.629, "step": 155000 }, { - "epoch": 0.78, - "learning_rate": 0.00018269319058982598, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.0002397287580259266, + "loss": 0.0183, "step": 155010 }, { - "epoch": 0.78, - "learning_rate": 0.000182685622896812, - "loss": 0.0206, + "epoch": 0.4, + "learning_rate": 0.00023972486980955514, + "loss": 0.0213, "step": 155020 }, { - "epoch": 0.78, - "learning_rate": 0.00018267805520379797, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.0002397209815931837, + "loss": 0.0215, "step": 155030 }, { - "epoch": 0.78, - "learning_rate": 0.00018267048751078395, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00023971709337681222, + "loss": 0.0207, "step": 155040 }, { - "epoch": 0.78, - "learning_rate": 0.00018266291981776996, - "loss": 0.0166, + "epoch": 0.4, + "learning_rate": 0.00023971320516044073, + "loss": 0.0167, "step": 155050 }, { - "epoch": 0.78, - "learning_rate": 0.00018265535212475594, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023970931694406927, + "loss": 0.0144, "step": 155060 }, { - "epoch": 0.78, - "learning_rate": 0.00018264778443174192, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.0002397054287276978, + "loss": 0.0368, "step": 155070 }, { - "epoch": 0.78, - "learning_rate": 0.00018264021673872793, - "loss": 0.0103, + "epoch": 0.4, + "learning_rate": 0.00023970154051132636, + "loss": 0.0214, "step": 155080 }, { - "epoch": 0.78, - "learning_rate": 0.0001826326490457139, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.0002396976522949549, + "loss": 0.0182, "step": 155090 }, { - "epoch": 0.78, - "learning_rate": 0.0001826250813526999, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.00023969376407858341, + "loss": 0.0177, "step": 155100 }, { - "epoch": 0.78, - "learning_rate": 0.00018261751365968587, - "loss": 0.0111, + "epoch": 0.4, + "learning_rate": 0.00023968987586221196, + "loss": 0.021, "step": 155110 }, { - "epoch": 0.78, - "learning_rate": 0.00018260994596667188, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.0002396859876458405, + "loss": 0.021, "step": 155120 }, { - "epoch": 0.78, - "learning_rate": 0.00018260237827365786, - "loss": 0.0121, + "epoch": 0.4, + "learning_rate": 0.00023968209942946904, + "loss": 0.0173, "step": 155130 }, { - "epoch": 0.78, - "learning_rate": 0.00018259481058064385, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023967821121309755, + "loss": 0.0214, "step": 155140 }, { - "epoch": 0.78, - "learning_rate": 0.00018258724288762985, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.0002396743229967261, + "loss": 0.0217, "step": 155150 }, { - "epoch": 0.78, - "learning_rate": 0.00018257967519461584, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.00023967043478035464, + "loss": 0.0186, "step": 155160 }, { - "epoch": 0.78, - "learning_rate": 0.00018257210750160182, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00023966654656398318, + "loss": 0.0176, "step": 155170 }, { - "epoch": 0.78, - "learning_rate": 0.00018256453980858783, - "loss": 0.0182, + "epoch": 0.4, + "learning_rate": 0.0002396626583476117, + "loss": 0.0191, "step": 155180 }, { - "epoch": 0.78, - "learning_rate": 0.0001825569721155738, - "loss": 0.0164, + "epoch": 0.4, + "learning_rate": 0.00023965877013124023, + "loss": 0.0183, "step": 155190 }, { - "epoch": 0.78, - "learning_rate": 0.0001825494044225598, - "loss": 0.017, + "epoch": 0.4, + "learning_rate": 0.0002396548819148688, + "loss": 0.0165, "step": 155200 }, { - "epoch": 0.78, - "learning_rate": 0.0001825418367295458, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023965099369849732, + "loss": 0.0181, "step": 155210 }, { - "epoch": 0.78, - "learning_rate": 0.00018253426903653178, - "loss": 0.015, + "epoch": 0.4, + "learning_rate": 0.00023964710548212583, + "loss": 0.0229, "step": 155220 }, { - "epoch": 0.78, - "learning_rate": 0.00018252670134351773, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023964321726575437, + "loss": 0.0224, "step": 155230 }, { - "epoch": 0.78, - "learning_rate": 0.00018251913365050371, - "loss": 0.0164, + "epoch": 0.4, + "learning_rate": 0.00023963932904938294, + "loss": 0.0214, "step": 155240 }, { - "epoch": 0.78, - "learning_rate": 0.00018251156595748972, - "loss": 0.0184, + "epoch": 0.4, + "learning_rate": 0.00023963544083301146, + "loss": 0.0202, "step": 155250 }, { - "epoch": 0.78, - "learning_rate": 0.0001825039982644757, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.00023963155261664, + "loss": 0.0224, "step": 155260 }, { - "epoch": 0.78, - "learning_rate": 0.00018249643057146169, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023962766440026851, + "loss": 0.0201, "step": 155270 }, { - "epoch": 0.78, - "learning_rate": 0.0001824888628784477, - "loss": 0.0101, + "epoch": 0.4, + "learning_rate": 0.00023962377618389708, + "loss": 0.0203, "step": 155280 }, { - "epoch": 0.78, - "learning_rate": 0.00018248129518543368, - "loss": 0.0154, + "epoch": 0.4, + "learning_rate": 0.0002396198879675256, + "loss": 0.0198, "step": 155290 }, { - "epoch": 0.78, - "learning_rate": 0.00018247372749241966, - "loss": 0.0149, + "epoch": 0.4, + "learning_rate": 0.00023961599975115414, + "loss": 0.0162, "step": 155300 }, { - "epoch": 0.78, - "learning_rate": 0.00018246615979940567, - "loss": 0.0109, + "epoch": 0.4, + "learning_rate": 0.00023961211153478265, + "loss": 0.0192, "step": 155310 }, { - "epoch": 0.78, - "learning_rate": 0.00018245859210639165, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.0002396082233184112, + "loss": 0.022, "step": 155320 }, { - "epoch": 0.78, - "learning_rate": 0.00018245102441337763, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00023960433510203974, + "loss": 0.0201, "step": 155330 }, { - "epoch": 0.78, - "learning_rate": 0.0001824434567203636, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00023960044688566828, + "loss": 0.0169, "step": 155340 }, { - "epoch": 0.78, - "learning_rate": 0.00018243588902734962, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.0002395965586692968, + "loss": 0.0224, "step": 155350 }, { - "epoch": 0.78, - "learning_rate": 0.0001824283213343356, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00023959267045292533, + "loss": 0.0215, "step": 155360 }, { - "epoch": 0.78, - "learning_rate": 0.00018242075364132158, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00023958878223655388, + "loss": 0.02, "step": 155370 }, { - "epoch": 0.78, - "learning_rate": 0.0001824131859483076, - "loss": 0.0131, + "epoch": 0.4, + "learning_rate": 0.00023958489402018242, + "loss": 0.0197, "step": 155380 }, { - "epoch": 0.78, - "learning_rate": 0.00018240561825529357, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00023958100580381093, + "loss": 0.0166, "step": 155390 }, { - "epoch": 0.78, - "learning_rate": 0.00018239805056227955, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023957711758743947, + "loss": 0.0229, "step": 155400 }, { - "epoch": 0.78, - "learning_rate": 0.00018239048286926556, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023957322937106804, + "loss": 0.021, "step": 155410 }, { - "epoch": 0.78, - "learning_rate": 0.00018238291517625154, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023956934115469656, + "loss": 0.0202, "step": 155420 }, { - "epoch": 0.78, - "learning_rate": 0.00018237534748323752, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.0002395654529383251, + "loss": 0.0176, "step": 155430 }, { - "epoch": 0.78, - "learning_rate": 0.00018236777979022353, - "loss": 0.0105, + "epoch": 0.4, + "learning_rate": 0.0002395615647219536, + "loss": 0.0203, "step": 155440 }, { - "epoch": 0.78, - "learning_rate": 0.00018236021209720951, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00023955767650558218, + "loss": 0.0265, "step": 155450 }, { - "epoch": 0.78, - "learning_rate": 0.0001823526444041955, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.0002395537882892107, + "loss": 0.0187, "step": 155460 }, { - "epoch": 0.78, - "learning_rate": 0.0001823450767111815, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00023954990007283924, + "loss": 0.0186, "step": 155470 }, { - "epoch": 0.78, - "learning_rate": 0.00018233750901816749, - "loss": 0.0088, + "epoch": 0.4, + "learning_rate": 0.00023954601185646775, + "loss": 0.0186, "step": 155480 }, { - "epoch": 0.78, - "learning_rate": 0.00018232994132515347, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023954212364009632, + "loss": 0.017, "step": 155490 }, { - "epoch": 0.78, - "learning_rate": 0.00018232237363213945, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00023953823542372484, + "loss": 0.0225, "step": 155500 }, { - "epoch": 0.78, - "learning_rate": 0.00018231480593912546, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00023953434720735338, + "loss": 0.0174, "step": 155510 }, { - "epoch": 0.78, - "learning_rate": 0.00018230723824611144, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.0002395304589909819, + "loss": 0.0179, "step": 155520 }, { - "epoch": 0.78, - "learning_rate": 0.00018229967055309742, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00023952657077461046, + "loss": 0.0195, "step": 155530 }, { - "epoch": 0.78, - "learning_rate": 0.00018229210286008343, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.00023952268255823898, + "loss": 0.0181, "step": 155540 }, { - "epoch": 0.78, - "learning_rate": 0.0001822845351670694, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023951879434186752, + "loss": 0.018, "step": 155550 }, { - "epoch": 0.78, - "learning_rate": 0.0001822769674740554, - "loss": 0.0147, + "epoch": 0.4, + "learning_rate": 0.00023951490612549603, + "loss": 0.0175, "step": 155560 }, { - "epoch": 0.78, - "learning_rate": 0.0001822693997810414, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023951101790912457, + "loss": 0.0238, "step": 155570 }, { - "epoch": 0.78, - "learning_rate": 0.00018226183208802738, - "loss": 0.0108, + "epoch": 0.4, + "learning_rate": 0.00023950712969275314, + "loss": 0.0156, "step": 155580 }, { - "epoch": 0.78, - "learning_rate": 0.00018225426439501336, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00023950324147638166, + "loss": 0.0188, "step": 155590 }, { - "epoch": 0.79, - "learning_rate": 0.00018224669670199937, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.0002394993532600102, + "loss": 0.0184, "step": 155600 }, { - "epoch": 0.79, - "learning_rate": 0.00018223912900898535, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.0002394954650436387, + "loss": 0.0165, "step": 155610 }, { - "epoch": 0.79, - "learning_rate": 0.00018223156131597133, - "loss": 0.0132, + "epoch": 0.4, + "learning_rate": 0.00023949157682726728, + "loss": 0.02, "step": 155620 }, { - "epoch": 0.79, - "learning_rate": 0.00018222399362295734, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.0002394876886108958, + "loss": 0.015, "step": 155630 }, { - "epoch": 0.79, - "learning_rate": 0.00018221642592994332, - "loss": 0.0174, + "epoch": 0.4, + "learning_rate": 0.00023948380039452434, + "loss": 0.0192, "step": 155640 }, { - "epoch": 0.79, - "learning_rate": 0.0001822088582369293, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023947991217815285, + "loss": 0.0141, "step": 155650 }, { - "epoch": 0.79, - "learning_rate": 0.00018220129054391531, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023947602396178142, + "loss": 0.0228, "step": 155660 }, { - "epoch": 0.79, - "learning_rate": 0.0001821937228509013, - "loss": 0.0115, + "epoch": 0.4, + "learning_rate": 0.00023947213574540994, + "loss": 0.0184, "step": 155670 }, { - "epoch": 0.79, - "learning_rate": 0.00018218615515788728, - "loss": 0.0114, + "epoch": 0.4, + "learning_rate": 0.00023946824752903848, + "loss": 0.0205, "step": 155680 }, { - "epoch": 0.79, - "learning_rate": 0.00018217858746487326, - "loss": 0.0108, + "epoch": 0.4, + "learning_rate": 0.000239464359312667, + "loss": 0.0222, "step": 155690 }, { - "epoch": 0.79, - "learning_rate": 0.00018217101977185927, - "loss": 0.0118, + "epoch": 0.4, + "learning_rate": 0.00023946047109629556, + "loss": 0.0187, "step": 155700 }, { - "epoch": 0.79, - "learning_rate": 0.00018216345207884525, - "loss": 0.0119, + "epoch": 0.4, + "learning_rate": 0.00023945658287992407, + "loss": 0.0206, "step": 155710 }, { - "epoch": 0.79, - "learning_rate": 0.00018215588438583123, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.00023945269466355262, + "loss": 0.0185, "step": 155720 }, { - "epoch": 0.79, - "learning_rate": 0.00018214831669281724, - "loss": 0.0102, + "epoch": 0.4, + "learning_rate": 0.00023944880644718113, + "loss": 0.0178, "step": 155730 }, { - "epoch": 0.79, - "learning_rate": 0.00018214074899980322, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.0002394449182308097, + "loss": 0.0179, "step": 155740 }, { - "epoch": 0.79, - "learning_rate": 0.0001821331813067892, - "loss": 0.0142, + "epoch": 0.4, + "learning_rate": 0.00023944103001443824, + "loss": 0.0149, "step": 155750 }, { - "epoch": 0.79, - "learning_rate": 0.0001821256136137752, - "loss": 0.0108, + "epoch": 0.4, + "learning_rate": 0.00023943714179806676, + "loss": 0.0183, "step": 155760 }, { - "epoch": 0.79, - "learning_rate": 0.0001821180459207612, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00023943325358169527, + "loss": 0.0168, "step": 155770 }, { - "epoch": 0.79, - "learning_rate": 0.00018211047822774717, - "loss": 0.0161, + "epoch": 0.4, + "learning_rate": 0.00023942936536532384, + "loss": 0.0191, "step": 155780 }, { - "epoch": 0.79, - "learning_rate": 0.00018210291053473318, - "loss": 0.0138, + "epoch": 0.4, + "learning_rate": 0.00023942547714895238, + "loss": 0.0176, "step": 155790 }, { - "epoch": 0.79, - "learning_rate": 0.00018209534284171916, - "loss": 0.011, + "epoch": 0.4, + "learning_rate": 0.0002394215889325809, + "loss": 0.0214, "step": 155800 }, { - "epoch": 0.79, - "learning_rate": 0.00018208777514870514, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.00023941770071620944, + "loss": 0.022, "step": 155810 }, { - "epoch": 0.79, - "learning_rate": 0.00018208020745569115, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00023941381249983795, + "loss": 0.0261, "step": 155820 }, { - "epoch": 0.79, - "learning_rate": 0.00018207263976267713, - "loss": 0.0126, + "epoch": 0.4, + "learning_rate": 0.00023940992428346652, + "loss": 0.0239, "step": 155830 }, { - "epoch": 0.79, - "learning_rate": 0.00018206507206966312, - "loss": 0.0143, + "epoch": 0.4, + "learning_rate": 0.00023940603606709503, + "loss": 0.0182, "step": 155840 }, { - "epoch": 0.79, - "learning_rate": 0.0001820575043766491, - "loss": 0.0099, + "epoch": 0.4, + "learning_rate": 0.00023940214785072358, + "loss": 0.0191, "step": 155850 }, { - "epoch": 0.79, - "learning_rate": 0.0001820499366836351, - "loss": 0.0129, + "epoch": 0.4, + "learning_rate": 0.0002393982596343521, + "loss": 0.0212, "step": 155860 }, { - "epoch": 0.79, - "learning_rate": 0.0001820423689906211, - "loss": 0.0159, + "epoch": 0.4, + "learning_rate": 0.00023939437141798066, + "loss": 0.018, "step": 155870 }, { - "epoch": 0.79, - "learning_rate": 0.00018203480129760707, - "loss": 0.0127, + "epoch": 0.4, + "learning_rate": 0.00023939048320160917, + "loss": 0.019, "step": 155880 }, { - "epoch": 0.79, - "learning_rate": 0.00018202723360459308, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.00023938659498523772, + "loss": 0.0239, "step": 155890 }, { - "epoch": 0.79, - "learning_rate": 0.00018201966591157906, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00023938270676886623, + "loss": 0.0233, "step": 155900 }, { - "epoch": 0.79, - "learning_rate": 0.00018201209821856504, - "loss": 0.0155, + "epoch": 0.4, + "learning_rate": 0.0002393788185524948, + "loss": 0.0176, "step": 155910 }, { - "epoch": 0.79, - "learning_rate": 0.00018200453052555105, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00023937493033612334, + "loss": 0.0239, "step": 155920 }, { - "epoch": 0.79, - "learning_rate": 0.00018199696283253703, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00023937104211975186, + "loss": 0.0206, "step": 155930 }, { - "epoch": 0.79, - "learning_rate": 0.000181989395139523, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023936715390338037, + "loss": 0.0213, "step": 155940 }, { - "epoch": 0.79, - "learning_rate": 0.00018198182744650902, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00023936326568700894, + "loss": 0.0252, "step": 155950 }, { - "epoch": 0.79, - "learning_rate": 0.000181974259753495, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023935937747063748, + "loss": 0.0237, "step": 155960 }, { - "epoch": 0.79, - "learning_rate": 0.00018196669206048098, - "loss": 0.0139, + "epoch": 0.4, + "learning_rate": 0.000239355489254266, + "loss": 0.0173, "step": 155970 }, { - "epoch": 0.79, - "learning_rate": 0.000181959124367467, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00023935160103789454, + "loss": 0.0203, "step": 155980 }, { - "epoch": 0.79, - "learning_rate": 0.00018195155667445297, - "loss": 0.01, + "epoch": 0.4, + "learning_rate": 0.00023934771282152308, + "loss": 0.021, "step": 155990 }, { - "epoch": 0.79, - "learning_rate": 0.00018194398898143895, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023934382460515162, + "loss": 0.0229, "step": 156000 }, { - "epoch": 0.79, - "eval_cer": 0.9144838414489178, - "eval_loss": 0.00919434055685997, - "eval_runtime": 116.631, - "eval_samples_per_second": 17.148, - "eval_steps_per_second": 4.287, + "epoch": 0.4, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.012980636209249496, + "eval_runtime": 108.1448, + "eval_samples_per_second": 18.494, + "eval_steps_per_second": 4.623, "step": 156000 }, { - "epoch": 0.79, - "learning_rate": 0.00018193642128842494, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00023933993638878013, + "loss": 0.0183, "step": 156010 }, { - "epoch": 0.79, - "learning_rate": 0.00018192885359541094, - "loss": 0.0135, + "epoch": 0.4, + "learning_rate": 0.00023933604817240868, + "loss": 0.0206, "step": 156020 }, { - "epoch": 0.79, - "learning_rate": 0.00018192128590239693, - "loss": 0.0128, + "epoch": 0.4, + "learning_rate": 0.00023933215995603722, + "loss": 0.0172, "step": 156030 }, { - "epoch": 0.79, - "learning_rate": 0.0001819137182093829, - "loss": 0.0144, + "epoch": 0.4, + "learning_rate": 0.00023932827173966576, + "loss": 0.0202, "step": 156040 }, { - "epoch": 0.79, - "learning_rate": 0.00018190615051636892, - "loss": 0.0157, + "epoch": 0.4, + "learning_rate": 0.00023932438352329427, + "loss": 0.0173, "step": 156050 }, { - "epoch": 0.79, - "learning_rate": 0.0001818985828233549, - "loss": 0.0149, + "epoch": 0.4, + "learning_rate": 0.00023932049530692282, + "loss": 0.0174, "step": 156060 }, { - "epoch": 0.79, - "learning_rate": 0.00018189101513034088, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.00023931660709055133, + "loss": 0.0168, "step": 156070 }, { - "epoch": 0.79, - "learning_rate": 0.0001818834474373269, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.0002393127188741799, + "loss": 0.0176, "step": 156080 }, { - "epoch": 0.79, - "learning_rate": 0.00018187587974431287, - "loss": 0.0116, + "epoch": 0.4, + "learning_rate": 0.0002393088306578084, + "loss": 0.0172, "step": 156090 }, { - "epoch": 0.79, - "learning_rate": 0.00018186831205129885, - "loss": 0.014, + "epoch": 0.4, + "learning_rate": 0.00023930494244143695, + "loss": 0.0344, "step": 156100 }, { - "epoch": 0.79, - "learning_rate": 0.00018186074435828486, - "loss": 0.0123, + "epoch": 0.4, + "learning_rate": 0.00023930105422506547, + "loss": 0.0204, "step": 156110 }, { - "epoch": 0.79, - "learning_rate": 0.00018185317666527084, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00023929716600869404, + "loss": 0.0174, "step": 156120 }, { - "epoch": 0.79, - "learning_rate": 0.00018184560897225682, - "loss": 0.0124, + "epoch": 0.4, + "learning_rate": 0.00023929327779232258, + "loss": 0.0237, "step": 156130 }, { - "epoch": 0.79, - "learning_rate": 0.00018183804127924283, - "loss": 0.0112, + "epoch": 0.4, + "learning_rate": 0.0002392893895759511, + "loss": 0.0183, "step": 156140 }, { - "epoch": 0.79, - "learning_rate": 0.0001818304735862288, - "loss": 0.012, + "epoch": 0.4, + "learning_rate": 0.00023928550135957964, + "loss": 0.0171, "step": 156150 }, { - "epoch": 0.79, - "learning_rate": 0.0001818229058932148, - "loss": 0.0125, + "epoch": 0.4, + "learning_rate": 0.00023928161314320818, + "loss": 0.0204, "step": 156160 }, { - "epoch": 0.79, - "learning_rate": 0.0001818153382002008, - "loss": 0.013, + "epoch": 0.4, + "learning_rate": 0.00023927772492683672, + "loss": 0.0189, "step": 156170 }, { - "epoch": 0.79, - "learning_rate": 0.00018180777050718678, - "loss": 0.0136, + "epoch": 0.4, + "learning_rate": 0.00023927383671046523, + "loss": 0.018, "step": 156180 }, { - "epoch": 0.79, - "learning_rate": 0.00018180020281417276, - "loss": 0.0117, + "epoch": 0.4, + "learning_rate": 0.00023926994849409378, + "loss": 0.0188, "step": 156190 }, { - "epoch": 0.79, - "learning_rate": 0.00018179263512115875, - "loss": 0.0137, + "epoch": 0.4, + "learning_rate": 0.00023926606027772232, + "loss": 0.0179, "step": 156200 }, { - "epoch": 0.79, - "learning_rate": 0.00018178506742814475, - "loss": 0.0122, + "epoch": 0.4, + "learning_rate": 0.00023926217206135086, + "loss": 0.0204, "step": 156210 }, { - "epoch": 0.79, - "learning_rate": 0.00018177749973513074, - "loss": 0.0134, + "epoch": 0.4, + "learning_rate": 0.00023925828384497937, + "loss": 0.016, "step": 156220 }, { - "epoch": 0.79, - "learning_rate": 0.00018176993204211672, - "loss": 0.0133, + "epoch": 0.4, + "learning_rate": 0.00023925439562860791, + "loss": 0.0231, "step": 156230 }, { - "epoch": 0.79, - "learning_rate": 0.00018176236434910273, - "loss": 0.0091, + "epoch": 0.4, + "learning_rate": 0.00023925050741223646, + "loss": 0.0208, "step": 156240 }, { - "epoch": 0.79, - "learning_rate": 0.0001817547966560887, - "loss": 0.0171, + "epoch": 0.41, + "learning_rate": 0.000239246619195865, + "loss": 0.0187, "step": 156250 }, { - "epoch": 0.79, - "learning_rate": 0.0001817472289630747, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.0002392427309794935, + "loss": 0.0188, "step": 156260 }, { - "epoch": 0.79, - "learning_rate": 0.0001817396612700607, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023923884276312205, + "loss": 0.0182, "step": 156270 }, { - "epoch": 0.79, - "learning_rate": 0.00018173209357704668, - "loss": 0.0103, + "epoch": 0.41, + "learning_rate": 0.00023923495454675062, + "loss": 0.016, "step": 156280 }, { - "epoch": 0.79, - "learning_rate": 0.00018172452588403266, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023923106633037914, + "loss": 0.0178, "step": 156290 }, { - "epoch": 0.79, - "learning_rate": 0.00018171695819101867, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023922717811400768, + "loss": 0.0213, "step": 156300 }, { - "epoch": 0.79, - "learning_rate": 0.00018170939049800465, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.0002392232898976362, + "loss": 0.017, "step": 156310 }, { - "epoch": 0.79, - "learning_rate": 0.00018170182280499063, - "loss": 0.0106, + "epoch": 0.41, + "learning_rate": 0.00023921940168126474, + "loss": 0.0172, "step": 156320 }, { - "epoch": 0.79, - "learning_rate": 0.00018169425511197664, - "loss": 0.0093, + "epoch": 0.41, + "learning_rate": 0.00023921551346489328, + "loss": 0.0204, "step": 156330 }, { - "epoch": 0.79, - "learning_rate": 0.00018168668741896262, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023921162524852182, + "loss": 0.022, "step": 156340 }, { - "epoch": 0.79, - "learning_rate": 0.0001816791197259486, - "loss": 0.0085, + "epoch": 0.41, + "learning_rate": 0.00023920773703215033, + "loss": 0.0146, "step": 156350 }, { - "epoch": 0.79, - "learning_rate": 0.00018167155203293459, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023920384881577887, + "loss": 0.0179, "step": 156360 }, { - "epoch": 0.79, - "learning_rate": 0.0001816639843399206, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023919996059940742, + "loss": 0.0221, "step": 156370 }, { - "epoch": 0.79, - "learning_rate": 0.00018165641664690657, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023919607238303596, + "loss": 0.0237, "step": 156380 }, { - "epoch": 0.79, - "learning_rate": 0.00018164884895389256, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023919218416666447, + "loss": 0.0208, "step": 156390 }, { - "epoch": 0.79, - "learning_rate": 0.00018164128126087856, - "loss": 0.01, + "epoch": 0.41, + "learning_rate": 0.00023918829595029301, + "loss": 0.0185, "step": 156400 }, { - "epoch": 0.79, - "learning_rate": 0.00018163371356786455, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023918440773392156, + "loss": 0.0183, "step": 156410 }, { - "epoch": 0.79, - "learning_rate": 0.00018162614587485053, - "loss": 0.0155, + "epoch": 0.41, + "learning_rate": 0.0002391805195175501, + "loss": 0.0202, "step": 156420 }, { - "epoch": 0.79, - "learning_rate": 0.00018161857818183654, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.0002391766313011786, + "loss": 0.0159, "step": 156430 }, { - "epoch": 0.79, - "learning_rate": 0.00018161101048882252, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.00023917274308480715, + "loss": 0.0161, "step": 156440 }, { - "epoch": 0.79, - "learning_rate": 0.0001816034427958085, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023916885486843572, + "loss": 0.0226, "step": 156450 }, { - "epoch": 0.79, - "learning_rate": 0.0001815958751027945, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.00023916496665206424, + "loss": 0.0211, "step": 156460 }, { - "epoch": 0.79, - "learning_rate": 0.0001815883074097805, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023916107843569278, + "loss": 0.0181, "step": 156470 }, { - "epoch": 0.79, - "learning_rate": 0.00018158073971676647, - "loss": 0.0153, + "epoch": 0.41, + "learning_rate": 0.0002391571902193213, + "loss": 0.0193, "step": 156480 }, { - "epoch": 0.79, - "learning_rate": 0.00018157317202375243, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023915330200294986, + "loss": 0.0152, "step": 156490 }, { - "epoch": 0.79, - "learning_rate": 0.00018156560433073843, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023914941378657838, + "loss": 0.0191, "step": 156500 }, { - "epoch": 0.79, - "learning_rate": 0.00018155803663772442, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023914552557020692, + "loss": 0.0196, "step": 156510 }, { - "epoch": 0.79, - "learning_rate": 0.0001815504689447104, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.00023914163735383543, + "loss": 0.0212, "step": 156520 }, { - "epoch": 0.79, - "learning_rate": 0.0001815429012516964, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.000239137749137464, + "loss": 0.016, "step": 156530 }, { - "epoch": 0.79, - "learning_rate": 0.0001815353335586824, - "loss": 0.0195, + "epoch": 0.41, + "learning_rate": 0.00023913386092109252, + "loss": 0.0192, "step": 156540 }, { - "epoch": 0.79, - "learning_rate": 0.00018152776586566837, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023912997270472106, + "loss": 0.0242, "step": 156550 }, { - "epoch": 0.79, - "learning_rate": 0.00018152019817265438, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023912608448834957, + "loss": 0.02, "step": 156560 }, { - "epoch": 0.79, - "learning_rate": 0.00018151263047964036, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.0002391221962719781, + "loss": 0.0193, "step": 156570 }, { - "epoch": 0.79, - "learning_rate": 0.00018150506278662634, - "loss": 0.0114, + "epoch": 0.41, + "learning_rate": 0.00023911830805560666, + "loss": 0.0185, "step": 156580 }, { - "epoch": 0.79, - "learning_rate": 0.00018149749509361232, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.0002391144198392352, + "loss": 0.0234, "step": 156590 }, { - "epoch": 0.79, - "learning_rate": 0.00018148992740059833, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.0002391105316228637, + "loss": 0.019, "step": 156600 }, { - "epoch": 0.79, - "learning_rate": 0.0001814823597075843, - "loss": 0.0273, + "epoch": 0.41, + "learning_rate": 0.00023910664340649225, + "loss": 0.021, "step": 156610 }, { - "epoch": 0.79, - "learning_rate": 0.0001814747920145703, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.00023910275519012082, + "loss": 0.0209, "step": 156620 }, { - "epoch": 0.79, - "learning_rate": 0.0001814672243215563, - "loss": 0.0153, + "epoch": 0.41, + "learning_rate": 0.00023909886697374934, + "loss": 0.025, "step": 156630 }, { - "epoch": 0.79, - "learning_rate": 0.00018145965662854228, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023909497875737785, + "loss": 0.0263, "step": 156640 }, { - "epoch": 0.79, - "learning_rate": 0.00018145208893552826, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.0002390910905410064, + "loss": 0.0198, "step": 156650 }, { - "epoch": 0.79, - "learning_rate": 0.00018144452124251427, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023908720232463496, + "loss": 0.0239, "step": 156660 }, { - "epoch": 0.79, - "learning_rate": 0.00018143695354950025, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023908331410826348, + "loss": 0.0206, "step": 156670 }, { - "epoch": 0.79, - "learning_rate": 0.00018142938585648624, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023907942589189202, + "loss": 0.0163, "step": 156680 }, { - "epoch": 0.79, - "learning_rate": 0.00018142181816347224, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.00023907553767552053, + "loss": 0.0221, "step": 156690 }, { - "epoch": 0.79, - "learning_rate": 0.00018141425047045823, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.0002390716494591491, + "loss": 0.0209, "step": 156700 }, { - "epoch": 0.79, - "learning_rate": 0.0001814066827774442, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023906776124277762, + "loss": 0.0182, "step": 156710 }, { - "epoch": 0.79, - "learning_rate": 0.00018139911508443022, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.00023906387302640616, + "loss": 0.0154, "step": 156720 }, { - "epoch": 0.79, - "learning_rate": 0.0001813915473914162, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023905998481003467, + "loss": 0.0194, "step": 156730 }, { - "epoch": 0.79, - "learning_rate": 0.00018138397969840218, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023905609659366324, + "loss": 0.0212, "step": 156740 }, { - "epoch": 0.79, - "learning_rate": 0.00018137641200538816, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023905220837729175, + "loss": 0.0174, "step": 156750 }, { - "epoch": 0.79, - "learning_rate": 0.00018136884431237417, - "loss": 0.0091, + "epoch": 0.41, + "learning_rate": 0.0002390483201609203, + "loss": 0.0159, "step": 156760 }, { - "epoch": 0.79, - "learning_rate": 0.00018136127661936015, - "loss": 0.0101, + "epoch": 0.41, + "learning_rate": 0.0002390444319445488, + "loss": 0.0171, "step": 156770 }, { - "epoch": 0.79, - "learning_rate": 0.00018135370892634613, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023904054372817738, + "loss": 0.0176, "step": 156780 }, { - "epoch": 0.79, - "learning_rate": 0.00018134614123333214, - "loss": 0.0159, + "epoch": 0.41, + "learning_rate": 0.00023903665551180592, + "loss": 0.0203, "step": 156790 }, { - "epoch": 0.79, - "learning_rate": 0.00018133857354031812, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023903276729543444, + "loss": 0.02, "step": 156800 }, { - "epoch": 0.79, - "learning_rate": 0.0001813310058473041, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023902887907906295, + "loss": 0.0177, "step": 156810 }, { - "epoch": 0.79, - "learning_rate": 0.0001813234381542901, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.0002390249908626915, + "loss": 0.0205, "step": 156820 }, { - "epoch": 0.79, - "learning_rate": 0.0001813158704612761, - "loss": 0.0155, + "epoch": 0.41, + "learning_rate": 0.00023902110264632006, + "loss": 0.0183, "step": 156830 }, { - "epoch": 0.79, - "learning_rate": 0.00018130830276826207, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023901721442994857, + "loss": 0.018, "step": 156840 }, { - "epoch": 0.79, - "learning_rate": 0.00018130073507524808, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.00023901332621357712, + "loss": 0.0218, "step": 156850 }, { - "epoch": 0.79, - "learning_rate": 0.00018129316738223406, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023900943799720563, + "loss": 0.0224, "step": 156860 }, { - "epoch": 0.79, - "learning_rate": 0.00018128559968922005, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.0002390055497808342, + "loss": 0.0215, "step": 156870 }, { - "epoch": 0.79, - "learning_rate": 0.00018127803199620605, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023900166156446271, + "loss": 0.0195, "step": 156880 }, { - "epoch": 0.79, - "learning_rate": 0.00018127046430319204, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023899777334809126, + "loss": 0.0167, "step": 156890 }, { - "epoch": 0.79, - "learning_rate": 0.00018126289661017802, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023899388513171977, + "loss": 0.0191, "step": 156900 }, { - "epoch": 0.79, - "learning_rate": 0.000181255328917164, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023898999691534834, + "loss": 0.0187, "step": 156910 }, { - "epoch": 0.79, - "learning_rate": 0.00018124776122415, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023898610869897685, + "loss": 0.0182, "step": 156920 }, { - "epoch": 0.79, - "learning_rate": 0.000181240193531136, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002389822204826054, + "loss": 0.0212, "step": 156930 }, { - "epoch": 0.79, - "learning_rate": 0.00018123262583812197, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.0002389783322662339, + "loss": 0.0185, "step": 156940 }, { - "epoch": 0.79, - "learning_rate": 0.00018122505814510798, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023897444404986248, + "loss": 0.0167, "step": 156950 }, { - "epoch": 0.79, - "learning_rate": 0.00018121749045209396, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.000238970555833491, + "loss": 0.0215, "step": 156960 }, { - "epoch": 0.79, - "learning_rate": 0.00018120992275907994, - "loss": 0.0112, + "epoch": 0.41, + "learning_rate": 0.00023896666761711953, + "loss": 0.0166, "step": 156970 }, { - "epoch": 0.79, - "learning_rate": 0.00018120235506606595, - "loss": 0.0101, + "epoch": 0.41, + "learning_rate": 0.00023896277940074805, + "loss": 0.02, "step": 156980 }, { - "epoch": 0.79, - "learning_rate": 0.00018119478737305193, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.00023895889118437662, + "loss": 0.0134, "step": 156990 }, { - "epoch": 0.79, - "learning_rate": 0.0001811872196800379, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023895500296800516, + "loss": 0.0189, "step": 157000 }, { - "epoch": 0.79, - "eval_cer": 0.9144983973907989, - "eval_loss": 0.009071653708815575, - "eval_runtime": 116.5721, - "eval_samples_per_second": 17.157, - "eval_steps_per_second": 4.289, + "epoch": 0.41, + "eval_cer": 0.8817852649022844, + "eval_loss": 0.013182581402361393, + "eval_runtime": 108.1899, + "eval_samples_per_second": 18.486, + "eval_steps_per_second": 4.622, "step": 157000 }, { - "epoch": 0.79, - "learning_rate": 0.00018117965198702392, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023895111475163367, + "loss": 0.0227, "step": 157010 }, { - "epoch": 0.79, - "learning_rate": 0.0001811720842940099, - "loss": 0.0134, + "epoch": 0.41, + "learning_rate": 0.00023894722653526222, + "loss": 0.0176, "step": 157020 }, { - "epoch": 0.79, - "learning_rate": 0.00018116451660099588, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023894333831889076, + "loss": 0.0164, "step": 157030 }, { - "epoch": 0.79, - "learning_rate": 0.0001811569489079819, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.0002389394501025193, + "loss": 0.0157, "step": 157040 }, { - "epoch": 0.79, - "learning_rate": 0.00018114938121496787, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023893556188614781, + "loss": 0.0199, "step": 157050 }, { - "epoch": 0.79, - "learning_rate": 0.00018114181352195386, - "loss": 0.0166, + "epoch": 0.41, + "learning_rate": 0.00023893167366977636, + "loss": 0.0196, "step": 157060 }, { - "epoch": 0.79, - "learning_rate": 0.00018113424582893984, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023892778545340487, + "loss": 0.0202, "step": 157070 }, { - "epoch": 0.79, - "learning_rate": 0.00018112667813592585, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.00023892389723703344, + "loss": 0.0184, "step": 157080 }, { - "epoch": 0.79, - "learning_rate": 0.00018111911044291183, - "loss": 0.019, + "epoch": 0.41, + "learning_rate": 0.00023892000902066195, + "loss": 0.0199, "step": 157090 }, { - "epoch": 0.79, - "learning_rate": 0.0001811115427498978, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.0002389161208042905, + "loss": 0.0177, "step": 157100 }, { - "epoch": 0.79, - "learning_rate": 0.00018110397505688382, - "loss": 0.0156, + "epoch": 0.41, + "learning_rate": 0.000238912232587919, + "loss": 0.0224, "step": 157110 }, { - "epoch": 0.79, - "learning_rate": 0.0001810964073638698, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023890834437154758, + "loss": 0.0189, "step": 157120 }, { - "epoch": 0.79, - "learning_rate": 0.00018108883967085578, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.0002389044561551761, + "loss": 0.0179, "step": 157130 }, { - "epoch": 0.79, - "learning_rate": 0.0001810812719778418, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023890056793880463, + "loss": 0.0224, "step": 157140 }, { - "epoch": 0.79, - "learning_rate": 0.00018107370428482777, - "loss": 0.0151, + "epoch": 0.41, + "learning_rate": 0.00023889667972243315, + "loss": 0.0179, "step": 157150 }, { - "epoch": 0.79, - "learning_rate": 0.00018106613659181375, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023889279150606172, + "loss": 0.0199, "step": 157160 }, { - "epoch": 0.79, - "learning_rate": 0.00018105856889879976, - "loss": 0.0154, + "epoch": 0.41, + "learning_rate": 0.00023888890328969026, + "loss": 0.0191, "step": 157170 }, { - "epoch": 0.79, - "learning_rate": 0.00018105100120578574, - "loss": 0.0146, + "epoch": 0.41, + "learning_rate": 0.00023888501507331877, + "loss": 0.0176, "step": 157180 }, { - "epoch": 0.79, - "learning_rate": 0.00018104343351277172, - "loss": 0.0104, + "epoch": 0.41, + "learning_rate": 0.00023888112685694732, + "loss": 0.0238, "step": 157190 }, { - "epoch": 0.79, - "learning_rate": 0.00018103586581975773, - "loss": 0.0094, + "epoch": 0.41, + "learning_rate": 0.00023887723864057586, + "loss": 0.0169, "step": 157200 }, { - "epoch": 0.79, - "learning_rate": 0.0001810282981267437, - "loss": 0.0141, + "epoch": 0.41, + "learning_rate": 0.0002388733504242044, + "loss": 0.0201, "step": 157210 }, { - "epoch": 0.79, - "learning_rate": 0.0001810207304337297, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.0002388694622078329, + "loss": 0.0174, "step": 157220 }, { - "epoch": 0.79, - "learning_rate": 0.0001810131627407157, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023886557399146145, + "loss": 0.0202, "step": 157230 }, { - "epoch": 0.79, - "learning_rate": 0.00018100559504770168, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023886168577509, + "loss": 0.0172, "step": 157240 }, { - "epoch": 0.79, - "learning_rate": 0.00018099802735468767, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023885779755871854, + "loss": 0.0188, "step": 157250 }, { - "epoch": 0.79, - "learning_rate": 0.00018099045966167365, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023885390934234705, + "loss": 0.0184, "step": 157260 }, { - "epoch": 0.79, - "learning_rate": 0.00018098289196865966, - "loss": 0.0152, + "epoch": 0.41, + "learning_rate": 0.0002388500211259756, + "loss": 0.0183, "step": 157270 }, { - "epoch": 0.79, - "learning_rate": 0.00018097532427564564, - "loss": 0.0164, + "epoch": 0.41, + "learning_rate": 0.00023884613290960414, + "loss": 0.0225, "step": 157280 }, { - "epoch": 0.79, - "learning_rate": 0.00018096775658263162, - "loss": 0.0145, + "epoch": 0.41, + "learning_rate": 0.00023884224469323268, + "loss": 0.018, "step": 157290 }, { - "epoch": 0.79, - "learning_rate": 0.00018096018888961763, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.0002388383564768612, + "loss": 0.0205, "step": 157300 }, { - "epoch": 0.79, - "learning_rate": 0.0001809526211966036, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023883446826048973, + "loss": 0.021, "step": 157310 }, { - "epoch": 0.79, - "learning_rate": 0.0001809450535035896, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023883058004411825, + "loss": 0.0163, "step": 157320 }, { - "epoch": 0.79, - "learning_rate": 0.0001809374858105756, - "loss": 0.0153, + "epoch": 0.41, + "learning_rate": 0.00023882669182774682, + "loss": 0.0182, "step": 157330 }, { - "epoch": 0.79, - "learning_rate": 0.00018092991811756158, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023882280361137536, + "loss": 0.0161, "step": 157340 }, { - "epoch": 0.79, - "learning_rate": 0.00018092235042454756, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.00023881891539500387, + "loss": 0.0206, "step": 157350 }, { - "epoch": 0.79, - "learning_rate": 0.00018091478273153357, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.0002388150271786324, + "loss": 0.0166, "step": 157360 }, { - "epoch": 0.79, - "learning_rate": 0.00018090721503851955, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023881113896226096, + "loss": 0.0212, "step": 157370 }, { - "epoch": 0.79, - "learning_rate": 0.00018089964734550553, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.0002388072507458895, + "loss": 0.0132, "step": 157380 }, { - "epoch": 0.79, - "learning_rate": 0.00018089207965249154, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.000238803362529518, + "loss": 0.0197, "step": 157390 }, { - "epoch": 0.79, - "learning_rate": 0.00018088451195947752, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023879947431314655, + "loss": 0.0178, "step": 157400 }, { - "epoch": 0.79, - "learning_rate": 0.0001808769442664635, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.0002387955860967751, + "loss": 0.0192, "step": 157410 }, { - "epoch": 0.79, - "learning_rate": 0.00018086937657344949, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023879169788040364, + "loss": 0.018, "step": 157420 }, { - "epoch": 0.79, - "learning_rate": 0.0001808618088804355, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023878780966403215, + "loss": 0.0172, "step": 157430 }, { - "epoch": 0.79, - "learning_rate": 0.00018085424118742148, - "loss": 0.0085, + "epoch": 0.41, + "learning_rate": 0.0002387839214476607, + "loss": 0.0158, "step": 157440 }, { - "epoch": 0.79, - "learning_rate": 0.00018084667349440746, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023878003323128924, + "loss": 0.0231, "step": 157450 }, { - "epoch": 0.79, - "learning_rate": 0.00018083910580139347, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023877614501491778, + "loss": 0.0205, "step": 157460 }, { - "epoch": 0.79, - "learning_rate": 0.00018083153810837945, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.0002387722567985463, + "loss": 0.0174, "step": 157470 }, { - "epoch": 0.79, - "learning_rate": 0.00018082397041536543, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023876836858217483, + "loss": 0.0153, "step": 157480 }, { - "epoch": 0.79, - "learning_rate": 0.00018081640272235144, - "loss": 0.0103, - "step": 157490 + "epoch": 0.41, + "learning_rate": 0.0002387644803658034, + "loss": 0.0176, + "step": 157490 }, { - "epoch": 0.79, - "learning_rate": 0.00018080883502933742, - "loss": 0.0204, + "epoch": 0.41, + "learning_rate": 0.00023876059214943192, + "loss": 0.0184, "step": 157500 }, { - "epoch": 0.79, - "learning_rate": 0.0001808012673363234, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023875670393306046, + "loss": 0.0207, "step": 157510 }, { - "epoch": 0.79, - "learning_rate": 0.0001807936996433094, - "loss": 0.0155, + "epoch": 0.41, + "learning_rate": 0.00023875281571668897, + "loss": 0.0201, "step": 157520 }, { - "epoch": 0.79, - "learning_rate": 0.0001807861319502954, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.00023874892750031754, + "loss": 0.0188, "step": 157530 }, { - "epoch": 0.79, - "learning_rate": 0.00018077856425728137, - "loss": 0.0102, + "epoch": 0.41, + "learning_rate": 0.00023874503928394606, + "loss": 0.0216, "step": 157540 }, { - "epoch": 0.79, - "learning_rate": 0.00018077099656426738, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.0002387411510675746, + "loss": 0.02, "step": 157550 }, { - "epoch": 0.79, - "learning_rate": 0.00018076342887125336, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.0002387372628512031, + "loss": 0.0213, "step": 157560 }, { - "epoch": 0.79, - "learning_rate": 0.00018075586117823934, - "loss": 0.0141, + "epoch": 0.41, + "learning_rate": 0.00023873337463483165, + "loss": 0.0187, "step": 157570 }, { - "epoch": 0.8, - "learning_rate": 0.00018074829348522532, - "loss": 0.0114, + "epoch": 0.41, + "learning_rate": 0.0002387294864184602, + "loss": 0.0194, "step": 157580 }, { - "epoch": 0.8, - "learning_rate": 0.00018074072579221133, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023872559820208874, + "loss": 0.0166, "step": 157590 }, { - "epoch": 0.8, - "learning_rate": 0.00018073315809919731, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023872170998571725, + "loss": 0.0144, "step": 157600 }, { - "epoch": 0.8, - "learning_rate": 0.0001807255904061833, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002387178217693458, + "loss": 0.0174, "step": 157610 }, { - "epoch": 0.8, - "learning_rate": 0.0001807180227131693, - "loss": 0.0169, + "epoch": 0.41, + "learning_rate": 0.00023871393355297433, + "loss": 0.0212, "step": 157620 }, { - "epoch": 0.8, - "learning_rate": 0.00018071045502015529, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023871004533660288, + "loss": 0.0164, "step": 157630 }, { - "epoch": 0.8, - "learning_rate": 0.00018070288732714127, - "loss": 0.0102, + "epoch": 0.41, + "learning_rate": 0.0002387061571202314, + "loss": 0.0162, "step": 157640 }, { - "epoch": 0.8, - "learning_rate": 0.00018069531963412728, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023870226890385993, + "loss": 0.0216, "step": 157650 }, { - "epoch": 0.8, - "learning_rate": 0.00018068775194111326, - "loss": 0.0149, + "epoch": 0.41, + "learning_rate": 0.0002386983806874885, + "loss": 0.022, "step": 157660 }, { - "epoch": 0.8, - "learning_rate": 0.00018068018424809924, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.00023869449247111702, + "loss": 0.0192, "step": 157670 }, { - "epoch": 0.8, - "learning_rate": 0.00018067261655508525, - "loss": 0.0141, + "epoch": 0.41, + "learning_rate": 0.00023869060425474553, + "loss": 0.0206, "step": 157680 }, { - "epoch": 0.8, - "learning_rate": 0.00018066504886207123, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023868671603837407, + "loss": 0.0154, "step": 157690 }, { - "epoch": 0.8, - "learning_rate": 0.0001806574811690572, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023868282782200264, + "loss": 0.0189, "step": 157700 }, { - "epoch": 0.8, - "learning_rate": 0.00018064991347604322, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023867893960563116, + "loss": 0.0197, "step": 157710 }, { - "epoch": 0.8, - "learning_rate": 0.0001806423457830292, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.0002386750513892597, + "loss": 0.0236, "step": 157720 }, { - "epoch": 0.8, - "learning_rate": 0.00018063477809001518, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.0002386711631728882, + "loss": 0.0222, "step": 157730 }, { - "epoch": 0.8, - "learning_rate": 0.00018062721039700114, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.00023866727495651678, + "loss": 0.0198, "step": 157740 }, { - "epoch": 0.8, - "learning_rate": 0.00018061964270398714, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002386633867401453, + "loss": 0.017, "step": 157750 }, { - "epoch": 0.8, - "learning_rate": 0.00018061207501097313, - "loss": 0.0114, + "epoch": 0.41, + "learning_rate": 0.00023865949852377384, + "loss": 0.0186, "step": 157760 }, { - "epoch": 0.8, - "learning_rate": 0.0001806045073179591, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023865561030740235, + "loss": 0.0165, "step": 157770 }, { - "epoch": 0.8, - "learning_rate": 0.00018059693962494512, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023865172209103092, + "loss": 0.0185, "step": 157780 }, { - "epoch": 0.8, - "learning_rate": 0.0001805893719319311, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023864783387465943, + "loss": 0.0183, "step": 157790 }, { - "epoch": 0.8, - "learning_rate": 0.00018058180423891708, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023864394565828798, + "loss": 0.0207, "step": 157800 }, { - "epoch": 0.8, - "learning_rate": 0.00018057423654590306, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.0002386400574419165, + "loss": 0.0185, "step": 157810 }, { - "epoch": 0.8, - "learning_rate": 0.00018056666885288907, - "loss": 0.0151, + "epoch": 0.41, + "learning_rate": 0.00023863616922554503, + "loss": 0.0201, "step": 157820 }, { - "epoch": 0.8, - "learning_rate": 0.00018055910115987505, - "loss": 0.0102, + "epoch": 0.41, + "learning_rate": 0.00023863228100917357, + "loss": 0.0191, "step": 157830 }, { - "epoch": 0.8, - "learning_rate": 0.00018055153346686103, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023862839279280212, + "loss": 0.0209, "step": 157840 }, { - "epoch": 0.8, - "learning_rate": 0.00018054396577384704, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023862450457643063, + "loss": 0.0208, "step": 157850 }, { - "epoch": 0.8, - "learning_rate": 0.00018053639808083302, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023862061636005917, + "loss": 0.0238, "step": 157860 }, { - "epoch": 0.8, - "learning_rate": 0.000180528830387819, - "loss": 0.0152, + "epoch": 0.41, + "learning_rate": 0.00023861672814368774, + "loss": 0.0196, "step": 157870 }, { - "epoch": 0.8, - "learning_rate": 0.000180521262694805, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023861283992731625, + "loss": 0.0176, "step": 157880 }, { - "epoch": 0.8, - "learning_rate": 0.000180513695001791, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.0002386089517109448, + "loss": 0.0159, "step": 157890 }, { - "epoch": 0.8, - "learning_rate": 0.00018050612730877697, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.0002386050634945733, + "loss": 0.0198, "step": 157900 }, { - "epoch": 0.8, - "learning_rate": 0.00018049855961576298, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023860117527820188, + "loss": 0.0195, "step": 157910 }, { - "epoch": 0.8, - "learning_rate": 0.00018049099192274896, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.0002385972870618304, + "loss": 0.0178, "step": 157920 }, { - "epoch": 0.8, - "learning_rate": 0.00018048342422973495, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.00023859339884545894, + "loss": 0.021, "step": 157930 }, { - "epoch": 0.8, - "learning_rate": 0.00018047585653672095, - "loss": 0.0112, + "epoch": 0.41, + "learning_rate": 0.00023858951062908745, + "loss": 0.018, "step": 157940 }, { - "epoch": 0.8, - "learning_rate": 0.00018046828884370694, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023858562241271602, + "loss": 0.0194, "step": 157950 }, { - "epoch": 0.8, - "learning_rate": 0.00018046072115069292, - "loss": 0.01, + "epoch": 0.41, + "learning_rate": 0.00023858173419634453, + "loss": 0.0243, "step": 157960 }, { - "epoch": 0.8, - "learning_rate": 0.0001804531534576789, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023857784597997308, + "loss": 0.0199, "step": 157970 }, { - "epoch": 0.8, - "learning_rate": 0.0001804455857646649, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.0002385739577636016, + "loss": 0.0198, "step": 157980 }, { - "epoch": 0.8, - "learning_rate": 0.0001804380180716509, - "loss": 0.0087, + "epoch": 0.41, + "learning_rate": 0.00023857006954723016, + "loss": 0.0185, "step": 157990 }, { - "epoch": 0.8, - "learning_rate": 0.00018043045037863687, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023856618133085867, + "loss": 0.0172, "step": 158000 }, { - "epoch": 0.8, - "eval_cer": 0.914447936792278, - "eval_loss": 0.008715854957699776, - "eval_runtime": 116.7633, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.41, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.012989984825253487, + "eval_runtime": 107.5587, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.649, "step": 158000 }, { - "epoch": 0.8, - "learning_rate": 0.00018042288268562288, - "loss": 0.0173, + "epoch": 0.41, + "learning_rate": 0.00023856229311448721, + "loss": 0.0186, "step": 158010 }, { - "epoch": 0.8, - "learning_rate": 0.00018041531499260886, - "loss": 0.0147, + "epoch": 0.41, + "learning_rate": 0.00023855840489811573, + "loss": 0.0204, "step": 158020 }, { - "epoch": 0.8, - "learning_rate": 0.00018040774729959484, - "loss": 0.0137, + "epoch": 0.41, + "learning_rate": 0.0002385545166817443, + "loss": 0.0228, "step": 158030 }, { - "epoch": 0.8, - "learning_rate": 0.00018040017960658085, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023855062846537284, + "loss": 0.0206, "step": 158040 }, { - "epoch": 0.8, - "learning_rate": 0.00018039261191356683, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023854674024900135, + "loss": 0.0199, "step": 158050 }, { - "epoch": 0.8, - "learning_rate": 0.0001803850442205528, - "loss": 0.0181, + "epoch": 0.41, + "learning_rate": 0.0002385428520326299, + "loss": 0.018, "step": 158060 }, { - "epoch": 0.8, - "learning_rate": 0.00018037747652753882, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.0002385389638162584, + "loss": 0.0179, "step": 158070 }, { - "epoch": 0.8, - "learning_rate": 0.0001803699088345248, - "loss": 0.0106, + "epoch": 0.41, + "learning_rate": 0.00023853507559988698, + "loss": 0.0219, "step": 158080 }, { - "epoch": 0.8, - "learning_rate": 0.00018036234114151078, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.0002385311873835155, + "loss": 0.0166, "step": 158090 }, { - "epoch": 0.8, - "learning_rate": 0.0001803547734484968, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023852729916714404, + "loss": 0.023, "step": 158100 }, { - "epoch": 0.8, - "learning_rate": 0.00018034720575548277, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023852341095077255, + "loss": 0.0187, "step": 158110 }, { - "epoch": 0.8, - "learning_rate": 0.00018033963806246876, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023851952273440112, + "loss": 0.0212, "step": 158120 }, { - "epoch": 0.8, - "learning_rate": 0.00018033207036945476, - "loss": 0.0159, + "epoch": 0.41, + "learning_rate": 0.00023851563451802963, + "loss": 0.0173, "step": 158130 }, { - "epoch": 0.8, - "learning_rate": 0.00018032450267644075, - "loss": 0.0092, + "epoch": 0.41, + "learning_rate": 0.00023851174630165817, + "loss": 0.0174, "step": 158140 }, { - "epoch": 0.8, - "learning_rate": 0.00018031693498342673, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.0002385078580852867, + "loss": 0.0189, "step": 158150 }, { - "epoch": 0.8, - "learning_rate": 0.0001803093672904127, - "loss": 0.0155, + "epoch": 0.41, + "learning_rate": 0.00023850396986891526, + "loss": 0.0247, "step": 158160 }, { - "epoch": 0.8, - "learning_rate": 0.00018030179959739872, - "loss": 0.0114, + "epoch": 0.41, + "learning_rate": 0.00023850008165254377, + "loss": 0.0192, "step": 158170 }, { - "epoch": 0.8, - "learning_rate": 0.0001802942319043847, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023849619343617231, + "loss": 0.0169, "step": 158180 }, { - "epoch": 0.8, - "learning_rate": 0.00018028666421137068, - "loss": 0.0101, + "epoch": 0.41, + "learning_rate": 0.00023849230521980083, + "loss": 0.018, "step": 158190 }, { - "epoch": 0.8, - "learning_rate": 0.0001802790965183567, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.0002384884170034294, + "loss": 0.0185, "step": 158200 }, { - "epoch": 0.8, - "learning_rate": 0.00018027152882534267, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.00023848452878705794, + "loss": 0.0306, "step": 158210 }, { - "epoch": 0.8, - "learning_rate": 0.00018026396113232865, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023848064057068645, + "loss": 0.0165, "step": 158220 }, { - "epoch": 0.8, - "learning_rate": 0.00018025639343931466, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023847675235431497, + "loss": 0.0181, "step": 158230 }, { - "epoch": 0.8, - "learning_rate": 0.00018024882574630064, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023847286413794354, + "loss": 0.0169, "step": 158240 }, { - "epoch": 0.8, - "learning_rate": 0.00018024125805328662, - "loss": 0.0151, + "epoch": 0.41, + "learning_rate": 0.00023846897592157208, + "loss": 0.0166, "step": 158250 }, { - "epoch": 0.8, - "learning_rate": 0.00018023369036027263, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.0002384650877052006, + "loss": 0.0196, "step": 158260 }, { - "epoch": 0.8, - "learning_rate": 0.0001802261226672586, - "loss": 0.0101, + "epoch": 0.41, + "learning_rate": 0.00023846119948882913, + "loss": 0.018, "step": 158270 }, { - "epoch": 0.8, - "learning_rate": 0.0001802185549742446, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023845731127245768, + "loss": 0.0188, "step": 158280 }, { - "epoch": 0.8, - "learning_rate": 0.0001802109872812306, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023845342305608622, + "loss": 0.0201, "step": 158290 }, { - "epoch": 0.8, - "learning_rate": 0.00018020341958821658, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.00023844953483971473, + "loss": 0.019, "step": 158300 }, { - "epoch": 0.8, - "learning_rate": 0.00018019585189520257, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023844564662334327, + "loss": 0.0227, "step": 158310 }, { - "epoch": 0.8, - "learning_rate": 0.00018018828420218855, - "loss": 0.0156, + "epoch": 0.41, + "learning_rate": 0.0002384417584069718, + "loss": 0.0196, "step": 158320 }, { - "epoch": 0.8, - "learning_rate": 0.00018018071650917456, - "loss": 0.018, + "epoch": 0.41, + "learning_rate": 0.00023843787019060036, + "loss": 0.0229, "step": 158330 }, { - "epoch": 0.8, - "learning_rate": 0.00018017314881616054, - "loss": 0.0102, + "epoch": 0.41, + "learning_rate": 0.00023843398197422887, + "loss": 0.022, "step": 158340 }, { - "epoch": 0.8, - "learning_rate": 0.00018016558112314652, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023843009375785741, + "loss": 0.0216, "step": 158350 }, { - "epoch": 0.8, - "learning_rate": 0.00018015801343013253, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023842620554148593, + "loss": 0.0202, "step": 158360 }, { - "epoch": 0.8, - "learning_rate": 0.0001801504457371185, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.0002384223173251145, + "loss": 0.0154, "step": 158370 }, { - "epoch": 0.8, - "learning_rate": 0.0001801428780441045, - "loss": 0.0158, + "epoch": 0.41, + "learning_rate": 0.00023841842910874304, + "loss": 0.0174, "step": 158380 }, { - "epoch": 0.8, - "learning_rate": 0.0001801353103510905, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023841454089237155, + "loss": 0.0209, "step": 158390 }, { - "epoch": 0.8, - "learning_rate": 0.00018012774265807648, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023841065267600007, + "loss": 0.0197, "step": 158400 }, { - "epoch": 0.8, - "learning_rate": 0.00018012017496506246, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023840676445962864, + "loss": 0.0192, "step": 158410 }, { - "epoch": 0.8, - "learning_rate": 0.00018011260727204847, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023840287624325718, + "loss": 0.0189, "step": 158420 }, { - "epoch": 0.8, - "learning_rate": 0.00018010503957903445, - "loss": 0.0126, + "epoch": 0.41, + "learning_rate": 0.0002383989880268857, + "loss": 0.0226, "step": 158430 }, { - "epoch": 0.8, - "learning_rate": 0.00018009747188602043, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.00023839509981051423, + "loss": 0.0188, "step": 158440 }, { - "epoch": 0.8, - "learning_rate": 0.00018008990419300644, - "loss": 0.0099, + "epoch": 0.41, + "learning_rate": 0.00023839121159414278, + "loss": 0.0215, "step": 158450 }, { - "epoch": 0.8, - "learning_rate": 0.00018008233649999242, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023838732337777132, + "loss": 0.0241, "step": 158460 }, { - "epoch": 0.8, - "learning_rate": 0.0001800747688069784, - "loss": 0.0148, + "epoch": 0.41, + "learning_rate": 0.00023838343516139983, + "loss": 0.0193, "step": 158470 }, { - "epoch": 0.8, - "learning_rate": 0.00018006720111396439, - "loss": 0.0158, + "epoch": 0.41, + "learning_rate": 0.00023837954694502837, + "loss": 0.02, "step": 158480 }, { - "epoch": 0.8, - "learning_rate": 0.0001800596334209504, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023837565872865692, + "loss": 0.0174, "step": 158490 }, { - "epoch": 0.8, - "learning_rate": 0.00018005206572793638, - "loss": 0.0093, + "epoch": 0.41, + "learning_rate": 0.00023837177051228546, + "loss": 0.0202, "step": 158500 }, { - "epoch": 0.8, - "learning_rate": 0.00018004449803492236, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023836788229591397, + "loss": 0.0269, "step": 158510 }, { - "epoch": 0.8, - "learning_rate": 0.00018003693034190837, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.0002383639940795425, + "loss": 0.0192, "step": 158520 }, { - "epoch": 0.8, - "learning_rate": 0.00018002936264889435, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023836010586317108, + "loss": 0.0182, "step": 158530 }, { - "epoch": 0.8, - "learning_rate": 0.00018002179495588033, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.0002383562176467996, + "loss": 0.0193, "step": 158540 }, { - "epoch": 0.8, - "learning_rate": 0.00018001422726286634, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.0002383523294304281, + "loss": 0.0182, "step": 158550 }, { - "epoch": 0.8, - "learning_rate": 0.00018000665956985232, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023834844121405665, + "loss": 0.0175, "step": 158560 }, { - "epoch": 0.8, - "learning_rate": 0.0001799990918768383, - "loss": 0.0103, + "epoch": 0.41, + "learning_rate": 0.00023834455299768517, + "loss": 0.0236, "step": 158570 }, { - "epoch": 0.8, - "learning_rate": 0.0001799915241838243, - "loss": 0.0095, + "epoch": 0.41, + "learning_rate": 0.00023834066478131374, + "loss": 0.0223, "step": 158580 }, { - "epoch": 0.8, - "learning_rate": 0.0001799839564908103, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023833677656494228, + "loss": 0.0136, "step": 158590 }, { - "epoch": 0.8, - "learning_rate": 0.00017997638879779627, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.0002383328883485708, + "loss": 0.0177, "step": 158600 }, { - "epoch": 0.8, - "learning_rate": 0.00017996882110478228, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023832900013219933, + "loss": 0.017, "step": 158610 }, { - "epoch": 0.8, - "learning_rate": 0.00017996125341176826, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.00023832511191582788, + "loss": 0.0189, "step": 158620 }, { - "epoch": 0.8, - "learning_rate": 0.00017995368571875424, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.00023832122369945642, + "loss": 0.0231, "step": 158630 }, { - "epoch": 0.8, - "learning_rate": 0.00017994611802574025, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.00023831733548308493, + "loss": 0.02, "step": 158640 }, { - "epoch": 0.8, - "learning_rate": 0.00017993855033272623, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023831344726671347, + "loss": 0.0169, "step": 158650 }, { - "epoch": 0.8, - "learning_rate": 0.00017993098263971221, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023830955905034201, + "loss": 0.017, "step": 158660 }, { - "epoch": 0.8, - "learning_rate": 0.0001799234149466982, - "loss": 0.0101, + "epoch": 0.41, + "learning_rate": 0.00023830567083397056, + "loss": 0.0187, "step": 158670 }, { - "epoch": 0.8, - "learning_rate": 0.0001799158472536842, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023830178261759907, + "loss": 0.0184, "step": 158680 }, { - "epoch": 0.8, - "learning_rate": 0.00017990827956067019, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002382978944012276, + "loss": 0.0189, "step": 158690 }, { - "epoch": 0.8, - "learning_rate": 0.00017990071186765617, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023829400618485618, + "loss": 0.0228, "step": 158700 }, { - "epoch": 0.8, - "learning_rate": 0.00017989314417464218, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.0002382901179684847, + "loss": 0.0247, "step": 158710 }, { - "epoch": 0.8, - "learning_rate": 0.00017988557648162816, - "loss": 0.0103, + "epoch": 0.41, + "learning_rate": 0.0002382862297521132, + "loss": 0.0171, "step": 158720 }, { - "epoch": 0.8, - "learning_rate": 0.00017987800878861414, - "loss": 0.0103, + "epoch": 0.41, + "learning_rate": 0.00023828234153574175, + "loss": 0.0226, "step": 158730 }, { - "epoch": 0.8, - "learning_rate": 0.00017987044109560015, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023827845331937032, + "loss": 0.0164, "step": 158740 }, { - "epoch": 0.8, - "learning_rate": 0.00017986287340258613, - "loss": 0.0149, + "epoch": 0.41, + "learning_rate": 0.00023827456510299884, + "loss": 0.0216, "step": 158750 }, { - "epoch": 0.8, - "learning_rate": 0.0001798553057095721, - "loss": 0.0141, + "epoch": 0.41, + "learning_rate": 0.00023827067688662738, + "loss": 0.0167, "step": 158760 }, { - "epoch": 0.8, - "learning_rate": 0.00017984773801655812, - "loss": 0.0097, + "epoch": 0.41, + "learning_rate": 0.0002382667886702559, + "loss": 0.0178, "step": 158770 }, { - "epoch": 0.8, - "learning_rate": 0.0001798401703235441, - "loss": 0.0136, + "epoch": 0.41, + "learning_rate": 0.00023826290045388446, + "loss": 0.0188, "step": 158780 }, { - "epoch": 0.8, - "learning_rate": 0.00017983260263053008, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023825901223751297, + "loss": 0.021, "step": 158790 }, { - "epoch": 0.8, - "learning_rate": 0.0001798250349375161, - "loss": 0.0104, + "epoch": 0.41, + "learning_rate": 0.00023825512402114152, + "loss": 0.0195, "step": 158800 }, { - "epoch": 0.8, - "learning_rate": 0.00017981746724450207, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023825123580477003, + "loss": 0.0191, "step": 158810 }, { - "epoch": 0.8, - "learning_rate": 0.00017980989955148805, - "loss": 0.0171, + "epoch": 0.41, + "learning_rate": 0.00023824734758839857, + "loss": 0.0184, "step": 158820 }, { - "epoch": 0.8, - "learning_rate": 0.00017980233185847403, - "loss": 0.0094, + "epoch": 0.41, + "learning_rate": 0.00023824345937202711, + "loss": 0.0227, "step": 158830 }, { - "epoch": 0.8, - "learning_rate": 0.00017979476416546004, - "loss": 0.0098, + "epoch": 0.41, + "learning_rate": 0.00023823957115565566, + "loss": 0.02, "step": 158840 }, { - "epoch": 0.8, - "learning_rate": 0.00017978719647244602, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023823568293928417, + "loss": 0.0152, "step": 158850 }, { - "epoch": 0.8, - "learning_rate": 0.000179779628779432, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.0002382317947229127, + "loss": 0.0198, "step": 158860 }, { - "epoch": 0.8, - "learning_rate": 0.00017977206108641801, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023822790650654125, + "loss": 0.0194, "step": 158870 }, { - "epoch": 0.8, - "learning_rate": 0.000179764493393404, - "loss": 0.0169, + "epoch": 0.41, + "learning_rate": 0.0002382240182901698, + "loss": 0.0194, "step": 158880 }, { - "epoch": 0.8, - "learning_rate": 0.00017975692570038998, - "loss": 0.0093, + "epoch": 0.41, + "learning_rate": 0.0002382201300737983, + "loss": 0.0231, "step": 158890 }, { - "epoch": 0.8, - "learning_rate": 0.00017974935800737599, - "loss": 0.0186, + "epoch": 0.41, + "learning_rate": 0.00023821624185742685, + "loss": 0.0195, "step": 158900 }, { - "epoch": 0.8, - "learning_rate": 0.00017974179031436197, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.00023821235364105542, + "loss": 0.0188, "step": 158910 }, { - "epoch": 0.8, - "learning_rate": 0.00017973422262134795, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023820846542468393, + "loss": 0.0182, "step": 158920 }, { - "epoch": 0.8, - "learning_rate": 0.00017972665492833396, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023820457720831248, + "loss": 0.0182, "step": 158930 }, { - "epoch": 0.8, - "learning_rate": 0.00017971908723531994, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.000238200688991941, + "loss": 0.018, "step": 158940 }, { - "epoch": 0.8, - "learning_rate": 0.00017971151954230592, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023819680077556956, + "loss": 0.0177, "step": 158950 }, { - "epoch": 0.8, - "learning_rate": 0.00017970395184929193, - "loss": 0.0098, + "epoch": 0.41, + "learning_rate": 0.00023819291255919807, + "loss": 0.0155, "step": 158960 }, { - "epoch": 0.8, - "learning_rate": 0.0001796963841562779, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023818902434282662, + "loss": 0.0174, "step": 158970 }, { - "epoch": 0.8, - "learning_rate": 0.0001796888164632639, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023818513612645513, + "loss": 0.018, "step": 158980 }, { - "epoch": 0.8, - "learning_rate": 0.00017968124877024987, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002381812479100837, + "loss": 0.0165, "step": 158990 }, { - "epoch": 0.8, - "learning_rate": 0.00017967368107723585, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.0002381773596937122, + "loss": 0.0168, "step": 159000 }, { - "epoch": 0.8, - "eval_cer": 0.9144945158062973, - "eval_loss": 0.00861455500125885, - "eval_runtime": 116.6046, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.41, + "eval_cer": 0.8817796663545476, + "eval_loss": 0.013127253390848637, + "eval_runtime": 107.1652, + "eval_samples_per_second": 18.663, + "eval_steps_per_second": 4.666, "step": 159000 }, { - "epoch": 0.8, - "learning_rate": 0.00017966611338422184, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023817347147734076, + "loss": 0.0213, "step": 159010 }, { - "epoch": 0.8, - "learning_rate": 0.00017965854569120782, - "loss": 0.0118, + "epoch": 0.41, + "learning_rate": 0.00023816958326096927, + "loss": 0.0207, "step": 159020 }, { - "epoch": 0.8, - "learning_rate": 0.00017965097799819383, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023816569504459784, + "loss": 0.0185, "step": 159030 }, { - "epoch": 0.8, - "learning_rate": 0.0001796434103051798, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023816180682822635, + "loss": 0.02, "step": 159040 }, { - "epoch": 0.8, - "learning_rate": 0.0001796358426121658, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.0002381579186118549, + "loss": 0.0171, "step": 159050 }, { - "epoch": 0.8, - "learning_rate": 0.00017962827491915177, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.0002381540303954834, + "loss": 0.0232, "step": 159060 }, { - "epoch": 0.8, - "learning_rate": 0.00017962070722613778, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.00023815014217911195, + "loss": 0.0184, "step": 159070 }, { - "epoch": 0.8, - "learning_rate": 0.00017961313953312376, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023814625396274052, + "loss": 0.0252, "step": 159080 }, { - "epoch": 0.8, - "learning_rate": 0.00017960557184010974, - "loss": 0.0141, + "epoch": 0.41, + "learning_rate": 0.00023814236574636903, + "loss": 0.0235, "step": 159090 }, { - "epoch": 0.8, - "learning_rate": 0.00017959800414709575, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.00023813847752999758, + "loss": 0.0163, "step": 159100 }, { - "epoch": 0.8, - "learning_rate": 0.00017959043645408173, - "loss": 0.0098, + "epoch": 0.41, + "learning_rate": 0.0002381345893136261, + "loss": 0.0183, "step": 159110 }, { - "epoch": 0.8, - "learning_rate": 0.0001795828687610677, - "loss": 0.0104, + "epoch": 0.41, + "learning_rate": 0.00023813070109725466, + "loss": 0.0173, "step": 159120 }, { - "epoch": 0.8, - "learning_rate": 0.00017957530106805372, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023812681288088317, + "loss": 0.0184, "step": 159130 }, { - "epoch": 0.8, - "learning_rate": 0.0001795677333750397, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023812292466451172, + "loss": 0.0185, "step": 159140 }, { - "epoch": 0.8, - "learning_rate": 0.00017956016568202568, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.00023811903644814023, + "loss": 0.0217, "step": 159150 }, { - "epoch": 0.8, - "learning_rate": 0.0001795525979890117, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.0002381151482317688, + "loss": 0.0158, "step": 159160 }, { - "epoch": 0.8, - "learning_rate": 0.00017954503029599767, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.0002381112600153973, + "loss": 0.0208, "step": 159170 }, { - "epoch": 0.8, - "learning_rate": 0.00017953746260298366, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.00023810737179902585, + "loss": 0.0368, "step": 159180 }, { - "epoch": 0.8, - "learning_rate": 0.00017952989490996966, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023810348358265437, + "loss": 0.0206, "step": 159190 }, { - "epoch": 0.8, - "learning_rate": 0.00017952232721695565, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.00023809959536628294, + "loss": 0.0174, "step": 159200 }, { - "epoch": 0.8, - "learning_rate": 0.00017951475952394163, - "loss": 0.0191, + "epoch": 0.41, + "learning_rate": 0.00023809570714991145, + "loss": 0.0176, "step": 159210 }, { - "epoch": 0.8, - "learning_rate": 0.0001795071918309276, - "loss": 0.0091, + "epoch": 0.41, + "learning_rate": 0.00023809181893354, + "loss": 0.0194, "step": 159220 }, { - "epoch": 0.8, - "learning_rate": 0.00017949962413791362, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.0002380879307171685, + "loss": 0.024, "step": 159230 }, { - "epoch": 0.8, - "learning_rate": 0.0001794920564448996, - "loss": 0.0126, + "epoch": 0.41, + "learning_rate": 0.00023808404250079708, + "loss": 0.0173, "step": 159240 }, { - "epoch": 0.8, - "learning_rate": 0.00017948448875188558, - "loss": 0.012, + "epoch": 0.41, + "learning_rate": 0.00023808015428442562, + "loss": 0.0232, "step": 159250 }, { - "epoch": 0.8, - "learning_rate": 0.0001794769210588716, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.00023807626606805413, + "loss": 0.0241, "step": 159260 }, { - "epoch": 0.8, - "learning_rate": 0.00017946935336585757, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.00023807237785168265, + "loss": 0.0184, "step": 159270 }, { - "epoch": 0.8, - "learning_rate": 0.00017946178567284355, - "loss": 0.0193, + "epoch": 0.41, + "learning_rate": 0.00023806848963531122, + "loss": 0.0199, "step": 159280 }, { - "epoch": 0.8, - "learning_rate": 0.00017945421797982956, - "loss": 0.0141, + "epoch": 0.41, + "learning_rate": 0.00023806460141893976, + "loss": 0.0239, "step": 159290 }, { - "epoch": 0.8, - "learning_rate": 0.00017944665028681554, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023806071320256827, + "loss": 0.0284, "step": 159300 }, { - "epoch": 0.8, - "learning_rate": 0.00017943908259380152, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023805682498619681, + "loss": 0.0208, "step": 159310 }, { - "epoch": 0.8, - "learning_rate": 0.00017943151490078753, - "loss": 0.0114, + "epoch": 0.41, + "learning_rate": 0.00023805293676982533, + "loss": 0.0183, "step": 159320 }, { - "epoch": 0.8, - "learning_rate": 0.0001794239472077735, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.0002380490485534539, + "loss": 0.0159, "step": 159330 }, { - "epoch": 0.8, - "learning_rate": 0.0001794163795147595, - "loss": 0.02, + "epoch": 0.41, + "learning_rate": 0.0002380451603370824, + "loss": 0.0157, "step": 159340 }, { - "epoch": 0.8, - "learning_rate": 0.0001794088118217455, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023804127212071095, + "loss": 0.018, "step": 159350 }, { - "epoch": 0.8, - "learning_rate": 0.00017940124412873148, - "loss": 0.0158, + "epoch": 0.41, + "learning_rate": 0.00023803738390433947, + "loss": 0.0186, "step": 159360 }, { - "epoch": 0.8, - "learning_rate": 0.00017939367643571747, - "loss": 0.0125, + "epoch": 0.41, + "learning_rate": 0.00023803349568796804, + "loss": 0.0165, "step": 159370 }, { - "epoch": 0.8, - "learning_rate": 0.00017938610874270345, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023802960747159655, + "loss": 0.0152, "step": 159380 }, { - "epoch": 0.8, - "learning_rate": 0.00017937854104968946, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.0002380257192552251, + "loss": 0.0148, "step": 159390 }, { - "epoch": 0.8, - "learning_rate": 0.00017937097335667544, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.0002380218310388536, + "loss": 0.0193, "step": 159400 }, { - "epoch": 0.8, - "learning_rate": 0.00017936340566366142, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023801794282248218, + "loss": 0.0163, "step": 159410 }, { - "epoch": 0.8, - "learning_rate": 0.00017935583797064743, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.0002380140546061107, + "loss": 0.0199, "step": 159420 }, { - "epoch": 0.8, - "learning_rate": 0.0001793482702776334, - "loss": 0.014, + "epoch": 0.41, + "learning_rate": 0.00023801016638973923, + "loss": 0.015, "step": 159430 }, { - "epoch": 0.8, - "learning_rate": 0.0001793407025846194, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.00023800627817336775, + "loss": 0.0207, "step": 159440 }, { - "epoch": 0.8, - "learning_rate": 0.0001793331348916054, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.00023800238995699632, + "loss": 0.014, "step": 159450 }, { - "epoch": 0.8, - "learning_rate": 0.00017932556719859138, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023799850174062486, + "loss": 0.0194, "step": 159460 }, { - "epoch": 0.8, - "learning_rate": 0.00017931799950557736, - "loss": 0.0112, + "epoch": 0.41, + "learning_rate": 0.00023799461352425337, + "loss": 0.0143, "step": 159470 }, { - "epoch": 0.8, - "learning_rate": 0.00017931043181256337, - "loss": 0.0158, + "epoch": 0.41, + "learning_rate": 0.00023799072530788191, + "loss": 0.0255, "step": 159480 }, { - "epoch": 0.8, - "learning_rate": 0.00017930286411954935, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023798683709151046, + "loss": 0.016, "step": 159490 }, { - "epoch": 0.8, - "learning_rate": 0.00017929529642653533, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.000237982948875139, + "loss": 0.0207, "step": 159500 }, { - "epoch": 0.8, - "learning_rate": 0.00017928772873352134, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.0002379790606587675, + "loss": 0.0186, "step": 159510 }, { - "epoch": 0.8, - "learning_rate": 0.00017928016104050732, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023797517244239605, + "loss": 0.0204, "step": 159520 }, { - "epoch": 0.8, - "learning_rate": 0.0001792725933474933, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.0002379712842260246, + "loss": 0.0184, "step": 159530 }, { - "epoch": 0.8, - "learning_rate": 0.0001792650256544793, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.00023796739600965314, + "loss": 0.0167, "step": 159540 }, { - "epoch": 0.8, - "learning_rate": 0.0001792574579614653, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023796350779328165, + "loss": 0.0207, "step": 159550 }, { - "epoch": 0.8, - "learning_rate": 0.00017924989026845128, - "loss": 0.0139, + "epoch": 0.41, + "learning_rate": 0.0002379596195769102, + "loss": 0.022, "step": 159560 }, { - "epoch": 0.81, - "learning_rate": 0.00017924232257543726, - "loss": 0.011, + "epoch": 0.41, + "learning_rate": 0.0002379557313605387, + "loss": 0.0195, "step": 159570 }, { - "epoch": 0.81, - "learning_rate": 0.00017923475488242327, - "loss": 0.0143, + "epoch": 0.41, + "learning_rate": 0.00023795184314416728, + "loss": 0.019, "step": 159580 }, { - "epoch": 0.81, - "learning_rate": 0.00017922718718940925, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.0002379479549277958, + "loss": 0.0175, "step": 159590 }, { - "epoch": 0.81, - "learning_rate": 0.00017921961949639523, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.00023794406671142433, + "loss": 0.0236, "step": 159600 }, { - "epoch": 0.81, - "learning_rate": 0.00017921205180338124, - "loss": 0.0119, + "epoch": 0.41, + "learning_rate": 0.00023794017849505285, + "loss": 0.016, "step": 159610 }, { - "epoch": 0.81, - "learning_rate": 0.00017920448411036722, - "loss": 0.0187, + "epoch": 0.41, + "learning_rate": 0.00023793629027868142, + "loss": 0.0188, "step": 159620 }, { - "epoch": 0.81, - "learning_rate": 0.0001791969164173532, - "loss": 0.0142, + "epoch": 0.41, + "learning_rate": 0.00023793240206230996, + "loss": 0.0188, "step": 159630 }, { - "epoch": 0.81, - "learning_rate": 0.0001791893487243392, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023792851384593847, + "loss": 0.0165, "step": 159640 }, { - "epoch": 0.81, - "learning_rate": 0.0001791817810313252, - "loss": 0.015, + "epoch": 0.41, + "learning_rate": 0.000237924625629567, + "loss": 0.0147, "step": 159650 }, { - "epoch": 0.81, - "learning_rate": 0.00017917421333831117, - "loss": 0.0122, + "epoch": 0.41, + "learning_rate": 0.00023792073741319556, + "loss": 0.019, "step": 159660 }, { - "epoch": 0.81, - "learning_rate": 0.00017916664564529718, - "loss": 0.0115, + "epoch": 0.41, + "learning_rate": 0.0002379168491968241, + "loss": 0.0177, "step": 159670 }, { - "epoch": 0.81, - "learning_rate": 0.00017915907795228316, - "loss": 0.0106, + "epoch": 0.41, + "learning_rate": 0.0002379129609804526, + "loss": 0.0175, "step": 159680 }, { - "epoch": 0.81, - "learning_rate": 0.00017915151025926914, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023790907276408115, + "loss": 0.0189, "step": 159690 }, { - "epoch": 0.81, - "learning_rate": 0.00017914394256625515, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002379051845477097, + "loss": 0.0188, "step": 159700 }, { - "epoch": 0.81, - "learning_rate": 0.00017913637487324113, - "loss": 0.0161, + "epoch": 0.41, + "learning_rate": 0.00023790129633133824, + "loss": 0.0216, "step": 159710 }, { - "epoch": 0.81, - "learning_rate": 0.00017912880718022711, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023789740811496675, + "loss": 0.0199, "step": 159720 }, { - "epoch": 0.81, - "learning_rate": 0.0001791212394872131, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.0002378935198985953, + "loss": 0.0175, "step": 159730 }, { - "epoch": 0.81, - "learning_rate": 0.0001791136717941991, - "loss": 0.0097, + "epoch": 0.41, + "learning_rate": 0.00023788963168222383, + "loss": 0.0207, "step": 159740 }, { - "epoch": 0.81, - "learning_rate": 0.00017910610410118509, - "loss": 0.0126, + "epoch": 0.41, + "learning_rate": 0.00023788574346585238, + "loss": 0.0189, "step": 159750 }, { - "epoch": 0.81, - "learning_rate": 0.00017909853640817107, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.0002378818552494809, + "loss": 0.0194, "step": 159760 }, { - "epoch": 0.81, - "learning_rate": 0.00017909096871515708, - "loss": 0.0107, + "epoch": 0.41, + "learning_rate": 0.00023787796703310943, + "loss": 0.0208, "step": 159770 }, { - "epoch": 0.81, - "learning_rate": 0.00017908340102214306, - "loss": 0.0111, + "epoch": 0.41, + "learning_rate": 0.000237874078816738, + "loss": 0.0177, "step": 159780 }, { - "epoch": 0.81, - "learning_rate": 0.00017907583332912904, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.00023787019060036651, + "loss": 0.0162, "step": 159790 }, { - "epoch": 0.81, - "learning_rate": 0.00017906826563611505, - "loss": 0.0123, + "epoch": 0.41, + "learning_rate": 0.00023786630238399506, + "loss": 0.021, "step": 159800 }, { - "epoch": 0.81, - "learning_rate": 0.00017906069794310103, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023786241416762357, + "loss": 0.0159, "step": 159810 }, { - "epoch": 0.81, - "learning_rate": 0.000179053130250087, - "loss": 0.0127, + "epoch": 0.41, + "learning_rate": 0.00023785852595125209, + "loss": 0.0189, "step": 159820 }, { - "epoch": 0.81, - "learning_rate": 0.00017904556255707302, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023785463773488065, + "loss": 0.0165, "step": 159830 }, { - "epoch": 0.81, - "learning_rate": 0.000179037994864059, - "loss": 0.0153, + "epoch": 0.41, + "learning_rate": 0.0002378507495185092, + "loss": 0.0214, "step": 159840 }, { - "epoch": 0.81, - "learning_rate": 0.00017903042717104498, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.0002378468613021377, + "loss": 0.0307, "step": 159850 }, { - "epoch": 0.81, - "learning_rate": 0.000179022859478031, - "loss": 0.0116, + "epoch": 0.41, + "learning_rate": 0.00023784297308576625, + "loss": 0.0163, "step": 159860 }, { - "epoch": 0.81, - "learning_rate": 0.00017901529178501697, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002378390848693948, + "loss": 0.02, "step": 159870 }, { - "epoch": 0.81, - "learning_rate": 0.00017900772409200295, - "loss": 0.0109, + "epoch": 0.41, + "learning_rate": 0.00023783519665302334, + "loss": 0.0188, "step": 159880 }, { - "epoch": 0.81, - "learning_rate": 0.00017900015639898893, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023783130843665185, + "loss": 0.0199, "step": 159890 }, { - "epoch": 0.81, - "learning_rate": 0.00017899258870597494, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.0002378274202202804, + "loss": 0.0213, "step": 159900 }, { - "epoch": 0.81, - "learning_rate": 0.00017898502101296092, - "loss": 0.0131, + "epoch": 0.41, + "learning_rate": 0.00023782353200390893, + "loss": 0.0202, "step": 159910 }, { - "epoch": 0.81, - "learning_rate": 0.0001789774533199469, - "loss": 0.0113, + "epoch": 0.41, + "learning_rate": 0.00023781964378753747, + "loss": 0.016, "step": 159920 }, { - "epoch": 0.81, - "learning_rate": 0.00017896988562693291, - "loss": 0.0105, + "epoch": 0.41, + "learning_rate": 0.000237815755571166, + "loss": 0.0176, "step": 159930 }, { - "epoch": 0.81, - "learning_rate": 0.0001789623179339189, - "loss": 0.0135, + "epoch": 0.41, + "learning_rate": 0.00023781186735479453, + "loss": 0.0165, "step": 159940 }, { - "epoch": 0.81, - "learning_rate": 0.00017895475024090488, - "loss": 0.0128, + "epoch": 0.41, + "learning_rate": 0.0002378079791384231, + "loss": 0.0203, "step": 159950 }, { - "epoch": 0.81, - "learning_rate": 0.00017894718254789089, - "loss": 0.0129, + "epoch": 0.41, + "learning_rate": 0.00023780409092205161, + "loss": 0.022, "step": 159960 }, { - "epoch": 0.81, - "learning_rate": 0.00017893961485487687, - "loss": 0.0184, + "epoch": 0.41, + "learning_rate": 0.00023780020270568016, + "loss": 0.022, "step": 159970 }, { - "epoch": 0.81, - "learning_rate": 0.00017893204716186285, - "loss": 0.0144, + "epoch": 0.41, + "learning_rate": 0.00023779631448930867, + "loss": 0.0208, "step": 159980 }, { - "epoch": 0.81, - "learning_rate": 0.00017892447946884886, - "loss": 0.0096, + "epoch": 0.41, + "learning_rate": 0.00023779242627293724, + "loss": 0.0165, "step": 159990 }, { - "epoch": 0.81, - "learning_rate": 0.00017891691177583484, - "loss": 0.0133, + "epoch": 0.41, + "learning_rate": 0.00023778853805656575, + "loss": 0.017, "step": 160000 }, { - "epoch": 0.81, - "eval_cer": 0.9144867526372941, - "eval_loss": 0.008828338235616684, - "eval_runtime": 116.6369, - "eval_samples_per_second": 17.147, - "eval_steps_per_second": 4.287, + "epoch": 0.41, + "eval_cer": 0.881806259456297, + "eval_loss": 0.013189446181058884, + "eval_runtime": 107.4253, + "eval_samples_per_second": 18.618, + "eval_steps_per_second": 4.654, "step": 160000 }, { - "epoch": 0.81, - "learning_rate": 0.00017890934408282082, - "loss": 0.0108, + "epoch": 0.41, + "learning_rate": 0.0002377846498401943, + "loss": 0.0176, "step": 160010 }, { - "epoch": 0.81, - "learning_rate": 0.00017890177638980683, - "loss": 0.013, + "epoch": 0.41, + "learning_rate": 0.0002377807616238228, + "loss": 0.0175, "step": 160020 }, { - "epoch": 0.81, - "learning_rate": 0.0001788942086967928, - "loss": 0.0134, - "step": 160030 + "epoch": 0.41, + "learning_rate": 0.00023777687340745135, + "loss": 0.0178, + "step": 160030 }, { - "epoch": 0.81, - "learning_rate": 0.0001788866410037788, - "loss": 0.0124, + "epoch": 0.41, + "learning_rate": 0.0002377729851910799, + "loss": 0.0178, "step": 160040 }, { - "epoch": 0.81, - "learning_rate": 0.0001788790733107648, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023776909697470843, + "loss": 0.02, "step": 160050 }, { - "epoch": 0.81, - "learning_rate": 0.00017887150561775078, - "loss": 0.0132, + "epoch": 0.41, + "learning_rate": 0.00023776520875833695, + "loss": 0.0147, "step": 160060 }, { - "epoch": 0.81, - "learning_rate": 0.00017886393792473676, - "loss": 0.0121, + "epoch": 0.41, + "learning_rate": 0.0002377613205419655, + "loss": 0.0188, "step": 160070 }, { - "epoch": 0.81, - "learning_rate": 0.00017885637023172274, - "loss": 0.0138, + "epoch": 0.41, + "learning_rate": 0.00023775743232559403, + "loss": 0.0152, "step": 160080 }, { - "epoch": 0.81, - "learning_rate": 0.00017884880253870875, - "loss": 0.0117, + "epoch": 0.41, + "learning_rate": 0.00023775354410922257, + "loss": 0.0218, "step": 160090 }, { - "epoch": 0.81, - "learning_rate": 0.00017884123484569473, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.0002377496558928511, + "loss": 0.0195, "step": 160100 }, { - "epoch": 0.81, - "learning_rate": 0.00017883366715268072, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023774576767647963, + "loss": 0.0199, "step": 160110 }, { - "epoch": 0.81, - "learning_rate": 0.00017882609945966672, - "loss": 0.0142, + "epoch": 0.42, + "learning_rate": 0.0002377418794601082, + "loss": 0.0197, "step": 160120 }, { - "epoch": 0.81, - "learning_rate": 0.0001788185317666527, - "loss": 0.0164, + "epoch": 0.42, + "learning_rate": 0.00023773799124373671, + "loss": 0.0208, "step": 160130 }, { - "epoch": 0.81, - "learning_rate": 0.0001788109640736387, - "loss": 0.0105, + "epoch": 0.42, + "learning_rate": 0.00023773410302736523, + "loss": 0.0144, "step": 160140 }, { - "epoch": 0.81, - "learning_rate": 0.0001788033963806247, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.00023773021481099377, + "loss": 0.0171, "step": 160150 }, { - "epoch": 0.81, - "learning_rate": 0.00017879582868761068, - "loss": 0.0183, + "epoch": 0.42, + "learning_rate": 0.00023772632659462234, + "loss": 0.018, "step": 160160 }, { - "epoch": 0.81, - "learning_rate": 0.00017878826099459666, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023772243837825085, + "loss": 0.0189, "step": 160170 }, { - "epoch": 0.81, - "learning_rate": 0.00017878069330158267, - "loss": 0.0155, + "epoch": 0.42, + "learning_rate": 0.0002377185501618794, + "loss": 0.0174, "step": 160180 }, { - "epoch": 0.81, - "learning_rate": 0.00017877312560856865, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.0002377146619455079, + "loss": 0.0198, "step": 160190 }, { - "epoch": 0.81, - "learning_rate": 0.00017876555791555463, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023771077372913648, + "loss": 0.0163, "step": 160200 }, { - "epoch": 0.81, - "learning_rate": 0.00017875799022254064, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.000237706885512765, + "loss": 0.0218, "step": 160210 }, { - "epoch": 0.81, - "learning_rate": 0.00017875042252952662, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.00023770299729639353, + "loss": 0.0192, "step": 160220 }, { - "epoch": 0.81, - "learning_rate": 0.0001787428548365126, - "loss": 0.0108, + "epoch": 0.42, + "learning_rate": 0.00023769910908002205, + "loss": 0.0209, "step": 160230 }, { - "epoch": 0.81, - "learning_rate": 0.00017873528714349858, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023769522086365062, + "loss": 0.0149, "step": 160240 }, { - "epoch": 0.81, - "learning_rate": 0.0001787277194504846, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023769133264727913, + "loss": 0.0207, "step": 160250 }, { - "epoch": 0.81, - "learning_rate": 0.00017872015175747055, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023768744443090767, + "loss": 0.0225, "step": 160260 }, { - "epoch": 0.81, - "learning_rate": 0.00017871258406445653, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.0002376835562145362, + "loss": 0.0258, "step": 160270 }, { - "epoch": 0.81, - "learning_rate": 0.0001787050163714425, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023767966799816473, + "loss": 0.0187, "step": 160280 }, { - "epoch": 0.81, - "learning_rate": 0.00017869744867842852, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.0002376757797817933, + "loss": 0.0256, "step": 160290 }, { - "epoch": 0.81, - "learning_rate": 0.0001786898809854145, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.0002376718915654218, + "loss": 0.0189, "step": 160300 }, { - "epoch": 0.81, - "learning_rate": 0.00017868231329240048, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023766800334905033, + "loss": 0.0207, "step": 160310 }, { - "epoch": 0.81, - "learning_rate": 0.0001786747455993865, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023766411513267887, + "loss": 0.0201, "step": 160320 }, { - "epoch": 0.81, - "learning_rate": 0.00017866717790637247, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023766022691630744, + "loss": 0.0185, "step": 160330 }, { - "epoch": 0.81, - "learning_rate": 0.00017865961021335845, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023765633869993595, + "loss": 0.0217, "step": 160340 }, { - "epoch": 0.81, - "learning_rate": 0.00017865204252034446, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.0002376524504835645, + "loss": 0.018, "step": 160350 }, { - "epoch": 0.81, - "learning_rate": 0.00017864447482733044, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.000237648562267193, + "loss": 0.016, "step": 160360 }, { - "epoch": 0.81, - "learning_rate": 0.00017863690713431642, - "loss": 0.0097, + "epoch": 0.42, + "learning_rate": 0.00023764467405082158, + "loss": 0.0187, "step": 160370 }, { - "epoch": 0.81, - "learning_rate": 0.00017862933944130243, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.0002376407858344501, + "loss": 0.0174, "step": 160380 }, { - "epoch": 0.81, - "learning_rate": 0.0001786217717482884, - "loss": 0.0092, + "epoch": 0.42, + "learning_rate": 0.00023763689761807863, + "loss": 0.0204, "step": 160390 }, { - "epoch": 0.81, - "learning_rate": 0.0001786142040552744, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.00023763300940170715, + "loss": 0.0157, "step": 160400 }, { - "epoch": 0.81, - "learning_rate": 0.0001786066363622604, - "loss": 0.0108, + "epoch": 0.42, + "learning_rate": 0.00023762912118533572, + "loss": 0.0213, "step": 160410 }, { - "epoch": 0.81, - "learning_rate": 0.00017859906866924638, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023762523296896423, + "loss": 0.0181, "step": 160420 }, { - "epoch": 0.81, - "learning_rate": 0.00017859150097623237, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023762134475259277, + "loss": 0.0188, "step": 160430 }, { - "epoch": 0.81, - "learning_rate": 0.00017858393328321837, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.0002376174565362213, + "loss": 0.022, "step": 160440 }, { - "epoch": 0.81, - "learning_rate": 0.00017857636559020436, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.00023761356831984986, + "loss": 0.0247, "step": 160450 }, { - "epoch": 0.81, - "learning_rate": 0.00017856879789719034, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023760968010347837, + "loss": 0.0172, "step": 160460 }, { - "epoch": 0.81, - "learning_rate": 0.00017856123020417632, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.0002376057918871069, + "loss": 0.0201, "step": 160470 }, { - "epoch": 0.81, - "learning_rate": 0.00017855366251116233, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023760190367073543, + "loss": 0.0208, "step": 160480 }, { - "epoch": 0.81, - "learning_rate": 0.0001785460948181483, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.000237598015454364, + "loss": 0.018, "step": 160490 }, { - "epoch": 0.81, - "learning_rate": 0.0001785385271251343, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023759412723799254, + "loss": 0.0157, "step": 160500 }, { - "epoch": 0.81, - "learning_rate": 0.0001785309594321203, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023759023902162105, + "loss": 0.0192, "step": 160510 }, { - "epoch": 0.81, - "learning_rate": 0.00017852339173910628, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.0002375863508052496, + "loss": 0.0133, "step": 160520 }, { - "epoch": 0.81, - "learning_rate": 0.00017851582404609226, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002375824625888781, + "loss": 0.0205, "step": 160530 }, { - "epoch": 0.81, - "learning_rate": 0.00017850825635307827, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023757857437250668, + "loss": 0.0187, "step": 160540 }, { - "epoch": 0.81, - "learning_rate": 0.00017850068866006425, - "loss": 0.0095, + "epoch": 0.42, + "learning_rate": 0.0002375746861561352, + "loss": 0.0231, "step": 160550 }, { - "epoch": 0.81, - "learning_rate": 0.00017849312096705023, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023757079793976373, + "loss": 0.0209, "step": 160560 }, { - "epoch": 0.81, - "learning_rate": 0.00017848555327403624, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.00023756690972339225, + "loss": 0.023, "step": 160570 }, { - "epoch": 0.81, - "learning_rate": 0.00017847798558102222, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023756302150702082, + "loss": 0.0212, "step": 160580 }, { - "epoch": 0.81, - "learning_rate": 0.0001784704178880082, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023755913329064933, + "loss": 0.016, "step": 160590 }, { - "epoch": 0.81, - "learning_rate": 0.0001784628501949942, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023755524507427787, + "loss": 0.0211, "step": 160600 }, { - "epoch": 0.81, - "learning_rate": 0.0001784552825019802, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.0002375513568579064, + "loss": 0.0203, "step": 160610 }, { - "epoch": 0.81, - "learning_rate": 0.00017844771480896618, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023754746864153496, + "loss": 0.0207, "step": 160620 }, { - "epoch": 0.81, - "learning_rate": 0.00017844014711595216, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023754358042516347, + "loss": 0.019, "step": 160630 }, { - "epoch": 0.81, - "learning_rate": 0.00017843257942293817, - "loss": 0.01, + "epoch": 0.42, + "learning_rate": 0.000237539692208792, + "loss": 0.0187, "step": 160640 }, { - "epoch": 0.81, - "learning_rate": 0.00017842501172992415, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023753580399242053, + "loss": 0.0198, "step": 160650 }, { - "epoch": 0.81, - "learning_rate": 0.00017841744403691013, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.0002375319157760491, + "loss": 0.0197, "step": 160660 }, { - "epoch": 0.81, - "learning_rate": 0.00017840987634389614, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023752802755967764, + "loss": 0.0168, "step": 160670 }, { - "epoch": 0.81, - "learning_rate": 0.00017840230865088212, - "loss": 0.01, + "epoch": 0.42, + "learning_rate": 0.00023752413934330615, + "loss": 0.0175, "step": 160680 }, { - "epoch": 0.81, - "learning_rate": 0.0001783947409578681, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.0002375202511269347, + "loss": 0.0192, "step": 160690 }, { - "epoch": 0.81, - "learning_rate": 0.0001783871732648541, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.00023751636291056323, + "loss": 0.0214, "step": 160700 }, { - "epoch": 0.81, - "learning_rate": 0.0001783796055718401, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023751247469419178, + "loss": 0.0183, "step": 160710 }, { - "epoch": 0.81, - "learning_rate": 0.00017837203787882607, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.0002375085864778203, + "loss": 0.0175, "step": 160720 }, { - "epoch": 0.81, - "learning_rate": 0.00017836447018581208, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023750469826144883, + "loss": 0.0207, "step": 160730 }, { - "epoch": 0.81, - "learning_rate": 0.00017835690249279806, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023750081004507737, + "loss": 0.0172, "step": 160740 }, { - "epoch": 0.81, - "learning_rate": 0.00017834933479978404, - "loss": 0.0095, + "epoch": 0.42, + "learning_rate": 0.00023749692182870592, + "loss": 0.018, "step": 160750 }, { - "epoch": 0.81, - "learning_rate": 0.00017834176710677005, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023749303361233443, + "loss": 0.0172, "step": 160760 }, { - "epoch": 0.81, - "learning_rate": 0.00017833419941375603, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023748914539596297, + "loss": 0.0187, "step": 160770 }, { - "epoch": 0.81, - "learning_rate": 0.00017832663172074201, - "loss": 0.0089, + "epoch": 0.42, + "learning_rate": 0.0002374852571795915, + "loss": 0.0224, "step": 160780 }, { - "epoch": 0.81, - "learning_rate": 0.000178319064027728, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023748136896322006, + "loss": 0.0221, "step": 160790 }, { - "epoch": 0.81, - "learning_rate": 0.000178311496334714, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023747748074684857, + "loss": 0.0215, "step": 160800 }, { - "epoch": 0.81, - "learning_rate": 0.00017830392864169999, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.0002374735925304771, + "loss": 0.0192, "step": 160810 }, { - "epoch": 0.81, - "learning_rate": 0.00017829636094868597, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023746970431410563, + "loss": 0.0178, "step": 160820 }, { - "epoch": 0.81, - "learning_rate": 0.00017828879325567198, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.0002374658160977342, + "loss": 0.016, "step": 160830 }, { - "epoch": 0.81, - "learning_rate": 0.00017828122556265796, - "loss": 0.0167, + "epoch": 0.42, + "learning_rate": 0.00023746192788136274, + "loss": 0.0209, "step": 160840 }, { - "epoch": 0.81, - "learning_rate": 0.00017827365786964394, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023745803966499125, + "loss": 0.0224, "step": 160850 }, { - "epoch": 0.81, - "learning_rate": 0.00017826609017662995, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023745415144861977, + "loss": 0.0175, "step": 160860 }, { - "epoch": 0.81, - "learning_rate": 0.00017825852248361593, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023745026323224833, + "loss": 0.0165, "step": 160870 }, { - "epoch": 0.81, - "learning_rate": 0.0001782509547906019, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023744637501587688, + "loss": 0.0204, "step": 160880 }, { - "epoch": 0.81, - "learning_rate": 0.00017824338709758792, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.0002374424867995054, + "loss": 0.017, "step": 160890 }, { - "epoch": 0.81, - "learning_rate": 0.0001782358194045739, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.00023743859858313393, + "loss": 0.0281, "step": 160900 }, { - "epoch": 0.81, - "learning_rate": 0.00017822825171155988, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.00023743471036676247, + "loss": 0.0252, "step": 160910 }, { - "epoch": 0.81, - "learning_rate": 0.0001782206840185459, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.00023743082215039102, + "loss": 0.0156, "step": 160920 }, { - "epoch": 0.81, - "learning_rate": 0.00017821311632553187, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.00023742693393401953, + "loss": 0.0192, "step": 160930 }, { - "epoch": 0.81, - "learning_rate": 0.00017820554863251785, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023742304571764807, + "loss": 0.0176, "step": 160940 }, { - "epoch": 0.81, - "learning_rate": 0.00017819798093950383, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.0002374191575012766, + "loss": 0.0188, "step": 160950 }, { - "epoch": 0.81, - "learning_rate": 0.00017819041324648984, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023741526928490515, + "loss": 0.0222, "step": 160960 }, { - "epoch": 0.81, - "learning_rate": 0.00017818284555347582, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023741138106853367, + "loss": 0.0193, "step": 160970 }, { - "epoch": 0.81, - "learning_rate": 0.0001781752778604618, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.0002374074928521622, + "loss": 0.016, "step": 160980 }, { - "epoch": 0.81, - "learning_rate": 0.00017816771016744781, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.00023740360463579078, + "loss": 0.0219, "step": 160990 }, { - "epoch": 0.81, - "learning_rate": 0.0001781601424744338, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002373997164194193, + "loss": 0.018, "step": 161000 }, { - "epoch": 0.81, - "eval_cer": 0.9144789894682909, - "eval_loss": 0.008487106300890446, - "eval_runtime": 116.5295, - "eval_samples_per_second": 17.163, - "eval_steps_per_second": 4.291, + "epoch": 0.42, + "eval_cer": 0.88176706962214, + "eval_loss": 0.012851111590862274, + "eval_runtime": 107.3307, + "eval_samples_per_second": 18.634, + "eval_steps_per_second": 4.658, "step": 161000 }, { - "epoch": 0.81, - "learning_rate": 0.00017815257478141978, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.0002373958282030478, + "loss": 0.0159, "step": 161010 }, { - "epoch": 0.81, - "learning_rate": 0.00017814500708840579, - "loss": 0.0154, + "epoch": 0.42, + "learning_rate": 0.00023739193998667635, + "loss": 0.0141, "step": 161020 }, { - "epoch": 0.81, - "learning_rate": 0.00017813743939539177, - "loss": 0.0145, + "epoch": 0.42, + "learning_rate": 0.00023738805177030486, + "loss": 0.0187, "step": 161030 }, { - "epoch": 0.81, - "learning_rate": 0.00017812987170237775, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023738416355393343, + "loss": 0.0198, "step": 161040 }, { - "epoch": 0.81, - "learning_rate": 0.00017812230400936376, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.00023738027533756198, + "loss": 0.0185, "step": 161050 }, { - "epoch": 0.81, - "learning_rate": 0.00017811473631634974, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.0002373763871211905, + "loss": 0.0158, "step": 161060 }, { - "epoch": 0.81, - "learning_rate": 0.00017810716862333572, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023737249890481903, + "loss": 0.0188, "step": 161070 }, { - "epoch": 0.81, - "learning_rate": 0.00017809960093032173, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023736861068844757, + "loss": 0.022, "step": 161080 }, { - "epoch": 0.81, - "learning_rate": 0.0001780920332373077, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023736472247207611, + "loss": 0.0219, "step": 161090 }, { - "epoch": 0.81, - "learning_rate": 0.0001780844655442937, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023736083425570463, + "loss": 0.0175, "step": 161100 }, { - "epoch": 0.81, - "learning_rate": 0.0001780768978512797, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023735694603933317, + "loss": 0.0195, "step": 161110 }, { - "epoch": 0.81, - "learning_rate": 0.00017806933015826568, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.0002373530578229617, + "loss": 0.0182, "step": 161120 }, { - "epoch": 0.81, - "learning_rate": 0.00017806176246525166, - "loss": 0.0091, + "epoch": 0.42, + "learning_rate": 0.00023734916960659025, + "loss": 0.0212, "step": 161130 }, { - "epoch": 0.81, - "learning_rate": 0.00017805419477223764, - "loss": 0.0154, + "epoch": 0.42, + "learning_rate": 0.00023734528139021877, + "loss": 0.0173, "step": 161140 }, { - "epoch": 0.81, - "learning_rate": 0.00017804662707922365, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.0002373413931738473, + "loss": 0.0182, "step": 161150 }, { - "epoch": 0.81, - "learning_rate": 0.00017803905938620963, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023733750495747588, + "loss": 0.0187, "step": 161160 }, { - "epoch": 0.81, - "learning_rate": 0.00017803149169319562, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.0002373336167411044, + "loss": 0.0186, "step": 161170 }, { - "epoch": 0.81, - "learning_rate": 0.00017802392400018162, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.0002373297285247329, + "loss": 0.0163, "step": 161180 }, { - "epoch": 0.81, - "learning_rate": 0.0001780163563071676, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023732584030836145, + "loss": 0.0195, "step": 161190 }, { - "epoch": 0.81, - "learning_rate": 0.0001780087886141536, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.00023732195209199002, + "loss": 0.0171, "step": 161200 }, { - "epoch": 0.81, - "learning_rate": 0.0001780012209211396, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023731806387561853, + "loss": 0.0153, "step": 161210 }, { - "epoch": 0.81, - "learning_rate": 0.00017799365322812558, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023731417565924707, + "loss": 0.0153, "step": 161220 }, { - "epoch": 0.81, - "learning_rate": 0.00017798608553511156, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.0002373102874428756, + "loss": 0.0149, "step": 161230 }, { - "epoch": 0.81, - "learning_rate": 0.00017797851784209757, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023730639922650416, + "loss": 0.0158, "step": 161240 }, { - "epoch": 0.81, - "learning_rate": 0.00017797095014908355, - "loss": 0.0143, + "epoch": 0.42, + "learning_rate": 0.00023730251101013267, + "loss": 0.0179, "step": 161250 }, { - "epoch": 0.81, - "learning_rate": 0.00017796338245606953, - "loss": 0.0134, + "epoch": 0.42, + "learning_rate": 0.00023729862279376121, + "loss": 0.0216, "step": 161260 }, { - "epoch": 0.81, - "learning_rate": 0.00017795581476305554, - "loss": 0.0098, + "epoch": 0.42, + "learning_rate": 0.00023729473457738973, + "loss": 0.0198, "step": 161270 }, { - "epoch": 0.81, - "learning_rate": 0.00017794824707004152, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023729084636101827, + "loss": 0.0159, "step": 161280 }, { - "epoch": 0.81, - "learning_rate": 0.0001779406793770275, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.0002372869581446468, + "loss": 0.0299, "step": 161290 }, { - "epoch": 0.81, - "learning_rate": 0.00017793311168401348, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023728306992827535, + "loss": 0.0184, "step": 161300 }, { - "epoch": 0.81, - "learning_rate": 0.0001779255439909995, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023727918171190387, + "loss": 0.0135, "step": 161310 }, { - "epoch": 0.81, - "learning_rate": 0.00017791797629798547, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.0002372752934955324, + "loss": 0.0184, "step": 161320 }, { - "epoch": 0.81, - "learning_rate": 0.00017791040860497145, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023727140527916095, + "loss": 0.0224, "step": 161330 }, { - "epoch": 0.81, - "learning_rate": 0.00017790284091195746, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002372675170627895, + "loss": 0.0215, "step": 161340 }, { - "epoch": 0.81, - "learning_rate": 0.00017789527321894344, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.000237263628846418, + "loss": 0.0195, "step": 161350 }, { - "epoch": 0.81, - "learning_rate": 0.00017788770552592943, - "loss": 0.0149, + "epoch": 0.42, + "learning_rate": 0.00023725974063004655, + "loss": 0.0169, "step": 161360 }, { - "epoch": 0.81, - "learning_rate": 0.00017788013783291543, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.00023725585241367512, + "loss": 0.0191, "step": 161370 }, { - "epoch": 0.81, - "learning_rate": 0.00017787257013990142, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023725196419730363, + "loss": 0.0158, "step": 161380 }, { - "epoch": 0.81, - "learning_rate": 0.0001778650024468874, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023724807598093217, + "loss": 0.0187, "step": 161390 }, { - "epoch": 0.81, - "learning_rate": 0.0001778574347538734, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002372441877645607, + "loss": 0.0202, "step": 161400 }, { - "epoch": 0.81, - "learning_rate": 0.0001778498670608594, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023724029954818926, + "loss": 0.0181, "step": 161410 }, { - "epoch": 0.81, - "learning_rate": 0.00017784229936784537, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023723641133181777, + "loss": 0.0175, "step": 161420 }, { - "epoch": 0.81, - "learning_rate": 0.00017783473167483138, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023723252311544631, + "loss": 0.0194, "step": 161430 }, { - "epoch": 0.81, - "learning_rate": 0.00017782716398181736, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023722863489907483, + "loss": 0.0191, "step": 161440 }, { - "epoch": 0.81, - "learning_rate": 0.00017781959628880334, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.0002372247466827034, + "loss": 0.0178, "step": 161450 }, { - "epoch": 0.81, - "learning_rate": 0.00017781202859578932, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.0002372208584663319, + "loss": 0.0167, "step": 161460 }, { - "epoch": 0.81, - "learning_rate": 0.00017780446090277533, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023721697024996045, + "loss": 0.0245, "step": 161470 }, { - "epoch": 0.81, - "learning_rate": 0.0001777968932097613, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023721308203358897, + "loss": 0.0216, "step": 161480 }, { - "epoch": 0.81, - "learning_rate": 0.0001777893255167473, - "loss": 0.0158, + "epoch": 0.42, + "learning_rate": 0.00023720919381721754, + "loss": 0.0184, "step": 161490 }, { - "epoch": 0.81, - "learning_rate": 0.0001777817578237333, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023720530560084605, + "loss": 0.0152, "step": 161500 }, { - "epoch": 0.81, - "learning_rate": 0.00017777419013071926, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.0002372014173844746, + "loss": 0.0213, "step": 161510 }, { - "epoch": 0.81, - "learning_rate": 0.00017776662243770524, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.0002371975291681031, + "loss": 0.0183, "step": 161520 }, { - "epoch": 0.81, - "learning_rate": 0.00017775905474469122, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023719364095173165, + "loss": 0.0214, "step": 161530 }, { - "epoch": 0.81, - "learning_rate": 0.00017775148705167723, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023718975273536022, + "loss": 0.028, "step": 161540 }, { - "epoch": 0.82, - "learning_rate": 0.0001777439193586632, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023718586451898873, + "loss": 0.0254, "step": 161550 }, { - "epoch": 0.82, - "learning_rate": 0.0001777363516656492, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023718197630261727, + "loss": 0.0172, "step": 161560 }, { - "epoch": 0.82, - "learning_rate": 0.0001777287839726352, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.0002371780880862458, + "loss": 0.018, "step": 161570 }, { - "epoch": 0.82, - "learning_rate": 0.00017772121627962118, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023717419986987436, + "loss": 0.0191, "step": 161580 }, { - "epoch": 0.82, - "learning_rate": 0.00017771364858660716, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023717031165350287, + "loss": 0.016, "step": 161590 }, { - "epoch": 0.82, - "learning_rate": 0.00017770608089359317, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.0002371664234371314, + "loss": 0.0216, "step": 161600 }, { - "epoch": 0.82, - "learning_rate": 0.00017769851320057915, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023716253522075993, + "loss": 0.0156, "step": 161610 }, { - "epoch": 0.82, - "learning_rate": 0.00017769094550756513, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.0002371586470043885, + "loss": 0.0167, "step": 161620 }, { - "epoch": 0.82, - "learning_rate": 0.00017768337781455114, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.000237154758788017, + "loss": 0.0165, "step": 161630 }, { - "epoch": 0.82, - "learning_rate": 0.00017767581012153712, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023715087057164555, + "loss": 0.0159, "step": 161640 }, { - "epoch": 0.82, - "learning_rate": 0.0001776682424285231, - "loss": 0.0155, + "epoch": 0.42, + "learning_rate": 0.00023714698235527407, + "loss": 0.0187, "step": 161650 }, { - "epoch": 0.82, - "learning_rate": 0.0001776606747355091, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023714309413890264, + "loss": 0.0221, "step": 161660 }, { - "epoch": 0.82, - "learning_rate": 0.0001776531070424951, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023713920592253115, + "loss": 0.0185, "step": 161670 }, { - "epoch": 0.82, - "learning_rate": 0.00017764553934948108, - "loss": 0.0149, + "epoch": 0.42, + "learning_rate": 0.0002371353177061597, + "loss": 0.0169, "step": 161680 }, { - "epoch": 0.82, - "learning_rate": 0.00017763797165646706, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.0002371314294897882, + "loss": 0.0158, "step": 161690 }, { - "epoch": 0.82, - "learning_rate": 0.00017763040396345307, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023712754127341678, + "loss": 0.0186, "step": 161700 }, { - "epoch": 0.82, - "learning_rate": 0.00017762283627043905, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023712365305704532, + "loss": 0.0223, "step": 161710 }, { - "epoch": 0.82, - "learning_rate": 0.00017761526857742503, - "loss": 0.0096, + "epoch": 0.42, + "learning_rate": 0.00023711976484067383, + "loss": 0.0191, "step": 161720 }, { - "epoch": 0.82, - "learning_rate": 0.00017760770088441104, - "loss": 0.011, + "epoch": 0.42, + "learning_rate": 0.00023711587662430235, + "loss": 0.0189, "step": 161730 }, { - "epoch": 0.82, - "learning_rate": 0.00017760013319139702, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023711198840793091, + "loss": 0.0231, "step": 161740 }, { - "epoch": 0.82, - "learning_rate": 0.000177592565498383, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023710810019155946, + "loss": 0.0202, "step": 161750 }, { - "epoch": 0.82, - "learning_rate": 0.000177584997805369, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023710421197518797, + "loss": 0.0228, "step": 161760 }, { - "epoch": 0.82, - "learning_rate": 0.000177577430112355, - "loss": 0.0101, + "epoch": 0.42, + "learning_rate": 0.0002371003237588165, + "loss": 0.0185, "step": 161770 }, { - "epoch": 0.82, - "learning_rate": 0.00017756986241934097, - "loss": 0.0228, + "epoch": 0.42, + "learning_rate": 0.00023709643554244503, + "loss": 0.0195, "step": 161780 }, { - "epoch": 0.82, - "learning_rate": 0.00017756229472632698, - "loss": 0.0153, + "epoch": 0.42, + "learning_rate": 0.0002370925473260736, + "loss": 0.0187, "step": 161790 }, { - "epoch": 0.82, - "learning_rate": 0.00017755472703331296, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.0002370886591097021, + "loss": 0.0198, "step": 161800 }, { - "epoch": 0.82, - "learning_rate": 0.00017754715934029894, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023708477089333065, + "loss": 0.0281, "step": 161810 }, { - "epoch": 0.82, - "learning_rate": 0.00017753959164728495, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023708088267695917, + "loss": 0.0216, "step": 161820 }, { - "epoch": 0.82, - "learning_rate": 0.00017753202395427093, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023707699446058774, + "loss": 0.0167, "step": 161830 }, { - "epoch": 0.82, - "learning_rate": 0.00017752445626125691, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023707310624421625, + "loss": 0.0207, "step": 161840 }, { - "epoch": 0.82, - "learning_rate": 0.0001775168885682429, - "loss": 0.0099, + "epoch": 0.42, + "learning_rate": 0.0002370692180278448, + "loss": 0.0279, "step": 161850 }, { - "epoch": 0.82, - "learning_rate": 0.0001775093208752289, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.0002370653298114733, + "loss": 0.0206, "step": 161860 }, { - "epoch": 0.82, - "learning_rate": 0.00017750175318221489, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023706144159510187, + "loss": 0.0228, "step": 161870 }, { - "epoch": 0.82, - "learning_rate": 0.00017749418548920087, - "loss": 0.0105, + "epoch": 0.42, + "learning_rate": 0.0002370575533787304, + "loss": 0.0157, "step": 161880 }, { - "epoch": 0.82, - "learning_rate": 0.00017748661779618688, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023705366516235893, + "loss": 0.0196, "step": 161890 }, { - "epoch": 0.82, - "learning_rate": 0.00017747905010317286, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023704977694598745, + "loss": 0.0189, "step": 161900 }, { - "epoch": 0.82, - "learning_rate": 0.00017747148241015884, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023704588872961601, + "loss": 0.0206, "step": 161910 }, { - "epoch": 0.82, - "learning_rate": 0.00017746391471714485, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023704200051324456, + "loss": 0.0183, "step": 161920 }, { - "epoch": 0.82, - "learning_rate": 0.00017745634702413083, - "loss": 0.0188, + "epoch": 0.42, + "learning_rate": 0.00023703811229687307, + "loss": 0.0137, "step": 161930 }, { - "epoch": 0.82, - "learning_rate": 0.0001774487793311168, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.0002370342240805016, + "loss": 0.0182, "step": 161940 }, { - "epoch": 0.82, - "learning_rate": 0.00017744121163810282, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023703033586413015, + "loss": 0.0163, "step": 161950 }, { - "epoch": 0.82, - "learning_rate": 0.0001774336439450888, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.0002370264476477587, + "loss": 0.0159, "step": 161960 }, { - "epoch": 0.82, - "learning_rate": 0.00017742607625207478, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.0002370225594313872, + "loss": 0.0199, "step": 161970 }, { - "epoch": 0.82, - "learning_rate": 0.0001774185085590608, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023701867121501575, + "loss": 0.0157, "step": 161980 }, { - "epoch": 0.82, - "learning_rate": 0.00017741094086604677, - "loss": 0.0088, + "epoch": 0.42, + "learning_rate": 0.0002370147829986443, + "loss": 0.0251, "step": 161990 }, { - "epoch": 0.82, - "learning_rate": 0.00017740337317303275, - "loss": 0.0211, + "epoch": 0.42, + "learning_rate": 0.00023701089478227283, + "loss": 0.0198, "step": 162000 }, { - "epoch": 0.82, - "eval_cer": 0.9144663743186606, - "eval_loss": 0.008896621875464916, - "eval_runtime": 115.9502, - "eval_samples_per_second": 17.249, - "eval_steps_per_second": 4.312, + "epoch": 0.42, + "eval_cer": 0.8817796663545476, + "eval_loss": 0.012595619075000286, + "eval_runtime": 107.3974, + "eval_samples_per_second": 18.622, + "eval_steps_per_second": 4.656, "step": 162000 }, { - "epoch": 0.82, - "learning_rate": 0.00017739580548001876, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023700700656590135, + "loss": 0.0167, "step": 162010 }, { - "epoch": 0.82, - "learning_rate": 0.00017738823778700474, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.0002370031183495299, + "loss": 0.0218, "step": 162020 }, { - "epoch": 0.82, - "learning_rate": 0.00017738067009399072, - "loss": 0.0148, + "epoch": 0.42, + "learning_rate": 0.0002369992301331584, + "loss": 0.0321, "step": 162030 }, { - "epoch": 0.82, - "learning_rate": 0.0001773731024009767, - "loss": 0.0181, + "epoch": 0.42, + "learning_rate": 0.00023699534191678697, + "loss": 0.0219, "step": 162040 }, { - "epoch": 0.82, - "learning_rate": 0.00017736553470796271, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.0002369914537004155, + "loss": 0.0177, "step": 162050 }, { - "epoch": 0.82, - "learning_rate": 0.0001773579670149487, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023698756548404403, + "loss": 0.0219, "step": 162060 }, { - "epoch": 0.82, - "learning_rate": 0.00017735039932193468, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023698367726767254, + "loss": 0.0203, "step": 162070 }, { - "epoch": 0.82, - "learning_rate": 0.00017734283162892069, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.0002369797890513011, + "loss": 0.0198, "step": 162080 }, { - "epoch": 0.82, - "learning_rate": 0.00017733526393590667, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023697590083492966, + "loss": 0.0263, "step": 162090 }, { - "epoch": 0.82, - "learning_rate": 0.00017732769624289265, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023697201261855817, + "loss": 0.0153, "step": 162100 }, { - "epoch": 0.82, - "learning_rate": 0.00017732012854987866, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.0002369681244021867, + "loss": 0.013, "step": 162110 }, { - "epoch": 0.82, - "learning_rate": 0.00017731256085686464, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023696423618581525, + "loss": 0.0223, "step": 162120 }, { - "epoch": 0.82, - "learning_rate": 0.00017730499316385062, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.0002369603479694438, + "loss": 0.0169, "step": 162130 }, { - "epoch": 0.82, - "learning_rate": 0.00017729742547083663, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.0002369564597530723, + "loss": 0.0222, "step": 162140 }, { - "epoch": 0.82, - "learning_rate": 0.0001772898577778226, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023695257153670085, + "loss": 0.0173, "step": 162150 }, { - "epoch": 0.82, - "learning_rate": 0.0001772822900848086, - "loss": 0.0096, + "epoch": 0.42, + "learning_rate": 0.0002369486833203294, + "loss": 0.0154, "step": 162160 }, { - "epoch": 0.82, - "learning_rate": 0.0001772747223917946, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023694479510395793, + "loss": 0.0193, "step": 162170 }, { - "epoch": 0.82, - "learning_rate": 0.00017726715469878058, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023694090688758645, + "loss": 0.0164, "step": 162180 }, { - "epoch": 0.82, - "learning_rate": 0.00017725958700576656, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.000236937018671215, + "loss": 0.0175, "step": 162190 }, { - "epoch": 0.82, - "learning_rate": 0.00017725201931275255, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023693313045484353, + "loss": 0.0189, "step": 162200 }, { - "epoch": 0.82, - "learning_rate": 0.00017724445161973855, - "loss": 0.0093, + "epoch": 0.42, + "learning_rate": 0.00023692924223847207, + "loss": 0.0223, "step": 162210 }, { - "epoch": 0.82, - "learning_rate": 0.00017723688392672454, - "loss": 0.0157, + "epoch": 0.42, + "learning_rate": 0.0002369253540221006, + "loss": 0.0197, "step": 162220 }, { - "epoch": 0.82, - "learning_rate": 0.00017722931623371052, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023692146580572913, + "loss": 0.0223, "step": 162230 }, { - "epoch": 0.82, - "learning_rate": 0.00017722174854069653, - "loss": 0.0108, + "epoch": 0.42, + "learning_rate": 0.0002369175775893577, + "loss": 0.018, "step": 162240 }, { - "epoch": 0.82, - "learning_rate": 0.0001772141808476825, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.0002369136893729862, + "loss": 0.018, "step": 162250 }, { - "epoch": 0.82, - "learning_rate": 0.0001772066131546685, - "loss": 0.0154, + "epoch": 0.42, + "learning_rate": 0.00023690980115661475, + "loss": 0.0183, "step": 162260 }, { - "epoch": 0.82, - "learning_rate": 0.0001771990454616545, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023690591294024327, + "loss": 0.023, "step": 162270 }, { - "epoch": 0.82, - "learning_rate": 0.00017719147776864048, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.0002369020247238718, + "loss": 0.0161, "step": 162280 }, { - "epoch": 0.82, - "learning_rate": 0.00017718391007562646, - "loss": 0.0093, + "epoch": 0.42, + "learning_rate": 0.00023689813650750035, + "loss": 0.0163, "step": 162290 }, { - "epoch": 0.82, - "learning_rate": 0.00017717634238261247, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.0002368942482911289, + "loss": 0.0289, "step": 162300 }, { - "epoch": 0.82, - "learning_rate": 0.00017716877468959845, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.0002368903600747574, + "loss": 0.0202, "step": 162310 }, { - "epoch": 0.82, - "learning_rate": 0.00017716120699658443, - "loss": 0.0105, + "epoch": 0.42, + "learning_rate": 0.00023688647185838595, + "loss": 0.0181, "step": 162320 }, { - "epoch": 0.82, - "learning_rate": 0.00017715363930357044, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.0002368825836420145, + "loss": 0.0181, "step": 162330 }, { - "epoch": 0.82, - "learning_rate": 0.00017714607161055642, - "loss": 0.0177, + "epoch": 0.42, + "learning_rate": 0.00023687869542564303, + "loss": 0.0193, "step": 162340 }, { - "epoch": 0.82, - "learning_rate": 0.0001771385039175424, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023687480720927155, + "loss": 0.0175, "step": 162350 }, { - "epoch": 0.82, - "learning_rate": 0.00017713093622452838, - "loss": 0.0197, + "epoch": 0.42, + "learning_rate": 0.0002368709189929001, + "loss": 0.0187, "step": 162360 }, { - "epoch": 0.82, - "learning_rate": 0.0001771233685315144, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023686703077652863, + "loss": 0.0156, "step": 162370 }, { - "epoch": 0.82, - "learning_rate": 0.00017711580083850037, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.00023686314256015717, + "loss": 0.018, "step": 162380 }, { - "epoch": 0.82, - "learning_rate": 0.00017710823314548636, - "loss": 0.0105, + "epoch": 0.42, + "learning_rate": 0.0002368592543437857, + "loss": 0.017, "step": 162390 }, { - "epoch": 0.82, - "learning_rate": 0.00017710066545247236, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023685536612741423, + "loss": 0.0183, "step": 162400 }, { - "epoch": 0.82, - "learning_rate": 0.00017709309775945835, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002368514779110428, + "loss": 0.0217, "step": 162410 }, { - "epoch": 0.82, - "learning_rate": 0.00017708553006644433, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.0002368475896946713, + "loss": 0.0199, "step": 162420 }, { - "epoch": 0.82, - "learning_rate": 0.00017707796237343034, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023684370147829985, + "loss": 0.0227, "step": 162430 }, { - "epoch": 0.82, - "learning_rate": 0.00017707039468041632, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.00023683981326192837, + "loss": 0.0173, "step": 162440 }, { - "epoch": 0.82, - "learning_rate": 0.0001770628269874023, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023683592504555694, + "loss": 0.0197, "step": 162450 }, { - "epoch": 0.82, - "learning_rate": 0.0001770552592943883, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.00023683203682918545, + "loss": 0.022, "step": 162460 }, { - "epoch": 0.82, - "learning_rate": 0.0001770476916013743, - "loss": 0.011, + "epoch": 0.42, + "learning_rate": 0.000236828148612814, + "loss": 0.0161, "step": 162470 }, { - "epoch": 0.82, - "learning_rate": 0.00017704012390836027, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.0002368242603964425, + "loss": 0.0236, "step": 162480 }, { - "epoch": 0.82, - "learning_rate": 0.00017703255621534628, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.00023682037218007108, + "loss": 0.0208, "step": 162490 }, { - "epoch": 0.82, - "learning_rate": 0.00017702498852233226, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.0002368164839636996, + "loss": 0.0205, "step": 162500 }, { - "epoch": 0.82, - "learning_rate": 0.00017701742082931824, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023681259574732813, + "loss": 0.0173, "step": 162510 }, { - "epoch": 0.82, - "learning_rate": 0.00017700985313630425, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023680870753095665, + "loss": 0.0154, "step": 162520 }, { - "epoch": 0.82, - "learning_rate": 0.00017700228544329023, - "loss": 0.0142, + "epoch": 0.42, + "learning_rate": 0.0002368048193145852, + "loss": 0.0197, "step": 162530 }, { - "epoch": 0.82, - "learning_rate": 0.0001769947177502762, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023680093109821373, + "loss": 0.0185, "step": 162540 }, { - "epoch": 0.82, - "learning_rate": 0.0001769871500572622, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023679704288184227, + "loss": 0.0145, "step": 162550 }, { - "epoch": 0.82, - "learning_rate": 0.0001769795823642482, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.0002367931546654708, + "loss": 0.0218, "step": 162560 }, { - "epoch": 0.82, - "learning_rate": 0.00017697201467123418, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023678926644909933, + "loss": 0.0184, "step": 162570 }, { - "epoch": 0.82, - "learning_rate": 0.00017696444697822017, - "loss": 0.015, + "epoch": 0.42, + "learning_rate": 0.0002367853782327279, + "loss": 0.0169, "step": 162580 }, { - "epoch": 0.82, - "learning_rate": 0.00017695687928520617, - "loss": 0.0108, + "epoch": 0.42, + "learning_rate": 0.0002367814900163564, + "loss": 0.0229, "step": 162590 }, { - "epoch": 0.82, - "learning_rate": 0.00017694931159219216, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.00023677760179998493, + "loss": 0.0197, "step": 162600 }, { - "epoch": 0.82, - "learning_rate": 0.00017694174389917814, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023677371358361347, + "loss": 0.023, "step": 162610 }, { - "epoch": 0.82, - "learning_rate": 0.00017693417620616415, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.00023676982536724204, + "loss": 0.0209, "step": 162620 }, { - "epoch": 0.82, - "learning_rate": 0.00017692660851315013, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023676593715087055, + "loss": 0.0219, "step": 162630 }, { - "epoch": 0.82, - "learning_rate": 0.0001769190408201361, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.0002367620489344991, + "loss": 0.0191, "step": 162640 }, { - "epoch": 0.82, - "learning_rate": 0.00017691147312712212, - "loss": 0.0154, + "epoch": 0.42, + "learning_rate": 0.0002367581607181276, + "loss": 0.0207, "step": 162650 }, { - "epoch": 0.82, - "learning_rate": 0.0001769039054341081, - "loss": 0.0169, + "epoch": 0.42, + "learning_rate": 0.00023675427250175618, + "loss": 0.0212, "step": 162660 }, { - "epoch": 0.82, - "learning_rate": 0.00017689633774109408, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.0002367503842853847, + "loss": 0.0187, "step": 162670 }, { - "epoch": 0.82, - "learning_rate": 0.0001768887700480801, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023674649606901323, + "loss": 0.0247, "step": 162680 }, { - "epoch": 0.82, - "learning_rate": 0.00017688120235506607, - "loss": 0.011, + "epoch": 0.42, + "learning_rate": 0.00023674260785264175, + "loss": 0.0175, "step": 162690 }, { - "epoch": 0.82, - "learning_rate": 0.00017687363466205205, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023673871963627032, + "loss": 0.0207, "step": 162700 }, { - "epoch": 0.82, - "learning_rate": 0.00017686606696903803, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023673483141989883, + "loss": 0.0182, "step": 162710 }, { - "epoch": 0.82, - "learning_rate": 0.00017685849927602404, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023673094320352737, + "loss": 0.0179, "step": 162720 }, { - "epoch": 0.82, - "learning_rate": 0.00017685093158301002, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023672705498715589, + "loss": 0.0163, "step": 162730 }, { - "epoch": 0.82, - "learning_rate": 0.000176843363889996, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.00023672316677078445, + "loss": 0.0194, "step": 162740 }, { - "epoch": 0.82, - "learning_rate": 0.000176835796196982, - "loss": 0.0099, + "epoch": 0.42, + "learning_rate": 0.000236719278554413, + "loss": 0.0165, "step": 162750 }, { - "epoch": 0.82, - "learning_rate": 0.000176828228503968, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.0002367153903380415, + "loss": 0.021, "step": 162760 }, { - "epoch": 0.82, - "learning_rate": 0.00017682066081095395, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.00023671150212167003, + "loss": 0.0177, "step": 162770 }, { - "epoch": 0.82, - "learning_rate": 0.00017681309311793993, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023670761390529857, + "loss": 0.017, "step": 162780 }, { - "epoch": 0.82, - "learning_rate": 0.00017680552542492594, - "loss": 0.0145, + "epoch": 0.42, + "learning_rate": 0.00023670372568892714, + "loss": 0.0203, "step": 162790 }, { - "epoch": 0.82, - "learning_rate": 0.00017679795773191192, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023669983747255565, + "loss": 0.0228, "step": 162800 }, { - "epoch": 0.82, - "learning_rate": 0.0001767903900388979, - "loss": 0.0152, + "epoch": 0.42, + "learning_rate": 0.0002366959492561842, + "loss": 0.0177, "step": 162810 }, { - "epoch": 0.82, - "learning_rate": 0.0001767828223458839, - "loss": 0.0176, + "epoch": 0.42, + "learning_rate": 0.0002366920610398127, + "loss": 0.0179, "step": 162820 }, { - "epoch": 0.82, - "learning_rate": 0.0001767752546528699, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023668817282344128, + "loss": 0.0198, "step": 162830 }, { - "epoch": 0.82, - "learning_rate": 0.00017676768695985587, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.0002366842846070698, + "loss": 0.022, "step": 162840 }, { - "epoch": 0.82, - "learning_rate": 0.00017676011926684188, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023668039639069833, + "loss": 0.0181, "step": 162850 }, { - "epoch": 0.82, - "learning_rate": 0.00017675255157382786, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023667650817432685, + "loss": 0.0171, "step": 162860 }, { - "epoch": 0.82, - "learning_rate": 0.00017674498388081384, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.00023667261995795541, + "loss": 0.0181, "step": 162870 }, { - "epoch": 0.82, - "learning_rate": 0.00017673741618779985, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023666873174158393, + "loss": 0.0295, "step": 162880 }, { - "epoch": 0.82, - "learning_rate": 0.00017672984849478583, - "loss": 0.0173, + "epoch": 0.42, + "learning_rate": 0.00023666484352521247, + "loss": 0.0184, "step": 162890 }, { - "epoch": 0.82, - "learning_rate": 0.00017672228080177182, - "loss": 0.0135, + "epoch": 0.42, + "learning_rate": 0.00023666095530884099, + "loss": 0.0212, "step": 162900 }, { - "epoch": 0.82, - "learning_rate": 0.00017671471310875782, - "loss": 0.0136, + "epoch": 0.42, + "learning_rate": 0.00023665706709246955, + "loss": 0.0166, "step": 162910 }, { - "epoch": 0.82, - "learning_rate": 0.0001767071454157438, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023665317887609807, + "loss": 0.0225, "step": 162920 }, { - "epoch": 0.82, - "learning_rate": 0.0001766995777227298, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.0002366492906597266, + "loss": 0.0189, "step": 162930 }, { - "epoch": 0.82, - "learning_rate": 0.00017669201002971577, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023664540244335513, + "loss": 0.0202, "step": 162940 }, { - "epoch": 0.82, - "learning_rate": 0.00017668444233670178, - "loss": 0.0155, + "epoch": 0.42, + "learning_rate": 0.0002366415142269837, + "loss": 0.0198, "step": 162950 }, { - "epoch": 0.82, - "learning_rate": 0.00017667687464368776, - "loss": 0.0123, + "epoch": 0.42, + "learning_rate": 0.00023663762601061224, + "loss": 0.016, "step": 162960 }, { - "epoch": 0.82, - "learning_rate": 0.00017666930695067374, - "loss": 0.0093, + "epoch": 0.42, + "learning_rate": 0.00023663373779424075, + "loss": 0.0164, "step": 162970 }, { - "epoch": 0.82, - "learning_rate": 0.00017666173925765975, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.0002366298495778693, + "loss": 0.0193, "step": 162980 }, { - "epoch": 0.82, - "learning_rate": 0.00017665417156464573, - "loss": 0.0108, + "epoch": 0.42, + "learning_rate": 0.00023662596136149783, + "loss": 0.023, "step": 162990 }, { - "epoch": 0.82, - "learning_rate": 0.0001766466038716317, - "loss": 0.0087, + "epoch": 0.42, + "learning_rate": 0.00023662207314512637, + "loss": 0.0169, "step": 163000 }, { - "epoch": 0.82, - "eval_cer": 0.9144401736232748, - "eval_loss": 0.00887399259954691, - "eval_runtime": 116.6416, - "eval_samples_per_second": 17.147, - "eval_steps_per_second": 4.287, + "epoch": 0.42, + "eval_cer": 0.8817838652653501, + "eval_loss": 0.01325357798486948, + "eval_runtime": 107.3603, + "eval_samples_per_second": 18.629, + "eval_steps_per_second": 4.657, "step": 163000 }, { - "epoch": 0.82, - "learning_rate": 0.00017663903617861772, - "loss": 0.0108, + "epoch": 0.42, + "learning_rate": 0.0002366181849287549, + "loss": 0.0191, "step": 163010 }, { - "epoch": 0.82, - "learning_rate": 0.0001766314684856037, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023661429671238343, + "loss": 0.0161, "step": 163020 }, { - "epoch": 0.82, - "learning_rate": 0.00017662390079258968, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023661040849601195, + "loss": 0.0211, "step": 163030 }, { - "epoch": 0.82, - "learning_rate": 0.0001766163330995757, - "loss": 0.011, + "epoch": 0.42, + "learning_rate": 0.00023660652027964051, + "loss": 0.0191, "step": 163040 }, { - "epoch": 0.82, - "learning_rate": 0.00017660876540656167, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.00023660263206326903, + "loss": 0.017, "step": 163050 }, { - "epoch": 0.82, - "learning_rate": 0.00017660119771354765, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023659874384689757, + "loss": 0.0187, "step": 163060 }, { - "epoch": 0.82, - "learning_rate": 0.00017659363002053366, - "loss": 0.0137, + "epoch": 0.42, + "learning_rate": 0.00023659485563052609, + "loss": 0.0173, "step": 163070 }, { - "epoch": 0.82, - "learning_rate": 0.00017658606232751964, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023659096741415465, + "loss": 0.0223, "step": 163080 }, { - "epoch": 0.82, - "learning_rate": 0.00017657849463450563, - "loss": 0.0148, + "epoch": 0.42, + "learning_rate": 0.00023658707919778317, + "loss": 0.0185, "step": 163090 }, { - "epoch": 0.82, - "learning_rate": 0.0001765709269414916, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.0002365831909814117, + "loss": 0.0164, "step": 163100 }, { - "epoch": 0.82, - "learning_rate": 0.00017656335924847762, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.00023657930276504022, + "loss": 0.0178, "step": 163110 }, { - "epoch": 0.82, - "learning_rate": 0.0001765557915554636, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.0002365754145486688, + "loss": 0.0162, "step": 163120 }, { - "epoch": 0.82, - "learning_rate": 0.00017654822386244958, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.00023657152633229733, + "loss": 0.0199, "step": 163130 }, { - "epoch": 0.82, - "learning_rate": 0.0001765406561694356, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023656763811592585, + "loss": 0.0185, "step": 163140 }, { - "epoch": 0.82, - "learning_rate": 0.00017653308847642157, - "loss": 0.0127, + "epoch": 0.42, + "learning_rate": 0.0002365637498995544, + "loss": 0.0191, "step": 163150 }, { - "epoch": 0.82, - "learning_rate": 0.00017652552078340755, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023655986168318293, + "loss": 0.0176, "step": 163160 }, { - "epoch": 0.82, - "learning_rate": 0.00017651795309039356, - "loss": 0.014, + "epoch": 0.42, + "learning_rate": 0.00023655597346681147, + "loss": 0.021, "step": 163170 }, { - "epoch": 0.82, - "learning_rate": 0.00017651038539737954, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023655208525044, + "loss": 0.0187, "step": 163180 }, { - "epoch": 0.82, - "learning_rate": 0.00017650281770436552, - "loss": 0.0139, + "epoch": 0.42, + "learning_rate": 0.00023654819703406853, + "loss": 0.02, "step": 163190 }, { - "epoch": 0.82, - "learning_rate": 0.00017649525001135153, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.00023654430881769707, + "loss": 0.0199, "step": 163200 }, { - "epoch": 0.82, - "learning_rate": 0.0001764876823183375, - "loss": 0.0113, + "epoch": 0.42, + "learning_rate": 0.00023654042060132561, + "loss": 0.0216, "step": 163210 }, { - "epoch": 0.82, - "learning_rate": 0.0001764801146253235, - "loss": 0.0175, + "epoch": 0.42, + "learning_rate": 0.00023653653238495413, + "loss": 0.0217, "step": 163220 }, { - "epoch": 0.82, - "learning_rate": 0.0001764725469323095, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.00023653264416858267, + "loss": 0.0178, "step": 163230 }, { - "epoch": 0.82, - "learning_rate": 0.00017646497923929548, - "loss": 0.0146, + "epoch": 0.42, + "learning_rate": 0.0002365287559522112, + "loss": 0.0177, "step": 163240 }, { - "epoch": 0.82, - "learning_rate": 0.00017645741154628146, - "loss": 0.0101, + "epoch": 0.42, + "learning_rate": 0.00023652486773583975, + "loss": 0.0188, "step": 163250 }, { - "epoch": 0.82, - "learning_rate": 0.00017644984385326745, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023652097951946827, + "loss": 0.015, "step": 163260 }, { - "epoch": 0.82, - "learning_rate": 0.00017644227616025345, - "loss": 0.0115, + "epoch": 0.42, + "learning_rate": 0.0002365170913030968, + "loss": 0.0195, "step": 163270 }, { - "epoch": 0.82, - "learning_rate": 0.00017643470846723944, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023651320308672532, + "loss": 0.018, "step": 163280 }, { - "epoch": 0.82, - "learning_rate": 0.00017642714077422542, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.0002365093148703539, + "loss": 0.0173, "step": 163290 }, { - "epoch": 0.82, - "learning_rate": 0.00017641957308121143, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.00023650542665398243, + "loss": 0.0207, "step": 163300 }, { - "epoch": 0.82, - "learning_rate": 0.0001764120053881974, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023650153843761095, + "loss": 0.018, "step": 163310 }, { - "epoch": 0.82, - "learning_rate": 0.0001764044376951834, - "loss": 0.0151, + "epoch": 0.42, + "learning_rate": 0.00023649765022123946, + "loss": 0.0202, "step": 163320 }, { - "epoch": 0.82, - "learning_rate": 0.0001763968700021694, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.00023649376200486803, + "loss": 0.0223, "step": 163330 }, { - "epoch": 0.82, - "learning_rate": 0.00017638930230915538, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023648987378849657, + "loss": 0.0199, "step": 163340 }, { - "epoch": 0.82, - "learning_rate": 0.00017638173461614136, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.0002364859855721251, + "loss": 0.0181, "step": 163350 }, { - "epoch": 0.82, - "learning_rate": 0.00017637416692312737, - "loss": 0.0176, + "epoch": 0.42, + "learning_rate": 0.00023648209735575363, + "loss": 0.0219, "step": 163360 }, { - "epoch": 0.82, - "learning_rate": 0.00017636659923011335, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023647820913938217, + "loss": 0.0181, "step": 163370 }, { - "epoch": 0.82, - "learning_rate": 0.00017635903153709933, - "loss": 0.0107, + "epoch": 0.42, + "learning_rate": 0.0002364743209230107, + "loss": 0.0191, "step": 163380 }, { - "epoch": 0.82, - "learning_rate": 0.00017635146384408534, - "loss": 0.0144, + "epoch": 0.42, + "learning_rate": 0.00023647043270663923, + "loss": 0.0176, "step": 163390 }, { - "epoch": 0.82, - "learning_rate": 0.00017634389615107132, - "loss": 0.0103, + "epoch": 0.42, + "learning_rate": 0.00023646654449026777, + "loss": 0.0225, "step": 163400 }, { - "epoch": 0.82, - "learning_rate": 0.0001763363284580573, - "loss": 0.0186, + "epoch": 0.42, + "learning_rate": 0.0002364626562738963, + "loss": 0.0244, "step": 163410 }, { - "epoch": 0.82, - "learning_rate": 0.0001763287607650433, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023645876805752485, + "loss": 0.0147, "step": 163420 }, { - "epoch": 0.82, - "learning_rate": 0.0001763211930720293, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023645487984115337, + "loss": 0.0217, "step": 163430 }, { - "epoch": 0.82, - "learning_rate": 0.00017631362537901527, - "loss": 0.0124, + "epoch": 0.42, + "learning_rate": 0.0002364509916247819, + "loss": 0.0198, "step": 163440 }, { - "epoch": 0.82, - "learning_rate": 0.00017630605768600126, - "loss": 0.0119, + "epoch": 0.42, + "learning_rate": 0.00023644710340841048, + "loss": 0.0204, "step": 163450 }, { - "epoch": 0.82, - "learning_rate": 0.00017629848999298726, - "loss": 0.0149, + "epoch": 0.42, + "learning_rate": 0.000236443215192039, + "loss": 0.0188, "step": 163460 }, { - "epoch": 0.82, - "learning_rate": 0.00017629092229997325, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.0002364393269756675, + "loss": 0.0245, "step": 163470 }, { - "epoch": 0.82, - "learning_rate": 0.00017628335460695923, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023643543875929605, + "loss": 0.0248, "step": 163480 }, { - "epoch": 0.82, - "learning_rate": 0.00017627578691394524, - "loss": 0.011, + "epoch": 0.42, + "learning_rate": 0.00023643155054292462, + "loss": 0.0224, "step": 163490 }, { - "epoch": 0.82, - "learning_rate": 0.00017626821922093122, - "loss": 0.0104, + "epoch": 0.42, + "learning_rate": 0.00023642766232655313, + "loss": 0.0174, "step": 163500 }, { - "epoch": 0.82, - "learning_rate": 0.0001762606515279172, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023642377411018167, + "loss": 0.0202, "step": 163510 }, { - "epoch": 0.82, - "learning_rate": 0.0001762530838349032, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.0002364198858938102, + "loss": 0.0213, "step": 163520 }, { - "epoch": 0.83, - "learning_rate": 0.0001762455161418892, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.00023641599767743873, + "loss": 0.0194, "step": 163530 }, { - "epoch": 0.83, - "learning_rate": 0.00017623794844887517, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.00023641210946106727, + "loss": 0.0191, "step": 163540 }, { - "epoch": 0.83, - "learning_rate": 0.00017623038075586118, - "loss": 0.0114, + "epoch": 0.42, + "learning_rate": 0.0002364082212446958, + "loss": 0.0247, "step": 163550 }, { - "epoch": 0.83, - "learning_rate": 0.00017622281306284716, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023640433302832433, + "loss": 0.0207, "step": 163560 }, { - "epoch": 0.83, - "learning_rate": 0.00017621524536983314, - "loss": 0.0081, + "epoch": 0.42, + "learning_rate": 0.00023640044481195287, + "loss": 0.0187, "step": 163570 }, { - "epoch": 0.83, - "learning_rate": 0.00017620767767681915, - "loss": 0.0116, + "epoch": 0.42, + "learning_rate": 0.0002363965565955814, + "loss": 0.02, "step": 163580 }, { - "epoch": 0.83, - "learning_rate": 0.00017620010998380513, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023639266837920995, + "loss": 0.0221, "step": 163590 }, { - "epoch": 0.83, - "learning_rate": 0.0001761925422907911, - "loss": 0.0126, + "epoch": 0.42, + "learning_rate": 0.00023638878016283847, + "loss": 0.0211, "step": 163600 }, { - "epoch": 0.83, - "learning_rate": 0.0001761849745977771, - "loss": 0.0111, + "epoch": 0.42, + "learning_rate": 0.000236384891946467, + "loss": 0.0171, "step": 163610 }, { - "epoch": 0.83, - "learning_rate": 0.0001761774069047631, - "loss": 0.0096, + "epoch": 0.42, + "learning_rate": 0.00023638100373009558, + "loss": 0.032, "step": 163620 }, { - "epoch": 0.83, - "learning_rate": 0.00017616983921174908, - "loss": 0.01, + "epoch": 0.42, + "learning_rate": 0.0002363771155137241, + "loss": 0.0301, "step": 163630 }, { - "epoch": 0.83, - "learning_rate": 0.00017616227151873507, - "loss": 0.0098, + "epoch": 0.42, + "learning_rate": 0.0002363732272973526, + "loss": 0.0198, "step": 163640 }, { - "epoch": 0.83, - "learning_rate": 0.00017615470382572107, - "loss": 0.0147, + "epoch": 0.42, + "learning_rate": 0.00023636933908098115, + "loss": 0.014, "step": 163650 }, { - "epoch": 0.83, - "learning_rate": 0.00017614713613270706, - "loss": 0.0122, + "epoch": 0.42, + "learning_rate": 0.00023636545086460972, + "loss": 0.0197, "step": 163660 }, { - "epoch": 0.83, - "learning_rate": 0.00017613956843969304, - "loss": 0.0112, + "epoch": 0.42, + "learning_rate": 0.00023636156264823823, + "loss": 0.0213, "step": 163670 }, { - "epoch": 0.83, - "learning_rate": 0.00017613200074667905, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.00023635767443186677, + "loss": 0.0198, "step": 163680 }, { - "epoch": 0.83, - "learning_rate": 0.00017612443305366503, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.0002363537862154953, + "loss": 0.0191, "step": 163690 }, { - "epoch": 0.83, - "learning_rate": 0.000176116865360651, - "loss": 0.013, + "epoch": 0.42, + "learning_rate": 0.00023634989799912386, + "loss": 0.0169, "step": 163700 }, { - "epoch": 0.83, - "learning_rate": 0.00017610929766763702, - "loss": 0.0121, + "epoch": 0.42, + "learning_rate": 0.00023634600978275237, + "loss": 0.0214, "step": 163710 }, { - "epoch": 0.83, - "learning_rate": 0.000176101729974623, - "loss": 0.0133, + "epoch": 0.42, + "learning_rate": 0.0002363421215663809, + "loss": 0.0211, "step": 163720 }, { - "epoch": 0.83, - "learning_rate": 0.00017609416228160898, - "loss": 0.0118, + "epoch": 0.42, + "learning_rate": 0.00023633823335000943, + "loss": 0.018, "step": 163730 }, { - "epoch": 0.83, - "learning_rate": 0.000176086594588595, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.000236334345133638, + "loss": 0.0208, "step": 163740 }, { - "epoch": 0.83, - "learning_rate": 0.00017607902689558097, - "loss": 0.0129, + "epoch": 0.42, + "learning_rate": 0.0002363304569172665, + "loss": 0.0175, "step": 163750 }, { - "epoch": 0.83, - "learning_rate": 0.00017607145920256695, - "loss": 0.012, + "epoch": 0.42, + "learning_rate": 0.00023632656870089505, + "loss": 0.0211, "step": 163760 }, { - "epoch": 0.83, - "learning_rate": 0.00017606389150955293, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.00023632268048452357, + "loss": 0.0181, "step": 163770 }, { - "epoch": 0.83, - "learning_rate": 0.00017605632381653894, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.0002363187922681521, + "loss": 0.0223, "step": 163780 }, { - "epoch": 0.83, - "learning_rate": 0.00017604875612352492, - "loss": 0.0206, + "epoch": 0.42, + "learning_rate": 0.00023631490405178065, + "loss": 0.0177, "step": 163790 }, { - "epoch": 0.83, - "learning_rate": 0.0001760411884305109, - "loss": 0.0131, + "epoch": 0.42, + "learning_rate": 0.0002363110158354092, + "loss": 0.0194, "step": 163800 }, { - "epoch": 0.83, - "learning_rate": 0.0001760336207374969, - "loss": 0.0162, + "epoch": 0.42, + "learning_rate": 0.0002363071276190377, + "loss": 0.0203, "step": 163810 }, { - "epoch": 0.83, - "learning_rate": 0.0001760260530444829, - "loss": 0.0125, + "epoch": 0.42, + "learning_rate": 0.00023630323940266625, + "loss": 0.0139, "step": 163820 }, { - "epoch": 0.83, - "learning_rate": 0.00017601848535146888, - "loss": 0.0117, + "epoch": 0.42, + "learning_rate": 0.00023629935118629482, + "loss": 0.0236, "step": 163830 }, { - "epoch": 0.83, - "learning_rate": 0.00017601091765845488, - "loss": 0.0132, + "epoch": 0.42, + "learning_rate": 0.00023629546296992333, + "loss": 0.02, "step": 163840 }, { - "epoch": 0.83, - "learning_rate": 0.00017600334996544087, - "loss": 0.0109, + "epoch": 0.42, + "learning_rate": 0.00023629157475355187, + "loss": 0.0163, "step": 163850 }, { - "epoch": 0.83, - "learning_rate": 0.00017599578227242685, - "loss": 0.0156, + "epoch": 0.42, + "learning_rate": 0.0002362876865371804, + "loss": 0.0183, "step": 163860 }, { - "epoch": 0.83, - "learning_rate": 0.00017598821457941286, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023628379832080896, + "loss": 0.0223, "step": 163870 }, { - "epoch": 0.83, - "learning_rate": 0.00017598064688639884, - "loss": 0.0145, + "epoch": 0.42, + "learning_rate": 0.00023627991010443747, + "loss": 0.0246, "step": 163880 }, { - "epoch": 0.83, - "learning_rate": 0.00017597307919338482, - "loss": 0.0128, + "epoch": 0.42, + "learning_rate": 0.000236276021888066, + "loss": 0.0154, "step": 163890 }, { - "epoch": 0.83, - "learning_rate": 0.00017596551150037083, - "loss": 0.0138, + "epoch": 0.42, + "learning_rate": 0.00023627213367169453, + "loss": 0.0198, "step": 163900 }, { - "epoch": 0.83, - "learning_rate": 0.0001759579438073568, - "loss": 0.0102, + "epoch": 0.42, + "learning_rate": 0.0002362682454553231, + "loss": 0.0202, "step": 163910 }, { - "epoch": 0.83, - "learning_rate": 0.0001759503761143428, - "loss": 0.016, + "epoch": 0.42, + "learning_rate": 0.0002362643572389516, + "loss": 0.0222, "step": 163920 }, { - "epoch": 0.83, - "learning_rate": 0.0001759428084213288, - "loss": 0.016, + "epoch": 0.42, + "learning_rate": 0.00023626046902258015, + "loss": 0.0203, "step": 163930 }, { - "epoch": 0.83, - "learning_rate": 0.00017593524072831478, - "loss": 0.0106, + "epoch": 0.42, + "learning_rate": 0.00023625658080620867, + "loss": 0.0202, "step": 163940 }, { - "epoch": 0.83, - "learning_rate": 0.00017592767303530076, - "loss": 0.0141, + "epoch": 0.42, + "learning_rate": 0.00023625269258983723, + "loss": 0.0308, "step": 163950 }, { - "epoch": 0.83, - "learning_rate": 0.00017592010534228674, - "loss": 0.0091, + "epoch": 0.43, + "learning_rate": 0.00023624880437346575, + "loss": 0.0221, "step": 163960 }, { - "epoch": 0.83, - "learning_rate": 0.00017591253764927275, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.0002362449161570943, + "loss": 0.0198, "step": 163970 }, { - "epoch": 0.83, - "learning_rate": 0.00017590496995625873, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.0002362410279407228, + "loss": 0.02, "step": 163980 }, { - "epoch": 0.83, - "learning_rate": 0.00017589740226324471, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.00023623713972435137, + "loss": 0.0207, "step": 163990 }, { - "epoch": 0.83, - "learning_rate": 0.00017588983457023072, - "loss": 0.0148, + "epoch": 0.43, + "learning_rate": 0.00023623325150797992, + "loss": 0.0232, "step": 164000 }, { - "epoch": 0.83, - "eval_cer": 0.914481900656667, - "eval_loss": 0.009098981507122517, - "eval_runtime": 116.6318, - "eval_samples_per_second": 17.148, - "eval_steps_per_second": 4.287, + "epoch": 0.43, + "eval_cer": 0.8817880641761527, + "eval_loss": 0.012865516357123852, + "eval_runtime": 107.376, + "eval_samples_per_second": 18.626, + "eval_steps_per_second": 4.657, "step": 164000 }, { - "epoch": 0.83, - "learning_rate": 0.0001758822668772167, - "loss": 0.0169, + "epoch": 0.43, + "learning_rate": 0.00023622936329160843, + "loss": 0.0242, "step": 164010 }, { - "epoch": 0.83, - "learning_rate": 0.00017587469918420269, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.00023622547507523697, + "loss": 0.0177, "step": 164020 }, { - "epoch": 0.83, - "learning_rate": 0.00017586713149118864, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023622158685886549, + "loss": 0.0212, "step": 164030 }, { - "epoch": 0.83, - "learning_rate": 0.00017585956379817465, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.00023621769864249405, + "loss": 0.0168, "step": 164040 }, { - "epoch": 0.83, - "learning_rate": 0.00017585199610516063, - "loss": 0.0092, + "epoch": 0.43, + "learning_rate": 0.00023621381042612257, + "loss": 0.0172, "step": 164050 }, { - "epoch": 0.83, - "learning_rate": 0.0001758444284121466, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.0002362099222097511, + "loss": 0.0189, "step": 164060 }, { - "epoch": 0.83, - "learning_rate": 0.00017583686071913262, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023620603399337963, + "loss": 0.0159, "step": 164070 }, { - "epoch": 0.83, - "learning_rate": 0.0001758292930261186, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.0002362021457770082, + "loss": 0.017, "step": 164080 }, { - "epoch": 0.83, - "learning_rate": 0.00017582172533310458, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.0002361982575606367, + "loss": 0.0186, "step": 164090 }, { - "epoch": 0.83, - "learning_rate": 0.0001758141576400906, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023619436934426525, + "loss": 0.0181, "step": 164100 }, { - "epoch": 0.83, - "learning_rate": 0.00017580658994707657, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023619048112789376, + "loss": 0.0147, "step": 164110 }, { - "epoch": 0.83, - "learning_rate": 0.00017579902225406255, - "loss": 0.0085, + "epoch": 0.43, + "learning_rate": 0.00023618659291152233, + "loss": 0.0163, "step": 164120 }, { - "epoch": 0.83, - "learning_rate": 0.00017579145456104856, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023618270469515085, + "loss": 0.0173, "step": 164130 }, { - "epoch": 0.83, - "learning_rate": 0.00017578388686803454, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.0002361788164787794, + "loss": 0.0176, "step": 164140 }, { - "epoch": 0.83, - "learning_rate": 0.00017577631917502053, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.0002361749282624079, + "loss": 0.0204, "step": 164150 }, { - "epoch": 0.83, - "learning_rate": 0.0001757687514820065, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.00023617104004603647, + "loss": 0.0195, "step": 164160 }, { - "epoch": 0.83, - "learning_rate": 0.00017576118378899252, - "loss": 0.0162, + "epoch": 0.43, + "learning_rate": 0.00023616715182966501, + "loss": 0.0208, "step": 164170 }, { - "epoch": 0.83, - "learning_rate": 0.0001757536160959785, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023616326361329353, + "loss": 0.02, "step": 164180 }, { - "epoch": 0.83, - "learning_rate": 0.00017574604840296448, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023615937539692204, + "loss": 0.0198, "step": 164190 }, { - "epoch": 0.83, - "learning_rate": 0.0001757384807099505, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.0002361554871805506, + "loss": 0.0178, "step": 164200 }, { - "epoch": 0.83, - "learning_rate": 0.00017573091301693647, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023615159896417915, + "loss": 0.0147, "step": 164210 }, { - "epoch": 0.83, - "learning_rate": 0.00017572334532392245, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023614771074780767, + "loss": 0.0185, "step": 164220 }, { - "epoch": 0.83, - "learning_rate": 0.00017571577763090846, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.0002361438225314362, + "loss": 0.0192, "step": 164230 }, { - "epoch": 0.83, - "learning_rate": 0.00017570820993789444, - "loss": 0.0152, + "epoch": 0.43, + "learning_rate": 0.00023613993431506475, + "loss": 0.0231, "step": 164240 }, { - "epoch": 0.83, - "learning_rate": 0.00017570064224488042, - "loss": 0.0141, + "epoch": 0.43, + "learning_rate": 0.0002361360460986933, + "loss": 0.0197, "step": 164250 }, { - "epoch": 0.83, - "learning_rate": 0.00017569307455186643, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.0002361321578823218, + "loss": 0.0159, "step": 164260 }, { - "epoch": 0.83, - "learning_rate": 0.0001756855068588524, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.00023612826966595035, + "loss": 0.0188, "step": 164270 }, { - "epoch": 0.83, - "learning_rate": 0.0001756779391658384, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023612438144957886, + "loss": 0.0216, "step": 164280 }, { - "epoch": 0.83, - "learning_rate": 0.0001756703714728244, - "loss": 0.0101, + "epoch": 0.43, + "learning_rate": 0.00023612049323320743, + "loss": 0.0205, "step": 164290 }, { - "epoch": 0.83, - "learning_rate": 0.00017566280377981038, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.00023611660501683595, + "loss": 0.0206, "step": 164300 }, { - "epoch": 0.83, - "learning_rate": 0.00017565523608679636, - "loss": 0.0159, + "epoch": 0.43, + "learning_rate": 0.0002361127168004645, + "loss": 0.016, "step": 164310 }, { - "epoch": 0.83, - "learning_rate": 0.00017564766839378237, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.000236108828584093, + "loss": 0.0152, "step": 164320 }, { - "epoch": 0.83, - "learning_rate": 0.00017564010070076835, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023610494036772157, + "loss": 0.0216, "step": 164330 }, { - "epoch": 0.83, - "learning_rate": 0.00017563253300775434, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023610105215135011, + "loss": 0.0196, "step": 164340 }, { - "epoch": 0.83, - "learning_rate": 0.00017562496531474032, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.00023609716393497863, + "loss": 0.0174, "step": 164350 }, { - "epoch": 0.83, - "learning_rate": 0.00017561739762172633, - "loss": 0.0148, + "epoch": 0.43, + "learning_rate": 0.00023609327571860714, + "loss": 0.0198, "step": 164360 }, { - "epoch": 0.83, - "learning_rate": 0.0001756098299287123, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.0002360893875022357, + "loss": 0.0209, "step": 164370 }, { - "epoch": 0.83, - "learning_rate": 0.0001756022622356983, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023608549928586425, + "loss": 0.0196, "step": 164380 }, { - "epoch": 0.83, - "learning_rate": 0.0001755946945426843, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023608161106949277, + "loss": 0.0195, "step": 164390 }, { - "epoch": 0.83, - "learning_rate": 0.00017558712684967028, - "loss": 0.0101, + "epoch": 0.43, + "learning_rate": 0.0002360777228531213, + "loss": 0.0191, "step": 164400 }, { - "epoch": 0.83, - "learning_rate": 0.00017557955915665626, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.00023607383463674985, + "loss": 0.0145, "step": 164410 }, { - "epoch": 0.83, - "learning_rate": 0.00017557199146364227, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.0002360699464203784, + "loss": 0.0182, "step": 164420 }, { - "epoch": 0.83, - "learning_rate": 0.00017556442377062825, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.0002360660582040069, + "loss": 0.0206, "step": 164430 }, { - "epoch": 0.83, - "learning_rate": 0.00017555685607761423, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023606216998763545, + "loss": 0.0152, "step": 164440 }, { - "epoch": 0.83, - "learning_rate": 0.00017554928838460024, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.000236058281771264, + "loss": 0.0185, "step": 164450 }, { - "epoch": 0.83, - "learning_rate": 0.00017554172069158622, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023605439355489253, + "loss": 0.019, "step": 164460 }, { - "epoch": 0.83, - "learning_rate": 0.0001755341529985722, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023605050533852105, + "loss": 0.0172, "step": 164470 }, { - "epoch": 0.83, - "learning_rate": 0.0001755265853055582, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.0002360466171221496, + "loss": 0.0165, "step": 164480 }, { - "epoch": 0.83, - "learning_rate": 0.0001755190176125442, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023604272890577816, + "loss": 0.0197, "step": 164490 }, { - "epoch": 0.83, - "learning_rate": 0.00017551144991953017, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023603884068940667, + "loss": 0.0176, "step": 164500 }, { - "epoch": 0.83, - "learning_rate": 0.00017550388222651616, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.0002360349524730352, + "loss": 0.0171, "step": 164510 }, { - "epoch": 0.83, - "learning_rate": 0.00017549631453350216, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.00023603106425666373, + "loss": 0.0199, "step": 164520 }, { - "epoch": 0.83, - "learning_rate": 0.00017548874684048815, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023602717604029224, + "loss": 0.0158, "step": 164530 }, { - "epoch": 0.83, - "learning_rate": 0.00017548117914747413, - "loss": 0.0083, + "epoch": 0.43, + "learning_rate": 0.0002360232878239208, + "loss": 0.0179, "step": 164540 }, { - "epoch": 0.83, - "learning_rate": 0.00017547361145446014, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.00023601939960754935, + "loss": 0.0195, "step": 164550 }, { - "epoch": 0.83, - "learning_rate": 0.00017546604376144612, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023601551139117787, + "loss": 0.0164, "step": 164560 }, { - "epoch": 0.83, - "learning_rate": 0.0001754584760684321, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.0002360116231748064, + "loss": 0.0142, "step": 164570 }, { - "epoch": 0.83, - "learning_rate": 0.0001754509083754181, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023600773495843495, + "loss": 0.0159, "step": 164580 }, { - "epoch": 0.83, - "learning_rate": 0.0001754433406824041, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.0002360038467420635, + "loss": 0.0182, "step": 164590 }, { - "epoch": 0.83, - "learning_rate": 0.00017543577298939007, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.000235999958525692, + "loss": 0.0196, "step": 164600 }, { - "epoch": 0.83, - "learning_rate": 0.00017542820529637608, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.00023599607030932055, + "loss": 0.0216, "step": 164610 }, { - "epoch": 0.83, - "learning_rate": 0.00017542063760336206, - "loss": 0.016, + "epoch": 0.43, + "learning_rate": 0.0002359921820929491, + "loss": 0.0217, "step": 164620 }, { - "epoch": 0.83, - "learning_rate": 0.00017541306991034804, - "loss": 0.0153, + "epoch": 0.43, + "learning_rate": 0.00023598829387657763, + "loss": 0.0224, "step": 164630 }, { - "epoch": 0.83, - "learning_rate": 0.00017540550221733405, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023598440566020615, + "loss": 0.0166, "step": 164640 }, { - "epoch": 0.83, - "learning_rate": 0.00017539793452432003, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002359805174438347, + "loss": 0.0206, "step": 164650 }, { - "epoch": 0.83, - "learning_rate": 0.000175390366831306, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023597662922746323, + "loss": 0.0191, "step": 164660 }, { - "epoch": 0.83, - "learning_rate": 0.000175382799138292, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.00023597274101109177, + "loss": 0.0213, "step": 164670 }, { - "epoch": 0.83, - "learning_rate": 0.000175375231445278, - "loss": 0.0159, + "epoch": 0.43, + "learning_rate": 0.00023596885279472029, + "loss": 0.0157, "step": 164680 }, { - "epoch": 0.83, - "learning_rate": 0.00017536766375226398, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023596496457834883, + "loss": 0.0219, "step": 164690 }, { - "epoch": 0.83, - "learning_rate": 0.00017536009605924997, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.0002359610763619774, + "loss": 0.0183, "step": 164700 }, { - "epoch": 0.83, - "learning_rate": 0.00017535252836623597, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.0002359571881456059, + "loss": 0.0186, "step": 164710 }, { - "epoch": 0.83, - "learning_rate": 0.00017534496067322196, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.00023595329992923445, + "loss": 0.027, "step": 164720 }, { - "epoch": 0.83, - "learning_rate": 0.00017533739298020794, - "loss": 0.0095, + "epoch": 0.43, + "learning_rate": 0.00023594941171286297, + "loss": 0.02, "step": 164730 }, { - "epoch": 0.83, - "learning_rate": 0.00017532982528719395, - "loss": 0.0147, + "epoch": 0.43, + "learning_rate": 0.00023594552349649154, + "loss": 0.0167, "step": 164740 }, { - "epoch": 0.83, - "learning_rate": 0.00017532225759417993, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023594163528012005, + "loss": 0.017, "step": 164750 }, { - "epoch": 0.83, - "learning_rate": 0.0001753146899011659, - "loss": 0.0159, + "epoch": 0.43, + "learning_rate": 0.0002359377470637486, + "loss": 0.0214, "step": 164760 }, { - "epoch": 0.83, - "learning_rate": 0.00017530712220815192, - "loss": 0.016, + "epoch": 0.43, + "learning_rate": 0.0002359338588473771, + "loss": 0.0223, "step": 164770 }, { - "epoch": 0.83, - "learning_rate": 0.0001752995545151379, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023592997063100565, + "loss": 0.0245, "step": 164780 }, { - "epoch": 0.83, - "learning_rate": 0.00017529198682212388, - "loss": 0.0161, + "epoch": 0.43, + "learning_rate": 0.0002359260824146342, + "loss": 0.0188, "step": 164790 }, { - "epoch": 0.83, - "learning_rate": 0.0001752844191291099, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023592219419826273, + "loss": 0.0228, "step": 164800 }, { - "epoch": 0.83, - "learning_rate": 0.00017527685143609587, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.00023591830598189125, + "loss": 0.018, "step": 164810 }, { - "epoch": 0.83, - "learning_rate": 0.00017526928374308185, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.0002359144177655198, + "loss": 0.0189, "step": 164820 }, { - "epoch": 0.83, - "learning_rate": 0.00017526171605006783, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.00023591052954914833, + "loss": 0.0187, "step": 164830 }, { - "epoch": 0.83, - "learning_rate": 0.00017525414835705384, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023590664133277687, + "loss": 0.0205, "step": 164840 }, { - "epoch": 0.83, - "learning_rate": 0.00017524658066403982, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023590275311640539, + "loss": 0.0218, "step": 164850 }, { - "epoch": 0.83, - "learning_rate": 0.0001752390129710258, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023589886490003393, + "loss": 0.0211, "step": 164860 }, { - "epoch": 0.83, - "learning_rate": 0.0001752314452780118, - "loss": 0.0146, + "epoch": 0.43, + "learning_rate": 0.0002358949766836625, + "loss": 0.0211, "step": 164870 }, { - "epoch": 0.83, - "learning_rate": 0.0001752238775849978, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.000235891088467291, + "loss": 0.0174, "step": 164880 }, { - "epoch": 0.83, - "learning_rate": 0.00017521630989198378, - "loss": 0.0146, + "epoch": 0.43, + "learning_rate": 0.00023588720025091955, + "loss": 0.0201, "step": 164890 }, { - "epoch": 0.83, - "learning_rate": 0.00017520874219896978, - "loss": 0.0109, + "epoch": 0.43, + "learning_rate": 0.00023588331203454807, + "loss": 0.0188, "step": 164900 }, { - "epoch": 0.83, - "learning_rate": 0.00017520117450595577, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.00023587942381817664, + "loss": 0.0188, "step": 164910 }, { - "epoch": 0.83, - "learning_rate": 0.00017519360681294175, - "loss": 0.0135, + "epoch": 0.43, + "learning_rate": 0.00023587553560180515, + "loss": 0.0241, "step": 164920 }, { - "epoch": 0.83, - "learning_rate": 0.00017518603911992776, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.0002358716473854337, + "loss": 0.0192, "step": 164930 }, { - "epoch": 0.83, - "learning_rate": 0.00017517847142691374, - "loss": 0.0097, + "epoch": 0.43, + "learning_rate": 0.0002358677591690622, + "loss": 0.024, "step": 164940 }, { - "epoch": 0.83, - "learning_rate": 0.00017517090373389972, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023586387095269077, + "loss": 0.0158, "step": 164950 }, { - "epoch": 0.83, - "learning_rate": 0.00017516333604088573, - "loss": 0.0096, + "epoch": 0.43, + "learning_rate": 0.0002358599827363193, + "loss": 0.0174, "step": 164960 }, { - "epoch": 0.83, - "learning_rate": 0.0001751557683478717, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023585609451994783, + "loss": 0.0197, "step": 164970 }, { - "epoch": 0.83, - "learning_rate": 0.0001751482006548577, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.00023585220630357635, + "loss": 0.0201, "step": 164980 }, { - "epoch": 0.83, - "learning_rate": 0.0001751406329618437, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023584831808720491, + "loss": 0.0168, "step": 164990 }, { - "epoch": 0.83, - "learning_rate": 0.00017513306526882968, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023584442987083343, + "loss": 0.0178, "step": 165000 }, { - "epoch": 0.83, - "eval_cer": 0.9144586111496574, - "eval_loss": 0.008332598023116589, - "eval_runtime": 116.7175, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.43, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.013063205406069756, + "eval_runtime": 107.4075, + "eval_samples_per_second": 18.621, + "eval_steps_per_second": 4.655, "step": 165000 }, { - "epoch": 0.83, - "learning_rate": 0.00017512549757581566, - "loss": 0.0141, + "epoch": 0.43, + "learning_rate": 0.00023584054165446197, + "loss": 0.0151, "step": 165010 }, { - "epoch": 0.83, - "learning_rate": 0.00017511792988280164, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023583665343809048, + "loss": 0.0214, "step": 165020 }, { - "epoch": 0.83, - "learning_rate": 0.00017511036218978765, - "loss": 0.0104, + "epoch": 0.43, + "learning_rate": 0.00023583276522171903, + "loss": 0.0214, "step": 165030 }, { - "epoch": 0.83, - "learning_rate": 0.00017510279449677363, - "loss": 0.0161, + "epoch": 0.43, + "learning_rate": 0.0002358288770053476, + "loss": 0.018, "step": 165040 }, { - "epoch": 0.83, - "learning_rate": 0.00017509522680375961, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.0002358249887889761, + "loss": 0.0195, "step": 165050 }, { - "epoch": 0.83, - "learning_rate": 0.00017508765911074562, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023582110057260462, + "loss": 0.02, "step": 165060 }, { - "epoch": 0.83, - "learning_rate": 0.0001750800914177316, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023581721235623317, + "loss": 0.0251, "step": 165070 }, { - "epoch": 0.83, - "learning_rate": 0.00017507252372471759, - "loss": 0.0106, + "epoch": 0.43, + "learning_rate": 0.00023581332413986173, + "loss": 0.019, "step": 165080 }, { - "epoch": 0.83, - "learning_rate": 0.0001750649560317036, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023580943592349025, + "loss": 0.0247, "step": 165090 }, { - "epoch": 0.83, - "learning_rate": 0.00017505738833868958, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.0002358055477071188, + "loss": 0.0161, "step": 165100 }, { - "epoch": 0.83, - "learning_rate": 0.00017504982064567556, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.0002358016594907473, + "loss": 0.0223, "step": 165110 }, { - "epoch": 0.83, - "learning_rate": 0.00017504225295266157, - "loss": 0.0129, - "step": 165120 + "epoch": 0.43, + "learning_rate": 0.00023579777127437587, + "loss": 0.0181, + "step": 165120 }, { - "epoch": 0.83, - "learning_rate": 0.00017503468525964755, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.0002357938830580044, + "loss": 0.0173, "step": 165130 }, { - "epoch": 0.83, - "learning_rate": 0.00017502711756663353, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023578999484163293, + "loss": 0.0205, "step": 165140 }, { - "epoch": 0.83, - "learning_rate": 0.00017501954987361954, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.00023578610662526144, + "loss": 0.0191, "step": 165150 }, { - "epoch": 0.83, - "learning_rate": 0.00017501198218060552, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023578221840889, + "loss": 0.016, "step": 165160 }, { - "epoch": 0.83, - "learning_rate": 0.0001750044144875915, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023577833019251853, + "loss": 0.0187, "step": 165170 }, { - "epoch": 0.83, - "learning_rate": 0.00017499684679457748, - "loss": 0.0153, + "epoch": 0.43, + "learning_rate": 0.00023577444197614707, + "loss": 0.0209, "step": 165180 }, { - "epoch": 0.83, - "learning_rate": 0.0001749892791015635, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023577055375977558, + "loss": 0.0234, "step": 165190 }, { - "epoch": 0.83, - "learning_rate": 0.00017498171140854947, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023576666554340415, + "loss": 0.0176, "step": 165200 }, { - "epoch": 0.83, - "learning_rate": 0.00017497414371553545, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.0002357627773270327, + "loss": 0.0174, "step": 165210 }, { - "epoch": 0.83, - "learning_rate": 0.00017496657602252146, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.0002357588891106612, + "loss": 0.0178, "step": 165220 }, { - "epoch": 0.83, - "learning_rate": 0.00017495900832950744, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023575500089428972, + "loss": 0.0185, "step": 165230 }, { - "epoch": 0.83, - "learning_rate": 0.00017495144063649342, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023575111267791827, + "loss": 0.0173, "step": 165240 }, { - "epoch": 0.83, - "learning_rate": 0.00017494387294347943, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.00023574722446154683, + "loss": 0.0176, "step": 165250 }, { - "epoch": 0.83, - "learning_rate": 0.00017493630525046541, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023574333624517535, + "loss": 0.0193, "step": 165260 }, { - "epoch": 0.83, - "learning_rate": 0.0001749287375574514, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.0002357394480288039, + "loss": 0.0219, "step": 165270 }, { - "epoch": 0.83, - "learning_rate": 0.0001749211698644374, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.0002357355598124324, + "loss": 0.02, "step": 165280 }, { - "epoch": 0.83, - "learning_rate": 0.00017491360217142336, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023573167159606097, + "loss": 0.0199, "step": 165290 }, { - "epoch": 0.83, - "learning_rate": 0.00017490603447840934, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.0002357277833796895, + "loss": 0.0185, "step": 165300 }, { - "epoch": 0.83, - "learning_rate": 0.00017489846678539532, - "loss": 0.0081, + "epoch": 0.43, + "learning_rate": 0.00023572389516331803, + "loss": 0.0228, "step": 165310 }, { - "epoch": 0.83, - "learning_rate": 0.00017489089909238133, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023572000694694654, + "loss": 0.0217, "step": 165320 }, { - "epoch": 0.83, - "learning_rate": 0.0001748833313993673, - "loss": 0.0095, + "epoch": 0.43, + "learning_rate": 0.0002357161187305751, + "loss": 0.0228, "step": 165330 }, { - "epoch": 0.83, - "learning_rate": 0.0001748757637063533, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.00023571223051420363, + "loss": 0.0172, "step": 165340 }, { - "epoch": 0.83, - "learning_rate": 0.0001748681960133393, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023570834229783217, + "loss": 0.0168, "step": 165350 }, { - "epoch": 0.83, - "learning_rate": 0.00017486062832032528, - "loss": 0.0095, + "epoch": 0.43, + "learning_rate": 0.00023570445408146068, + "loss": 0.0174, "step": 165360 }, { - "epoch": 0.83, - "learning_rate": 0.00017485306062731126, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.00023570056586508925, + "loss": 0.0258, "step": 165370 }, { - "epoch": 0.83, - "learning_rate": 0.00017484549293429727, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.00023569667764871777, + "loss": 0.0146, "step": 165380 }, { - "epoch": 0.83, - "learning_rate": 0.00017483792524128325, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.0002356927894323463, + "loss": 0.0167, "step": 165390 }, { - "epoch": 0.83, - "learning_rate": 0.00017483035754826924, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023568890121597482, + "loss": 0.0177, "step": 165400 }, { - "epoch": 0.83, - "learning_rate": 0.00017482278985525522, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.0002356850129996034, + "loss": 0.0147, "step": 165410 }, { - "epoch": 0.83, - "learning_rate": 0.00017481522216224123, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.00023568112478323193, + "loss": 0.0166, "step": 165420 }, { - "epoch": 0.83, - "learning_rate": 0.0001748076544692272, - "loss": 0.0134, + "epoch": 0.43, + "learning_rate": 0.00023567723656686045, + "loss": 0.0205, "step": 165430 }, { - "epoch": 0.83, - "learning_rate": 0.0001748000867762132, - "loss": 0.0156, + "epoch": 0.43, + "learning_rate": 0.000235673348350489, + "loss": 0.0204, "step": 165440 }, { - "epoch": 0.83, - "learning_rate": 0.0001747925190831992, - "loss": 0.0152, + "epoch": 0.43, + "learning_rate": 0.00023566946013411753, + "loss": 0.0186, "step": 165450 }, { - "epoch": 0.83, - "learning_rate": 0.00017478495139018518, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023566557191774607, + "loss": 0.0138, "step": 165460 }, { - "epoch": 0.83, - "learning_rate": 0.00017477738369717116, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002356616837013746, + "loss": 0.015, "step": 165470 }, { - "epoch": 0.83, - "learning_rate": 0.00017476981600415717, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023565779548500313, + "loss": 0.0178, "step": 165480 }, { - "epoch": 0.83, - "learning_rate": 0.00017476224831114315, - "loss": 0.0091, + "epoch": 0.43, + "learning_rate": 0.00023565390726863164, + "loss": 0.0237, "step": 165490 }, { - "epoch": 0.83, - "learning_rate": 0.00017475468061812913, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.0002356500190522602, + "loss": 0.0173, "step": 165500 }, { - "epoch": 0.84, - "learning_rate": 0.00017474711292511514, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023564613083588873, + "loss": 0.0191, "step": 165510 }, { - "epoch": 0.84, - "learning_rate": 0.00017473954523210112, - "loss": 0.0131, + "epoch": 0.43, + "learning_rate": 0.00023564224261951727, + "loss": 0.0223, "step": 165520 }, { - "epoch": 0.84, - "learning_rate": 0.0001747319775390871, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023563835440314578, + "loss": 0.0236, "step": 165530 }, { - "epoch": 0.84, - "learning_rate": 0.0001747244098460731, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.00023563446618677435, + "loss": 0.0214, "step": 165540 }, { - "epoch": 0.84, - "learning_rate": 0.0001747168421530591, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023563057797040287, + "loss": 0.0201, "step": 165550 }, { - "epoch": 0.84, - "learning_rate": 0.00017470927446004507, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002356266897540314, + "loss": 0.0189, "step": 165560 }, { - "epoch": 0.84, - "learning_rate": 0.00017470170676703106, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023562280153765992, + "loss": 0.0194, "step": 165570 }, { - "epoch": 0.84, - "learning_rate": 0.00017469413907401706, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.0002356189133212885, + "loss": 0.0153, "step": 165580 }, { - "epoch": 0.84, - "learning_rate": 0.00017468657138100305, - "loss": 0.0184, + "epoch": 0.43, + "learning_rate": 0.00023561502510491703, + "loss": 0.0171, "step": 165590 }, { - "epoch": 0.84, - "learning_rate": 0.00017467900368798903, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023561113688854555, + "loss": 0.0172, "step": 165600 }, { - "epoch": 0.84, - "learning_rate": 0.00017467143599497504, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.0002356072486721741, + "loss": 0.0217, "step": 165610 }, { - "epoch": 0.84, - "learning_rate": 0.00017466386830196102, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023560336045580263, + "loss": 0.0167, "step": 165620 }, { - "epoch": 0.84, - "learning_rate": 0.000174656300608947, - "loss": 0.0095, + "epoch": 0.43, + "learning_rate": 0.00023559947223943117, + "loss": 0.015, "step": 165630 }, { - "epoch": 0.84, - "learning_rate": 0.000174648732915933, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.0002355955840230597, + "loss": 0.0194, "step": 165640 }, { - "epoch": 0.84, - "learning_rate": 0.000174641165222919, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023559169580668823, + "loss": 0.0203, "step": 165650 }, { - "epoch": 0.84, - "learning_rate": 0.00017463359752990497, - "loss": 0.0153, + "epoch": 0.43, + "learning_rate": 0.00023558780759031677, + "loss": 0.0207, "step": 165660 }, { - "epoch": 0.84, - "learning_rate": 0.00017462602983689098, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.0002355839193739453, + "loss": 0.0175, "step": 165670 }, { - "epoch": 0.84, - "learning_rate": 0.00017461846214387696, - "loss": 0.0134, + "epoch": 0.43, + "learning_rate": 0.00023558003115757383, + "loss": 0.021, "step": 165680 }, { - "epoch": 0.84, - "learning_rate": 0.00017461089445086294, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023557614294120237, + "loss": 0.0191, "step": 165690 }, { - "epoch": 0.84, - "learning_rate": 0.00017460332675784895, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.0002355722547248309, + "loss": 0.02, "step": 165700 }, { - "epoch": 0.84, - "learning_rate": 0.00017459575906483493, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023556836650845945, + "loss": 0.0192, "step": 165710 }, { - "epoch": 0.84, - "learning_rate": 0.0001745881913718209, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.00023556447829208797, + "loss": 0.0195, "step": 165720 }, { - "epoch": 0.84, - "learning_rate": 0.0001745806236788069, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.0002355605900757165, + "loss": 0.0201, "step": 165730 }, { - "epoch": 0.84, - "learning_rate": 0.0001745730559857929, - "loss": 0.0161, + "epoch": 0.43, + "learning_rate": 0.00023555670185934502, + "loss": 0.0187, "step": 165740 }, { - "epoch": 0.84, - "learning_rate": 0.00017456548829277888, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.0002355528136429736, + "loss": 0.0194, "step": 165750 }, { - "epoch": 0.84, - "learning_rate": 0.00017455792059976487, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023554892542660213, + "loss": 0.021, "step": 165760 }, { - "epoch": 0.84, - "learning_rate": 0.00017455035290675087, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023554503721023065, + "loss": 0.0194, "step": 165770 }, { - "epoch": 0.84, - "learning_rate": 0.00017454278521373686, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.00023554114899385916, + "loss": 0.0143, "step": 165780 }, { - "epoch": 0.84, - "learning_rate": 0.00017453521752072284, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.00023553726077748773, + "loss": 0.0205, "step": 165790 }, { - "epoch": 0.84, - "learning_rate": 0.00017452764982770885, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023553337256111627, + "loss": 0.0194, "step": 165800 }, { - "epoch": 0.84, - "learning_rate": 0.00017452008213469483, - "loss": 0.0095, + "epoch": 0.43, + "learning_rate": 0.00023552948434474479, + "loss": 0.0189, "step": 165810 }, { - "epoch": 0.84, - "learning_rate": 0.0001745125144416808, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023552559612837333, + "loss": 0.0227, "step": 165820 }, { - "epoch": 0.84, - "learning_rate": 0.00017450494674866682, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023552170791200187, + "loss": 0.02, "step": 165830 }, { - "epoch": 0.84, - "learning_rate": 0.0001744973790556528, - "loss": 0.0088, + "epoch": 0.43, + "learning_rate": 0.0002355178196956304, + "loss": 0.0151, "step": 165840 }, { - "epoch": 0.84, - "learning_rate": 0.00017448981136263878, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.00023551393147925893, + "loss": 0.0193, "step": 165850 }, { - "epoch": 0.84, - "learning_rate": 0.0001744822436696248, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023551004326288747, + "loss": 0.0189, "step": 165860 }, { - "epoch": 0.84, - "learning_rate": 0.00017447467597661077, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.000235506155046516, + "loss": 0.0204, "step": 165870 }, { - "epoch": 0.84, - "learning_rate": 0.00017446710828359675, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023550226683014455, + "loss": 0.0178, "step": 165880 }, { - "epoch": 0.84, - "learning_rate": 0.00017445954059058276, - "loss": 0.0148, + "epoch": 0.43, + "learning_rate": 0.00023549837861377307, + "loss": 0.0166, "step": 165890 }, { - "epoch": 0.84, - "learning_rate": 0.00017445197289756874, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.0002354944903974016, + "loss": 0.0166, "step": 165900 }, { - "epoch": 0.84, - "learning_rate": 0.00017444440520455472, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023549060218103018, + "loss": 0.0185, "step": 165910 }, { - "epoch": 0.84, - "learning_rate": 0.0001744368375115407, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.0002354867139646587, + "loss": 0.0174, "step": 165920 }, { - "epoch": 0.84, - "learning_rate": 0.0001744292698185267, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023548282574828723, + "loss": 0.0181, "step": 165930 }, { - "epoch": 0.84, - "learning_rate": 0.0001744217021255127, - "loss": 0.0098, + "epoch": 0.43, + "learning_rate": 0.00023547893753191575, + "loss": 0.0222, "step": 165940 }, { - "epoch": 0.84, - "learning_rate": 0.00017441413443249868, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023547504931554431, + "loss": 0.019, "step": 165950 }, { - "epoch": 0.84, - "learning_rate": 0.00017440656673948468, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.00023547116109917283, + "loss": 0.0192, "step": 165960 }, { - "epoch": 0.84, - "learning_rate": 0.00017439899904647067, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023546727288280137, + "loss": 0.02, "step": 165970 }, { - "epoch": 0.84, - "learning_rate": 0.00017439143135345665, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.00023546338466642989, + "loss": 0.0243, "step": 165980 }, { - "epoch": 0.84, - "learning_rate": 0.00017438386366044266, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023545949645005843, + "loss": 0.0174, "step": 165990 }, { - "epoch": 0.84, - "learning_rate": 0.00017437629596742864, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023545560823368697, + "loss": 0.0213, "step": 166000 }, { - "epoch": 0.84, - "eval_cer": 0.9144508479806542, - "eval_loss": 0.008648986928164959, - "eval_runtime": 116.5926, - "eval_samples_per_second": 17.154, - "eval_steps_per_second": 4.288, + "epoch": 0.43, + "eval_cer": 0.8817446754311932, + "eval_loss": 0.012856963090598583, + "eval_runtime": 107.8453, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, "step": 166000 }, { - "epoch": 0.84, - "learning_rate": 0.00017436872827441462, - "loss": 0.0157, + "epoch": 0.43, + "learning_rate": 0.0002354517200173155, + "loss": 0.0203, "step": 166010 }, { - "epoch": 0.84, - "learning_rate": 0.00017436116058140063, - "loss": 0.0134, + "epoch": 0.43, + "learning_rate": 0.00023544783180094403, + "loss": 0.0207, "step": 166020 }, { - "epoch": 0.84, - "learning_rate": 0.0001743535928883866, - "loss": 0.0149, + "epoch": 0.43, + "learning_rate": 0.00023544394358457257, + "loss": 0.0172, "step": 166030 }, { - "epoch": 0.84, - "learning_rate": 0.0001743460251953726, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.0002354400553682011, + "loss": 0.0168, "step": 166040 }, { - "epoch": 0.84, - "learning_rate": 0.0001743384575023586, - "loss": 0.0075, + "epoch": 0.43, + "learning_rate": 0.00023543616715182965, + "loss": 0.0186, "step": 166050 }, { - "epoch": 0.84, - "learning_rate": 0.00017433088980934458, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023543227893545816, + "loss": 0.0168, "step": 166060 }, { - "epoch": 0.84, - "learning_rate": 0.00017432332211633056, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.0002354283907190867, + "loss": 0.0195, "step": 166070 }, { - "epoch": 0.84, - "learning_rate": 0.00017431575442331654, - "loss": 0.0146, + "epoch": 0.43, + "learning_rate": 0.00023542450250271527, + "loss": 0.0168, "step": 166080 }, { - "epoch": 0.84, - "learning_rate": 0.00017430818673030255, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.0002354206142863438, + "loss": 0.0193, "step": 166090 }, { - "epoch": 0.84, - "learning_rate": 0.00017430061903728853, - "loss": 0.0151, + "epoch": 0.43, + "learning_rate": 0.0002354167260699723, + "loss": 0.0205, "step": 166100 }, { - "epoch": 0.84, - "learning_rate": 0.00017429305134427451, - "loss": 0.0094, + "epoch": 0.43, + "learning_rate": 0.00023541283785360085, + "loss": 0.0181, "step": 166110 }, { - "epoch": 0.84, - "learning_rate": 0.00017428548365126052, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023540894963722941, + "loss": 0.0176, "step": 166120 }, { - "epoch": 0.84, - "learning_rate": 0.0001742779159582465, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.00023540506142085793, + "loss": 0.0183, "step": 166130 }, { - "epoch": 0.84, - "learning_rate": 0.00017427034826523249, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.00023540117320448647, + "loss": 0.0207, "step": 166140 }, { - "epoch": 0.84, - "learning_rate": 0.0001742627805722185, - "loss": 0.0154, + "epoch": 0.43, + "learning_rate": 0.00023539728498811499, + "loss": 0.0202, "step": 166150 }, { - "epoch": 0.84, - "learning_rate": 0.00017425521287920448, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023539339677174355, + "loss": 0.0177, "step": 166160 }, { - "epoch": 0.84, - "learning_rate": 0.00017424764518619046, - "loss": 0.0152, + "epoch": 0.43, + "learning_rate": 0.00023538950855537207, + "loss": 0.0202, "step": 166170 }, { - "epoch": 0.84, - "learning_rate": 0.00017424007749317647, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.0002353856203390006, + "loss": 0.0221, "step": 166180 }, { - "epoch": 0.84, - "learning_rate": 0.00017423250980016245, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023538173212262912, + "loss": 0.019, "step": 166190 }, { - "epoch": 0.84, - "learning_rate": 0.00017422494210714843, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002353778439062577, + "loss": 0.0145, "step": 166200 }, { - "epoch": 0.84, - "learning_rate": 0.00017421737441413444, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.0002353739556898862, + "loss": 0.0186, "step": 166210 }, { - "epoch": 0.84, - "learning_rate": 0.00017420980672112042, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023537006747351475, + "loss": 0.0208, "step": 166220 }, { - "epoch": 0.84, - "learning_rate": 0.0001742022390281064, - "loss": 0.0094, + "epoch": 0.43, + "learning_rate": 0.00023536617925714326, + "loss": 0.0167, "step": 166230 }, { - "epoch": 0.84, - "learning_rate": 0.00017419467133509238, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.0002353622910407718, + "loss": 0.0217, "step": 166240 }, { - "epoch": 0.84, - "learning_rate": 0.0001741871036420784, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023535840282440035, + "loss": 0.018, "step": 166250 }, { - "epoch": 0.84, - "learning_rate": 0.00017417953594906437, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.0002353545146080289, + "loss": 0.0183, "step": 166260 }, { - "epoch": 0.84, - "learning_rate": 0.00017417196825605035, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.0002353506263916574, + "loss": 0.021, "step": 166270 }, { - "epoch": 0.84, - "learning_rate": 0.00017416440056303636, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023534673817528595, + "loss": 0.021, "step": 166280 }, { - "epoch": 0.84, - "learning_rate": 0.00017415683287002234, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023534284995891451, + "loss": 0.0223, "step": 166290 }, { - "epoch": 0.84, - "learning_rate": 0.00017414926517700832, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023533896174254303, + "loss": 0.016, "step": 166300 }, { - "epoch": 0.84, - "learning_rate": 0.00017414169748399433, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023533507352617157, + "loss": 0.023, "step": 166310 }, { - "epoch": 0.84, - "learning_rate": 0.00017413412979098031, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023533118530980008, + "loss": 0.0202, "step": 166320 }, { - "epoch": 0.84, - "learning_rate": 0.0001741265620979663, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.00023532729709342865, + "loss": 0.0243, "step": 166330 }, { - "epoch": 0.84, - "learning_rate": 0.0001741189944049523, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023532340887705717, + "loss": 0.021, "step": 166340 }, { - "epoch": 0.84, - "learning_rate": 0.00017411142671193829, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.0002353195206606857, + "loss": 0.0187, "step": 166350 }, { - "epoch": 0.84, - "learning_rate": 0.00017410385901892427, - "loss": 0.0143, + "epoch": 0.43, + "learning_rate": 0.00023531563244431422, + "loss": 0.0183, "step": 166360 }, { - "epoch": 0.84, - "learning_rate": 0.00017409629132591028, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.0002353117442279428, + "loss": 0.0194, "step": 166370 }, { - "epoch": 0.84, - "learning_rate": 0.00017408872363289626, - "loss": 0.0116, + "epoch": 0.43, + "learning_rate": 0.0002353078560115713, + "loss": 0.0169, "step": 166380 }, { - "epoch": 0.84, - "learning_rate": 0.00017408115593988224, - "loss": 0.0101, + "epoch": 0.43, + "learning_rate": 0.00023530396779519985, + "loss": 0.0204, "step": 166390 }, { - "epoch": 0.84, - "learning_rate": 0.00017407358824686825, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023530007957882836, + "loss": 0.0155, "step": 166400 }, { - "epoch": 0.84, - "learning_rate": 0.00017406602055385423, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.00023529619136245693, + "loss": 0.0207, "step": 166410 }, { - "epoch": 0.84, - "learning_rate": 0.0001740584528608402, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023529230314608545, + "loss": 0.0175, "step": 166420 }, { - "epoch": 0.84, - "learning_rate": 0.0001740508851678262, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.000235288414929714, + "loss": 0.0144, "step": 166430 }, { - "epoch": 0.84, - "learning_rate": 0.0001740433174748122, - "loss": 0.0097, + "epoch": 0.43, + "learning_rate": 0.0002352845267133425, + "loss": 0.0174, "step": 166440 }, { - "epoch": 0.84, - "learning_rate": 0.00017403574978179818, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023528063849697107, + "loss": 0.0189, "step": 166450 }, { - "epoch": 0.84, - "learning_rate": 0.00017402818208878416, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.0002352767502805996, + "loss": 0.0158, "step": 166460 }, { - "epoch": 0.84, - "learning_rate": 0.00017402061439577017, - "loss": 0.0106, + "epoch": 0.43, + "learning_rate": 0.00023527286206422813, + "loss": 0.0222, "step": 166470 }, { - "epoch": 0.84, - "learning_rate": 0.00017401304670275615, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.00023526897384785667, + "loss": 0.0178, "step": 166480 }, { - "epoch": 0.84, - "learning_rate": 0.00017400547900974213, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023526508563148518, + "loss": 0.0158, "step": 166490 }, { - "epoch": 0.84, - "learning_rate": 0.00017399791131672814, - "loss": 0.0156, + "epoch": 0.43, + "learning_rate": 0.00023526119741511375, + "loss": 0.016, "step": 166500 }, { - "epoch": 0.84, - "learning_rate": 0.00017399034362371412, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023525730919874227, + "loss": 0.021, "step": 166510 }, { - "epoch": 0.84, - "learning_rate": 0.0001739827759307001, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.0002352534209823708, + "loss": 0.0175, "step": 166520 }, { - "epoch": 0.84, - "learning_rate": 0.00017397520823768611, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.00023524953276599932, + "loss": 0.0175, "step": 166530 }, { - "epoch": 0.84, - "learning_rate": 0.00017396764054467207, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.0002352456445496279, + "loss": 0.0188, "step": 166540 }, { - "epoch": 0.84, - "learning_rate": 0.00017396007285165805, - "loss": 0.0133, + "epoch": 0.43, + "learning_rate": 0.0002352417563332564, + "loss": 0.0161, "step": 166550 }, { - "epoch": 0.84, - "learning_rate": 0.00017395250515864403, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023523786811688495, + "loss": 0.0197, "step": 166560 }, { - "epoch": 0.84, - "learning_rate": 0.00017394493746563004, - "loss": 0.0152, + "epoch": 0.43, + "learning_rate": 0.00023523397990051346, + "loss": 0.0221, "step": 166570 }, { - "epoch": 0.84, - "learning_rate": 0.00017393736977261602, - "loss": 0.0163, + "epoch": 0.43, + "learning_rate": 0.00023523009168414203, + "loss": 0.0185, "step": 166580 }, { - "epoch": 0.84, - "learning_rate": 0.000173929802079602, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023522620346777055, + "loss": 0.0177, "step": 166590 }, { - "epoch": 0.84, - "learning_rate": 0.000173922234386588, - "loss": 0.0157, + "epoch": 0.43, + "learning_rate": 0.0002352223152513991, + "loss": 0.0145, "step": 166600 }, { - "epoch": 0.84, - "learning_rate": 0.000173914666693574, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.0002352184270350276, + "loss": 0.0219, "step": 166610 }, { - "epoch": 0.84, - "learning_rate": 0.00017390709900055997, - "loss": 0.016, + "epoch": 0.43, + "learning_rate": 0.00023521453881865617, + "loss": 0.0244, "step": 166620 }, { - "epoch": 0.84, - "learning_rate": 0.00017389953130754596, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.0002352106506022847, + "loss": 0.0174, "step": 166630 }, { - "epoch": 0.84, - "learning_rate": 0.00017389196361453196, - "loss": 0.0125, + "epoch": 0.43, + "learning_rate": 0.00023520676238591323, + "loss": 0.0184, "step": 166640 }, { - "epoch": 0.84, - "learning_rate": 0.00017388439592151795, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023520287416954174, + "loss": 0.019, "step": 166650 }, { - "epoch": 0.84, - "learning_rate": 0.00017387682822850393, - "loss": 0.0106, + "epoch": 0.43, + "learning_rate": 0.0002351989859531703, + "loss": 0.0248, "step": 166660 }, { - "epoch": 0.84, - "learning_rate": 0.00017386926053548994, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023519509773679885, + "loss": 0.0202, "step": 166670 }, { - "epoch": 0.84, - "learning_rate": 0.00017386169284247592, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023519120952042737, + "loss": 0.0193, "step": 166680 }, { - "epoch": 0.84, - "learning_rate": 0.0001738541251494619, - "loss": 0.0081, + "epoch": 0.43, + "learning_rate": 0.0002351873213040559, + "loss": 0.0175, "step": 166690 }, { - "epoch": 0.84, - "learning_rate": 0.0001738465574564479, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023518343308768445, + "loss": 0.0185, "step": 166700 }, { - "epoch": 0.84, - "learning_rate": 0.0001738389897634339, - "loss": 0.0149, + "epoch": 0.43, + "learning_rate": 0.000235179544871313, + "loss": 0.0206, "step": 166710 }, { - "epoch": 0.84, - "learning_rate": 0.00017383142207041987, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002351756566549415, + "loss": 0.0219, "step": 166720 }, { - "epoch": 0.84, - "learning_rate": 0.00017382385437740588, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.00023517176843857005, + "loss": 0.0228, "step": 166730 }, { - "epoch": 0.84, - "learning_rate": 0.00017381628668439186, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.00023516788022219856, + "loss": 0.0198, "step": 166740 }, { - "epoch": 0.84, - "learning_rate": 0.00017380871899137784, - "loss": 0.0131, + "epoch": 0.43, + "learning_rate": 0.00023516399200582713, + "loss": 0.0181, "step": 166750 }, { - "epoch": 0.84, - "learning_rate": 0.00017380115129836385, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023516010378945565, + "loss": 0.0204, "step": 166760 }, { - "epoch": 0.84, - "learning_rate": 0.00017379358360534983, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.0002351562155730842, + "loss": 0.0183, "step": 166770 }, { - "epoch": 0.84, - "learning_rate": 0.0001737860159123358, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.0002351523273567127, + "loss": 0.0188, "step": 166780 }, { - "epoch": 0.84, - "learning_rate": 0.00017377844821932182, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023514843914034127, + "loss": 0.0202, "step": 166790 }, { - "epoch": 0.84, - "learning_rate": 0.0001737708805263078, - "loss": 0.0098, + "epoch": 0.43, + "learning_rate": 0.0002351445509239698, + "loss": 0.0162, "step": 166800 }, { - "epoch": 0.84, - "learning_rate": 0.00017376331283329378, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.00023514066270759833, + "loss": 0.0157, "step": 166810 }, { - "epoch": 0.84, - "learning_rate": 0.00017375574514027977, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023513677449122684, + "loss": 0.0139, "step": 166820 }, { - "epoch": 0.84, - "learning_rate": 0.00017374817744726577, - "loss": 0.0106, + "epoch": 0.43, + "learning_rate": 0.0002351328862748554, + "loss": 0.0174, "step": 166830 }, { - "epoch": 0.84, - "learning_rate": 0.00017374060975425176, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023512899805848395, + "loss": 0.0224, "step": 166840 }, { - "epoch": 0.84, - "learning_rate": 0.00017373304206123774, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.00023512510984211247, + "loss": 0.0176, "step": 166850 }, { - "epoch": 0.84, - "learning_rate": 0.00017372547436822375, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.000235121221625741, + "loss": 0.0199, "step": 166860 }, { - "epoch": 0.84, - "learning_rate": 0.00017371790667520973, - "loss": 0.0139, + "epoch": 0.43, + "learning_rate": 0.00023511733340936955, + "loss": 0.0158, "step": 166870 }, { - "epoch": 0.84, - "learning_rate": 0.0001737103389821957, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002351134451929981, + "loss": 0.0181, "step": 166880 }, { - "epoch": 0.84, - "learning_rate": 0.00017370277128918172, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.0002351095569766266, + "loss": 0.0226, "step": 166890 }, { - "epoch": 0.84, - "learning_rate": 0.0001736952035961677, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023510566876025515, + "loss": 0.0175, "step": 166900 }, { - "epoch": 0.84, - "learning_rate": 0.00017368763590315368, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.0002351017805438837, + "loss": 0.021, "step": 166910 }, { - "epoch": 0.84, - "learning_rate": 0.0001736800682101397, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023509789232751223, + "loss": 0.0185, "step": 166920 }, { - "epoch": 0.84, - "learning_rate": 0.00017367250051712567, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023509400411114074, + "loss": 0.0173, "step": 166930 }, { - "epoch": 0.84, - "learning_rate": 0.00017366493282411165, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.0002350901158947693, + "loss": 0.0199, "step": 166940 }, { - "epoch": 0.84, - "learning_rate": 0.00017365736513109766, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023508622767839786, + "loss": 0.0185, "step": 166950 }, { - "epoch": 0.84, - "learning_rate": 0.00017364979743808364, - "loss": 0.0096, + "epoch": 0.43, + "learning_rate": 0.00023508233946202637, + "loss": 0.0168, "step": 166960 }, { - "epoch": 0.84, - "learning_rate": 0.00017364222974506962, - "loss": 0.0096, + "epoch": 0.43, + "learning_rate": 0.00023507845124565488, + "loss": 0.0202, "step": 166970 }, { - "epoch": 0.84, - "learning_rate": 0.0001736346620520556, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023507456302928343, + "loss": 0.0175, "step": 166980 }, { - "epoch": 0.84, - "learning_rate": 0.0001736270943590416, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023507067481291194, + "loss": 0.0194, "step": 166990 }, { - "epoch": 0.84, - "learning_rate": 0.0001736195266660276, - "loss": 0.0144, + "epoch": 0.43, + "learning_rate": 0.0002350667865965405, + "loss": 0.018, "step": 167000 }, { - "epoch": 0.84, - "eval_cer": 0.9144906342217957, - "eval_loss": 0.008696102537214756, - "eval_runtime": 116.717, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.43, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.012466521002352238, + "eval_runtime": 107.3379, + "eval_samples_per_second": 18.633, + "eval_steps_per_second": 4.658, "step": 167000 }, { - "epoch": 0.84, - "learning_rate": 0.00017361195897301358, - "loss": 0.0094, + "epoch": 0.43, + "learning_rate": 0.00023506289838016905, + "loss": 0.0156, "step": 167010 }, { - "epoch": 0.84, - "learning_rate": 0.00017360439127999958, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023505901016379757, + "loss": 0.0195, "step": 167020 }, { - "epoch": 0.84, - "learning_rate": 0.00017359682358698557, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.0002350551219474261, + "loss": 0.0149, "step": 167030 }, { - "epoch": 0.84, - "learning_rate": 0.00017358925589397155, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023505123373105465, + "loss": 0.0177, "step": 167040 }, { - "epoch": 0.84, - "learning_rate": 0.00017358168820095756, - "loss": 0.0132, + "epoch": 0.43, + "learning_rate": 0.0002350473455146832, + "loss": 0.0217, "step": 167050 }, { - "epoch": 0.84, - "learning_rate": 0.00017357412050794354, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.0002350434572983117, + "loss": 0.0217, "step": 167060 }, { - "epoch": 0.84, - "learning_rate": 0.00017356655281492952, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023503956908194025, + "loss": 0.0146, "step": 167070 }, { - "epoch": 0.84, - "learning_rate": 0.00017355898512191553, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.0002350356808655688, + "loss": 0.0151, "step": 167080 }, { - "epoch": 0.84, - "learning_rate": 0.0001735514174289015, - "loss": 0.01, + "epoch": 0.43, + "learning_rate": 0.00023503179264919733, + "loss": 0.0157, "step": 167090 }, { - "epoch": 0.84, - "learning_rate": 0.0001735438497358875, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023502790443282584, + "loss": 0.0196, "step": 167100 }, { - "epoch": 0.84, - "learning_rate": 0.0001735362820428735, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.00023502401621645439, + "loss": 0.0191, "step": 167110 }, { - "epoch": 0.84, - "learning_rate": 0.00017352871434985948, - "loss": 0.0097, + "epoch": 0.43, + "learning_rate": 0.00023502012800008295, + "loss": 0.0181, "step": 167120 }, { - "epoch": 0.84, - "learning_rate": 0.00017352114665684546, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023501623978371147, + "loss": 0.018, "step": 167130 }, { - "epoch": 0.84, - "learning_rate": 0.00017351357896383144, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023501235156733998, + "loss": 0.0175, "step": 167140 }, { - "epoch": 0.84, - "learning_rate": 0.00017350601127081745, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.00023500846335096853, + "loss": 0.0197, "step": 167150 }, { - "epoch": 0.84, - "learning_rate": 0.00017349844357780343, - "loss": 0.0128, + "epoch": 0.43, + "learning_rate": 0.0002350045751345971, + "loss": 0.0229, "step": 167160 }, { - "epoch": 0.84, - "learning_rate": 0.00017349087588478941, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.0002350006869182256, + "loss": 0.0199, "step": 167170 }, { - "epoch": 0.84, - "learning_rate": 0.00017348330819177542, - "loss": 0.0113, + "epoch": 0.43, + "learning_rate": 0.00023499679870185415, + "loss": 0.016, "step": 167180 }, { - "epoch": 0.84, - "learning_rate": 0.0001734757404987614, - "loss": 0.0109, + "epoch": 0.43, + "learning_rate": 0.00023499291048548266, + "loss": 0.0165, "step": 167190 }, { - "epoch": 0.84, - "learning_rate": 0.00017346817280574739, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.00023498902226911123, + "loss": 0.0178, "step": 167200 }, { - "epoch": 0.84, - "learning_rate": 0.0001734606051127334, - "loss": 0.0099, + "epoch": 0.43, + "learning_rate": 0.00023498513405273975, + "loss": 0.0208, "step": 167210 }, { - "epoch": 0.84, - "learning_rate": 0.00017345303741971938, - "loss": 0.0107, + "epoch": 0.43, + "learning_rate": 0.0002349812458363683, + "loss": 0.0187, "step": 167220 }, { - "epoch": 0.84, - "learning_rate": 0.00017344546972670536, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.0002349773576199968, + "loss": 0.0175, "step": 167230 }, { - "epoch": 0.84, - "learning_rate": 0.00017343790203369137, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.00023497346940362535, + "loss": 0.0169, "step": 167240 }, { - "epoch": 0.84, - "learning_rate": 0.00017343033434067735, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002349695811872539, + "loss": 0.0151, "step": 167250 }, { - "epoch": 0.84, - "learning_rate": 0.00017342276664766333, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.00023496569297088243, + "loss": 0.0179, "step": 167260 }, { - "epoch": 0.84, - "learning_rate": 0.00017341519895464934, - "loss": 0.0112, + "epoch": 0.43, + "learning_rate": 0.00023496180475451094, + "loss": 0.0202, "step": 167270 }, { - "epoch": 0.84, - "learning_rate": 0.00017340763126163532, - "loss": 0.0117, + "epoch": 0.43, + "learning_rate": 0.00023495791653813949, + "loss": 0.0199, "step": 167280 }, { - "epoch": 0.84, - "learning_rate": 0.0001734000635686213, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023495402832176803, + "loss": 0.0146, "step": 167290 }, { - "epoch": 0.84, - "learning_rate": 0.0001733924958756073, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.00023495014010539657, + "loss": 0.0184, "step": 167300 }, { - "epoch": 0.84, - "learning_rate": 0.0001733849281825933, - "loss": 0.0111, + "epoch": 0.43, + "learning_rate": 0.00023494625188902508, + "loss": 0.0203, "step": 167310 }, { - "epoch": 0.84, - "learning_rate": 0.00017337736048957927, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023494236367265362, + "loss": 0.0162, "step": 167320 }, { - "epoch": 0.84, - "learning_rate": 0.00017336979279656525, - "loss": 0.0086, + "epoch": 0.43, + "learning_rate": 0.0002349384754562822, + "loss": 0.0152, "step": 167330 }, { - "epoch": 0.84, - "learning_rate": 0.00017336222510355126, - "loss": 0.0151, + "epoch": 0.43, + "learning_rate": 0.0002349345872399107, + "loss": 0.0218, "step": 167340 }, { - "epoch": 0.84, - "learning_rate": 0.00017335465741053724, - "loss": 0.0096, + "epoch": 0.43, + "learning_rate": 0.00023493069902353925, + "loss": 0.0172, "step": 167350 }, { - "epoch": 0.84, - "learning_rate": 0.00017334708971752322, - "loss": 0.0109, + "epoch": 0.43, + "learning_rate": 0.00023492681080716776, + "loss": 0.0216, "step": 167360 }, { - "epoch": 0.84, - "learning_rate": 0.00017333952202450923, - "loss": 0.0148, + "epoch": 0.43, + "learning_rate": 0.00023492292259079633, + "loss": 0.0203, "step": 167370 }, { - "epoch": 0.84, - "learning_rate": 0.00017333195433149521, - "loss": 0.013, + "epoch": 0.43, + "learning_rate": 0.00023491903437442485, + "loss": 0.0159, "step": 167380 }, { - "epoch": 0.84, - "learning_rate": 0.0001733243866384812, - "loss": 0.0121, + "epoch": 0.43, + "learning_rate": 0.0002349151461580534, + "loss": 0.0406, "step": 167390 }, { - "epoch": 0.84, - "learning_rate": 0.0001733168189454672, - "loss": 0.0105, + "epoch": 0.43, + "learning_rate": 0.0002349112579416819, + "loss": 0.0167, "step": 167400 }, { - "epoch": 0.84, - "learning_rate": 0.00017330925125245319, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.00023490736972531047, + "loss": 0.0235, "step": 167410 }, { - "epoch": 0.84, - "learning_rate": 0.00017330168355943917, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.000234903481508939, + "loss": 0.0204, "step": 167420 }, { - "epoch": 0.84, - "learning_rate": 0.00017329411586642518, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023489959329256753, + "loss": 0.0216, "step": 167430 }, { - "epoch": 0.84, - "learning_rate": 0.00017328654817341116, - "loss": 0.0103, + "epoch": 0.43, + "learning_rate": 0.00023489570507619604, + "loss": 0.0165, "step": 167440 }, { - "epoch": 0.84, - "learning_rate": 0.00017327898048039714, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.0002348918168598246, + "loss": 0.02, "step": 167450 }, { - "epoch": 0.84, - "learning_rate": 0.00017327141278738315, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023488792864345313, + "loss": 0.0201, "step": 167460 }, { - "epoch": 0.84, - "learning_rate": 0.00017326384509436913, - "loss": 0.0096, + "epoch": 0.43, + "learning_rate": 0.00023488404042708167, + "loss": 0.0163, "step": 167470 }, { - "epoch": 0.84, - "learning_rate": 0.0001732562774013551, - "loss": 0.0141, + "epoch": 0.43, + "learning_rate": 0.00023488015221071018, + "loss": 0.0182, "step": 167480 }, { - "epoch": 0.85, - "learning_rate": 0.0001732487097083411, - "loss": 0.0153, + "epoch": 0.43, + "learning_rate": 0.00023487626399433872, + "loss": 0.0203, "step": 167490 }, { - "epoch": 0.85, - "learning_rate": 0.0001732411420153271, - "loss": 0.0126, + "epoch": 0.43, + "learning_rate": 0.0002348723757779673, + "loss": 0.0232, "step": 167500 }, { - "epoch": 0.85, - "learning_rate": 0.00017323357432231308, - "loss": 0.0137, + "epoch": 0.43, + "learning_rate": 0.0002348684875615958, + "loss": 0.0168, "step": 167510 }, { - "epoch": 0.85, - "learning_rate": 0.00017322600662929906, - "loss": 0.015, + "epoch": 0.43, + "learning_rate": 0.00023486459934522435, + "loss": 0.0191, "step": 167520 }, { - "epoch": 0.85, - "learning_rate": 0.00017321843893628507, - "loss": 0.0118, + "epoch": 0.43, + "learning_rate": 0.00023486071112885286, + "loss": 0.0204, "step": 167530 }, { - "epoch": 0.85, - "learning_rate": 0.00017321087124327105, - "loss": 0.0108, + "epoch": 0.43, + "learning_rate": 0.00023485682291248143, + "loss": 0.0194, "step": 167540 }, { - "epoch": 0.85, - "learning_rate": 0.00017320330355025703, - "loss": 0.0101, + "epoch": 0.43, + "learning_rate": 0.00023485293469610995, + "loss": 0.0185, "step": 167550 }, { - "epoch": 0.85, - "learning_rate": 0.00017319573585724304, - "loss": 0.0102, + "epoch": 0.43, + "learning_rate": 0.0002348490464797385, + "loss": 0.0213, "step": 167560 }, { - "epoch": 0.85, - "learning_rate": 0.00017318816816422902, - "loss": 0.0129, + "epoch": 0.43, + "learning_rate": 0.000234845158263367, + "loss": 0.0211, "step": 167570 }, { - "epoch": 0.85, - "learning_rate": 0.000173180600471215, - "loss": 0.0145, + "epoch": 0.43, + "learning_rate": 0.00023484127004699557, + "loss": 0.0163, "step": 167580 }, { - "epoch": 0.85, - "learning_rate": 0.00017317303277820101, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023483738183062409, + "loss": 0.019, "step": 167590 }, { - "epoch": 0.85, - "learning_rate": 0.000173165465085187, - "loss": 0.0163, + "epoch": 0.43, + "learning_rate": 0.00023483349361425263, + "loss": 0.0172, "step": 167600 }, { - "epoch": 0.85, - "learning_rate": 0.00017315789739217298, - "loss": 0.0091, + "epoch": 0.43, + "learning_rate": 0.00023482960539788114, + "loss": 0.0181, "step": 167610 }, { - "epoch": 0.85, - "learning_rate": 0.00017315032969915899, - "loss": 0.0127, + "epoch": 0.43, + "learning_rate": 0.0002348257171815097, + "loss": 0.0198, "step": 167620 }, { - "epoch": 0.85, - "learning_rate": 0.00017314276200614497, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.00023482182896513823, + "loss": 0.0219, "step": 167630 }, { - "epoch": 0.85, - "learning_rate": 0.00017313519431313095, - "loss": 0.0142, + "epoch": 0.43, + "learning_rate": 0.00023481794074876677, + "loss": 0.0195, "step": 167640 }, { - "epoch": 0.85, - "learning_rate": 0.00017312762662011693, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023481405253239528, + "loss": 0.0179, "step": 167650 }, { - "epoch": 0.85, - "learning_rate": 0.00017312005892710294, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.00023481016431602385, + "loss": 0.0186, "step": 167660 }, { - "epoch": 0.85, - "learning_rate": 0.00017311249123408892, - "loss": 0.0138, + "epoch": 0.43, + "learning_rate": 0.0002348062760996524, + "loss": 0.0187, "step": 167670 }, { - "epoch": 0.85, - "learning_rate": 0.0001731049235410749, - "loss": 0.014, + "epoch": 0.43, + "learning_rate": 0.0002348023878832809, + "loss": 0.0152, "step": 167680 }, { - "epoch": 0.85, - "learning_rate": 0.0001730973558480609, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023479849966690942, + "loss": 0.0175, "step": 167690 }, { - "epoch": 0.85, - "learning_rate": 0.0001730897881550469, - "loss": 0.0123, + "epoch": 0.43, + "learning_rate": 0.000234794611450538, + "loss": 0.0208, "step": 167700 }, { - "epoch": 0.85, - "learning_rate": 0.00017308222046203287, - "loss": 0.0152, + "epoch": 0.43, + "learning_rate": 0.00023479072323416653, + "loss": 0.0173, "step": 167710 }, { - "epoch": 0.85, - "learning_rate": 0.00017307465276901888, - "loss": 0.0124, + "epoch": 0.43, + "learning_rate": 0.00023478683501779505, + "loss": 0.0174, "step": 167720 }, { - "epoch": 0.85, - "learning_rate": 0.00017306708507600486, - "loss": 0.0114, + "epoch": 0.43, + "learning_rate": 0.0002347829468014236, + "loss": 0.0188, "step": 167730 }, { - "epoch": 0.85, - "learning_rate": 0.00017305951738299084, - "loss": 0.0119, + "epoch": 0.43, + "learning_rate": 0.0002347790585850521, + "loss": 0.0153, "step": 167740 }, { - "epoch": 0.85, - "learning_rate": 0.00017305194968997685, - "loss": 0.0122, + "epoch": 0.43, + "learning_rate": 0.00023477517036868067, + "loss": 0.0168, "step": 167750 }, { - "epoch": 0.85, - "learning_rate": 0.00017304438199696283, - "loss": 0.0202, + "epoch": 0.43, + "learning_rate": 0.00023477128215230919, + "loss": 0.0162, "step": 167760 }, { - "epoch": 0.85, - "learning_rate": 0.00017303681430394882, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023476739393593773, + "loss": 0.0169, "step": 167770 }, { - "epoch": 0.85, - "learning_rate": 0.00017302924661093482, - "loss": 0.0115, + "epoch": 0.43, + "learning_rate": 0.00023476350571956624, + "loss": 0.0188, "step": 167780 }, { - "epoch": 0.85, - "learning_rate": 0.0001730216789179208, - "loss": 0.011, + "epoch": 0.43, + "learning_rate": 0.0002347596175031948, + "loss": 0.0285, "step": 167790 }, { - "epoch": 0.85, - "learning_rate": 0.00017301411122490676, - "loss": 0.0136, + "epoch": 0.43, + "learning_rate": 0.00023475572928682333, + "loss": 0.0203, "step": 167800 }, { - "epoch": 0.85, - "learning_rate": 0.00017300654353189274, - "loss": 0.012, + "epoch": 0.43, + "learning_rate": 0.00023475184107045187, + "loss": 0.0143, "step": 167810 }, { - "epoch": 0.85, - "learning_rate": 0.00017299897583887875, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023474795285408038, + "loss": 0.0195, "step": 167820 }, { - "epoch": 0.85, - "learning_rate": 0.00017299140814586473, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023474406463770895, + "loss": 0.0175, "step": 167830 }, { - "epoch": 0.85, - "learning_rate": 0.00017298384045285071, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023474017642133746, + "loss": 0.0228, "step": 167840 }, { - "epoch": 0.85, - "learning_rate": 0.00017297627275983672, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.000234736288204966, + "loss": 0.0219, "step": 167850 }, { - "epoch": 0.85, - "learning_rate": 0.0001729687050668227, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023473239998859452, + "loss": 0.0163, "step": 167860 }, { - "epoch": 0.85, - "learning_rate": 0.00017296113737380869, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.0002347285117722231, + "loss": 0.0189, "step": 167870 }, { - "epoch": 0.85, - "learning_rate": 0.00017295356968079467, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023472462355585163, + "loss": 0.0163, "step": 167880 }, { - "epoch": 0.85, - "learning_rate": 0.00017294600198778067, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023472073533948015, + "loss": 0.0164, "step": 167890 }, { - "epoch": 0.85, - "learning_rate": 0.00017293843429476666, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.0002347168471231087, + "loss": 0.0205, "step": 167900 }, { - "epoch": 0.85, - "learning_rate": 0.00017293086660175264, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023471295890673723, + "loss": 0.0203, "step": 167910 }, { - "epoch": 0.85, - "learning_rate": 0.00017292329890873865, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023470907069036577, + "loss": 0.02, "step": 167920 }, { - "epoch": 0.85, - "learning_rate": 0.00017291573121572463, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023470518247399429, + "loss": 0.0196, "step": 167930 }, { - "epoch": 0.85, - "learning_rate": 0.0001729081635227106, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023470129425762283, + "loss": 0.0192, "step": 167940 }, { - "epoch": 0.85, - "learning_rate": 0.00017290059582969662, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023469740604125137, + "loss": 0.0167, "step": 167950 }, { - "epoch": 0.85, - "learning_rate": 0.0001728930281366826, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.0002346935178248799, + "loss": 0.0205, "step": 167960 }, { - "epoch": 0.85, - "learning_rate": 0.00017288546044366858, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023468962960850842, + "loss": 0.0177, "step": 167970 }, { - "epoch": 0.85, - "learning_rate": 0.0001728778927506546, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023468574139213697, + "loss": 0.0223, "step": 167980 }, { - "epoch": 0.85, - "learning_rate": 0.00017287032505764057, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023468185317576548, + "loss": 0.0186, "step": 167990 }, { - "epoch": 0.85, - "learning_rate": 0.00017286275736462655, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.00023467796495939405, + "loss": 0.0226, "step": 168000 }, { - "epoch": 0.85, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.008770990185439587, - "eval_runtime": 116.7217, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.44, + "eval_cer": 0.8817390768834564, + "eval_loss": 0.012735070660710335, + "eval_runtime": 108.0118, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 168000 }, { - "epoch": 0.85, - "learning_rate": 0.00017285518967161256, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023467407674302256, + "loss": 0.0206, "step": 168010 }, { - "epoch": 0.85, - "learning_rate": 0.00017284762197859854, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.0002346701885266511, + "loss": 0.0255, "step": 168020 }, { - "epoch": 0.85, - "learning_rate": 0.00017284005428558452, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.00023466630031027962, + "loss": 0.0213, "step": 168030 }, { - "epoch": 0.85, - "learning_rate": 0.0001728324865925705, - "loss": 0.0086, + "epoch": 0.44, + "learning_rate": 0.0002346624120939082, + "loss": 0.021, "step": 168040 }, { - "epoch": 0.85, - "learning_rate": 0.00017282491889955651, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023465852387753673, + "loss": 0.0168, "step": 168050 }, { - "epoch": 0.85, - "learning_rate": 0.0001728173512065425, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023465463566116525, + "loss": 0.0206, "step": 168060 }, { - "epoch": 0.85, - "learning_rate": 0.00017280978351352848, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.0002346507474447938, + "loss": 0.0258, "step": 168070 }, { - "epoch": 0.85, - "learning_rate": 0.00017280221582051449, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023464685922842233, + "loss": 0.0183, "step": 168080 }, { - "epoch": 0.85, - "learning_rate": 0.00017279464812750047, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.00023464297101205087, + "loss": 0.0211, "step": 168090 }, { - "epoch": 0.85, - "learning_rate": 0.00017278708043448645, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023463908279567938, + "loss": 0.0181, "step": 168100 }, { - "epoch": 0.85, - "learning_rate": 0.00017277951274147246, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023463519457930793, + "loss": 0.0167, "step": 168110 }, { - "epoch": 0.85, - "learning_rate": 0.00017277194504845844, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.00023463130636293647, + "loss": 0.0176, "step": 168120 }, { - "epoch": 0.85, - "learning_rate": 0.00017276437735544442, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.000234627418146565, + "loss": 0.0184, "step": 168130 }, { - "epoch": 0.85, - "learning_rate": 0.00017275680966243043, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023462352993019352, + "loss": 0.0184, "step": 168140 }, { - "epoch": 0.85, - "learning_rate": 0.0001727492419694164, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.00023461964171382207, + "loss": 0.0173, "step": 168150 }, { - "epoch": 0.85, - "learning_rate": 0.0001727416742764024, - "loss": 0.0154, + "epoch": 0.44, + "learning_rate": 0.0002346157534974506, + "loss": 0.0201, "step": 168160 }, { - "epoch": 0.85, - "learning_rate": 0.0001727341065833884, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023461186528107915, + "loss": 0.0165, "step": 168170 }, { - "epoch": 0.85, - "learning_rate": 0.00017272653889037438, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.00023460797706470766, + "loss": 0.0196, "step": 168180 }, { - "epoch": 0.85, - "learning_rate": 0.00017271897119736036, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.0002346040888483362, + "loss": 0.0156, "step": 168190 }, { - "epoch": 0.85, - "learning_rate": 0.00017271140350434637, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023460020063196477, + "loss": 0.0314, "step": 168200 }, { - "epoch": 0.85, - "learning_rate": 0.00017270383581133235, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.0002345963124155933, + "loss": 0.0201, "step": 168210 }, { - "epoch": 0.85, - "learning_rate": 0.00017269626811831833, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023459242419922183, + "loss": 0.0186, "step": 168220 }, { - "epoch": 0.85, - "learning_rate": 0.00017268870042530432, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023458853598285034, + "loss": 0.0179, "step": 168230 }, { - "epoch": 0.85, - "learning_rate": 0.00017268113273229032, - "loss": 0.0132, + "epoch": 0.44, + "learning_rate": 0.00023458464776647886, + "loss": 0.0204, "step": 168240 }, { - "epoch": 0.85, - "learning_rate": 0.0001726735650392763, - "loss": 0.0142, + "epoch": 0.44, + "learning_rate": 0.00023458075955010743, + "loss": 0.0164, "step": 168250 }, { - "epoch": 0.85, - "learning_rate": 0.0001726659973462623, - "loss": 0.0142, + "epoch": 0.44, + "learning_rate": 0.00023457687133373597, + "loss": 0.0212, "step": 168260 }, { - "epoch": 0.85, - "learning_rate": 0.0001726584296532483, - "loss": 0.0155, + "epoch": 0.44, + "learning_rate": 0.00023457298311736448, + "loss": 0.0148, "step": 168270 }, { - "epoch": 0.85, - "learning_rate": 0.00017265086196023428, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023456909490099303, + "loss": 0.0153, "step": 168280 }, { - "epoch": 0.85, - "learning_rate": 0.00017264329426722026, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023456520668462157, + "loss": 0.0176, "step": 168290 }, { - "epoch": 0.85, - "learning_rate": 0.00017263572657420627, - "loss": 0.0151, + "epoch": 0.44, + "learning_rate": 0.0002345613184682501, + "loss": 0.0172, "step": 168300 }, { - "epoch": 0.85, - "learning_rate": 0.00017262815888119225, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023455743025187862, + "loss": 0.0193, "step": 168310 }, { - "epoch": 0.85, - "learning_rate": 0.00017262059118817823, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023455354203550717, + "loss": 0.0137, "step": 168320 }, { - "epoch": 0.85, - "learning_rate": 0.00017261302349516424, - "loss": 0.0142, + "epoch": 0.44, + "learning_rate": 0.0002345496538191357, + "loss": 0.0208, "step": 168330 }, { - "epoch": 0.85, - "learning_rate": 0.00017260545580215022, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023454576560276425, + "loss": 0.0176, "step": 168340 }, { - "epoch": 0.85, - "learning_rate": 0.0001725978881091362, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023454187738639276, + "loss": 0.0226, "step": 168350 }, { - "epoch": 0.85, - "learning_rate": 0.0001725903204161222, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.0002345379891700213, + "loss": 0.0159, "step": 168360 }, { - "epoch": 0.85, - "learning_rate": 0.0001725827527231082, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023453410095364987, + "loss": 0.0186, "step": 168370 }, { - "epoch": 0.85, - "learning_rate": 0.00017257518503009417, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.0002345302127372784, + "loss": 0.0267, "step": 168380 }, { - "epoch": 0.85, - "learning_rate": 0.00017256761733708015, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023452632452090693, + "loss": 0.0174, "step": 168390 }, { - "epoch": 0.85, - "learning_rate": 0.00017256004964406616, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023452243630453544, + "loss": 0.0216, "step": 168400 }, { - "epoch": 0.85, - "learning_rate": 0.00017255248195105214, - "loss": 0.0114, + "epoch": 0.44, + "learning_rate": 0.000234518548088164, + "loss": 0.0219, "step": 168410 }, { - "epoch": 0.85, - "learning_rate": 0.00017254491425803813, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023451465987179253, + "loss": 0.0184, "step": 168420 }, { - "epoch": 0.85, - "learning_rate": 0.00017253734656502413, - "loss": 0.0099, + "epoch": 0.44, + "learning_rate": 0.00023451077165542107, + "loss": 0.0245, "step": 168430 }, { - "epoch": 0.85, - "learning_rate": 0.00017252977887201012, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023450688343904958, + "loss": 0.0203, "step": 168440 }, { - "epoch": 0.85, - "learning_rate": 0.0001725222111789961, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023450299522267815, + "loss": 0.0194, "step": 168450 }, { - "epoch": 0.85, - "learning_rate": 0.0001725146434859821, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023449910700630667, + "loss": 0.0187, "step": 168460 }, { - "epoch": 0.85, - "learning_rate": 0.0001725070757929681, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.0002344952187899352, + "loss": 0.0209, "step": 168470 }, { - "epoch": 0.85, - "learning_rate": 0.00017249950809995407, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023449133057356372, + "loss": 0.0175, "step": 168480 }, { - "epoch": 0.85, - "learning_rate": 0.00017249194040694008, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023448744235719226, + "loss": 0.0179, "step": 168490 }, { - "epoch": 0.85, - "learning_rate": 0.00017248437271392606, - "loss": 0.0097, + "epoch": 0.44, + "learning_rate": 0.0002344835541408208, + "loss": 0.0212, "step": 168500 }, { - "epoch": 0.85, - "learning_rate": 0.00017247680502091204, - "loss": 0.0095, + "epoch": 0.44, + "learning_rate": 0.00023447966592444935, + "loss": 0.018, "step": 168510 }, { - "epoch": 0.85, - "learning_rate": 0.00017246923732789805, - "loss": 0.0114, + "epoch": 0.44, + "learning_rate": 0.00023447577770807786, + "loss": 0.0165, "step": 168520 }, { - "epoch": 0.85, - "learning_rate": 0.00017246166963488403, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.0002344718894917064, + "loss": 0.019, "step": 168530 }, { - "epoch": 0.85, - "learning_rate": 0.00017245410194187, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.00023446800127533497, + "loss": 0.0205, "step": 168540 }, { - "epoch": 0.85, - "learning_rate": 0.000172446534248856, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.0002344641130589635, + "loss": 0.0181, "step": 168550 }, { - "epoch": 0.85, - "learning_rate": 0.000172438966555842, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.000234460224842592, + "loss": 0.019, "step": 168560 }, { - "epoch": 0.85, - "learning_rate": 0.00017243139886282798, - "loss": 0.0102, + "epoch": 0.44, + "learning_rate": 0.00023445633662622054, + "loss": 0.0241, "step": 168570 }, { - "epoch": 0.85, - "learning_rate": 0.00017242383116981396, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.0002344524484098491, + "loss": 0.0182, "step": 168580 }, { - "epoch": 0.85, - "learning_rate": 0.00017241626347679997, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023444856019347763, + "loss": 0.0198, "step": 168590 }, { - "epoch": 0.85, - "learning_rate": 0.00017240869578378595, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023444467197710617, + "loss": 0.0218, "step": 168600 }, { - "epoch": 0.85, - "learning_rate": 0.00017240112809077194, - "loss": 0.0104, + "epoch": 0.44, + "learning_rate": 0.00023444078376073468, + "loss": 0.0165, "step": 168610 }, { - "epoch": 0.85, - "learning_rate": 0.00017239356039775794, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023443689554436325, + "loss": 0.0184, "step": 168620 }, { - "epoch": 0.85, - "learning_rate": 0.00017238599270474393, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023443300732799177, + "loss": 0.0172, "step": 168630 }, { - "epoch": 0.85, - "learning_rate": 0.0001723784250117299, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.0002344291191116203, + "loss": 0.0146, "step": 168640 }, { - "epoch": 0.85, - "learning_rate": 0.00017237085731871592, - "loss": 0.0151, + "epoch": 0.44, + "learning_rate": 0.00023442523089524882, + "loss": 0.0166, "step": 168650 }, { - "epoch": 0.85, - "learning_rate": 0.0001723632896257019, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.0002344213426788774, + "loss": 0.0249, "step": 168660 }, { - "epoch": 0.85, - "learning_rate": 0.00017235572193268788, - "loss": 0.017, + "epoch": 0.44, + "learning_rate": 0.0002344174544625059, + "loss": 0.0162, "step": 168670 }, { - "epoch": 0.85, - "learning_rate": 0.0001723481542396739, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023441356624613445, + "loss": 0.0189, "step": 168680 }, { - "epoch": 0.85, - "learning_rate": 0.00017234058654665987, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023440967802976296, + "loss": 0.0193, "step": 168690 }, { - "epoch": 0.85, - "learning_rate": 0.00017233301885364585, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023440578981339153, + "loss": 0.0209, "step": 168700 }, { - "epoch": 0.85, - "learning_rate": 0.00017232545116063183, - "loss": 0.0087, + "epoch": 0.44, + "learning_rate": 0.00023440190159702007, + "loss": 0.0192, "step": 168710 }, { - "epoch": 0.85, - "learning_rate": 0.00017231788346761784, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.0002343980133806486, + "loss": 0.0184, "step": 168720 }, { - "epoch": 0.85, - "learning_rate": 0.00017231031577460382, - "loss": 0.0153, + "epoch": 0.44, + "learning_rate": 0.0002343941251642771, + "loss": 0.0216, "step": 168730 }, { - "epoch": 0.85, - "learning_rate": 0.0001723027480815898, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023439023694790564, + "loss": 0.0212, "step": 168740 }, { - "epoch": 0.85, - "learning_rate": 0.0001722951803885758, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.0002343863487315342, + "loss": 0.0165, "step": 168750 }, { - "epoch": 0.85, - "learning_rate": 0.0001722876126955618, - "loss": 0.0104, + "epoch": 0.44, + "learning_rate": 0.00023438246051516273, + "loss": 0.018, "step": 168760 }, { - "epoch": 0.85, - "learning_rate": 0.00017228004500254777, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023437857229879127, + "loss": 0.0173, "step": 168770 }, { - "epoch": 0.85, - "learning_rate": 0.00017227247730953378, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023437468408241978, + "loss": 0.0207, "step": 168780 }, { - "epoch": 0.85, - "learning_rate": 0.00017226490961651976, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023437079586604835, + "loss": 0.0215, "step": 168790 }, { - "epoch": 0.85, - "learning_rate": 0.00017225734192350575, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023436690764967687, + "loss": 0.0201, "step": 168800 }, { - "epoch": 0.85, - "learning_rate": 0.00017224977423049175, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.0002343630194333054, + "loss": 0.0187, "step": 168810 }, { - "epoch": 0.85, - "learning_rate": 0.00017224220653747774, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023435913121693392, + "loss": 0.0181, "step": 168820 }, { - "epoch": 0.85, - "learning_rate": 0.00017223463884446372, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.0002343552430005625, + "loss": 0.0197, "step": 168830 }, { - "epoch": 0.85, - "learning_rate": 0.00017222707115144973, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.000234351354784191, + "loss": 0.021, "step": 168840 }, { - "epoch": 0.85, - "learning_rate": 0.0001722195034584357, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.00023434746656781955, + "loss": 0.0182, "step": 168850 }, { - "epoch": 0.85, - "learning_rate": 0.0001722119357654217, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023434357835144806, + "loss": 0.0238, "step": 168860 }, { - "epoch": 0.85, - "learning_rate": 0.0001722043680724077, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.00023433969013507663, + "loss": 0.021, "step": 168870 }, { - "epoch": 0.85, - "learning_rate": 0.00017219680037939368, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023433580191870514, + "loss": 0.0163, "step": 168880 }, { - "epoch": 0.85, - "learning_rate": 0.00017218923268637966, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023433191370233369, + "loss": 0.0128, "step": 168890 }, { - "epoch": 0.85, - "learning_rate": 0.00017218166499336564, - "loss": 0.0154, + "epoch": 0.44, + "learning_rate": 0.0002343280254859622, + "loss": 0.0204, "step": 168900 }, { - "epoch": 0.85, - "learning_rate": 0.00017217409730035165, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.00023432413726959077, + "loss": 0.0208, "step": 168910 }, { - "epoch": 0.85, - "learning_rate": 0.00017216652960733763, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.0002343202490532193, + "loss": 0.0195, "step": 168920 }, { - "epoch": 0.85, - "learning_rate": 0.0001721589619143236, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023431636083684783, + "loss": 0.0181, "step": 168930 }, { - "epoch": 0.85, - "learning_rate": 0.00017215139422130962, - "loss": 0.0101, + "epoch": 0.44, + "learning_rate": 0.00023431247262047637, + "loss": 0.02, "step": 168940 }, { - "epoch": 0.85, - "learning_rate": 0.0001721438265282956, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.0002343085844041049, + "loss": 0.0192, "step": 168950 }, { - "epoch": 0.85, - "learning_rate": 0.00017213625883528158, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023430469618773345, + "loss": 0.0191, "step": 168960 }, { - "epoch": 0.85, - "learning_rate": 0.0001721286911422676, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023430080797136197, + "loss": 0.0175, "step": 168970 }, { - "epoch": 0.85, - "learning_rate": 0.00017212112344925357, - "loss": 0.0089, + "epoch": 0.44, + "learning_rate": 0.0002342969197549905, + "loss": 0.0195, "step": 168980 }, { - "epoch": 0.85, - "learning_rate": 0.00017211355575623956, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023429303153861902, + "loss": 0.0192, "step": 168990 }, { - "epoch": 0.85, - "learning_rate": 0.00017210598806322556, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.0002342891433222476, + "loss": 0.0192, "step": 169000 }, { - "epoch": 0.85, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.008490633219480515, - "eval_runtime": 116.745, - "eval_samples_per_second": 17.131, - "eval_steps_per_second": 4.283, + "epoch": 0.44, + "eval_cer": 0.88176706962214, + "eval_loss": 0.012475664727389812, + "eval_runtime": 107.3738, + "eval_samples_per_second": 18.627, + "eval_steps_per_second": 4.657, "step": 169000 }, { - "epoch": 0.85, - "learning_rate": 0.00017209842037021155, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.0002342852551058761, + "loss": 0.022, "step": 169010 }, { - "epoch": 0.85, - "learning_rate": 0.00017209085267719753, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023428136688950465, + "loss": 0.014, "step": 169020 }, { - "epoch": 0.85, - "learning_rate": 0.00017208328498418354, - "loss": 0.017, + "epoch": 0.44, + "learning_rate": 0.00023427747867313316, + "loss": 0.0267, "step": 169030 }, { - "epoch": 0.85, - "learning_rate": 0.00017207571729116952, - "loss": 0.0104, + "epoch": 0.44, + "learning_rate": 0.00023427359045676173, + "loss": 0.0186, "step": 169040 }, { - "epoch": 0.85, - "learning_rate": 0.0001720681495981555, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023426970224039024, + "loss": 0.0232, "step": 169050 }, { - "epoch": 0.85, - "learning_rate": 0.00017206058190514145, - "loss": 0.0148, + "epoch": 0.44, + "learning_rate": 0.00023426581402401879, + "loss": 0.0162, "step": 169060 }, { - "epoch": 0.85, - "learning_rate": 0.00017205301421212746, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.0002342619258076473, + "loss": 0.0181, "step": 169070 }, { - "epoch": 0.85, - "learning_rate": 0.00017204544651911344, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023425803759127587, + "loss": 0.0147, "step": 169080 }, { - "epoch": 0.85, - "learning_rate": 0.00017203787882609942, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.0002342541493749044, + "loss": 0.02, "step": 169090 }, { - "epoch": 0.85, - "learning_rate": 0.00017203031113308543, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023425026115853293, + "loss": 0.0189, "step": 169100 }, { - "epoch": 0.85, - "learning_rate": 0.00017202274344007141, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023424637294216147, + "loss": 0.0212, "step": 169110 }, { - "epoch": 0.85, - "learning_rate": 0.0001720151757470574, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023424248472579, + "loss": 0.0184, "step": 169120 }, { - "epoch": 0.85, - "learning_rate": 0.00017200760805404338, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023423859650941855, + "loss": 0.0178, "step": 169130 }, { - "epoch": 0.85, - "learning_rate": 0.00017200004036102939, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023423470829304706, + "loss": 0.0161, "step": 169140 }, { - "epoch": 0.85, - "learning_rate": 0.00017199247266801537, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.0002342308200766756, + "loss": 0.0158, "step": 169150 }, { - "epoch": 0.85, - "learning_rate": 0.00017198490497500135, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023422693186030415, + "loss": 0.0187, "step": 169160 }, { - "epoch": 0.85, - "learning_rate": 0.00017197733728198736, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.0002342230436439327, + "loss": 0.0195, "step": 169170 }, { - "epoch": 0.85, - "learning_rate": 0.00017196976958897334, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.0002342191554275612, + "loss": 0.0163, "step": 169180 }, { - "epoch": 0.85, - "learning_rate": 0.00017196220189595932, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023421526721118975, + "loss": 0.0216, "step": 169190 }, { - "epoch": 0.85, - "learning_rate": 0.00017195463420294533, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.0002342113789948183, + "loss": 0.0173, "step": 169200 }, { - "epoch": 0.85, - "learning_rate": 0.0001719470665099313, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023420749077844683, + "loss": 0.0158, "step": 169210 }, { - "epoch": 0.85, - "learning_rate": 0.0001719394988169173, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023420360256207534, + "loss": 0.0177, "step": 169220 }, { - "epoch": 0.85, - "learning_rate": 0.0001719319311239033, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.00023419971434570389, + "loss": 0.0196, "step": 169230 }, { - "epoch": 0.85, - "learning_rate": 0.00017192436343088928, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.0002341958261293324, + "loss": 0.0208, "step": 169240 }, { - "epoch": 0.85, - "learning_rate": 0.00017191679573787526, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023419193791296097, + "loss": 0.0206, "step": 169250 }, { - "epoch": 0.85, - "learning_rate": 0.00017190922804486127, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.0002341880496965895, + "loss": 0.0187, "step": 169260 }, { - "epoch": 0.85, - "learning_rate": 0.00017190166035184725, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023418416148021802, + "loss": 0.0161, "step": 169270 }, { - "epoch": 0.85, - "learning_rate": 0.00017189409265883323, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023418027326384654, + "loss": 0.0201, "step": 169280 }, { - "epoch": 0.85, - "learning_rate": 0.00017188652496581922, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.0002341763850474751, + "loss": 0.0129, "step": 169290 }, { - "epoch": 0.85, - "learning_rate": 0.00017187895727280522, - "loss": 0.0101, + "epoch": 0.44, + "learning_rate": 0.00023417249683110365, + "loss": 0.0171, "step": 169300 }, { - "epoch": 0.85, - "learning_rate": 0.0001718713895797912, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023416860861473216, + "loss": 0.02, "step": 169310 }, { - "epoch": 0.85, - "learning_rate": 0.0001718638218867772, - "loss": 0.0193, + "epoch": 0.44, + "learning_rate": 0.0002341647203983607, + "loss": 0.0167, "step": 169320 }, { - "epoch": 0.85, - "learning_rate": 0.0001718562541937632, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.00023416083218198925, + "loss": 0.02, "step": 169330 }, { - "epoch": 0.85, - "learning_rate": 0.00017184868650074918, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.0002341569439656178, + "loss": 0.0173, "step": 169340 }, { - "epoch": 0.85, - "learning_rate": 0.00017184111880773516, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.0002341530557492463, + "loss": 0.0182, "step": 169350 }, { - "epoch": 0.85, - "learning_rate": 0.00017183355111472117, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023414916753287485, + "loss": 0.0185, "step": 169360 }, { - "epoch": 0.85, - "learning_rate": 0.00017182598342170715, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.0002341452793165034, + "loss": 0.0225, "step": 169370 }, { - "epoch": 0.85, - "learning_rate": 0.00017181841572869313, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023414139110013193, + "loss": 0.0192, "step": 169380 }, { - "epoch": 0.85, - "learning_rate": 0.00017181084803567914, - "loss": 0.013, + "epoch": 0.44, + "learning_rate": 0.00023413750288376044, + "loss": 0.0207, "step": 169390 }, { - "epoch": 0.85, - "learning_rate": 0.00017180328034266512, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023413361466738898, + "loss": 0.0221, "step": 169400 }, { - "epoch": 0.85, - "learning_rate": 0.0001717957126496511, - "loss": 0.015, + "epoch": 0.44, + "learning_rate": 0.00023412972645101755, + "loss": 0.0207, "step": 169410 }, { - "epoch": 0.85, - "learning_rate": 0.0001717881449566371, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023412583823464607, + "loss": 0.0184, "step": 169420 }, { - "epoch": 0.85, - "learning_rate": 0.0001717805772636231, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023412195001827458, + "loss": 0.0158, "step": 169430 }, { - "epoch": 0.85, - "learning_rate": 0.00017177300957060907, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.00023411806180190312, + "loss": 0.0194, "step": 169440 }, { - "epoch": 0.85, - "learning_rate": 0.00017176544187759505, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.0002341141735855317, + "loss": 0.0155, "step": 169450 }, { - "epoch": 0.85, - "learning_rate": 0.00017175787418458106, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.0002341102853691602, + "loss": 0.0202, "step": 169460 }, { - "epoch": 0.85, - "learning_rate": 0.00017175030649156704, - "loss": 0.014, + "epoch": 0.44, + "learning_rate": 0.00023410639715278875, + "loss": 0.0193, "step": 169470 }, { - "epoch": 0.86, - "learning_rate": 0.00017174273879855303, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023410250893641726, + "loss": 0.0196, "step": 169480 }, { - "epoch": 0.86, - "learning_rate": 0.00017173517110553903, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.0002340986207200458, + "loss": 0.0282, "step": 169490 }, { - "epoch": 0.86, - "learning_rate": 0.00017172760341252502, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.00023409473250367435, + "loss": 0.0189, "step": 169500 }, { - "epoch": 0.86, - "learning_rate": 0.000171720035719511, - "loss": 0.0091, + "epoch": 0.44, + "learning_rate": 0.0002340908442873029, + "loss": 0.0204, "step": 169510 }, { - "epoch": 0.86, - "learning_rate": 0.000171712468026497, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.0002340869560709314, + "loss": 0.0203, "step": 169520 }, { - "epoch": 0.86, - "learning_rate": 0.000171704900333483, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023408306785455994, + "loss": 0.0203, "step": 169530 }, { - "epoch": 0.86, - "learning_rate": 0.00017169733264046897, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023407917963818849, + "loss": 0.0157, "step": 169540 }, { - "epoch": 0.86, - "learning_rate": 0.00017168976494745498, - "loss": 0.0132, + "epoch": 0.44, + "learning_rate": 0.00023407529142181703, + "loss": 0.0179, "step": 169550 }, { - "epoch": 0.86, - "learning_rate": 0.00017168219725444096, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023407140320544554, + "loss": 0.0159, "step": 169560 }, { - "epoch": 0.86, - "learning_rate": 0.00017167462956142694, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023406751498907408, + "loss": 0.0187, "step": 169570 }, { - "epoch": 0.86, - "learning_rate": 0.00017166706186841295, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023406362677270265, + "loss": 0.0203, "step": 169580 }, { - "epoch": 0.86, - "learning_rate": 0.00017165949417539893, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.00023405973855633117, + "loss": 0.0162, "step": 169590 }, { - "epoch": 0.86, - "learning_rate": 0.0001716519264823849, - "loss": 0.0152, + "epoch": 0.44, + "learning_rate": 0.00023405585033995968, + "loss": 0.0168, "step": 169600 }, { - "epoch": 0.86, - "learning_rate": 0.0001716443587893709, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023405196212358822, + "loss": 0.0181, "step": 169610 }, { - "epoch": 0.86, - "learning_rate": 0.0001716367910963569, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.0002340480739072168, + "loss": 0.023, "step": 169620 }, { - "epoch": 0.86, - "learning_rate": 0.00017162922340334288, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.0002340441856908453, + "loss": 0.0201, "step": 169630 }, { - "epoch": 0.86, - "learning_rate": 0.00017162165571032886, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023404029747447385, + "loss": 0.0167, "step": 169640 }, { - "epoch": 0.86, - "learning_rate": 0.00017161408801731487, - "loss": 0.0088, + "epoch": 0.44, + "learning_rate": 0.00023403640925810236, + "loss": 0.02, "step": 169650 }, { - "epoch": 0.86, - "learning_rate": 0.00017160652032430085, - "loss": 0.0099, + "epoch": 0.44, + "learning_rate": 0.00023403252104173093, + "loss": 0.0183, "step": 169660 }, { - "epoch": 0.86, - "learning_rate": 0.00017159895263128684, - "loss": 0.0094, + "epoch": 0.44, + "learning_rate": 0.00023402863282535945, + "loss": 0.0184, "step": 169670 }, { - "epoch": 0.86, - "learning_rate": 0.00017159138493827284, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.000234024744608988, + "loss": 0.0148, "step": 169680 }, { - "epoch": 0.86, - "learning_rate": 0.00017158381724525883, - "loss": 0.0152, + "epoch": 0.44, + "learning_rate": 0.0002340208563926165, + "loss": 0.0166, "step": 169690 }, { - "epoch": 0.86, - "learning_rate": 0.0001715762495522448, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.00023401696817624507, + "loss": 0.0152, "step": 169700 }, { - "epoch": 0.86, - "learning_rate": 0.00017156868185923082, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023401307995987359, + "loss": 0.0147, "step": 169710 }, { - "epoch": 0.86, - "learning_rate": 0.0001715611141662168, - "loss": 0.0096, + "epoch": 0.44, + "learning_rate": 0.00023400919174350213, + "loss": 0.0174, "step": 169720 }, { - "epoch": 0.86, - "learning_rate": 0.00017155354647320278, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.00023400530352713064, + "loss": 0.016, "step": 169730 }, { - "epoch": 0.86, - "learning_rate": 0.0001715459787801888, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.00023400141531075918, + "loss": 0.0174, "step": 169740 }, { - "epoch": 0.86, - "learning_rate": 0.00017153841108717477, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023399752709438772, + "loss": 0.019, "step": 169750 }, { - "epoch": 0.86, - "learning_rate": 0.00017153084339416075, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023399363887801627, + "loss": 0.0173, "step": 169760 }, { - "epoch": 0.86, - "learning_rate": 0.00017152327570114676, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023398975066164478, + "loss": 0.0212, "step": 169770 }, { - "epoch": 0.86, - "learning_rate": 0.00017151570800813274, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023398586244527332, + "loss": 0.0175, "step": 169780 }, { - "epoch": 0.86, - "learning_rate": 0.00017150814031511872, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.0002339819742289019, + "loss": 0.0227, "step": 169790 }, { - "epoch": 0.86, - "learning_rate": 0.0001715005726221047, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.0002339780860125304, + "loss": 0.019, "step": 169800 }, { - "epoch": 0.86, - "learning_rate": 0.0001714930049290907, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.00023397419779615895, + "loss": 0.017, "step": 169810 }, { - "epoch": 0.86, - "learning_rate": 0.0001714854372360767, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023397030957978746, + "loss": 0.0182, "step": 169820 }, { - "epoch": 0.86, - "learning_rate": 0.00017147786954306267, - "loss": 0.0097, + "epoch": 0.44, + "learning_rate": 0.00023396642136341603, + "loss": 0.0214, "step": 169830 }, { - "epoch": 0.86, - "learning_rate": 0.00017147030185004868, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023396253314704455, + "loss": 0.0194, "step": 169840 }, { - "epoch": 0.86, - "learning_rate": 0.00017146273415703466, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.0002339586449306731, + "loss": 0.0211, "step": 169850 }, { - "epoch": 0.86, - "learning_rate": 0.00017145516646402065, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.0002339547567143016, + "loss": 0.0182, "step": 169860 }, { - "epoch": 0.86, - "learning_rate": 0.00017144759877100665, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023395086849793017, + "loss": 0.0221, "step": 169870 }, { - "epoch": 0.86, - "learning_rate": 0.00017144003107799264, - "loss": 0.0147, + "epoch": 0.44, + "learning_rate": 0.00023394698028155868, + "loss": 0.0209, "step": 169880 }, { - "epoch": 0.86, - "learning_rate": 0.00017143246338497862, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023394309206518723, + "loss": 0.0178, "step": 169890 }, { - "epoch": 0.86, - "learning_rate": 0.00017142489569196463, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023393920384881574, + "loss": 0.0232, "step": 169900 }, { - "epoch": 0.86, - "learning_rate": 0.0001714173279989506, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.0002339353156324443, + "loss": 0.0169, "step": 169910 }, { - "epoch": 0.86, - "learning_rate": 0.0001714097603059366, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023393142741607282, + "loss": 0.0169, "step": 169920 }, { - "epoch": 0.86, - "learning_rate": 0.0001714021926129226, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023392753919970137, + "loss": 0.0188, "step": 169930 }, { - "epoch": 0.86, - "learning_rate": 0.00017139462491990858, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023392365098332988, + "loss": 0.0168, "step": 169940 }, { - "epoch": 0.86, - "learning_rate": 0.00017138705722689456, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023391976276695845, + "loss": 0.0165, "step": 169950 }, { - "epoch": 0.86, - "learning_rate": 0.00017137948953388054, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.000233915874550587, + "loss": 0.0146, "step": 169960 }, { - "epoch": 0.86, - "learning_rate": 0.00017137192184086655, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.0002339119863342155, + "loss": 0.017, "step": 169970 }, { - "epoch": 0.86, - "learning_rate": 0.00017136435414785253, - "loss": 0.0093, + "epoch": 0.44, + "learning_rate": 0.00023390809811784405, + "loss": 0.0311, "step": 169980 }, { - "epoch": 0.86, - "learning_rate": 0.0001713567864548385, - "loss": 0.0162, + "epoch": 0.44, + "learning_rate": 0.00023390420990147256, + "loss": 0.0195, "step": 169990 }, { - "epoch": 0.86, - "learning_rate": 0.00017134921876182452, - "loss": 0.015, + "epoch": 0.44, + "learning_rate": 0.00023390032168510113, + "loss": 0.0191, "step": 170000 }, { - "epoch": 0.86, - "eval_cer": 0.9144799598644162, - "eval_loss": 0.00878238771110773, - "eval_runtime": 116.6286, - "eval_samples_per_second": 17.148, - "eval_steps_per_second": 4.287, + "epoch": 0.44, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.01211427990347147, + "eval_runtime": 107.8438, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, "step": 170000 }, { - "epoch": 0.86, - "learning_rate": 0.0001713416510688105, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023389643346872964, + "loss": 0.0174, "step": 170010 }, { - "epoch": 0.86, - "learning_rate": 0.00017133408337579648, - "loss": 0.0136, + "epoch": 0.44, + "learning_rate": 0.0002338925452523582, + "loss": 0.0151, "step": 170020 }, { - "epoch": 0.86, - "learning_rate": 0.0001713265156827825, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.0002338886570359867, + "loss": 0.0167, "step": 170030 }, { - "epoch": 0.86, - "learning_rate": 0.00017131894798976847, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023388476881961527, + "loss": 0.0189, "step": 170040 }, { - "epoch": 0.86, - "learning_rate": 0.00017131138029675446, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.00023388088060324378, + "loss": 0.0237, "step": 170050 }, { - "epoch": 0.86, - "learning_rate": 0.00017130381260374046, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.00023387699238687233, + "loss": 0.0173, "step": 170060 }, { - "epoch": 0.86, - "learning_rate": 0.00017129624491072645, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023387310417050084, + "loss": 0.0172, "step": 170070 }, { - "epoch": 0.86, - "learning_rate": 0.00017128867721771243, - "loss": 0.0101, + "epoch": 0.44, + "learning_rate": 0.0002338692159541294, + "loss": 0.016, "step": 170080 }, { - "epoch": 0.86, - "learning_rate": 0.00017128110952469844, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023386532773775792, + "loss": 0.0175, "step": 170090 }, { - "epoch": 0.86, - "learning_rate": 0.00017127354183168442, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023386143952138647, + "loss": 0.0199, "step": 170100 }, { - "epoch": 0.86, - "learning_rate": 0.0001712659741386704, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023385755130501498, + "loss": 0.0167, "step": 170110 }, { - "epoch": 0.86, - "learning_rate": 0.00017125840644565638, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023385366308864355, + "loss": 0.0184, "step": 170120 }, { - "epoch": 0.86, - "learning_rate": 0.0001712508387526424, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.0002338497748722721, + "loss": 0.0154, "step": 170130 }, { - "epoch": 0.86, - "learning_rate": 0.00017124327105962837, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.0002338458866559006, + "loss": 0.0207, "step": 170140 }, { - "epoch": 0.86, - "learning_rate": 0.00017123570336661435, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023384199843952912, + "loss": 0.0185, "step": 170150 }, { - "epoch": 0.86, - "learning_rate": 0.00017122813567360036, - "loss": 0.0099, + "epoch": 0.44, + "learning_rate": 0.0002338381102231577, + "loss": 0.018, "step": 170160 }, { - "epoch": 0.86, - "learning_rate": 0.00017122056798058634, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023383422200678623, + "loss": 0.0164, "step": 170170 }, { - "epoch": 0.86, - "learning_rate": 0.00017121300028757232, - "loss": 0.0101, + "epoch": 0.44, + "learning_rate": 0.00023383033379041474, + "loss": 0.0177, "step": 170180 }, { - "epoch": 0.86, - "learning_rate": 0.00017120543259455833, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023382644557404329, + "loss": 0.0172, "step": 170190 }, { - "epoch": 0.86, - "learning_rate": 0.0001711978649015443, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023382255735767183, + "loss": 0.0185, "step": 170200 }, { - "epoch": 0.86, - "learning_rate": 0.0001711902972085303, - "loss": 0.011, - "step": 170210 + "epoch": 0.44, + "learning_rate": 0.00023381866914130037, + "loss": 0.0146, + "step": 170210 }, { - "epoch": 0.86, - "learning_rate": 0.0001711827295155163, - "loss": 0.0158, + "epoch": 0.44, + "learning_rate": 0.00023381478092492888, + "loss": 0.0182, "step": 170220 }, { - "epoch": 0.86, - "learning_rate": 0.00017117516182250228, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023381089270855743, + "loss": 0.0141, "step": 170230 }, { - "epoch": 0.86, - "learning_rate": 0.00017116759412948827, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023380700449218594, + "loss": 0.0144, "step": 170240 }, { - "epoch": 0.86, - "learning_rate": 0.00017116002643647427, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.0002338031162758145, + "loss": 0.0196, "step": 170250 }, { - "epoch": 0.86, - "learning_rate": 0.00017115245874346026, - "loss": 0.0271, + "epoch": 0.44, + "learning_rate": 0.00023379922805944302, + "loss": 0.0168, "step": 170260 }, { - "epoch": 0.86, - "learning_rate": 0.00017114489105044624, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.00023379533984307156, + "loss": 0.0169, "step": 170270 }, { - "epoch": 0.86, - "learning_rate": 0.00017113732335743225, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023379145162670008, + "loss": 0.0179, "step": 170280 }, { - "epoch": 0.86, - "learning_rate": 0.00017112975566441823, - "loss": 0.0123, + "epoch": 0.44, + "learning_rate": 0.00023378756341032865, + "loss": 0.0182, "step": 170290 }, { - "epoch": 0.86, - "learning_rate": 0.0001711221879714042, - "loss": 0.0142, + "epoch": 0.44, + "learning_rate": 0.00023378367519395716, + "loss": 0.0171, "step": 170300 }, { - "epoch": 0.86, - "learning_rate": 0.00017111462027839016, - "loss": 0.0148, + "epoch": 0.44, + "learning_rate": 0.0002337797869775857, + "loss": 0.0175, "step": 170310 }, { - "epoch": 0.86, - "learning_rate": 0.00017110705258537617, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023377589876121422, + "loss": 0.0202, "step": 170320 }, { - "epoch": 0.86, - "learning_rate": 0.00017109948489236215, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.0002337720105448428, + "loss": 0.0165, "step": 170330 }, { - "epoch": 0.86, - "learning_rate": 0.00017109191719934813, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023376812232847133, + "loss": 0.0155, "step": 170340 }, { - "epoch": 0.86, - "learning_rate": 0.00017108434950633412, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.00023376423411209984, + "loss": 0.0217, "step": 170350 }, { - "epoch": 0.86, - "learning_rate": 0.00017107678181332012, - "loss": 0.0173, + "epoch": 0.44, + "learning_rate": 0.00023376034589572839, + "loss": 0.018, "step": 170360 }, { - "epoch": 0.86, - "learning_rate": 0.0001710692141203061, - "loss": 0.015, + "epoch": 0.44, + "learning_rate": 0.00023375645767935693, + "loss": 0.016, "step": 170370 }, { - "epoch": 0.86, - "learning_rate": 0.0001710616464272921, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023375256946298547, + "loss": 0.016, "step": 170380 }, { - "epoch": 0.86, - "learning_rate": 0.0001710540787342781, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023374868124661398, + "loss": 0.0164, "step": 170390 }, { - "epoch": 0.86, - "learning_rate": 0.00017104651104126408, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023374479303024252, + "loss": 0.0213, "step": 170400 }, { - "epoch": 0.86, - "learning_rate": 0.00017103894334825006, - "loss": 0.023, + "epoch": 0.44, + "learning_rate": 0.00023374090481387107, + "loss": 0.0196, "step": 170410 }, { - "epoch": 0.86, - "learning_rate": 0.00017103137565523607, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.0002337370165974996, + "loss": 0.0149, "step": 170420 }, { - "epoch": 0.86, - "learning_rate": 0.00017102380796222205, - "loss": 0.0142, + "epoch": 0.44, + "learning_rate": 0.00023373312838112812, + "loss": 0.0172, "step": 170430 }, { - "epoch": 0.86, - "learning_rate": 0.00017101624026920803, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023372924016475666, + "loss": 0.023, "step": 170440 }, { - "epoch": 0.86, - "learning_rate": 0.00017100867257619404, - "loss": 0.0095, + "epoch": 0.44, + "learning_rate": 0.00023372535194838518, + "loss": 0.0173, "step": 170450 }, { - "epoch": 0.86, - "learning_rate": 0.00017100110488318002, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023372146373201375, + "loss": 0.0164, "step": 170460 }, { - "epoch": 0.86, - "learning_rate": 0.000170993537190166, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023371757551564226, + "loss": 0.0203, "step": 170470 }, { - "epoch": 0.86, - "learning_rate": 0.000170985969497152, - "loss": 0.0096, + "epoch": 0.44, + "learning_rate": 0.0002337136872992708, + "loss": 0.016, "step": 170480 }, { - "epoch": 0.86, - "learning_rate": 0.000170978401804138, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023370979908289932, + "loss": 0.0178, "step": 170490 }, { - "epoch": 0.86, - "learning_rate": 0.00017097083411112397, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.0002337059108665279, + "loss": 0.016, "step": 170500 }, { - "epoch": 0.86, - "learning_rate": 0.00017096326641810995, - "loss": 0.0102, + "epoch": 0.44, + "learning_rate": 0.00023370202265015643, + "loss": 0.0178, "step": 170510 }, { - "epoch": 0.86, - "learning_rate": 0.00017095569872509596, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.00023369813443378494, + "loss": 0.0127, "step": 170520 }, { - "epoch": 0.86, - "learning_rate": 0.00017094813103208194, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023369424621741348, + "loss": 0.0203, "step": 170530 }, { - "epoch": 0.86, - "learning_rate": 0.00017094056333906793, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.00023369035800104203, + "loss": 0.0152, "step": 170540 }, { - "epoch": 0.86, - "learning_rate": 0.00017093299564605393, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023368646978467057, + "loss": 0.0173, "step": 170550 }, { - "epoch": 0.86, - "learning_rate": 0.00017092542795303992, - "loss": 0.0126, + "epoch": 0.44, + "learning_rate": 0.00023368258156829908, + "loss": 0.0164, "step": 170560 }, { - "epoch": 0.86, - "learning_rate": 0.0001709178602600259, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023367869335192762, + "loss": 0.0188, "step": 170570 }, { - "epoch": 0.86, - "learning_rate": 0.0001709102925670119, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.00023367480513555617, + "loss": 0.0243, "step": 170580 }, { - "epoch": 0.86, - "learning_rate": 0.0001709027248739979, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.0002336709169191847, + "loss": 0.015, "step": 170590 }, { - "epoch": 0.86, - "learning_rate": 0.00017089515718098387, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023366702870281322, + "loss": 0.0187, "step": 170600 }, { - "epoch": 0.86, - "learning_rate": 0.00017088758948796988, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023366314048644176, + "loss": 0.0203, "step": 170610 }, { - "epoch": 0.86, - "learning_rate": 0.00017088002179495586, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.0002336592522700703, + "loss": 0.0165, "step": 170620 }, { - "epoch": 0.86, - "learning_rate": 0.00017087245410194184, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023365536405369885, + "loss": 0.0216, "step": 170630 }, { - "epoch": 0.86, - "learning_rate": 0.00017086488640892785, - "loss": 0.0117, + "epoch": 0.44, + "learning_rate": 0.00023365147583732736, + "loss": 0.0196, "step": 170640 }, { - "epoch": 0.86, - "learning_rate": 0.00017085731871591383, - "loss": 0.0138, + "epoch": 0.44, + "learning_rate": 0.0002336475876209559, + "loss": 0.0161, "step": 170650 }, { - "epoch": 0.86, - "learning_rate": 0.0001708497510228998, - "loss": 0.0104, + "epoch": 0.44, + "learning_rate": 0.00023364369940458447, + "loss": 0.0215, "step": 170660 }, { - "epoch": 0.86, - "learning_rate": 0.00017084218332988582, - "loss": 0.0165, + "epoch": 0.44, + "learning_rate": 0.00023363981118821299, + "loss": 0.0151, "step": 170670 }, { - "epoch": 0.86, - "learning_rate": 0.0001708346156368718, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.00023363592297184153, + "loss": 0.0158, "step": 170680 }, { - "epoch": 0.86, - "learning_rate": 0.00017082704794385778, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023363203475547004, + "loss": 0.0197, "step": 170690 }, { - "epoch": 0.86, - "learning_rate": 0.00017081948025084376, - "loss": 0.0125, + "epoch": 0.44, + "learning_rate": 0.00023362814653909858, + "loss": 0.0171, "step": 170700 }, { - "epoch": 0.86, - "learning_rate": 0.00017081191255782977, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023362425832272713, + "loss": 0.0188, "step": 170710 }, { - "epoch": 0.86, - "learning_rate": 0.00017080434486481575, - "loss": 0.0132, + "epoch": 0.44, + "learning_rate": 0.00023362037010635567, + "loss": 0.0202, "step": 170720 }, { - "epoch": 0.86, - "learning_rate": 0.00017079677717180174, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023361648188998418, + "loss": 0.0228, "step": 170730 }, { - "epoch": 0.86, - "learning_rate": 0.00017078920947878774, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023361259367361272, + "loss": 0.0191, "step": 170740 }, { - "epoch": 0.86, - "learning_rate": 0.00017078164178577373, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023360870545724127, + "loss": 0.0186, "step": 170750 }, { - "epoch": 0.86, - "learning_rate": 0.0001707740740927597, - "loss": 0.0148, + "epoch": 0.44, + "learning_rate": 0.0002336048172408698, + "loss": 0.0246, "step": 170760 }, { - "epoch": 0.86, - "learning_rate": 0.00017076650639974572, - "loss": 0.0139, + "epoch": 0.44, + "learning_rate": 0.00023360092902449832, + "loss": 0.0233, "step": 170770 }, { - "epoch": 0.86, - "learning_rate": 0.0001707589387067317, - "loss": 0.0155, + "epoch": 0.44, + "learning_rate": 0.00023359704080812686, + "loss": 0.0202, "step": 170780 }, { - "epoch": 0.86, - "learning_rate": 0.00017075137101371768, - "loss": 0.0094, + "epoch": 0.44, + "learning_rate": 0.0002335931525917554, + "loss": 0.0181, "step": 170790 }, { - "epoch": 0.86, - "learning_rate": 0.0001707438033207037, - "loss": 0.0137, + "epoch": 0.44, + "learning_rate": 0.00023358926437538395, + "loss": 0.0171, "step": 170800 }, { - "epoch": 0.86, - "learning_rate": 0.00017073623562768967, - "loss": 0.0097, + "epoch": 0.44, + "learning_rate": 0.00023358537615901246, + "loss": 0.0248, "step": 170810 }, { - "epoch": 0.86, - "learning_rate": 0.00017072866793467565, - "loss": 0.0095, + "epoch": 0.44, + "learning_rate": 0.000233581487942641, + "loss": 0.0182, "step": 170820 }, { - "epoch": 0.86, - "learning_rate": 0.00017072110024166166, - "loss": 0.0162, + "epoch": 0.44, + "learning_rate": 0.00023357759972626957, + "loss": 0.0139, "step": 170830 }, { - "epoch": 0.86, - "learning_rate": 0.00017071353254864764, - "loss": 0.0122, + "epoch": 0.44, + "learning_rate": 0.00023357371150989809, + "loss": 0.0191, "step": 170840 }, { - "epoch": 0.86, - "learning_rate": 0.00017070596485563362, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023356982329352663, + "loss": 0.0144, "step": 170850 }, { - "epoch": 0.86, - "learning_rate": 0.0001706983971626196, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023356593507715514, + "loss": 0.0172, "step": 170860 }, { - "epoch": 0.86, - "learning_rate": 0.0001706908294696056, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.0002335620468607837, + "loss": 0.0173, "step": 170870 }, { - "epoch": 0.86, - "learning_rate": 0.0001706832617765916, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023355815864441223, + "loss": 0.0141, "step": 170880 }, { - "epoch": 0.86, - "learning_rate": 0.00017067569408357757, - "loss": 0.0102, + "epoch": 0.44, + "learning_rate": 0.00023355427042804077, + "loss": 0.0195, "step": 170890 }, { - "epoch": 0.86, - "learning_rate": 0.00017066812639056358, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.00023355038221166928, + "loss": 0.0196, "step": 170900 }, { - "epoch": 0.86, - "learning_rate": 0.00017066055869754956, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023354649399529785, + "loss": 0.0181, "step": 170910 }, { - "epoch": 0.86, - "learning_rate": 0.00017065299100453555, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023354260577892636, + "loss": 0.0169, "step": 170920 }, { - "epoch": 0.86, - "learning_rate": 0.00017064542331152155, - "loss": 0.0141, + "epoch": 0.44, + "learning_rate": 0.0002335387175625549, + "loss": 0.0175, "step": 170930 }, { - "epoch": 0.86, - "learning_rate": 0.00017063785561850754, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023353482934618342, + "loss": 0.0145, "step": 170940 }, { - "epoch": 0.86, - "learning_rate": 0.00017063028792549352, - "loss": 0.0227, + "epoch": 0.44, + "learning_rate": 0.00023353094112981196, + "loss": 0.0165, "step": 170950 }, { - "epoch": 0.86, - "learning_rate": 0.00017062272023247953, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.0002335270529134405, + "loss": 0.0284, "step": 170960 }, { - "epoch": 0.86, - "learning_rate": 0.0001706151525394655, - "loss": 0.0113, + "epoch": 0.44, + "learning_rate": 0.00023352316469706905, + "loss": 0.0172, "step": 170970 }, { - "epoch": 0.86, - "learning_rate": 0.0001706075848464515, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.00023351927648069756, + "loss": 0.0187, "step": 170980 }, { - "epoch": 0.86, - "learning_rate": 0.0001706000171534375, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.0002335153882643261, + "loss": 0.017, "step": 170990 }, { - "epoch": 0.86, - "learning_rate": 0.00017059244946042348, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.00023351150004795467, + "loss": 0.026, "step": 171000 }, { - "epoch": 0.86, - "eval_cer": 0.914508101352053, - "eval_loss": 0.008454186841845512, - "eval_runtime": 116.644, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.287, + "epoch": 0.44, + "eval_cer": 0.8818006609085604, + "eval_loss": 0.01254571508616209, + "eval_runtime": 108.0306, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, "step": 171000 }, { - "epoch": 0.86, - "learning_rate": 0.00017058488176740946, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.00023350761183158319, + "loss": 0.0176, "step": 171010 }, { - "epoch": 0.86, - "learning_rate": 0.00017057731407439544, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.0002335037236152117, + "loss": 0.0204, "step": 171020 }, { - "epoch": 0.86, - "learning_rate": 0.00017056974638138145, - "loss": 0.0135, + "epoch": 0.44, + "learning_rate": 0.00023349983539884024, + "loss": 0.0178, "step": 171030 }, { - "epoch": 0.86, - "learning_rate": 0.00017056217868836743, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.0002334959471824688, + "loss": 0.0205, "step": 171040 }, { - "epoch": 0.86, - "learning_rate": 0.0001705546109953534, - "loss": 0.0095, + "epoch": 0.44, + "learning_rate": 0.00023349205896609732, + "loss": 0.0237, "step": 171050 }, { - "epoch": 0.86, - "learning_rate": 0.00017054704330233942, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023348817074972587, + "loss": 0.0196, "step": 171060 }, { - "epoch": 0.86, - "learning_rate": 0.0001705394756093254, - "loss": 0.0101, + "epoch": 0.44, + "learning_rate": 0.00023348428253335438, + "loss": 0.0188, "step": 171070 }, { - "epoch": 0.86, - "learning_rate": 0.00017053190791631138, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.00023348039431698295, + "loss": 0.0146, "step": 171080 }, { - "epoch": 0.86, - "learning_rate": 0.0001705243402232974, - "loss": 0.0097, + "epoch": 0.44, + "learning_rate": 0.00023347650610061146, + "loss": 0.0247, "step": 171090 }, { - "epoch": 0.86, - "learning_rate": 0.00017051677253028337, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023347261788424, + "loss": 0.0167, "step": 171100 }, { - "epoch": 0.86, - "learning_rate": 0.00017050920483726936, - "loss": 0.0133, + "epoch": 0.44, + "learning_rate": 0.00023346872966786852, + "loss": 0.018, "step": 171110 }, { - "epoch": 0.86, - "learning_rate": 0.00017050163714425536, - "loss": 0.0121, + "epoch": 0.44, + "learning_rate": 0.0002334648414514971, + "loss": 0.0149, "step": 171120 }, { - "epoch": 0.86, - "learning_rate": 0.00017049406945124135, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.0002334609532351256, + "loss": 0.018, "step": 171130 }, { - "epoch": 0.86, - "learning_rate": 0.00017048650175822733, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023345706501875415, + "loss": 0.0203, "step": 171140 }, { - "epoch": 0.86, - "learning_rate": 0.00017047893406521334, - "loss": 0.0097, + "epoch": 0.44, + "learning_rate": 0.00023345317680238266, + "loss": 0.0205, "step": 171150 }, { - "epoch": 0.86, - "learning_rate": 0.00017047136637219932, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023344928858601123, + "loss": 0.0176, "step": 171160 }, { - "epoch": 0.86, - "learning_rate": 0.0001704637986791853, - "loss": 0.0114, + "epoch": 0.44, + "learning_rate": 0.00023344540036963977, + "loss": 0.0144, "step": 171170 }, { - "epoch": 0.86, - "learning_rate": 0.0001704562309861713, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.00023344151215326828, + "loss": 0.0222, "step": 171180 }, { - "epoch": 0.86, - "learning_rate": 0.0001704486632931573, - "loss": 0.0127, + "epoch": 0.44, + "learning_rate": 0.0002334376239368968, + "loss": 0.0179, "step": 171190 }, { - "epoch": 0.86, - "learning_rate": 0.00017044109560014327, - "loss": 0.0152, + "epoch": 0.44, + "learning_rate": 0.00023343373572052534, + "loss": 0.024, "step": 171200 }, { - "epoch": 0.86, - "learning_rate": 0.00017043352790712925, - "loss": 0.0144, + "epoch": 0.44, + "learning_rate": 0.0002334298475041539, + "loss": 0.0185, "step": 171210 }, { - "epoch": 0.86, - "learning_rate": 0.00017042596021411526, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.00023342595928778242, + "loss": 0.0163, "step": 171220 }, { - "epoch": 0.86, - "learning_rate": 0.00017041839252110124, - "loss": 0.0093, + "epoch": 0.44, + "learning_rate": 0.00023342207107141097, + "loss": 0.0166, "step": 171230 }, { - "epoch": 0.86, - "learning_rate": 0.00017041082482808722, - "loss": 0.0102, + "epoch": 0.44, + "learning_rate": 0.00023341818285503948, + "loss": 0.0162, "step": 171240 }, { - "epoch": 0.86, - "learning_rate": 0.00017040325713507323, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023341429463866805, + "loss": 0.0183, "step": 171250 }, { - "epoch": 0.86, - "learning_rate": 0.0001703956894420592, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.00023341040642229656, + "loss": 0.0174, "step": 171260 }, { - "epoch": 0.86, - "learning_rate": 0.0001703881217490452, - "loss": 0.0092, + "epoch": 0.44, + "learning_rate": 0.0002334065182059251, + "loss": 0.0166, "step": 171270 }, { - "epoch": 0.86, - "learning_rate": 0.0001703805540560312, - "loss": 0.0085, + "epoch": 0.44, + "learning_rate": 0.00023340262998955362, + "loss": 0.0172, "step": 171280 }, { - "epoch": 0.86, - "learning_rate": 0.00017037298636301718, - "loss": 0.0103, + "epoch": 0.44, + "learning_rate": 0.0002333987417731822, + "loss": 0.0289, "step": 171290 }, { - "epoch": 0.86, - "learning_rate": 0.00017036541867000317, - "loss": 0.0119, + "epoch": 0.44, + "learning_rate": 0.0002333948535568107, + "loss": 0.0197, "step": 171300 }, { - "epoch": 0.86, - "learning_rate": 0.00017035785097698917, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023339096534043924, + "loss": 0.0199, "step": 171310 }, { - "epoch": 0.86, - "learning_rate": 0.00017035028328397516, - "loss": 0.0106, + "epoch": 0.44, + "learning_rate": 0.00023338707712406776, + "loss": 0.0169, "step": 171320 }, { - "epoch": 0.86, - "learning_rate": 0.00017034271559096114, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.00023338318890769633, + "loss": 0.0207, "step": 171330 }, { - "epoch": 0.86, - "learning_rate": 0.00017033514789794715, - "loss": 0.009, + "epoch": 0.44, + "learning_rate": 0.00023337930069132484, + "loss": 0.0185, "step": 171340 }, { - "epoch": 0.86, - "learning_rate": 0.00017032758020493313, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023337541247495338, + "loss": 0.0221, "step": 171350 }, { - "epoch": 0.86, - "learning_rate": 0.0001703200125119191, - "loss": 0.0101, + "epoch": 0.44, + "learning_rate": 0.0002333715242585819, + "loss": 0.0223, "step": 171360 }, { - "epoch": 0.86, - "learning_rate": 0.0001703124448189051, - "loss": 0.0129, + "epoch": 0.44, + "learning_rate": 0.00023336763604221047, + "loss": 0.0229, "step": 171370 }, { - "epoch": 0.86, - "learning_rate": 0.0001703048771258911, - "loss": 0.0114, + "epoch": 0.44, + "learning_rate": 0.000233363747825839, + "loss": 0.0209, "step": 171380 }, { - "epoch": 0.86, - "learning_rate": 0.00017029730943287708, - "loss": 0.0128, + "epoch": 0.44, + "learning_rate": 0.00023335985960946752, + "loss": 0.023, "step": 171390 }, { - "epoch": 0.86, - "learning_rate": 0.00017028974173986306, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023335597139309607, + "loss": 0.0182, "step": 171400 }, { - "epoch": 0.86, - "learning_rate": 0.00017028217404684907, - "loss": 0.0086, + "epoch": 0.44, + "learning_rate": 0.0002333520831767246, + "loss": 0.0183, "step": 171410 }, { - "epoch": 0.86, - "learning_rate": 0.00017027460635383505, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023334819496035315, + "loss": 0.0161, "step": 171420 }, { - "epoch": 0.86, - "learning_rate": 0.00017026703866082103, - "loss": 0.012, + "epoch": 0.44, + "learning_rate": 0.00023334430674398166, + "loss": 0.0153, "step": 171430 }, { - "epoch": 0.86, - "learning_rate": 0.00017025947096780704, - "loss": 0.0109, + "epoch": 0.44, + "learning_rate": 0.0002333404185276102, + "loss": 0.0218, "step": 171440 }, { - "epoch": 0.86, - "learning_rate": 0.00017025190327479302, - "loss": 0.0098, + "epoch": 0.44, + "learning_rate": 0.00023333653031123872, + "loss": 0.0181, "step": 171450 }, { - "epoch": 0.87, - "learning_rate": 0.000170244335581779, - "loss": 0.0105, + "epoch": 0.44, + "learning_rate": 0.0002333326420948673, + "loss": 0.0193, "step": 171460 }, { - "epoch": 0.87, - "learning_rate": 0.000170236767888765, - "loss": 0.0107, + "epoch": 0.44, + "learning_rate": 0.0002333287538784958, + "loss": 0.0195, "step": 171470 }, { - "epoch": 0.87, - "learning_rate": 0.000170229200195751, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023332486566212434, + "loss": 0.0167, "step": 171480 }, { - "epoch": 0.87, - "learning_rate": 0.00017022163250273698, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.00023332097744575286, + "loss": 0.0185, "step": 171490 }, { - "epoch": 0.87, - "learning_rate": 0.00017021406480972298, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023331708922938143, + "loss": 0.0195, "step": 171500 }, { - "epoch": 0.87, - "learning_rate": 0.00017020649711670897, - "loss": 0.0115, + "epoch": 0.44, + "learning_rate": 0.00023331320101300994, + "loss": 0.018, "step": 171510 }, { - "epoch": 0.87, - "learning_rate": 0.00017019892942369495, - "loss": 0.01, + "epoch": 0.44, + "learning_rate": 0.00023330931279663848, + "loss": 0.0159, "step": 171520 }, { - "epoch": 0.87, - "learning_rate": 0.00017019136173068093, - "loss": 0.0124, + "epoch": 0.44, + "learning_rate": 0.000233305424580267, + "loss": 0.0195, "step": 171530 }, { - "epoch": 0.87, - "learning_rate": 0.00017018379403766694, - "loss": 0.0118, + "epoch": 0.44, + "learning_rate": 0.00023330153636389557, + "loss": 0.0143, "step": 171540 }, { - "epoch": 0.87, - "learning_rate": 0.00017017622634465292, - "loss": 0.0116, + "epoch": 0.44, + "learning_rate": 0.0002332976481475241, + "loss": 0.0152, "step": 171550 }, { - "epoch": 0.87, - "learning_rate": 0.0001701686586516389, - "loss": 0.0131, + "epoch": 0.44, + "learning_rate": 0.00023329375993115262, + "loss": 0.014, "step": 171560 }, { - "epoch": 0.87, - "learning_rate": 0.00017016109095862488, - "loss": 0.0154, + "epoch": 0.44, + "learning_rate": 0.00023328987171478116, + "loss": 0.0214, "step": 171570 }, { - "epoch": 0.87, - "learning_rate": 0.00017015352326561086, - "loss": 0.0102, + "epoch": 0.44, + "learning_rate": 0.0002332859834984097, + "loss": 0.017, "step": 171580 }, { - "epoch": 0.87, - "learning_rate": 0.00017014595557259684, - "loss": 0.011, + "epoch": 0.44, + "learning_rate": 0.00023328209528203825, + "loss": 0.0199, "step": 171590 }, { - "epoch": 0.87, - "learning_rate": 0.00017013838787958283, - "loss": 0.0132, + "epoch": 0.44, + "learning_rate": 0.00023327820706566676, + "loss": 0.0138, "step": 171600 }, { - "epoch": 0.87, - "learning_rate": 0.00017013082018656883, - "loss": 0.0096, + "epoch": 0.44, + "learning_rate": 0.0002332743188492953, + "loss": 0.0182, "step": 171610 }, { - "epoch": 0.87, - "learning_rate": 0.00017012325249355482, - "loss": 0.0092, + "epoch": 0.44, + "learning_rate": 0.00023327043063292385, + "loss": 0.0169, "step": 171620 }, { - "epoch": 0.87, - "learning_rate": 0.0001701156848005408, - "loss": 0.017, + "epoch": 0.44, + "learning_rate": 0.0002332665424165524, + "loss": 0.0187, "step": 171630 }, { - "epoch": 0.87, - "learning_rate": 0.0001701081171075268, - "loss": 0.0112, + "epoch": 0.44, + "learning_rate": 0.0002332626542001809, + "loss": 0.0198, "step": 171640 }, { - "epoch": 0.87, - "learning_rate": 0.0001701005494145128, - "loss": 0.0108, + "epoch": 0.44, + "learning_rate": 0.00023325876598380944, + "loss": 0.0174, "step": 171650 }, { - "epoch": 0.87, - "learning_rate": 0.00017009298172149877, - "loss": 0.0099, + "epoch": 0.44, + "learning_rate": 0.00023325487776743799, + "loss": 0.0166, "step": 171660 }, { - "epoch": 0.87, - "learning_rate": 0.00017008541402848478, - "loss": 0.0111, + "epoch": 0.44, + "learning_rate": 0.00023325098955106653, + "loss": 0.0188, "step": 171670 }, { - "epoch": 0.87, - "learning_rate": 0.00017007784633547076, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023324710133469504, + "loss": 0.0259, "step": 171680 }, { - "epoch": 0.87, - "learning_rate": 0.00017007027864245674, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.00023324321311832358, + "loss": 0.0181, "step": 171690 }, { - "epoch": 0.87, - "learning_rate": 0.00017006271094944275, - "loss": 0.0088, + "epoch": 0.45, + "learning_rate": 0.0002332393249019521, + "loss": 0.0199, "step": 171700 }, { - "epoch": 0.87, - "learning_rate": 0.00017005514325642873, - "loss": 0.0282, + "epoch": 0.45, + "learning_rate": 0.00023323543668558067, + "loss": 0.018, "step": 171710 }, { - "epoch": 0.87, - "learning_rate": 0.0001700475755634147, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.0002332315484692092, + "loss": 0.0171, "step": 171720 }, { - "epoch": 0.87, - "learning_rate": 0.00017004000787040072, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023322766025283772, + "loss": 0.0203, "step": 171730 }, { - "epoch": 0.87, - "learning_rate": 0.0001700324401773867, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023322377203646624, + "loss": 0.0241, "step": 171740 }, { - "epoch": 0.87, - "learning_rate": 0.00017002487248437268, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.0002332198838200948, + "loss": 0.0197, "step": 171750 }, { - "epoch": 0.87, - "learning_rate": 0.00017001730479135866, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023321599560372335, + "loss": 0.0187, "step": 171760 }, { - "epoch": 0.87, - "learning_rate": 0.00017000973709834467, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023321210738735186, + "loss": 0.0182, "step": 171770 }, { - "epoch": 0.87, - "learning_rate": 0.00017000216940533065, - "loss": 0.0092, + "epoch": 0.45, + "learning_rate": 0.0002332082191709804, + "loss": 0.0185, "step": 171780 }, { - "epoch": 0.87, - "learning_rate": 0.00016999460171231664, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023320433095460895, + "loss": 0.0159, "step": 171790 }, { - "epoch": 0.87, - "learning_rate": 0.00016998703401930264, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.0002332004427382375, + "loss": 0.0182, "step": 171800 }, { - "epoch": 0.87, - "learning_rate": 0.00016997946632628863, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.000233196554521866, + "loss": 0.0174, "step": 171810 }, { - "epoch": 0.87, - "learning_rate": 0.0001699718986332746, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023319266630549454, + "loss": 0.0169, "step": 171820 }, { - "epoch": 0.87, - "learning_rate": 0.00016996433094026062, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023318877808912308, + "loss": 0.0164, "step": 171830 }, { - "epoch": 0.87, - "learning_rate": 0.0001699567632472466, - "loss": 0.0103, + "epoch": 0.45, + "learning_rate": 0.00023318488987275163, + "loss": 0.0165, "step": 171840 }, { - "epoch": 0.87, - "learning_rate": 0.00016994919555423258, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023318100165638014, + "loss": 0.0163, "step": 171850 }, { - "epoch": 0.87, - "learning_rate": 0.0001699416278612186, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023317711344000868, + "loss": 0.021, "step": 171860 }, { - "epoch": 0.87, - "learning_rate": 0.00016993406016820457, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023317322522363725, + "loss": 0.0171, "step": 171870 }, { - "epoch": 0.87, - "learning_rate": 0.00016992649247519055, - "loss": 0.009, + "epoch": 0.45, + "learning_rate": 0.00023316933700726577, + "loss": 0.0175, "step": 171880 }, { - "epoch": 0.87, - "learning_rate": 0.00016991892478217656, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.00023316544879089428, + "loss": 0.0202, "step": 171890 }, { - "epoch": 0.87, - "learning_rate": 0.00016991135708916254, - "loss": 0.009, + "epoch": 0.45, + "learning_rate": 0.00023316156057452282, + "loss": 0.0198, "step": 171900 }, { - "epoch": 0.87, - "learning_rate": 0.00016990378939614852, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.0002331576723581514, + "loss": 0.0214, "step": 171910 }, { - "epoch": 0.87, - "learning_rate": 0.0001698962217031345, - "loss": 0.011, + "epoch": 0.45, + "learning_rate": 0.0002331537841417799, + "loss": 0.0177, "step": 171920 }, { - "epoch": 0.87, - "learning_rate": 0.0001698886540101205, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023314989592540845, + "loss": 0.0156, "step": 171930 }, { - "epoch": 0.87, - "learning_rate": 0.0001698810863171065, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.00023314600770903696, + "loss": 0.0187, "step": 171940 }, { - "epoch": 0.87, - "learning_rate": 0.00016987351862409247, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.0002331421194926655, + "loss": 0.0184, "step": 171950 }, { - "epoch": 0.87, - "learning_rate": 0.00016986595093107848, - "loss": 0.0097, + "epoch": 0.45, + "learning_rate": 0.00023313823127629404, + "loss": 0.0213, "step": 171960 }, { - "epoch": 0.87, - "learning_rate": 0.00016985838323806446, - "loss": 0.016, + "epoch": 0.45, + "learning_rate": 0.00023313434305992259, + "loss": 0.0183, "step": 171970 }, { - "epoch": 0.87, - "learning_rate": 0.00016985081554505045, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.0002331304548435511, + "loss": 0.0243, "step": 171980 }, { - "epoch": 0.87, - "learning_rate": 0.00016984324785203645, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023312656662717964, + "loss": 0.0199, "step": 171990 }, { - "epoch": 0.87, - "learning_rate": 0.00016983568015902244, - "loss": 0.011, + "epoch": 0.45, + "learning_rate": 0.00023312267841080818, + "loss": 0.0185, "step": 172000 }, { - "epoch": 0.87, - "eval_cer": 0.9145003381830497, - "eval_loss": 0.00847652181982994, - "eval_runtime": 116.6974, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.285, + "epoch": 0.45, + "eval_cer": 0.881782465628416, + "eval_loss": 0.012556556612253189, + "eval_runtime": 107.2056, + "eval_samples_per_second": 18.656, + "eval_steps_per_second": 4.664, "step": 172000 }, { - "epoch": 0.87, - "learning_rate": 0.00016982811246600842, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023311879019443673, + "loss": 0.0217, "step": 172010 }, { - "epoch": 0.87, - "learning_rate": 0.00016982054477299443, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023311490197806524, + "loss": 0.0176, "step": 172020 }, { - "epoch": 0.87, - "learning_rate": 0.0001698129770799804, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023311101376169378, + "loss": 0.0182, "step": 172030 }, { - "epoch": 0.87, - "learning_rate": 0.0001698054093869664, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023310712554532235, + "loss": 0.0225, "step": 172040 }, { - "epoch": 0.87, - "learning_rate": 0.0001697978416939524, - "loss": 0.0103, + "epoch": 0.45, + "learning_rate": 0.00023310323732895087, + "loss": 0.0164, "step": 172050 }, { - "epoch": 0.87, - "learning_rate": 0.00016979027400093838, - "loss": 0.0138, + "epoch": 0.45, + "learning_rate": 0.00023309934911257938, + "loss": 0.0172, "step": 172060 }, { - "epoch": 0.87, - "learning_rate": 0.00016978270630792436, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.00023309546089620792, + "loss": 0.0199, "step": 172070 }, { - "epoch": 0.87, - "learning_rate": 0.00016977513861491037, - "loss": 0.0152, + "epoch": 0.45, + "learning_rate": 0.0002330915726798365, + "loss": 0.021, "step": 172080 }, { - "epoch": 0.87, - "learning_rate": 0.00016976757092189635, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.000233087684463465, + "loss": 0.0174, "step": 172090 }, { - "epoch": 0.87, - "learning_rate": 0.00016976000322888233, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023308379624709355, + "loss": 0.0191, "step": 172100 }, { - "epoch": 0.87, - "learning_rate": 0.0001697524355358683, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.00023307990803072206, + "loss": 0.0152, "step": 172110 }, { - "epoch": 0.87, - "learning_rate": 0.00016974486784285432, - "loss": 0.0077, + "epoch": 0.45, + "learning_rate": 0.00023307601981435063, + "loss": 0.0177, "step": 172120 }, { - "epoch": 0.87, - "learning_rate": 0.0001697373001498403, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.00023307213159797914, + "loss": 0.0183, "step": 172130 }, { - "epoch": 0.87, - "learning_rate": 0.00016972973245682628, - "loss": 0.0153, + "epoch": 0.45, + "learning_rate": 0.00023306824338160769, + "loss": 0.0203, "step": 172140 }, { - "epoch": 0.87, - "learning_rate": 0.0001697221647638123, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.0002330643551652362, + "loss": 0.0175, "step": 172150 }, { - "epoch": 0.87, - "learning_rate": 0.00016971459707079827, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.00023306046694886477, + "loss": 0.0183, "step": 172160 }, { - "epoch": 0.87, - "learning_rate": 0.00016970702937778426, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.00023305657873249328, + "loss": 0.0215, "step": 172170 }, { - "epoch": 0.87, - "learning_rate": 0.00016969946168477026, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023305269051612183, + "loss": 0.0185, "step": 172180 }, { - "epoch": 0.87, - "learning_rate": 0.00016969189399175625, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023304880229975034, + "loss": 0.0155, "step": 172190 }, { - "epoch": 0.87, - "learning_rate": 0.00016968432629874223, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.00023304491408337888, + "loss": 0.0203, "step": 172200 }, { - "epoch": 0.87, - "learning_rate": 0.00016967675860572824, - "loss": 0.0098, + "epoch": 0.45, + "learning_rate": 0.00023304102586700742, + "loss": 0.0216, "step": 172210 }, { - "epoch": 0.87, - "learning_rate": 0.00016966919091271422, - "loss": 0.0096, + "epoch": 0.45, + "learning_rate": 0.00023303713765063596, + "loss": 0.0205, "step": 172220 }, { - "epoch": 0.87, - "learning_rate": 0.0001696616232197002, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023303324943426448, + "loss": 0.0165, "step": 172230 }, { - "epoch": 0.87, - "learning_rate": 0.0001696540555266862, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.00023302936121789302, + "loss": 0.0181, "step": 172240 }, { - "epoch": 0.87, - "learning_rate": 0.0001696464878336722, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.0002330254730015216, + "loss": 0.0171, "step": 172250 }, { - "epoch": 0.87, - "learning_rate": 0.00016963892014065817, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.0002330215847851501, + "loss": 0.0163, "step": 172260 }, { - "epoch": 0.87, - "learning_rate": 0.00016963135244764415, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023301769656877865, + "loss": 0.0189, "step": 172270 }, { - "epoch": 0.87, - "learning_rate": 0.00016962378475463016, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023301380835240716, + "loss": 0.019, "step": 172280 }, { - "epoch": 0.87, - "learning_rate": 0.00016961621706161614, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023300992013603573, + "loss": 0.0148, "step": 172290 }, { - "epoch": 0.87, - "learning_rate": 0.00016960864936860212, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023300603191966424, + "loss": 0.0196, "step": 172300 }, { - "epoch": 0.87, - "learning_rate": 0.00016960108167558813, - "loss": 0.0157, + "epoch": 0.45, + "learning_rate": 0.00023300214370329279, + "loss": 0.0196, "step": 172310 }, { - "epoch": 0.87, - "learning_rate": 0.0001695935139825741, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.0002329982554869213, + "loss": 0.0189, "step": 172320 }, { - "epoch": 0.87, - "learning_rate": 0.0001695859462895601, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023299436727054987, + "loss": 0.0174, "step": 172330 }, { - "epoch": 0.87, - "learning_rate": 0.0001695783785965461, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023299047905417838, + "loss": 0.0191, "step": 172340 }, { - "epoch": 0.87, - "learning_rate": 0.00016957081090353208, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023298659083780692, + "loss": 0.0222, "step": 172350 }, { - "epoch": 0.87, - "learning_rate": 0.00016956324321051807, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023298270262143544, + "loss": 0.0213, "step": 172360 }, { - "epoch": 0.87, - "learning_rate": 0.00016955567551750407, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.000232978814405064, + "loss": 0.0175, "step": 172370 }, { - "epoch": 0.87, - "learning_rate": 0.00016954810782449006, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023297492618869252, + "loss": 0.0186, "step": 172380 }, { - "epoch": 0.87, - "learning_rate": 0.00016954054013147604, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023297103797232106, + "loss": 0.0182, "step": 172390 }, { - "epoch": 0.87, - "learning_rate": 0.00016953297243846205, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023296714975594958, + "loss": 0.0208, "step": 172400 }, { - "epoch": 0.87, - "learning_rate": 0.00016952540474544803, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023296326153957815, + "loss": 0.02, "step": 172410 }, { - "epoch": 0.87, - "learning_rate": 0.000169517837052434, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.0002329593733232067, + "loss": 0.0149, "step": 172420 }, { - "epoch": 0.87, - "learning_rate": 0.00016951026935942, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.0002329554851068352, + "loss": 0.0174, "step": 172430 }, { - "epoch": 0.87, - "learning_rate": 0.000169502701666406, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023295159689046374, + "loss": 0.0218, "step": 172440 }, { - "epoch": 0.87, - "learning_rate": 0.00016949513397339198, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023294770867409226, + "loss": 0.0181, "step": 172450 }, { - "epoch": 0.87, - "learning_rate": 0.00016948756628037796, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023294382045772083, + "loss": 0.0166, "step": 172460 }, { - "epoch": 0.87, - "learning_rate": 0.00016947999858736397, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023293993224134934, + "loss": 0.0174, "step": 172470 }, { - "epoch": 0.87, - "learning_rate": 0.00016947243089434995, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023293604402497788, + "loss": 0.0167, "step": 172480 }, { - "epoch": 0.87, - "learning_rate": 0.00016946486320133593, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.0002329321558086064, + "loss": 0.0162, "step": 172490 }, { - "epoch": 0.87, - "learning_rate": 0.00016945729550832194, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023292826759223497, + "loss": 0.0159, "step": 172500 }, { - "epoch": 0.87, - "learning_rate": 0.00016944972781530792, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023292437937586348, + "loss": 0.0159, "step": 172510 }, { - "epoch": 0.87, - "learning_rate": 0.0001694421601222939, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023292049115949202, + "loss": 0.0188, "step": 172520 }, { - "epoch": 0.87, - "learning_rate": 0.0001694345924292799, - "loss": 0.0178, + "epoch": 0.45, + "learning_rate": 0.00023291660294312054, + "loss": 0.0213, "step": 172530 }, { - "epoch": 0.87, - "learning_rate": 0.0001694270247362659, - "loss": 0.0161, + "epoch": 0.45, + "learning_rate": 0.0002329127147267491, + "loss": 0.018, "step": 172540 }, { - "epoch": 0.87, - "learning_rate": 0.00016941945704325188, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.00023290882651037762, + "loss": 0.0167, "step": 172550 }, { - "epoch": 0.87, - "learning_rate": 0.00016941188935023788, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023290493829400616, + "loss": 0.0201, "step": 172560 }, { - "epoch": 0.87, - "learning_rate": 0.00016940432165722387, - "loss": 0.0096, + "epoch": 0.45, + "learning_rate": 0.00023290105007763468, + "loss": 0.0186, "step": 172570 }, { - "epoch": 0.87, - "learning_rate": 0.00016939675396420985, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023289716186126325, + "loss": 0.0165, "step": 172580 }, { - "epoch": 0.87, - "learning_rate": 0.00016938918627119583, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.0002328932736448918, + "loss": 0.021, "step": 172590 }, { - "epoch": 0.87, - "learning_rate": 0.00016938161857818184, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.0002328893854285203, + "loss": 0.0157, "step": 172600 }, { - "epoch": 0.87, - "learning_rate": 0.00016937405088516782, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023288549721214882, + "loss": 0.0164, "step": 172610 }, { - "epoch": 0.87, - "learning_rate": 0.0001693664831921538, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023288160899577739, + "loss": 0.0198, "step": 172620 }, { - "epoch": 0.87, - "learning_rate": 0.0001693589154991398, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023287772077940593, + "loss": 0.0312, "step": 172630 }, { - "epoch": 0.87, - "learning_rate": 0.0001693513478061258, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023287383256303444, + "loss": 0.017, "step": 172640 }, { - "epoch": 0.87, - "learning_rate": 0.00016934378011311177, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023286994434666298, + "loss": 0.0199, "step": 172650 }, { - "epoch": 0.87, - "learning_rate": 0.00016933621242009778, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023286605613029153, + "loss": 0.0209, "step": 172660 }, { - "epoch": 0.87, - "learning_rate": 0.00016932864472708376, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023286216791392007, + "loss": 0.0205, "step": 172670 }, { - "epoch": 0.87, - "learning_rate": 0.00016932107703406974, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.00023285827969754858, + "loss": 0.0233, "step": 172680 }, { - "epoch": 0.87, - "learning_rate": 0.00016931350934105575, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023285439148117712, + "loss": 0.0148, "step": 172690 }, { - "epoch": 0.87, - "learning_rate": 0.00016930594164804173, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023285050326480564, + "loss": 0.02, "step": 172700 }, { - "epoch": 0.87, - "learning_rate": 0.00016929837395502771, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.0002328466150484342, + "loss": 0.019, "step": 172710 }, { - "epoch": 0.87, - "learning_rate": 0.00016929080626201372, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023284272683206272, + "loss": 0.0178, "step": 172720 }, { - "epoch": 0.87, - "learning_rate": 0.0001692832385689997, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023283883861569126, + "loss": 0.0187, "step": 172730 }, { - "epoch": 0.87, - "learning_rate": 0.00016927567087598569, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.00023283495039931978, + "loss": 0.017, "step": 172740 }, { - "epoch": 0.87, - "learning_rate": 0.0001692681031829717, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023283106218294835, + "loss": 0.0281, "step": 172750 }, { - "epoch": 0.87, - "learning_rate": 0.00016926053548995768, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.0002328271739665769, + "loss": 0.0165, "step": 172760 }, { - "epoch": 0.87, - "learning_rate": 0.00016925296779694366, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.0002328232857502054, + "loss": 0.0168, "step": 172770 }, { - "epoch": 0.87, - "learning_rate": 0.00016924540010392964, - "loss": 0.0091, + "epoch": 0.45, + "learning_rate": 0.00023281939753383392, + "loss": 0.0176, "step": 172780 }, { - "epoch": 0.87, - "learning_rate": 0.00016923783241091565, - "loss": 0.0085, + "epoch": 0.45, + "learning_rate": 0.00023281550931746249, + "loss": 0.0187, "step": 172790 }, { - "epoch": 0.87, - "learning_rate": 0.00016923026471790163, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023281162110109103, + "loss": 0.0162, "step": 172800 }, { - "epoch": 0.87, - "learning_rate": 0.0001692226970248876, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.00023280773288471954, + "loss": 0.018, "step": 172810 }, { - "epoch": 0.87, - "learning_rate": 0.00016921512933187362, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023280384466834808, + "loss": 0.0198, "step": 172820 }, { - "epoch": 0.87, - "learning_rate": 0.00016920756163885957, - "loss": 0.0095, + "epoch": 0.45, + "learning_rate": 0.00023279995645197662, + "loss": 0.0167, "step": 172830 }, { - "epoch": 0.87, - "learning_rate": 0.00016919999394584555, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023279606823560517, + "loss": 0.0204, "step": 172840 }, { - "epoch": 0.87, - "learning_rate": 0.00016919242625283154, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023279218001923368, + "loss": 0.0231, "step": 172850 }, { - "epoch": 0.87, - "learning_rate": 0.00016918485855981754, - "loss": 0.011, + "epoch": 0.45, + "learning_rate": 0.00023278829180286222, + "loss": 0.0175, "step": 172860 }, { - "epoch": 0.87, - "learning_rate": 0.00016917729086680353, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.00023278440358649076, + "loss": 0.0185, "step": 172870 }, { - "epoch": 0.87, - "learning_rate": 0.0001691697231737895, - "loss": 0.0164, + "epoch": 0.45, + "learning_rate": 0.0002327805153701193, + "loss": 0.0189, "step": 172880 }, { - "epoch": 0.87, - "learning_rate": 0.00016916215548077552, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023277662715374782, + "loss": 0.0204, "step": 172890 }, { - "epoch": 0.87, - "learning_rate": 0.0001691545877877615, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023277273893737636, + "loss": 0.0194, "step": 172900 }, { - "epoch": 0.87, - "learning_rate": 0.00016914702009474748, - "loss": 0.014, + "epoch": 0.45, + "learning_rate": 0.00023276885072100493, + "loss": 0.0232, "step": 172910 }, { - "epoch": 0.87, - "learning_rate": 0.0001691394524017335, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023276496250463345, + "loss": 0.0182, "step": 172920 }, { - "epoch": 0.87, - "learning_rate": 0.00016913188470871947, - "loss": 0.0157, + "epoch": 0.45, + "learning_rate": 0.00023276107428826196, + "loss": 0.0191, "step": 172930 }, { - "epoch": 0.87, - "learning_rate": 0.00016912431701570545, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.0002327571860718905, + "loss": 0.019, "step": 172940 }, { - "epoch": 0.87, - "learning_rate": 0.00016911674932269146, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.00023275329785551902, + "loss": 0.0198, "step": 172950 }, { - "epoch": 0.87, - "learning_rate": 0.00016910918162967744, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023274940963914758, + "loss": 0.0182, "step": 172960 }, { - "epoch": 0.87, - "learning_rate": 0.00016910161393666342, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.00023274552142277613, + "loss": 0.0166, "step": 172970 }, { - "epoch": 0.87, - "learning_rate": 0.00016909404624364943, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023274163320640464, + "loss": 0.019, "step": 172980 }, { - "epoch": 0.87, - "learning_rate": 0.0001690864785506354, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023273774499003318, + "loss": 0.0215, "step": 172990 }, { - "epoch": 0.87, - "learning_rate": 0.0001690789108576214, - "loss": 0.0146, + "epoch": 0.45, + "learning_rate": 0.00023273385677366172, + "loss": 0.0188, "step": 173000 }, { - "epoch": 0.87, - "eval_cer": 0.9145003381830497, - "eval_loss": 0.008254943415522575, - "eval_runtime": 116.8302, - "eval_samples_per_second": 17.119, - "eval_steps_per_second": 4.28, + "epoch": 0.45, + "eval_cer": 0.8818034601824287, + "eval_loss": 0.012683995999395847, + "eval_runtime": 108.0649, + "eval_samples_per_second": 18.507, + "eval_steps_per_second": 4.627, "step": 173000 }, { - "epoch": 0.87, - "learning_rate": 0.00016907134316460737, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023272996855729027, + "loss": 0.0206, "step": 173010 }, { - "epoch": 0.87, - "learning_rate": 0.00016906377547159338, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023272608034091878, + "loss": 0.0142, "step": 173020 }, { - "epoch": 0.87, - "learning_rate": 0.00016905620777857936, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023272219212454732, + "loss": 0.0215, "step": 173030 }, { - "epoch": 0.87, - "learning_rate": 0.00016904864008556535, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023271830390817586, + "loss": 0.0168, "step": 173040 }, { - "epoch": 0.87, - "learning_rate": 0.00016904107239255135, - "loss": 0.0095, + "epoch": 0.45, + "learning_rate": 0.0002327144156918044, + "loss": 0.0201, "step": 173050 }, { - "epoch": 0.87, - "learning_rate": 0.00016903350469953734, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023271052747543292, + "loss": 0.019, "step": 173060 }, { - "epoch": 0.87, - "learning_rate": 0.00016902593700652332, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023270663925906146, + "loss": 0.0171, "step": 173070 }, { - "epoch": 0.87, - "learning_rate": 0.00016901836931350933, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023270275104269, + "loss": 0.0198, "step": 173080 }, { - "epoch": 0.87, - "learning_rate": 0.0001690108016204953, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023269886282631854, + "loss": 0.018, "step": 173090 }, { - "epoch": 0.87, - "learning_rate": 0.0001690032339274813, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023269497460994706, + "loss": 0.0503, "step": 173100 }, { - "epoch": 0.87, - "learning_rate": 0.0001689956662344673, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.0002326910863935756, + "loss": 0.0203, "step": 173110 }, { - "epoch": 0.87, - "learning_rate": 0.00016898809854145328, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023268719817720417, + "loss": 0.0205, "step": 173120 }, { - "epoch": 0.87, - "learning_rate": 0.00016898053084843926, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023268330996083268, + "loss": 0.0172, "step": 173130 }, { - "epoch": 0.87, - "learning_rate": 0.00016897296315542527, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023267942174446123, + "loss": 0.0181, "step": 173140 }, { - "epoch": 0.87, - "learning_rate": 0.00016896539546241125, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023267553352808974, + "loss": 0.0167, "step": 173150 }, { - "epoch": 0.87, - "learning_rate": 0.00016895782776939723, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.0002326716453117183, + "loss": 0.0181, "step": 173160 }, { - "epoch": 0.87, - "learning_rate": 0.0001689502600763832, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023266775709534682, + "loss": 0.0169, "step": 173170 }, { - "epoch": 0.87, - "learning_rate": 0.00016894269238336922, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023266386887897537, + "loss": 0.019, "step": 173180 }, { - "epoch": 0.87, - "learning_rate": 0.0001689351246903552, - "loss": 0.0149, + "epoch": 0.45, + "learning_rate": 0.00023265998066260388, + "loss": 0.0198, "step": 173190 }, { - "epoch": 0.87, - "learning_rate": 0.00016892755699734118, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023265609244623242, + "loss": 0.0179, "step": 173200 }, { - "epoch": 0.87, - "learning_rate": 0.0001689199893043272, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023265220422986096, + "loss": 0.0185, "step": 173210 }, { - "epoch": 0.87, - "learning_rate": 0.00016891242161131317, - "loss": 0.0092, + "epoch": 0.45, + "learning_rate": 0.0002326483160134895, + "loss": 0.0216, "step": 173220 }, { - "epoch": 0.87, - "learning_rate": 0.00016890485391829916, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023264442779711802, + "loss": 0.0185, "step": 173230 }, { - "epoch": 0.87, - "learning_rate": 0.00016889728622528516, - "loss": 0.0091, + "epoch": 0.45, + "learning_rate": 0.00023264053958074656, + "loss": 0.0161, "step": 173240 }, { - "epoch": 0.87, - "learning_rate": 0.00016888971853227115, - "loss": 0.0133, + "epoch": 0.45, + "learning_rate": 0.0002326366513643751, + "loss": 0.0188, "step": 173250 }, { - "epoch": 0.87, - "learning_rate": 0.00016888215083925713, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023263276314800364, + "loss": 0.0205, "step": 173260 }, { - "epoch": 0.87, - "learning_rate": 0.00016887458314624314, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023262887493163216, + "loss": 0.0172, "step": 173270 }, { - "epoch": 0.87, - "learning_rate": 0.00016886701545322912, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.0002326249867152607, + "loss": 0.014, "step": 173280 }, { - "epoch": 0.87, - "learning_rate": 0.0001688594477602151, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023262109849888927, + "loss": 0.0181, "step": 173290 }, { - "epoch": 0.87, - "learning_rate": 0.0001688518800672011, - "loss": 0.0155, + "epoch": 0.45, + "learning_rate": 0.00023261721028251778, + "loss": 0.0177, "step": 173300 }, { - "epoch": 0.87, - "learning_rate": 0.0001688443123741871, - "loss": 0.0156, + "epoch": 0.45, + "learning_rate": 0.00023261332206614633, + "loss": 0.0165, "step": 173310 }, { - "epoch": 0.87, - "learning_rate": 0.00016883674468117307, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023260943384977484, + "loss": 0.0182, "step": 173320 }, { - "epoch": 0.87, - "learning_rate": 0.00016882917698815905, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.0002326055456334034, + "loss": 0.0162, "step": 173330 }, { - "epoch": 0.87, - "learning_rate": 0.00016882160929514506, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.00023260165741703192, + "loss": 0.0194, "step": 173340 }, { - "epoch": 0.87, - "learning_rate": 0.00016881404160213104, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023259776920066046, + "loss": 0.0171, "step": 173350 }, { - "epoch": 0.87, - "learning_rate": 0.00016880647390911702, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023259388098428898, + "loss": 0.0191, "step": 173360 }, { - "epoch": 0.87, - "learning_rate": 0.00016879890621610303, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023258999276791755, + "loss": 0.0188, "step": 173370 }, { - "epoch": 0.87, - "learning_rate": 0.000168791338523089, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023258610455154606, + "loss": 0.0165, "step": 173380 }, { - "epoch": 0.87, - "learning_rate": 0.000168783770830075, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.0002325822163351746, + "loss": 0.0176, "step": 173390 }, { - "epoch": 0.87, - "learning_rate": 0.000168776203137061, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.00023257832811880312, + "loss": 0.0171, "step": 173400 }, { - "epoch": 0.87, - "learning_rate": 0.00016876863544404698, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.0002325744399024317, + "loss": 0.0211, "step": 173410 }, { - "epoch": 0.87, - "learning_rate": 0.00016876106775103297, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.0002325705516860602, + "loss": 0.0199, "step": 173420 }, { - "epoch": 0.87, - "learning_rate": 0.00016875350005801897, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023256666346968874, + "loss": 0.0156, "step": 173430 }, { - "epoch": 0.88, - "learning_rate": 0.00016874593236500496, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023256277525331726, + "loss": 0.0203, "step": 173440 }, { - "epoch": 0.88, - "learning_rate": 0.00016873836467199094, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.0002325588870369458, + "loss": 0.0208, "step": 173450 }, { - "epoch": 0.88, - "learning_rate": 0.00016873079697897695, - "loss": 0.0103, + "epoch": 0.45, + "learning_rate": 0.00023255499882057437, + "loss": 0.0227, "step": 173460 }, { - "epoch": 0.88, - "learning_rate": 0.00016872322928596293, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023255111060420288, + "loss": 0.0188, "step": 173470 }, { - "epoch": 0.88, - "learning_rate": 0.0001687156615929489, + "epoch": 0.45, + "learning_rate": 0.0002325472223878314, "loss": 0.0134, "step": 173480 }, { - "epoch": 0.88, - "learning_rate": 0.0001687080938999349, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023254333417145994, + "loss": 0.016, "step": 173490 }, { - "epoch": 0.88, - "learning_rate": 0.0001687005262069209, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.0002325394459550885, + "loss": 0.016, "step": 173500 }, { - "epoch": 0.88, - "learning_rate": 0.00016869295851390688, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023253555773871702, + "loss": 0.0186, "step": 173510 }, { - "epoch": 0.88, - "learning_rate": 0.00016868539082089286, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.00023253166952234556, + "loss": 0.0208, "step": 173520 }, { - "epoch": 0.88, - "learning_rate": 0.00016867782312787887, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023252778130597408, + "loss": 0.0171, "step": 173530 }, { - "epoch": 0.88, - "learning_rate": 0.00016867025543486485, - "loss": 0.0152, + "epoch": 0.45, + "learning_rate": 0.00023252389308960265, + "loss": 0.0172, "step": 173540 }, { - "epoch": 0.88, - "learning_rate": 0.00016866268774185083, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.00023252000487323116, + "loss": 0.0198, "step": 173550 }, { - "epoch": 0.88, - "learning_rate": 0.00016865512004883684, - "loss": 0.0091, + "epoch": 0.45, + "learning_rate": 0.0002325161166568597, + "loss": 0.0193, "step": 173560 }, { - "epoch": 0.88, - "learning_rate": 0.00016864755235582282, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023251222844048822, + "loss": 0.0227, "step": 173570 }, { - "epoch": 0.88, - "learning_rate": 0.0001686399846628088, - "loss": 0.0158, + "epoch": 0.45, + "learning_rate": 0.0002325083402241168, + "loss": 0.017, "step": 173580 }, { - "epoch": 0.88, - "learning_rate": 0.0001686324169697948, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.0002325044520077453, + "loss": 0.0239, "step": 173590 }, { - "epoch": 0.88, - "learning_rate": 0.0001686248492767808, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023250056379137384, + "loss": 0.0177, "step": 173600 }, { - "epoch": 0.88, - "learning_rate": 0.00016861728158376678, - "loss": 0.0092, + "epoch": 0.45, + "learning_rate": 0.00023249667557500236, + "loss": 0.0245, "step": 173610 }, { - "epoch": 0.88, - "learning_rate": 0.00016860971389075278, - "loss": 0.0101, + "epoch": 0.45, + "learning_rate": 0.00023249278735863093, + "loss": 0.0166, "step": 173620 }, { - "epoch": 0.88, - "learning_rate": 0.00016860214619773877, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023248889914225947, + "loss": 0.0201, "step": 173630 }, { - "epoch": 0.88, - "learning_rate": 0.00016859457850472475, - "loss": 0.0092, + "epoch": 0.45, + "learning_rate": 0.00023248501092588798, + "loss": 0.0167, "step": 173640 }, { - "epoch": 0.88, - "learning_rate": 0.00016858701081171076, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.0002324811227095165, + "loss": 0.016, "step": 173650 }, { - "epoch": 0.88, - "learning_rate": 0.00016857944311869674, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023247723449314507, + "loss": 0.0185, "step": 173660 }, { - "epoch": 0.88, - "learning_rate": 0.00016857187542568272, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.0002324733462767736, + "loss": 0.018, "step": 173670 }, { - "epoch": 0.88, - "learning_rate": 0.0001685643077326687, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023246945806040212, + "loss": 0.018, "step": 173680 }, { - "epoch": 0.88, - "learning_rate": 0.0001685567400396547, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023246556984403066, + "loss": 0.0172, "step": 173690 }, { - "epoch": 0.88, - "learning_rate": 0.0001685491723466407, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023246168162765918, + "loss": 0.0192, "step": 173700 }, { - "epoch": 0.88, - "learning_rate": 0.00016854160465362667, - "loss": 0.0143, + "epoch": 0.45, + "learning_rate": 0.00023245779341128775, + "loss": 0.022, "step": 173710 }, { - "epoch": 0.88, - "learning_rate": 0.00016853403696061268, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023245390519491626, + "loss": 0.0183, "step": 173720 }, { - "epoch": 0.88, - "learning_rate": 0.00016852646926759866, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.0002324500169785448, + "loss": 0.0176, "step": 173730 }, { - "epoch": 0.88, - "learning_rate": 0.00016851890157458464, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023244612876217332, + "loss": 0.0163, "step": 173740 }, { - "epoch": 0.88, - "learning_rate": 0.00016851133388157065, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023244224054580189, + "loss": 0.0171, "step": 173750 }, { - "epoch": 0.88, - "learning_rate": 0.00016850376618855663, - "loss": 0.0101, + "epoch": 0.45, + "learning_rate": 0.0002324383523294304, + "loss": 0.0154, "step": 173760 }, { - "epoch": 0.88, - "learning_rate": 0.00016849619849554261, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023243446411305894, + "loss": 0.0194, "step": 173770 }, { - "epoch": 0.88, - "learning_rate": 0.00016848863080252862, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023243057589668746, + "loss": 0.0172, "step": 173780 }, { - "epoch": 0.88, - "learning_rate": 0.0001684810631095146, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.00023242668768031603, + "loss": 0.0186, "step": 173790 }, { - "epoch": 0.88, - "learning_rate": 0.00016847349541650059, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023242279946394454, + "loss": 0.017, "step": 173800 }, { - "epoch": 0.88, - "learning_rate": 0.0001684659277234866, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023241891124757308, + "loss": 0.0189, "step": 173810 }, { - "epoch": 0.88, - "learning_rate": 0.00016845836003047258, - "loss": 0.0084, + "epoch": 0.45, + "learning_rate": 0.0002324150230312016, + "loss": 0.0149, "step": 173820 }, { - "epoch": 0.88, - "learning_rate": 0.00016845079233745856, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023241113481483017, + "loss": 0.0181, "step": 173830 }, { - "epoch": 0.88, - "learning_rate": 0.00016844322464444454, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.0002324072465984587, + "loss": 0.0245, "step": 173840 }, { - "epoch": 0.88, - "learning_rate": 0.00016843565695143055, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023240335838208722, + "loss": 0.0163, "step": 173850 }, { - "epoch": 0.88, - "learning_rate": 0.00016842808925841653, - "loss": 0.0147, + "epoch": 0.45, + "learning_rate": 0.00023239947016571576, + "loss": 0.0176, "step": 173860 }, { - "epoch": 0.88, - "learning_rate": 0.0001684205215654025, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.0002323955819493443, + "loss": 0.0196, "step": 173870 }, { - "epoch": 0.88, - "learning_rate": 0.00016841295387238852, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023239169373297285, + "loss": 0.0186, "step": 173880 }, { - "epoch": 0.88, - "learning_rate": 0.0001684053861793745, - "loss": 0.0166, + "epoch": 0.45, + "learning_rate": 0.00023238780551660136, + "loss": 0.0161, "step": 173890 }, { - "epoch": 0.88, - "learning_rate": 0.00016839781848636048, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.0002323839173002299, + "loss": 0.0188, "step": 173900 }, { - "epoch": 0.88, - "learning_rate": 0.0001683902507933465, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.00023238002908385844, + "loss": 0.0216, "step": 173910 }, { - "epoch": 0.88, - "learning_rate": 0.00016838268310033247, - "loss": 0.0101, + "epoch": 0.45, + "learning_rate": 0.00023237614086748699, + "loss": 0.0148, "step": 173920 }, { - "epoch": 0.88, - "learning_rate": 0.00016837511540731845, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.0002323722526511155, + "loss": 0.019, "step": 173930 }, { - "epoch": 0.88, - "learning_rate": 0.00016836754771430446, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.00023236836443474404, + "loss": 0.021, "step": 173940 }, { - "epoch": 0.88, - "learning_rate": 0.00016835998002129044, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023236447621837256, + "loss": 0.0169, "step": 173950 }, { - "epoch": 0.88, - "learning_rate": 0.00016835241232827643, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023236058800200113, + "loss": 0.0119, "step": 173960 }, { - "epoch": 0.88, - "learning_rate": 0.00016834484463526243, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023235669978562964, + "loss": 0.0181, "step": 173970 }, { - "epoch": 0.88, - "learning_rate": 0.00016833727694224842, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023235281156925818, + "loss": 0.0174, "step": 173980 }, { - "epoch": 0.88, - "learning_rate": 0.0001683297092492344, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.0002323489233528867, + "loss": 0.0195, "step": 173990 }, { - "epoch": 0.88, - "learning_rate": 0.00016832214155622038, - "loss": 0.0158, + "epoch": 0.45, + "learning_rate": 0.00023234503513651526, + "loss": 0.0179, "step": 174000 }, { - "epoch": 0.88, - "eval_cer": 0.9144935454101719, - "eval_loss": 0.008368046954274178, - "eval_runtime": 116.7718, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.45, + "eval_cer": 0.8817922630869552, + "eval_loss": 0.012246196158230305, + "eval_runtime": 108.0303, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, "step": 174000 }, { - "epoch": 0.88, - "learning_rate": 0.0001683145738632064, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.0002323411469201438, + "loss": 0.0174, "step": 174010 }, { - "epoch": 0.88, - "learning_rate": 0.00016830700617019237, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023233725870377232, + "loss": 0.0171, "step": 174020 }, { - "epoch": 0.88, - "learning_rate": 0.00016829943847717835, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023233337048740086, + "loss": 0.016, "step": 174030 }, { - "epoch": 0.88, - "learning_rate": 0.00016829187078416436, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.0002323294822710294, + "loss": 0.0179, "step": 174040 }, { - "epoch": 0.88, - "learning_rate": 0.00016828430309115034, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023232559405465795, + "loss": 0.0215, "step": 174050 }, { - "epoch": 0.88, - "learning_rate": 0.00016827673539813632, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023232170583828646, + "loss": 0.0227, "step": 174060 }, { - "epoch": 0.88, - "learning_rate": 0.00016826916770512233, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.000232317817621915, + "loss": 0.0187, "step": 174070 }, { - "epoch": 0.88, - "learning_rate": 0.00016826160001210828, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023231392940554354, + "loss": 0.0179, "step": 174080 }, { - "epoch": 0.88, - "learning_rate": 0.00016825403231909427, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.00023231004118917209, + "loss": 0.0169, "step": 174090 }, { - "epoch": 0.88, - "learning_rate": 0.00016824646462608025, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.0002323061529728006, + "loss": 0.0211, "step": 174100 }, { - "epoch": 0.88, - "learning_rate": 0.00016823889693306626, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023230226475642914, + "loss": 0.0183, "step": 174110 }, { - "epoch": 0.88, - "learning_rate": 0.00016823132924005224, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023229837654005768, + "loss": 0.0167, "step": 174120 }, { - "epoch": 0.88, - "learning_rate": 0.00016822376154703822, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023229448832368622, + "loss": 0.0233, "step": 174130 }, { - "epoch": 0.88, - "learning_rate": 0.00016821619385402423, - "loss": 0.0132, + "epoch": 0.45, + "learning_rate": 0.00023229060010731474, + "loss": 0.0187, "step": 174140 }, { - "epoch": 0.88, - "learning_rate": 0.0001682086261610102, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023228671189094328, + "loss": 0.0199, "step": 174150 }, { - "epoch": 0.88, - "learning_rate": 0.0001682010584679962, - "loss": 0.016, + "epoch": 0.45, + "learning_rate": 0.00023228282367457185, + "loss": 0.0201, "step": 174160 }, { - "epoch": 0.88, - "learning_rate": 0.0001681934907749822, - "loss": 0.0159, + "epoch": 0.45, + "learning_rate": 0.00023227893545820036, + "loss": 0.0183, "step": 174170 }, { - "epoch": 0.88, - "learning_rate": 0.00016818592308196818, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.0002322750472418289, + "loss": 0.0211, "step": 174180 }, { - "epoch": 0.88, - "learning_rate": 0.00016817835538895416, - "loss": 0.0096, + "epoch": 0.45, + "learning_rate": 0.00023227115902545742, + "loss": 0.0209, "step": 174190 }, { - "epoch": 0.88, - "learning_rate": 0.00016817078769594017, - "loss": 0.0148, + "epoch": 0.45, + "learning_rate": 0.00023226727080908593, + "loss": 0.0183, "step": 174200 }, { - "epoch": 0.88, - "learning_rate": 0.00016816322000292615, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.0002322633825927145, + "loss": 0.016, "step": 174210 }, { - "epoch": 0.88, - "learning_rate": 0.00016815565230991213, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023225949437634305, + "loss": 0.0218, "step": 174220 }, { - "epoch": 0.88, - "learning_rate": 0.00016814808461689811, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023225560615997156, + "loss": 0.0185, "step": 174230 }, { - "epoch": 0.88, - "learning_rate": 0.00016814051692388412, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.0002322517179436001, + "loss": 0.02, "step": 174240 }, { - "epoch": 0.88, - "learning_rate": 0.0001681329492308701, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023224782972722864, + "loss": 0.0144, "step": 174250 }, { - "epoch": 0.88, - "learning_rate": 0.00016812538153785609, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023224394151085718, + "loss": 0.0167, "step": 174260 }, { - "epoch": 0.88, - "learning_rate": 0.0001681178138448421, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.0002322400532944857, + "loss": 0.0176, "step": 174270 }, { - "epoch": 0.88, - "learning_rate": 0.00016811024615182808, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023223616507811424, + "loss": 0.0179, "step": 174280 }, { - "epoch": 0.88, - "learning_rate": 0.00016810267845881406, - "loss": 0.0113, + "epoch": 0.45, + "learning_rate": 0.00023223227686174278, + "loss": 0.0166, "step": 174290 }, { - "epoch": 0.88, - "learning_rate": 0.00016809511076580007, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023222838864537132, + "loss": 0.0161, "step": 174300 }, { - "epoch": 0.88, - "learning_rate": 0.00016808754307278605, - "loss": 0.0091, + "epoch": 0.45, + "learning_rate": 0.00023222450042899984, + "loss": 0.0183, "step": 174310 }, { - "epoch": 0.88, - "learning_rate": 0.00016807997537977203, - "loss": 0.0122, + "epoch": 0.45, + "learning_rate": 0.00023222061221262838, + "loss": 0.0227, "step": 174320 }, { - "epoch": 0.88, - "learning_rate": 0.00016807240768675804, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.00023221672399625695, + "loss": 0.0145, "step": 174330 }, { - "epoch": 0.88, - "learning_rate": 0.00016806483999374402, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023221283577988546, + "loss": 0.0182, "step": 174340 }, { - "epoch": 0.88, - "learning_rate": 0.00016805727230073, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.000232208947563514, + "loss": 0.0165, "step": 174350 }, { - "epoch": 0.88, - "learning_rate": 0.000168049704607716, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023220505934714252, + "loss": 0.0182, "step": 174360 }, { - "epoch": 0.88, - "learning_rate": 0.000168042136914702, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.0002322011711307711, + "loss": 0.0192, "step": 174370 }, { - "epoch": 0.88, - "learning_rate": 0.00016803456922168797, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.0002321972829143996, + "loss": 0.0174, "step": 174380 }, { - "epoch": 0.88, - "learning_rate": 0.00016802700152867395, - "loss": 0.0171, + "epoch": 0.45, + "learning_rate": 0.00023219339469802814, + "loss": 0.0188, "step": 174390 }, { - "epoch": 0.88, - "learning_rate": 0.00016801943383565996, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023218950648165666, + "loss": 0.0166, "step": 174400 }, { - "epoch": 0.88, - "learning_rate": 0.00016801186614264594, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023218561826528523, + "loss": 0.0156, "step": 174410 }, { - "epoch": 0.88, - "learning_rate": 0.00016800429844963192, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023218173004891374, + "loss": 0.018, "step": 174420 }, { - "epoch": 0.88, - "learning_rate": 0.00016799673075661793, - "loss": 0.0132, + "epoch": 0.45, + "learning_rate": 0.00023217784183254228, + "loss": 0.0165, "step": 174430 }, { - "epoch": 0.88, - "learning_rate": 0.00016798916306360391, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.0002321739536161708, + "loss": 0.0189, "step": 174440 }, { - "epoch": 0.88, - "learning_rate": 0.0001679815953705899, - "loss": 0.0106, + "epoch": 0.45, + "learning_rate": 0.00023217006539979934, + "loss": 0.0147, "step": 174450 }, { - "epoch": 0.88, - "learning_rate": 0.0001679740276775759, - "loss": 0.0155, + "epoch": 0.45, + "learning_rate": 0.00023216617718342788, + "loss": 0.0177, "step": 174460 }, { - "epoch": 0.88, - "learning_rate": 0.00016796645998456189, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023216228896705642, + "loss": 0.0144, "step": 174470 }, { - "epoch": 0.88, - "learning_rate": 0.00016795889229154787, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023215840075068494, + "loss": 0.0149, "step": 174480 }, { - "epoch": 0.88, - "learning_rate": 0.00016795132459853388, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023215451253431348, + "loss": 0.0183, "step": 174490 }, { - "epoch": 0.88, - "learning_rate": 0.00016794375690551986, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023215062431794205, + "loss": 0.0206, "step": 174500 }, { - "epoch": 0.88, - "learning_rate": 0.00016793618921250584, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.00023214673610157056, + "loss": 0.0188, "step": 174510 }, { - "epoch": 0.88, - "learning_rate": 0.00016792862151949185, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023214284788519908, + "loss": 0.0176, "step": 174520 }, { - "epoch": 0.88, - "learning_rate": 0.00016792105382647783, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.00023213895966882762, + "loss": 0.0243, "step": 174530 }, { - "epoch": 0.88, - "learning_rate": 0.0001679134861334638, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.0002321350714524562, + "loss": 0.0175, "step": 174540 }, { - "epoch": 0.88, - "learning_rate": 0.00016790591844044982, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.0002321311832360847, + "loss": 0.0183, "step": 174550 }, { - "epoch": 0.88, - "learning_rate": 0.0001678983507474358, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023212729501971324, + "loss": 0.0169, "step": 174560 }, { - "epoch": 0.88, - "learning_rate": 0.00016789078305442178, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.00023212340680334176, + "loss": 0.0205, "step": 174570 }, { - "epoch": 0.88, - "learning_rate": 0.00016788321536140776, - "loss": 0.0129, + "epoch": 0.45, + "learning_rate": 0.00023211951858697033, + "loss": 0.0156, "step": 174580 }, { - "epoch": 0.88, - "learning_rate": 0.00016787564766839377, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.00023211563037059884, + "loss": 0.0149, "step": 174590 }, { - "epoch": 0.88, - "learning_rate": 0.00016786807997537975, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.00023211174215422738, + "loss": 0.0162, "step": 174600 }, { - "epoch": 0.88, - "learning_rate": 0.00016786051228236573, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.0002321078539378559, + "loss": 0.027, "step": 174610 }, { - "epoch": 0.88, - "learning_rate": 0.00016785294458935174, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023210396572148447, + "loss": 0.0198, "step": 174620 }, { - "epoch": 0.88, - "learning_rate": 0.00016784537689633772, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023210007750511298, + "loss": 0.0172, "step": 174630 }, { - "epoch": 0.88, - "learning_rate": 0.0001678378092033237, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023209618928874152, + "loss": 0.0188, "step": 174640 }, { - "epoch": 0.88, - "learning_rate": 0.00016783024151030971, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023209230107237004, + "loss": 0.0186, "step": 174650 }, { - "epoch": 0.88, - "learning_rate": 0.0001678226738172957, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.0002320884128559986, + "loss": 0.0164, "step": 174660 }, { - "epoch": 0.88, - "learning_rate": 0.00016781510612428168, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023208452463962712, + "loss": 0.0193, "step": 174670 }, { - "epoch": 0.88, - "learning_rate": 0.00016780753843126769, - "loss": 0.0111, + "epoch": 0.45, + "learning_rate": 0.00023208063642325566, + "loss": 0.0174, "step": 174680 }, { - "epoch": 0.88, - "learning_rate": 0.00016779997073825367, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023207674820688418, + "loss": 0.0166, "step": 174690 }, { - "epoch": 0.88, - "learning_rate": 0.00016779240304523965, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023207285999051272, + "loss": 0.0176, "step": 174700 }, { - "epoch": 0.88, - "learning_rate": 0.00016778483535222566, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.0002320689717741413, + "loss": 0.0182, "step": 174710 }, { - "epoch": 0.88, - "learning_rate": 0.00016777726765921164, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.0002320650835577698, + "loss": 0.0176, "step": 174720 }, { - "epoch": 0.88, - "learning_rate": 0.00016776969996619762, - "loss": 0.0146, + "epoch": 0.45, + "learning_rate": 0.00023206119534139834, + "loss": 0.0187, "step": 174730 }, { - "epoch": 0.88, - "learning_rate": 0.0001677621322731836, - "loss": 0.0094, + "epoch": 0.45, + "learning_rate": 0.00023205730712502686, + "loss": 0.0256, "step": 174740 }, { - "epoch": 0.88, - "learning_rate": 0.0001677545645801696, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.00023205341890865543, + "loss": 0.0181, "step": 174750 }, { - "epoch": 0.88, - "learning_rate": 0.0001677469968871556, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023204953069228394, + "loss": 0.0141, "step": 174760 }, { - "epoch": 0.88, - "learning_rate": 0.00016773942919414157, - "loss": 0.0125, + "epoch": 0.45, + "learning_rate": 0.00023204564247591248, + "loss": 0.0171, "step": 174770 }, { - "epoch": 0.88, - "learning_rate": 0.00016773186150112758, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.000232041754259541, + "loss": 0.0195, "step": 174780 }, { - "epoch": 0.88, - "learning_rate": 0.00016772429380811356, - "loss": 0.0144, + "epoch": 0.45, + "learning_rate": 0.00023203786604316957, + "loss": 0.017, "step": 174790 }, { - "epoch": 0.88, - "learning_rate": 0.00016771672611509954, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.00023203397782679808, + "loss": 0.0199, "step": 174800 }, { - "epoch": 0.88, - "learning_rate": 0.00016770915842208555, - "loss": 0.0101, + "epoch": 0.45, + "learning_rate": 0.00023203008961042662, + "loss": 0.0208, "step": 174810 }, { - "epoch": 0.88, - "learning_rate": 0.00016770159072907153, - "loss": 0.0094, + "epoch": 0.45, + "learning_rate": 0.00023202620139405514, + "loss": 0.0183, "step": 174820 }, { - "epoch": 0.88, - "learning_rate": 0.00016769402303605752, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.0002320223131776837, + "loss": 0.0206, "step": 174830 }, { - "epoch": 0.88, - "learning_rate": 0.00016768645534304352, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023201842496131222, + "loss": 0.0192, "step": 174840 }, { - "epoch": 0.88, - "learning_rate": 0.0001676788876500295, - "loss": 0.012, + "epoch": 0.45, + "learning_rate": 0.00023201453674494076, + "loss": 0.0178, "step": 174850 }, { - "epoch": 0.88, - "learning_rate": 0.0001676713199570155, - "loss": 0.0097, + "epoch": 0.45, + "learning_rate": 0.00023201064852856928, + "loss": 0.0174, "step": 174860 }, { - "epoch": 0.88, - "learning_rate": 0.0001676637522640015, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023200676031219785, + "loss": 0.018, "step": 174870 }, { - "epoch": 0.88, - "learning_rate": 0.00016765618457098748, - "loss": 0.0154, + "epoch": 0.45, + "learning_rate": 0.0002320028720958264, + "loss": 0.0158, "step": 174880 }, { - "epoch": 0.88, - "learning_rate": 0.00016764861687797346, - "loss": 0.0117, + "epoch": 0.45, + "learning_rate": 0.0002319989838794549, + "loss": 0.0164, "step": 174890 }, { - "epoch": 0.88, - "learning_rate": 0.00016764104918495944, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.00023199509566308344, + "loss": 0.0203, "step": 174900 }, { - "epoch": 0.88, - "learning_rate": 0.00016763348149194545, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023199120744671198, + "loss": 0.0195, "step": 174910 }, { - "epoch": 0.88, - "learning_rate": 0.00016762591379893143, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023198731923034053, + "loss": 0.0212, "step": 174920 }, { - "epoch": 0.88, - "learning_rate": 0.0001676183461059174, - "loss": 0.0157, + "epoch": 0.45, + "learning_rate": 0.00023198343101396904, + "loss": 0.0156, "step": 174930 }, { - "epoch": 0.88, - "learning_rate": 0.00016761077841290342, - "loss": 0.0141, + "epoch": 0.45, + "learning_rate": 0.00023197954279759758, + "loss": 0.0142, "step": 174940 }, { - "epoch": 0.88, - "learning_rate": 0.0001676032107198894, - "loss": 0.0148, + "epoch": 0.45, + "learning_rate": 0.0002319756545812261, + "loss": 0.0186, "step": 174950 }, { - "epoch": 0.88, - "learning_rate": 0.00016759564302687538, - "loss": 0.0887, + "epoch": 0.45, + "learning_rate": 0.00023197176636485467, + "loss": 0.0185, "step": 174960 }, { - "epoch": 0.88, - "learning_rate": 0.0001675880753338614, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023196787814848318, + "loss": 0.0166, "step": 174970 }, { - "epoch": 0.88, - "learning_rate": 0.00016758050764084737, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023196398993211172, + "loss": 0.0162, "step": 174980 }, { - "epoch": 0.88, - "learning_rate": 0.00016757293994783335, - "loss": 0.0149, + "epoch": 0.45, + "learning_rate": 0.00023196010171574024, + "loss": 0.018, "step": 174990 }, { - "epoch": 0.88, - "learning_rate": 0.00016756537225481936, - "loss": 0.0152, + "epoch": 0.45, + "learning_rate": 0.0002319562134993688, + "loss": 0.019, "step": 175000 }, { - "epoch": 0.88, - "eval_cer": 0.9144993677869243, - "eval_loss": 0.008513858541846275, - "eval_runtime": 116.6209, - "eval_samples_per_second": 17.15, - "eval_steps_per_second": 4.287, + "epoch": 0.45, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.012664512731134892, + "eval_runtime": 107.9478, + "eval_samples_per_second": 18.527, + "eval_steps_per_second": 4.632, "step": 175000 }, { - "epoch": 0.88, - "learning_rate": 0.00016755780456180534, - "loss": 0.011, + "epoch": 0.45, + "learning_rate": 0.00023195232528299732, + "loss": 0.0157, "step": 175010 }, { - "epoch": 0.88, - "learning_rate": 0.00016755023686879133, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023194843706662586, + "loss": 0.0172, "step": 175020 }, { - "epoch": 0.88, - "learning_rate": 0.00016754266917577733, - "loss": 0.0094, + "epoch": 0.45, + "learning_rate": 0.00023194454885025438, + "loss": 0.0217, "step": 175030 }, { - "epoch": 0.88, - "learning_rate": 0.00016753510148276332, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023194066063388294, + "loss": 0.0169, "step": 175040 }, { - "epoch": 0.88, - "learning_rate": 0.0001675275337897493, - "loss": 0.0135, + "epoch": 0.45, + "learning_rate": 0.00023193677241751149, + "loss": 0.0177, "step": 175050 }, { - "epoch": 0.88, - "learning_rate": 0.0001675199660967353, - "loss": 0.0105, + "epoch": 0.45, + "learning_rate": 0.00023193288420114, + "loss": 0.0178, "step": 175060 }, { - "epoch": 0.88, - "learning_rate": 0.0001675123984037213, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023192899598476852, + "loss": 0.0228, "step": 175070 }, { - "epoch": 0.88, - "learning_rate": 0.00016750483071070727, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023192510776839708, + "loss": 0.0175, "step": 175080 }, { - "epoch": 0.88, - "learning_rate": 0.00016749726301769325, - "loss": 0.0088, + "epoch": 0.45, + "learning_rate": 0.00023192121955202563, + "loss": 0.0186, "step": 175090 }, { - "epoch": 0.88, - "learning_rate": 0.00016748969532467926, - "loss": 0.013, + "epoch": 0.45, + "learning_rate": 0.00023191733133565414, + "loss": 0.0205, "step": 175100 }, { - "epoch": 0.88, - "learning_rate": 0.00016748212763166524, - "loss": 0.0099, + "epoch": 0.45, + "learning_rate": 0.00023191344311928268, + "loss": 0.0218, "step": 175110 }, { - "epoch": 0.88, - "learning_rate": 0.00016747455993865122, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023190955490291122, + "loss": 0.0162, "step": 175120 }, { - "epoch": 0.88, - "learning_rate": 0.00016746699224563723, - "loss": 0.0136, + "epoch": 0.45, + "learning_rate": 0.00023190566668653977, + "loss": 0.02, "step": 175130 }, { - "epoch": 0.88, - "learning_rate": 0.0001674594245526232, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023190177847016828, + "loss": 0.0217, "step": 175140 }, { - "epoch": 0.88, - "learning_rate": 0.0001674518568596092, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023189789025379682, + "loss": 0.0161, "step": 175150 }, { - "epoch": 0.88, - "learning_rate": 0.0001674442891665952, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023189400203742536, + "loss": 0.0178, "step": 175160 }, { - "epoch": 0.88, - "learning_rate": 0.00016743672147358118, - "loss": 0.0118, + "epoch": 0.45, + "learning_rate": 0.0002318901138210539, + "loss": 0.021, "step": 175170 }, { - "epoch": 0.88, - "learning_rate": 0.00016742915378056716, - "loss": 0.0116, + "epoch": 0.45, + "learning_rate": 0.00023188622560468242, + "loss": 0.0231, "step": 175180 }, { - "epoch": 0.88, - "learning_rate": 0.00016742158608755317, - "loss": 0.0102, + "epoch": 0.45, + "learning_rate": 0.00023188233738831096, + "loss": 0.017, "step": 175190 }, { - "epoch": 0.88, - "learning_rate": 0.00016741401839453915, - "loss": 0.0098, + "epoch": 0.45, + "learning_rate": 0.00023187844917193948, + "loss": 0.0187, "step": 175200 }, { - "epoch": 0.88, - "learning_rate": 0.00016740645070152514, - "loss": 0.0161, + "epoch": 0.45, + "learning_rate": 0.00023187456095556804, + "loss": 0.0165, "step": 175210 }, { - "epoch": 0.88, - "learning_rate": 0.00016739888300851114, - "loss": 0.0142, + "epoch": 0.45, + "learning_rate": 0.00023187067273919659, + "loss": 0.0158, "step": 175220 }, { - "epoch": 0.88, - "learning_rate": 0.00016739131531549713, - "loss": 0.0103, + "epoch": 0.45, + "learning_rate": 0.0002318667845228251, + "loss": 0.0172, "step": 175230 }, { - "epoch": 0.88, - "learning_rate": 0.0001673837476224831, - "loss": 0.0101, + "epoch": 0.45, + "learning_rate": 0.00023186289630645361, + "loss": 0.0166, "step": 175240 }, { - "epoch": 0.88, - "learning_rate": 0.0001673761799294691, - "loss": 0.0103, + "epoch": 0.45, + "learning_rate": 0.00023185900809008218, + "loss": 0.0196, "step": 175250 }, { - "epoch": 0.88, - "learning_rate": 0.0001673686122364551, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.00023185511987371073, + "loss": 0.0217, "step": 175260 }, { - "epoch": 0.88, - "learning_rate": 0.00016736104454344108, - "loss": 0.0131, + "epoch": 0.45, + "learning_rate": 0.00023185123165733924, + "loss": 0.0163, "step": 175270 }, { - "epoch": 0.88, - "learning_rate": 0.00016735347685042706, - "loss": 0.0109, + "epoch": 0.45, + "learning_rate": 0.00023184734344096778, + "loss": 0.0219, "step": 175280 }, { - "epoch": 0.88, - "learning_rate": 0.00016734590915741307, - "loss": 0.0166, + "epoch": 0.45, + "learning_rate": 0.00023184345522459632, + "loss": 0.0164, "step": 175290 }, { - "epoch": 0.88, - "learning_rate": 0.00016733834146439905, - "loss": 0.0112, + "epoch": 0.45, + "learning_rate": 0.00023183956700822486, + "loss": 0.0207, "step": 175300 }, { - "epoch": 0.88, - "learning_rate": 0.00016733077377138503, - "loss": 0.0108, + "epoch": 0.45, + "learning_rate": 0.00023183567879185338, + "loss": 0.0198, "step": 175310 }, { - "epoch": 0.88, - "learning_rate": 0.00016732320607837104, - "loss": 0.0121, + "epoch": 0.45, + "learning_rate": 0.00023183179057548192, + "loss": 0.0166, "step": 175320 }, { - "epoch": 0.88, - "learning_rate": 0.00016731563838535702, - "loss": 0.0146, + "epoch": 0.45, + "learning_rate": 0.00023182790235911046, + "loss": 0.017, "step": 175330 }, { - "epoch": 0.88, - "learning_rate": 0.00016730807069234298, - "loss": 0.0115, + "epoch": 0.45, + "learning_rate": 0.000231824014142739, + "loss": 0.0186, "step": 175340 }, { - "epoch": 0.88, - "learning_rate": 0.00016730050299932896, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023182012592636752, + "loss": 0.0207, "step": 175350 }, { - "epoch": 0.88, - "learning_rate": 0.00016729293530631497, - "loss": 0.0127, + "epoch": 0.45, + "learning_rate": 0.00023181623770999606, + "loss": 0.0203, "step": 175360 }, { - "epoch": 0.88, - "learning_rate": 0.00016728536761330095, - "loss": 0.0126, + "epoch": 0.45, + "learning_rate": 0.00023181234949362463, + "loss": 0.0154, "step": 175370 }, { - "epoch": 0.88, - "learning_rate": 0.00016727779992028693, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023180846127725314, + "loss": 0.0182, "step": 175380 }, { - "epoch": 0.88, - "learning_rate": 0.00016727023222727294, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023180457306088166, + "loss": 0.0222, "step": 175390 }, { - "epoch": 0.88, - "learning_rate": 0.00016726266453425892, - "loss": 0.0139, + "epoch": 0.45, + "learning_rate": 0.0002318006848445102, + "loss": 0.0174, "step": 175400 }, { - "epoch": 0.88, - "learning_rate": 0.0001672550968412449, - "loss": 0.0119, + "epoch": 0.45, + "learning_rate": 0.00023179679662813877, + "loss": 0.0163, "step": 175410 }, { - "epoch": 0.89, - "learning_rate": 0.0001672475291482309, - "loss": 0.0114, + "epoch": 0.45, + "learning_rate": 0.00023179290841176728, + "loss": 0.0158, "step": 175420 }, { - "epoch": 0.89, - "learning_rate": 0.0001672399614552169, - "loss": 0.0104, + "epoch": 0.45, + "learning_rate": 0.00023178902019539582, + "loss": 0.0187, "step": 175430 }, { - "epoch": 0.89, - "learning_rate": 0.00016723239376220287, - "loss": 0.0096, + "epoch": 0.45, + "learning_rate": 0.00023178513197902434, + "loss": 0.0243, "step": 175440 }, { - "epoch": 0.89, - "learning_rate": 0.00016722482606918888, - "loss": 0.0138, + "epoch": 0.45, + "learning_rate": 0.00023178124376265288, + "loss": 0.0211, "step": 175450 }, { - "epoch": 0.89, - "learning_rate": 0.00016721725837617486, - "loss": 0.0134, + "epoch": 0.45, + "learning_rate": 0.00023177735554628142, + "loss": 0.0296, "step": 175460 }, { - "epoch": 0.89, - "learning_rate": 0.00016720969068316084, - "loss": 0.01, + "epoch": 0.45, + "learning_rate": 0.00023177346732990996, + "loss": 0.0217, "step": 175470 }, { - "epoch": 0.89, - "learning_rate": 0.00016720212299014682, - "loss": 0.0178, + "epoch": 0.45, + "learning_rate": 0.00023176957911353848, + "loss": 0.0162, "step": 175480 }, { - "epoch": 0.89, - "learning_rate": 0.00016719455529713283, - "loss": 0.0152, + "epoch": 0.45, + "learning_rate": 0.00023176569089716702, + "loss": 0.0186, "step": 175490 }, { - "epoch": 0.89, - "learning_rate": 0.00016718698760411881, - "loss": 0.0124, + "epoch": 0.45, + "learning_rate": 0.00023176180268079556, + "loss": 0.0185, "step": 175500 }, { - "epoch": 0.89, - "learning_rate": 0.0001671794199111048, - "loss": 0.0128, + "epoch": 0.45, + "learning_rate": 0.0002317579144644241, + "loss": 0.0192, "step": 175510 }, { - "epoch": 0.89, - "learning_rate": 0.0001671718522180908, - "loss": 0.0107, + "epoch": 0.45, + "learning_rate": 0.00023175402624805262, + "loss": 0.0166, "step": 175520 }, { - "epoch": 0.89, - "learning_rate": 0.00016716428452507679, - "loss": 0.0123, + "epoch": 0.45, + "learning_rate": 0.00023175013803168116, + "loss": 0.0171, "step": 175530 }, { - "epoch": 0.89, - "learning_rate": 0.00016715671683206277, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023174624981530973, + "loss": 0.019, "step": 175540 }, { - "epoch": 0.89, - "learning_rate": 0.00016714914913904878, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023174236159893824, + "loss": 0.0172, "step": 175550 }, { - "epoch": 0.89, - "learning_rate": 0.00016714158144603476, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.00023173847338256676, + "loss": 0.0183, "step": 175560 }, { - "epoch": 0.89, - "learning_rate": 0.00016713401375302074, - "loss": 0.0141, + "epoch": 0.46, + "learning_rate": 0.0002317345851661953, + "loss": 0.0166, "step": 175570 }, { - "epoch": 0.89, - "learning_rate": 0.00016712644606000675, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023173069694982387, + "loss": 0.0222, "step": 175580 }, { - "epoch": 0.89, - "learning_rate": 0.00016711887836699273, - "loss": 0.0092, + "epoch": 0.46, + "learning_rate": 0.00023172680873345238, + "loss": 0.017, "step": 175590 }, { - "epoch": 0.89, - "learning_rate": 0.0001671113106739787, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.00023172292051708092, + "loss": 0.0174, "step": 175600 }, { - "epoch": 0.89, - "learning_rate": 0.00016710374298096472, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023171903230070944, + "loss": 0.0212, "step": 175610 }, { - "epoch": 0.89, - "learning_rate": 0.0001670961752879507, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.000231715144084338, + "loss": 0.0177, "step": 175620 }, { - "epoch": 0.89, - "learning_rate": 0.00016708860759493668, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023171125586796652, + "loss": 0.0184, "step": 175630 }, { - "epoch": 0.89, - "learning_rate": 0.00016708103990192266, - "loss": 0.015, + "epoch": 0.46, + "learning_rate": 0.00023170736765159506, + "loss": 0.0172, "step": 175640 }, { - "epoch": 0.89, - "learning_rate": 0.00016707347220890867, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.00023170347943522358, + "loss": 0.0194, "step": 175650 }, { - "epoch": 0.89, - "learning_rate": 0.00016706590451589465, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023169959121885212, + "loss": 0.0154, "step": 175660 }, { - "epoch": 0.89, - "learning_rate": 0.00016705833682288063, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023169570300248066, + "loss": 0.0185, "step": 175670 }, { - "epoch": 0.89, - "learning_rate": 0.00016705076912986664, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002316918147861092, + "loss": 0.0214, "step": 175680 }, { - "epoch": 0.89, - "learning_rate": 0.00016704320143685262, - "loss": 0.0092, + "epoch": 0.46, + "learning_rate": 0.00023168792656973772, + "loss": 0.0171, "step": 175690 }, { - "epoch": 0.89, - "learning_rate": 0.0001670356337438386, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.00023168403835336626, + "loss": 0.0196, "step": 175700 }, { - "epoch": 0.89, - "learning_rate": 0.00016702806605082461, - "loss": 0.0163, + "epoch": 0.46, + "learning_rate": 0.0002316801501369948, + "loss": 0.02, "step": 175710 }, { - "epoch": 0.89, - "learning_rate": 0.0001670204983578106, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023167626192062334, + "loss": 0.0192, "step": 175720 }, { - "epoch": 0.89, - "learning_rate": 0.00016701293066479658, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023167237370425186, + "loss": 0.0163, "step": 175730 }, { - "epoch": 0.89, - "learning_rate": 0.00016700536297178259, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.0002316684854878804, + "loss": 0.0194, "step": 175740 }, { - "epoch": 0.89, - "learning_rate": 0.00016699779527876857, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023166459727150897, + "loss": 0.0192, "step": 175750 }, { - "epoch": 0.89, - "learning_rate": 0.00016699022758575455, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023166070905513748, + "loss": 0.0186, "step": 175760 }, { - "epoch": 0.89, - "learning_rate": 0.00016698265989274056, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023165682083876602, + "loss": 0.0174, "step": 175770 }, { - "epoch": 0.89, - "learning_rate": 0.00016697509219972654, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.00023165293262239454, + "loss": 0.0218, "step": 175780 }, { - "epoch": 0.89, - "learning_rate": 0.00016696752450671252, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.0002316490444060231, + "loss": 0.0169, "step": 175790 }, { - "epoch": 0.89, - "learning_rate": 0.0001669599568136985, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023164515618965162, + "loss": 0.0201, "step": 175800 }, { - "epoch": 0.89, - "learning_rate": 0.0001669523891206845, - "loss": 0.0215, + "epoch": 0.46, + "learning_rate": 0.00023164126797328016, + "loss": 0.0226, "step": 175810 }, { - "epoch": 0.89, - "learning_rate": 0.0001669448214276705, - "loss": 0.0096, + "epoch": 0.46, + "learning_rate": 0.00023163737975690868, + "loss": 0.0259, "step": 175820 }, { - "epoch": 0.89, - "learning_rate": 0.00016693725373465647, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023163349154053725, + "loss": 0.019, "step": 175830 }, { - "epoch": 0.89, - "learning_rate": 0.00016692968604164248, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023162960332416576, + "loss": 0.023, "step": 175840 }, { - "epoch": 0.89, - "learning_rate": 0.00016692211834862846, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.0002316257151077943, + "loss": 0.0178, "step": 175850 }, { - "epoch": 0.89, - "learning_rate": 0.00016691455065561444, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023162182689142282, + "loss": 0.0238, "step": 175860 }, { - "epoch": 0.89, - "learning_rate": 0.00016690698296260045, - "loss": 0.0157, + "epoch": 0.46, + "learning_rate": 0.00023161793867505139, + "loss": 0.0181, "step": 175870 }, { - "epoch": 0.89, - "learning_rate": 0.00016689941526958643, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.0002316140504586799, + "loss": 0.0177, "step": 175880 }, { - "epoch": 0.89, - "learning_rate": 0.00016689184757657242, - "loss": 0.0156, + "epoch": 0.46, + "learning_rate": 0.00023161016224230844, + "loss": 0.0169, "step": 175890 }, { - "epoch": 0.89, - "learning_rate": 0.00016688427988355842, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023160627402593696, + "loss": 0.0159, "step": 175900 }, { - "epoch": 0.89, - "learning_rate": 0.0001668767121905444, - "loss": 0.0163, + "epoch": 0.46, + "learning_rate": 0.0002316023858095655, + "loss": 0.0234, "step": 175910 }, { - "epoch": 0.89, - "learning_rate": 0.0001668691444975304, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023159849759319407, + "loss": 0.023, "step": 175920 }, { - "epoch": 0.89, - "learning_rate": 0.0001668615768045164, - "loss": 0.0168, + "epoch": 0.46, + "learning_rate": 0.00023159460937682258, + "loss": 0.0238, "step": 175930 }, { - "epoch": 0.89, - "learning_rate": 0.00016685400911150238, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023159072116045112, + "loss": 0.016, "step": 175940 }, { - "epoch": 0.89, - "learning_rate": 0.00016684644141848836, - "loss": 0.0127, + "epoch": 0.46, + "learning_rate": 0.00023158683294407964, + "loss": 0.0185, "step": 175950 }, { - "epoch": 0.89, - "learning_rate": 0.00016683887372547437, - "loss": 0.0095, + "epoch": 0.46, + "learning_rate": 0.0002315829447277082, + "loss": 0.0174, "step": 175960 }, { - "epoch": 0.89, - "learning_rate": 0.00016683130603246035, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023157905651133672, + "loss": 0.016, "step": 175970 }, { - "epoch": 0.89, - "learning_rate": 0.00016682373833944633, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023157516829496526, + "loss": 0.0187, "step": 175980 }, { - "epoch": 0.89, - "learning_rate": 0.0001668161706464323, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023157128007859378, + "loss": 0.0173, "step": 175990 }, { - "epoch": 0.89, - "learning_rate": 0.00016680860295341832, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023156739186222235, + "loss": 0.0156, "step": 176000 }, { - "epoch": 0.89, - "eval_cer": 0.9145032493714259, - "eval_loss": 0.008152415975928307, - "eval_runtime": 116.6203, - "eval_samples_per_second": 17.15, - "eval_steps_per_second": 4.287, + "epoch": 0.46, + "eval_cer": 0.8817838652653501, + "eval_loss": 0.012811483815312386, + "eval_runtime": 107.6031, + "eval_samples_per_second": 18.587, + "eval_steps_per_second": 4.647, "step": 176000 }, { - "epoch": 0.89, - "learning_rate": 0.0001668010352604043, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023156350364585086, + "loss": 0.0194, "step": 176010 }, { - "epoch": 0.89, - "learning_rate": 0.00016679346756739028, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.0002315596154294794, + "loss": 0.0152, "step": 176020 }, { - "epoch": 0.89, - "learning_rate": 0.0001667858998743763, - "loss": 0.0097, + "epoch": 0.46, + "learning_rate": 0.00023155572721310792, + "loss": 0.0193, "step": 176030 }, { - "epoch": 0.89, - "learning_rate": 0.00016677833218136227, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023155183899673648, + "loss": 0.0154, "step": 176040 }, { - "epoch": 0.89, - "learning_rate": 0.00016677076448834825, - "loss": 0.0141, + "epoch": 0.46, + "learning_rate": 0.000231547950780365, + "loss": 0.0254, "step": 176050 }, { - "epoch": 0.89, - "learning_rate": 0.00016676319679533426, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023154406256399354, + "loss": 0.0169, "step": 176060 }, { - "epoch": 0.89, - "learning_rate": 0.00016675562910232024, - "loss": 0.0097, + "epoch": 0.46, + "learning_rate": 0.00023154017434762206, + "loss": 0.021, "step": 176070 }, { - "epoch": 0.89, - "learning_rate": 0.00016674806140930623, - "loss": 0.0143, + "epoch": 0.46, + "learning_rate": 0.00023153628613125062, + "loss": 0.0196, "step": 176080 }, { - "epoch": 0.89, - "learning_rate": 0.00016674049371629223, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023153239791487917, + "loss": 0.0208, "step": 176090 }, { - "epoch": 0.89, - "learning_rate": 0.00016673292602327822, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.00023152850969850768, + "loss": 0.0189, "step": 176100 }, { - "epoch": 0.89, - "learning_rate": 0.0001667253583302642, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.0002315246214821362, + "loss": 0.0183, "step": 176110 }, { - "epoch": 0.89, - "learning_rate": 0.0001667177906372502, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023152073326576476, + "loss": 0.0167, "step": 176120 }, { - "epoch": 0.89, - "learning_rate": 0.0001667102229442362, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.0002315168450493933, + "loss": 0.0156, "step": 176130 }, { - "epoch": 0.89, - "learning_rate": 0.00016670265525122217, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023151295683302182, + "loss": 0.0215, "step": 176140 }, { - "epoch": 0.89, - "learning_rate": 0.00016669508755820815, - "loss": 0.0139, + "epoch": 0.46, + "learning_rate": 0.00023150906861665036, + "loss": 0.0168, "step": 176150 }, { - "epoch": 0.89, - "learning_rate": 0.00016668751986519416, - "loss": 0.0087, + "epoch": 0.46, + "learning_rate": 0.00023150518040027888, + "loss": 0.0204, "step": 176160 }, { - "epoch": 0.89, - "learning_rate": 0.00016667995217218014, - "loss": 0.0136, + "epoch": 0.46, + "learning_rate": 0.00023150129218390744, + "loss": 0.0204, "step": 176170 }, { - "epoch": 0.89, - "learning_rate": 0.00016667238447916612, - "loss": 0.0155, + "epoch": 0.46, + "learning_rate": 0.00023149740396753596, + "loss": 0.0213, "step": 176180 }, { - "epoch": 0.89, - "learning_rate": 0.00016666481678615213, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.0002314935157511645, + "loss": 0.0187, "step": 176190 }, { - "epoch": 0.89, - "learning_rate": 0.0001666572490931381, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023148962753479302, + "loss": 0.0197, "step": 176200 }, { - "epoch": 0.89, - "learning_rate": 0.0001666496814001241, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023148573931842158, + "loss": 0.0181, "step": 176210 }, { - "epoch": 0.89, - "learning_rate": 0.0001666421137071101, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.0002314818511020501, + "loss": 0.0183, "step": 176220 }, { - "epoch": 0.89, - "learning_rate": 0.00016663454601409608, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023147796288567864, + "loss": 0.0245, "step": 176230 }, { - "epoch": 0.89, - "learning_rate": 0.00016662697832108206, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023147407466930715, + "loss": 0.0196, "step": 176240 }, { - "epoch": 0.89, - "learning_rate": 0.00016661941062806807, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023147018645293572, + "loss": 0.0165, "step": 176250 }, { - "epoch": 0.89, - "learning_rate": 0.00016661184293505405, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.00023146629823656424, + "loss": 0.018, "step": 176260 }, { - "epoch": 0.89, - "learning_rate": 0.00016660427524204004, - "loss": 0.009, + "epoch": 0.46, + "learning_rate": 0.00023146241002019278, + "loss": 0.0158, "step": 176270 }, { - "epoch": 0.89, - "learning_rate": 0.00016659670754902604, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.0002314585218038213, + "loss": 0.0176, "step": 176280 }, { - "epoch": 0.89, - "learning_rate": 0.00016658913985601203, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023145463358744986, + "loss": 0.0213, "step": 176290 }, { - "epoch": 0.89, - "learning_rate": 0.000166581572162998, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.0002314507453710784, + "loss": 0.0163, "step": 176300 }, { - "epoch": 0.89, - "learning_rate": 0.000166574004469984, - "loss": 0.0139, + "epoch": 0.46, + "learning_rate": 0.00023144685715470692, + "loss": 0.0215, "step": 176310 }, { - "epoch": 0.89, - "learning_rate": 0.00016656643677697, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023144296893833546, + "loss": 0.0158, "step": 176320 }, { - "epoch": 0.89, - "learning_rate": 0.00016655886908395598, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.000231439080721964, + "loss": 0.0163, "step": 176330 }, { - "epoch": 0.89, - "learning_rate": 0.00016655130139094196, - "loss": 0.0149, + "epoch": 0.46, + "learning_rate": 0.00023143519250559254, + "loss": 0.0168, "step": 176340 }, { - "epoch": 0.89, - "learning_rate": 0.00016654373369792797, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023143130428922106, + "loss": 0.0158, "step": 176350 }, { - "epoch": 0.89, - "learning_rate": 0.00016653616600491395, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.0002314274160728496, + "loss": 0.0174, "step": 176360 }, { - "epoch": 0.89, - "learning_rate": 0.00016652859831189993, - "loss": 0.0152, + "epoch": 0.46, + "learning_rate": 0.00023142352785647814, + "loss": 0.0162, "step": 176370 }, { - "epoch": 0.89, - "learning_rate": 0.00016652103061888594, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023141963964010668, + "loss": 0.0206, "step": 176380 }, { - "epoch": 0.89, - "learning_rate": 0.00016651346292587192, - "loss": 0.0129, + "epoch": 0.46, + "learning_rate": 0.0002314157514237352, + "loss": 0.0201, "step": 176390 }, { - "epoch": 0.89, - "learning_rate": 0.0001665058952328579, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023141186320736374, + "loss": 0.0167, "step": 176400 }, { - "epoch": 0.89, - "learning_rate": 0.0001664983275398439, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023140797499099225, + "loss": 0.0149, "step": 176410 }, { - "epoch": 0.89, - "learning_rate": 0.0001664907598468299, - "loss": 0.0125, + "epoch": 0.46, + "learning_rate": 0.00023140408677462082, + "loss": 0.0186, "step": 176420 }, { - "epoch": 0.89, - "learning_rate": 0.00016648319215381587, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023140019855824934, + "loss": 0.0184, "step": 176430 }, { - "epoch": 0.89, - "learning_rate": 0.00016647562446080188, - "loss": 0.0093, + "epoch": 0.46, + "learning_rate": 0.00023139631034187788, + "loss": 0.0187, "step": 176440 }, { - "epoch": 0.89, - "learning_rate": 0.00016646805676778786, - "loss": 0.0127, + "epoch": 0.46, + "learning_rate": 0.0002313924221255064, + "loss": 0.019, "step": 176450 }, { - "epoch": 0.89, - "learning_rate": 0.00016646048907477385, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023138853390913496, + "loss": 0.0169, "step": 176460 }, { - "epoch": 0.89, - "learning_rate": 0.00016645292138175983, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.0002313846456927635, + "loss": 0.0177, "step": 176470 }, { - "epoch": 0.89, - "learning_rate": 0.00016644535368874584, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023138075747639202, + "loss": 0.0149, "step": 176480 }, { - "epoch": 0.89, - "learning_rate": 0.00016643778599573182, - "loss": 0.0145, + "epoch": 0.46, + "learning_rate": 0.00023137686926002056, + "loss": 0.0204, "step": 176490 }, { - "epoch": 0.89, - "learning_rate": 0.0001664302183027178, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.0002313729810436491, + "loss": 0.0144, "step": 176500 }, { - "epoch": 0.89, - "learning_rate": 0.0001664226506097038, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023136909282727764, + "loss": 0.0195, "step": 176510 }, { - "epoch": 0.89, - "learning_rate": 0.0001664150829166898, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023136520461090616, + "loss": 0.0251, "step": 176520 }, { - "epoch": 0.89, - "learning_rate": 0.00016640751522367577, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.0002313613163945347, + "loss": 0.0276, "step": 176530 }, { - "epoch": 0.89, - "learning_rate": 0.00016639994753066178, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023135742817816324, + "loss": 0.014, "step": 176540 }, { - "epoch": 0.89, - "learning_rate": 0.00016639237983764776, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023135353996179178, + "loss": 0.0192, "step": 176550 }, { - "epoch": 0.89, - "learning_rate": 0.00016638481214463374, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.0002313496517454203, + "loss": 0.0204, "step": 176560 }, { - "epoch": 0.89, - "learning_rate": 0.00016637724445161975, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023134576352904884, + "loss": 0.0233, "step": 176570 }, { - "epoch": 0.89, - "learning_rate": 0.00016636967675860573, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023134187531267738, + "loss": 0.0176, "step": 176580 }, { - "epoch": 0.89, - "learning_rate": 0.0001663621090655917, - "loss": 0.0141, + "epoch": 0.46, + "learning_rate": 0.00023133798709630592, + "loss": 0.0288, "step": 176590 }, { - "epoch": 0.89, - "learning_rate": 0.00016635454137257767, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023133409887993444, + "loss": 0.0176, "step": 176600 }, { - "epoch": 0.89, - "learning_rate": 0.00016634697367956368, - "loss": 0.014, + "epoch": 0.46, + "learning_rate": 0.00023133021066356298, + "loss": 0.0155, "step": 176610 }, { - "epoch": 0.89, - "learning_rate": 0.00016633940598654966, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.00023132632244719155, + "loss": 0.0169, "step": 176620 }, { - "epoch": 0.89, - "learning_rate": 0.00016633183829353564, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.00023132243423082006, + "loss": 0.0171, "step": 176630 }, { - "epoch": 0.89, - "learning_rate": 0.00016632427060052165, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.0002313185460144486, + "loss": 0.0153, "step": 176640 }, { - "epoch": 0.89, - "learning_rate": 0.00016631670290750763, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023131465779807712, + "loss": 0.0169, "step": 176650 }, { - "epoch": 0.89, - "learning_rate": 0.0001663091352144936, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023131076958170563, + "loss": 0.0208, "step": 176660 }, { - "epoch": 0.89, - "learning_rate": 0.00016630156752147962, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.0002313068813653342, + "loss": 0.0256, "step": 176670 }, { - "epoch": 0.89, - "learning_rate": 0.0001662939998284656, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023130299314896274, + "loss": 0.0194, "step": 176680 }, { - "epoch": 0.89, - "learning_rate": 0.00016628643213545158, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023129910493259126, + "loss": 0.0176, "step": 176690 }, { - "epoch": 0.89, - "learning_rate": 0.00016627886444243756, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.0002312952167162198, + "loss": 0.0181, "step": 176700 }, { - "epoch": 0.89, - "learning_rate": 0.00016627129674942357, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023129132849984834, + "loss": 0.0137, "step": 176710 }, { - "epoch": 0.89, - "learning_rate": 0.00016626372905640955, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023128744028347688, + "loss": 0.0165, "step": 176720 }, { - "epoch": 0.89, - "learning_rate": 0.00016625616136339553, - "loss": 0.0096, + "epoch": 0.46, + "learning_rate": 0.0002312835520671054, + "loss": 0.0145, "step": 176730 }, { - "epoch": 0.89, - "learning_rate": 0.00016624859367038154, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023127966385073394, + "loss": 0.0159, "step": 176740 }, { - "epoch": 0.89, - "learning_rate": 0.00016624102597736752, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023127577563436248, + "loss": 0.0171, "step": 176750 }, { - "epoch": 0.89, - "learning_rate": 0.0001662334582843535, - "loss": 0.0125, + "epoch": 0.46, + "learning_rate": 0.00023127188741799102, + "loss": 0.0172, "step": 176760 }, { - "epoch": 0.89, - "learning_rate": 0.00016622589059133951, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023126799920161954, + "loss": 0.0161, "step": 176770 }, { - "epoch": 0.89, - "learning_rate": 0.0001662183228983255, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023126411098524808, + "loss": 0.0193, "step": 176780 }, { - "epoch": 0.89, - "learning_rate": 0.00016621075520531148, - "loss": 0.0092, + "epoch": 0.46, + "learning_rate": 0.00023126022276887665, + "loss": 0.0193, "step": 176790 }, { - "epoch": 0.89, - "learning_rate": 0.00016620318751229749, - "loss": 0.0084, + "epoch": 0.46, + "learning_rate": 0.00023125633455250516, + "loss": 0.0201, "step": 176800 }, { - "epoch": 0.89, - "learning_rate": 0.00016619561981928347, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.0002312524463361337, + "loss": 0.021, "step": 176810 }, { - "epoch": 0.89, - "learning_rate": 0.00016618805212626945, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023124855811976222, + "loss": 0.0152, "step": 176820 }, { - "epoch": 0.89, - "learning_rate": 0.00016618048443325546, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023124466990339079, + "loss": 0.0168, "step": 176830 }, { - "epoch": 0.89, - "learning_rate": 0.00016617291674024144, - "loss": 0.0094, + "epoch": 0.46, + "learning_rate": 0.0002312407816870193, + "loss": 0.0207, "step": 176840 }, { - "epoch": 0.89, - "learning_rate": 0.00016616534904722742, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023123689347064784, + "loss": 0.0151, "step": 176850 }, { - "epoch": 0.89, - "learning_rate": 0.00016615778135421343, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023123300525427636, + "loss": 0.0174, "step": 176860 }, { - "epoch": 0.89, - "learning_rate": 0.0001661502136611994, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023122911703790493, + "loss": 0.0206, "step": 176870 }, { - "epoch": 0.89, - "learning_rate": 0.0001661426459681854, - "loss": 0.0097, + "epoch": 0.46, + "learning_rate": 0.00023122522882153344, + "loss": 0.0305, "step": 176880 }, { - "epoch": 0.89, - "learning_rate": 0.00016613507827517137, - "loss": 0.0148, + "epoch": 0.46, + "learning_rate": 0.00023122134060516198, + "loss": 0.0193, "step": 176890 }, { - "epoch": 0.89, - "learning_rate": 0.00016612751058215738, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.0002312174523887905, + "loss": 0.0227, "step": 176900 }, { - "epoch": 0.89, - "learning_rate": 0.00016611994288914336, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023121356417241904, + "loss": 0.0175, "step": 176910 }, { - "epoch": 0.89, - "learning_rate": 0.00016611237519612934, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023120967595604758, + "loss": 0.0167, "step": 176920 }, { - "epoch": 0.89, - "learning_rate": 0.00016610480750311535, - "loss": 0.0088, + "epoch": 0.46, + "learning_rate": 0.00023120578773967612, + "loss": 0.0246, "step": 176930 }, { - "epoch": 0.89, - "learning_rate": 0.00016609723981010133, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023120189952330464, + "loss": 0.0182, "step": 176940 }, { - "epoch": 0.89, - "learning_rate": 0.00016608967211708732, - "loss": 0.0096, + "epoch": 0.46, + "learning_rate": 0.00023119801130693318, + "loss": 0.0146, "step": 176950 }, { - "epoch": 0.89, - "learning_rate": 0.00016608210442407332, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023119412309056175, + "loss": 0.019, "step": 176960 }, { - "epoch": 0.89, - "learning_rate": 0.0001660745367310593, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023119023487419026, + "loss": 0.0165, "step": 176970 }, { - "epoch": 0.89, - "learning_rate": 0.0001660669690380453, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023118634665781878, + "loss": 0.0148, "step": 176980 }, { - "epoch": 0.89, - "learning_rate": 0.0001660594013450313, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023118245844144732, + "loss": 0.018, "step": 176990 }, { - "epoch": 0.89, - "learning_rate": 0.00016605183365201728, - "loss": 0.0093, + "epoch": 0.46, + "learning_rate": 0.00023117857022507589, + "loss": 0.0189, "step": 177000 }, { - "epoch": 0.89, - "eval_cer": 0.9144896638256703, - "eval_loss": 0.00848294422030449, - "eval_runtime": 116.4993, - "eval_samples_per_second": 17.167, - "eval_steps_per_second": 4.292, + "epoch": 0.46, + "eval_cer": 0.8818174565517705, + "eval_loss": 0.012291929684579372, + "eval_runtime": 107.4295, + "eval_samples_per_second": 18.617, + "eval_steps_per_second": 4.654, "step": 177000 }, { - "epoch": 0.89, - "learning_rate": 0.00016604426595900326, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.0002311746820087044, + "loss": 0.0188, "step": 177010 }, { - "epoch": 0.89, - "learning_rate": 0.00016603669826598927, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.00023117079379233294, + "loss": 0.019, "step": 177020 }, { - "epoch": 0.89, - "learning_rate": 0.00016602913057297525, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023116690557596146, + "loss": 0.0171, "step": 177030 }, { - "epoch": 0.89, - "learning_rate": 0.00016602156287996123, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023116301735959003, + "loss": 0.016, "step": 177040 }, { - "epoch": 0.89, - "learning_rate": 0.0001660139951869472, - "loss": 0.0125, + "epoch": 0.46, + "learning_rate": 0.00023115912914321854, + "loss": 0.0188, "step": 177050 }, { - "epoch": 0.89, - "learning_rate": 0.00016600642749393322, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023115524092684708, + "loss": 0.0175, "step": 177060 }, { - "epoch": 0.89, - "learning_rate": 0.0001659988598009192, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.0002311513527104756, + "loss": 0.0175, "step": 177070 }, { - "epoch": 0.89, - "learning_rate": 0.00016599129210790518, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023114746449410416, + "loss": 0.0163, "step": 177080 }, { - "epoch": 0.89, - "learning_rate": 0.0001659837244148912, - "loss": 0.018, + "epoch": 0.46, + "learning_rate": 0.00023114357627773268, + "loss": 0.0168, "step": 177090 }, { - "epoch": 0.89, - "learning_rate": 0.00016597615672187717, - "loss": 0.0149, + "epoch": 0.46, + "learning_rate": 0.00023113968806136122, + "loss": 0.0147, "step": 177100 }, { - "epoch": 0.89, - "learning_rate": 0.00016596858902886315, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023113579984498974, + "loss": 0.0208, "step": 177110 }, { - "epoch": 0.89, - "learning_rate": 0.00016596102133584916, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.0002311319116286183, + "loss": 0.0163, "step": 177120 }, { - "epoch": 0.89, - "learning_rate": 0.00016595345364283514, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023112802341224682, + "loss": 0.0193, "step": 177130 }, { - "epoch": 0.89, - "learning_rate": 0.00016594588594982113, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023112413519587536, + "loss": 0.0142, "step": 177140 }, { - "epoch": 0.89, - "learning_rate": 0.00016593831825680713, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023112024697950387, + "loss": 0.0232, "step": 177150 }, { - "epoch": 0.89, - "learning_rate": 0.00016593075056379312, - "loss": 0.0133, + "epoch": 0.46, + "learning_rate": 0.00023111635876313242, + "loss": 0.0194, "step": 177160 }, { - "epoch": 0.89, - "learning_rate": 0.0001659231828707791, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023111247054676099, + "loss": 0.0161, "step": 177170 }, { - "epoch": 0.89, - "learning_rate": 0.0001659156151777651, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.0002311085823303895, + "loss": 0.0209, "step": 177180 }, { - "epoch": 0.89, - "learning_rate": 0.0001659080474847511, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023110469411401804, + "loss": 0.017, "step": 177190 }, { - "epoch": 0.89, - "learning_rate": 0.00016590047979173707, - "loss": 0.0091, + "epoch": 0.46, + "learning_rate": 0.00023110080589764656, + "loss": 0.016, "step": 177200 }, { - "epoch": 0.89, - "learning_rate": 0.00016589291209872305, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023109691768127512, + "loss": 0.02, "step": 177210 }, { - "epoch": 0.89, - "learning_rate": 0.00016588534440570906, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023109302946490364, + "loss": 0.0143, "step": 177220 }, { - "epoch": 0.89, - "learning_rate": 0.00016587777671269504, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.00023108914124853218, + "loss": 0.0188, "step": 177230 }, { - "epoch": 0.89, - "learning_rate": 0.00016587020901968102, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.0002310852530321607, + "loss": 0.0174, "step": 177240 }, { - "epoch": 0.89, - "learning_rate": 0.00016586264132666703, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023108136481578926, + "loss": 0.0157, "step": 177250 }, { - "epoch": 0.89, - "learning_rate": 0.000165855073633653, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023107747659941778, + "loss": 0.0236, "step": 177260 }, { - "epoch": 0.89, - "learning_rate": 0.000165847505940639, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023107358838304632, + "loss": 0.0224, "step": 177270 }, { - "epoch": 0.89, - "learning_rate": 0.000165839938247625, - "loss": 0.0139, + "epoch": 0.46, + "learning_rate": 0.00023106970016667483, + "loss": 0.0243, "step": 177280 }, { - "epoch": 0.89, - "learning_rate": 0.00016583237055461098, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.0002310658119503034, + "loss": 0.0238, "step": 177290 }, { - "epoch": 0.89, - "learning_rate": 0.00016582480286159696, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023106192373393192, + "loss": 0.0156, "step": 177300 }, { - "epoch": 0.89, - "learning_rate": 0.00016581723516858297, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023105803551756046, + "loss": 0.0168, "step": 177310 }, { - "epoch": 0.89, - "learning_rate": 0.00016580966747556895, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023105414730118897, + "loss": 0.0166, "step": 177320 }, { - "epoch": 0.89, - "learning_rate": 0.00016580209978255494, - "loss": 0.0143, + "epoch": 0.46, + "learning_rate": 0.00023105025908481754, + "loss": 0.0173, "step": 177330 }, { - "epoch": 0.89, - "learning_rate": 0.00016579453208954094, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023104637086844608, + "loss": 0.0244, "step": 177340 }, { - "epoch": 0.89, - "learning_rate": 0.00016578696439652693, - "loss": 0.0089, + "epoch": 0.46, + "learning_rate": 0.0002310424826520746, + "loss": 0.0164, "step": 177350 }, { - "epoch": 0.89, - "learning_rate": 0.0001657793967035129, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.00023103859443570314, + "loss": 0.0201, "step": 177360 }, { - "epoch": 0.89, - "learning_rate": 0.0001657718290104989, - "loss": 0.0096, + "epoch": 0.46, + "learning_rate": 0.00023103470621933168, + "loss": 0.0168, "step": 177370 }, { - "epoch": 0.89, - "learning_rate": 0.0001657642613174849, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023103081800296022, + "loss": 0.022, "step": 177380 }, { - "epoch": 0.89, - "learning_rate": 0.00016575669362447088, - "loss": 0.0082, + "epoch": 0.46, + "learning_rate": 0.00023102692978658874, + "loss": 0.0291, "step": 177390 }, { - "epoch": 0.9, - "learning_rate": 0.00016574912593145686, - "loss": 0.0158, + "epoch": 0.46, + "learning_rate": 0.00023102304157021728, + "loss": 0.0238, "step": 177400 }, { - "epoch": 0.9, - "learning_rate": 0.00016574155823844287, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.0002310191533538458, + "loss": 0.0196, "step": 177410 }, { - "epoch": 0.9, - "learning_rate": 0.00016573399054542885, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023101526513747436, + "loss": 0.029, "step": 177420 }, { - "epoch": 0.9, - "learning_rate": 0.00016572642285241483, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023101137692110288, + "loss": 0.027, "step": 177430 }, { - "epoch": 0.9, - "learning_rate": 0.00016571885515940084, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023100748870473142, + "loss": 0.0157, "step": 177440 }, { - "epoch": 0.9, - "learning_rate": 0.00016571128746638682, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023100360048835993, + "loss": 0.0147, "step": 177450 }, { - "epoch": 0.9, - "learning_rate": 0.0001657037197733728, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.0002309997122719885, + "loss": 0.015, "step": 177460 }, { - "epoch": 0.9, - "learning_rate": 0.0001656961520803588, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023099582405561702, + "loss": 0.0377, "step": 177470 }, { - "epoch": 0.9, - "learning_rate": 0.0001656885843873448, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023099193583924556, + "loss": 0.0661, "step": 177480 }, { - "epoch": 0.9, - "learning_rate": 0.00016568101669433077, - "loss": 0.0092, + "epoch": 0.46, + "learning_rate": 0.00023098804762287407, + "loss": 0.0178, "step": 177490 }, { - "epoch": 0.9, - "learning_rate": 0.00016567344900131678, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023098415940650264, + "loss": 0.0147, "step": 177500 }, { - "epoch": 0.9, - "learning_rate": 0.00016566588130830276, - "loss": 0.0098, + "epoch": 0.46, + "learning_rate": 0.00023098027119013118, + "loss": 0.014, "step": 177510 }, { - "epoch": 0.9, - "learning_rate": 0.00016565831361528875, - "loss": 0.0162, + "epoch": 0.46, + "learning_rate": 0.0002309763829737597, + "loss": 0.0189, "step": 177520 }, { - "epoch": 0.9, - "learning_rate": 0.00016565074592227475, - "loss": 0.0133, + "epoch": 0.46, + "learning_rate": 0.00023097249475738824, + "loss": 0.0175, "step": 177530 }, { - "epoch": 0.9, - "learning_rate": 0.00016564317822926074, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.00023096860654101678, + "loss": 0.0194, "step": 177540 }, { - "epoch": 0.9, - "learning_rate": 0.00016563561053624672, - "loss": 0.0091, + "epoch": 0.46, + "learning_rate": 0.00023096471832464532, + "loss": 0.0175, "step": 177550 }, { - "epoch": 0.9, - "learning_rate": 0.0001656280428432327, - "loss": 0.0135, + "epoch": 0.46, + "learning_rate": 0.00023096083010827384, + "loss": 0.015, "step": 177560 }, { - "epoch": 0.9, - "learning_rate": 0.0001656204751502187, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023095694189190238, + "loss": 0.0151, "step": 177570 }, { - "epoch": 0.9, - "learning_rate": 0.0001656129074572047, - "loss": 0.01, + "epoch": 0.46, + "learning_rate": 0.00023095305367553092, + "loss": 0.0206, "step": 177580 }, { - "epoch": 0.9, - "learning_rate": 0.00016560533976419067, - "loss": 0.0166, + "epoch": 0.46, + "learning_rate": 0.00023094916545915946, + "loss": 0.0188, "step": 177590 }, { - "epoch": 0.9, - "learning_rate": 0.00016559777207117668, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.00023094527724278798, + "loss": 0.0227, "step": 177600 }, { - "epoch": 0.9, - "learning_rate": 0.00016559020437816266, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023094138902641652, + "loss": 0.0259, "step": 177610 }, { - "epoch": 0.9, - "learning_rate": 0.00016558263668514864, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023093750081004506, + "loss": 0.0185, "step": 177620 }, { - "epoch": 0.9, - "learning_rate": 0.00016557506899213465, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.0002309336125936736, + "loss": 0.02, "step": 177630 }, { - "epoch": 0.9, - "learning_rate": 0.00016556750129912063, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023092972437730212, + "loss": 0.0212, "step": 177640 }, { - "epoch": 0.9, - "learning_rate": 0.0001655599336061066, - "loss": 0.0129, + "epoch": 0.46, + "learning_rate": 0.00023092583616093066, + "loss": 0.0175, "step": 177650 }, { - "epoch": 0.9, - "learning_rate": 0.00016555236591309262, - "loss": 0.0106, + "epoch": 0.46, + "learning_rate": 0.00023092194794455917, + "loss": 0.0176, "step": 177660 }, { - "epoch": 0.9, - "learning_rate": 0.0001655447982200786, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023091805972818774, + "loss": 0.0188, "step": 177670 }, { - "epoch": 0.9, - "learning_rate": 0.00016553723052706458, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023091417151181628, + "loss": 0.0175, "step": 177680 }, { - "epoch": 0.9, - "learning_rate": 0.0001655296628340506, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.0002309102832954448, + "loss": 0.0167, "step": 177690 }, { - "epoch": 0.9, - "learning_rate": 0.00016552209514103657, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.0002309063950790733, + "loss": 0.0149, "step": 177700 }, { - "epoch": 0.9, - "learning_rate": 0.00016551452744802256, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023090250686270188, + "loss": 0.0167, "step": 177710 }, { - "epoch": 0.9, - "learning_rate": 0.00016550695975500854, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023089861864633042, + "loss": 0.0154, "step": 177720 }, { - "epoch": 0.9, - "learning_rate": 0.00016549939206199455, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023089473042995894, + "loss": 0.0165, "step": 177730 }, { - "epoch": 0.9, - "learning_rate": 0.00016549182436898053, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023089084221358748, + "loss": 0.0153, "step": 177740 }, { - "epoch": 0.9, - "learning_rate": 0.0001654842566759665, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023088695399721602, + "loss": 0.0181, "step": 177750 }, { - "epoch": 0.9, - "learning_rate": 0.00016547668898295252, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023088306578084456, + "loss": 0.021, "step": 177760 }, { - "epoch": 0.9, - "learning_rate": 0.0001654691212899385, - "loss": 0.0077, + "epoch": 0.46, + "learning_rate": 0.00023087917756447308, + "loss": 0.0199, "step": 177770 }, { - "epoch": 0.9, - "learning_rate": 0.00016546155359692448, - "loss": 0.0153, + "epoch": 0.46, + "learning_rate": 0.00023087528934810162, + "loss": 0.0179, "step": 177780 }, { - "epoch": 0.9, - "learning_rate": 0.0001654539859039105, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023087140113173016, + "loss": 0.0164, "step": 177790 }, { - "epoch": 0.9, - "learning_rate": 0.00016544641821089647, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.0002308675129153587, + "loss": 0.0189, "step": 177800 }, { - "epoch": 0.9, - "learning_rate": 0.00016543885051788245, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023086362469898722, + "loss": 0.018, "step": 177810 }, { - "epoch": 0.9, - "learning_rate": 0.00016543128282486846, - "loss": 0.0144, + "epoch": 0.46, + "learning_rate": 0.00023085973648261576, + "loss": 0.022, "step": 177820 }, { - "epoch": 0.9, - "learning_rate": 0.00016542371513185444, - "loss": 0.0089, + "epoch": 0.46, + "learning_rate": 0.00023085584826624433, + "loss": 0.0193, "step": 177830 }, { - "epoch": 0.9, - "learning_rate": 0.00016541614743884042, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.00023085196004987284, + "loss": 0.0152, "step": 177840 }, { - "epoch": 0.9, - "learning_rate": 0.00016540857974582638, - "loss": 0.0141, + "epoch": 0.46, + "learning_rate": 0.00023084807183350136, + "loss": 0.0175, "step": 177850 }, { - "epoch": 0.9, - "learning_rate": 0.00016540101205281239, - "loss": 0.0095, - "step": 177860 + "epoch": 0.46, + "learning_rate": 0.0002308441836171299, + "loss": 0.0161, + "step": 177860 }, { - "epoch": 0.9, - "learning_rate": 0.00016539344435979837, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023084029540075847, + "loss": 0.018, "step": 177870 }, { - "epoch": 0.9, - "learning_rate": 0.00016538587666678435, - "loss": 0.0143, + "epoch": 0.46, + "learning_rate": 0.00023083640718438698, + "loss": 0.0157, "step": 177880 }, { - "epoch": 0.9, - "learning_rate": 0.00016537830897377036, - "loss": 0.0156, + "epoch": 0.46, + "learning_rate": 0.00023083251896801552, + "loss": 0.0174, "step": 177890 }, { - "epoch": 0.9, - "learning_rate": 0.00016537074128075634, - "loss": 0.0145, + "epoch": 0.46, + "learning_rate": 0.00023082863075164404, + "loss": 0.0158, "step": 177900 }, { - "epoch": 0.9, - "learning_rate": 0.00016536317358774232, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023082474253527258, + "loss": 0.0157, "step": 177910 }, { - "epoch": 0.9, - "learning_rate": 0.00016535560589472833, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023082085431890112, + "loss": 0.012, "step": 177920 }, { - "epoch": 0.9, - "learning_rate": 0.0001653480382017143, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023081696610252966, + "loss": 0.0153, "step": 177930 }, { - "epoch": 0.9, - "learning_rate": 0.0001653404705087003, - "loss": 0.0139, + "epoch": 0.46, + "learning_rate": 0.00023081307788615818, + "loss": 0.0143, "step": 177940 }, { - "epoch": 0.9, - "learning_rate": 0.00016533290281568627, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023080918966978672, + "loss": 0.0185, "step": 177950 }, { - "epoch": 0.9, - "learning_rate": 0.00016532533512267228, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023080530145341526, + "loss": 0.0155, "step": 177960 }, { - "epoch": 0.9, - "learning_rate": 0.00016531776742965826, - "loss": 0.014, + "epoch": 0.46, + "learning_rate": 0.0002308014132370438, + "loss": 0.0145, "step": 177970 }, { - "epoch": 0.9, - "learning_rate": 0.00016531019973664424, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023079752502067232, + "loss": 0.0178, "step": 177980 }, { - "epoch": 0.9, - "learning_rate": 0.00016530263204363025, - "loss": 0.0126, + "epoch": 0.46, + "learning_rate": 0.00023079363680430086, + "loss": 0.0188, "step": 177990 }, { - "epoch": 0.9, - "learning_rate": 0.00016529506435061623, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023078974858792943, + "loss": 0.0162, "step": 178000 }, { - "epoch": 0.9, - "eval_cer": 0.9144828710527925, - "eval_loss": 0.008248904719948769, - "eval_runtime": 116.6185, - "eval_samples_per_second": 17.15, - "eval_steps_per_second": 4.287, + "epoch": 0.46, + "eval_cer": 0.8817698688960084, + "eval_loss": 0.012205556035041809, + "eval_runtime": 108.0603, + "eval_samples_per_second": 18.508, + "eval_steps_per_second": 4.627, "step": 178000 }, { - "epoch": 0.9, - "learning_rate": 0.00016528749665760222, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023078586037155794, + "loss": 0.0186, "step": 178010 }, { - "epoch": 0.9, - "learning_rate": 0.00016527992896458822, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023078197215518646, + "loss": 0.0161, "step": 178020 }, { - "epoch": 0.9, - "learning_rate": 0.0001652723612715742, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.000230778083938815, + "loss": 0.021, "step": 178030 }, { - "epoch": 0.9, - "learning_rate": 0.0001652647935785602, - "loss": 0.0159, + "epoch": 0.46, + "learning_rate": 0.00023077419572244357, + "loss": 0.0192, "step": 178040 }, { - "epoch": 0.9, - "learning_rate": 0.0001652572258855462, - "loss": 0.0093, + "epoch": 0.46, + "learning_rate": 0.00023077030750607208, + "loss": 0.0163, "step": 178050 }, { - "epoch": 0.9, - "learning_rate": 0.00016524965819253218, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023076641928970062, + "loss": 0.0176, "step": 178060 }, { - "epoch": 0.9, - "learning_rate": 0.00016524209049951816, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023076253107332914, + "loss": 0.018, "step": 178070 }, { - "epoch": 0.9, - "learning_rate": 0.00016523452280650417, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.0002307586428569577, + "loss": 0.0179, "step": 178080 }, { - "epoch": 0.9, - "learning_rate": 0.00016522695511349015, - "loss": 0.0162, + "epoch": 0.46, + "learning_rate": 0.00023075475464058622, + "loss": 0.018, "step": 178090 }, { - "epoch": 0.9, - "learning_rate": 0.00016521938742047613, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.00023075086642421476, + "loss": 0.0154, "step": 178100 }, { - "epoch": 0.9, - "learning_rate": 0.0001652118197274621, - "loss": 0.0091, + "epoch": 0.46, + "learning_rate": 0.00023074697820784328, + "loss": 0.0198, "step": 178110 }, { - "epoch": 0.9, - "learning_rate": 0.00016520425203444812, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023074308999147184, + "loss": 0.0348, "step": 178120 }, { - "epoch": 0.9, - "learning_rate": 0.0001651966843414341, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023073920177510036, + "loss": 0.019, "step": 178130 }, { - "epoch": 0.9, - "learning_rate": 0.00016518911664842008, - "loss": 0.0081, + "epoch": 0.46, + "learning_rate": 0.0002307353135587289, + "loss": 0.0224, "step": 178140 }, { - "epoch": 0.9, - "learning_rate": 0.0001651815489554061, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023073142534235742, + "loss": 0.0216, "step": 178150 }, { - "epoch": 0.9, - "learning_rate": 0.00016517398126239207, - "loss": 0.0127, + "epoch": 0.46, + "learning_rate": 0.00023072753712598596, + "loss": 0.0172, "step": 178160 }, { - "epoch": 0.9, - "learning_rate": 0.00016516641356937805, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.0002307236489096145, + "loss": 0.0143, "step": 178170 }, { - "epoch": 0.9, - "learning_rate": 0.00016515884587636406, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023071976069324304, + "loss": 0.0223, "step": 178180 }, { - "epoch": 0.9, - "learning_rate": 0.00016515127818335004, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023071587247687155, + "loss": 0.0182, "step": 178190 }, { - "epoch": 0.9, - "learning_rate": 0.00016514371049033603, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.0002307119842605001, + "loss": 0.0173, "step": 178200 }, { - "epoch": 0.9, - "learning_rate": 0.00016513614279732203, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023070809604412867, + "loss": 0.0213, "step": 178210 }, { - "epoch": 0.9, - "learning_rate": 0.00016512857510430802, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023070420782775718, + "loss": 0.0195, "step": 178220 }, { - "epoch": 0.9, - "learning_rate": 0.000165121007411294, - "loss": 0.0114, + "epoch": 0.46, + "learning_rate": 0.00023070031961138572, + "loss": 0.0156, "step": 178230 }, { - "epoch": 0.9, - "learning_rate": 0.00016511343971828, - "loss": 0.0152, + "epoch": 0.46, + "learning_rate": 0.00023069643139501424, + "loss": 0.0213, "step": 178240 }, { - "epoch": 0.9, - "learning_rate": 0.000165105872025266, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.0002306925431786428, + "loss": 0.0241, "step": 178250 }, { - "epoch": 0.9, - "learning_rate": 0.00016509830433225197, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023068865496227132, + "loss": 0.0165, "step": 178260 }, { - "epoch": 0.9, - "learning_rate": 0.00016509073663923795, - "loss": 0.0172, + "epoch": 0.46, + "learning_rate": 0.00023068476674589986, + "loss": 0.0162, "step": 178270 }, { - "epoch": 0.9, - "learning_rate": 0.00016508316894622396, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023068087852952838, + "loss": 0.0222, "step": 178280 }, { - "epoch": 0.9, - "learning_rate": 0.00016507560125320994, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023067699031315694, + "loss": 0.0125, "step": 178290 }, { - "epoch": 0.9, - "learning_rate": 0.00016506803356019592, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023067310209678546, + "loss": 0.0184, "step": 178300 }, { - "epoch": 0.9, - "learning_rate": 0.00016506046586718193, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.000230669213880414, + "loss": 0.0156, "step": 178310 }, { - "epoch": 0.9, - "learning_rate": 0.0001650528981741679, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023066532566404251, + "loss": 0.0161, "step": 178320 }, { - "epoch": 0.9, - "learning_rate": 0.0001650453304811539, - "loss": 0.0095, + "epoch": 0.46, + "learning_rate": 0.00023066143744767108, + "loss": 0.0137, "step": 178330 }, { - "epoch": 0.9, - "learning_rate": 0.0001650377627881399, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.0002306575492312996, + "loss": 0.0228, "step": 178340 }, { - "epoch": 0.9, - "learning_rate": 0.00016503019509512588, - "loss": 0.0137, + "epoch": 0.46, + "learning_rate": 0.00023065366101492814, + "loss": 0.0265, "step": 178350 }, { - "epoch": 0.9, - "learning_rate": 0.00016502262740211186, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023064977279855665, + "loss": 0.0169, "step": 178360 }, { - "epoch": 0.9, - "learning_rate": 0.00016501505970909787, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.00023064588458218522, + "loss": 0.0174, "step": 178370 }, { - "epoch": 0.9, - "learning_rate": 0.00016500749201608385, - "loss": 0.0089, + "epoch": 0.46, + "learning_rate": 0.00023064199636581376, + "loss": 0.0237, "step": 178380 }, { - "epoch": 0.9, - "learning_rate": 0.00016499992432306984, - "loss": 0.0141, + "epoch": 0.46, + "learning_rate": 0.00023063810814944228, + "loss": 0.015, "step": 178390 }, { - "epoch": 0.9, - "learning_rate": 0.00016499235663005584, - "loss": 0.0121, + "epoch": 0.46, + "learning_rate": 0.00023063421993307082, + "loss": 0.017, "step": 178400 }, { - "epoch": 0.9, - "learning_rate": 0.00016498478893704183, - "loss": 0.013, + "epoch": 0.46, + "learning_rate": 0.00023063033171669934, + "loss": 0.0204, "step": 178410 }, { - "epoch": 0.9, - "learning_rate": 0.0001649772212440278, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.0002306264435003279, + "loss": 0.0179, "step": 178420 }, { - "epoch": 0.9, - "learning_rate": 0.00016496965355101382, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.00023062255528395642, + "loss": 0.0163, "step": 178430 }, { - "epoch": 0.9, - "learning_rate": 0.0001649620858579998, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.00023061866706758496, + "loss": 0.015, "step": 178440 }, { - "epoch": 0.9, - "learning_rate": 0.00016495451816498578, - "loss": 0.0133, + "epoch": 0.46, + "learning_rate": 0.00023061477885121347, + "loss": 0.0226, "step": 178450 }, { - "epoch": 0.9, - "learning_rate": 0.00016494695047197176, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023061089063484204, + "loss": 0.0232, "step": 178460 }, { - "epoch": 0.9, - "learning_rate": 0.00016493938277895777, - "loss": 0.0093, + "epoch": 0.46, + "learning_rate": 0.00023060700241847056, + "loss": 0.0203, "step": 178470 }, { - "epoch": 0.9, - "learning_rate": 0.00016493181508594375, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.0002306031142020991, + "loss": 0.0138, "step": 178480 }, { - "epoch": 0.9, - "learning_rate": 0.00016492424739292973, - "loss": 0.0208, + "epoch": 0.46, + "learning_rate": 0.00023059922598572761, + "loss": 0.0187, "step": 178490 }, { - "epoch": 0.9, - "learning_rate": 0.00016491667969991574, - "loss": 0.0219, + "epoch": 0.46, + "learning_rate": 0.00023059533776935618, + "loss": 0.0148, "step": 178500 }, { - "epoch": 0.9, - "learning_rate": 0.00016490911200690172, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.0002305914495529847, + "loss": 0.0155, "step": 178510 }, { - "epoch": 0.9, - "learning_rate": 0.0001649015443138877, - "loss": 0.0267, + "epoch": 0.46, + "learning_rate": 0.00023058756133661324, + "loss": 0.0157, "step": 178520 }, { - "epoch": 0.9, - "learning_rate": 0.0001648939766208737, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023058367312024175, + "loss": 0.0191, "step": 178530 }, { - "epoch": 0.9, - "learning_rate": 0.0001648864089278597, - "loss": 0.0128, + "epoch": 0.46, + "learning_rate": 0.00023057978490387032, + "loss": 0.0177, "step": 178540 }, { - "epoch": 0.9, - "learning_rate": 0.00016487884123484567, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023057589668749886, + "loss": 0.0128, "step": 178550 }, { - "epoch": 0.9, - "learning_rate": 0.00016487127354183168, - "loss": 0.0133, + "epoch": 0.46, + "learning_rate": 0.00023057200847112738, + "loss": 0.0155, "step": 178560 }, { - "epoch": 0.9, - "learning_rate": 0.00016486370584881766, - "loss": 0.0131, + "epoch": 0.46, + "learning_rate": 0.0002305681202547559, + "loss": 0.0184, "step": 178570 }, { - "epoch": 0.9, - "learning_rate": 0.00016485613815580365, - "loss": 0.0102, + "epoch": 0.46, + "learning_rate": 0.00023056423203838446, + "loss": 0.0172, "step": 178580 }, { - "epoch": 0.9, - "learning_rate": 0.00016484857046278965, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.000230560343822013, + "loss": 0.0193, "step": 178590 }, { - "epoch": 0.9, - "learning_rate": 0.00016484100276977564, - "loss": 0.0111, + "epoch": 0.46, + "learning_rate": 0.00023055645560564152, + "loss": 0.0177, "step": 178600 }, { - "epoch": 0.9, - "learning_rate": 0.00016483343507676162, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.00023055256738927006, + "loss": 0.0179, "step": 178610 }, { - "epoch": 0.9, - "learning_rate": 0.0001648258673837476, - "loss": 0.0086, + "epoch": 0.46, + "learning_rate": 0.0002305486791728986, + "loss": 0.0209, "step": 178620 }, { - "epoch": 0.9, - "learning_rate": 0.0001648182996907336, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023054479095652714, + "loss": 0.0197, "step": 178630 }, { - "epoch": 0.9, - "learning_rate": 0.0001648107319977196, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.00023054090274015566, + "loss": 0.0171, "step": 178640 }, { - "epoch": 0.9, - "learning_rate": 0.00016480316430470557, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.0002305370145237842, + "loss": 0.0192, "step": 178650 }, { - "epoch": 0.9, - "learning_rate": 0.00016479559661169158, - "loss": 0.0107, + "epoch": 0.46, + "learning_rate": 0.0002305331263074127, + "loss": 0.0181, "step": 178660 }, { - "epoch": 0.9, - "learning_rate": 0.00016478802891867756, - "loss": 0.0094, + "epoch": 0.46, + "learning_rate": 0.00023052923809104128, + "loss": 0.0172, "step": 178670 }, { - "epoch": 0.9, - "learning_rate": 0.00016478046122566354, - "loss": 0.0101, + "epoch": 0.46, + "learning_rate": 0.0002305253498746698, + "loss": 0.0187, "step": 178680 }, { - "epoch": 0.9, - "learning_rate": 0.00016477289353264955, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023052146165829834, + "loss": 0.0199, "step": 178690 }, { - "epoch": 0.9, - "learning_rate": 0.00016476532583963553, - "loss": 0.01, + "epoch": 0.46, + "learning_rate": 0.00023051757344192685, + "loss": 0.0156, "step": 178700 }, { - "epoch": 0.9, - "learning_rate": 0.0001647577581466215, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.00023051368522555542, + "loss": 0.0206, "step": 178710 }, { - "epoch": 0.9, - "learning_rate": 0.00016475019045360752, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023050979700918394, + "loss": 0.0161, "step": 178720 }, { - "epoch": 0.9, - "learning_rate": 0.0001647426227605935, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023050590879281248, + "loss": 0.0167, "step": 178730 }, { - "epoch": 0.9, - "learning_rate": 0.00016473505506757948, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.000230502020576441, + "loss": 0.0187, "step": 178740 }, { - "epoch": 0.9, - "learning_rate": 0.0001647274873745655, - "loss": 0.0158, + "epoch": 0.46, + "learning_rate": 0.00023049813236006956, + "loss": 0.0207, "step": 178750 }, { - "epoch": 0.9, - "learning_rate": 0.00016471991968155147, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.0002304942441436981, + "loss": 0.0168, "step": 178760 }, { - "epoch": 0.9, - "learning_rate": 0.00016471235198853746, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023049035592732662, + "loss": 0.0234, "step": 178770 }, { - "epoch": 0.9, - "learning_rate": 0.00016470478429552344, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023048646771095516, + "loss": 0.0169, "step": 178780 }, { - "epoch": 0.9, - "learning_rate": 0.00016469721660250945, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.0002304825794945837, + "loss": 0.0163, "step": 178790 }, { - "epoch": 0.9, - "learning_rate": 0.00016468964890949543, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023047869127821224, + "loss": 0.0151, "step": 178800 }, { - "epoch": 0.9, - "learning_rate": 0.0001646820812164814, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.00023047480306184076, + "loss": 0.0164, "step": 178810 }, { - "epoch": 0.9, - "learning_rate": 0.00016467451352346742, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.0002304709148454693, + "loss": 0.0136, "step": 178820 }, { - "epoch": 0.9, - "learning_rate": 0.0001646669458304534, - "loss": 0.0146, + "epoch": 0.46, + "learning_rate": 0.00023046702662909784, + "loss": 0.0201, "step": 178830 }, { - "epoch": 0.9, - "learning_rate": 0.00016465937813743938, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023046313841272638, + "loss": 0.0149, "step": 178840 }, { - "epoch": 0.9, - "learning_rate": 0.0001646518104444254, - "loss": 0.012, + "epoch": 0.46, + "learning_rate": 0.0002304592501963549, + "loss": 0.0172, "step": 178850 }, { - "epoch": 0.9, - "learning_rate": 0.00016464424275141137, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023045536197998344, + "loss": 0.0168, "step": 178860 }, { - "epoch": 0.9, - "learning_rate": 0.00016463667505839735, - "loss": 0.0084, + "epoch": 0.46, + "learning_rate": 0.000230451473763612, + "loss": 0.022, "step": 178870 }, { - "epoch": 0.9, - "learning_rate": 0.00016462910736538336, - "loss": 0.0092, + "epoch": 0.46, + "learning_rate": 0.00023044758554724052, + "loss": 0.0174, "step": 178880 }, { - "epoch": 0.9, - "learning_rate": 0.00016462153967236934, - "loss": 0.0154, + "epoch": 0.46, + "learning_rate": 0.00023044369733086904, + "loss": 0.0209, "step": 178890 }, { - "epoch": 0.9, - "learning_rate": 0.00016461397197935532, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023043980911449758, + "loss": 0.0179, "step": 178900 }, { - "epoch": 0.9, - "learning_rate": 0.00016460640428634133, - "loss": 0.0132, + "epoch": 0.46, + "learning_rate": 0.0002304359208981261, + "loss": 0.0188, "step": 178910 }, { - "epoch": 0.9, - "learning_rate": 0.0001645988365933273, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023043203268175466, + "loss": 0.0172, "step": 178920 }, { - "epoch": 0.9, - "learning_rate": 0.0001645912689003133, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.0002304281444653832, + "loss": 0.0202, "step": 178930 }, { - "epoch": 0.9, - "learning_rate": 0.0001645837012072993, - "loss": 0.0108, + "epoch": 0.46, + "learning_rate": 0.00023042425624901172, + "loss": 0.0203, "step": 178940 }, { - "epoch": 0.9, - "learning_rate": 0.00016457613351428528, - "loss": 0.0109, + "epoch": 0.46, + "learning_rate": 0.00023042036803264026, + "loss": 0.0182, "step": 178950 }, { - "epoch": 0.9, - "learning_rate": 0.00016456856582127127, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.0002304164798162688, + "loss": 0.0284, "step": 178960 }, { - "epoch": 0.9, - "learning_rate": 0.00016456099812825725, - "loss": 0.0142, + "epoch": 0.46, + "learning_rate": 0.00023041259159989734, + "loss": 0.0226, "step": 178970 }, { - "epoch": 0.9, - "learning_rate": 0.00016455343043524326, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023040870338352586, + "loss": 0.0167, "step": 178980 }, { - "epoch": 0.9, - "learning_rate": 0.00016454586274222924, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.0002304048151671544, + "loss": 0.0144, "step": 178990 }, { - "epoch": 0.9, - "learning_rate": 0.00016453829504921522, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023040092695078294, + "loss": 0.0166, "step": 179000 }, { - "epoch": 0.9, - "eval_cer": 0.914462492734159, - "eval_loss": 0.008126331493258476, - "eval_runtime": 116.7985, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.46, + "eval_cer": 0.8817880641761527, + "eval_loss": 0.012226469814777374, + "eval_runtime": 108.116, + "eval_samples_per_second": 18.499, + "eval_steps_per_second": 4.625, "step": 179000 }, { - "epoch": 0.9, - "learning_rate": 0.00016453072735620123, - "loss": 0.0122, + "epoch": 0.46, + "learning_rate": 0.00023039703873441148, + "loss": 0.0176, "step": 179010 }, { - "epoch": 0.9, - "learning_rate": 0.0001645231596631872, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023039315051804, + "loss": 0.0151, "step": 179020 }, { - "epoch": 0.9, - "learning_rate": 0.0001645155919701732, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.00023038926230166854, + "loss": 0.021, "step": 179030 }, { - "epoch": 0.9, - "learning_rate": 0.0001645080242771592, - "loss": 0.0118, + "epoch": 0.46, + "learning_rate": 0.00023038537408529708, + "loss": 0.0225, "step": 179040 }, { - "epoch": 0.9, - "learning_rate": 0.00016450045658414518, - "loss": 0.0124, + "epoch": 0.46, + "learning_rate": 0.00023038148586892562, + "loss": 0.0185, "step": 179050 }, { - "epoch": 0.9, - "learning_rate": 0.00016449288889113116, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023037759765255414, + "loss": 0.0163, "step": 179060 }, { - "epoch": 0.9, - "learning_rate": 0.00016448532119811717, - "loss": 0.0093, + "epoch": 0.46, + "learning_rate": 0.00023037370943618268, + "loss": 0.0141, "step": 179070 }, { - "epoch": 0.9, - "learning_rate": 0.00016447775350510315, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023036982121981125, + "loss": 0.0185, "step": 179080 }, { - "epoch": 0.9, - "learning_rate": 0.00016447018581208913, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023036593300343976, + "loss": 0.0155, "step": 179090 }, { - "epoch": 0.9, - "learning_rate": 0.00016446261811907514, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.0002303620447870683, + "loss": 0.0151, "step": 179100 }, { - "epoch": 0.9, - "learning_rate": 0.0001644550504260611, - "loss": 0.0172, + "epoch": 0.46, + "learning_rate": 0.00023035815657069682, + "loss": 0.0149, "step": 179110 }, { - "epoch": 0.9, - "learning_rate": 0.00016444748273304708, - "loss": 0.0158, + "epoch": 0.46, + "learning_rate": 0.00023035426835432538, + "loss": 0.0195, "step": 179120 }, { - "epoch": 0.9, - "learning_rate": 0.00016443991504003306, - "loss": 0.0119, + "epoch": 0.46, + "learning_rate": 0.0002303503801379539, + "loss": 0.0186, "step": 179130 }, { - "epoch": 0.9, - "learning_rate": 0.00016443234734701907, - "loss": 0.0134, + "epoch": 0.46, + "learning_rate": 0.00023034649192158244, + "loss": 0.0196, "step": 179140 }, { - "epoch": 0.9, - "learning_rate": 0.00016442477965400505, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023034260370521096, + "loss": 0.0166, "step": 179150 }, { - "epoch": 0.9, - "learning_rate": 0.00016441721196099103, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.0002303387154888395, + "loss": 0.019, "step": 179160 }, { - "epoch": 0.9, - "learning_rate": 0.000164409644267977, - "loss": 0.0117, + "epoch": 0.46, + "learning_rate": 0.00023033482727246804, + "loss": 0.0222, "step": 179170 }, { - "epoch": 0.9, - "learning_rate": 0.00016440207657496302, - "loss": 0.0097, + "epoch": 0.46, + "learning_rate": 0.00023033093905609658, + "loss": 0.0189, "step": 179180 }, { - "epoch": 0.9, - "learning_rate": 0.000164394508881949, - "loss": 0.0103, + "epoch": 0.46, + "learning_rate": 0.0002303270508397251, + "loss": 0.0173, "step": 179190 }, { - "epoch": 0.9, - "learning_rate": 0.00016438694118893498, - "loss": 0.0105, + "epoch": 0.46, + "learning_rate": 0.00023032316262335364, + "loss": 0.0197, "step": 179200 }, { - "epoch": 0.9, - "learning_rate": 0.000164379373495921, - "loss": 0.0112, + "epoch": 0.46, + "learning_rate": 0.00023031927440698218, + "loss": 0.0209, "step": 179210 }, { - "epoch": 0.9, - "learning_rate": 0.00016437180580290697, - "loss": 0.0147, + "epoch": 0.46, + "learning_rate": 0.00023031538619061072, + "loss": 0.0207, "step": 179220 }, { - "epoch": 0.9, - "learning_rate": 0.00016436423810989295, - "loss": 0.0154, + "epoch": 0.46, + "learning_rate": 0.00023031149797423923, + "loss": 0.0193, "step": 179230 }, { - "epoch": 0.9, - "learning_rate": 0.00016435667041687896, - "loss": 0.0091, + "epoch": 0.46, + "learning_rate": 0.00023030760975786778, + "loss": 0.0139, "step": 179240 }, { - "epoch": 0.9, - "learning_rate": 0.00016434910272386494, - "loss": 0.0099, + "epoch": 0.46, + "learning_rate": 0.00023030372154149634, + "loss": 0.02, "step": 179250 }, { - "epoch": 0.9, - "learning_rate": 0.00016434153503085093, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.00023029983332512486, + "loss": 0.0165, "step": 179260 }, { - "epoch": 0.9, - "learning_rate": 0.00016433396733783693, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.0002302959451087534, + "loss": 0.018, "step": 179270 }, { - "epoch": 0.9, - "learning_rate": 0.00016432639964482292, - "loss": 0.0116, + "epoch": 0.46, + "learning_rate": 0.00023029205689238192, + "loss": 0.0149, "step": 179280 }, { - "epoch": 0.9, - "learning_rate": 0.0001643188319518089, - "loss": 0.0104, + "epoch": 0.46, + "learning_rate": 0.00023028816867601048, + "loss": 0.0134, "step": 179290 }, { - "epoch": 0.9, - "learning_rate": 0.0001643112642587949, - "loss": 0.0115, + "epoch": 0.46, + "learning_rate": 0.000230284280459639, + "loss": 0.0178, "step": 179300 }, { - "epoch": 0.9, - "learning_rate": 0.0001643036965657809, - "loss": 0.0136, + "epoch": 0.46, + "learning_rate": 0.00023028039224326754, + "loss": 0.0158, "step": 179310 }, { - "epoch": 0.9, - "learning_rate": 0.00016429612887276687, - "loss": 0.0123, + "epoch": 0.46, + "learning_rate": 0.00023027650402689605, + "loss": 0.0164, "step": 179320 }, { - "epoch": 0.9, - "learning_rate": 0.00016428856117975288, - "loss": 0.0089, + "epoch": 0.46, + "learning_rate": 0.00023027261581052462, + "loss": 0.021, "step": 179330 }, { - "epoch": 0.9, - "learning_rate": 0.00016428099348673886, - "loss": 0.0113, + "epoch": 0.46, + "learning_rate": 0.00023026872759415314, + "loss": 0.0153, "step": 179340 }, { - "epoch": 0.9, - "learning_rate": 0.00016427342579372484, - "loss": 0.0096, + "epoch": 0.46, + "learning_rate": 0.00023026483937778168, + "loss": 0.0206, "step": 179350 }, { - "epoch": 0.9, - "learning_rate": 0.00016426585810071082, - "loss": 0.0138, + "epoch": 0.46, + "learning_rate": 0.0002302609511614102, + "loss": 0.0175, "step": 179360 }, { - "epoch": 0.9, - "learning_rate": 0.00016425829040769683, - "loss": 0.0143, + "epoch": 0.46, + "learning_rate": 0.00023025706294503876, + "loss": 0.0168, "step": 179370 }, { - "epoch": 0.9, - "learning_rate": 0.0001642507227146828, - "loss": 0.011, + "epoch": 0.46, + "learning_rate": 0.00023025317472866728, + "loss": 0.0231, "step": 179380 }, { - "epoch": 0.91, - "learning_rate": 0.0001642431550216688, - "loss": 0.016, + "epoch": 0.47, + "learning_rate": 0.00023024928651229582, + "loss": 0.0155, "step": 179390 }, { - "epoch": 0.91, - "learning_rate": 0.0001642355873286548, - "loss": 0.0085, + "epoch": 0.47, + "learning_rate": 0.00023024539829592433, + "loss": 0.0149, "step": 179400 }, { - "epoch": 0.91, - "learning_rate": 0.00016422801963564078, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00023024151007955288, + "loss": 0.0138, "step": 179410 }, { - "epoch": 0.91, - "learning_rate": 0.00016422045194262676, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.00023023762186318144, + "loss": 0.0166, "step": 179420 }, { - "epoch": 0.91, - "learning_rate": 0.00016421288424961277, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00023023373364680996, + "loss": 0.0213, "step": 179430 }, { - "epoch": 0.91, - "learning_rate": 0.00016420531655659875, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.00023022984543043847, + "loss": 0.0194, "step": 179440 }, { - "epoch": 0.91, - "learning_rate": 0.00016419774886358474, - "loss": 0.0133, + "epoch": 0.47, + "learning_rate": 0.00023022595721406701, + "loss": 0.0174, "step": 179450 }, { - "epoch": 0.91, - "learning_rate": 0.00016419018117057074, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00023022206899769558, + "loss": 0.0183, "step": 179460 }, { - "epoch": 0.91, - "learning_rate": 0.00016418261347755673, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.0002302181807813241, + "loss": 0.0178, "step": 179470 }, { - "epoch": 0.91, - "learning_rate": 0.0001641750457845427, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00023021429256495264, + "loss": 0.0156, "step": 179480 }, { - "epoch": 0.91, - "learning_rate": 0.00016416747809152872, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.00023021040434858115, + "loss": 0.0175, "step": 179490 }, { - "epoch": 0.91, - "learning_rate": 0.0001641599103985147, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.00023020651613220972, + "loss": 0.0212, "step": 179500 }, { - "epoch": 0.91, - "learning_rate": 0.00016415234270550068, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00023020262791583824, + "loss": 0.017, "step": 179510 }, { - "epoch": 0.91, - "learning_rate": 0.00016414477501248666, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00023019873969946678, + "loss": 0.0177, "step": 179520 }, { - "epoch": 0.91, - "learning_rate": 0.00016413720731947267, - "loss": 0.0132, + "epoch": 0.47, + "learning_rate": 0.0002301948514830953, + "loss": 0.0193, "step": 179530 }, { - "epoch": 0.91, - "learning_rate": 0.00016412963962645865, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00023019096326672386, + "loss": 0.0166, "step": 179540 }, { - "epoch": 0.91, - "learning_rate": 0.00016412207193344463, - "loss": 0.0153, + "epoch": 0.47, + "learning_rate": 0.00023018707505035238, + "loss": 0.0182, "step": 179550 }, { - "epoch": 0.91, - "learning_rate": 0.00016411450424043064, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.00023018318683398092, + "loss": 0.0203, "step": 179560 }, { - "epoch": 0.91, - "learning_rate": 0.00016410693654741662, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00023017929861760943, + "loss": 0.0155, "step": 179570 }, { - "epoch": 0.91, - "learning_rate": 0.0001640993688544026, - "loss": 0.0216, + "epoch": 0.47, + "learning_rate": 0.000230175410401238, + "loss": 0.0186, "step": 179580 }, { - "epoch": 0.91, - "learning_rate": 0.0001640918011613886, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00023017152218486654, + "loss": 0.0168, "step": 179590 }, { - "epoch": 0.91, - "learning_rate": 0.0001640842334683746, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00023016763396849506, + "loss": 0.0186, "step": 179600 }, { - "epoch": 0.91, - "learning_rate": 0.00016407666577536058, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00023016374575212357, + "loss": 0.0195, "step": 179610 }, { - "epoch": 0.91, - "learning_rate": 0.00016406909808234658, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00023015985753575214, + "loss": 0.0196, "step": 179620 }, { - "epoch": 0.91, - "learning_rate": 0.00016406153038933257, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.00023015596931938068, + "loss": 0.0212, "step": 179630 }, { - "epoch": 0.91, - "learning_rate": 0.00016405396269631855, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.0002301520811030092, + "loss": 0.0136, "step": 179640 }, { - "epoch": 0.91, - "learning_rate": 0.00016404639500330455, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.00023014819288663774, + "loss": 0.0197, "step": 179650 }, { - "epoch": 0.91, - "learning_rate": 0.00016403882731029054, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00023014430467026625, + "loss": 0.0141, "step": 179660 }, { - "epoch": 0.91, - "learning_rate": 0.00016403125961727652, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00023014041645389482, + "loss": 0.0187, "step": 179670 }, { - "epoch": 0.91, - "learning_rate": 0.0001640236919242625, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.00023013652823752334, + "loss": 0.0141, "step": 179680 }, { - "epoch": 0.91, - "learning_rate": 0.0001640161242312485, - "loss": 0.017, + "epoch": 0.47, + "learning_rate": 0.00023013264002115188, + "loss": 0.0209, "step": 179690 }, { - "epoch": 0.91, - "learning_rate": 0.0001640085565382345, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.0002301287518047804, + "loss": 0.0221, "step": 179700 }, { - "epoch": 0.91, - "learning_rate": 0.00016400098884522047, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.00023012486358840896, + "loss": 0.0166, "step": 179710 }, { - "epoch": 0.91, - "learning_rate": 0.00016399342115220648, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.00023012097537203748, + "loss": 0.0177, "step": 179720 }, { - "epoch": 0.91, - "learning_rate": 0.00016398585345919246, - "loss": 0.0084, + "epoch": 0.47, + "learning_rate": 0.00023011708715566602, + "loss": 0.0195, "step": 179730 }, { - "epoch": 0.91, - "learning_rate": 0.00016397828576617844, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00023011319893929453, + "loss": 0.0176, "step": 179740 }, { - "epoch": 0.91, - "learning_rate": 0.00016397071807316445, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.0002301093107229231, + "loss": 0.0188, "step": 179750 }, { - "epoch": 0.91, - "learning_rate": 0.00016396315038015043, - "loss": 0.0088, + "epoch": 0.47, + "learning_rate": 0.00023010542250655162, + "loss": 0.0225, "step": 179760 }, { - "epoch": 0.91, - "learning_rate": 0.00016395558268713641, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00023010153429018016, + "loss": 0.0221, "step": 179770 }, { - "epoch": 0.91, - "learning_rate": 0.00016394801499412242, - "loss": 0.0152, + "epoch": 0.47, + "learning_rate": 0.00023009764607380867, + "loss": 0.0183, "step": 179780 }, { - "epoch": 0.91, - "learning_rate": 0.0001639404473011084, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00023009375785743724, + "loss": 0.0176, "step": 179790 }, { - "epoch": 0.91, - "learning_rate": 0.00016393287960809439, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00023008986964106578, + "loss": 0.0215, "step": 179800 }, { - "epoch": 0.91, - "learning_rate": 0.0001639253119150804, - "loss": 0.0165, + "epoch": 0.47, + "learning_rate": 0.0002300859814246943, + "loss": 0.0224, "step": 179810 }, { - "epoch": 0.91, - "learning_rate": 0.00016391774422206638, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00023008209320832284, + "loss": 0.0189, "step": 179820 }, { - "epoch": 0.91, - "learning_rate": 0.00016391017652905236, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00023007820499195138, + "loss": 0.0172, "step": 179830 }, { - "epoch": 0.91, - "learning_rate": 0.00016390260883603837, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00023007431677557992, + "loss": 0.0181, "step": 179840 }, { - "epoch": 0.91, - "learning_rate": 0.00016389504114302435, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00023007042855920844, + "loss": 0.0143, "step": 179850 }, { - "epoch": 0.91, - "learning_rate": 0.00016388747345001033, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00023006654034283698, + "loss": 0.0141, "step": 179860 }, { - "epoch": 0.91, - "learning_rate": 0.0001638799057569963, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00023006265212646552, + "loss": 0.0173, "step": 179870 }, { - "epoch": 0.91, - "learning_rate": 0.00016387233806398232, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.00023005876391009406, + "loss": 0.0183, "step": 179880 }, { - "epoch": 0.91, - "learning_rate": 0.0001638647703709683, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.00023005487569372258, + "loss": 0.0153, "step": 179890 }, { - "epoch": 0.91, - "learning_rate": 0.00016385720267795428, - "loss": 0.0081, + "epoch": 0.47, + "learning_rate": 0.00023005098747735112, + "loss": 0.0153, "step": 179900 }, { - "epoch": 0.91, - "learning_rate": 0.0001638496349849403, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00023004709926097963, + "loss": 0.0174, "step": 179910 }, { - "epoch": 0.91, - "learning_rate": 0.00016384206729192627, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.0002300432110446082, + "loss": 0.0193, "step": 179920 }, { - "epoch": 0.91, - "learning_rate": 0.00016383449959891225, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00023003932282823672, + "loss": 0.0169, "step": 179930 }, { - "epoch": 0.91, - "learning_rate": 0.00016382693190589826, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.00023003543461186526, + "loss": 0.0147, "step": 179940 }, { - "epoch": 0.91, - "learning_rate": 0.00016381936421288424, - "loss": 0.0149, + "epoch": 0.47, + "learning_rate": 0.00023003154639549377, + "loss": 0.0146, "step": 179950 }, { - "epoch": 0.91, - "learning_rate": 0.00016381179651987022, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00023002765817912234, + "loss": 0.0161, "step": 179960 }, { - "epoch": 0.91, - "learning_rate": 0.00016380422882685623, - "loss": 0.0134, + "epoch": 0.47, + "learning_rate": 0.00023002376996275088, + "loss": 0.0184, "step": 179970 }, { - "epoch": 0.91, - "learning_rate": 0.00016379666113384221, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.0002300198817463794, + "loss": 0.0213, "step": 179980 }, { - "epoch": 0.91, - "learning_rate": 0.0001637890934408282, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00023001599353000794, + "loss": 0.0198, "step": 179990 }, { - "epoch": 0.91, - "learning_rate": 0.0001637815257478142, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00023001210531363648, + "loss": 0.0192, "step": 180000 }, { - "epoch": 0.91, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.008224265649914742, - "eval_runtime": 116.6551, - "eval_samples_per_second": 17.145, - "eval_steps_per_second": 4.286, + "epoch": 0.47, + "eval_cer": 0.881821655462573, + "eval_loss": 0.012280810624361038, + "eval_runtime": 108.0099, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 180000 }, { - "epoch": 0.91, - "learning_rate": 0.00016377395805480019, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00023000821709726502, + "loss": 0.0165, "step": 180010 }, { - "epoch": 0.91, - "learning_rate": 0.00016376639036178617, - "loss": 0.009, + "epoch": 0.47, + "learning_rate": 0.00023000432888089354, + "loss": 0.0186, "step": 180020 }, { - "epoch": 0.91, - "learning_rate": 0.00016375882266877215, - "loss": 0.0138, + "epoch": 0.47, + "learning_rate": 0.00023000044066452208, + "loss": 0.0208, "step": 180030 }, { - "epoch": 0.91, - "learning_rate": 0.00016375125497575816, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.00022999655244815062, + "loss": 0.0213, "step": 180040 }, { - "epoch": 0.91, - "learning_rate": 0.00016374368728274414, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.00022999266423177916, + "loss": 0.0197, "step": 180050 }, { - "epoch": 0.91, - "learning_rate": 0.00016373611958973012, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.00022998877601540768, + "loss": 0.0195, "step": 180060 }, { - "epoch": 0.91, - "learning_rate": 0.00016372855189671613, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.00022998488779903622, + "loss": 0.0176, "step": 180070 }, { - "epoch": 0.91, - "learning_rate": 0.0001637209842037021, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022998099958266476, + "loss": 0.0195, "step": 180080 }, { - "epoch": 0.91, - "learning_rate": 0.0001637134165106881, - "loss": 0.0144, + "epoch": 0.47, + "learning_rate": 0.0002299771113662933, + "loss": 0.0199, "step": 180090 }, { - "epoch": 0.91, - "learning_rate": 0.0001637058488176741, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022997322314992181, + "loss": 0.0144, "step": 180100 }, { - "epoch": 0.91, - "learning_rate": 0.00016369828112466008, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022996933493355036, + "loss": 0.0158, "step": 180110 }, { - "epoch": 0.91, - "learning_rate": 0.00016369071343164606, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022996544671717893, + "loss": 0.0175, "step": 180120 }, { - "epoch": 0.91, - "learning_rate": 0.00016368314573863207, - "loss": 0.0141, + "epoch": 0.47, + "learning_rate": 0.00022996155850080744, + "loss": 0.0186, "step": 180130 }, { - "epoch": 0.91, - "learning_rate": 0.00016367557804561805, - "loss": 0.0137, + "epoch": 0.47, + "learning_rate": 0.00022995767028443598, + "loss": 0.0203, "step": 180140 }, { - "epoch": 0.91, - "learning_rate": 0.00016366801035260403, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.0002299537820680645, + "loss": 0.0167, "step": 180150 }, { - "epoch": 0.91, - "learning_rate": 0.00016366044265959004, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.000229949893851693, + "loss": 0.018, "step": 180160 }, { - "epoch": 0.91, - "learning_rate": 0.00016365287496657602, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00022994600563532158, + "loss": 0.0169, "step": 180170 }, { - "epoch": 0.91, - "learning_rate": 0.000163645307273562, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.00022994211741895012, + "loss": 0.0217, "step": 180180 }, { - "epoch": 0.91, - "learning_rate": 0.000163637739580548, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022993822920257864, + "loss": 0.0166, "step": 180190 }, { - "epoch": 0.91, - "learning_rate": 0.000163630171887534, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.00022993434098620718, + "loss": 0.018, "step": 180200 }, { - "epoch": 0.91, - "learning_rate": 0.00016362260419451998, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022993045276983572, + "loss": 0.0148, "step": 180210 }, { - "epoch": 0.91, - "learning_rate": 0.00016361503650150596, - "loss": 0.0133, + "epoch": 0.47, + "learning_rate": 0.00022992656455346426, + "loss": 0.016, "step": 180220 }, { - "epoch": 0.91, - "learning_rate": 0.00016360746880849197, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022992267633709277, + "loss": 0.0169, "step": 180230 }, { - "epoch": 0.91, - "learning_rate": 0.00016359990111547795, - "loss": 0.0166, + "epoch": 0.47, + "learning_rate": 0.00022991878812072132, + "loss": 0.0167, "step": 180240 }, { - "epoch": 0.91, - "learning_rate": 0.00016359233342246393, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022991489990434986, + "loss": 0.0179, "step": 180250 }, { - "epoch": 0.91, - "learning_rate": 0.00016358476572944994, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.0002299110116879784, + "loss": 0.0163, "step": 180260 }, { - "epoch": 0.91, - "learning_rate": 0.00016357719803643592, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022990712347160691, + "loss": 0.0177, "step": 180270 }, { - "epoch": 0.91, - "learning_rate": 0.0001635696303434219, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022990323525523546, + "loss": 0.0167, "step": 180280 }, { - "epoch": 0.91, - "learning_rate": 0.0001635620626504079, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022989934703886402, + "loss": 0.0173, "step": 180290 }, { - "epoch": 0.91, - "learning_rate": 0.0001635544949573939, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022989545882249254, + "loss": 0.0237, "step": 180300 }, { - "epoch": 0.91, - "learning_rate": 0.00016354692726437987, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022989157060612105, + "loss": 0.0175, "step": 180310 }, { - "epoch": 0.91, - "learning_rate": 0.00016353935957136588, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.0002298876823897496, + "loss": 0.0195, "step": 180320 }, { - "epoch": 0.91, - "learning_rate": 0.00016353179187835186, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022988379417337816, + "loss": 0.0191, "step": 180330 }, { - "epoch": 0.91, - "learning_rate": 0.00016352422418533784, - "loss": 0.009, + "epoch": 0.47, + "learning_rate": 0.00022987990595700668, + "loss": 0.0174, "step": 180340 }, { - "epoch": 0.91, - "learning_rate": 0.00016351665649232383, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022987601774063522, + "loss": 0.0159, "step": 180350 }, { - "epoch": 0.91, - "learning_rate": 0.00016350908879930983, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022987212952426373, + "loss": 0.0174, "step": 180360 }, { - "epoch": 0.91, - "learning_rate": 0.0001635015211062958, - "loss": 0.0081, + "epoch": 0.47, + "learning_rate": 0.0002298682413078923, + "loss": 0.0166, "step": 180370 }, { - "epoch": 0.91, - "learning_rate": 0.00016349395341328177, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022986435309152082, + "loss": 0.0183, "step": 180380 }, { - "epoch": 0.91, - "learning_rate": 0.00016348638572026778, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00022986046487514936, + "loss": 0.0182, "step": 180390 }, { - "epoch": 0.91, - "learning_rate": 0.00016347881802725376, - "loss": 0.0102, - "step": 180400 + "epoch": 0.47, + "learning_rate": 0.00022985657665877787, + "loss": 0.0178, + "step": 180400 }, { - "epoch": 0.91, - "learning_rate": 0.00016347125033423974, - "loss": 0.0083, + "epoch": 0.47, + "learning_rate": 0.00022985268844240642, + "loss": 0.0183, "step": 180410 }, { - "epoch": 0.91, - "learning_rate": 0.00016346368264122572, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022984880022603496, + "loss": 0.019, "step": 180420 }, { - "epoch": 0.91, - "learning_rate": 0.00016345611494821173, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.0002298449120096635, + "loss": 0.0168, "step": 180430 }, { - "epoch": 0.91, - "learning_rate": 0.0001634485472551977, - "loss": 0.0153, + "epoch": 0.47, + "learning_rate": 0.00022984102379329201, + "loss": 0.018, "step": 180440 }, { - "epoch": 0.91, - "learning_rate": 0.0001634409795621837, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.00022983713557692056, + "loss": 0.0181, "step": 180450 }, { - "epoch": 0.91, - "learning_rate": 0.0001634334118691697, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.00022983324736054912, + "loss": 0.0195, "step": 180460 }, { - "epoch": 0.91, - "learning_rate": 0.00016342584417615568, - "loss": 0.0147, + "epoch": 0.47, + "learning_rate": 0.00022982935914417764, + "loss": 0.0163, "step": 180470 }, { - "epoch": 0.91, - "learning_rate": 0.00016341827648314167, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022982547092780615, + "loss": 0.0173, "step": 180480 }, { - "epoch": 0.91, - "learning_rate": 0.00016341070879012767, - "loss": 0.0176, + "epoch": 0.47, + "learning_rate": 0.0002298215827114347, + "loss": 0.0179, "step": 180490 }, { - "epoch": 0.91, - "learning_rate": 0.00016340314109711366, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022981769449506326, + "loss": 0.0207, "step": 180500 }, { - "epoch": 0.91, - "learning_rate": 0.00016339557340409964, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00022981380627869178, + "loss": 0.0189, "step": 180510 }, { - "epoch": 0.91, - "learning_rate": 0.00016338800571108565, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022980991806232032, + "loss": 0.0218, "step": 180520 }, { - "epoch": 0.91, - "learning_rate": 0.00016338043801807163, - "loss": 0.014, + "epoch": 0.47, + "learning_rate": 0.00022980602984594883, + "loss": 0.0193, "step": 180530 }, { - "epoch": 0.91, - "learning_rate": 0.0001633728703250576, - "loss": 0.0174, + "epoch": 0.47, + "learning_rate": 0.0002298021416295774, + "loss": 0.0193, "step": 180540 }, { - "epoch": 0.91, - "learning_rate": 0.00016336530263204362, - "loss": 0.0089, + "epoch": 0.47, + "learning_rate": 0.00022979825341320592, + "loss": 0.0199, "step": 180550 }, { - "epoch": 0.91, - "learning_rate": 0.0001633577349390296, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022979436519683446, + "loss": 0.0225, "step": 180560 }, { - "epoch": 0.91, - "learning_rate": 0.00016335016724601558, - "loss": 0.0146, + "epoch": 0.47, + "learning_rate": 0.00022979047698046297, + "loss": 0.0231, "step": 180570 }, { - "epoch": 0.91, - "learning_rate": 0.00016334259955300156, - "loss": 0.0176, + "epoch": 0.47, + "learning_rate": 0.00022978658876409154, + "loss": 0.0154, "step": 180580 }, { - "epoch": 0.91, - "learning_rate": 0.00016333503185998757, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022978270054772006, + "loss": 0.0166, "step": 180590 }, { - "epoch": 0.91, - "learning_rate": 0.00016332746416697355, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002297788123313486, + "loss": 0.0203, "step": 180600 }, { - "epoch": 0.91, - "learning_rate": 0.00016331989647395953, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.0002297749241149771, + "loss": 0.0172, "step": 180610 }, { - "epoch": 0.91, - "learning_rate": 0.00016331232878094554, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022977103589860568, + "loss": 0.019, "step": 180620 }, { - "epoch": 0.91, - "learning_rate": 0.00016330476108793152, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.0002297671476822342, + "loss": 0.0181, "step": 180630 }, { - "epoch": 0.91, - "learning_rate": 0.0001632971933949175, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022976325946586274, + "loss": 0.0166, "step": 180640 }, { - "epoch": 0.91, - "learning_rate": 0.0001632896257019035, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022975937124949125, + "loss": 0.0162, "step": 180650 }, { - "epoch": 0.91, - "learning_rate": 0.0001632820580088895, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.0002297554830331198, + "loss": 0.0193, "step": 180660 }, { - "epoch": 0.91, - "learning_rate": 0.00016327449031587548, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022975159481674836, + "loss": 0.0182, "step": 180670 }, { - "epoch": 0.91, - "learning_rate": 0.00016326692262286148, - "loss": 0.0089, + "epoch": 0.47, + "learning_rate": 0.00022974770660037688, + "loss": 0.0207, "step": 180680 }, { - "epoch": 0.91, - "learning_rate": 0.00016325935492984747, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022974381838400542, + "loss": 0.0158, "step": 180690 }, { - "epoch": 0.91, - "learning_rate": 0.00016325178723683345, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00022973993016763393, + "loss": 0.0162, "step": 180700 }, { - "epoch": 0.91, - "learning_rate": 0.00016324421954381946, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.0002297360419512625, + "loss": 0.0204, "step": 180710 }, { - "epoch": 0.91, - "learning_rate": 0.00016323665185080544, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022973215373489102, + "loss": 0.0172, "step": 180720 }, { - "epoch": 0.91, - "learning_rate": 0.00016322908415779142, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022972826551851956, + "loss": 0.0257, "step": 180730 }, { - "epoch": 0.91, - "learning_rate": 0.00016322151646477743, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022972437730214807, + "loss": 0.0185, "step": 180740 }, { - "epoch": 0.91, - "learning_rate": 0.0001632139487717634, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022972048908577664, + "loss": 0.0172, "step": 180750 }, { - "epoch": 0.91, - "learning_rate": 0.0001632063810787494, - "loss": 0.0158, + "epoch": 0.47, + "learning_rate": 0.00022971660086940516, + "loss": 0.0214, "step": 180760 }, { - "epoch": 0.91, - "learning_rate": 0.00016319881338573537, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.0002297127126530337, + "loss": 0.02, "step": 180770 }, { - "epoch": 0.91, - "learning_rate": 0.00016319124569272138, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.0002297088244366622, + "loss": 0.0184, "step": 180780 }, { - "epoch": 0.91, - "learning_rate": 0.00016318367799970736, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00022970493622029078, + "loss": 0.0206, "step": 180790 }, { - "epoch": 0.91, - "learning_rate": 0.00016317611030669334, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002297010480039193, + "loss": 0.0179, "step": 180800 }, { - "epoch": 0.91, - "learning_rate": 0.00016316854261367935, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022969715978754784, + "loss": 0.0173, "step": 180810 }, { - "epoch": 0.91, - "learning_rate": 0.00016316097492066533, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022969327157117635, + "loss": 0.0186, "step": 180820 }, { - "epoch": 0.91, - "learning_rate": 0.00016315340722765131, - "loss": 0.0127, + "epoch": 0.47, + "learning_rate": 0.00022968938335480492, + "loss": 0.018, "step": 180830 }, { - "epoch": 0.91, - "learning_rate": 0.00016314583953463732, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.00022968549513843346, + "loss": 0.0158, "step": 180840 }, { - "epoch": 0.91, - "learning_rate": 0.0001631382718416233, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022968160692206198, + "loss": 0.019, "step": 180850 }, { - "epoch": 0.91, - "learning_rate": 0.00016313070414860929, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022967771870569052, + "loss": 0.0206, "step": 180860 }, { - "epoch": 0.91, - "learning_rate": 0.0001631231364555953, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022967383048931903, + "loss": 0.0214, "step": 180870 }, { - "epoch": 0.91, - "learning_rate": 0.00016311556876258128, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.0002296699422729476, + "loss": 0.0155, "step": 180880 }, { - "epoch": 0.91, - "learning_rate": 0.00016310800106956726, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00022966605405657612, + "loss": 0.0221, "step": 180890 }, { - "epoch": 0.91, - "learning_rate": 0.00016310043337655327, - "loss": 0.0144, + "epoch": 0.47, + "learning_rate": 0.00022966216584020466, + "loss": 0.0189, "step": 180900 }, { - "epoch": 0.91, - "learning_rate": 0.00016309286568353925, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022965827762383317, + "loss": 0.0156, "step": 180910 }, { - "epoch": 0.91, - "learning_rate": 0.00016308529799052523, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022965438940746174, + "loss": 0.0173, "step": 180920 }, { - "epoch": 0.91, - "learning_rate": 0.0001630777302975112, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022965050119109026, + "loss": 0.0162, "step": 180930 }, { - "epoch": 0.91, - "learning_rate": 0.00016307016260449722, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.0002296466129747188, + "loss": 0.0203, "step": 180940 }, { - "epoch": 0.91, - "learning_rate": 0.0001630625949114832, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.0002296427247583473, + "loss": 0.0179, "step": 180950 }, { - "epoch": 0.91, - "learning_rate": 0.00016305502721846918, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022963883654197588, + "loss": 0.0212, "step": 180960 }, { - "epoch": 0.91, - "learning_rate": 0.0001630474595254552, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.0002296349483256044, + "loss": 0.0187, "step": 180970 }, { - "epoch": 0.91, - "learning_rate": 0.00016303989183244117, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.00022963106010923294, + "loss": 0.0162, "step": 180980 }, { - "epoch": 0.91, - "learning_rate": 0.00016303232413942715, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022962717189286145, + "loss": 0.0156, "step": 180990 }, { - "epoch": 0.91, - "learning_rate": 0.00016302475644641316, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022962328367649002, + "loss": 0.025, "step": 181000 }, { - "epoch": 0.91, - "eval_cer": 0.9144751078837893, - "eval_loss": 0.008274085819721222, - "eval_runtime": 116.712, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.47, + "eval_cer": 0.881782465628416, + "eval_loss": 0.012816259637475014, + "eval_runtime": 107.9694, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, "step": 181000 }, { - "epoch": 0.91, - "learning_rate": 0.00016301718875339914, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00022961939546011856, + "loss": 0.018, "step": 181010 }, { - "epoch": 0.91, - "learning_rate": 0.00016300962106038512, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022961550724374708, + "loss": 0.0241, "step": 181020 }, { - "epoch": 0.91, - "learning_rate": 0.00016300205336737113, - "loss": 0.0161, + "epoch": 0.47, + "learning_rate": 0.0002296116190273756, + "loss": 0.0196, "step": 181030 }, { - "epoch": 0.91, - "learning_rate": 0.00016299448567435711, - "loss": 0.0133, + "epoch": 0.47, + "learning_rate": 0.00022960773081100416, + "loss": 0.0194, "step": 181040 }, { - "epoch": 0.91, - "learning_rate": 0.0001629869179813431, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.0002296038425946327, + "loss": 0.0173, "step": 181050 }, { - "epoch": 0.91, - "learning_rate": 0.0001629793502883291, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022959995437826122, + "loss": 0.0203, "step": 181060 }, { - "epoch": 0.91, - "learning_rate": 0.00016297178259531509, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022959606616188976, + "loss": 0.0193, "step": 181070 }, { - "epoch": 0.91, - "learning_rate": 0.00016296421490230107, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.0002295921779455183, + "loss": 0.0178, "step": 181080 }, { - "epoch": 0.91, - "learning_rate": 0.00016295664720928705, - "loss": 0.0172, + "epoch": 0.47, + "learning_rate": 0.00022958828972914684, + "loss": 0.0145, "step": 181090 }, { - "epoch": 0.91, - "learning_rate": 0.00016294907951627306, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.00022958440151277536, + "loss": 0.0201, "step": 181100 }, { - "epoch": 0.91, - "learning_rate": 0.00016294151182325904, - "loss": 0.0132, + "epoch": 0.47, + "learning_rate": 0.0002295805132964039, + "loss": 0.0185, "step": 181110 }, { - "epoch": 0.91, - "learning_rate": 0.00016293394413024502, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.0002295766250800324, + "loss": 0.0237, "step": 181120 }, { - "epoch": 0.91, - "learning_rate": 0.00016292637643723103, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022957273686366098, + "loss": 0.0197, "step": 181130 }, { - "epoch": 0.91, - "learning_rate": 0.000162918808744217, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002295688486472895, + "loss": 0.0172, "step": 181140 }, { - "epoch": 0.91, - "learning_rate": 0.000162911241051203, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.00022956496043091804, + "loss": 0.0174, "step": 181150 }, { - "epoch": 0.91, - "learning_rate": 0.000162903673358189, - "loss": 0.0085, + "epoch": 0.47, + "learning_rate": 0.00022956107221454655, + "loss": 0.0147, "step": 181160 }, { - "epoch": 0.91, - "learning_rate": 0.00016289610566517498, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.00022955718399817512, + "loss": 0.0202, "step": 181170 }, { - "epoch": 0.91, - "learning_rate": 0.00016288853797216096, + "epoch": 0.47, + "learning_rate": 0.00022955329578180366, "loss": 0.0177, "step": 181180 }, { - "epoch": 0.91, - "learning_rate": 0.00016288097027914697, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022954940756543218, + "loss": 0.0153, "step": 181190 }, { - "epoch": 0.91, - "learning_rate": 0.00016287340258613295, - "loss": 0.0179, + "epoch": 0.47, + "learning_rate": 0.0002295455193490607, + "loss": 0.0192, "step": 181200 }, { - "epoch": 0.91, - "learning_rate": 0.00016286583489311893, - "loss": 0.0151, + "epoch": 0.47, + "learning_rate": 0.00022954163113268926, + "loss": 0.0227, "step": 181210 }, { - "epoch": 0.91, - "learning_rate": 0.00016285826720010494, - "loss": 0.0134, + "epoch": 0.47, + "learning_rate": 0.0002295377429163178, + "loss": 0.0203, "step": 181220 }, { - "epoch": 0.91, - "learning_rate": 0.00016285069950709092, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.00022953385469994632, + "loss": 0.0187, "step": 181230 }, { - "epoch": 0.91, - "learning_rate": 0.0001628431318140769, - "loss": 0.0148, + "epoch": 0.47, + "learning_rate": 0.00022952996648357486, + "loss": 0.0194, "step": 181240 }, { - "epoch": 0.91, - "learning_rate": 0.0001628355641210629, - "loss": 0.0166, + "epoch": 0.47, + "learning_rate": 0.0002295260782672034, + "loss": 0.0235, "step": 181250 }, { - "epoch": 0.91, - "learning_rate": 0.0001628279964280489, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.00022952219005083194, + "loss": 0.014, "step": 181260 }, { - "epoch": 0.91, - "learning_rate": 0.00016282042873503488, - "loss": 0.0088, + "epoch": 0.47, + "learning_rate": 0.00022951830183446045, + "loss": 0.017, "step": 181270 }, { - "epoch": 0.91, - "learning_rate": 0.00016281286104202086, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.000229514413618089, + "loss": 0.0171, "step": 181280 }, { - "epoch": 0.91, - "learning_rate": 0.00016280529334900687, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022951052540171754, + "loss": 0.017, "step": 181290 }, { - "epoch": 0.91, - "learning_rate": 0.00016279772565599285, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022950663718534608, + "loss": 0.0158, "step": 181300 }, { - "epoch": 0.91, - "learning_rate": 0.00016279015796297883, - "loss": 0.0119, + "epoch": 0.47, + "learning_rate": 0.0002295027489689746, + "loss": 0.0194, "step": 181310 }, { - "epoch": 0.91, - "learning_rate": 0.00016278259026996484, - "loss": 0.0134, + "epoch": 0.47, + "learning_rate": 0.00022949886075260314, + "loss": 0.0164, "step": 181320 }, { - "epoch": 0.91, - "learning_rate": 0.00016277502257695082, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.0002294949725362317, + "loss": 0.02, "step": 181330 }, { - "epoch": 0.91, - "learning_rate": 0.0001627674548839368, - "loss": 0.0132, + "epoch": 0.47, + "learning_rate": 0.00022949108431986022, + "loss": 0.0224, "step": 181340 }, { - "epoch": 0.91, - "learning_rate": 0.0001627598871909228, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022948719610348873, + "loss": 0.0163, "step": 181350 }, { - "epoch": 0.91, - "learning_rate": 0.0001627523194979088, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022948330788711728, + "loss": 0.019, "step": 181360 }, { - "epoch": 0.92, - "learning_rate": 0.00016274475180489477, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002294794196707458, + "loss": 0.0125, "step": 181370 }, { - "epoch": 0.92, - "learning_rate": 0.00016273718411188078, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022947553145437436, + "loss": 0.0208, "step": 181380 }, { - "epoch": 0.92, - "learning_rate": 0.00016272961641886676, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.0002294716432380029, + "loss": 0.0167, "step": 181390 }, { - "epoch": 0.92, - "learning_rate": 0.00016272204872585274, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022946775502163141, + "loss": 0.0155, "step": 181400 }, { - "epoch": 0.92, - "learning_rate": 0.00016271448103283875, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.00022946386680525996, + "loss": 0.0178, "step": 181410 }, { - "epoch": 0.92, - "learning_rate": 0.00016270691333982473, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.0002294599785888885, + "loss": 0.0177, "step": 181420 }, { - "epoch": 0.92, - "learning_rate": 0.00016269934564681072, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022945609037251704, + "loss": 0.0159, "step": 181430 }, { - "epoch": 0.92, - "learning_rate": 0.0001626917779537967, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022945220215614555, + "loss": 0.0223, "step": 181440 }, { - "epoch": 0.92, - "learning_rate": 0.0001626842102607827, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.0002294483139397741, + "loss": 0.0148, "step": 181450 }, { - "epoch": 0.92, - "learning_rate": 0.0001626766425677687, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022944442572340264, + "loss": 0.0259, "step": 181460 }, { - "epoch": 0.92, - "learning_rate": 0.00016266907487475467, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022944053750703118, + "loss": 0.0211, "step": 181470 }, { - "epoch": 0.92, - "learning_rate": 0.00016266150718174068, - "loss": 0.0087, + "epoch": 0.47, + "learning_rate": 0.0002294366492906597, + "loss": 0.0227, "step": 181480 }, { - "epoch": 0.92, - "learning_rate": 0.00016265393948872666, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022943276107428824, + "loss": 0.0206, "step": 181490 }, { - "epoch": 0.92, - "learning_rate": 0.00016264637179571264, - "loss": 0.0088, + "epoch": 0.47, + "learning_rate": 0.00022942887285791678, + "loss": 0.017, "step": 181500 }, { - "epoch": 0.92, - "learning_rate": 0.00016263880410269865, - "loss": 0.0153, + "epoch": 0.47, + "learning_rate": 0.00022942498464154532, + "loss": 0.0145, "step": 181510 }, { - "epoch": 0.92, - "learning_rate": 0.00016263123640968463, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022942109642517383, + "loss": 0.016, "step": 181520 }, { - "epoch": 0.92, - "learning_rate": 0.0001626236687166706, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022941720820880237, + "loss": 0.018, "step": 181530 }, { - "epoch": 0.92, - "learning_rate": 0.00016261610102365662, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022941331999243094, + "loss": 0.0173, "step": 181540 }, { - "epoch": 0.92, - "learning_rate": 0.0001626085333306426, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022940943177605946, + "loss": 0.0168, "step": 181550 }, { - "epoch": 0.92, - "learning_rate": 0.00016260096563762858, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.000229405543559688, + "loss": 0.0179, "step": 181560 }, { - "epoch": 0.92, - "learning_rate": 0.0001625933979446146, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022940165534331651, + "loss": 0.0163, "step": 181570 }, { - "epoch": 0.92, - "learning_rate": 0.00016258583025160057, - "loss": 0.0148, + "epoch": 0.47, + "learning_rate": 0.00022939776712694508, + "loss": 0.0174, "step": 181580 }, { - "epoch": 0.92, - "learning_rate": 0.00016257826255858655, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.0002293938789105736, + "loss": 0.0177, "step": 181590 }, { - "epoch": 0.92, - "learning_rate": 0.00016257069486557254, - "loss": 0.0137, + "epoch": 0.47, + "learning_rate": 0.00022938999069420214, + "loss": 0.0153, "step": 181600 }, { - "epoch": 0.92, - "learning_rate": 0.00016256312717255854, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022938610247783065, + "loss": 0.0201, "step": 181610 }, { - "epoch": 0.92, - "learning_rate": 0.00016255555947954453, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.0002293822142614592, + "loss": 0.0159, "step": 181620 }, { - "epoch": 0.92, - "learning_rate": 0.00016254799178653048, - "loss": 0.0162, + "epoch": 0.47, + "learning_rate": 0.00022937832604508774, + "loss": 0.0178, "step": 181630 }, { - "epoch": 0.92, - "learning_rate": 0.00016254042409351646, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022937443782871628, + "loss": 0.016, "step": 181640 }, { - "epoch": 0.92, - "learning_rate": 0.00016253285640050247, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.0002293705496123448, + "loss": 0.0158, "step": 181650 }, { - "epoch": 0.92, - "learning_rate": 0.00016252528870748845, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022936666139597333, + "loss": 0.0182, "step": 181660 }, { - "epoch": 0.92, - "learning_rate": 0.00016251772101447443, - "loss": 0.0139, + "epoch": 0.47, + "learning_rate": 0.00022936277317960188, + "loss": 0.0217, "step": 181670 }, { - "epoch": 0.92, - "learning_rate": 0.00016251015332146044, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.00022935888496323042, + "loss": 0.0231, "step": 181680 }, { - "epoch": 0.92, - "learning_rate": 0.00016250258562844642, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00022935499674685893, + "loss": 0.0179, "step": 181690 }, { - "epoch": 0.92, - "learning_rate": 0.0001624950179354324, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022935110853048747, + "loss": 0.0196, "step": 181700 }, { - "epoch": 0.92, - "learning_rate": 0.0001624874502424184, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022934722031411604, + "loss": 0.0159, "step": 181710 }, { - "epoch": 0.92, - "learning_rate": 0.0001624798825494044, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022934333209774456, + "loss": 0.0153, "step": 181720 }, { - "epoch": 0.92, - "learning_rate": 0.00016247231485639038, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.0002293394438813731, + "loss": 0.0185, "step": 181730 }, { - "epoch": 0.92, - "learning_rate": 0.00016246474716337638, - "loss": 0.0124, + "epoch": 0.47, + "learning_rate": 0.0002293355556650016, + "loss": 0.018, "step": 181740 }, { - "epoch": 0.92, - "learning_rate": 0.00016245717947036237, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.00022933166744863018, + "loss": 0.0176, "step": 181750 }, { - "epoch": 0.92, - "learning_rate": 0.00016244961177734835, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.0002293277792322587, + "loss": 0.0241, "step": 181760 }, { - "epoch": 0.92, - "learning_rate": 0.00016244204408433436, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.00022932389101588724, + "loss": 0.0181, "step": 181770 }, { - "epoch": 0.92, - "learning_rate": 0.00016243447639132034, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00022932000279951575, + "loss": 0.0191, "step": 181780 }, { - "epoch": 0.92, - "learning_rate": 0.00016242690869830632, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022931611458314432, + "loss": 0.0169, "step": 181790 }, { - "epoch": 0.92, - "learning_rate": 0.00016241934100529233, - "loss": 0.0138, + "epoch": 0.47, + "learning_rate": 0.00022931222636677284, + "loss": 0.0182, "step": 181800 }, { - "epoch": 0.92, - "learning_rate": 0.0001624117733122783, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00022930833815040138, + "loss": 0.0137, "step": 181810 }, { - "epoch": 0.92, - "learning_rate": 0.0001624042056192643, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.0002293044499340299, + "loss": 0.0223, "step": 181820 }, { - "epoch": 0.92, - "learning_rate": 0.00016239663792625027, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022930056171765846, + "loss": 0.0169, "step": 181830 }, { - "epoch": 0.92, - "learning_rate": 0.00016238907023323628, - "loss": 0.0132, + "epoch": 0.47, + "learning_rate": 0.00022929667350128698, + "loss": 0.0195, "step": 181840 }, { - "epoch": 0.92, - "learning_rate": 0.00016238150254022226, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022929278528491552, + "loss": 0.0164, "step": 181850 }, { - "epoch": 0.92, - "learning_rate": 0.00016237393484720824, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022928889706854403, + "loss": 0.02, "step": 181860 }, { - "epoch": 0.92, - "learning_rate": 0.00016236636715419425, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022928500885217257, + "loss": 0.0197, "step": 181870 }, { - "epoch": 0.92, - "learning_rate": 0.00016235879946118023, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022928112063580114, + "loss": 0.0224, "step": 181880 }, { - "epoch": 0.92, - "learning_rate": 0.00016235123176816621, - "loss": 0.0159, + "epoch": 0.47, + "learning_rate": 0.00022927723241942966, + "loss": 0.0188, "step": 181890 }, { - "epoch": 0.92, - "learning_rate": 0.00016234366407515222, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022927334420305817, + "loss": 0.018, "step": 181900 }, { - "epoch": 0.92, - "learning_rate": 0.0001623360963821382, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.0002292694559866867, + "loss": 0.0189, "step": 181910 }, { - "epoch": 0.92, - "learning_rate": 0.00016232852868912419, - "loss": 0.0142, + "epoch": 0.47, + "learning_rate": 0.00022926556777031528, + "loss": 0.0193, "step": 181920 }, { - "epoch": 0.92, - "learning_rate": 0.0001623209609961102, - "loss": 0.0138, + "epoch": 0.47, + "learning_rate": 0.0002292616795539438, + "loss": 0.0144, "step": 181930 }, { - "epoch": 0.92, - "learning_rate": 0.00016231339330309618, - "loss": 0.0173, + "epoch": 0.47, + "learning_rate": 0.00022925779133757234, + "loss": 0.017, "step": 181940 }, { - "epoch": 0.92, - "learning_rate": 0.00016230582561008216, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.00022925390312120085, + "loss": 0.0192, "step": 181950 }, { - "epoch": 0.92, - "learning_rate": 0.00016229825791706817, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022925001490482942, + "loss": 0.0208, "step": 181960 }, { - "epoch": 0.92, - "learning_rate": 0.00016229069022405415, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.00022924612668845794, + "loss": 0.021, "step": 181970 }, { - "epoch": 0.92, - "learning_rate": 0.00016228312253104013, - "loss": 0.0156, + "epoch": 0.47, + "learning_rate": 0.00022924223847208648, + "loss": 0.0162, "step": 181980 }, { - "epoch": 0.92, - "learning_rate": 0.0001622755548380261, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.000229238350255715, + "loss": 0.0151, "step": 181990 }, { - "epoch": 0.92, - "learning_rate": 0.00016226798714501212, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022923446203934356, + "loss": 0.018, "step": 182000 }, { - "epoch": 0.92, - "eval_cer": 0.9144857822411687, - "eval_loss": 0.008326300419867039, - "eval_runtime": 116.6222, - "eval_samples_per_second": 17.149, - "eval_steps_per_second": 4.287, + "epoch": 0.47, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.012949470430612564, + "eval_runtime": 108.1298, + "eval_samples_per_second": 18.496, + "eval_steps_per_second": 4.624, "step": 182000 }, { - "epoch": 0.92, - "learning_rate": 0.0001622604194519981, - "loss": 0.0137, + "epoch": 0.47, + "learning_rate": 0.00022923057382297208, + "loss": 0.0161, "step": 182010 }, { - "epoch": 0.92, - "learning_rate": 0.00016225285175898408, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022922668560660062, + "loss": 0.0174, "step": 182020 }, { - "epoch": 0.92, - "learning_rate": 0.0001622452840659701, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00022922279739022913, + "loss": 0.024, "step": 182030 }, { - "epoch": 0.92, - "learning_rate": 0.00016223771637295607, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.0002292189091738577, + "loss": 0.0201, "step": 182040 }, { - "epoch": 0.92, - "learning_rate": 0.00016223014867994205, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00022921502095748624, + "loss": 0.0182, "step": 182050 }, { - "epoch": 0.92, - "learning_rate": 0.00016222258098692806, - "loss": 0.0127, + "epoch": 0.47, + "learning_rate": 0.00022921113274111476, + "loss": 0.0183, "step": 182060 }, { - "epoch": 0.92, - "learning_rate": 0.00016221501329391404, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022920724452474327, + "loss": 0.02, "step": 182070 }, { - "epoch": 0.92, - "learning_rate": 0.00016220744560090002, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022920335630837184, + "loss": 0.0218, "step": 182080 }, { - "epoch": 0.92, - "learning_rate": 0.00016219987790788603, - "loss": 0.0126, + "epoch": 0.47, + "learning_rate": 0.00022919946809200038, + "loss": 0.0166, "step": 182090 }, { - "epoch": 0.92, - "learning_rate": 0.00016219231021487201, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.0002291955798756289, + "loss": 0.015, "step": 182100 }, { - "epoch": 0.92, - "learning_rate": 0.000162184742521858, - "loss": 0.014, + "epoch": 0.47, + "learning_rate": 0.00022919169165925744, + "loss": 0.0169, "step": 182110 }, { - "epoch": 0.92, - "learning_rate": 0.000162177174828844, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022918780344288595, + "loss": 0.0181, "step": 182120 }, { - "epoch": 0.92, - "learning_rate": 0.00016216960713582999, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022918391522651452, + "loss": 0.024, "step": 182130 }, { - "epoch": 0.92, - "learning_rate": 0.00016216203944281597, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022918002701014303, + "loss": 0.0142, "step": 182140 }, { - "epoch": 0.92, - "learning_rate": 0.00016215447174980195, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022917613879377158, + "loss": 0.0245, "step": 182150 }, { - "epoch": 0.92, - "learning_rate": 0.00016214690405678796, - "loss": 0.0099, + "epoch": 0.47, + "learning_rate": 0.0002291722505774001, + "loss": 0.014, "step": 182160 }, { - "epoch": 0.92, - "learning_rate": 0.00016213933636377394, - "loss": 0.0134, + "epoch": 0.47, + "learning_rate": 0.00022916836236102866, + "loss": 0.0199, "step": 182170 }, { - "epoch": 0.92, - "learning_rate": 0.00016213176867075992, - "loss": 0.0115, + "epoch": 0.47, + "learning_rate": 0.00022916447414465717, + "loss": 0.0221, "step": 182180 }, { - "epoch": 0.92, - "learning_rate": 0.00016212420097774593, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.00022916058592828572, + "loss": 0.0221, "step": 182190 }, { - "epoch": 0.92, - "learning_rate": 0.0001621166332847319, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022915669771191423, + "loss": 0.0216, "step": 182200 }, { - "epoch": 0.92, - "learning_rate": 0.0001621090655917179, - "loss": 0.0168, + "epoch": 0.47, + "learning_rate": 0.0002291528094955428, + "loss": 0.0171, "step": 182210 }, { - "epoch": 0.92, - "learning_rate": 0.0001621014978987039, - "loss": 0.0137, + "epoch": 0.47, + "learning_rate": 0.00022914892127917131, + "loss": 0.0159, "step": 182220 }, { - "epoch": 0.92, - "learning_rate": 0.00016209393020568988, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022914503306279986, + "loss": 0.0154, "step": 182230 }, { - "epoch": 0.92, - "learning_rate": 0.00016208636251267586, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022914114484642837, + "loss": 0.0202, "step": 182240 }, { - "epoch": 0.92, - "learning_rate": 0.00016207879481966187, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.00022913725663005694, + "loss": 0.0167, "step": 182250 }, { - "epoch": 0.92, - "learning_rate": 0.00016207122712664785, - "loss": 0.0173, + "epoch": 0.47, + "learning_rate": 0.00022913336841368548, + "loss": 0.0182, "step": 182260 }, { - "epoch": 0.92, - "learning_rate": 0.00016206365943363383, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.000229129480197314, + "loss": 0.0182, "step": 182270 }, { - "epoch": 0.92, - "learning_rate": 0.00016205609174061984, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.00022912559198094254, + "loss": 0.0222, "step": 182280 }, { - "epoch": 0.92, - "learning_rate": 0.00016204852404760582, - "loss": 0.0148, + "epoch": 0.47, + "learning_rate": 0.00022912170376457108, + "loss": 0.0257, "step": 182290 }, { - "epoch": 0.92, - "learning_rate": 0.0001620409563545918, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022911781554819962, + "loss": 0.0185, "step": 182300 }, { - "epoch": 0.92, - "learning_rate": 0.00016203338866157781, - "loss": 0.009, + "epoch": 0.47, + "learning_rate": 0.00022911392733182813, + "loss": 0.0185, "step": 182310 }, { - "epoch": 0.92, - "learning_rate": 0.0001620258209685638, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022911003911545668, + "loss": 0.0191, "step": 182320 }, { - "epoch": 0.92, - "learning_rate": 0.00016201825327554978, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022910615089908522, + "loss": 0.0168, "step": 182330 }, { - "epoch": 0.92, - "learning_rate": 0.00016201068558253576, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022910226268271376, + "loss": 0.0185, "step": 182340 }, { - "epoch": 0.92, - "learning_rate": 0.00016200311788952177, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022909837446634227, + "loss": 0.0201, "step": 182350 }, { - "epoch": 0.92, - "learning_rate": 0.00016199555019650775, - "loss": 0.0144, + "epoch": 0.47, + "learning_rate": 0.00022909448624997082, + "loss": 0.0142, "step": 182360 }, { - "epoch": 0.92, - "learning_rate": 0.00016198798250349373, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022909059803359933, + "loss": 0.0233, "step": 182370 }, { - "epoch": 0.92, - "learning_rate": 0.00016198041481047974, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.0002290867098172279, + "loss": 0.015, "step": 182380 }, { - "epoch": 0.92, - "learning_rate": 0.00016197284711746572, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.0002290828216008564, + "loss": 0.0189, "step": 182390 }, { - "epoch": 0.92, - "learning_rate": 0.0001619652794244517, - "loss": 0.013, + "epoch": 0.47, + "learning_rate": 0.00022907893338448495, + "loss": 0.0215, "step": 182400 }, { - "epoch": 0.92, - "learning_rate": 0.0001619577117314377, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022907504516811347, + "loss": 0.0181, "step": 182410 }, { - "epoch": 0.92, - "learning_rate": 0.0001619501440384237, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.00022907115695174204, + "loss": 0.0162, "step": 182420 }, { - "epoch": 0.92, - "learning_rate": 0.00016194257634540967, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022906726873537058, + "loss": 0.0189, "step": 182430 }, { - "epoch": 0.92, - "learning_rate": 0.00016193500865239568, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.0002290633805189991, + "loss": 0.0238, "step": 182440 }, { - "epoch": 0.92, - "learning_rate": 0.00016192744095938166, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022905949230262764, + "loss": 0.0191, "step": 182450 }, { - "epoch": 0.92, - "learning_rate": 0.00016191987326636764, - "loss": 0.0128, + "epoch": 0.47, + "learning_rate": 0.00022905560408625618, + "loss": 0.0188, "step": 182460 }, { - "epoch": 0.92, - "learning_rate": 0.00016191230557335365, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00022905171586988472, + "loss": 0.0178, "step": 182470 }, { - "epoch": 0.92, - "learning_rate": 0.00016190473788033963, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022904782765351323, + "loss": 0.0187, "step": 182480 }, { - "epoch": 0.92, - "learning_rate": 0.00016189717018732562, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.00022904393943714178, + "loss": 0.0183, "step": 182490 }, { - "epoch": 0.92, - "learning_rate": 0.0001618896024943116, - "loss": 0.0104, + "epoch": 0.47, + "learning_rate": 0.00022904005122077032, + "loss": 0.0165, "step": 182500 }, { - "epoch": 0.92, - "learning_rate": 0.0001618820348012976, - "loss": 0.0094, + "epoch": 0.47, + "learning_rate": 0.00022903616300439886, + "loss": 0.0174, "step": 182510 }, { - "epoch": 0.92, - "learning_rate": 0.0001618744671082836, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.00022903227478802737, + "loss": 0.0182, "step": 182520 }, { - "epoch": 0.92, - "learning_rate": 0.00016186689941526957, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022902838657165591, + "loss": 0.0147, "step": 182530 }, { - "epoch": 0.92, - "learning_rate": 0.00016185933172225558, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022902449835528446, + "loss": 0.0224, "step": 182540 }, { - "epoch": 0.92, - "learning_rate": 0.00016185176402924156, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.000229020610138913, + "loss": 0.0195, "step": 182550 }, { - "epoch": 0.92, - "learning_rate": 0.00016184419633622754, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.0002290167219225415, + "loss": 0.0169, "step": 182560 }, { - "epoch": 0.92, - "learning_rate": 0.00016183662864321355, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022901283370617005, + "loss": 0.0175, "step": 182570 }, { - "epoch": 0.92, - "learning_rate": 0.00016182906095019953, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.00022900894548979862, + "loss": 0.018, "step": 182580 }, { - "epoch": 0.92, - "learning_rate": 0.0001618214932571855, - "loss": 0.009, + "epoch": 0.47, + "learning_rate": 0.00022900505727342714, + "loss": 0.0183, "step": 182590 }, { - "epoch": 0.92, - "learning_rate": 0.00016181392556417152, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.00022900116905705568, + "loss": 0.015, "step": 182600 }, { - "epoch": 0.92, - "learning_rate": 0.0001618063578711575, - "loss": 0.0111, + "epoch": 0.47, + "learning_rate": 0.0002289972808406842, + "loss": 0.0247, "step": 182610 }, { - "epoch": 0.92, - "learning_rate": 0.00016179879017814348, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.0002289933926243127, + "loss": 0.0181, "step": 182620 }, { - "epoch": 0.92, - "learning_rate": 0.0001617912224851295, - "loss": 0.0121, + "epoch": 0.47, + "learning_rate": 0.00022898950440794128, + "loss": 0.0222, "step": 182630 }, { - "epoch": 0.92, - "learning_rate": 0.00016178365479211547, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022898561619156982, + "loss": 0.0157, "step": 182640 }, { - "epoch": 0.92, - "learning_rate": 0.00016177608709910145, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022898172797519833, + "loss": 0.0206, "step": 182650 }, { - "epoch": 0.92, - "learning_rate": 0.00016176851940608744, - "loss": 0.0107, + "epoch": 0.47, + "learning_rate": 0.00022897783975882687, + "loss": 0.0138, "step": 182660 }, { - "epoch": 0.92, - "learning_rate": 0.00016176095171307344, - "loss": 0.0109, + "epoch": 0.47, + "learning_rate": 0.00022897395154245542, + "loss": 0.0152, "step": 182670 }, { - "epoch": 0.92, - "learning_rate": 0.00016175338402005943, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022897006332608396, + "loss": 0.0162, "step": 182680 }, { - "epoch": 0.92, - "learning_rate": 0.0001617458163270454, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022896617510971247, + "loss": 0.0155, "step": 182690 }, { - "epoch": 0.92, - "learning_rate": 0.00016173824863403142, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022896228689334101, + "loss": 0.0163, "step": 182700 }, { - "epoch": 0.92, - "learning_rate": 0.0001617306809410174, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022895839867696956, + "loss": 0.0177, "step": 182710 }, { - "epoch": 0.92, - "learning_rate": 0.00016172311324800338, - "loss": 0.0114, + "epoch": 0.47, + "learning_rate": 0.0002289545104605981, + "loss": 0.0195, "step": 182720 }, { - "epoch": 0.92, - "learning_rate": 0.0001617155455549894, - "loss": 0.014, + "epoch": 0.47, + "learning_rate": 0.0002289506222442266, + "loss": 0.0182, "step": 182730 }, { - "epoch": 0.92, - "learning_rate": 0.00016170797786197537, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022894673402785515, + "loss": 0.0155, "step": 182740 }, { - "epoch": 0.92, - "learning_rate": 0.00016170041016896135, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022894284581148372, + "loss": 0.0166, "step": 182750 }, { - "epoch": 0.92, - "learning_rate": 0.00016169284247594736, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022893895759511224, + "loss": 0.0181, "step": 182760 }, { - "epoch": 0.92, - "learning_rate": 0.00016168527478293334, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.00022893506937874078, + "loss": 0.0217, "step": 182770 }, { - "epoch": 0.92, - "learning_rate": 0.00016167770708991932, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.0002289311811623693, + "loss": 0.0184, "step": 182780 }, { - "epoch": 0.92, - "learning_rate": 0.00016167013939690533, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022892729294599786, + "loss": 0.0147, "step": 182790 }, { - "epoch": 0.92, - "learning_rate": 0.0001616625717038913, - "loss": 0.0112, + "epoch": 0.47, + "learning_rate": 0.00022892340472962638, + "loss": 0.0178, "step": 182800 }, { - "epoch": 0.92, - "learning_rate": 0.0001616550040108773, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.00022891951651325492, + "loss": 0.015, "step": 182810 }, { - "epoch": 0.92, - "learning_rate": 0.0001616474363178633, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.00022891562829688343, + "loss": 0.018, "step": 182820 }, { - "epoch": 0.92, - "learning_rate": 0.00016163986862484928, - "loss": 0.0122, + "epoch": 0.47, + "learning_rate": 0.000228911740080512, + "loss": 0.0191, "step": 182830 }, { - "epoch": 0.92, - "learning_rate": 0.00016163230093183526, - "loss": 0.01, + "epoch": 0.47, + "learning_rate": 0.00022890785186414052, + "loss": 0.0145, "step": 182840 }, { - "epoch": 0.92, - "learning_rate": 0.00016162473323882125, - "loss": 0.0095, + "epoch": 0.47, + "learning_rate": 0.00022890396364776906, + "loss": 0.0149, "step": 182850 }, { - "epoch": 0.92, - "learning_rate": 0.00016161716554580725, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022890007543139757, + "loss": 0.0203, "step": 182860 }, { - "epoch": 0.92, - "learning_rate": 0.00016160959785279324, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022889618721502611, + "loss": 0.0216, "step": 182870 }, { - "epoch": 0.92, - "learning_rate": 0.0001616020301597792, - "loss": 0.0093, + "epoch": 0.47, + "learning_rate": 0.00022889229899865466, + "loss": 0.0132, "step": 182880 }, { - "epoch": 0.92, - "learning_rate": 0.00016159446246676517, - "loss": 0.0098, + "epoch": 0.47, + "learning_rate": 0.0002288884107822832, + "loss": 0.0192, "step": 182890 }, { - "epoch": 0.92, - "learning_rate": 0.00016158689477375118, - "loss": 0.0131, + "epoch": 0.47, + "learning_rate": 0.0002288845225659117, + "loss": 0.0156, "step": 182900 }, { - "epoch": 0.92, - "learning_rate": 0.00016157932708073716, - "loss": 0.0083, + "epoch": 0.47, + "learning_rate": 0.00022888063434954025, + "loss": 0.0163, "step": 182910 }, { - "epoch": 0.92, - "learning_rate": 0.00016157175938772314, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022887674613316882, + "loss": 0.0152, "step": 182920 }, { - "epoch": 0.92, - "learning_rate": 0.00016156419169470915, - "loss": 0.0119, + "epoch": 0.47, + "learning_rate": 0.00022887285791679734, + "loss": 0.0204, "step": 182930 }, { - "epoch": 0.92, - "learning_rate": 0.00016155662400169513, - "loss": 0.0091, + "epoch": 0.47, + "learning_rate": 0.00022886896970042585, + "loss": 0.0181, "step": 182940 }, { - "epoch": 0.92, - "learning_rate": 0.00016154905630868111, - "loss": 0.0129, - "step": 182950 + "epoch": 0.47, + "learning_rate": 0.0002288650814840544, + "loss": 0.0182, + "step": 182950 }, { - "epoch": 0.92, - "learning_rate": 0.00016154148861566712, - "loss": 0.012, + "epoch": 0.47, + "learning_rate": 0.00022886119326768296, + "loss": 0.0229, "step": 182960 }, { - "epoch": 0.92, - "learning_rate": 0.0001615339209226531, - "loss": 0.0135, + "epoch": 0.47, + "learning_rate": 0.00022885730505131148, + "loss": 0.0249, "step": 182970 }, { - "epoch": 0.92, - "learning_rate": 0.00016152635322963909, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022885341683494002, + "loss": 0.0163, "step": 182980 }, { - "epoch": 0.92, - "learning_rate": 0.0001615187855366251, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022884952861856853, + "loss": 0.0155, "step": 182990 }, { - "epoch": 0.92, - "learning_rate": 0.00016151121784361108, - "loss": 0.0101, + "epoch": 0.47, + "learning_rate": 0.0002288456404021971, + "loss": 0.0191, "step": 183000 }, { - "epoch": 0.92, - "eval_cer": 0.9144828710527925, - "eval_loss": 0.00819355621933937, - "eval_runtime": 116.6466, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.286, + "epoch": 0.47, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.012429905124008656, + "eval_runtime": 108.0004, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.63, "step": 183000 }, { - "epoch": 0.92, - "learning_rate": 0.00016150365015059706, - "loss": 0.0082, + "epoch": 0.47, + "learning_rate": 0.00022884175218582562, + "loss": 0.0171, "step": 183010 }, { - "epoch": 0.92, - "learning_rate": 0.00016149608245758307, - "loss": 0.0146, + "epoch": 0.47, + "learning_rate": 0.00022883786396945416, + "loss": 0.0166, "step": 183020 }, { - "epoch": 0.92, - "learning_rate": 0.00016148851476456905, - "loss": 0.0106, + "epoch": 0.47, + "learning_rate": 0.00022883397575308267, + "loss": 0.016, "step": 183030 }, { - "epoch": 0.92, - "learning_rate": 0.00016148094707155503, - "loss": 0.0108, + "epoch": 0.47, + "learning_rate": 0.00022883008753671124, + "loss": 0.0215, "step": 183040 }, { - "epoch": 0.92, - "learning_rate": 0.000161473379378541, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022882619932033975, + "loss": 0.0163, "step": 183050 }, { - "epoch": 0.92, - "learning_rate": 0.00016146581168552702, - "loss": 0.0125, + "epoch": 0.47, + "learning_rate": 0.0002288223111039683, + "loss": 0.0202, "step": 183060 }, { - "epoch": 0.92, - "learning_rate": 0.000161458243992513, - "loss": 0.0097, + "epoch": 0.47, + "learning_rate": 0.0002288184228875968, + "loss": 0.0281, "step": 183070 }, { - "epoch": 0.92, - "learning_rate": 0.00016145067629949898, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022881453467122538, + "loss": 0.0182, "step": 183080 }, { - "epoch": 0.92, - "learning_rate": 0.000161443108606485, - "loss": 0.0116, + "epoch": 0.47, + "learning_rate": 0.0002288106464548539, + "loss": 0.0171, "step": 183090 }, { - "epoch": 0.92, - "learning_rate": 0.00016143554091347097, - "loss": 0.0129, + "epoch": 0.47, + "learning_rate": 0.00022880675823848244, + "loss": 0.0202, "step": 183100 }, { - "epoch": 0.92, - "learning_rate": 0.00016142797322045695, - "loss": 0.0113, + "epoch": 0.47, + "learning_rate": 0.00022880287002211095, + "loss": 0.0167, "step": 183110 }, { - "epoch": 0.92, - "learning_rate": 0.00016142040552744296, - "loss": 0.0136, + "epoch": 0.47, + "learning_rate": 0.0002287989818057395, + "loss": 0.0193, "step": 183120 }, { - "epoch": 0.92, - "learning_rate": 0.00016141283783442894, - "loss": 0.0117, + "epoch": 0.47, + "learning_rate": 0.00022879509358936806, + "loss": 0.0147, "step": 183130 }, { - "epoch": 0.92, - "learning_rate": 0.00016140527014141492, - "loss": 0.0092, + "epoch": 0.47, + "learning_rate": 0.00022879120537299658, + "loss": 0.0162, "step": 183140 }, { - "epoch": 0.92, - "learning_rate": 0.00016139770244840093, - "loss": 0.0105, + "epoch": 0.47, + "learning_rate": 0.00022878731715662512, + "loss": 0.0167, "step": 183150 }, { - "epoch": 0.92, - "learning_rate": 0.00016139013475538691, - "loss": 0.0102, + "epoch": 0.47, + "learning_rate": 0.00022878342894025363, + "loss": 0.0168, "step": 183160 }, { - "epoch": 0.92, - "learning_rate": 0.0001613825670623729, - "loss": 0.0096, + "epoch": 0.47, + "learning_rate": 0.0002287795407238822, + "loss": 0.0169, "step": 183170 }, { - "epoch": 0.92, - "learning_rate": 0.0001613749993693589, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022877565250751071, + "loss": 0.0151, "step": 183180 }, { - "epoch": 0.92, - "learning_rate": 0.00016136743167634489, - "loss": 0.011, + "epoch": 0.47, + "learning_rate": 0.00022877176429113926, + "loss": 0.0224, "step": 183190 }, { - "epoch": 0.92, - "learning_rate": 0.00016135986398333087, - "loss": 0.0123, + "epoch": 0.47, + "learning_rate": 0.00022876787607476777, + "loss": 0.0184, "step": 183200 }, { - "epoch": 0.92, - "learning_rate": 0.00016135229629031688, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022876398785839634, + "loss": 0.0187, "step": 183210 }, { - "epoch": 0.92, - "learning_rate": 0.00016134472859730286, - "loss": 0.0118, + "epoch": 0.47, + "learning_rate": 0.00022876009964202485, + "loss": 0.0183, "step": 183220 }, { - "epoch": 0.92, - "learning_rate": 0.00016133716090428884, - "loss": 0.0127, + "epoch": 0.47, + "learning_rate": 0.0002287562114256534, + "loss": 0.0135, "step": 183230 }, { - "epoch": 0.92, - "learning_rate": 0.00016132959321127482, - "loss": 0.0103, + "epoch": 0.47, + "learning_rate": 0.0002287523232092819, + "loss": 0.0153, "step": 183240 }, { - "epoch": 0.92, - "learning_rate": 0.00016132202551826083, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022874843499291048, + "loss": 0.0201, "step": 183250 }, { - "epoch": 0.92, - "learning_rate": 0.0001613144578252468, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.000228744546776539, + "loss": 0.0169, "step": 183260 }, { - "epoch": 0.92, - "learning_rate": 0.0001613068901322328, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022874065856016754, + "loss": 0.0157, "step": 183270 }, { - "epoch": 0.92, - "learning_rate": 0.0001612993224392188, - "loss": 0.0092, + "epoch": 0.48, + "learning_rate": 0.00022873677034379605, + "loss": 0.0244, "step": 183280 }, { - "epoch": 0.92, - "learning_rate": 0.00016129175474620478, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022873288212742462, + "loss": 0.0182, "step": 183290 }, { - "epoch": 0.92, - "learning_rate": 0.00016128418705319076, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022872899391105316, + "loss": 0.0175, "step": 183300 }, { - "epoch": 0.92, - "learning_rate": 0.00016127661936017677, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022872510569468167, + "loss": 0.0234, "step": 183310 }, { - "epoch": 0.92, - "learning_rate": 0.00016126905166716275, - "loss": 0.0088, + "epoch": 0.48, + "learning_rate": 0.00022872121747831022, + "loss": 0.0155, "step": 183320 }, { - "epoch": 0.92, - "learning_rate": 0.00016126148397414873, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022871732926193876, + "loss": 0.018, "step": 183330 }, { - "epoch": 0.92, - "learning_rate": 0.00016125391628113474, - "loss": 0.015, + "epoch": 0.48, + "learning_rate": 0.0002287134410455673, + "loss": 0.0234, "step": 183340 }, { - "epoch": 0.93, - "learning_rate": 0.00016124634858812072, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022870955282919581, + "loss": 0.017, "step": 183350 }, { - "epoch": 0.93, - "learning_rate": 0.0001612387808951067, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022870566461282436, + "loss": 0.0183, "step": 183360 }, { - "epoch": 0.93, - "learning_rate": 0.00016123121320209271, - "loss": 0.0171, + "epoch": 0.48, + "learning_rate": 0.00022870177639645287, + "loss": 0.0195, "step": 183370 }, { - "epoch": 0.93, - "learning_rate": 0.0001612236455090787, - "loss": 0.0222, + "epoch": 0.48, + "learning_rate": 0.00022869788818008144, + "loss": 0.0228, "step": 183380 }, { - "epoch": 0.93, - "learning_rate": 0.00016121607781606468, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022869399996370995, + "loss": 0.0192, "step": 183390 }, { - "epoch": 0.93, - "learning_rate": 0.00016120851012305066, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.0002286901117473385, + "loss": 0.0195, "step": 183400 }, { - "epoch": 0.93, - "learning_rate": 0.00016120094243003667, - "loss": 0.0139, + "epoch": 0.48, + "learning_rate": 0.000228686223530967, + "loss": 0.0173, "step": 183410 }, { - "epoch": 0.93, - "learning_rate": 0.00016119337473702265, - "loss": 0.0157, + "epoch": 0.48, + "learning_rate": 0.00022868233531459558, + "loss": 0.0162, "step": 183420 }, { - "epoch": 0.93, - "learning_rate": 0.00016118580704400863, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.0002286784470982241, + "loss": 0.0242, "step": 183430 }, { - "epoch": 0.93, - "learning_rate": 0.00016117823935099464, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022867455888185263, + "loss": 0.0168, "step": 183440 }, { - "epoch": 0.93, - "learning_rate": 0.00016117067165798062, - "loss": 0.0139, + "epoch": 0.48, + "learning_rate": 0.00022867067066548115, + "loss": 0.0153, "step": 183450 }, { - "epoch": 0.93, - "learning_rate": 0.0001611631039649666, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022866678244910972, + "loss": 0.0174, "step": 183460 }, { - "epoch": 0.93, - "learning_rate": 0.0001611555362719526, - "loss": 0.0089, + "epoch": 0.48, + "learning_rate": 0.00022866289423273826, + "loss": 0.0195, "step": 183470 }, { - "epoch": 0.93, - "learning_rate": 0.0001611479685789386, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022865900601636677, + "loss": 0.0162, "step": 183480 }, { - "epoch": 0.93, - "learning_rate": 0.00016114040088592457, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.0002286551177999953, + "loss": 0.0181, "step": 183490 }, { - "epoch": 0.93, - "learning_rate": 0.00016113283319291058, - "loss": 0.0132, + "epoch": 0.48, + "learning_rate": 0.00022865122958362386, + "loss": 0.0177, "step": 183500 }, { - "epoch": 0.93, - "learning_rate": 0.00016112526549989656, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.0002286473413672524, + "loss": 0.0165, "step": 183510 }, { - "epoch": 0.93, - "learning_rate": 0.00016111769780688254, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022864345315088091, + "loss": 0.0184, "step": 183520 }, { - "epoch": 0.93, - "learning_rate": 0.00016111013011386855, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022863956493450946, + "loss": 0.013, "step": 183530 }, { - "epoch": 0.93, - "learning_rate": 0.00016110256242085453, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.000228635676718138, + "loss": 0.0131, "step": 183540 }, { - "epoch": 0.93, - "learning_rate": 0.00016109499472784052, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022863178850176654, + "loss": 0.0182, "step": 183550 }, { - "epoch": 0.93, - "learning_rate": 0.0001610874270348265, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022862790028539505, + "loss": 0.0162, "step": 183560 }, { - "epoch": 0.93, - "learning_rate": 0.0001610798593418125, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002286240120690236, + "loss": 0.019, "step": 183570 }, { - "epoch": 0.93, - "learning_rate": 0.0001610722916487985, - "loss": 0.0081, + "epoch": 0.48, + "learning_rate": 0.00022862012385265214, + "loss": 0.0154, "step": 183580 }, { - "epoch": 0.93, - "learning_rate": 0.00016106472395578447, - "loss": 0.0158, + "epoch": 0.48, + "learning_rate": 0.00022861623563628068, + "loss": 0.0169, "step": 183590 }, { - "epoch": 0.93, - "learning_rate": 0.00016105715626277048, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.0002286123474199092, + "loss": 0.0188, "step": 183600 }, { - "epoch": 0.93, - "learning_rate": 0.00016104958856975646, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022860845920353773, + "loss": 0.0161, "step": 183610 }, { - "epoch": 0.93, - "learning_rate": 0.00016104202087674244, - "loss": 0.0147, + "epoch": 0.48, + "learning_rate": 0.00022860457098716625, + "loss": 0.0177, "step": 183620 }, { - "epoch": 0.93, - "learning_rate": 0.00016103445318372845, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022860068277079482, + "loss": 0.0164, "step": 183630 }, { - "epoch": 0.93, - "learning_rate": 0.00016102688549071443, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.00022859679455442336, + "loss": 0.0157, "step": 183640 }, { - "epoch": 0.93, - "learning_rate": 0.0001610193177977004, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022859290633805187, + "loss": 0.0148, "step": 183650 }, { - "epoch": 0.93, - "learning_rate": 0.00016101175010468642, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.0002285890181216804, + "loss": 0.0167, "step": 183660 }, { - "epoch": 0.93, - "learning_rate": 0.0001610041824116724, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022858512990530896, + "loss": 0.0178, "step": 183670 }, { - "epoch": 0.93, - "learning_rate": 0.00016099661471865838, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002285812416889375, + "loss": 0.017, "step": 183680 }, { - "epoch": 0.93, - "learning_rate": 0.0001609890470256444, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.000228577353472566, + "loss": 0.02, "step": 183690 }, { - "epoch": 0.93, - "learning_rate": 0.00016098147933263037, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.00022857346525619455, + "loss": 0.0153, "step": 183700 }, { - "epoch": 0.93, - "learning_rate": 0.00016097391163961635, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.0002285695770398231, + "loss": 0.0185, "step": 183710 }, { - "epoch": 0.93, - "learning_rate": 0.00016096634394660236, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.00022856568882345164, + "loss": 0.0247, "step": 183720 }, { - "epoch": 0.93, - "learning_rate": 0.00016095877625358834, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022856180060708015, + "loss": 0.0234, "step": 183730 }, { - "epoch": 0.93, - "learning_rate": 0.00016095120856057433, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.0002285579123907087, + "loss": 0.018, "step": 183740 }, { - "epoch": 0.93, - "learning_rate": 0.0001609436408675603, - "loss": 0.014, + "epoch": 0.48, + "learning_rate": 0.00022855402417433724, + "loss": 0.019, "step": 183750 }, { - "epoch": 0.93, - "learning_rate": 0.00016093607317454632, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022855013595796578, + "loss": 0.0157, "step": 183760 }, { - "epoch": 0.93, - "learning_rate": 0.0001609285054815323, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002285462477415943, + "loss": 0.021, "step": 183770 }, { - "epoch": 0.93, - "learning_rate": 0.00016092093778851828, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022854235952522283, + "loss": 0.0217, "step": 183780 }, { - "epoch": 0.93, - "learning_rate": 0.0001609133700955043, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.0002285384713088514, + "loss": 0.0218, "step": 183790 }, { - "epoch": 0.93, - "learning_rate": 0.00016090580240249027, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022853458309247992, + "loss": 0.0271, "step": 183800 }, { - "epoch": 0.93, - "learning_rate": 0.00016089823470947625, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022853069487610843, + "loss": 0.0169, "step": 183810 }, { - "epoch": 0.93, - "learning_rate": 0.00016089066701646226, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022852680665973697, + "loss": 0.0187, "step": 183820 }, { - "epoch": 0.93, - "learning_rate": 0.00016088309932344824, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022852291844336554, + "loss": 0.0164, "step": 183830 }, { - "epoch": 0.93, - "learning_rate": 0.00016087553163043422, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022851903022699406, + "loss": 0.0224, "step": 183840 }, { - "epoch": 0.93, - "learning_rate": 0.00016086796393742023, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.0002285151420106226, + "loss": 0.0183, "step": 183850 }, { - "epoch": 0.93, - "learning_rate": 0.0001608603962444062, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.0002285112537942511, + "loss": 0.0151, "step": 183860 }, { - "epoch": 0.93, - "learning_rate": 0.0001608528285513922, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022850736557787965, + "loss": 0.0183, "step": 183870 }, { - "epoch": 0.93, - "learning_rate": 0.0001608452608583782, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.0002285034773615082, + "loss": 0.0229, "step": 183880 }, { - "epoch": 0.93, - "learning_rate": 0.00016083769316536418, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022849958914513674, + "loss": 0.0209, "step": 183890 }, { - "epoch": 0.93, - "learning_rate": 0.00016083012547235016, - "loss": 0.009, + "epoch": 0.48, + "learning_rate": 0.00022849570092876525, + "loss": 0.037, "step": 183900 }, { - "epoch": 0.93, - "learning_rate": 0.00016082255777933615, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002284918127123938, + "loss": 0.0236, "step": 183910 }, { - "epoch": 0.93, - "learning_rate": 0.00016081499008632215, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022848792449602234, + "loss": 0.0194, "step": 183920 }, { - "epoch": 0.93, - "learning_rate": 0.00016080742239330814, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022848403627965088, + "loss": 0.0197, "step": 183930 }, { - "epoch": 0.93, - "learning_rate": 0.00016079985470029412, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.0002284801480632794, + "loss": 0.0233, "step": 183940 }, { - "epoch": 0.93, - "learning_rate": 0.00016079228700728013, - "loss": 0.0093, + "epoch": 0.48, + "learning_rate": 0.00022847625984690793, + "loss": 0.0178, "step": 183950 }, { - "epoch": 0.93, - "learning_rate": 0.0001607847193142661, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.00022847237163053647, + "loss": 0.0197, "step": 183960 }, { - "epoch": 0.93, - "learning_rate": 0.0001607771516212521, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022846848341416502, + "loss": 0.0154, "step": 183970 }, { - "epoch": 0.93, - "learning_rate": 0.0001607695839282381, - "loss": 0.0076, + "epoch": 0.48, + "learning_rate": 0.00022846459519779353, + "loss": 0.0155, "step": 183980 }, { - "epoch": 0.93, - "learning_rate": 0.00016076201623522408, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022846070698142207, + "loss": 0.0206, "step": 183990 }, { - "epoch": 0.93, - "learning_rate": 0.00016075444854221006, - "loss": 0.0133, + "epoch": 0.48, + "learning_rate": 0.00022845681876505064, + "loss": 0.021, "step": 184000 }, { - "epoch": 0.93, - "eval_cer": 0.9144731670915385, - "eval_loss": 0.00799303688108921, - "eval_runtime": 116.5635, - "eval_samples_per_second": 17.158, - "eval_steps_per_second": 4.29, + "epoch": 0.48, + "eval_cer": 0.8817712685329425, + "eval_loss": 0.012564102187752724, + "eval_runtime": 108.043, + "eval_samples_per_second": 18.511, + "eval_steps_per_second": 4.628, "step": 184000 }, { - "epoch": 0.93, - "learning_rate": 0.00016074688084919607, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022845293054867916, + "loss": 0.0193, "step": 184010 }, { - "epoch": 0.93, - "learning_rate": 0.00016073931315618205, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002284490423323077, + "loss": 0.0184, "step": 184020 }, { - "epoch": 0.93, - "learning_rate": 0.00016073174546316803, - "loss": 0.0128, + "epoch": 0.48, + "learning_rate": 0.0002284451541159362, + "loss": 0.0251, "step": 184030 }, { - "epoch": 0.93, - "learning_rate": 0.00016072417777015404, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022844126589956478, + "loss": 0.0248, "step": 184040 }, { - "epoch": 0.93, - "learning_rate": 0.00016071661007714002, - "loss": 0.0088, + "epoch": 0.48, + "learning_rate": 0.0002284373776831933, + "loss": 0.0146, "step": 184050 }, { - "epoch": 0.93, - "learning_rate": 0.000160709042384126, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022843348946682184, + "loss": 0.0184, "step": 184060 }, { - "epoch": 0.93, - "learning_rate": 0.00016070147469111198, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022842960125045035, + "loss": 0.0198, "step": 184070 }, { - "epoch": 0.93, - "learning_rate": 0.000160693906998098, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022842571303407892, + "loss": 0.0143, "step": 184080 }, { - "epoch": 0.93, - "learning_rate": 0.00016068633930508397, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022842182481770743, + "loss": 0.0214, "step": 184090 }, { - "epoch": 0.93, - "learning_rate": 0.00016067877161206996, - "loss": 0.0156, + "epoch": 0.48, + "learning_rate": 0.00022841793660133598, + "loss": 0.0181, "step": 184100 }, { - "epoch": 0.93, - "learning_rate": 0.00016067120391905596, - "loss": 0.0137, + "epoch": 0.48, + "learning_rate": 0.0002284140483849645, + "loss": 0.0179, "step": 184110 }, { - "epoch": 0.93, - "learning_rate": 0.00016066363622604195, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022841016016859303, + "loss": 0.0183, "step": 184120 }, { - "epoch": 0.93, - "learning_rate": 0.00016065606853302793, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022840627195222157, + "loss": 0.0171, "step": 184130 }, { - "epoch": 0.93, - "learning_rate": 0.00016064850084001388, - "loss": 0.0084, + "epoch": 0.48, + "learning_rate": 0.00022840238373585012, + "loss": 0.0186, "step": 184140 }, { - "epoch": 0.93, - "learning_rate": 0.0001606409331469999, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022839849551947863, + "loss": 0.0143, "step": 184150 }, { - "epoch": 0.93, - "learning_rate": 0.00016063336545398587, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022839460730310717, + "loss": 0.0148, "step": 184160 }, { - "epoch": 0.93, - "learning_rate": 0.00016062579776097185, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022839071908673574, + "loss": 0.0158, "step": 184170 }, { - "epoch": 0.93, - "learning_rate": 0.00016061823006795786, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.00022838683087036426, + "loss": 0.0134, "step": 184180 }, { - "epoch": 0.93, - "learning_rate": 0.00016061066237494384, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.0002283829426539928, + "loss": 0.0179, "step": 184190 }, { - "epoch": 0.93, - "learning_rate": 0.00016060309468192982, - "loss": 0.0093, + "epoch": 0.48, + "learning_rate": 0.0002283790544376213, + "loss": 0.017, "step": 184200 }, { - "epoch": 0.93, - "learning_rate": 0.00016059552698891583, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022837516622124988, + "loss": 0.0172, "step": 184210 }, { - "epoch": 0.93, - "learning_rate": 0.00016058795929590181, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002283712780048784, + "loss": 0.016, "step": 184220 }, { - "epoch": 0.93, - "learning_rate": 0.0001605803916028878, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022836738978850694, + "loss": 0.0148, "step": 184230 }, { - "epoch": 0.93, - "learning_rate": 0.0001605728239098738, - "loss": 0.0124, + "epoch": 0.48, + "learning_rate": 0.00022836350157213545, + "loss": 0.0182, "step": 184240 }, { - "epoch": 0.93, - "learning_rate": 0.00016056525621685979, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022835961335576402, + "loss": 0.0172, "step": 184250 }, { - "epoch": 0.93, - "learning_rate": 0.00016055768852384577, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.00022835572513939253, + "loss": 0.0159, "step": 184260 }, { - "epoch": 0.93, - "learning_rate": 0.00016055012083083178, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.00022835183692302108, + "loss": 0.0164, "step": 184270 }, { - "epoch": 0.93, - "learning_rate": 0.00016054255313781776, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002283479487066496, + "loss": 0.0224, "step": 184280 }, { - "epoch": 0.93, - "learning_rate": 0.00016053498544480374, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022834406049027816, + "loss": 0.0218, "step": 184290 }, { - "epoch": 0.93, - "learning_rate": 0.00016052741775178972, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022834017227390667, + "loss": 0.0139, "step": 184300 }, { - "epoch": 0.93, - "learning_rate": 0.00016051985005877573, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022833628405753522, + "loss": 0.0212, "step": 184310 }, { - "epoch": 0.93, - "learning_rate": 0.0001605122823657617, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022833239584116373, + "loss": 0.0153, "step": 184320 }, { - "epoch": 0.93, - "learning_rate": 0.0001605047146727477, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.0002283285076247923, + "loss": 0.02, "step": 184330 }, { - "epoch": 0.93, - "learning_rate": 0.0001604971469797337, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022832461940842084, + "loss": 0.0202, "step": 184340 }, { - "epoch": 0.93, - "learning_rate": 0.00016048957928671968, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022832073119204935, + "loss": 0.0225, "step": 184350 }, { - "epoch": 0.93, - "learning_rate": 0.00016048201159370566, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002283168429756779, + "loss": 0.022, "step": 184360 }, { - "epoch": 0.93, - "learning_rate": 0.00016047444390069167, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.0002283129547593064, + "loss": 0.0142, "step": 184370 }, { - "epoch": 0.93, - "learning_rate": 0.00016046687620767765, - "loss": 0.0139, + "epoch": 0.48, + "learning_rate": 0.00022830906654293498, + "loss": 0.0177, "step": 184380 }, { - "epoch": 0.93, - "learning_rate": 0.00016045930851466363, - "loss": 0.0134, + "epoch": 0.48, + "learning_rate": 0.0002283051783265635, + "loss": 0.0173, "step": 184390 }, { - "epoch": 0.93, - "learning_rate": 0.00016045174082164964, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.00022830129011019204, + "loss": 0.0153, "step": 184400 }, { - "epoch": 0.93, - "learning_rate": 0.00016044417312863562, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022829740189382055, + "loss": 0.0197, "step": 184410 }, { - "epoch": 0.93, - "learning_rate": 0.0001604366054356216, - "loss": 0.0129, + "epoch": 0.48, + "learning_rate": 0.00022829351367744912, + "loss": 0.0178, "step": 184420 }, { - "epoch": 0.93, - "learning_rate": 0.00016042903774260761, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022828962546107763, + "loss": 0.0172, "step": 184430 }, { - "epoch": 0.93, - "learning_rate": 0.0001604214700495936, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022828573724470618, + "loss": 0.0153, "step": 184440 }, { - "epoch": 0.93, - "learning_rate": 0.00016041390235657958, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.0002282818490283347, + "loss": 0.0195, "step": 184450 }, { - "epoch": 0.93, - "learning_rate": 0.00016040633466356556, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022827796081196326, + "loss": 0.0173, "step": 184460 }, { - "epoch": 0.93, - "learning_rate": 0.00016039876697055157, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022827407259559177, + "loss": 0.017, "step": 184470 }, { - "epoch": 0.93, - "learning_rate": 0.00016039119927753755, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022827018437922031, + "loss": 0.0178, "step": 184480 }, { - "epoch": 0.93, - "learning_rate": 0.00016038363158452353, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022826629616284883, + "loss": 0.0128, "step": 184490 }, { - "epoch": 0.93, - "learning_rate": 0.00016037606389150954, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.0002282624079464774, + "loss": 0.0185, "step": 184500 }, { - "epoch": 0.93, - "learning_rate": 0.00016036849619849552, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022825851973010594, + "loss": 0.0255, "step": 184510 }, { - "epoch": 0.93, - "learning_rate": 0.0001603609285054815, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022825463151373445, + "loss": 0.0163, "step": 184520 }, { - "epoch": 0.93, - "learning_rate": 0.0001603533608124675, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022825074329736297, + "loss": 0.0171, "step": 184530 }, { - "epoch": 0.93, - "learning_rate": 0.0001603457931194535, - "loss": 0.0141, + "epoch": 0.48, + "learning_rate": 0.00022824685508099154, + "loss": 0.0155, "step": 184540 }, { - "epoch": 0.93, - "learning_rate": 0.00016033822542643947, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022824296686462008, + "loss": 0.0167, "step": 184550 }, { - "epoch": 0.93, - "learning_rate": 0.00016033065773342548, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.0002282390786482486, + "loss": 0.015, "step": 184560 }, { - "epoch": 0.93, - "learning_rate": 0.00016032309004041146, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022823519043187714, + "loss": 0.021, "step": 184570 }, { - "epoch": 0.93, - "learning_rate": 0.00016031552234739744, - "loss": 0.0122, + "epoch": 0.48, + "learning_rate": 0.00022823130221550568, + "loss": 0.0172, "step": 184580 }, { - "epoch": 0.93, - "learning_rate": 0.00016030795465438345, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022822741399913422, + "loss": 0.0199, "step": 184590 }, { - "epoch": 0.93, - "learning_rate": 0.00016030038696136943, - "loss": 0.0139, + "epoch": 0.48, + "learning_rate": 0.00022822352578276273, + "loss": 0.0155, "step": 184600 }, { - "epoch": 0.93, - "learning_rate": 0.00016029281926835542, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.00022821963756639127, + "loss": 0.0175, "step": 184610 }, { - "epoch": 0.93, - "learning_rate": 0.00016028525157534142, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.0002282157493500198, + "loss": 0.0205, "step": 184620 }, { - "epoch": 0.93, - "learning_rate": 0.0001602776838823274, - "loss": 0.0155, + "epoch": 0.48, + "learning_rate": 0.00022821186113364836, + "loss": 0.0183, "step": 184630 }, { - "epoch": 0.93, - "learning_rate": 0.0001602701161893134, - "loss": 0.0135, + "epoch": 0.48, + "learning_rate": 0.00022820797291727687, + "loss": 0.0179, "step": 184640 }, { - "epoch": 0.93, - "learning_rate": 0.00016026254849629937, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022820408470090541, + "loss": 0.0165, "step": 184650 }, { - "epoch": 0.93, - "learning_rate": 0.00016025498080328538, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022820019648453393, + "loss": 0.0177, "step": 184660 }, { - "epoch": 0.93, - "learning_rate": 0.00016024741311027136, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.0002281963082681625, + "loss": 0.0197, "step": 184670 }, { - "epoch": 0.93, - "learning_rate": 0.00016023984541725734, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.000228192420051791, + "loss": 0.0217, "step": 184680 }, { - "epoch": 0.93, - "learning_rate": 0.00016023227772424335, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022818853183541955, + "loss": 0.018, "step": 184690 }, { - "epoch": 0.93, - "learning_rate": 0.00016022471003122933, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022818464361904807, + "loss": 0.0169, "step": 184700 }, { - "epoch": 0.93, - "learning_rate": 0.0001602171423382153, - "loss": 0.0085, + "epoch": 0.48, + "learning_rate": 0.00022818075540267664, + "loss": 0.0159, "step": 184710 }, { - "epoch": 0.93, - "learning_rate": 0.00016020957464520132, - "loss": 0.0135, + "epoch": 0.48, + "learning_rate": 0.00022817686718630518, + "loss": 0.0168, "step": 184720 }, { - "epoch": 0.93, - "learning_rate": 0.0001602020069521873, - "loss": 0.0145, + "epoch": 0.48, + "learning_rate": 0.0002281729789699337, + "loss": 0.0214, "step": 184730 }, { - "epoch": 0.93, - "learning_rate": 0.00016019443925917328, - "loss": 0.0088, + "epoch": 0.48, + "learning_rate": 0.00022816909075356223, + "loss": 0.02, "step": 184740 }, { - "epoch": 0.93, - "learning_rate": 0.0001601868715661593, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022816520253719078, + "loss": 0.0169, "step": 184750 }, { - "epoch": 0.93, - "learning_rate": 0.00016017930387314527, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022816131432081932, + "loss": 0.0211, "step": 184760 }, { - "epoch": 0.93, - "learning_rate": 0.00016017173618013125, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022815742610444783, + "loss": 0.0156, "step": 184770 }, { - "epoch": 0.93, - "learning_rate": 0.00016016416848711726, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022815353788807637, + "loss": 0.0216, "step": 184780 }, { - "epoch": 0.93, - "learning_rate": 0.00016015660079410324, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022814964967170492, + "loss": 0.019, "step": 184790 }, { - "epoch": 0.93, - "learning_rate": 0.00016014903310108923, - "loss": 0.0148, + "epoch": 0.48, + "learning_rate": 0.00022814576145533346, + "loss": 0.0187, "step": 184800 }, { - "epoch": 0.93, - "learning_rate": 0.0001601414654080752, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022814187323896197, + "loss": 0.0188, "step": 184810 }, { - "epoch": 0.93, - "learning_rate": 0.00016013389771506122, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.0002281379850225905, + "loss": 0.0161, "step": 184820 }, { - "epoch": 0.93, - "learning_rate": 0.0001601263300220472, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022813409680621908, + "loss": 0.0196, "step": 184830 }, { - "epoch": 0.93, - "learning_rate": 0.00016011876232903318, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.0002281302085898476, + "loss": 0.0189, "step": 184840 }, { - "epoch": 0.93, - "learning_rate": 0.0001601111946360192, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.0002281263203734761, + "loss": 0.0225, "step": 184850 }, { - "epoch": 0.93, - "learning_rate": 0.00016010362694300517, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022812243215710465, + "loss": 0.0191, "step": 184860 }, { - "epoch": 0.93, - "learning_rate": 0.00016009605924999115, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022811854394073317, + "loss": 0.0166, "step": 184870 }, { - "epoch": 0.93, - "learning_rate": 0.00016008849155697716, - "loss": 0.0081, + "epoch": 0.48, + "learning_rate": 0.00022811465572436174, + "loss": 0.0141, "step": 184880 }, { - "epoch": 0.93, - "learning_rate": 0.00016008092386396314, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.00022811076750799028, + "loss": 0.0202, "step": 184890 }, { - "epoch": 0.93, - "learning_rate": 0.00016007335617094912, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.0002281068792916188, + "loss": 0.0207, "step": 184900 }, { - "epoch": 0.93, - "learning_rate": 0.00016006578847793513, - "loss": 0.0155, + "epoch": 0.48, + "learning_rate": 0.00022810299107524733, + "loss": 0.0214, "step": 184910 }, { - "epoch": 0.93, - "learning_rate": 0.0001600582207849211, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022809910285887588, + "loss": 0.0155, "step": 184920 }, { - "epoch": 0.93, - "learning_rate": 0.0001600506530919071, - "loss": 0.0155, + "epoch": 0.48, + "learning_rate": 0.00022809521464250442, + "loss": 0.0165, "step": 184930 }, { - "epoch": 0.93, - "learning_rate": 0.0001600430853988931, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022809132642613293, + "loss": 0.0167, "step": 184940 }, { - "epoch": 0.93, - "learning_rate": 0.00016003551770587908, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.00022808743820976147, + "loss": 0.016, "step": 184950 }, { - "epoch": 0.93, - "learning_rate": 0.00016002795001286506, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022808354999339002, + "loss": 0.0156, "step": 184960 }, { - "epoch": 0.93, - "learning_rate": 0.00016002038231985105, - "loss": 0.0149, + "epoch": 0.48, + "learning_rate": 0.00022807966177701856, + "loss": 0.025, "step": 184970 }, { - "epoch": 0.93, - "learning_rate": 0.00016001281462683705, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.00022807577356064707, + "loss": 0.018, "step": 184980 }, { - "epoch": 0.93, - "learning_rate": 0.00016000524693382304, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.0002280718853442756, + "loss": 0.0206, "step": 184990 }, { - "epoch": 0.93, - "learning_rate": 0.00015999767924080902, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022806799712790415, + "loss": 0.0197, "step": 185000 }, { - "epoch": 0.93, - "eval_cer": 0.914462492734159, - "eval_loss": 0.007860948331654072, - "eval_runtime": 116.6063, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.48, + "eval_cer": 0.8817614710744033, + "eval_loss": 0.01203981600701809, + "eval_runtime": 108.1177, + "eval_samples_per_second": 18.498, + "eval_steps_per_second": 4.625, "step": 185000 }, { - "epoch": 0.93, - "learning_rate": 0.00015999011154779503, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002280641089115327, + "loss": 0.0149, "step": 185010 }, { - "epoch": 0.93, - "learning_rate": 0.000159982543854781, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.0002280602206951612, + "loss": 0.0135, "step": 185020 }, { - "epoch": 0.93, - "learning_rate": 0.000159974976161767, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.00022805633247878975, + "loss": 0.0166, "step": 185030 }, { - "epoch": 0.93, - "learning_rate": 0.000159967408468753, - "loss": 0.0079, + "epoch": 0.48, + "learning_rate": 0.00022805244426241832, + "loss": 0.0182, "step": 185040 }, { - "epoch": 0.93, - "learning_rate": 0.00015995984077573898, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.00022804855604604684, + "loss": 0.0178, "step": 185050 }, { - "epoch": 0.93, - "learning_rate": 0.00015995227308272496, - "loss": 0.0135, + "epoch": 0.48, + "learning_rate": 0.00022804466782967538, + "loss": 0.0176, "step": 185060 }, { - "epoch": 0.93, - "learning_rate": 0.00015994470538971097, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.0002280407796133039, + "loss": 0.0178, "step": 185070 }, { - "epoch": 0.93, - "learning_rate": 0.00015993713769669695, - "loss": 0.014, + "epoch": 0.48, + "learning_rate": 0.00022803689139693246, + "loss": 0.0207, "step": 185080 }, { - "epoch": 0.93, - "learning_rate": 0.00015992957000368293, - "loss": 0.0133, + "epoch": 0.48, + "learning_rate": 0.00022803300318056097, + "loss": 0.0163, "step": 185090 }, { - "epoch": 0.93, - "learning_rate": 0.00015992200231066894, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022802911496418952, + "loss": 0.017, "step": 185100 }, { - "epoch": 0.93, - "learning_rate": 0.00015991443461765492, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022802522674781803, + "loss": 0.0147, "step": 185110 }, { - "epoch": 0.93, - "learning_rate": 0.0001599068669246409, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022802133853144657, + "loss": 0.0204, "step": 185120 }, { - "epoch": 0.93, - "learning_rate": 0.00015989929923162688, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022801745031507511, + "loss": 0.0174, "step": 185130 }, { - "epoch": 0.93, - "learning_rate": 0.0001598917315386129, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022801356209870366, + "loss": 0.0138, "step": 185140 }, { - "epoch": 0.93, - "learning_rate": 0.00015988416384559887, - "loss": 0.0139, + "epoch": 0.48, + "learning_rate": 0.00022800967388233217, + "loss": 0.0171, "step": 185150 }, { - "epoch": 0.93, - "learning_rate": 0.00015987659615258486, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.0002280057856659607, + "loss": 0.0171, "step": 185160 }, { - "epoch": 0.93, - "learning_rate": 0.00015986902845957086, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022800189744958925, + "loss": 0.0173, "step": 185170 }, { - "epoch": 0.93, - "learning_rate": 0.00015986146076655685, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.0002279980092332178, + "loss": 0.0207, "step": 185180 }, { - "epoch": 0.93, - "learning_rate": 0.00015985389307354283, - "loss": 0.0153, + "epoch": 0.48, + "learning_rate": 0.0002279941210168463, + "loss": 0.0171, "step": 185190 }, { - "epoch": 0.93, - "learning_rate": 0.00015984632538052884, - "loss": 0.0131, + "epoch": 0.48, + "learning_rate": 0.00022799023280047485, + "loss": 0.0227, "step": 185200 }, { - "epoch": 0.93, - "learning_rate": 0.00015983875768751482, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022798634458410342, + "loss": 0.0162, "step": 185210 }, { - "epoch": 0.93, - "learning_rate": 0.0001598311899945008, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022798245636773193, + "loss": 0.0169, "step": 185220 }, { - "epoch": 0.93, - "learning_rate": 0.0001598236223014868, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.00022797856815136048, + "loss": 0.0186, "step": 185230 }, { - "epoch": 0.93, - "learning_rate": 0.0001598160546084728, - "loss": 0.008, + "epoch": 0.48, + "learning_rate": 0.000227974679934989, + "loss": 0.0226, "step": 185240 }, { - "epoch": 0.93, - "learning_rate": 0.00015980848691545877, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022797079171861756, + "loss": 0.0177, "step": 185250 }, { - "epoch": 0.93, - "learning_rate": 0.00015980091922244478, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.00022796690350224607, + "loss": 0.0134, "step": 185260 }, { - "epoch": 0.93, - "learning_rate": 0.00015979335152943076, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022796301528587462, + "loss": 0.017, "step": 185270 }, { - "epoch": 0.93, - "learning_rate": 0.00015978578383641674, - "loss": 0.0146, + "epoch": 0.48, + "learning_rate": 0.00022795912706950313, + "loss": 0.0205, "step": 185280 }, { - "epoch": 0.93, - "learning_rate": 0.00015977821614340275, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.0002279552388531317, + "loss": 0.0156, "step": 185290 }, { - "epoch": 0.93, - "learning_rate": 0.00015977064845038873, - "loss": 0.0132, + "epoch": 0.48, + "learning_rate": 0.00022795135063676021, + "loss": 0.0201, "step": 185300 }, { - "epoch": 0.93, - "learning_rate": 0.0001597630807573747, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022794746242038876, + "loss": 0.0184, "step": 185310 }, { - "epoch": 0.93, - "learning_rate": 0.0001597555130643607, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022794357420401727, + "loss": 0.0169, "step": 185320 }, { - "epoch": 0.94, - "learning_rate": 0.0001597479453713467, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022793968598764584, + "loss": 0.0167, "step": 185330 }, { - "epoch": 0.94, - "learning_rate": 0.00015974037767833268, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022793579777127435, + "loss": 0.0174, "step": 185340 }, { - "epoch": 0.94, - "learning_rate": 0.00015973280998531867, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.0002279319095549029, + "loss": 0.0208, "step": 185350 }, { - "epoch": 0.94, - "learning_rate": 0.00015972524229230467, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002279280213385314, + "loss": 0.0157, "step": 185360 }, { - "epoch": 0.94, - "learning_rate": 0.00015971767459929066, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022792413312215995, + "loss": 0.017, "step": 185370 }, { - "epoch": 0.94, - "learning_rate": 0.00015971010690627664, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022792024490578852, + "loss": 0.0165, "step": 185380 }, { - "epoch": 0.94, - "learning_rate": 0.00015970253921326265, - "loss": 0.0129, + "epoch": 0.48, + "learning_rate": 0.00022791635668941703, + "loss": 0.0163, "step": 185390 }, { - "epoch": 0.94, - "learning_rate": 0.0001596949715202486, - "loss": 0.0131, + "epoch": 0.48, + "learning_rate": 0.00022791246847304555, + "loss": 0.0187, "step": 185400 }, { - "epoch": 0.94, - "learning_rate": 0.00015968740382723458, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002279085802566741, + "loss": 0.0163, "step": 185410 }, { - "epoch": 0.94, - "learning_rate": 0.00015967983613422056, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022790469204030266, + "loss": 0.0151, "step": 185420 }, { - "epoch": 0.94, - "learning_rate": 0.00015967226844120657, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022790080382393117, + "loss": 0.0153, "step": 185430 }, { - "epoch": 0.94, - "learning_rate": 0.00015966470074819255, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022789691560755972, + "loss": 0.0227, "step": 185440 }, { - "epoch": 0.94, - "learning_rate": 0.00015965713305517854, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022789302739118823, + "loss": 0.0177, "step": 185450 }, { - "epoch": 0.94, - "learning_rate": 0.00015964956536216454, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.0002278891391748168, + "loss": 0.0154, "step": 185460 }, { - "epoch": 0.94, - "learning_rate": 0.00015964199766915053, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002278852509584453, + "loss": 0.0246, "step": 185470 }, { - "epoch": 0.94, - "learning_rate": 0.0001596344299761365, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022788136274207385, + "loss": 0.0154, "step": 185480 }, { - "epoch": 0.94, - "learning_rate": 0.00015962686228312252, - "loss": 0.0096, - "step": 185490 + "epoch": 0.48, + "learning_rate": 0.00022787747452570237, + "loss": 0.0181, + "step": 185490 }, { - "epoch": 0.94, - "learning_rate": 0.0001596192945901085, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022787358630933094, + "loss": 0.0189, "step": 185500 }, { - "epoch": 0.94, - "learning_rate": 0.00015961172689709448, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022786969809295945, + "loss": 0.0256, "step": 185510 }, { - "epoch": 0.94, - "learning_rate": 0.00015960415920408046, - "loss": 0.0134, + "epoch": 0.48, + "learning_rate": 0.000227865809876588, + "loss": 0.0211, "step": 185520 }, { - "epoch": 0.94, - "learning_rate": 0.00015959659151106647, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002278619216602165, + "loss": 0.017, "step": 185530 }, { - "epoch": 0.94, - "learning_rate": 0.00015958902381805245, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022785803344384508, + "loss": 0.0169, "step": 185540 }, { - "epoch": 0.94, - "learning_rate": 0.00015958145612503843, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.0002278541452274736, + "loss": 0.0152, "step": 185550 }, { - "epoch": 0.94, - "learning_rate": 0.00015957388843202444, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022785025701110213, + "loss": 0.02, "step": 185560 }, { - "epoch": 0.94, - "learning_rate": 0.00015956632073901042, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.00022784636879473065, + "loss": 0.0194, "step": 185570 }, { - "epoch": 0.94, - "learning_rate": 0.0001595587530459964, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.00022784248057835922, + "loss": 0.0173, "step": 185580 }, { - "epoch": 0.94, - "learning_rate": 0.0001595511853529824, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022783859236198776, + "loss": 0.0182, "step": 185590 }, { - "epoch": 0.94, - "learning_rate": 0.0001595436176599684, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022783470414561627, + "loss": 0.0175, "step": 185600 }, { - "epoch": 0.94, - "learning_rate": 0.00015953604996695437, - "loss": 0.0132, + "epoch": 0.48, + "learning_rate": 0.00022783081592924481, + "loss": 0.0172, "step": 185610 }, { - "epoch": 0.94, - "learning_rate": 0.00015952848227394038, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022782692771287333, + "loss": 0.0182, "step": 185620 }, { - "epoch": 0.94, - "learning_rate": 0.00015952091458092636, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.0002278230394965019, + "loss": 0.0167, "step": 185630 }, { - "epoch": 0.94, - "learning_rate": 0.00015951334688791235, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.0002278191512801304, + "loss": 0.019, "step": 185640 }, { - "epoch": 0.94, - "learning_rate": 0.00015950577919489835, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.00022781526306375895, + "loss": 0.0182, "step": 185650 }, { - "epoch": 0.94, - "learning_rate": 0.00015949821150188434, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022781137484738747, + "loss": 0.0177, "step": 185660 }, { - "epoch": 0.94, - "learning_rate": 0.00015949064380887032, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022780748663101604, + "loss": 0.0154, "step": 185670 }, { - "epoch": 0.94, - "learning_rate": 0.00015948307611585633, - "loss": 0.0143, + "epoch": 0.48, + "learning_rate": 0.00022780359841464455, + "loss": 0.0215, "step": 185680 }, { - "epoch": 0.94, - "learning_rate": 0.0001594755084228423, - "loss": 0.0089, + "epoch": 0.48, + "learning_rate": 0.0002277997101982731, + "loss": 0.0165, "step": 185690 }, { - "epoch": 0.94, - "learning_rate": 0.0001594679407298283, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002277958219819016, + "loss": 0.019, "step": 185700 }, { - "epoch": 0.94, - "learning_rate": 0.00015946037303681427, - "loss": 0.0129, + "epoch": 0.48, + "learning_rate": 0.00022779193376553018, + "loss": 0.0186, "step": 185710 }, { - "epoch": 0.94, - "learning_rate": 0.00015945280534380028, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.0002277880455491587, + "loss": 0.0144, "step": 185720 }, { - "epoch": 0.94, - "learning_rate": 0.00015944523765078626, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.00022778415733278723, + "loss": 0.0182, "step": 185730 }, { - "epoch": 0.94, - "learning_rate": 0.00015943766995777224, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022778026911641575, + "loss": 0.0178, "step": 185740 }, { - "epoch": 0.94, - "learning_rate": 0.00015943010226475825, - "loss": 0.0141, + "epoch": 0.48, + "learning_rate": 0.00022777638090004432, + "loss": 0.0159, "step": 185750 }, { - "epoch": 0.94, - "learning_rate": 0.00015942253457174423, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022777249268367286, + "loss": 0.0205, "step": 185760 }, { - "epoch": 0.94, - "learning_rate": 0.0001594149668787302, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.00022776860446730137, + "loss": 0.017, "step": 185770 }, { - "epoch": 0.94, - "learning_rate": 0.00015940739918571622, - "loss": 0.0082, + "epoch": 0.48, + "learning_rate": 0.00022776471625092991, + "loss": 0.0225, "step": 185780 }, { - "epoch": 0.94, - "learning_rate": 0.0001593998314927022, - "loss": 0.0079, + "epoch": 0.48, + "learning_rate": 0.00022776082803455846, + "loss": 0.015, "step": 185790 }, { - "epoch": 0.94, - "learning_rate": 0.00015939226379968818, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.000227756939818187, + "loss": 0.0185, "step": 185800 }, { - "epoch": 0.94, - "learning_rate": 0.0001593846961066742, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.0002277530516018155, + "loss": 0.0193, "step": 185810 }, { - "epoch": 0.94, - "learning_rate": 0.00015937712841366017, - "loss": 0.0099, + "epoch": 0.48, + "learning_rate": 0.00022774916338544405, + "loss": 0.0139, "step": 185820 }, { - "epoch": 0.94, - "learning_rate": 0.00015936956072064616, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.0002277452751690726, + "loss": 0.0157, "step": 185830 }, { - "epoch": 0.94, - "learning_rate": 0.00015936199302763216, - "loss": 0.0145, + "epoch": 0.48, + "learning_rate": 0.00022774138695270114, + "loss": 0.016, "step": 185840 }, { - "epoch": 0.94, - "learning_rate": 0.00015935442533461815, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022773749873632965, + "loss": 0.0212, "step": 185850 }, { - "epoch": 0.94, - "learning_rate": 0.00015934685764160413, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.0002277336105199582, + "loss": 0.0161, "step": 185860 }, { - "epoch": 0.94, - "learning_rate": 0.0001593392899485901, - "loss": 0.0128, + "epoch": 0.48, + "learning_rate": 0.0002277297223035867, + "loss": 0.017, "step": 185870 }, { - "epoch": 0.94, - "learning_rate": 0.00015933172225557612, - "loss": 0.0136, + "epoch": 0.48, + "learning_rate": 0.00022772583408721528, + "loss": 0.017, "step": 185880 }, { - "epoch": 0.94, - "learning_rate": 0.0001593241545625621, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.0002277219458708438, + "loss": 0.0168, "step": 185890 }, { - "epoch": 0.94, - "learning_rate": 0.00015931658686954808, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022771805765447233, + "loss": 0.0166, "step": 185900 }, { - "epoch": 0.94, - "learning_rate": 0.0001593090191765341, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022771416943810085, + "loss": 0.0174, "step": 185910 }, { - "epoch": 0.94, - "learning_rate": 0.00015930145148352007, - "loss": 0.0132, + "epoch": 0.48, + "learning_rate": 0.00022771028122172942, + "loss": 0.0178, "step": 185920 }, { - "epoch": 0.94, - "learning_rate": 0.00015929388379050605, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022770639300535796, + "loss": 0.0171, "step": 185930 }, { - "epoch": 0.94, - "learning_rate": 0.00015928631609749206, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022770250478898647, + "loss": 0.0175, "step": 185940 }, { - "epoch": 0.94, - "learning_rate": 0.00015927874840447804, - "loss": 0.0119, + "epoch": 0.48, + "learning_rate": 0.00022769861657261501, + "loss": 0.0173, "step": 185950 }, { - "epoch": 0.94, - "learning_rate": 0.00015927118071146402, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022769472835624356, + "loss": 0.018, "step": 185960 }, { - "epoch": 0.94, - "learning_rate": 0.00015926361301845003, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.0002276908401398721, + "loss": 0.0178, "step": 185970 }, { - "epoch": 0.94, - "learning_rate": 0.000159256045325436, - "loss": 0.0141, + "epoch": 0.48, + "learning_rate": 0.0002276869519235006, + "loss": 0.0134, "step": 185980 }, { - "epoch": 0.94, - "learning_rate": 0.000159248477632422, - "loss": 0.015, + "epoch": 0.48, + "learning_rate": 0.00022768306370712915, + "loss": 0.0168, "step": 185990 }, { - "epoch": 0.94, - "learning_rate": 0.000159240909939408, - "loss": 0.009, + "epoch": 0.48, + "learning_rate": 0.0002276791754907577, + "loss": 0.0172, "step": 186000 }, { - "epoch": 0.94, - "eval_cer": 0.9144770486760401, - "eval_loss": 0.007943259552121162, - "eval_runtime": 116.7604, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.48, + "eval_cer": 0.8818188561887047, + "eval_loss": 0.012164667248725891, + "eval_runtime": 107.6778, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 4.643, "step": 186000 }, { - "epoch": 0.94, - "learning_rate": 0.00015923334224639398, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022767528727438624, + "loss": 0.0175, "step": 186010 }, { - "epoch": 0.94, - "learning_rate": 0.00015922577455337997, - "loss": 0.0079, + "epoch": 0.48, + "learning_rate": 0.00022767139905801475, + "loss": 0.0145, "step": 186020 }, { - "epoch": 0.94, - "learning_rate": 0.00015921820686036595, - "loss": 0.0128, + "epoch": 0.48, + "learning_rate": 0.0002276675108416433, + "loss": 0.0205, "step": 186030 }, { - "epoch": 0.94, - "learning_rate": 0.00015921063916735196, - "loss": 0.0144, + "epoch": 0.48, + "learning_rate": 0.00022766362262527183, + "loss": 0.0171, "step": 186040 }, { - "epoch": 0.94, - "learning_rate": 0.00015920307147433794, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022765973440890038, + "loss": 0.0157, "step": 186050 }, { - "epoch": 0.94, - "learning_rate": 0.00015919550378132392, - "loss": 0.0096, + "epoch": 0.48, + "learning_rate": 0.0002276558461925289, + "loss": 0.0181, "step": 186060 }, { - "epoch": 0.94, - "learning_rate": 0.00015918793608830993, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.00022765195797615743, + "loss": 0.0179, "step": 186070 }, { - "epoch": 0.94, - "learning_rate": 0.0001591803683952959, - "loss": 0.0161, + "epoch": 0.48, + "learning_rate": 0.00022764806975978595, + "loss": 0.0172, "step": 186080 }, { - "epoch": 0.94, - "learning_rate": 0.0001591728007022819, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022764418154341452, + "loss": 0.0225, "step": 186090 }, { - "epoch": 0.94, - "learning_rate": 0.0001591652330092679, - "loss": 0.0094, + "epoch": 0.48, + "learning_rate": 0.00022764029332704306, + "loss": 0.0223, "step": 186100 }, { - "epoch": 0.94, - "learning_rate": 0.00015915766531625388, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022763640511067157, + "loss": 0.0181, "step": 186110 }, { - "epoch": 0.94, - "learning_rate": 0.00015915009762323986, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022763251689430009, + "loss": 0.0131, "step": 186120 }, { - "epoch": 0.94, - "learning_rate": 0.00015914252993022587, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.00022762862867792865, + "loss": 0.0188, "step": 186130 }, { - "epoch": 0.94, - "learning_rate": 0.00015913496223721185, - "loss": 0.0088, + "epoch": 0.48, + "learning_rate": 0.0002276247404615572, + "loss": 0.0203, "step": 186140 }, { - "epoch": 0.94, - "learning_rate": 0.00015912739454419783, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.0002276208522451857, + "loss": 0.0185, "step": 186150 }, { - "epoch": 0.94, - "learning_rate": 0.00015911982685118384, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022761696402881425, + "loss": 0.0139, "step": 186160 }, { - "epoch": 0.94, - "learning_rate": 0.00015911225915816982, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.0002276130758124428, + "loss": 0.0175, "step": 186170 }, { - "epoch": 0.94, - "learning_rate": 0.0001591046914651558, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.00022760918759607134, + "loss": 0.0156, "step": 186180 }, { - "epoch": 0.94, - "learning_rate": 0.0001590971237721418, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022760529937969985, + "loss": 0.0221, "step": 186190 }, { - "epoch": 0.94, - "learning_rate": 0.0001590895560791278, - "loss": 0.0093, + "epoch": 0.48, + "learning_rate": 0.0002276014111633284, + "loss": 0.0163, "step": 186200 }, { - "epoch": 0.94, - "learning_rate": 0.00015908198838611378, - "loss": 0.0102, + "epoch": 0.48, + "learning_rate": 0.00022759752294695693, + "loss": 0.0141, "step": 186210 }, { - "epoch": 0.94, - "learning_rate": 0.00015907442069309976, - "loss": 0.0135, + "epoch": 0.48, + "learning_rate": 0.00022759363473058548, + "loss": 0.0197, "step": 186220 }, { - "epoch": 0.94, - "learning_rate": 0.00015906685300008577, - "loss": 0.0086, + "epoch": 0.48, + "learning_rate": 0.000227589746514214, + "loss": 0.0169, "step": 186230 }, { - "epoch": 0.94, - "learning_rate": 0.00015905928530707175, - "loss": 0.0155, + "epoch": 0.48, + "learning_rate": 0.00022758585829784253, + "loss": 0.0183, "step": 186240 }, { - "epoch": 0.94, - "learning_rate": 0.00015905171761405773, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.0002275819700814711, + "loss": 0.0164, "step": 186250 }, { - "epoch": 0.94, - "learning_rate": 0.00015904414992104374, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.00022757808186509961, + "loss": 0.0191, "step": 186260 }, { - "epoch": 0.94, - "learning_rate": 0.00015903658222802972, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022757419364872813, + "loss": 0.016, "step": 186270 }, { - "epoch": 0.94, - "learning_rate": 0.0001590290145350157, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.00022757030543235667, + "loss": 0.0161, "step": 186280 }, { - "epoch": 0.94, - "learning_rate": 0.0001590214468420017, - "loss": 0.0091, + "epoch": 0.48, + "learning_rate": 0.00022756641721598524, + "loss": 0.0179, "step": 186290 }, { - "epoch": 0.94, - "learning_rate": 0.0001590138791489877, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.00022756252899961375, + "loss": 0.0165, "step": 186300 }, { - "epoch": 0.94, - "learning_rate": 0.00015900631145597367, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002275586407832423, + "loss": 0.0166, "step": 186310 }, { - "epoch": 0.94, - "learning_rate": 0.00015899874376295968, - "loss": 0.0112, + "epoch": 0.48, + "learning_rate": 0.0002275547525668708, + "loss": 0.0172, "step": 186320 }, { - "epoch": 0.94, - "learning_rate": 0.00015899117606994566, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022755086435049935, + "loss": 0.018, "step": 186330 }, { - "epoch": 0.94, - "learning_rate": 0.00015898360837693164, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.0002275469761341279, + "loss": 0.0174, "step": 186340 }, { - "epoch": 0.94, - "learning_rate": 0.00015897604068391765, - "loss": 0.0103, + "epoch": 0.48, + "learning_rate": 0.00022754308791775644, + "loss": 0.0177, "step": 186350 }, { - "epoch": 0.94, - "learning_rate": 0.00015896847299090363, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022753919970138495, + "loss": 0.0165, "step": 186360 }, { - "epoch": 0.94, - "learning_rate": 0.00015896090529788961, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.0002275353114850135, + "loss": 0.0153, "step": 186370 }, { - "epoch": 0.94, - "learning_rate": 0.0001589533376048756, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022753142326864203, + "loss": 0.0159, "step": 186380 }, { - "epoch": 0.94, - "learning_rate": 0.0001589457699118616, - "loss": 0.0124, + "epoch": 0.48, + "learning_rate": 0.00022752753505227057, + "loss": 0.0221, "step": 186390 }, { - "epoch": 0.94, - "learning_rate": 0.00015893820221884759, - "loss": 0.0153, + "epoch": 0.48, + "learning_rate": 0.0002275236468358991, + "loss": 0.019, "step": 186400 }, { - "epoch": 0.94, - "learning_rate": 0.00015893063452583357, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022751975861952763, + "loss": 0.0155, "step": 186410 }, { - "epoch": 0.94, - "learning_rate": 0.00015892306683281958, - "loss": 0.012, + "epoch": 0.48, + "learning_rate": 0.0002275158704031562, + "loss": 0.0136, "step": 186420 }, { - "epoch": 0.94, - "learning_rate": 0.00015891549913980556, - "loss": 0.009, + "epoch": 0.48, + "learning_rate": 0.00022751198218678471, + "loss": 0.0206, "step": 186430 }, { - "epoch": 0.94, - "learning_rate": 0.00015890793144679154, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022750809397041323, + "loss": 0.0208, "step": 186440 }, { - "epoch": 0.94, - "learning_rate": 0.00015890036375377755, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022750420575404177, + "loss": 0.0189, "step": 186450 }, { - "epoch": 0.94, - "learning_rate": 0.00015889279606076353, - "loss": 0.0138, + "epoch": 0.48, + "learning_rate": 0.00022750031753767034, + "loss": 0.0209, "step": 186460 }, { - "epoch": 0.94, - "learning_rate": 0.0001588852283677495, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.00022749642932129885, + "loss": 0.0167, "step": 186470 }, { - "epoch": 0.94, - "learning_rate": 0.00015887766067473552, - "loss": 0.0121, + "epoch": 0.48, + "learning_rate": 0.0002274925411049274, + "loss": 0.0181, "step": 186480 }, { - "epoch": 0.94, - "learning_rate": 0.0001588700929817215, - "loss": 0.0104, + "epoch": 0.48, + "learning_rate": 0.0002274886528885559, + "loss": 0.0177, "step": 186490 }, { - "epoch": 0.94, - "learning_rate": 0.00015886252528870748, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022748476467218448, + "loss": 0.0198, "step": 186500 }, { - "epoch": 0.94, - "learning_rate": 0.0001588549575956935, - "loss": 0.0085, + "epoch": 0.48, + "learning_rate": 0.000227480876455813, + "loss": 0.0165, "step": 186510 }, { - "epoch": 0.94, - "learning_rate": 0.00015884738990267947, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022747698823944153, + "loss": 0.0137, "step": 186520 }, { - "epoch": 0.94, - "learning_rate": 0.00015883982220966545, - "loss": 0.0113, + "epoch": 0.48, + "learning_rate": 0.00022747310002307005, + "loss": 0.015, "step": 186530 }, { - "epoch": 0.94, - "learning_rate": 0.00015883225451665143, - "loss": 0.0158, + "epoch": 0.48, + "learning_rate": 0.00022746921180669862, + "loss": 0.0191, "step": 186540 }, { - "epoch": 0.94, - "learning_rate": 0.00015882468682363744, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.00022746532359032713, + "loss": 0.0202, "step": 186550 }, { - "epoch": 0.94, - "learning_rate": 0.00015881711913062342, - "loss": 0.0126, + "epoch": 0.48, + "learning_rate": 0.00022746143537395567, + "loss": 0.0176, "step": 186560 }, { - "epoch": 0.94, - "learning_rate": 0.0001588095514376094, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.0002274575471575842, + "loss": 0.0184, "step": 186570 }, { - "epoch": 0.94, - "learning_rate": 0.00015880198374459541, - "loss": 0.0081, + "epoch": 0.48, + "learning_rate": 0.00022745365894121273, + "loss": 0.0186, "step": 186580 }, { - "epoch": 0.94, - "learning_rate": 0.0001587944160515814, - "loss": 0.0106, + "epoch": 0.48, + "learning_rate": 0.00022744977072484127, + "loss": 0.0178, "step": 186590 }, { - "epoch": 0.94, - "learning_rate": 0.00015878684835856738, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022744588250846981, + "loss": 0.0192, "step": 186600 }, { - "epoch": 0.94, - "learning_rate": 0.00015877928066555339, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022744199429209833, + "loss": 0.0164, "step": 186610 }, { - "epoch": 0.94, - "learning_rate": 0.00015877171297253937, - "loss": 0.0128, + "epoch": 0.48, + "learning_rate": 0.00022743810607572687, + "loss": 0.0174, "step": 186620 }, { - "epoch": 0.94, - "learning_rate": 0.00015876414527952535, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022743421785935544, + "loss": 0.0204, "step": 186630 }, { - "epoch": 0.94, - "learning_rate": 0.00015875657758651136, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022743032964298395, + "loss": 0.0152, "step": 186640 }, { - "epoch": 0.94, - "learning_rate": 0.0001587490098934973, - "loss": 0.0127, + "epoch": 0.48, + "learning_rate": 0.0002274264414266125, + "loss": 0.0194, "step": 186650 }, { - "epoch": 0.94, - "learning_rate": 0.0001587414422004833, - "loss": 0.0122, + "epoch": 0.48, + "learning_rate": 0.000227422553210241, + "loss": 0.0277, "step": 186660 }, { - "epoch": 0.94, - "learning_rate": 0.00015873387450746927, - "loss": 0.0093, + "epoch": 0.48, + "learning_rate": 0.00022741866499386958, + "loss": 0.0201, "step": 186670 }, { - "epoch": 0.94, - "learning_rate": 0.00015872630681445528, - "loss": 0.0083, + "epoch": 0.48, + "learning_rate": 0.0002274147767774981, + "loss": 0.0146, "step": 186680 }, { - "epoch": 0.94, - "learning_rate": 0.00015871873912144126, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.00022741088856112663, + "loss": 0.018, "step": 186690 }, { - "epoch": 0.94, - "learning_rate": 0.00015871117142842725, - "loss": 0.0109, + "epoch": 0.48, + "learning_rate": 0.00022740700034475515, + "loss": 0.0154, "step": 186700 }, { - "epoch": 0.94, - "learning_rate": 0.00015870360373541325, - "loss": 0.0138, + "epoch": 0.48, + "learning_rate": 0.00022740311212838372, + "loss": 0.0199, "step": 186710 }, { - "epoch": 0.94, - "learning_rate": 0.00015869603604239924, - "loss": 0.0147, + "epoch": 0.48, + "learning_rate": 0.00022739922391201223, + "loss": 0.019, "step": 186720 }, { - "epoch": 0.94, - "learning_rate": 0.00015868846834938522, - "loss": 0.0085, + "epoch": 0.48, + "learning_rate": 0.00022739533569564077, + "loss": 0.0158, "step": 186730 }, { - "epoch": 0.94, - "learning_rate": 0.00015868090065637123, - "loss": 0.0137, + "epoch": 0.48, + "learning_rate": 0.0002273914474792693, + "loss": 0.0203, "step": 186740 }, { - "epoch": 0.94, - "learning_rate": 0.0001586733329633572, - "loss": 0.009, + "epoch": 0.48, + "learning_rate": 0.00022738755926289786, + "loss": 0.02, "step": 186750 }, { - "epoch": 0.94, - "learning_rate": 0.0001586657652703432, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022738367104652637, + "loss": 0.0169, "step": 186760 }, { - "epoch": 0.94, - "learning_rate": 0.00015865819757732917, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.0002273797828301549, + "loss": 0.0239, "step": 186770 }, { - "epoch": 0.94, - "learning_rate": 0.00015865062988431518, - "loss": 0.0125, + "epoch": 0.48, + "learning_rate": 0.00022737589461378343, + "loss": 0.0175, "step": 186780 }, { - "epoch": 0.94, - "learning_rate": 0.00015864306219130116, - "loss": 0.0111, + "epoch": 0.48, + "learning_rate": 0.000227372006397412, + "loss": 0.0174, "step": 186790 }, { - "epoch": 0.94, - "learning_rate": 0.00015863549449828714, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022736811818104054, + "loss": 0.0169, "step": 186800 }, { - "epoch": 0.94, - "learning_rate": 0.00015862792680527315, - "loss": 0.0077, + "epoch": 0.48, + "learning_rate": 0.00022736422996466905, + "loss": 0.0185, "step": 186810 }, { - "epoch": 0.94, - "learning_rate": 0.00015862035911225913, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.0002273603417482976, + "loss": 0.0154, "step": 186820 }, { - "epoch": 0.94, - "learning_rate": 0.0001586127914192451, - "loss": 0.0151, + "epoch": 0.48, + "learning_rate": 0.0002273564535319261, + "loss": 0.0193, "step": 186830 }, { - "epoch": 0.94, - "learning_rate": 0.00015860522372623112, - "loss": 0.0114, + "epoch": 0.48, + "learning_rate": 0.00022735256531555468, + "loss": 0.0279, "step": 186840 }, { - "epoch": 0.94, - "learning_rate": 0.0001585976560332171, - "loss": 0.0116, + "epoch": 0.48, + "learning_rate": 0.0002273486770991832, + "loss": 0.0169, "step": 186850 }, { - "epoch": 0.94, - "learning_rate": 0.00015859008834020308, - "loss": 0.0129, + "epoch": 0.48, + "learning_rate": 0.00022734478888281173, + "loss": 0.0222, "step": 186860 }, { - "epoch": 0.94, - "learning_rate": 0.0001585825206471891, - "loss": 0.0098, + "epoch": 0.48, + "learning_rate": 0.00022734090066644025, + "loss": 0.0135, "step": 186870 }, { - "epoch": 0.94, - "learning_rate": 0.00015857495295417507, - "loss": 0.0087, + "epoch": 0.48, + "learning_rate": 0.00022733701245006882, + "loss": 0.0186, "step": 186880 }, { - "epoch": 0.94, - "learning_rate": 0.00015856738526116106, - "loss": 0.01, + "epoch": 0.48, + "learning_rate": 0.00022733312423369733, + "loss": 0.016, "step": 186890 }, { - "epoch": 0.94, - "learning_rate": 0.00015855981756814706, - "loss": 0.0097, + "epoch": 0.48, + "learning_rate": 0.00022732923601732587, + "loss": 0.0248, "step": 186900 }, { - "epoch": 0.94, - "learning_rate": 0.00015855224987513305, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.0002273253478009544, + "loss": 0.0158, "step": 186910 }, { - "epoch": 0.94, - "learning_rate": 0.00015854468218211903, - "loss": 0.0258, + "epoch": 0.48, + "learning_rate": 0.00022732145958458296, + "loss": 0.018, "step": 186920 }, { - "epoch": 0.94, - "learning_rate": 0.000158537114489105, - "loss": 0.0128, + "epoch": 0.48, + "learning_rate": 0.00022731757136821147, + "loss": 0.0163, "step": 186930 }, { - "epoch": 0.94, - "learning_rate": 0.00015852954679609102, - "loss": 0.0108, + "epoch": 0.48, + "learning_rate": 0.00022731368315184, + "loss": 0.0312, "step": 186940 }, { - "epoch": 0.94, - "learning_rate": 0.000158521979103077, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.00022730979493546853, + "loss": 0.0182, "step": 186950 }, { - "epoch": 0.94, - "learning_rate": 0.00015851441141006298, - "loss": 0.0141, + "epoch": 0.48, + "learning_rate": 0.0002273059067190971, + "loss": 0.0152, "step": 186960 }, { - "epoch": 0.94, - "learning_rate": 0.000158506843717049, - "loss": 0.0093, + "epoch": 0.48, + "learning_rate": 0.00022730201850272564, + "loss": 0.0179, "step": 186970 }, { - "epoch": 0.94, - "learning_rate": 0.00015849927602403497, - "loss": 0.013, + "epoch": 0.48, + "learning_rate": 0.00022729813028635415, + "loss": 0.0194, "step": 186980 }, { - "epoch": 0.94, - "learning_rate": 0.00015849170833102095, - "loss": 0.0117, + "epoch": 0.48, + "learning_rate": 0.00022729424206998267, + "loss": 0.0162, "step": 186990 }, { - "epoch": 0.94, - "learning_rate": 0.00015848414063800696, - "loss": 0.0092, + "epoch": 0.48, + "learning_rate": 0.00022729035385361124, + "loss": 0.0229, "step": 187000 }, { - "epoch": 0.94, - "eval_cer": 0.9144683151109114, - "eval_loss": 0.008203052915632725, - "eval_runtime": 116.5799, - "eval_samples_per_second": 17.156, - "eval_steps_per_second": 4.289, + "epoch": 0.48, + "eval_cer": 0.8818174565517705, + "eval_loss": 0.01267703715711832, + "eval_runtime": 107.8484, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, "step": 187000 }, { - "epoch": 0.94, - "learning_rate": 0.00015847657294499294, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022728646563723978, + "loss": 0.0177, "step": 187010 }, { - "epoch": 0.94, - "learning_rate": 0.00015846900525197892, - "loss": 0.0123, + "epoch": 0.48, + "learning_rate": 0.0002272825774208683, + "loss": 0.0146, "step": 187020 }, { - "epoch": 0.94, - "learning_rate": 0.00015846143755896493, - "loss": 0.0105, + "epoch": 0.48, + "learning_rate": 0.00022727868920449683, + "loss": 0.0159, "step": 187030 }, { - "epoch": 0.94, - "learning_rate": 0.0001584538698659509, - "loss": 0.0101, + "epoch": 0.48, + "learning_rate": 0.00022727480098812537, + "loss": 0.0196, "step": 187040 }, { - "epoch": 0.94, - "learning_rate": 0.0001584463021729369, - "loss": 0.011, + "epoch": 0.48, + "learning_rate": 0.00022727091277175392, + "loss": 0.0188, "step": 187050 }, { - "epoch": 0.94, - "learning_rate": 0.0001584387344799229, - "loss": 0.0118, + "epoch": 0.48, + "learning_rate": 0.00022726702455538243, + "loss": 0.0213, "step": 187060 }, { - "epoch": 0.94, - "learning_rate": 0.00015843116678690888, - "loss": 0.0107, + "epoch": 0.48, + "learning_rate": 0.00022726313633901097, + "loss": 0.02, "step": 187070 }, { - "epoch": 0.94, - "learning_rate": 0.00015842359909389487, - "loss": 0.0115, + "epoch": 0.48, + "learning_rate": 0.0002272592481226395, + "loss": 0.0169, "step": 187080 }, { - "epoch": 0.94, - "learning_rate": 0.00015841603140088087, - "loss": 0.0144, + "epoch": 0.48, + "learning_rate": 0.00022725535990626806, + "loss": 0.018, "step": 187090 }, { - "epoch": 0.94, - "learning_rate": 0.00015840846370786686, - "loss": 0.0095, + "epoch": 0.48, + "learning_rate": 0.00022725147168989657, + "loss": 0.016, "step": 187100 }, { - "epoch": 0.94, - "learning_rate": 0.00015840089601485284, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.0002272475834735251, + "loss": 0.0275, "step": 187110 }, { - "epoch": 0.94, - "learning_rate": 0.00015839332832183882, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022724369525715363, + "loss": 0.0154, "step": 187120 }, { - "epoch": 0.94, - "learning_rate": 0.00015838576062882483, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.0002272398070407822, + "loss": 0.0194, "step": 187130 }, { - "epoch": 0.94, - "learning_rate": 0.0001583781929358108, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.0002272359188244107, + "loss": 0.0182, "step": 187140 }, { - "epoch": 0.94, - "learning_rate": 0.0001583706252427968, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.00022723203060803925, + "loss": 0.0164, "step": 187150 }, { - "epoch": 0.94, - "learning_rate": 0.0001583630575497828, - "loss": 0.0154, + "epoch": 0.49, + "learning_rate": 0.00022722814239166777, + "loss": 0.016, "step": 187160 }, { - "epoch": 0.94, - "learning_rate": 0.00015835548985676878, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022722425417529633, + "loss": 0.019, "step": 187170 }, { - "epoch": 0.94, - "learning_rate": 0.00015834792216375476, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022722036595892488, + "loss": 0.0182, "step": 187180 }, { - "epoch": 0.94, - "learning_rate": 0.00015834035447074077, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.0002272164777425534, + "loss": 0.0171, "step": 187190 }, { - "epoch": 0.94, - "learning_rate": 0.00015833278677772675, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022721258952618193, + "loss": 0.0215, "step": 187200 }, { - "epoch": 0.94, - "learning_rate": 0.00015832521908471273, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022720870130981047, + "loss": 0.0157, "step": 187210 }, { - "epoch": 0.94, - "learning_rate": 0.00015831765139169874, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022720481309343902, + "loss": 0.0202, "step": 187220 }, { - "epoch": 0.94, - "learning_rate": 0.00015831008369868472, - "loss": 0.0091, + "epoch": 0.49, + "learning_rate": 0.00022720092487706753, + "loss": 0.0175, "step": 187230 }, { - "epoch": 0.94, - "learning_rate": 0.0001583025160056707, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022719703666069607, + "loss": 0.0197, "step": 187240 }, { - "epoch": 0.94, - "learning_rate": 0.0001582949483126567, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.0002271931484443246, + "loss": 0.0178, "step": 187250 }, { - "epoch": 0.94, - "learning_rate": 0.0001582873806196427, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.00022718926022795316, + "loss": 0.0194, "step": 187260 }, { - "epoch": 0.94, - "learning_rate": 0.00015827981292662868, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.00022718537201158167, + "loss": 0.0149, "step": 187270 }, { - "epoch": 0.94, - "learning_rate": 0.00015827224523361466, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.0002271814837952102, + "loss": 0.0188, "step": 187280 }, { - "epoch": 0.94, - "learning_rate": 0.00015826467754060067, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022717759557883878, + "loss": 0.0171, "step": 187290 }, { - "epoch": 0.94, - "learning_rate": 0.00015825710984758665, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.0002271737073624673, + "loss": 0.019, "step": 187300 }, { - "epoch": 0.94, - "learning_rate": 0.00015824954215457263, - "loss": 0.0137, + "epoch": 0.49, + "learning_rate": 0.0002271698191460958, + "loss": 0.0211, "step": 187310 }, { - "epoch": 0.95, - "learning_rate": 0.00015824197446155864, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022716593092972435, + "loss": 0.0176, "step": 187320 }, { - "epoch": 0.95, - "learning_rate": 0.00015823440676854462, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022716204271335287, + "loss": 0.0164, "step": 187330 }, { - "epoch": 0.95, - "learning_rate": 0.0001582268390755306, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.00022715815449698143, + "loss": 0.0157, "step": 187340 }, { - "epoch": 0.95, - "learning_rate": 0.0001582192713825166, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022715426628060998, + "loss": 0.0192, "step": 187350 }, { - "epoch": 0.95, - "learning_rate": 0.0001582117036895026, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.0002271503780642385, + "loss": 0.0148, "step": 187360 }, { - "epoch": 0.95, - "learning_rate": 0.00015820413599648857, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022714648984786703, + "loss": 0.0164, "step": 187370 }, { - "epoch": 0.95, - "learning_rate": 0.00015819656830347458, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022714260163149557, + "loss": 0.0143, "step": 187380 }, { - "epoch": 0.95, - "learning_rate": 0.00015818900061046056, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022713871341512412, + "loss": 0.02, "step": 187390 }, { - "epoch": 0.95, - "learning_rate": 0.00015818143291744654, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022713482519875263, + "loss": 0.0196, "step": 187400 }, { - "epoch": 0.95, - "learning_rate": 0.00015817386522443255, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022713093698238117, + "loss": 0.0164, "step": 187410 }, { - "epoch": 0.95, - "learning_rate": 0.00015816629753141853, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.0002271270487660097, + "loss": 0.0192, "step": 187420 }, { - "epoch": 0.95, - "learning_rate": 0.00015815872983840451, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022712316054963825, + "loss": 0.0182, "step": 187430 }, { - "epoch": 0.95, - "learning_rate": 0.0001581511621453905, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022711927233326677, + "loss": 0.0192, "step": 187440 }, { - "epoch": 0.95, - "learning_rate": 0.0001581435944523765, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.0002271153841168953, + "loss": 0.0182, "step": 187450 }, { - "epoch": 0.95, - "learning_rate": 0.00015813602675936249, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022711149590052385, + "loss": 0.0141, "step": 187460 }, { - "epoch": 0.95, - "learning_rate": 0.00015812845906634847, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.0002271076076841524, + "loss": 0.0245, "step": 187470 }, { - "epoch": 0.95, - "learning_rate": 0.00015812089137333448, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002271037194677809, + "loss": 0.0191, "step": 187480 }, { - "epoch": 0.95, - "learning_rate": 0.00015811332368032046, - "loss": 0.014, + "epoch": 0.49, + "learning_rate": 0.00022709983125140945, + "loss": 0.0182, "step": 187490 }, { - "epoch": 0.95, - "learning_rate": 0.00015810575598730644, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022709594303503802, + "loss": 0.0175, "step": 187500 }, { - "epoch": 0.95, - "learning_rate": 0.00015809818829429245, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022709205481866653, + "loss": 0.0189, "step": 187510 }, { - "epoch": 0.95, - "learning_rate": 0.00015809062060127843, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022708816660229508, + "loss": 0.0139, "step": 187520 }, { - "epoch": 0.95, - "learning_rate": 0.0001580830529082644, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.0002270842783859236, + "loss": 0.0211, "step": 187530 }, { - "epoch": 0.95, - "learning_rate": 0.00015807548521525042, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.00022708039016955216, + "loss": 0.0238, "step": 187540 }, { - "epoch": 0.95, - "learning_rate": 0.0001580679175222364, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022707650195318067, + "loss": 0.0162, "step": 187550 }, { - "epoch": 0.95, - "learning_rate": 0.00015806034982922238, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.00022707261373680921, + "loss": 0.0181, "step": 187560 }, { - "epoch": 0.95, - "learning_rate": 0.0001580527821362084, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022706872552043773, + "loss": 0.0171, "step": 187570 }, { - "epoch": 0.95, - "learning_rate": 0.00015804521444319437, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022706483730406627, + "loss": 0.0198, "step": 187580 }, { - "epoch": 0.95, - "learning_rate": 0.00015803764675018035, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.0002270609490876948, + "loss": 0.0191, "step": 187590 }, { - "epoch": 0.95, - "learning_rate": 0.00015803007905716636, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022705706087132335, + "loss": 0.0167, "step": 187600 }, { - "epoch": 0.95, - "learning_rate": 0.00015802251136415234, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.00022705317265495187, + "loss": 0.0183, "step": 187610 }, { - "epoch": 0.95, - "learning_rate": 0.00015801494367113832, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.0002270492844385804, + "loss": 0.0157, "step": 187620 }, { - "epoch": 0.95, - "learning_rate": 0.0001580073759781243, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022704539622220895, + "loss": 0.0163, "step": 187630 }, { - "epoch": 0.95, - "learning_rate": 0.00015799980828511031, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002270415080058375, + "loss": 0.0151, "step": 187640 }, { - "epoch": 0.95, - "learning_rate": 0.0001579922405920963, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.000227037619789466, + "loss": 0.0183, "step": 187650 }, { - "epoch": 0.95, - "learning_rate": 0.00015798467289908228, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022703373157309455, + "loss": 0.0198, "step": 187660 }, { - "epoch": 0.95, - "learning_rate": 0.00015797710520606829, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022702984335672312, + "loss": 0.0175, "step": 187670 }, { - "epoch": 0.95, - "learning_rate": 0.00015796953751305427, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022702595514035163, + "loss": 0.0218, "step": 187680 }, { - "epoch": 0.95, - "learning_rate": 0.00015796196982004025, - "loss": 0.0162, + "epoch": 0.49, + "learning_rate": 0.00022702206692398017, + "loss": 0.0203, "step": 187690 }, { - "epoch": 0.95, - "learning_rate": 0.00015795440212702626, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.0002270181787076087, + "loss": 0.0183, "step": 187700 }, { - "epoch": 0.95, - "learning_rate": 0.00015794683443401224, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022701429049123726, + "loss": 0.0148, "step": 187710 }, { - "epoch": 0.95, - "learning_rate": 0.00015793926674099822, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022701040227486577, + "loss": 0.018, "step": 187720 }, { - "epoch": 0.95, - "learning_rate": 0.00015793169904798423, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022700651405849431, + "loss": 0.0174, "step": 187730 }, { - "epoch": 0.95, - "learning_rate": 0.0001579241313549702, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022700262584212283, + "loss": 0.0189, "step": 187740 }, { - "epoch": 0.95, - "learning_rate": 0.0001579165636619562, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.0002269987376257514, + "loss": 0.0142, "step": 187750 }, { - "epoch": 0.95, - "learning_rate": 0.0001579089959689422, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.0002269948494093799, + "loss": 0.0244, "step": 187760 }, { - "epoch": 0.95, - "learning_rate": 0.00015790142827592818, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.00022699096119300845, + "loss": 0.0181, "step": 187770 }, { - "epoch": 0.95, - "learning_rate": 0.00015789386058291416, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.00022698707297663697, + "loss": 0.0186, "step": 187780 }, { - "epoch": 0.95, - "learning_rate": 0.00015788629288990014, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022698318476026554, + "loss": 0.0164, "step": 187790 }, { - "epoch": 0.95, - "learning_rate": 0.00015787872519688615, - "loss": 0.0123, + "epoch": 0.49, + "learning_rate": 0.00022697929654389405, + "loss": 0.0214, "step": 187800 }, { - "epoch": 0.95, - "learning_rate": 0.00015787115750387213, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.0002269754083275226, + "loss": 0.014, "step": 187810 }, { - "epoch": 0.95, - "learning_rate": 0.00015786358981085812, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.0002269715201111511, + "loss": 0.0142, "step": 187820 }, { - "epoch": 0.95, - "learning_rate": 0.00015785602211784412, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022696763189477965, + "loss": 0.0169, "step": 187830 }, { - "epoch": 0.95, - "learning_rate": 0.0001578484544248301, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022696374367840822, + "loss": 0.0181, "step": 187840 }, { - "epoch": 0.95, - "learning_rate": 0.0001578408867318161, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022695985546203673, + "loss": 0.0198, "step": 187850 }, { - "epoch": 0.95, - "learning_rate": 0.0001578333190388021, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.00022695596724566525, + "loss": 0.0173, "step": 187860 }, { - "epoch": 0.95, - "learning_rate": 0.00015782575134578808, - "loss": 0.0133, + "epoch": 0.49, + "learning_rate": 0.0002269520790292938, + "loss": 0.0196, "step": 187870 }, { - "epoch": 0.95, - "learning_rate": 0.00015781818365277406, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022694819081292236, + "loss": 0.0214, "step": 187880 }, { - "epoch": 0.95, - "learning_rate": 0.00015781061595976007, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022694430259655087, + "loss": 0.0255, "step": 187890 }, { - "epoch": 0.95, - "learning_rate": 0.00015780304826674605, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.0002269404143801794, + "loss": 0.0138, "step": 187900 }, { - "epoch": 0.95, - "learning_rate": 0.000157795480573732, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022693652616380793, + "loss": 0.0194, "step": 187910 }, { - "epoch": 0.95, - "learning_rate": 0.00015778791288071798, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.0002269326379474365, + "loss": 0.0142, "step": 187920 }, { - "epoch": 0.95, - "learning_rate": 0.000157780345187704, - "loss": 0.0124, + "epoch": 0.49, + "learning_rate": 0.000226928749731065, + "loss": 0.0195, "step": 187930 }, { - "epoch": 0.95, - "learning_rate": 0.00015777277749468997, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022692486151469355, + "loss": 0.027, "step": 187940 }, { - "epoch": 0.95, - "learning_rate": 0.00015776520980167596, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022692097329832207, + "loss": 0.0178, "step": 187950 }, { - "epoch": 0.95, - "learning_rate": 0.00015775764210866196, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022691708508195064, + "loss": 0.0208, "step": 187960 }, { - "epoch": 0.95, - "learning_rate": 0.00015775007441564795, - "loss": 0.0136, + "epoch": 0.49, + "learning_rate": 0.00022691319686557915, + "loss": 0.021, "step": 187970 }, { - "epoch": 0.95, - "learning_rate": 0.00015774250672263393, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.0002269093086492077, + "loss": 0.0188, "step": 187980 }, { - "epoch": 0.95, - "learning_rate": 0.00015773493902961994, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.0002269054204328362, + "loss": 0.017, "step": 187990 }, { - "epoch": 0.95, - "learning_rate": 0.00015772737133660592, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022690153221646478, + "loss": 0.0159, "step": 188000 }, { - "epoch": 0.95, - "eval_cer": 0.9144634631302844, - "eval_loss": 0.007855391129851341, - "eval_runtime": 116.599, - "eval_samples_per_second": 17.153, - "eval_steps_per_second": 4.288, + "epoch": 0.49, + "eval_cer": 0.8818286536472439, + "eval_loss": 0.012727465480566025, + "eval_runtime": 108.1818, + "eval_samples_per_second": 18.487, + "eval_steps_per_second": 4.622, "step": 188000 }, { - "epoch": 0.95, - "learning_rate": 0.0001577198036435919, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022689764400009332, + "loss": 0.0225, "step": 188010 }, { - "epoch": 0.95, - "learning_rate": 0.00015771223595057788, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.00022689375578372183, + "loss": 0.021, "step": 188020 }, { - "epoch": 0.95, - "learning_rate": 0.0001577046682575639, - "loss": 0.0094, - "step": 188030 + "epoch": 0.49, + "learning_rate": 0.00022688986756735035, + "loss": 0.0155, + "step": 188030 }, { - "epoch": 0.95, - "learning_rate": 0.00015769710056454987, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022688597935097891, + "loss": 0.0185, "step": 188040 }, { - "epoch": 0.95, - "learning_rate": 0.00015768953287153585, - "loss": 0.0123, + "epoch": 0.49, + "learning_rate": 0.00022688209113460746, + "loss": 0.0184, "step": 188050 }, { - "epoch": 0.95, - "learning_rate": 0.00015768196517852186, - "loss": 0.0144, + "epoch": 0.49, + "learning_rate": 0.00022687820291823597, + "loss": 0.0232, "step": 188060 }, { - "epoch": 0.95, - "learning_rate": 0.00015767439748550784, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.0002268743147018645, + "loss": 0.0157, "step": 188070 }, { - "epoch": 0.95, - "learning_rate": 0.00015766682979249382, - "loss": 0.0162, + "epoch": 0.49, + "learning_rate": 0.00022687042648549303, + "loss": 0.0272, "step": 188080 }, { - "epoch": 0.95, - "learning_rate": 0.00015765926209947983, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.0002268665382691216, + "loss": 0.0194, "step": 188090 }, { - "epoch": 0.95, - "learning_rate": 0.0001576516944064658, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.0002268626500527501, + "loss": 0.024, "step": 188100 }, { - "epoch": 0.95, - "learning_rate": 0.0001576441267134518, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022685876183637865, + "loss": 0.0192, "step": 188110 }, { - "epoch": 0.95, - "learning_rate": 0.0001576365590204378, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022685487362000717, + "loss": 0.0222, "step": 188120 }, { - "epoch": 0.95, - "learning_rate": 0.00015762899132742378, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022685098540363574, + "loss": 0.0156, "step": 188130 }, { - "epoch": 0.95, - "learning_rate": 0.00015762142363440977, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.00022684709718726425, + "loss": 0.0211, "step": 188140 }, { - "epoch": 0.95, - "learning_rate": 0.00015761385594139577, - "loss": 0.0193, + "epoch": 0.49, + "learning_rate": 0.0002268432089708928, + "loss": 0.0176, "step": 188150 }, { - "epoch": 0.95, - "learning_rate": 0.00015760628824838176, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.0002268393207545213, + "loss": 0.0195, "step": 188160 }, { - "epoch": 0.95, - "learning_rate": 0.00015759872055536774, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022683543253814987, + "loss": 0.0188, "step": 188170 }, { - "epoch": 0.95, - "learning_rate": 0.00015759115286235372, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.0002268315443217784, + "loss": 0.0177, "step": 188180 }, { - "epoch": 0.95, - "learning_rate": 0.00015758358516933973, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.00022682765610540693, + "loss": 0.0152, "step": 188190 }, { - "epoch": 0.95, - "learning_rate": 0.0001575760174763257, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022682376788903545, + "loss": 0.0135, "step": 188200 }, { - "epoch": 0.95, - "learning_rate": 0.0001575684497833117, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022681987967266401, + "loss": 0.0257, "step": 188210 }, { - "epoch": 0.95, - "learning_rate": 0.0001575608820902977, - "loss": 0.0177, + "epoch": 0.49, + "learning_rate": 0.00022681599145629256, + "loss": 0.0191, "step": 188220 }, { - "epoch": 0.95, - "learning_rate": 0.00015755331439728368, - "loss": 0.0131, + "epoch": 0.49, + "learning_rate": 0.00022681210323992107, + "loss": 0.0179, "step": 188230 }, { - "epoch": 0.95, - "learning_rate": 0.00015754574670426966, - "loss": 0.0095, + "epoch": 0.49, + "learning_rate": 0.0002268082150235496, + "loss": 0.0185, "step": 188240 }, { - "epoch": 0.95, - "learning_rate": 0.00015753817901125567, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022680432680717815, + "loss": 0.0169, "step": 188250 }, { - "epoch": 0.95, - "learning_rate": 0.00015753061131824165, - "loss": 0.0136, + "epoch": 0.49, + "learning_rate": 0.0002268004385908067, + "loss": 0.0173, "step": 188260 }, { - "epoch": 0.95, - "learning_rate": 0.00015752304362522763, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.0002267965503744352, + "loss": 0.0178, "step": 188270 }, { - "epoch": 0.95, - "learning_rate": 0.00015751547593221364, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022679266215806375, + "loss": 0.021, "step": 188280 }, { - "epoch": 0.95, - "learning_rate": 0.00015750790823919962, - "loss": 0.008, + "epoch": 0.49, + "learning_rate": 0.0002267887739416923, + "loss": 0.0199, "step": 188290 }, { - "epoch": 0.95, - "learning_rate": 0.0001575003405461856, - "loss": 0.0145, + "epoch": 0.49, + "learning_rate": 0.00022678488572532083, + "loss": 0.0155, "step": 188300 }, { - "epoch": 0.95, - "learning_rate": 0.0001574927728531716, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022678099750894935, + "loss": 0.0155, "step": 188310 }, { - "epoch": 0.95, - "learning_rate": 0.0001574852051601576, - "loss": 0.0074, + "epoch": 0.49, + "learning_rate": 0.0002267771092925779, + "loss": 0.0162, "step": 188320 }, { - "epoch": 0.95, - "learning_rate": 0.00015747763746714358, - "loss": 0.0131, + "epoch": 0.49, + "learning_rate": 0.0002267732210762064, + "loss": 0.0186, "step": 188330 }, { - "epoch": 0.95, - "learning_rate": 0.00015747006977412956, - "loss": 0.0084, + "epoch": 0.49, + "learning_rate": 0.00022676933285983497, + "loss": 0.0181, "step": 188340 }, { - "epoch": 0.95, - "learning_rate": 0.00015746250208111557, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.0002267654446434635, + "loss": 0.0178, "step": 188350 }, { - "epoch": 0.95, - "learning_rate": 0.00015745493438810155, - "loss": 0.0124, + "epoch": 0.49, + "learning_rate": 0.00022676155642709203, + "loss": 0.0199, "step": 188360 }, { - "epoch": 0.95, - "learning_rate": 0.00015744736669508753, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.00022675766821072055, + "loss": 0.0148, "step": 188370 }, { - "epoch": 0.95, - "learning_rate": 0.00015743979900207354, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022675377999434911, + "loss": 0.0195, "step": 188380 }, { - "epoch": 0.95, - "learning_rate": 0.00015743223130905952, - "loss": 0.0141, + "epoch": 0.49, + "learning_rate": 0.00022674989177797766, + "loss": 0.0161, "step": 188390 }, { - "epoch": 0.95, - "learning_rate": 0.0001574246636160455, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022674600356160617, + "loss": 0.0153, "step": 188400 }, { - "epoch": 0.95, - "learning_rate": 0.0001574170959230315, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.0002267421153452347, + "loss": 0.0189, "step": 188410 }, { - "epoch": 0.95, - "learning_rate": 0.0001574095282300175, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022673822712886325, + "loss": 0.024, "step": 188420 }, { - "epoch": 0.95, - "learning_rate": 0.00015740196053700347, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002267343389124918, + "loss": 0.0157, "step": 188430 }, { - "epoch": 0.95, - "learning_rate": 0.00015739439284398948, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.0002267304506961203, + "loss": 0.0217, "step": 188440 }, { - "epoch": 0.95, - "learning_rate": 0.00015738682515097546, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022672656247974885, + "loss": 0.0173, "step": 188450 }, { - "epoch": 0.95, - "learning_rate": 0.00015737925745796144, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.0002267226742633774, + "loss": 0.0182, "step": 188460 }, { - "epoch": 0.95, - "learning_rate": 0.00015737168976494745, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022671878604700593, + "loss": 0.0208, "step": 188470 }, { - "epoch": 0.95, - "learning_rate": 0.00015736412207193343, - "loss": 0.0145, + "epoch": 0.49, + "learning_rate": 0.00022671489783063445, + "loss": 0.0155, "step": 188480 }, { - "epoch": 0.95, - "learning_rate": 0.00015735655437891941, - "loss": 0.0085, + "epoch": 0.49, + "learning_rate": 0.000226711009614263, + "loss": 0.0214, "step": 188490 }, { - "epoch": 0.95, - "learning_rate": 0.00015734898668590542, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.00022670712139789153, + "loss": 0.0165, "step": 188500 }, { - "epoch": 0.95, - "learning_rate": 0.0001573414189928914, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022670323318152007, + "loss": 0.0148, "step": 188510 }, { - "epoch": 0.95, - "learning_rate": 0.00015733385129987739, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.0002266993449651486, + "loss": 0.0177, "step": 188520 }, { - "epoch": 0.95, - "learning_rate": 0.00015732628360686337, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022669545674877713, + "loss": 0.0231, "step": 188530 }, { - "epoch": 0.95, - "learning_rate": 0.00015731871591384938, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.0002266915685324057, + "loss": 0.0152, "step": 188540 }, { - "epoch": 0.95, - "learning_rate": 0.00015731114822083536, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.0002266876803160342, + "loss": 0.0154, "step": 188550 }, { - "epoch": 0.95, - "learning_rate": 0.00015730358052782134, - "loss": 0.0083, + "epoch": 0.49, + "learning_rate": 0.00022668379209966275, + "loss": 0.0202, "step": 188560 }, { - "epoch": 0.95, - "learning_rate": 0.00015729601283480735, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022667990388329127, + "loss": 0.0223, "step": 188570 }, { - "epoch": 0.95, - "learning_rate": 0.00015728844514179333, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022667601566691978, + "loss": 0.0194, "step": 188580 }, { - "epoch": 0.95, - "learning_rate": 0.0001572808774487793, - "loss": 0.0147, + "epoch": 0.49, + "learning_rate": 0.00022667212745054835, + "loss": 0.0176, "step": 188590 }, { - "epoch": 0.95, - "learning_rate": 0.00015727330975576532, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.0002266682392341769, + "loss": 0.0196, "step": 188600 }, { - "epoch": 0.95, - "learning_rate": 0.0001572657420627513, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.0002266643510178054, + "loss": 0.026, "step": 188610 }, { - "epoch": 0.95, - "learning_rate": 0.00015725817436973728, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022666046280143395, + "loss": 0.0162, "step": 188620 }, { - "epoch": 0.95, - "learning_rate": 0.0001572506066767233, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.0002266565745850625, + "loss": 0.0174, "step": 188630 }, { - "epoch": 0.95, - "learning_rate": 0.00015724303898370927, - "loss": 0.0146, + "epoch": 0.49, + "learning_rate": 0.00022665268636869103, + "loss": 0.0159, "step": 188640 }, { - "epoch": 0.95, - "learning_rate": 0.00015723547129069525, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022664879815231955, + "loss": 0.0171, "step": 188650 }, { - "epoch": 0.95, - "learning_rate": 0.00015722790359768126, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.0002266449099359481, + "loss": 0.0162, "step": 188660 }, { - "epoch": 0.95, - "learning_rate": 0.00015722033590466724, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022664102171957663, + "loss": 0.0178, "step": 188670 }, { - "epoch": 0.95, - "learning_rate": 0.00015721276821165322, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022663713350320517, + "loss": 0.0189, "step": 188680 }, { - "epoch": 0.95, - "learning_rate": 0.0001572052005186392, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.0002266332452868337, + "loss": 0.0182, "step": 188690 }, { - "epoch": 0.95, - "learning_rate": 0.00015719763282562521, - "loss": 0.0088, + "epoch": 0.49, + "learning_rate": 0.00022662935707046223, + "loss": 0.0207, "step": 188700 }, { - "epoch": 0.95, - "learning_rate": 0.0001571900651326112, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.0002266254688540908, + "loss": 0.02, "step": 188710 }, { - "epoch": 0.95, - "learning_rate": 0.00015718249743959718, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.0002266215806377193, + "loss": 0.0136, "step": 188720 }, { - "epoch": 0.95, - "learning_rate": 0.00015717492974658319, - "loss": 0.0149, + "epoch": 0.49, + "learning_rate": 0.00022661769242134783, + "loss": 0.0174, "step": 188730 }, { - "epoch": 0.95, - "learning_rate": 0.00015716736205356917, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022661380420497637, + "loss": 0.0237, "step": 188740 }, { - "epoch": 0.95, - "learning_rate": 0.00015715979436055515, - "loss": 0.0145, + "epoch": 0.49, + "learning_rate": 0.00022660991598860494, + "loss": 0.0172, "step": 188750 }, { - "epoch": 0.95, - "learning_rate": 0.00015715222666754116, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022660602777223345, + "loss": 0.0236, "step": 188760 }, { - "epoch": 0.95, - "learning_rate": 0.00015714465897452714, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.000226602139555862, + "loss": 0.0171, "step": 188770 }, { - "epoch": 0.95, - "learning_rate": 0.00015713709128151312, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.0002265982513394905, + "loss": 0.0186, "step": 188780 }, { - "epoch": 0.95, - "learning_rate": 0.00015712952358849913, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022659436312311908, + "loss": 0.0206, "step": 188790 }, { - "epoch": 0.95, - "learning_rate": 0.0001571219558954851, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.0002265904749067476, + "loss": 0.0192, "step": 188800 }, { - "epoch": 0.95, - "learning_rate": 0.0001571143882024711, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022658658669037613, + "loss": 0.0163, "step": 188810 }, { - "epoch": 0.95, - "learning_rate": 0.0001571068205094571, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022658269847400465, + "loss": 0.0201, "step": 188820 }, { - "epoch": 0.95, - "learning_rate": 0.00015709925281644308, - "loss": 0.0123, + "epoch": 0.49, + "learning_rate": 0.0002265788102576332, + "loss": 0.0179, "step": 188830 }, { - "epoch": 0.95, - "learning_rate": 0.00015709168512342906, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.00022657492204126173, + "loss": 0.0171, "step": 188840 }, { - "epoch": 0.95, - "learning_rate": 0.00015708411743041504, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022657103382489027, + "loss": 0.0156, "step": 188850 }, { - "epoch": 0.95, - "learning_rate": 0.00015707654973740105, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002265671456085188, + "loss": 0.017, "step": 188860 }, { - "epoch": 0.95, - "learning_rate": 0.00015706898204438703, - "loss": 0.0091, + "epoch": 0.49, + "learning_rate": 0.00022656325739214733, + "loss": 0.0167, "step": 188870 }, { - "epoch": 0.95, - "learning_rate": 0.00015706141435137302, - "loss": 0.0136, + "epoch": 0.49, + "learning_rate": 0.0002265593691757759, + "loss": 0.0197, "step": 188880 }, { - "epoch": 0.95, - "learning_rate": 0.00015705384665835902, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.0002265554809594044, + "loss": 0.0194, "step": 188890 }, { - "epoch": 0.95, - "learning_rate": 0.000157046278965345, - "loss": 0.0123, + "epoch": 0.49, + "learning_rate": 0.00022655159274303293, + "loss": 0.0192, "step": 188900 }, { - "epoch": 0.95, - "learning_rate": 0.000157038711272331, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022654770452666147, + "loss": 0.018, "step": 188910 }, { - "epoch": 0.95, - "learning_rate": 0.000157031143579317, - "loss": 0.0139, + "epoch": 0.49, + "learning_rate": 0.00022654381631029004, + "loss": 0.0182, "step": 188920 }, { - "epoch": 0.95, - "learning_rate": 0.00015702357588630298, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022653992809391855, + "loss": 0.0242, "step": 188930 }, { - "epoch": 0.95, - "learning_rate": 0.00015701600819328896, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002265360398775471, + "loss": 0.0183, "step": 188940 }, { - "epoch": 0.95, - "learning_rate": 0.00015700844050027497, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002265321516611756, + "loss": 0.0257, "step": 188950 }, { - "epoch": 0.95, - "learning_rate": 0.00015700087280726095, - "loss": 0.014, + "epoch": 0.49, + "learning_rate": 0.00022652826344480418, + "loss": 0.0172, "step": 188960 }, { - "epoch": 0.95, - "learning_rate": 0.00015699330511424693, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.0002265243752284327, + "loss": 0.0141, "step": 188970 }, { - "epoch": 0.95, - "learning_rate": 0.00015698573742123294, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022652048701206123, + "loss": 0.0169, "step": 188980 }, { - "epoch": 0.95, - "learning_rate": 0.00015697816972821892, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022651659879568975, + "loss": 0.0193, "step": 188990 }, { - "epoch": 0.95, - "learning_rate": 0.0001569706020352049, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022651271057931832, + "loss": 0.0195, "step": 189000 }, { - "epoch": 0.95, - "eval_cer": 0.914452788772905, - "eval_loss": 0.00806601531803608, - "eval_runtime": 116.7489, - "eval_samples_per_second": 17.131, - "eval_steps_per_second": 4.283, + "epoch": 0.49, + "eval_cer": 0.8818104583670996, + "eval_loss": 0.012447088025510311, + "eval_runtime": 108.0069, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 189000 }, { - "epoch": 0.95, - "learning_rate": 0.00015696303434219088, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022650882236294683, + "loss": 0.0172, "step": 189010 }, { - "epoch": 0.95, - "learning_rate": 0.0001569554666491769, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.00022650493414657537, + "loss": 0.0156, "step": 189020 }, { - "epoch": 0.95, - "learning_rate": 0.00015694789895616287, - "loss": 0.0139, + "epoch": 0.49, + "learning_rate": 0.0002265010459302039, + "loss": 0.0192, "step": 189030 }, { - "epoch": 0.95, - "learning_rate": 0.00015694033126314885, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022649715771383246, + "loss": 0.0197, "step": 189040 }, { - "epoch": 0.95, - "learning_rate": 0.00015693276357013486, - "loss": 0.0078, + "epoch": 0.49, + "learning_rate": 0.00022649326949746097, + "loss": 0.0157, "step": 189050 }, { - "epoch": 0.95, - "learning_rate": 0.00015692519587712084, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.0002264893812810895, + "loss": 0.0168, "step": 189060 }, { - "epoch": 0.95, - "learning_rate": 0.00015691762818410683, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022648549306471803, + "loss": 0.0237, "step": 189070 }, { - "epoch": 0.95, - "learning_rate": 0.00015691006049109283, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022648160484834657, + "loss": 0.0191, "step": 189080 }, { - "epoch": 0.95, - "learning_rate": 0.00015690249279807882, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.00022647771663197514, + "loss": 0.0166, "step": 189090 }, { - "epoch": 0.95, - "learning_rate": 0.0001568949251050648, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022647382841560365, + "loss": 0.0166, "step": 189100 }, { - "epoch": 0.95, - "learning_rate": 0.0001568873574120508, - "loss": 0.0137, + "epoch": 0.49, + "learning_rate": 0.0002264699401992322, + "loss": 0.0231, "step": 189110 }, { - "epoch": 0.95, - "learning_rate": 0.0001568797897190368, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002264660519828607, + "loss": 0.0157, "step": 189120 }, { - "epoch": 0.95, - "learning_rate": 0.00015687222202602277, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022646216376648928, + "loss": 0.0156, "step": 189130 }, { - "epoch": 0.95, - "learning_rate": 0.00015686465433300878, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.0002264582755501178, + "loss": 0.0182, "step": 189140 }, { - "epoch": 0.95, - "learning_rate": 0.00015685708663999476, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022645438733374633, + "loss": 0.0185, "step": 189150 }, { - "epoch": 0.95, - "learning_rate": 0.00015684951894698074, - "loss": 0.0123, + "epoch": 0.49, + "learning_rate": 0.00022645049911737485, + "loss": 0.018, "step": 189160 }, { - "epoch": 0.95, - "learning_rate": 0.0001568419512539667, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.00022644661090100342, + "loss": 0.0176, "step": 189170 }, { - "epoch": 0.95, - "learning_rate": 0.0001568343835609527, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022644272268463193, + "loss": 0.0159, "step": 189180 }, { - "epoch": 0.95, - "learning_rate": 0.00015682681586793868, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022643883446826047, + "loss": 0.0163, "step": 189190 }, { - "epoch": 0.95, - "learning_rate": 0.00015681924817492467, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022643494625188899, + "loss": 0.0168, "step": 189200 }, { - "epoch": 0.95, - "learning_rate": 0.00015681168048191067, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022643105803551755, + "loss": 0.0176, "step": 189210 }, { - "epoch": 0.95, - "learning_rate": 0.00015680411278889666, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.00022642716981914607, + "loss": 0.0258, "step": 189220 }, { - "epoch": 0.95, - "learning_rate": 0.00015679654509588264, - "loss": 0.0202, + "epoch": 0.49, + "learning_rate": 0.0002264232816027746, + "loss": 0.0156, "step": 189230 }, { - "epoch": 0.95, - "learning_rate": 0.00015678897740286862, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022641939338640313, + "loss": 0.0214, "step": 189240 }, { - "epoch": 0.95, - "learning_rate": 0.00015678140970985463, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002264155051700317, + "loss": 0.0164, "step": 189250 }, { - "epoch": 0.95, - "learning_rate": 0.0001567738420168406, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.00022641161695366024, + "loss": 0.0171, "step": 189260 }, { - "epoch": 0.95, - "learning_rate": 0.0001567662743238266, - "loss": 0.0149, + "epoch": 0.49, + "learning_rate": 0.00022640772873728875, + "loss": 0.0173, "step": 189270 }, { - "epoch": 0.95, - "learning_rate": 0.0001567587066308126, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002264038405209173, + "loss": 0.0181, "step": 189280 }, { - "epoch": 0.95, - "learning_rate": 0.00015675113893779858, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022639995230454583, + "loss": 0.016, "step": 189290 }, { - "epoch": 0.96, - "learning_rate": 0.00015674357124478456, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022639606408817438, + "loss": 0.0222, "step": 189300 }, { - "epoch": 0.96, - "learning_rate": 0.00015673600355177057, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002263921758718029, + "loss": 0.0154, "step": 189310 }, { - "epoch": 0.96, - "learning_rate": 0.00015672843585875655, - "loss": 0.0077, + "epoch": 0.49, + "learning_rate": 0.00022638828765543143, + "loss": 0.0194, "step": 189320 }, { - "epoch": 0.96, - "learning_rate": 0.00015672086816574253, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022638439943905995, + "loss": 0.0337, "step": 189330 }, { - "epoch": 0.96, - "learning_rate": 0.00015671330047272854, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022638051122268851, + "loss": 0.0191, "step": 189340 }, { - "epoch": 0.96, - "learning_rate": 0.00015670573277971452, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022637662300631703, + "loss": 0.0146, "step": 189350 }, { - "epoch": 0.96, - "learning_rate": 0.0001566981650867005, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022637273478994557, + "loss": 0.0184, "step": 189360 }, { - "epoch": 0.96, - "learning_rate": 0.0001566905973936865, - "loss": 0.0088, + "epoch": 0.49, + "learning_rate": 0.00022636884657357409, + "loss": 0.0175, "step": 189370 }, { - "epoch": 0.96, - "learning_rate": 0.0001566830297006725, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022636495835720265, + "loss": 0.0163, "step": 189380 }, { - "epoch": 0.96, - "learning_rate": 0.00015667546200765848, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.00022636107014083117, + "loss": 0.017, "step": 189390 }, { - "epoch": 0.96, - "learning_rate": 0.00015666789431464446, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.0002263571819244597, + "loss": 0.014, "step": 189400 }, { - "epoch": 0.96, - "learning_rate": 0.00015666032662163047, - "loss": 0.0137, + "epoch": 0.49, + "learning_rate": 0.00022635329370808822, + "loss": 0.0201, "step": 189410 }, { - "epoch": 0.96, - "learning_rate": 0.00015665275892861645, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.0002263494054917168, + "loss": 0.0186, "step": 189420 }, { - "epoch": 0.96, - "learning_rate": 0.00015664519123560243, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.00022634551727534534, + "loss": 0.0183, "step": 189430 }, { - "epoch": 0.96, - "learning_rate": 0.00015663762354258844, - "loss": 0.012, + "epoch": 0.49, + "learning_rate": 0.00022634162905897385, + "loss": 0.0222, "step": 189440 }, { - "epoch": 0.96, - "learning_rate": 0.00015663005584957442, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022633774084260236, + "loss": 0.0156, "step": 189450 }, { - "epoch": 0.96, - "learning_rate": 0.0001566224881565604, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022633385262623093, + "loss": 0.0155, "step": 189460 }, { - "epoch": 0.96, - "learning_rate": 0.0001566149204635464, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.00022632996440985947, + "loss": 0.0159, "step": 189470 }, { - "epoch": 0.96, - "learning_rate": 0.0001566073527705324, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.000226326076193488, + "loss": 0.0202, "step": 189480 }, { - "epoch": 0.96, - "learning_rate": 0.00015659978507751837, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022632218797711653, + "loss": 0.0144, "step": 189490 }, { - "epoch": 0.96, - "learning_rate": 0.00015659221738450438, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.00022631829976074507, + "loss": 0.0163, "step": 189500 }, { - "epoch": 0.96, - "learning_rate": 0.00015658464969149036, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022631441154437361, + "loss": 0.0174, "step": 189510 }, { - "epoch": 0.96, - "learning_rate": 0.00015657708199847634, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022631052332800213, + "loss": 0.0182, "step": 189520 }, { - "epoch": 0.96, - "learning_rate": 0.00015656951430546235, - "loss": 0.0119, + "epoch": 0.49, + "learning_rate": 0.00022630663511163067, + "loss": 0.018, "step": 189530 }, { - "epoch": 0.96, - "learning_rate": 0.00015656194661244833, - "loss": 0.0144, + "epoch": 0.49, + "learning_rate": 0.0002263027468952592, + "loss": 0.0192, "step": 189540 }, { - "epoch": 0.96, - "learning_rate": 0.00015655437891943431, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022629885867888775, + "loss": 0.019, "step": 189550 }, { - "epoch": 0.96, - "learning_rate": 0.00015654681122642032, - "loss": 0.0141, + "epoch": 0.49, + "learning_rate": 0.00022629497046251627, + "loss": 0.0145, "step": 189560 }, { - "epoch": 0.96, - "learning_rate": 0.0001565392435334063, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.0002262910822461448, + "loss": 0.021, "step": 189570 }, { - "epoch": 0.96, - "learning_rate": 0.00015653167584039229, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.00022628719402977332, + "loss": 0.0143, "step": 189580 }, { - "epoch": 0.96, - "learning_rate": 0.00015652410814737827, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.0002262833058134019, + "loss": 0.0171, "step": 189590 }, { - "epoch": 0.96, - "learning_rate": 0.00015651654045436428, - "loss": 0.0164, + "epoch": 0.49, + "learning_rate": 0.00022627941759703043, + "loss": 0.0146, "step": 189600 }, { - "epoch": 0.96, - "learning_rate": 0.00015650897276135026, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022627552938065895, + "loss": 0.0159, "step": 189610 }, { - "epoch": 0.96, - "learning_rate": 0.00015650140506833624, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022627164116428746, + "loss": 0.0156, "step": 189620 }, { - "epoch": 0.96, - "learning_rate": 0.00015649383737532225, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022626775294791603, + "loss": 0.0165, "step": 189630 }, { - "epoch": 0.96, - "learning_rate": 0.00015648626968230823, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.00022626386473154457, + "loss": 0.0146, "step": 189640 }, { - "epoch": 0.96, - "learning_rate": 0.0001564787019892942, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.0002262599765151731, + "loss": 0.0168, "step": 189650 }, { - "epoch": 0.96, - "learning_rate": 0.00015647113429628022, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022625608829880163, + "loss": 0.0143, "step": 189660 }, { - "epoch": 0.96, - "learning_rate": 0.0001564635666032662, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022625220008243017, + "loss": 0.0195, "step": 189670 }, { - "epoch": 0.96, - "learning_rate": 0.00015645599891025218, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022624831186605871, + "loss": 0.0218, "step": 189680 }, { - "epoch": 0.96, - "learning_rate": 0.0001564484312172382, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022624442364968723, + "loss": 0.0154, "step": 189690 }, { - "epoch": 0.96, - "learning_rate": 0.00015644086352422417, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022624053543331577, + "loss": 0.0177, "step": 189700 }, { - "epoch": 0.96, - "learning_rate": 0.00015643329583121015, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.0002262366472169443, + "loss": 0.0207, "step": 189710 }, { - "epoch": 0.96, - "learning_rate": 0.00015642572813819616, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022623275900057285, + "loss": 0.0165, "step": 189720 }, { - "epoch": 0.96, - "learning_rate": 0.00015641816044518214, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022622887078420137, + "loss": 0.0188, "step": 189730 }, { - "epoch": 0.96, - "learning_rate": 0.00015641059275216812, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002262249825678299, + "loss": 0.0173, "step": 189740 }, { - "epoch": 0.96, - "learning_rate": 0.0001564030250591541, - "loss": 0.0146, + "epoch": 0.49, + "learning_rate": 0.00022622109435145848, + "loss": 0.0207, "step": 189750 }, { - "epoch": 0.96, - "learning_rate": 0.00015639545736614011, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.000226217206135087, + "loss": 0.0183, "step": 189760 }, { - "epoch": 0.96, - "learning_rate": 0.0001563878896731261, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.0002262133179187155, + "loss": 0.017, "step": 189770 }, { - "epoch": 0.96, - "learning_rate": 0.00015638032198011208, - "loss": 0.0087, + "epoch": 0.49, + "learning_rate": 0.00022620942970234405, + "loss": 0.0175, "step": 189780 }, { - "epoch": 0.96, - "learning_rate": 0.00015637275428709809, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.00022620554148597262, + "loss": 0.0208, "step": 189790 }, { - "epoch": 0.96, - "learning_rate": 0.00015636518659408407, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022620165326960113, + "loss": 0.0169, "step": 189800 }, { - "epoch": 0.96, - "learning_rate": 0.00015635761890107005, - "loss": 0.0089, + "epoch": 0.49, + "learning_rate": 0.00022619776505322967, + "loss": 0.0183, "step": 189810 }, { - "epoch": 0.96, - "learning_rate": 0.00015635005120805606, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.0002261938768368582, + "loss": 0.0228, "step": 189820 }, { - "epoch": 0.96, - "learning_rate": 0.00015634248351504204, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.00022618998862048673, + "loss": 0.0166, "step": 189830 }, { - "epoch": 0.96, - "learning_rate": 0.00015633491582202802, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022618610040411527, + "loss": 0.0206, "step": 189840 }, { - "epoch": 0.96, - "learning_rate": 0.00015632734812901403, - "loss": 0.0128, + "epoch": 0.49, + "learning_rate": 0.0002261822121877438, + "loss": 0.0226, "step": 189850 }, { - "epoch": 0.96, - "learning_rate": 0.000156319780436, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022617832397137233, + "loss": 0.018, "step": 189860 }, { - "epoch": 0.96, - "learning_rate": 0.000156312212742986, - "loss": 0.0146, + "epoch": 0.49, + "learning_rate": 0.00022617443575500087, + "loss": 0.0158, "step": 189870 }, { - "epoch": 0.96, - "learning_rate": 0.000156304645049972, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.0002261705475386294, + "loss": 0.0188, "step": 189880 }, { - "epoch": 0.96, - "learning_rate": 0.00015629707735695798, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022616665932225795, + "loss": 0.0179, "step": 189890 }, { - "epoch": 0.96, - "learning_rate": 0.00015628950966394396, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022616277110588647, + "loss": 0.0162, "step": 189900 }, { - "epoch": 0.96, - "learning_rate": 0.00015628194197092994, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.000226158882889515, + "loss": 0.0147, "step": 189910 }, { - "epoch": 0.96, - "learning_rate": 0.00015627437427791595, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022615499467314355, + "loss": 0.0192, "step": 189920 }, { - "epoch": 0.96, - "learning_rate": 0.00015626680658490193, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.0002261511064567721, + "loss": 0.0198, "step": 189930 }, { - "epoch": 0.96, - "learning_rate": 0.00015625923889188792, - "loss": 0.0134, + "epoch": 0.49, + "learning_rate": 0.0002261472182404006, + "loss": 0.0176, "step": 189940 }, { - "epoch": 0.96, - "learning_rate": 0.00015625167119887392, - "loss": 0.0137, + "epoch": 0.49, + "learning_rate": 0.00022614333002402915, + "loss": 0.0178, "step": 189950 }, { - "epoch": 0.96, - "learning_rate": 0.0001562441035058599, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.00022613944180765772, + "loss": 0.0161, "step": 189960 }, { - "epoch": 0.96, - "learning_rate": 0.0001562365358128459, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.00022613555359128623, + "loss": 0.0195, "step": 189970 }, { - "epoch": 0.96, - "learning_rate": 0.0001562289681198319, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.00022613166537491477, + "loss": 0.0185, "step": 189980 }, { - "epoch": 0.96, - "learning_rate": 0.00015622140042681788, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.0002261277771585433, + "loss": 0.0233, "step": 189990 }, { - "epoch": 0.96, - "learning_rate": 0.00015621383273380386, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.00022612388894217186, + "loss": 0.0184, "step": 190000 }, { - "epoch": 0.96, - "eval_cer": 0.9144372624348985, - "eval_loss": 0.007905209437012672, - "eval_runtime": 116.6163, - "eval_samples_per_second": 17.15, - "eval_steps_per_second": 4.288, + "epoch": 0.49, + "eval_cer": 0.8817894638130869, + "eval_loss": 0.01178650464862585, + "eval_runtime": 107.62, + "eval_samples_per_second": 18.584, + "eval_steps_per_second": 4.646, "step": 190000 }, { - "epoch": 0.96, - "learning_rate": 0.00015620626504078987, - "loss": 0.0084, + "epoch": 0.49, + "learning_rate": 0.00022612000072580037, + "loss": 0.0157, "step": 190010 }, { - "epoch": 0.96, - "learning_rate": 0.00015619869734777585, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.0002261161125094289, + "loss": 0.0139, "step": 190020 }, { - "epoch": 0.96, - "learning_rate": 0.00015619112965476183, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022611222429305743, + "loss": 0.0165, "step": 190030 }, { - "epoch": 0.96, - "learning_rate": 0.00015618356196174784, - "loss": 0.0118, + "epoch": 0.49, + "learning_rate": 0.000226108336076686, + "loss": 0.0176, "step": 190040 }, { - "epoch": 0.96, - "learning_rate": 0.00015617599426873382, - "loss": 0.0215, + "epoch": 0.49, + "learning_rate": 0.0002261044478603145, + "loss": 0.0134, "step": 190050 }, { - "epoch": 0.96, - "learning_rate": 0.0001561684265757198, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022610055964394305, + "loss": 0.0154, "step": 190060 }, { - "epoch": 0.96, - "learning_rate": 0.0001561608588827058, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022609667142757157, + "loss": 0.0162, "step": 190070 }, { - "epoch": 0.96, - "learning_rate": 0.0001561532911896918, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.0002260927832112001, + "loss": 0.0177, "step": 190080 }, { - "epoch": 0.96, - "learning_rate": 0.00015614572349667777, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022608889499482865, + "loss": 0.0165, "step": 190090 }, { - "epoch": 0.96, - "learning_rate": 0.00015613815580366375, - "loss": 0.0092, + "epoch": 0.49, + "learning_rate": 0.0002260850067784572, + "loss": 0.0159, "step": 190100 }, { - "epoch": 0.96, - "learning_rate": 0.00015613058811064976, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002260811185620857, + "loss": 0.0164, "step": 190110 }, { - "epoch": 0.96, - "learning_rate": 0.00015612302041763574, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022607723034571425, + "loss": 0.0188, "step": 190120 }, { - "epoch": 0.96, - "learning_rate": 0.00015611545272462173, - "loss": 0.0126, + "epoch": 0.49, + "learning_rate": 0.00022607334212934282, + "loss": 0.0153, "step": 190130 }, { - "epoch": 0.96, - "learning_rate": 0.00015610788503160773, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022606945391297133, + "loss": 0.0182, "step": 190140 }, { - "epoch": 0.96, - "learning_rate": 0.00015610031733859372, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022606556569659987, + "loss": 0.0145, "step": 190150 }, { - "epoch": 0.96, - "learning_rate": 0.0001560927496455797, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.0002260616774802284, + "loss": 0.0173, "step": 190160 }, { - "epoch": 0.96, - "learning_rate": 0.0001560851819525657, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022605778926385696, + "loss": 0.0145, "step": 190170 }, { - "epoch": 0.96, - "learning_rate": 0.0001560776142595517, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.00022605390104748547, + "loss": 0.0188, "step": 190180 }, { - "epoch": 0.96, - "learning_rate": 0.00015607004656653767, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.000226050012831114, + "loss": 0.0167, "step": 190190 }, { - "epoch": 0.96, - "learning_rate": 0.00015606247887352368, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022604612461474253, + "loss": 0.0193, "step": 190200 }, { - "epoch": 0.96, - "learning_rate": 0.00015605491118050966, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.0002260422363983711, + "loss": 0.0194, "step": 190210 }, { - "epoch": 0.96, - "learning_rate": 0.00015604734348749564, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.0002260383481819996, + "loss": 0.0138, "step": 190220 }, { - "epoch": 0.96, - "learning_rate": 0.00015603977579448165, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.00022603445996562815, + "loss": 0.0165, "step": 190230 }, { - "epoch": 0.96, - "learning_rate": 0.00015603220810146763, - "loss": 0.0088, + "epoch": 0.49, + "learning_rate": 0.00022603057174925667, + "loss": 0.0153, "step": 190240 }, { - "epoch": 0.96, - "learning_rate": 0.0001560246404084536, - "loss": 0.0106, + "epoch": 0.49, + "learning_rate": 0.00022602668353288523, + "loss": 0.0202, "step": 190250 }, { - "epoch": 0.96, - "learning_rate": 0.0001560170727154396, - "loss": 0.0122, + "epoch": 0.49, + "learning_rate": 0.00022602279531651375, + "loss": 0.0155, "step": 190260 }, { - "epoch": 0.96, - "learning_rate": 0.0001560095050224256, - "loss": 0.009, + "epoch": 0.49, + "learning_rate": 0.0002260189071001423, + "loss": 0.0193, "step": 190270 }, { - "epoch": 0.96, - "learning_rate": 0.00015600193732941158, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002260150188837708, + "loss": 0.0205, "step": 190280 }, { - "epoch": 0.96, - "learning_rate": 0.00015599436963639756, - "loss": 0.0135, + "epoch": 0.49, + "learning_rate": 0.00022601113066739937, + "loss": 0.0186, "step": 190290 }, { - "epoch": 0.96, - "learning_rate": 0.00015598680194338357, - "loss": 0.01, + "epoch": 0.49, + "learning_rate": 0.00022600724245102792, + "loss": 0.0158, "step": 190300 }, { - "epoch": 0.96, - "learning_rate": 0.00015597923425036955, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.00022600335423465643, + "loss": 0.0177, "step": 190310 }, { - "epoch": 0.96, - "learning_rate": 0.00015597166655735554, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.00022599946601828494, + "loss": 0.0161, "step": 190320 }, { - "epoch": 0.96, - "learning_rate": 0.00015596409886434154, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.00022599557780191349, + "loss": 0.0164, "step": 190330 }, { - "epoch": 0.96, - "learning_rate": 0.00015595653117132753, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022599168958554206, + "loss": 0.0169, "step": 190340 }, { - "epoch": 0.96, - "learning_rate": 0.0001559489634783135, - "loss": 0.0144, + "epoch": 0.49, + "learning_rate": 0.00022598780136917057, + "loss": 0.0189, "step": 190350 }, { - "epoch": 0.96, - "learning_rate": 0.00015594139578529952, - "loss": 0.0136, + "epoch": 0.49, + "learning_rate": 0.0002259839131527991, + "loss": 0.0186, "step": 190360 }, { - "epoch": 0.96, - "learning_rate": 0.0001559338280922855, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022598002493642763, + "loss": 0.0174, "step": 190370 }, { - "epoch": 0.96, - "learning_rate": 0.00015592626039927148, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.0002259761367200562, + "loss": 0.0237, "step": 190380 }, { - "epoch": 0.96, - "learning_rate": 0.0001559186927062575, - "loss": 0.0101, + "epoch": 0.49, + "learning_rate": 0.0002259722485036847, + "loss": 0.0225, "step": 190390 }, { - "epoch": 0.96, - "learning_rate": 0.00015591112501324347, - "loss": 0.0085, + "epoch": 0.49, + "learning_rate": 0.00022596836028731325, + "loss": 0.0152, "step": 190400 }, { - "epoch": 0.96, - "learning_rate": 0.00015590355732022945, - "loss": 0.0114, + "epoch": 0.49, + "learning_rate": 0.00022596447207094177, + "loss": 0.0172, "step": 190410 }, { - "epoch": 0.96, - "learning_rate": 0.0001558959896272154, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.00022596058385457033, + "loss": 0.0171, "step": 190420 }, { - "epoch": 0.96, - "learning_rate": 0.0001558884219342014, - "loss": 0.0115, + "epoch": 0.49, + "learning_rate": 0.00022595669563819885, + "loss": 0.0201, "step": 190430 }, { - "epoch": 0.96, - "learning_rate": 0.0001558808542411874, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.0002259528074218274, + "loss": 0.014, "step": 190440 }, { - "epoch": 0.96, - "learning_rate": 0.00015587328654817338, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.0002259489192054559, + "loss": 0.0207, "step": 190450 }, { - "epoch": 0.96, - "learning_rate": 0.00015586571885515938, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022594503098908447, + "loss": 0.0164, "step": 190460 }, { - "epoch": 0.96, - "learning_rate": 0.00015585815116214537, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022594114277271302, + "loss": 0.016, "step": 190470 }, { - "epoch": 0.96, - "learning_rate": 0.00015585058346913135, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022593725455634153, + "loss": 0.0341, "step": 190480 }, { - "epoch": 0.96, - "learning_rate": 0.00015584301577611733, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022593336633997004, + "loss": 0.0191, "step": 190490 }, { - "epoch": 0.96, - "learning_rate": 0.00015583544808310334, - "loss": 0.0102, + "epoch": 0.49, + "learning_rate": 0.0002259294781235986, + "loss": 0.016, "step": 190500 }, { - "epoch": 0.96, - "learning_rate": 0.00015582788039008932, - "loss": 0.0087, + "epoch": 0.49, + "learning_rate": 0.00022592558990722715, + "loss": 0.0212, "step": 190510 }, { - "epoch": 0.96, - "learning_rate": 0.0001558203126970753, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.00022592170169085567, + "loss": 0.0186, "step": 190520 }, { - "epoch": 0.96, - "learning_rate": 0.0001558127450040613, - "loss": 0.013, + "epoch": 0.49, + "learning_rate": 0.0002259178134744842, + "loss": 0.0185, "step": 190530 }, { - "epoch": 0.96, - "learning_rate": 0.0001558051773110473, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.00022591392525811275, + "loss": 0.0189, "step": 190540 }, { - "epoch": 0.96, - "learning_rate": 0.00015579760961803327, - "loss": 0.0135, + "epoch": 0.49, + "learning_rate": 0.0002259100370417413, + "loss": 0.0157, "step": 190550 }, { - "epoch": 0.96, - "learning_rate": 0.00015579004192501928, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.0002259061488253698, + "loss": 0.0184, "step": 190560 }, { - "epoch": 0.96, - "learning_rate": 0.00015578247423200526, - "loss": 0.0109, + "epoch": 0.49, + "learning_rate": 0.00022590226060899835, + "loss": 0.0184, "step": 190570 }, { - "epoch": 0.96, - "learning_rate": 0.00015577490653899124, - "loss": 0.0144, + "epoch": 0.49, + "learning_rate": 0.00022589837239262686, + "loss": 0.0189, "step": 190580 }, { - "epoch": 0.96, - "learning_rate": 0.00015576733884597725, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022589448417625543, + "loss": 0.0184, "step": 190590 }, { - "epoch": 0.96, - "learning_rate": 0.00015575977115296323, - "loss": 0.0139, + "epoch": 0.49, + "learning_rate": 0.00022589059595988395, + "loss": 0.0173, "step": 190600 }, { - "epoch": 0.96, - "learning_rate": 0.00015575220345994921, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.0002258867077435125, + "loss": 0.0189, "step": 190610 }, { - "epoch": 0.96, - "learning_rate": 0.00015574463576693522, - "loss": 0.0121, + "epoch": 0.49, + "learning_rate": 0.000225882819527141, + "loss": 0.0127, "step": 190620 }, { - "epoch": 0.96, - "learning_rate": 0.0001557370680739212, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022587893131076957, + "loss": 0.016, "step": 190630 }, { - "epoch": 0.96, - "learning_rate": 0.00015572950038090719, - "loss": 0.0127, + "epoch": 0.49, + "learning_rate": 0.0002258750430943981, + "loss": 0.0175, "step": 190640 }, { - "epoch": 0.96, - "learning_rate": 0.00015572193268789317, - "loss": 0.0088, + "epoch": 0.49, + "learning_rate": 0.00022587115487802663, + "loss": 0.0163, "step": 190650 }, { - "epoch": 0.96, - "learning_rate": 0.00015571436499487918, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022586726666165514, + "loss": 0.0155, "step": 190660 }, { - "epoch": 0.96, - "learning_rate": 0.00015570679730186516, - "loss": 0.0117, + "epoch": 0.49, + "learning_rate": 0.0002258633784452837, + "loss": 0.0214, "step": 190670 }, { - "epoch": 0.96, - "learning_rate": 0.00015569922960885114, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022585949022891225, + "loss": 0.0182, "step": 190680 }, { - "epoch": 0.96, - "learning_rate": 0.00015569166191583715, - "loss": 0.0086, + "epoch": 0.49, + "learning_rate": 0.00022585560201254077, + "loss": 0.0211, "step": 190690 }, { - "epoch": 0.96, - "learning_rate": 0.00015568409422282313, - "loss": 0.0094, + "epoch": 0.49, + "learning_rate": 0.0002258517137961693, + "loss": 0.0142, "step": 190700 }, { - "epoch": 0.96, - "learning_rate": 0.0001556765265298091, - "loss": 0.0124, + "epoch": 0.49, + "learning_rate": 0.00022584782557979785, + "loss": 0.0182, "step": 190710 }, { - "epoch": 0.96, - "learning_rate": 0.00015566895883679512, - "loss": 0.0153, + "epoch": 0.49, + "learning_rate": 0.0002258439373634264, + "loss": 0.0195, "step": 190720 }, { - "epoch": 0.96, - "learning_rate": 0.0001556613911437811, - "loss": 0.0129, + "epoch": 0.49, + "learning_rate": 0.0002258400491470549, + "loss": 0.0182, "step": 190730 }, { - "epoch": 0.96, - "learning_rate": 0.00015565382345076708, - "loss": 0.0149, + "epoch": 0.49, + "learning_rate": 0.00022583616093068345, + "loss": 0.0171, "step": 190740 }, { - "epoch": 0.96, - "learning_rate": 0.0001556462557577531, - "loss": 0.0097, + "epoch": 0.49, + "learning_rate": 0.000225832272714312, + "loss": 0.0161, "step": 190750 }, { - "epoch": 0.96, - "learning_rate": 0.00015563868806473907, - "loss": 0.0132, + "epoch": 0.49, + "learning_rate": 0.00022582838449794053, + "loss": 0.0144, "step": 190760 }, { - "epoch": 0.96, - "learning_rate": 0.00015563112037172505, - "loss": 0.0123, + "epoch": 0.49, + "learning_rate": 0.00022582449628156905, + "loss": 0.0265, "step": 190770 }, { - "epoch": 0.96, - "learning_rate": 0.00015562355267871106, - "loss": 0.0087, + "epoch": 0.49, + "learning_rate": 0.0002258206080651976, + "loss": 0.0155, "step": 190780 }, { - "epoch": 0.96, - "learning_rate": 0.00015561598498569704, - "loss": 0.0105, + "epoch": 0.49, + "learning_rate": 0.00022581671984882616, + "loss": 0.0161, "step": 190790 }, { - "epoch": 0.96, - "learning_rate": 0.00015560841729268302, - "loss": 0.011, + "epoch": 0.49, + "learning_rate": 0.00022581283163245467, + "loss": 0.0141, "step": 190800 }, { - "epoch": 0.96, - "learning_rate": 0.000155600849599669, - "loss": 0.0134, + "epoch": 0.49, + "learning_rate": 0.0002258089434160832, + "loss": 0.0164, "step": 190810 }, { - "epoch": 0.96, - "learning_rate": 0.00015559328190665501, - "loss": 0.0107, + "epoch": 0.49, + "learning_rate": 0.00022580505519971173, + "loss": 0.0191, "step": 190820 }, { - "epoch": 0.96, - "learning_rate": 0.000155585714213641, - "loss": 0.0108, + "epoch": 0.49, + "learning_rate": 0.00022580116698334024, + "loss": 0.0202, "step": 190830 }, { - "epoch": 0.96, - "learning_rate": 0.00015557814652062698, - "loss": 0.0093, + "epoch": 0.49, + "learning_rate": 0.0002257972787669688, + "loss": 0.0206, "step": 190840 }, { - "epoch": 0.96, - "learning_rate": 0.00015557057882761299, - "loss": 0.0116, + "epoch": 0.49, + "learning_rate": 0.00022579339055059735, + "loss": 0.0181, "step": 190850 }, { - "epoch": 0.96, - "learning_rate": 0.00015556301113459897, - "loss": 0.0125, + "epoch": 0.49, + "learning_rate": 0.00022578950233422587, + "loss": 0.0202, "step": 190860 }, { - "epoch": 0.96, - "learning_rate": 0.00015555544344158495, - "loss": 0.0064, + "epoch": 0.49, + "learning_rate": 0.0002257856141178544, + "loss": 0.0312, "step": 190870 }, { - "epoch": 0.96, - "learning_rate": 0.00015554787574857096, - "loss": 0.0104, + "epoch": 0.49, + "learning_rate": 0.00022578172590148295, + "loss": 0.0134, "step": 190880 }, { - "epoch": 0.96, - "learning_rate": 0.00015554030805555694, - "loss": 0.0098, + "epoch": 0.49, + "learning_rate": 0.0002257778376851115, + "loss": 0.0152, "step": 190890 }, { - "epoch": 0.96, - "learning_rate": 0.00015553274036254292, - "loss": 0.0099, + "epoch": 0.49, + "learning_rate": 0.00022577394946874, + "loss": 0.0157, "step": 190900 }, { - "epoch": 0.96, - "learning_rate": 0.00015552517266952893, - "loss": 0.0113, + "epoch": 0.49, + "learning_rate": 0.00022577006125236855, + "loss": 0.0152, "step": 190910 }, { - "epoch": 0.96, - "learning_rate": 0.0001555176049765149, - "loss": 0.0112, + "epoch": 0.49, + "learning_rate": 0.0002257661730359971, + "loss": 0.0197, "step": 190920 }, { - "epoch": 0.96, - "learning_rate": 0.0001555100372835009, - "loss": 0.0103, + "epoch": 0.49, + "learning_rate": 0.00022576228481962563, + "loss": 0.0199, "step": 190930 }, { - "epoch": 0.96, - "learning_rate": 0.0001555024695904869, - "loss": 0.0096, + "epoch": 0.49, + "learning_rate": 0.00022575839660325415, + "loss": 0.0204, "step": 190940 }, { - "epoch": 0.96, - "learning_rate": 0.00015549490189747288, - "loss": 0.0077, + "epoch": 0.49, + "learning_rate": 0.0002257545083868827, + "loss": 0.0242, "step": 190950 }, { - "epoch": 0.96, - "learning_rate": 0.00015548733420445886, - "loss": 0.0111, + "epoch": 0.49, + "learning_rate": 0.00022575062017051123, + "loss": 0.0165, "step": 190960 }, { - "epoch": 0.96, - "learning_rate": 0.00015547976651144487, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022574673195413977, + "loss": 0.018, "step": 190970 }, { - "epoch": 0.96, - "learning_rate": 0.00015547219881843085, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022574284373776829, + "loss": 0.0175, "step": 190980 }, { - "epoch": 0.96, - "learning_rate": 0.00015546463112541683, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022573895552139683, + "loss": 0.0174, "step": 190990 }, { - "epoch": 0.96, - "learning_rate": 0.00015545706343240282, - "loss": 0.0124, + "epoch": 0.5, + "learning_rate": 0.0002257350673050254, + "loss": 0.0218, "step": 191000 }, { - "epoch": 0.96, - "eval_cer": 0.9144634631302844, - "eval_loss": 0.007862123660743237, - "eval_runtime": 115.5241, - "eval_samples_per_second": 17.312, - "eval_steps_per_second": 4.328, + "epoch": 0.5, + "eval_cer": 0.8817964619977577, + "eval_loss": 0.01211930438876152, + "eval_runtime": 107.8599, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, "step": 191000 }, { - "epoch": 0.96, - "learning_rate": 0.00015544949573938882, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.0002257311790886539, + "loss": 0.0167, "step": 191010 }, { - "epoch": 0.96, - "learning_rate": 0.0001554419280463748, - "loss": 0.0134, + "epoch": 0.5, + "learning_rate": 0.00022572729087228245, + "loss": 0.0167, "step": 191020 }, { - "epoch": 0.96, - "learning_rate": 0.0001554343603533608, - "loss": 0.0088, + "epoch": 0.5, + "learning_rate": 0.00022572340265591097, + "loss": 0.0185, "step": 191030 }, { - "epoch": 0.96, - "learning_rate": 0.0001554267926603468, - "loss": 0.0132, + "epoch": 0.5, + "learning_rate": 0.00022571951443953954, + "loss": 0.0151, "step": 191040 }, { - "epoch": 0.96, - "learning_rate": 0.00015541922496733278, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.00022571562622316805, + "loss": 0.0177, "step": 191050 }, { - "epoch": 0.96, - "learning_rate": 0.00015541165727431876, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.0002257117380067966, + "loss": 0.0188, "step": 191060 }, { - "epoch": 0.96, - "learning_rate": 0.00015540408958130477, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002257078497904251, + "loss": 0.0203, "step": 191070 }, { - "epoch": 0.96, - "learning_rate": 0.00015539652188829075, - "loss": 0.0157, + "epoch": 0.5, + "learning_rate": 0.00022570396157405365, + "loss": 0.0205, "step": 191080 }, { - "epoch": 0.96, - "learning_rate": 0.00015538895419527673, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.0002257000733576822, + "loss": 0.0177, "step": 191090 }, { - "epoch": 0.96, - "learning_rate": 0.00015538138650226274, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022569618514131073, + "loss": 0.0242, "step": 191100 }, { - "epoch": 0.96, - "learning_rate": 0.00015537381880924872, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022569229692493925, + "loss": 0.0136, "step": 191110 }, { - "epoch": 0.96, - "learning_rate": 0.0001553662511162347, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.0002256884087085678, + "loss": 0.021, "step": 191120 }, { - "epoch": 0.96, - "learning_rate": 0.0001553586834232207, - "loss": 0.0174, + "epoch": 0.5, + "learning_rate": 0.00022568452049219633, + "loss": 0.0241, "step": 191130 }, { - "epoch": 0.96, - "learning_rate": 0.0001553511157302067, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022568063227582487, + "loss": 0.0181, "step": 191140 }, { - "epoch": 0.96, - "learning_rate": 0.00015534354803719267, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022567674405945339, + "loss": 0.0193, "step": 191150 }, { - "epoch": 0.96, - "learning_rate": 0.00015533598034417865, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.00022567285584308193, + "loss": 0.0201, "step": 191160 }, { - "epoch": 0.96, - "learning_rate": 0.00015532841265116466, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.0002256689676267105, + "loss": 0.0184, "step": 191170 }, { - "epoch": 0.96, - "learning_rate": 0.00015532084495815064, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.000225665079410339, + "loss": 0.0258, "step": 191180 }, { - "epoch": 0.96, - "learning_rate": 0.00015531327726513663, - "loss": 0.0137, + "epoch": 0.5, + "learning_rate": 0.00022566119119396755, + "loss": 0.0159, "step": 191190 }, { - "epoch": 0.96, - "learning_rate": 0.00015530570957212263, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.00022565730297759607, + "loss": 0.0195, "step": 191200 }, { - "epoch": 0.96, - "learning_rate": 0.00015529814187910862, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022565341476122464, + "loss": 0.0178, "step": 191210 }, { - "epoch": 0.96, - "learning_rate": 0.0001552905741860946, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022564952654485315, + "loss": 0.0153, "step": 191220 }, { - "epoch": 0.96, - "learning_rate": 0.0001552830064930806, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002256456383284817, + "loss": 0.0174, "step": 191230 }, { - "epoch": 0.96, - "learning_rate": 0.0001552754388000666, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.0002256417501121102, + "loss": 0.017, "step": 191240 }, { - "epoch": 0.96, - "learning_rate": 0.00015526787110705257, - "loss": 0.0149, + "epoch": 0.5, + "learning_rate": 0.00022563786189573877, + "loss": 0.0241, "step": 191250 }, { - "epoch": 0.96, - "learning_rate": 0.00015526030341403858, - "loss": 0.014, + "epoch": 0.5, + "learning_rate": 0.0002256339736793673, + "loss": 0.0183, "step": 191260 }, { - "epoch": 0.96, - "learning_rate": 0.00015525273572102456, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.00022563008546299583, + "loss": 0.0211, "step": 191270 }, { - "epoch": 0.97, - "learning_rate": 0.00015524516802801054, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022562619724662435, + "loss": 0.0192, "step": 191280 }, { - "epoch": 0.97, - "learning_rate": 0.00015523760033499655, - "loss": 0.0139, + "epoch": 0.5, + "learning_rate": 0.00022562230903025291, + "loss": 0.0183, "step": 191290 }, { - "epoch": 0.97, - "learning_rate": 0.00015523003264198253, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022561842081388143, + "loss": 0.0176, "step": 191300 }, { - "epoch": 0.97, - "learning_rate": 0.0001552224649489685, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022561453259750997, + "loss": 0.0182, "step": 191310 }, { - "epoch": 0.97, - "learning_rate": 0.0001552148972559545, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022561064438113849, + "loss": 0.0128, "step": 191320 }, { - "epoch": 0.97, - "learning_rate": 0.0001552073295629405, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022560675616476703, + "loss": 0.0117, "step": 191330 }, { - "epoch": 0.97, - "learning_rate": 0.00015519976186992648, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002256028679483956, + "loss": 0.0254, "step": 191340 }, { - "epoch": 0.97, - "learning_rate": 0.00015519219417691247, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.0002255989797320241, + "loss": 0.0169, "step": 191350 }, { - "epoch": 0.97, - "learning_rate": 0.00015518462648389847, - "loss": 0.0137, + "epoch": 0.5, + "learning_rate": 0.00022559509151565262, + "loss": 0.0166, "step": 191360 }, { - "epoch": 0.97, - "learning_rate": 0.00015517705879088446, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022559120329928117, + "loss": 0.0185, "step": 191370 }, { - "epoch": 0.97, - "learning_rate": 0.00015516949109787044, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.00022558731508290973, + "loss": 0.0175, "step": 191380 }, { - "epoch": 0.97, - "learning_rate": 0.00015516192340485645, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.00022558342686653825, + "loss": 0.0156, "step": 191390 }, { - "epoch": 0.97, - "learning_rate": 0.00015515435571184243, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.0002255795386501668, + "loss": 0.0189, "step": 191400 }, { - "epoch": 0.97, - "learning_rate": 0.0001551467880188284, - "loss": 0.0124, + "epoch": 0.5, + "learning_rate": 0.0002255756504337953, + "loss": 0.0242, "step": 191410 }, { - "epoch": 0.97, - "learning_rate": 0.00015513922032581442, - "loss": 0.0136, + "epoch": 0.5, + "learning_rate": 0.00022557176221742387, + "loss": 0.0176, "step": 191420 }, { - "epoch": 0.97, - "learning_rate": 0.0001551316526328004, - "loss": 0.015, + "epoch": 0.5, + "learning_rate": 0.0002255678740010524, + "loss": 0.0204, "step": 191430 }, { - "epoch": 0.97, - "learning_rate": 0.00015512408493978638, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022556398578468093, + "loss": 0.0232, "step": 191440 }, { - "epoch": 0.97, - "learning_rate": 0.0001551165172467724, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022556009756830945, + "loss": 0.0199, "step": 191450 }, { - "epoch": 0.97, - "learning_rate": 0.00015510894955375837, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022555620935193801, + "loss": 0.0179, "step": 191460 }, { - "epoch": 0.97, - "learning_rate": 0.00015510138186074435, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022555232113556653, + "loss": 0.0216, "step": 191470 }, { - "epoch": 0.97, - "learning_rate": 0.00015509381416773036, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022554843291919507, + "loss": 0.0176, "step": 191480 }, { - "epoch": 0.97, - "learning_rate": 0.00015508624647471634, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022554454470282358, + "loss": 0.0185, "step": 191490 }, { - "epoch": 0.97, - "learning_rate": 0.00015507867878170232, - "loss": 0.0143, + "epoch": 0.5, + "learning_rate": 0.00022554065648645215, + "loss": 0.0219, "step": 191500 }, { - "epoch": 0.97, - "learning_rate": 0.0001550711110886883, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.00022553676827008067, + "loss": 0.0168, "step": 191510 }, { - "epoch": 0.97, - "learning_rate": 0.0001550635433956743, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.0002255328800537092, + "loss": 0.0185, "step": 191520 }, { - "epoch": 0.97, - "learning_rate": 0.0001550559757026603, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.00022552899183733772, + "loss": 0.017, "step": 191530 }, { - "epoch": 0.97, - "learning_rate": 0.00015504840800964628, - "loss": 0.0128, + "epoch": 0.5, + "learning_rate": 0.00022552510362096627, + "loss": 0.0176, "step": 191540 }, { - "epoch": 0.97, - "learning_rate": 0.00015504084031663228, - "loss": 0.0136, + "epoch": 0.5, + "learning_rate": 0.00022552121540459483, + "loss": 0.017, "step": 191550 }, { - "epoch": 0.97, - "learning_rate": 0.00015503327262361827, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022551732718822335, + "loss": 0.0169, "step": 191560 }, { - "epoch": 0.97, - "learning_rate": 0.00015502570493060425, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.0002255134389718519, + "loss": 0.0159, "step": 191570 }, { - "epoch": 0.97, - "learning_rate": 0.00015501813723759026, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002255095507554804, + "loss": 0.0202, "step": 191580 }, { - "epoch": 0.97, - "learning_rate": 0.00015501056954457624, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022550566253910897, + "loss": 0.0173, "step": 191590 }, { - "epoch": 0.97, - "learning_rate": 0.00015500300185156222, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.0002255017743227375, + "loss": 0.0221, "step": 191600 }, { - "epoch": 0.97, - "learning_rate": 0.00015499543415854823, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022549788610636603, + "loss": 0.0164, "step": 191610 }, { - "epoch": 0.97, - "learning_rate": 0.0001549878664655342, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022549399788999454, + "loss": 0.018, "step": 191620 }, { - "epoch": 0.97, - "learning_rate": 0.0001549802987725202, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002254901096736231, + "loss": 0.0212, "step": 191630 }, { - "epoch": 0.97, - "learning_rate": 0.0001549727310795062, - "loss": 0.0141, + "epoch": 0.5, + "learning_rate": 0.00022548622145725163, + "loss": 0.0197, "step": 191640 }, { - "epoch": 0.97, - "learning_rate": 0.00015496516338649218, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.00022548233324088017, + "loss": 0.0178, "step": 191650 }, { - "epoch": 0.97, - "learning_rate": 0.00015495759569347816, - "loss": 0.0128, + "epoch": 0.5, + "learning_rate": 0.00022547844502450868, + "loss": 0.0191, "step": 191660 }, { - "epoch": 0.97, - "learning_rate": 0.00015495002800046414, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022547455680813725, + "loss": 0.0163, "step": 191670 }, { - "epoch": 0.97, - "learning_rate": 0.00015494246030745012, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022547066859176577, + "loss": 0.019, "step": 191680 }, { - "epoch": 0.97, - "learning_rate": 0.0001549348926144361, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.0002254667803753943, + "loss": 0.0166, "step": 191690 }, { - "epoch": 0.97, - "learning_rate": 0.0001549273249214221, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022546289215902282, + "loss": 0.0165, "step": 191700 }, { - "epoch": 0.97, - "learning_rate": 0.00015491975722840807, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.0002254590039426514, + "loss": 0.0153, "step": 191710 }, { - "epoch": 0.97, - "learning_rate": 0.00015491218953539408, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022545511572627993, + "loss": 0.0172, "step": 191720 }, { - "epoch": 0.97, - "learning_rate": 0.00015490462184238006, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022545122750990845, + "loss": 0.013, "step": 191730 }, { - "epoch": 0.97, - "learning_rate": 0.00015489705414936604, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.000225447339293537, + "loss": 0.0136, "step": 191740 }, { - "epoch": 0.97, - "learning_rate": 0.00015488948645635205, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022544345107716553, + "loss": 0.0124, "step": 191750 }, { - "epoch": 0.97, - "learning_rate": 0.00015488191876333803, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022543956286079407, + "loss": 0.0182, "step": 191760 }, { - "epoch": 0.97, - "learning_rate": 0.000154874351070324, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002254356746444226, + "loss": 0.016, "step": 191770 }, { - "epoch": 0.97, - "learning_rate": 0.00015486678337731002, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.00022543178642805113, + "loss": 0.0184, "step": 191780 }, { - "epoch": 0.97, - "learning_rate": 0.000154859215684296, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.00022542789821167964, + "loss": 0.0142, "step": 191790 }, { - "epoch": 0.97, - "learning_rate": 0.00015485164799128198, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.0002254240099953082, + "loss": 0.0131, "step": 191800 }, { - "epoch": 0.97, - "learning_rate": 0.000154844080298268, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.00022542012177893673, + "loss": 0.0189, "step": 191810 }, { - "epoch": 0.97, - "learning_rate": 0.00015483651260525397, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022541623356256527, + "loss": 0.0145, "step": 191820 }, { - "epoch": 0.97, - "learning_rate": 0.00015482894491223995, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022541234534619378, + "loss": 0.0169, "step": 191830 }, { - "epoch": 0.97, - "learning_rate": 0.00015482137721922596, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.00022540845712982235, + "loss": 0.0191, "step": 191840 }, { - "epoch": 0.97, - "learning_rate": 0.00015481380952621194, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022540456891345087, + "loss": 0.0144, "step": 191850 }, { - "epoch": 0.97, - "learning_rate": 0.00015480624183319793, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.0002254006806970794, + "loss": 0.0191, "step": 191860 }, { - "epoch": 0.97, - "learning_rate": 0.00015479867414018393, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022539679248070792, + "loss": 0.0146, "step": 191870 }, { - "epoch": 0.97, - "learning_rate": 0.00015479110644716992, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.0002253929042643365, + "loss": 0.0201, "step": 191880 }, { - "epoch": 0.97, - "learning_rate": 0.0001547835387541559, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022538901604796503, + "loss": 0.0185, "step": 191890 }, { - "epoch": 0.97, - "learning_rate": 0.00015477597106114188, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.00022538512783159355, + "loss": 0.0191, "step": 191900 }, { - "epoch": 0.97, - "learning_rate": 0.0001547684033681279, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022538123961522206, + "loss": 0.0163, "step": 191910 }, { - "epoch": 0.97, - "learning_rate": 0.00015476083567511387, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022537735139885063, + "loss": 0.0197, "step": 191920 }, { - "epoch": 0.97, - "learning_rate": 0.00015475326798209985, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022537346318247917, + "loss": 0.0192, "step": 191930 }, { - "epoch": 0.97, - "learning_rate": 0.00015474570028908586, - "loss": 0.0072, + "epoch": 0.5, + "learning_rate": 0.0002253695749661077, + "loss": 0.0205, "step": 191940 }, { - "epoch": 0.97, - "learning_rate": 0.00015473813259607184, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022536568674973623, + "loss": 0.0181, "step": 191950 }, { - "epoch": 0.97, - "learning_rate": 0.00015473056490305782, - "loss": 0.0141, + "epoch": 0.5, + "learning_rate": 0.00022536179853336477, + "loss": 0.0172, "step": 191960 }, { - "epoch": 0.97, - "learning_rate": 0.00015472299721004383, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002253579103169933, + "loss": 0.0187, "step": 191970 }, { - "epoch": 0.97, - "learning_rate": 0.0001547154295170298, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022535402210062183, + "loss": 0.022, "step": 191980 }, { - "epoch": 0.97, - "learning_rate": 0.0001547078618240158, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022535013388425037, + "loss": 0.0179, "step": 191990 }, { - "epoch": 0.97, - "learning_rate": 0.0001547002941310018, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.0002253462456678789, + "loss": 0.0161, "step": 192000 }, { - "epoch": 0.97, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.008027549833059311, - "eval_runtime": 116.6747, - "eval_samples_per_second": 17.142, - "eval_steps_per_second": 4.285, + "epoch": 0.5, + "eval_cer": 0.8818188561887047, + "eval_loss": 0.012052525766193867, + "eval_runtime": 108.244, + "eval_samples_per_second": 18.477, + "eval_steps_per_second": 4.619, "step": 192000 }, { - "epoch": 0.97, - "learning_rate": 0.00015469272643798778, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022534235745150745, + "loss": 0.0164, "step": 192010 }, { - "epoch": 0.97, - "learning_rate": 0.00015468515874497376, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022533846923513597, + "loss": 0.0162, "step": 192020 }, { - "epoch": 0.97, - "learning_rate": 0.00015467759105195977, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.0002253345810187645, + "loss": 0.0144, "step": 192030 }, { - "epoch": 0.97, - "learning_rate": 0.00015467002335894575, - "loss": 0.008, + "epoch": 0.5, + "learning_rate": 0.00022533069280239302, + "loss": 0.0217, "step": 192040 }, { - "epoch": 0.97, - "learning_rate": 0.00015466245566593174, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.0002253268045860216, + "loss": 0.0189, "step": 192050 }, { - "epoch": 0.97, - "learning_rate": 0.00015465488797291772, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022532291636965013, + "loss": 0.0167, "step": 192060 }, { - "epoch": 0.97, - "learning_rate": 0.00015464732027990373, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022531902815327865, + "loss": 0.0193, "step": 192070 }, { - "epoch": 0.97, - "learning_rate": 0.0001546397525868897, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.00022531513993690716, + "loss": 0.0212, "step": 192080 }, { - "epoch": 0.97, - "learning_rate": 0.0001546321848938757, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022531125172053573, + "loss": 0.0168, "step": 192090 }, { - "epoch": 0.97, - "learning_rate": 0.0001546246172008617, - "loss": 0.0163, + "epoch": 0.5, + "learning_rate": 0.00022530736350416427, + "loss": 0.0196, "step": 192100 }, { - "epoch": 0.97, - "learning_rate": 0.00015461704950784768, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.0002253034752877928, + "loss": 0.018, "step": 192110 }, { - "epoch": 0.97, - "learning_rate": 0.00015460948181483366, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.00022529958707142133, + "loss": 0.0241, "step": 192120 }, { - "epoch": 0.97, - "learning_rate": 0.00015460191412181967, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022529569885504987, + "loss": 0.0176, "step": 192130 }, { - "epoch": 0.97, - "learning_rate": 0.00015459434642880565, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.0002252918106386784, + "loss": 0.0175, "step": 192140 }, { - "epoch": 0.97, - "learning_rate": 0.00015458677873579163, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022528792242230693, + "loss": 0.019, "step": 192150 }, { - "epoch": 0.97, - "learning_rate": 0.00015457921104277764, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022528403420593547, + "loss": 0.0202, "step": 192160 }, { - "epoch": 0.97, - "learning_rate": 0.00015457164334976362, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.000225280145989564, + "loss": 0.018, "step": 192170 }, { - "epoch": 0.97, - "learning_rate": 0.0001545640756567496, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022527625777319255, + "loss": 0.0175, "step": 192180 }, { - "epoch": 0.97, - "learning_rate": 0.0001545565079637356, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022527236955682107, + "loss": 0.0182, "step": 192190 }, { - "epoch": 0.97, - "learning_rate": 0.0001545489402707216, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.0002252684813404496, + "loss": 0.0132, "step": 192200 }, { - "epoch": 0.97, - "learning_rate": 0.00015454137257770757, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022526459312407818, + "loss": 0.0191, "step": 192210 }, { - "epoch": 0.97, - "learning_rate": 0.00015453380488469356, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.0002252607049077067, + "loss": 0.0192, "step": 192220 }, { - "epoch": 0.97, - "learning_rate": 0.00015452623719167956, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002252568166913352, + "loss": 0.0173, "step": 192230 }, { - "epoch": 0.97, - "learning_rate": 0.00015451866949866555, - "loss": 0.0082, + "epoch": 0.5, + "learning_rate": 0.00022525292847496375, + "loss": 0.0194, "step": 192240 }, { - "epoch": 0.97, - "learning_rate": 0.00015451110180565153, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022524904025859232, + "loss": 0.014, "step": 192250 }, { - "epoch": 0.97, - "learning_rate": 0.00015450353411263754, - "loss": 0.0085, + "epoch": 0.5, + "learning_rate": 0.00022524515204222083, + "loss": 0.0161, "step": 192260 }, { - "epoch": 0.97, - "learning_rate": 0.00015449596641962352, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022524126382584937, + "loss": 0.0149, "step": 192270 }, { - "epoch": 0.97, - "learning_rate": 0.0001544883987266095, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022523737560947789, + "loss": 0.0164, "step": 192280 }, { - "epoch": 0.97, - "learning_rate": 0.0001544808310335955, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.00022523348739310643, + "loss": 0.0148, "step": 192290 }, { - "epoch": 0.97, - "learning_rate": 0.0001544732633405815, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022522959917673497, + "loss": 0.0152, "step": 192300 }, { - "epoch": 0.97, - "learning_rate": 0.00015446569564756747, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.0002252257109603635, + "loss": 0.0177, "step": 192310 }, { - "epoch": 0.97, - "learning_rate": 0.00015445812795455348, - "loss": 0.0088, + "epoch": 0.5, + "learning_rate": 0.00022522182274399203, + "loss": 0.0218, "step": 192320 }, { - "epoch": 0.97, - "learning_rate": 0.00015445056026153946, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022521793452762057, + "loss": 0.0176, "step": 192330 }, { - "epoch": 0.97, - "learning_rate": 0.00015444299256852544, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.0002252140463112491, + "loss": 0.0173, "step": 192340 }, { - "epoch": 0.97, - "learning_rate": 0.00015443542487551145, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.00022521015809487765, + "loss": 0.0173, "step": 192350 }, { - "epoch": 0.97, - "learning_rate": 0.00015442785718249743, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022520626987850616, + "loss": 0.0191, "step": 192360 }, { - "epoch": 0.97, - "learning_rate": 0.0001544202894894834, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.0002252023816621347, + "loss": 0.0146, "step": 192370 }, { - "epoch": 0.97, - "learning_rate": 0.00015441272179646942, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022519849344576325, + "loss": 0.0201, "step": 192380 }, { - "epoch": 0.97, - "learning_rate": 0.0001544051541034554, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.0002251946052293918, + "loss": 0.0148, "step": 192390 }, { - "epoch": 0.97, - "learning_rate": 0.00015439758641044138, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002251907170130203, + "loss": 0.0177, "step": 192400 }, { - "epoch": 0.97, - "learning_rate": 0.00015439001871742737, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022518682879664885, + "loss": 0.0167, "step": 192410 }, { - "epoch": 0.97, - "learning_rate": 0.00015438245102441337, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022518294058027741, + "loss": 0.0156, "step": 192420 }, { - "epoch": 0.97, - "learning_rate": 0.00015437488333139936, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022517905236390593, + "loss": 0.0145, "step": 192430 }, { - "epoch": 0.97, - "learning_rate": 0.00015436731563838534, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022517516414753447, + "loss": 0.0156, "step": 192440 }, { - "epoch": 0.97, - "learning_rate": 0.00015435974794537135, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022517127593116299, + "loss": 0.0226, "step": 192450 }, { - "epoch": 0.97, - "learning_rate": 0.00015435218025235733, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022516738771479155, + "loss": 0.0207, "step": 192460 }, { - "epoch": 0.97, - "learning_rate": 0.0001543446125593433, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022516349949842007, + "loss": 0.0185, "step": 192470 }, { - "epoch": 0.97, - "learning_rate": 0.00015433704486632932, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002251596112820486, + "loss": 0.0191, "step": 192480 }, { - "epoch": 0.97, - "learning_rate": 0.0001543294771733153, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.00022515572306567712, + "loss": 0.0182, "step": 192490 }, { - "epoch": 0.97, - "learning_rate": 0.00015432190948030128, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.0002251518348493057, + "loss": 0.0167, "step": 192500 }, { - "epoch": 0.97, - "learning_rate": 0.0001543143417872873, - "loss": 0.0088, + "epoch": 0.5, + "learning_rate": 0.0002251479466329342, + "loss": 0.0167, "step": 192510 }, { - "epoch": 0.97, - "learning_rate": 0.00015430677409427327, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.00022514405841656275, + "loss": 0.0159, "step": 192520 }, { - "epoch": 0.97, - "learning_rate": 0.00015429920640125925, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022514017020019126, + "loss": 0.0176, "step": 192530 }, { - "epoch": 0.97, - "learning_rate": 0.00015429163870824526, - "loss": 0.0144, + "epoch": 0.5, + "learning_rate": 0.0002251362819838198, + "loss": 0.0165, "step": 192540 }, { - "epoch": 0.97, - "learning_rate": 0.00015428407101523124, - "loss": 0.0077, + "epoch": 0.5, + "learning_rate": 0.00022513239376744835, + "loss": 0.0199, "step": 192550 }, { - "epoch": 0.97, - "learning_rate": 0.00015427650332221722, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.0002251285055510769, + "loss": 0.0181, "step": 192560 }, { - "epoch": 0.97, - "learning_rate": 0.0001542689356292032, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.0002251246173347054, + "loss": 0.0173, "step": 192570 }, { - "epoch": 0.97, - "learning_rate": 0.0001542613679361892, - "loss": 0.007, + "epoch": 0.5, + "learning_rate": 0.00022512072911833395, + "loss": 0.0151, "step": 192580 }, { - "epoch": 0.97, - "learning_rate": 0.0001542538002431752, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022511684090196251, + "loss": 0.0214, "step": 192590 }, { - "epoch": 0.97, - "learning_rate": 0.00015424623255016118, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022511295268559103, + "loss": 0.0255, "step": 192600 }, { - "epoch": 0.97, - "learning_rate": 0.00015423866485714718, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022510906446921957, + "loss": 0.0172, "step": 192610 }, { - "epoch": 0.97, - "learning_rate": 0.00015423109716413317, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022510517625284808, + "loss": 0.0148, "step": 192620 }, { - "epoch": 0.97, - "learning_rate": 0.00015422352947111915, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022510128803647665, + "loss": 0.017, "step": 192630 }, { - "epoch": 0.97, - "learning_rate": 0.00015421596177810516, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.00022509739982010517, + "loss": 0.0227, "step": 192640 }, { - "epoch": 0.97, - "learning_rate": 0.00015420839408509114, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.0002250935116037337, + "loss": 0.0161, "step": 192650 }, { - "epoch": 0.97, - "learning_rate": 0.00015420082639207712, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022508962338736222, + "loss": 0.0181, "step": 192660 }, { - "epoch": 0.97, - "learning_rate": 0.00015419325869906313, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002250857351709908, + "loss": 0.0174, "step": 192670 }, { - "epoch": 0.97, - "learning_rate": 0.0001541856910060491, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.0002250818469546193, + "loss": 0.0202, "step": 192680 }, { - "epoch": 0.97, - "learning_rate": 0.0001541781233130351, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.00022507795873824785, + "loss": 0.0178, "step": 192690 }, { - "epoch": 0.97, - "learning_rate": 0.0001541705556200211, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022507407052187636, + "loss": 0.0183, "step": 192700 }, { - "epoch": 0.97, - "learning_rate": 0.00015416298792700708, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022507018230550493, + "loss": 0.0237, "step": 192710 }, { - "epoch": 0.97, - "learning_rate": 0.00015415542023399306, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022506629408913345, + "loss": 0.0165, "step": 192720 }, { - "epoch": 0.97, - "learning_rate": 0.00015414785254097904, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.000225062405872762, + "loss": 0.0258, "step": 192730 }, { - "epoch": 0.97, - "learning_rate": 0.00015414028484796505, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.0002250585176563905, + "loss": 0.0201, "step": 192740 }, { - "epoch": 0.97, - "learning_rate": 0.00015413271715495103, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.00022505462944001907, + "loss": 0.0226, "step": 192750 }, { - "epoch": 0.97, - "learning_rate": 0.00015412514946193701, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.00022505074122364761, + "loss": 0.0196, "step": 192760 }, { - "epoch": 0.97, - "learning_rate": 0.00015411758176892302, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022504685300727613, + "loss": 0.0212, "step": 192770 }, { - "epoch": 0.97, - "learning_rate": 0.000154110014075909, - "loss": 0.0153, + "epoch": 0.5, + "learning_rate": 0.00022504296479090467, + "loss": 0.0192, "step": 192780 }, { - "epoch": 0.97, - "learning_rate": 0.00015410244638289499, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022503907657453318, + "loss": 0.0163, "step": 192790 }, { - "epoch": 0.97, - "learning_rate": 0.000154094878689881, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022503518835816175, + "loss": 0.0191, "step": 192800 }, { - "epoch": 0.97, - "learning_rate": 0.00015408731099686698, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022503130014179027, + "loss": 0.0183, "step": 192810 }, { - "epoch": 0.97, - "learning_rate": 0.00015407974330385296, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.0002250274119254188, + "loss": 0.0183, "step": 192820 }, { - "epoch": 0.97, - "learning_rate": 0.00015407217561083897, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.00022502352370904732, + "loss": 0.0185, "step": 192830 }, { - "epoch": 0.97, - "learning_rate": 0.00015406460791782495, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.0002250196354926759, + "loss": 0.0236, "step": 192840 }, { - "epoch": 0.97, - "learning_rate": 0.00015405704022481093, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.0002250157472763044, + "loss": 0.0191, "step": 192850 }, { - "epoch": 0.97, - "learning_rate": 0.00015404947253179694, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022501185905993295, + "loss": 0.016, "step": 192860 }, { - "epoch": 0.97, - "learning_rate": 0.00015404190483878292, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022500797084356146, + "loss": 0.0146, "step": 192870 }, { - "epoch": 0.97, - "learning_rate": 0.0001540343371457689, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022500408262719003, + "loss": 0.0177, "step": 192880 }, { - "epoch": 0.97, - "learning_rate": 0.00015402676945275488, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.00022500019441081855, + "loss": 0.0156, "step": 192890 }, { - "epoch": 0.97, - "learning_rate": 0.0001540192017597409, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.0002249963061944471, + "loss": 0.0171, "step": 192900 }, { - "epoch": 0.97, - "learning_rate": 0.00015401163406672687, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.0002249924179780756, + "loss": 0.0178, "step": 192910 }, { - "epoch": 0.97, - "learning_rate": 0.00015400406637371285, - "loss": 0.0079, + "epoch": 0.5, + "learning_rate": 0.00022498852976170417, + "loss": 0.0154, "step": 192920 }, { - "epoch": 0.97, - "learning_rate": 0.00015399649868069886, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.0002249846415453327, + "loss": 0.0204, "step": 192930 }, { - "epoch": 0.97, - "learning_rate": 0.00015398893098768482, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022498075332896123, + "loss": 0.0214, "step": 192940 }, { - "epoch": 0.97, - "learning_rate": 0.0001539813632946708, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022497686511258974, + "loss": 0.023, "step": 192950 }, { - "epoch": 0.97, - "learning_rate": 0.00015397379560165678, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.0002249729768962183, + "loss": 0.0152, "step": 192960 }, { - "epoch": 0.97, - "learning_rate": 0.0001539662279086428, - "loss": 0.008, + "epoch": 0.5, + "learning_rate": 0.00022496908867984685, + "loss": 0.0155, "step": 192970 }, { - "epoch": 0.97, - "learning_rate": 0.00015395866021562877, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.00022496520046347537, + "loss": 0.0185, "step": 192980 }, { - "epoch": 0.97, - "learning_rate": 0.00015395109252261475, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.0002249613122471039, + "loss": 0.022, "step": 192990 }, { - "epoch": 0.97, - "learning_rate": 0.00015394352482960076, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022495742403073245, + "loss": 0.0187, "step": 193000 }, { - "epoch": 0.97, - "eval_cer": 0.9144644335264098, - "eval_loss": 0.008065390400588512, - "eval_runtime": 116.6291, - "eval_samples_per_second": 17.148, - "eval_steps_per_second": 4.287, + "epoch": 0.5, + "eval_cer": 0.8818286536472439, + "eval_loss": 0.012139668688178062, + "eval_runtime": 108.0099, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 193000 }, { - "epoch": 0.97, - "learning_rate": 0.00015393595713658674, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.000224953535814361, + "loss": 0.02, "step": 193010 }, { - "epoch": 0.97, - "learning_rate": 0.00015392838944357272, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.0002249496475979895, + "loss": 0.0183, "step": 193020 }, { - "epoch": 0.97, - "learning_rate": 0.00015392082175055873, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022494575938161805, + "loss": 0.0223, "step": 193030 }, { - "epoch": 0.97, - "learning_rate": 0.0001539132540575447, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.00022494187116524656, + "loss": 0.0189, "step": 193040 }, { - "epoch": 0.97, - "learning_rate": 0.0001539056863645307, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022493798294887513, + "loss": 0.018, "step": 193050 }, { - "epoch": 0.97, - "learning_rate": 0.0001538981186715167, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022493409473250365, + "loss": 0.0212, "step": 193060 }, { - "epoch": 0.97, - "learning_rate": 0.00015389055097850268, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.0002249302065161322, + "loss": 0.0206, "step": 193070 }, { - "epoch": 0.97, - "learning_rate": 0.00015388298328548866, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.0002249263182997607, + "loss": 0.0182, "step": 193080 }, { - "epoch": 0.97, - "learning_rate": 0.00015387541559247467, - "loss": 0.0118, + "epoch": 0.5, + "learning_rate": 0.00022492243008338927, + "loss": 0.018, "step": 193090 }, { - "epoch": 0.97, - "learning_rate": 0.00015386784789946065, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.00022491854186701779, + "loss": 0.0207, "step": 193100 }, { - "epoch": 0.97, - "learning_rate": 0.00015386028020644664, - "loss": 0.0134, + "epoch": 0.5, + "learning_rate": 0.00022491465365064633, + "loss": 0.0244, "step": 193110 }, { - "epoch": 0.97, - "learning_rate": 0.00015385271251343262, - "loss": 0.0149, - "step": 193120 + "epoch": 0.5, + "learning_rate": 0.00022491076543427484, + "loss": 0.018, + "step": 193120 }, { - "epoch": 0.97, - "learning_rate": 0.00015384514482041863, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.0002249068772179034, + "loss": 0.0194, "step": 193130 }, { - "epoch": 0.97, - "learning_rate": 0.0001538375771274046, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022490298900153195, + "loss": 0.0173, "step": 193140 }, { - "epoch": 0.97, - "learning_rate": 0.0001538300094343906, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022489910078516047, + "loss": 0.0192, "step": 193150 }, { - "epoch": 0.97, - "learning_rate": 0.0001538224417413766, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.000224895212568789, + "loss": 0.015, "step": 193160 }, { - "epoch": 0.97, - "learning_rate": 0.00015381487404836258, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022489132435241755, + "loss": 0.0149, "step": 193170 }, { - "epoch": 0.97, - "learning_rate": 0.00015380730635534856, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.0002248874361360461, + "loss": 0.0198, "step": 193180 }, { - "epoch": 0.97, - "learning_rate": 0.00015379973866233457, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.0002248835479196746, + "loss": 0.0187, "step": 193190 }, { - "epoch": 0.97, - "learning_rate": 0.00015379217096932055, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022487965970330315, + "loss": 0.0157, "step": 193200 }, { - "epoch": 0.97, - "learning_rate": 0.00015378460327630653, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.0002248757714869317, + "loss": 0.0207, "step": 193210 }, { - "epoch": 0.97, - "learning_rate": 0.00015377703558329254, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022487188327056023, + "loss": 0.0228, "step": 193220 }, { - "epoch": 0.97, - "learning_rate": 0.00015376946789027852, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022486799505418875, + "loss": 0.0184, "step": 193230 }, { - "epoch": 0.97, - "learning_rate": 0.0001537619001972645, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.0002248641068378173, + "loss": 0.0178, "step": 193240 }, { - "epoch": 0.97, - "learning_rate": 0.0001537543325042505, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022486021862144586, + "loss": 0.0164, "step": 193250 }, { - "epoch": 0.98, - "learning_rate": 0.0001537467648112365, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022485633040507437, + "loss": 0.0156, "step": 193260 }, { - "epoch": 0.98, - "learning_rate": 0.00015373919711822247, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022485244218870288, + "loss": 0.0157, "step": 193270 }, { - "epoch": 0.98, - "learning_rate": 0.00015373162942520846, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.00022484855397233143, + "loss": 0.0184, "step": 193280 }, { - "epoch": 0.98, - "learning_rate": 0.00015372406173219446, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022484466575595994, + "loss": 0.0198, "step": 193290 }, { - "epoch": 0.98, - "learning_rate": 0.00015371649403918045, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.0002248407775395885, + "loss": 0.0162, "step": 193300 }, { - "epoch": 0.98, - "learning_rate": 0.00015370892634616643, - "loss": 0.0124, + "epoch": 0.5, + "learning_rate": 0.00022483688932321705, + "loss": 0.0208, "step": 193310 }, { - "epoch": 0.98, - "learning_rate": 0.00015370135865315244, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022483300110684557, + "loss": 0.0167, "step": 193320 }, { - "epoch": 0.98, - "learning_rate": 0.00015369379096013842, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002248291128904741, + "loss": 0.0132, "step": 193330 }, { - "epoch": 0.98, - "learning_rate": 0.0001536862232671244, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022482522467410265, + "loss": 0.0154, "step": 193340 }, { - "epoch": 0.98, - "learning_rate": 0.0001536786555741104, - "loss": 0.0152, + "epoch": 0.5, + "learning_rate": 0.0002248213364577312, + "loss": 0.018, "step": 193350 }, { - "epoch": 0.98, - "learning_rate": 0.0001536710878810964, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002248174482413597, + "loss": 0.0173, "step": 193360 }, { - "epoch": 0.98, - "learning_rate": 0.00015366352018808237, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022481356002498825, + "loss": 0.0193, "step": 193370 }, { - "epoch": 0.98, - "learning_rate": 0.00015365595249506838, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002248096718086168, + "loss": 0.0152, "step": 193380 }, { - "epoch": 0.98, - "learning_rate": 0.00015364838480205436, - "loss": 0.0124, + "epoch": 0.5, + "learning_rate": 0.00022480578359224533, + "loss": 0.0167, "step": 193390 }, { - "epoch": 0.98, - "learning_rate": 0.00015364081710904034, - "loss": 0.0136, + "epoch": 0.5, + "learning_rate": 0.00022480189537587384, + "loss": 0.0213, "step": 193400 }, { - "epoch": 0.98, - "learning_rate": 0.00015363324941602635, - "loss": 0.0138, + "epoch": 0.5, + "learning_rate": 0.00022479800715950239, + "loss": 0.0185, "step": 193410 }, { - "epoch": 0.98, - "learning_rate": 0.00015362568172301233, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.00022479411894313093, + "loss": 0.0153, "step": 193420 }, { - "epoch": 0.98, - "learning_rate": 0.0001536181140299983, - "loss": 0.013, + "epoch": 0.5, + "learning_rate": 0.00022479023072675947, + "loss": 0.0171, "step": 193430 }, { - "epoch": 0.98, - "learning_rate": 0.00015361054633698432, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.00022478634251038798, + "loss": 0.0194, "step": 193440 }, { - "epoch": 0.98, - "learning_rate": 0.0001536029786439703, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022478245429401653, + "loss": 0.0143, "step": 193450 }, { - "epoch": 0.98, - "learning_rate": 0.00015359541095095628, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.0002247785660776451, + "loss": 0.0223, "step": 193460 }, { - "epoch": 0.98, - "learning_rate": 0.00015358784325794227, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.0002247746778612736, + "loss": 0.0202, "step": 193470 }, { - "epoch": 0.98, - "learning_rate": 0.00015358027556492827, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.00022477078964490215, + "loss": 0.0149, "step": 193480 }, { - "epoch": 0.98, - "learning_rate": 0.00015357270787191426, - "loss": 0.008, + "epoch": 0.5, + "learning_rate": 0.00022476690142853067, + "loss": 0.0143, "step": 193490 }, { - "epoch": 0.98, - "learning_rate": 0.00015356514017890024, - "loss": 0.0128, + "epoch": 0.5, + "learning_rate": 0.00022476301321215923, + "loss": 0.0161, "step": 193500 }, { - "epoch": 0.98, - "learning_rate": 0.00015355757248588625, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.00022475912499578775, + "loss": 0.016, "step": 193510 }, { - "epoch": 0.98, - "learning_rate": 0.00015355000479287223, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.0002247552367794163, + "loss": 0.0197, "step": 193520 }, { - "epoch": 0.98, - "learning_rate": 0.0001535424370998582, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.0002247513485630448, + "loss": 0.017, "step": 193530 }, { - "epoch": 0.98, - "learning_rate": 0.00015353486940684422, - "loss": 0.015, + "epoch": 0.5, + "learning_rate": 0.00022474746034667335, + "loss": 0.0184, "step": 193540 }, { - "epoch": 0.98, - "learning_rate": 0.0001535273017138302, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.0002247435721303019, + "loss": 0.0188, "step": 193550 }, { - "epoch": 0.98, - "learning_rate": 0.00015351973402081618, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.00022473968391393043, + "loss": 0.0229, "step": 193560 }, { - "epoch": 0.98, - "learning_rate": 0.0001535121663278022, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022473579569755894, + "loss": 0.0186, "step": 193570 }, { - "epoch": 0.98, - "learning_rate": 0.00015350459863478817, - "loss": 0.0124, + "epoch": 0.5, + "learning_rate": 0.00022473190748118749, + "loss": 0.0146, "step": 193580 }, { - "epoch": 0.98, - "learning_rate": 0.00015349703094177415, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022472801926481603, + "loss": 0.0184, "step": 193590 }, { - "epoch": 0.98, - "learning_rate": 0.00015348946324876016, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022472413104844457, + "loss": 0.017, "step": 193600 }, { - "epoch": 0.98, - "learning_rate": 0.00015348189555574614, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022472024283207308, + "loss": 0.0188, "step": 193610 }, { - "epoch": 0.98, - "learning_rate": 0.00015347432786273212, - "loss": 0.0137, + "epoch": 0.5, + "learning_rate": 0.00022471635461570163, + "loss": 0.0202, "step": 193620 }, { - "epoch": 0.98, - "learning_rate": 0.0001534667601697181, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.0002247124663993302, + "loss": 0.0214, "step": 193630 }, { - "epoch": 0.98, - "learning_rate": 0.0001534591924767041, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.0002247085781829587, + "loss": 0.0228, "step": 193640 }, { - "epoch": 0.98, - "learning_rate": 0.0001534516247836901, - "loss": 0.0126, + "epoch": 0.5, + "learning_rate": 0.00022470468996658725, + "loss": 0.0209, "step": 193650 }, { - "epoch": 0.98, - "learning_rate": 0.00015344405709067608, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022470080175021576, + "loss": 0.0183, "step": 193660 }, { - "epoch": 0.98, - "learning_rate": 0.00015343648939766208, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.00022469691353384433, + "loss": 0.0173, "step": 193670 }, { - "epoch": 0.98, - "learning_rate": 0.00015342892170464807, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022469302531747285, + "loss": 0.0178, "step": 193680 }, { - "epoch": 0.98, - "learning_rate": 0.00015342135401163405, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.0002246891371011014, + "loss": 0.0204, "step": 193690 }, { - "epoch": 0.98, - "learning_rate": 0.00015341378631862006, - "loss": 0.0143, + "epoch": 0.5, + "learning_rate": 0.0002246852488847299, + "loss": 0.0166, "step": 193700 }, { - "epoch": 0.98, - "learning_rate": 0.00015340621862560604, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022468136066835847, + "loss": 0.0152, "step": 193710 }, { - "epoch": 0.98, - "learning_rate": 0.00015339865093259202, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.000224677472451987, + "loss": 0.0137, "step": 193720 }, { - "epoch": 0.98, - "learning_rate": 0.00015339108323957803, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022467358423561553, + "loss": 0.0165, "step": 193730 }, { - "epoch": 0.98, - "learning_rate": 0.000153383515546564, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.00022466969601924404, + "loss": 0.0182, "step": 193740 }, { - "epoch": 0.98, - "learning_rate": 0.00015337594785355, - "loss": 0.0155, + "epoch": 0.5, + "learning_rate": 0.0002246658078028726, + "loss": 0.0167, "step": 193750 }, { - "epoch": 0.98, - "learning_rate": 0.000153368380160536, - "loss": 0.0095, + "epoch": 0.5, + "learning_rate": 0.00022466191958650113, + "loss": 0.0131, "step": 193760 }, { - "epoch": 0.98, - "learning_rate": 0.00015336081246752198, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022465803137012967, + "loss": 0.0181, "step": 193770 }, { - "epoch": 0.98, - "learning_rate": 0.00015335324477450796, - "loss": 0.0157, + "epoch": 0.5, + "learning_rate": 0.00022465414315375818, + "loss": 0.0186, "step": 193780 }, { - "epoch": 0.98, - "learning_rate": 0.00015334567708149394, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022465025493738672, + "loss": 0.0199, "step": 193790 }, { - "epoch": 0.98, - "learning_rate": 0.00015333810938847995, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.0002246463667210153, + "loss": 0.0205, "step": 193800 }, { - "epoch": 0.98, - "learning_rate": 0.00015333054169546593, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.0002246424785046438, + "loss": 0.0178, "step": 193810 }, { - "epoch": 0.98, - "learning_rate": 0.00015332297400245191, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022463859028827232, + "loss": 0.0186, "step": 193820 }, { - "epoch": 0.98, - "learning_rate": 0.00015331540630943792, - "loss": 0.0082, + "epoch": 0.5, + "learning_rate": 0.00022463470207190086, + "loss": 0.0176, "step": 193830 }, { - "epoch": 0.98, - "learning_rate": 0.0001533078386164239, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.00022463081385552943, + "loss": 0.018, "step": 193840 }, { - "epoch": 0.98, - "learning_rate": 0.00015330027092340989, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022462692563915795, + "loss": 0.0182, "step": 193850 }, { - "epoch": 0.98, - "learning_rate": 0.0001532927032303959, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.0002246230374227865, + "loss": 0.0174, "step": 193860 }, { - "epoch": 0.98, - "learning_rate": 0.00015328513553738188, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.000224619149206415, + "loss": 0.0206, "step": 193870 }, { - "epoch": 0.98, - "learning_rate": 0.00015327756784436786, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022461526099004357, + "loss": 0.0193, "step": 193880 }, { - "epoch": 0.98, - "learning_rate": 0.00015327000015135387, - "loss": 0.013, + "epoch": 0.5, + "learning_rate": 0.0002246113727736721, + "loss": 0.0166, "step": 193890 }, { - "epoch": 0.98, - "learning_rate": 0.00015326243245833985, - "loss": 0.0127, + "epoch": 0.5, + "learning_rate": 0.00022460748455730063, + "loss": 0.0177, "step": 193900 }, { - "epoch": 0.98, - "learning_rate": 0.00015325486476532583, - "loss": 0.0122, + "epoch": 0.5, + "learning_rate": 0.00022460359634092914, + "loss": 0.0184, "step": 193910 }, { - "epoch": 0.98, - "learning_rate": 0.00015324729707231184, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.0002245997081245577, + "loss": 0.0194, "step": 193920 }, { - "epoch": 0.98, - "learning_rate": 0.00015323972937929782, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.00022459581990818623, + "loss": 0.0191, "step": 193930 }, { - "epoch": 0.98, - "learning_rate": 0.0001532321616862838, - "loss": 0.0139, + "epoch": 0.5, + "learning_rate": 0.00022459193169181477, + "loss": 0.0232, "step": 193940 }, { - "epoch": 0.98, - "learning_rate": 0.0001532245939932698, - "loss": 0.0138, + "epoch": 0.5, + "learning_rate": 0.00022458804347544328, + "loss": 0.016, "step": 193950 }, { - "epoch": 0.98, - "learning_rate": 0.0001532170263002558, - "loss": 0.0119, + "epoch": 0.5, + "learning_rate": 0.00022458415525907185, + "loss": 0.0116, "step": 193960 }, { - "epoch": 0.98, - "learning_rate": 0.00015320945860724177, - "loss": 0.0128, + "epoch": 0.5, + "learning_rate": 0.00022458026704270037, + "loss": 0.0209, "step": 193970 }, { - "epoch": 0.98, - "learning_rate": 0.00015320189091422775, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.0002245763788263289, + "loss": 0.018, "step": 193980 }, { - "epoch": 0.98, - "learning_rate": 0.00015319432322121376, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.00022457249060995742, + "loss": 0.0169, "step": 193990 }, { - "epoch": 0.98, - "learning_rate": 0.00015318675552819974, - "loss": 0.0134, + "epoch": 0.5, + "learning_rate": 0.000224568602393586, + "loss": 0.0127, "step": 194000 }, { - "epoch": 0.98, - "eval_cer": 0.9144683151109114, - "eval_loss": 0.007887054234743118, - "eval_runtime": 116.7404, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.5, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.012113718315958977, + "eval_runtime": 108.1959, + "eval_samples_per_second": 18.485, + "eval_steps_per_second": 4.621, "step": 194000 }, { - "epoch": 0.98, - "learning_rate": 0.00015317918783518572, - "loss": 0.0082, + "epoch": 0.5, + "learning_rate": 0.00022456471417721453, + "loss": 0.0165, "step": 194010 }, { - "epoch": 0.98, - "learning_rate": 0.00015317162014217173, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.00022456082596084305, + "loss": 0.0167, "step": 194020 }, { - "epoch": 0.98, - "learning_rate": 0.00015316405244915771, - "loss": 0.0106, + "epoch": 0.5, + "learning_rate": 0.0002245569377444716, + "loss": 0.0252, "step": 194030 }, { - "epoch": 0.98, - "learning_rate": 0.0001531564847561437, - "loss": 0.0085, + "epoch": 0.5, + "learning_rate": 0.0002245530495281001, + "loss": 0.0184, "step": 194040 }, { - "epoch": 0.98, - "learning_rate": 0.0001531489170631297, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022454916131172867, + "loss": 0.022, "step": 194050 }, { - "epoch": 0.98, - "learning_rate": 0.00015314134937011569, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022454527309535719, + "loss": 0.0152, "step": 194060 }, { - "epoch": 0.98, - "learning_rate": 0.00015313378167710167, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.00022454138487898573, + "loss": 0.0152, "step": 194070 }, { - "epoch": 0.98, - "learning_rate": 0.00015312621398408768, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.00022453749666261424, + "loss": 0.0147, "step": 194080 }, { - "epoch": 0.98, - "learning_rate": 0.00015311864629107366, - "loss": 0.0121, + "epoch": 0.5, + "learning_rate": 0.0002245336084462428, + "loss": 0.0146, "step": 194090 }, { - "epoch": 0.98, - "learning_rate": 0.00015311107859805964, - "loss": 0.0137, + "epoch": 0.5, + "learning_rate": 0.00022452972022987133, + "loss": 0.0203, "step": 194100 }, { - "epoch": 0.98, - "learning_rate": 0.00015310351090504565, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022452583201349987, + "loss": 0.0177, "step": 194110 }, { - "epoch": 0.98, - "learning_rate": 0.00015309594321203163, - "loss": 0.0129, + "epoch": 0.5, + "learning_rate": 0.00022452194379712838, + "loss": 0.0196, "step": 194120 }, { - "epoch": 0.98, - "learning_rate": 0.0001530883755190176, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.00022451805558075695, + "loss": 0.0168, "step": 194130 }, { - "epoch": 0.98, - "learning_rate": 0.0001530808078260036, - "loss": 0.0109, + "epoch": 0.5, + "learning_rate": 0.00022451416736438547, + "loss": 0.0202, "step": 194140 }, { - "epoch": 0.98, - "learning_rate": 0.0001530732401329896, - "loss": 0.0101, + "epoch": 0.5, + "learning_rate": 0.000224510279148014, + "loss": 0.015, "step": 194150 }, { - "epoch": 0.98, - "learning_rate": 0.00015306567243997558, - "loss": 0.0143, + "epoch": 0.5, + "learning_rate": 0.00022450639093164252, + "loss": 0.0176, "step": 194160 }, { - "epoch": 0.98, - "learning_rate": 0.00015305810474696156, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.0002245025027152711, + "loss": 0.0177, "step": 194170 }, { - "epoch": 0.98, - "learning_rate": 0.00015305053705394757, - "loss": 0.0096, + "epoch": 0.5, + "learning_rate": 0.00022449861449889963, + "loss": 0.0179, "step": 194180 }, { - "epoch": 0.98, - "learning_rate": 0.00015304296936093353, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022449472628252815, + "loss": 0.0176, "step": 194190 }, { - "epoch": 0.98, - "learning_rate": 0.0001530354016679195, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.0002244908380661567, + "loss": 0.0152, "step": 194200 }, { - "epoch": 0.98, - "learning_rate": 0.0001530278339749055, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.00022448694984978523, + "loss": 0.0166, "step": 194210 }, { - "epoch": 0.98, - "learning_rate": 0.0001530202662818915, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.00022448306163341377, + "loss": 0.0144, "step": 194220 }, { - "epoch": 0.98, - "learning_rate": 0.00015301269858887748, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022447917341704229, + "loss": 0.0247, "step": 194230 }, { - "epoch": 0.98, - "learning_rate": 0.00015300513089586346, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.00022447528520067083, + "loss": 0.0166, "step": 194240 }, { - "epoch": 0.98, - "learning_rate": 0.00015299756320284947, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022447139698429937, + "loss": 0.0166, "step": 194250 }, { - "epoch": 0.98, - "learning_rate": 0.00015298999550983545, - "loss": 0.0093, + "epoch": 0.5, + "learning_rate": 0.0002244675087679279, + "loss": 0.0285, "step": 194260 }, { - "epoch": 0.98, - "learning_rate": 0.00015298242781682143, - "loss": 0.0135, + "epoch": 0.5, + "learning_rate": 0.00022446362055155643, + "loss": 0.0176, "step": 194270 }, { - "epoch": 0.98, - "learning_rate": 0.00015297486012380744, - "loss": 0.0088, + "epoch": 0.5, + "learning_rate": 0.00022445973233518497, + "loss": 0.019, "step": 194280 }, { - "epoch": 0.98, - "learning_rate": 0.00015296729243079342, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022445584411881348, + "loss": 0.019, "step": 194290 }, { - "epoch": 0.98, - "learning_rate": 0.0001529597247377794, - "loss": 0.0091, + "epoch": 0.5, + "learning_rate": 0.00022445195590244205, + "loss": 0.0163, "step": 194300 }, { - "epoch": 0.98, - "learning_rate": 0.0001529521570447654, - "loss": 0.0092, + "epoch": 0.5, + "learning_rate": 0.00022444806768607056, + "loss": 0.018, "step": 194310 }, { - "epoch": 0.98, - "learning_rate": 0.0001529445893517514, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.0002244441794696991, + "loss": 0.0183, "step": 194320 }, { - "epoch": 0.98, - "learning_rate": 0.00015293702165873737, - "loss": 0.0114, + "epoch": 0.5, + "learning_rate": 0.00022444029125332762, + "loss": 0.0163, "step": 194330 }, { - "epoch": 0.98, - "learning_rate": 0.00015292945396572338, - "loss": 0.012, + "epoch": 0.5, + "learning_rate": 0.0002244364030369562, + "loss": 0.0142, "step": 194340 }, { - "epoch": 0.98, - "learning_rate": 0.00015292188627270936, - "loss": 0.0145, + "epoch": 0.5, + "learning_rate": 0.00022443251482058473, + "loss": 0.0166, "step": 194350 }, { - "epoch": 0.98, - "learning_rate": 0.00015291431857969535, - "loss": 0.01, + "epoch": 0.5, + "learning_rate": 0.00022442862660421325, + "loss": 0.0221, "step": 194360 }, { - "epoch": 0.98, - "learning_rate": 0.00015290675088668133, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.0002244247383878418, + "loss": 0.0226, "step": 194370 }, { - "epoch": 0.98, - "learning_rate": 0.00015289918319366734, - "loss": 0.0097, + "epoch": 0.5, + "learning_rate": 0.00022442085017147033, + "loss": 0.0152, "step": 194380 }, { - "epoch": 0.98, - "learning_rate": 0.00015289161550065332, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022441696195509887, + "loss": 0.0188, "step": 194390 }, { - "epoch": 0.98, - "learning_rate": 0.0001528840478076393, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022441307373872739, + "loss": 0.0152, "step": 194400 }, { - "epoch": 0.98, - "learning_rate": 0.0001528764801146253, - "loss": 0.0139, + "epoch": 0.5, + "learning_rate": 0.00022440918552235593, + "loss": 0.0192, "step": 194410 }, { - "epoch": 0.98, - "learning_rate": 0.0001528689124216113, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022440529730598447, + "loss": 0.0174, "step": 194420 }, { - "epoch": 0.98, - "learning_rate": 0.00015286134472859727, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.000224401409089613, + "loss": 0.0165, "step": 194430 }, { - "epoch": 0.98, - "learning_rate": 0.00015285377703558328, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022439752087324152, + "loss": 0.0172, "step": 194440 }, { - "epoch": 0.98, - "learning_rate": 0.00015284620934256926, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022439363265687007, + "loss": 0.0173, "step": 194450 }, { - "epoch": 0.98, - "learning_rate": 0.00015283864164955524, - "loss": 0.0131, + "epoch": 0.5, + "learning_rate": 0.0002243897444404986, + "loss": 0.0182, "step": 194460 }, { - "epoch": 0.98, - "learning_rate": 0.00015283107395654125, - "loss": 0.0117, + "epoch": 0.5, + "learning_rate": 0.00022438585622412715, + "loss": 0.012, "step": 194470 }, { - "epoch": 0.98, - "learning_rate": 0.00015282350626352723, - "loss": 0.0105, + "epoch": 0.5, + "learning_rate": 0.00022438196800775566, + "loss": 0.0156, "step": 194480 }, { - "epoch": 0.98, - "learning_rate": 0.0001528159385705132, - "loss": 0.0112, + "epoch": 0.5, + "learning_rate": 0.0002243780797913842, + "loss": 0.0193, "step": 194490 }, { - "epoch": 0.98, - "learning_rate": 0.00015280837087749922, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022437419157501277, + "loss": 0.0189, "step": 194500 }, { - "epoch": 0.98, - "learning_rate": 0.0001528008031844852, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.0002243703033586413, + "loss": 0.0154, "step": 194510 }, { - "epoch": 0.98, - "learning_rate": 0.00015279323549147118, - "loss": 0.0178, + "epoch": 0.5, + "learning_rate": 0.00022436641514226983, + "loss": 0.0126, "step": 194520 }, { - "epoch": 0.98, - "learning_rate": 0.00015278566779845717, - "loss": 0.0098, + "epoch": 0.5, + "learning_rate": 0.00022436252692589835, + "loss": 0.0172, "step": 194530 }, { - "epoch": 0.98, - "learning_rate": 0.00015277810010544317, - "loss": 0.0131, + "epoch": 0.5, + "learning_rate": 0.00022435863870952686, + "loss": 0.0166, "step": 194540 }, { - "epoch": 0.98, - "learning_rate": 0.00015277053241242916, - "loss": 0.0108, + "epoch": 0.5, + "learning_rate": 0.00022435475049315543, + "loss": 0.0155, "step": 194550 }, { - "epoch": 0.98, - "learning_rate": 0.00015276296471941514, - "loss": 0.0086, + "epoch": 0.5, + "learning_rate": 0.00022435086227678397, + "loss": 0.0189, "step": 194560 }, { - "epoch": 0.98, - "learning_rate": 0.00015275539702640115, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022434697406041248, + "loss": 0.0171, "step": 194570 }, { - "epoch": 0.98, - "learning_rate": 0.00015274782933338713, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022434308584404103, + "loss": 0.0118, "step": 194580 }, { - "epoch": 0.98, - "learning_rate": 0.0001527402616403731, - "loss": 0.0123, + "epoch": 0.5, + "learning_rate": 0.00022433919762766957, + "loss": 0.0138, "step": 194590 }, { - "epoch": 0.98, - "learning_rate": 0.00015273269394735912, - "loss": 0.009, + "epoch": 0.5, + "learning_rate": 0.0002243353094112981, + "loss": 0.0161, "step": 194600 }, { - "epoch": 0.98, - "learning_rate": 0.0001527251262543451, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.00022433142119492662, + "loss": 0.0218, "step": 194610 }, { - "epoch": 0.98, - "learning_rate": 0.00015271755856133108, - "loss": 0.0107, + "epoch": 0.5, + "learning_rate": 0.00022432753297855517, + "loss": 0.0197, "step": 194620 }, { - "epoch": 0.98, - "learning_rate": 0.0001527099908683171, - "loss": 0.0152, + "epoch": 0.5, + "learning_rate": 0.0002243236447621837, + "loss": 0.0161, "step": 194630 }, { - "epoch": 0.98, - "learning_rate": 0.00015270242317530307, - "loss": 0.0113, + "epoch": 0.5, + "learning_rate": 0.00022431975654581225, + "loss": 0.017, "step": 194640 }, { - "epoch": 0.98, - "learning_rate": 0.00015269485548228905, - "loss": 0.0099, + "epoch": 0.5, + "learning_rate": 0.00022431586832944076, + "loss": 0.0169, "step": 194650 }, { - "epoch": 0.98, - "learning_rate": 0.00015268728778927506, - "loss": 0.014, + "epoch": 0.5, + "learning_rate": 0.0002243119801130693, + "loss": 0.0195, "step": 194660 }, { - "epoch": 0.98, - "learning_rate": 0.00015267972009626104, - "loss": 0.0133, + "epoch": 0.5, + "learning_rate": 0.00022430809189669787, + "loss": 0.0206, "step": 194670 }, { - "epoch": 0.98, - "learning_rate": 0.00015267215240324702, - "loss": 0.0085, + "epoch": 0.5, + "learning_rate": 0.0002243042036803264, + "loss": 0.0161, "step": 194680 }, { - "epoch": 0.98, - "learning_rate": 0.000152664584710233, - "loss": 0.0111, + "epoch": 0.5, + "learning_rate": 0.0002243003154639549, + "loss": 0.0151, "step": 194690 }, { - "epoch": 0.98, - "learning_rate": 0.000152657017017219, - "loss": 0.0128, + "epoch": 0.5, + "learning_rate": 0.00022429642724758344, + "loss": 0.0157, "step": 194700 }, { - "epoch": 0.98, - "learning_rate": 0.000152649449324205, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.000224292539031212, + "loss": 0.0176, "step": 194710 }, { - "epoch": 0.98, - "learning_rate": 0.00015264188163119098, - "loss": 0.0094, + "epoch": 0.5, + "learning_rate": 0.00022428865081484053, + "loss": 0.0151, "step": 194720 }, { - "epoch": 0.98, - "learning_rate": 0.00015263431393817698, - "loss": 0.0116, + "epoch": 0.5, + "learning_rate": 0.00022428476259846907, + "loss": 0.0166, "step": 194730 }, { - "epoch": 0.98, - "learning_rate": 0.00015262674624516297, - "loss": 0.0089, + "epoch": 0.5, + "learning_rate": 0.00022428087438209758, + "loss": 0.02, "step": 194740 }, { - "epoch": 0.98, - "learning_rate": 0.00015261917855214895, - "loss": 0.011, + "epoch": 0.5, + "learning_rate": 0.00022427698616572615, + "loss": 0.0177, "step": 194750 }, { - "epoch": 0.98, - "learning_rate": 0.00015261161085913496, - "loss": 0.0102, + "epoch": 0.5, + "learning_rate": 0.00022427309794935467, + "loss": 0.0201, "step": 194760 }, { - "epoch": 0.98, - "learning_rate": 0.00015260404316612094, - "loss": 0.0115, + "epoch": 0.5, + "learning_rate": 0.0002242692097329832, + "loss": 0.0189, "step": 194770 }, { - "epoch": 0.98, - "learning_rate": 0.00015259647547310692, - "loss": 0.0125, + "epoch": 0.5, + "learning_rate": 0.00022426532151661172, + "loss": 0.0226, "step": 194780 }, { - "epoch": 0.98, - "learning_rate": 0.00015258890778009293, - "loss": 0.0104, + "epoch": 0.5, + "learning_rate": 0.00022426143330024026, + "loss": 0.0243, "step": 194790 }, { - "epoch": 0.98, - "learning_rate": 0.0001525813400870789, - "loss": 0.0103, + "epoch": 0.5, + "learning_rate": 0.0002242575450838688, + "loss": 0.0151, "step": 194800 }, { - "epoch": 0.98, - "learning_rate": 0.0001525737723940649, - "loss": 0.0087, + "epoch": 0.5, + "learning_rate": 0.00022425365686749735, + "loss": 0.0165, "step": 194810 }, { - "epoch": 0.98, - "learning_rate": 0.0001525662047010509, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022424976865112586, + "loss": 0.0152, "step": 194820 }, { - "epoch": 0.98, - "learning_rate": 0.00015255863700803688, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.0002242458804347544, + "loss": 0.0162, "step": 194830 }, { - "epoch": 0.98, - "learning_rate": 0.00015255106931502286, - "loss": 0.009, + "epoch": 0.51, + "learning_rate": 0.00022424199221838297, + "loss": 0.0168, "step": 194840 }, { - "epoch": 0.98, - "learning_rate": 0.00015254350162200887, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.0002242381040020115, + "loss": 0.0172, "step": 194850 }, { - "epoch": 0.98, - "learning_rate": 0.00015253593392899485, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.00022423421578564, + "loss": 0.0129, "step": 194860 }, { - "epoch": 0.98, - "learning_rate": 0.00015252836623598083, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022423032756926854, + "loss": 0.0209, "step": 194870 }, { - "epoch": 0.98, - "learning_rate": 0.00015252079854296681, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.0002242264393528971, + "loss": 0.019, "step": 194880 }, { - "epoch": 0.98, - "learning_rate": 0.00015251323084995282, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022422255113652563, + "loss": 0.0177, "step": 194890 }, { - "epoch": 0.98, - "learning_rate": 0.0001525056631569388, - "loss": 0.014, + "epoch": 0.51, + "learning_rate": 0.00022421866292015417, + "loss": 0.0168, "step": 194900 }, { - "epoch": 0.98, - "learning_rate": 0.00015249809546392479, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022421477470378268, + "loss": 0.0197, "step": 194910 }, { - "epoch": 0.98, - "learning_rate": 0.0001524905277709108, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022421088648741125, + "loss": 0.0141, "step": 194920 }, { - "epoch": 0.98, - "learning_rate": 0.00015248296007789678, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022420699827103977, + "loss": 0.0183, "step": 194930 }, { - "epoch": 0.98, - "learning_rate": 0.00015247539238488276, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.0002242031100546683, + "loss": 0.0176, "step": 194940 }, { - "epoch": 0.98, - "learning_rate": 0.00015246782469186877, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022419922183829682, + "loss": 0.0166, "step": 194950 }, { - "epoch": 0.98, - "learning_rate": 0.00015246025699885475, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.0002241953336219254, + "loss": 0.0129, "step": 194960 }, { - "epoch": 0.98, - "learning_rate": 0.00015245268930584073, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.0002241914454055539, + "loss": 0.0168, "step": 194970 }, { - "epoch": 0.98, - "learning_rate": 0.00015244512161282674, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022418755718918245, + "loss": 0.014, "step": 194980 }, { - "epoch": 0.98, - "learning_rate": 0.00015243755391981272, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022418366897281096, + "loss": 0.016, "step": 194990 }, { - "epoch": 0.98, - "learning_rate": 0.0001524299862267987, - "loss": 0.0132, + "epoch": 0.51, + "learning_rate": 0.00022417978075643953, + "loss": 0.0182, "step": 195000 }, { - "epoch": 0.98, - "eval_cer": 0.9144712262992877, - "eval_loss": 0.007762947119772434, - "eval_runtime": 116.6633, - "eval_samples_per_second": 17.143, - "eval_steps_per_second": 4.286, + "epoch": 0.51, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.012146620079874992, + "eval_runtime": 108.1358, + "eval_samples_per_second": 18.495, + "eval_steps_per_second": 4.624, "step": 195000 }, { - "epoch": 0.98, - "learning_rate": 0.0001524224185337847, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022417589254006805, + "loss": 0.0212, "step": 195010 }, { - "epoch": 0.98, - "learning_rate": 0.0001524148508407707, - "loss": 0.0135, + "epoch": 0.51, + "learning_rate": 0.0002241720043236966, + "loss": 0.0181, "step": 195020 }, { - "epoch": 0.98, - "learning_rate": 0.00015240728314775667, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.0002241681161073251, + "loss": 0.0192, "step": 195030 }, { - "epoch": 0.98, - "learning_rate": 0.00015239971545474265, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022416422789095364, + "loss": 0.0177, "step": 195040 }, { - "epoch": 0.98, - "learning_rate": 0.00015239214776172866, - "loss": 0.0137, + "epoch": 0.51, + "learning_rate": 0.0002241603396745822, + "loss": 0.0194, "step": 195050 }, { - "epoch": 0.98, - "learning_rate": 0.00015238458006871464, - "loss": 0.0117, + "epoch": 0.51, + "learning_rate": 0.00022415645145821073, + "loss": 0.0192, "step": 195060 }, { - "epoch": 0.98, - "learning_rate": 0.00015237701237570062, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022415256324183927, + "loss": 0.018, "step": 195070 }, { - "epoch": 0.98, - "learning_rate": 0.00015236944468268663, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022414867502546778, + "loss": 0.0203, "step": 195080 }, { - "epoch": 0.98, - "learning_rate": 0.00015236187698967261, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022414478680909635, + "loss": 0.023, "step": 195090 }, { - "epoch": 0.98, - "learning_rate": 0.0001523543092966586, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022414089859272487, + "loss": 0.0159, "step": 195100 }, { - "epoch": 0.98, - "learning_rate": 0.0001523467416036446, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.0002241370103763534, + "loss": 0.0168, "step": 195110 }, { - "epoch": 0.98, - "learning_rate": 0.00015233917391063059, - "loss": 0.0126, + "epoch": 0.51, + "learning_rate": 0.00022413312215998192, + "loss": 0.0222, "step": 195120 }, { - "epoch": 0.98, - "learning_rate": 0.00015233160621761657, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.0002241292339436105, + "loss": 0.0131, "step": 195130 }, { - "epoch": 0.98, - "learning_rate": 0.00015232403852460258, - "loss": 0.0135, + "epoch": 0.51, + "learning_rate": 0.000224125345727239, + "loss": 0.0172, "step": 195140 }, { - "epoch": 0.98, - "learning_rate": 0.00015231647083158856, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022412145751086755, + "loss": 0.026, "step": 195150 }, { - "epoch": 0.98, - "learning_rate": 0.00015230890313857454, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022411756929449606, + "loss": 0.0171, "step": 195160 }, { - "epoch": 0.98, - "learning_rate": 0.00015230133544556055, - "loss": 0.0138, + "epoch": 0.51, + "learning_rate": 0.00022411368107812463, + "loss": 0.0179, "step": 195170 }, { - "epoch": 0.98, - "learning_rate": 0.00015229376775254653, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022410979286175314, + "loss": 0.0146, "step": 195180 }, { - "epoch": 0.98, - "learning_rate": 0.0001522862000595325, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.0002241059046453817, + "loss": 0.0203, "step": 195190 }, { - "epoch": 0.98, - "learning_rate": 0.0001522786323665185, - "loss": 0.0143, + "epoch": 0.51, + "learning_rate": 0.0002241020164290102, + "loss": 0.0163, "step": 195200 }, { - "epoch": 0.98, - "learning_rate": 0.0001522710646735045, - "loss": 0.0134, + "epoch": 0.51, + "learning_rate": 0.00022409812821263877, + "loss": 0.017, "step": 195210 }, { - "epoch": 0.98, - "learning_rate": 0.00015226349698049048, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.0002240942399962673, + "loss": 0.0172, "step": 195220 }, { - "epoch": 0.98, - "learning_rate": 0.00015225592928747646, - "loss": 0.012, + "epoch": 0.51, + "learning_rate": 0.00022409035177989583, + "loss": 0.0186, "step": 195230 }, { - "epoch": 0.99, - "learning_rate": 0.00015224836159446247, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022408646356352437, + "loss": 0.0195, "step": 195240 }, { - "epoch": 0.99, - "learning_rate": 0.00015224079390144845, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.0002240825753471529, + "loss": 0.0173, "step": 195250 }, { - "epoch": 0.99, - "learning_rate": 0.00015223322620843443, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022407868713078145, + "loss": 0.0207, "step": 195260 }, { - "epoch": 0.99, - "learning_rate": 0.00015222565851542044, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022407479891440997, + "loss": 0.0195, "step": 195270 }, { - "epoch": 0.99, - "learning_rate": 0.00015221809082240642, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.0002240709106980385, + "loss": 0.0152, "step": 195280 }, { - "epoch": 0.99, - "learning_rate": 0.0001522105231293924, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.00022406702248166702, + "loss": 0.0163, "step": 195290 }, { - "epoch": 0.99, - "learning_rate": 0.00015220295543637841, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.0002240631342652956, + "loss": 0.0212, "step": 195300 }, { - "epoch": 0.99, - "learning_rate": 0.0001521953877433644, - "loss": 0.0132, + "epoch": 0.51, + "learning_rate": 0.0002240592460489241, + "loss": 0.0208, "step": 195310 }, { - "epoch": 0.99, - "learning_rate": 0.00015218782005035038, - "loss": 0.0126, + "epoch": 0.51, + "learning_rate": 0.00022405535783255265, + "loss": 0.0158, "step": 195320 }, { - "epoch": 0.99, - "learning_rate": 0.00015218025235733639, - "loss": 0.009, + "epoch": 0.51, + "learning_rate": 0.00022405146961618116, + "loss": 0.017, "step": 195330 }, { - "epoch": 0.99, - "learning_rate": 0.00015217268466432237, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022404758139980973, + "loss": 0.0183, "step": 195340 }, { - "epoch": 0.99, - "learning_rate": 0.00015216511697130835, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022404369318343824, + "loss": 0.0131, "step": 195350 }, { - "epoch": 0.99, - "learning_rate": 0.00015215754927829436, - "loss": 0.0133, + "epoch": 0.51, + "learning_rate": 0.00022403980496706679, + "loss": 0.0163, "step": 195360 }, { - "epoch": 0.99, - "learning_rate": 0.00015214998158528034, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.0002240359167506953, + "loss": 0.02, "step": 195370 }, { - "epoch": 0.99, - "learning_rate": 0.00015214241389226632, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022403202853432387, + "loss": 0.0198, "step": 195380 }, { - "epoch": 0.99, - "learning_rate": 0.0001521348461992523, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.0002240281403179524, + "loss": 0.0188, "step": 195390 }, { - "epoch": 0.99, - "learning_rate": 0.0001521272785062383, - "loss": 0.0075, + "epoch": 0.51, + "learning_rate": 0.00022402425210158093, + "loss": 0.0184, "step": 195400 }, { - "epoch": 0.99, - "learning_rate": 0.0001521197108132243, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022402036388520944, + "loss": 0.0206, "step": 195410 }, { - "epoch": 0.99, - "learning_rate": 0.00015211214312021027, - "loss": 0.0077, + "epoch": 0.51, + "learning_rate": 0.000224016475668838, + "loss": 0.0189, "step": 195420 }, { - "epoch": 0.99, - "learning_rate": 0.00015210457542719628, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022401258745246655, + "loss": 0.0155, "step": 195430 }, { - "epoch": 0.99, - "learning_rate": 0.00015209700773418226, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022400869923609506, + "loss": 0.0215, "step": 195440 }, { - "epoch": 0.99, - "learning_rate": 0.00015208944004116822, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.0002240048110197236, + "loss": 0.0152, "step": 195450 }, { - "epoch": 0.99, - "learning_rate": 0.0001520818723481542, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022400092280335215, + "loss": 0.0169, "step": 195460 }, { - "epoch": 0.99, - "learning_rate": 0.0001520743046551402, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.0002239970345869807, + "loss": 0.0201, "step": 195470 }, { - "epoch": 0.99, - "learning_rate": 0.0001520667369621262, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.0002239931463706092, + "loss": 0.0208, "step": 195480 }, { - "epoch": 0.99, - "learning_rate": 0.00015205916926911217, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.00022398925815423775, + "loss": 0.0219, "step": 195490 }, { - "epoch": 0.99, - "learning_rate": 0.00015205160157609818, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.0002239853699378663, + "loss": 0.0349, "step": 195500 }, { - "epoch": 0.99, - "learning_rate": 0.00015204403388308416, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022398148172149483, + "loss": 0.0163, "step": 195510 }, { - "epoch": 0.99, - "learning_rate": 0.00015203646619007014, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022397759350512334, + "loss": 0.0181, "step": 195520 }, { - "epoch": 0.99, - "learning_rate": 0.00015202889849705615, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022397370528875189, + "loss": 0.0157, "step": 195530 }, { - "epoch": 0.99, - "learning_rate": 0.00015202133080404213, - "loss": 0.0157, + "epoch": 0.51, + "learning_rate": 0.0002239698170723804, + "loss": 0.0141, "step": 195540 }, { - "epoch": 0.99, - "learning_rate": 0.0001520137631110281, - "loss": 0.0133, + "epoch": 0.51, + "learning_rate": 0.00022396592885600897, + "loss": 0.0164, "step": 195550 }, { - "epoch": 0.99, - "learning_rate": 0.00015200619541801412, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022396204063963748, + "loss": 0.0193, "step": 195560 }, { - "epoch": 0.99, - "learning_rate": 0.0001519986277250001, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022395815242326602, + "loss": 0.0216, "step": 195570 }, { - "epoch": 0.99, - "learning_rate": 0.00015199106003198608, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022395426420689454, + "loss": 0.0164, "step": 195580 }, { - "epoch": 0.99, - "learning_rate": 0.00015198349233897207, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.0002239503759905231, + "loss": 0.0191, "step": 195590 }, { - "epoch": 0.99, - "learning_rate": 0.00015197592464595807, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.00022394648777415165, + "loss": 0.0168, "step": 195600 }, { - "epoch": 0.99, - "learning_rate": 0.00015196835695294406, - "loss": 0.0136, + "epoch": 0.51, + "learning_rate": 0.00022394259955778016, + "loss": 0.02, "step": 195610 }, { - "epoch": 0.99, - "learning_rate": 0.00015196078925993004, - "loss": 0.0123, + "epoch": 0.51, + "learning_rate": 0.0002239387113414087, + "loss": 0.0172, "step": 195620 }, { - "epoch": 0.99, - "learning_rate": 0.00015195322156691605, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022393482312503725, + "loss": 0.0174, "step": 195630 }, { - "epoch": 0.99, - "learning_rate": 0.00015194565387390203, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.0002239309349086658, + "loss": 0.0162, "step": 195640 }, { - "epoch": 0.99, - "learning_rate": 0.000151938086180888, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.0002239270466922943, + "loss": 0.0139, "step": 195650 }, { - "epoch": 0.99, - "learning_rate": 0.00015193051848787402, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.00022392315847592285, + "loss": 0.0176, "step": 195660 }, { - "epoch": 0.99, - "learning_rate": 0.00015192295079486, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.0002239192702595514, + "loss": 0.0154, "step": 195670 }, { - "epoch": 0.99, - "learning_rate": 0.00015191538310184598, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022391538204317993, + "loss": 0.0157, "step": 195680 }, { - "epoch": 0.99, - "learning_rate": 0.000151907815408832, - "loss": 0.0131, + "epoch": 0.51, + "learning_rate": 0.00022391149382680844, + "loss": 0.0465, "step": 195690 }, { - "epoch": 0.99, - "learning_rate": 0.00015190024771581797, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.00022390760561043698, + "loss": 0.0235, "step": 195700 }, { - "epoch": 0.99, - "learning_rate": 0.00015189268002280395, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022390371739406555, + "loss": 0.0192, "step": 195710 }, { - "epoch": 0.99, - "learning_rate": 0.00015188511232978996, - "loss": 0.0131, + "epoch": 0.51, + "learning_rate": 0.00022389982917769407, + "loss": 0.02, "step": 195720 }, { - "epoch": 0.99, - "learning_rate": 0.00015187754463677594, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.00022389594096132258, + "loss": 0.0176, "step": 195730 }, { - "epoch": 0.99, - "learning_rate": 0.00015186997694376192, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022389205274495112, + "loss": 0.0214, "step": 195740 }, { - "epoch": 0.99, - "learning_rate": 0.00015186240925074793, - "loss": 0.0141, + "epoch": 0.51, + "learning_rate": 0.0002238881645285797, + "loss": 0.0203, "step": 195750 }, { - "epoch": 0.99, - "learning_rate": 0.0001518548415577339, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.0002238842763122082, + "loss": 0.0405, "step": 195760 }, { - "epoch": 0.99, - "learning_rate": 0.0001518472738647199, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022388038809583675, + "loss": 0.0177, "step": 195770 }, { - "epoch": 0.99, - "learning_rate": 0.00015183970617170588, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022387649987946526, + "loss": 0.0172, "step": 195780 }, { - "epoch": 0.99, - "learning_rate": 0.00015183213847869188, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.0002238726116630938, + "loss": 0.0189, "step": 195790 }, { - "epoch": 0.99, - "learning_rate": 0.00015182457078567787, - "loss": 0.0139, + "epoch": 0.51, + "learning_rate": 0.00022386872344672235, + "loss": 0.0168, "step": 195800 }, { - "epoch": 0.99, - "learning_rate": 0.00015181700309266385, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.0002238648352303509, + "loss": 0.0244, "step": 195810 }, { - "epoch": 0.99, - "learning_rate": 0.00015180943539964986, - "loss": 0.0083, + "epoch": 0.51, + "learning_rate": 0.0002238609470139794, + "loss": 0.0133, "step": 195820 }, { - "epoch": 0.99, - "learning_rate": 0.00015180186770663584, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022385705879760794, + "loss": 0.0157, "step": 195830 }, { - "epoch": 0.99, - "learning_rate": 0.00015179430001362182, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.00022385317058123649, + "loss": 0.0177, "step": 195840 }, { - "epoch": 0.99, - "learning_rate": 0.00015178673232060783, - "loss": 0.0149, + "epoch": 0.51, + "learning_rate": 0.00022384928236486503, + "loss": 0.0185, "step": 195850 }, { - "epoch": 0.99, - "learning_rate": 0.0001517791646275938, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022384539414849354, + "loss": 0.0156, "step": 195860 }, { - "epoch": 0.99, - "learning_rate": 0.0001517715969345798, - "loss": 0.0122, + "epoch": 0.51, + "learning_rate": 0.00022384150593212208, + "loss": 0.0215, "step": 195870 }, { - "epoch": 0.99, - "learning_rate": 0.0001517640292415658, - "loss": 0.0137, + "epoch": 0.51, + "learning_rate": 0.00022383761771575063, + "loss": 0.0199, "step": 195880 }, { - "epoch": 0.99, - "learning_rate": 0.00015175646154855178, - "loss": 0.0138, + "epoch": 0.51, + "learning_rate": 0.00022383372949937917, + "loss": 0.0179, "step": 195890 }, { - "epoch": 0.99, - "learning_rate": 0.00015174889385553776, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022382984128300768, + "loss": 0.0207, "step": 195900 }, { - "epoch": 0.99, - "learning_rate": 0.00015174132616252377, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.00022382595306663622, + "loss": 0.0162, "step": 195910 }, { - "epoch": 0.99, - "learning_rate": 0.00015173375846950975, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.0002238220648502648, + "loss": 0.0188, "step": 195920 }, { - "epoch": 0.99, - "learning_rate": 0.00015172619077649573, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.0002238181766338933, + "loss": 0.0157, "step": 195930 }, { - "epoch": 0.99, - "learning_rate": 0.00015171862308348171, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.00022381428841752185, + "loss": 0.0175, "step": 195940 }, { - "epoch": 0.99, - "learning_rate": 0.00015171105539046772, - "loss": 0.0135, + "epoch": 0.51, + "learning_rate": 0.00022381040020115036, + "loss": 0.0153, "step": 195950 }, { - "epoch": 0.99, - "learning_rate": 0.0001517034876974537, - "loss": 0.0157, + "epoch": 0.51, + "learning_rate": 0.00022380651198477893, + "loss": 0.0214, "step": 195960 }, { - "epoch": 0.99, - "learning_rate": 0.00015169592000443969, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022380262376840745, + "loss": 0.0178, "step": 195970 }, { - "epoch": 0.99, - "learning_rate": 0.0001516883523114257, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.000223798735552036, + "loss": 0.0208, "step": 195980 }, { - "epoch": 0.99, - "learning_rate": 0.00015168078461841168, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.0002237948473356645, + "loss": 0.019, "step": 195990 }, { - "epoch": 0.99, - "learning_rate": 0.00015167321692539766, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022379095911929307, + "loss": 0.0157, "step": 196000 }, { - "epoch": 0.99, - "eval_cer": 0.9144450256039017, - "eval_loss": 0.007811464369297028, - "eval_runtime": 116.6323, - "eval_samples_per_second": 17.148, - "eval_steps_per_second": 4.287, + "epoch": 0.51, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.012171548791229725, + "eval_runtime": 107.9343, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.632, "step": 196000 }, { - "epoch": 0.99, - "learning_rate": 0.00015166564923238367, - "loss": 0.008, + "epoch": 0.51, + "learning_rate": 0.00022378707090292159, + "loss": 0.0186, "step": 196010 }, { - "epoch": 0.99, - "learning_rate": 0.00015165808153936965, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.00022378318268655013, + "loss": 0.0173, "step": 196020 }, { - "epoch": 0.99, - "learning_rate": 0.00015165051384635563, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022377929447017864, + "loss": 0.0196, "step": 196030 }, { - "epoch": 0.99, - "learning_rate": 0.00015164294615334164, - "loss": 0.012, + "epoch": 0.51, + "learning_rate": 0.00022377540625380718, + "loss": 0.0192, "step": 196040 }, { - "epoch": 0.99, - "learning_rate": 0.00015163537846032762, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022377151803743573, + "loss": 0.0177, "step": 196050 }, { - "epoch": 0.99, - "learning_rate": 0.0001516278107673136, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.00022376762982106427, + "loss": 0.0166, "step": 196060 }, { - "epoch": 0.99, - "learning_rate": 0.0001516202430742996, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022376374160469278, + "loss": 0.0195, "step": 196070 }, { - "epoch": 0.99, - "learning_rate": 0.0001516126753812856, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022375985338832132, + "loss": 0.0172, "step": 196080 }, { - "epoch": 0.99, - "learning_rate": 0.00015160510768827157, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.0002237559651719499, + "loss": 0.018, "step": 196090 }, { - "epoch": 0.99, - "learning_rate": 0.00015159753999525755, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002237520769555784, + "loss": 0.0148, "step": 196100 }, { - "epoch": 0.99, - "learning_rate": 0.00015158997230224356, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022374818873920695, + "loss": 0.0175, "step": 196110 }, { - "epoch": 0.99, - "learning_rate": 0.00015158240460922954, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022374430052283546, + "loss": 0.0185, "step": 196120 }, { - "epoch": 0.99, - "learning_rate": 0.00015157483691621552, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022374041230646403, + "loss": 0.018, "step": 196130 }, { - "epoch": 0.99, - "learning_rate": 0.00015156726922320153, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022373652409009255, + "loss": 0.017, "step": 196140 }, { - "epoch": 0.99, - "learning_rate": 0.00015155970153018751, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.0002237326358737211, + "loss": 0.0149, "step": 196150 }, { - "epoch": 0.99, - "learning_rate": 0.0001515521338371735, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.0002237287476573496, + "loss": 0.0178, "step": 196160 }, { - "epoch": 0.99, - "learning_rate": 0.0001515445661441595, - "loss": 0.0139, + "epoch": 0.51, + "learning_rate": 0.00022372485944097817, + "loss": 0.0155, "step": 196170 }, { - "epoch": 0.99, - "learning_rate": 0.00015153699845114549, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022372097122460669, + "loss": 0.0177, "step": 196180 }, { - "epoch": 0.99, - "learning_rate": 0.00015152943075813147, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.00022371708300823523, + "loss": 0.0231, "step": 196190 }, { - "epoch": 0.99, - "learning_rate": 0.00015152186306511748, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.00022371319479186374, + "loss": 0.0169, "step": 196200 }, { - "epoch": 0.99, - "learning_rate": 0.00015151429537210346, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.0002237093065754923, + "loss": 0.0196, "step": 196210 }, { - "epoch": 0.99, - "learning_rate": 0.00015150672767908944, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.00022370541835912082, + "loss": 0.0176, "step": 196220 }, { - "epoch": 0.99, - "learning_rate": 0.00015149915998607545, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022370153014274937, + "loss": 0.0184, "step": 196230 }, { - "epoch": 0.99, - "learning_rate": 0.00015149159229306143, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.00022369764192637788, + "loss": 0.0205, "step": 196240 }, { - "epoch": 0.99, - "learning_rate": 0.0001514840246000474, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022369375371000645, + "loss": 0.0155, "step": 196250 }, { - "epoch": 0.99, - "learning_rate": 0.00015147645690703342, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.000223689865493635, + "loss": 0.0211, "step": 196260 }, { - "epoch": 0.99, - "learning_rate": 0.0001514688892140194, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.0002236859772772635, + "loss": 0.0165, "step": 196270 }, { - "epoch": 0.99, - "learning_rate": 0.00015146132152100538, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022368208906089202, + "loss": 0.0131, "step": 196280 }, { - "epoch": 0.99, - "learning_rate": 0.00015145375382799136, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022367820084452056, + "loss": 0.0165, "step": 196290 }, { - "epoch": 0.99, - "learning_rate": 0.00015144618613497737, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022367431262814913, + "loss": 0.0169, "step": 196300 }, { - "epoch": 0.99, - "learning_rate": 0.00015143861844196335, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022367042441177765, + "loss": 0.022, "step": 196310 }, { - "epoch": 0.99, - "learning_rate": 0.00015143105074894933, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.0002236665361954062, + "loss": 0.018, "step": 196320 }, { - "epoch": 0.99, - "learning_rate": 0.00015142348305593534, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002236626479790347, + "loss": 0.0244, "step": 196330 }, { - "epoch": 0.99, - "learning_rate": 0.00015141591536292132, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022365875976266327, + "loss": 0.018, "step": 196340 }, { - "epoch": 0.99, - "learning_rate": 0.0001514083476699073, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022365487154629178, + "loss": 0.0196, "step": 196350 }, { - "epoch": 0.99, - "learning_rate": 0.00015140077997689331, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022365098332992033, + "loss": 0.0157, "step": 196360 }, { - "epoch": 0.99, - "learning_rate": 0.0001513932122838793, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022364709511354884, + "loss": 0.0202, "step": 196370 }, { - "epoch": 0.99, - "learning_rate": 0.00015138564459086528, - "loss": 0.012, + "epoch": 0.51, + "learning_rate": 0.0002236432068971774, + "loss": 0.0152, "step": 196380 }, { - "epoch": 0.99, - "learning_rate": 0.00015137807689785129, - "loss": 0.0122, + "epoch": 0.51, + "learning_rate": 0.00022363931868080592, + "loss": 0.0218, "step": 196390 }, { - "epoch": 0.99, - "learning_rate": 0.00015137050920483727, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022363543046443447, + "loss": 0.0185, "step": 196400 }, { - "epoch": 0.99, - "learning_rate": 0.00015136294151182325, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022363154224806298, + "loss": 0.0143, "step": 196410 }, { - "epoch": 0.99, - "learning_rate": 0.00015135537381880926, - "loss": 0.0084, + "epoch": 0.51, + "learning_rate": 0.00022362765403169155, + "loss": 0.0161, "step": 196420 }, { - "epoch": 0.99, - "learning_rate": 0.00015134780612579524, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.0002236237658153201, + "loss": 0.0198, "step": 196430 }, { - "epoch": 0.99, - "learning_rate": 0.00015134023843278122, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.0002236198775989486, + "loss": 0.0204, "step": 196440 }, { - "epoch": 0.99, - "learning_rate": 0.0001513326707397672, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022361598938257712, + "loss": 0.0183, "step": 196450 }, { - "epoch": 0.99, - "learning_rate": 0.0001513251030467532, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.0002236121011662057, + "loss": 0.0178, "step": 196460 }, { - "epoch": 0.99, - "learning_rate": 0.0001513175353537392, - "loss": 0.0083, + "epoch": 0.51, + "learning_rate": 0.00022360821294983423, + "loss": 0.0182, "step": 196470 }, { - "epoch": 0.99, - "learning_rate": 0.00015130996766072517, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022360432473346274, + "loss": 0.0161, "step": 196480 }, { - "epoch": 0.99, - "learning_rate": 0.00015130239996771118, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022360043651709129, + "loss": 0.0189, "step": 196490 }, { - "epoch": 0.99, - "learning_rate": 0.00015129483227469716, - "loss": 0.0163, + "epoch": 0.51, + "learning_rate": 0.00022359654830071983, + "loss": 0.0142, "step": 196500 }, { - "epoch": 0.99, - "learning_rate": 0.00015128726458168314, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022359266008434837, + "loss": 0.017, "step": 196510 }, { - "epoch": 0.99, - "learning_rate": 0.00015127969688866915, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022358877186797688, + "loss": 0.0174, "step": 196520 }, { - "epoch": 0.99, - "learning_rate": 0.00015127212919565513, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.00022358488365160543, + "loss": 0.0167, "step": 196530 }, { - "epoch": 0.99, - "learning_rate": 0.00015126456150264112, - "loss": 0.0082, + "epoch": 0.51, + "learning_rate": 0.00022358099543523394, + "loss": 0.0161, "step": 196540 }, { - "epoch": 0.99, - "learning_rate": 0.00015125699380962712, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.0002235771072188625, + "loss": 0.0155, "step": 196550 }, { - "epoch": 0.99, - "learning_rate": 0.0001512494261166131, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022357321900249102, + "loss": 0.0221, "step": 196560 }, { - "epoch": 0.99, - "learning_rate": 0.0001512418584235991, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022356933078611957, + "loss": 0.0151, "step": 196570 }, { - "epoch": 0.99, - "learning_rate": 0.0001512342907305851, - "loss": 0.0079, + "epoch": 0.51, + "learning_rate": 0.00022356544256974808, + "loss": 0.0145, "step": 196580 }, { - "epoch": 0.99, - "learning_rate": 0.00015122672303757108, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.00022356155435337665, + "loss": 0.0154, "step": 196590 }, { - "epoch": 0.99, - "learning_rate": 0.00015121915534455706, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022355766613700516, + "loss": 0.0163, "step": 196600 }, { - "epoch": 0.99, - "learning_rate": 0.00015121158765154304, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.0002235537779206337, + "loss": 0.0153, "step": 196610 }, { - "epoch": 0.99, - "learning_rate": 0.00015120401995852905, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.00022354988970426222, + "loss": 0.0167, "step": 196620 }, { - "epoch": 0.99, - "learning_rate": 0.00015119645226551503, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.0002235460014878908, + "loss": 0.0173, "step": 196630 }, { - "epoch": 0.99, - "learning_rate": 0.000151188884572501, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022354211327151933, + "loss": 0.0137, "step": 196640 }, { - "epoch": 0.99, - "learning_rate": 0.00015118131687948702, - "loss": 0.0148, + "epoch": 0.51, + "learning_rate": 0.00022353822505514784, + "loss": 0.0149, "step": 196650 }, { - "epoch": 0.99, - "learning_rate": 0.000151173749186473, - "loss": 0.0133, + "epoch": 0.51, + "learning_rate": 0.00022353433683877639, + "loss": 0.0174, "step": 196660 }, { - "epoch": 0.99, - "learning_rate": 0.00015116618149345898, - "loss": 0.0141, + "epoch": 0.51, + "learning_rate": 0.00022353044862240493, + "loss": 0.018, "step": 196670 }, { - "epoch": 0.99, - "learning_rate": 0.000151158613800445, - "loss": 0.0078, + "epoch": 0.51, + "learning_rate": 0.00022352656040603347, + "loss": 0.0174, "step": 196680 }, { - "epoch": 0.99, - "learning_rate": 0.00015115104610743097, - "loss": 0.0129, + "epoch": 0.51, + "learning_rate": 0.00022352267218966198, + "loss": 0.0193, "step": 196690 }, { - "epoch": 0.99, - "learning_rate": 0.00015114347841441695, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.00022351878397329053, + "loss": 0.0168, "step": 196700 }, { - "epoch": 0.99, - "learning_rate": 0.0001511359107214029, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022351489575691907, + "loss": 0.0172, "step": 196710 }, { - "epoch": 0.99, - "learning_rate": 0.00015112834302838892, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.0002235110075405476, + "loss": 0.0167, "step": 196720 }, { - "epoch": 0.99, - "learning_rate": 0.0001511207753353749, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022350711932417612, + "loss": 0.0175, "step": 196730 }, { - "epoch": 0.99, - "learning_rate": 0.00015111320764236088, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022350323110780466, + "loss": 0.019, "step": 196740 }, { - "epoch": 0.99, - "learning_rate": 0.0001511056399493469, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022349934289143318, + "loss": 0.0175, "step": 196750 }, { - "epoch": 0.99, - "learning_rate": 0.00015109807225633287, - "loss": 0.0135, + "epoch": 0.51, + "learning_rate": 0.00022349545467506175, + "loss": 0.0226, "step": 196760 }, { - "epoch": 0.99, - "learning_rate": 0.00015109050456331885, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022349156645869026, + "loss": 0.0158, "step": 196770 }, { - "epoch": 0.99, - "learning_rate": 0.00015108293687030486, - "loss": 0.0173, + "epoch": 0.51, + "learning_rate": 0.0002234876782423188, + "loss": 0.0138, "step": 196780 }, { - "epoch": 0.99, - "learning_rate": 0.00015107536917729084, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022348379002594732, + "loss": 0.0168, "step": 196790 }, { - "epoch": 0.99, - "learning_rate": 0.00015106780148427682, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.0002234799018095759, + "loss": 0.0174, "step": 196800 }, { - "epoch": 0.99, - "learning_rate": 0.00015106023379126283, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.00022347601359320443, + "loss": 0.0159, "step": 196810 }, { - "epoch": 0.99, - "learning_rate": 0.0001510526660982488, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022347212537683294, + "loss": 0.0182, "step": 196820 }, { - "epoch": 0.99, - "learning_rate": 0.0001510450984052348, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022346823716046149, + "loss": 0.0173, "step": 196830 }, { - "epoch": 0.99, - "learning_rate": 0.00015103753071222078, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022346434894409003, + "loss": 0.0193, "step": 196840 }, { - "epoch": 0.99, - "learning_rate": 0.00015102996301920678, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.00022346046072771857, + "loss": 0.0169, "step": 196850 }, { - "epoch": 0.99, - "learning_rate": 0.00015102239532619277, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022345657251134708, + "loss": 0.0202, "step": 196860 }, { - "epoch": 0.99, - "learning_rate": 0.00015101482763317875, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022345268429497562, + "loss": 0.0223, "step": 196870 }, { - "epoch": 0.99, - "learning_rate": 0.00015100725994016476, - "loss": 0.0132, + "epoch": 0.51, + "learning_rate": 0.00022344879607860417, + "loss": 0.0175, "step": 196880 }, { - "epoch": 0.99, - "learning_rate": 0.00015099969224715074, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.0002234449078622327, + "loss": 0.0167, "step": 196890 }, { - "epoch": 0.99, - "learning_rate": 0.00015099212455413672, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022344101964586122, + "loss": 0.0146, "step": 196900 }, { - "epoch": 0.99, - "learning_rate": 0.00015098455686112273, - "loss": 0.0134, + "epoch": 0.51, + "learning_rate": 0.00022343713142948976, + "loss": 0.0171, "step": 196910 }, { - "epoch": 0.99, - "learning_rate": 0.0001509769891681087, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.0002234332432131183, + "loss": 0.0171, "step": 196920 }, { - "epoch": 0.99, - "learning_rate": 0.0001509694214750947, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.00022342935499674685, + "loss": 0.0125, "step": 196930 }, { - "epoch": 0.99, - "learning_rate": 0.0001509618537820807, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022342546678037536, + "loss": 0.0182, "step": 196940 }, { - "epoch": 0.99, - "learning_rate": 0.00015095428608906668, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.0002234215785640039, + "loss": 0.0189, "step": 196950 }, { - "epoch": 0.99, - "learning_rate": 0.00015094671839605266, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022341769034763247, + "loss": 0.0157, "step": 196960 }, { - "epoch": 0.99, - "learning_rate": 0.00015093915070303867, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.000223413802131261, + "loss": 0.0172, "step": 196970 }, { - "epoch": 0.99, - "learning_rate": 0.00015093158301002465, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.00022340991391488953, + "loss": 0.0164, "step": 196980 }, { - "epoch": 0.99, - "learning_rate": 0.00015092401531701063, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.00022340602569851804, + "loss": 0.014, "step": 196990 }, { - "epoch": 0.99, - "learning_rate": 0.00015091644762399662, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022340213748214656, + "loss": 0.0163, "step": 197000 }, { - "epoch": 0.99, - "eval_cer": 0.9144877230334195, - "eval_loss": 0.007818542420864105, - "eval_runtime": 116.7928, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.51, + "eval_cer": 0.8818160569148363, + "eval_loss": 0.011719505302608013, + "eval_runtime": 107.9068, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, "step": 197000 }, { - "epoch": 0.99, - "learning_rate": 0.00015090887993098262, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022339824926577513, + "loss": 0.0164, "step": 197010 }, { - "epoch": 0.99, - "learning_rate": 0.0001509013122379686, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.00022339436104940367, + "loss": 0.0196, "step": 197020 }, { - "epoch": 0.99, - "learning_rate": 0.0001508937445449546, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022339047283303218, + "loss": 0.0201, "step": 197030 }, { - "epoch": 0.99, - "learning_rate": 0.0001508861768519406, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022338658461666072, + "loss": 0.0158, "step": 197040 }, { - "epoch": 0.99, - "learning_rate": 0.00015087860915892658, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022338269640028927, + "loss": 0.0208, "step": 197050 }, { - "epoch": 0.99, - "learning_rate": 0.00015087104146591256, - "loss": 0.0121, + "epoch": 0.51, + "learning_rate": 0.0002233788081839178, + "loss": 0.0196, "step": 197060 }, { - "epoch": 0.99, - "learning_rate": 0.00015086347377289857, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022337491996754632, + "loss": 0.0179, "step": 197070 }, { - "epoch": 0.99, - "learning_rate": 0.00015085590607988455, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022337103175117486, + "loss": 0.0175, "step": 197080 }, { - "epoch": 0.99, - "learning_rate": 0.00015084833838687053, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.0002233671435348034, + "loss": 0.0174, "step": 197090 }, { - "epoch": 0.99, - "learning_rate": 0.00015084077069385654, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022336325531843195, + "loss": 0.0177, "step": 197100 }, { - "epoch": 0.99, - "learning_rate": 0.00015083320300084252, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022335936710206046, + "loss": 0.0206, "step": 197110 }, { - "epoch": 0.99, - "learning_rate": 0.0001508256353078285, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.000223355478885689, + "loss": 0.0142, "step": 197120 }, { - "epoch": 0.99, - "learning_rate": 0.0001508180676148145, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022335159066931757, + "loss": 0.0141, "step": 197130 }, { - "epoch": 0.99, - "learning_rate": 0.0001508104999218005, - "loss": 0.0127, + "epoch": 0.51, + "learning_rate": 0.00022334770245294609, + "loss": 0.0178, "step": 197140 }, { - "epoch": 0.99, - "learning_rate": 0.00015080293222878647, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.0002233438142365746, + "loss": 0.0161, "step": 197150 }, { - "epoch": 0.99, - "learning_rate": 0.00015079536453577245, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022333992602020314, + "loss": 0.0143, "step": 197160 }, { - "epoch": 0.99, - "learning_rate": 0.00015078779684275846, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.0002233360378038317, + "loss": 0.0168, "step": 197170 }, { - "epoch": 0.99, - "learning_rate": 0.00015078022914974444, - "loss": 0.0134, + "epoch": 0.51, + "learning_rate": 0.00022333214958746023, + "loss": 0.0171, "step": 197180 }, { - "epoch": 0.99, - "learning_rate": 0.00015077266145673043, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022332826137108877, + "loss": 0.0165, "step": 197190 }, { - "epoch": 0.99, - "learning_rate": 0.00015076509376371643, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022332437315471728, + "loss": 0.0194, "step": 197200 }, { - "epoch": 0.99, - "learning_rate": 0.00015075752607070242, - "loss": 0.016, + "epoch": 0.51, + "learning_rate": 0.00022332048493834585, + "loss": 0.0176, "step": 197210 }, { - "epoch": 0.99, - "learning_rate": 0.0001507499583776884, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022331659672197437, + "loss": 0.0182, "step": 197220 }, { - "epoch": 1.0, - "learning_rate": 0.0001507423906846744, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.0002233127085056029, + "loss": 0.0211, "step": 197230 }, { - "epoch": 1.0, - "learning_rate": 0.0001507348229916604, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.00022330882028923142, + "loss": 0.0167, "step": 197240 }, { - "epoch": 1.0, - "learning_rate": 0.00015072725529864637, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022330493207285996, + "loss": 0.0167, "step": 197250 }, { - "epoch": 1.0, - "learning_rate": 0.00015071968760563238, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.0002233010438564885, + "loss": 0.0156, "step": 197260 }, { - "epoch": 1.0, - "learning_rate": 0.00015071211991261836, - "loss": 0.0135, + "epoch": 0.51, + "learning_rate": 0.00022329715564011705, + "loss": 0.0175, "step": 197270 }, { - "epoch": 1.0, - "learning_rate": 0.00015070455221960434, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.00022329326742374556, + "loss": 0.0145, "step": 197280 }, { - "epoch": 1.0, - "learning_rate": 0.00015069698452659035, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.0002232893792073741, + "loss": 0.0178, "step": 197290 }, { - "epoch": 1.0, - "learning_rate": 0.00015068941683357633, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022328549099100267, + "loss": 0.0147, "step": 197300 }, { - "epoch": 1.0, - "learning_rate": 0.0001506818491405623, - "loss": 0.0117, + "epoch": 0.51, + "learning_rate": 0.00022328160277463119, + "loss": 0.0144, "step": 197310 }, { - "epoch": 1.0, - "learning_rate": 0.00015067428144754832, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.0002232777145582597, + "loss": 0.0159, "step": 197320 }, { - "epoch": 1.0, - "learning_rate": 0.0001506667137545343, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.00022327382634188824, + "loss": 0.0172, "step": 197330 }, { - "epoch": 1.0, - "learning_rate": 0.00015065914606152028, - "loss": 0.0129, + "epoch": 0.51, + "learning_rate": 0.0002232699381255168, + "loss": 0.0166, "step": 197340 }, { - "epoch": 1.0, - "learning_rate": 0.00015065157836850626, - "loss": 0.0166, + "epoch": 0.51, + "learning_rate": 0.00022326604990914533, + "loss": 0.0153, "step": 197350 }, { - "epoch": 1.0, - "learning_rate": 0.00015064401067549227, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022326216169277387, + "loss": 0.0174, "step": 197360 }, { - "epoch": 1.0, - "learning_rate": 0.00015063644298247825, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022325827347640238, + "loss": 0.0163, "step": 197370 }, { - "epoch": 1.0, - "learning_rate": 0.00015062887528946424, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022325438526003095, + "loss": 0.0159, "step": 197380 }, { - "epoch": 1.0, - "learning_rate": 0.00015062130759645024, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022325049704365946, + "loss": 0.0174, "step": 197390 }, { - "epoch": 1.0, - "learning_rate": 0.00015061373990343623, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.000223246608827288, + "loss": 0.0156, "step": 197400 }, { - "epoch": 1.0, - "learning_rate": 0.0001506061722104222, - "loss": 0.008, + "epoch": 0.51, + "learning_rate": 0.00022324272061091652, + "loss": 0.0225, "step": 197410 }, { - "epoch": 1.0, - "learning_rate": 0.00015059860451740822, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002232388323945451, + "loss": 0.0176, "step": 197420 }, { - "epoch": 1.0, - "learning_rate": 0.0001505910368243942, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.0002232349441781736, + "loss": 0.0211, "step": 197430 }, { - "epoch": 1.0, - "learning_rate": 0.00015058346913138018, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022323105596180215, + "loss": 0.016, "step": 197440 }, { - "epoch": 1.0, - "learning_rate": 0.0001505759014383662, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022322716774543066, + "loss": 0.0153, "step": 197450 }, { - "epoch": 1.0, - "learning_rate": 0.00015056833374535217, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022322327952905923, + "loss": 0.0143, "step": 197460 }, { - "epoch": 1.0, - "learning_rate": 0.00015056076605233815, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022321939131268774, + "loss": 0.0132, "step": 197470 }, { - "epoch": 1.0, - "learning_rate": 0.00015055319835932416, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022321550309631629, + "loss": 0.0166, "step": 197480 }, { - "epoch": 1.0, - "learning_rate": 0.00015054563066631014, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.0002232116148799448, + "loss": 0.0166, "step": 197490 }, { - "epoch": 1.0, - "learning_rate": 0.00015053806297329612, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.00022320772666357334, + "loss": 0.0165, "step": 197500 }, { - "epoch": 1.0, - "learning_rate": 0.0001505304952802821, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.0002232038384472019, + "loss": 0.0196, "step": 197510 }, { - "epoch": 1.0, - "learning_rate": 0.0001505229275872681, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022319995023083042, + "loss": 0.0185, "step": 197520 }, { - "epoch": 1.0, - "learning_rate": 0.0001505153598942541, - "loss": 0.0122, + "epoch": 0.51, + "learning_rate": 0.00022319606201445897, + "loss": 0.016, "step": 197530 }, { - "epoch": 1.0, - "learning_rate": 0.00015050779220124007, - "loss": 0.0116, + "epoch": 0.51, + "learning_rate": 0.00022319217379808748, + "loss": 0.0149, "step": 197540 }, { - "epoch": 1.0, - "learning_rate": 0.00015050022450822608, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022318828558171605, + "loss": 0.016, "step": 197550 }, { - "epoch": 1.0, - "learning_rate": 0.00015049265681521206, - "loss": 0.0085, + "epoch": 0.51, + "learning_rate": 0.00022318439736534456, + "loss": 0.0195, "step": 197560 }, { - "epoch": 1.0, - "learning_rate": 0.00015048508912219805, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.0002231805091489731, + "loss": 0.0255, "step": 197570 }, { - "epoch": 1.0, - "learning_rate": 0.00015047752142918405, - "loss": 0.0131, + "epoch": 0.51, + "learning_rate": 0.00022317662093260162, + "loss": 0.0231, "step": 197580 }, { - "epoch": 1.0, - "learning_rate": 0.00015046995373617004, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.0002231727327162302, + "loss": 0.0153, "step": 197590 }, { - "epoch": 1.0, - "learning_rate": 0.00015046238604315602, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002231688444998587, + "loss": 0.0148, "step": 197600 }, { - "epoch": 1.0, - "learning_rate": 0.00015045481835014203, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022316495628348725, + "loss": 0.0179, "step": 197610 }, { - "epoch": 1.0, - "learning_rate": 0.000150447250657128, - "loss": 0.0079, + "epoch": 0.51, + "learning_rate": 0.00022316106806711576, + "loss": 0.0162, "step": 197620 }, { - "epoch": 1.0, - "learning_rate": 0.000150439682964114, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022315717985074433, + "loss": 0.0182, "step": 197630 }, { - "epoch": 1.0, - "learning_rate": 0.0001504321152711, - "loss": 0.0078, + "epoch": 0.51, + "learning_rate": 0.00022315329163437284, + "loss": 0.0218, "step": 197640 }, { - "epoch": 1.0, - "learning_rate": 0.00015042454757808598, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022314940341800138, + "loss": 0.0153, "step": 197650 }, { - "epoch": 1.0, - "learning_rate": 0.00015041697988507196, - "loss": 0.0119, + "epoch": 0.51, + "learning_rate": 0.0002231455152016299, + "loss": 0.0183, "step": 197660 }, { - "epoch": 1.0, - "learning_rate": 0.00015040941219205794, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022314162698525847, + "loss": 0.0176, "step": 197670 }, { - "epoch": 1.0, - "learning_rate": 0.00015040184449904395, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.000223137738768887, + "loss": 0.0187, "step": 197680 }, { - "epoch": 1.0, - "learning_rate": 0.00015039427680602993, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022313385055251552, + "loss": 0.016, "step": 197690 }, { - "epoch": 1.0, - "learning_rate": 0.0001503867091130159, - "loss": 0.0098, + "epoch": 0.51, + "learning_rate": 0.00022312996233614407, + "loss": 0.0176, "step": 197700 }, { - "epoch": 1.0, - "learning_rate": 0.00015037914142000192, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.0002231260741197726, + "loss": 0.02, "step": 197710 }, { - "epoch": 1.0, - "learning_rate": 0.0001503715737269879, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022312218590340115, + "loss": 0.0234, "step": 197720 }, { - "epoch": 1.0, - "learning_rate": 0.00015036400603397388, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022311829768702966, + "loss": 0.018, "step": 197730 }, { - "epoch": 1.0, - "learning_rate": 0.0001503564383409599, - "loss": 0.0112, + "epoch": 0.51, + "learning_rate": 0.0002231144094706582, + "loss": 0.0165, "step": 197740 }, { - "epoch": 1.0, - "learning_rate": 0.00015034887064794587, - "loss": 0.0099, + "epoch": 0.51, + "learning_rate": 0.00022311052125428672, + "loss": 0.0195, "step": 197750 }, { - "epoch": 1.0, - "learning_rate": 0.00015034130295493186, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.0002231066330379153, + "loss": 0.0179, "step": 197760 }, { - "epoch": 1.0, - "learning_rate": 0.00015033373526191786, - "loss": 0.0073, + "epoch": 0.51, + "learning_rate": 0.0002231027448215438, + "loss": 0.0159, "step": 197770 }, { - "epoch": 1.0, - "learning_rate": 0.00015032616756890385, - "loss": 0.0081, + "epoch": 0.51, + "learning_rate": 0.00022309885660517234, + "loss": 0.0126, "step": 197780 }, { - "epoch": 1.0, - "learning_rate": 0.00015031859987588983, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022309496838880086, + "loss": 0.0162, "step": 197790 }, { - "epoch": 1.0, - "learning_rate": 0.00015031103218287584, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022309108017242943, + "loss": 0.0172, "step": 197800 }, { - "epoch": 1.0, - "learning_rate": 0.00015030346448986182, - "loss": 0.0136, + "epoch": 0.51, + "learning_rate": 0.00022308719195605794, + "loss": 0.0194, "step": 197810 }, { - "epoch": 1.0, - "learning_rate": 0.0001502958967968478, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022308330373968648, + "loss": 0.0181, "step": 197820 }, { - "epoch": 1.0, - "learning_rate": 0.0001502883291038338, - "loss": 0.013, + "epoch": 0.51, + "learning_rate": 0.000223079415523315, + "loss": 0.0191, "step": 197830 }, { - "epoch": 1.0, - "learning_rate": 0.0001502807614108198, - "loss": 0.0079, + "epoch": 0.51, + "learning_rate": 0.00022307552730694357, + "loss": 0.0193, "step": 197840 }, { - "epoch": 1.0, - "learning_rate": 0.00015027319371780577, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.0002230716390905721, + "loss": 0.0223, "step": 197850 }, { - "epoch": 1.0, - "learning_rate": 0.00015026562602479175, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022306775087420062, + "loss": 0.0153, "step": 197860 }, { - "epoch": 1.0, - "learning_rate": 0.00015025805833177776, - "loss": 0.0102, + "epoch": 0.51, + "learning_rate": 0.00022306386265782914, + "loss": 0.0202, "step": 197870 }, { - "epoch": 1.0, - "learning_rate": 0.00015025049063876374, - "loss": 0.0104, + "epoch": 0.51, + "learning_rate": 0.0002230599744414577, + "loss": 0.0157, "step": 197880 }, { - "epoch": 1.0, - "learning_rate": 0.00015024292294574972, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022305608622508625, + "loss": 0.0172, "step": 197890 }, { - "epoch": 1.0, - "learning_rate": 0.00015023535525273573, - "loss": 0.0141, + "epoch": 0.51, + "learning_rate": 0.00022305219800871476, + "loss": 0.0197, "step": 197900 }, { - "epoch": 1.0, - "learning_rate": 0.0001502277875597217, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.0002230483097923433, + "loss": 0.0177, "step": 197910 }, { - "epoch": 1.0, - "learning_rate": 0.0001502202198667077, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022304442157597185, + "loss": 0.02, "step": 197920 }, { - "epoch": 1.0, - "learning_rate": 0.0001502126521736937, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.0002230405333596004, + "loss": 0.0171, "step": 197930 }, { - "epoch": 1.0, - "learning_rate": 0.00015020508448067968, - "loss": 0.0118, + "epoch": 0.51, + "learning_rate": 0.0002230366451432289, + "loss": 0.0185, "step": 197940 }, { - "epoch": 1.0, - "learning_rate": 0.00015019751678766567, - "loss": 0.009, + "epoch": 0.51, + "learning_rate": 0.00022303275692685744, + "loss": 0.0162, "step": 197950 }, { - "epoch": 1.0, - "learning_rate": 0.00015018994909465162, - "loss": 0.0109, + "epoch": 0.51, + "learning_rate": 0.00022302886871048599, + "loss": 0.0172, "step": 197960 }, { - "epoch": 1.0, - "learning_rate": 0.00015018238140163763, - "loss": 0.0111, + "epoch": 0.51, + "learning_rate": 0.00022302498049411453, + "loss": 0.0163, "step": 197970 }, { - "epoch": 1.0, - "learning_rate": 0.0001501748137086236, - "loss": 0.0077, + "epoch": 0.51, + "learning_rate": 0.00022302109227774304, + "loss": 0.0201, "step": 197980 }, { - "epoch": 1.0, - "learning_rate": 0.0001501672460156096, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.00022301720406137158, + "loss": 0.0158, "step": 197990 }, { - "epoch": 1.0, - "learning_rate": 0.0001501596783225956, - "loss": 0.0091, + "epoch": 0.51, + "learning_rate": 0.0002230133158450001, + "loss": 0.0157, "step": 198000 }, { - "epoch": 1.0, - "eval_cer": 0.9144508479806542, - "eval_loss": 0.007899566553533077, - "eval_runtime": 116.6273, - "eval_samples_per_second": 17.149, - "eval_steps_per_second": 4.287, + "epoch": 0.51, + "eval_cer": 0.8818356518319148, + "eval_loss": 0.011476157233119011, + "eval_runtime": 107.9405, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, "step": 198000 }, { - "epoch": 1.0, - "learning_rate": 0.00015015211062958158, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022300942762862867, + "loss": 0.0173, "step": 198010 }, { - "epoch": 1.0, - "learning_rate": 0.00015014454293656756, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.0002230055394122572, + "loss": 0.0132, "step": 198020 }, { - "epoch": 1.0, - "learning_rate": 0.00015013697524355357, - "loss": 0.0132, + "epoch": 0.51, + "learning_rate": 0.00022300165119588572, + "loss": 0.0172, "step": 198030 }, { - "epoch": 1.0, - "learning_rate": 0.00015012940755053955, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022299776297951424, + "loss": 0.0177, "step": 198040 }, { - "epoch": 1.0, - "learning_rate": 0.00015012183985752553, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.0002229938747631428, + "loss": 0.0204, "step": 198050 }, { - "epoch": 1.0, - "learning_rate": 0.00015011427216451152, - "loss": 0.0122, + "epoch": 0.51, + "learning_rate": 0.00022298998654677135, + "loss": 0.0165, "step": 198060 }, { - "epoch": 1.0, - "learning_rate": 0.00015010670447149752, - "loss": 0.013, + "epoch": 0.51, + "learning_rate": 0.00022298609833039986, + "loss": 0.0208, "step": 198070 }, { - "epoch": 1.0, - "learning_rate": 0.0001500991367784835, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.0002229822101140284, + "loss": 0.0165, "step": 198080 }, { - "epoch": 1.0, - "learning_rate": 0.0001500915690854695, - "loss": 0.007, + "epoch": 0.51, + "learning_rate": 0.00022297832189765695, + "loss": 0.0182, "step": 198090 }, { - "epoch": 1.0, - "learning_rate": 0.0001500840013924555, - "loss": 0.0124, + "epoch": 0.51, + "learning_rate": 0.0002229744336812855, + "loss": 0.018, "step": 198100 }, { - "epoch": 1.0, - "learning_rate": 0.00015007643369944148, - "loss": 0.0075, + "epoch": 0.51, + "learning_rate": 0.000222970545464914, + "loss": 0.0174, "step": 198110 }, { - "epoch": 1.0, - "learning_rate": 0.00015006886600642746, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022296665724854254, + "loss": 0.0179, "step": 198120 }, { - "epoch": 1.0, - "learning_rate": 0.00015006129831341347, - "loss": 0.0134, + "epoch": 0.51, + "learning_rate": 0.00022296276903217108, + "loss": 0.0202, "step": 198130 }, { - "epoch": 1.0, - "learning_rate": 0.00015005373062039945, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022295888081579963, + "loss": 0.0211, "step": 198140 }, { - "epoch": 1.0, - "learning_rate": 0.00015004616292738543, - "loss": 0.0164, + "epoch": 0.51, + "learning_rate": 0.00022295499259942814, + "loss": 0.0166, "step": 198150 }, { - "epoch": 1.0, - "learning_rate": 0.00015003859523437144, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022295110438305668, + "loss": 0.0158, "step": 198160 }, { - "epoch": 1.0, - "learning_rate": 0.00015003102754135742, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.00022294721616668525, + "loss": 0.0176, "step": 198170 }, { - "epoch": 1.0, - "learning_rate": 0.0001500234598483434, - "loss": 0.0145, + "epoch": 0.51, + "learning_rate": 0.00022294332795031377, + "loss": 0.0164, "step": 198180 }, { - "epoch": 1.0, - "learning_rate": 0.0001500158921553294, - "loss": 0.0115, + "epoch": 0.51, + "learning_rate": 0.00022293943973394228, + "loss": 0.0162, "step": 198190 }, { - "epoch": 1.0, - "learning_rate": 0.0001500083244623154, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022293555151757082, + "loss": 0.0196, "step": 198200 }, { - "epoch": 1.0, - "learning_rate": 0.00015000075676930137, - "loss": 0.0138, - "step": 198210 + "epoch": 0.51, + "learning_rate": 0.0002229316633011994, + "loss": 0.0165, + "step": 198210 }, { - "epoch": 1.0, - "learning_rate": 0.00014999318907628738, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.0002229277750848279, + "loss": 0.0251, "step": 198220 }, { - "epoch": 1.0, - "learning_rate": 0.00014998562138327336, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022292388686845645, + "loss": 0.0219, "step": 198230 }, { - "epoch": 1.0, - "learning_rate": 0.00014997805369025937, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.00022291999865208496, + "loss": 0.0182, "step": 198240 }, { - "epoch": 1.0, - "learning_rate": 0.00014997048599724535, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.0002229161104357135, + "loss": 0.0158, "step": 198250 }, { - "epoch": 1.0, - "learning_rate": 0.00014996291830423133, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022291222221934204, + "loss": 0.0154, "step": 198260 }, { - "epoch": 1.0, - "learning_rate": 0.00014995535061121734, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.0002229083340029706, + "loss": 0.0152, "step": 198270 }, { - "epoch": 1.0, - "learning_rate": 0.0001499477829182033, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.0002229044457865991, + "loss": 0.0158, "step": 198280 }, { - "epoch": 1.0, - "learning_rate": 0.0001499402152251893, - "loss": 0.0107, + "epoch": 0.51, + "learning_rate": 0.00022290055757022764, + "loss": 0.0161, "step": 198290 }, { - "epoch": 1.0, - "learning_rate": 0.0001499326475321753, - "loss": 0.0087, + "epoch": 0.51, + "learning_rate": 0.00022289666935385618, + "loss": 0.0193, "step": 198300 }, { - "epoch": 1.0, - "learning_rate": 0.00014992507983916127, - "loss": 0.0094, + "epoch": 0.51, + "learning_rate": 0.00022289278113748473, + "loss": 0.0181, "step": 198310 }, { - "epoch": 1.0, - "learning_rate": 0.00014991751214614728, - "loss": 0.0105, + "epoch": 0.51, + "learning_rate": 0.00022288889292111324, + "loss": 0.0189, "step": 198320 }, { - "epoch": 1.0, - "learning_rate": 0.00014990994445313326, - "loss": 0.0088, + "epoch": 0.51, + "learning_rate": 0.00022288500470474178, + "loss": 0.014, "step": 198330 }, { - "epoch": 1.0, - "learning_rate": 0.00014990237676011924, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022288111648837032, + "loss": 0.0167, "step": 198340 }, { - "epoch": 1.0, - "learning_rate": 0.00014989480906710525, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.00022287722827199887, + "loss": 0.0161, "step": 198350 }, { - "epoch": 1.0, - "learning_rate": 0.00014988724137409123, - "loss": 0.0106, + "epoch": 0.51, + "learning_rate": 0.00022287334005562738, + "loss": 0.0198, "step": 198360 }, { - "epoch": 1.0, - "learning_rate": 0.0001498796736810772, - "loss": 0.0083, + "epoch": 0.51, + "learning_rate": 0.00022286945183925592, + "loss": 0.0143, "step": 198370 }, { - "epoch": 1.0, - "learning_rate": 0.00014987210598806322, - "loss": 0.0092, + "epoch": 0.51, + "learning_rate": 0.0002228655636228845, + "loss": 0.0139, "step": 198380 }, { - "epoch": 1.0, - "learning_rate": 0.0001498645382950492, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.000222861675406513, + "loss": 0.0189, "step": 198390 }, { - "epoch": 1.0, - "learning_rate": 0.00014985697060203518, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022285778719014155, + "loss": 0.0262, "step": 198400 }, { - "epoch": 1.0, - "learning_rate": 0.00014984940290902116, - "loss": 0.0117, + "epoch": 0.51, + "learning_rate": 0.00022285389897377006, + "loss": 0.0191, "step": 198410 }, { - "epoch": 1.0, - "learning_rate": 0.00014984183521600717, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022285001075739863, + "loss": 0.0195, "step": 198420 }, { - "epoch": 1.0, - "learning_rate": 0.00014983426752299315, - "loss": 0.0067, + "epoch": 0.51, + "learning_rate": 0.00022284612254102714, + "loss": 0.0175, "step": 198430 }, { - "epoch": 1.0, - "learning_rate": 0.00014982669982997914, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022284223432465569, + "loss": 0.0143, "step": 198440 }, { - "epoch": 1.0, - "learning_rate": 0.00014981913213696514, - "loss": 0.0089, + "epoch": 0.51, + "learning_rate": 0.0002228383461082842, + "loss": 0.0163, "step": 198450 }, { - "epoch": 1.0, - "learning_rate": 0.00014981156444395113, - "loss": 0.0103, + "epoch": 0.51, + "learning_rate": 0.00022283445789191277, + "loss": 0.0202, "step": 198460 }, { - "epoch": 1.0, - "learning_rate": 0.0001498039967509371, - "loss": 0.0125, + "epoch": 0.51, + "learning_rate": 0.00022283056967554128, + "loss": 0.0151, "step": 198470 }, { - "epoch": 1.0, - "learning_rate": 0.00014979642905792312, - "loss": 0.0086, + "epoch": 0.51, + "learning_rate": 0.00022282668145916983, + "loss": 0.0167, "step": 198480 }, { - "epoch": 1.0, - "learning_rate": 0.0001497888613649091, - "loss": 0.0097, + "epoch": 0.51, + "learning_rate": 0.00022282279324279834, + "loss": 0.018, "step": 198490 }, { - "epoch": 1.0, - "learning_rate": 0.00014978129367189508, - "loss": 0.0067, + "epoch": 0.51, + "learning_rate": 0.00022281890502642688, + "loss": 0.0183, "step": 198500 }, { - "epoch": 1.0, - "learning_rate": 0.0001497737259788811, - "loss": 0.0101, + "epoch": 0.51, + "learning_rate": 0.00022281501681005542, + "loss": 0.0228, "step": 198510 }, { - "epoch": 1.0, - "learning_rate": 0.00014976615828586707, - "loss": 0.0114, + "epoch": 0.51, + "learning_rate": 0.00022281112859368396, + "loss": 0.0176, "step": 198520 }, { - "epoch": 1.0, - "learning_rate": 0.00014975859059285305, - "loss": 0.009, + "epoch": 0.51, + "learning_rate": 0.00022280724037731248, + "loss": 0.0166, "step": 198530 }, { - "epoch": 1.0, - "learning_rate": 0.00014975102289983906, - "loss": 0.0081, + "epoch": 0.51, + "learning_rate": 0.00022280335216094102, + "loss": 0.0168, "step": 198540 }, { - "epoch": 1.0, - "learning_rate": 0.00014974345520682504, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.0002227994639445696, + "loss": 0.0184, "step": 198550 }, { - "epoch": 1.0, - "learning_rate": 0.00014973588751381102, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.0002227955757281981, + "loss": 0.0168, "step": 198560 }, { - "epoch": 1.0, - "learning_rate": 0.000149728319820797, - "loss": 0.0093, + "epoch": 0.51, + "learning_rate": 0.00022279168751182665, + "loss": 0.0187, "step": 198570 }, { - "epoch": 1.0, - "learning_rate": 0.000149720752127783, - "loss": 0.01, + "epoch": 0.51, + "learning_rate": 0.00022278779929545516, + "loss": 0.0135, "step": 198580 }, { - "epoch": 1.0, - "learning_rate": 0.000149713184434769, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.00022278391107908373, + "loss": 0.0212, "step": 198590 }, { - "epoch": 1.0, - "learning_rate": 0.00014970561674175497, - "loss": 0.0158, + "epoch": 0.51, + "learning_rate": 0.00022278002286271224, + "loss": 0.0187, "step": 198600 }, { - "epoch": 1.0, - "learning_rate": 0.00014969804904874098, - "loss": 0.015, + "epoch": 0.51, + "learning_rate": 0.00022277613464634079, + "loss": 0.017, "step": 198610 }, { - "epoch": 1.0, - "learning_rate": 0.00014969048135572696, - "loss": 0.0128, + "epoch": 0.51, + "learning_rate": 0.0002227722464299693, + "loss": 0.0198, "step": 198620 }, { - "epoch": 1.0, - "learning_rate": 0.00014968291366271295, - "loss": 0.011, + "epoch": 0.51, + "learning_rate": 0.00022276835821359787, + "loss": 0.0175, "step": 198630 }, { - "epoch": 1.0, - "learning_rate": 0.00014967534596969895, - "loss": 0.0096, + "epoch": 0.51, + "learning_rate": 0.00022276446999722638, + "loss": 0.0175, "step": 198640 }, { - "epoch": 1.0, - "learning_rate": 0.00014966777827668494, - "loss": 0.0108, + "epoch": 0.51, + "learning_rate": 0.00022276058178085492, + "loss": 0.0168, "step": 198650 }, { - "epoch": 1.0, - "learning_rate": 0.00014966021058367092, - "loss": 0.0095, + "epoch": 0.51, + "learning_rate": 0.00022275669356448344, + "loss": 0.0174, "step": 198660 }, { - "epoch": 1.0, - "learning_rate": 0.00014965264289065693, - "loss": 0.0113, + "epoch": 0.51, + "learning_rate": 0.000222752805348112, + "loss": 0.0167, "step": 198670 }, { - "epoch": 1.0, - "learning_rate": 0.0001496450751976429, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022274891713174052, + "loss": 0.0178, "step": 198680 }, { - "epoch": 1.0, - "learning_rate": 0.0001496375075046289, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022274502891536906, + "loss": 0.0145, "step": 198690 }, { - "epoch": 1.0, - "learning_rate": 0.0001496299398116149, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022274114069899758, + "loss": 0.0183, "step": 198700 }, { - "epoch": 1.0, - "learning_rate": 0.00014962237211860088, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022273725248262615, + "loss": 0.015, "step": 198710 }, { - "epoch": 1.0, - "learning_rate": 0.00014961480442558686, - "loss": 0.0074, + "epoch": 0.52, + "learning_rate": 0.0002227333642662547, + "loss": 0.0199, "step": 198720 }, { - "epoch": 1.0, - "learning_rate": 0.00014960723673257287, - "loss": 0.0135, + "epoch": 0.52, + "learning_rate": 0.0002227294760498832, + "loss": 0.0205, "step": 198730 }, { - "epoch": 1.0, - "learning_rate": 0.00014959966903955885, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022272558783351172, + "loss": 0.0177, "step": 198740 }, { - "epoch": 1.0, - "learning_rate": 0.00014959210134654483, - "loss": 0.0113, + "epoch": 0.52, + "learning_rate": 0.00022272169961714026, + "loss": 0.0152, "step": 198750 }, { - "epoch": 1.0, - "learning_rate": 0.0001495845336535308, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022271781140076883, + "loss": 0.0213, "step": 198760 }, { - "epoch": 1.0, - "learning_rate": 0.00014957696596051682, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022271392318439734, + "loss": 0.0164, "step": 198770 }, { - "epoch": 1.0, - "learning_rate": 0.0001495693982675028, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022271003496802588, + "loss": 0.0171, "step": 198780 }, { - "epoch": 1.0, - "learning_rate": 0.00014956183057448878, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.0002227061467516544, + "loss": 0.0234, "step": 198790 }, { - "epoch": 1.0, - "learning_rate": 0.0001495542628814748, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.00022270225853528297, + "loss": 0.021, "step": 198800 }, { - "epoch": 1.0, - "learning_rate": 0.00014954669518846077, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.00022269837031891148, + "loss": 0.0175, "step": 198810 }, { - "epoch": 1.0, - "learning_rate": 0.00014953912749544676, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022269448210254002, + "loss": 0.0179, "step": 198820 }, { - "epoch": 1.0, - "learning_rate": 0.00014953155980243276, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.00022269059388616854, + "loss": 0.0166, "step": 198830 }, { - "epoch": 1.0, - "learning_rate": 0.00014952399210941875, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.0002226867056697971, + "loss": 0.0189, "step": 198840 }, { - "epoch": 1.0, - "learning_rate": 0.00014951642441640473, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022268281745342562, + "loss": 0.0187, "step": 198850 }, { - "epoch": 1.0, - "learning_rate": 0.00014950885672339074, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022267892923705416, + "loss": 0.0185, "step": 198860 }, { - "epoch": 1.0, - "learning_rate": 0.00014950128903037672, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.00022267504102068268, + "loss": 0.0163, "step": 198870 }, { - "epoch": 1.0, - "learning_rate": 0.0001494937213373627, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022267115280431125, + "loss": 0.0137, "step": 198880 }, { - "epoch": 1.0, - "learning_rate": 0.0001494861536443487, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.0002226672645879398, + "loss": 0.0205, "step": 198890 }, { - "epoch": 1.0, - "learning_rate": 0.0001494785859513347, - "loss": 0.0116, + "epoch": 0.52, + "learning_rate": 0.0002226633763715683, + "loss": 0.0175, "step": 198900 }, { - "epoch": 1.0, - "learning_rate": 0.00014947101825832067, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022265948815519682, + "loss": 0.0138, "step": 198910 }, { - "epoch": 1.0, - "learning_rate": 0.00014946345056530665, - "loss": 0.0067, + "epoch": 0.52, + "learning_rate": 0.00022265559993882539, + "loss": 0.0154, "step": 198920 }, { - "epoch": 1.0, - "learning_rate": 0.00014945588287229263, - "loss": 0.0138, + "epoch": 0.52, + "learning_rate": 0.00022265171172245393, + "loss": 0.0156, "step": 198930 }, { - "epoch": 1.0, - "learning_rate": 0.00014944831517927861, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022264782350608244, + "loss": 0.0165, "step": 198940 }, { - "epoch": 1.0, - "learning_rate": 0.00014944074748626462, - "loss": 0.0139, + "epoch": 0.52, + "learning_rate": 0.00022264393528971098, + "loss": 0.0198, "step": 198950 }, { - "epoch": 1.0, - "learning_rate": 0.0001494331797932506, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.00022264004707333953, + "loss": 0.0208, "step": 198960 }, { - "epoch": 1.0, - "learning_rate": 0.00014942561210023659, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022263615885696807, + "loss": 0.0168, "step": 198970 }, { - "epoch": 1.0, - "learning_rate": 0.0001494180444072226, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.00022263227064059658, + "loss": 0.0174, "step": 198980 }, { - "epoch": 1.0, - "learning_rate": 0.00014941047671420858, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022262838242422512, + "loss": 0.0187, "step": 198990 }, { - "epoch": 1.0, - "learning_rate": 0.00014940290902119456, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022262449420785364, + "loss": 0.0176, "step": 199000 }, { - "epoch": 1.0, - "eval_cer": 0.914462492734159, - "eval_loss": 0.00810973159968853, - "eval_runtime": 117.6891, - "eval_samples_per_second": 16.994, - "eval_steps_per_second": 4.248, + "epoch": 0.52, + "eval_cer": 0.8817992612716261, + "eval_loss": 0.012197881937026978, + "eval_runtime": 107.9744, + "eval_samples_per_second": 18.523, + "eval_steps_per_second": 4.631, "step": 199000 }, { - "epoch": 1.0, - "learning_rate": 0.00014939534132818057, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.0002226206059914822, + "loss": 0.0189, "step": 199010 }, { - "epoch": 1.0, - "learning_rate": 0.00014938777363516655, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022261671777511072, + "loss": 0.0175, "step": 199020 }, { - "epoch": 1.0, - "learning_rate": 0.00014938020594215253, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022261282955873926, + "loss": 0.0192, "step": 199030 }, { - "epoch": 1.0, - "learning_rate": 0.00014937263824913854, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022260894134236778, + "loss": 0.0169, "step": 199040 }, { - "epoch": 1.0, - "learning_rate": 0.00014936507055612452, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022260505312599635, + "loss": 0.0182, "step": 199050 }, { - "epoch": 1.0, - "learning_rate": 0.0001493575028631105, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022260116490962486, + "loss": 0.017, "step": 199060 }, { - "epoch": 1.0, - "learning_rate": 0.0001493499351700965, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.0002225972766932534, + "loss": 0.0141, "step": 199070 }, { - "epoch": 1.0, - "learning_rate": 0.0001493423674770825, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022259338847688192, + "loss": 0.0136, "step": 199080 }, { - "epoch": 1.0, - "learning_rate": 0.00014933479978406847, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022258950026051049, + "loss": 0.018, "step": 199090 }, { - "epoch": 1.0, - "learning_rate": 0.00014932723209105445, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022258561204413903, + "loss": 0.0148, "step": 199100 }, { - "epoch": 1.0, - "learning_rate": 0.00014931966439804046, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.00022258172382776754, + "loss": 0.0197, "step": 199110 }, { - "epoch": 1.0, - "learning_rate": 0.00014931209670502644, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022257783561139608, + "loss": 0.0169, "step": 199120 }, { - "epoch": 1.0, - "learning_rate": 0.00014930452901201242, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022257394739502463, + "loss": 0.0187, "step": 199130 }, { - "epoch": 1.0, - "learning_rate": 0.00014929696131899843, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022257005917865317, + "loss": 0.019, "step": 199140 }, { - "epoch": 1.0, - "learning_rate": 0.00014928939362598441, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022256617096228168, + "loss": 0.0192, "step": 199150 }, { - "epoch": 1.0, - "learning_rate": 0.0001492818259329704, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022256228274591022, + "loss": 0.0161, "step": 199160 }, { - "epoch": 1.0, - "learning_rate": 0.0001492742582399564, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022255839452953876, + "loss": 0.0146, "step": 199170 }, { - "epoch": 1.0, - "learning_rate": 0.00014926669054694239, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.0002225545063131673, + "loss": 0.0201, "step": 199180 }, { - "epoch": 1.0, - "learning_rate": 0.00014925912285392837, - "loss": 0.0162, + "epoch": 0.52, + "learning_rate": 0.00022255061809679582, + "loss": 0.0196, "step": 199190 }, { - "epoch": 1.0, - "learning_rate": 0.00014925155516091438, - "loss": 0.0074, + "epoch": 0.52, + "learning_rate": 0.00022254672988042436, + "loss": 0.0162, "step": 199200 }, { - "epoch": 1.01, - "learning_rate": 0.00014924398746790036, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.0002225428416640529, + "loss": 0.0199, "step": 199210 }, { - "epoch": 1.01, - "learning_rate": 0.00014923641977488634, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022253895344768145, + "loss": 0.0189, "step": 199220 }, { - "epoch": 1.01, - "learning_rate": 0.00014922885208187235, - "loss": 0.0081, + "epoch": 0.52, + "learning_rate": 0.00022253506523130996, + "loss": 0.0214, "step": 199230 }, { - "epoch": 1.01, - "learning_rate": 0.00014922128438885833, - "loss": 0.0115, + "epoch": 0.52, + "learning_rate": 0.0002225311770149385, + "loss": 0.0196, "step": 199240 }, { - "epoch": 1.01, - "learning_rate": 0.0001492137166958443, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.00022252728879856702, + "loss": 0.0143, "step": 199250 }, { - "epoch": 1.01, - "learning_rate": 0.00014920614900283032, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022252340058219559, + "loss": 0.018, "step": 199260 }, { - "epoch": 1.01, - "learning_rate": 0.0001491985813098163, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022251951236582413, + "loss": 0.0171, "step": 199270 }, { - "epoch": 1.01, - "learning_rate": 0.00014919101361680228, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022251562414945264, + "loss": 0.0173, "step": 199280 }, { - "epoch": 1.01, - "learning_rate": 0.00014918344592378826, - "loss": 0.0078, + "epoch": 0.52, + "learning_rate": 0.00022251173593308118, + "loss": 0.0153, "step": 199290 }, { - "epoch": 1.01, - "learning_rate": 0.00014917587823077427, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022250784771670972, + "loss": 0.0207, "step": 199300 }, { - "epoch": 1.01, - "learning_rate": 0.00014916831053776025, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022250395950033827, + "loss": 0.0165, "step": 199310 }, { - "epoch": 1.01, - "learning_rate": 0.00014916074284474623, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022250007128396678, + "loss": 0.0176, "step": 199320 }, { - "epoch": 1.01, - "learning_rate": 0.00014915317515173224, - "loss": 0.0081, + "epoch": 0.52, + "learning_rate": 0.00022249618306759532, + "loss": 0.014, "step": 199330 }, { - "epoch": 1.01, - "learning_rate": 0.00014914560745871822, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022249229485122386, + "loss": 0.0171, "step": 199340 }, { - "epoch": 1.01, - "learning_rate": 0.0001491380397657042, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.0002224884066348524, + "loss": 0.0161, "step": 199350 }, { - "epoch": 1.01, - "learning_rate": 0.00014913047207269021, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022248451841848092, + "loss": 0.0155, "step": 199360 }, { - "epoch": 1.01, - "learning_rate": 0.0001491229043796762, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022248063020210946, + "loss": 0.0178, "step": 199370 }, { - "epoch": 1.01, - "learning_rate": 0.00014911533668666218, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.000222476741985738, + "loss": 0.0155, "step": 199380 }, { - "epoch": 1.01, - "learning_rate": 0.00014910776899364819, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022247285376936655, + "loss": 0.0212, "step": 199390 }, { - "epoch": 1.01, - "learning_rate": 0.00014910020130063417, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022246896555299506, + "loss": 0.0204, "step": 199400 }, { - "epoch": 1.01, - "learning_rate": 0.00014909263360762015, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.0002224650773366236, + "loss": 0.0158, "step": 199410 }, { - "epoch": 1.01, - "learning_rate": 0.00014908506591460616, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022246118912025217, + "loss": 0.0128, "step": 199420 }, { - "epoch": 1.01, - "learning_rate": 0.00014907749822159214, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022245730090388068, + "loss": 0.0158, "step": 199430 }, { - "epoch": 1.01, - "learning_rate": 0.00014906993052857812, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022245341268750923, + "loss": 0.0205, "step": 199440 }, { - "epoch": 1.01, - "learning_rate": 0.0001490623628355641, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022244952447113774, + "loss": 0.0217, "step": 199450 }, { - "epoch": 1.01, - "learning_rate": 0.0001490547951425501, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.0002224456362547663, + "loss": 0.0194, "step": 199460 }, { - "epoch": 1.01, - "learning_rate": 0.0001490472274495361, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022244174803839482, + "loss": 0.0179, "step": 199470 }, { - "epoch": 1.01, - "learning_rate": 0.00014903965975652207, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022243785982202337, + "loss": 0.0189, "step": 199480 }, { - "epoch": 1.01, - "learning_rate": 0.00014903209206350808, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022243397160565188, + "loss": 0.0162, "step": 199490 }, { - "epoch": 1.01, - "learning_rate": 0.00014902452437049406, - "loss": 0.0127, + "epoch": 0.52, + "learning_rate": 0.00022243008338928042, + "loss": 0.0151, "step": 199500 }, { - "epoch": 1.01, - "learning_rate": 0.00014901695667748004, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022242619517290896, + "loss": 0.018, "step": 199510 }, { - "epoch": 1.01, - "learning_rate": 0.00014900938898446605, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.0002224223069565375, + "loss": 0.0196, "step": 199520 }, { - "epoch": 1.01, - "learning_rate": 0.00014900182129145203, - "loss": 0.0153, + "epoch": 0.52, + "learning_rate": 0.00022241841874016602, + "loss": 0.0167, "step": 199530 }, { - "epoch": 1.01, - "learning_rate": 0.00014899425359843802, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022241453052379456, + "loss": 0.0188, "step": 199540 }, { - "epoch": 1.01, - "learning_rate": 0.000148986685905424, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.0002224106423074231, + "loss": 0.0193, "step": 199550 }, { - "epoch": 1.01, - "learning_rate": 0.00014897911821240998, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022240675409105164, + "loss": 0.0175, "step": 199560 }, { - "epoch": 1.01, - "learning_rate": 0.000148971550519396, - "loss": 0.0081, + "epoch": 0.52, + "learning_rate": 0.00022240286587468016, + "loss": 0.0233, "step": 199570 }, { - "epoch": 1.01, - "learning_rate": 0.00014896398282638197, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.0002223989776583087, + "loss": 0.023, "step": 199580 }, { - "epoch": 1.01, - "learning_rate": 0.00014895641513336795, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022239508944193727, + "loss": 0.0167, "step": 199590 }, { - "epoch": 1.01, - "learning_rate": 0.00014894884744035396, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022239120122556578, + "loss": 0.0191, "step": 199600 }, { - "epoch": 1.01, - "learning_rate": 0.00014894127974733994, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022238731300919433, + "loss": 0.0137, "step": 199610 }, { - "epoch": 1.01, - "learning_rate": 0.00014893371205432592, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022238342479282284, + "loss": 0.0151, "step": 199620 }, { - "epoch": 1.01, - "learning_rate": 0.00014892614436131193, - "loss": 0.0113, + "epoch": 0.52, + "learning_rate": 0.0002223795365764514, + "loss": 0.0183, "step": 199630 }, { - "epoch": 1.01, - "learning_rate": 0.0001489185766682979, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022237564836007992, + "loss": 0.0207, "step": 199640 }, { - "epoch": 1.01, - "learning_rate": 0.0001489110089752839, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022237176014370847, + "loss": 0.0188, "step": 199650 }, { - "epoch": 1.01, - "learning_rate": 0.00014890344128226987, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022236787192733698, + "loss": 0.019, "step": 199660 }, { - "epoch": 1.01, - "learning_rate": 0.00014889587358925588, - "loss": 0.0142, + "epoch": 0.52, + "learning_rate": 0.00022236398371096555, + "loss": 0.018, "step": 199670 }, { - "epoch": 1.01, - "learning_rate": 0.00014888830589624186, - "loss": 0.0162, + "epoch": 0.52, + "learning_rate": 0.00022236009549459406, + "loss": 0.0173, "step": 199680 }, { - "epoch": 1.01, - "learning_rate": 0.00014888073820322785, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.0002223562072782226, + "loss": 0.0174, "step": 199690 }, { - "epoch": 1.01, - "learning_rate": 0.00014887317051021385, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022235231906185112, + "loss": 0.0166, "step": 199700 }, { - "epoch": 1.01, - "learning_rate": 0.00014886560281719984, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.0002223484308454797, + "loss": 0.0192, "step": 199710 }, { - "epoch": 1.01, - "learning_rate": 0.00014885803512418582, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.0002223445426291082, + "loss": 0.0154, "step": 199720 }, { - "epoch": 1.01, - "learning_rate": 0.00014885046743117183, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022234065441273674, + "loss": 0.0207, "step": 199730 }, { - "epoch": 1.01, - "learning_rate": 0.0001488428997381578, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022233676619636526, + "loss": 0.0192, "step": 199740 }, { - "epoch": 1.01, - "learning_rate": 0.0001488353320451438, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.0002223328779799938, + "loss": 0.0154, "step": 199750 }, { - "epoch": 1.01, - "learning_rate": 0.0001488277643521298, - "loss": 0.0069, + "epoch": 0.52, + "learning_rate": 0.00022232898976362237, + "loss": 0.0225, "step": 199760 }, { - "epoch": 1.01, - "learning_rate": 0.00014882019665911578, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022232510154725088, + "loss": 0.02, "step": 199770 }, { - "epoch": 1.01, - "learning_rate": 0.00014881262896610176, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.0002223212133308794, + "loss": 0.0164, "step": 199780 }, { - "epoch": 1.01, - "learning_rate": 0.00014880506127308777, - "loss": 0.0082, + "epoch": 0.52, + "learning_rate": 0.00022231732511450794, + "loss": 0.0162, "step": 199790 }, { - "epoch": 1.01, - "learning_rate": 0.00014879749358007375, - "loss": 0.0137, + "epoch": 0.52, + "learning_rate": 0.0002223134368981365, + "loss": 0.0176, "step": 199800 }, { - "epoch": 1.01, - "learning_rate": 0.00014878992588705973, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022230954868176502, + "loss": 0.0165, "step": 199810 }, { - "epoch": 1.01, - "learning_rate": 0.0001487823581940457, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022230566046539356, + "loss": 0.02, "step": 199820 }, { - "epoch": 1.01, - "learning_rate": 0.00014877479050103172, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022230177224902208, + "loss": 0.016, "step": 199830 }, { - "epoch": 1.01, - "learning_rate": 0.0001487672228080177, - "loss": 0.0118, + "epoch": 0.52, + "learning_rate": 0.00022229788403265065, + "loss": 0.015, "step": 199840 }, { - "epoch": 1.01, - "learning_rate": 0.00014875965511500368, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022229399581627916, + "loss": 0.0201, "step": 199850 }, { - "epoch": 1.01, - "learning_rate": 0.0001487520874219897, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.0002222901075999077, + "loss": 0.0214, "step": 199860 }, { - "epoch": 1.01, - "learning_rate": 0.00014874451972897567, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022228621938353622, + "loss": 0.024, "step": 199870 }, { - "epoch": 1.01, - "learning_rate": 0.00014873695203596166, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.0002222823311671648, + "loss": 0.0152, "step": 199880 }, { - "epoch": 1.01, - "learning_rate": 0.00014872938434294766, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.0002222784429507933, + "loss": 0.018, "step": 199890 }, { - "epoch": 1.01, - "learning_rate": 0.00014872181664993365, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022227455473442184, + "loss": 0.0154, "step": 199900 }, { - "epoch": 1.01, - "learning_rate": 0.00014871424895691963, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022227066651805036, + "loss": 0.0183, "step": 199910 }, { - "epoch": 1.01, - "learning_rate": 0.00014870668126390564, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022226677830167893, + "loss": 0.0169, "step": 199920 }, { - "epoch": 1.01, - "learning_rate": 0.00014869911357089162, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022226289008530744, + "loss": 0.0183, "step": 199930 }, { - "epoch": 1.01, - "learning_rate": 0.0001486915458778776, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022225900186893598, + "loss": 0.0151, "step": 199940 }, { - "epoch": 1.01, - "learning_rate": 0.0001486839781848636, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.0002222551136525645, + "loss": 0.0181, "step": 199950 }, { - "epoch": 1.01, - "learning_rate": 0.0001486764104918496, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022225122543619307, + "loss": 0.0179, "step": 199960 }, { - "epoch": 1.01, - "learning_rate": 0.00014866884279883557, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.0002222473372198216, + "loss": 0.0153, "step": 199970 }, { - "epoch": 1.01, - "learning_rate": 0.00014866127510582155, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.00022224344900345012, + "loss": 0.0164, "step": 199980 }, { - "epoch": 1.01, - "learning_rate": 0.00014865370741280756, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022223956078707866, + "loss": 0.0148, "step": 199990 }, { - "epoch": 1.01, - "learning_rate": 0.00014864613971979354, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022223567257070718, + "loss": 0.0183, "step": 200000 }, { - "epoch": 1.01, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.007801192346960306, - "eval_runtime": 117.4252, - "eval_samples_per_second": 17.032, - "eval_steps_per_second": 4.258, + "epoch": 0.52, + "eval_cer": 0.8817880641761527, + "eval_loss": 0.012208198197185993, + "eval_runtime": 108.0565, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, "step": 200000 }, { - "epoch": 1.01, - "learning_rate": 0.00014863857202677952, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022223178435433575, + "loss": 0.0196, "step": 200010 }, { - "epoch": 1.01, - "learning_rate": 0.00014863100433376553, - "loss": 0.0116, + "epoch": 0.52, + "learning_rate": 0.00022222789613796426, + "loss": 0.021, "step": 200020 }, { - "epoch": 1.01, - "learning_rate": 0.0001486234366407515, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.0002222240079215928, + "loss": 0.016, "step": 200030 }, { - "epoch": 1.01, - "learning_rate": 0.0001486158689477375, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022222011970522132, + "loss": 0.0178, "step": 200040 }, { - "epoch": 1.01, - "learning_rate": 0.0001486083012547235, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.0002222162314888499, + "loss": 0.0136, "step": 200050 }, { - "epoch": 1.01, - "learning_rate": 0.00014860073356170948, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.0002222123432724784, + "loss": 0.0163, "step": 200060 }, { - "epoch": 1.01, - "learning_rate": 0.00014859316586869547, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022220845505610694, + "loss": 0.0175, "step": 200070 }, { - "epoch": 1.01, - "learning_rate": 0.00014858559817568147, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022220456683973546, + "loss": 0.0194, "step": 200080 }, { - "epoch": 1.01, - "learning_rate": 0.00014857803048266746, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022220067862336403, + "loss": 0.0196, "step": 200090 }, { - "epoch": 1.01, - "learning_rate": 0.00014857046278965344, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022219679040699254, + "loss": 0.0191, "step": 200100 }, { - "epoch": 1.01, - "learning_rate": 0.00014856289509663945, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022219290219062108, + "loss": 0.0164, "step": 200110 }, { - "epoch": 1.01, - "learning_rate": 0.00014855532740362543, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.0002221890139742496, + "loss": 0.0188, "step": 200120 }, { - "epoch": 1.01, - "learning_rate": 0.0001485477597106114, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022218512575787817, + "loss": 0.0189, "step": 200130 }, { - "epoch": 1.01, - "learning_rate": 0.00014854019201759742, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.0002221812375415067, + "loss": 0.0172, "step": 200140 }, { - "epoch": 1.01, - "learning_rate": 0.0001485326243245834, - "loss": 0.0074, + "epoch": 0.52, + "learning_rate": 0.00022217734932513522, + "loss": 0.0166, "step": 200150 }, { - "epoch": 1.01, - "learning_rate": 0.00014852505663156938, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022217346110876376, + "loss": 0.0209, "step": 200160 }, { - "epoch": 1.01, - "learning_rate": 0.00014851748893855536, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.0002221695728923923, + "loss": 0.0152, "step": 200170 }, { - "epoch": 1.01, - "learning_rate": 0.00014850992124554134, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022216568467602085, + "loss": 0.0198, "step": 200180 }, { - "epoch": 1.01, - "learning_rate": 0.00014850235355252732, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022216179645964936, + "loss": 0.0181, "step": 200190 }, { - "epoch": 1.01, - "learning_rate": 0.00014849478585951333, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.0002221579082432779, + "loss": 0.0168, "step": 200200 }, { - "epoch": 1.01, - "learning_rate": 0.00014848721816649931, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022215402002690644, + "loss": 0.0184, "step": 200210 }, { - "epoch": 1.01, - "learning_rate": 0.0001484796504734853, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022215013181053499, + "loss": 0.024, "step": 200220 }, { - "epoch": 1.01, - "learning_rate": 0.0001484720827804713, - "loss": 0.0075, + "epoch": 0.52, + "learning_rate": 0.0002221462435941635, + "loss": 0.0496, "step": 200230 }, { - "epoch": 1.01, - "learning_rate": 0.00014846451508745729, - "loss": 0.0082, + "epoch": 0.52, + "learning_rate": 0.00022214235537779204, + "loss": 0.0284, "step": 200240 }, { - "epoch": 1.01, - "learning_rate": 0.00014845694739444327, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022213846716142056, + "loss": 0.016, "step": 200250 }, { - "epoch": 1.01, - "learning_rate": 0.00014844937970142928, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.00022213457894504913, + "loss": 0.0203, "step": 200260 }, { - "epoch": 1.01, - "learning_rate": 0.00014844181200841526, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022213069072867764, + "loss": 0.0208, "step": 200270 }, { - "epoch": 1.01, - "learning_rate": 0.00014843424431540124, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022212680251230618, + "loss": 0.0184, "step": 200280 }, { - "epoch": 1.01, - "learning_rate": 0.00014842667662238725, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.0002221229142959347, + "loss": 0.0161, "step": 200290 }, { - "epoch": 1.01, - "learning_rate": 0.00014841910892937323, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022211902607956327, + "loss": 0.0209, "step": 200300 }, { - "epoch": 1.01, - "learning_rate": 0.0001484115412363592, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.0002221151378631918, + "loss": 0.0183, "step": 200310 }, { - "epoch": 1.01, - "learning_rate": 0.00014840397354334522, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022211124964682032, + "loss": 0.0181, "step": 200320 }, { - "epoch": 1.01, - "learning_rate": 0.0001483964058503312, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022210736143044884, + "loss": 0.019, "step": 200330 }, { - "epoch": 1.01, - "learning_rate": 0.00014838883815731718, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.0002221034732140774, + "loss": 0.0152, "step": 200340 }, { - "epoch": 1.01, - "learning_rate": 0.00014838127046430316, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022209958499770595, + "loss": 0.0183, "step": 200350 }, { - "epoch": 1.01, - "learning_rate": 0.00014837370277128917, - "loss": 0.0074, + "epoch": 0.52, + "learning_rate": 0.00022209569678133446, + "loss": 0.0164, "step": 200360 }, { - "epoch": 1.01, - "learning_rate": 0.00014836613507827515, - "loss": 0.0176, + "epoch": 0.52, + "learning_rate": 0.000222091808564963, + "loss": 0.0239, "step": 200370 }, { - "epoch": 1.01, - "learning_rate": 0.00014835856738526113, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022208792034859154, + "loss": 0.0138, "step": 200380 }, { - "epoch": 1.01, - "learning_rate": 0.00014835099969224714, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022208403213222009, + "loss": 0.0192, "step": 200390 }, { - "epoch": 1.01, - "learning_rate": 0.00014834343199923312, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.0002220801439158486, + "loss": 0.0154, "step": 200400 }, { - "epoch": 1.01, - "learning_rate": 0.0001483358643062191, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022207625569947714, + "loss": 0.0181, "step": 200410 }, { - "epoch": 1.01, - "learning_rate": 0.00014832829661320511, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022207236748310568, + "loss": 0.018, "step": 200420 }, { - "epoch": 1.01, - "learning_rate": 0.0001483207289201911, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022206847926673423, + "loss": 0.0235, "step": 200430 }, { - "epoch": 1.01, - "learning_rate": 0.00014831316122717708, - "loss": 0.015, + "epoch": 0.52, + "learning_rate": 0.00022206459105036274, + "loss": 0.023, "step": 200440 }, { - "epoch": 1.01, - "learning_rate": 0.00014830559353416309, - "loss": 0.0131, + "epoch": 0.52, + "learning_rate": 0.00022206070283399128, + "loss": 0.0251, "step": 200450 }, { - "epoch": 1.01, - "learning_rate": 0.00014829802584114907, - "loss": 0.0498, + "epoch": 0.52, + "learning_rate": 0.00022205681461761985, + "loss": 0.0182, "step": 200460 }, { - "epoch": 1.01, - "learning_rate": 0.00014829045814813505, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.00022205292640124836, + "loss": 0.0168, "step": 200470 }, { - "epoch": 1.01, - "learning_rate": 0.00014828289045512106, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.0002220490381848769, + "loss": 0.0182, "step": 200480 }, { - "epoch": 1.01, - "learning_rate": 0.00014827532276210704, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.00022204514996850542, + "loss": 0.0203, "step": 200490 }, { - "epoch": 1.01, - "learning_rate": 0.00014826775506909302, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022204126175213394, + "loss": 0.0189, "step": 200500 }, { - "epoch": 1.01, - "learning_rate": 0.000148260187376079, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.0002220373735357625, + "loss": 0.0145, "step": 200510 }, { - "epoch": 1.01, - "learning_rate": 0.000148252619683065, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022203348531939105, + "loss": 0.0162, "step": 200520 }, { - "epoch": 1.01, - "learning_rate": 0.000148245051990051, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022202959710301956, + "loss": 0.0197, "step": 200530 }, { - "epoch": 1.01, - "learning_rate": 0.00014823748429703697, - "loss": 0.0123, + "epoch": 0.52, + "learning_rate": 0.0002220257088866481, + "loss": 0.0184, "step": 200540 }, { - "epoch": 1.01, - "learning_rate": 0.00014822991660402298, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022202182067027664, + "loss": 0.0228, "step": 200550 }, { - "epoch": 1.01, - "learning_rate": 0.00014822234891100896, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022201793245390519, + "loss": 0.0123, "step": 200560 }, { - "epoch": 1.01, - "learning_rate": 0.00014821478121799494, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.0002220140442375337, + "loss": 0.0186, "step": 200570 }, { - "epoch": 1.01, - "learning_rate": 0.00014820721352498095, - "loss": 0.0071, + "epoch": 0.52, + "learning_rate": 0.00022201015602116224, + "loss": 0.0172, "step": 200580 }, { - "epoch": 1.01, - "learning_rate": 0.00014819964583196693, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.00022200626780479078, + "loss": 0.0153, "step": 200590 }, { - "epoch": 1.01, - "learning_rate": 0.00014819207813895292, - "loss": 0.0127, + "epoch": 0.52, + "learning_rate": 0.00022200237958841932, + "loss": 0.0225, "step": 200600 }, { - "epoch": 1.01, - "learning_rate": 0.00014818451044593892, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.00022199849137204784, + "loss": 0.0175, "step": 200610 }, { - "epoch": 1.01, - "learning_rate": 0.0001481769427529249, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022199460315567638, + "loss": 0.019, "step": 200620 }, { - "epoch": 1.01, - "learning_rate": 0.0001481693750599109, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022199071493930495, + "loss": 0.0189, "step": 200630 }, { - "epoch": 1.01, - "learning_rate": 0.0001481618073668969, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022198682672293346, + "loss": 0.0162, "step": 200640 }, { - "epoch": 1.01, - "learning_rate": 0.00014815423967388288, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.00022198293850656198, + "loss": 0.0165, "step": 200650 }, { - "epoch": 1.01, - "learning_rate": 0.00014814667198086886, - "loss": 0.0076, + "epoch": 0.52, + "learning_rate": 0.00022197905029019052, + "loss": 0.0181, "step": 200660 }, { - "epoch": 1.01, - "learning_rate": 0.00014813910428785487, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.0002219751620738191, + "loss": 0.0239, "step": 200670 }, { - "epoch": 1.01, - "learning_rate": 0.00014813153659484085, - "loss": 0.0104, + "epoch": 0.52, + "learning_rate": 0.0002219712738574476, + "loss": 0.0181, "step": 200680 }, { - "epoch": 1.01, - "learning_rate": 0.00014812396890182683, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022196738564107614, + "loss": 0.0207, "step": 200690 }, { - "epoch": 1.01, - "learning_rate": 0.0001481164012088128, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022196349742470466, + "loss": 0.0178, "step": 200700 }, { - "epoch": 1.01, - "learning_rate": 0.00014810883351579882, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022195960920833323, + "loss": 0.0156, "step": 200710 }, { - "epoch": 1.01, - "learning_rate": 0.0001481012658227848, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022195572099196174, + "loss": 0.0135, "step": 200720 }, { - "epoch": 1.01, - "learning_rate": 0.00014809369812977078, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022195183277559028, + "loss": 0.0214, "step": 200730 }, { - "epoch": 1.01, - "learning_rate": 0.0001480861304367568, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.0002219479445592188, + "loss": 0.0165, "step": 200740 }, { - "epoch": 1.01, - "learning_rate": 0.00014807856274374277, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022194405634284734, + "loss": 0.0142, "step": 200750 }, { - "epoch": 1.01, - "learning_rate": 0.00014807099505072875, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022194016812647588, + "loss": 0.0159, "step": 200760 }, { - "epoch": 1.01, - "learning_rate": 0.00014806342735771476, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022193627991010442, + "loss": 0.0215, "step": 200770 }, { - "epoch": 1.01, - "learning_rate": 0.00014805585966470074, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022193239169373294, + "loss": 0.0219, "step": 200780 }, { - "epoch": 1.01, - "learning_rate": 0.00014804829197168673, - "loss": 0.0124, + "epoch": 0.52, + "learning_rate": 0.00022192850347736148, + "loss": 0.0185, "step": 200790 }, { - "epoch": 1.01, - "learning_rate": 0.0001480407242786727, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022192461526099002, + "loss": 0.0192, "step": 200800 }, { - "epoch": 1.01, - "learning_rate": 0.0001480331565856587, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022192072704461856, + "loss": 0.0179, "step": 200810 }, { - "epoch": 1.01, - "learning_rate": 0.0001480255888926447, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022191683882824708, + "loss": 0.0156, "step": 200820 }, { - "epoch": 1.01, - "learning_rate": 0.00014801802119963068, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022191295061187562, + "loss": 0.0168, "step": 200830 }, { - "epoch": 1.01, - "learning_rate": 0.00014801045350661666, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.0002219090623955042, + "loss": 0.0167, "step": 200840 }, { - "epoch": 1.01, - "learning_rate": 0.00014800288581360267, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.0002219051741791327, + "loss": 0.0259, "step": 200850 }, { - "epoch": 1.01, - "learning_rate": 0.00014799531812058865, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022190128596276124, + "loss": 0.0182, "step": 200860 }, { - "epoch": 1.01, - "learning_rate": 0.00014798775042757463, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022189739774638976, + "loss": 0.0175, "step": 200870 }, { - "epoch": 1.01, - "learning_rate": 0.0001479801827345606, - "loss": 0.0118, + "epoch": 0.52, + "learning_rate": 0.00022189350953001833, + "loss": 0.0175, "step": 200880 }, { - "epoch": 1.01, - "learning_rate": 0.00014797261504154662, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.00022188962131364684, + "loss": 0.0151, "step": 200890 }, { - "epoch": 1.01, - "learning_rate": 0.0001479650473485326, - "loss": 0.0112, + "epoch": 0.52, + "learning_rate": 0.00022188573309727538, + "loss": 0.0176, "step": 200900 }, { - "epoch": 1.01, - "learning_rate": 0.00014795747965551858, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.0002218818448809039, + "loss": 0.015, "step": 200910 }, { - "epoch": 1.01, - "learning_rate": 0.0001479499119625046, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022187795666453247, + "loss": 0.0207, "step": 200920 }, { - "epoch": 1.01, - "learning_rate": 0.00014794234426949057, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022187406844816098, + "loss": 0.0207, "step": 200930 }, { - "epoch": 1.01, - "learning_rate": 0.00014793477657647656, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022187018023178952, + "loss": 0.0206, "step": 200940 }, { - "epoch": 1.01, - "learning_rate": 0.00014792720888346256, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.00022186629201541804, + "loss": 0.0171, "step": 200950 }, { - "epoch": 1.01, - "learning_rate": 0.00014791964119044855, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.0002218624037990466, + "loss": 0.0172, "step": 200960 }, { - "epoch": 1.01, - "learning_rate": 0.00014791207349743453, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022185851558267512, + "loss": 0.0187, "step": 200970 }, { - "epoch": 1.01, - "learning_rate": 0.00014790450580442054, - "loss": 0.0159, + "epoch": 0.52, + "learning_rate": 0.00022185462736630366, + "loss": 0.0195, "step": 200980 }, { - "epoch": 1.01, - "learning_rate": 0.00014789693811140652, - "loss": 0.0129, + "epoch": 0.52, + "learning_rate": 0.00022185073914993218, + "loss": 0.0185, "step": 200990 }, { - "epoch": 1.01, - "learning_rate": 0.0001478893704183925, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022184685093356072, + "loss": 0.0169, "step": 201000 }, { - "epoch": 1.01, - "eval_cer": 0.914447936792278, - "eval_loss": 0.007961818017065525, - "eval_runtime": 117.347, - "eval_samples_per_second": 17.043, - "eval_steps_per_second": 4.261, + "epoch": 0.52, + "eval_cer": 0.8817600714374692, + "eval_loss": 0.011896415613591671, + "eval_runtime": 108.2669, + "eval_samples_per_second": 18.473, + "eval_steps_per_second": 4.618, "step": 201000 }, { - "epoch": 1.01, - "learning_rate": 0.0001478818027253785, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.0002218429627171893, + "loss": 0.0207, "step": 201010 }, { - "epoch": 1.01, - "learning_rate": 0.0001478742350323645, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.0002218390745008178, + "loss": 0.028, "step": 201020 }, { - "epoch": 1.01, - "learning_rate": 0.00014786666733935047, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022183518628444634, + "loss": 0.0166, "step": 201030 }, { - "epoch": 1.01, - "learning_rate": 0.00014785909964633645, - "loss": 0.0135, + "epoch": 0.52, + "learning_rate": 0.00022183129806807486, + "loss": 0.017, "step": 201040 }, { - "epoch": 1.01, - "learning_rate": 0.00014785153195332246, - "loss": 0.0141, + "epoch": 0.52, + "learning_rate": 0.00022182740985170343, + "loss": 0.0207, "step": 201050 }, { - "epoch": 1.01, - "learning_rate": 0.00014784396426030844, - "loss": 0.0078, + "epoch": 0.52, + "learning_rate": 0.00022182352163533194, + "loss": 0.0169, "step": 201060 }, { - "epoch": 1.01, - "learning_rate": 0.00014783639656729442, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.00022181963341896048, + "loss": 0.0153, "step": 201070 }, { - "epoch": 1.01, - "learning_rate": 0.00014782882887428043, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.000221815745202589, + "loss": 0.0116, "step": 201080 }, { - "epoch": 1.01, - "learning_rate": 0.0001478212611812664, - "loss": 0.01, + "epoch": 0.52, + "learning_rate": 0.00022181185698621757, + "loss": 0.0135, "step": 201090 }, { - "epoch": 1.01, - "learning_rate": 0.0001478136934882524, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022180796876984608, + "loss": 0.0184, "step": 201100 }, { - "epoch": 1.01, - "learning_rate": 0.0001478061257952384, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022180408055347462, + "loss": 0.0157, "step": 201110 }, { - "epoch": 1.01, - "learning_rate": 0.00014779855810222438, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022180019233710314, + "loss": 0.0191, "step": 201120 }, { - "epoch": 1.01, - "learning_rate": 0.00014779099040921037, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.0002217963041207317, + "loss": 0.0149, "step": 201130 }, { - "epoch": 1.01, - "learning_rate": 0.00014778342271619637, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022179241590436022, + "loss": 0.0159, "step": 201140 }, { - "epoch": 1.01, - "learning_rate": 0.00014777585502318236, - "loss": 0.0116, + "epoch": 0.52, + "learning_rate": 0.00022178852768798876, + "loss": 0.017, "step": 201150 }, { - "epoch": 1.01, - "learning_rate": 0.00014776828733016834, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022178463947161728, + "loss": 0.0182, "step": 201160 }, { - "epoch": 1.01, - "learning_rate": 0.00014776071963715435, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022178075125524585, + "loss": 0.0161, "step": 201170 }, { - "epoch": 1.01, - "learning_rate": 0.00014775315194414033, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.0002217768630388744, + "loss": 0.0169, "step": 201180 }, { - "epoch": 1.02, - "learning_rate": 0.0001477455842511263, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.0002217729748225029, + "loss": 0.0142, "step": 201190 }, { - "epoch": 1.02, - "learning_rate": 0.00014773801655811232, - "loss": 0.0082, + "epoch": 0.52, + "learning_rate": 0.00022176908660613144, + "loss": 0.0165, "step": 201200 }, { - "epoch": 1.02, - "learning_rate": 0.0001477304488650983, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022176519838975998, + "loss": 0.0138, "step": 201210 }, { - "epoch": 1.02, - "learning_rate": 0.00014772288117208428, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022176131017338853, + "loss": 0.0174, "step": 201220 }, { - "epoch": 1.02, - "learning_rate": 0.00014771531347907026, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022175742195701704, + "loss": 0.0131, "step": 201230 }, { - "epoch": 1.02, - "learning_rate": 0.00014770774578605627, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022175353374064558, + "loss": 0.021, "step": 201240 }, { - "epoch": 1.02, - "learning_rate": 0.00014770017809304225, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.0002217496455242741, + "loss": 0.0198, "step": 201250 }, { - "epoch": 1.02, - "learning_rate": 0.00014769261040002823, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.00022174575730790267, + "loss": 0.0176, "step": 201260 }, { - "epoch": 1.02, - "learning_rate": 0.00014768504270701424, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.00022174186909153118, + "loss": 0.0157, "step": 201270 }, { - "epoch": 1.02, - "learning_rate": 0.00014767747501400022, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022173798087515972, + "loss": 0.0172, "step": 201280 }, { - "epoch": 1.02, - "learning_rate": 0.0001476699073209862, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022173409265878824, + "loss": 0.0243, "step": 201290 }, { - "epoch": 1.02, - "learning_rate": 0.0001476623396279722, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.0002217302044424168, + "loss": 0.0173, "step": 201300 }, { - "epoch": 1.02, - "learning_rate": 0.0001476547719349582, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022172631622604532, + "loss": 0.0169, "step": 201310 }, { - "epoch": 1.02, - "learning_rate": 0.00014764720424194418, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022172242800967386, + "loss": 0.0192, "step": 201320 }, { - "epoch": 1.02, - "learning_rate": 0.00014763963654893018, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022171853979330238, + "loss": 0.02, "step": 201330 }, { - "epoch": 1.02, - "learning_rate": 0.00014763206885591617, - "loss": 0.0078, + "epoch": 0.52, + "learning_rate": 0.00022171465157693094, + "loss": 0.0189, "step": 201340 }, { - "epoch": 1.02, - "learning_rate": 0.00014762450116290215, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.0002217107633605595, + "loss": 0.0142, "step": 201350 }, { - "epoch": 1.02, - "learning_rate": 0.00014761693346988816, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.000221706875144188, + "loss": 0.0197, "step": 201360 }, { - "epoch": 1.02, - "learning_rate": 0.00014760936577687414, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022170298692781652, + "loss": 0.0196, "step": 201370 }, { - "epoch": 1.02, - "learning_rate": 0.00014760179808386012, - "loss": 0.0086, + "epoch": 0.52, + "learning_rate": 0.00022169909871144508, + "loss": 0.0146, "step": 201380 }, { - "epoch": 1.02, - "learning_rate": 0.0001475942303908461, - "loss": 0.0102, + "epoch": 0.52, + "learning_rate": 0.00022169521049507363, + "loss": 0.0147, "step": 201390 }, { - "epoch": 1.02, - "learning_rate": 0.0001475866626978321, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022169132227870214, + "loss": 0.0175, "step": 201400 }, { - "epoch": 1.02, - "learning_rate": 0.0001475790950048181, - "loss": 0.0143, + "epoch": 0.52, + "learning_rate": 0.00022168743406233068, + "loss": 0.0181, "step": 201410 }, { - "epoch": 1.02, - "learning_rate": 0.00014757152731180407, - "loss": 0.0086, + "epoch": 0.52, + "learning_rate": 0.00022168354584595922, + "loss": 0.0148, "step": 201420 }, { - "epoch": 1.02, - "learning_rate": 0.00014756395961879005, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022167965762958777, + "loss": 0.0188, "step": 201430 }, { - "epoch": 1.02, - "learning_rate": 0.00014755639192577603, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022167576941321628, + "loss": 0.0184, "step": 201440 }, { - "epoch": 1.02, - "learning_rate": 0.00014754882423276204, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.00022167188119684482, + "loss": 0.0174, "step": 201450 }, { - "epoch": 1.02, - "learning_rate": 0.00014754125653974802, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022166799298047336, + "loss": 0.018, "step": 201460 }, { - "epoch": 1.02, - "learning_rate": 0.000147533688846734, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.0002216641047641019, + "loss": 0.0196, "step": 201470 }, { - "epoch": 1.02, - "learning_rate": 0.00014752612115372001, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022166021654773042, + "loss": 0.0168, "step": 201480 }, { - "epoch": 1.02, - "learning_rate": 0.000147518553460706, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022165632833135896, + "loss": 0.0195, "step": 201490 }, { - "epoch": 1.02, - "learning_rate": 0.00014751098576769198, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022165244011498748, + "loss": 0.0158, "step": 201500 }, { - "epoch": 1.02, - "learning_rate": 0.00014750341807467799, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022164855189861604, + "loss": 0.0183, "step": 201510 }, { - "epoch": 1.02, - "learning_rate": 0.00014749585038166397, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022164466368224456, + "loss": 0.0186, "step": 201520 }, { - "epoch": 1.02, - "learning_rate": 0.00014748828268864995, - "loss": 0.0117, + "epoch": 0.52, + "learning_rate": 0.0002216407754658731, + "loss": 0.017, "step": 201530 }, { - "epoch": 1.02, - "learning_rate": 0.00014748071499563596, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022163688724950161, + "loss": 0.0204, "step": 201540 }, { - "epoch": 1.02, - "learning_rate": 0.00014747314730262194, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022163299903313018, + "loss": 0.0152, "step": 201550 }, { - "epoch": 1.02, - "learning_rate": 0.00014746557960960792, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022162911081675873, + "loss": 0.03, "step": 201560 }, { - "epoch": 1.02, - "learning_rate": 0.00014745801191659393, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022162522260038724, + "loss": 0.0166, "step": 201570 }, { - "epoch": 1.02, - "learning_rate": 0.0001474504442235799, - "loss": 0.0122, + "epoch": 0.52, + "learning_rate": 0.00022162133438401578, + "loss": 0.0193, "step": 201580 }, { - "epoch": 1.02, - "learning_rate": 0.0001474428765305659, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022161744616764432, + "loss": 0.0355, "step": 201590 }, { - "epoch": 1.02, - "learning_rate": 0.00014743530883755187, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022161355795127286, + "loss": 0.0154, "step": 201600 }, { - "epoch": 1.02, - "learning_rate": 0.00014742774114453788, - "loss": 0.0069, + "epoch": 0.52, + "learning_rate": 0.00022160966973490138, + "loss": 0.0166, "step": 201610 }, { - "epoch": 1.02, - "learning_rate": 0.00014742017345152386, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022160578151852992, + "loss": 0.0142, "step": 201620 }, { - "epoch": 1.02, - "learning_rate": 0.00014741260575850984, - "loss": 0.0137, + "epoch": 0.52, + "learning_rate": 0.00022160189330215846, + "loss": 0.0162, "step": 201630 }, { - "epoch": 1.02, - "learning_rate": 0.00014740503806549585, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.000221598005085787, + "loss": 0.0181, "step": 201640 }, { - "epoch": 1.02, - "learning_rate": 0.00014739747037248183, - "loss": 0.0082, + "epoch": 0.52, + "learning_rate": 0.00022159411686941552, + "loss": 0.0184, "step": 201650 }, { - "epoch": 1.02, - "learning_rate": 0.00014738990267946782, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022159022865304406, + "loss": 0.0197, "step": 201660 }, { - "epoch": 1.02, - "learning_rate": 0.00014738233498645382, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022158634043667263, + "loss": 0.0167, "step": 201670 }, { - "epoch": 1.02, - "learning_rate": 0.0001473747672934398, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.00022158245222030114, + "loss": 0.0184, "step": 201680 }, { - "epoch": 1.02, - "learning_rate": 0.0001473671996004258, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022157856400392966, + "loss": 0.018, "step": 201690 }, { - "epoch": 1.02, - "learning_rate": 0.0001473596319074118, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.0002215746757875582, + "loss": 0.0155, "step": 201700 }, { - "epoch": 1.02, - "learning_rate": 0.00014735206421439778, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.00022157078757118677, + "loss": 0.0171, "step": 201710 }, { - "epoch": 1.02, - "learning_rate": 0.00014734449652138376, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022156689935481528, + "loss": 0.0152, "step": 201720 }, { - "epoch": 1.02, - "learning_rate": 0.00014733692882836977, - "loss": 0.015, + "epoch": 0.52, + "learning_rate": 0.00022156301113844382, + "loss": 0.0196, "step": 201730 }, { - "epoch": 1.02, - "learning_rate": 0.00014732936113535575, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022155912292207234, + "loss": 0.0183, "step": 201740 }, { - "epoch": 1.02, - "learning_rate": 0.00014732179344234173, - "loss": 0.0091, + "epoch": 0.52, + "learning_rate": 0.00022155523470570088, + "loss": 0.0167, "step": 201750 }, { - "epoch": 1.02, - "learning_rate": 0.0001473142257493277, - "loss": 0.0131, + "epoch": 0.52, + "learning_rate": 0.00022155134648932942, + "loss": 0.0176, "step": 201760 }, { - "epoch": 1.02, - "learning_rate": 0.00014730665805631372, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022154745827295796, + "loss": 0.0151, "step": 201770 }, { - "epoch": 1.02, - "learning_rate": 0.0001472990903632997, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.00022154357005658648, + "loss": 0.0138, "step": 201780 }, { - "epoch": 1.02, - "learning_rate": 0.00014729152267028568, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022153968184021502, + "loss": 0.0168, "step": 201790 }, { - "epoch": 1.02, - "learning_rate": 0.0001472839549772717, - "loss": 0.0139, + "epoch": 0.52, + "learning_rate": 0.00022153579362384356, + "loss": 0.0159, "step": 201800 }, { - "epoch": 1.02, - "learning_rate": 0.00014727638728425767, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.0002215319054074721, + "loss": 0.0159, "step": 201810 }, { - "epoch": 1.02, - "learning_rate": 0.00014726881959124365, - "loss": 0.0109, + "epoch": 0.52, + "learning_rate": 0.00022152801719110062, + "loss": 0.0166, "step": 201820 }, { - "epoch": 1.02, - "learning_rate": 0.00014726125189822966, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.00022152412897472916, + "loss": 0.0177, "step": 201830 }, { - "epoch": 1.02, - "learning_rate": 0.00014725368420521564, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.0002215202407583577, + "loss": 0.0156, "step": 201840 }, { - "epoch": 1.02, - "learning_rate": 0.00014724611651220163, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022151635254198624, + "loss": 0.0202, "step": 201850 }, { - "epoch": 1.02, - "learning_rate": 0.00014723854881918763, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022151246432561476, + "loss": 0.0173, "step": 201860 }, { - "epoch": 1.02, - "learning_rate": 0.00014723098112617362, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.0002215085761092433, + "loss": 0.0174, "step": 201870 }, { - "epoch": 1.02, - "learning_rate": 0.0001472234134331596, - "loss": 0.012, + "epoch": 0.52, + "learning_rate": 0.00022150468789287187, + "loss": 0.0183, "step": 201880 }, { - "epoch": 1.02, - "learning_rate": 0.0001472158457401456, - "loss": 0.0085, + "epoch": 0.52, + "learning_rate": 0.00022150079967650038, + "loss": 0.0208, "step": 201890 }, { - "epoch": 1.02, - "learning_rate": 0.0001472082780471316, - "loss": 0.0081, + "epoch": 0.52, + "learning_rate": 0.00022149691146012892, + "loss": 0.0155, "step": 201900 }, { - "epoch": 1.02, - "learning_rate": 0.00014720071035411757, - "loss": 0.0077, + "epoch": 0.52, + "learning_rate": 0.00022149302324375744, + "loss": 0.0185, "step": 201910 }, { - "epoch": 1.02, - "learning_rate": 0.00014719314266110355, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.000221489135027386, + "loss": 0.0158, "step": 201920 }, { - "epoch": 1.02, - "learning_rate": 0.00014718557496808956, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.00022148524681101452, + "loss": 0.0185, "step": 201930 }, { - "epoch": 1.02, - "learning_rate": 0.00014717800727507554, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.00022148135859464306, + "loss": 0.0179, "step": 201940 }, { - "epoch": 1.02, - "learning_rate": 0.00014717043958206152, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022147747037827158, + "loss": 0.0138, "step": 201950 }, { - "epoch": 1.02, - "learning_rate": 0.00014716287188904753, - "loss": 0.0086, + "epoch": 0.52, + "learning_rate": 0.00022147358216190012, + "loss": 0.0157, "step": 201960 }, { - "epoch": 1.02, - "learning_rate": 0.0001471553041960335, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022146969394552866, + "loss": 0.0132, "step": 201970 }, { - "epoch": 1.02, - "learning_rate": 0.0001471477365030195, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.0002214658057291572, + "loss": 0.0147, "step": 201980 }, { - "epoch": 1.02, - "learning_rate": 0.0001471401688100055, - "loss": 0.008, + "epoch": 0.52, + "learning_rate": 0.00022146191751278572, + "loss": 0.0142, "step": 201990 }, { - "epoch": 1.02, - "learning_rate": 0.00014713260111699148, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022145802929641426, + "loss": 0.0185, "step": 202000 }, { - "epoch": 1.02, - "eval_cer": 0.9144954862024227, - "eval_loss": 0.007912137545645237, - "eval_runtime": 117.0882, - "eval_samples_per_second": 17.081, - "eval_steps_per_second": 4.27, + "epoch": 0.52, + "eval_cer": 0.8818104583670996, + "eval_loss": 0.011379092931747437, + "eval_runtime": 107.8594, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, "step": 202000 }, { - "epoch": 1.02, - "learning_rate": 0.00014712503342397746, - "loss": 0.0113, + "epoch": 0.52, + "learning_rate": 0.0002214541410800428, + "loss": 0.0207, "step": 202010 }, { - "epoch": 1.02, - "learning_rate": 0.00014711746573096347, - "loss": 0.0106, + "epoch": 0.52, + "learning_rate": 0.00022145025286367134, + "loss": 0.015, "step": 202020 }, { - "epoch": 1.02, - "learning_rate": 0.00014710989803794945, - "loss": 0.0126, + "epoch": 0.52, + "learning_rate": 0.00022144636464729986, + "loss": 0.0144, "step": 202030 }, { - "epoch": 1.02, - "learning_rate": 0.00014710233034493544, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.0002214424764309284, + "loss": 0.0168, "step": 202040 }, { - "epoch": 1.02, - "learning_rate": 0.00014709476265192142, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022143858821455697, + "loss": 0.014, "step": 202050 }, { - "epoch": 1.02, - "learning_rate": 0.0001470871949589074, - "loss": 0.0086, + "epoch": 0.52, + "learning_rate": 0.00022143469999818548, + "loss": 0.0175, "step": 202060 }, { - "epoch": 1.02, - "learning_rate": 0.0001470796272658934, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022143081178181402, + "loss": 0.0181, "step": 202070 }, { - "epoch": 1.02, - "learning_rate": 0.0001470720595728794, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022142692356544254, + "loss": 0.0131, "step": 202080 }, { - "epoch": 1.02, - "learning_rate": 0.00014706449187986537, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.0002214230353490711, + "loss": 0.0222, "step": 202090 }, { - "epoch": 1.02, - "learning_rate": 0.00014705692418685138, - "loss": 0.0099, + "epoch": 0.52, + "learning_rate": 0.00022141914713269962, + "loss": 0.018, "step": 202100 }, { - "epoch": 1.02, - "learning_rate": 0.00014704935649383736, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022141525891632816, + "loss": 0.0162, "step": 202110 }, { - "epoch": 1.02, - "learning_rate": 0.00014704178880082334, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022141137069995668, + "loss": 0.0148, "step": 202120 }, { - "epoch": 1.02, - "learning_rate": 0.00014703422110780932, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.00022140748248358525, + "loss": 0.0136, "step": 202130 }, { - "epoch": 1.02, - "learning_rate": 0.00014702665341479533, - "loss": 0.0092, + "epoch": 0.52, + "learning_rate": 0.00022140359426721376, + "loss": 0.0191, "step": 202140 }, { - "epoch": 1.02, - "learning_rate": 0.0001470190857217813, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.0002213997060508423, + "loss": 0.0174, "step": 202150 }, { - "epoch": 1.02, - "learning_rate": 0.0001470115180287673, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022139581783447082, + "loss": 0.0158, "step": 202160 }, { - "epoch": 1.02, - "learning_rate": 0.0001470039503357533, - "loss": 0.0118, + "epoch": 0.52, + "learning_rate": 0.00022139192961809939, + "loss": 0.018, "step": 202170 }, { - "epoch": 1.02, - "learning_rate": 0.00014699638264273928, - "loss": 0.0094, + "epoch": 0.52, + "learning_rate": 0.0002213880414017279, + "loss": 0.0213, "step": 202180 }, { - "epoch": 1.02, - "learning_rate": 0.00014698881494972527, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022138415318535644, + "loss": 0.0162, "step": 202190 }, { - "epoch": 1.02, - "learning_rate": 0.00014698124725671127, - "loss": 0.0129, + "epoch": 0.52, + "learning_rate": 0.00022138026496898496, + "loss": 0.0227, "step": 202200 }, { - "epoch": 1.02, - "learning_rate": 0.00014697367956369726, - "loss": 0.0133, + "epoch": 0.52, + "learning_rate": 0.0002213763767526135, + "loss": 0.0216, "step": 202210 }, { - "epoch": 1.02, - "learning_rate": 0.00014696611187068324, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022137248853624207, + "loss": 0.0169, "step": 202220 }, { - "epoch": 1.02, - "learning_rate": 0.00014695854417766925, - "loss": 0.0078, + "epoch": 0.52, + "learning_rate": 0.00022136860031987058, + "loss": 0.0166, "step": 202230 }, { - "epoch": 1.02, - "learning_rate": 0.00014695097648465523, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.0002213647121034991, + "loss": 0.0232, "step": 202240 }, { - "epoch": 1.02, - "learning_rate": 0.0001469434087916412, - "loss": 0.0114, + "epoch": 0.52, + "learning_rate": 0.00022136082388712764, + "loss": 0.0207, "step": 202250 }, { - "epoch": 1.02, - "learning_rate": 0.00014693584109862722, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.0002213569356707562, + "loss": 0.0146, "step": 202260 }, { - "epoch": 1.02, - "learning_rate": 0.0001469282734056132, - "loss": 0.0074, + "epoch": 0.52, + "learning_rate": 0.00022135304745438472, + "loss": 0.0155, "step": 202270 }, { - "epoch": 1.02, - "learning_rate": 0.00014692070571259918, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022134915923801326, + "loss": 0.0162, "step": 202280 }, { - "epoch": 1.02, - "learning_rate": 0.00014691313801958516, - "loss": 0.0101, + "epoch": 0.52, + "learning_rate": 0.00022134527102164178, + "loss": 0.0177, "step": 202290 }, { - "epoch": 1.02, - "learning_rate": 0.00014690557032657117, - "loss": 0.0098, + "epoch": 0.52, + "learning_rate": 0.00022134138280527035, + "loss": 0.0146, "step": 202300 }, { - "epoch": 1.02, - "learning_rate": 0.00014689800263355715, - "loss": 0.0111, + "epoch": 0.52, + "learning_rate": 0.00022133749458889886, + "loss": 0.0133, "step": 202310 }, { - "epoch": 1.02, - "learning_rate": 0.00014689043494054313, - "loss": 0.0127, + "epoch": 0.52, + "learning_rate": 0.0002213336063725274, + "loss": 0.015, "step": 202320 }, { - "epoch": 1.02, - "learning_rate": 0.00014688286724752914, - "loss": 0.0075, + "epoch": 0.52, + "learning_rate": 0.00022132971815615592, + "loss": 0.0186, "step": 202330 }, { - "epoch": 1.02, - "learning_rate": 0.00014687529955451512, - "loss": 0.0084, + "epoch": 0.52, + "learning_rate": 0.00022132582993978449, + "loss": 0.0219, "step": 202340 }, { - "epoch": 1.02, - "learning_rate": 0.0001468677318615011, - "loss": 0.0105, + "epoch": 0.52, + "learning_rate": 0.000221321941723413, + "loss": 0.0171, "step": 202350 }, { - "epoch": 1.02, - "learning_rate": 0.0001468601641684871, - "loss": 0.0088, + "epoch": 0.52, + "learning_rate": 0.00022131805350704154, + "loss": 0.0205, "step": 202360 }, { - "epoch": 1.02, - "learning_rate": 0.0001468525964754731, - "loss": 0.0096, + "epoch": 0.52, + "learning_rate": 0.00022131416529067006, + "loss": 0.0154, "step": 202370 }, { - "epoch": 1.02, - "learning_rate": 0.00014684502878245908, - "loss": 0.0097, + "epoch": 0.52, + "learning_rate": 0.00022131027707429862, + "loss": 0.0182, "step": 202380 }, { - "epoch": 1.02, - "learning_rate": 0.00014683746108944508, - "loss": 0.0119, + "epoch": 0.52, + "learning_rate": 0.00022130638885792714, + "loss": 0.017, "step": 202390 }, { - "epoch": 1.02, - "learning_rate": 0.00014682989339643107, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022130250064155568, + "loss": 0.0166, "step": 202400 }, { - "epoch": 1.02, - "learning_rate": 0.00014682232570341705, - "loss": 0.0113, + "epoch": 0.52, + "learning_rate": 0.0002212986124251842, + "loss": 0.0176, "step": 202410 }, { - "epoch": 1.02, - "learning_rate": 0.00014681475801040306, - "loss": 0.0093, + "epoch": 0.52, + "learning_rate": 0.00022129472420881276, + "loss": 0.0218, "step": 202420 }, { - "epoch": 1.02, - "learning_rate": 0.00014680719031738904, - "loss": 0.0107, + "epoch": 0.52, + "learning_rate": 0.0002212908359924413, + "loss": 0.0218, "step": 202430 }, { - "epoch": 1.02, - "learning_rate": 0.00014679962262437502, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.00022128694777606982, + "loss": 0.0193, "step": 202440 }, { - "epoch": 1.02, - "learning_rate": 0.000146792054931361, - "loss": 0.0079, + "epoch": 0.52, + "learning_rate": 0.00022128305955969836, + "loss": 0.0202, "step": 202450 }, { - "epoch": 1.02, - "learning_rate": 0.000146784487238347, - "loss": 0.0108, + "epoch": 0.52, + "learning_rate": 0.00022127917134332688, + "loss": 0.0216, "step": 202460 }, { - "epoch": 1.02, - "learning_rate": 0.000146776919545333, - "loss": 0.011, + "epoch": 0.52, + "learning_rate": 0.00022127528312695545, + "loss": 0.0183, "step": 202470 }, { - "epoch": 1.02, - "learning_rate": 0.00014676935185231897, - "loss": 0.0095, + "epoch": 0.52, + "learning_rate": 0.00022127139491058396, + "loss": 0.0132, "step": 202480 }, { - "epoch": 1.02, - "learning_rate": 0.00014676178415930498, - "loss": 0.0083, + "epoch": 0.52, + "learning_rate": 0.0002212675066942125, + "loss": 0.0229, "step": 202490 }, { - "epoch": 1.02, - "learning_rate": 0.00014675421646629096, - "loss": 0.0087, + "epoch": 0.52, + "learning_rate": 0.00022126361847784102, + "loss": 0.0224, "step": 202500 }, { - "epoch": 1.02, - "learning_rate": 0.00014674664877327694, - "loss": 0.009, + "epoch": 0.52, + "learning_rate": 0.00022125973026146958, + "loss": 0.0206, "step": 202510 }, { - "epoch": 1.02, - "learning_rate": 0.00014673908108026295, - "loss": 0.0089, + "epoch": 0.52, + "learning_rate": 0.0002212558420450981, + "loss": 0.0163, "step": 202520 }, { - "epoch": 1.02, - "learning_rate": 0.00014673151338724893, - "loss": 0.0103, + "epoch": 0.52, + "learning_rate": 0.00022125195382872664, + "loss": 0.0214, "step": 202530 }, { - "epoch": 1.02, - "learning_rate": 0.00014672394569423491, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.00022124806561235516, + "loss": 0.0169, "step": 202540 }, { - "epoch": 1.02, - "learning_rate": 0.00014671637800122092, - "loss": 0.0122, + "epoch": 0.53, + "learning_rate": 0.00022124417739598372, + "loss": 0.019, "step": 202550 }, { - "epoch": 1.02, - "learning_rate": 0.0001467088103082069, - "loss": 0.0078, + "epoch": 0.53, + "learning_rate": 0.00022124028917961224, + "loss": 0.0175, "step": 202560 }, { - "epoch": 1.02, - "learning_rate": 0.00014670124261519289, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022123640096324078, + "loss": 0.0176, "step": 202570 }, { - "epoch": 1.02, - "learning_rate": 0.0001466936749221789, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.0002212325127468693, + "loss": 0.0225, "step": 202580 }, { - "epoch": 1.02, - "learning_rate": 0.00014668610722916488, - "loss": 0.0077, + "epoch": 0.53, + "learning_rate": 0.00022122862453049786, + "loss": 0.0151, "step": 202590 }, { - "epoch": 1.02, - "learning_rate": 0.00014667853953615086, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.0002212247363141264, + "loss": 0.0151, "step": 202600 }, { - "epoch": 1.02, - "learning_rate": 0.00014667097184313687, - "loss": 0.0124, + "epoch": 0.53, + "learning_rate": 0.00022122084809775492, + "loss": 0.0197, "step": 202610 }, { - "epoch": 1.02, - "learning_rate": 0.00014666340415012285, - "loss": 0.0125, + "epoch": 0.53, + "learning_rate": 0.00022121695988138346, + "loss": 0.0174, "step": 202620 }, { - "epoch": 1.02, - "learning_rate": 0.00014665583645710883, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.000221213071665012, + "loss": 0.0175, "step": 202630 }, { - "epoch": 1.02, - "learning_rate": 0.0001466482687640948, - "loss": 0.0127, + "epoch": 0.53, + "learning_rate": 0.00022120918344864054, + "loss": 0.0161, "step": 202640 }, { - "epoch": 1.02, - "learning_rate": 0.00014664070107108082, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022120529523226906, + "loss": 0.0157, "step": 202650 }, { - "epoch": 1.02, - "learning_rate": 0.0001466331333780668, - "loss": 0.0077, + "epoch": 0.53, + "learning_rate": 0.0002212014070158976, + "loss": 0.0161, "step": 202660 }, { - "epoch": 1.02, - "learning_rate": 0.00014662556568505278, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022119751879952614, + "loss": 0.019, "step": 202670 }, { - "epoch": 1.02, - "learning_rate": 0.00014661799799203876, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022119363058315468, + "loss": 0.0176, "step": 202680 }, { - "epoch": 1.02, - "learning_rate": 0.00014661043029902474, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.0002211897423667832, + "loss": 0.0193, "step": 202690 }, { - "epoch": 1.02, - "learning_rate": 0.00014660286260601075, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.00022118585415041174, + "loss": 0.0152, "step": 202700 }, { - "epoch": 1.02, - "learning_rate": 0.00014659529491299673, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022118196593404025, + "loss": 0.0177, "step": 202710 }, { - "epoch": 1.02, - "learning_rate": 0.00014658772721998272, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.00022117807771766882, + "loss": 0.0188, "step": 202720 }, { - "epoch": 1.02, - "learning_rate": 0.00014658015952696872, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022117418950129734, + "loss": 0.0173, "step": 202730 }, { - "epoch": 1.02, - "learning_rate": 0.0001465725918339547, - "loss": 0.0076, + "epoch": 0.53, + "learning_rate": 0.00022117030128492588, + "loss": 0.0166, "step": 202740 }, { - "epoch": 1.02, - "learning_rate": 0.0001465650241409407, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.0002211664130685544, + "loss": 0.0151, "step": 202750 }, { - "epoch": 1.02, - "learning_rate": 0.0001465574564479267, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022116252485218296, + "loss": 0.0185, "step": 202760 }, { - "epoch": 1.02, - "learning_rate": 0.00014654988875491268, - "loss": 0.0123, + "epoch": 0.53, + "learning_rate": 0.0002211586366358115, + "loss": 0.0134, "step": 202770 }, { - "epoch": 1.02, - "learning_rate": 0.00014654232106189866, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022115474841944002, + "loss": 0.0177, "step": 202780 }, { - "epoch": 1.02, - "learning_rate": 0.00014653475336888467, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022115086020306856, + "loss": 0.0134, "step": 202790 }, { - "epoch": 1.02, - "learning_rate": 0.00014652718567587065, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.0002211469719866971, + "loss": 0.0159, "step": 202800 }, { - "epoch": 1.02, - "learning_rate": 0.00014651961798285663, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022114308377032564, + "loss": 0.0213, "step": 202810 }, { - "epoch": 1.02, - "learning_rate": 0.0001465120502898426, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022113919555395416, + "loss": 0.0207, "step": 202820 }, { - "epoch": 1.02, - "learning_rate": 0.00014650448259682862, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002211353073375827, + "loss": 0.0201, "step": 202830 }, { - "epoch": 1.02, - "learning_rate": 0.0001464969149038146, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.00022113141912121124, + "loss": 0.0167, "step": 202840 }, { - "epoch": 1.02, - "learning_rate": 0.00014648934721080058, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022112753090483978, + "loss": 0.0165, "step": 202850 }, { - "epoch": 1.02, - "learning_rate": 0.0001464817795177866, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.0002211236426884683, + "loss": 0.0191, "step": 202860 }, { - "epoch": 1.02, - "learning_rate": 0.00014647421182477257, - "loss": 0.0074, + "epoch": 0.53, + "learning_rate": 0.00022111975447209684, + "loss": 0.0185, "step": 202870 }, { - "epoch": 1.02, - "learning_rate": 0.00014646664413175856, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022111586625572538, + "loss": 0.0191, "step": 202880 }, { - "epoch": 1.02, - "learning_rate": 0.00014645907643874456, - "loss": 0.0068, + "epoch": 0.53, + "learning_rate": 0.00022111197803935392, + "loss": 0.0241, "step": 202890 }, { - "epoch": 1.02, - "learning_rate": 0.00014645150874573055, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022110808982298244, + "loss": 0.0172, "step": 202900 }, { - "epoch": 1.02, - "learning_rate": 0.00014644394105271653, - "loss": 0.0077, + "epoch": 0.53, + "learning_rate": 0.00022110420160661098, + "loss": 0.0184, "step": 202910 }, { - "epoch": 1.02, - "learning_rate": 0.00014643637335970254, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022110031339023955, + "loss": 0.0182, "step": 202920 }, { - "epoch": 1.02, - "learning_rate": 0.00014642880566668852, - "loss": 0.0073, + "epoch": 0.53, + "learning_rate": 0.00022109642517386806, + "loss": 0.0161, "step": 202930 }, { - "epoch": 1.02, - "learning_rate": 0.0001464212379736745, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.0002210925369574966, + "loss": 0.0154, "step": 202940 }, { - "epoch": 1.02, - "learning_rate": 0.0001464136702806605, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.00022108864874112512, + "loss": 0.0136, "step": 202950 }, { - "epoch": 1.02, - "learning_rate": 0.0001464061025876465, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.00022108476052475363, + "loss": 0.0157, "step": 202960 }, { - "epoch": 1.02, - "learning_rate": 0.00014639853489463247, - "loss": 0.0143, + "epoch": 0.53, + "learning_rate": 0.0002210808723083822, + "loss": 0.0189, "step": 202970 }, { - "epoch": 1.02, - "learning_rate": 0.00014639096720161845, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022107698409201074, + "loss": 0.0197, "step": 202980 }, { - "epoch": 1.02, - "learning_rate": 0.00014638339950860446, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022107309587563926, + "loss": 0.0154, "step": 202990 }, { - "epoch": 1.02, - "learning_rate": 0.00014637583181559044, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.0002210692076592678, + "loss": 0.0149, "step": 203000 }, { - "epoch": 1.02, - "eval_cer": 0.9144663743186606, - "eval_loss": 0.0076591866090893745, - "eval_runtime": 117.2192, - "eval_samples_per_second": 17.062, - "eval_steps_per_second": 4.266, + "epoch": 0.53, + "eval_cer": 0.8817866645392185, + "eval_loss": 0.011468823999166489, + "eval_runtime": 107.5391, + "eval_samples_per_second": 18.598, + "eval_steps_per_second": 4.649, "step": 203000 }, { - "epoch": 1.02, - "learning_rate": 0.00014636826412257642, - "loss": 0.0068, + "epoch": 0.53, + "learning_rate": 0.00022106531944289634, + "loss": 0.02, "step": 203010 }, { - "epoch": 1.02, - "learning_rate": 0.00014636069642956243, - "loss": 0.0078, + "epoch": 0.53, + "learning_rate": 0.00022106143122652488, + "loss": 0.0127, "step": 203020 }, { - "epoch": 1.02, - "learning_rate": 0.0001463531287365484, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.0002210575430101534, + "loss": 0.019, "step": 203030 }, { - "epoch": 1.02, - "learning_rate": 0.0001463455610435344, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00022105365479378194, + "loss": 0.0138, "step": 203040 }, { - "epoch": 1.02, - "learning_rate": 0.0001463379933505204, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022104976657741048, + "loss": 0.016, "step": 203050 }, { - "epoch": 1.02, - "learning_rate": 0.00014633042565750638, - "loss": 0.0069, + "epoch": 0.53, + "learning_rate": 0.00022104587836103902, + "loss": 0.0183, "step": 203060 }, { - "epoch": 1.02, - "learning_rate": 0.00014632285796449237, - "loss": 0.0126, + "epoch": 0.53, + "learning_rate": 0.00022104199014466754, + "loss": 0.0164, "step": 203070 }, { - "epoch": 1.02, - "learning_rate": 0.00014631529027147837, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022103810192829608, + "loss": 0.0179, "step": 203080 }, { - "epoch": 1.02, - "learning_rate": 0.00014630772257846436, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022103421371192465, + "loss": 0.0173, "step": 203090 }, { - "epoch": 1.02, - "learning_rate": 0.00014630015488545034, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022103032549555316, + "loss": 0.0193, "step": 203100 }, { - "epoch": 1.02, - "learning_rate": 0.00014629258719243635, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022102643727918168, + "loss": 0.0225, "step": 203110 }, { - "epoch": 1.02, - "learning_rate": 0.00014628501949942233, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.00022102254906281022, + "loss": 0.0158, "step": 203120 }, { - "epoch": 1.02, - "learning_rate": 0.0001462774518064083, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.0002210186608464388, + "loss": 0.0169, "step": 203130 }, { - "epoch": 1.02, - "learning_rate": 0.00014626988411339432, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.0002210147726300673, + "loss": 0.0273, "step": 203140 }, { - "epoch": 1.02, - "learning_rate": 0.0001462623164203803, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022101088441369584, + "loss": 0.0196, "step": 203150 }, { - "epoch": 1.02, - "learning_rate": 0.00014625474872736628, - "loss": 0.0124, + "epoch": 0.53, + "learning_rate": 0.00022100699619732436, + "loss": 0.0126, "step": 203160 }, { - "epoch": 1.03, - "learning_rate": 0.00014624718103435226, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00022100310798095293, + "loss": 0.0133, "step": 203170 }, { - "epoch": 1.03, - "learning_rate": 0.00014623961334133827, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.00022099921976458144, + "loss": 0.0187, "step": 203180 }, { - "epoch": 1.03, - "learning_rate": 0.00014623204564832425, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.00022099533154820998, + "loss": 0.0183, "step": 203190 }, { - "epoch": 1.03, - "learning_rate": 0.00014622447795531023, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.0002209914433318385, + "loss": 0.0174, "step": 203200 }, { - "epoch": 1.03, - "learning_rate": 0.00014621691026229624, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022098755511546704, + "loss": 0.0171, "step": 203210 }, { - "epoch": 1.03, - "learning_rate": 0.00014620934256928222, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022098366689909558, + "loss": 0.0161, "step": 203220 }, { - "epoch": 1.03, - "learning_rate": 0.0001462017748762682, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022097977868272412, + "loss": 0.0141, "step": 203230 }, { - "epoch": 1.03, - "learning_rate": 0.0001461942071832542, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022097589046635264, + "loss": 0.0164, "step": 203240 }, { - "epoch": 1.03, - "learning_rate": 0.0001461866394902402, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022097200224998118, + "loss": 0.0217, "step": 203250 }, { - "epoch": 1.03, - "learning_rate": 0.00014617907179722618, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022096811403360975, + "loss": 0.0207, "step": 203260 }, { - "epoch": 1.03, - "learning_rate": 0.00014617150410421218, - "loss": 0.0121, + "epoch": 0.53, + "learning_rate": 0.00022096422581723826, + "loss": 0.0187, "step": 203270 }, { - "epoch": 1.03, - "learning_rate": 0.00014616393641119817, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022096033760086678, + "loss": 0.0193, "step": 203280 }, { - "epoch": 1.03, - "learning_rate": 0.00014615636871818415, - "loss": 0.0122, + "epoch": 0.53, + "learning_rate": 0.00022095644938449532, + "loss": 0.0174, "step": 203290 }, { - "epoch": 1.03, - "learning_rate": 0.00014614880102517016, - "loss": 0.0086, - "step": 203300 + "epoch": 0.53, + "learning_rate": 0.00022095256116812389, + "loss": 0.0162, + "step": 203300 }, { - "epoch": 1.03, - "learning_rate": 0.0001461412333321561, - "loss": 0.011, + "epoch": 0.53, + "learning_rate": 0.0002209486729517524, + "loss": 0.014, "step": 203310 }, { - "epoch": 1.03, - "learning_rate": 0.00014613366563914212, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022094478473538094, + "loss": 0.014, "step": 203320 }, { - "epoch": 1.03, - "learning_rate": 0.0001461260979461281, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022094089651900946, + "loss": 0.0205, "step": 203330 }, { - "epoch": 1.03, - "learning_rate": 0.00014611853025311408, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022093700830263803, + "loss": 0.0188, "step": 203340 }, { - "epoch": 1.03, - "learning_rate": 0.00014611096256010006, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022093312008626654, + "loss": 0.0212, "step": 203350 }, { - "epoch": 1.03, - "learning_rate": 0.00014610339486708607, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022092923186989508, + "loss": 0.0195, "step": 203360 }, { - "epoch": 1.03, - "learning_rate": 0.00014609582717407205, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.0002209253436535236, + "loss": 0.0118, "step": 203370 }, { - "epoch": 1.03, - "learning_rate": 0.00014608825948105803, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022092145543715217, + "loss": 0.0157, "step": 203380 }, { - "epoch": 1.03, - "learning_rate": 0.00014608069178804404, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022091756722078068, + "loss": 0.0169, "step": 203390 }, { - "epoch": 1.03, - "learning_rate": 0.00014607312409503002, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022091367900440922, + "loss": 0.0154, "step": 203400 }, { - "epoch": 1.03, - "learning_rate": 0.000146065556402016, - "loss": 0.0063, + "epoch": 0.53, + "learning_rate": 0.00022090979078803774, + "loss": 0.0164, "step": 203410 }, { - "epoch": 1.03, - "learning_rate": 0.00014605798870900201, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.0002209059025716663, + "loss": 0.0164, "step": 203420 }, { - "epoch": 1.03, - "learning_rate": 0.000146050421015988, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022090201435529482, + "loss": 0.0243, "step": 203430 }, { - "epoch": 1.03, - "learning_rate": 0.00014604285332297398, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022089812613892336, + "loss": 0.0247, "step": 203440 }, { - "epoch": 1.03, - "learning_rate": 0.00014603528562995999, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022089423792255188, + "loss": 0.022, "step": 203450 }, { - "epoch": 1.03, - "learning_rate": 0.00014602771793694597, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.00022089034970618042, + "loss": 0.0153, "step": 203460 }, { - "epoch": 1.03, - "learning_rate": 0.00014602015024393195, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022088646148980899, + "loss": 0.0162, "step": 203470 }, { - "epoch": 1.03, - "learning_rate": 0.00014601258255091796, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.0002208825732734375, + "loss": 0.022, "step": 203480 }, { - "epoch": 1.03, - "learning_rate": 0.00014600501485790394, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.00022087868505706604, + "loss": 0.0156, "step": 203490 }, { - "epoch": 1.03, - "learning_rate": 0.00014599744716488992, - "loss": 0.0069, + "epoch": 0.53, + "learning_rate": 0.00022087479684069456, + "loss": 0.0227, "step": 203500 }, { - "epoch": 1.03, - "learning_rate": 0.00014598987947187593, - "loss": 0.0118, + "epoch": 0.53, + "learning_rate": 0.00022087090862432313, + "loss": 0.0156, "step": 203510 }, { - "epoch": 1.03, - "learning_rate": 0.0001459823117788619, - "loss": 0.0086, + "epoch": 0.53, + "learning_rate": 0.00022086702040795164, + "loss": 0.0137, "step": 203520 }, { - "epoch": 1.03, - "learning_rate": 0.0001459747440858479, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022086313219158018, + "loss": 0.0186, "step": 203530 }, { - "epoch": 1.03, - "learning_rate": 0.00014596717639283387, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.0002208592439752087, + "loss": 0.0172, "step": 203540 }, { - "epoch": 1.03, - "learning_rate": 0.00014595960869981988, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022085535575883726, + "loss": 0.0187, "step": 203550 }, { - "epoch": 1.03, - "learning_rate": 0.00014595204100680586, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.00022085146754246578, + "loss": 0.0182, "step": 203560 }, { - "epoch": 1.03, - "learning_rate": 0.00014594447331379184, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022084757932609432, + "loss": 0.0176, "step": 203570 }, { - "epoch": 1.03, - "learning_rate": 0.00014593690562077785, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022084369110972284, + "loss": 0.0183, "step": 203580 }, { - "epoch": 1.03, - "learning_rate": 0.00014592933792776383, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.0002208398028933514, + "loss": 0.0145, "step": 203590 }, { - "epoch": 1.03, - "learning_rate": 0.00014592177023474982, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022083591467697992, + "loss": 0.0226, "step": 203600 }, { - "epoch": 1.03, - "learning_rate": 0.00014591420254173582, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022083202646060846, + "loss": 0.0149, "step": 203610 }, { - "epoch": 1.03, - "learning_rate": 0.0001459066348487218, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.00022082813824423697, + "loss": 0.013, "step": 203620 }, { - "epoch": 1.03, - "learning_rate": 0.0001458990671557078, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022082425002786554, + "loss": 0.0212, "step": 203630 }, { - "epoch": 1.03, - "learning_rate": 0.0001458914994626938, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022082036181149408, + "loss": 0.0159, "step": 203640 }, { - "epoch": 1.03, - "learning_rate": 0.00014588393176967978, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.0002208164735951226, + "loss": 0.016, "step": 203650 }, { - "epoch": 1.03, - "learning_rate": 0.00014587636407666576, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022081258537875114, + "loss": 0.0151, "step": 203660 }, { - "epoch": 1.03, - "learning_rate": 0.00014586879638365177, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022080869716237968, + "loss": 0.0171, "step": 203670 }, { - "epoch": 1.03, - "learning_rate": 0.00014586122869063775, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022080480894600822, + "loss": 0.0134, "step": 203680 }, { - "epoch": 1.03, - "learning_rate": 0.00014585366099762373, - "loss": 0.0123, + "epoch": 0.53, + "learning_rate": 0.00022080092072963674, + "loss": 0.017, "step": 203690 }, { - "epoch": 1.03, - "learning_rate": 0.0001458460933046097, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022079703251326528, + "loss": 0.0188, "step": 203700 }, { - "epoch": 1.03, - "learning_rate": 0.00014583852561159572, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.0002207931442968938, + "loss": 0.0191, "step": 203710 }, { - "epoch": 1.03, - "learning_rate": 0.0001458309579185817, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022078925608052236, + "loss": 0.0182, "step": 203720 }, { - "epoch": 1.03, - "learning_rate": 0.00014582339022556768, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022078536786415088, + "loss": 0.0128, "step": 203730 }, { - "epoch": 1.03, - "learning_rate": 0.0001458158225325537, - "loss": 0.0086, + "epoch": 0.53, + "learning_rate": 0.00022078147964777942, + "loss": 0.0155, "step": 203740 }, { - "epoch": 1.03, - "learning_rate": 0.00014580825483953967, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.00022077759143140793, + "loss": 0.0169, "step": 203750 }, { - "epoch": 1.03, - "learning_rate": 0.00014580068714652565, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.0002207737032150365, + "loss": 0.0156, "step": 203760 }, { - "epoch": 1.03, - "learning_rate": 0.00014579311945351166, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022076981499866502, + "loss": 0.0172, "step": 203770 }, { - "epoch": 1.03, - "learning_rate": 0.00014578555176049764, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.00022076592678229356, + "loss": 0.019, "step": 203780 }, { - "epoch": 1.03, - "learning_rate": 0.00014577798406748363, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022076203856592207, + "loss": 0.0208, "step": 203790 }, { - "epoch": 1.03, - "learning_rate": 0.00014577041637446963, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022075815034955064, + "loss": 0.0195, "step": 203800 }, { - "epoch": 1.03, - "learning_rate": 0.00014576284868145562, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.00022075426213317918, + "loss": 0.0125, "step": 203810 }, { - "epoch": 1.03, - "learning_rate": 0.0001457552809884416, - "loss": 0.0124, + "epoch": 0.53, + "learning_rate": 0.0002207503739168077, + "loss": 0.0169, "step": 203820 }, { - "epoch": 1.03, - "learning_rate": 0.0001457477132954276, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.0002207464857004362, + "loss": 0.0156, "step": 203830 }, { - "epoch": 1.03, - "learning_rate": 0.0001457401456024136, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.00022074259748406478, + "loss": 0.016, "step": 203840 }, { - "epoch": 1.03, - "learning_rate": 0.00014573257790939957, - "loss": 0.0132, + "epoch": 0.53, + "learning_rate": 0.00022073870926769332, + "loss": 0.0174, "step": 203850 }, { - "epoch": 1.03, - "learning_rate": 0.00014572501021638555, - "loss": 0.0131, + "epoch": 0.53, + "learning_rate": 0.00022073482105132184, + "loss": 0.0182, "step": 203860 }, { - "epoch": 1.03, - "learning_rate": 0.00014571744252337156, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022073093283495038, + "loss": 0.0151, "step": 203870 }, { - "epoch": 1.03, - "learning_rate": 0.00014570987483035754, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022072704461857892, + "loss": 0.0167, "step": 203880 }, { - "epoch": 1.03, - "learning_rate": 0.00014570230713734352, - "loss": 0.0121, + "epoch": 0.53, + "learning_rate": 0.00022072315640220746, + "loss": 0.0153, "step": 203890 }, { - "epoch": 1.03, - "learning_rate": 0.00014569473944432953, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.00022071926818583598, + "loss": 0.0167, "step": 203900 }, { - "epoch": 1.03, - "learning_rate": 0.0001456871717513155, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022071537996946452, + "loss": 0.0152, "step": 203910 }, { - "epoch": 1.03, - "learning_rate": 0.0001456796040583015, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.00022071149175309306, + "loss": 0.0166, "step": 203920 }, { - "epoch": 1.03, - "learning_rate": 0.00014567203636528747, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.0002207076035367216, + "loss": 0.0173, "step": 203930 }, { - "epoch": 1.03, - "learning_rate": 0.00014566446867227346, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022070371532035012, + "loss": 0.0204, "step": 203940 }, { - "epoch": 1.03, - "learning_rate": 0.00014565690097925946, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022069982710397866, + "loss": 0.0142, "step": 203950 }, { - "epoch": 1.03, - "learning_rate": 0.00014564933328624545, - "loss": 0.0073, + "epoch": 0.53, + "learning_rate": 0.00022069593888760717, + "loss": 0.0164, "step": 203960 }, { - "epoch": 1.03, - "learning_rate": 0.00014564176559323143, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022069205067123574, + "loss": 0.0158, "step": 203970 }, { - "epoch": 1.03, - "learning_rate": 0.00014563419790021744, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022068816245486426, + "loss": 0.017, "step": 203980 }, { - "epoch": 1.03, - "learning_rate": 0.00014562663020720342, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002206842742384928, + "loss": 0.0134, "step": 203990 }, { - "epoch": 1.03, - "learning_rate": 0.0001456190625141894, - "loss": 0.0129, + "epoch": 0.53, + "learning_rate": 0.0002206803860221213, + "loss": 0.0158, "step": 204000 }, { - "epoch": 1.03, - "eval_cer": 0.9144741374876638, - "eval_loss": 0.007685788441449404, - "eval_runtime": 116.7131, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.53, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.01144192460924387, + "eval_runtime": 107.6151, + "eval_samples_per_second": 18.585, + "eval_steps_per_second": 4.646, "step": 204000 }, { - "epoch": 1.03, - "learning_rate": 0.0001456114948211754, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022067649780574988, + "loss": 0.0132, "step": 204010 }, { - "epoch": 1.03, - "learning_rate": 0.0001456039271281614, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.00022067260958937842, + "loss": 0.0235, "step": 204020 }, { - "epoch": 1.03, - "learning_rate": 0.00014559635943514737, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.00022066872137300694, + "loss": 0.022, "step": 204030 }, { - "epoch": 1.03, - "learning_rate": 0.00014558879174213338, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022066483315663548, + "loss": 0.0167, "step": 204040 }, { - "epoch": 1.03, - "learning_rate": 0.00014558122404911936, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022066094494026402, + "loss": 0.016, "step": 204050 }, { - "epoch": 1.03, - "learning_rate": 0.00014557365635610534, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022065705672389256, + "loss": 0.0141, "step": 204060 }, { - "epoch": 1.03, - "learning_rate": 0.00014556608866309132, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022065316850752108, + "loss": 0.0168, "step": 204070 }, { - "epoch": 1.03, - "learning_rate": 0.00014555852097007733, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022064928029114962, + "loss": 0.0184, "step": 204080 }, { - "epoch": 1.03, - "learning_rate": 0.0001455509532770633, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022064539207477816, + "loss": 0.0174, "step": 204090 }, { - "epoch": 1.03, - "learning_rate": 0.0001455433855840493, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.0002206415038584067, + "loss": 0.0167, "step": 204100 }, { - "epoch": 1.03, - "learning_rate": 0.0001455358178910353, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022063761564203522, + "loss": 0.0183, "step": 204110 }, { - "epoch": 1.03, - "learning_rate": 0.00014552825019802128, - "loss": 0.0133, + "epoch": 0.53, + "learning_rate": 0.00022063372742566376, + "loss": 0.017, "step": 204120 }, { - "epoch": 1.03, - "learning_rate": 0.00014552068250500727, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.00022062983920929233, + "loss": 0.0145, "step": 204130 }, { - "epoch": 1.03, - "learning_rate": 0.00014551311481199327, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022062595099292084, + "loss": 0.0191, "step": 204140 }, { - "epoch": 1.03, - "learning_rate": 0.00014550554711897926, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022062206277654936, + "loss": 0.0284, "step": 204150 }, { - "epoch": 1.03, - "learning_rate": 0.00014549797942596524, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.0002206181745601779, + "loss": 0.0155, "step": 204160 }, { - "epoch": 1.03, - "learning_rate": 0.00014549041173295125, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022061428634380647, + "loss": 0.0172, "step": 204170 }, { - "epoch": 1.03, - "learning_rate": 0.00014548284403993723, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022061039812743498, + "loss": 0.0156, "step": 204180 }, { - "epoch": 1.03, - "learning_rate": 0.0001454752763469232, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022060650991106352, + "loss": 0.018, "step": 204190 }, { - "epoch": 1.03, - "learning_rate": 0.00014546770865390922, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022060262169469204, + "loss": 0.0153, "step": 204200 }, { - "epoch": 1.03, - "learning_rate": 0.0001454601409608952, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022059873347832058, + "loss": 0.0164, "step": 204210 }, { - "epoch": 1.03, - "learning_rate": 0.00014545257326788118, - "loss": 0.0134, + "epoch": 0.53, + "learning_rate": 0.00022059484526194912, + "loss": 0.0182, "step": 204220 }, { - "epoch": 1.03, - "learning_rate": 0.00014544500557486716, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00022059095704557766, + "loss": 0.0133, "step": 204230 }, { - "epoch": 1.03, - "learning_rate": 0.00014543743788185317, - "loss": 0.0145, + "epoch": 0.53, + "learning_rate": 0.00022058706882920618, + "loss": 0.0154, "step": 204240 }, { - "epoch": 1.03, - "learning_rate": 0.00014542987018883915, - "loss": 0.0131, + "epoch": 0.53, + "learning_rate": 0.00022058318061283472, + "loss": 0.0161, "step": 204250 }, { - "epoch": 1.03, - "learning_rate": 0.00014542230249582513, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022057929239646326, + "loss": 0.0173, "step": 204260 }, { - "epoch": 1.03, - "learning_rate": 0.00014541473480281114, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.0002205754041800918, + "loss": 0.0166, "step": 204270 }, { - "epoch": 1.03, - "learning_rate": 0.00014540716710979712, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022057151596372032, + "loss": 0.0169, "step": 204280 }, { - "epoch": 1.03, - "learning_rate": 0.0001453995994167831, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00022056762774734886, + "loss": 0.0153, "step": 204290 }, { - "epoch": 1.03, - "learning_rate": 0.0001453920317237691, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.0002205637395309774, + "loss": 0.0161, "step": 204300 }, { - "epoch": 1.03, - "learning_rate": 0.0001453844640307551, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022055985131460594, + "loss": 0.0208, "step": 204310 }, { - "epoch": 1.03, - "learning_rate": 0.00014537689633774108, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.00022055596309823446, + "loss": 0.0164, "step": 204320 }, { - "epoch": 1.03, - "learning_rate": 0.00014536932864472708, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.000220552074881863, + "loss": 0.0197, "step": 204330 }, { - "epoch": 1.03, - "learning_rate": 0.00014536176095171307, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022054818666549157, + "loss": 0.0141, "step": 204340 }, { - "epoch": 1.03, - "learning_rate": 0.00014535419325869905, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022054429844912008, + "loss": 0.0166, "step": 204350 }, { - "epoch": 1.03, - "learning_rate": 0.00014534662556568506, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00022054041023274862, + "loss": 0.0168, "step": 204360 }, { - "epoch": 1.03, - "learning_rate": 0.00014533905787267104, - "loss": 0.0123, + "epoch": 0.53, + "learning_rate": 0.00022053652201637714, + "loss": 0.0143, "step": 204370 }, { - "epoch": 1.03, - "learning_rate": 0.00014533149017965702, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.0002205326338000057, + "loss": 0.0196, "step": 204380 }, { - "epoch": 1.03, - "learning_rate": 0.000145323922486643, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022052874558363422, + "loss": 0.0134, "step": 204390 }, { - "epoch": 1.03, - "learning_rate": 0.000145316354793629, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022052485736726276, + "loss": 0.0143, "step": 204400 }, { - "epoch": 1.03, - "learning_rate": 0.000145308787100615, - "loss": 0.0129, + "epoch": 0.53, + "learning_rate": 0.00022052096915089128, + "loss": 0.0163, "step": 204410 }, { - "epoch": 1.03, - "learning_rate": 0.00014530121940760097, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022051708093451984, + "loss": 0.0184, "step": 204420 }, { - "epoch": 1.03, - "learning_rate": 0.00014529365171458698, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00022051319271814836, + "loss": 0.0153, "step": 204430 }, { - "epoch": 1.03, - "learning_rate": 0.00014528608402157296, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.0002205093045017769, + "loss": 0.0186, "step": 204440 }, { - "epoch": 1.03, - "learning_rate": 0.00014527851632855894, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.00022050541628540542, + "loss": 0.0147, "step": 204450 }, { - "epoch": 1.03, - "learning_rate": 0.00014527094863554495, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022050152806903396, + "loss": 0.0153, "step": 204460 }, { - "epoch": 1.03, - "learning_rate": 0.00014526338094253093, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.0002204976398526625, + "loss": 0.0219, "step": 204470 }, { - "epoch": 1.03, - "learning_rate": 0.00014525581324951691, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00022049375163629104, + "loss": 0.0161, "step": 204480 }, { - "epoch": 1.03, - "learning_rate": 0.00014524824555650292, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022048986341991955, + "loss": 0.0153, "step": 204490 }, { - "epoch": 1.03, - "learning_rate": 0.0001452406778634889, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.0002204859752035481, + "loss": 0.0218, "step": 204500 }, { - "epoch": 1.03, - "learning_rate": 0.00014523311017047489, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.00022048208698717667, + "loss": 0.0184, "step": 204510 }, { - "epoch": 1.03, - "learning_rate": 0.0001452255424774609, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022047819877080518, + "loss": 0.0219, "step": 204520 }, { - "epoch": 1.03, - "learning_rate": 0.00014521797478444688, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022047431055443372, + "loss": 0.0202, "step": 204530 }, { - "epoch": 1.03, - "learning_rate": 0.00014521040709143286, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022047042233806224, + "loss": 0.0232, "step": 204540 }, { - "epoch": 1.03, - "learning_rate": 0.00014520283939841887, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.0002204665341216908, + "loss": 0.0133, "step": 204550 }, { - "epoch": 1.03, - "learning_rate": 0.00014519527170540482, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022046264590531932, + "loss": 0.015, "step": 204560 }, { - "epoch": 1.03, - "learning_rate": 0.00014518770401239083, - "loss": 0.0155, + "epoch": 0.53, + "learning_rate": 0.00022045875768894786, + "loss": 0.0151, "step": 204570 }, { - "epoch": 1.03, - "learning_rate": 0.0001451801363193768, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022045486947257638, + "loss": 0.0198, "step": 204580 }, { - "epoch": 1.03, - "learning_rate": 0.0001451725686263628, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022045098125620494, + "loss": 0.0172, "step": 204590 }, { - "epoch": 1.03, - "learning_rate": 0.00014516500093334877, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00022044709303983346, + "loss": 0.0209, "step": 204600 }, { - "epoch": 1.03, - "learning_rate": 0.00014515743324033478, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.000220443204823462, + "loss": 0.0154, "step": 204610 }, { - "epoch": 1.03, - "learning_rate": 0.00014514986554732076, - "loss": 0.0123, + "epoch": 0.53, + "learning_rate": 0.00022043931660709051, + "loss": 0.0209, "step": 204620 }, { - "epoch": 1.03, - "learning_rate": 0.00014514229785430674, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.00022043542839071908, + "loss": 0.0241, "step": 204630 }, { - "epoch": 1.03, - "learning_rate": 0.00014513473016129275, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.0002204315401743476, + "loss": 0.0161, "step": 204640 }, { - "epoch": 1.03, - "learning_rate": 0.00014512716246827873, - "loss": 0.013, + "epoch": 0.53, + "learning_rate": 0.00022042765195797614, + "loss": 0.0179, "step": 204650 }, { - "epoch": 1.03, - "learning_rate": 0.00014511959477526472, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022042376374160465, + "loss": 0.0167, "step": 204660 }, { - "epoch": 1.03, - "learning_rate": 0.00014511202708225072, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022041987552523322, + "loss": 0.0153, "step": 204670 }, { - "epoch": 1.03, - "learning_rate": 0.0001451044593892367, - "loss": 0.0136, + "epoch": 0.53, + "learning_rate": 0.00022041598730886176, + "loss": 0.0202, "step": 204680 }, { - "epoch": 1.03, - "learning_rate": 0.0001450968916962227, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022041209909249028, + "loss": 0.0149, "step": 204690 }, { - "epoch": 1.03, - "learning_rate": 0.0001450893240032087, - "loss": 0.0125, + "epoch": 0.53, + "learning_rate": 0.0002204082108761188, + "loss": 0.0164, "step": 204700 }, { - "epoch": 1.03, - "learning_rate": 0.00014508175631019468, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022040432265974734, + "loss": 0.0177, "step": 204710 }, { - "epoch": 1.03, - "learning_rate": 0.00014507418861718066, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.0002204004344433759, + "loss": 0.0155, "step": 204720 }, { - "epoch": 1.03, - "learning_rate": 0.00014506662092416667, - "loss": 0.0129, + "epoch": 0.53, + "learning_rate": 0.00022039654622700442, + "loss": 0.0176, "step": 204730 }, { - "epoch": 1.03, - "learning_rate": 0.00014505905323115265, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00022039265801063296, + "loss": 0.014, "step": 204740 }, { - "epoch": 1.03, - "learning_rate": 0.00014505148553813863, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.00022038876979426147, + "loss": 0.0158, "step": 204750 }, { - "epoch": 1.03, - "learning_rate": 0.0001450439178451246, - "loss": 0.0156, + "epoch": 0.53, + "learning_rate": 0.00022038488157789004, + "loss": 0.0163, "step": 204760 }, { - "epoch": 1.03, - "learning_rate": 0.00014503635015211062, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00022038099336151856, + "loss": 0.0143, "step": 204770 }, { - "epoch": 1.03, - "learning_rate": 0.0001450287824590966, - "loss": 0.0073, + "epoch": 0.53, + "learning_rate": 0.0002203771051451471, + "loss": 0.0172, "step": 204780 }, { - "epoch": 1.03, - "learning_rate": 0.00014502121476608258, - "loss": 0.008, + "epoch": 0.53, + "learning_rate": 0.00022037321692877561, + "loss": 0.0167, "step": 204790 }, { - "epoch": 1.03, - "learning_rate": 0.0001450136470730686, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.00022036932871240418, + "loss": 0.0159, "step": 204800 }, { - "epoch": 1.03, - "learning_rate": 0.00014500607938005457, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.0002203654404960327, + "loss": 0.0177, "step": 204810 }, { - "epoch": 1.03, - "learning_rate": 0.00014499851168704055, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022036155227966124, + "loss": 0.0177, "step": 204820 }, { - "epoch": 1.03, - "learning_rate": 0.00014499094399402656, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022035766406328975, + "loss": 0.0193, "step": 204830 }, { - "epoch": 1.03, - "learning_rate": 0.00014498337630101254, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022035377584691832, + "loss": 0.0174, "step": 204840 }, { - "epoch": 1.03, - "learning_rate": 0.00014497580860799853, - "loss": 0.0086, + "epoch": 0.53, + "learning_rate": 0.00022034988763054686, + "loss": 0.0179, "step": 204850 }, { - "epoch": 1.03, - "learning_rate": 0.00014496824091498453, - "loss": 0.0077, + "epoch": 0.53, + "learning_rate": 0.00022034599941417538, + "loss": 0.0165, "step": 204860 }, { - "epoch": 1.03, - "learning_rate": 0.00014496067322197052, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.0002203421111978039, + "loss": 0.0208, "step": 204870 }, { - "epoch": 1.03, - "learning_rate": 0.0001449531055289565, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.00022033822298143246, + "loss": 0.0178, "step": 204880 }, { - "epoch": 1.03, - "learning_rate": 0.0001449455378359425, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.000220334334765061, + "loss": 0.0195, "step": 204890 }, { - "epoch": 1.03, - "learning_rate": 0.0001449379701429285, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00022033044654868952, + "loss": 0.0177, "step": 204900 }, { - "epoch": 1.03, - "learning_rate": 0.00014493040244991447, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00022032655833231806, + "loss": 0.0155, "step": 204910 }, { - "epoch": 1.03, - "learning_rate": 0.00014492283475690045, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.0002203226701159466, + "loss": 0.019, "step": 204920 }, { - "epoch": 1.03, - "learning_rate": 0.00014491526706388646, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022031878189957514, + "loss": 0.0114, "step": 204930 }, { - "epoch": 1.03, - "learning_rate": 0.00014490769937087244, - "loss": 0.0086, + "epoch": 0.53, + "learning_rate": 0.00022031489368320366, + "loss": 0.0178, "step": 204940 }, { - "epoch": 1.03, - "learning_rate": 0.00014490013167785842, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002203110054668322, + "loss": 0.0142, "step": 204950 }, { - "epoch": 1.03, - "learning_rate": 0.00014489256398484443, - "loss": 0.0114, + "epoch": 0.53, + "learning_rate": 0.00022030711725046071, + "loss": 0.0147, "step": 204960 }, { - "epoch": 1.03, - "learning_rate": 0.0001448849962918304, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022030322903408928, + "loss": 0.0167, "step": 204970 }, { - "epoch": 1.03, - "learning_rate": 0.0001448774285988164, - "loss": 0.0073, + "epoch": 0.53, + "learning_rate": 0.0002202993408177178, + "loss": 0.0163, "step": 204980 }, { - "epoch": 1.03, - "learning_rate": 0.0001448698609058024, - "loss": 0.0077, + "epoch": 0.53, + "learning_rate": 0.00022029545260134634, + "loss": 0.016, "step": 204990 }, { - "epoch": 1.03, - "learning_rate": 0.00014486229321278838, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022029156438497485, + "loss": 0.021, "step": 205000 }, { - "epoch": 1.03, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.007726417388767004, - "eval_runtime": 116.6083, - "eval_samples_per_second": 17.151, - "eval_steps_per_second": 4.288, + "epoch": 0.53, + "eval_cer": 0.8817810659914818, + "eval_loss": 0.011213579215109348, + "eval_runtime": 107.384, + "eval_samples_per_second": 18.625, + "eval_steps_per_second": 4.656, "step": 205000 }, { - "epoch": 1.03, - "learning_rate": 0.00014485472551977436, - "loss": 0.0074, + "epoch": 0.53, + "learning_rate": 0.00022028767616860342, + "loss": 0.0162, "step": 205010 }, { - "epoch": 1.03, - "learning_rate": 0.00014484715782676037, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00022028378795223194, + "loss": 0.0163, "step": 205020 }, { - "epoch": 1.03, - "learning_rate": 0.00014483959013374635, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022027989973586048, + "loss": 0.018, "step": 205030 }, { - "epoch": 1.03, - "learning_rate": 0.00014483202244073234, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.000220276011519489, + "loss": 0.0197, "step": 205040 }, { - "epoch": 1.03, - "learning_rate": 0.00014482445474771834, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.00022027212330311756, + "loss": 0.0169, "step": 205050 }, { - "epoch": 1.03, - "learning_rate": 0.00014481688705470433, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.0002202682350867461, + "loss": 0.0147, "step": 205060 }, { - "epoch": 1.03, - "learning_rate": 0.0001448093193616903, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.00022026434687037462, + "loss": 0.014, "step": 205070 }, { - "epoch": 1.03, - "learning_rate": 0.00014480175166867632, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022026045865400316, + "loss": 0.0181, "step": 205080 }, { - "epoch": 1.03, - "learning_rate": 0.0001447941839756623, - "loss": 0.013, + "epoch": 0.53, + "learning_rate": 0.0002202565704376317, + "loss": 0.0184, "step": 205090 }, { - "epoch": 1.03, - "learning_rate": 0.00014478661628264828, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.00022025268222126024, + "loss": 0.0179, "step": 205100 }, { - "epoch": 1.03, - "learning_rate": 0.00014477904858963426, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022024879400488876, + "loss": 0.0103, "step": 205110 }, { - "epoch": 1.03, - "learning_rate": 0.00014477148089662027, - "loss": 0.0107, + "epoch": 0.53, + "learning_rate": 0.0002202449057885173, + "loss": 0.0176, "step": 205120 }, { - "epoch": 1.03, - "learning_rate": 0.00014476391320360625, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022024101757214584, + "loss": 0.0137, "step": 205130 }, { - "epoch": 1.03, - "learning_rate": 0.00014475634551059223, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.00022023712935577438, + "loss": 0.0173, "step": 205140 }, { - "epoch": 1.04, - "learning_rate": 0.00014474877781757824, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002202332411394029, + "loss": 0.0205, "step": 205150 }, { - "epoch": 1.04, - "learning_rate": 0.00014474121012456422, - "loss": 0.0076, + "epoch": 0.53, + "learning_rate": 0.00022022935292303144, + "loss": 0.0159, "step": 205160 }, { - "epoch": 1.04, - "learning_rate": 0.0001447336424315502, - "loss": 0.011, + "epoch": 0.53, + "learning_rate": 0.00022022546470665998, + "loss": 0.0166, "step": 205170 }, { - "epoch": 1.04, - "learning_rate": 0.0001447260747385362, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.00022022157649028852, + "loss": 0.0155, "step": 205180 }, { - "epoch": 1.04, - "learning_rate": 0.00014471850704552217, - "loss": 0.011, + "epoch": 0.53, + "learning_rate": 0.00022021768827391704, + "loss": 0.0119, "step": 205190 }, { - "epoch": 1.04, - "learning_rate": 0.00014471093935250817, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.00022021380005754558, + "loss": 0.0137, "step": 205200 }, { - "epoch": 1.04, - "learning_rate": 0.00014470337165949416, - "loss": 0.0123, + "epoch": 0.53, + "learning_rate": 0.0002202099118411741, + "loss": 0.0188, "step": 205210 }, { - "epoch": 1.04, - "learning_rate": 0.00014469580396648014, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00022020602362480266, + "loss": 0.0164, "step": 205220 }, { - "epoch": 1.04, - "learning_rate": 0.00014468823627346615, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.0002202021354084312, + "loss": 0.0205, "step": 205230 }, { - "epoch": 1.04, - "learning_rate": 0.00014468066858045213, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00022019824719205972, + "loss": 0.0222, "step": 205240 }, { - "epoch": 1.04, - "learning_rate": 0.0001446731008874381, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022019435897568826, + "loss": 0.0308, "step": 205250 }, { - "epoch": 1.04, - "learning_rate": 0.00014466553319442412, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.0002201904707593168, + "loss": 0.0202, "step": 205260 }, { - "epoch": 1.04, - "learning_rate": 0.0001446579655014101, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022018658254294534, + "loss": 0.017, "step": 205270 }, { - "epoch": 1.04, - "learning_rate": 0.00014465039780839608, - "loss": 0.0119, + "epoch": 0.53, + "learning_rate": 0.00022018269432657386, + "loss": 0.0187, "step": 205280 }, { - "epoch": 1.04, - "learning_rate": 0.00014464283011538206, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.0002201788061102024, + "loss": 0.0216, "step": 205290 }, { - "epoch": 1.04, - "learning_rate": 0.00014463526242236807, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.00022017491789383094, + "loss": 0.0177, "step": 205300 }, { - "epoch": 1.04, - "learning_rate": 0.00014462769472935405, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.00022017102967745948, + "loss": 0.0161, "step": 205310 }, { - "epoch": 1.04, - "learning_rate": 0.00014462012703634003, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.000220167141461088, + "loss": 0.0183, "step": 205320 }, { - "epoch": 1.04, - "learning_rate": 0.00014461255934332604, - "loss": 0.009, + "epoch": 0.53, + "learning_rate": 0.00022016325324471654, + "loss": 0.0183, "step": 205330 }, { - "epoch": 1.04, - "learning_rate": 0.00014460499165031202, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022015936502834508, + "loss": 0.0177, "step": 205340 }, { - "epoch": 1.04, - "learning_rate": 0.000144597423957298, - "loss": 0.0134, + "epoch": 0.53, + "learning_rate": 0.00022015547681197362, + "loss": 0.0194, "step": 205350 }, { - "epoch": 1.04, - "learning_rate": 0.000144589856264284, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.00022015158859560214, + "loss": 0.0169, "step": 205360 }, { - "epoch": 1.04, - "learning_rate": 0.00014458228857127, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00022014770037923068, + "loss": 0.0159, "step": 205370 }, { - "epoch": 1.04, - "learning_rate": 0.00014457472087825598, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022014381216285925, + "loss": 0.0188, "step": 205380 }, { - "epoch": 1.04, - "learning_rate": 0.00014456715318524198, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00022013992394648776, + "loss": 0.0188, "step": 205390 }, { - "epoch": 1.04, - "learning_rate": 0.00014455958549222797, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.0002201360357301163, + "loss": 0.0172, "step": 205400 }, { - "epoch": 1.04, - "learning_rate": 0.00014455201779921395, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00022013214751374482, + "loss": 0.0186, "step": 205410 }, { - "epoch": 1.04, - "learning_rate": 0.00014454445010619996, - "loss": 0.0136, + "epoch": 0.53, + "learning_rate": 0.00022012825929737339, + "loss": 0.0195, "step": 205420 }, { - "epoch": 1.04, - "learning_rate": 0.00014453688241318594, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.0002201243710810019, + "loss": 0.025, "step": 205430 }, { - "epoch": 1.04, - "learning_rate": 0.00014452931472017192, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.00022012048286463044, + "loss": 0.0184, "step": 205440 }, { - "epoch": 1.04, - "learning_rate": 0.00014452174702715793, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022011659464825896, + "loss": 0.0203, "step": 205450 }, { - "epoch": 1.04, - "learning_rate": 0.0001445141793341439, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.0002201127064318875, + "loss": 0.0212, "step": 205460 }, { - "epoch": 1.04, - "learning_rate": 0.0001445066116411299, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00022010881821551604, + "loss": 0.0222, "step": 205470 }, { - "epoch": 1.04, - "learning_rate": 0.00014449904394811587, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.00022010492999914458, + "loss": 0.0172, "step": 205480 }, { - "epoch": 1.04, - "learning_rate": 0.00014449147625510188, - "loss": 0.011, + "epoch": 0.53, + "learning_rate": 0.0002201010417827731, + "loss": 0.0152, "step": 205490 }, { - "epoch": 1.04, - "learning_rate": 0.00014448390856208786, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022009715356640164, + "loss": 0.0187, "step": 205500 }, { - "epoch": 1.04, - "learning_rate": 0.00014447634086907384, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.00022009326535003018, + "loss": 0.0189, "step": 205510 }, { - "epoch": 1.04, - "learning_rate": 0.00014446877317605985, - "loss": 0.0077, + "epoch": 0.53, + "learning_rate": 0.00022008937713365872, + "loss": 0.0175, "step": 205520 }, { - "epoch": 1.04, - "learning_rate": 0.00014446120548304583, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022008548891728723, + "loss": 0.0198, "step": 205530 }, { - "epoch": 1.04, - "learning_rate": 0.00014445363779003181, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00022008160070091578, + "loss": 0.02, "step": 205540 }, { - "epoch": 1.04, - "learning_rate": 0.00014444607009701782, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00022007771248454435, + "loss": 0.0192, "step": 205550 }, { - "epoch": 1.04, - "learning_rate": 0.0001444385024040038, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.00022007382426817286, + "loss": 0.0197, "step": 205560 }, { - "epoch": 1.04, - "learning_rate": 0.00014443093471098979, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022006993605180137, + "loss": 0.0194, "step": 205570 }, { - "epoch": 1.04, - "learning_rate": 0.0001444233670179758, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.00022006604783542992, + "loss": 0.0173, "step": 205580 }, { - "epoch": 1.04, - "learning_rate": 0.00014441579932496178, - "loss": 0.0076, + "epoch": 0.53, + "learning_rate": 0.00022006215961905848, + "loss": 0.0142, "step": 205590 }, { - "epoch": 1.04, - "learning_rate": 0.00014440823163194776, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.000220058271402687, + "loss": 0.0159, "step": 205600 }, { - "epoch": 1.04, - "learning_rate": 0.00014440066393893377, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00022005438318631554, + "loss": 0.0197, "step": 205610 }, { - "epoch": 1.04, - "learning_rate": 0.00014439309624591975, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00022005049496994406, + "loss": 0.0195, "step": 205620 }, { - "epoch": 1.04, - "learning_rate": 0.00014438552855290573, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.00022004660675357262, + "loss": 0.0181, "step": 205630 }, { - "epoch": 1.04, - "learning_rate": 0.0001443779608598917, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.00022004271853720114, + "loss": 0.0146, "step": 205640 }, { - "epoch": 1.04, - "learning_rate": 0.00014437039316687772, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00022003883032082968, + "loss": 0.0205, "step": 205650 }, { - "epoch": 1.04, - "learning_rate": 0.0001443628254738637, - "loss": 0.0078, + "epoch": 0.53, + "learning_rate": 0.0002200349421044582, + "loss": 0.0164, "step": 205660 }, { - "epoch": 1.04, - "learning_rate": 0.00014435525778084968, - "loss": 0.0135, + "epoch": 0.53, + "learning_rate": 0.00022003105388808676, + "loss": 0.0157, "step": 205670 }, { - "epoch": 1.04, - "learning_rate": 0.0001443476900878357, - "loss": 0.0093, + "epoch": 0.53, + "learning_rate": 0.00022002716567171528, + "loss": 0.016, "step": 205680 }, { - "epoch": 1.04, - "learning_rate": 0.00014434012239482167, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00022002327745534382, + "loss": 0.015, "step": 205690 }, { - "epoch": 1.04, - "learning_rate": 0.00014433255470180765, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022001938923897233, + "loss": 0.0174, "step": 205700 }, { - "epoch": 1.04, - "learning_rate": 0.00014432498700879366, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00022001550102260088, + "loss": 0.0192, "step": 205710 }, { - "epoch": 1.04, - "learning_rate": 0.00014431741931577964, - "loss": 0.011, + "epoch": 0.53, + "learning_rate": 0.00022001161280622944, + "loss": 0.0172, "step": 205720 }, { - "epoch": 1.04, - "learning_rate": 0.00014430985162276562, - "loss": 0.0096, + "epoch": 0.53, + "learning_rate": 0.00022000772458985796, + "loss": 0.0188, "step": 205730 }, { - "epoch": 1.04, - "learning_rate": 0.00014430228392975163, - "loss": 0.0122, + "epoch": 0.53, + "learning_rate": 0.00022000383637348647, + "loss": 0.0198, "step": 205740 }, { - "epoch": 1.04, - "learning_rate": 0.00014429471623673761, - "loss": 0.0117, + "epoch": 0.53, + "learning_rate": 0.00021999994815711502, + "loss": 0.0175, "step": 205750 }, { - "epoch": 1.04, - "learning_rate": 0.0001442871485437236, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00021999605994074358, + "loss": 0.0176, "step": 205760 }, { - "epoch": 1.04, - "learning_rate": 0.0001442795808507096, - "loss": 0.01, + "epoch": 0.53, + "learning_rate": 0.0002199921717243721, + "loss": 0.0205, "step": 205770 }, { - "epoch": 1.04, - "learning_rate": 0.00014427201315769559, - "loss": 0.0115, + "epoch": 0.53, + "learning_rate": 0.00021998828350800064, + "loss": 0.0195, "step": 205780 }, { - "epoch": 1.04, - "learning_rate": 0.00014426444546468157, - "loss": 0.0081, + "epoch": 0.53, + "learning_rate": 0.00021998439529162915, + "loss": 0.0208, "step": 205790 }, { - "epoch": 1.04, - "learning_rate": 0.00014425687777166755, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00021998050707525772, + "loss": 0.0174, "step": 205800 }, { - "epoch": 1.04, - "learning_rate": 0.00014424931007865356, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00021997661885888624, + "loss": 0.0184, "step": 205810 }, { - "epoch": 1.04, - "learning_rate": 0.0001442417423856395, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00021997273064251478, + "loss": 0.0223, "step": 205820 }, { - "epoch": 1.04, - "learning_rate": 0.00014423417469262552, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.0002199688424261433, + "loss": 0.0148, "step": 205830 }, { - "epoch": 1.04, - "learning_rate": 0.0001442266069996115, - "loss": 0.0065, + "epoch": 0.53, + "learning_rate": 0.00021996495420977186, + "loss": 0.0155, "step": 205840 }, { - "epoch": 1.04, - "learning_rate": 0.00014421903930659748, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00021996106599340038, + "loss": 0.0188, "step": 205850 }, { - "epoch": 1.04, - "learning_rate": 0.0001442114716135835, - "loss": 0.0092, + "epoch": 0.53, + "learning_rate": 0.00021995717777702892, + "loss": 0.0187, "step": 205860 }, { - "epoch": 1.04, - "learning_rate": 0.00014420390392056947, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00021995328956065743, + "loss": 0.0178, "step": 205870 }, { - "epoch": 1.04, - "learning_rate": 0.00014419633622755545, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.000219949401344286, + "loss": 0.0131, "step": 205880 }, { - "epoch": 1.04, - "learning_rate": 0.00014418876853454146, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00021994551312791452, + "loss": 0.02, "step": 205890 }, { - "epoch": 1.04, - "learning_rate": 0.00014418120084152744, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00021994162491154306, + "loss": 0.0178, "step": 205900 }, { - "epoch": 1.04, - "learning_rate": 0.00014417363314851343, - "loss": 0.0106, + "epoch": 0.53, + "learning_rate": 0.00021993773669517157, + "loss": 0.0195, "step": 205910 }, { - "epoch": 1.04, - "learning_rate": 0.00014416606545549943, - "loss": 0.0135, + "epoch": 0.53, + "learning_rate": 0.00021993384847880014, + "loss": 0.0196, "step": 205920 }, { - "epoch": 1.04, - "learning_rate": 0.00014415849776248542, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00021992996026242868, + "loss": 0.0177, "step": 205930 }, { - "epoch": 1.04, - "learning_rate": 0.0001441509300694714, - "loss": 0.0085, + "epoch": 0.53, + "learning_rate": 0.0002199260720460572, + "loss": 0.0195, "step": 205940 }, { - "epoch": 1.04, - "learning_rate": 0.0001441433623764574, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00021992218382968574, + "loss": 0.0174, "step": 205950 }, { - "epoch": 1.04, - "learning_rate": 0.0001441357946834434, - "loss": 0.0073, + "epoch": 0.53, + "learning_rate": 0.00021991829561331425, + "loss": 0.0162, "step": 205960 }, { - "epoch": 1.04, - "learning_rate": 0.00014412822699042937, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00021991440739694282, + "loss": 0.014, "step": 205970 }, { - "epoch": 1.04, - "learning_rate": 0.00014412065929741538, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00021991051918057134, + "loss": 0.0143, "step": 205980 }, { - "epoch": 1.04, - "learning_rate": 0.00014411309160440136, - "loss": 0.0084, + "epoch": 0.53, + "learning_rate": 0.00021990663096419988, + "loss": 0.0159, "step": 205990 }, { - "epoch": 1.04, - "learning_rate": 0.00014410552391138734, - "loss": 0.0122, + "epoch": 0.53, + "learning_rate": 0.0002199027427478284, + "loss": 0.0159, "step": 206000 }, { - "epoch": 1.04, - "eval_cer": 0.914452788772905, - "eval_loss": 0.007414559833705425, - "eval_runtime": 116.657, - "eval_samples_per_second": 17.144, - "eval_steps_per_second": 4.286, + "epoch": 0.53, + "eval_cer": 0.8817754674437451, + "eval_loss": 0.011567558161914349, + "eval_runtime": 107.5415, + "eval_samples_per_second": 18.597, + "eval_steps_per_second": 4.649, "step": 206000 }, { - "epoch": 1.04, - "learning_rate": 0.00014409795621837332, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.00021989885453145696, + "loss": 0.0163, "step": 206010 }, { - "epoch": 1.04, - "learning_rate": 0.00014409038852535933, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00021989496631508548, + "loss": 0.0139, "step": 206020 }, { - "epoch": 1.04, - "learning_rate": 0.0001440828208323453, - "loss": 0.0149, + "epoch": 0.53, + "learning_rate": 0.00021989107809871402, + "loss": 0.02, "step": 206030 }, { - "epoch": 1.04, - "learning_rate": 0.0001440752531393313, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00021988718988234253, + "loss": 0.0173, "step": 206040 }, { - "epoch": 1.04, - "learning_rate": 0.0001440676854463173, - "loss": 0.0074, + "epoch": 0.53, + "learning_rate": 0.0002198833016659711, + "loss": 0.0161, "step": 206050 }, { - "epoch": 1.04, - "learning_rate": 0.00014406011775330328, - "loss": 0.0079, + "epoch": 0.53, + "learning_rate": 0.00021987941344959962, + "loss": 0.0148, "step": 206060 }, { - "epoch": 1.04, - "learning_rate": 0.00014405255006028926, - "loss": 0.0116, + "epoch": 0.53, + "learning_rate": 0.00021987552523322816, + "loss": 0.0142, "step": 206070 }, { - "epoch": 1.04, - "learning_rate": 0.00014404498236727527, - "loss": 0.0102, + "epoch": 0.53, + "learning_rate": 0.00021987163701685667, + "loss": 0.0211, "step": 206080 }, { - "epoch": 1.04, - "learning_rate": 0.00014403741467426125, - "loss": 0.0083, + "epoch": 0.53, + "learning_rate": 0.00021986774880048524, + "loss": 0.0182, "step": 206090 }, { - "epoch": 1.04, - "learning_rate": 0.00014402984698124724, - "loss": 0.0103, + "epoch": 0.53, + "learning_rate": 0.00021986386058411378, + "loss": 0.0127, "step": 206100 }, { - "epoch": 1.04, - "learning_rate": 0.00014402227928823324, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.0002198599723677423, + "loss": 0.0173, "step": 206110 }, { - "epoch": 1.04, - "learning_rate": 0.00014401471159521923, - "loss": 0.0131, + "epoch": 0.53, + "learning_rate": 0.00021985608415137084, + "loss": 0.0228, "step": 206120 }, { - "epoch": 1.04, - "learning_rate": 0.0001440071439022052, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00021985219593499938, + "loss": 0.0155, "step": 206130 }, { - "epoch": 1.04, - "learning_rate": 0.00014399957620919122, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00021984830771862792, + "loss": 0.0194, "step": 206140 }, { - "epoch": 1.04, - "learning_rate": 0.0001439920085161772, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.00021984441950225644, + "loss": 0.0175, "step": 206150 }, { - "epoch": 1.04, - "learning_rate": 0.00014398444082316318, - "loss": 0.0097, + "epoch": 0.53, + "learning_rate": 0.00021984053128588498, + "loss": 0.02, "step": 206160 }, { - "epoch": 1.04, - "learning_rate": 0.00014397687313014916, - "loss": 0.0098, + "epoch": 0.53, + "learning_rate": 0.00021983664306951352, + "loss": 0.0172, "step": 206170 }, { - "epoch": 1.04, - "learning_rate": 0.00014396930543713517, - "loss": 0.0089, + "epoch": 0.53, + "learning_rate": 0.00021983275485314206, + "loss": 0.0179, "step": 206180 }, { - "epoch": 1.04, - "learning_rate": 0.00014396173774412115, - "loss": 0.0111, + "epoch": 0.53, + "learning_rate": 0.00021982886663677058, + "loss": 0.019, "step": 206190 }, { - "epoch": 1.04, - "learning_rate": 0.00014395417005110713, - "loss": 0.0104, + "epoch": 0.53, + "learning_rate": 0.00021982497842039912, + "loss": 0.0195, "step": 206200 }, { - "epoch": 1.04, - "learning_rate": 0.00014394660235809314, - "loss": 0.0091, + "epoch": 0.53, + "learning_rate": 0.00021982109020402763, + "loss": 0.017, "step": 206210 }, { - "epoch": 1.04, - "learning_rate": 0.00014393903466507912, - "loss": 0.0094, + "epoch": 0.53, + "learning_rate": 0.0002198172019876562, + "loss": 0.0202, "step": 206220 }, { - "epoch": 1.04, - "learning_rate": 0.0001439314669720651, - "loss": 0.0101, + "epoch": 0.53, + "learning_rate": 0.00021981331377128472, + "loss": 0.0177, "step": 206230 }, { - "epoch": 1.04, - "learning_rate": 0.0001439238992790511, - "loss": 0.0108, + "epoch": 0.53, + "learning_rate": 0.00021980942555491326, + "loss": 0.0188, "step": 206240 }, { - "epoch": 1.04, - "learning_rate": 0.0001439163315860371, - "loss": 0.0113, + "epoch": 0.53, + "learning_rate": 0.00021980553733854177, + "loss": 0.0215, "step": 206250 }, { - "epoch": 1.04, - "learning_rate": 0.00014390876389302307, - "loss": 0.0099, + "epoch": 0.53, + "learning_rate": 0.00021980164912217034, + "loss": 0.0151, "step": 206260 }, { - "epoch": 1.04, - "learning_rate": 0.00014390119620000908, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.00021979776090579888, + "loss": 0.0154, "step": 206270 }, { - "epoch": 1.04, - "learning_rate": 0.00014389362850699506, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.0002197938726894274, + "loss": 0.0174, "step": 206280 }, { - "epoch": 1.04, - "learning_rate": 0.00014388606081398105, - "loss": 0.0105, + "epoch": 0.53, + "learning_rate": 0.0002197899844730559, + "loss": 0.0161, "step": 206290 }, { - "epoch": 1.04, - "learning_rate": 0.00014387849312096705, - "loss": 0.0109, + "epoch": 0.53, + "learning_rate": 0.00021978609625668448, + "loss": 0.0171, "step": 206300 }, { - "epoch": 1.04, - "learning_rate": 0.00014387092542795304, - "loss": 0.0121, + "epoch": 0.53, + "learning_rate": 0.00021978220804031302, + "loss": 0.016, "step": 206310 }, { - "epoch": 1.04, - "learning_rate": 0.00014386335773493902, - "loss": 0.012, + "epoch": 0.53, + "learning_rate": 0.00021977831982394154, + "loss": 0.0225, "step": 206320 }, { - "epoch": 1.04, - "learning_rate": 0.000143855790041925, - "loss": 0.0095, + "epoch": 0.53, + "learning_rate": 0.00021977443160757008, + "loss": 0.0194, "step": 206330 }, { - "epoch": 1.04, - "learning_rate": 0.000143848222348911, - "loss": 0.0087, + "epoch": 0.53, + "learning_rate": 0.00021977054339119862, + "loss": 0.0196, "step": 206340 }, { - "epoch": 1.04, - "learning_rate": 0.000143840654655897, - "loss": 0.0126, + "epoch": 0.53, + "learning_rate": 0.00021976665517482716, + "loss": 0.0187, "step": 206350 }, { - "epoch": 1.04, - "learning_rate": 0.00014383308696288297, - "loss": 0.0082, + "epoch": 0.53, + "learning_rate": 0.00021976276695845568, + "loss": 0.0166, "step": 206360 }, { - "epoch": 1.04, - "learning_rate": 0.00014382551926986898, - "loss": 0.0112, + "epoch": 0.53, + "learning_rate": 0.00021975887874208422, + "loss": 0.0151, "step": 206370 }, { - "epoch": 1.04, - "learning_rate": 0.00014381795157685496, - "loss": 0.0122, + "epoch": 0.53, + "learning_rate": 0.00021975499052571276, + "loss": 0.0144, "step": 206380 }, { - "epoch": 1.04, - "learning_rate": 0.00014381038388384094, - "loss": 0.0088, + "epoch": 0.53, + "learning_rate": 0.0002197511023093413, + "loss": 0.0114, "step": 206390 }, { - "epoch": 1.04, - "learning_rate": 0.00014380281619082695, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021974721409296982, + "loss": 0.0199, "step": 206400 }, { - "epoch": 1.04, - "learning_rate": 0.00014379524849781293, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021974332587659836, + "loss": 0.0175, "step": 206410 }, { - "epoch": 1.04, - "learning_rate": 0.0001437876808047989, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021973943766022693, + "loss": 0.0127, "step": 206420 }, { - "epoch": 1.04, - "learning_rate": 0.00014378011311178492, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.00021973554944385544, + "loss": 0.0169, "step": 206430 }, { - "epoch": 1.04, - "learning_rate": 0.0001437725454187709, - "loss": 0.0107, + "epoch": 0.54, + "learning_rate": 0.00021973166122748398, + "loss": 0.0158, "step": 206440 }, { - "epoch": 1.04, - "learning_rate": 0.00014376497772575688, - "loss": 0.0085, + "epoch": 0.54, + "learning_rate": 0.0002197277730111125, + "loss": 0.0131, "step": 206450 }, { - "epoch": 1.04, - "learning_rate": 0.00014375741003274287, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.000219723884794741, + "loss": 0.019, "step": 206460 }, { - "epoch": 1.04, - "learning_rate": 0.00014374984233972885, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021971999657836958, + "loss": 0.0168, "step": 206470 }, { - "epoch": 1.04, - "learning_rate": 0.00014374227464671486, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.00021971610836199812, + "loss": 0.0154, "step": 206480 }, { - "epoch": 1.04, - "learning_rate": 0.00014373470695370084, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021971222014562664, + "loss": 0.0165, "step": 206490 }, { - "epoch": 1.04, - "learning_rate": 0.00014372713926068682, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021970833192925518, + "loss": 0.0155, "step": 206500 }, { - "epoch": 1.04, - "learning_rate": 0.00014371957156767283, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021970444371288372, + "loss": 0.0156, "step": 206510 }, { - "epoch": 1.04, - "learning_rate": 0.0001437120038746588, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021970055549651226, + "loss": 0.0154, "step": 206520 }, { - "epoch": 1.04, - "learning_rate": 0.0001437044361816448, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021969666728014078, + "loss": 0.0153, "step": 206530 }, { - "epoch": 1.04, - "learning_rate": 0.00014369686848863077, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021969277906376932, + "loss": 0.0161, "step": 206540 }, { - "epoch": 1.04, - "learning_rate": 0.00014368930079561678, - "loss": 0.0127, + "epoch": 0.54, + "learning_rate": 0.00021968889084739786, + "loss": 0.0212, "step": 206550 }, { - "epoch": 1.04, - "learning_rate": 0.00014368173310260276, - "loss": 0.0067, + "epoch": 0.54, + "learning_rate": 0.0002196850026310264, + "loss": 0.0192, "step": 206560 }, { - "epoch": 1.04, - "learning_rate": 0.00014367416540958874, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021968111441465491, + "loss": 0.0208, "step": 206570 }, { - "epoch": 1.04, - "learning_rate": 0.00014366659771657475, - "loss": 0.0078, + "epoch": 0.54, + "learning_rate": 0.00021967722619828346, + "loss": 0.0232, "step": 206580 }, { - "epoch": 1.04, - "learning_rate": 0.00014365903002356073, - "loss": 0.0135, + "epoch": 0.54, + "learning_rate": 0.00021967333798191202, + "loss": 0.0189, "step": 206590 }, { - "epoch": 1.04, - "learning_rate": 0.00014365146233054671, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021966944976554054, + "loss": 0.0161, "step": 206600 }, { - "epoch": 1.04, - "learning_rate": 0.00014364389463753272, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021966556154916905, + "loss": 0.0151, "step": 206610 }, { - "epoch": 1.04, - "learning_rate": 0.0001436363269445187, - "loss": 0.0074, + "epoch": 0.54, + "learning_rate": 0.0002196616733327976, + "loss": 0.0153, "step": 206620 }, { - "epoch": 1.04, - "learning_rate": 0.00014362875925150469, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021965778511642616, + "loss": 0.0157, "step": 206630 }, { - "epoch": 1.04, - "learning_rate": 0.0001436211915584907, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021965389690005468, + "loss": 0.0132, "step": 206640 }, { - "epoch": 1.04, - "learning_rate": 0.00014361362386547668, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021965000868368322, + "loss": 0.0168, "step": 206650 }, { - "epoch": 1.04, - "learning_rate": 0.00014360605617246266, - "loss": 0.0078, + "epoch": 0.54, + "learning_rate": 0.00021964612046731174, + "loss": 0.0176, "step": 206660 }, { - "epoch": 1.04, - "learning_rate": 0.00014359848847944867, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.0002196422322509403, + "loss": 0.0154, "step": 206670 }, { - "epoch": 1.04, - "learning_rate": 0.00014359092078643465, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021963834403456882, + "loss": 0.0154, "step": 206680 }, { - "epoch": 1.04, - "learning_rate": 0.00014358335309342063, - "loss": 0.0138, + "epoch": 0.54, + "learning_rate": 0.00021963445581819736, + "loss": 0.0141, "step": 206690 }, { - "epoch": 1.04, - "learning_rate": 0.0001435757854004066, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021963056760182587, + "loss": 0.0194, "step": 206700 }, { - "epoch": 1.04, - "learning_rate": 0.00014356821770739262, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021962667938545442, + "loss": 0.0174, "step": 206710 }, { - "epoch": 1.04, - "learning_rate": 0.0001435606500143786, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021962279116908296, + "loss": 0.0155, "step": 206720 }, { - "epoch": 1.04, - "learning_rate": 0.00014355308232136458, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.0002196189029527115, + "loss": 0.0129, "step": 206730 }, { - "epoch": 1.04, - "learning_rate": 0.0001435455146283506, - "loss": 0.007, + "epoch": 0.54, + "learning_rate": 0.00021961501473634001, + "loss": 0.0152, "step": 206740 }, { - "epoch": 1.04, - "learning_rate": 0.00014353794693533657, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021961112651996856, + "loss": 0.0189, "step": 206750 }, { - "epoch": 1.04, - "learning_rate": 0.00014353037924232255, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.0002196072383035971, + "loss": 0.0208, "step": 206760 }, { - "epoch": 1.04, - "learning_rate": 0.00014352281154930856, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021960335008722564, + "loss": 0.0174, "step": 206770 }, { - "epoch": 1.04, - "learning_rate": 0.00014351524385629454, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021959946187085415, + "loss": 0.019, "step": 206780 }, { - "epoch": 1.04, - "learning_rate": 0.00014350767616328052, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.0002195955736544827, + "loss": 0.02, "step": 206790 }, { - "epoch": 1.04, - "learning_rate": 0.00014350010847026653, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.00021959168543811126, + "loss": 0.0192, "step": 206800 }, { - "epoch": 1.04, - "learning_rate": 0.00014349254077725251, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021958779722173978, + "loss": 0.0186, "step": 206810 }, { - "epoch": 1.04, - "learning_rate": 0.0001434849730842385, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.00021958390900536832, + "loss": 0.0167, "step": 206820 }, { - "epoch": 1.04, - "learning_rate": 0.0001434774053912245, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021958002078899683, + "loss": 0.0134, "step": 206830 }, { - "epoch": 1.04, - "learning_rate": 0.00014346983769821049, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.0002195761325726254, + "loss": 0.0175, "step": 206840 }, { - "epoch": 1.04, - "learning_rate": 0.00014346227000519647, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021957224435625392, + "loss": 0.0164, "step": 206850 }, { - "epoch": 1.04, - "learning_rate": 0.00014345470231218245, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021956835613988246, + "loss": 0.0182, "step": 206860 }, { - "epoch": 1.04, - "learning_rate": 0.00014344713461916846, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021956446792351097, + "loss": 0.0142, "step": 206870 }, { - "epoch": 1.04, - "learning_rate": 0.00014343956692615444, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021956057970713954, + "loss": 0.0138, "step": 206880 }, { - "epoch": 1.04, - "learning_rate": 0.00014343199923314042, - "loss": 0.0076, + "epoch": 0.54, + "learning_rate": 0.00021955669149076806, + "loss": 0.0135, "step": 206890 }, { - "epoch": 1.04, - "learning_rate": 0.00014342443154012643, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.0002195528032743966, + "loss": 0.0183, "step": 206900 }, { - "epoch": 1.04, - "learning_rate": 0.0001434168638471124, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.0002195489150580251, + "loss": 0.0115, "step": 206910 }, { - "epoch": 1.04, - "learning_rate": 0.0001434092961540984, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.00021954502684165368, + "loss": 0.0168, "step": 206920 }, { - "epoch": 1.04, - "learning_rate": 0.0001434017284610844, - "loss": 0.0116, + "epoch": 0.54, + "learning_rate": 0.0002195411386252822, + "loss": 0.0187, "step": 206930 }, { - "epoch": 1.04, - "learning_rate": 0.00014339416076807038, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021953725040891074, + "loss": 0.0177, "step": 206940 }, { - "epoch": 1.04, - "learning_rate": 0.00014338659307505636, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021953336219253925, + "loss": 0.0154, "step": 206950 }, { - "epoch": 1.04, - "learning_rate": 0.00014337902538204237, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.0002195294739761678, + "loss": 0.0157, "step": 206960 }, { - "epoch": 1.04, - "learning_rate": 0.00014337145768902835, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021952558575979636, + "loss": 0.0168, "step": 206970 }, { - "epoch": 1.04, - "learning_rate": 0.00014336388999601433, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021952169754342488, + "loss": 0.0146, "step": 206980 }, { - "epoch": 1.04, - "learning_rate": 0.00014335632230300034, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021951780932705342, + "loss": 0.0163, "step": 206990 }, { - "epoch": 1.04, - "learning_rate": 0.00014334875460998632, - "loss": 0.0136, + "epoch": 0.54, + "learning_rate": 0.00021951392111068193, + "loss": 0.0188, "step": 207000 }, { - "epoch": 1.04, - "eval_cer": 0.9144566703574066, - "eval_loss": 0.0076129864901304245, - "eval_runtime": 116.5362, - "eval_samples_per_second": 17.162, - "eval_steps_per_second": 4.291, + "epoch": 0.54, + "eval_cer": 0.8817614710744033, + "eval_loss": 0.011343833990395069, + "eval_runtime": 107.8464, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, "step": 207000 }, { - "epoch": 1.04, - "learning_rate": 0.0001433411869169723, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.0002195100328943105, + "loss": 0.017, "step": 207010 }, { - "epoch": 1.04, - "learning_rate": 0.00014333361922395831, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021950614467793902, + "loss": 0.0183, "step": 207020 }, { - "epoch": 1.04, - "learning_rate": 0.0001433260515309443, - "loss": 0.0077, + "epoch": 0.54, + "learning_rate": 0.00021950225646156756, + "loss": 0.0125, "step": 207030 }, { - "epoch": 1.04, - "learning_rate": 0.00014331848383793028, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021949836824519607, + "loss": 0.0171, "step": 207040 }, { - "epoch": 1.04, - "learning_rate": 0.00014331091614491626, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021949448002882464, + "loss": 0.0192, "step": 207050 }, { - "epoch": 1.04, - "learning_rate": 0.00014330334845190227, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021949059181245316, + "loss": 0.0168, "step": 207060 }, { - "epoch": 1.04, - "learning_rate": 0.00014329578075888825, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.0002194867035960817, + "loss": 0.0241, "step": 207070 }, { - "epoch": 1.04, - "learning_rate": 0.00014328821306587423, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002194828153797102, + "loss": 0.017, "step": 207080 }, { - "epoch": 1.04, - "learning_rate": 0.0001432806453728602, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021947892716333878, + "loss": 0.0142, "step": 207090 }, { - "epoch": 1.04, - "learning_rate": 0.0001432730776798462, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.0002194750389469673, + "loss": 0.0146, "step": 207100 }, { - "epoch": 1.04, - "learning_rate": 0.0001432655099868322, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021947115073059584, + "loss": 0.0179, "step": 207110 }, { - "epoch": 1.04, - "learning_rate": 0.00014325794229381818, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021946726251422435, + "loss": 0.0164, "step": 207120 }, { - "epoch": 1.04, - "learning_rate": 0.00014325037460080416, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021946337429785292, + "loss": 0.0191, "step": 207130 }, { - "epoch": 1.05, - "learning_rate": 0.00014324280690779017, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021945948608148146, + "loss": 0.0168, "step": 207140 }, { - "epoch": 1.05, - "learning_rate": 0.00014323523921477615, - "loss": 0.0075, + "epoch": 0.54, + "learning_rate": 0.00021945559786510998, + "loss": 0.0136, "step": 207150 }, { - "epoch": 1.05, - "learning_rate": 0.00014322767152176214, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.0002194517096487385, + "loss": 0.0152, "step": 207160 }, { - "epoch": 1.05, - "learning_rate": 0.00014322010382874814, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.00021944782143236703, + "loss": 0.016, "step": 207170 }, { - "epoch": 1.05, - "learning_rate": 0.00014321253613573413, - "loss": 0.0117, + "epoch": 0.54, + "learning_rate": 0.0002194439332159956, + "loss": 0.0189, "step": 207180 }, { - "epoch": 1.05, - "learning_rate": 0.0001432049684427201, - "loss": 0.0074, + "epoch": 0.54, + "learning_rate": 0.00021944004499962412, + "loss": 0.0148, "step": 207190 }, { - "epoch": 1.05, - "learning_rate": 0.00014319740074970612, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.00021943615678325266, + "loss": 0.0119, "step": 207200 }, { - "epoch": 1.05, - "learning_rate": 0.0001431898330566921, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021943226856688117, + "loss": 0.0195, "step": 207210 }, { - "epoch": 1.05, - "learning_rate": 0.00014318226536367808, - "loss": 0.0128, + "epoch": 0.54, + "learning_rate": 0.00021942838035050974, + "loss": 0.0176, "step": 207220 }, { - "epoch": 1.05, - "learning_rate": 0.00014317469767066406, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021942449213413826, + "loss": 0.0187, "step": 207230 }, { - "epoch": 1.05, - "learning_rate": 0.00014316712997765007, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.0002194206039177668, + "loss": 0.015, "step": 207240 }, { - "epoch": 1.05, - "learning_rate": 0.00014315956228463605, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.0002194167157013953, + "loss": 0.0212, "step": 207250 }, { - "epoch": 1.05, - "learning_rate": 0.00014315199459162203, - "loss": 0.0119, + "epoch": 0.54, + "learning_rate": 0.00021941282748502388, + "loss": 0.0142, "step": 207260 }, { - "epoch": 1.05, - "learning_rate": 0.00014314442689860804, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.0002194089392686524, + "loss": 0.0153, "step": 207270 }, { - "epoch": 1.05, - "learning_rate": 0.00014313685920559402, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021940505105228094, + "loss": 0.0161, "step": 207280 }, { - "epoch": 1.05, - "learning_rate": 0.00014312929151258, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021940116283590945, + "loss": 0.0147, "step": 207290 }, { - "epoch": 1.05, - "learning_rate": 0.000143121723819566, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021939727461953802, + "loss": 0.0169, "step": 207300 }, { - "epoch": 1.05, - "learning_rate": 0.000143114156126552, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.00021939338640316656, + "loss": 0.0158, "step": 207310 }, { - "epoch": 1.05, - "learning_rate": 0.00014310658843353797, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021938949818679508, + "loss": 0.0153, "step": 207320 }, { - "epoch": 1.05, - "learning_rate": 0.00014309902074052398, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.0002193856099704236, + "loss": 0.019, "step": 207330 }, { - "epoch": 1.05, - "learning_rate": 0.00014309145304750996, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021938172175405216, + "loss": 0.0178, "step": 207340 }, { - "epoch": 1.05, - "learning_rate": 0.00014308388535449595, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.0002193778335376807, + "loss": 0.0173, "step": 207350 }, { - "epoch": 1.05, - "learning_rate": 0.00014307631766148195, - "loss": 0.0163, + "epoch": 0.54, + "learning_rate": 0.00021937394532130922, + "loss": 0.0169, "step": 207360 }, { - "epoch": 1.05, - "learning_rate": 0.00014306874996846794, - "loss": 0.0126, + "epoch": 0.54, + "learning_rate": 0.00021937005710493776, + "loss": 0.019, "step": 207370 }, { - "epoch": 1.05, - "learning_rate": 0.00014306118227545392, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002193661688885663, + "loss": 0.0154, "step": 207380 }, { - "epoch": 1.05, - "learning_rate": 0.00014305361458243993, - "loss": 0.013, + "epoch": 0.54, + "learning_rate": 0.00021936228067219484, + "loss": 0.0172, "step": 207390 }, { - "epoch": 1.05, - "learning_rate": 0.0001430460468894259, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021935839245582336, + "loss": 0.0139, "step": 207400 }, { - "epoch": 1.05, - "learning_rate": 0.0001430384791964119, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.0002193545042394519, + "loss": 0.0156, "step": 207410 }, { - "epoch": 1.05, - "learning_rate": 0.00014303091150339787, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.0002193506160230804, + "loss": 0.0176, "step": 207420 }, { - "epoch": 1.05, - "learning_rate": 0.00014302334381038388, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021934672780670898, + "loss": 0.0347, "step": 207430 }, { - "epoch": 1.05, - "learning_rate": 0.00014301577611736986, - "loss": 0.0116, + "epoch": 0.54, + "learning_rate": 0.0002193428395903375, + "loss": 0.0158, "step": 207440 }, { - "epoch": 1.05, - "learning_rate": 0.00014300820842435584, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021933895137396604, + "loss": 0.018, "step": 207450 }, { - "epoch": 1.05, - "learning_rate": 0.00014300064073134185, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021933506315759455, + "loss": 0.0166, "step": 207460 }, { - "epoch": 1.05, - "learning_rate": 0.00014299307303832783, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021933117494122312, + "loss": 0.0169, "step": 207470 }, { - "epoch": 1.05, - "learning_rate": 0.0001429855053453138, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021932728672485163, + "loss": 0.0202, "step": 207480 }, { - "epoch": 1.05, - "learning_rate": 0.00014297793765229982, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021932339850848018, + "loss": 0.0148, "step": 207490 }, { - "epoch": 1.05, - "learning_rate": 0.0001429703699592858, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002193195102921087, + "loss": 0.0227, "step": 207500 }, { - "epoch": 1.05, - "learning_rate": 0.00014296280226627178, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021931562207573726, + "loss": 0.0187, "step": 207510 }, { - "epoch": 1.05, - "learning_rate": 0.0001429552345732578, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.0002193117338593658, + "loss": 0.0155, "step": 207520 }, { - "epoch": 1.05, - "learning_rate": 0.00014294766688024377, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021930784564299432, + "loss": 0.0134, "step": 207530 }, { - "epoch": 1.05, - "learning_rate": 0.00014294009918722976, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.00021930395742662286, + "loss": 0.0158, "step": 207540 }, { - "epoch": 1.05, - "learning_rate": 0.00014293253149421576, - "loss": 0.0085, + "epoch": 0.54, + "learning_rate": 0.0002193000692102514, + "loss": 0.0142, "step": 207550 }, { - "epoch": 1.05, - "learning_rate": 0.00014292496380120175, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021929618099387994, + "loss": 0.0169, "step": 207560 }, { - "epoch": 1.05, - "learning_rate": 0.00014291739610818773, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.00021929229277750845, + "loss": 0.0116, "step": 207570 }, { - "epoch": 1.05, - "learning_rate": 0.0001429098284151737, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.000219288404561137, + "loss": 0.0156, "step": 207580 }, { - "epoch": 1.05, - "learning_rate": 0.00014290226072215972, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021928451634476554, + "loss": 0.0187, "step": 207590 }, { - "epoch": 1.05, - "learning_rate": 0.0001428946930291457, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.00021928062812839408, + "loss": 0.0271, "step": 207600 }, { - "epoch": 1.05, - "learning_rate": 0.00014288712533613168, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.0002192767399120226, + "loss": 0.0172, "step": 207610 }, { - "epoch": 1.05, - "learning_rate": 0.0001428795576431177, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021927285169565114, + "loss": 0.0154, "step": 207620 }, { - "epoch": 1.05, - "learning_rate": 0.00014287198995010367, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021926896347927968, + "loss": 0.022, "step": 207630 }, { - "epoch": 1.05, - "learning_rate": 0.00014286442225708965, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021926507526290822, + "loss": 0.0182, "step": 207640 }, { - "epoch": 1.05, - "learning_rate": 0.00014285685456407566, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021926118704653673, + "loss": 0.0139, "step": 207650 }, { - "epoch": 1.05, - "learning_rate": 0.00014284928687106164, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021925729883016528, + "loss": 0.0167, "step": 207660 }, { - "epoch": 1.05, - "learning_rate": 0.00014284171917804762, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.0002192534106137938, + "loss": 0.0161, "step": 207670 }, { - "epoch": 1.05, - "learning_rate": 0.00014283415148503363, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021924952239742236, + "loss": 0.0187, "step": 207680 }, { - "epoch": 1.05, - "learning_rate": 0.0001428265837920196, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.0002192456341810509, + "loss": 0.0202, "step": 207690 }, { - "epoch": 1.05, - "learning_rate": 0.0001428190160990056, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021924174596467941, + "loss": 0.0177, "step": 207700 }, { - "epoch": 1.05, - "learning_rate": 0.00014281144840599158, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021923785774830796, + "loss": 0.0171, "step": 207710 }, { - "epoch": 1.05, - "learning_rate": 0.00014280388071297756, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.0002192339695319365, + "loss": 0.0165, "step": 207720 }, { - "epoch": 1.05, - "learning_rate": 0.00014279631301996357, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021923008131556504, + "loss": 0.0144, "step": 207730 }, { - "epoch": 1.05, - "learning_rate": 0.00014278874532694955, - "loss": 0.0126, + "epoch": 0.54, + "learning_rate": 0.00021922619309919355, + "loss": 0.0125, "step": 207740 }, { - "epoch": 1.05, - "learning_rate": 0.00014278117763393553, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.0002192223048828221, + "loss": 0.0156, "step": 207750 }, { - "epoch": 1.05, - "learning_rate": 0.0001427736099409215, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021921841666645064, + "loss": 0.0147, "step": 207760 }, { - "epoch": 1.05, - "learning_rate": 0.00014276604224790752, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021921452845007918, + "loss": 0.0231, "step": 207770 }, { - "epoch": 1.05, - "learning_rate": 0.0001427584745548935, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.0002192106402337077, + "loss": 0.0166, "step": 207780 }, { - "epoch": 1.05, - "learning_rate": 0.00014275090686187948, - "loss": 0.0107, + "epoch": 0.54, + "learning_rate": 0.00021920675201733624, + "loss": 0.0153, "step": 207790 }, { - "epoch": 1.05, - "learning_rate": 0.0001427433391688655, - "loss": 0.007, + "epoch": 0.54, + "learning_rate": 0.00021920286380096478, + "loss": 0.0155, "step": 207800 }, { - "epoch": 1.05, - "learning_rate": 0.00014273577147585147, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021919897558459332, + "loss": 0.0168, "step": 207810 }, { - "epoch": 1.05, - "learning_rate": 0.00014272820378283745, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021919508736822183, + "loss": 0.0161, "step": 207820 }, { - "epoch": 1.05, - "learning_rate": 0.00014272063608982346, - "loss": 0.0121, + "epoch": 0.54, + "learning_rate": 0.00021919119915185037, + "loss": 0.0254, "step": 207830 }, { - "epoch": 1.05, - "learning_rate": 0.00014271306839680944, - "loss": 0.0121, + "epoch": 0.54, + "learning_rate": 0.00021918731093547894, + "loss": 0.0152, "step": 207840 }, { - "epoch": 1.05, - "learning_rate": 0.00014270550070379542, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021918342271910746, + "loss": 0.0177, "step": 207850 }, { - "epoch": 1.05, - "learning_rate": 0.00014269793301078143, - "loss": 0.0107, + "epoch": 0.54, + "learning_rate": 0.000219179534502736, + "loss": 0.0184, "step": 207860 }, { - "epoch": 1.05, - "learning_rate": 0.00014269036531776741, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021917564628636451, + "loss": 0.0187, "step": 207870 }, { - "epoch": 1.05, - "learning_rate": 0.0001426827976247534, - "loss": 0.0085, + "epoch": 0.54, + "learning_rate": 0.00021917175806999308, + "loss": 0.0158, "step": 207880 }, { - "epoch": 1.05, - "learning_rate": 0.0001426752299317394, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002191678698536216, + "loss": 0.0181, "step": 207890 }, { - "epoch": 1.05, - "learning_rate": 0.00014266766223872539, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021916398163725014, + "loss": 0.016, "step": 207900 }, { - "epoch": 1.05, - "learning_rate": 0.00014266009454571137, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021916009342087865, + "loss": 0.0181, "step": 207910 }, { - "epoch": 1.05, - "learning_rate": 0.00014265252685269738, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.0002191562052045072, + "loss": 0.0194, "step": 207920 }, { - "epoch": 1.05, - "learning_rate": 0.00014264495915968336, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021915231698813574, + "loss": 0.0166, "step": 207930 }, { - "epoch": 1.05, - "learning_rate": 0.00014263739146666934, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021914842877176428, + "loss": 0.0134, "step": 207940 }, { - "epoch": 1.05, - "learning_rate": 0.00014262982377365532, - "loss": 0.0067, + "epoch": 0.54, + "learning_rate": 0.0002191445405553928, + "loss": 0.0167, "step": 207950 }, { - "epoch": 1.05, - "learning_rate": 0.00014262225608064133, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021914065233902133, + "loss": 0.0225, "step": 207960 }, { - "epoch": 1.05, - "learning_rate": 0.0001426146883876273, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.00021913676412264988, + "loss": 0.0157, "step": 207970 }, { - "epoch": 1.05, - "learning_rate": 0.0001426071206946133, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021913287590627842, + "loss": 0.0178, "step": 207980 }, { - "epoch": 1.05, - "learning_rate": 0.0001425995530015993, - "loss": 0.0123, + "epoch": 0.54, + "learning_rate": 0.00021912898768990693, + "loss": 0.0149, "step": 207990 }, { - "epoch": 1.05, - "learning_rate": 0.00014259198530858528, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021912509947353547, + "loss": 0.0187, "step": 208000 }, { - "epoch": 1.05, - "eval_cer": 0.914462492734159, - "eval_loss": 0.007478554733097553, - "eval_runtime": 116.5491, - "eval_samples_per_second": 17.16, - "eval_steps_per_second": 4.29, + "epoch": 0.54, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.011146793141961098, + "eval_runtime": 108.0067, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 208000 }, { - "epoch": 1.05, - "learning_rate": 0.00014258441761557126, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021912121125716404, + "loss": 0.0137, "step": 208010 }, { - "epoch": 1.05, - "learning_rate": 0.00014257684992255727, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021911732304079256, + "loss": 0.0167, "step": 208020 }, { - "epoch": 1.05, - "learning_rate": 0.00014256928222954325, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.0002191134348244211, + "loss": 0.0143, "step": 208030 }, { - "epoch": 1.05, - "learning_rate": 0.00014256171453652923, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.00021910954660804961, + "loss": 0.0174, "step": 208040 }, { - "epoch": 1.05, - "learning_rate": 0.00014255414684351524, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021910565839167818, + "loss": 0.0166, "step": 208050 }, { - "epoch": 1.05, - "learning_rate": 0.00014254657915050122, - "loss": 0.0114, + "epoch": 0.54, + "learning_rate": 0.0002191017701753067, + "loss": 0.0151, "step": 208060 }, { - "epoch": 1.05, - "learning_rate": 0.0001425390114574872, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021909788195893524, + "loss": 0.0177, "step": 208070 }, { - "epoch": 1.05, - "learning_rate": 0.00014253144376447321, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021909399374256375, + "loss": 0.0164, "step": 208080 }, { - "epoch": 1.05, - "learning_rate": 0.0001425238760714592, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021909010552619232, + "loss": 0.021, "step": 208090 }, { - "epoch": 1.05, - "learning_rate": 0.00014251630837844518, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021908621730982084, + "loss": 0.0135, "step": 208100 }, { - "epoch": 1.05, - "learning_rate": 0.00014250874068543116, - "loss": 0.0063, + "epoch": 0.54, + "learning_rate": 0.00021908232909344938, + "loss": 0.016, "step": 208110 }, { - "epoch": 1.05, - "learning_rate": 0.00014250117299241717, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.0002190784408770779, + "loss": 0.0168, "step": 208120 }, { - "epoch": 1.05, - "learning_rate": 0.00014249360529940315, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021907455266070646, + "loss": 0.0148, "step": 208130 }, { - "epoch": 1.05, - "learning_rate": 0.00014248603760638913, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021907066444433498, + "loss": 0.0151, "step": 208140 }, { - "epoch": 1.05, - "learning_rate": 0.00014247846991337514, - "loss": 0.0078, + "epoch": 0.54, + "learning_rate": 0.00021906677622796352, + "loss": 0.0177, "step": 208150 }, { - "epoch": 1.05, - "learning_rate": 0.00014247090222036112, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021906288801159203, + "loss": 0.0155, "step": 208160 }, { - "epoch": 1.05, - "learning_rate": 0.0001424633345273471, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021905899979522057, + "loss": 0.0165, "step": 208170 }, { - "epoch": 1.05, - "learning_rate": 0.0001424557668343331, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021905511157884914, + "loss": 0.0168, "step": 208180 }, { - "epoch": 1.05, - "learning_rate": 0.0001424481991413191, - "loss": 0.012, + "epoch": 0.54, + "learning_rate": 0.00021905122336247766, + "loss": 0.0135, "step": 208190 }, { - "epoch": 1.05, - "learning_rate": 0.00014244063144830507, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021904733514610617, + "loss": 0.017, "step": 208200 }, { - "epoch": 1.05, - "learning_rate": 0.00014243306375529108, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002190434469297347, + "loss": 0.0173, "step": 208210 }, { - "epoch": 1.05, - "learning_rate": 0.00014242549606227706, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021903955871336328, + "loss": 0.0154, "step": 208220 }, { - "epoch": 1.05, - "learning_rate": 0.00014241792836926304, - "loss": 0.0125, + "epoch": 0.54, + "learning_rate": 0.0002190356704969918, + "loss": 0.0167, "step": 208230 }, { - "epoch": 1.05, - "learning_rate": 0.00014241036067624905, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021903178228062034, + "loss": 0.0184, "step": 208240 }, { - "epoch": 1.05, - "learning_rate": 0.00014240279298323503, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021902789406424885, + "loss": 0.0189, "step": 208250 }, { - "epoch": 1.05, - "learning_rate": 0.00014239522529022102, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021902400584787742, + "loss": 0.0166, "step": 208260 }, { - "epoch": 1.05, - "learning_rate": 0.000142387657597207, - "loss": 0.013, + "epoch": 0.54, + "learning_rate": 0.00021902011763150594, + "loss": 0.0173, "step": 208270 }, { - "epoch": 1.05, - "learning_rate": 0.000142380089904193, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021901622941513448, + "loss": 0.0174, "step": 208280 }, { - "epoch": 1.05, - "learning_rate": 0.000142372522211179, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.000219012341198763, + "loss": 0.0165, "step": 208290 }, { - "epoch": 1.05, - "learning_rate": 0.00014236495451816497, - "loss": 0.0077, + "epoch": 0.54, + "learning_rate": 0.00021900845298239156, + "loss": 0.0141, "step": 208300 }, { - "epoch": 1.05, - "learning_rate": 0.00014235738682515098, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021900456476602008, + "loss": 0.0185, "step": 208310 }, { - "epoch": 1.05, - "learning_rate": 0.00014234981913213696, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021900067654964862, + "loss": 0.0152, "step": 208320 }, { - "epoch": 1.05, - "learning_rate": 0.00014234225143912294, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021899678833327713, + "loss": 0.0175, "step": 208330 }, { - "epoch": 1.05, - "learning_rate": 0.00014233468374610892, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.0002189929001169057, + "loss": 0.0161, "step": 208340 }, { - "epoch": 1.05, - "learning_rate": 0.0001423271160530949, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021898901190053421, + "loss": 0.0178, "step": 208350 }, { - "epoch": 1.05, - "learning_rate": 0.0001423195483600809, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021898512368416276, + "loss": 0.0162, "step": 208360 }, { - "epoch": 1.05, - "learning_rate": 0.0001423119806670669, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021898123546779127, + "loss": 0.0138, "step": 208370 }, { - "epoch": 1.05, - "learning_rate": 0.00014230441297405287, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021897734725141984, + "loss": 0.0211, "step": 208380 }, { - "epoch": 1.05, - "learning_rate": 0.00014229684528103888, - "loss": 0.0084, - "step": 208390 + "epoch": 0.54, + "learning_rate": 0.00021897345903504838, + "loss": 0.0176, + "step": 208390 }, { - "epoch": 1.05, - "learning_rate": 0.00014228927758802486, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.0002189695708186769, + "loss": 0.0172, "step": 208400 }, { - "epoch": 1.05, - "learning_rate": 0.00014228170989501085, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021896568260230544, + "loss": 0.0136, "step": 208410 }, { - "epoch": 1.05, - "learning_rate": 0.00014227414220199685, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021896179438593395, + "loss": 0.0159, "step": 208420 }, { - "epoch": 1.05, - "learning_rate": 0.00014226657450898284, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.00021895790616956252, + "loss": 0.0176, "step": 208430 }, { - "epoch": 1.05, - "learning_rate": 0.00014225900681596882, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021895401795319104, + "loss": 0.017, "step": 208440 }, { - "epoch": 1.05, - "learning_rate": 0.00014225143912295483, - "loss": 0.0077, + "epoch": 0.54, + "learning_rate": 0.00021895012973681958, + "loss": 0.0133, "step": 208450 }, { - "epoch": 1.05, - "learning_rate": 0.0001422438714299408, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.0002189462415204481, + "loss": 0.0185, "step": 208460 }, { - "epoch": 1.05, - "learning_rate": 0.0001422363037369268, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021894235330407666, + "loss": 0.0152, "step": 208470 }, { - "epoch": 1.05, - "learning_rate": 0.00014222873604391277, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021893846508770517, + "loss": 0.0211, "step": 208480 }, { - "epoch": 1.05, - "learning_rate": 0.00014222116835089878, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021893457687133372, + "loss": 0.0172, "step": 208490 }, { - "epoch": 1.05, - "learning_rate": 0.00014221360065788476, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.00021893068865496223, + "loss": 0.0158, "step": 208500 }, { - "epoch": 1.05, - "learning_rate": 0.00014220603296487074, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.0002189268004385908, + "loss": 0.0197, "step": 208510 }, { - "epoch": 1.05, - "learning_rate": 0.00014219846527185675, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021892291222221931, + "loss": 0.0171, "step": 208520 }, { - "epoch": 1.05, - "learning_rate": 0.00014219089757884273, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021891902400584786, + "loss": 0.0175, "step": 208530 }, { - "epoch": 1.05, - "learning_rate": 0.00014218332988582871, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021891513578947637, + "loss": 0.0162, "step": 208540 }, { - "epoch": 1.05, - "learning_rate": 0.00014217576219281472, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021891124757310494, + "loss": 0.0157, "step": 208550 }, { - "epoch": 1.05, - "learning_rate": 0.0001421681944998007, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021890735935673348, + "loss": 0.0166, "step": 208560 }, { - "epoch": 1.05, - "learning_rate": 0.00014216062680678668, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.000218903471140362, + "loss": 0.0186, "step": 208570 }, { - "epoch": 1.05, - "learning_rate": 0.0001421530591137727, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021889958292399054, + "loss": 0.0161, "step": 208580 }, { - "epoch": 1.05, - "learning_rate": 0.00014214549142075867, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021889569470761908, + "loss": 0.0154, "step": 208590 }, { - "epoch": 1.05, - "learning_rate": 0.00014213792372774466, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021889180649124762, + "loss": 0.0189, "step": 208600 }, { - "epoch": 1.05, - "learning_rate": 0.00014213035603473066, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021888791827487613, + "loss": 0.0156, "step": 208610 }, { - "epoch": 1.05, - "learning_rate": 0.00014212278834171665, - "loss": 0.0065, + "epoch": 0.54, + "learning_rate": 0.00021888403005850468, + "loss": 0.016, "step": 208620 }, { - "epoch": 1.05, - "learning_rate": 0.00014211522064870263, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021888014184213322, + "loss": 0.0213, "step": 208630 }, { - "epoch": 1.05, - "learning_rate": 0.0001421076529556886, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021887625362576176, + "loss": 0.0207, "step": 208640 }, { - "epoch": 1.05, - "learning_rate": 0.00014210008526267462, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021887236540939027, + "loss": 0.014, "step": 208650 }, { - "epoch": 1.05, - "learning_rate": 0.0001420925175696606, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021886847719301882, + "loss": 0.0157, "step": 208660 }, { - "epoch": 1.05, - "learning_rate": 0.00014208494987664658, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.00021886458897664733, + "loss": 0.0189, "step": 208670 }, { - "epoch": 1.05, - "learning_rate": 0.0001420773821836326, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002188607007602759, + "loss": 0.0158, "step": 208680 }, { - "epoch": 1.05, - "learning_rate": 0.00014206981449061857, - "loss": 0.013, + "epoch": 0.54, + "learning_rate": 0.00021885681254390441, + "loss": 0.0135, "step": 208690 }, { - "epoch": 1.05, - "learning_rate": 0.00014206224679760455, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.00021885292432753296, + "loss": 0.0144, "step": 208700 }, { - "epoch": 1.05, - "learning_rate": 0.00014205467910459056, - "loss": 0.0131, + "epoch": 0.54, + "learning_rate": 0.00021884903611116147, + "loss": 0.0196, "step": 208710 }, { - "epoch": 1.05, - "learning_rate": 0.00014204711141157654, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021884514789479004, + "loss": 0.0218, "step": 208720 }, { - "epoch": 1.05, - "learning_rate": 0.00014203954371856252, - "loss": 0.0116, + "epoch": 0.54, + "learning_rate": 0.00021884125967841858, + "loss": 0.0161, "step": 208730 }, { - "epoch": 1.05, - "learning_rate": 0.00014203197602554853, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.0002188373714620471, + "loss": 0.0131, "step": 208740 }, { - "epoch": 1.05, - "learning_rate": 0.00014202440833253451, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.0002188334832456756, + "loss": 0.0147, "step": 208750 }, { - "epoch": 1.05, - "learning_rate": 0.0001420168406395205, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021882959502930418, + "loss": 0.0159, "step": 208760 }, { - "epoch": 1.05, - "learning_rate": 0.0001420092729465065, - "loss": 0.0074, + "epoch": 0.54, + "learning_rate": 0.00021882570681293272, + "loss": 0.0172, "step": 208770 }, { - "epoch": 1.05, - "learning_rate": 0.00014200170525349249, - "loss": 0.0122, + "epoch": 0.54, + "learning_rate": 0.00021882181859656123, + "loss": 0.0169, "step": 208780 }, { - "epoch": 1.05, - "learning_rate": 0.00014199413756047847, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021881793038018978, + "loss": 0.0162, "step": 208790 }, { - "epoch": 1.05, - "learning_rate": 0.00014198656986746445, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.00021881404216381832, + "loss": 0.0148, "step": 208800 }, { - "epoch": 1.05, - "learning_rate": 0.00014197900217445046, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021881015394744686, + "loss": 0.0189, "step": 208810 }, { - "epoch": 1.05, - "learning_rate": 0.00014197143448143644, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.00021880626573107537, + "loss": 0.0146, "step": 208820 }, { - "epoch": 1.05, - "learning_rate": 0.00014196386678842242, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021880237751470392, + "loss": 0.0176, "step": 208830 }, { - "epoch": 1.05, - "learning_rate": 0.00014195629909540843, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021879848929833246, + "loss": 0.0227, "step": 208840 }, { - "epoch": 1.05, - "learning_rate": 0.0001419487314023944, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.000218794601081961, + "loss": 0.0174, "step": 208850 }, { - "epoch": 1.05, - "learning_rate": 0.0001419411637093804, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.0002187907128655895, + "loss": 0.018, "step": 208860 }, { - "epoch": 1.05, - "learning_rate": 0.0001419335960163664, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.00021878682464921805, + "loss": 0.0189, "step": 208870 }, { - "epoch": 1.05, - "learning_rate": 0.00014192602832335238, - "loss": 0.0148, + "epoch": 0.54, + "learning_rate": 0.00021878293643284662, + "loss": 0.0184, "step": 208880 }, { - "epoch": 1.05, - "learning_rate": 0.00014191846063033836, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021877904821647514, + "loss": 0.0168, "step": 208890 }, { - "epoch": 1.05, - "learning_rate": 0.00014191089293732437, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021877516000010368, + "loss": 0.0174, "step": 208900 }, { - "epoch": 1.05, - "learning_rate": 0.00014190332524431035, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.0002187712717837322, + "loss": 0.0142, "step": 208910 }, { - "epoch": 1.05, - "learning_rate": 0.00014189575755129633, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.0002187673835673607, + "loss": 0.0185, "step": 208920 }, { - "epoch": 1.05, - "learning_rate": 0.00014188818985828234, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021876349535098928, + "loss": 0.0177, "step": 208930 }, { - "epoch": 1.05, - "learning_rate": 0.00014188062216526832, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021875960713461782, + "loss": 0.0166, "step": 208940 }, { - "epoch": 1.05, - "learning_rate": 0.0001418730544722543, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021875571891824633, + "loss": 0.0142, "step": 208950 }, { - "epoch": 1.05, - "learning_rate": 0.0001418654867792403, - "loss": 0.0115, + "epoch": 0.54, + "learning_rate": 0.00021875183070187488, + "loss": 0.0142, "step": 208960 }, { - "epoch": 1.05, - "learning_rate": 0.00014185791908622627, - "loss": 0.008, + "epoch": 0.54, + "learning_rate": 0.00021874794248550342, + "loss": 0.0184, "step": 208970 }, { - "epoch": 1.05, - "learning_rate": 0.00014185035139321228, - "loss": 0.0119, + "epoch": 0.54, + "learning_rate": 0.00021874405426913196, + "loss": 0.0192, "step": 208980 }, { - "epoch": 1.05, - "learning_rate": 0.00014184278370019826, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021874016605276047, + "loss": 0.0176, "step": 208990 }, { - "epoch": 1.05, - "learning_rate": 0.00014183521600718424, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021873627783638901, + "loss": 0.0197, "step": 209000 }, { - "epoch": 1.05, - "eval_cer": 0.9144392032271493, - "eval_loss": 0.007373651955276728, - "eval_runtime": 116.5945, - "eval_samples_per_second": 17.153, - "eval_steps_per_second": 4.288, + "epoch": 0.54, + "eval_cer": 0.8817362776095881, + "eval_loss": 0.011807015165686607, + "eval_runtime": 107.3317, + "eval_samples_per_second": 18.634, + "eval_steps_per_second": 4.658, "step": 209000 }, { - "epoch": 1.05, - "learning_rate": 0.00014182764831417022, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021873238962001756, + "loss": 0.0188, "step": 209010 }, { - "epoch": 1.05, - "learning_rate": 0.00014182008062115623, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.0002187285014036461, + "loss": 0.016, "step": 209020 }, { - "epoch": 1.05, - "learning_rate": 0.0001418125129281422, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.0002187246131872746, + "loss": 0.0207, "step": 209030 }, { - "epoch": 1.05, - "learning_rate": 0.0001418049452351282, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021872072497090315, + "loss": 0.0159, "step": 209040 }, { - "epoch": 1.05, - "learning_rate": 0.0001417973775421142, - "loss": 0.0074, + "epoch": 0.54, + "learning_rate": 0.00021871683675453172, + "loss": 0.0173, "step": 209050 }, { - "epoch": 1.05, - "learning_rate": 0.00014178980984910018, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021871294853816024, + "loss": 0.0207, "step": 209060 }, { - "epoch": 1.05, - "learning_rate": 0.00014178224215608616, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021870906032178875, + "loss": 0.0154, "step": 209070 }, { - "epoch": 1.05, - "learning_rate": 0.00014177467446307217, - "loss": 0.013, + "epoch": 0.54, + "learning_rate": 0.0002187051721054173, + "loss": 0.0165, "step": 209080 }, { - "epoch": 1.05, - "learning_rate": 0.00014176710677005815, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021870128388904586, + "loss": 0.0142, "step": 209090 }, { - "epoch": 1.05, - "learning_rate": 0.00014175953907704414, - "loss": 0.011, + "epoch": 0.54, + "learning_rate": 0.00021869739567267438, + "loss": 0.0173, "step": 209100 }, { - "epoch": 1.05, - "learning_rate": 0.00014175197138403014, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.00021869350745630292, + "loss": 0.0206, "step": 209110 }, { - "epoch": 1.06, - "learning_rate": 0.00014174440369101613, - "loss": 0.0117, + "epoch": 0.54, + "learning_rate": 0.00021868961923993143, + "loss": 0.0246, "step": 209120 }, { - "epoch": 1.06, - "learning_rate": 0.0001417368359980021, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021868573102356, + "loss": 0.0159, "step": 209130 }, { - "epoch": 1.06, - "learning_rate": 0.00014172926830498812, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021868184280718852, + "loss": 0.0179, "step": 209140 }, { - "epoch": 1.06, - "learning_rate": 0.0001417217006119741, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021867795459081706, + "loss": 0.0208, "step": 209150 }, { - "epoch": 1.06, - "learning_rate": 0.00014171413291896008, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.00021867406637444557, + "loss": 0.0214, "step": 209160 }, { - "epoch": 1.06, - "learning_rate": 0.00014170656522594606, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021867017815807411, + "loss": 0.0167, "step": 209170 }, { - "epoch": 1.06, - "learning_rate": 0.00014169899753293207, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021866628994170266, + "loss": 0.0189, "step": 209180 }, { - "epoch": 1.06, - "learning_rate": 0.00014169142983991805, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002186624017253312, + "loss": 0.0188, "step": 209190 }, { - "epoch": 1.06, - "learning_rate": 0.00014168386214690403, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002186585135089597, + "loss": 0.0206, "step": 209200 }, { - "epoch": 1.06, - "learning_rate": 0.00014167629445389004, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021865462529258825, + "loss": 0.0254, "step": 209210 }, { - "epoch": 1.06, - "learning_rate": 0.00014166872676087602, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.0002186507370762168, + "loss": 0.0152, "step": 209220 }, { - "epoch": 1.06, - "learning_rate": 0.000141661159067862, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021864684885984534, + "loss": 0.0186, "step": 209230 }, { - "epoch": 1.06, - "learning_rate": 0.000141653591374848, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021864296064347385, + "loss": 0.0189, "step": 209240 }, { - "epoch": 1.06, - "learning_rate": 0.000141646023681834, - "loss": 0.0077, + "epoch": 0.54, + "learning_rate": 0.0002186390724271024, + "loss": 0.0144, "step": 209250 }, { - "epoch": 1.06, - "learning_rate": 0.00014163845598881997, - "loss": 0.0073, + "epoch": 0.54, + "learning_rate": 0.00021863518421073096, + "loss": 0.0173, "step": 209260 }, { - "epoch": 1.06, - "learning_rate": 0.00014163088829580598, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021863129599435948, + "loss": 0.0169, "step": 209270 }, { - "epoch": 1.06, - "learning_rate": 0.00014162332060279196, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021862740777798802, + "loss": 0.0191, "step": 209280 }, { - "epoch": 1.06, - "learning_rate": 0.00014161575290977795, - "loss": 0.0126, + "epoch": 0.54, + "learning_rate": 0.00021862351956161653, + "loss": 0.0184, "step": 209290 }, { - "epoch": 1.06, - "learning_rate": 0.00014160818521676395, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.0002186196313452451, + "loss": 0.0173, "step": 209300 }, { - "epoch": 1.06, - "learning_rate": 0.00014160061752374994, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021861574312887362, + "loss": 0.0209, "step": 209310 }, { - "epoch": 1.06, - "learning_rate": 0.00014159304983073592, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021861185491250216, + "loss": 0.0165, "step": 209320 }, { - "epoch": 1.06, - "learning_rate": 0.00014158548213772193, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021860796669613067, + "loss": 0.0151, "step": 209330 }, { - "epoch": 1.06, - "learning_rate": 0.0001415779144447079, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021860407847975924, + "loss": 0.0145, "step": 209340 }, { - "epoch": 1.06, - "learning_rate": 0.0001415703467516939, - "loss": 0.0123, + "epoch": 0.54, + "learning_rate": 0.00021860019026338776, + "loss": 0.0229, "step": 209350 }, { - "epoch": 1.06, - "learning_rate": 0.00014156277905867987, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.0002185963020470163, + "loss": 0.0176, "step": 209360 }, { - "epoch": 1.06, - "learning_rate": 0.00014155521136566588, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.0002185924138306448, + "loss": 0.0174, "step": 209370 }, { - "epoch": 1.06, - "learning_rate": 0.00014154764367265186, - "loss": 0.0084, + "epoch": 0.54, + "learning_rate": 0.00021858852561427338, + "loss": 0.0163, "step": 209380 }, { - "epoch": 1.06, - "learning_rate": 0.00014154007597963784, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.0002185846373979019, + "loss": 0.0155, "step": 209390 }, { - "epoch": 1.06, - "learning_rate": 0.00014153250828662385, - "loss": 0.0075, + "epoch": 0.54, + "learning_rate": 0.00021858074918153044, + "loss": 0.0176, "step": 209400 }, { - "epoch": 1.06, - "learning_rate": 0.00014152494059360983, - "loss": 0.0126, + "epoch": 0.54, + "learning_rate": 0.00021857686096515895, + "loss": 0.0187, "step": 209410 }, { - "epoch": 1.06, - "learning_rate": 0.0001415173729005958, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.0002185729727487875, + "loss": 0.0198, "step": 209420 }, { - "epoch": 1.06, - "learning_rate": 0.00014150980520758182, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021856908453241606, + "loss": 0.0155, "step": 209430 }, { - "epoch": 1.06, - "learning_rate": 0.0001415022375145678, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021856519631604458, + "loss": 0.0188, "step": 209440 }, { - "epoch": 1.06, - "learning_rate": 0.00014149466982155378, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021856130809967312, + "loss": 0.0175, "step": 209450 }, { - "epoch": 1.06, - "learning_rate": 0.0001414871021285398, - "loss": 0.0138, + "epoch": 0.54, + "learning_rate": 0.00021855741988330163, + "loss": 0.0162, "step": 209460 }, { - "epoch": 1.06, - "learning_rate": 0.00014147953443552577, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.0002185535316669302, + "loss": 0.016, "step": 209470 }, { - "epoch": 1.06, - "learning_rate": 0.00014147196674251176, - "loss": 0.0156, + "epoch": 0.54, + "learning_rate": 0.00021854964345055872, + "loss": 0.0132, "step": 209480 }, { - "epoch": 1.06, - "learning_rate": 0.00014146439904949776, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021854575523418726, + "loss": 0.0118, "step": 209490 }, { - "epoch": 1.06, - "learning_rate": 0.00014145683135648375, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021854186701781577, + "loss": 0.0187, "step": 209500 }, { - "epoch": 1.06, - "learning_rate": 0.00014144926366346973, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021853797880144434, + "loss": 0.0108, "step": 209510 }, { - "epoch": 1.06, - "learning_rate": 0.0001414416959704557, - "loss": 0.0106, + "epoch": 0.54, + "learning_rate": 0.00021853409058507285, + "loss": 0.0167, "step": 209520 }, { - "epoch": 1.06, - "learning_rate": 0.00014143412827744172, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.0002185302023687014, + "loss": 0.0128, "step": 209530 }, { - "epoch": 1.06, - "learning_rate": 0.0001414265605844277, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.0002185263141523299, + "loss": 0.0185, "step": 209540 }, { - "epoch": 1.06, - "learning_rate": 0.00014141899289141368, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021852242593595848, + "loss": 0.0115, "step": 209550 }, { - "epoch": 1.06, - "learning_rate": 0.0001414114251983997, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.000218518537719587, + "loss": 0.0183, "step": 209560 }, { - "epoch": 1.06, - "learning_rate": 0.00014140385750538567, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021851464950321554, + "loss": 0.0164, "step": 209570 }, { - "epoch": 1.06, - "learning_rate": 0.00014139628981237165, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021851076128684405, + "loss": 0.0231, "step": 209580 }, { - "epoch": 1.06, - "learning_rate": 0.00014138872211935763, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021850687307047262, + "loss": 0.0159, "step": 209590 }, { - "epoch": 1.06, - "learning_rate": 0.00014138115442634361, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021850298485410116, + "loss": 0.0175, "step": 209600 }, { - "epoch": 1.06, - "learning_rate": 0.00014137358673332962, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021849909663772968, + "loss": 0.0158, "step": 209610 }, { - "epoch": 1.06, - "learning_rate": 0.0001413660190403156, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021849520842135822, + "loss": 0.0196, "step": 209620 }, { - "epoch": 1.06, - "learning_rate": 0.00014135845134730159, - "loss": 0.009, + "epoch": 0.54, + "learning_rate": 0.00021849132020498676, + "loss": 0.0139, "step": 209630 }, { - "epoch": 1.06, - "learning_rate": 0.0001413508836542876, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.0002184874319886153, + "loss": 0.0198, "step": 209640 }, { - "epoch": 1.06, - "learning_rate": 0.00014134331596127358, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021848354377224381, + "loss": 0.0157, "step": 209650 }, { - "epoch": 1.06, - "learning_rate": 0.00014133574826825956, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021847965555587236, + "loss": 0.0227, "step": 209660 }, { - "epoch": 1.06, - "learning_rate": 0.00014132818057524557, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021847576733950087, + "loss": 0.0155, "step": 209670 }, { - "epoch": 1.06, - "learning_rate": 0.00014132061288223155, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.00021847187912312944, + "loss": 0.0142, "step": 209680 }, { - "epoch": 1.06, - "learning_rate": 0.00014131304518921753, - "loss": 0.0107, + "epoch": 0.54, + "learning_rate": 0.00021846799090675795, + "loss": 0.0161, "step": 209690 }, { - "epoch": 1.06, - "learning_rate": 0.0001413054774962035, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.0002184641026903865, + "loss": 0.0183, "step": 209700 }, { - "epoch": 1.06, - "learning_rate": 0.00014129790980318952, - "loss": 0.0076, + "epoch": 0.54, + "learning_rate": 0.000218460214474015, + "loss": 0.0166, "step": 209710 }, { - "epoch": 1.06, - "learning_rate": 0.0001412903421101755, - "loss": 0.0125, + "epoch": 0.54, + "learning_rate": 0.00021845632625764358, + "loss": 0.0193, "step": 209720 }, { - "epoch": 1.06, - "learning_rate": 0.00014128277441716148, - "loss": 0.0078, + "epoch": 0.54, + "learning_rate": 0.0002184524380412721, + "loss": 0.0155, "step": 209730 }, { - "epoch": 1.06, - "learning_rate": 0.0001412752067241475, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021844854982490064, + "loss": 0.0175, "step": 209740 }, { - "epoch": 1.06, - "learning_rate": 0.00014126763903113347, - "loss": 0.0124, + "epoch": 0.54, + "learning_rate": 0.00021844466160852915, + "loss": 0.016, "step": 209750 }, { - "epoch": 1.06, - "learning_rate": 0.00014126007133811945, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021844077339215772, + "loss": 0.0167, "step": 209760 }, { - "epoch": 1.06, - "learning_rate": 0.00014125250364510546, - "loss": 0.0086, + "epoch": 0.54, + "learning_rate": 0.00021843688517578626, + "loss": 0.0127, "step": 209770 }, { - "epoch": 1.06, - "learning_rate": 0.00014124493595209144, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021843299695941477, + "loss": 0.0161, "step": 209780 }, { - "epoch": 1.06, - "learning_rate": 0.00014123736825907742, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.0002184291087430433, + "loss": 0.015, "step": 209790 }, { - "epoch": 1.06, - "learning_rate": 0.00014122980056606343, - "loss": 0.0079, + "epoch": 0.54, + "learning_rate": 0.00021842522052667186, + "loss": 0.0151, "step": 209800 }, { - "epoch": 1.06, - "learning_rate": 0.00014122223287304941, - "loss": 0.0103, + "epoch": 0.54, + "learning_rate": 0.0002184213323103004, + "loss": 0.0123, "step": 209810 }, { - "epoch": 1.06, - "learning_rate": 0.0001412146651800354, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021841744409392891, + "loss": 0.0175, "step": 209820 }, { - "epoch": 1.06, - "learning_rate": 0.0001412070974870214, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.00021841355587755746, + "loss": 0.0197, "step": 209830 }, { - "epoch": 1.06, - "learning_rate": 0.00014119952979400739, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.000218409667661186, + "loss": 0.0215, "step": 209840 }, { - "epoch": 1.06, - "learning_rate": 0.00014119196210099337, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021840577944481454, + "loss": 0.0196, "step": 209850 }, { - "epoch": 1.06, - "learning_rate": 0.00014118439440797938, - "loss": 0.0099, + "epoch": 0.54, + "learning_rate": 0.00021840189122844305, + "loss": 0.0145, "step": 209860 }, { - "epoch": 1.06, - "learning_rate": 0.00014117682671496536, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.0002183980030120716, + "loss": 0.0141, "step": 209870 }, { - "epoch": 1.06, - "learning_rate": 0.00014116925902195134, - "loss": 0.0096, + "epoch": 0.54, + "learning_rate": 0.00021839411479570014, + "loss": 0.0181, "step": 209880 }, { - "epoch": 1.06, - "learning_rate": 0.00014116169132893732, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021839022657932868, + "loss": 0.0124, "step": 209890 }, { - "epoch": 1.06, - "learning_rate": 0.00014115412363592333, - "loss": 0.0088, + "epoch": 0.54, + "learning_rate": 0.0002183863383629572, + "loss": 0.0185, "step": 209900 }, { - "epoch": 1.06, - "learning_rate": 0.0001411465559429093, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021838245014658573, + "loss": 0.0191, "step": 209910 }, { - "epoch": 1.06, - "learning_rate": 0.0001411389882498953, - "loss": 0.0077, + "epoch": 0.54, + "learning_rate": 0.00021837856193021425, + "loss": 0.0193, "step": 209920 }, { - "epoch": 1.06, - "learning_rate": 0.0001411314205568813, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.00021837467371384282, + "loss": 0.0153, "step": 209930 }, { - "epoch": 1.06, - "learning_rate": 0.00014112385286386728, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021837078549747133, + "loss": 0.014, "step": 209940 }, { - "epoch": 1.06, - "learning_rate": 0.00014111628517085326, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.00021836689728109987, + "loss": 0.0179, "step": 209950 }, { - "epoch": 1.06, - "learning_rate": 0.00014110871747783927, - "loss": 0.0087, + "epoch": 0.54, + "learning_rate": 0.0002183630090647284, + "loss": 0.0153, "step": 209960 }, { - "epoch": 1.06, - "learning_rate": 0.00014110114978482525, - "loss": 0.0097, + "epoch": 0.54, + "learning_rate": 0.00021835912084835696, + "loss": 0.0175, "step": 209970 }, { - "epoch": 1.06, - "learning_rate": 0.00014109358209181123, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.0002183552326319855, + "loss": 0.0163, "step": 209980 }, { - "epoch": 1.06, - "learning_rate": 0.00014108601439879724, - "loss": 0.0225, + "epoch": 0.54, + "learning_rate": 0.000218351344415614, + "loss": 0.0202, "step": 209990 }, { - "epoch": 1.06, - "learning_rate": 0.00014107844670578322, - "loss": 0.0091, + "epoch": 0.54, + "learning_rate": 0.00021834745619924256, + "loss": 0.0165, "step": 210000 }, { - "epoch": 1.06, - "eval_cer": 0.9144906342217957, - "eval_loss": 0.007647486869245768, - "eval_runtime": 116.648, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.286, + "epoch": 0.54, + "eval_cer": 0.8817362776095881, + "eval_loss": 0.011167431250214577, + "eval_runtime": 108.0029, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.63, "step": 210000 }, { - "epoch": 1.06, - "learning_rate": 0.0001410708790127692, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.0002183435679828711, + "loss": 0.018, "step": 210010 }, { - "epoch": 1.06, - "learning_rate": 0.00014106331131975521, - "loss": 0.0083, + "epoch": 0.54, + "learning_rate": 0.00021833967976649964, + "loss": 0.0149, "step": 210020 }, { - "epoch": 1.06, - "learning_rate": 0.0001410557436267412, - "loss": 0.0113, + "epoch": 0.54, + "learning_rate": 0.00021833579155012815, + "loss": 0.016, "step": 210030 }, { - "epoch": 1.06, - "learning_rate": 0.00014104817593372718, - "loss": 0.0092, + "epoch": 0.54, + "learning_rate": 0.0002183319033337567, + "loss": 0.0151, "step": 210040 }, { - "epoch": 1.06, - "learning_rate": 0.00014104060824071316, - "loss": 0.0101, + "epoch": 0.54, + "learning_rate": 0.00021832801511738524, + "loss": 0.0152, "step": 210050 }, { - "epoch": 1.06, - "learning_rate": 0.00014103304054769917, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.00021832412690101378, + "loss": 0.019, "step": 210060 }, { - "epoch": 1.06, - "learning_rate": 0.00014102547285468515, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.0002183202386846423, + "loss": 0.0211, "step": 210070 }, { - "epoch": 1.06, - "learning_rate": 0.00014101790516167113, - "loss": 0.0081, + "epoch": 0.54, + "learning_rate": 0.00021831635046827083, + "loss": 0.0162, "step": 210080 }, { - "epoch": 1.06, - "learning_rate": 0.00014101033746865714, - "loss": 0.0111, + "epoch": 0.54, + "learning_rate": 0.0002183124622518994, + "loss": 0.0307, "step": 210090 }, { - "epoch": 1.06, - "learning_rate": 0.00014100276977564312, - "loss": 0.0109, + "epoch": 0.54, + "learning_rate": 0.00021830857403552792, + "loss": 0.0206, "step": 210100 }, { - "epoch": 1.06, - "learning_rate": 0.0001409952020826291, - "loss": 0.0108, + "epoch": 0.54, + "learning_rate": 0.00021830468581915643, + "loss": 0.0198, "step": 210110 }, { - "epoch": 1.06, - "learning_rate": 0.0001409876343896151, - "loss": 0.0102, + "epoch": 0.54, + "learning_rate": 0.00021830079760278497, + "loss": 0.0153, "step": 210120 }, { - "epoch": 1.06, - "learning_rate": 0.0001409800666966011, - "loss": 0.0094, + "epoch": 0.54, + "learning_rate": 0.00021829690938641354, + "loss": 0.014, "step": 210130 }, { - "epoch": 1.06, - "learning_rate": 0.00014097249900358707, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.00021829302117004206, + "loss": 0.0169, "step": 210140 }, { - "epoch": 1.06, - "learning_rate": 0.00014096493131057308, - "loss": 0.0104, + "epoch": 0.54, + "learning_rate": 0.0002182891329536706, + "loss": 0.0287, "step": 210150 }, { - "epoch": 1.06, - "learning_rate": 0.00014095736361755906, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.0002182852447372991, + "loss": 0.0176, "step": 210160 }, { - "epoch": 1.06, - "learning_rate": 0.00014094979592454504, - "loss": 0.0112, + "epoch": 0.54, + "learning_rate": 0.00021828135652092765, + "loss": 0.0178, "step": 210170 }, { - "epoch": 1.06, - "learning_rate": 0.00014094222823153105, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.0002182774683045562, + "loss": 0.0176, "step": 210180 }, { - "epoch": 1.06, - "learning_rate": 0.00014093466053851703, - "loss": 0.0105, + "epoch": 0.54, + "learning_rate": 0.00021827358008818474, + "loss": 0.0193, "step": 210190 }, { - "epoch": 1.06, - "learning_rate": 0.00014092709284550302, - "loss": 0.0095, + "epoch": 0.54, + "learning_rate": 0.00021826969187181325, + "loss": 0.0175, "step": 210200 }, { - "epoch": 1.06, - "learning_rate": 0.000140919525152489, - "loss": 0.0093, + "epoch": 0.54, + "learning_rate": 0.0002182658036554418, + "loss": 0.0181, "step": 210210 }, { - "epoch": 1.06, - "learning_rate": 0.00014091195745947498, - "loss": 0.0089, + "epoch": 0.54, + "learning_rate": 0.00021826191543907034, + "loss": 0.0207, "step": 210220 }, { - "epoch": 1.06, - "learning_rate": 0.000140904389766461, - "loss": 0.0156, + "epoch": 0.54, + "learning_rate": 0.00021825802722269888, + "loss": 0.0158, "step": 210230 }, { - "epoch": 1.06, - "learning_rate": 0.00014089682207344697, - "loss": 0.0098, + "epoch": 0.54, + "learning_rate": 0.0002182541390063274, + "loss": 0.0178, "step": 210240 }, { - "epoch": 1.06, - "learning_rate": 0.00014088925438043295, - "loss": 0.01, + "epoch": 0.54, + "learning_rate": 0.00021825025078995593, + "loss": 0.0141, "step": 210250 }, { - "epoch": 1.06, - "learning_rate": 0.00014088168668741893, - "loss": 0.0125, + "epoch": 0.55, + "learning_rate": 0.00021824636257358448, + "loss": 0.0158, "step": 210260 }, { - "epoch": 1.06, - "learning_rate": 0.00014087411899440494, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021824247435721302, + "loss": 0.0184, "step": 210270 }, { - "epoch": 1.06, - "learning_rate": 0.00014086655130139092, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021823858614084153, + "loss": 0.0175, "step": 210280 }, { - "epoch": 1.06, - "learning_rate": 0.0001408589836083769, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021823469792447007, + "loss": 0.015, "step": 210290 }, { - "epoch": 1.06, - "learning_rate": 0.0001408514159153629, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.00021823080970809864, + "loss": 0.0178, "step": 210300 }, { - "epoch": 1.06, - "learning_rate": 0.0001408438482223489, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021822692149172716, + "loss": 0.022, "step": 210310 }, { - "epoch": 1.06, - "learning_rate": 0.00014083628052933487, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.0002182230332753557, + "loss": 0.016, "step": 210320 }, { - "epoch": 1.06, - "learning_rate": 0.00014082871283632088, - "loss": 0.0118, + "epoch": 0.55, + "learning_rate": 0.0002182191450589842, + "loss": 0.0162, "step": 210330 }, { - "epoch": 1.06, - "learning_rate": 0.00014082114514330686, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.00021821525684261278, + "loss": 0.0184, "step": 210340 }, { - "epoch": 1.06, - "learning_rate": 0.00014081357745029285, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.0002182113686262413, + "loss": 0.0161, "step": 210350 }, { - "epoch": 1.06, - "learning_rate": 0.00014080600975727885, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021820748040986984, + "loss": 0.0178, "step": 210360 }, { - "epoch": 1.06, - "learning_rate": 0.00014079844206426484, - "loss": 0.0113, + "epoch": 0.55, + "learning_rate": 0.00021820359219349835, + "loss": 0.0171, "step": 210370 }, { - "epoch": 1.06, - "learning_rate": 0.00014079087437125082, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021819970397712692, + "loss": 0.0232, "step": 210380 }, { - "epoch": 1.06, - "learning_rate": 0.00014078330667823683, - "loss": 0.0134, + "epoch": 0.55, + "learning_rate": 0.00021819581576075543, + "loss": 0.0169, "step": 210390 }, { - "epoch": 1.06, - "learning_rate": 0.0001407757389852228, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021819192754438398, + "loss": 0.0153, "step": 210400 }, { - "epoch": 1.06, - "learning_rate": 0.0001407681712922088, - "loss": 0.0121, + "epoch": 0.55, + "learning_rate": 0.0002181880393280125, + "loss": 0.0244, "step": 210410 }, { - "epoch": 1.06, - "learning_rate": 0.00014076060359919477, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021818415111164103, + "loss": 0.0186, "step": 210420 }, { - "epoch": 1.06, - "learning_rate": 0.00014075303590618078, - "loss": 0.0126, + "epoch": 0.55, + "learning_rate": 0.00021818026289526957, + "loss": 0.0306, "step": 210430 }, { - "epoch": 1.06, - "learning_rate": 0.00014074546821316676, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021817637467889812, + "loss": 0.0153, "step": 210440 }, { - "epoch": 1.06, - "learning_rate": 0.00014073790052015274, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021817248646252663, + "loss": 0.0207, "step": 210450 }, { - "epoch": 1.06, - "learning_rate": 0.00014073033282713875, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021816859824615517, + "loss": 0.0149, "step": 210460 }, { - "epoch": 1.06, - "learning_rate": 0.00014072276513412473, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021816471002978374, + "loss": 0.0227, "step": 210470 }, { - "epoch": 1.06, - "learning_rate": 0.0001407151974411107, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021816082181341226, + "loss": 0.0203, "step": 210480 }, { - "epoch": 1.06, - "learning_rate": 0.00014070762974809672, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002181569335970408, + "loss": 0.0188, "step": 210490 }, { - "epoch": 1.06, - "learning_rate": 0.0001407000620550827, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.0002181530453806693, + "loss": 0.0183, "step": 210500 }, { - "epoch": 1.06, - "learning_rate": 0.00014069249436206868, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021814915716429788, + "loss": 0.0183, "step": 210510 }, { - "epoch": 1.06, - "learning_rate": 0.0001406849266690547, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.0002181452689479264, + "loss": 0.0127, "step": 210520 }, { - "epoch": 1.06, - "learning_rate": 0.00014067735897604067, - "loss": 0.013, + "epoch": 0.55, + "learning_rate": 0.00021814138073155494, + "loss": 0.0204, "step": 210530 }, { - "epoch": 1.06, - "learning_rate": 0.00014066979128302666, - "loss": 0.0165, + "epoch": 0.55, + "learning_rate": 0.00021813749251518345, + "loss": 0.0157, "step": 210540 }, { - "epoch": 1.06, - "learning_rate": 0.00014066222359001266, - "loss": 0.0072, + "epoch": 0.55, + "learning_rate": 0.00021813360429881202, + "loss": 0.0172, "step": 210550 }, { - "epoch": 1.06, - "learning_rate": 0.00014065465589699865, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021812971608244053, + "loss": 0.0163, "step": 210560 }, { - "epoch": 1.06, - "learning_rate": 0.00014064708820398463, - "loss": 0.0121, + "epoch": 0.55, + "learning_rate": 0.00021812582786606908, + "loss": 0.0155, "step": 210570 }, { - "epoch": 1.06, - "learning_rate": 0.0001406395205109706, - "loss": 0.015, + "epoch": 0.55, + "learning_rate": 0.0002181219396496976, + "loss": 0.0176, "step": 210580 }, { - "epoch": 1.06, - "learning_rate": 0.00014063195281795662, - "loss": 0.0078, + "epoch": 0.55, + "learning_rate": 0.00021811805143332616, + "loss": 0.0161, "step": 210590 }, { - "epoch": 1.06, - "learning_rate": 0.0001406243851249426, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021811416321695467, + "loss": 0.0155, "step": 210600 }, { - "epoch": 1.06, - "learning_rate": 0.00014061681743192858, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021811027500058322, + "loss": 0.0162, "step": 210610 }, { - "epoch": 1.06, - "learning_rate": 0.0001406092497389146, - "loss": 0.014, + "epoch": 0.55, + "learning_rate": 0.00021810638678421173, + "loss": 0.0199, "step": 210620 }, { - "epoch": 1.06, - "learning_rate": 0.00014060168204590057, - "loss": 0.0131, + "epoch": 0.55, + "learning_rate": 0.0002181024985678403, + "loss": 0.0205, "step": 210630 }, { - "epoch": 1.06, - "learning_rate": 0.00014059411435288655, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021809861035146884, + "loss": 0.0201, "step": 210640 }, { - "epoch": 1.06, - "learning_rate": 0.00014058654665987256, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021809472213509735, + "loss": 0.0118, "step": 210650 }, { - "epoch": 1.06, - "learning_rate": 0.00014057897896685854, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.00021809083391872587, + "loss": 0.0191, "step": 210660 }, { - "epoch": 1.06, - "learning_rate": 0.00014057141127384452, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.0002180869457023544, + "loss": 0.0165, "step": 210670 }, { - "epoch": 1.06, - "learning_rate": 0.00014056384358083053, - "loss": 0.0075, + "epoch": 0.55, + "learning_rate": 0.00021808305748598298, + "loss": 0.0153, "step": 210680 }, { - "epoch": 1.06, - "learning_rate": 0.0001405562758878165, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002180791692696115, + "loss": 0.0127, "step": 210690 }, { - "epoch": 1.06, - "learning_rate": 0.0001405487081948025, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.00021807528105324004, + "loss": 0.0164, "step": 210700 }, { - "epoch": 1.06, - "learning_rate": 0.0001405411405017885, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021807139283686855, + "loss": 0.0138, "step": 210710 }, { - "epoch": 1.06, - "learning_rate": 0.00014053357280877448, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021806750462049712, + "loss": 0.0207, "step": 210720 }, { - "epoch": 1.06, - "learning_rate": 0.00014052600511576047, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021806361640412563, + "loss": 0.0201, "step": 210730 }, { - "epoch": 1.06, - "learning_rate": 0.00014051843742274645, - "loss": 0.0113, + "epoch": 0.55, + "learning_rate": 0.00021805972818775418, + "loss": 0.0181, "step": 210740 }, { - "epoch": 1.06, - "learning_rate": 0.00014051086972973246, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.0002180558399713827, + "loss": 0.0206, "step": 210750 }, { - "epoch": 1.06, - "learning_rate": 0.00014050330203671844, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021805195175501126, + "loss": 0.0131, "step": 210760 }, { - "epoch": 1.06, - "learning_rate": 0.00014049573434370442, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021804806353863977, + "loss": 0.0141, "step": 210770 }, { - "epoch": 1.06, - "learning_rate": 0.00014048816665069043, - "loss": 0.0125, + "epoch": 0.55, + "learning_rate": 0.00021804417532226831, + "loss": 0.0152, "step": 210780 }, { - "epoch": 1.06, - "learning_rate": 0.0001404805989576764, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.00021804028710589683, + "loss": 0.0172, "step": 210790 }, { - "epoch": 1.06, - "learning_rate": 0.0001404730312646624, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.0002180363988895254, + "loss": 0.0206, "step": 210800 }, { - "epoch": 1.06, - "learning_rate": 0.0001404654635716484, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.0002180325106731539, + "loss": 0.0148, "step": 210810 }, { - "epoch": 1.06, - "learning_rate": 0.00014045789587863438, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.00021802862245678245, + "loss": 0.0201, "step": 210820 }, { - "epoch": 1.06, - "learning_rate": 0.00014045032818562036, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021802473424041097, + "loss": 0.0172, "step": 210830 }, { - "epoch": 1.06, - "learning_rate": 0.00014044276049260637, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021802084602403954, + "loss": 0.0144, "step": 210840 }, { - "epoch": 1.06, - "learning_rate": 0.00014043519279959232, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021801695780766808, + "loss": 0.0207, "step": 210850 }, { - "epoch": 1.06, - "learning_rate": 0.00014042762510657833, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.0002180130695912966, + "loss": 0.0167, "step": 210860 }, { - "epoch": 1.06, - "learning_rate": 0.00014042005741356431, - "loss": 0.0128, + "epoch": 0.55, + "learning_rate": 0.00021800918137492514, + "loss": 0.0239, "step": 210870 }, { - "epoch": 1.06, - "learning_rate": 0.0001404124897205503, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021800529315855368, + "loss": 0.017, "step": 210880 }, { - "epoch": 1.06, - "learning_rate": 0.0001404049220275363, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021800140494218222, + "loss": 0.017, "step": 210890 }, { - "epoch": 1.06, - "learning_rate": 0.00014039735433452229, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021799751672581073, + "loss": 0.0154, "step": 210900 }, { - "epoch": 1.06, - "learning_rate": 0.00014038978664150827, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021799362850943927, + "loss": 0.0132, "step": 210910 }, { - "epoch": 1.06, - "learning_rate": 0.00014038221894849428, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.0002179897402930678, + "loss": 0.0162, "step": 210920 }, { - "epoch": 1.06, - "learning_rate": 0.00014037465125548026, - "loss": 0.0076, + "epoch": 0.55, + "learning_rate": 0.00021798585207669636, + "loss": 0.0175, "step": 210930 }, { - "epoch": 1.06, - "learning_rate": 0.00014036708356246624, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021798196386032487, + "loss": 0.0119, "step": 210940 }, { - "epoch": 1.06, - "learning_rate": 0.00014035951586945222, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021797807564395341, + "loss": 0.0165, "step": 210950 }, { - "epoch": 1.06, - "learning_rate": 0.00014035194817643823, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021797418742758193, + "loss": 0.0221, "step": 210960 }, { - "epoch": 1.06, - "learning_rate": 0.0001403443804834242, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.0002179702992112105, + "loss": 0.0133, "step": 210970 }, { - "epoch": 1.06, - "learning_rate": 0.0001403368127904102, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.000217966410994839, + "loss": 0.0173, "step": 210980 }, { - "epoch": 1.06, - "learning_rate": 0.0001403292450973962, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021796252277846755, + "loss": 0.0183, "step": 210990 }, { - "epoch": 1.06, - "learning_rate": 0.00014032167740438218, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.00021795863456209607, + "loss": 0.015, "step": 211000 }, { - "epoch": 1.06, - "eval_cer": 0.9144489071884033, - "eval_loss": 0.007559832185506821, - "eval_runtime": 116.7132, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.55, + "eval_cer": 0.8817600714374692, + "eval_loss": 0.011309986002743244, + "eval_runtime": 107.7403, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, "step": 211000 }, { - "epoch": 1.06, - "learning_rate": 0.00014031410971136816, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021795474634572464, + "loss": 0.016, "step": 211010 }, { - "epoch": 1.06, - "learning_rate": 0.00014030654201835417, - "loss": 0.007, + "epoch": 0.55, + "learning_rate": 0.00021795085812935318, + "loss": 0.0133, "step": 211020 }, { - "epoch": 1.06, - "learning_rate": 0.00014029897432534015, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002179469699129817, + "loss": 0.0176, "step": 211030 }, { - "epoch": 1.06, - "learning_rate": 0.00014029140663232613, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021794308169661023, + "loss": 0.0176, "step": 211040 }, { - "epoch": 1.06, - "learning_rate": 0.00014028383893931214, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021793919348023878, + "loss": 0.0149, "step": 211050 }, { - "epoch": 1.06, - "learning_rate": 0.00014027627124629812, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021793530526386732, + "loss": 0.02, "step": 211060 }, { - "epoch": 1.06, - "learning_rate": 0.0001402687035532841, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.00021793141704749583, + "loss": 0.0199, "step": 211070 }, { - "epoch": 1.06, - "learning_rate": 0.00014026113586027011, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021792752883112437, + "loss": 0.019, "step": 211080 }, { - "epoch": 1.06, - "learning_rate": 0.0001402535681672561, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021792364061475292, + "loss": 0.0177, "step": 211090 }, { - "epoch": 1.07, - "learning_rate": 0.00014024600047424208, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021791975239838146, + "loss": 0.019, "step": 211100 }, { - "epoch": 1.07, - "learning_rate": 0.00014023843278122806, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.00021791586418200997, + "loss": 0.022, "step": 211110 }, { - "epoch": 1.07, - "learning_rate": 0.00014023086508821407, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021791197596563851, + "loss": 0.0188, "step": 211120 }, { - "epoch": 1.07, - "learning_rate": 0.00014022329739520005, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021790808774926706, + "loss": 0.017, "step": 211130 }, { - "epoch": 1.07, - "learning_rate": 0.00014021572970218603, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002179041995328956, + "loss": 0.0182, "step": 211140 }, { - "epoch": 1.07, - "learning_rate": 0.00014020816200917204, - "loss": 0.0081, + "epoch": 0.55, + "learning_rate": 0.0002179003113165241, + "loss": 0.0125, "step": 211150 }, { - "epoch": 1.07, - "learning_rate": 0.00014020059431615802, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021789642310015265, + "loss": 0.0171, "step": 211160 }, { - "epoch": 1.07, - "learning_rate": 0.000140193026623144, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021789253488378117, + "loss": 0.0148, "step": 211170 }, { - "epoch": 1.07, - "learning_rate": 0.00014018545893013, - "loss": 0.0075, + "epoch": 0.55, + "learning_rate": 0.00021788864666740974, + "loss": 0.0191, "step": 211180 }, { - "epoch": 1.07, - "learning_rate": 0.000140177891237116, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021788475845103828, + "loss": 0.0156, "step": 211190 }, { - "epoch": 1.07, - "learning_rate": 0.00014017032354410197, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002178808702346668, + "loss": 0.0189, "step": 211200 }, { - "epoch": 1.07, - "learning_rate": 0.00014016275585108798, - "loss": 0.0076, + "epoch": 0.55, + "learning_rate": 0.00021787698201829533, + "loss": 0.0165, "step": 211210 }, { - "epoch": 1.07, - "learning_rate": 0.00014015518815807396, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.00021787309380192388, + "loss": 0.0203, "step": 211220 }, { - "epoch": 1.07, - "learning_rate": 0.00014014762046505994, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021786920558555242, + "loss": 0.0145, "step": 211230 }, { - "epoch": 1.07, - "learning_rate": 0.00014014005277204595, - "loss": 0.0172, + "epoch": 0.55, + "learning_rate": 0.00021786531736918093, + "loss": 0.017, "step": 211240 }, { - "epoch": 1.07, - "learning_rate": 0.00014013248507903193, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021786142915280947, + "loss": 0.0188, "step": 211250 }, { - "epoch": 1.07, - "learning_rate": 0.00014012491738601792, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021785754093643802, + "loss": 0.0156, "step": 211260 }, { - "epoch": 1.07, - "learning_rate": 0.00014011734969300392, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021785365272006656, + "loss": 0.0145, "step": 211270 }, { - "epoch": 1.07, - "learning_rate": 0.0001401097819999899, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021784976450369507, + "loss": 0.015, "step": 211280 }, { - "epoch": 1.07, - "learning_rate": 0.0001401022143069759, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.0002178458762873236, + "loss": 0.0171, "step": 211290 }, { - "epoch": 1.07, - "learning_rate": 0.00014009464661396187, - "loss": 0.013, + "epoch": 0.55, + "learning_rate": 0.00021784198807095215, + "loss": 0.0158, "step": 211300 }, { - "epoch": 1.07, - "learning_rate": 0.00014008707892094788, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002178380998545807, + "loss": 0.016, "step": 211310 }, { - "epoch": 1.07, - "learning_rate": 0.00014007951122793386, - "loss": 0.0118, + "epoch": 0.55, + "learning_rate": 0.0002178342116382092, + "loss": 0.021, "step": 211320 }, { - "epoch": 1.07, - "learning_rate": 0.00014007194353491984, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021783032342183775, + "loss": 0.0162, "step": 211330 }, { - "epoch": 1.07, - "learning_rate": 0.00014006437584190585, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.00021782643520546632, + "loss": 0.018, "step": 211340 }, { - "epoch": 1.07, - "learning_rate": 0.00014005680814889183, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.00021782254698909484, + "loss": 0.0149, "step": 211350 }, { - "epoch": 1.07, - "learning_rate": 0.0001400492404558778, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021781865877272338, + "loss": 0.0185, "step": 211360 }, { - "epoch": 1.07, - "learning_rate": 0.00014004167276286382, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.0002178147705563519, + "loss": 0.0177, "step": 211370 }, { - "epoch": 1.07, - "learning_rate": 0.0001400341050698498, - "loss": 0.0115, + "epoch": 0.55, + "learning_rate": 0.00021781088233998046, + "loss": 0.0128, "step": 211380 }, { - "epoch": 1.07, - "learning_rate": 0.00014002653737683578, - "loss": 0.007, + "epoch": 0.55, + "learning_rate": 0.00021780699412360898, + "loss": 0.018, "step": 211390 }, { - "epoch": 1.07, - "learning_rate": 0.0001400189696838218, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021780310590723752, + "loss": 0.0176, "step": 211400 }, { - "epoch": 1.07, - "learning_rate": 0.00014001140199080777, - "loss": 0.0162, + "epoch": 0.55, + "learning_rate": 0.00021779921769086603, + "loss": 0.0137, "step": 211410 }, { - "epoch": 1.07, - "learning_rate": 0.00014000383429779375, - "loss": 0.0088, + "epoch": 0.55, + "learning_rate": 0.00021779532947449457, + "loss": 0.0185, "step": 211420 }, { - "epoch": 1.07, - "learning_rate": 0.00013999626660477976, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021779144125812311, + "loss": 0.0161, "step": 211430 }, { - "epoch": 1.07, - "learning_rate": 0.00013998869891176574, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021778755304175166, + "loss": 0.0161, "step": 211440 }, { - "epoch": 1.07, - "learning_rate": 0.00013998113121875173, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021778366482538017, + "loss": 0.0195, "step": 211450 }, { - "epoch": 1.07, - "learning_rate": 0.0001399735635257377, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002177797766090087, + "loss": 0.0153, "step": 211460 }, { - "epoch": 1.07, - "learning_rate": 0.00013996599583272372, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021777588839263725, + "loss": 0.0148, "step": 211470 }, { - "epoch": 1.07, - "learning_rate": 0.00013995842813970967, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.0002177720001762658, + "loss": 0.0186, "step": 211480 }, { - "epoch": 1.07, - "learning_rate": 0.00013995086044669568, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.0002177681119598943, + "loss": 0.0162, "step": 211490 }, { - "epoch": 1.07, - "learning_rate": 0.00013994329275368166, - "loss": 0.0121, + "epoch": 0.55, + "learning_rate": 0.00021776422374352285, + "loss": 0.0173, "step": 211500 }, { - "epoch": 1.07, - "learning_rate": 0.00013993572506066764, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021776033552715142, + "loss": 0.0184, "step": 211510 }, { - "epoch": 1.07, - "learning_rate": 0.00013992815736765365, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021775644731077994, + "loss": 0.0148, "step": 211520 }, { - "epoch": 1.07, - "learning_rate": 0.00013992058967463963, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.00021775255909440845, + "loss": 0.0192, "step": 211530 }, { - "epoch": 1.07, - "learning_rate": 0.0001399130219816256, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.000217748670878037, + "loss": 0.0172, "step": 211540 }, { - "epoch": 1.07, - "learning_rate": 0.00013990545428861162, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021774478266166556, + "loss": 0.0181, "step": 211550 }, { - "epoch": 1.07, - "learning_rate": 0.0001398978865955976, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021774089444529407, + "loss": 0.0181, "step": 211560 }, { - "epoch": 1.07, - "learning_rate": 0.00013989031890258358, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021773700622892262, + "loss": 0.0129, "step": 211570 }, { - "epoch": 1.07, - "learning_rate": 0.0001398827512095696, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021773311801255113, + "loss": 0.0164, "step": 211580 }, { - "epoch": 1.07, - "learning_rate": 0.00013987518351655557, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002177292297961797, + "loss": 0.0157, "step": 211590 }, { - "epoch": 1.07, - "learning_rate": 0.00013986761582354156, - "loss": 0.0127, + "epoch": 0.55, + "learning_rate": 0.00021772534157980821, + "loss": 0.0154, "step": 211600 }, { - "epoch": 1.07, - "learning_rate": 0.00013986004813052756, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021772145336343676, + "loss": 0.0188, "step": 211610 }, { - "epoch": 1.07, - "learning_rate": 0.00013985248043751355, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021771756514706527, + "loss": 0.0172, "step": 211620 }, { - "epoch": 1.07, - "learning_rate": 0.00013984491274449953, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021771367693069384, + "loss": 0.0198, "step": 211630 }, { - "epoch": 1.07, - "learning_rate": 0.0001398373450514855, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021770978871432235, + "loss": 0.0188, "step": 211640 }, { - "epoch": 1.07, - "learning_rate": 0.00013982977735847152, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.0002177059004979509, + "loss": 0.0155, "step": 211650 }, { - "epoch": 1.07, - "learning_rate": 0.0001398222096654575, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.0002177020122815794, + "loss": 0.0196, "step": 211660 }, { - "epoch": 1.07, - "learning_rate": 0.00013981464197244348, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021769812406520795, + "loss": 0.0171, "step": 211670 }, { - "epoch": 1.07, - "learning_rate": 0.0001398070742794295, - "loss": 0.0078, + "epoch": 0.55, + "learning_rate": 0.00021769423584883652, + "loss": 0.0173, "step": 211680 }, { - "epoch": 1.07, - "learning_rate": 0.00013979950658641547, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021769034763246503, + "loss": 0.021, "step": 211690 }, { - "epoch": 1.07, - "learning_rate": 0.00013979193889340145, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021768645941609355, + "loss": 0.0173, "step": 211700 }, { - "epoch": 1.07, - "learning_rate": 0.00013978437120038746, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.0002176825711997221, + "loss": 0.0194, "step": 211710 }, { - "epoch": 1.07, - "learning_rate": 0.00013977680350737344, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021767868298335066, + "loss": 0.0184, "step": 211720 }, { - "epoch": 1.07, - "learning_rate": 0.00013976923581435942, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021767479476697917, + "loss": 0.0197, "step": 211730 }, { - "epoch": 1.07, - "learning_rate": 0.00013976166812134543, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021767090655060772, + "loss": 0.0162, "step": 211740 }, { - "epoch": 1.07, - "learning_rate": 0.0001397541004283314, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021766701833423623, + "loss": 0.018, "step": 211750 }, { - "epoch": 1.07, - "learning_rate": 0.0001397465327353174, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.0002176631301178648, + "loss": 0.0165, "step": 211760 }, { - "epoch": 1.07, - "learning_rate": 0.0001397389650423034, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021765924190149331, + "loss": 0.0151, "step": 211770 }, { - "epoch": 1.07, - "learning_rate": 0.00013973139734928938, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021765535368512186, + "loss": 0.0145, "step": 211780 }, { - "epoch": 1.07, - "learning_rate": 0.00013972382965627537, - "loss": 0.0141, + "epoch": 0.55, + "learning_rate": 0.00021765146546875037, + "loss": 0.0158, "step": 211790 }, { - "epoch": 1.07, - "learning_rate": 0.00013971626196326137, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021764757725237894, + "loss": 0.0183, "step": 211800 }, { - "epoch": 1.07, - "learning_rate": 0.00013970869427024736, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021764368903600745, + "loss": 0.0208, "step": 211810 }, { - "epoch": 1.07, - "learning_rate": 0.00013970112657723334, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.000217639800819636, + "loss": 0.0153, "step": 211820 }, { - "epoch": 1.07, - "learning_rate": 0.00013969355888421932, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.0002176359126032645, + "loss": 0.0181, "step": 211830 }, { - "epoch": 1.07, - "learning_rate": 0.00013968599119120533, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021763202438689308, + "loss": 0.0157, "step": 211840 }, { - "epoch": 1.07, - "learning_rate": 0.0001396784234981913, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.0002176281361705216, + "loss": 0.0134, "step": 211850 }, { - "epoch": 1.07, - "learning_rate": 0.0001396708558051773, - "loss": 0.0123, + "epoch": 0.55, + "learning_rate": 0.00021762424795415013, + "loss": 0.0181, "step": 211860 }, { - "epoch": 1.07, - "learning_rate": 0.0001396632881121633, - "loss": 0.0113, + "epoch": 0.55, + "learning_rate": 0.00021762035973777865, + "loss": 0.0192, "step": 211870 }, { - "epoch": 1.07, - "learning_rate": 0.00013965572041914928, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021761647152140722, + "loss": 0.0159, "step": 211880 }, { - "epoch": 1.07, - "learning_rate": 0.00013964815272613526, - "loss": 0.0076, + "epoch": 0.55, + "learning_rate": 0.00021761258330503576, + "loss": 0.0139, "step": 211890 }, { - "epoch": 1.07, - "learning_rate": 0.00013964058503312127, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.00021760869508866427, + "loss": 0.0138, "step": 211900 }, { - "epoch": 1.07, - "learning_rate": 0.00013963301734010725, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021760480687229282, + "loss": 0.0175, "step": 211910 }, { - "epoch": 1.07, - "learning_rate": 0.00013962544964709323, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021760091865592133, + "loss": 0.0146, "step": 211920 }, { - "epoch": 1.07, - "learning_rate": 0.00013961788195407924, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.0002175970304395499, + "loss": 0.0169, "step": 211930 }, { - "epoch": 1.07, - "learning_rate": 0.00013961031426106522, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.0002175931422231784, + "loss": 0.0178, "step": 211940 }, { - "epoch": 1.07, - "learning_rate": 0.0001396027465680512, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021758925400680695, + "loss": 0.0181, "step": 211950 }, { - "epoch": 1.07, - "learning_rate": 0.0001395951788750372, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021758536579043547, + "loss": 0.0169, "step": 211960 }, { - "epoch": 1.07, - "learning_rate": 0.0001395876111820232, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021758147757406404, + "loss": 0.0172, "step": 211970 }, { - "epoch": 1.07, - "learning_rate": 0.00013958004348900918, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.00021757758935769255, + "loss": 0.0165, "step": 211980 }, { - "epoch": 1.07, - "learning_rate": 0.00013957247579599516, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.0002175737011413211, + "loss": 0.0224, "step": 211990 }, { - "epoch": 1.07, - "learning_rate": 0.00013956490810298117, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.0002175698129249496, + "loss": 0.0168, "step": 212000 }, { - "epoch": 1.07, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.007792965974658728, - "eval_runtime": 116.6797, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.55, + "eval_cer": 0.8817446754311932, + "eval_loss": 0.011121110990643501, + "eval_runtime": 107.2308, + "eval_samples_per_second": 18.651, + "eval_steps_per_second": 4.663, "step": 212000 }, { - "epoch": 1.07, - "learning_rate": 0.00013955734040996715, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021756592470857818, + "loss": 0.0188, "step": 212010 }, { - "epoch": 1.07, - "learning_rate": 0.00013954977271695313, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.0002175620364922067, + "loss": 0.0154, "step": 212020 }, { - "epoch": 1.07, - "learning_rate": 0.00013954220502393914, - "loss": 0.0078, + "epoch": 0.55, + "learning_rate": 0.00021755814827583523, + "loss": 0.0143, "step": 212030 }, { - "epoch": 1.07, - "learning_rate": 0.00013953463733092512, - "loss": 0.0154, + "epoch": 0.55, + "learning_rate": 0.00021755426005946375, + "loss": 0.0141, "step": 212040 }, { - "epoch": 1.07, - "learning_rate": 0.0001395270696379111, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021755037184309232, + "loss": 0.0171, "step": 212050 }, { - "epoch": 1.07, - "learning_rate": 0.0001395195019448971, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021754648362672086, + "loss": 0.0209, "step": 212060 }, { - "epoch": 1.07, - "learning_rate": 0.0001395119342518831, - "loss": 0.0071, + "epoch": 0.55, + "learning_rate": 0.00021754259541034937, + "loss": 0.0235, "step": 212070 }, { - "epoch": 1.07, - "learning_rate": 0.00013950436655886907, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021753870719397791, + "loss": 0.0169, "step": 212080 }, { - "epoch": 1.07, - "learning_rate": 0.00013949679886585508, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021753481897760646, + "loss": 0.0176, "step": 212090 }, { - "epoch": 1.07, - "learning_rate": 0.00013948923117284103, - "loss": 0.0074, + "epoch": 0.55, + "learning_rate": 0.000217530930761235, + "loss": 0.0141, "step": 212100 }, { - "epoch": 1.07, - "learning_rate": 0.00013948166347982704, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.0002175270425448635, + "loss": 0.018, "step": 212110 }, { - "epoch": 1.07, - "learning_rate": 0.00013947409578681302, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021752315432849205, + "loss": 0.0165, "step": 212120 }, { - "epoch": 1.07, - "learning_rate": 0.000139466528093799, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002175192661121206, + "loss": 0.017, "step": 212130 }, { - "epoch": 1.07, - "learning_rate": 0.00013945896040078501, - "loss": 0.0122, + "epoch": 0.55, + "learning_rate": 0.00021751537789574914, + "loss": 0.016, "step": 212140 }, { - "epoch": 1.07, - "learning_rate": 0.000139451392707771, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021751148967937765, + "loss": 0.0176, "step": 212150 }, { - "epoch": 1.07, - "learning_rate": 0.00013944382501475698, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.0002175076014630062, + "loss": 0.0189, "step": 212160 }, { - "epoch": 1.07, - "learning_rate": 0.00013943625732174299, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.0002175037132466347, + "loss": 0.0157, "step": 212170 }, { - "epoch": 1.07, - "learning_rate": 0.00013942868962872897, - "loss": 0.0081, + "epoch": 0.55, + "learning_rate": 0.00021749982503026328, + "loss": 0.016, "step": 212180 }, { - "epoch": 1.07, - "learning_rate": 0.00013942112193571495, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.0002174959368138918, + "loss": 0.0188, "step": 212190 }, { - "epoch": 1.07, - "learning_rate": 0.00013941355424270093, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021749204859752033, + "loss": 0.0154, "step": 212200 }, { - "epoch": 1.07, - "learning_rate": 0.00013940598654968694, - "loss": 0.0124, + "epoch": 0.55, + "learning_rate": 0.00021748816038114885, + "loss": 0.0158, "step": 212210 }, { - "epoch": 1.07, - "learning_rate": 0.00013939841885667292, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021748427216477742, + "loss": 0.0134, "step": 212220 }, { - "epoch": 1.07, - "learning_rate": 0.0001393908511636589, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021748038394840596, + "loss": 0.0188, "step": 212230 }, { - "epoch": 1.07, - "learning_rate": 0.0001393832834706449, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.00021747649573203447, + "loss": 0.016, "step": 212240 }, { - "epoch": 1.07, - "learning_rate": 0.0001393757157776309, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.000217472607515663, + "loss": 0.0153, "step": 212250 }, { - "epoch": 1.07, - "learning_rate": 0.00013936814808461687, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021746871929929156, + "loss": 0.0188, "step": 212260 }, { - "epoch": 1.07, - "learning_rate": 0.00013936058039160288, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002174648310829201, + "loss": 0.0165, "step": 212270 }, { - "epoch": 1.07, - "learning_rate": 0.00013935301269858886, - "loss": 0.0075, + "epoch": 0.55, + "learning_rate": 0.0002174609428665486, + "loss": 0.0174, "step": 212280 }, { - "epoch": 1.07, - "learning_rate": 0.00013934544500557484, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.00021745705465017715, + "loss": 0.0203, "step": 212290 }, { - "epoch": 1.07, - "learning_rate": 0.00013933787731256085, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002174531664338057, + "loss": 0.0201, "step": 212300 }, { - "epoch": 1.07, - "learning_rate": 0.00013933030961954683, - "loss": 0.008, + "epoch": 0.55, + "learning_rate": 0.00021744927821743424, + "loss": 0.0196, "step": 212310 }, { - "epoch": 1.07, - "learning_rate": 0.00013932274192653282, - "loss": 0.0113, + "epoch": 0.55, + "learning_rate": 0.00021744539000106275, + "loss": 0.0208, "step": 212320 }, { - "epoch": 1.07, - "learning_rate": 0.00013931517423351882, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.0002174415017846913, + "loss": 0.0173, "step": 212330 }, { - "epoch": 1.07, - "learning_rate": 0.0001393076065405048, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021743761356831983, + "loss": 0.011, "step": 212340 }, { - "epoch": 1.07, - "learning_rate": 0.0001393000388474908, - "loss": 0.0122, + "epoch": 0.55, + "learning_rate": 0.00021743372535194838, + "loss": 0.0181, "step": 212350 }, { - "epoch": 1.07, - "learning_rate": 0.00013929247115447677, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002174298371355769, + "loss": 0.0183, "step": 212360 }, { - "epoch": 1.07, - "learning_rate": 0.00013928490346146278, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021742594891920543, + "loss": 0.0152, "step": 212370 }, { - "epoch": 1.07, - "learning_rate": 0.00013927733576844876, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021742206070283395, + "loss": 0.0177, "step": 212380 }, { - "epoch": 1.07, - "learning_rate": 0.00013926976807543474, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021741817248646252, + "loss": 0.0164, "step": 212390 }, { - "epoch": 1.07, - "learning_rate": 0.00013926220038242075, - "loss": 0.0068, + "epoch": 0.55, + "learning_rate": 0.00021741428427009103, + "loss": 0.022, "step": 212400 }, { - "epoch": 1.07, - "learning_rate": 0.00013925463268940673, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.00021741039605371957, + "loss": 0.0193, "step": 212410 }, { - "epoch": 1.07, - "learning_rate": 0.0001392470649963927, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021740650783734809, + "loss": 0.0173, "step": 212420 }, { - "epoch": 1.07, - "learning_rate": 0.00013923949730337872, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021740261962097666, + "loss": 0.0208, "step": 212430 }, { - "epoch": 1.07, - "learning_rate": 0.0001392319296103647, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.0002173987314046052, + "loss": 0.0136, "step": 212440 }, { - "epoch": 1.07, - "learning_rate": 0.00013922436191735068, - "loss": 0.0139, + "epoch": 0.55, + "learning_rate": 0.0002173948431882337, + "loss": 0.0165, "step": 212450 }, { - "epoch": 1.07, - "learning_rate": 0.0001392167942243367, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021739095497186225, + "loss": 0.0199, "step": 212460 }, { - "epoch": 1.07, - "learning_rate": 0.00013920922653132267, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.0002173870667554908, + "loss": 0.0111, "step": 212470 }, { - "epoch": 1.07, - "learning_rate": 0.00013920165883830865, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021738317853911934, + "loss": 0.0149, "step": 212480 }, { - "epoch": 1.07, - "learning_rate": 0.00013919409114529466, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021737929032274785, + "loss": 0.0176, "step": 212490 }, { - "epoch": 1.07, - "learning_rate": 0.00013918652345228064, - "loss": 0.0118, + "epoch": 0.55, + "learning_rate": 0.0002173754021063764, + "loss": 0.0162, "step": 212500 }, { - "epoch": 1.07, - "learning_rate": 0.00013917895575926663, - "loss": 0.0118, + "epoch": 0.55, + "learning_rate": 0.00021737151389000493, + "loss": 0.0179, "step": 212510 }, { - "epoch": 1.07, - "learning_rate": 0.0001391713880662526, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.00021736762567363348, + "loss": 0.0162, "step": 212520 }, { - "epoch": 1.07, - "learning_rate": 0.00013916382037323862, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.000217363737457262, + "loss": 0.0166, "step": 212530 }, { - "epoch": 1.07, - "learning_rate": 0.0001391562526802246, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021735984924089053, + "loss": 0.0149, "step": 212540 }, { - "epoch": 1.07, - "learning_rate": 0.00013914868498721058, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.0002173559610245191, + "loss": 0.0167, "step": 212550 }, { - "epoch": 1.07, - "learning_rate": 0.0001391411172941966, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021735207280814762, + "loss": 0.0189, "step": 212560 }, { - "epoch": 1.07, - "learning_rate": 0.00013913354960118257, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.00021734818459177613, + "loss": 0.0149, "step": 212570 }, { - "epoch": 1.07, - "learning_rate": 0.00013912598190816855, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.00021734429637540467, + "loss": 0.0155, "step": 212580 }, { - "epoch": 1.07, - "learning_rate": 0.00013911841421515456, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021734040815903324, + "loss": 0.0148, "step": 212590 }, { - "epoch": 1.07, - "learning_rate": 0.00013911084652214054, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021733651994266175, + "loss": 0.0162, "step": 212600 }, { - "epoch": 1.07, - "learning_rate": 0.00013910327882912652, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.0002173326317262903, + "loss": 0.0184, "step": 212610 }, { - "epoch": 1.07, - "learning_rate": 0.00013909571113611253, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.0002173287435099188, + "loss": 0.0165, "step": 212620 }, { - "epoch": 1.07, - "learning_rate": 0.0001390881434430985, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021732485529354735, + "loss": 0.0175, "step": 212630 }, { - "epoch": 1.07, - "learning_rate": 0.0001390805757500845, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002173209670771759, + "loss": 0.0178, "step": 212640 }, { - "epoch": 1.07, - "learning_rate": 0.0001390730080570705, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021731707886080444, + "loss": 0.0183, "step": 212650 }, { - "epoch": 1.07, - "learning_rate": 0.00013906544036405648, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.00021731319064443295, + "loss": 0.0139, "step": 212660 }, { - "epoch": 1.07, - "learning_rate": 0.00013905787267104246, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.0002173093024280615, + "loss": 0.0216, "step": 212670 }, { - "epoch": 1.07, - "learning_rate": 0.00013905030497802845, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021730541421169003, + "loss": 0.0168, "step": 212680 }, { - "epoch": 1.07, - "learning_rate": 0.00013904273728501445, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021730152599531858, + "loss": 0.0176, "step": 212690 }, { - "epoch": 1.07, - "learning_rate": 0.00013903516959200044, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.0002172976377789471, + "loss": 0.0181, "step": 212700 }, { - "epoch": 1.07, - "learning_rate": 0.00013902760189898642, - "loss": 0.0072, + "epoch": 0.55, + "learning_rate": 0.00021729374956257563, + "loss": 0.0179, "step": 212710 }, { - "epoch": 1.07, - "learning_rate": 0.00013902003420597243, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021728986134620417, + "loss": 0.0122, "step": 212720 }, { - "epoch": 1.07, - "learning_rate": 0.00013901246651295838, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021728597312983271, + "loss": 0.0116, "step": 212730 }, { - "epoch": 1.07, - "learning_rate": 0.0001390048988199444, - "loss": 0.0127, + "epoch": 0.55, + "learning_rate": 0.00021728208491346123, + "loss": 0.0154, "step": 212740 }, { - "epoch": 1.07, - "learning_rate": 0.00013899733112693037, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021727819669708977, + "loss": 0.0135, "step": 212750 }, { - "epoch": 1.07, - "learning_rate": 0.00013898976343391635, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.00021727430848071834, + "loss": 0.0159, "step": 212760 }, { - "epoch": 1.07, - "learning_rate": 0.00013898219574090236, - "loss": 0.0123, + "epoch": 0.55, + "learning_rate": 0.00021727042026434685, + "loss": 0.0199, "step": 212770 }, { - "epoch": 1.07, - "learning_rate": 0.00013897462804788834, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.0002172665320479754, + "loss": 0.0156, "step": 212780 }, { - "epoch": 1.07, - "learning_rate": 0.00013896706035487432, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.0002172626438316039, + "loss": 0.0147, "step": 212790 }, { - "epoch": 1.07, - "learning_rate": 0.00013895949266186033, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021725875561523248, + "loss": 0.0157, "step": 212800 }, { - "epoch": 1.07, - "learning_rate": 0.0001389519249688463, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.000217254867398861, + "loss": 0.0214, "step": 212810 }, { - "epoch": 1.07, - "learning_rate": 0.0001389443572758323, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021725097918248954, + "loss": 0.0143, "step": 212820 }, { - "epoch": 1.07, - "learning_rate": 0.0001389367895828183, - "loss": 0.0075, + "epoch": 0.55, + "learning_rate": 0.00021724709096611805, + "loss": 0.0207, "step": 212830 }, { - "epoch": 1.07, - "learning_rate": 0.00013892922188980428, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021724320274974662, + "loss": 0.0172, "step": 212840 }, { - "epoch": 1.07, - "learning_rate": 0.00013892165419679027, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.00021723931453337513, + "loss": 0.0162, "step": 212850 }, { - "epoch": 1.07, - "learning_rate": 0.00013891408650377627, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021723542631700367, + "loss": 0.0164, "step": 212860 }, { - "epoch": 1.07, - "learning_rate": 0.00013890651881076226, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.0002172315381006322, + "loss": 0.023, "step": 212870 }, { - "epoch": 1.07, - "learning_rate": 0.00013889895111774824, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021722764988426073, + "loss": 0.0188, "step": 212880 }, { - "epoch": 1.07, - "learning_rate": 0.00013889138342473422, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021722376166788927, + "loss": 0.0131, "step": 212890 }, { - "epoch": 1.07, - "learning_rate": 0.00013888381573172023, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021721987345151781, + "loss": 0.0155, "step": 212900 }, { - "epoch": 1.07, - "learning_rate": 0.0001388762480387062, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021721598523514633, + "loss": 0.0168, "step": 212910 }, { - "epoch": 1.07, - "learning_rate": 0.0001388686803456922, - "loss": 0.0089, + "epoch": 0.55, + "learning_rate": 0.00021721209701877487, + "loss": 0.0152, "step": 212920 }, { - "epoch": 1.07, - "learning_rate": 0.0001388611126526782, - "loss": 0.0129, + "epoch": 0.55, + "learning_rate": 0.00021720820880240344, + "loss": 0.0168, "step": 212930 }, { - "epoch": 1.07, - "learning_rate": 0.00013885354495966418, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021720432058603195, + "loss": 0.02, "step": 212940 }, { - "epoch": 1.07, - "learning_rate": 0.00013884597726665016, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.0002172004323696605, + "loss": 0.0149, "step": 212950 }, { - "epoch": 1.07, - "learning_rate": 0.00013883840957363617, - "loss": 0.0133, + "epoch": 0.55, + "learning_rate": 0.000217196544153289, + "loss": 0.016, "step": 212960 }, { - "epoch": 1.07, - "learning_rate": 0.00013883084188062215, - "loss": 0.0119, + "epoch": 0.55, + "learning_rate": 0.00021719265593691758, + "loss": 0.0228, "step": 212970 }, { - "epoch": 1.07, - "learning_rate": 0.00013882327418760813, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.0002171887677205461, + "loss": 0.0157, "step": 212980 }, { - "epoch": 1.07, - "learning_rate": 0.00013881570649459414, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021718487950417463, + "loss": 0.0197, "step": 212990 }, { - "epoch": 1.07, - "learning_rate": 0.00013880813880158012, - "loss": 0.0184, + "epoch": 0.55, + "learning_rate": 0.00021718099128780315, + "loss": 0.018, "step": 213000 }, { - "epoch": 1.07, - "eval_cer": 0.914481900656667, - "eval_loss": 0.007489955984055996, - "eval_runtime": 116.6491, - "eval_samples_per_second": 17.145, - "eval_steps_per_second": 4.286, + "epoch": 0.55, + "eval_cer": 0.8817586718005349, + "eval_loss": 0.01114367600530386, + "eval_runtime": 107.9769, + "eval_samples_per_second": 18.522, + "eval_steps_per_second": 4.631, "step": 213000 }, { - "epoch": 1.07, - "learning_rate": 0.0001388005711085661, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021717710307143172, + "loss": 0.0153, "step": 213010 }, { - "epoch": 1.07, - "learning_rate": 0.0001387930034155521, - "loss": 0.0117, + "epoch": 0.55, + "learning_rate": 0.00021717321485506023, + "loss": 0.0135, "step": 213020 }, { - "epoch": 1.07, - "learning_rate": 0.0001387854357225381, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021716932663868877, + "loss": 0.0158, "step": 213030 }, { - "epoch": 1.07, - "learning_rate": 0.00013877786802952408, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002171654384223173, + "loss": 0.0152, "step": 213040 }, { - "epoch": 1.07, - "learning_rate": 0.00013877030033651006, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021716155020594586, + "loss": 0.0231, "step": 213050 }, { - "epoch": 1.07, - "learning_rate": 0.00013876273264349607, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021715766198957437, + "loss": 0.0182, "step": 213060 }, { - "epoch": 1.07, - "learning_rate": 0.00013875516495048205, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.0002171537737732029, + "loss": 0.0122, "step": 213070 }, { - "epoch": 1.08, - "learning_rate": 0.00013874759725746803, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021714988555683143, + "loss": 0.0183, "step": 213080 }, { - "epoch": 1.08, - "learning_rate": 0.00013874002956445404, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021714599734046, + "loss": 0.0146, "step": 213090 }, { - "epoch": 1.08, - "learning_rate": 0.00013873246187144002, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021714210912408854, + "loss": 0.0211, "step": 213100 }, { - "epoch": 1.08, - "learning_rate": 0.000138724894178426, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021713822090771705, + "loss": 0.015, "step": 213110 }, { - "epoch": 1.08, - "learning_rate": 0.000138717326485412, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021713433269134557, + "loss": 0.0161, "step": 213120 }, { - "epoch": 1.08, - "learning_rate": 0.000138709758792398, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.0002171304444749741, + "loss": 0.0148, "step": 213130 }, { - "epoch": 1.08, - "learning_rate": 0.00013870219109938397, - "loss": 0.0071, + "epoch": 0.55, + "learning_rate": 0.00021712655625860268, + "loss": 0.0153, "step": 213140 }, { - "epoch": 1.08, - "learning_rate": 0.00013869462340636998, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.0002171226680422312, + "loss": 0.0135, "step": 213150 }, { - "epoch": 1.08, - "learning_rate": 0.00013868705571335596, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021711877982585973, + "loss": 0.0201, "step": 213160 }, { - "epoch": 1.08, - "learning_rate": 0.00013867948802034194, - "loss": 0.0134, + "epoch": 0.55, + "learning_rate": 0.00021711489160948825, + "loss": 0.0158, "step": 213170 }, { - "epoch": 1.08, - "learning_rate": 0.00013867192032732795, - "loss": 0.0127, + "epoch": 0.55, + "learning_rate": 0.00021711100339311682, + "loss": 0.0183, "step": 213180 }, { - "epoch": 1.08, - "learning_rate": 0.00013866435263431393, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.00021710711517674533, + "loss": 0.0127, "step": 213190 }, { - "epoch": 1.08, - "learning_rate": 0.00013865678494129991, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.00021710322696037387, + "loss": 0.0172, "step": 213200 }, { - "epoch": 1.08, - "learning_rate": 0.00013864921724828592, - "loss": 0.0071, + "epoch": 0.55, + "learning_rate": 0.0002170993387440024, + "loss": 0.0212, "step": 213210 }, { - "epoch": 1.08, - "learning_rate": 0.0001386416495552719, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.00021709545052763096, + "loss": 0.0175, "step": 213220 }, { - "epoch": 1.08, - "learning_rate": 0.00013863408186225789, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021709156231125947, + "loss": 0.0169, "step": 213230 }, { - "epoch": 1.08, - "learning_rate": 0.00013862651416924387, - "loss": 0.0122, + "epoch": 0.55, + "learning_rate": 0.000217087674094888, + "loss": 0.0178, "step": 213240 }, { - "epoch": 1.08, - "learning_rate": 0.00013861894647622988, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.00021708378587851653, + "loss": 0.0139, "step": 213250 }, { - "epoch": 1.08, - "learning_rate": 0.00013861137878321586, - "loss": 0.0061, + "epoch": 0.55, + "learning_rate": 0.0002170798976621451, + "loss": 0.0214, "step": 213260 }, { - "epoch": 1.08, - "learning_rate": 0.00013860381109020184, - "loss": 0.0101, + "epoch": 0.55, + "learning_rate": 0.00021707600944577364, + "loss": 0.0176, "step": 213270 }, { - "epoch": 1.08, - "learning_rate": 0.00013859624339718785, - "loss": 0.0075, + "epoch": 0.55, + "learning_rate": 0.00021707212122940215, + "loss": 0.017, "step": 213280 }, { - "epoch": 1.08, - "learning_rate": 0.00013858867570417383, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021706823301303067, + "loss": 0.0142, "step": 213290 }, { - "epoch": 1.08, - "learning_rate": 0.0001385811080111598, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021706434479665924, + "loss": 0.0139, "step": 213300 }, { - "epoch": 1.08, - "learning_rate": 0.00013857354031814582, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021706045658028778, + "loss": 0.0138, "step": 213310 }, { - "epoch": 1.08, - "learning_rate": 0.0001385659726251318, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002170565683639163, + "loss": 0.017, "step": 213320 }, { - "epoch": 1.08, - "learning_rate": 0.00013855840493211778, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021705268014754483, + "loss": 0.0164, "step": 213330 }, { - "epoch": 1.08, - "learning_rate": 0.0001385508372391038, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021704879193117337, + "loss": 0.0198, "step": 213340 }, { - "epoch": 1.08, - "learning_rate": 0.00013854326954608977, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021704490371480192, + "loss": 0.0163, "step": 213350 }, { - "epoch": 1.08, - "learning_rate": 0.00013853570185307575, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021704101549843043, + "loss": 0.0162, "step": 213360 }, { - "epoch": 1.08, - "learning_rate": 0.00013852813416006173, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021703712728205897, + "loss": 0.0157, "step": 213370 }, { - "epoch": 1.08, - "learning_rate": 0.00013852056646704772, - "loss": 0.0107, + "epoch": 0.55, + "learning_rate": 0.0002170332390656875, + "loss": 0.0173, "step": 213380 }, { - "epoch": 1.08, - "learning_rate": 0.00013851299877403372, - "loss": 0.0112, + "epoch": 0.55, + "learning_rate": 0.00021702935084931606, + "loss": 0.0162, "step": 213390 }, { - "epoch": 1.08, - "learning_rate": 0.0001385054310810197, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021702546263294457, + "loss": 0.0166, "step": 213400 }, { - "epoch": 1.08, - "learning_rate": 0.0001384978633880057, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.0002170215744165731, + "loss": 0.0176, "step": 213410 }, { - "epoch": 1.08, - "learning_rate": 0.00013849029569499167, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021701768620020163, + "loss": 0.0155, "step": 213420 }, { - "epoch": 1.08, - "learning_rate": 0.00013848272800197768, - "loss": 0.0118, + "epoch": 0.55, + "learning_rate": 0.0002170137979838302, + "loss": 0.0189, "step": 213430 }, { - "epoch": 1.08, - "learning_rate": 0.00013847516030896366, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.0002170099097674587, + "loss": 0.0168, "step": 213440 }, { - "epoch": 1.08, - "learning_rate": 0.00013846759261594964, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021700602155108725, + "loss": 0.0148, "step": 213450 }, { - "epoch": 1.08, - "learning_rate": 0.00013846002492293565, - "loss": 0.0084, + "epoch": 0.55, + "learning_rate": 0.00021700213333471577, + "loss": 0.0151, "step": 213460 }, { - "epoch": 1.08, - "learning_rate": 0.00013845245722992163, - "loss": 0.0083, + "epoch": 0.55, + "learning_rate": 0.00021699824511834433, + "loss": 0.0142, "step": 213470 }, { - "epoch": 1.08, - "learning_rate": 0.0001384448895369076, - "loss": 0.0076, - "step": 213480 + "epoch": 0.55, + "learning_rate": 0.00021699435690197288, + "loss": 0.0159, + "step": 213480 }, { - "epoch": 1.08, - "learning_rate": 0.00013843732184389362, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.0002169904686856014, + "loss": 0.0168, "step": 213490 }, { - "epoch": 1.08, - "learning_rate": 0.0001384297541508796, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021698658046922993, + "loss": 0.0154, "step": 213500 }, { - "epoch": 1.08, - "learning_rate": 0.00013842218645786558, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021698269225285847, + "loss": 0.0151, "step": 213510 }, { - "epoch": 1.08, - "learning_rate": 0.0001384146187648516, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021697880403648702, + "loss": 0.0125, "step": 213520 }, { - "epoch": 1.08, - "learning_rate": 0.00013840705107183757, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021697491582011553, + "loss": 0.0157, "step": 213530 }, { - "epoch": 1.08, - "learning_rate": 0.00013839948337882355, - "loss": 0.0075, + "epoch": 0.55, + "learning_rate": 0.00021697102760374407, + "loss": 0.0175, "step": 213540 }, { - "epoch": 1.08, - "learning_rate": 0.00013839191568580956, - "loss": 0.0081, + "epoch": 0.55, + "learning_rate": 0.00021696713938737261, + "loss": 0.0126, "step": 213550 }, { - "epoch": 1.08, - "learning_rate": 0.00013838434799279554, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021696325117100116, + "loss": 0.0179, "step": 213560 }, { - "epoch": 1.08, - "learning_rate": 0.00013837678029978153, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021695936295462967, + "loss": 0.0178, "step": 213570 }, { - "epoch": 1.08, - "learning_rate": 0.0001383692126067675, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.0002169554747382582, + "loss": 0.0195, "step": 213580 }, { - "epoch": 1.08, - "learning_rate": 0.00013836164491375352, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021695158652188675, + "loss": 0.0172, "step": 213590 }, { - "epoch": 1.08, - "learning_rate": 0.0001383540772207395, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.0002169476983055153, + "loss": 0.0138, "step": 213600 }, { - "epoch": 1.08, - "learning_rate": 0.00013834650952772548, - "loss": 0.0096, + "epoch": 0.55, + "learning_rate": 0.0002169438100891438, + "loss": 0.0192, "step": 213610 }, { - "epoch": 1.08, - "learning_rate": 0.0001383389418347115, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021693992187277235, + "loss": 0.017, "step": 213620 }, { - "epoch": 1.08, - "learning_rate": 0.00013833137414169747, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021693603365640087, + "loss": 0.0172, "step": 213630 }, { - "epoch": 1.08, - "learning_rate": 0.00013832380644868345, - "loss": 0.008, + "epoch": 0.55, + "learning_rate": 0.00021693214544002943, + "loss": 0.0141, "step": 213640 }, { - "epoch": 1.08, - "learning_rate": 0.00013831623875566946, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021692825722365798, + "loss": 0.0137, "step": 213650 }, { - "epoch": 1.08, - "learning_rate": 0.00013830867106265544, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.0002169243690072865, + "loss": 0.0146, "step": 213660 }, { - "epoch": 1.08, - "learning_rate": 0.00013830110336964142, - "loss": 0.0099, + "epoch": 0.55, + "learning_rate": 0.00021692048079091503, + "loss": 0.0139, "step": 213670 }, { - "epoch": 1.08, - "learning_rate": 0.00013829353567662743, - "loss": 0.0108, + "epoch": 0.55, + "learning_rate": 0.00021691659257454357, + "loss": 0.0143, "step": 213680 }, { - "epoch": 1.08, - "learning_rate": 0.0001382859679836134, - "loss": 0.0082, + "epoch": 0.55, + "learning_rate": 0.00021691270435817212, + "loss": 0.0177, "step": 213690 }, { - "epoch": 1.08, - "learning_rate": 0.0001382784002905994, - "loss": 0.0095, + "epoch": 0.55, + "learning_rate": 0.00021690881614180063, + "loss": 0.0148, "step": 213700 }, { - "epoch": 1.08, - "learning_rate": 0.0001382708325975854, - "loss": 0.0093, + "epoch": 0.55, + "learning_rate": 0.00021690492792542917, + "loss": 0.0181, "step": 213710 }, { - "epoch": 1.08, - "learning_rate": 0.00013826326490457138, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.0002169010397090577, + "loss": 0.0162, "step": 213720 }, { - "epoch": 1.08, - "learning_rate": 0.00013825569721155736, - "loss": 0.0087, + "epoch": 0.55, + "learning_rate": 0.00021689715149268625, + "loss": 0.0164, "step": 213730 }, { - "epoch": 1.08, - "learning_rate": 0.00013824812951854337, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021689326327631477, + "loss": 0.0163, "step": 213740 }, { - "epoch": 1.08, - "learning_rate": 0.00013824056182552935, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002168893750599433, + "loss": 0.0151, "step": 213750 }, { - "epoch": 1.08, - "learning_rate": 0.00013823299413251534, - "loss": 0.0118, + "epoch": 0.55, + "learning_rate": 0.00021688548684357185, + "loss": 0.0172, "step": 213760 }, { - "epoch": 1.08, - "learning_rate": 0.00013822542643950132, - "loss": 0.0106, + "epoch": 0.55, + "learning_rate": 0.0002168815986272004, + "loss": 0.0184, "step": 213770 }, { - "epoch": 1.08, - "learning_rate": 0.00013821785874648733, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.0002168777104108289, + "loss": 0.0119, "step": 213780 }, { - "epoch": 1.08, - "learning_rate": 0.0001382102910534733, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.00021687382219445745, + "loss": 0.0241, "step": 213790 }, { - "epoch": 1.08, - "learning_rate": 0.0001382027233604593, - "loss": 0.0074, + "epoch": 0.55, + "learning_rate": 0.00021686993397808602, + "loss": 0.0164, "step": 213800 }, { - "epoch": 1.08, - "learning_rate": 0.0001381951556674453, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021686604576171453, + "loss": 0.0145, "step": 213810 }, { - "epoch": 1.08, - "learning_rate": 0.00013818758797443128, - "loss": 0.0124, + "epoch": 0.55, + "learning_rate": 0.00021686215754534308, + "loss": 0.0145, "step": 213820 }, { - "epoch": 1.08, - "learning_rate": 0.00013818002028141726, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.0002168582693289716, + "loss": 0.0144, "step": 213830 }, { - "epoch": 1.08, - "learning_rate": 0.00013817245258840327, - "loss": 0.0077, + "epoch": 0.55, + "learning_rate": 0.00021685438111260016, + "loss": 0.014, "step": 213840 }, { - "epoch": 1.08, - "learning_rate": 0.00013816488489538925, - "loss": 0.0114, + "epoch": 0.55, + "learning_rate": 0.00021685049289622867, + "loss": 0.0156, "step": 213850 }, { - "epoch": 1.08, - "learning_rate": 0.00013815731720237523, - "loss": 0.0116, + "epoch": 0.55, + "learning_rate": 0.00021684660467985721, + "loss": 0.0186, "step": 213860 }, { - "epoch": 1.08, - "learning_rate": 0.00013814974950936124, - "loss": 0.0092, + "epoch": 0.55, + "learning_rate": 0.00021684271646348573, + "loss": 0.0183, "step": 213870 }, { - "epoch": 1.08, - "learning_rate": 0.00013814218181634722, - "loss": 0.0102, + "epoch": 0.55, + "learning_rate": 0.00021683882824711427, + "loss": 0.0344, "step": 213880 }, { - "epoch": 1.08, - "learning_rate": 0.0001381346141233332, - "loss": 0.0085, + "epoch": 0.55, + "learning_rate": 0.0002168349400307428, + "loss": 0.0184, "step": 213890 }, { - "epoch": 1.08, - "learning_rate": 0.0001381270464303192, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021683105181437135, + "loss": 0.0183, "step": 213900 }, { - "epoch": 1.08, - "learning_rate": 0.0001381194787373052, - "loss": 0.0079, + "epoch": 0.55, + "learning_rate": 0.00021682716359799987, + "loss": 0.0184, "step": 213910 }, { - "epoch": 1.08, - "learning_rate": 0.00013811191104429117, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.0002168232753816284, + "loss": 0.0158, "step": 213920 }, { - "epoch": 1.08, - "learning_rate": 0.00013810434335127716, - "loss": 0.0097, + "epoch": 0.55, + "learning_rate": 0.00021681938716525695, + "loss": 0.0132, "step": 213930 }, { - "epoch": 1.08, - "learning_rate": 0.00013809677565826316, - "loss": 0.009, + "epoch": 0.55, + "learning_rate": 0.0002168154989488855, + "loss": 0.0166, "step": 213940 }, { - "epoch": 1.08, - "learning_rate": 0.00013808920796524915, - "loss": 0.0091, + "epoch": 0.55, + "learning_rate": 0.000216811610732514, + "loss": 0.0205, "step": 213950 }, { - "epoch": 1.08, - "learning_rate": 0.00013808164027223513, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021680772251614255, + "loss": 0.0173, "step": 213960 }, { - "epoch": 1.08, - "learning_rate": 0.00013807407257922114, - "loss": 0.0152, + "epoch": 0.55, + "learning_rate": 0.00021680383429977112, + "loss": 0.0186, "step": 213970 }, { - "epoch": 1.08, - "learning_rate": 0.00013806650488620712, - "loss": 0.0104, + "epoch": 0.55, + "learning_rate": 0.00021679994608339963, + "loss": 0.0197, "step": 213980 }, { - "epoch": 1.08, - "learning_rate": 0.0001380589371931931, + "epoch": 0.55, + "learning_rate": 0.00021679605786702815, "loss": 0.0146, "step": 213990 }, { - "epoch": 1.08, - "learning_rate": 0.00013805136950017908, - "loss": 0.0098, + "epoch": 0.55, + "learning_rate": 0.0002167921696506567, + "loss": 0.0189, "step": 214000 }, { - "epoch": 1.08, - "eval_cer": 0.9144392032271493, - "eval_loss": 0.0074865869246423244, - "eval_runtime": 116.6822, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.55, + "eval_cer": 0.8817418761573248, + "eval_loss": 0.01149623654782772, + "eval_runtime": 107.8487, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, "step": 214000 }, { - "epoch": 1.08, - "learning_rate": 0.00013804380180716506, - "loss": 0.0103, + "epoch": 0.55, + "learning_rate": 0.00021678828143428526, + "loss": 0.0176, "step": 214010 }, { - "epoch": 1.08, - "learning_rate": 0.00013803623411415107, - "loss": 0.0094, + "epoch": 0.55, + "learning_rate": 0.00021678439321791377, + "loss": 0.0185, "step": 214020 }, { - "epoch": 1.08, - "learning_rate": 0.00013802866642113705, - "loss": 0.0128, + "epoch": 0.55, + "learning_rate": 0.00021678050500154231, + "loss": 0.0148, "step": 214030 }, { - "epoch": 1.08, - "learning_rate": 0.00013802109872812303, - "loss": 0.011, + "epoch": 0.55, + "learning_rate": 0.00021677661678517083, + "loss": 0.0218, "step": 214040 }, { - "epoch": 1.08, - "learning_rate": 0.00013801353103510904, - "loss": 0.0086, + "epoch": 0.55, + "learning_rate": 0.0002167727285687994, + "loss": 0.0146, "step": 214050 }, { - "epoch": 1.08, - "learning_rate": 0.00013800596334209502, - "loss": 0.01, + "epoch": 0.55, + "learning_rate": 0.0002167688403524279, + "loss": 0.0157, "step": 214060 }, { - "epoch": 1.08, - "learning_rate": 0.000137998395649081, - "loss": 0.0124, + "epoch": 0.55, + "learning_rate": 0.00021676495213605645, + "loss": 0.0136, "step": 214070 }, { - "epoch": 1.08, - "learning_rate": 0.000137990827956067, - "loss": 0.0109, + "epoch": 0.55, + "learning_rate": 0.00021676106391968497, + "loss": 0.0162, "step": 214080 }, { - "epoch": 1.08, - "learning_rate": 0.000137983260263053, - "loss": 0.0105, + "epoch": 0.55, + "learning_rate": 0.00021675717570331354, + "loss": 0.0186, "step": 214090 }, { - "epoch": 1.08, - "learning_rate": 0.00013797569257003898, - "loss": 0.0111, + "epoch": 0.55, + "learning_rate": 0.00021675328748694205, + "loss": 0.0148, "step": 214100 }, { - "epoch": 1.08, - "learning_rate": 0.00013796812487702498, - "loss": 0.0144, + "epoch": 0.56, + "learning_rate": 0.0002167493992705706, + "loss": 0.0162, "step": 214110 }, { - "epoch": 1.08, - "learning_rate": 0.00013796055718401097, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.0002167455110541991, + "loss": 0.0184, "step": 214120 }, { - "epoch": 1.08, - "learning_rate": 0.00013795298949099695, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021674162283782765, + "loss": 0.0185, "step": 214130 }, { - "epoch": 1.08, - "learning_rate": 0.00013794542179798293, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021673773462145622, + "loss": 0.0155, "step": 214140 }, { - "epoch": 1.08, - "learning_rate": 0.00013793785410496894, - "loss": 0.0135, + "epoch": 0.56, + "learning_rate": 0.00021673384640508473, + "loss": 0.0198, "step": 214150 }, { - "epoch": 1.08, - "learning_rate": 0.00013793028641195492, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021672995818871325, + "loss": 0.0214, "step": 214160 }, { - "epoch": 1.08, - "learning_rate": 0.0001379227187189409, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002167260699723418, + "loss": 0.0177, "step": 214170 }, { - "epoch": 1.08, - "learning_rate": 0.0001379151510259269, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021672218175597036, + "loss": 0.0154, "step": 214180 }, { - "epoch": 1.08, - "learning_rate": 0.0001379075833329129, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.00021671829353959887, + "loss": 0.0162, "step": 214190 }, { - "epoch": 1.08, - "learning_rate": 0.00013790001563989887, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021671440532322741, + "loss": 0.0169, "step": 214200 }, { - "epoch": 1.08, - "learning_rate": 0.00013789244794688488, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021671051710685593, + "loss": 0.0231, "step": 214210 }, { - "epoch": 1.08, - "learning_rate": 0.00013788488025387086, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.0002167066288904845, + "loss": 0.0166, "step": 214220 }, { - "epoch": 1.08, - "learning_rate": 0.00013787731256085684, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.000216702740674113, + "loss": 0.0165, "step": 214230 }, { - "epoch": 1.08, - "learning_rate": 0.00013786974486784285, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021669885245774155, + "loss": 0.0181, "step": 214240 }, { - "epoch": 1.08, - "learning_rate": 0.00013786217717482883, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021669496424137007, + "loss": 0.0158, "step": 214250 }, { - "epoch": 1.08, - "learning_rate": 0.00013785460948181481, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021669107602499864, + "loss": 0.0229, "step": 214260 }, { - "epoch": 1.08, - "learning_rate": 0.00013784704178880082, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021668718780862715, + "loss": 0.0194, "step": 214270 }, { - "epoch": 1.08, - "learning_rate": 0.0001378394740957868, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.0002166832995922557, + "loss": 0.0161, "step": 214280 }, { - "epoch": 1.08, - "learning_rate": 0.00013783190640277279, - "loss": 0.007, + "epoch": 0.56, + "learning_rate": 0.0002166794113758842, + "loss": 0.0161, "step": 214290 }, { - "epoch": 1.08, - "learning_rate": 0.00013782433870975877, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021667552315951278, + "loss": 0.018, "step": 214300 }, { - "epoch": 1.08, - "learning_rate": 0.00013781677101674478, - "loss": 0.0114, + "epoch": 0.56, + "learning_rate": 0.0002166716349431413, + "loss": 0.0168, "step": 214310 }, { - "epoch": 1.08, - "learning_rate": 0.00013780920332373076, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.00021666774672676983, + "loss": 0.0163, "step": 214320 }, { - "epoch": 1.08, - "learning_rate": 0.00013780163563071674, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021666385851039835, + "loss": 0.0173, "step": 214330 }, { - "epoch": 1.08, - "learning_rate": 0.00013779406793770275, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021665997029402692, + "loss": 0.0145, "step": 214340 }, { - "epoch": 1.08, - "learning_rate": 0.00013778650024468873, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021665608207765546, + "loss": 0.0169, "step": 214350 }, { - "epoch": 1.08, - "learning_rate": 0.0001377789325516747, - "loss": 0.0122, + "epoch": 0.56, + "learning_rate": 0.00021665219386128397, + "loss": 0.0136, "step": 214360 }, { - "epoch": 1.08, - "learning_rate": 0.00013777136485866072, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.0002166483056449125, + "loss": 0.0151, "step": 214370 }, { - "epoch": 1.08, - "learning_rate": 0.0001377637971656467, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021664441742854103, + "loss": 0.0172, "step": 214380 }, { - "epoch": 1.08, - "learning_rate": 0.00013775622947263268, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.0002166405292121696, + "loss": 0.0235, "step": 214390 }, { - "epoch": 1.08, - "learning_rate": 0.0001377486617796187, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.0002166366409957981, + "loss": 0.017, "step": 214400 }, { - "epoch": 1.08, - "learning_rate": 0.00013774109408660467, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021663275277942665, + "loss": 0.0196, "step": 214410 }, { - "epoch": 1.08, - "learning_rate": 0.00013773352639359065, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.00021662886456305517, + "loss": 0.019, "step": 214420 }, { - "epoch": 1.08, - "learning_rate": 0.00013772595870057666, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021662497634668374, + "loss": 0.0193, "step": 214430 }, { - "epoch": 1.08, - "learning_rate": 0.00013771839100756264, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021662108813031225, + "loss": 0.0147, "step": 214440 }, { - "epoch": 1.08, - "learning_rate": 0.00013771082331454862, - "loss": 0.0075, + "epoch": 0.56, + "learning_rate": 0.0002166171999139408, + "loss": 0.0169, "step": 214450 }, { - "epoch": 1.08, - "learning_rate": 0.0001377032556215346, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.0002166133116975693, + "loss": 0.0152, "step": 214460 }, { - "epoch": 1.08, - "learning_rate": 0.00013769568792852061, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021660942348119788, + "loss": 0.0175, "step": 214470 }, { - "epoch": 1.08, - "learning_rate": 0.0001376881202355066, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002166055352648264, + "loss": 0.0202, "step": 214480 }, { - "epoch": 1.08, - "learning_rate": 0.00013768055254249258, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021660164704845493, + "loss": 0.02, "step": 214490 }, { - "epoch": 1.08, - "learning_rate": 0.00013767298484947859, - "loss": 0.014, + "epoch": 0.56, + "learning_rate": 0.00021659775883208345, + "loss": 0.017, "step": 214500 }, { - "epoch": 1.08, - "learning_rate": 0.00013766541715646457, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021659387061571201, + "loss": 0.0166, "step": 214510 }, { - "epoch": 1.08, - "learning_rate": 0.00013765784946345055, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.00021658998239934056, + "loss": 0.0263, "step": 214520 }, { - "epoch": 1.08, - "learning_rate": 0.00013765028177043656, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021658609418296907, + "loss": 0.0191, "step": 214530 }, { - "epoch": 1.08, - "learning_rate": 0.00013764271407742254, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.0002165822059665976, + "loss": 0.0155, "step": 214540 }, { - "epoch": 1.08, - "learning_rate": 0.00013763514638440852, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021657831775022615, + "loss": 0.0204, "step": 214550 }, { - "epoch": 1.08, - "learning_rate": 0.00013762757869139453, - "loss": 0.0069, + "epoch": 0.56, + "learning_rate": 0.0002165744295338547, + "loss": 0.0172, "step": 214560 }, { - "epoch": 1.08, - "learning_rate": 0.0001376200109983805, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.0002165705413174832, + "loss": 0.0176, "step": 214570 }, { - "epoch": 1.08, - "learning_rate": 0.0001376124433053665, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021656665310111175, + "loss": 0.018, "step": 214580 }, { - "epoch": 1.08, - "learning_rate": 0.0001376048756123525, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.0002165627648847403, + "loss": 0.0171, "step": 214590 }, { - "epoch": 1.08, - "learning_rate": 0.00013759730791933848, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021655887666836884, + "loss": 0.0218, "step": 214600 }, { - "epoch": 1.08, - "learning_rate": 0.00013758974022632446, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.00021655498845199735, + "loss": 0.0154, "step": 214610 }, { - "epoch": 1.08, - "learning_rate": 0.00013758217253331045, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.0002165511002356259, + "loss": 0.0166, "step": 214620 }, { - "epoch": 1.08, - "learning_rate": 0.00013757460484029643, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.0002165472120192544, + "loss": 0.0182, "step": 214630 }, { - "epoch": 1.08, - "learning_rate": 0.00013756703714728244, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021654332380288297, + "loss": 0.0181, "step": 214640 }, { - "epoch": 1.08, - "learning_rate": 0.00013755946945426842, - "loss": 0.0119, + "epoch": 0.56, + "learning_rate": 0.0002165394355865115, + "loss": 0.0155, "step": 214650 }, { - "epoch": 1.08, - "learning_rate": 0.0001375519017612544, - "loss": 0.0121, + "epoch": 0.56, + "learning_rate": 0.00021653554737014003, + "loss": 0.0149, "step": 214660 }, { - "epoch": 1.08, - "learning_rate": 0.00013754433406824038, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021653165915376855, + "loss": 0.0175, "step": 214670 }, { - "epoch": 1.08, - "learning_rate": 0.0001375367663752264, - "loss": 0.0107, + "epoch": 0.56, + "learning_rate": 0.00021652777093739711, + "loss": 0.0202, "step": 214680 }, { - "epoch": 1.08, - "learning_rate": 0.00013752919868221237, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021652388272102566, + "loss": 0.0122, "step": 214690 }, { - "epoch": 1.08, - "learning_rate": 0.00013752163098919835, - "loss": 0.0136, + "epoch": 0.56, + "learning_rate": 0.00021651999450465417, + "loss": 0.0191, "step": 214700 }, { - "epoch": 1.08, - "learning_rate": 0.00013751406329618436, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021651610628828268, + "loss": 0.0125, "step": 214710 }, { - "epoch": 1.08, - "learning_rate": 0.00013750649560317034, - "loss": 0.0119, + "epoch": 0.56, + "learning_rate": 0.00021651221807191125, + "loss": 0.0153, "step": 214720 }, { - "epoch": 1.08, - "learning_rate": 0.00013749892791015632, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.0002165083298555398, + "loss": 0.0138, "step": 214730 }, { - "epoch": 1.08, - "learning_rate": 0.00013749136021714233, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.0002165044416391683, + "loss": 0.0172, "step": 214740 }, { - "epoch": 1.08, - "learning_rate": 0.0001374837925241283, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021650055342279685, + "loss": 0.0165, "step": 214750 }, { - "epoch": 1.08, - "learning_rate": 0.0001374762248311143, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.0002164966652064254, + "loss": 0.0161, "step": 214760 }, { - "epoch": 1.08, - "learning_rate": 0.0001374686571381003, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.00021649277699005393, + "loss": 0.0198, "step": 214770 }, { - "epoch": 1.08, - "learning_rate": 0.00013746108944508628, - "loss": 0.0078, + "epoch": 0.56, + "learning_rate": 0.00021648888877368245, + "loss": 0.0179, "step": 214780 }, { - "epoch": 1.08, - "learning_rate": 0.00013745352175207227, - "loss": 0.0073, + "epoch": 0.56, + "learning_rate": 0.000216485000557311, + "loss": 0.013, "step": 214790 }, { - "epoch": 1.08, - "learning_rate": 0.00013744595405905827, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021648111234093953, + "loss": 0.0169, "step": 214800 }, { - "epoch": 1.08, - "learning_rate": 0.00013743838636604426, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021647722412456807, + "loss": 0.0184, "step": 214810 }, { - "epoch": 1.08, - "learning_rate": 0.00013743081867303024, - "loss": 0.0107, + "epoch": 0.56, + "learning_rate": 0.0002164733359081966, + "loss": 0.0209, "step": 214820 }, { - "epoch": 1.08, - "learning_rate": 0.00013742325098001622, - "loss": 0.0073, + "epoch": 0.56, + "learning_rate": 0.00021646944769182513, + "loss": 0.0179, "step": 214830 }, { - "epoch": 1.08, - "learning_rate": 0.00013741568328700223, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.0002164655594754537, + "loss": 0.0149, "step": 214840 }, { - "epoch": 1.08, - "learning_rate": 0.0001374081155939882, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021646167125908221, + "loss": 0.0164, "step": 214850 }, { - "epoch": 1.08, - "learning_rate": 0.0001374005479009742, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021645778304271076, + "loss": 0.0137, "step": 214860 }, { - "epoch": 1.08, - "learning_rate": 0.0001373929802079602, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021645389482633927, + "loss": 0.0142, "step": 214870 }, { - "epoch": 1.08, - "learning_rate": 0.00013738541251494618, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021645000660996778, + "loss": 0.0179, "step": 214880 }, { - "epoch": 1.08, - "learning_rate": 0.00013737784482193216, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021644611839359635, + "loss": 0.0156, "step": 214890 }, { - "epoch": 1.08, - "learning_rate": 0.00013737027712891817, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.0002164422301772249, + "loss": 0.0143, "step": 214900 }, { - "epoch": 1.08, - "learning_rate": 0.00013736270943590415, - "loss": 0.0077, + "epoch": 0.56, + "learning_rate": 0.0002164383419608534, + "loss": 0.0188, "step": 214910 }, { - "epoch": 1.08, - "learning_rate": 0.00013735514174289013, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021643445374448195, + "loss": 0.0142, "step": 214920 }, { - "epoch": 1.08, - "learning_rate": 0.00013734757404987614, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002164305655281105, + "loss": 0.0165, "step": 214930 }, { - "epoch": 1.08, - "learning_rate": 0.00013734000635686212, - "loss": 0.0137, + "epoch": 0.56, + "learning_rate": 0.00021642667731173903, + "loss": 0.0185, "step": 214940 }, { - "epoch": 1.08, - "learning_rate": 0.0001373324386638481, - "loss": 0.0117, + "epoch": 0.56, + "learning_rate": 0.00021642278909536755, + "loss": 0.0132, "step": 214950 }, { - "epoch": 1.08, - "learning_rate": 0.0001373248709708341, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.0002164189008789961, + "loss": 0.0207, "step": 214960 }, { - "epoch": 1.08, - "learning_rate": 0.0001373173032778201, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.00021641501266262463, + "loss": 0.0184, "step": 214970 }, { - "epoch": 1.08, - "learning_rate": 0.00013730973558480608, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021641112444625317, + "loss": 0.0213, "step": 214980 }, { - "epoch": 1.08, - "learning_rate": 0.00013730216789179206, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.0002164072362298817, + "loss": 0.0148, "step": 214990 }, { - "epoch": 1.08, - "learning_rate": 0.00013729460019877807, - "loss": 0.0132, + "epoch": 0.56, + "learning_rate": 0.00021640334801351023, + "loss": 0.0152, "step": 215000 }, { - "epoch": 1.08, - "eval_cer": 0.9144809302605417, - "eval_loss": 0.0071860929019749165, - "eval_runtime": 116.5447, - "eval_samples_per_second": 17.161, - "eval_steps_per_second": 4.29, + "epoch": 0.56, + "eval_cer": 0.8817292794249172, + "eval_loss": 0.011770045384764671, + "eval_runtime": 107.7843, + "eval_samples_per_second": 18.556, + "eval_steps_per_second": 4.639, "step": 215000 }, { - "epoch": 1.08, - "learning_rate": 0.00013728703250576405, - "loss": 0.013, + "epoch": 0.56, + "learning_rate": 0.0002163994597971388, + "loss": 0.0123, "step": 215010 }, { - "epoch": 1.08, - "learning_rate": 0.00013727946481275003, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.0002163955715807673, + "loss": 0.0195, "step": 215020 }, { - "epoch": 1.08, - "learning_rate": 0.00013727189711973604, - "loss": 0.0118, + "epoch": 0.56, + "learning_rate": 0.00021639168336439583, + "loss": 0.0231, "step": 215030 }, { - "epoch": 1.08, - "learning_rate": 0.00013726432942672202, - "loss": 0.0071, + "epoch": 0.56, + "learning_rate": 0.00021638779514802437, + "loss": 0.0146, "step": 215040 }, { - "epoch": 1.08, - "learning_rate": 0.000137256761733708, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021638390693165294, + "loss": 0.015, "step": 215050 }, { - "epoch": 1.09, - "learning_rate": 0.000137249194040694, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021638001871528145, + "loss": 0.0146, "step": 215060 }, { - "epoch": 1.09, - "learning_rate": 0.00013724162634768, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021637613049891, + "loss": 0.0158, "step": 215070 }, { - "epoch": 1.09, - "learning_rate": 0.00013723405865466597, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.0002163722422825385, + "loss": 0.0238, "step": 215080 }, { - "epoch": 1.09, - "learning_rate": 0.00013722649096165198, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021636835406616708, + "loss": 0.0197, "step": 215090 }, { - "epoch": 1.09, - "learning_rate": 0.00013721892326863796, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.0002163644658497956, + "loss": 0.0186, "step": 215100 }, { - "epoch": 1.09, - "learning_rate": 0.00013721135557562394, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021636057763342413, + "loss": 0.0187, "step": 215110 }, { - "epoch": 1.09, - "learning_rate": 0.00013720378788260995, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021635668941705265, + "loss": 0.0184, "step": 215120 }, { - "epoch": 1.09, - "learning_rate": 0.00013719622018959593, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.0002163528012006812, + "loss": 0.0169, "step": 215130 }, { - "epoch": 1.09, - "learning_rate": 0.00013718865249658191, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021634891298430973, + "loss": 0.0151, "step": 215140 }, { - "epoch": 1.09, - "learning_rate": 0.00013718108480356792, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.00021634502476793827, + "loss": 0.0169, "step": 215150 }, { - "epoch": 1.09, - "learning_rate": 0.0001371735171105539, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.0002163411365515668, + "loss": 0.0213, "step": 215160 }, { - "epoch": 1.09, - "learning_rate": 0.00013716594941753989, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021633724833519533, + "loss": 0.0193, "step": 215170 }, { - "epoch": 1.09, - "learning_rate": 0.00013715838172452587, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.00021633336011882387, + "loss": 0.0173, "step": 215180 }, { - "epoch": 1.09, - "learning_rate": 0.00013715081403151188, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.0002163294719024524, + "loss": 0.0164, "step": 215190 }, { - "epoch": 1.09, - "learning_rate": 0.00013714324633849786, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021632558368608093, + "loss": 0.0142, "step": 215200 }, { - "epoch": 1.09, - "learning_rate": 0.00013713567864548384, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021632169546970947, + "loss": 0.0129, "step": 215210 }, { - "epoch": 1.09, - "learning_rate": 0.00013712811095246985, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021631780725333804, + "loss": 0.0167, "step": 215220 }, { - "epoch": 1.09, - "learning_rate": 0.00013712054325945583, - "loss": 0.0078, + "epoch": 0.56, + "learning_rate": 0.00021631391903696655, + "loss": 0.0128, "step": 215230 }, { - "epoch": 1.09, - "learning_rate": 0.0001371129755664418, - "loss": 0.0113, + "epoch": 0.56, + "learning_rate": 0.0002163100308205951, + "loss": 0.0187, "step": 215240 }, { - "epoch": 1.09, - "learning_rate": 0.0001371054078734278, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.0002163061426042236, + "loss": 0.0167, "step": 215250 }, { - "epoch": 1.09, - "learning_rate": 0.00013709784018041377, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021630225438785218, + "loss": 0.0154, "step": 215260 }, { - "epoch": 1.09, - "learning_rate": 0.00013709027248739978, - "loss": 0.0121, + "epoch": 0.56, + "learning_rate": 0.0002162983661714807, + "loss": 0.017, "step": 215270 }, { - "epoch": 1.09, - "learning_rate": 0.00013708270479438576, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021629447795510923, + "loss": 0.0157, "step": 215280 }, { - "epoch": 1.09, - "learning_rate": 0.00013707513710137174, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021629058973873775, + "loss": 0.0153, "step": 215290 }, { - "epoch": 1.09, - "learning_rate": 0.00013706756940835775, - "loss": 0.0075, + "epoch": 0.56, + "learning_rate": 0.00021628670152236632, + "loss": 0.0158, "step": 215300 }, { - "epoch": 1.09, - "learning_rate": 0.00013706000171534373, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021628281330599483, + "loss": 0.0137, "step": 215310 }, { - "epoch": 1.09, - "learning_rate": 0.00013705243402232972, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021627892508962337, + "loss": 0.0192, "step": 215320 }, { - "epoch": 1.09, - "learning_rate": 0.00013704486632931572, - "loss": 0.0069, + "epoch": 0.56, + "learning_rate": 0.0002162750368732519, + "loss": 0.0133, "step": 215330 }, { - "epoch": 1.09, - "learning_rate": 0.0001370372986363017, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021627114865688046, + "loss": 0.0158, "step": 215340 }, { - "epoch": 1.09, - "learning_rate": 0.0001370297309432877, - "loss": 0.0125, + "epoch": 0.56, + "learning_rate": 0.00021626726044050897, + "loss": 0.0126, "step": 215350 }, { - "epoch": 1.09, - "learning_rate": 0.00013702216325027367, - "loss": 0.0107, + "epoch": 0.56, + "learning_rate": 0.0002162633722241375, + "loss": 0.0137, "step": 215360 }, { - "epoch": 1.09, - "learning_rate": 0.00013701459555725968, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021625948400776603, + "loss": 0.0178, "step": 215370 }, { - "epoch": 1.09, - "learning_rate": 0.00013700702786424566, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.00021625559579139457, + "loss": 0.0203, "step": 215380 }, { - "epoch": 1.09, - "learning_rate": 0.00013699946017123164, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021625170757502314, + "loss": 0.0195, "step": 215390 }, { - "epoch": 1.09, - "learning_rate": 0.00013699189247821765, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021624781935865165, + "loss": 0.0129, "step": 215400 }, { - "epoch": 1.09, - "learning_rate": 0.00013698432478520363, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.0002162439311422802, + "loss": 0.016, "step": 215410 }, { - "epoch": 1.09, - "learning_rate": 0.0001369767570921896, - "loss": 0.014, + "epoch": 0.56, + "learning_rate": 0.0002162400429259087, + "loss": 0.0162, "step": 215420 }, { - "epoch": 1.09, - "learning_rate": 0.00013696918939917562, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021623615470953728, + "loss": 0.0141, "step": 215430 }, { - "epoch": 1.09, - "learning_rate": 0.0001369616217061616, - "loss": 0.0123, + "epoch": 0.56, + "learning_rate": 0.0002162322664931658, + "loss": 0.0139, "step": 215440 }, { - "epoch": 1.09, - "learning_rate": 0.00013695405401314758, - "loss": 0.0127, + "epoch": 0.56, + "learning_rate": 0.00021622837827679433, + "loss": 0.0155, "step": 215450 }, { - "epoch": 1.09, - "learning_rate": 0.0001369464863201336, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021622449006042285, + "loss": 0.0199, "step": 215460 }, { - "epoch": 1.09, - "learning_rate": 0.00013693891862711957, - "loss": 0.0119, + "epoch": 0.56, + "learning_rate": 0.00021622060184405142, + "loss": 0.0144, "step": 215470 }, { - "epoch": 1.09, - "learning_rate": 0.00013693135093410555, - "loss": 0.0069, + "epoch": 0.56, + "learning_rate": 0.00021621671362767993, + "loss": 0.0215, "step": 215480 }, { - "epoch": 1.09, - "learning_rate": 0.00013692378324109156, - "loss": 0.0138, + "epoch": 0.56, + "learning_rate": 0.00021621282541130847, + "loss": 0.0156, "step": 215490 }, { - "epoch": 1.09, - "learning_rate": 0.00013691621554807754, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.00021620893719493699, + "loss": 0.0153, "step": 215500 }, { - "epoch": 1.09, - "learning_rate": 0.00013690864785506353, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.00021620504897856556, + "loss": 0.0157, "step": 215510 }, { - "epoch": 1.09, - "learning_rate": 0.0001369010801620495, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.00021620116076219407, + "loss": 0.0168, "step": 215520 }, { - "epoch": 1.09, - "learning_rate": 0.00013689351246903552, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.0002161972725458226, + "loss": 0.0218, "step": 215530 }, { - "epoch": 1.09, - "learning_rate": 0.0001368859447760215, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021619338432945113, + "loss": 0.0199, "step": 215540 }, { - "epoch": 1.09, - "learning_rate": 0.00013687837708300748, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.0002161894961130797, + "loss": 0.017, "step": 215550 }, { - "epoch": 1.09, - "learning_rate": 0.0001368708093899935, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021618560789670824, + "loss": 0.0174, "step": 215560 }, { - "epoch": 1.09, - "learning_rate": 0.00013686324169697947, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021618171968033675, + "loss": 0.0189, "step": 215570 }, { - "epoch": 1.09, - "learning_rate": 0.00013685567400396545, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021617783146396527, + "loss": 0.019, "step": 215580 }, { - "epoch": 1.09, - "learning_rate": 0.00013684810631095146, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.00021617394324759383, + "loss": 0.0153, "step": 215590 }, { - "epoch": 1.09, - "learning_rate": 0.00013684053861793744, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.00021617005503122238, + "loss": 0.0119, "step": 215600 }, { - "epoch": 1.09, - "learning_rate": 0.00013683297092492342, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.0002161661668148509, + "loss": 0.0186, "step": 215610 }, { - "epoch": 1.09, - "learning_rate": 0.00013682540323190943, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021616227859847943, + "loss": 0.0146, "step": 215620 }, { - "epoch": 1.09, - "learning_rate": 0.0001368178355388954, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021615839038210795, + "loss": 0.0141, "step": 215630 }, { - "epoch": 1.09, - "learning_rate": 0.0001368102678458814, - "loss": 0.0116, + "epoch": 0.56, + "learning_rate": 0.00021615450216573652, + "loss": 0.0173, "step": 215640 }, { - "epoch": 1.09, - "learning_rate": 0.0001368027001528674, - "loss": 0.0128, + "epoch": 0.56, + "learning_rate": 0.00021615061394936503, + "loss": 0.0139, "step": 215650 }, { - "epoch": 1.09, - "learning_rate": 0.00013679513245985338, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021614672573299357, + "loss": 0.0157, "step": 215660 }, { - "epoch": 1.09, - "learning_rate": 0.00013678756476683936, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021614283751662209, + "loss": 0.0155, "step": 215670 }, { - "epoch": 1.09, - "learning_rate": 0.00013677999707382537, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021613894930025065, + "loss": 0.0178, "step": 215680 }, { - "epoch": 1.09, - "learning_rate": 0.00013677242938081135, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021613506108387917, + "loss": 0.0159, "step": 215690 }, { - "epoch": 1.09, - "learning_rate": 0.00013676486168779734, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.0002161311728675077, + "loss": 0.0185, "step": 215700 }, { - "epoch": 1.09, - "learning_rate": 0.00013675729399478332, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021612728465113623, + "loss": 0.0139, "step": 215710 }, { - "epoch": 1.09, - "learning_rate": 0.00013674972630176933, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.0002161233964347648, + "loss": 0.0175, "step": 215720 }, { - "epoch": 1.09, - "learning_rate": 0.0001367421586087553, - "loss": 0.012, + "epoch": 0.56, + "learning_rate": 0.00021611950821839334, + "loss": 0.0151, "step": 215730 }, { - "epoch": 1.09, - "learning_rate": 0.0001367345909157413, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021611562000202185, + "loss": 0.0189, "step": 215740 }, { - "epoch": 1.09, - "learning_rate": 0.0001367270232227273, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021611173178565036, + "loss": 0.0131, "step": 215750 }, { - "epoch": 1.09, - "learning_rate": 0.00013671945552971328, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021610784356927893, + "loss": 0.0191, "step": 215760 }, { - "epoch": 1.09, - "learning_rate": 0.00013671188783669926, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021610395535290748, + "loss": 0.0182, "step": 215770 }, { - "epoch": 1.09, - "learning_rate": 0.00013670432014368527, - "loss": 0.0066, + "epoch": 0.56, + "learning_rate": 0.000216100067136536, + "loss": 0.0162, "step": 215780 }, { - "epoch": 1.09, - "learning_rate": 0.00013669675245067125, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021609617892016453, + "loss": 0.0149, "step": 215790 }, { - "epoch": 1.09, - "learning_rate": 0.00013668918475765723, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021609229070379307, + "loss": 0.0164, "step": 215800 }, { - "epoch": 1.09, - "learning_rate": 0.00013668161706464324, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021608840248742161, + "loss": 0.0155, "step": 215810 }, { - "epoch": 1.09, - "learning_rate": 0.00013667404937162922, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021608451427105013, + "loss": 0.0145, "step": 215820 }, { - "epoch": 1.09, - "learning_rate": 0.0001366664816786152, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021608062605467867, + "loss": 0.0143, "step": 215830 }, { - "epoch": 1.09, - "learning_rate": 0.0001366589139856012, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.0002160767378383072, + "loss": 0.0165, "step": 215840 }, { - "epoch": 1.09, - "learning_rate": 0.0001366513462925872, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.00021607284962193575, + "loss": 0.0139, "step": 215850 }, { - "epoch": 1.09, - "learning_rate": 0.00013664377859957317, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021606896140556427, + "loss": 0.0141, "step": 215860 }, { - "epoch": 1.09, - "learning_rate": 0.00013663621090655916, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.0002160650731891928, + "loss": 0.0154, "step": 215870 }, { - "epoch": 1.09, - "learning_rate": 0.00013662864321354514, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021606118497282132, + "loss": 0.0187, "step": 215880 }, { - "epoch": 1.09, - "learning_rate": 0.00013662107552053112, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.0002160572967564499, + "loss": 0.0146, "step": 215890 }, { - "epoch": 1.09, - "learning_rate": 0.00013661350782751713, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002160534085400784, + "loss": 0.0146, "step": 215900 }, { - "epoch": 1.09, - "learning_rate": 0.0001366059401345031, - "loss": 0.0145, + "epoch": 0.56, + "learning_rate": 0.00021604952032370695, + "loss": 0.0144, "step": 215910 }, { - "epoch": 1.09, - "learning_rate": 0.0001365983724414891, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021604563210733546, + "loss": 0.0162, "step": 215920 }, { - "epoch": 1.09, - "learning_rate": 0.0001365908047484751, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021604174389096403, + "loss": 0.0204, "step": 215930 }, { - "epoch": 1.09, - "learning_rate": 0.00013658323705546108, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.00021603785567459257, + "loss": 0.0179, "step": 215940 }, { - "epoch": 1.09, - "learning_rate": 0.00013657566936244706, - "loss": 0.0074, + "epoch": 0.56, + "learning_rate": 0.0002160339674582211, + "loss": 0.0167, "step": 215950 }, { - "epoch": 1.09, - "learning_rate": 0.00013656810166943307, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021603007924184963, + "loss": 0.0194, "step": 215960 }, { - "epoch": 1.09, - "learning_rate": 0.00013656053397641905, - "loss": 0.0076, + "epoch": 0.56, + "learning_rate": 0.00021602619102547817, + "loss": 0.0174, "step": 215970 }, { - "epoch": 1.09, - "learning_rate": 0.00013655296628340503, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.00021602230280910671, + "loss": 0.022, "step": 215980 }, { - "epoch": 1.09, - "learning_rate": 0.00013654539859039104, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021601841459273523, + "loss": 0.0158, "step": 215990 }, { - "epoch": 1.09, - "learning_rate": 0.00013653783089737702, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021601452637636377, + "loss": 0.0189, "step": 216000 }, { - "epoch": 1.09, - "eval_cer": 0.9144760782799146, - "eval_loss": 0.0073201656341552734, - "eval_runtime": 116.5986, - "eval_samples_per_second": 17.153, - "eval_steps_per_second": 4.288, + "epoch": 0.56, + "eval_cer": 0.8817712685329425, + "eval_loss": 0.011435981839895248, + "eval_runtime": 108.0861, + "eval_samples_per_second": 18.504, + "eval_steps_per_second": 4.626, "step": 216000 }, { - "epoch": 1.09, - "learning_rate": 0.000136530263204363, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.0002160106381599923, + "loss": 0.0162, "step": 216010 }, { - "epoch": 1.09, - "learning_rate": 0.000136522695511349, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021600674994362085, + "loss": 0.0178, "step": 216020 }, { - "epoch": 1.09, - "learning_rate": 0.000136515127818335, - "loss": 0.0064, + "epoch": 0.56, + "learning_rate": 0.00021600286172724937, + "loss": 0.0162, "step": 216030 }, { - "epoch": 1.09, - "learning_rate": 0.00013650756012532098, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.0002159989735108779, + "loss": 0.0152, "step": 216040 }, { - "epoch": 1.09, - "learning_rate": 0.00013649999243230698, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021599508529450645, + "loss": 0.016, "step": 216050 }, { - "epoch": 1.09, - "learning_rate": 0.00013649242473929297, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.000215991197078135, + "loss": 0.0154, "step": 216060 }, { - "epoch": 1.09, - "learning_rate": 0.00013648485704627895, - "loss": 0.0128, + "epoch": 0.56, + "learning_rate": 0.0002159873088617635, + "loss": 0.0139, "step": 216070 }, { - "epoch": 1.09, - "learning_rate": 0.00013647728935326493, - "loss": 0.012, + "epoch": 0.56, + "learning_rate": 0.00021598342064539205, + "loss": 0.0188, "step": 216080 }, { - "epoch": 1.09, - "learning_rate": 0.00013646972166025094, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021597953242902062, + "loss": 0.0194, "step": 216090 }, { - "epoch": 1.09, - "learning_rate": 0.00013646215396723692, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021597564421264913, + "loss": 0.0159, "step": 216100 }, { - "epoch": 1.09, - "learning_rate": 0.0001364545862742229, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021597175599627767, + "loss": 0.0159, "step": 216110 }, { - "epoch": 1.09, - "learning_rate": 0.0001364470185812089, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.0002159678677799062, + "loss": 0.017, "step": 216120 }, { - "epoch": 1.09, - "learning_rate": 0.0001364394508881949, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021596397956353473, + "loss": 0.0148, "step": 216130 }, { - "epoch": 1.09, - "learning_rate": 0.00013643188319518087, - "loss": 0.0068, + "epoch": 0.56, + "learning_rate": 0.00021596009134716327, + "loss": 0.0176, "step": 216140 }, { - "epoch": 1.09, - "learning_rate": 0.00013642431550216688, - "loss": 0.012, + "epoch": 0.56, + "learning_rate": 0.0002159562031307918, + "loss": 0.0171, "step": 216150 }, { - "epoch": 1.09, - "learning_rate": 0.00013641674780915286, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.00021595231491442033, + "loss": 0.0158, "step": 216160 }, { - "epoch": 1.09, - "learning_rate": 0.00013640918011613884, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021594842669804887, + "loss": 0.0202, "step": 216170 }, { - "epoch": 1.09, - "learning_rate": 0.00013640161242312485, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.0002159445384816774, + "loss": 0.0155, "step": 216180 }, { - "epoch": 1.09, - "learning_rate": 0.00013639404473011083, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021594065026530595, + "loss": 0.0147, "step": 216190 }, { - "epoch": 1.09, - "learning_rate": 0.00013638647703709681, - "loss": 0.0068, + "epoch": 0.56, + "learning_rate": 0.00021593676204893447, + "loss": 0.0213, "step": 216200 }, { - "epoch": 1.09, - "learning_rate": 0.00013637890934408282, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.000215932873832563, + "loss": 0.0169, "step": 216210 }, { - "epoch": 1.09, - "learning_rate": 0.0001363713416510688, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021592898561619155, + "loss": 0.0203, "step": 216220 }, { - "epoch": 1.09, - "learning_rate": 0.00013636377395805479, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.0002159250973998201, + "loss": 0.0192, "step": 216230 }, { - "epoch": 1.09, - "learning_rate": 0.00013635620626504077, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.0002159212091834486, + "loss": 0.0175, "step": 216240 }, { - "epoch": 1.09, - "learning_rate": 0.00013634863857202678, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021591732096707715, + "loss": 0.016, "step": 216250 }, { - "epoch": 1.09, - "learning_rate": 0.00013634107087901276, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021591343275070572, + "loss": 0.0241, "step": 216260 }, { - "epoch": 1.09, - "learning_rate": 0.00013633350318599874, - "loss": 0.0107, + "epoch": 0.56, + "learning_rate": 0.00021590954453433423, + "loss": 0.0153, "step": 216270 }, { - "epoch": 1.09, - "learning_rate": 0.00013632593549298475, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021590565631796277, + "loss": 0.0167, "step": 216280 }, { - "epoch": 1.09, - "learning_rate": 0.00013631836779997073, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.0002159017681015913, + "loss": 0.0158, "step": 216290 }, { - "epoch": 1.09, - "learning_rate": 0.0001363108001069567, - "loss": 0.0129, + "epoch": 0.56, + "learning_rate": 0.00021589787988521986, + "loss": 0.0149, "step": 216300 }, { - "epoch": 1.09, - "learning_rate": 0.00013630323241394272, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021589399166884837, + "loss": 0.0212, "step": 216310 }, { - "epoch": 1.09, - "learning_rate": 0.0001362956647209287, - "loss": 0.0076, + "epoch": 0.56, + "learning_rate": 0.0002158901034524769, + "loss": 0.0153, "step": 216320 }, { - "epoch": 1.09, - "learning_rate": 0.00013628809702791468, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021588621523610543, + "loss": 0.0177, "step": 216330 }, { - "epoch": 1.09, - "learning_rate": 0.0001362805293349007, - "loss": 0.0075, + "epoch": 0.56, + "learning_rate": 0.000215882327019734, + "loss": 0.0144, "step": 216340 }, { - "epoch": 1.09, - "learning_rate": 0.00013627296164188667, - "loss": 0.0076, + "epoch": 0.56, + "learning_rate": 0.0002158784388033625, + "loss": 0.0143, "step": 216350 }, { - "epoch": 1.09, - "learning_rate": 0.00013626539394887265, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021587455058699105, + "loss": 0.021, "step": 216360 }, { - "epoch": 1.09, - "learning_rate": 0.00013625782625585866, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.00021587066237061957, + "loss": 0.016, "step": 216370 }, { - "epoch": 1.09, - "learning_rate": 0.00013625025856284464, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.0002158667741542481, + "loss": 0.0164, "step": 216380 }, { - "epoch": 1.09, - "learning_rate": 0.00013624269086983062, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021586288593787665, + "loss": 0.0159, "step": 216390 }, { - "epoch": 1.09, - "learning_rate": 0.0001362351231768166, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.0002158589977215052, + "loss": 0.019, "step": 216400 }, { - "epoch": 1.09, - "learning_rate": 0.00013622755548380261, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.0002158551095051337, + "loss": 0.0173, "step": 216410 }, { - "epoch": 1.09, - "learning_rate": 0.0001362199877907886, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021585122128876225, + "loss": 0.0177, "step": 216420 }, { - "epoch": 1.09, - "learning_rate": 0.00013621242009777458, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021584733307239082, + "loss": 0.0165, "step": 216430 }, { - "epoch": 1.09, - "learning_rate": 0.00013620485240476059, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021584344485601933, + "loss": 0.0168, "step": 216440 }, { - "epoch": 1.09, - "learning_rate": 0.00013619728471174657, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021583955663964787, + "loss": 0.0225, "step": 216450 }, { - "epoch": 1.09, - "learning_rate": 0.00013618971701873255, - "loss": 0.0067, + "epoch": 0.56, + "learning_rate": 0.0002158356684232764, + "loss": 0.0191, "step": 216460 }, { - "epoch": 1.09, - "learning_rate": 0.00013618214932571856, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021583178020690496, + "loss": 0.02, "step": 216470 }, { - "epoch": 1.09, - "learning_rate": 0.00013617458163270454, - "loss": 0.0074, + "epoch": 0.56, + "learning_rate": 0.00021582789199053347, + "loss": 0.015, "step": 216480 }, { - "epoch": 1.09, - "learning_rate": 0.00013616701393969052, - "loss": 0.0127, + "epoch": 0.56, + "learning_rate": 0.000215824003774162, + "loss": 0.0189, "step": 216490 }, { - "epoch": 1.09, - "learning_rate": 0.0001361594462466765, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.00021582011555779053, + "loss": 0.0147, "step": 216500 }, { - "epoch": 1.09, - "learning_rate": 0.00013615187855366248, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.0002158162273414191, + "loss": 0.0164, "step": 216510 }, { - "epoch": 1.09, - "learning_rate": 0.0001361443108606485, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.0002158123391250476, + "loss": 0.0144, "step": 216520 }, { - "epoch": 1.09, - "learning_rate": 0.00013613674316763447, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021580845090867615, + "loss": 0.0142, "step": 216530 }, { - "epoch": 1.09, - "learning_rate": 0.00013612917547462045, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021580456269230467, + "loss": 0.0132, "step": 216540 }, { - "epoch": 1.09, - "learning_rate": 0.00013612160778160646, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021580067447593323, + "loss": 0.0212, "step": 216550 }, { - "epoch": 1.09, - "learning_rate": 0.00013611404008859244, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021579678625956175, + "loss": 0.0174, "step": 216560 }, { - "epoch": 1.09, - "learning_rate": 0.00013610647239557843, - "loss": 0.007, + "epoch": 0.56, + "learning_rate": 0.0002157928980431903, + "loss": 0.0172, "step": 216570 }, { - "epoch": 1.09, - "learning_rate": 0.00013609890470256443, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.0002157890098268188, + "loss": 0.0221, "step": 216580 }, { - "epoch": 1.09, - "learning_rate": 0.00013609133700955042, - "loss": 0.0122, + "epoch": 0.56, + "learning_rate": 0.00021578512161044737, + "loss": 0.0162, "step": 216590 }, { - "epoch": 1.09, - "learning_rate": 0.0001360837693165364, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.00021578123339407592, + "loss": 0.016, "step": 216600 }, { - "epoch": 1.09, - "learning_rate": 0.00013607620162352238, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021577734517770443, + "loss": 0.0289, "step": 216610 }, { - "epoch": 1.09, - "learning_rate": 0.0001360686339305084, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021577345696133295, + "loss": 0.0193, "step": 216620 }, { - "epoch": 1.09, - "learning_rate": 0.00013606106623749437, - "loss": 0.0075, + "epoch": 0.56, + "learning_rate": 0.0002157695687449615, + "loss": 0.0157, "step": 216630 }, { - "epoch": 1.09, - "learning_rate": 0.00013605349854448035, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.00021576568052859006, + "loss": 0.0191, "step": 216640 }, { - "epoch": 1.09, - "learning_rate": 0.00013604593085146636, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021576179231221857, + "loss": 0.0185, "step": 216650 }, { - "epoch": 1.09, - "learning_rate": 0.00013603836315845234, - "loss": 0.0107, + "epoch": 0.56, + "learning_rate": 0.0002157579040958471, + "loss": 0.0271, "step": 216660 }, { - "epoch": 1.09, - "learning_rate": 0.00013603079546543832, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021575401587947563, + "loss": 0.019, "step": 216670 }, { - "epoch": 1.09, - "learning_rate": 0.00013602322777242433, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.0002157501276631042, + "loss": 0.0181, "step": 216680 }, { - "epoch": 1.09, - "learning_rate": 0.0001360156600794103, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.0002157462394467327, + "loss": 0.0167, "step": 216690 }, { - "epoch": 1.09, - "learning_rate": 0.0001360080923863963, - "loss": 0.0127, + "epoch": 0.56, + "learning_rate": 0.00021574235123036125, + "loss": 0.0199, "step": 216700 }, { - "epoch": 1.09, - "learning_rate": 0.0001360005246933823, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021573846301398977, + "loss": 0.0188, "step": 216710 }, { - "epoch": 1.09, - "learning_rate": 0.00013599295700036828, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021573457479761833, + "loss": 0.02, "step": 216720 }, { - "epoch": 1.09, - "learning_rate": 0.00013598538930735426, - "loss": 0.0153, + "epoch": 0.56, + "learning_rate": 0.00021573068658124685, + "loss": 0.0182, "step": 216730 }, { - "epoch": 1.09, - "learning_rate": 0.00013597782161434027, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.0002157267983648754, + "loss": 0.0152, "step": 216740 }, { - "epoch": 1.09, - "learning_rate": 0.00013597025392132625, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.0002157229101485039, + "loss": 0.0123, "step": 216750 }, { - "epoch": 1.09, - "learning_rate": 0.00013596268622831224, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021571902193213247, + "loss": 0.0177, "step": 216760 }, { - "epoch": 1.09, - "learning_rate": 0.00013595511853529822, - "loss": 0.0076, + "epoch": 0.56, + "learning_rate": 0.000215715133715761, + "loss": 0.017, "step": 216770 }, { - "epoch": 1.09, - "learning_rate": 0.00013594755084228423, - "loss": 0.0112, + "epoch": 0.56, + "learning_rate": 0.00021571124549938953, + "loss": 0.0205, "step": 216780 }, { - "epoch": 1.09, - "learning_rate": 0.0001359399831492702, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.00021570735728301804, + "loss": 0.016, "step": 216790 }, { - "epoch": 1.09, - "learning_rate": 0.0001359324154562562, - "loss": 0.0123, + "epoch": 0.56, + "learning_rate": 0.0002157034690666466, + "loss": 0.0148, "step": 216800 }, { - "epoch": 1.09, - "learning_rate": 0.0001359248477632422, - "loss": 0.0071, + "epoch": 0.56, + "learning_rate": 0.00021569958085027515, + "loss": 0.0143, "step": 216810 }, { - "epoch": 1.09, - "learning_rate": 0.00013591728007022818, - "loss": 0.0074, + "epoch": 0.56, + "learning_rate": 0.00021569569263390367, + "loss": 0.0207, "step": 216820 }, { - "epoch": 1.09, - "learning_rate": 0.00013590971237721416, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.0002156918044175322, + "loss": 0.0192, "step": 216830 }, { - "epoch": 1.09, - "learning_rate": 0.00013590214468420017, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021568791620116075, + "loss": 0.0218, "step": 216840 }, { - "epoch": 1.09, - "learning_rate": 0.00013589457699118615, - "loss": 0.0078, + "epoch": 0.56, + "learning_rate": 0.0002156840279847893, + "loss": 0.0191, "step": 216850 }, { - "epoch": 1.09, - "learning_rate": 0.00013588700929817213, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002156801397684178, + "loss": 0.0153, "step": 216860 }, { - "epoch": 1.09, - "learning_rate": 0.00013587944160515814, - "loss": 0.012, + "epoch": 0.56, + "learning_rate": 0.00021567625155204635, + "loss": 0.0123, "step": 216870 }, { - "epoch": 1.09, - "learning_rate": 0.00013587187391214412, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021567236333567487, + "loss": 0.0201, "step": 216880 }, { - "epoch": 1.09, - "learning_rate": 0.0001358643062191301, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021566847511930343, + "loss": 0.0178, "step": 216890 }, { - "epoch": 1.09, - "learning_rate": 0.0001358567385261161, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021566458690293195, + "loss": 0.0165, "step": 216900 }, { - "epoch": 1.09, - "learning_rate": 0.0001358491708331021, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.0002156606986865605, + "loss": 0.0176, "step": 216910 }, { - "epoch": 1.09, - "learning_rate": 0.00013584160314008807, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.000215656810470189, + "loss": 0.0151, "step": 216920 }, { - "epoch": 1.09, - "learning_rate": 0.00013583403544707406, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021565292225381757, + "loss": 0.0121, "step": 216930 }, { - "epoch": 1.09, - "learning_rate": 0.00013582646775406006, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.0002156490340374461, + "loss": 0.0157, "step": 216940 }, { - "epoch": 1.09, - "learning_rate": 0.00013581890006104605, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.00021564514582107463, + "loss": 0.0154, "step": 216950 }, { - "epoch": 1.09, - "learning_rate": 0.00013581133236803203, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021564125760470314, + "loss": 0.0197, "step": 216960 }, { - "epoch": 1.09, - "learning_rate": 0.00013580376467501804, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.0002156373693883317, + "loss": 0.0195, "step": 216970 }, { - "epoch": 1.09, - "learning_rate": 0.00013579619698200402, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.00021563348117196025, + "loss": 0.016, "step": 216980 }, { - "epoch": 1.09, - "learning_rate": 0.00013578862928899, - "loss": 0.0122, + "epoch": 0.56, + "learning_rate": 0.00021562959295558877, + "loss": 0.0164, "step": 216990 }, { - "epoch": 1.09, - "learning_rate": 0.000135781061595976, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.0002156257047392173, + "loss": 0.0129, "step": 217000 }, { - "epoch": 1.09, - "eval_cer": 0.9144741374876638, - "eval_loss": 0.007423856761306524, - "eval_runtime": 116.6037, - "eval_samples_per_second": 17.152, - "eval_steps_per_second": 4.288, + "epoch": 0.56, + "eval_cer": 0.8817432757942589, + "eval_loss": 0.011607037857174873, + "eval_runtime": 107.7722, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.639, "step": 217000 }, { - "epoch": 1.09, - "learning_rate": 0.000135773493902962, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.00021562181652284585, + "loss": 0.0165, "step": 217010 }, { - "epoch": 1.09, - "learning_rate": 0.00013576592620994797, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002156179283064744, + "loss": 0.0174, "step": 217020 }, { - "epoch": 1.09, - "learning_rate": 0.00013575835851693398, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.0002156140400901029, + "loss": 0.0235, "step": 217030 }, { - "epoch": 1.09, - "learning_rate": 0.00013575079082391996, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021561015187373145, + "loss": 0.0158, "step": 217040 }, { - "epoch": 1.1, - "learning_rate": 0.00013574322313090594, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.00021560626365736, + "loss": 0.0167, "step": 217050 }, { - "epoch": 1.1, - "learning_rate": 0.00013573565543789195, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021560237544098853, + "loss": 0.017, "step": 217060 }, { - "epoch": 1.1, - "learning_rate": 0.00013572808774487793, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021559848722461705, + "loss": 0.0194, "step": 217070 }, { - "epoch": 1.1, - "learning_rate": 0.0001357205200518639, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.0002155945990082456, + "loss": 0.0157, "step": 217080 }, { - "epoch": 1.1, - "learning_rate": 0.00013571295235884992, - "loss": 0.0072, + "epoch": 0.56, + "learning_rate": 0.00021559071079187413, + "loss": 0.0183, "step": 217090 }, { - "epoch": 1.1, - "learning_rate": 0.0001357053846658359, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021558682257550267, + "loss": 0.0169, "step": 217100 }, { - "epoch": 1.1, - "learning_rate": 0.00013569781697282188, - "loss": 0.0097, + "epoch": 0.56, + "learning_rate": 0.0002155829343591312, + "loss": 0.0164, "step": 217110 }, { - "epoch": 1.1, - "learning_rate": 0.00013569024927980787, - "loss": 0.0078, + "epoch": 0.56, + "learning_rate": 0.00021557904614275973, + "loss": 0.017, "step": 217120 }, { - "epoch": 1.1, - "learning_rate": 0.00013568268158679385, - "loss": 0.0118, + "epoch": 0.56, + "learning_rate": 0.00021557515792638824, + "loss": 0.0141, "step": 217130 }, { - "epoch": 1.1, - "learning_rate": 0.00013567511389377983, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.0002155712697100168, + "loss": 0.0162, "step": 217140 }, { - "epoch": 1.1, - "learning_rate": 0.00013566754620076584, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021556738149364535, + "loss": 0.0151, "step": 217150 }, { - "epoch": 1.1, - "learning_rate": 0.00013565997850775182, - "loss": 0.0102, + "epoch": 0.56, + "learning_rate": 0.00021556349327727387, + "loss": 0.0174, "step": 217160 }, { - "epoch": 1.1, - "learning_rate": 0.0001356524108147378, - "loss": 0.0114, + "epoch": 0.56, + "learning_rate": 0.00021555960506090238, + "loss": 0.0167, "step": 217170 }, { - "epoch": 1.1, - "learning_rate": 0.0001356448431217238, - "loss": 0.0079, + "epoch": 0.56, + "learning_rate": 0.00021555571684453095, + "loss": 0.0148, "step": 217180 }, { - "epoch": 1.1, - "learning_rate": 0.0001356372754287098, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.0002155518286281595, + "loss": 0.0151, "step": 217190 }, { - "epoch": 1.1, - "learning_rate": 0.00013562970773569577, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.000215547940411788, + "loss": 0.0167, "step": 217200 }, { - "epoch": 1.1, - "learning_rate": 0.00013562214004268178, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021554405219541655, + "loss": 0.0209, "step": 217210 }, { - "epoch": 1.1, - "learning_rate": 0.00013561457234966776, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.0002155401639790451, + "loss": 0.0179, "step": 217220 }, { - "epoch": 1.1, - "learning_rate": 0.00013560700465665374, - "loss": 0.0133, + "epoch": 0.56, + "learning_rate": 0.00021553627576267363, + "loss": 0.018, "step": 217230 }, { - "epoch": 1.1, - "learning_rate": 0.00013559943696363975, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021553238754630215, + "loss": 0.0174, "step": 217240 }, { - "epoch": 1.1, - "learning_rate": 0.00013559186927062573, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.0002155284993299307, + "loss": 0.0145, "step": 217250 }, { - "epoch": 1.1, - "learning_rate": 0.00013558430157761171, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021552461111355923, + "loss": 0.0149, "step": 217260 }, { - "epoch": 1.1, - "learning_rate": 0.00013557673388459772, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021552072289718777, + "loss": 0.0172, "step": 217270 }, { - "epoch": 1.1, - "learning_rate": 0.0001355691661915837, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.0002155168346808163, + "loss": 0.0215, "step": 217280 }, { - "epoch": 1.1, - "learning_rate": 0.00013556159849856969, - "loss": 0.0069, + "epoch": 0.56, + "learning_rate": 0.00021551294646444483, + "loss": 0.02, "step": 217290 }, { - "epoch": 1.1, - "learning_rate": 0.00013555403080555567, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002155090582480734, + "loss": 0.0152, "step": 217300 }, { - "epoch": 1.1, - "learning_rate": 0.00013554646311254168, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.0002155051700317019, + "loss": 0.0184, "step": 217310 }, { - "epoch": 1.1, - "learning_rate": 0.00013553889541952766, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.00021550128181533045, + "loss": 0.0154, "step": 217320 }, { - "epoch": 1.1, - "learning_rate": 0.00013553132772651364, - "loss": 0.0092, + "epoch": 0.56, + "learning_rate": 0.00021549739359895897, + "loss": 0.0168, "step": 217330 }, { - "epoch": 1.1, - "learning_rate": 0.00013552376003349965, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021549350538258754, + "loss": 0.0238, "step": 217340 }, { - "epoch": 1.1, - "learning_rate": 0.00013551619234048563, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.00021548961716621605, + "loss": 0.0175, "step": 217350 }, { - "epoch": 1.1, - "learning_rate": 0.0001355086246474716, - "loss": 0.0086, + "epoch": 0.56, + "learning_rate": 0.0002154857289498446, + "loss": 0.0177, "step": 217360 }, { - "epoch": 1.1, - "learning_rate": 0.00013550105695445762, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002154818407334731, + "loss": 0.0164, "step": 217370 }, { - "epoch": 1.1, - "learning_rate": 0.0001354934892614436, - "loss": 0.0083, + "epoch": 0.56, + "learning_rate": 0.00021547795251710165, + "loss": 0.0156, "step": 217380 }, { - "epoch": 1.1, - "learning_rate": 0.00013548592156842958, - "loss": 0.007, + "epoch": 0.56, + "learning_rate": 0.0002154740643007302, + "loss": 0.0146, "step": 217390 }, { - "epoch": 1.1, - "learning_rate": 0.0001354783538754156, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.00021547017608435873, + "loss": 0.0162, "step": 217400 }, { - "epoch": 1.1, - "learning_rate": 0.00013547078618240157, - "loss": 0.0085, + "epoch": 0.56, + "learning_rate": 0.00021546628786798725, + "loss": 0.0151, "step": 217410 }, { - "epoch": 1.1, - "learning_rate": 0.00013546321848938755, - "loss": 0.0073, + "epoch": 0.56, + "learning_rate": 0.0002154623996516158, + "loss": 0.0173, "step": 217420 }, { - "epoch": 1.1, - "learning_rate": 0.00013545565079637356, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.00021545851143524433, + "loss": 0.0197, "step": 217430 }, { - "epoch": 1.1, - "learning_rate": 0.00013544808310335954, - "loss": 0.0106, + "epoch": 0.56, + "learning_rate": 0.00021545462321887287, + "loss": 0.0146, "step": 217440 }, { - "epoch": 1.1, - "learning_rate": 0.00013544051541034552, - "loss": 0.0093, + "epoch": 0.56, + "learning_rate": 0.00021545073500250139, + "loss": 0.0147, "step": 217450 }, { - "epoch": 1.1, - "learning_rate": 0.0001354329477173315, - "loss": 0.0114, + "epoch": 0.56, + "learning_rate": 0.00021544684678612993, + "loss": 0.0187, "step": 217460 }, { - "epoch": 1.1, - "learning_rate": 0.00013542538002431751, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.0002154429585697585, + "loss": 0.0134, "step": 217470 }, { - "epoch": 1.1, - "learning_rate": 0.0001354178123313035, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.000215439070353387, + "loss": 0.0157, "step": 217480 }, { - "epoch": 1.1, - "learning_rate": 0.00013541024463828948, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021543518213701553, + "loss": 0.0159, "step": 217490 }, { - "epoch": 1.1, - "learning_rate": 0.00013540267694527549, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021543129392064407, + "loss": 0.0148, "step": 217500 }, { - "epoch": 1.1, - "learning_rate": 0.00013539510925226147, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021542740570427264, + "loss": 0.0175, "step": 217510 }, { - "epoch": 1.1, - "learning_rate": 0.00013538754155924745, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021542351748790115, + "loss": 0.0139, "step": 217520 }, { - "epoch": 1.1, - "learning_rate": 0.00013537997386623346, - "loss": 0.0128, + "epoch": 0.56, + "learning_rate": 0.0002154196292715297, + "loss": 0.0183, "step": 217530 }, { - "epoch": 1.1, - "learning_rate": 0.00013537240617321944, - "loss": 0.0082, + "epoch": 0.56, + "learning_rate": 0.0002154157410551582, + "loss": 0.02, "step": 217540 }, { - "epoch": 1.1, - "learning_rate": 0.00013536483848020542, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021541185283878678, + "loss": 0.0161, "step": 217550 }, { - "epoch": 1.1, - "learning_rate": 0.00013535727078719143, - "loss": 0.0124, + "epoch": 0.56, + "learning_rate": 0.0002154079646224153, + "loss": 0.0159, "step": 217560 }, { - "epoch": 1.1, - "learning_rate": 0.0001353497030941774, - "loss": 0.0071, + "epoch": 0.56, + "learning_rate": 0.00021540407640604383, + "loss": 0.0162, "step": 217570 }, { - "epoch": 1.1, - "learning_rate": 0.0001353421354011634, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021540018818967235, + "loss": 0.0136, "step": 217580 }, { - "epoch": 1.1, - "learning_rate": 0.0001353345677081494, - "loss": 0.0128, + "epoch": 0.56, + "learning_rate": 0.0002153962999733009, + "loss": 0.0209, "step": 217590 }, { - "epoch": 1.1, - "learning_rate": 0.00013532700001513538, - "loss": 0.0081, + "epoch": 0.56, + "learning_rate": 0.00021539241175692943, + "loss": 0.0162, "step": 217600 }, { - "epoch": 1.1, - "learning_rate": 0.00013531943232212136, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.00021538852354055797, + "loss": 0.0188, "step": 217610 }, { - "epoch": 1.1, - "learning_rate": 0.00013531186462910737, - "loss": 0.0084, + "epoch": 0.56, + "learning_rate": 0.00021538463532418649, + "loss": 0.0204, "step": 217620 }, { - "epoch": 1.1, - "learning_rate": 0.00013530429693609335, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021538074710781503, + "loss": 0.017, "step": 217630 }, { - "epoch": 1.1, - "learning_rate": 0.00013529672924307933, - "loss": 0.0095, + "epoch": 0.56, + "learning_rate": 0.00021537685889144357, + "loss": 0.0159, "step": 217640 }, { - "epoch": 1.1, - "learning_rate": 0.00013528916155006532, - "loss": 0.0091, + "epoch": 0.56, + "learning_rate": 0.0002153729706750721, + "loss": 0.0187, "step": 217650 }, { - "epoch": 1.1, - "learning_rate": 0.00013528159385705132, - "loss": 0.0094, + "epoch": 0.56, + "learning_rate": 0.00021536908245870062, + "loss": 0.0166, "step": 217660 }, { - "epoch": 1.1, - "learning_rate": 0.0001352740261640373, - "loss": 0.0109, + "epoch": 0.56, + "learning_rate": 0.00021536519424232917, + "loss": 0.0184, "step": 217670 }, { - "epoch": 1.1, - "learning_rate": 0.0001352664584710233, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.00021536130602595774, + "loss": 0.0187, "step": 217680 }, { - "epoch": 1.1, - "learning_rate": 0.0001352588907780093, - "loss": 0.01, + "epoch": 0.56, + "learning_rate": 0.00021535741780958625, + "loss": 0.0211, "step": 217690 }, { - "epoch": 1.1, - "learning_rate": 0.00013525132308499528, - "loss": 0.009, + "epoch": 0.56, + "learning_rate": 0.0002153535295932148, + "loss": 0.0223, "step": 217700 }, { - "epoch": 1.1, - "learning_rate": 0.00013524375539198126, - "loss": 0.0098, + "epoch": 0.56, + "learning_rate": 0.0002153496413768433, + "loss": 0.0299, "step": 217710 }, { - "epoch": 1.1, - "learning_rate": 0.00013523618769896727, - "loss": 0.0101, + "epoch": 0.56, + "learning_rate": 0.00021534575316047187, + "loss": 0.021, "step": 217720 }, { - "epoch": 1.1, - "learning_rate": 0.00013522862000595325, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.0002153418649441004, + "loss": 0.0138, "step": 217730 }, { - "epoch": 1.1, - "learning_rate": 0.00013522105231293923, - "loss": 0.0077, + "epoch": 0.56, + "learning_rate": 0.00021533797672772893, + "loss": 0.0155, "step": 217740 }, { - "epoch": 1.1, - "learning_rate": 0.00013521348461992524, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.00021533408851135745, + "loss": 0.0154, "step": 217750 }, { - "epoch": 1.1, - "learning_rate": 0.0001352059169269112, - "loss": 0.0074, + "epoch": 0.56, + "learning_rate": 0.00021533020029498601, + "loss": 0.0165, "step": 217760 }, { - "epoch": 1.1, - "learning_rate": 0.0001351983492338972, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.00021532631207861453, + "loss": 0.0183, "step": 217770 }, { - "epoch": 1.1, - "learning_rate": 0.00013519078154088318, - "loss": 0.0108, + "epoch": 0.56, + "learning_rate": 0.00021532242386224307, + "loss": 0.0151, "step": 217780 }, { - "epoch": 1.1, - "learning_rate": 0.00013518321384786916, - "loss": 0.0096, + "epoch": 0.56, + "learning_rate": 0.00021531853564587158, + "loss": 0.0171, "step": 217790 }, { - "epoch": 1.1, - "learning_rate": 0.00013517564615485517, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021531464742950015, + "loss": 0.0183, "step": 217800 }, { - "epoch": 1.1, - "learning_rate": 0.00013516807846184115, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021531075921312867, + "loss": 0.0176, "step": 217810 }, { - "epoch": 1.1, - "learning_rate": 0.00013516051076882714, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.0002153068709967572, + "loss": 0.0161, "step": 217820 }, { - "epoch": 1.1, - "learning_rate": 0.00013515294307581312, - "loss": 0.0188, + "epoch": 0.56, + "learning_rate": 0.00021530298278038572, + "loss": 0.014, "step": 217830 }, { - "epoch": 1.1, - "learning_rate": 0.00013514537538279913, - "loss": 0.0099, + "epoch": 0.56, + "learning_rate": 0.00021529909456401427, + "loss": 0.0134, "step": 217840 }, { - "epoch": 1.1, - "learning_rate": 0.0001351378076897851, - "loss": 0.0119, + "epoch": 0.56, + "learning_rate": 0.00021529520634764283, + "loss": 0.0169, "step": 217850 }, { - "epoch": 1.1, - "learning_rate": 0.0001351302399967711, - "loss": 0.0089, + "epoch": 0.56, + "learning_rate": 0.00021529131813127135, + "loss": 0.0183, "step": 217860 }, { - "epoch": 1.1, - "learning_rate": 0.0001351226723037571, - "loss": 0.0105, + "epoch": 0.56, + "learning_rate": 0.0002152874299148999, + "loss": 0.0251, "step": 217870 }, { - "epoch": 1.1, - "learning_rate": 0.00013511510461074308, - "loss": 0.0073, + "epoch": 0.56, + "learning_rate": 0.0002152835416985284, + "loss": 0.0201, "step": 217880 }, { - "epoch": 1.1, - "learning_rate": 0.00013510753691772906, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021527965348215697, + "loss": 0.0177, "step": 217890 }, { - "epoch": 1.1, - "learning_rate": 0.00013509996922471507, - "loss": 0.011, + "epoch": 0.56, + "learning_rate": 0.0002152757652657855, + "loss": 0.0168, "step": 217900 }, { - "epoch": 1.1, - "learning_rate": 0.00013509240153170105, - "loss": 0.0088, + "epoch": 0.56, + "learning_rate": 0.00021527187704941403, + "loss": 0.0141, "step": 217910 }, { - "epoch": 1.1, - "learning_rate": 0.00013508483383868703, - "loss": 0.0103, + "epoch": 0.56, + "learning_rate": 0.00021526798883304254, + "loss": 0.0157, "step": 217920 }, { - "epoch": 1.1, - "learning_rate": 0.00013507726614567304, - "loss": 0.008, + "epoch": 0.56, + "learning_rate": 0.00021526410061667111, + "loss": 0.0162, "step": 217930 }, { - "epoch": 1.1, - "learning_rate": 0.00013506969845265902, - "loss": 0.0104, + "epoch": 0.56, + "learning_rate": 0.00021526021240029963, + "loss": 0.0155, "step": 217940 }, { - "epoch": 1.1, - "learning_rate": 0.000135062130759645, - "loss": 0.0087, + "epoch": 0.56, + "learning_rate": 0.00021525632418392817, + "loss": 0.0151, "step": 217950 }, { - "epoch": 1.1, - "learning_rate": 0.000135054563066631, - "loss": 0.0111, + "epoch": 0.56, + "learning_rate": 0.00021525243596755668, + "loss": 0.0183, "step": 217960 }, { - "epoch": 1.1, - "learning_rate": 0.000135046995373617, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021524854775118525, + "loss": 0.0192, "step": 217970 }, { - "epoch": 1.1, - "learning_rate": 0.00013503942768060297, - "loss": 0.0133, + "epoch": 0.57, + "learning_rate": 0.00021524465953481377, + "loss": 0.0186, "step": 217980 }, { - "epoch": 1.1, - "learning_rate": 0.00013503185998758898, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.0002152407713184423, + "loss": 0.017, "step": 217990 }, { - "epoch": 1.1, - "learning_rate": 0.00013502429229457496, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.00021523688310207082, + "loss": 0.0165, "step": 218000 }, { - "epoch": 1.1, - "eval_cer": 0.9144867526372941, - "eval_loss": 0.006999760400503874, - "eval_runtime": 116.2125, - "eval_samples_per_second": 17.21, - "eval_steps_per_second": 4.302, + "epoch": 0.57, + "eval_cer": 0.8817376772465223, + "eval_loss": 0.011108589358627796, + "eval_runtime": 107.5987, + "eval_samples_per_second": 18.588, + "eval_steps_per_second": 4.647, "step": 218000 }, { - "epoch": 1.1, - "learning_rate": 0.00013501672460156095, - "loss": 0.0123, + "epoch": 0.57, + "learning_rate": 0.0002152329948856994, + "loss": 0.0141, "step": 218010 }, { - "epoch": 1.1, - "learning_rate": 0.00013500915690854693, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021522910666932793, + "loss": 0.0193, "step": 218020 }, { - "epoch": 1.1, - "learning_rate": 0.00013500158921553294, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021522521845295645, + "loss": 0.0171, "step": 218030 }, { - "epoch": 1.1, - "learning_rate": 0.00013499402152251892, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.000215221330236585, + "loss": 0.0147, "step": 218040 }, { - "epoch": 1.1, - "learning_rate": 0.0001349864538295049, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021521744202021353, + "loss": 0.0178, "step": 218050 }, { - "epoch": 1.1, - "learning_rate": 0.0001349788861364909, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021521355380384207, + "loss": 0.0191, "step": 218060 }, { - "epoch": 1.1, - "learning_rate": 0.0001349713184434769, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.0002152096655874706, + "loss": 0.0162, "step": 218070 }, { - "epoch": 1.1, - "learning_rate": 0.00013496375075046287, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.00021520577737109913, + "loss": 0.0183, "step": 218080 }, { - "epoch": 1.1, - "learning_rate": 0.00013495618305744888, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021520188915472764, + "loss": 0.0162, "step": 218090 }, { - "epoch": 1.1, - "learning_rate": 0.00013494861536443486, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.0002151980009383562, + "loss": 0.0168, "step": 218100 }, { - "epoch": 1.1, - "learning_rate": 0.00013494104767142084, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021519411272198473, + "loss": 0.0159, "step": 218110 }, { - "epoch": 1.1, - "learning_rate": 0.00013493347997840685, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021519022450561327, + "loss": 0.0161, "step": 218120 }, { - "epoch": 1.1, - "learning_rate": 0.00013492591228539283, - "loss": 0.0113, + "epoch": 0.57, + "learning_rate": 0.00021518633628924178, + "loss": 0.0159, "step": 218130 }, { - "epoch": 1.1, - "learning_rate": 0.0001349183445923788, - "loss": 0.0129, + "epoch": 0.57, + "learning_rate": 0.00021518244807287035, + "loss": 0.0128, "step": 218140 }, { - "epoch": 1.1, - "learning_rate": 0.00013491077689936482, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021517855985649887, + "loss": 0.0141, "step": 218150 }, { - "epoch": 1.1, - "learning_rate": 0.0001349032092063508, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002151746716401274, + "loss": 0.0129, "step": 218160 }, { - "epoch": 1.1, - "learning_rate": 0.00013489564151333678, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021517078342375592, + "loss": 0.0138, "step": 218170 }, { - "epoch": 1.1, - "learning_rate": 0.00013488807382032277, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002151668952073845, + "loss": 0.0182, "step": 218180 }, { - "epoch": 1.1, - "learning_rate": 0.00013488050612730877, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021516300699101303, + "loss": 0.0135, "step": 218190 }, { - "epoch": 1.1, - "learning_rate": 0.00013487293843429476, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021515911877464155, + "loss": 0.019, "step": 218200 }, { - "epoch": 1.1, - "learning_rate": 0.00013486537074128074, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021515523055827006, + "loss": 0.0143, "step": 218210 }, { - "epoch": 1.1, - "learning_rate": 0.00013485780304826675, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.00021515134234189863, + "loss": 0.02, "step": 218220 }, { - "epoch": 1.1, - "learning_rate": 0.00013485023535525273, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021514745412552717, + "loss": 0.0185, "step": 218230 }, { - "epoch": 1.1, - "learning_rate": 0.0001348426676622387, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.0002151435659091557, + "loss": 0.0191, "step": 218240 }, { - "epoch": 1.1, - "learning_rate": 0.00013483509996922472, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021513967769278423, + "loss": 0.0146, "step": 218250 }, { - "epoch": 1.1, - "learning_rate": 0.0001348275322762107, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021513578947641277, + "loss": 0.0168, "step": 218260 }, { - "epoch": 1.1, - "learning_rate": 0.00013481996458319668, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.0002151319012600413, + "loss": 0.0172, "step": 218270 }, { - "epoch": 1.1, - "learning_rate": 0.0001348123968901827, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021512801304366983, + "loss": 0.0158, "step": 218280 }, { - "epoch": 1.1, - "learning_rate": 0.00013480482919716867, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021512412482729837, + "loss": 0.0167, "step": 218290 }, { - "epoch": 1.1, - "learning_rate": 0.00013479726150415465, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.0002151202366109269, + "loss": 0.0159, "step": 218300 }, { - "epoch": 1.1, - "learning_rate": 0.00013478969381114066, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021511634839455545, + "loss": 0.0157, "step": 218310 }, { - "epoch": 1.1, - "learning_rate": 0.00013478212611812664, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021511246017818397, + "loss": 0.0123, "step": 218320 }, { - "epoch": 1.1, - "learning_rate": 0.00013477455842511262, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002151085719618125, + "loss": 0.0163, "step": 218330 }, { - "epoch": 1.1, - "learning_rate": 0.0001347669907320986, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.00021510468374544102, + "loss": 0.0146, "step": 218340 }, { - "epoch": 1.1, - "learning_rate": 0.0001347594230390846, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.0002151007955290696, + "loss": 0.0212, "step": 218350 }, { - "epoch": 1.1, - "learning_rate": 0.0001347518553460706, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.0002150969073126981, + "loss": 0.0174, "step": 218360 }, { - "epoch": 1.1, - "learning_rate": 0.00013474428765305658, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.00021509301909632665, + "loss": 0.0143, "step": 218370 }, { - "epoch": 1.1, - "learning_rate": 0.00013473671996004258, - "loss": 0.014, + "epoch": 0.57, + "learning_rate": 0.00021508913087995516, + "loss": 0.0175, "step": 218380 }, { - "epoch": 1.1, - "learning_rate": 0.00013472915226702854, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021508524266358373, + "loss": 0.017, "step": 218390 }, { - "epoch": 1.1, - "learning_rate": 0.00013472158457401455, - "loss": 0.0139, + "epoch": 0.57, + "learning_rate": 0.00021508135444721227, + "loss": 0.013, "step": 218400 }, { - "epoch": 1.1, - "learning_rate": 0.00013471401688100053, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.0002150774662308408, + "loss": 0.0179, "step": 218410 }, { - "epoch": 1.1, - "learning_rate": 0.0001347064491879865, - "loss": 0.0074, + "epoch": 0.57, + "learning_rate": 0.00021507357801446933, + "loss": 0.0142, "step": 218420 }, { - "epoch": 1.1, - "learning_rate": 0.00013469888149497252, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021506968979809787, + "loss": 0.0175, "step": 218430 }, { - "epoch": 1.1, - "learning_rate": 0.0001346913138019585, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.0002150658015817264, + "loss": 0.0183, "step": 218440 }, { - "epoch": 1.1, - "learning_rate": 0.00013468374610894448, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021506191336535493, + "loss": 0.0201, "step": 218450 }, { - "epoch": 1.1, - "learning_rate": 0.0001346761784159305, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021505802514898347, + "loss": 0.0169, "step": 218460 }, { - "epoch": 1.1, - "learning_rate": 0.00013466861072291647, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.000215054136932612, + "loss": 0.0195, "step": 218470 }, { - "epoch": 1.1, - "learning_rate": 0.00013466104302990245, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021505024871624055, + "loss": 0.015, "step": 218480 }, { - "epoch": 1.1, - "learning_rate": 0.00013465347533688846, - "loss": 0.0127, + "epoch": 0.57, + "learning_rate": 0.00021504636049986907, + "loss": 0.0174, "step": 218490 }, { - "epoch": 1.1, - "learning_rate": 0.00013464590764387444, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.0002150424722834976, + "loss": 0.022, "step": 218500 }, { - "epoch": 1.1, - "learning_rate": 0.00013463833995086042, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021503858406712618, + "loss": 0.0162, "step": 218510 }, { - "epoch": 1.1, - "learning_rate": 0.00013463077225784643, - "loss": 0.0079, + "epoch": 0.57, + "learning_rate": 0.0002150346958507547, + "loss": 0.0161, "step": 218520 }, { - "epoch": 1.1, - "learning_rate": 0.00013462320456483241, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002150308076343832, + "loss": 0.0162, "step": 218530 }, { - "epoch": 1.1, - "learning_rate": 0.0001346156368718184, - "loss": 0.0113, + "epoch": 0.57, + "learning_rate": 0.00021502691941801175, + "loss": 0.0142, "step": 218540 }, { - "epoch": 1.1, - "learning_rate": 0.00013460806917880438, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021502303120164032, + "loss": 0.0183, "step": 218550 }, { - "epoch": 1.1, - "learning_rate": 0.00013460050148579039, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.00021501914298526883, + "loss": 0.02, "step": 218560 }, { - "epoch": 1.1, - "learning_rate": 0.00013459293379277637, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.00021501525476889737, + "loss": 0.0216, "step": 218570 }, { - "epoch": 1.1, - "learning_rate": 0.00013458536609976235, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021501136655252589, + "loss": 0.0168, "step": 218580 }, { - "epoch": 1.1, - "learning_rate": 0.00013457779840674836, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021500747833615443, + "loss": 0.0164, "step": 218590 }, { - "epoch": 1.1, - "learning_rate": 0.00013457023071373434, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021500359011978297, + "loss": 0.0165, "step": 218600 }, { - "epoch": 1.1, - "learning_rate": 0.00013456266302072032, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.0002149997019034115, + "loss": 0.0116, "step": 218610 }, { - "epoch": 1.1, - "learning_rate": 0.00013455509532770633, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021499581368704003, + "loss": 0.0143, "step": 218620 }, { - "epoch": 1.1, - "learning_rate": 0.0001345475276346923, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021499192547066857, + "loss": 0.0192, "step": 218630 }, { - "epoch": 1.1, - "learning_rate": 0.0001345399599416783, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.0002149880372542971, + "loss": 0.0201, "step": 218640 }, { - "epoch": 1.1, - "learning_rate": 0.0001345323922486643, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.00021498414903792565, + "loss": 0.0153, "step": 218650 }, { - "epoch": 1.1, - "learning_rate": 0.00013452482455565028, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021498026082155417, + "loss": 0.0197, "step": 218660 }, { - "epoch": 1.1, - "learning_rate": 0.00013451725686263626, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002149763726051827, + "loss": 0.017, "step": 218670 }, { - "epoch": 1.1, - "learning_rate": 0.00013450968916962227, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021497248438881125, + "loss": 0.0166, "step": 218680 }, { - "epoch": 1.1, - "learning_rate": 0.00013450212147660825, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.0002149685961724398, + "loss": 0.0217, "step": 218690 }, { - "epoch": 1.1, - "learning_rate": 0.00013449455378359423, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.0002149647079560683, + "loss": 0.0192, "step": 218700 }, { - "epoch": 1.1, - "learning_rate": 0.00013448698609058022, - "loss": 0.0128, + "epoch": 0.57, + "learning_rate": 0.00021496081973969685, + "loss": 0.0217, "step": 218710 }, { - "epoch": 1.1, - "learning_rate": 0.00013447941839756622, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021495693152332542, + "loss": 0.0168, "step": 218720 }, { - "epoch": 1.1, - "learning_rate": 0.0001344718507045522, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021495304330695393, + "loss": 0.0155, "step": 218730 }, { - "epoch": 1.1, - "learning_rate": 0.0001344642830115382, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021494915509058247, + "loss": 0.0147, "step": 218740 }, { - "epoch": 1.1, - "learning_rate": 0.0001344567153185242, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021494526687421099, + "loss": 0.0182, "step": 218750 }, { - "epoch": 1.1, - "learning_rate": 0.00013444914762551018, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.00021494137865783955, + "loss": 0.0183, "step": 218760 }, { - "epoch": 1.1, - "learning_rate": 0.00013444157993249616, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.00021493749044146807, + "loss": 0.0177, "step": 218770 }, { - "epoch": 1.1, - "learning_rate": 0.00013443401223948217, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.0002149336022250966, + "loss": 0.0176, "step": 218780 }, { - "epoch": 1.1, - "learning_rate": 0.00013442644454646815, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021492971400872513, + "loss": 0.0195, "step": 218790 }, { - "epoch": 1.1, - "learning_rate": 0.00013441887685345413, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.0002149258257923537, + "loss": 0.0147, "step": 218800 }, { - "epoch": 1.1, - "learning_rate": 0.00013441130916044014, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.0002149219375759822, + "loss": 0.0178, "step": 218810 }, { - "epoch": 1.1, - "learning_rate": 0.00013440374146742612, - "loss": 0.0119, + "epoch": 0.57, + "learning_rate": 0.00021491804935961075, + "loss": 0.0161, "step": 218820 }, { - "epoch": 1.1, - "learning_rate": 0.0001343961737744121, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021491416114323926, + "loss": 0.0165, "step": 218830 }, { - "epoch": 1.1, - "learning_rate": 0.0001343886060813981, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.0002149102729268678, + "loss": 0.0242, "step": 218840 }, { - "epoch": 1.1, - "learning_rate": 0.0001343810383883841, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.00021490638471049635, + "loss": 0.0185, "step": 218850 }, { - "epoch": 1.1, - "learning_rate": 0.00013437347069537007, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.0002149024964941249, + "loss": 0.0172, "step": 218860 }, { - "epoch": 1.1, - "learning_rate": 0.00013436590300235605, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.0002148986082777534, + "loss": 0.0164, "step": 218870 }, { - "epoch": 1.1, - "learning_rate": 0.00013435833530934206, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.00021489472006138195, + "loss": 0.0172, "step": 218880 }, { - "epoch": 1.1, - "learning_rate": 0.00013435076761632804, - "loss": 0.0072, + "epoch": 0.57, + "learning_rate": 0.00021489083184501051, + "loss": 0.0194, "step": 218890 }, { - "epoch": 1.1, - "learning_rate": 0.00013434319992331403, - "loss": 0.0123, + "epoch": 0.57, + "learning_rate": 0.00021488694362863903, + "loss": 0.0205, "step": 218900 }, { - "epoch": 1.1, - "learning_rate": 0.00013433563223030003, - "loss": 0.0066, + "epoch": 0.57, + "learning_rate": 0.00021488305541226757, + "loss": 0.0191, "step": 218910 }, { - "epoch": 1.1, - "learning_rate": 0.00013432806453728602, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021487916719589609, + "loss": 0.0147, "step": 218920 }, { - "epoch": 1.1, - "learning_rate": 0.000134320496844272, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021487527897952465, + "loss": 0.0144, "step": 218930 }, { - "epoch": 1.1, - "learning_rate": 0.000134312929151258, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021487139076315317, + "loss": 0.0179, "step": 218940 }, { - "epoch": 1.1, - "learning_rate": 0.000134305361458244, - "loss": 0.0115, + "epoch": 0.57, + "learning_rate": 0.0002148675025467817, + "loss": 0.018, "step": 218950 }, { - "epoch": 1.1, - "learning_rate": 0.00013429779376522997, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021486361433041022, + "loss": 0.0157, "step": 218960 }, { - "epoch": 1.1, - "learning_rate": 0.00013429022607221598, - "loss": 0.0127, + "epoch": 0.57, + "learning_rate": 0.0002148597261140388, + "loss": 0.0165, "step": 218970 }, { - "epoch": 1.1, - "learning_rate": 0.00013428265837920196, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.0002148558378976673, + "loss": 0.0161, "step": 218980 }, { - "epoch": 1.1, - "learning_rate": 0.00013427509068618794, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021485194968129585, + "loss": 0.0162, "step": 218990 }, { - "epoch": 1.1, - "learning_rate": 0.00013426752299317395, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021484806146492436, + "loss": 0.019, "step": 219000 }, { - "epoch": 1.1, - "eval_cer": 0.9144799598644162, - "eval_loss": 0.007354082074016333, - "eval_runtime": 116.3343, - "eval_samples_per_second": 17.192, - "eval_steps_per_second": 4.298, + "epoch": 0.57, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.011217095889151096, + "eval_runtime": 107.9572, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.631, "step": 219000 }, { - "epoch": 1.1, - "learning_rate": 0.00013425995530015993, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021484417324855293, + "loss": 0.0152, "step": 219010 }, { - "epoch": 1.1, - "learning_rate": 0.0001342523876071459, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021484028503218145, + "loss": 0.0155, "step": 219020 }, { - "epoch": 1.11, - "learning_rate": 0.0001342448199141319, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021483639681581, + "loss": 0.0171, "step": 219030 }, { - "epoch": 1.11, - "learning_rate": 0.00013423725222111787, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.0002148325085994385, + "loss": 0.0151, "step": 219040 }, { - "epoch": 1.11, - "learning_rate": 0.00013422968452810388, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.00021482862038306707, + "loss": 0.0145, "step": 219050 }, { - "epoch": 1.11, - "learning_rate": 0.00013422211683508986, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021482473216669561, + "loss": 0.0152, "step": 219060 }, { - "epoch": 1.11, - "learning_rate": 0.00013421454914207585, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021482084395032413, + "loss": 0.0168, "step": 219070 }, { - "epoch": 1.11, - "learning_rate": 0.00013420698144906183, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021481695573395264, + "loss": 0.0165, "step": 219080 }, { - "epoch": 1.11, - "learning_rate": 0.00013419941375604784, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021481306751758118, + "loss": 0.0169, "step": 219090 }, { - "epoch": 1.11, - "learning_rate": 0.00013419184606303382, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021480917930120975, + "loss": 0.0129, "step": 219100 }, { - "epoch": 1.11, - "learning_rate": 0.0001341842783700198, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021480529108483827, + "loss": 0.0174, "step": 219110 }, { - "epoch": 1.11, - "learning_rate": 0.0001341767106770058, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.0002148014028684668, + "loss": 0.0184, "step": 219120 }, { - "epoch": 1.11, - "learning_rate": 0.0001341691429839918, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021479751465209532, + "loss": 0.0156, "step": 219130 }, { - "epoch": 1.11, - "learning_rate": 0.00013416157529097777, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002147936264357239, + "loss": 0.0159, "step": 219140 }, { - "epoch": 1.11, - "learning_rate": 0.00013415400759796378, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.0002147897382193524, + "loss": 0.0157, "step": 219150 }, { - "epoch": 1.11, - "learning_rate": 0.00013414643990494976, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021478585000298095, + "loss": 0.0145, "step": 219160 }, { - "epoch": 1.11, - "learning_rate": 0.00013413887221193574, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021478196178660946, + "loss": 0.0112, "step": 219170 }, { - "epoch": 1.11, - "learning_rate": 0.00013413130451892175, - "loss": 0.0116, + "epoch": 0.57, + "learning_rate": 0.00021477807357023803, + "loss": 0.0163, "step": 219180 }, { - "epoch": 1.11, - "learning_rate": 0.00013412373682590773, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021477418535386655, + "loss": 0.0149, "step": 219190 }, { - "epoch": 1.11, - "learning_rate": 0.0001341161691328937, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.0002147702971374951, + "loss": 0.0162, "step": 219200 }, { - "epoch": 1.11, - "learning_rate": 0.00013410860143987972, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002147664089211236, + "loss": 0.0204, "step": 219210 }, { - "epoch": 1.11, - "learning_rate": 0.0001341010337468657, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021476252070475217, + "loss": 0.0149, "step": 219220 }, { - "epoch": 1.11, - "learning_rate": 0.00013409346605385168, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021475863248838069, + "loss": 0.0153, "step": 219230 }, { - "epoch": 1.11, - "learning_rate": 0.00013408589836083767, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021475474427200923, + "loss": 0.0174, "step": 219240 }, { - "epoch": 1.11, - "learning_rate": 0.00013407833066782367, - "loss": 0.0076, + "epoch": 0.57, + "learning_rate": 0.00021475085605563774, + "loss": 0.0177, "step": 219250 }, { - "epoch": 1.11, - "learning_rate": 0.00013407076297480966, - "loss": 0.012, + "epoch": 0.57, + "learning_rate": 0.0002147469678392663, + "loss": 0.0176, "step": 219260 }, { - "epoch": 1.11, - "learning_rate": 0.00013406319528179564, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021474307962289485, + "loss": 0.016, "step": 219270 }, { - "epoch": 1.11, - "learning_rate": 0.00013405562758878165, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.00021473919140652337, + "loss": 0.0185, "step": 219280 }, { - "epoch": 1.11, - "learning_rate": 0.00013404805989576763, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002147353031901519, + "loss": 0.0129, "step": 219290 }, { - "epoch": 1.11, - "learning_rate": 0.0001340404922027536, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021473141497378045, + "loss": 0.0181, "step": 219300 }, { - "epoch": 1.11, - "learning_rate": 0.00013403292450973962, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.000214727526757409, + "loss": 0.0162, "step": 219310 }, { - "epoch": 1.11, - "learning_rate": 0.0001340253568167256, - "loss": 0.0069, + "epoch": 0.57, + "learning_rate": 0.0002147236385410375, + "loss": 0.0182, "step": 219320 }, { - "epoch": 1.11, - "learning_rate": 0.00013401778912371158, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021471975032466605, + "loss": 0.0168, "step": 219330 }, { - "epoch": 1.11, - "learning_rate": 0.0001340102214306976, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021471586210829456, + "loss": 0.0185, "step": 219340 }, { - "epoch": 1.11, - "learning_rate": 0.00013400265373768357, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021471197389192313, + "loss": 0.0162, "step": 219350 }, { - "epoch": 1.11, - "learning_rate": 0.00013399508604466955, - "loss": 0.0071, + "epoch": 0.57, + "learning_rate": 0.00021470808567555165, + "loss": 0.0164, "step": 219360 }, { - "epoch": 1.11, - "learning_rate": 0.00013398751835165556, - "loss": 0.0117, + "epoch": 0.57, + "learning_rate": 0.0002147041974591802, + "loss": 0.016, "step": 219370 }, { - "epoch": 1.11, - "learning_rate": 0.00013397995065864154, - "loss": 0.0129, + "epoch": 0.57, + "learning_rate": 0.0002147003092428087, + "loss": 0.0169, "step": 219380 }, { - "epoch": 1.11, - "learning_rate": 0.00013397238296562752, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021469642102643727, + "loss": 0.0171, "step": 219390 }, { - "epoch": 1.11, - "learning_rate": 0.0001339648152726135, - "loss": 0.0109, + "epoch": 0.57, + "learning_rate": 0.00021469253281006579, + "loss": 0.0209, "step": 219400 }, { - "epoch": 1.11, - "learning_rate": 0.0001339572475795995, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021468864459369433, + "loss": 0.0215, "step": 219410 }, { - "epoch": 1.11, - "learning_rate": 0.0001339496798865855, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.00021468475637732284, + "loss": 0.0136, "step": 219420 }, { - "epoch": 1.11, - "learning_rate": 0.00013394211219357148, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.0002146808681609514, + "loss": 0.0143, "step": 219430 }, { - "epoch": 1.11, - "learning_rate": 0.00013393454450055748, - "loss": 0.0119, + "epoch": 0.57, + "learning_rate": 0.00021467697994457995, + "loss": 0.0159, "step": 219440 }, { - "epoch": 1.11, - "learning_rate": 0.00013392697680754347, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021467309172820847, + "loss": 0.0164, "step": 219450 }, { - "epoch": 1.11, - "learning_rate": 0.00013391940911452945, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.000214669203511837, + "loss": 0.0134, "step": 219460 }, { - "epoch": 1.11, - "learning_rate": 0.00013391184142151546, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021466531529546555, + "loss": 0.0172, "step": 219470 }, { - "epoch": 1.11, - "learning_rate": 0.00013390427372850144, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.0002146614270790941, + "loss": 0.0196, "step": 219480 }, { - "epoch": 1.11, - "learning_rate": 0.00013389670603548742, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.0002146575388627226, + "loss": 0.0168, "step": 219490 }, { - "epoch": 1.11, - "learning_rate": 0.00013388913834247343, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021465365064635115, + "loss": 0.0168, "step": 219500 }, { - "epoch": 1.11, - "learning_rate": 0.0001338815706494594, - "loss": 0.0128, + "epoch": 0.57, + "learning_rate": 0.0002146497624299797, + "loss": 0.0172, "step": 219510 }, { - "epoch": 1.11, - "learning_rate": 0.0001338740029564454, - "loss": 0.0071, + "epoch": 0.57, + "learning_rate": 0.00021464587421360823, + "loss": 0.0215, "step": 219520 }, { - "epoch": 1.11, - "learning_rate": 0.0001338664352634314, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.00021464198599723675, + "loss": 0.0189, "step": 219530 }, { - "epoch": 1.11, - "learning_rate": 0.00013385886757041738, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.0002146380977808653, + "loss": 0.0185, "step": 219540 }, { - "epoch": 1.11, - "learning_rate": 0.00013385129987740336, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021463420956449383, + "loss": 0.0155, "step": 219550 }, { - "epoch": 1.11, - "learning_rate": 0.00013384373218438937, - "loss": 0.007, + "epoch": 0.57, + "learning_rate": 0.00021463032134812237, + "loss": 0.0189, "step": 219560 }, { - "epoch": 1.11, - "learning_rate": 0.00013383616449137535, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021462643313175089, + "loss": 0.0193, "step": 219570 }, { - "epoch": 1.11, - "learning_rate": 0.00013382859679836133, - "loss": 0.0118, + "epoch": 0.57, + "learning_rate": 0.00021462254491537943, + "loss": 0.0165, "step": 219580 }, { - "epoch": 1.11, - "learning_rate": 0.00013382102910534731, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021461865669900794, + "loss": 0.0168, "step": 219590 }, { - "epoch": 1.11, - "learning_rate": 0.00013381346141233332, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.0002146147684826365, + "loss": 0.0152, "step": 219600 }, { - "epoch": 1.11, - "learning_rate": 0.0001338058937193193, - "loss": 0.0128, + "epoch": 0.57, + "learning_rate": 0.00021461088026626505, + "loss": 0.0158, "step": 219610 }, { - "epoch": 1.11, - "learning_rate": 0.00013379832602630529, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.00021460699204989357, + "loss": 0.0169, "step": 219620 }, { - "epoch": 1.11, - "learning_rate": 0.0001337907583332913, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.0002146031038335221, + "loss": 0.0152, "step": 219630 }, { - "epoch": 1.11, - "learning_rate": 0.00013378319064027728, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021459921561715065, + "loss": 0.0156, "step": 219640 }, { - "epoch": 1.11, - "learning_rate": 0.00013377562294726326, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.0002145953274007792, + "loss": 0.0156, "step": 219650 }, { - "epoch": 1.11, - "learning_rate": 0.00013376805525424924, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.0002145914391844077, + "loss": 0.0188, "step": 219660 }, { - "epoch": 1.11, - "learning_rate": 0.00013376048756123522, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021458755096803625, + "loss": 0.0211, "step": 219670 }, { - "epoch": 1.11, - "learning_rate": 0.00013375291986822123, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.0002145836627516648, + "loss": 0.0168, "step": 219680 }, { - "epoch": 1.11, - "learning_rate": 0.0001337453521752072, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021457977453529333, + "loss": 0.0209, "step": 219690 }, { - "epoch": 1.11, - "learning_rate": 0.0001337377844821932, - "loss": 0.012, + "epoch": 0.57, + "learning_rate": 0.00021457588631892185, + "loss": 0.0131, "step": 219700 }, { - "epoch": 1.11, - "learning_rate": 0.0001337302167891792, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.0002145719981025504, + "loss": 0.0164, "step": 219710 }, { - "epoch": 1.11, - "learning_rate": 0.00013372264909616518, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021456810988617893, + "loss": 0.0163, "step": 219720 }, { - "epoch": 1.11, - "learning_rate": 0.00013371508140315116, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021456422166980747, + "loss": 0.0142, "step": 219730 }, { - "epoch": 1.11, - "learning_rate": 0.00013370751371013717, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021456033345343598, + "loss": 0.0177, "step": 219740 }, { - "epoch": 1.11, - "learning_rate": 0.00013369994601712315, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021455644523706453, + "loss": 0.0147, "step": 219750 }, { - "epoch": 1.11, - "learning_rate": 0.00013369237832410913, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.0002145525570206931, + "loss": 0.0148, "step": 219760 }, { - "epoch": 1.11, - "learning_rate": 0.00013368481063109512, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.0002145486688043216, + "loss": 0.0139, "step": 219770 }, { - "epoch": 1.11, - "learning_rate": 0.00013367724293808112, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021454478058795015, + "loss": 0.0129, "step": 219780 }, { - "epoch": 1.11, - "learning_rate": 0.0001336696752450671, - "loss": 0.0073, + "epoch": 0.57, + "learning_rate": 0.00021454089237157867, + "loss": 0.018, "step": 219790 }, { - "epoch": 1.11, - "learning_rate": 0.0001336621075520531, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021453700415520723, + "loss": 0.0174, "step": 219800 }, { - "epoch": 1.11, - "learning_rate": 0.0001336545398590391, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021453311593883575, + "loss": 0.0172, "step": 219810 }, { - "epoch": 1.11, - "learning_rate": 0.00013364697216602508, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002145292277224643, + "loss": 0.0167, "step": 219820 }, { - "epoch": 1.11, - "learning_rate": 0.00013363940447301106, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.0002145253395060928, + "loss": 0.0183, "step": 219830 }, { - "epoch": 1.11, - "learning_rate": 0.00013363183677999707, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.00021452145128972135, + "loss": 0.0179, "step": 219840 }, { - "epoch": 1.11, - "learning_rate": 0.00013362426908698305, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.0002145175630733499, + "loss": 0.0148, "step": 219850 }, { - "epoch": 1.11, - "learning_rate": 0.00013361670139396903, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021451367485697843, + "loss": 0.0166, "step": 219860 }, { - "epoch": 1.11, - "learning_rate": 0.00013360913370095504, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021450978664060694, + "loss": 0.0178, "step": 219870 }, { - "epoch": 1.11, - "learning_rate": 0.00013360156600794102, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.00021450589842423549, + "loss": 0.0177, "step": 219880 }, { - "epoch": 1.11, - "learning_rate": 0.000133593998314927, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021450201020786403, + "loss": 0.0195, "step": 219890 }, { - "epoch": 1.11, - "learning_rate": 0.000133586430621913, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021449812199149257, + "loss": 0.0133, "step": 219900 }, { - "epoch": 1.11, - "learning_rate": 0.000133578862928899, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021449423377512108, + "loss": 0.015, "step": 219910 }, { - "epoch": 1.11, - "learning_rate": 0.00013357129523588497, - "loss": 0.0079, + "epoch": 0.57, + "learning_rate": 0.00021449034555874963, + "loss": 0.0169, "step": 219920 }, { - "epoch": 1.11, - "learning_rate": 0.00013356372754287098, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.0002144864573423782, + "loss": 0.0139, "step": 219930 }, { - "epoch": 1.11, - "learning_rate": 0.00013355615984985696, - "loss": 0.0113, + "epoch": 0.57, + "learning_rate": 0.0002144825691260067, + "loss": 0.0149, "step": 219940 }, { - "epoch": 1.11, - "learning_rate": 0.00013354859215684294, - "loss": 0.0113, + "epoch": 0.57, + "learning_rate": 0.00021447868090963522, + "loss": 0.0141, "step": 219950 }, { - "epoch": 1.11, - "learning_rate": 0.00013354102446382893, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021447479269326377, + "loss": 0.0193, "step": 219960 }, { - "epoch": 1.11, - "learning_rate": 0.00013353345677081493, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021447090447689233, + "loss": 0.0144, "step": 219970 }, { - "epoch": 1.11, - "learning_rate": 0.00013352588907780092, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021446701626052085, + "loss": 0.0131, "step": 219980 }, { - "epoch": 1.11, - "learning_rate": 0.0001335183213847869, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.0002144631280441494, + "loss": 0.0141, "step": 219990 }, { - "epoch": 1.11, - "learning_rate": 0.0001335107536917729, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.0002144592398277779, + "loss": 0.0245, "step": 220000 }, { - "epoch": 1.11, - "eval_cer": 0.9144450256039017, - "eval_loss": 0.007259270641952753, - "eval_runtime": 116.3674, - "eval_samples_per_second": 17.187, - "eval_steps_per_second": 4.297, + "epoch": 0.57, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.011034357361495495, + "eval_runtime": 107.3096, + "eval_samples_per_second": 18.638, + "eval_steps_per_second": 4.659, "step": 220000 }, { - "epoch": 1.11, - "learning_rate": 0.0001335031859987589, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021445535161140647, + "loss": 0.0137, "step": 220010 }, { - "epoch": 1.11, - "learning_rate": 0.00013349561830574487, - "loss": 0.0124, + "epoch": 0.57, + "learning_rate": 0.000214451463395035, + "loss": 0.0172, "step": 220020 }, { - "epoch": 1.11, - "learning_rate": 0.00013348805061273088, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021444757517866353, + "loss": 0.0136, "step": 220030 }, { - "epoch": 1.11, - "learning_rate": 0.00013348048291971686, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021444368696229204, + "loss": 0.016, "step": 220040 }, { - "epoch": 1.11, - "learning_rate": 0.00013347291522670284, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.0002144397987459206, + "loss": 0.0216, "step": 220050 }, { - "epoch": 1.11, - "learning_rate": 0.00013346534753368885, - "loss": 0.0121, + "epoch": 0.57, + "learning_rate": 0.00021443591052954913, + "loss": 0.0157, "step": 220060 }, { - "epoch": 1.11, - "learning_rate": 0.00013345777984067483, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.00021443202231317767, + "loss": 0.0204, "step": 220070 }, { - "epoch": 1.11, - "learning_rate": 0.0001334502121476608, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021442813409680618, + "loss": 0.0219, "step": 220080 }, { - "epoch": 1.11, - "learning_rate": 0.00013344264445464682, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021442424588043472, + "loss": 0.0156, "step": 220090 }, { - "epoch": 1.11, - "learning_rate": 0.0001334350767616328, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.0002144203576640633, + "loss": 0.0173, "step": 220100 }, { - "epoch": 1.11, - "learning_rate": 0.00013342750906861878, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.0002144164694476918, + "loss": 0.0164, "step": 220110 }, { - "epoch": 1.11, - "learning_rate": 0.00013341994137560476, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021441258123132032, + "loss": 0.0168, "step": 220120 }, { - "epoch": 1.11, - "learning_rate": 0.00013341237368259077, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021440869301494886, + "loss": 0.0161, "step": 220130 }, { - "epoch": 1.11, - "learning_rate": 0.00013340480598957675, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021440480479857743, + "loss": 0.0172, "step": 220140 }, { - "epoch": 1.11, - "learning_rate": 0.00013339723829656274, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021440091658220595, + "loss": 0.0172, "step": 220150 }, { - "epoch": 1.11, - "learning_rate": 0.00013338967060354874, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.0002143970283658345, + "loss": 0.0171, "step": 220160 }, { - "epoch": 1.11, - "learning_rate": 0.00013338210291053473, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.000214393140149463, + "loss": 0.0181, "step": 220170 }, { - "epoch": 1.11, - "learning_rate": 0.0001333745352175207, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021438925193309157, + "loss": 0.0153, "step": 220180 }, { - "epoch": 1.11, - "learning_rate": 0.00013336696752450672, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.0002143853637167201, + "loss": 0.015, "step": 220190 }, { - "epoch": 1.11, - "learning_rate": 0.0001333593998314927, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021438147550034863, + "loss": 0.0249, "step": 220200 }, { - "epoch": 1.11, - "learning_rate": 0.00013335183213847868, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021437758728397714, + "loss": 0.0227, "step": 220210 }, { - "epoch": 1.11, - "learning_rate": 0.0001333442644454647, - "loss": 0.0077, + "epoch": 0.57, + "learning_rate": 0.0002143736990676057, + "loss": 0.0157, "step": 220220 }, { - "epoch": 1.11, - "learning_rate": 0.00013333669675245067, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.00021436981085123423, + "loss": 0.0156, "step": 220230 }, { - "epoch": 1.11, - "learning_rate": 0.00013332912905943665, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.00021436592263486277, + "loss": 0.0168, "step": 220240 }, { - "epoch": 1.11, - "learning_rate": 0.00013332156136642266, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021436203441849128, + "loss": 0.0148, "step": 220250 }, { - "epoch": 1.11, - "learning_rate": 0.00013331399367340864, - "loss": 0.007, + "epoch": 0.57, + "learning_rate": 0.00021435814620211985, + "loss": 0.0157, "step": 220260 }, { - "epoch": 1.11, - "learning_rate": 0.00013330642598039462, - "loss": 0.013, + "epoch": 0.57, + "learning_rate": 0.00021435425798574837, + "loss": 0.0154, "step": 220270 }, { - "epoch": 1.11, - "learning_rate": 0.0001332988582873806, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.0002143503697693769, + "loss": 0.0131, "step": 220280 }, { - "epoch": 1.11, - "learning_rate": 0.00013329129059436659, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.00021434648155300542, + "loss": 0.0184, "step": 220290 }, { - "epoch": 1.11, - "learning_rate": 0.00013328372290135257, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.000214342593336634, + "loss": 0.0134, "step": 220300 }, { - "epoch": 1.11, - "learning_rate": 0.00013327615520833858, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021433870512026253, + "loss": 0.0173, "step": 220310 }, { - "epoch": 1.11, - "learning_rate": 0.00013326858751532456, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021433481690389105, + "loss": 0.0188, "step": 220320 }, { - "epoch": 1.11, - "learning_rate": 0.00013326101982231054, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002143309286875196, + "loss": 0.0158, "step": 220330 }, { - "epoch": 1.11, - "learning_rate": 0.00013325345212929655, - "loss": 0.0113, + "epoch": 0.57, + "learning_rate": 0.0002143270404711481, + "loss": 0.0179, "step": 220340 }, { - "epoch": 1.11, - "learning_rate": 0.00013324588443628253, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021432315225477667, + "loss": 0.0183, "step": 220350 }, { - "epoch": 1.11, - "learning_rate": 0.0001332383167432685, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002143192640384052, + "loss": 0.0163, "step": 220360 }, { - "epoch": 1.11, - "learning_rate": 0.00013323074905025452, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021431537582203373, + "loss": 0.0139, "step": 220370 }, { - "epoch": 1.11, - "learning_rate": 0.0001332231813572405, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.00021431148760566224, + "loss": 0.0144, "step": 220380 }, { - "epoch": 1.11, - "learning_rate": 0.00013321561366422648, - "loss": 0.0114, + "epoch": 0.57, + "learning_rate": 0.0002143075993892908, + "loss": 0.0169, "step": 220390 }, { - "epoch": 1.11, - "learning_rate": 0.0001332080459712125, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021430371117291933, + "loss": 0.0136, "step": 220400 }, { - "epoch": 1.11, - "learning_rate": 0.00013320047827819847, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021429982295654787, + "loss": 0.0167, "step": 220410 }, { - "epoch": 1.11, - "learning_rate": 0.00013319291058518445, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021429593474017638, + "loss": 0.0161, "step": 220420 }, { - "epoch": 1.11, - "learning_rate": 0.00013318534289217046, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.00021429204652380495, + "loss": 0.0161, "step": 220430 }, { - "epoch": 1.11, - "learning_rate": 0.00013317777519915644, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021428815830743347, + "loss": 0.0182, "step": 220440 }, { - "epoch": 1.11, - "learning_rate": 0.00013317020750614242, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.000214284270091062, + "loss": 0.0182, "step": 220450 }, { - "epoch": 1.11, - "learning_rate": 0.00013316263981312843, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.00021428038187469052, + "loss": 0.0187, "step": 220460 }, { - "epoch": 1.11, - "learning_rate": 0.00013315507212011441, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.0002142764936583191, + "loss": 0.0166, "step": 220470 }, { - "epoch": 1.11, - "learning_rate": 0.0001331475044271004, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021427260544194763, + "loss": 0.0157, "step": 220480 }, { - "epoch": 1.11, - "learning_rate": 0.00013313993673408638, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021426871722557615, + "loss": 0.0129, "step": 220490 }, { - "epoch": 1.11, - "learning_rate": 0.00013313236904107239, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.0002142648290092047, + "loss": 0.0188, "step": 220500 }, { - "epoch": 1.11, - "learning_rate": 0.00013312480134805837, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021426094079283323, + "loss": 0.0157, "step": 220510 }, { - "epoch": 1.11, - "learning_rate": 0.00013311723365504435, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021425705257646177, + "loss": 0.0135, "step": 220520 }, { - "epoch": 1.11, - "learning_rate": 0.00013310966596203036, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.00021425316436009029, + "loss": 0.0304, "step": 220530 }, { - "epoch": 1.11, - "learning_rate": 0.00013310209826901634, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021424927614371883, + "loss": 0.0189, "step": 220540 }, { - "epoch": 1.11, - "learning_rate": 0.00013309453057600232, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021424538792734737, + "loss": 0.0166, "step": 220550 }, { - "epoch": 1.11, - "learning_rate": 0.00013308696288298833, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.0002142414997109759, + "loss": 0.015, "step": 220560 }, { - "epoch": 1.11, - "learning_rate": 0.0001330793951899743, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021423761149460443, + "loss": 0.0194, "step": 220570 }, { - "epoch": 1.11, - "learning_rate": 0.0001330718274969603, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021423372327823297, + "loss": 0.0166, "step": 220580 }, { - "epoch": 1.11, - "learning_rate": 0.0001330642598039463, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021422983506186148, + "loss": 0.0187, "step": 220590 }, { - "epoch": 1.11, - "learning_rate": 0.00013305669211093228, - "loss": 0.0103, + "epoch": 0.57, + "learning_rate": 0.00021422594684549005, + "loss": 0.0162, "step": 220600 }, { - "epoch": 1.11, - "learning_rate": 0.00013304912441791826, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021422205862911856, + "loss": 0.0156, "step": 220610 }, { - "epoch": 1.11, - "learning_rate": 0.00013304155672490427, - "loss": 0.0079, + "epoch": 0.57, + "learning_rate": 0.0002142181704127471, + "loss": 0.0201, "step": 220620 }, { - "epoch": 1.11, - "learning_rate": 0.00013303398903189025, - "loss": 0.0076, + "epoch": 0.57, + "learning_rate": 0.00021421428219637562, + "loss": 0.0156, "step": 220630 }, { - "epoch": 1.11, - "learning_rate": 0.00013302642133887623, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.0002142103939800042, + "loss": 0.0161, "step": 220640 }, { - "epoch": 1.11, - "learning_rate": 0.00013301885364586222, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021420650576363273, + "loss": 0.0183, "step": 220650 }, { - "epoch": 1.11, - "learning_rate": 0.00013301128595284822, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021420261754726125, + "loss": 0.0186, "step": 220660 }, { - "epoch": 1.11, - "learning_rate": 0.0001330037182598342, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021419872933088976, + "loss": 0.0219, "step": 220670 }, { - "epoch": 1.11, - "learning_rate": 0.0001329961505668202, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021419484111451833, + "loss": 0.0147, "step": 220680 }, { - "epoch": 1.11, - "learning_rate": 0.0001329885828738062, - "loss": 0.0122, + "epoch": 0.57, + "learning_rate": 0.00021419095289814687, + "loss": 0.0179, "step": 220690 }, { - "epoch": 1.11, - "learning_rate": 0.00013298101518079218, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.00021418706468177539, + "loss": 0.0204, "step": 220700 }, { - "epoch": 1.11, - "learning_rate": 0.00013297344748777816, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021418317646540393, + "loss": 0.0188, "step": 220710 }, { - "epoch": 1.11, - "learning_rate": 0.00013296587979476417, - "loss": 0.0101, + "epoch": 0.57, + "learning_rate": 0.00021417928824903247, + "loss": 0.018, "step": 220720 }, { - "epoch": 1.11, - "learning_rate": 0.00013295831210175015, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.000214175400032661, + "loss": 0.019, "step": 220730 }, { - "epoch": 1.11, - "learning_rate": 0.00013295074440873613, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021417151181628952, + "loss": 0.0176, "step": 220740 }, { - "epoch": 1.11, - "learning_rate": 0.00013294317671572214, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021416762359991807, + "loss": 0.0158, "step": 220750 }, { - "epoch": 1.11, - "learning_rate": 0.00013293560902270812, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.0002141637353835466, + "loss": 0.0175, "step": 220760 }, { - "epoch": 1.11, - "learning_rate": 0.0001329280413296941, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.00021415984716717515, + "loss": 0.0188, "step": 220770 }, { - "epoch": 1.11, - "learning_rate": 0.0001329204736366801, - "loss": 0.0127, + "epoch": 0.57, + "learning_rate": 0.00021415595895080366, + "loss": 0.0165, "step": 220780 }, { - "epoch": 1.11, - "learning_rate": 0.0001329129059436661, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.0002141520707344322, + "loss": 0.0158, "step": 220790 }, { - "epoch": 1.11, - "learning_rate": 0.00013290533825065207, - "loss": 0.0071, + "epoch": 0.57, + "learning_rate": 0.00021414818251806077, + "loss": 0.0175, "step": 220800 }, { - "epoch": 1.11, - "learning_rate": 0.00013289777055763805, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.0002141442943016893, + "loss": 0.0182, "step": 220810 }, { - "epoch": 1.11, - "learning_rate": 0.00013289020286462406, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.0002141404060853178, + "loss": 0.0186, "step": 220820 }, { - "epoch": 1.11, - "learning_rate": 0.00013288263517161004, - "loss": 0.0083, + "epoch": 0.57, + "learning_rate": 0.00021413651786894635, + "loss": 0.02, "step": 220830 }, { - "epoch": 1.11, - "learning_rate": 0.00013287506747859603, - "loss": 0.0131, + "epoch": 0.57, + "learning_rate": 0.00021413262965257486, + "loss": 0.0163, "step": 220840 }, { - "epoch": 1.11, - "learning_rate": 0.00013286749978558203, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021412874143620343, + "loss": 0.0141, "step": 220850 }, { - "epoch": 1.11, - "learning_rate": 0.00013285993209256802, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021412485321983197, + "loss": 0.0159, "step": 220860 }, { - "epoch": 1.11, - "learning_rate": 0.000132852364399554, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021412096500346048, + "loss": 0.0179, "step": 220870 }, { - "epoch": 1.11, - "learning_rate": 0.00013284479670654, - "loss": 0.0118, + "epoch": 0.57, + "learning_rate": 0.00021411707678708903, + "loss": 0.019, "step": 220880 }, { - "epoch": 1.11, - "learning_rate": 0.000132837229013526, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021411318857071757, + "loss": 0.0157, "step": 220890 }, { - "epoch": 1.11, - "learning_rate": 0.00013282966132051197, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.0002141093003543461, + "loss": 0.0154, "step": 220900 }, { - "epoch": 1.11, - "learning_rate": 0.00013282209362749795, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021410541213797462, + "loss": 0.0168, "step": 220910 }, { - "epoch": 1.11, - "learning_rate": 0.00013281452593448393, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021410152392160317, + "loss": 0.017, "step": 220920 }, { - "epoch": 1.11, - "learning_rate": 0.00013280695824146994, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.0002140976357052317, + "loss": 0.0145, "step": 220930 }, { - "epoch": 1.11, - "learning_rate": 0.00013279939054845592, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.00021409374748886025, + "loss": 0.016, "step": 220940 }, { - "epoch": 1.11, - "learning_rate": 0.0001327918228554419, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021408985927248876, + "loss": 0.0151, "step": 220950 }, { - "epoch": 1.11, - "learning_rate": 0.0001327842551624279, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.0002140859710561173, + "loss": 0.0167, "step": 220960 }, { - "epoch": 1.11, - "learning_rate": 0.0001327766874694139, - "loss": 0.0092, + "epoch": 0.57, + "learning_rate": 0.00021408208283974587, + "loss": 0.0141, "step": 220970 }, { - "epoch": 1.11, - "learning_rate": 0.00013276911977639987, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.0002140781946233744, + "loss": 0.0195, "step": 220980 }, { - "epoch": 1.11, - "learning_rate": 0.00013276155208338588, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.0002140743064070029, + "loss": 0.0174, "step": 220990 }, { - "epoch": 1.11, - "learning_rate": 0.00013275398439037186, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021407041819063144, + "loss": 0.0136, "step": 221000 }, { - "epoch": 1.11, - "eval_cer": 0.9144712262992877, - "eval_loss": 0.007316153962165117, - "eval_runtime": 116.2409, - "eval_samples_per_second": 17.206, - "eval_steps_per_second": 4.301, + "epoch": 0.57, + "eval_cer": 0.8817754674437451, + "eval_loss": 0.011082570999860764, + "eval_runtime": 107.259, + "eval_samples_per_second": 18.646, + "eval_steps_per_second": 4.662, "step": 221000 }, { - "epoch": 1.12, - "learning_rate": 0.00013274641669735785, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021406652997426001, + "loss": 0.0179, "step": 221010 }, { - "epoch": 1.12, - "learning_rate": 0.00013273884900434383, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021406264175788853, + "loss": 0.0198, "step": 221020 }, { - "epoch": 1.12, - "learning_rate": 0.00013273128131132984, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021405875354151707, + "loss": 0.0141, "step": 221030 }, { - "epoch": 1.12, - "learning_rate": 0.00013272371361831582, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021405486532514558, + "loss": 0.0174, "step": 221040 }, { - "epoch": 1.12, - "learning_rate": 0.0001327161459253018, - "loss": 0.0073, + "epoch": 0.57, + "learning_rate": 0.00021405097710877415, + "loss": 0.0184, "step": 221050 }, { - "epoch": 1.12, - "learning_rate": 0.0001327085782322878, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.00021404708889240267, + "loss": 0.0134, "step": 221060 }, { - "epoch": 1.12, - "learning_rate": 0.0001327010105392738, - "loss": 0.0076, + "epoch": 0.57, + "learning_rate": 0.0002140432006760312, + "loss": 0.0165, "step": 221070 }, { - "epoch": 1.12, - "learning_rate": 0.00013269344284625977, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021403931245965972, + "loss": 0.0162, "step": 221080 }, { - "epoch": 1.12, - "learning_rate": 0.00013268587515324578, - "loss": 0.007, + "epoch": 0.57, + "learning_rate": 0.00021403542424328827, + "loss": 0.0165, "step": 221090 }, { - "epoch": 1.12, - "learning_rate": 0.00013267830746023176, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.0002140315360269168, + "loss": 0.0138, "step": 221100 }, { - "epoch": 1.12, - "learning_rate": 0.00013267073976721774, - "loss": 0.0145, + "epoch": 0.57, + "learning_rate": 0.00021402764781054535, + "loss": 0.0155, "step": 221110 }, { - "epoch": 1.12, - "learning_rate": 0.00013266317207420375, - "loss": 0.0096, - "step": 221120 + "epoch": 0.57, + "learning_rate": 0.00021402375959417386, + "loss": 0.0162, + "step": 221120 }, { - "epoch": 1.12, - "learning_rate": 0.00013265560438118973, - "loss": 0.0093, + "epoch": 0.57, + "learning_rate": 0.0002140198713778024, + "loss": 0.016, "step": 221130 }, { - "epoch": 1.12, - "learning_rate": 0.0001326480366881757, - "loss": 0.0106, + "epoch": 0.57, + "learning_rate": 0.00021401598316143095, + "loss": 0.0145, "step": 221140 }, { - "epoch": 1.12, - "learning_rate": 0.00013264046899516172, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.0002140120949450595, + "loss": 0.0157, "step": 221150 }, { - "epoch": 1.12, - "learning_rate": 0.0001326329013021477, - "loss": 0.0187, + "epoch": 0.57, + "learning_rate": 0.000214008206728688, + "loss": 0.0159, "step": 221160 }, { - "epoch": 1.12, - "learning_rate": 0.00013262533360913368, - "loss": 0.013, + "epoch": 0.57, + "learning_rate": 0.00021400431851231654, + "loss": 0.0166, "step": 221170 }, { - "epoch": 1.12, - "learning_rate": 0.00013261776591611967, - "loss": 0.0105, + "epoch": 0.57, + "learning_rate": 0.0002140004302959451, + "loss": 0.0143, "step": 221180 }, { - "epoch": 1.12, - "learning_rate": 0.00013261019822310567, - "loss": 0.0121, + "epoch": 0.57, + "learning_rate": 0.00021399654207957363, + "loss": 0.0164, "step": 221190 }, { - "epoch": 1.12, - "learning_rate": 0.00013260263053009166, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021399265386320217, + "loss": 0.0199, "step": 221200 }, { - "epoch": 1.12, - "learning_rate": 0.00013259506283707764, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021398876564683068, + "loss": 0.0198, "step": 221210 }, { - "epoch": 1.12, - "learning_rate": 0.00013258749514406365, - "loss": 0.0065, + "epoch": 0.57, + "learning_rate": 0.00021398487743045925, + "loss": 0.0207, "step": 221220 }, { - "epoch": 1.12, - "learning_rate": 0.00013257992745104963, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021398098921408777, + "loss": 0.0119, "step": 221230 }, { - "epoch": 1.12, - "learning_rate": 0.0001325723597580356, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.0002139771009977163, + "loss": 0.0175, "step": 221240 }, { - "epoch": 1.12, - "learning_rate": 0.00013256479206502162, - "loss": 0.0107, + "epoch": 0.57, + "learning_rate": 0.00021397321278134482, + "loss": 0.0151, "step": 221250 }, { - "epoch": 1.12, - "learning_rate": 0.0001325572243720076, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.0002139693245649734, + "loss": 0.0164, "step": 221260 }, { - "epoch": 1.12, - "learning_rate": 0.00013254965667899358, - "loss": 0.0091, + "epoch": 0.57, + "learning_rate": 0.0002139654363486019, + "loss": 0.0174, "step": 221270 }, { - "epoch": 1.12, - "learning_rate": 0.0001325420889859796, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.00021396154813223045, + "loss": 0.0153, "step": 221280 }, { - "epoch": 1.12, - "learning_rate": 0.00013253452129296557, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021395765991585896, + "loss": 0.0212, "step": 221290 }, { - "epoch": 1.12, - "learning_rate": 0.00013252695359995155, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021395377169948753, + "loss": 0.017, "step": 221300 }, { - "epoch": 1.12, - "learning_rate": 0.00013251938590693756, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.00021394988348311605, + "loss": 0.0139, "step": 221310 }, { - "epoch": 1.12, - "learning_rate": 0.00013251181821392354, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.0002139459952667446, + "loss": 0.0152, "step": 221320 }, { - "epoch": 1.12, - "learning_rate": 0.00013250425052090952, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.0002139421070503731, + "loss": 0.0148, "step": 221330 }, { - "epoch": 1.12, - "learning_rate": 0.0001324966828278955, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021393821883400164, + "loss": 0.0147, "step": 221340 }, { - "epoch": 1.12, - "learning_rate": 0.0001324891151348815, - "loss": 0.008, + "epoch": 0.57, + "learning_rate": 0.0002139343306176302, + "loss": 0.0146, "step": 221350 }, { - "epoch": 1.12, - "learning_rate": 0.0001324815474418675, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021393044240125873, + "loss": 0.0143, "step": 221360 }, { - "epoch": 1.12, - "learning_rate": 0.00013247397974885348, - "loss": 0.0129, + "epoch": 0.57, + "learning_rate": 0.00021392655418488727, + "loss": 0.0147, "step": 221370 }, { - "epoch": 1.12, - "learning_rate": 0.00013246641205583948, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.00021392266596851578, + "loss": 0.0156, "step": 221380 }, { - "epoch": 1.12, - "learning_rate": 0.00013245884436282547, - "loss": 0.0082, + "epoch": 0.57, + "learning_rate": 0.00021391877775214435, + "loss": 0.0165, "step": 221390 }, { - "epoch": 1.12, - "learning_rate": 0.00013245127666981145, - "loss": 0.0102, + "epoch": 0.57, + "learning_rate": 0.00021391488953577287, + "loss": 0.0153, "step": 221400 }, { - "epoch": 1.12, - "learning_rate": 0.00013244370897679746, - "loss": 0.01, + "epoch": 0.57, + "learning_rate": 0.0002139110013194014, + "loss": 0.015, "step": 221410 }, { - "epoch": 1.12, - "learning_rate": 0.00013243614128378344, - "loss": 0.0097, + "epoch": 0.57, + "learning_rate": 0.00021390711310302992, + "loss": 0.0158, "step": 221420 }, { - "epoch": 1.12, - "learning_rate": 0.00013242857359076942, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002139032248866585, + "loss": 0.0167, "step": 221430 }, { - "epoch": 1.12, - "learning_rate": 0.00013242100589775543, - "loss": 0.0088, + "epoch": 0.57, + "learning_rate": 0.000213899336670287, + "loss": 0.0206, "step": 221440 }, { - "epoch": 1.12, - "learning_rate": 0.0001324134382047414, - "loss": 0.0119, + "epoch": 0.57, + "learning_rate": 0.00021389544845391555, + "loss": 0.0145, "step": 221450 }, { - "epoch": 1.12, - "learning_rate": 0.0001324058705117274, - "loss": 0.0087, + "epoch": 0.57, + "learning_rate": 0.00021389156023754406, + "loss": 0.0147, "step": 221460 }, { - "epoch": 1.12, - "learning_rate": 0.0001323983028187134, - "loss": 0.0078, + "epoch": 0.57, + "learning_rate": 0.00021388767202117263, + "loss": 0.0135, "step": 221470 }, { - "epoch": 1.12, - "learning_rate": 0.00013239073512569938, - "loss": 0.0089, + "epoch": 0.57, + "learning_rate": 0.00021388378380480115, + "loss": 0.0129, "step": 221480 }, { - "epoch": 1.12, - "learning_rate": 0.00013238316743268536, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.0002138798955884297, + "loss": 0.0121, "step": 221490 }, { - "epoch": 1.12, - "learning_rate": 0.00013237559973967137, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.0002138760073720582, + "loss": 0.0173, "step": 221500 }, { - "epoch": 1.12, - "learning_rate": 0.00013236803204665735, - "loss": 0.0108, + "epoch": 0.57, + "learning_rate": 0.00021387211915568677, + "loss": 0.0198, "step": 221510 }, { - "epoch": 1.12, - "learning_rate": 0.00013236046435364333, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.0002138682309393153, + "loss": 0.0193, "step": 221520 }, { - "epoch": 1.12, - "learning_rate": 0.00013235289666062931, - "loss": 0.0085, + "epoch": 0.57, + "learning_rate": 0.00021386434272294383, + "loss": 0.016, "step": 221530 }, { - "epoch": 1.12, - "learning_rate": 0.0001323453289676153, - "loss": 0.0081, + "epoch": 0.57, + "learning_rate": 0.00021386045450657234, + "loss": 0.0155, "step": 221540 }, { - "epoch": 1.12, - "learning_rate": 0.00013233776127460128, - "loss": 0.0098, + "epoch": 0.57, + "learning_rate": 0.0002138565662902009, + "loss": 0.017, "step": 221550 }, { - "epoch": 1.12, - "learning_rate": 0.00013233019358158729, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.00021385267807382945, + "loss": 0.0169, "step": 221560 }, { - "epoch": 1.12, - "learning_rate": 0.00013232262588857327, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021384878985745797, + "loss": 0.0187, "step": 221570 }, { - "epoch": 1.12, - "learning_rate": 0.00013231505819555925, - "loss": 0.0073, + "epoch": 0.57, + "learning_rate": 0.0002138449016410865, + "loss": 0.0189, "step": 221580 }, { - "epoch": 1.12, - "learning_rate": 0.00013230749050254526, - "loss": 0.0135, + "epoch": 0.57, + "learning_rate": 0.00021384101342471502, + "loss": 0.0152, "step": 221590 }, { - "epoch": 1.12, - "learning_rate": 0.00013229992280953124, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.0002138371252083436, + "loss": 0.0175, "step": 221600 }, { - "epoch": 1.12, - "learning_rate": 0.00013229235511651722, - "loss": 0.0072, + "epoch": 0.57, + "learning_rate": 0.0002138332369919721, + "loss": 0.0148, "step": 221610 }, { - "epoch": 1.12, - "learning_rate": 0.00013228478742350323, - "loss": 0.0124, + "epoch": 0.57, + "learning_rate": 0.00021382934877560065, + "loss": 0.0158, "step": 221620 }, { - "epoch": 1.12, - "learning_rate": 0.0001322772197304892, - "loss": 0.0096, + "epoch": 0.57, + "learning_rate": 0.00021382546055922916, + "loss": 0.0188, "step": 221630 }, { - "epoch": 1.12, - "learning_rate": 0.0001322696520374752, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021382157234285773, + "loss": 0.0141, "step": 221640 }, { - "epoch": 1.12, - "learning_rate": 0.0001322620843444612, - "loss": 0.0104, + "epoch": 0.57, + "learning_rate": 0.00021381768412648624, + "loss": 0.0149, "step": 221650 }, { - "epoch": 1.12, - "learning_rate": 0.00013225451665144718, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021381379591011479, + "loss": 0.0157, "step": 221660 }, { - "epoch": 1.12, - "learning_rate": 0.00013224694895843316, - "loss": 0.0111, + "epoch": 0.57, + "learning_rate": 0.0002138099076937433, + "loss": 0.0194, "step": 221670 }, { - "epoch": 1.12, - "learning_rate": 0.00013223938126541917, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021380601947737187, + "loss": 0.0182, "step": 221680 }, { - "epoch": 1.12, - "learning_rate": 0.00013223181357240515, - "loss": 0.0112, + "epoch": 0.57, + "learning_rate": 0.0002138021312610004, + "loss": 0.0175, "step": 221690 }, { - "epoch": 1.12, - "learning_rate": 0.00013222424587939113, - "loss": 0.0302, + "epoch": 0.57, + "learning_rate": 0.00021379824304462893, + "loss": 0.0137, "step": 221700 }, { - "epoch": 1.12, - "learning_rate": 0.00013221667818637712, - "loss": 0.0137, + "epoch": 0.57, + "learning_rate": 0.00021379435482825744, + "loss": 0.0174, "step": 221710 }, { - "epoch": 1.12, - "learning_rate": 0.00013220911049336312, - "loss": 0.0125, + "epoch": 0.57, + "learning_rate": 0.000213790466611886, + "loss": 0.0172, "step": 221720 }, { - "epoch": 1.12, - "learning_rate": 0.0001322015428003491, - "loss": 0.0086, + "epoch": 0.57, + "learning_rate": 0.00021378657839551455, + "loss": 0.0174, "step": 221730 }, { - "epoch": 1.12, - "learning_rate": 0.0001321939751073351, - "loss": 0.0094, + "epoch": 0.57, + "learning_rate": 0.00021378269017914307, + "loss": 0.017, "step": 221740 }, { - "epoch": 1.12, - "learning_rate": 0.0001321864074143211, - "loss": 0.0084, + "epoch": 0.57, + "learning_rate": 0.0002137788019627716, + "loss": 0.0149, "step": 221750 }, { - "epoch": 1.12, - "learning_rate": 0.00013217883972130708, - "loss": 0.0071, + "epoch": 0.57, + "learning_rate": 0.00021377491374640015, + "loss": 0.0226, "step": 221760 }, { - "epoch": 1.12, - "learning_rate": 0.00013217127202829306, - "loss": 0.0095, + "epoch": 0.57, + "learning_rate": 0.0002137710255300287, + "loss": 0.0146, "step": 221770 }, { - "epoch": 1.12, - "learning_rate": 0.00013216370433527907, - "loss": 0.0073, + "epoch": 0.57, + "learning_rate": 0.0002137671373136572, + "loss": 0.017, "step": 221780 }, { - "epoch": 1.12, - "learning_rate": 0.00013215613664226505, - "loss": 0.0099, + "epoch": 0.57, + "learning_rate": 0.00021376324909728575, + "loss": 0.0134, "step": 221790 }, { - "epoch": 1.12, - "learning_rate": 0.00013214856894925103, - "loss": 0.011, + "epoch": 0.57, + "learning_rate": 0.0002137593608809143, + "loss": 0.0154, "step": 221800 }, { - "epoch": 1.12, - "learning_rate": 0.00013214100125623704, - "loss": 0.009, + "epoch": 0.57, + "learning_rate": 0.00021375547266454283, + "loss": 0.0192, "step": 221810 }, { - "epoch": 1.12, - "learning_rate": 0.00013213343356322302, - "loss": 0.0075, + "epoch": 0.57, + "learning_rate": 0.00021375158444817134, + "loss": 0.0129, "step": 221820 }, { - "epoch": 1.12, - "learning_rate": 0.000132125865870209, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021374769623179989, + "loss": 0.019, "step": 221830 }, { - "epoch": 1.12, - "learning_rate": 0.000132118298177195, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.0002137438080154284, + "loss": 0.0162, "step": 221840 }, { - "epoch": 1.12, - "learning_rate": 0.000132110730484181, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021373991979905697, + "loss": 0.0189, "step": 221850 }, { - "epoch": 1.12, - "learning_rate": 0.00013210316279116697, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021373603158268548, + "loss": 0.0153, "step": 221860 }, { - "epoch": 1.12, - "learning_rate": 0.00013209559509815298, - "loss": 0.0126, + "epoch": 0.58, + "learning_rate": 0.00021373214336631403, + "loss": 0.0142, "step": 221870 }, { - "epoch": 1.12, - "learning_rate": 0.00013208802740513896, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021372825514994254, + "loss": 0.0184, "step": 221880 }, { - "epoch": 1.12, - "learning_rate": 0.00013208045971212494, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.0002137243669335711, + "loss": 0.0182, "step": 221890 }, { - "epoch": 1.12, - "learning_rate": 0.00013207289201911093, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021372047871719965, + "loss": 0.0164, "step": 221900 }, { - "epoch": 1.12, - "learning_rate": 0.00013206532432609693, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021371659050082816, + "loss": 0.0161, "step": 221910 }, { - "epoch": 1.12, - "learning_rate": 0.00013205775663308292, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.0002137127022844567, + "loss": 0.0167, "step": 221920 }, { - "epoch": 1.12, - "learning_rate": 0.0001320501889400689, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021370881406808525, + "loss": 0.0204, "step": 221930 }, { - "epoch": 1.12, - "learning_rate": 0.0001320426212470549, - "loss": 0.0119, + "epoch": 0.58, + "learning_rate": 0.0002137049258517138, + "loss": 0.019, "step": 221940 }, { - "epoch": 1.12, - "learning_rate": 0.0001320350535540409, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.0002137010376353423, + "loss": 0.0186, "step": 221950 }, { - "epoch": 1.12, - "learning_rate": 0.00013202748586102687, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021369714941897085, + "loss": 0.0164, "step": 221960 }, { - "epoch": 1.12, - "learning_rate": 0.00013201991816801288, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.0002136932612025994, + "loss": 0.018, "step": 221970 }, { - "epoch": 1.12, - "learning_rate": 0.00013201235047499886, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021368937298622793, + "loss": 0.0183, "step": 221980 }, { - "epoch": 1.12, - "learning_rate": 0.00013200478278198484, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021368548476985644, + "loss": 0.0156, "step": 221990 }, { - "epoch": 1.12, - "learning_rate": 0.00013199721508897085, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021368159655348499, + "loss": 0.0141, "step": 222000 }, { - "epoch": 1.12, - "eval_cer": 0.9144731670915385, - "eval_loss": 0.007101530209183693, - "eval_runtime": 116.3424, - "eval_samples_per_second": 17.191, - "eval_steps_per_second": 4.298, + "epoch": 0.58, + "eval_cer": 0.8817600714374692, + "eval_loss": 0.011201182380318642, + "eval_runtime": 107.2894, + "eval_samples_per_second": 18.641, + "eval_steps_per_second": 4.66, "step": 222000 }, { - "epoch": 1.12, - "learning_rate": 0.00013198964739595683, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.00021367770833711353, + "loss": 0.0159, "step": 222010 }, { - "epoch": 1.12, - "learning_rate": 0.0001319820797029428, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021367382012074207, + "loss": 0.0171, "step": 222020 }, { - "epoch": 1.12, - "learning_rate": 0.00013197451200992882, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021366993190437058, + "loss": 0.0216, "step": 222030 }, { - "epoch": 1.12, - "learning_rate": 0.0001319669443169148, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.00021366604368799912, + "loss": 0.0186, "step": 222040 }, { - "epoch": 1.12, - "learning_rate": 0.00013195937662390078, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.0002136621554716277, + "loss": 0.0166, "step": 222050 }, { - "epoch": 1.12, - "learning_rate": 0.00013195180893088676, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.0002136582672552562, + "loss": 0.0178, "step": 222060 }, { - "epoch": 1.12, - "learning_rate": 0.00013194424123787277, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021365437903888475, + "loss": 0.0164, "step": 222070 }, { - "epoch": 1.12, - "learning_rate": 0.00013193667354485875, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021365049082251326, + "loss": 0.0161, "step": 222080 }, { - "epoch": 1.12, - "learning_rate": 0.00013192910585184474, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.0002136466026061418, + "loss": 0.016, "step": 222090 }, { - "epoch": 1.12, - "learning_rate": 0.00013192153815883074, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021364271438977035, + "loss": 0.0152, "step": 222100 }, { - "epoch": 1.12, - "learning_rate": 0.00013191397046581673, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.0002136388261733989, + "loss": 0.0156, "step": 222110 }, { - "epoch": 1.12, - "learning_rate": 0.0001319064027728027, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.0002136349379570274, + "loss": 0.0197, "step": 222120 }, { - "epoch": 1.12, - "learning_rate": 0.00013189883507978872, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021363104974065595, + "loss": 0.0166, "step": 222130 }, { - "epoch": 1.12, - "learning_rate": 0.0001318912673867747, - "loss": 0.0071, + "epoch": 0.58, + "learning_rate": 0.0002136271615242845, + "loss": 0.0171, "step": 222140 }, { - "epoch": 1.12, - "learning_rate": 0.00013188369969376068, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021362327330791303, + "loss": 0.0189, "step": 222150 }, { - "epoch": 1.12, - "learning_rate": 0.00013187613200074666, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021361938509154154, + "loss": 0.0159, "step": 222160 }, { - "epoch": 1.12, - "learning_rate": 0.00013186856430773264, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021361549687517008, + "loss": 0.0224, "step": 222170 }, { - "epoch": 1.12, - "learning_rate": 0.00013186099661471865, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021361160865879863, + "loss": 0.0177, "step": 222180 }, { - "epoch": 1.12, - "learning_rate": 0.00013185342892170463, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021360772044242717, + "loss": 0.0156, "step": 222190 }, { - "epoch": 1.12, - "learning_rate": 0.0001318458612286906, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021360383222605568, + "loss": 0.0176, "step": 222200 }, { - "epoch": 1.12, - "learning_rate": 0.00013183829353567662, - "loss": 0.0074, + "epoch": 0.58, + "learning_rate": 0.00021359994400968422, + "loss": 0.0161, "step": 222210 }, { - "epoch": 1.12, - "learning_rate": 0.0001318307258426626, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.0002135960557933128, + "loss": 0.0174, "step": 222220 }, { - "epoch": 1.12, - "learning_rate": 0.00013182315814964858, - "loss": 0.0118, + "epoch": 0.58, + "learning_rate": 0.0002135921675769413, + "loss": 0.0137, "step": 222230 }, { - "epoch": 1.12, - "learning_rate": 0.00013181559045663457, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021358827936056985, + "loss": 0.0147, "step": 222240 }, { - "epoch": 1.12, - "learning_rate": 0.00013180802276362057, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021358439114419836, + "loss": 0.0148, "step": 222250 }, { - "epoch": 1.12, - "learning_rate": 0.00013180045507060656, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021358050292782693, + "loss": 0.0201, "step": 222260 }, { - "epoch": 1.12, - "learning_rate": 0.00013179288737759254, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021357661471145545, + "loss": 0.0176, "step": 222270 }, { - "epoch": 1.12, - "learning_rate": 0.00013178531968457855, - "loss": 0.0102, + "epoch": 0.58, + "learning_rate": 0.000213572726495084, + "loss": 0.0158, "step": 222280 }, { - "epoch": 1.12, - "learning_rate": 0.00013177775199156453, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.0002135688382787125, + "loss": 0.0216, "step": 222290 }, { - "epoch": 1.12, - "learning_rate": 0.0001317701842985505, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021356495006234107, + "loss": 0.0187, "step": 222300 }, { - "epoch": 1.12, - "learning_rate": 0.00013176261660553652, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021356106184596959, + "loss": 0.0156, "step": 222310 }, { - "epoch": 1.12, - "learning_rate": 0.0001317550489125225, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021355717362959813, + "loss": 0.017, "step": 222320 }, { - "epoch": 1.12, - "learning_rate": 0.00013174748121950848, - "loss": 0.0113, + "epoch": 0.58, + "learning_rate": 0.00021355328541322664, + "loss": 0.0184, "step": 222330 }, { - "epoch": 1.12, - "learning_rate": 0.0001317399135264945, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021354939719685518, + "loss": 0.0167, "step": 222340 }, { - "epoch": 1.12, - "learning_rate": 0.00013173234583348047, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021354550898048373, + "loss": 0.0186, "step": 222350 }, { - "epoch": 1.12, - "learning_rate": 0.00013172477814046645, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021354162076411227, + "loss": 0.0243, "step": 222360 }, { - "epoch": 1.12, - "learning_rate": 0.00013171721044745246, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.00021353773254774078, + "loss": 0.0173, "step": 222370 }, { - "epoch": 1.12, - "learning_rate": 0.00013170964275443844, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021353384433136932, + "loss": 0.0157, "step": 222380 }, { - "epoch": 1.12, - "learning_rate": 0.00013170207506142442, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.0002135299561149979, + "loss": 0.0151, "step": 222390 }, { - "epoch": 1.12, - "learning_rate": 0.00013169450736841043, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.0002135260678986264, + "loss": 0.0205, "step": 222400 }, { - "epoch": 1.12, - "learning_rate": 0.0001316869396753964, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021352217968225492, + "loss": 0.0164, "step": 222410 }, { - "epoch": 1.12, - "learning_rate": 0.0001316793719823824, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021351829146588346, + "loss": 0.0137, "step": 222420 }, { - "epoch": 1.12, - "learning_rate": 0.00013167180428936838, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021351440324951203, + "loss": 0.0218, "step": 222430 }, { - "epoch": 1.12, - "learning_rate": 0.00013166423659635438, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021351051503314055, + "loss": 0.0186, "step": 222440 }, { - "epoch": 1.12, - "learning_rate": 0.00013165666890334037, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.0002135066268167691, + "loss": 0.0147, "step": 222450 }, { - "epoch": 1.12, - "learning_rate": 0.00013164910121032635, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.0002135027386003976, + "loss": 0.0158, "step": 222460 }, { - "epoch": 1.12, - "learning_rate": 0.00013164153351731236, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021349885038402617, + "loss": 0.0154, "step": 222470 }, { - "epoch": 1.12, - "learning_rate": 0.00013163396582429834, - "loss": 0.0102, + "epoch": 0.58, + "learning_rate": 0.00021349496216765469, + "loss": 0.0221, "step": 222480 }, { - "epoch": 1.12, - "learning_rate": 0.00013162639813128432, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021349107395128323, + "loss": 0.0159, "step": 222490 }, { - "epoch": 1.12, - "learning_rate": 0.00013161883043827033, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.00021348718573491174, + "loss": 0.0163, "step": 222500 }, { - "epoch": 1.12, - "learning_rate": 0.0001316112627452563, - "loss": 0.0152, + "epoch": 0.58, + "learning_rate": 0.0002134832975185403, + "loss": 0.0162, "step": 222510 }, { - "epoch": 1.12, - "learning_rate": 0.0001316036950522423, - "loss": 0.0075, + "epoch": 0.58, + "learning_rate": 0.00021347940930216883, + "loss": 0.0148, "step": 222520 }, { - "epoch": 1.12, - "learning_rate": 0.0001315961273592283, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021347552108579737, + "loss": 0.0167, "step": 222530 }, { - "epoch": 1.12, - "learning_rate": 0.00013158855966621428, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021347163286942588, + "loss": 0.0195, "step": 222540 }, { - "epoch": 1.12, - "learning_rate": 0.00013158099197320026, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.00021346774465305445, + "loss": 0.0131, "step": 222550 }, { - "epoch": 1.12, - "learning_rate": 0.00013157342428018627, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.000213463856436683, + "loss": 0.0159, "step": 222560 }, { - "epoch": 1.12, - "learning_rate": 0.00013156585658717225, - "loss": 0.0113, + "epoch": 0.58, + "learning_rate": 0.0002134599682203115, + "loss": 0.0165, "step": 222570 }, { - "epoch": 1.12, - "learning_rate": 0.00013155828889415823, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021345608000394002, + "loss": 0.0156, "step": 222580 }, { - "epoch": 1.12, - "learning_rate": 0.00013155072120114421, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021345219178756856, + "loss": 0.0169, "step": 222590 }, { - "epoch": 1.12, - "learning_rate": 0.00013154315350813022, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021344830357119713, + "loss": 0.015, "step": 222600 }, { - "epoch": 1.12, - "learning_rate": 0.0001315355858151162, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021344441535482565, + "loss": 0.016, "step": 222610 }, { - "epoch": 1.12, - "learning_rate": 0.00013152801812210219, - "loss": 0.0108, + "epoch": 0.58, + "learning_rate": 0.0002134405271384542, + "loss": 0.0252, "step": 222620 }, { - "epoch": 1.12, - "learning_rate": 0.0001315204504290882, - "loss": 0.0074, + "epoch": 0.58, + "learning_rate": 0.0002134366389220827, + "loss": 0.0642, "step": 222630 }, { - "epoch": 1.12, - "learning_rate": 0.00013151288273607418, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021343275070571127, + "loss": 0.0169, "step": 222640 }, { - "epoch": 1.12, - "learning_rate": 0.00013150531504306016, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021342886248933979, + "loss": 0.0138, "step": 222650 }, { - "epoch": 1.12, - "learning_rate": 0.00013149774735004617, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021342497427296833, + "loss": 0.0194, "step": 222660 }, { - "epoch": 1.12, - "learning_rate": 0.00013149017965703215, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021342108605659684, + "loss": 0.0156, "step": 222670 }, { - "epoch": 1.12, - "learning_rate": 0.00013148261196401813, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.0002134171978402254, + "loss": 0.0163, "step": 222680 }, { - "epoch": 1.12, - "learning_rate": 0.00013147504427100414, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021341330962385392, + "loss": 0.0155, "step": 222690 }, { - "epoch": 1.12, - "learning_rate": 0.00013146747657799012, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021340942140748247, + "loss": 0.0117, "step": 222700 }, { - "epoch": 1.12, - "learning_rate": 0.0001314599088849761, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021340553319111098, + "loss": 0.018, "step": 222710 }, { - "epoch": 1.12, - "learning_rate": 0.0001314523411919621, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021340164497473955, + "loss": 0.0186, "step": 222720 }, { - "epoch": 1.12, - "learning_rate": 0.0001314447734989481, - "loss": 0.0064, + "epoch": 0.58, + "learning_rate": 0.00021339775675836806, + "loss": 0.0152, "step": 222730 }, { - "epoch": 1.12, - "learning_rate": 0.00013143720580593407, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.0002133938685419966, + "loss": 0.0152, "step": 222740 }, { - "epoch": 1.12, - "learning_rate": 0.00013142963811292005, - "loss": 0.0119, + "epoch": 0.58, + "learning_rate": 0.00021338998032562512, + "loss": 0.0125, "step": 222750 }, { - "epoch": 1.12, - "learning_rate": 0.00013142207041990606, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.0002133860921092537, + "loss": 0.0168, "step": 222760 }, { - "epoch": 1.12, - "learning_rate": 0.00013141450272689204, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021338220389288223, + "loss": 0.0173, "step": 222770 }, { - "epoch": 1.12, - "learning_rate": 0.00013140693503387802, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021337831567651075, + "loss": 0.018, "step": 222780 }, { - "epoch": 1.12, - "learning_rate": 0.000131399367340864, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.0002133744274601393, + "loss": 0.0187, "step": 222790 }, { - "epoch": 1.12, - "learning_rate": 0.00013139179964785, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.0002133705392437678, + "loss": 0.0164, "step": 222800 }, { - "epoch": 1.12, - "learning_rate": 0.000131384231954836, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021336665102739637, + "loss": 0.015, "step": 222810 }, { - "epoch": 1.12, - "learning_rate": 0.00013137666426182198, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021336276281102488, + "loss": 0.0146, "step": 222820 }, { - "epoch": 1.12, - "learning_rate": 0.00013136909656880796, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021335887459465343, + "loss": 0.012, "step": 222830 }, { - "epoch": 1.12, - "learning_rate": 0.00013136152887579397, - "loss": 0.0119, + "epoch": 0.58, + "learning_rate": 0.00021335498637828194, + "loss": 0.0222, "step": 222840 }, { - "epoch": 1.12, - "learning_rate": 0.00013135396118277995, - "loss": 0.0116, + "epoch": 0.58, + "learning_rate": 0.0002133510981619105, + "loss": 0.0164, "step": 222850 }, { - "epoch": 1.12, - "learning_rate": 0.00013134639348976593, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021334720994553902, + "loss": 0.0172, "step": 222860 }, { - "epoch": 1.12, - "learning_rate": 0.00013133882579675194, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021334332172916757, + "loss": 0.0213, "step": 222870 }, { - "epoch": 1.12, - "learning_rate": 0.00013133125810373792, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021333943351279608, + "loss": 0.0153, "step": 222880 }, { - "epoch": 1.12, - "learning_rate": 0.0001313236904107239, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021333554529642465, + "loss": 0.0264, "step": 222890 }, { - "epoch": 1.12, - "learning_rate": 0.0001313161227177099, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021333165708005316, + "loss": 0.0198, "step": 222900 }, { - "epoch": 1.12, - "learning_rate": 0.0001313085550246959, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.0002133277688636817, + "loss": 0.0173, "step": 222910 }, { - "epoch": 1.12, - "learning_rate": 0.00013130098733168187, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021332388064731022, + "loss": 0.0166, "step": 222920 }, { - "epoch": 1.12, - "learning_rate": 0.00013129341963866788, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.0002133199924309388, + "loss": 0.0212, "step": 222930 }, { - "epoch": 1.12, - "learning_rate": 0.00013128585194565386, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021331610421456733, + "loss": 0.017, "step": 222940 }, { - "epoch": 1.12, - "learning_rate": 0.00013127828425263984, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021331221599819584, + "loss": 0.0178, "step": 222950 }, { - "epoch": 1.12, - "learning_rate": 0.00013127071655962583, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021330832778182439, + "loss": 0.0201, "step": 222960 }, { - "epoch": 1.12, - "learning_rate": 0.00013126314886661183, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021330443956545293, + "loss": 0.0148, "step": 222970 }, { - "epoch": 1.12, - "learning_rate": 0.00013125558117359782, - "loss": 0.0117, + "epoch": 0.58, + "learning_rate": 0.00021330055134908147, + "loss": 0.0187, "step": 222980 }, { - "epoch": 1.13, - "learning_rate": 0.0001312480134805838, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021329666313270998, + "loss": 0.0185, "step": 222990 }, { - "epoch": 1.13, - "learning_rate": 0.0001312404457875698, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021329277491633853, + "loss": 0.0171, "step": 223000 }, { - "epoch": 1.13, - "eval_cer": 0.9144547295651558, - "eval_loss": 0.006930416449904442, - "eval_runtime": 115.5739, - "eval_samples_per_second": 17.305, - "eval_steps_per_second": 4.326, + "epoch": 0.58, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.010963888838887215, + "eval_runtime": 107.1777, + "eval_samples_per_second": 18.661, + "eval_steps_per_second": 4.665, "step": 223000 }, { - "epoch": 1.13, - "learning_rate": 0.0001312328780945558, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021328888669996707, + "loss": 0.0147, "step": 223010 }, { - "epoch": 1.13, - "learning_rate": 0.00013122531040154177, - "loss": 0.0118, + "epoch": 0.58, + "learning_rate": 0.0002132849984835956, + "loss": 0.0208, "step": 223020 }, { - "epoch": 1.13, - "learning_rate": 0.00013121774270852778, - "loss": 0.0107, + "epoch": 0.58, + "learning_rate": 0.00021328111026722412, + "loss": 0.014, "step": 223030 }, { - "epoch": 1.13, - "learning_rate": 0.00013121017501551376, - "loss": 0.0117, + "epoch": 0.58, + "learning_rate": 0.00021327722205085266, + "loss": 0.0171, "step": 223040 }, { - "epoch": 1.13, - "learning_rate": 0.00013120260732249974, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021327333383448118, + "loss": 0.021, "step": 223050 }, { - "epoch": 1.13, - "learning_rate": 0.00013119503962948575, - "loss": 0.0108, + "epoch": 0.58, + "learning_rate": 0.00021326944561810975, + "loss": 0.0131, "step": 223060 }, { - "epoch": 1.13, - "learning_rate": 0.00013118747193647173, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021326555740173826, + "loss": 0.0159, "step": 223070 }, { - "epoch": 1.13, - "learning_rate": 0.0001311799042434577, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.0002132616691853668, + "loss": 0.0185, "step": 223080 }, { - "epoch": 1.13, - "learning_rate": 0.00013117233655044372, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021325778096899532, + "loss": 0.0158, "step": 223090 }, { - "epoch": 1.13, - "learning_rate": 0.0001311647688574297, - "loss": 0.0115, + "epoch": 0.58, + "learning_rate": 0.0002132538927526239, + "loss": 0.0222, "step": 223100 }, { - "epoch": 1.13, - "learning_rate": 0.00013115720116441568, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021325000453625243, + "loss": 0.0224, "step": 223110 }, { - "epoch": 1.13, - "learning_rate": 0.00013114963347140166, - "loss": 0.0118, + "epoch": 0.58, + "learning_rate": 0.00021324611631988094, + "loss": 0.0179, "step": 223120 }, { - "epoch": 1.13, - "learning_rate": 0.00013114206577838767, - "loss": 0.0116, + "epoch": 0.58, + "learning_rate": 0.00021324222810350946, + "loss": 0.0141, "step": 223130 }, { - "epoch": 1.13, - "learning_rate": 0.00013113449808537365, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021323833988713803, + "loss": 0.016, "step": 223140 }, { - "epoch": 1.13, - "learning_rate": 0.00013112693039235964, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021323445167076657, + "loss": 0.0198, "step": 223150 }, { - "epoch": 1.13, - "learning_rate": 0.00013111936269934564, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.00021323056345439508, + "loss": 0.0177, "step": 223160 }, { - "epoch": 1.13, - "learning_rate": 0.00013111179500633163, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021322667523802362, + "loss": 0.0139, "step": 223170 }, { - "epoch": 1.13, - "learning_rate": 0.0001311042273133176, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021322278702165217, + "loss": 0.0173, "step": 223180 }, { - "epoch": 1.13, - "learning_rate": 0.00013109665962030362, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002132188988052807, + "loss": 0.0158, "step": 223190 }, { - "epoch": 1.13, - "learning_rate": 0.0001310890919272896, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021321501058890922, + "loss": 0.0153, "step": 223200 }, { - "epoch": 1.13, - "learning_rate": 0.00013108152423427558, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.00021321112237253776, + "loss": 0.0159, "step": 223210 }, { - "epoch": 1.13, - "learning_rate": 0.0001310739565412616, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.0002132072341561663, + "loss": 0.0177, "step": 223220 }, { - "epoch": 1.13, - "learning_rate": 0.00013106638884824757, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021320334593979485, + "loss": 0.0174, "step": 223230 }, { - "epoch": 1.13, - "learning_rate": 0.00013105882115523355, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021319945772342336, + "loss": 0.0129, "step": 223240 }, { - "epoch": 1.13, - "learning_rate": 0.00013105125346221956, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.0002131955695070519, + "loss": 0.0144, "step": 223250 }, { - "epoch": 1.13, - "learning_rate": 0.00013104368576920554, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021319168129068047, + "loss": 0.0162, "step": 223260 }, { - "epoch": 1.13, - "learning_rate": 0.00013103611807619152, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.000213187793074309, + "loss": 0.0148, "step": 223270 }, { - "epoch": 1.13, - "learning_rate": 0.0001310285503831775, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021318390485793753, + "loss": 0.0146, "step": 223280 }, { - "epoch": 1.13, - "learning_rate": 0.0001310209826901635, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021318001664156604, + "loss": 0.015, "step": 223290 }, { - "epoch": 1.13, - "learning_rate": 0.0001310134149971495, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.00021317612842519456, + "loss": 0.0145, "step": 223300 }, { - "epoch": 1.13, - "learning_rate": 0.00013100584730413547, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.00021317224020882313, + "loss": 0.0185, "step": 223310 }, { - "epoch": 1.13, - "learning_rate": 0.00013099827961112148, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021316835199245167, + "loss": 0.0146, "step": 223320 }, { - "epoch": 1.13, - "learning_rate": 0.00013099071191810746, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021316446377608018, + "loss": 0.0161, "step": 223330 }, { - "epoch": 1.13, - "learning_rate": 0.00013098314422509345, - "loss": 0.0116, + "epoch": 0.58, + "learning_rate": 0.00021316057555970872, + "loss": 0.0136, "step": 223340 }, { - "epoch": 1.13, - "learning_rate": 0.00013097557653207945, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021315668734333727, + "loss": 0.0137, "step": 223350 }, { - "epoch": 1.13, - "learning_rate": 0.00013096800883906544, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.0002131527991269658, + "loss": 0.0146, "step": 223360 }, { - "epoch": 1.13, - "learning_rate": 0.00013096044114605142, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.00021314891091059432, + "loss": 0.0202, "step": 223370 }, { - "epoch": 1.13, - "learning_rate": 0.00013095287345303743, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021314502269422286, + "loss": 0.0123, "step": 223380 }, { - "epoch": 1.13, - "learning_rate": 0.0001309453057600234, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.0002131411344778514, + "loss": 0.0152, "step": 223390 }, { - "epoch": 1.13, - "learning_rate": 0.0001309377380670094, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021313724626147995, + "loss": 0.0165, "step": 223400 }, { - "epoch": 1.13, - "learning_rate": 0.0001309301703739954, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021313335804510846, + "loss": 0.0162, "step": 223410 }, { - "epoch": 1.13, - "learning_rate": 0.00013092260268098135, - "loss": 0.0126, + "epoch": 0.58, + "learning_rate": 0.000213129469828737, + "loss": 0.0163, "step": 223420 }, { - "epoch": 1.13, - "learning_rate": 0.00013091503498796736, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.00021312558161236557, + "loss": 0.0159, "step": 223430 }, { - "epoch": 1.13, - "learning_rate": 0.00013090746729495334, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.0002131216933959941, + "loss": 0.0183, "step": 223440 }, { - "epoch": 1.13, - "learning_rate": 0.00013089989960193932, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.0002131178051796226, + "loss": 0.0147, "step": 223450 }, { - "epoch": 1.13, - "learning_rate": 0.00013089233190892533, - "loss": 0.0126, + "epoch": 0.58, + "learning_rate": 0.00021311391696325114, + "loss": 0.0175, "step": 223460 }, { - "epoch": 1.13, - "learning_rate": 0.0001308847642159113, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.0002131100287468797, + "loss": 0.015, "step": 223470 }, { - "epoch": 1.13, - "learning_rate": 0.0001308771965228973, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021310614053050823, + "loss": 0.015, "step": 223480 }, { - "epoch": 1.13, - "learning_rate": 0.00013086962882988328, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021310225231413677, + "loss": 0.0163, "step": 223490 }, { - "epoch": 1.13, - "learning_rate": 0.00013086206113686928, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021309836409776528, + "loss": 0.0173, "step": 223500 }, { - "epoch": 1.13, - "learning_rate": 0.00013085449344385527, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021309447588139385, + "loss": 0.0168, "step": 223510 }, { - "epoch": 1.13, - "learning_rate": 0.00013084692575084125, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021309058766502237, + "loss": 0.0153, "step": 223520 }, { - "epoch": 1.13, - "learning_rate": 0.00013083935805782726, - "loss": 0.0125, + "epoch": 0.58, + "learning_rate": 0.0002130866994486509, + "loss": 0.0167, "step": 223530 }, { - "epoch": 1.13, - "learning_rate": 0.00013083179036481324, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021308281123227942, + "loss": 0.0187, "step": 223540 }, { - "epoch": 1.13, - "learning_rate": 0.00013082422267179922, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021307892301590796, + "loss": 0.0187, "step": 223550 }, { - "epoch": 1.13, - "learning_rate": 0.00013081665497878523, - "loss": 0.0122, + "epoch": 0.58, + "learning_rate": 0.0002130750347995365, + "loss": 0.016, "step": 223560 }, { - "epoch": 1.13, - "learning_rate": 0.0001308090872857712, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021307114658316505, + "loss": 0.0182, "step": 223570 }, { - "epoch": 1.13, - "learning_rate": 0.0001308015195927572, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021306725836679356, + "loss": 0.0152, "step": 223580 }, { - "epoch": 1.13, - "learning_rate": 0.0001307939518997432, - "loss": 0.0146, + "epoch": 0.58, + "learning_rate": 0.0002130633701504221, + "loss": 0.0139, "step": 223590 }, { - "epoch": 1.13, - "learning_rate": 0.00013078638420672918, - "loss": 0.0137, + "epoch": 0.58, + "learning_rate": 0.00021305948193405064, + "loss": 0.0211, "step": 223600 }, { - "epoch": 1.13, - "learning_rate": 0.00013077881651371516, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021305559371767919, + "loss": 0.0184, "step": 223610 }, { - "epoch": 1.13, - "learning_rate": 0.00013077124882070117, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.0002130517055013077, + "loss": 0.0187, "step": 223620 }, { - "epoch": 1.13, - "learning_rate": 0.00013076368112768715, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021304781728493624, + "loss": 0.0157, "step": 223630 }, { - "epoch": 1.13, - "learning_rate": 0.00013075611343467313, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.0002130439290685648, + "loss": 0.0182, "step": 223640 }, { - "epoch": 1.13, - "learning_rate": 0.00013074854574165911, - "loss": 0.0117, + "epoch": 0.58, + "learning_rate": 0.00021304004085219333, + "loss": 0.0201, "step": 223650 }, { - "epoch": 1.13, - "learning_rate": 0.00013074097804864512, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.00021303615263582187, + "loss": 0.0188, "step": 223660 }, { - "epoch": 1.13, - "learning_rate": 0.0001307334103556311, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021303226441945038, + "loss": 0.0164, "step": 223670 }, { - "epoch": 1.13, - "learning_rate": 0.00013072584266261709, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021302837620307895, + "loss": 0.0165, "step": 223680 }, { - "epoch": 1.13, - "learning_rate": 0.0001307182749696031, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021302448798670746, + "loss": 0.0141, "step": 223690 }, { - "epoch": 1.13, - "learning_rate": 0.00013071070727658908, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.000213020599770336, + "loss": 0.0143, "step": 223700 }, { - "epoch": 1.13, - "learning_rate": 0.00013070313958357506, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021301671155396452, + "loss": 0.016, "step": 223710 }, { - "epoch": 1.13, - "learning_rate": 0.00013069557189056107, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.0002130128233375931, + "loss": 0.016, "step": 223720 }, { - "epoch": 1.13, - "learning_rate": 0.00013068800419754705, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.0002130089351212216, + "loss": 0.0143, "step": 223730 }, { - "epoch": 1.13, - "learning_rate": 0.00013068043650453303, - "loss": 0.0259, + "epoch": 0.58, + "learning_rate": 0.00021300504690485015, + "loss": 0.0119, "step": 223740 }, { - "epoch": 1.13, - "learning_rate": 0.00013067286881151904, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.00021300115868847866, + "loss": 0.0162, "step": 223750 }, { - "epoch": 1.13, - "learning_rate": 0.00013066530111850502, - "loss": 0.0127, + "epoch": 0.58, + "learning_rate": 0.00021299727047210723, + "loss": 0.0177, "step": 223760 }, { - "epoch": 1.13, - "learning_rate": 0.000130657733425491, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.00021299338225573574, + "loss": 0.0158, "step": 223770 }, { - "epoch": 1.13, - "learning_rate": 0.000130650165732477, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021298949403936429, + "loss": 0.0183, "step": 223780 }, { - "epoch": 1.13, - "learning_rate": 0.000130642598039463, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.0002129856058229928, + "loss": 0.0146, "step": 223790 }, { - "epoch": 1.13, - "learning_rate": 0.00013063503034644897, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021298171760662134, + "loss": 0.0179, "step": 223800 }, { - "epoch": 1.13, - "learning_rate": 0.00013062746265343498, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.0002129778293902499, + "loss": 0.015, "step": 223810 }, { - "epoch": 1.13, - "learning_rate": 0.00013061989496042096, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.00021297394117387842, + "loss": 0.0182, "step": 223820 }, { - "epoch": 1.13, - "learning_rate": 0.00013061232726740694, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021297005295750697, + "loss": 0.0155, "step": 223830 }, { - "epoch": 1.13, - "learning_rate": 0.00013060475957439292, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021296616474113548, + "loss": 0.0159, "step": 223840 }, { - "epoch": 1.13, - "learning_rate": 0.00013059719188137893, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021296227652476405, + "loss": 0.0145, "step": 223850 }, { - "epoch": 1.13, - "learning_rate": 0.00013058962418836491, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021295838830839256, + "loss": 0.0163, "step": 223860 }, { - "epoch": 1.13, - "learning_rate": 0.0001305820564953509, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.0002129545000920211, + "loss": 0.0135, "step": 223870 }, { - "epoch": 1.13, - "learning_rate": 0.0001305744888023369, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021295061187564962, + "loss": 0.0191, "step": 223880 }, { - "epoch": 1.13, - "learning_rate": 0.00013056692110932289, - "loss": 0.0071, + "epoch": 0.58, + "learning_rate": 0.0002129467236592782, + "loss": 0.0199, "step": 223890 }, { - "epoch": 1.13, - "learning_rate": 0.00013055935341630887, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.0002129428354429067, + "loss": 0.0164, "step": 223900 }, { - "epoch": 1.13, - "learning_rate": 0.00013055178572329488, - "loss": 0.007, + "epoch": 0.58, + "learning_rate": 0.00021293894722653525, + "loss": 0.0184, "step": 223910 }, { - "epoch": 1.13, - "learning_rate": 0.00013054421803028086, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021293505901016376, + "loss": 0.0166, "step": 223920 }, { - "epoch": 1.13, - "learning_rate": 0.00013053665033726684, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021293117079379233, + "loss": 0.0189, "step": 223930 }, { - "epoch": 1.13, - "learning_rate": 0.00013052908264425285, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021292728257742084, + "loss": 0.017, "step": 223940 }, { - "epoch": 1.13, - "learning_rate": 0.00013052151495123883, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021292339436104938, + "loss": 0.0172, "step": 223950 }, { - "epoch": 1.13, - "learning_rate": 0.0001305139472582248, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.0002129195061446779, + "loss": 0.0177, "step": 223960 }, { - "epoch": 1.13, - "learning_rate": 0.00013050637956521082, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021291561792830647, + "loss": 0.0165, "step": 223970 }, { - "epoch": 1.13, - "learning_rate": 0.0001304988118721968, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.000212911729711935, + "loss": 0.0172, "step": 223980 }, { - "epoch": 1.13, - "learning_rate": 0.00013049124417918278, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021290784149556352, + "loss": 0.0211, "step": 223990 }, { - "epoch": 1.13, - "learning_rate": 0.00013048367648616876, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021290395327919204, + "loss": 0.0137, "step": 224000 }, { - "epoch": 1.13, - "eval_cer": 0.9144683151109114, - "eval_loss": 0.007022760342806578, - "eval_runtime": 115.4845, - "eval_samples_per_second": 17.318, - "eval_steps_per_second": 4.33, + "epoch": 0.58, + "eval_cer": 0.8817502739789299, + "eval_loss": 0.010993575677275658, + "eval_runtime": 107.4094, + "eval_samples_per_second": 18.62, + "eval_steps_per_second": 4.655, "step": 224000 }, { - "epoch": 1.13, - "learning_rate": 0.00013047610879315477, - "loss": 0.0131, + "epoch": 0.58, + "learning_rate": 0.0002129000650628206, + "loss": 0.0216, "step": 224010 }, { - "epoch": 1.13, - "learning_rate": 0.00013046854110014075, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021289617684644915, + "loss": 0.0132, "step": 224020 }, { - "epoch": 1.13, - "learning_rate": 0.00013046097340712673, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021289228863007766, + "loss": 0.0245, "step": 224030 }, { - "epoch": 1.13, - "learning_rate": 0.00013045340571411274, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.0002128884004137062, + "loss": 0.0217, "step": 224040 }, { - "epoch": 1.13, - "learning_rate": 0.0001304458380210987, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021288451219733472, + "loss": 0.0149, "step": 224050 }, { - "epoch": 1.13, - "learning_rate": 0.0001304382703280847, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.0002128806239809633, + "loss": 0.0179, "step": 224060 }, { - "epoch": 1.13, - "learning_rate": 0.0001304307026350707, - "loss": 0.0097, + "epoch": 0.58, + "learning_rate": 0.0002128767357645918, + "loss": 0.0162, "step": 224070 }, { - "epoch": 1.13, - "learning_rate": 0.00013042313494205667, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021287284754822034, + "loss": 0.0169, "step": 224080 }, { - "epoch": 1.13, - "learning_rate": 0.00013041556724904268, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021286895933184886, + "loss": 0.0115, "step": 224090 }, { - "epoch": 1.13, - "learning_rate": 0.00013040799955602866, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021286507111547743, + "loss": 0.015, "step": 224100 }, { - "epoch": 1.13, - "learning_rate": 0.00013040043186301464, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021286118289910594, + "loss": 0.0178, "step": 224110 }, { - "epoch": 1.13, - "learning_rate": 0.00013039286417000065, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021285729468273448, + "loss": 0.0186, "step": 224120 }, { - "epoch": 1.13, - "learning_rate": 0.00013038529647698663, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.000212853406466363, + "loss": 0.0169, "step": 224130 }, { - "epoch": 1.13, - "learning_rate": 0.0001303777287839726, - "loss": 0.0115, + "epoch": 0.58, + "learning_rate": 0.00021284951824999157, + "loss": 0.0132, "step": 224140 }, { - "epoch": 1.13, - "learning_rate": 0.00013037016109095862, - "loss": 0.013, + "epoch": 0.58, + "learning_rate": 0.0002128456300336201, + "loss": 0.0301, "step": 224150 }, { - "epoch": 1.13, - "learning_rate": 0.0001303625933979446, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.00021284174181724862, + "loss": 0.0339, "step": 224160 }, { - "epoch": 1.13, - "learning_rate": 0.00013035502570493058, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021283785360087714, + "loss": 0.0134, "step": 224170 }, { - "epoch": 1.13, - "learning_rate": 0.00013034745801191656, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.0002128339653845057, + "loss": 0.0199, "step": 224180 }, { - "epoch": 1.13, - "learning_rate": 0.00013033989031890257, - "loss": 0.0067, + "epoch": 0.58, + "learning_rate": 0.00021283007716813425, + "loss": 0.0174, "step": 224190 }, { - "epoch": 1.13, - "learning_rate": 0.00013033232262588855, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021282618895176276, + "loss": 0.015, "step": 224200 }, { - "epoch": 1.13, - "learning_rate": 0.00013032475493287454, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.0002128223007353913, + "loss": 0.0178, "step": 224210 }, { - "epoch": 1.13, - "learning_rate": 0.00013031718723986054, - "loss": 0.0095, + "epoch": 0.58, + "learning_rate": 0.00021281841251901985, + "loss": 0.0193, "step": 224220 }, { - "epoch": 1.13, - "learning_rate": 0.00013030961954684653, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.0002128145243026484, + "loss": 0.0225, "step": 224230 }, { - "epoch": 1.13, - "learning_rate": 0.0001303020518538325, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002128106360862769, + "loss": 0.0129, "step": 224240 }, { - "epoch": 1.13, - "learning_rate": 0.00013029448416081852, - "loss": 0.0074, + "epoch": 0.58, + "learning_rate": 0.00021280674786990544, + "loss": 0.0185, "step": 224250 }, { - "epoch": 1.13, - "learning_rate": 0.0001302869164678045, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021280285965353399, + "loss": 0.0165, "step": 224260 }, { - "epoch": 1.13, - "learning_rate": 0.00013027934877479048, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021279897143716253, + "loss": 0.017, "step": 224270 }, { - "epoch": 1.13, - "learning_rate": 0.0001302717810817765, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021279508322079104, + "loss": 0.018, "step": 224280 }, { - "epoch": 1.13, - "learning_rate": 0.00013026421338876247, - "loss": 0.0122, + "epoch": 0.58, + "learning_rate": 0.00021279119500441958, + "loss": 0.0162, "step": 224290 }, { - "epoch": 1.13, - "learning_rate": 0.00013025664569574845, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.0002127873067880481, + "loss": 0.0185, "step": 224300 }, { - "epoch": 1.13, - "learning_rate": 0.00013024907800273446, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021278341857167667, + "loss": 0.0153, "step": 224310 }, { - "epoch": 1.13, - "learning_rate": 0.00013024151030972044, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021277953035530518, + "loss": 0.017, "step": 224320 }, { - "epoch": 1.13, - "learning_rate": 0.00013023394261670642, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021277564213893372, + "loss": 0.016, "step": 224330 }, { - "epoch": 1.13, - "learning_rate": 0.00013022637492369243, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021277175392256224, + "loss": 0.0189, "step": 224340 }, { - "epoch": 1.13, - "learning_rate": 0.0001302188072306784, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.0002127678657061908, + "loss": 0.0153, "step": 224350 }, { - "epoch": 1.13, - "learning_rate": 0.0001302112395376644, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021276397748981935, + "loss": 0.015, "step": 224360 }, { - "epoch": 1.13, - "learning_rate": 0.00013020367184465037, - "loss": 0.0117, + "epoch": 0.58, + "learning_rate": 0.00021276008927344786, + "loss": 0.0184, "step": 224370 }, { - "epoch": 1.13, - "learning_rate": 0.00013019610415163638, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.0002127562010570764, + "loss": 0.0187, "step": 224380 }, { - "epoch": 1.13, - "learning_rate": 0.00013018853645862236, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021275231284070495, + "loss": 0.0154, "step": 224390 }, { - "epoch": 1.13, - "learning_rate": 0.00013018096876560835, - "loss": 0.013, + "epoch": 0.58, + "learning_rate": 0.0002127484246243335, + "loss": 0.0143, "step": 224400 }, { - "epoch": 1.13, - "learning_rate": 0.00013017340107259435, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.000212744536407962, + "loss": 0.0148, "step": 224410 }, { - "epoch": 1.13, - "learning_rate": 0.00013016583337958034, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021274064819159054, + "loss": 0.0175, "step": 224420 }, { - "epoch": 1.13, - "learning_rate": 0.00013015826568656632, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021273675997521909, + "loss": 0.0159, "step": 224430 }, { - "epoch": 1.13, - "learning_rate": 0.00013015069799355233, - "loss": 0.0102, + "epoch": 0.58, + "learning_rate": 0.00021273287175884763, + "loss": 0.0152, "step": 224440 }, { - "epoch": 1.13, - "learning_rate": 0.0001301431303005383, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.00021272898354247614, + "loss": 0.0177, "step": 224450 }, { - "epoch": 1.13, - "learning_rate": 0.0001301355626075243, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021272509532610468, + "loss": 0.0158, "step": 224460 }, { - "epoch": 1.13, - "learning_rate": 0.0001301279949145103, - "loss": 0.0104, + "epoch": 0.58, + "learning_rate": 0.00021272120710973322, + "loss": 0.018, "step": 224470 }, { - "epoch": 1.13, - "learning_rate": 0.00013012042722149628, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021271731889336177, + "loss": 0.0203, "step": 224480 }, { - "epoch": 1.13, - "learning_rate": 0.00013011285952848226, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021271343067699028, + "loss": 0.0161, "step": 224490 }, { - "epoch": 1.13, - "learning_rate": 0.00013010529183546827, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021270954246061882, + "loss": 0.0172, "step": 224500 }, { - "epoch": 1.13, - "learning_rate": 0.00013009772414245425, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.0002127056542442474, + "loss": 0.0172, "step": 224510 }, { - "epoch": 1.13, - "learning_rate": 0.00013009015644944023, - "loss": 0.0078, + "epoch": 0.58, + "learning_rate": 0.0002127017660278759, + "loss": 0.0144, "step": 224520 }, { - "epoch": 1.13, - "learning_rate": 0.0001300825887564262, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021269787781150445, + "loss": 0.0196, "step": 224530 }, { - "epoch": 1.13, - "learning_rate": 0.00013007502106341222, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021269398959513296, + "loss": 0.0168, "step": 224540 }, { - "epoch": 1.13, - "learning_rate": 0.0001300674533703982, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.0002126901013787615, + "loss": 0.0185, "step": 224550 }, { - "epoch": 1.13, - "learning_rate": 0.00013005988567738418, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.00021268621316239005, + "loss": 0.0213, "step": 224560 }, { - "epoch": 1.13, - "learning_rate": 0.0001300523179843702, - "loss": 0.0106, + "epoch": 0.58, + "learning_rate": 0.0002126823249460186, + "loss": 0.018, "step": 224570 }, { - "epoch": 1.13, - "learning_rate": 0.00013004475029135617, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002126784367296471, + "loss": 0.0142, "step": 224580 }, { - "epoch": 1.13, - "learning_rate": 0.00013003718259834216, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021267454851327564, + "loss": 0.0172, "step": 224590 }, { - "epoch": 1.13, - "learning_rate": 0.00013002961490532816, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021267066029690418, + "loss": 0.014, "step": 224600 }, { - "epoch": 1.13, - "learning_rate": 0.00013002204721231415, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021266677208053273, + "loss": 0.0158, "step": 224610 }, { - "epoch": 1.13, - "learning_rate": 0.00013001447951930013, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021266288386416124, + "loss": 0.0144, "step": 224620 }, { - "epoch": 1.13, - "learning_rate": 0.00013000691182628614, - "loss": 0.0067, + "epoch": 0.58, + "learning_rate": 0.00021265899564778978, + "loss": 0.0166, "step": 224630 }, { - "epoch": 1.13, - "learning_rate": 0.00012999934413327212, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021265510743141832, + "loss": 0.0169, "step": 224640 }, { - "epoch": 1.13, - "learning_rate": 0.0001299917764402581, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.00021265121921504687, + "loss": 0.0169, "step": 224650 }, { - "epoch": 1.13, - "learning_rate": 0.0001299842087472441, - "loss": 0.0113, + "epoch": 0.58, + "learning_rate": 0.00021264733099867538, + "loss": 0.0165, "step": 224660 }, { - "epoch": 1.13, - "learning_rate": 0.00012997664105423006, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021264344278230392, + "loss": 0.0176, "step": 224670 }, { - "epoch": 1.13, - "learning_rate": 0.00012996907336121607, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002126395545659325, + "loss": 0.0154, "step": 224680 }, { - "epoch": 1.13, - "learning_rate": 0.00012996150566820205, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.000212635666349561, + "loss": 0.0128, "step": 224690 }, { - "epoch": 1.13, - "learning_rate": 0.00012995393797518803, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021263177813318955, + "loss": 0.0151, "step": 224700 }, { - "epoch": 1.13, - "learning_rate": 0.00012994637028217404, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021262788991681806, + "loss": 0.0154, "step": 224710 }, { - "epoch": 1.13, - "learning_rate": 0.00012993880258916002, - "loss": 0.0115, + "epoch": 0.58, + "learning_rate": 0.00021262400170044663, + "loss": 0.0186, "step": 224720 }, { - "epoch": 1.13, - "learning_rate": 0.000129931234896146, - "loss": 0.0072, + "epoch": 0.58, + "learning_rate": 0.00021262011348407514, + "loss": 0.0136, "step": 224730 }, { - "epoch": 1.13, - "learning_rate": 0.00012992366720313199, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.00021261622526770369, + "loss": 0.016, "step": 224740 }, { - "epoch": 1.13, - "learning_rate": 0.000129916099510118, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.0002126123370513322, + "loss": 0.0178, "step": 224750 }, { - "epoch": 1.13, - "learning_rate": 0.00012990853181710398, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021260844883496077, + "loss": 0.0132, "step": 224760 }, { - "epoch": 1.13, - "learning_rate": 0.00012990096412408996, - "loss": 0.0114, + "epoch": 0.58, + "learning_rate": 0.00021260456061858928, + "loss": 0.0128, "step": 224770 }, { - "epoch": 1.13, - "learning_rate": 0.00012989339643107597, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021260067240221783, + "loss": 0.0171, "step": 224780 }, { - "epoch": 1.13, - "learning_rate": 0.00012988582873806195, - "loss": 0.007, + "epoch": 0.58, + "learning_rate": 0.00021259678418584634, + "loss": 0.0142, "step": 224790 }, { - "epoch": 1.13, - "learning_rate": 0.00012987826104504793, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021259289596947488, + "loss": 0.0143, "step": 224800 }, { - "epoch": 1.13, - "learning_rate": 0.00012987069335203394, - "loss": 0.0068, + "epoch": 0.58, + "learning_rate": 0.00021258900775310342, + "loss": 0.0144, "step": 224810 }, { - "epoch": 1.13, - "learning_rate": 0.00012986312565901992, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021258511953673197, + "loss": 0.016, "step": 224820 }, { - "epoch": 1.13, - "learning_rate": 0.0001298555579660059, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021258123132036048, + "loss": 0.0147, "step": 224830 }, { - "epoch": 1.13, - "learning_rate": 0.0001298479902729919, - "loss": 0.0108, + "epoch": 0.58, + "learning_rate": 0.00021257734310398902, + "loss": 0.0138, "step": 224840 }, { - "epoch": 1.13, - "learning_rate": 0.0001298404225799779, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.0002125734548876176, + "loss": 0.0187, "step": 224850 }, { - "epoch": 1.13, - "learning_rate": 0.00012983285488696387, - "loss": 0.0129, + "epoch": 0.58, + "learning_rate": 0.0002125695666712461, + "loss": 0.0173, "step": 224860 }, { - "epoch": 1.13, - "learning_rate": 0.00012982528719394988, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021256567845487465, + "loss": 0.0188, "step": 224870 }, { - "epoch": 1.13, - "learning_rate": 0.00012981771950093586, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021256179023850316, + "loss": 0.0164, "step": 224880 }, { - "epoch": 1.13, - "learning_rate": 0.00012981015180792184, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021255790202213173, + "loss": 0.0108, "step": 224890 }, { - "epoch": 1.13, - "learning_rate": 0.00012980258411490782, - "loss": 0.0103, + "epoch": 0.58, + "learning_rate": 0.00021255401380576024, + "loss": 0.0145, "step": 224900 }, { - "epoch": 1.13, - "learning_rate": 0.00012979501642189383, - "loss": 0.0129, + "epoch": 0.58, + "learning_rate": 0.00021255012558938879, + "loss": 0.0195, "step": 224910 }, { - "epoch": 1.13, - "learning_rate": 0.00012978744872887981, - "loss": 0.0069, + "epoch": 0.58, + "learning_rate": 0.0002125462373730173, + "loss": 0.0159, "step": 224920 }, { - "epoch": 1.13, - "learning_rate": 0.0001297798810358658, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021254234915664587, + "loss": 0.016, "step": 224930 }, { - "epoch": 1.13, - "learning_rate": 0.0001297723133428518, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021253846094027438, + "loss": 0.0192, "step": 224940 }, { - "epoch": 1.13, - "learning_rate": 0.00012976474564983779, - "loss": 0.0154, + "epoch": 0.58, + "learning_rate": 0.00021253457272390293, + "loss": 0.017, "step": 224950 }, { - "epoch": 1.13, - "learning_rate": 0.00012975717795682377, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.00021253068450753144, + "loss": 0.0178, "step": 224960 }, { - "epoch": 1.13, - "learning_rate": 0.00012974961026380978, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.00021252679629116, + "loss": 0.0191, "step": 224970 }, { - "epoch": 1.14, - "learning_rate": 0.00012974204257079576, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.00021252290807478852, + "loss": 0.0184, "step": 224980 }, { - "epoch": 1.14, - "learning_rate": 0.00012973447487778174, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021251901985841706, + "loss": 0.0144, "step": 224990 }, { - "epoch": 1.14, - "learning_rate": 0.00012972690718476775, - "loss": 0.0074, + "epoch": 0.58, + "learning_rate": 0.00021251513164204558, + "loss": 0.0136, "step": 225000 }, { - "epoch": 1.14, - "eval_cer": 0.9144644335264098, - "eval_loss": 0.007108866702765226, - "eval_runtime": 116.0265, - "eval_samples_per_second": 17.237, - "eval_steps_per_second": 4.309, + "epoch": 0.58, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.01163857989013195, + "eval_runtime": 107.3494, + "eval_samples_per_second": 18.631, + "eval_steps_per_second": 4.658, "step": 225000 }, { - "epoch": 1.14, - "learning_rate": 0.00012971933949175373, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021251124342567415, + "loss": 0.0174, "step": 225010 }, { - "epoch": 1.14, - "learning_rate": 0.0001297117717987397, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.0002125073552093027, + "loss": 0.0186, "step": 225020 }, { - "epoch": 1.14, - "learning_rate": 0.00012970420410572572, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.0002125034669929312, + "loss": 0.0146, "step": 225030 }, { - "epoch": 1.14, - "learning_rate": 0.0001296966364127117, - "loss": 0.0085, + "epoch": 0.58, + "learning_rate": 0.00021249957877655972, + "loss": 0.0133, "step": 225040 }, { - "epoch": 1.14, - "learning_rate": 0.00012968906871969768, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021249569056018826, + "loss": 0.0163, "step": 225050 }, { - "epoch": 1.14, - "learning_rate": 0.00012968150102668366, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021249180234381683, + "loss": 0.0183, "step": 225060 }, { - "epoch": 1.14, - "learning_rate": 0.00012967393333366967, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021248791412744534, + "loss": 0.0141, "step": 225070 }, { - "epoch": 1.14, - "learning_rate": 0.00012966636564065565, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.00021248402591107389, + "loss": 0.0192, "step": 225080 }, { - "epoch": 1.14, - "learning_rate": 0.00012965879794764163, - "loss": 0.0076, + "epoch": 0.58, + "learning_rate": 0.0002124801376947024, + "loss": 0.0142, "step": 225090 }, { - "epoch": 1.14, - "learning_rate": 0.00012965123025462764, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021247624947833097, + "loss": 0.0186, "step": 225100 }, { - "epoch": 1.14, - "learning_rate": 0.00012964366256161362, - "loss": 0.0099, + "epoch": 0.58, + "learning_rate": 0.00021247236126195948, + "loss": 0.0144, "step": 225110 }, { - "epoch": 1.14, - "learning_rate": 0.0001296360948685996, - "loss": 0.0135, + "epoch": 0.58, + "learning_rate": 0.00021246847304558802, + "loss": 0.0191, "step": 225120 }, { - "epoch": 1.14, - "learning_rate": 0.00012962852717558561, - "loss": 0.012, + "epoch": 0.58, + "learning_rate": 0.00021246458482921654, + "loss": 0.0245, "step": 225130 }, { - "epoch": 1.14, - "learning_rate": 0.0001296209594825716, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.0002124606966128451, + "loss": 0.0208, "step": 225140 }, { - "epoch": 1.14, - "learning_rate": 0.00012961339178955758, - "loss": 0.0111, + "epoch": 0.58, + "learning_rate": 0.00021245680839647362, + "loss": 0.0188, "step": 225150 }, { - "epoch": 1.14, - "learning_rate": 0.00012960582409654359, - "loss": 0.0098, + "epoch": 0.58, + "learning_rate": 0.00021245292018010216, + "loss": 0.0157, "step": 225160 }, { - "epoch": 1.14, - "learning_rate": 0.00012959825640352957, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021244903196373068, + "loss": 0.0217, "step": 225170 }, { - "epoch": 1.14, - "learning_rate": 0.00012959068871051555, - "loss": 0.0087, + "epoch": 0.58, + "learning_rate": 0.00021244514374735925, + "loss": 0.0142, "step": 225180 }, { - "epoch": 1.14, - "learning_rate": 0.00012958312101750156, - "loss": 0.0121, + "epoch": 0.58, + "learning_rate": 0.00021244125553098776, + "loss": 0.0177, "step": 225190 }, { - "epoch": 1.14, - "learning_rate": 0.00012957555332448754, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.0002124373673146163, + "loss": 0.0191, "step": 225200 }, { - "epoch": 1.14, - "learning_rate": 0.00012956798563147352, - "loss": 0.0115, + "epoch": 0.58, + "learning_rate": 0.00021243347909824482, + "loss": 0.0201, "step": 225210 }, { - "epoch": 1.14, - "learning_rate": 0.0001295604179384595, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.0002124295908818734, + "loss": 0.0134, "step": 225220 }, { - "epoch": 1.14, - "learning_rate": 0.0001295528502454455, - "loss": 0.0118, + "epoch": 0.58, + "learning_rate": 0.00021242570266550193, + "loss": 0.0142, "step": 225230 }, { - "epoch": 1.14, - "learning_rate": 0.0001295452825524315, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021242181444913044, + "loss": 0.0158, "step": 225240 }, { - "epoch": 1.14, - "learning_rate": 0.00012953771485941747, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021241792623275898, + "loss": 0.018, "step": 225250 }, { - "epoch": 1.14, - "learning_rate": 0.00012953014716640348, - "loss": 0.008, + "epoch": 0.58, + "learning_rate": 0.00021241403801638753, + "loss": 0.0182, "step": 225260 }, { - "epoch": 1.14, - "learning_rate": 0.00012952257947338946, - "loss": 0.0093, + "epoch": 0.58, + "learning_rate": 0.00021241014980001607, + "loss": 0.0146, "step": 225270 }, { - "epoch": 1.14, - "learning_rate": 0.00012951501178037544, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021240626158364458, + "loss": 0.0174, "step": 225280 }, { - "epoch": 1.14, - "learning_rate": 0.00012950744408736145, - "loss": 0.0122, + "epoch": 0.58, + "learning_rate": 0.00021240237336727312, + "loss": 0.0163, "step": 225290 }, { - "epoch": 1.14, - "learning_rate": 0.0001294998763943474, - "loss": 0.01, + "epoch": 0.58, + "learning_rate": 0.00021239848515090164, + "loss": 0.0137, "step": 225300 }, { - "epoch": 1.14, - "learning_rate": 0.00012949230870133342, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.0002123945969345302, + "loss": 0.0152, "step": 225310 }, { - "epoch": 1.14, - "learning_rate": 0.0001294847410083194, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021239070871815872, + "loss": 0.0132, "step": 225320 }, { - "epoch": 1.14, - "learning_rate": 0.00012947717331530538, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021238682050178726, + "loss": 0.0157, "step": 225330 }, { - "epoch": 1.14, - "learning_rate": 0.0001294696056222914, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021238293228541578, + "loss": 0.0182, "step": 225340 }, { - "epoch": 1.14, - "learning_rate": 0.00012946203792927737, - "loss": 0.0116, + "epoch": 0.58, + "learning_rate": 0.00021237904406904435, + "loss": 0.0158, "step": 225350 }, { - "epoch": 1.14, - "learning_rate": 0.00012945447023626335, - "loss": 0.0079, + "epoch": 0.58, + "learning_rate": 0.00021237515585267286, + "loss": 0.02, "step": 225360 }, { - "epoch": 1.14, - "learning_rate": 0.00012944690254324936, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.0002123712676363014, + "loss": 0.0197, "step": 225370 }, { - "epoch": 1.14, - "learning_rate": 0.00012943933485023534, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021236737941992992, + "loss": 0.0157, "step": 225380 }, { - "epoch": 1.14, - "learning_rate": 0.00012943176715722132, - "loss": 0.0096, + "epoch": 0.58, + "learning_rate": 0.00021236349120355849, + "loss": 0.0176, "step": 225390 }, { - "epoch": 1.14, - "learning_rate": 0.00012942419946420733, - "loss": 0.0118, + "epoch": 0.58, + "learning_rate": 0.00021235960298718703, + "loss": 0.0125, "step": 225400 }, { - "epoch": 1.14, - "learning_rate": 0.0001294166317711933, - "loss": 0.0089, + "epoch": 0.58, + "learning_rate": 0.00021235571477081554, + "loss": 0.0177, "step": 225410 }, { - "epoch": 1.14, - "learning_rate": 0.0001294090640781793, - "loss": 0.0092, + "epoch": 0.58, + "learning_rate": 0.00021235182655444408, + "loss": 0.0259, "step": 225420 }, { - "epoch": 1.14, - "learning_rate": 0.00012940149638516527, - "loss": 0.009, + "epoch": 0.58, + "learning_rate": 0.00021234793833807263, + "loss": 0.0169, "step": 225430 }, { - "epoch": 1.14, - "learning_rate": 0.00012939392869215128, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021234405012170117, + "loss": 0.0159, "step": 225440 }, { - "epoch": 1.14, - "learning_rate": 0.00012938636099913726, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021234016190532968, + "loss": 0.0211, "step": 225450 }, { - "epoch": 1.14, - "learning_rate": 0.00012937879330612325, - "loss": 0.0091, + "epoch": 0.58, + "learning_rate": 0.00021233627368895822, + "loss": 0.0155, "step": 225460 }, { - "epoch": 1.14, - "learning_rate": 0.00012937122561310925, - "loss": 0.0101, + "epoch": 0.58, + "learning_rate": 0.00021233238547258677, + "loss": 0.0168, "step": 225470 }, { - "epoch": 1.14, - "learning_rate": 0.00012936365792009524, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.0002123284972562153, + "loss": 0.0185, "step": 225480 }, { - "epoch": 1.14, - "learning_rate": 0.00012935609022708122, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021232460903984382, + "loss": 0.0141, "step": 225490 }, { - "epoch": 1.14, - "learning_rate": 0.00012934852253406723, - "loss": 0.0105, + "epoch": 0.58, + "learning_rate": 0.00021232072082347236, + "loss": 0.0177, "step": 225500 }, { - "epoch": 1.14, - "learning_rate": 0.0001293409548410532, - "loss": 0.0084, + "epoch": 0.58, + "learning_rate": 0.0002123168326071009, + "loss": 0.0213, "step": 225510 }, { - "epoch": 1.14, - "learning_rate": 0.0001293333871480392, - "loss": 0.0075, + "epoch": 0.58, + "learning_rate": 0.00021231294439072945, + "loss": 0.0155, "step": 225520 }, { - "epoch": 1.14, - "learning_rate": 0.0001293258194550252, - "loss": 0.0081, + "epoch": 0.58, + "learning_rate": 0.00021230905617435796, + "loss": 0.0163, "step": 225530 }, { - "epoch": 1.14, - "learning_rate": 0.00012931825176201118, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.0002123051679579865, + "loss": 0.02, "step": 225540 }, { - "epoch": 1.14, - "learning_rate": 0.00012931068406899716, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021230127974161502, + "loss": 0.0153, "step": 225550 }, { - "epoch": 1.14, - "learning_rate": 0.00012930311637598317, - "loss": 0.0153, + "epoch": 0.58, + "learning_rate": 0.00021229739152524359, + "loss": 0.0141, "step": 225560 }, { - "epoch": 1.14, - "learning_rate": 0.00012929554868296915, - "loss": 0.0082, + "epoch": 0.58, + "learning_rate": 0.00021229350330887213, + "loss": 0.0188, "step": 225570 }, { - "epoch": 1.14, - "learning_rate": 0.00012928798098995513, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021228961509250064, + "loss": 0.0148, "step": 225580 }, { - "epoch": 1.14, - "learning_rate": 0.0001292804132969411, - "loss": 0.0088, + "epoch": 0.58, + "learning_rate": 0.00021228572687612916, + "loss": 0.0134, "step": 225590 }, { - "epoch": 1.14, - "learning_rate": 0.00012927284560392712, - "loss": 0.0086, + "epoch": 0.58, + "learning_rate": 0.00021228183865975773, + "loss": 0.0157, "step": 225600 }, { - "epoch": 1.14, - "learning_rate": 0.0001292652779109131, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021227795044338627, + "loss": 0.0128, "step": 225610 }, { - "epoch": 1.14, - "learning_rate": 0.00012925771021789908, - "loss": 0.0094, + "epoch": 0.58, + "learning_rate": 0.00021227406222701478, + "loss": 0.0149, "step": 225620 }, { - "epoch": 1.14, - "learning_rate": 0.0001292501425248851, - "loss": 0.0077, + "epoch": 0.58, + "learning_rate": 0.00021227017401064332, + "loss": 0.0149, "step": 225630 }, { - "epoch": 1.14, - "learning_rate": 0.00012924257483187107, - "loss": 0.0112, + "epoch": 0.58, + "learning_rate": 0.00021226628579427186, + "loss": 0.0173, "step": 225640 }, { - "epoch": 1.14, - "learning_rate": 0.00012923500713885706, - "loss": 0.0068, + "epoch": 0.58, + "learning_rate": 0.0002122623975779004, + "loss": 0.0148, "step": 225650 }, { - "epoch": 1.14, - "learning_rate": 0.00012922743944584306, - "loss": 0.0075, + "epoch": 0.58, + "learning_rate": 0.00021225850936152892, + "loss": 0.0156, "step": 225660 }, { - "epoch": 1.14, - "learning_rate": 0.00012921987175282905, - "loss": 0.0083, + "epoch": 0.58, + "learning_rate": 0.00021225462114515746, + "loss": 0.0163, "step": 225670 }, { - "epoch": 1.14, - "learning_rate": 0.00012921230405981503, - "loss": 0.011, + "epoch": 0.58, + "learning_rate": 0.000212250732928786, + "loss": 0.0151, "step": 225680 }, { - "epoch": 1.14, - "learning_rate": 0.00012920473636680104, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021224684471241455, + "loss": 0.0168, "step": 225690 }, { - "epoch": 1.14, - "learning_rate": 0.00012919716867378702, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021224295649604306, + "loss": 0.0145, "step": 225700 }, { - "epoch": 1.14, - "learning_rate": 0.000129189600980773, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.0002122390682796716, + "loss": 0.0178, "step": 225710 }, { - "epoch": 1.14, - "learning_rate": 0.000129182033287759, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021223518006330017, + "loss": 0.0193, "step": 225720 }, { - "epoch": 1.14, - "learning_rate": 0.000129174465594745, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021223129184692869, + "loss": 0.0142, "step": 225730 }, { - "epoch": 1.14, - "learning_rate": 0.00012916689790173097, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021222740363055723, + "loss": 0.0184, "step": 225740 }, { - "epoch": 1.14, - "learning_rate": 0.00012915933020871698, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021222351541418574, + "loss": 0.0163, "step": 225750 }, { - "epoch": 1.14, - "learning_rate": 0.00012915176251570296, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.0002122196271978143, + "loss": 0.0126, "step": 225760 }, { - "epoch": 1.14, - "learning_rate": 0.00012914419482268894, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021221573898144282, + "loss": 0.0142, "step": 225770 }, { - "epoch": 1.14, - "learning_rate": 0.00012913662712967492, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021221185076507137, + "loss": 0.0192, "step": 225780 }, { - "epoch": 1.14, - "learning_rate": 0.00012912905943666093, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021220796254869988, + "loss": 0.018, "step": 225790 }, { - "epoch": 1.14, - "learning_rate": 0.0001291214917436469, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021220407433232842, + "loss": 0.0152, "step": 225800 }, { - "epoch": 1.14, - "learning_rate": 0.0001291139240506329, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021220018611595696, + "loss": 0.0168, "step": 225810 }, { - "epoch": 1.14, - "learning_rate": 0.0001291063563576189, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.0002121962978995855, + "loss": 0.0182, "step": 225820 }, { - "epoch": 1.14, - "learning_rate": 0.00012909878866460488, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021219240968321402, + "loss": 0.0179, "step": 225830 }, { - "epoch": 1.14, - "learning_rate": 0.00012909122097159087, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021218852146684256, + "loss": 0.0142, "step": 225840 }, { - "epoch": 1.14, - "learning_rate": 0.00012908365327857687, - "loss": 0.0072, + "epoch": 0.59, + "learning_rate": 0.0002121846332504711, + "loss": 0.0151, "step": 225850 }, { - "epoch": 1.14, - "learning_rate": 0.00012907608558556286, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021218074503409965, + "loss": 0.0146, "step": 225860 }, { - "epoch": 1.14, - "learning_rate": 0.00012906851789254884, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021217685681772816, + "loss": 0.0197, "step": 225870 }, { - "epoch": 1.14, - "learning_rate": 0.00012906095019953485, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.0002121729686013567, + "loss": 0.0161, "step": 225880 }, { - "epoch": 1.14, - "learning_rate": 0.00012905338250652083, - "loss": 0.0067, + "epoch": 0.59, + "learning_rate": 0.00021216908038498527, + "loss": 0.0204, "step": 225890 }, { - "epoch": 1.14, - "learning_rate": 0.0001290458148135068, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021216519216861378, + "loss": 0.0177, "step": 225900 }, { - "epoch": 1.14, - "learning_rate": 0.00012903824712049282, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.0002121613039522423, + "loss": 0.015, "step": 225910 }, { - "epoch": 1.14, - "learning_rate": 0.0001290306794274788, - "loss": 0.0108, + "epoch": 0.59, + "learning_rate": 0.00021215741573587084, + "loss": 0.0241, "step": 225920 }, { - "epoch": 1.14, - "learning_rate": 0.00012902311173446478, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.0002121535275194994, + "loss": 0.0239, "step": 225930 }, { - "epoch": 1.14, - "learning_rate": 0.00012901554404145076, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021214963930312792, + "loss": 0.0159, "step": 225940 }, { - "epoch": 1.14, - "learning_rate": 0.00012900797634843674, - "loss": 0.0117, + "epoch": 0.59, + "learning_rate": 0.00021214575108675647, + "loss": 0.0156, "step": 225950 }, { - "epoch": 1.14, - "learning_rate": 0.00012900040865542272, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.00021214186287038498, + "loss": 0.012, "step": 225960 }, { - "epoch": 1.14, - "learning_rate": 0.00012899284096240873, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021213797465401355, + "loss": 0.0237, "step": 225970 }, { - "epoch": 1.14, - "learning_rate": 0.00012898527326939471, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.00021213408643764206, + "loss": 0.0188, "step": 225980 }, { - "epoch": 1.14, - "learning_rate": 0.0001289777055763807, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.0002121301982212706, + "loss": 0.0184, "step": 225990 }, { - "epoch": 1.14, - "learning_rate": 0.0001289701378833667, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021212631000489912, + "loss": 0.0158, "step": 226000 }, { - "epoch": 1.14, - "eval_cer": 0.9144498775845288, - "eval_loss": 0.007178218103945255, - "eval_runtime": 116.0384, - "eval_samples_per_second": 17.236, - "eval_steps_per_second": 4.309, + "epoch": 0.59, + "eval_cer": 0.881821655462573, + "eval_loss": 0.01118859276175499, + "eval_runtime": 107.4296, + "eval_samples_per_second": 18.617, + "eval_steps_per_second": 4.654, "step": 226000 }, { - "epoch": 1.14, - "learning_rate": 0.00012896257019035269, - "loss": 0.006, + "epoch": 0.59, + "learning_rate": 0.0002121224217885277, + "loss": 0.0214, "step": 226010 }, { - "epoch": 1.14, - "learning_rate": 0.00012895500249733867, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.0002121185335721562, + "loss": 0.0145, "step": 226020 }, { - "epoch": 1.14, - "learning_rate": 0.00012894743480432468, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021211464535578474, + "loss": 0.0178, "step": 226030 }, { - "epoch": 1.14, - "learning_rate": 0.00012893986711131066, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021211075713941326, + "loss": 0.0156, "step": 226040 }, { - "epoch": 1.14, - "learning_rate": 0.00012893229941829664, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.0002121068689230418, + "loss": 0.013, "step": 226050 }, { - "epoch": 1.14, - "learning_rate": 0.00012892473172528265, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021210298070667034, + "loss": 0.0163, "step": 226060 }, { - "epoch": 1.14, - "learning_rate": 0.00012891716403226863, - "loss": 0.0116, + "epoch": 0.59, + "learning_rate": 0.00021209909249029888, + "loss": 0.0157, "step": 226070 }, { - "epoch": 1.14, - "learning_rate": 0.0001289095963392546, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.0002120952042739274, + "loss": 0.0165, "step": 226080 }, { - "epoch": 1.14, - "learning_rate": 0.00012890202864624062, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021209131605755594, + "loss": 0.0164, "step": 226090 }, { - "epoch": 1.14, - "learning_rate": 0.0001288944609532266, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.0002120874278411845, + "loss": 0.0149, "step": 226100 }, { - "epoch": 1.14, - "learning_rate": 0.00012888689326021258, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021208353962481302, + "loss": 0.0149, "step": 226110 }, { - "epoch": 1.14, - "learning_rate": 0.00012887932556719856, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021207965140844156, + "loss": 0.0157, "step": 226120 }, { - "epoch": 1.14, - "learning_rate": 0.00012887175787418457, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021207576319207008, + "loss": 0.0134, "step": 226130 }, { - "epoch": 1.14, - "learning_rate": 0.00012886419018117055, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021207187497569865, + "loss": 0.014, "step": 226140 }, { - "epoch": 1.14, - "learning_rate": 0.00012885662248815654, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021206798675932716, + "loss": 0.0178, "step": 226150 }, { - "epoch": 1.14, - "learning_rate": 0.00012884905479514254, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.0002120640985429557, + "loss": 0.0214, "step": 226160 }, { - "epoch": 1.14, - "learning_rate": 0.00012884148710212853, - "loss": 0.0134, + "epoch": 0.59, + "learning_rate": 0.00021206021032658422, + "loss": 0.0141, "step": 226170 }, { - "epoch": 1.14, - "learning_rate": 0.0001288339194091145, - "loss": 0.007, + "epoch": 0.59, + "learning_rate": 0.0002120563221102128, + "loss": 0.014, "step": 226180 }, { - "epoch": 1.14, - "learning_rate": 0.00012882635171610052, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.0002120524338938413, + "loss": 0.0198, "step": 226190 }, { - "epoch": 1.14, - "learning_rate": 0.0001288187840230865, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.00021204854567746984, + "loss": 0.0176, "step": 226200 }, { - "epoch": 1.14, - "learning_rate": 0.00012881121633007248, - "loss": 0.009, - "step": 226210 + "epoch": 0.59, + "learning_rate": 0.00021204465746109836, + "loss": 0.0181, + "step": 226210 }, { - "epoch": 1.14, - "learning_rate": 0.00012880364863705849, - "loss": 0.0069, + "epoch": 0.59, + "learning_rate": 0.00021204076924472693, + "loss": 0.015, "step": 226220 }, { - "epoch": 1.14, - "learning_rate": 0.00012879608094404447, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021203688102835544, + "loss": 0.0163, "step": 226230 }, { - "epoch": 1.14, - "learning_rate": 0.00012878851325103045, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021203299281198398, + "loss": 0.0154, "step": 226240 }, { - "epoch": 1.14, - "learning_rate": 0.00012878094555801646, - "loss": 0.012, + "epoch": 0.59, + "learning_rate": 0.0002120291045956125, + "loss": 0.0145, "step": 226250 }, { - "epoch": 1.14, - "learning_rate": 0.00012877337786500244, - "loss": 0.0071, + "epoch": 0.59, + "learning_rate": 0.00021202521637924107, + "loss": 0.0203, "step": 226260 }, { - "epoch": 1.14, - "learning_rate": 0.00012876581017198842, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.0002120213281628696, + "loss": 0.0292, "step": 226270 }, { - "epoch": 1.14, - "learning_rate": 0.00012875824247897443, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021201743994649812, + "loss": 0.0227, "step": 226280 }, { - "epoch": 1.14, - "learning_rate": 0.0001287506747859604, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021201355173012666, + "loss": 0.0148, "step": 226290 }, { - "epoch": 1.14, - "learning_rate": 0.0001287431070929464, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021200966351375518, + "loss": 0.02, "step": 226300 }, { - "epoch": 1.14, - "learning_rate": 0.00012873553939993237, - "loss": 0.0113, + "epoch": 0.59, + "learning_rate": 0.00021200577529738375, + "loss": 0.0181, "step": 226310 }, { - "epoch": 1.14, - "learning_rate": 0.00012872797170691838, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021200188708101226, + "loss": 0.0165, "step": 226320 }, { - "epoch": 1.14, - "learning_rate": 0.00012872040401390436, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.0002119979988646408, + "loss": 0.0153, "step": 226330 }, { - "epoch": 1.14, - "learning_rate": 0.00012871283632089035, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021199411064826932, + "loss": 0.0141, "step": 226340 }, { - "epoch": 1.14, - "learning_rate": 0.00012870526862787635, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.0002119902224318979, + "loss": 0.0167, "step": 226350 }, { - "epoch": 1.14, - "learning_rate": 0.00012869770093486234, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.0002119863342155264, + "loss": 0.0187, "step": 226360 }, { - "epoch": 1.14, - "learning_rate": 0.00012869013324184832, - "loss": 0.0115, + "epoch": 0.59, + "learning_rate": 0.00021198244599915494, + "loss": 0.0157, "step": 226370 }, { - "epoch": 1.14, - "learning_rate": 0.00012868256554883433, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021197855778278346, + "loss": 0.0164, "step": 226380 }, { - "epoch": 1.14, - "learning_rate": 0.0001286749978558203, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021197466956641203, + "loss": 0.0158, "step": 226390 }, { - "epoch": 1.14, - "learning_rate": 0.0001286674301628063, - "loss": 0.0069, + "epoch": 0.59, + "learning_rate": 0.00021197078135004054, + "loss": 0.0183, "step": 226400 }, { - "epoch": 1.14, - "learning_rate": 0.0001286598624697923, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021196689313366908, + "loss": 0.0178, "step": 226410 }, { - "epoch": 1.14, - "learning_rate": 0.00012865229477677828, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.0002119630049172976, + "loss": 0.018, "step": 226420 }, { - "epoch": 1.14, - "learning_rate": 0.00012864472708376426, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021195911670092617, + "loss": 0.0238, "step": 226430 }, { - "epoch": 1.14, - "learning_rate": 0.00012863715939075027, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.0002119552284845547, + "loss": 0.016, "step": 226440 }, { - "epoch": 1.14, - "learning_rate": 0.00012862959169773625, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021195134026818322, + "loss": 0.0145, "step": 226450 }, { - "epoch": 1.14, - "learning_rate": 0.00012862202400472223, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021194745205181176, + "loss": 0.0176, "step": 226460 }, { - "epoch": 1.14, - "learning_rate": 0.0001286144563117082, - "loss": 0.0068, + "epoch": 0.59, + "learning_rate": 0.0002119435638354403, + "loss": 0.0123, "step": 226470 }, { - "epoch": 1.14, - "learning_rate": 0.00012860688861869422, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021193967561906885, + "loss": 0.0136, "step": 226480 }, { - "epoch": 1.14, - "learning_rate": 0.0001285993209256802, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021193578740269736, + "loss": 0.0191, "step": 226490 }, { - "epoch": 1.14, - "learning_rate": 0.00012859175323266618, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.0002119318991863259, + "loss": 0.0149, "step": 226500 }, { - "epoch": 1.14, - "learning_rate": 0.0001285841855396522, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021192801096995444, + "loss": 0.0169, "step": 226510 }, { - "epoch": 1.14, - "learning_rate": 0.00012857661784663817, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.000211924122753583, + "loss": 0.0111, "step": 226520 }, { - "epoch": 1.14, - "learning_rate": 0.00012856905015362416, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.0002119202345372115, + "loss": 0.0153, "step": 226530 }, { - "epoch": 1.14, - "learning_rate": 0.00012856148246061016, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021191634632084004, + "loss": 0.016, "step": 226540 }, { - "epoch": 1.14, - "learning_rate": 0.00012855391476759615, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021191245810446856, + "loss": 0.0151, "step": 226550 }, { - "epoch": 1.14, - "learning_rate": 0.00012854634707458213, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021190856988809713, + "loss": 0.0168, "step": 226560 }, { - "epoch": 1.14, - "learning_rate": 0.0001285387793815681, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.00021190468167172564, + "loss": 0.013, "step": 226570 }, { - "epoch": 1.14, - "learning_rate": 0.0001285312116885541, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021190079345535418, + "loss": 0.0172, "step": 226580 }, { - "epoch": 1.14, - "learning_rate": 0.0001285236439955401, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.0002118969052389827, + "loss": 0.0164, "step": 226590 }, { - "epoch": 1.14, - "learning_rate": 0.00012851607630252608, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021189301702261127, + "loss": 0.0166, "step": 226600 }, { - "epoch": 1.14, - "learning_rate": 0.00012850850860951206, - "loss": 0.0084, + "epoch": 0.59, + "learning_rate": 0.0002118891288062398, + "loss": 0.0141, "step": 226610 }, { - "epoch": 1.14, - "learning_rate": 0.00012850094091649807, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021188524058986832, + "loss": 0.0132, "step": 226620 }, { - "epoch": 1.14, - "learning_rate": 0.00012849337322348405, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021188135237349684, + "loss": 0.0159, "step": 226630 }, { - "epoch": 1.14, - "learning_rate": 0.00012848580553047003, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.0002118774641571254, + "loss": 0.02, "step": 226640 }, { - "epoch": 1.14, - "learning_rate": 0.00012847823783745601, - "loss": 0.0121, + "epoch": 0.59, + "learning_rate": 0.00021187357594075395, + "loss": 0.0134, "step": 226650 }, { - "epoch": 1.14, - "learning_rate": 0.00012847067014444202, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021186968772438246, + "loss": 0.018, "step": 226660 }, { - "epoch": 1.14, - "learning_rate": 0.000128463102451428, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.000211865799508011, + "loss": 0.021, "step": 226670 }, { - "epoch": 1.14, - "learning_rate": 0.00012845553475841399, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.00021186191129163954, + "loss": 0.0145, "step": 226680 }, { - "epoch": 1.14, - "learning_rate": 0.0001284479670654, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021185802307526809, + "loss": 0.0165, "step": 226690 }, { - "epoch": 1.14, - "learning_rate": 0.00012844039937238598, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.0002118541348588966, + "loss": 0.016, "step": 226700 }, { - "epoch": 1.14, - "learning_rate": 0.00012843283167937196, - "loss": 0.0084, + "epoch": 0.59, + "learning_rate": 0.00021185024664252514, + "loss": 0.0177, "step": 226710 }, { - "epoch": 1.14, - "learning_rate": 0.00012842526398635797, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021184635842615368, + "loss": 0.0167, "step": 226720 }, { - "epoch": 1.14, - "learning_rate": 0.00012841769629334395, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021184247020978223, + "loss": 0.0169, "step": 226730 }, { - "epoch": 1.14, - "learning_rate": 0.00012841012860032993, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021183858199341074, + "loss": 0.0134, "step": 226740 }, { - "epoch": 1.14, - "learning_rate": 0.00012840256090731594, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021183469377703928, + "loss": 0.0157, "step": 226750 }, { - "epoch": 1.14, - "learning_rate": 0.00012839499321430192, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021183080556066785, + "loss": 0.0203, "step": 226760 }, { - "epoch": 1.14, - "learning_rate": 0.0001283874255212879, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.00021182691734429636, + "loss": 0.0136, "step": 226770 }, { - "epoch": 1.14, - "learning_rate": 0.0001283798578282739, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021182302912792488, + "loss": 0.0204, "step": 226780 }, { - "epoch": 1.14, - "learning_rate": 0.0001283722901352599, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.00021181914091155342, + "loss": 0.0129, "step": 226790 }, { - "epoch": 1.14, - "learning_rate": 0.00012836472244224587, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021181525269518194, + "loss": 0.0184, "step": 226800 }, { - "epoch": 1.14, - "learning_rate": 0.00012835715474923188, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.0002118113644788105, + "loss": 0.015, "step": 226810 }, { - "epoch": 1.14, - "learning_rate": 0.00012834958705621786, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021180747626243905, + "loss": 0.0153, "step": 226820 }, { - "epoch": 1.14, - "learning_rate": 0.00012834201936320384, - "loss": 0.0064, + "epoch": 0.59, + "learning_rate": 0.00021180358804606756, + "loss": 0.0147, "step": 226830 }, { - "epoch": 1.14, - "learning_rate": 0.00012833445167018982, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.0002117996998296961, + "loss": 0.0159, "step": 226840 }, { - "epoch": 1.14, - "learning_rate": 0.00012832688397717583, - "loss": 0.0109, + "epoch": 0.59, + "learning_rate": 0.00021179581161332464, + "loss": 0.0151, "step": 226850 }, { - "epoch": 1.14, - "learning_rate": 0.00012831931628416181, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021179192339695319, + "loss": 0.0178, "step": 226860 }, { - "epoch": 1.14, - "learning_rate": 0.0001283117485911478, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.0002117880351805817, + "loss": 0.0176, "step": 226870 }, { - "epoch": 1.14, - "learning_rate": 0.0001283041808981338, - "loss": 0.0068, + "epoch": 0.59, + "learning_rate": 0.00021178414696421024, + "loss": 0.0225, "step": 226880 }, { - "epoch": 1.14, - "learning_rate": 0.00012829661320511979, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021178025874783878, + "loss": 0.0137, "step": 226890 }, { - "epoch": 1.14, - "learning_rate": 0.00012828904551210577, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021177637053146732, + "loss": 0.0204, "step": 226900 }, { - "epoch": 1.14, - "learning_rate": 0.00012828147781909178, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021177248231509584, + "loss": 0.0175, "step": 226910 }, { - "epoch": 1.14, - "learning_rate": 0.00012827391012607776, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021176859409872438, + "loss": 0.0201, "step": 226920 }, { - "epoch": 1.14, - "learning_rate": 0.00012826634243306374, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.00021176470588235295, + "loss": 0.0173, "step": 226930 }, { - "epoch": 1.14, - "learning_rate": 0.00012825877474004975, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021176081766598146, + "loss": 0.0164, "step": 226940 }, { - "epoch": 1.14, - "learning_rate": 0.00012825120704703573, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021175692944960998, + "loss": 0.0161, "step": 226950 }, { - "epoch": 1.15, - "learning_rate": 0.0001282436393540217, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021175304123323852, + "loss": 0.0164, "step": 226960 }, { - "epoch": 1.15, - "learning_rate": 0.00012823607166100772, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.0002117491530168671, + "loss": 0.0198, "step": 226970 }, { - "epoch": 1.15, - "learning_rate": 0.0001282285039679937, - "loss": 0.0114, + "epoch": 0.59, + "learning_rate": 0.0002117452648004956, + "loss": 0.0211, "step": 226980 }, { - "epoch": 1.15, - "learning_rate": 0.00012822093627497968, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021174137658412415, + "loss": 0.0149, "step": 226990 }, { - "epoch": 1.15, - "learning_rate": 0.00012821336858196566, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021173748836775266, + "loss": 0.0163, "step": 227000 }, { - "epoch": 1.15, - "eval_cer": 0.9144663743186606, - "eval_loss": 0.006952292751520872, - "eval_runtime": 116.2021, - "eval_samples_per_second": 17.211, - "eval_steps_per_second": 4.303, + "epoch": 0.59, + "eval_cer": 0.8817964619977577, + "eval_loss": 0.011157948523759842, + "eval_runtime": 107.4259, + "eval_samples_per_second": 18.617, + "eval_steps_per_second": 4.654, "step": 227000 }, { - "epoch": 1.15, - "learning_rate": 0.00012820580088895167, - "loss": 0.0068, + "epoch": 0.59, + "learning_rate": 0.00021173360015138123, + "loss": 0.0156, "step": 227010 }, { - "epoch": 1.15, - "learning_rate": 0.00012819823319593765, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021172971193500974, + "loss": 0.0143, "step": 227020 }, { - "epoch": 1.15, - "learning_rate": 0.00012819066550292363, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.00021172582371863828, + "loss": 0.0142, "step": 227030 }, { - "epoch": 1.15, - "learning_rate": 0.00012818309780990964, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.0002117219355022668, + "loss": 0.0143, "step": 227040 }, { - "epoch": 1.15, - "learning_rate": 0.00012817553011689562, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021171804728589534, + "loss": 0.0182, "step": 227050 }, { - "epoch": 1.15, - "learning_rate": 0.0001281679624238816, - "loss": 0.0063, + "epoch": 0.59, + "learning_rate": 0.00021171415906952388, + "loss": 0.0156, "step": 227060 }, { - "epoch": 1.15, - "learning_rate": 0.00012816039473086761, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021171027085315242, + "loss": 0.0184, "step": 227070 }, { - "epoch": 1.15, - "learning_rate": 0.0001281528270378536, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021170638263678094, + "loss": 0.0165, "step": 227080 }, { - "epoch": 1.15, - "learning_rate": 0.00012814525934483958, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021170249442040948, + "loss": 0.0149, "step": 227090 }, { - "epoch": 1.15, - "learning_rate": 0.00012813769165182559, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021169860620403802, + "loss": 0.0135, "step": 227100 }, { - "epoch": 1.15, - "learning_rate": 0.00012813012395881157, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021169471798766656, + "loss": 0.0147, "step": 227110 }, { - "epoch": 1.15, - "learning_rate": 0.00012812255626579755, - "loss": 0.0124, + "epoch": 0.59, + "learning_rate": 0.00021169082977129508, + "loss": 0.0169, "step": 227120 }, { - "epoch": 1.15, - "learning_rate": 0.00012811498857278356, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.00021168694155492362, + "loss": 0.0152, "step": 227130 }, { - "epoch": 1.15, - "learning_rate": 0.00012810742087976954, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.0002116830533385522, + "loss": 0.0165, "step": 227140 }, { - "epoch": 1.15, - "learning_rate": 0.00012809985318675552, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.0002116791651221807, + "loss": 0.0145, "step": 227150 }, { - "epoch": 1.15, - "learning_rate": 0.0001280922854937415, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021167527690580924, + "loss": 0.0152, "step": 227160 }, { - "epoch": 1.15, - "learning_rate": 0.0001280847178007275, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021167138868943776, + "loss": 0.0171, "step": 227170 }, { - "epoch": 1.15, - "learning_rate": 0.0001280771501077135, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021166750047306633, + "loss": 0.0199, "step": 227180 }, { - "epoch": 1.15, - "learning_rate": 0.00012806958241469947, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021166361225669484, + "loss": 0.0168, "step": 227190 }, { - "epoch": 1.15, - "learning_rate": 0.00012806201472168545, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.00021165972404032338, + "loss": 0.0141, "step": 227200 }, { - "epoch": 1.15, - "learning_rate": 0.00012805444702867144, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.0002116558358239519, + "loss": 0.0135, "step": 227210 }, { - "epoch": 1.15, - "learning_rate": 0.00012804687933565744, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021165194760758047, + "loss": 0.0165, "step": 227220 }, { - "epoch": 1.15, - "learning_rate": 0.00012803931164264343, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021164805939120898, + "loss": 0.0176, "step": 227230 }, { - "epoch": 1.15, - "learning_rate": 0.0001280317439496294, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021164417117483752, + "loss": 0.0176, "step": 227240 }, { - "epoch": 1.15, - "learning_rate": 0.00012802417625661542, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021164028295846604, + "loss": 0.0134, "step": 227250 }, { - "epoch": 1.15, - "learning_rate": 0.0001280166085636014, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.0002116363947420946, + "loss": 0.0201, "step": 227260 }, { - "epoch": 1.15, - "learning_rate": 0.00012800904087058738, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021163250652572312, + "loss": 0.0146, "step": 227270 }, { - "epoch": 1.15, - "learning_rate": 0.0001280014731775734, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.00021162861830935166, + "loss": 0.0176, "step": 227280 }, { - "epoch": 1.15, - "learning_rate": 0.00012799390548455937, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021162473009298018, + "loss": 0.0153, "step": 227290 }, { - "epoch": 1.15, - "learning_rate": 0.00012798633779154535, - "loss": 0.0072, + "epoch": 0.59, + "learning_rate": 0.00021162084187660872, + "loss": 0.0124, "step": 227300 }, { - "epoch": 1.15, - "learning_rate": 0.00012797877009853136, - "loss": 0.0116, + "epoch": 0.59, + "learning_rate": 0.0002116169536602373, + "loss": 0.0146, "step": 227310 }, { - "epoch": 1.15, - "learning_rate": 0.00012797120240551734, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.0002116130654438658, + "loss": 0.0163, "step": 227320 }, { - "epoch": 1.15, - "learning_rate": 0.00012796363471250332, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.00021160917722749434, + "loss": 0.0167, "step": 227330 }, { - "epoch": 1.15, - "learning_rate": 0.00012795606701948933, - "loss": 0.0084, + "epoch": 0.59, + "learning_rate": 0.00021160528901112286, + "loss": 0.0146, "step": 227340 }, { - "epoch": 1.15, - "learning_rate": 0.0001279484993264753, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021160140079475143, + "loss": 0.0179, "step": 227350 }, { - "epoch": 1.15, - "learning_rate": 0.0001279409316334613, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021159751257837994, + "loss": 0.0146, "step": 227360 }, { - "epoch": 1.15, - "learning_rate": 0.00012793336394044727, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021159362436200848, + "loss": 0.0146, "step": 227370 }, { - "epoch": 1.15, - "learning_rate": 0.00012792579624743328, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.000211589736145637, + "loss": 0.0168, "step": 227380 }, { - "epoch": 1.15, - "learning_rate": 0.00012791822855441926, - "loss": 0.0073, + "epoch": 0.59, + "learning_rate": 0.00021158584792926557, + "loss": 0.0153, "step": 227390 }, { - "epoch": 1.15, - "learning_rate": 0.00012791066086140525, - "loss": 0.007, + "epoch": 0.59, + "learning_rate": 0.00021158195971289408, + "loss": 0.0199, "step": 227400 }, { - "epoch": 1.15, - "learning_rate": 0.00012790309316839125, - "loss": 0.0067, + "epoch": 0.59, + "learning_rate": 0.00021157807149652262, + "loss": 0.0155, "step": 227410 }, { - "epoch": 1.15, - "learning_rate": 0.00012789552547537724, - "loss": 0.0072, + "epoch": 0.59, + "learning_rate": 0.00021157418328015114, + "loss": 0.0162, "step": 227420 }, { - "epoch": 1.15, - "learning_rate": 0.00012788795778236322, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.0002115702950637797, + "loss": 0.0142, "step": 227430 }, { - "epoch": 1.15, - "learning_rate": 0.00012788039008934923, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021156640684740822, + "loss": 0.02, "step": 227440 }, { - "epoch": 1.15, - "learning_rate": 0.0001278728223963352, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021156251863103676, + "loss": 0.0164, "step": 227450 }, { - "epoch": 1.15, - "learning_rate": 0.0001278652547033212, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021155863041466528, + "loss": 0.0134, "step": 227460 }, { - "epoch": 1.15, - "learning_rate": 0.0001278576870103072, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021155474219829385, + "loss": 0.0125, "step": 227470 }, { - "epoch": 1.15, - "learning_rate": 0.00012785011931729318, - "loss": 0.0113, + "epoch": 0.59, + "learning_rate": 0.0002115508539819224, + "loss": 0.0188, "step": 227480 }, { - "epoch": 1.15, - "learning_rate": 0.00012784255162427916, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.0002115469657655509, + "loss": 0.0131, "step": 227490 }, { - "epoch": 1.15, - "learning_rate": 0.00012783498393126517, - "loss": 0.0073, + "epoch": 0.59, + "learning_rate": 0.00021154307754917942, + "loss": 0.0183, "step": 227500 }, { - "epoch": 1.15, - "learning_rate": 0.00012782741623825115, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021153918933280799, + "loss": 0.0157, "step": 227510 }, { - "epoch": 1.15, - "learning_rate": 0.00012781984854523713, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.00021153530111643653, + "loss": 0.0136, "step": 227520 }, { - "epoch": 1.15, - "learning_rate": 0.0001278122808522231, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021153141290006504, + "loss": 0.0274, "step": 227530 }, { - "epoch": 1.15, - "learning_rate": 0.00012780471315920912, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021152752468369358, + "loss": 0.0154, "step": 227540 }, { - "epoch": 1.15, - "learning_rate": 0.0001277971454661951, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.0002115236364673221, + "loss": 0.0177, "step": 227550 }, { - "epoch": 1.15, - "learning_rate": 0.00012778957777318108, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021151974825095067, + "loss": 0.0154, "step": 227560 }, { - "epoch": 1.15, - "learning_rate": 0.0001277820100801671, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021151586003457918, + "loss": 0.0115, "step": 227570 }, { - "epoch": 1.15, - "learning_rate": 0.00012777444238715307, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021151197181820772, + "loss": 0.0156, "step": 227580 }, { - "epoch": 1.15, - "learning_rate": 0.00012776687469413906, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021150808360183624, + "loss": 0.0174, "step": 227590 }, { - "epoch": 1.15, - "learning_rate": 0.00012775930700112506, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.0002115041953854648, + "loss": 0.0174, "step": 227600 }, { - "epoch": 1.15, - "learning_rate": 0.00012775173930811105, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.00021150030716909332, + "loss": 0.0197, "step": 227610 }, { - "epoch": 1.15, - "learning_rate": 0.00012774417161509703, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021149641895272186, + "loss": 0.0173, "step": 227620 }, { - "epoch": 1.15, - "learning_rate": 0.00012773660392208304, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021149253073635038, + "loss": 0.0152, "step": 227630 }, { - "epoch": 1.15, - "learning_rate": 0.00012772903622906902, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021148864251997895, + "loss": 0.0199, "step": 227640 }, { - "epoch": 1.15, - "learning_rate": 0.000127721468536055, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021148475430360746, + "loss": 0.0133, "step": 227650 }, { - "epoch": 1.15, - "learning_rate": 0.000127713900843041, - "loss": 0.007, + "epoch": 0.59, + "learning_rate": 0.000211480866087236, + "loss": 0.0142, "step": 227660 }, { - "epoch": 1.15, - "learning_rate": 0.000127706333150027, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021147697787086452, + "loss": 0.0117, "step": 227670 }, { - "epoch": 1.15, - "learning_rate": 0.00012769876545701297, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021147308965449308, + "loss": 0.0177, "step": 227680 }, { - "epoch": 1.15, - "learning_rate": 0.00012769119776399898, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021146920143812163, + "loss": 0.0141, "step": 227690 }, { - "epoch": 1.15, - "learning_rate": 0.00012768363007098496, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021146531322175014, + "loss": 0.0155, "step": 227700 }, { - "epoch": 1.15, - "learning_rate": 0.00012767606237797094, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021146142500537868, + "loss": 0.0201, "step": 227710 }, { - "epoch": 1.15, - "learning_rate": 0.00012766849468495692, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021145753678900722, + "loss": 0.0142, "step": 227720 }, { - "epoch": 1.15, - "learning_rate": 0.00012766092699194293, - "loss": 0.0127, + "epoch": 0.59, + "learning_rate": 0.00021145364857263577, + "loss": 0.0135, "step": 227730 }, { - "epoch": 1.15, - "learning_rate": 0.0001276533592989289, - "loss": 0.0061, + "epoch": 0.59, + "learning_rate": 0.00021144976035626428, + "loss": 0.0136, "step": 227740 }, { - "epoch": 1.15, - "learning_rate": 0.0001276457916059149, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021144587213989282, + "loss": 0.0158, "step": 227750 }, { - "epoch": 1.15, - "learning_rate": 0.0001276382239129009, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021144198392352136, + "loss": 0.0176, "step": 227760 }, { - "epoch": 1.15, - "learning_rate": 0.00012763065621988688, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.0002114380957071499, + "loss": 0.0167, "step": 227770 }, { - "epoch": 1.15, - "learning_rate": 0.00012762308852687287, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021143420749077842, + "loss": 0.0147, "step": 227780 }, { - "epoch": 1.15, - "learning_rate": 0.00012761552083385887, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021143031927440696, + "loss": 0.0136, "step": 227790 }, { - "epoch": 1.15, - "learning_rate": 0.00012760795314084486, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021142643105803548, + "loss": 0.0148, "step": 227800 }, { - "epoch": 1.15, - "learning_rate": 0.00012760038544783084, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021142254284166404, + "loss": 0.0142, "step": 227810 }, { - "epoch": 1.15, - "learning_rate": 0.00012759281775481682, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.00021141865462529256, + "loss": 0.0166, "step": 227820 }, { - "epoch": 1.15, - "learning_rate": 0.0001275852500618028, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.0002114147664089211, + "loss": 0.0132, "step": 227830 }, { - "epoch": 1.15, - "learning_rate": 0.0001275776823687888, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021141087819254962, + "loss": 0.0153, "step": 227840 }, { - "epoch": 1.15, - "learning_rate": 0.0001275701146757748, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021140698997617818, + "loss": 0.0165, "step": 227850 }, { - "epoch": 1.15, - "learning_rate": 0.00012756254698276077, - "loss": 0.0084, + "epoch": 0.59, + "learning_rate": 0.00021140310175980673, + "loss": 0.0171, "step": 227860 }, { - "epoch": 1.15, - "learning_rate": 0.00012755497928974678, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021139921354343524, + "loss": 0.017, "step": 227870 }, { - "epoch": 1.15, - "learning_rate": 0.00012754741159673276, - "loss": 0.012, + "epoch": 0.59, + "learning_rate": 0.00021139532532706378, + "loss": 0.0151, "step": 227880 }, { - "epoch": 1.15, - "learning_rate": 0.00012753984390371874, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021139143711069232, + "loss": 0.015, "step": 227890 }, { - "epoch": 1.15, - "learning_rate": 0.00012753227621070472, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021138754889432087, + "loss": 0.0125, "step": 227900 }, { - "epoch": 1.15, - "learning_rate": 0.00012752470851769073, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021138366067794938, + "loss": 0.0138, "step": 227910 }, { - "epoch": 1.15, - "learning_rate": 0.00012751714082467671, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021137977246157792, + "loss": 0.0154, "step": 227920 }, { - "epoch": 1.15, - "learning_rate": 0.0001275095731316627, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021137588424520646, + "loss": 0.0159, "step": 227930 }, { - "epoch": 1.15, - "learning_rate": 0.0001275020054386487, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.000211371996028835, + "loss": 0.0154, "step": 227940 }, { - "epoch": 1.15, - "learning_rate": 0.00012749443774563469, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021136810781246352, + "loss": 0.0166, "step": 227950 }, { - "epoch": 1.15, - "learning_rate": 0.00012748687005262067, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021136421959609206, + "loss": 0.0177, "step": 227960 }, { - "epoch": 1.15, - "learning_rate": 0.00012747930235960668, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.0002113603313797206, + "loss": 0.0145, "step": 227970 }, { - "epoch": 1.15, - "learning_rate": 0.00012747173466659266, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021135644316334914, + "loss": 0.0181, "step": 227980 }, { - "epoch": 1.15, - "learning_rate": 0.00012746416697357864, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021135255494697766, + "loss": 0.019, "step": 227990 }, { - "epoch": 1.15, - "learning_rate": 0.00012745659928056465, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.0002113486667306062, + "loss": 0.015, "step": 228000 }, { - "epoch": 1.15, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.006729237735271454, - "eval_runtime": 116.2506, - "eval_samples_per_second": 17.204, - "eval_steps_per_second": 4.301, + "epoch": 0.59, + "eval_cer": 0.8818006609085604, + "eval_loss": 0.011607250198721886, + "eval_runtime": 107.2928, + "eval_samples_per_second": 18.641, + "eval_steps_per_second": 4.66, "step": 228000 }, { - "epoch": 1.15, - "learning_rate": 0.00012744903158755063, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021134477851423471, + "loss": 0.0233, "step": 228010 }, { - "epoch": 1.15, - "learning_rate": 0.0001274414638945366, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021134089029786328, + "loss": 0.0157, "step": 228020 }, { - "epoch": 1.15, - "learning_rate": 0.00012743389620152262, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021133700208149183, + "loss": 0.0207, "step": 228030 }, { - "epoch": 1.15, - "learning_rate": 0.0001274263285085086, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.00021133311386512034, + "loss": 0.0184, "step": 228040 }, { - "epoch": 1.15, - "learning_rate": 0.00012741876081549458, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021132922564874885, + "loss": 0.0155, "step": 228050 }, { - "epoch": 1.15, - "learning_rate": 0.00012741119312248056, - "loss": 0.0112, + "epoch": 0.59, + "learning_rate": 0.00021132533743237742, + "loss": 0.0172, "step": 228060 }, { - "epoch": 1.15, - "learning_rate": 0.00012740362542946657, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021132144921600596, + "loss": 0.0148, "step": 228070 }, { - "epoch": 1.15, - "learning_rate": 0.00012739605773645255, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.00021131756099963448, + "loss": 0.0179, "step": 228080 }, { - "epoch": 1.15, - "learning_rate": 0.00012738849004343853, - "loss": 0.0118, + "epoch": 0.59, + "learning_rate": 0.00021131367278326302, + "loss": 0.0176, "step": 228090 }, { - "epoch": 1.15, - "learning_rate": 0.00012738092235042454, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021130978456689156, + "loss": 0.0151, "step": 228100 }, { - "epoch": 1.15, - "learning_rate": 0.00012737335465741052, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.0002113058963505201, + "loss": 0.0191, "step": 228110 }, { - "epoch": 1.15, - "learning_rate": 0.0001273657869643965, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021130200813414862, + "loss": 0.0152, "step": 228120 }, { - "epoch": 1.15, - "learning_rate": 0.00012735821927138251, - "loss": 0.0074, + "epoch": 0.59, + "learning_rate": 0.00021129811991777716, + "loss": 0.0171, "step": 228130 }, { - "epoch": 1.15, - "learning_rate": 0.0001273506515783685, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.0002112942317014057, + "loss": 0.0146, "step": 228140 }, { - "epoch": 1.15, - "learning_rate": 0.00012734308388535448, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021129034348503424, + "loss": 0.0153, "step": 228150 }, { - "epoch": 1.15, - "learning_rate": 0.00012733551619234049, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021128645526866276, + "loss": 0.0171, "step": 228160 }, { - "epoch": 1.15, - "learning_rate": 0.00012732794849932647, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.0002112825670522913, + "loss": 0.0163, "step": 228170 }, { - "epoch": 1.15, - "learning_rate": 0.00012732038080631245, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021127867883591987, + "loss": 0.0207, "step": 228180 }, { - "epoch": 1.15, - "learning_rate": 0.00012731281311329846, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021127479061954838, + "loss": 0.016, "step": 228190 }, { - "epoch": 1.15, - "learning_rate": 0.00012730524542028444, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021127090240317692, + "loss": 0.0169, "step": 228200 }, { - "epoch": 1.15, - "learning_rate": 0.00012729767772727042, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021126701418680544, + "loss": 0.0145, "step": 228210 }, { - "epoch": 1.15, - "learning_rate": 0.00012729011003425643, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.000211263125970434, + "loss": 0.0205, "step": 228220 }, { - "epoch": 1.15, - "learning_rate": 0.0001272825423412424, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021125923775406252, + "loss": 0.016, "step": 228230 }, { - "epoch": 1.15, - "learning_rate": 0.0001272749746482284, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021125534953769106, + "loss": 0.017, "step": 228240 }, { - "epoch": 1.15, - "learning_rate": 0.00012726740695521437, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021125146132131958, + "loss": 0.0139, "step": 228250 }, { - "epoch": 1.15, - "learning_rate": 0.00012725983926220038, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021124757310494812, + "loss": 0.0147, "step": 228260 }, { - "epoch": 1.15, - "learning_rate": 0.00012725227156918636, - "loss": 0.0116, + "epoch": 0.59, + "learning_rate": 0.00021124368488857666, + "loss": 0.0151, "step": 228270 }, { - "epoch": 1.15, - "learning_rate": 0.00012724470387617234, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.0002112397966722052, + "loss": 0.0198, "step": 228280 }, { - "epoch": 1.15, - "learning_rate": 0.00012723713618315835, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021123590845583372, + "loss": 0.0159, "step": 228290 }, { - "epoch": 1.15, - "learning_rate": 0.00012722956849014433, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021123202023946226, + "loss": 0.0183, "step": 228300 }, { - "epoch": 1.15, - "learning_rate": 0.00012722200079713032, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.0002112281320230908, + "loss": 0.0178, "step": 228310 }, { - "epoch": 1.15, - "learning_rate": 0.00012721443310411632, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021122424380671934, + "loss": 0.0176, "step": 228320 }, { - "epoch": 1.15, - "learning_rate": 0.0001272068654111023, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021122035559034786, + "loss": 0.0162, "step": 228330 }, { - "epoch": 1.15, - "learning_rate": 0.0001271992977180883, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.0002112164673739764, + "loss": 0.0166, "step": 228340 }, { - "epoch": 1.15, - "learning_rate": 0.0001271917300250743, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021121257915760497, + "loss": 0.0225, "step": 228350 }, { - "epoch": 1.15, - "learning_rate": 0.00012718416233206028, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021120869094123348, + "loss": 0.0156, "step": 228360 }, { - "epoch": 1.15, - "learning_rate": 0.00012717659463904626, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.000211204802724862, + "loss": 0.0176, "step": 228370 }, { - "epoch": 1.15, - "learning_rate": 0.00012716902694603227, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021120091450849054, + "loss": 0.0129, "step": 228380 }, { - "epoch": 1.15, - "learning_rate": 0.00012716145925301825, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.0002111970262921191, + "loss": 0.0171, "step": 228390 }, { - "epoch": 1.15, - "learning_rate": 0.00012715389156000423, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021119313807574762, + "loss": 0.0189, "step": 228400 }, { - "epoch": 1.15, - "learning_rate": 0.0001271463238669902, - "loss": 0.0094, + "epoch": 0.59, + "learning_rate": 0.00021118924985937616, + "loss": 0.0121, "step": 228410 }, { - "epoch": 1.15, - "learning_rate": 0.00012713875617397622, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021118536164300468, + "loss": 0.0134, "step": 228420 }, { - "epoch": 1.15, - "learning_rate": 0.0001271311884809622, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021118147342663325, + "loss": 0.015, "step": 228430 }, { - "epoch": 1.15, - "learning_rate": 0.00012712362078794818, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021117758521026176, + "loss": 0.0159, "step": 228440 }, { - "epoch": 1.15, - "learning_rate": 0.00012711605309493416, - "loss": 0.0139, + "epoch": 0.59, + "learning_rate": 0.0002111736969938903, + "loss": 0.0157, "step": 228450 }, { - "epoch": 1.15, - "learning_rate": 0.00012710848540192015, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021116980877751882, + "loss": 0.015, "step": 228460 }, { - "epoch": 1.15, - "learning_rate": 0.00012710091770890615, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021116592056114739, + "loss": 0.0129, "step": 228470 }, { - "epoch": 1.15, - "learning_rate": 0.00012709335001589214, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.0002111620323447759, + "loss": 0.0161, "step": 228480 }, { - "epoch": 1.15, - "learning_rate": 0.00012708578232287812, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021115814412840444, + "loss": 0.0151, "step": 228490 }, { - "epoch": 1.15, - "learning_rate": 0.00012707821462986413, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021115425591203296, + "loss": 0.02, "step": 228500 }, { - "epoch": 1.15, - "learning_rate": 0.0001270706469368501, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.0002111503676956615, + "loss": 0.0153, "step": 228510 }, { - "epoch": 1.15, - "learning_rate": 0.0001270630792438361, - "loss": 0.0122, + "epoch": 0.59, + "learning_rate": 0.00021114647947929007, + "loss": 0.0161, "step": 228520 }, { - "epoch": 1.15, - "learning_rate": 0.0001270555115508221, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021114259126291858, + "loss": 0.0162, "step": 228530 }, { - "epoch": 1.15, - "learning_rate": 0.00012704794385780808, - "loss": 0.012, + "epoch": 0.59, + "learning_rate": 0.0002111387030465471, + "loss": 0.0176, "step": 228540 }, { - "epoch": 1.15, - "learning_rate": 0.00012704037616479406, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.00021113481483017564, + "loss": 0.0205, "step": 228550 }, { - "epoch": 1.15, - "learning_rate": 0.00012703280847178007, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.0002111309266138042, + "loss": 0.0143, "step": 228560 }, { - "epoch": 1.15, - "learning_rate": 0.00012702524077876605, - "loss": 0.0123, + "epoch": 0.59, + "learning_rate": 0.00021112703839743272, + "loss": 0.0142, "step": 228570 }, { - "epoch": 1.15, - "learning_rate": 0.00012701767308575203, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021112315018106126, + "loss": 0.014, "step": 228580 }, { - "epoch": 1.15, - "learning_rate": 0.000127010105392738, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021111926196468978, + "loss": 0.0158, "step": 228590 }, { - "epoch": 1.15, - "learning_rate": 0.00012700253769972402, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.00021111537374831835, + "loss": 0.0159, "step": 228600 }, { - "epoch": 1.15, - "learning_rate": 0.00012699497000671, - "loss": 0.0111, + "epoch": 0.59, + "learning_rate": 0.00021111148553194686, + "loss": 0.0113, "step": 228610 }, { - "epoch": 1.15, - "learning_rate": 0.00012698740231369598, - "loss": 0.0104, + "epoch": 0.59, + "learning_rate": 0.0002111075973155754, + "loss": 0.015, "step": 228620 }, { - "epoch": 1.15, - "learning_rate": 0.000126979834620682, - "loss": 0.0139, + "epoch": 0.59, + "learning_rate": 0.00021110370909920392, + "loss": 0.0181, "step": 228630 }, { - "epoch": 1.15, - "learning_rate": 0.00012697226692766797, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021109982088283249, + "loss": 0.0142, "step": 228640 }, { - "epoch": 1.15, - "learning_rate": 0.00012696469923465396, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.000211095932666461, + "loss": 0.0143, "step": 228650 }, { - "epoch": 1.15, - "learning_rate": 0.00012695713154163996, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021109204445008954, + "loss": 0.0212, "step": 228660 }, { - "epoch": 1.15, - "learning_rate": 0.00012694956384862595, - "loss": 0.0107, + "epoch": 0.59, + "learning_rate": 0.00021108815623371806, + "loss": 0.0176, "step": 228670 }, { - "epoch": 1.15, - "learning_rate": 0.00012694199615561193, - "loss": 0.0118, + "epoch": 0.59, + "learning_rate": 0.00021108426801734663, + "loss": 0.0176, "step": 228680 }, { - "epoch": 1.15, - "learning_rate": 0.00012693442846259794, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021108037980097514, + "loss": 0.0174, "step": 228690 }, { - "epoch": 1.15, - "learning_rate": 0.00012692686076958392, - "loss": 0.0079, + "epoch": 0.59, + "learning_rate": 0.00021107649158460368, + "loss": 0.0165, "step": 228700 }, { - "epoch": 1.15, - "learning_rate": 0.0001269192930765699, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.0002110726033682322, + "loss": 0.0166, "step": 228710 }, { - "epoch": 1.15, - "learning_rate": 0.0001269117253835559, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021106871515186076, + "loss": 0.0225, "step": 228720 }, { - "epoch": 1.15, - "learning_rate": 0.0001269041576905419, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.0002110648269354893, + "loss": 0.0146, "step": 228730 }, { - "epoch": 1.15, - "learning_rate": 0.00012689658999752787, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021106093871911782, + "loss": 0.0175, "step": 228740 }, { - "epoch": 1.15, - "learning_rate": 0.00012688902230451388, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021105705050274636, + "loss": 0.0161, "step": 228750 }, { - "epoch": 1.15, - "learning_rate": 0.00012688145461149986, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021105316228637488, + "loss": 0.014, "step": 228760 }, { - "epoch": 1.15, - "learning_rate": 0.00012687388691848584, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021104927407000345, + "loss": 0.0192, "step": 228770 }, { - "epoch": 1.15, - "learning_rate": 0.00012686631922547182, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021104538585363196, + "loss": 0.0134, "step": 228780 }, { - "epoch": 1.15, - "learning_rate": 0.00012685875153245783, - "loss": 0.0108, + "epoch": 0.59, + "learning_rate": 0.0002110414976372605, + "loss": 0.0155, "step": 228790 }, { - "epoch": 1.15, - "learning_rate": 0.0001268511838394438, - "loss": 0.0119, + "epoch": 0.59, + "learning_rate": 0.00021103760942088902, + "loss": 0.0209, "step": 228800 }, { - "epoch": 1.15, - "learning_rate": 0.0001268436161464298, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021103372120451759, + "loss": 0.0188, "step": 228810 }, { - "epoch": 1.15, - "learning_rate": 0.0001268360484534158, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.0002110298329881461, + "loss": 0.0176, "step": 228820 }, { - "epoch": 1.15, - "learning_rate": 0.00012682848076040178, - "loss": 0.0075, + "epoch": 0.59, + "learning_rate": 0.00021102594477177464, + "loss": 0.0153, "step": 228830 }, { - "epoch": 1.15, - "learning_rate": 0.00012682091306738777, - "loss": 0.0106, + "epoch": 0.59, + "learning_rate": 0.00021102205655540316, + "loss": 0.0163, "step": 228840 }, { - "epoch": 1.15, - "learning_rate": 0.00012681334537437377, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021101816833903172, + "loss": 0.0202, "step": 228850 }, { - "epoch": 1.15, - "learning_rate": 0.00012680577768135976, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021101428012266024, + "loss": 0.0137, "step": 228860 }, { - "epoch": 1.15, - "learning_rate": 0.00012679820998834574, - "loss": 0.0083, + "epoch": 0.59, + "learning_rate": 0.00021101039190628878, + "loss": 0.016, "step": 228870 }, { - "epoch": 1.15, - "learning_rate": 0.00012679064229533175, - "loss": 0.0073, + "epoch": 0.59, + "learning_rate": 0.0002110065036899173, + "loss": 0.0159, "step": 228880 }, { - "epoch": 1.15, - "learning_rate": 0.00012678307460231773, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021100261547354586, + "loss": 0.0156, "step": 228890 }, { - "epoch": 1.15, - "learning_rate": 0.0001267755069093037, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.0002109987272571744, + "loss": 0.0161, "step": 228900 }, { - "epoch": 1.15, - "learning_rate": 0.00012676793921628972, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021099483904080292, + "loss": 0.0146, "step": 228910 }, { - "epoch": 1.15, - "learning_rate": 0.0001267603715232757, - "loss": 0.0073, + "epoch": 0.59, + "learning_rate": 0.00021099095082443146, + "loss": 0.0124, "step": 228920 }, { - "epoch": 1.15, - "learning_rate": 0.00012675280383026168, - "loss": 0.0102, + "epoch": 0.59, + "learning_rate": 0.00021098706260806, + "loss": 0.015, "step": 228930 }, { - "epoch": 1.16, - "learning_rate": 0.00012674523613724766, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.00021098317439168854, + "loss": 0.0182, "step": 228940 }, { - "epoch": 1.16, - "learning_rate": 0.00012673766844423367, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021097928617531706, + "loss": 0.0137, "step": 228950 }, { - "epoch": 1.16, - "learning_rate": 0.00012673010075121965, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.0002109753979589456, + "loss": 0.0238, "step": 228960 }, { - "epoch": 1.16, - "learning_rate": 0.00012672253305820563, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021097150974257414, + "loss": 0.0203, "step": 228970 }, { - "epoch": 1.16, - "learning_rate": 0.00012671496536519164, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.00021096762152620268, + "loss": 0.0172, "step": 228980 }, { - "epoch": 1.16, - "learning_rate": 0.00012670739767217762, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.0002109637333098312, + "loss": 0.0136, "step": 228990 }, { - "epoch": 1.16, - "learning_rate": 0.0001266998299791636, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021095984509345974, + "loss": 0.0171, "step": 229000 }, { - "epoch": 1.16, - "eval_cer": 0.9144634631302844, - "eval_loss": 0.006603468209505081, - "eval_runtime": 116.4012, - "eval_samples_per_second": 17.182, - "eval_steps_per_second": 4.295, + "epoch": 0.59, + "eval_cer": 0.8817838652653501, + "eval_loss": 0.011135715059936047, + "eval_runtime": 107.4098, + "eval_samples_per_second": 18.62, + "eval_steps_per_second": 4.655, "step": 229000 }, { - "epoch": 1.16, - "learning_rate": 0.0001266922622861496, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021095595687708826, + "loss": 0.0183, "step": 229010 }, { - "epoch": 1.16, - "learning_rate": 0.0001266846945931356, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021095206866071682, + "loss": 0.0166, "step": 229020 }, { - "epoch": 1.16, - "learning_rate": 0.00012667712690012158, - "loss": 0.0081, + "epoch": 0.59, + "learning_rate": 0.00021094818044434534, + "loss": 0.0164, "step": 229030 }, { - "epoch": 1.16, - "learning_rate": 0.00012666955920710758, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021094429222797388, + "loss": 0.0171, "step": 229040 }, { - "epoch": 1.16, - "learning_rate": 0.00012666199151409357, - "loss": 0.0112, + "epoch": 0.59, + "learning_rate": 0.0002109404040116024, + "loss": 0.0128, "step": 229050 }, { - "epoch": 1.16, - "learning_rate": 0.00012665442382107955, - "loss": 0.0097, + "epoch": 0.59, + "learning_rate": 0.00021093651579523096, + "loss": 0.0175, "step": 229060 }, { - "epoch": 1.16, - "learning_rate": 0.00012664685612806553, - "loss": 0.0077, + "epoch": 0.59, + "learning_rate": 0.0002109326275788595, + "loss": 0.0183, "step": 229070 }, { - "epoch": 1.16, - "learning_rate": 0.0001266392884350515, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021092873936248802, + "loss": 0.0165, "step": 229080 }, { - "epoch": 1.16, - "learning_rate": 0.00012663172074203752, - "loss": 0.0088, + "epoch": 0.59, + "learning_rate": 0.00021092485114611653, + "loss": 0.0143, "step": 229090 }, { - "epoch": 1.16, - "learning_rate": 0.0001266241530490235, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.0002109209629297451, + "loss": 0.0138, "step": 229100 }, { - "epoch": 1.16, - "learning_rate": 0.00012661658535600948, - "loss": 0.0067, + "epoch": 0.59, + "learning_rate": 0.00021091707471337364, + "loss": 0.0137, "step": 229110 }, { - "epoch": 1.16, - "learning_rate": 0.0001266090176629955, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021091318649700216, + "loss": 0.0123, "step": 229120 }, { - "epoch": 1.16, - "learning_rate": 0.00012660144996998147, - "loss": 0.0105, + "epoch": 0.59, + "learning_rate": 0.0002109092982806307, + "loss": 0.0145, "step": 229130 }, { - "epoch": 1.16, - "learning_rate": 0.00012659388227696745, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021090541006425924, + "loss": 0.0162, "step": 229140 }, { - "epoch": 1.16, - "learning_rate": 0.00012658631458395343, - "loss": 0.0112, + "epoch": 0.59, + "learning_rate": 0.00021090152184788778, + "loss": 0.0162, "step": 229150 }, { - "epoch": 1.16, - "learning_rate": 0.00012657874689093944, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.0002108976336315163, + "loss": 0.0177, "step": 229160 }, { - "epoch": 1.16, - "learning_rate": 0.00012657117919792542, - "loss": 0.0089, + "epoch": 0.59, + "learning_rate": 0.00021089374541514484, + "loss": 0.0146, "step": 229170 }, { - "epoch": 1.16, - "learning_rate": 0.0001265636115049114, - "loss": 0.0076, + "epoch": 0.59, + "learning_rate": 0.00021088985719877338, + "loss": 0.0152, "step": 229180 }, { - "epoch": 1.16, - "learning_rate": 0.00012655604381189741, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021088596898240192, + "loss": 0.0182, "step": 229190 }, { - "epoch": 1.16, - "learning_rate": 0.0001265484761188834, - "loss": 0.0082, + "epoch": 0.59, + "learning_rate": 0.00021088208076603044, + "loss": 0.0145, "step": 229200 }, { - "epoch": 1.16, - "learning_rate": 0.00012654090842586938, - "loss": 0.0065, + "epoch": 0.59, + "learning_rate": 0.00021087819254965898, + "loss": 0.0153, "step": 229210 }, { - "epoch": 1.16, - "learning_rate": 0.00012653334073285539, - "loss": 0.008, + "epoch": 0.59, + "learning_rate": 0.00021087430433328755, + "loss": 0.0165, "step": 229220 }, { - "epoch": 1.16, - "learning_rate": 0.00012652577303984137, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021087041611691606, + "loss": 0.0169, "step": 229230 }, { - "epoch": 1.16, - "learning_rate": 0.00012651820534682735, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021086652790054458, + "loss": 0.0157, "step": 229240 }, { - "epoch": 1.16, - "learning_rate": 0.00012651063765381336, - "loss": 0.0096, + "epoch": 0.59, + "learning_rate": 0.00021086263968417312, + "loss": 0.0147, "step": 229250 }, { - "epoch": 1.16, - "learning_rate": 0.00012650306996079934, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021085875146780163, + "loss": 0.0155, "step": 229260 }, { - "epoch": 1.16, - "learning_rate": 0.00012649550226778532, - "loss": 0.0103, + "epoch": 0.59, + "learning_rate": 0.0002108548632514302, + "loss": 0.015, "step": 229270 }, { - "epoch": 1.16, - "learning_rate": 0.00012648793457477133, - "loss": 0.0085, + "epoch": 0.59, + "learning_rate": 0.00021085097503505874, + "loss": 0.0182, "step": 229280 }, { - "epoch": 1.16, - "learning_rate": 0.0001264803668817573, - "loss": 0.0099, + "epoch": 0.59, + "learning_rate": 0.00021084708681868726, + "loss": 0.0208, "step": 229290 }, { - "epoch": 1.16, - "learning_rate": 0.0001264727991887433, - "loss": 0.0084, + "epoch": 0.59, + "learning_rate": 0.0002108431986023158, + "loss": 0.0184, "step": 229300 }, { - "epoch": 1.16, - "learning_rate": 0.00012646523149572927, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021083931038594434, + "loss": 0.0171, "step": 229310 }, { - "epoch": 1.16, - "learning_rate": 0.00012645766380271528, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021083542216957288, + "loss": 0.0189, "step": 229320 }, { - "epoch": 1.16, - "learning_rate": 0.00012645009610970126, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.0002108315339532014, + "loss": 0.014, "step": 229330 }, { - "epoch": 1.16, - "learning_rate": 0.00012644252841668724, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021082764573682994, + "loss": 0.0202, "step": 229340 }, { - "epoch": 1.16, - "learning_rate": 0.00012643496072367325, - "loss": 0.0093, + "epoch": 0.59, + "learning_rate": 0.00021082375752045848, + "loss": 0.0188, "step": 229350 }, { - "epoch": 1.16, - "learning_rate": 0.00012642739303065923, - "loss": 0.0098, + "epoch": 0.59, + "learning_rate": 0.00021081986930408702, + "loss": 0.022, "step": 229360 }, { - "epoch": 1.16, - "learning_rate": 0.00012641982533764522, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021081598108771554, + "loss": 0.0143, "step": 229370 }, { - "epoch": 1.16, - "learning_rate": 0.00012641225764463122, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021081209287134408, + "loss": 0.0175, "step": 229380 }, { - "epoch": 1.16, - "learning_rate": 0.0001264046899516172, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021080820465497265, + "loss": 0.0165, "step": 229390 }, { - "epoch": 1.16, - "learning_rate": 0.0001263971222586032, - "loss": 0.0095, + "epoch": 0.59, + "learning_rate": 0.00021080431643860116, + "loss": 0.0136, "step": 229400 }, { - "epoch": 1.16, - "learning_rate": 0.0001263895545655892, - "loss": 0.0086, + "epoch": 0.59, + "learning_rate": 0.00021080042822222968, + "loss": 0.0139, "step": 229410 }, { - "epoch": 1.16, - "learning_rate": 0.00012638198687257518, - "loss": 0.0078, + "epoch": 0.59, + "learning_rate": 0.00021079654000585822, + "loss": 0.0135, "step": 229420 }, { - "epoch": 1.16, - "learning_rate": 0.00012637441917956116, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.0002107926517894868, + "loss": 0.0159, "step": 229430 }, { - "epoch": 1.16, - "learning_rate": 0.00012636685148654717, - "loss": 0.0092, + "epoch": 0.59, + "learning_rate": 0.0002107887635731153, + "loss": 0.0178, "step": 229440 }, { - "epoch": 1.16, - "learning_rate": 0.00012635928379353315, - "loss": 0.0091, + "epoch": 0.59, + "learning_rate": 0.00021078487535674384, + "loss": 0.0184, "step": 229450 }, { - "epoch": 1.16, - "learning_rate": 0.00012635171610051913, - "loss": 0.01, + "epoch": 0.59, + "learning_rate": 0.00021078098714037236, + "loss": 0.0186, "step": 229460 }, { - "epoch": 1.16, - "learning_rate": 0.0001263441484075051, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.00021077709892400093, + "loss": 0.0166, "step": 229470 }, { - "epoch": 1.16, - "learning_rate": 0.00012633658071449112, - "loss": 0.009, + "epoch": 0.59, + "learning_rate": 0.00021077321070762944, + "loss": 0.017, "step": 229480 }, { - "epoch": 1.16, - "learning_rate": 0.0001263290130214771, - "loss": 0.0101, + "epoch": 0.59, + "learning_rate": 0.00021076932249125798, + "loss": 0.0162, "step": 229490 }, { - "epoch": 1.16, - "learning_rate": 0.00012632144532846308, - "loss": 0.0087, + "epoch": 0.59, + "learning_rate": 0.0002107654342748865, + "loss": 0.0146, "step": 229500 }, { - "epoch": 1.16, - "learning_rate": 0.0001263138776354491, - "loss": 0.0084, + "epoch": 0.59, + "learning_rate": 0.00021076154605851504, + "loss": 0.0153, "step": 229510 }, { - "epoch": 1.16, - "learning_rate": 0.00012630630994243507, - "loss": 0.011, + "epoch": 0.59, + "learning_rate": 0.00021075765784214358, + "loss": 0.0196, "step": 229520 }, { - "epoch": 1.16, - "learning_rate": 0.00012629874224942105, - "loss": 0.0068, + "epoch": 0.59, + "learning_rate": 0.00021075376962577212, + "loss": 0.0157, "step": 229530 }, { - "epoch": 1.16, - "learning_rate": 0.00012629117455640706, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00021074988140940064, + "loss": 0.019, "step": 229540 }, { - "epoch": 1.16, - "learning_rate": 0.00012628360686339304, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.00021074599319302918, + "loss": 0.0152, "step": 229550 }, { - "epoch": 1.16, - "learning_rate": 0.00012627603917037903, - "loss": 0.011, + "epoch": 0.6, + "learning_rate": 0.00021074210497665772, + "loss": 0.0134, "step": 229560 }, { - "epoch": 1.16, - "learning_rate": 0.00012626847147736503, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021073821676028626, + "loss": 0.015, "step": 229570 }, { - "epoch": 1.16, - "learning_rate": 0.00012626090378435102, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021073432854391478, + "loss": 0.0148, "step": 229580 }, { - "epoch": 1.16, - "learning_rate": 0.000126253336091337, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00021073044032754332, + "loss": 0.0167, "step": 229590 }, { - "epoch": 1.16, - "learning_rate": 0.000126245768398323, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.0002107265521111719, + "loss": 0.0144, "step": 229600 }, { - "epoch": 1.16, - "learning_rate": 0.000126238200705309, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002107226638948004, + "loss": 0.0177, "step": 229610 }, { - "epoch": 1.16, - "learning_rate": 0.00012623063301229497, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021071877567842894, + "loss": 0.0152, "step": 229620 }, { - "epoch": 1.16, - "learning_rate": 0.00012622306531928098, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021071488746205746, + "loss": 0.0134, "step": 229630 }, { - "epoch": 1.16, - "learning_rate": 0.00012621549762626696, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021071099924568603, + "loss": 0.0155, "step": 229640 }, { - "epoch": 1.16, - "learning_rate": 0.00012620792993325294, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021070711102931454, + "loss": 0.0183, "step": 229650 }, { - "epoch": 1.16, - "learning_rate": 0.00012620036224023892, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021070322281294308, + "loss": 0.0175, "step": 229660 }, { - "epoch": 1.16, - "learning_rate": 0.00012619279454722493, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.0002106993345965716, + "loss": 0.0175, "step": 229670 }, { - "epoch": 1.16, - "learning_rate": 0.0001261852268542109, - "loss": 0.0111, + "epoch": 0.6, + "learning_rate": 0.00021069544638020017, + "loss": 0.0161, "step": 229680 }, { - "epoch": 1.16, - "learning_rate": 0.0001261776591611969, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021069155816382868, + "loss": 0.0181, "step": 229690 }, { - "epoch": 1.16, - "learning_rate": 0.00012617009146818287, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021068766994745722, + "loss": 0.0174, "step": 229700 }, { - "epoch": 1.16, - "learning_rate": 0.00012616252377516886, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00021068378173108574, + "loss": 0.0205, "step": 229710 }, { - "epoch": 1.16, - "learning_rate": 0.00012615495608215486, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002106798935147143, + "loss": 0.0163, "step": 229720 }, { - "epoch": 1.16, - "learning_rate": 0.00012614738838914085, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00021067600529834282, + "loss": 0.0183, "step": 229730 }, { - "epoch": 1.16, - "learning_rate": 0.00012613982069612683, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.00021067211708197136, + "loss": 0.0153, "step": 229740 }, { - "epoch": 1.16, - "learning_rate": 0.00012613225300311284, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021066822886559988, + "loss": 0.0147, "step": 229750 }, { - "epoch": 1.16, - "learning_rate": 0.00012612468531009882, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.00021066434064922842, + "loss": 0.0202, "step": 229760 }, { - "epoch": 1.16, - "learning_rate": 0.0001261171176170848, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021066045243285699, + "loss": 0.0162, "step": 229770 }, { - "epoch": 1.16, - "learning_rate": 0.0001261095499240708, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002106565642164855, + "loss": 0.0183, "step": 229780 }, { - "epoch": 1.16, - "learning_rate": 0.0001261019822310568, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00021065267600011404, + "loss": 0.0175, "step": 229790 }, { - "epoch": 1.16, - "learning_rate": 0.00012609441453804277, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021064878778374256, + "loss": 0.0154, "step": 229800 }, { - "epoch": 1.16, - "learning_rate": 0.00012608684684502878, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00021064489956737113, + "loss": 0.0166, "step": 229810 }, { - "epoch": 1.16, - "learning_rate": 0.00012607927915201476, - "loss": 0.0074, + "epoch": 0.6, + "learning_rate": 0.00021064101135099964, + "loss": 0.0151, "step": 229820 }, { - "epoch": 1.16, - "learning_rate": 0.00012607171145900074, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021063712313462818, + "loss": 0.0163, "step": 229830 }, { - "epoch": 1.16, - "learning_rate": 0.00012606414376598672, - "loss": 0.0135, + "epoch": 0.6, + "learning_rate": 0.0002106332349182567, + "loss": 0.0169, "step": 229840 }, { - "epoch": 1.16, - "learning_rate": 0.00012605657607297273, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021062934670188526, + "loss": 0.0192, "step": 229850 }, { - "epoch": 1.16, - "learning_rate": 0.0001260490083799587, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.00021062545848551378, + "loss": 0.0138, "step": 229860 }, { - "epoch": 1.16, - "learning_rate": 0.0001260414406869447, - "loss": 0.0221, + "epoch": 0.6, + "learning_rate": 0.00021062157026914232, + "loss": 0.0147, "step": 229870 }, { - "epoch": 1.16, - "learning_rate": 0.0001260338729939307, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021061768205277084, + "loss": 0.0162, "step": 229880 }, { - "epoch": 1.16, - "learning_rate": 0.00012602630530091668, - "loss": 0.0112, + "epoch": 0.6, + "learning_rate": 0.0002106137938363994, + "loss": 0.0152, "step": 229890 }, { - "epoch": 1.16, - "learning_rate": 0.00012601873760790267, - "loss": 0.0123, + "epoch": 0.6, + "learning_rate": 0.00021060990562002792, + "loss": 0.0173, "step": 229900 }, { - "epoch": 1.16, - "learning_rate": 0.00012601116991488867, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021060601740365646, + "loss": 0.0175, "step": 229910 }, { - "epoch": 1.16, - "learning_rate": 0.00012600360222187466, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021060212918728497, + "loss": 0.0175, "step": 229920 }, { - "epoch": 1.16, - "learning_rate": 0.00012599603452886064, - "loss": 0.0069, + "epoch": 0.6, + "learning_rate": 0.00021059824097091354, + "loss": 0.0197, "step": 229930 }, { - "epoch": 1.16, - "learning_rate": 0.00012598846683584665, - "loss": 0.0107, + "epoch": 0.6, + "learning_rate": 0.00021059435275454209, + "loss": 0.0173, "step": 229940 }, { - "epoch": 1.16, - "learning_rate": 0.00012598089914283263, - "loss": 0.0074, + "epoch": 0.6, + "learning_rate": 0.0002105904645381706, + "loss": 0.0173, "step": 229950 }, { - "epoch": 1.16, - "learning_rate": 0.0001259733314498186, - "loss": 0.0074, + "epoch": 0.6, + "learning_rate": 0.00021058657632179911, + "loss": 0.0142, "step": 229960 }, { - "epoch": 1.16, - "learning_rate": 0.00012596576375680462, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021058268810542768, + "loss": 0.0154, "step": 229970 }, { - "epoch": 1.16, - "learning_rate": 0.0001259581960637906, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00021057879988905622, + "loss": 0.0176, "step": 229980 }, { - "epoch": 1.16, - "learning_rate": 0.00012595062837077658, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.00021057491167268474, + "loss": 0.0161, "step": 229990 }, { - "epoch": 1.16, - "learning_rate": 0.00012594306067776256, - "loss": 0.0113, + "epoch": 0.6, + "learning_rate": 0.00021057102345631328, + "loss": 0.0179, "step": 230000 }, { - "epoch": 1.16, - "eval_cer": 0.9144556999612812, - "eval_loss": 0.006792085710912943, - "eval_runtime": 116.2077, - "eval_samples_per_second": 17.211, - "eval_steps_per_second": 4.303, + "epoch": 0.6, + "eval_cer": 0.8817558725266665, + "eval_loss": 0.011123710311949253, + "eval_runtime": 107.2187, + "eval_samples_per_second": 18.653, + "eval_steps_per_second": 4.663, "step": 230000 }, { - "epoch": 1.16, - "learning_rate": 0.00012593549298474857, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002105671352399418, + "loss": 0.0188, "step": 230010 }, { - "epoch": 1.16, - "learning_rate": 0.00012592792529173455, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00021056324702357036, + "loss": 0.0195, "step": 230020 }, { - "epoch": 1.16, - "learning_rate": 0.00012592035759872053, - "loss": 0.0076, + "epoch": 0.6, + "learning_rate": 0.00021055935880719888, + "loss": 0.0151, "step": 230030 }, { - "epoch": 1.16, - "learning_rate": 0.00012591278990570654, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021055547059082742, + "loss": 0.0143, "step": 230040 }, { - "epoch": 1.16, - "learning_rate": 0.00012590522221269252, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00021055158237445593, + "loss": 0.0153, "step": 230050 }, { - "epoch": 1.16, - "learning_rate": 0.0001258976545196785, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.0002105476941580845, + "loss": 0.0164, "step": 230060 }, { - "epoch": 1.16, - "learning_rate": 0.0001258900868266645, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00021054380594171302, + "loss": 0.0166, "step": 230070 }, { - "epoch": 1.16, - "learning_rate": 0.0001258825191336505, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00021053991772534156, + "loss": 0.0156, "step": 230080 }, { - "epoch": 1.16, - "learning_rate": 0.00012587495144063648, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00021053602950897007, + "loss": 0.012, "step": 230090 }, { - "epoch": 1.16, - "learning_rate": 0.00012586738374762248, - "loss": 0.0115, + "epoch": 0.6, + "learning_rate": 0.00021053214129259864, + "loss": 0.0153, "step": 230100 }, { - "epoch": 1.16, - "learning_rate": 0.00012585981605460847, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00021052825307622718, + "loss": 0.0209, "step": 230110 }, { - "epoch": 1.16, - "learning_rate": 0.00012585224836159445, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.0002105243648598557, + "loss": 0.0167, "step": 230120 }, { - "epoch": 1.16, - "learning_rate": 0.00012584468066858046, - "loss": 0.0122, + "epoch": 0.6, + "learning_rate": 0.00021052047664348421, + "loss": 0.0151, "step": 230130 }, { - "epoch": 1.16, - "learning_rate": 0.00012583711297556644, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00021051658842711278, + "loss": 0.0137, "step": 230140 }, { - "epoch": 1.16, - "learning_rate": 0.00012582954528255242, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021051270021074132, + "loss": 0.0147, "step": 230150 }, { - "epoch": 1.16, - "learning_rate": 0.00012582197758953843, - "loss": 0.0129, + "epoch": 0.6, + "learning_rate": 0.00021050881199436984, + "loss": 0.0142, "step": 230160 }, { - "epoch": 1.16, - "learning_rate": 0.0001258144098965244, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021050492377799838, + "loss": 0.0167, "step": 230170 }, { - "epoch": 1.16, - "learning_rate": 0.0001258068422035104, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021050103556162692, + "loss": 0.0151, "step": 230180 }, { - "epoch": 1.16, - "learning_rate": 0.00012579927451049637, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021049714734525546, + "loss": 0.0181, "step": 230190 }, { - "epoch": 1.16, - "learning_rate": 0.00012579170681748238, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00021049325912888398, + "loss": 0.0168, "step": 230200 }, { - "epoch": 1.16, - "learning_rate": 0.00012578413912446836, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00021048937091251252, + "loss": 0.0122, "step": 230210 }, { - "epoch": 1.16, - "learning_rate": 0.00012577657143145434, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00021048548269614106, + "loss": 0.0156, "step": 230220 }, { - "epoch": 1.16, - "learning_rate": 0.00012576900373844035, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.0002104815944797696, + "loss": 0.0183, "step": 230230 }, { - "epoch": 1.16, - "learning_rate": 0.00012576143604542633, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.00021047770626339812, + "loss": 0.0158, "step": 230240 }, { - "epoch": 1.16, - "learning_rate": 0.00012575386835241231, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021047381804702666, + "loss": 0.0163, "step": 230250 }, { - "epoch": 1.16, - "learning_rate": 0.00012574630065939832, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00021046992983065517, + "loss": 0.0219, "step": 230260 }, { - "epoch": 1.16, - "learning_rate": 0.0001257387329663843, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00021046604161428374, + "loss": 0.0192, "step": 230270 }, { - "epoch": 1.16, - "learning_rate": 0.00012573116527337029, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00021046215339791226, + "loss": 0.0146, "step": 230280 }, { - "epoch": 1.16, - "learning_rate": 0.0001257235975803563, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.0002104582651815408, + "loss": 0.0188, "step": 230290 }, { - "epoch": 1.16, - "learning_rate": 0.00012571602988734228, - "loss": 0.011, + "epoch": 0.6, + "learning_rate": 0.0002104543769651693, + "loss": 0.0118, "step": 230300 }, { - "epoch": 1.16, - "learning_rate": 0.00012570846219432826, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021045048874879788, + "loss": 0.016, "step": 230310 }, { - "epoch": 1.16, - "learning_rate": 0.00012570089450131427, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021044660053242642, + "loss": 0.0162, "step": 230320 }, { - "epoch": 1.16, - "learning_rate": 0.00012569332680830022, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00021044271231605494, + "loss": 0.015, "step": 230330 }, { - "epoch": 1.16, - "learning_rate": 0.00012568575911528623, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00021043882409968348, + "loss": 0.0183, "step": 230340 }, { - "epoch": 1.16, - "learning_rate": 0.0001256781914222722, - "loss": 0.0111, + "epoch": 0.6, + "learning_rate": 0.00021043493588331202, + "loss": 0.0145, "step": 230350 }, { - "epoch": 1.16, - "learning_rate": 0.0001256706237292582, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021043104766694056, + "loss": 0.0178, "step": 230360 }, { - "epoch": 1.16, - "learning_rate": 0.00012566305603624417, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00021042715945056908, + "loss": 0.0179, "step": 230370 }, { - "epoch": 1.16, - "learning_rate": 0.00012565548834323018, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021042327123419762, + "loss": 0.0188, "step": 230380 }, { - "epoch": 1.16, - "learning_rate": 0.00012564792065021616, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00021041938301782616, + "loss": 0.0188, "step": 230390 }, { - "epoch": 1.16, - "learning_rate": 0.00012564035295720214, - "loss": 0.0104, + "epoch": 0.6, + "learning_rate": 0.0002104154948014547, + "loss": 0.0139, "step": 230400 }, { - "epoch": 1.16, - "learning_rate": 0.00012563278526418815, - "loss": 0.0068, + "epoch": 0.6, + "learning_rate": 0.00021041160658508322, + "loss": 0.0167, "step": 230410 }, { - "epoch": 1.16, - "learning_rate": 0.00012562521757117413, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021040771836871176, + "loss": 0.0211, "step": 230420 }, { - "epoch": 1.16, - "learning_rate": 0.00012561764987816012, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.0002104038301523403, + "loss": 0.0171, "step": 230430 }, { - "epoch": 1.16, - "learning_rate": 0.00012561008218514612, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021039994193596884, + "loss": 0.0114, "step": 230440 }, { - "epoch": 1.16, - "learning_rate": 0.0001256025144921321, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021039605371959736, + "loss": 0.0186, "step": 230450 }, { - "epoch": 1.16, - "learning_rate": 0.0001255949467991181, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.0002103921655032259, + "loss": 0.0131, "step": 230460 }, { - "epoch": 1.16, - "learning_rate": 0.0001255873791061041, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00021038827728685447, + "loss": 0.014, "step": 230470 }, { - "epoch": 1.16, - "learning_rate": 0.00012557981141309008, - "loss": 0.0112, + "epoch": 0.6, + "learning_rate": 0.00021038438907048298, + "loss": 0.0212, "step": 230480 }, { - "epoch": 1.16, - "learning_rate": 0.00012557224372007606, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021038050085411152, + "loss": 0.0142, "step": 230490 }, { - "epoch": 1.16, - "learning_rate": 0.00012556467602706207, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021037661263774004, + "loss": 0.0151, "step": 230500 }, { - "epoch": 1.16, - "learning_rate": 0.00012555710833404805, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00021037272442136858, + "loss": 0.0187, "step": 230510 }, { - "epoch": 1.16, - "learning_rate": 0.00012554954064103403, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.00021036883620499712, + "loss": 0.0156, "step": 230520 }, { - "epoch": 1.16, - "learning_rate": 0.00012554197294802, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021036494798862566, + "loss": 0.0149, "step": 230530 }, { - "epoch": 1.16, - "learning_rate": 0.00012553440525500602, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021036105977225418, + "loss": 0.0125, "step": 230540 }, { - "epoch": 1.16, - "learning_rate": 0.000125526837561992, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00021035717155588272, + "loss": 0.0135, "step": 230550 }, { - "epoch": 1.16, - "learning_rate": 0.00012551926986897798, - "loss": 0.0076, + "epoch": 0.6, + "learning_rate": 0.00021035328333951126, + "loss": 0.0144, "step": 230560 }, { - "epoch": 1.16, - "learning_rate": 0.000125511702175964, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.0002103493951231398, + "loss": 0.0205, "step": 230570 }, { - "epoch": 1.16, - "learning_rate": 0.00012550413448294997, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021034550690676832, + "loss": 0.0164, "step": 230580 }, { - "epoch": 1.16, - "learning_rate": 0.00012549656678993595, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021034161869039686, + "loss": 0.0197, "step": 230590 }, { - "epoch": 1.16, - "learning_rate": 0.00012548899909692196, - "loss": 0.0073, + "epoch": 0.6, + "learning_rate": 0.0002103377304740254, + "loss": 0.0164, "step": 230600 }, { - "epoch": 1.16, - "learning_rate": 0.00012548143140390794, - "loss": 0.0111, + "epoch": 0.6, + "learning_rate": 0.00021033384225765394, + "loss": 0.0196, "step": 230610 }, { - "epoch": 1.16, - "learning_rate": 0.00012547386371089393, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021032995404128246, + "loss": 0.0173, "step": 230620 }, { - "epoch": 1.16, - "learning_rate": 0.00012546629601787993, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.000210326065824911, + "loss": 0.0152, "step": 230630 }, { - "epoch": 1.16, - "learning_rate": 0.00012545872832486592, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.00021032217760853957, + "loss": 0.0156, "step": 230640 }, { - "epoch": 1.16, - "learning_rate": 0.0001254511606318519, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021031828939216808, + "loss": 0.011, "step": 230650 }, { - "epoch": 1.16, - "learning_rate": 0.0001254435929388379, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021031440117579662, + "loss": 0.0141, "step": 230660 }, { - "epoch": 1.16, - "learning_rate": 0.0001254360252458239, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021031051295942514, + "loss": 0.0134, "step": 230670 }, { - "epoch": 1.16, - "learning_rate": 0.00012542845755280987, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.0002103066247430537, + "loss": 0.0136, "step": 230680 }, { - "epoch": 1.16, - "learning_rate": 0.00012542088985979588, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00021030273652668222, + "loss": 0.0177, "step": 230690 }, { - "epoch": 1.16, - "learning_rate": 0.00012541332216678186, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00021029884831031076, + "loss": 0.0184, "step": 230700 }, { - "epoch": 1.16, - "learning_rate": 0.00012540575447376784, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021029496009393928, + "loss": 0.0171, "step": 230710 }, { - "epoch": 1.16, - "learning_rate": 0.00012539818678075382, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021029107187756785, + "loss": 0.0136, "step": 230720 }, { - "epoch": 1.16, - "learning_rate": 0.00012539061908773983, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021028718366119636, + "loss": 0.0169, "step": 230730 }, { - "epoch": 1.16, - "learning_rate": 0.0001253830513947258, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.0002102832954448249, + "loss": 0.0153, "step": 230740 }, { - "epoch": 1.16, - "learning_rate": 0.0001253754837017118, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.00021027940722845342, + "loss": 0.0164, "step": 230750 }, { - "epoch": 1.16, - "learning_rate": 0.0001253679160086978, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00021027551901208196, + "loss": 0.0169, "step": 230760 }, { - "epoch": 1.16, - "learning_rate": 0.00012536034831568378, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002102716307957105, + "loss": 0.0164, "step": 230770 }, { - "epoch": 1.16, - "learning_rate": 0.00012535278062266976, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021026774257933904, + "loss": 0.0134, "step": 230780 }, { - "epoch": 1.16, - "learning_rate": 0.00012534521292965577, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021026385436296756, + "loss": 0.0152, "step": 230790 }, { - "epoch": 1.16, - "learning_rate": 0.00012533764523664175, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.0002102599661465961, + "loss": 0.0157, "step": 230800 }, { - "epoch": 1.16, - "learning_rate": 0.00012533007754362774, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021025607793022467, + "loss": 0.0152, "step": 230810 }, { - "epoch": 1.16, - "learning_rate": 0.00012532250985061374, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00021025218971385318, + "loss": 0.0163, "step": 230820 }, { - "epoch": 1.16, - "learning_rate": 0.00012531494215759973, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.0002102483014974817, + "loss": 0.018, "step": 230830 }, { - "epoch": 1.16, - "learning_rate": 0.0001253073744645857, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00021024441328111024, + "loss": 0.0206, "step": 230840 }, { - "epoch": 1.16, - "learning_rate": 0.00012529980677157172, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.0002102405250647388, + "loss": 0.0153, "step": 230850 }, { - "epoch": 1.16, - "learning_rate": 0.0001252922390785577, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.00021023663684836732, + "loss": 0.021, "step": 230860 }, { - "epoch": 1.16, - "learning_rate": 0.00012528467138554368, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021023274863199586, + "loss": 0.0223, "step": 230870 }, { - "epoch": 1.16, - "learning_rate": 0.00012527710369252966, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00021022886041562438, + "loss": 0.0169, "step": 230880 }, { - "epoch": 1.16, - "learning_rate": 0.00012526953599951567, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021022497219925294, + "loss": 0.0159, "step": 230890 }, { - "epoch": 1.16, - "learning_rate": 0.00012526196830650165, - "loss": 0.0082, + "epoch": 0.6, + "learning_rate": 0.00021022108398288146, + "loss": 0.0201, "step": 230900 }, { - "epoch": 1.16, - "learning_rate": 0.00012525440061348763, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00021021719576651, + "loss": 0.019, "step": 230910 }, { - "epoch": 1.17, - "learning_rate": 0.00012524683292047364, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021021330755013852, + "loss": 0.0151, "step": 230920 }, { - "epoch": 1.17, - "learning_rate": 0.00012523926522745962, - "loss": 0.012, + "epoch": 0.6, + "learning_rate": 0.00021020941933376708, + "loss": 0.0169, "step": 230930 }, { - "epoch": 1.17, - "learning_rate": 0.0001252316975344456, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.0002102055311173956, + "loss": 0.0168, "step": 230940 }, { - "epoch": 1.17, - "learning_rate": 0.0001252241298414316, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00021020164290102414, + "loss": 0.0158, "step": 230950 }, { - "epoch": 1.17, - "learning_rate": 0.00012521656214841757, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00021019775468465265, + "loss": 0.0172, "step": 230960 }, { - "epoch": 1.17, - "learning_rate": 0.00012520899445540357, - "loss": 0.0124, + "epoch": 0.6, + "learning_rate": 0.00021019386646828122, + "loss": 0.0187, "step": 230970 }, { - "epoch": 1.17, - "learning_rate": 0.00012520142676238956, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00021018997825190977, + "loss": 0.0152, "step": 230980 }, { - "epoch": 1.17, - "learning_rate": 0.00012519385906937554, - "loss": 0.011, + "epoch": 0.6, + "learning_rate": 0.00021018609003553828, + "loss": 0.0149, "step": 230990 }, { - "epoch": 1.17, - "learning_rate": 0.00012518629137636155, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.0002101822018191668, + "loss": 0.0201, "step": 231000 }, { - "epoch": 1.17, - "eval_cer": 0.9144353216426477, - "eval_loss": 0.006772263906896114, - "eval_runtime": 116.0719, - "eval_samples_per_second": 17.231, - "eval_steps_per_second": 4.308, + "epoch": 0.6, + "eval_cer": 0.8817656699852059, + "eval_loss": 0.010918508283793926, + "eval_runtime": 107.5234, + "eval_samples_per_second": 18.601, + "eval_steps_per_second": 4.65, "step": 231000 }, { - "epoch": 1.17, - "learning_rate": 0.00012517872368334753, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00021017831360279534, + "loss": 0.0149, "step": 231010 }, { - "epoch": 1.17, - "learning_rate": 0.0001251711559903335, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.0002101744253864239, + "loss": 0.0154, "step": 231020 }, { - "epoch": 1.17, - "learning_rate": 0.00012516358829731952, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021017053717005242, + "loss": 0.0152, "step": 231030 }, { - "epoch": 1.17, - "learning_rate": 0.0001251560206043055, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00021016664895368096, + "loss": 0.0205, "step": 231040 }, { - "epoch": 1.17, - "learning_rate": 0.00012514845291129148, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021016276073730948, + "loss": 0.0252, "step": 231050 }, { - "epoch": 1.17, - "learning_rate": 0.0001251408852182775, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00021015887252093804, + "loss": 0.0171, "step": 231060 }, { - "epoch": 1.17, - "learning_rate": 0.00012513331752526347, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00021015498430456656, + "loss": 0.0152, "step": 231070 }, { - "epoch": 1.17, - "learning_rate": 0.00012512574983224945, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002101510960881951, + "loss": 0.0117, "step": 231080 }, { - "epoch": 1.17, - "learning_rate": 0.00012511818213923543, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00021014720787182361, + "loss": 0.0147, "step": 231090 }, { - "epoch": 1.17, - "learning_rate": 0.00012511061444622144, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00021014331965545218, + "loss": 0.0149, "step": 231100 }, { - "epoch": 1.17, - "learning_rate": 0.00012510304675320742, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.0002101394314390807, + "loss": 0.0162, "step": 231110 }, { - "epoch": 1.17, - "learning_rate": 0.0001250954790601934, - "loss": 0.0135, + "epoch": 0.6, + "learning_rate": 0.00021013554322270924, + "loss": 0.0148, "step": 231120 }, { - "epoch": 1.17, - "learning_rate": 0.0001250879113671794, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.00021013165500633775, + "loss": 0.0118, "step": 231130 }, { - "epoch": 1.17, - "learning_rate": 0.0001250803436741654, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.00021012776678996632, + "loss": 0.0169, "step": 231140 }, { - "epoch": 1.17, - "learning_rate": 0.00012507277598115138, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00021012387857359484, + "loss": 0.0157, "step": 231150 }, { - "epoch": 1.17, - "learning_rate": 0.00012506520828813738, - "loss": 0.0115, + "epoch": 0.6, + "learning_rate": 0.00021011999035722338, + "loss": 0.018, "step": 231160 }, { - "epoch": 1.17, - "learning_rate": 0.00012505764059512337, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002101161021408519, + "loss": 0.0165, "step": 231170 }, { - "epoch": 1.17, - "learning_rate": 0.00012505007290210935, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.00021011221392448046, + "loss": 0.0174, "step": 231180 }, { - "epoch": 1.17, - "learning_rate": 0.00012504250520909536, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.000210108325708109, + "loss": 0.0137, "step": 231190 }, { - "epoch": 1.17, - "learning_rate": 0.00012503493751608134, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00021010443749173752, + "loss": 0.0247, "step": 231200 }, { - "epoch": 1.17, - "learning_rate": 0.00012502736982306732, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00021010054927536606, + "loss": 0.0136, "step": 231210 }, { - "epoch": 1.17, - "learning_rate": 0.00012501980213005333, - "loss": 0.0116, + "epoch": 0.6, + "learning_rate": 0.0002100966610589946, + "loss": 0.0158, "step": 231220 }, { - "epoch": 1.17, - "learning_rate": 0.0001250122344370393, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00021009277284262314, + "loss": 0.0195, "step": 231230 }, { - "epoch": 1.17, - "learning_rate": 0.0001250046667440253, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00021008888462625166, + "loss": 0.0251, "step": 231240 }, { - "epoch": 1.17, - "learning_rate": 0.00012499709905101127, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.0002100849964098802, + "loss": 0.0148, "step": 231250 }, { - "epoch": 1.17, - "learning_rate": 0.00012498953135799728, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.00021008110819350871, + "loss": 0.0125, "step": 231260 }, { - "epoch": 1.17, - "learning_rate": 0.00012498196366498326, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00021007721997713728, + "loss": 0.015, "step": 231270 }, { - "epoch": 1.17, - "learning_rate": 0.00012497439597196924, - "loss": 0.0112, + "epoch": 0.6, + "learning_rate": 0.0002100733317607658, + "loss": 0.018, "step": 231280 }, { - "epoch": 1.17, - "learning_rate": 0.00012496682827895525, - "loss": 0.0115, + "epoch": 0.6, + "learning_rate": 0.00021006944354439434, + "loss": 0.0181, "step": 231290 }, { - "epoch": 1.17, - "learning_rate": 0.00012495926058594123, - "loss": 0.0113, - "step": 231300 + "epoch": 0.6, + "learning_rate": 0.00021006555532802285, + "loss": 0.0173, + "step": 231300 }, { - "epoch": 1.17, - "learning_rate": 0.00012495169289292721, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021006166711165142, + "loss": 0.0134, "step": 231310 }, { - "epoch": 1.17, - "learning_rate": 0.00012494412519991322, - "loss": 0.013, + "epoch": 0.6, + "learning_rate": 0.00021005777889527994, + "loss": 0.0172, "step": 231320 }, { - "epoch": 1.17, - "learning_rate": 0.0001249365575068992, - "loss": 0.0074, + "epoch": 0.6, + "learning_rate": 0.00021005389067890848, + "loss": 0.0128, "step": 231330 }, { - "epoch": 1.17, - "learning_rate": 0.00012492898981388519, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.000210050002462537, + "loss": 0.0138, "step": 231340 }, { - "epoch": 1.17, - "learning_rate": 0.0001249214221208712, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00021004611424616556, + "loss": 0.018, "step": 231350 }, { - "epoch": 1.17, - "learning_rate": 0.00012491385442785718, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.0002100422260297941, + "loss": 0.015, "step": 231360 }, { - "epoch": 1.17, - "learning_rate": 0.00012490628673484316, - "loss": 0.0136, + "epoch": 0.6, + "learning_rate": 0.00021003833781342262, + "loss": 0.0194, "step": 231370 }, { - "epoch": 1.17, - "learning_rate": 0.00012489871904182917, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00021003444959705116, + "loss": 0.0156, "step": 231380 }, { - "epoch": 1.17, - "learning_rate": 0.00012489115134881515, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.0002100305613806797, + "loss": 0.0162, "step": 231390 }, { - "epoch": 1.17, - "learning_rate": 0.00012488358365580113, - "loss": 0.0073, + "epoch": 0.6, + "learning_rate": 0.00021002667316430824, + "loss": 0.0157, "step": 231400 }, { - "epoch": 1.17, - "learning_rate": 0.0001248760159627871, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00021002278494793676, + "loss": 0.0187, "step": 231410 }, { - "epoch": 1.17, - "learning_rate": 0.00012486844826977312, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.0002100188967315653, + "loss": 0.0154, "step": 231420 }, { - "epoch": 1.17, - "learning_rate": 0.0001248608805767591, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00021001500851519384, + "loss": 0.0176, "step": 231430 }, { - "epoch": 1.17, - "learning_rate": 0.00012485331288374508, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.00021001112029882238, + "loss": 0.0187, "step": 231440 }, { - "epoch": 1.17, - "learning_rate": 0.0001248457451907311, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.0002100072320824509, + "loss": 0.0142, "step": 231450 }, { - "epoch": 1.17, - "learning_rate": 0.00012483817749771707, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00021000334386607944, + "loss": 0.0147, "step": 231460 }, { - "epoch": 1.17, - "learning_rate": 0.00012483060980470305, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00020999945564970798, + "loss": 0.0153, "step": 231470 }, { - "epoch": 1.17, - "learning_rate": 0.00012482304211168906, - "loss": 0.0072, + "epoch": 0.6, + "learning_rate": 0.00020999556743333652, + "loss": 0.015, "step": 231480 }, { - "epoch": 1.17, - "learning_rate": 0.00012481547441867504, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020999167921696504, + "loss": 0.0176, "step": 231490 }, { - "epoch": 1.17, - "learning_rate": 0.00012480790672566102, - "loss": 0.0118, + "epoch": 0.6, + "learning_rate": 0.00020998779100059358, + "loss": 0.0149, "step": 231500 }, { - "epoch": 1.17, - "learning_rate": 0.00012480033903264703, - "loss": 0.0113, + "epoch": 0.6, + "learning_rate": 0.0002099839027842221, + "loss": 0.0215, "step": 231510 }, { - "epoch": 1.17, - "learning_rate": 0.00012479277133963301, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00020998001456785066, + "loss": 0.0161, "step": 231520 }, { - "epoch": 1.17, - "learning_rate": 0.000124785203646619, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.0002099761263514792, + "loss": 0.0123, "step": 231530 }, { - "epoch": 1.17, - "learning_rate": 0.000124777635953605, - "loss": 0.007, + "epoch": 0.6, + "learning_rate": 0.00020997223813510772, + "loss": 0.0175, "step": 231540 }, { - "epoch": 1.17, - "learning_rate": 0.00012477006826059099, - "loss": 0.0115, + "epoch": 0.6, + "learning_rate": 0.00020996834991873623, + "loss": 0.0183, "step": 231550 }, { - "epoch": 1.17, - "learning_rate": 0.00012476250056757697, - "loss": 0.0116, + "epoch": 0.6, + "learning_rate": 0.0002099644617023648, + "loss": 0.0153, "step": 231560 }, { - "epoch": 1.17, - "learning_rate": 0.00012475493287456298, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00020996057348599334, + "loss": 0.0224, "step": 231570 }, { - "epoch": 1.17, - "learning_rate": 0.00012474736518154896, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00020995668526962186, + "loss": 0.016, "step": 231580 }, { - "epoch": 1.17, - "learning_rate": 0.00012473979748853494, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.0002099527970532504, + "loss": 0.0153, "step": 231590 }, { - "epoch": 1.17, - "learning_rate": 0.00012473222979552092, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00020994890883687894, + "loss": 0.0172, "step": 231600 }, { - "epoch": 1.17, - "learning_rate": 0.0001247246621025069, - "loss": 0.0131, + "epoch": 0.6, + "learning_rate": 0.00020994502062050748, + "loss": 0.0185, "step": 231610 }, { - "epoch": 1.17, - "learning_rate": 0.00012471709440949288, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.000209941132404136, + "loss": 0.0127, "step": 231620 }, { - "epoch": 1.17, - "learning_rate": 0.0001247095267164789, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020993724418776454, + "loss": 0.0175, "step": 231630 }, { - "epoch": 1.17, - "learning_rate": 0.00012470195902346487, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00020993335597139308, + "loss": 0.0188, "step": 231640 }, { - "epoch": 1.17, - "learning_rate": 0.00012469439133045085, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00020992946775502162, + "loss": 0.0144, "step": 231650 }, { - "epoch": 1.17, - "learning_rate": 0.00012468682363743686, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00020992557953865014, + "loss": 0.0208, "step": 231660 }, { - "epoch": 1.17, - "learning_rate": 0.00012467925594442284, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00020992169132227868, + "loss": 0.0175, "step": 231670 }, { - "epoch": 1.17, - "learning_rate": 0.00012467168825140883, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00020991780310590725, + "loss": 0.0157, "step": 231680 }, { - "epoch": 1.17, - "learning_rate": 0.00012466412055839483, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020991391488953576, + "loss": 0.0155, "step": 231690 }, { - "epoch": 1.17, - "learning_rate": 0.00012465655286538082, - "loss": 0.011, + "epoch": 0.6, + "learning_rate": 0.0002099100266731643, + "loss": 0.018, "step": 231700 }, { - "epoch": 1.17, - "learning_rate": 0.0001246489851723668, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00020990613845679282, + "loss": 0.0158, "step": 231710 }, { - "epoch": 1.17, - "learning_rate": 0.0001246414174793528, - "loss": 0.0109, + "epoch": 0.6, + "learning_rate": 0.00020990225024042139, + "loss": 0.0164, "step": 231720 }, { - "epoch": 1.17, - "learning_rate": 0.0001246338497863388, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.0002098983620240499, + "loss": 0.0148, "step": 231730 }, { - "epoch": 1.17, - "learning_rate": 0.00012462628209332477, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.00020989447380767844, + "loss": 0.0189, "step": 231740 }, { - "epoch": 1.17, - "learning_rate": 0.00012461871440031078, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00020989058559130696, + "loss": 0.0152, "step": 231750 }, { - "epoch": 1.17, - "learning_rate": 0.00012461114670729676, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002098866973749355, + "loss": 0.0171, "step": 231760 }, { - "epoch": 1.17, - "learning_rate": 0.00012460357901428274, - "loss": 0.0066, + "epoch": 0.6, + "learning_rate": 0.00020988280915856404, + "loss": 0.0144, "step": 231770 }, { - "epoch": 1.17, - "learning_rate": 0.00012459601132126872, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020987892094219258, + "loss": 0.0189, "step": 231780 }, { - "epoch": 1.17, - "learning_rate": 0.00012458844362825473, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.0002098750327258211, + "loss": 0.0211, "step": 231790 }, { - "epoch": 1.17, - "learning_rate": 0.0001245808759352407, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020987114450944964, + "loss": 0.0156, "step": 231800 }, { - "epoch": 1.17, - "learning_rate": 0.0001245733082422267, - "loss": 0.0115, + "epoch": 0.6, + "learning_rate": 0.00020986725629307818, + "loss": 0.0116, "step": 231810 }, { - "epoch": 1.17, - "learning_rate": 0.0001245657405492127, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00020986336807670672, + "loss": 0.0173, "step": 231820 }, { - "epoch": 1.17, - "learning_rate": 0.00012455817285619868, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.00020985947986033524, + "loss": 0.0186, "step": 231830 }, { - "epoch": 1.17, - "learning_rate": 0.00012455060516318466, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020985559164396378, + "loss": 0.0179, "step": 231840 }, { - "epoch": 1.17, - "learning_rate": 0.00012454303747017067, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020985170342759235, + "loss": 0.0143, "step": 231850 }, { - "epoch": 1.17, - "learning_rate": 0.00012453546977715665, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020984781521122086, + "loss": 0.0204, "step": 231860 }, { - "epoch": 1.17, - "learning_rate": 0.00012452790208414264, - "loss": 0.0113, + "epoch": 0.6, + "learning_rate": 0.00020984392699484937, + "loss": 0.0159, "step": 231870 }, { - "epoch": 1.17, - "learning_rate": 0.00012452033439112864, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00020984003877847792, + "loss": 0.0186, "step": 231880 }, { - "epoch": 1.17, - "learning_rate": 0.00012451276669811463, - "loss": 0.0124, + "epoch": 0.6, + "learning_rate": 0.00020983615056210648, + "loss": 0.0148, "step": 231890 }, { - "epoch": 1.17, - "learning_rate": 0.0001245051990051006, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.000209832262345735, + "loss": 0.0124, "step": 231900 }, { - "epoch": 1.17, - "learning_rate": 0.00012449763131208662, - "loss": 0.0112, + "epoch": 0.6, + "learning_rate": 0.00020982837412936354, + "loss": 0.0154, "step": 231910 }, { - "epoch": 1.17, - "learning_rate": 0.0001244900636190726, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00020982448591299206, + "loss": 0.0155, "step": 231920 }, { - "epoch": 1.17, - "learning_rate": 0.00012448249592605858, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00020982059769662062, + "loss": 0.02, "step": 231930 }, { - "epoch": 1.17, - "learning_rate": 0.00012447492823304456, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020981670948024914, + "loss": 0.0138, "step": 231940 }, { - "epoch": 1.17, - "learning_rate": 0.00012446736054003057, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00020981282126387768, + "loss": 0.0178, "step": 231950 }, { - "epoch": 1.17, - "learning_rate": 0.00012445979284701655, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.0002098089330475062, + "loss": 0.0191, "step": 231960 }, { - "epoch": 1.17, - "learning_rate": 0.00012445222515400253, - "loss": 0.0072, + "epoch": 0.6, + "learning_rate": 0.00020980504483113476, + "loss": 0.0147, "step": 231970 }, { - "epoch": 1.17, - "learning_rate": 0.00012444465746098854, - "loss": 0.0095, + "epoch": 0.6, + "learning_rate": 0.00020980115661476328, + "loss": 0.0202, "step": 231980 }, { - "epoch": 1.17, - "learning_rate": 0.00012443708976797452, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00020979726839839182, + "loss": 0.0165, "step": 231990 }, { - "epoch": 1.17, - "learning_rate": 0.0001244295220749605, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00020979338018202033, + "loss": 0.02, "step": 232000 }, { - "epoch": 1.17, - "eval_cer": 0.9144654039225352, - "eval_loss": 0.006733159068971872, - "eval_runtime": 115.9285, - "eval_samples_per_second": 17.252, - "eval_steps_per_second": 4.313, + "epoch": 0.6, + "eval_cer": 0.8817768670806793, + "eval_loss": 0.010772459208965302, + "eval_runtime": 107.4987, + "eval_samples_per_second": 18.605, + "eval_steps_per_second": 4.651, "step": 232000 }, { - "epoch": 1.17, - "learning_rate": 0.0001244219543819465, - "loss": 0.0108, + "epoch": 0.6, + "learning_rate": 0.00020978949196564888, + "loss": 0.0152, "step": 232010 }, { - "epoch": 1.17, - "learning_rate": 0.0001244143866889325, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020978560374927742, + "loss": 0.0174, "step": 232020 }, { - "epoch": 1.17, - "learning_rate": 0.00012440681899591848, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020978171553290596, + "loss": 0.0168, "step": 232030 }, { - "epoch": 1.17, - "learning_rate": 0.00012439925130290448, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020977782731653447, + "loss": 0.0178, "step": 232040 }, { - "epoch": 1.17, - "learning_rate": 0.00012439168360989047, - "loss": 0.0111, + "epoch": 0.6, + "learning_rate": 0.00020977393910016302, + "loss": 0.0159, "step": 232050 }, { - "epoch": 1.17, - "learning_rate": 0.00012438411591687645, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.00020977005088379158, + "loss": 0.0132, "step": 232060 }, { - "epoch": 1.17, - "learning_rate": 0.00012437654822386246, - "loss": 0.0072, + "epoch": 0.6, + "learning_rate": 0.0002097661626674201, + "loss": 0.0144, "step": 232070 }, { - "epoch": 1.17, - "learning_rate": 0.00012436898053084844, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020976227445104864, + "loss": 0.0163, "step": 232080 }, { - "epoch": 1.17, - "learning_rate": 0.00012436141283783442, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020975838623467716, + "loss": 0.0154, "step": 232090 }, { - "epoch": 1.17, - "learning_rate": 0.00012435384514482043, - "loss": 0.0129, + "epoch": 0.6, + "learning_rate": 0.00020975449801830572, + "loss": 0.0155, "step": 232100 }, { - "epoch": 1.17, - "learning_rate": 0.0001243462774518064, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020975060980193424, + "loss": 0.0178, "step": 232110 }, { - "epoch": 1.17, - "learning_rate": 0.0001243387097587924, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020974672158556278, + "loss": 0.0178, "step": 232120 }, { - "epoch": 1.17, - "learning_rate": 0.00012433114206577837, - "loss": 0.0117, + "epoch": 0.6, + "learning_rate": 0.0002097428333691913, + "loss": 0.0192, "step": 232130 }, { - "epoch": 1.17, - "learning_rate": 0.00012432357437276438, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00020973894515281986, + "loss": 0.0172, "step": 232140 }, { - "epoch": 1.17, - "learning_rate": 0.00012431600667975036, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00020973505693644838, + "loss": 0.0239, "step": 232150 }, { - "epoch": 1.17, - "learning_rate": 0.00012430843898673634, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00020973116872007692, + "loss": 0.0184, "step": 232160 }, { - "epoch": 1.17, - "learning_rate": 0.00012430087129372235, - "loss": 0.0131, + "epoch": 0.6, + "learning_rate": 0.00020972728050370543, + "loss": 0.0171, "step": 232170 }, { - "epoch": 1.17, - "learning_rate": 0.00012429330360070833, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.000209723392287334, + "loss": 0.0149, "step": 232180 }, { - "epoch": 1.17, - "learning_rate": 0.00012428573590769431, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020971950407096252, + "loss": 0.0157, "step": 232190 }, { - "epoch": 1.17, - "learning_rate": 0.00012427816821468032, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020971561585459106, + "loss": 0.0184, "step": 232200 }, { - "epoch": 1.17, - "learning_rate": 0.00012427060052166628, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00020971172763821957, + "loss": 0.0184, "step": 232210 }, { - "epoch": 1.17, - "learning_rate": 0.00012426303282865229, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00020970783942184814, + "loss": 0.0184, "step": 232220 }, { - "epoch": 1.17, - "learning_rate": 0.00012425546513563827, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00020970395120547668, + "loss": 0.0149, "step": 232230 }, { - "epoch": 1.17, - "learning_rate": 0.00012424789744262425, - "loss": 0.0123, + "epoch": 0.6, + "learning_rate": 0.0002097000629891052, + "loss": 0.0141, "step": 232240 }, { - "epoch": 1.17, - "learning_rate": 0.00012424032974961026, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00020969617477273374, + "loss": 0.0199, "step": 232250 }, { - "epoch": 1.17, - "learning_rate": 0.00012423276205659624, - "loss": 0.0069, + "epoch": 0.6, + "learning_rate": 0.00020969228655636225, + "loss": 0.0155, "step": 232260 }, { - "epoch": 1.17, - "learning_rate": 0.00012422519436358222, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00020968839833999082, + "loss": 0.0156, "step": 232270 }, { - "epoch": 1.17, - "learning_rate": 0.00012421762667056823, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00020968451012361934, + "loss": 0.0156, "step": 232280 }, { - "epoch": 1.17, - "learning_rate": 0.0001242100589775542, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00020968062190724788, + "loss": 0.0171, "step": 232290 }, { - "epoch": 1.17, - "learning_rate": 0.0001242024912845402, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.0002096767336908764, + "loss": 0.0226, "step": 232300 }, { - "epoch": 1.17, - "learning_rate": 0.00012419492359152617, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00020967284547450496, + "loss": 0.0144, "step": 232310 }, { - "epoch": 1.17, - "learning_rate": 0.00012418735589851218, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020966895725813348, + "loss": 0.0153, "step": 232320 }, { - "epoch": 1.17, - "learning_rate": 0.00012417978820549816, - "loss": 0.0076, + "epoch": 0.6, + "learning_rate": 0.00020966506904176202, + "loss": 0.0173, "step": 232330 }, { - "epoch": 1.17, - "learning_rate": 0.00012417222051248414, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020966118082539053, + "loss": 0.0139, "step": 232340 }, { - "epoch": 1.17, - "learning_rate": 0.00012416465281947015, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.0002096572926090191, + "loss": 0.0164, "step": 232350 }, { - "epoch": 1.17, - "learning_rate": 0.00012415708512645613, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.00020965340439264762, + "loss": 0.0163, "step": 232360 }, { - "epoch": 1.17, - "learning_rate": 0.00012414951743344212, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020964951617627616, + "loss": 0.0153, "step": 232370 }, { - "epoch": 1.17, - "learning_rate": 0.00012414194974042812, - "loss": 0.0116, + "epoch": 0.6, + "learning_rate": 0.00020964562795990467, + "loss": 0.0147, "step": 232380 }, { - "epoch": 1.17, - "learning_rate": 0.0001241343820474141, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020964173974353324, + "loss": 0.0164, "step": 232390 }, { - "epoch": 1.17, - "learning_rate": 0.0001241268143544001, - "loss": 0.0075, + "epoch": 0.6, + "learning_rate": 0.00020963785152716178, + "loss": 0.0155, "step": 232400 }, { - "epoch": 1.17, - "learning_rate": 0.0001241192466613861, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.0002096339633107903, + "loss": 0.0127, "step": 232410 }, { - "epoch": 1.17, - "learning_rate": 0.00012411167896837208, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002096300750944188, + "loss": 0.016, "step": 232420 }, { - "epoch": 1.17, - "learning_rate": 0.00012410411127535806, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020962618687804738, + "loss": 0.014, "step": 232430 }, { - "epoch": 1.17, - "learning_rate": 0.00012409654358234407, - "loss": 0.0104, + "epoch": 0.6, + "learning_rate": 0.00020962229866167592, + "loss": 0.0196, "step": 232440 }, { - "epoch": 1.17, - "learning_rate": 0.00012408897588933005, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00020961841044530444, + "loss": 0.0118, "step": 232450 }, { - "epoch": 1.17, - "learning_rate": 0.00012408140819631603, - "loss": 0.0155, + "epoch": 0.6, + "learning_rate": 0.00020961452222893298, + "loss": 0.0181, "step": 232460 }, { - "epoch": 1.17, - "learning_rate": 0.000124073840503302, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020961063401256152, + "loss": 0.0154, "step": 232470 }, { - "epoch": 1.17, - "learning_rate": 0.00012406627281028802, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00020960674579619006, + "loss": 0.0202, "step": 232480 }, { - "epoch": 1.17, - "learning_rate": 0.000124058705117274, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020960285757981858, + "loss": 0.017, "step": 232490 }, { - "epoch": 1.17, - "learning_rate": 0.00012405113742425998, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020959896936344712, + "loss": 0.0177, "step": 232500 }, { - "epoch": 1.17, - "learning_rate": 0.000124043569731246, - "loss": 0.0065, + "epoch": 0.6, + "learning_rate": 0.00020959508114707563, + "loss": 0.0154, "step": 232510 }, { - "epoch": 1.17, - "learning_rate": 0.00012403600203823197, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.0002095911929307042, + "loss": 0.0137, "step": 232520 }, { - "epoch": 1.17, - "learning_rate": 0.00012402843434521795, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020958730471433272, + "loss": 0.0194, "step": 232530 }, { - "epoch": 1.17, - "learning_rate": 0.00012402086665220396, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020958341649796126, + "loss": 0.0166, "step": 232540 }, { - "epoch": 1.17, - "learning_rate": 0.00012401329895918994, - "loss": 0.0118, + "epoch": 0.6, + "learning_rate": 0.00020957952828158977, + "loss": 0.0148, "step": 232550 }, { - "epoch": 1.17, - "learning_rate": 0.00012400573126617593, - "loss": 0.007, + "epoch": 0.6, + "learning_rate": 0.00020957564006521834, + "loss": 0.0169, "step": 232560 }, { - "epoch": 1.17, - "learning_rate": 0.00012399816357316193, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.00020957175184884688, + "loss": 0.0163, "step": 232570 }, { - "epoch": 1.17, - "learning_rate": 0.00012399059588014792, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.0002095678636324754, + "loss": 0.0137, "step": 232580 }, { - "epoch": 1.17, - "learning_rate": 0.0001239830281871339, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.0002095639754161039, + "loss": 0.0142, "step": 232590 }, { - "epoch": 1.17, - "learning_rate": 0.0001239754604941199, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00020956008719973248, + "loss": 0.0192, "step": 232600 }, { - "epoch": 1.17, - "learning_rate": 0.0001239678928011059, - "loss": 0.0138, + "epoch": 0.6, + "learning_rate": 0.00020955619898336102, + "loss": 0.0144, "step": 232610 }, { - "epoch": 1.17, - "learning_rate": 0.00012396032510809187, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020955231076698954, + "loss": 0.0202, "step": 232620 }, { - "epoch": 1.17, - "learning_rate": 0.00012395275741507788, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020954842255061808, + "loss": 0.0156, "step": 232630 }, { - "epoch": 1.17, - "learning_rate": 0.00012394518972206386, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020954453433424662, + "loss": 0.0144, "step": 232640 }, { - "epoch": 1.17, - "learning_rate": 0.00012393762202904984, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00020954064611787516, + "loss": 0.0169, "step": 232650 }, { - "epoch": 1.17, - "learning_rate": 0.00012393005433603582, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.00020953675790150368, + "loss": 0.0164, "step": 232660 }, { - "epoch": 1.17, - "learning_rate": 0.00012392248664302183, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00020953286968513222, + "loss": 0.015, "step": 232670 }, { - "epoch": 1.17, - "learning_rate": 0.0001239149189500078, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.00020952898146876076, + "loss": 0.0131, "step": 232680 }, { - "epoch": 1.17, - "learning_rate": 0.0001239073512569938, - "loss": 0.0119, + "epoch": 0.6, + "learning_rate": 0.0002095250932523893, + "loss": 0.0167, "step": 232690 }, { - "epoch": 1.17, - "learning_rate": 0.0001238997835639798, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.00020952120503601782, + "loss": 0.0175, "step": 232700 }, { - "epoch": 1.17, - "learning_rate": 0.00012389221587096578, - "loss": 0.0098, + "epoch": 0.6, + "learning_rate": 0.00020951731681964636, + "loss": 0.0119, "step": 232710 }, { - "epoch": 1.17, - "learning_rate": 0.00012388464817795176, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.00020951342860327493, + "loss": 0.0158, "step": 232720 }, { - "epoch": 1.17, - "learning_rate": 0.00012387708048493777, - "loss": 0.0117, + "epoch": 0.6, + "learning_rate": 0.00020950954038690344, + "loss": 0.017, "step": 232730 }, { - "epoch": 1.17, - "learning_rate": 0.00012386951279192375, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020950565217053195, + "loss": 0.0156, "step": 232740 }, { - "epoch": 1.17, - "learning_rate": 0.00012386194509890974, - "loss": 0.0105, + "epoch": 0.6, + "learning_rate": 0.0002095017639541605, + "loss": 0.0225, "step": 232750 }, { - "epoch": 1.17, - "learning_rate": 0.00012385437740589574, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.000209497875737789, + "loss": 0.0156, "step": 232760 }, { - "epoch": 1.17, - "learning_rate": 0.00012384680971288173, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00020949398752141758, + "loss": 0.014, "step": 232770 }, { - "epoch": 1.17, - "learning_rate": 0.0001238392420198677, - "loss": 0.0071, + "epoch": 0.6, + "learning_rate": 0.00020949009930504612, + "loss": 0.0164, "step": 232780 }, { - "epoch": 1.17, - "learning_rate": 0.00012383167432685372, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.00020948621108867464, + "loss": 0.013, "step": 232790 }, { - "epoch": 1.17, - "learning_rate": 0.0001238241066338397, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00020948232287230318, + "loss": 0.0214, "step": 232800 }, { - "epoch": 1.17, - "learning_rate": 0.00012381653894082568, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.00020947843465593172, + "loss": 0.0145, "step": 232810 }, { - "epoch": 1.17, - "learning_rate": 0.00012380897124781166, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.00020947454643956026, + "loss": 0.019, "step": 232820 }, { - "epoch": 1.17, - "learning_rate": 0.00012380140355479767, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00020947065822318878, + "loss": 0.0156, "step": 232830 }, { - "epoch": 1.17, - "learning_rate": 0.00012379383586178362, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020946677000681732, + "loss": 0.013, "step": 232840 }, { - "epoch": 1.17, - "learning_rate": 0.00012378626816876963, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020946288179044586, + "loss": 0.0162, "step": 232850 }, { - "epoch": 1.17, - "learning_rate": 0.0001237787004757556, - "loss": 0.0096, + "epoch": 0.6, + "learning_rate": 0.0002094589935740744, + "loss": 0.0157, "step": 232860 }, { - "epoch": 1.17, - "learning_rate": 0.0001237711327827416, - "loss": 0.0117, + "epoch": 0.6, + "learning_rate": 0.00020945510535770291, + "loss": 0.0167, "step": 232870 }, { - "epoch": 1.17, - "learning_rate": 0.0001237635650897276, - "loss": 0.009, + "epoch": 0.6, + "learning_rate": 0.00020945121714133146, + "loss": 0.0162, "step": 232880 }, { - "epoch": 1.17, - "learning_rate": 0.00012375599739671358, - "loss": 0.01, + "epoch": 0.6, + "learning_rate": 0.00020944732892496, + "loss": 0.0148, "step": 232890 }, { - "epoch": 1.18, - "learning_rate": 0.00012374842970369957, - "loss": 0.0089, + "epoch": 0.6, + "learning_rate": 0.00020944344070858854, + "loss": 0.015, "step": 232900 }, { - "epoch": 1.18, - "learning_rate": 0.00012374086201068557, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00020943955249221705, + "loss": 0.015, "step": 232910 }, { - "epoch": 1.18, - "learning_rate": 0.00012373329431767156, - "loss": 0.0087, + "epoch": 0.6, + "learning_rate": 0.0002094356642758456, + "loss": 0.014, "step": 232920 }, { - "epoch": 1.18, - "learning_rate": 0.00012372572662465754, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020943177605947416, + "loss": 0.0182, "step": 232930 }, { - "epoch": 1.18, - "learning_rate": 0.00012371815893164355, - "loss": 0.0067, + "epoch": 0.6, + "learning_rate": 0.00020942788784310268, + "loss": 0.0251, "step": 232940 }, { - "epoch": 1.18, - "learning_rate": 0.00012371059123862953, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020942399962673122, + "loss": 0.0151, "step": 232950 }, { - "epoch": 1.18, - "learning_rate": 0.0001237030235456155, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00020942011141035974, + "loss": 0.0164, "step": 232960 }, { - "epoch": 1.18, - "learning_rate": 0.00012369545585260152, - "loss": 0.0097, + "epoch": 0.6, + "learning_rate": 0.0002094162231939883, + "loss": 0.0203, "step": 232970 }, { - "epoch": 1.18, - "learning_rate": 0.0001236878881595875, - "loss": 0.008, + "epoch": 0.6, + "learning_rate": 0.00020941233497761682, + "loss": 0.0191, "step": 232980 }, { - "epoch": 1.18, - "learning_rate": 0.00012368032046657348, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020940844676124536, + "loss": 0.0161, "step": 232990 }, { - "epoch": 1.18, - "learning_rate": 0.0001236727527735595, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00020940455854487387, + "loss": 0.0171, "step": 233000 }, { - "epoch": 1.18, - "eval_cer": 0.914438232831024, - "eval_loss": 0.006864336784929037, - "eval_runtime": 115.9429, - "eval_samples_per_second": 17.25, - "eval_steps_per_second": 4.312, + "epoch": 0.6, + "eval_cer": 0.8817292794249172, + "eval_loss": 0.011502685025334358, + "eval_runtime": 107.4531, + "eval_samples_per_second": 18.613, + "eval_steps_per_second": 4.653, "step": 233000 }, { - "epoch": 1.18, - "learning_rate": 0.00012366518508054547, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.00020940067032850242, + "loss": 0.0146, "step": 233010 }, { - "epoch": 1.18, - "learning_rate": 0.00012365761738753145, - "loss": 0.0101, + "epoch": 0.6, + "learning_rate": 0.00020939678211213096, + "loss": 0.0184, "step": 233020 }, { - "epoch": 1.18, - "learning_rate": 0.00012365004969451743, - "loss": 0.0131, + "epoch": 0.6, + "learning_rate": 0.0002093928938957595, + "loss": 0.0181, "step": 233030 }, { - "epoch": 1.18, - "learning_rate": 0.00012364248200150344, - "loss": 0.0068, + "epoch": 0.6, + "learning_rate": 0.00020938900567938801, + "loss": 0.016, "step": 233040 }, { - "epoch": 1.18, - "learning_rate": 0.00012363491430848942, - "loss": 0.0107, + "epoch": 0.6, + "learning_rate": 0.00020938511746301656, + "loss": 0.0144, "step": 233050 }, { - "epoch": 1.18, - "learning_rate": 0.0001236273466154754, - "loss": 0.0104, + "epoch": 0.6, + "learning_rate": 0.0002093812292466451, + "loss": 0.0158, "step": 233060 }, { - "epoch": 1.18, - "learning_rate": 0.0001236197789224614, - "loss": 0.0077, + "epoch": 0.6, + "learning_rate": 0.00020937734103027364, + "loss": 0.0174, "step": 233070 }, { - "epoch": 1.18, - "learning_rate": 0.0001236122112294474, - "loss": 0.0091, + "epoch": 0.6, + "learning_rate": 0.00020937345281390215, + "loss": 0.0149, "step": 233080 }, { - "epoch": 1.18, - "learning_rate": 0.00012360464353643338, - "loss": 0.0111, + "epoch": 0.6, + "learning_rate": 0.0002093695645975307, + "loss": 0.0181, "step": 233090 }, { - "epoch": 1.18, - "learning_rate": 0.00012359707584341938, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00020936567638115926, + "loss": 0.0174, "step": 233100 }, { - "epoch": 1.18, - "learning_rate": 0.00012358950815040537, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020936178816478778, + "loss": 0.013, "step": 233110 }, { - "epoch": 1.18, - "learning_rate": 0.00012358194045739135, - "loss": 0.0085, + "epoch": 0.6, + "learning_rate": 0.00020935789994841632, + "loss": 0.0147, "step": 233120 }, { - "epoch": 1.18, - "learning_rate": 0.00012357437276437736, - "loss": 0.0122, + "epoch": 0.6, + "learning_rate": 0.00020935401173204483, + "loss": 0.0169, "step": 233130 }, { - "epoch": 1.18, - "learning_rate": 0.00012356680507136334, - "loss": 0.0069, + "epoch": 0.6, + "learning_rate": 0.0002093501235156734, + "loss": 0.0199, "step": 233140 }, { - "epoch": 1.18, - "learning_rate": 0.00012355923737834932, - "loss": 0.0143, + "epoch": 0.6, + "learning_rate": 0.00020934623529930192, + "loss": 0.0171, "step": 233150 }, { - "epoch": 1.18, - "learning_rate": 0.00012355166968533533, - "loss": 0.0093, + "epoch": 0.6, + "learning_rate": 0.00020934234708293046, + "loss": 0.0234, "step": 233160 }, { - "epoch": 1.18, - "learning_rate": 0.0001235441019923213, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020933845886655897, + "loss": 0.0179, "step": 233170 }, { - "epoch": 1.18, - "learning_rate": 0.0001235365342993073, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020933457065018754, + "loss": 0.0154, "step": 233180 }, { - "epoch": 1.18, - "learning_rate": 0.00012352896660629327, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020933068243381606, + "loss": 0.0186, "step": 233190 }, { - "epoch": 1.18, - "learning_rate": 0.00012352139891327928, - "loss": 0.0094, + "epoch": 0.6, + "learning_rate": 0.0002093267942174446, + "loss": 0.0167, "step": 233200 }, { - "epoch": 1.18, - "learning_rate": 0.00012351383122026526, - "loss": 0.0069, + "epoch": 0.6, + "learning_rate": 0.00020932290600107311, + "loss": 0.0176, "step": 233210 }, { - "epoch": 1.18, - "learning_rate": 0.00012350626352725124, - "loss": 0.0081, + "epoch": 0.6, + "learning_rate": 0.00020931901778470168, + "loss": 0.0331, "step": 233220 }, { - "epoch": 1.18, - "learning_rate": 0.00012349869583423725, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.0002093151295683302, + "loss": 0.0127, "step": 233230 }, { - "epoch": 1.18, - "learning_rate": 0.00012349112814122323, - "loss": 0.0092, + "epoch": 0.6, + "learning_rate": 0.00020931124135195874, + "loss": 0.0152, "step": 233240 }, { - "epoch": 1.18, - "learning_rate": 0.00012348356044820921, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.00020930735313558725, + "loss": 0.0173, "step": 233250 }, { - "epoch": 1.18, - "learning_rate": 0.00012347599275519522, - "loss": 0.0086, + "epoch": 0.6, + "learning_rate": 0.0002093034649192158, + "loss": 0.0211, "step": 233260 }, { - "epoch": 1.18, - "learning_rate": 0.0001234684250621812, - "loss": 0.0103, + "epoch": 0.6, + "learning_rate": 0.00020929957670284436, + "loss": 0.0139, "step": 233270 }, { - "epoch": 1.18, - "learning_rate": 0.00012346085736916719, - "loss": 0.0078, + "epoch": 0.6, + "learning_rate": 0.00020929568848647288, + "loss": 0.0176, "step": 233280 }, { - "epoch": 1.18, - "learning_rate": 0.0001234532896761532, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020929180027010142, + "loss": 0.0173, "step": 233290 }, { - "epoch": 1.18, - "learning_rate": 0.00012344572198313918, - "loss": 0.0083, + "epoch": 0.6, + "learning_rate": 0.00020928791205372993, + "loss": 0.0179, "step": 233300 }, { - "epoch": 1.18, - "learning_rate": 0.00012343815429012516, - "loss": 0.0099, + "epoch": 0.6, + "learning_rate": 0.0002092840238373585, + "loss": 0.0162, "step": 233310 }, { - "epoch": 1.18, - "learning_rate": 0.00012343058659711117, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020928013562098702, + "loss": 0.0143, "step": 233320 }, { - "epoch": 1.18, - "learning_rate": 0.00012342301890409715, - "loss": 0.0102, + "epoch": 0.6, + "learning_rate": 0.00020927624740461556, + "loss": 0.0164, "step": 233330 }, { - "epoch": 1.18, - "learning_rate": 0.00012341545121108313, - "loss": 0.0088, + "epoch": 0.6, + "learning_rate": 0.00020927235918824407, + "loss": 0.0194, "step": 233340 }, { - "epoch": 1.18, - "learning_rate": 0.0001234078835180691, - "loss": 0.0065, + "epoch": 0.6, + "learning_rate": 0.00020926847097187264, + "loss": 0.015, "step": 233350 }, { - "epoch": 1.18, - "learning_rate": 0.00012340031582505512, - "loss": 0.0068, + "epoch": 0.6, + "learning_rate": 0.00020926458275550116, + "loss": 0.014, "step": 233360 }, { - "epoch": 1.18, - "learning_rate": 0.0001233927481320411, - "loss": 0.0084, + "epoch": 0.6, + "learning_rate": 0.0002092606945391297, + "loss": 0.0163, "step": 233370 }, { - "epoch": 1.18, - "learning_rate": 0.00012338518043902708, - "loss": 0.0079, + "epoch": 0.6, + "learning_rate": 0.0002092568063227582, + "loss": 0.0112, "step": 233380 }, { - "epoch": 1.18, - "learning_rate": 0.0001233776127460131, - "loss": 0.0106, + "epoch": 0.6, + "learning_rate": 0.00020925291810638678, + "loss": 0.0156, "step": 233390 }, { - "epoch": 1.18, - "learning_rate": 0.00012337004505299907, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.0002092490298900153, + "loss": 0.0159, "step": 233400 }, { - "epoch": 1.18, - "learning_rate": 0.00012336247735998505, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020924514167364384, + "loss": 0.0179, "step": 233410 }, { - "epoch": 1.18, - "learning_rate": 0.00012335490966697106, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020924125345727235, + "loss": 0.0157, "step": 233420 }, { - "epoch": 1.18, - "learning_rate": 0.00012334734197395704, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020923736524090092, + "loss": 0.0165, "step": 233430 }, { - "epoch": 1.18, - "learning_rate": 0.00012333977428094302, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020923347702452946, + "loss": 0.0139, "step": 233440 }, { - "epoch": 1.18, - "learning_rate": 0.00012333220658792903, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020922958880815798, + "loss": 0.015, "step": 233450 }, { - "epoch": 1.18, - "learning_rate": 0.00012332463889491501, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.0002092257005917865, + "loss": 0.0157, "step": 233460 }, { - "epoch": 1.18, - "learning_rate": 0.000123317071201901, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020922181237541503, + "loss": 0.0146, "step": 233470 }, { - "epoch": 1.18, - "learning_rate": 0.00012330950350888698, - "loss": 0.0069, + "epoch": 0.61, + "learning_rate": 0.0002092179241590436, + "loss": 0.0194, "step": 233480 }, { - "epoch": 1.18, - "learning_rate": 0.00012330193581587296, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020921403594267212, + "loss": 0.0147, "step": 233490 }, { - "epoch": 1.18, - "learning_rate": 0.00012329436812285897, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020921014772630066, + "loss": 0.0156, "step": 233500 }, { - "epoch": 1.18, - "learning_rate": 0.00012328680042984495, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020920625950992917, + "loss": 0.0129, "step": 233510 }, { - "epoch": 1.18, - "learning_rate": 0.00012327923273683093, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020920237129355774, + "loss": 0.0167, "step": 233520 }, { - "epoch": 1.18, - "learning_rate": 0.00012327166504381694, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020919848307718626, + "loss": 0.0115, "step": 233530 }, { - "epoch": 1.18, - "learning_rate": 0.00012326409735080292, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.0002091945948608148, + "loss": 0.0189, "step": 233540 }, { - "epoch": 1.18, - "learning_rate": 0.0001232565296577889, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.0002091907066444433, + "loss": 0.0172, "step": 233550 }, { - "epoch": 1.18, - "learning_rate": 0.00012324896196477488, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020918681842807188, + "loss": 0.0152, "step": 233560 }, { - "epoch": 1.18, - "learning_rate": 0.0001232413942717609, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002091829302117004, + "loss": 0.0192, "step": 233570 }, { - "epoch": 1.18, - "learning_rate": 0.00012323382657874687, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020917904199532894, + "loss": 0.0163, "step": 233580 }, { - "epoch": 1.18, - "learning_rate": 0.00012322625888573285, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020917515377895745, + "loss": 0.0165, "step": 233590 }, { - "epoch": 1.18, - "learning_rate": 0.00012321869119271886, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020917126556258602, + "loss": 0.0187, "step": 233600 }, { - "epoch": 1.18, - "learning_rate": 0.00012321112349970484, - "loss": 0.0126, + "epoch": 0.61, + "learning_rate": 0.00020916737734621454, + "loss": 0.0167, "step": 233610 }, { - "epoch": 1.18, - "learning_rate": 0.00012320355580669083, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020916348912984308, + "loss": 0.0176, "step": 233620 }, { - "epoch": 1.18, - "learning_rate": 0.00012319598811367683, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.0002091596009134716, + "loss": 0.0141, "step": 233630 }, { - "epoch": 1.18, - "learning_rate": 0.00012318842042066282, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020915571269710016, + "loss": 0.017, "step": 233640 }, { - "epoch": 1.18, - "learning_rate": 0.0001231808527276488, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.0002091518244807287, + "loss": 0.0225, "step": 233650 }, { - "epoch": 1.18, - "learning_rate": 0.0001231732850346348, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020914793626435722, + "loss": 0.0203, "step": 233660 }, { - "epoch": 1.18, - "learning_rate": 0.0001231657173416208, - "loss": 0.0114, + "epoch": 0.61, + "learning_rate": 0.00020914404804798576, + "loss": 0.017, "step": 233670 }, { - "epoch": 1.18, - "learning_rate": 0.00012315814964860677, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.0002091401598316143, + "loss": 0.016, "step": 233680 }, { - "epoch": 1.18, - "learning_rate": 0.00012315058195559278, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020913627161524284, + "loss": 0.0202, "step": 233690 }, { - "epoch": 1.18, - "learning_rate": 0.00012314301426257876, - "loss": 0.0157, + "epoch": 0.61, + "learning_rate": 0.00020913238339887136, + "loss": 0.0132, "step": 233700 }, { - "epoch": 1.18, - "learning_rate": 0.00012313544656956474, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.0002091284951824999, + "loss": 0.0137, "step": 233710 }, { - "epoch": 1.18, - "learning_rate": 0.00012312787887655072, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.0002091246069661284, + "loss": 0.0122, "step": 233720 }, { - "epoch": 1.18, - "learning_rate": 0.00012312031118353673, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020912071874975698, + "loss": 0.0146, "step": 233730 }, { - "epoch": 1.18, - "learning_rate": 0.0001231127434905227, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.0002091168305333855, + "loss": 0.015, "step": 233740 }, { - "epoch": 1.18, - "learning_rate": 0.0001231051757975087, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020911294231701404, + "loss": 0.0152, "step": 233750 }, { - "epoch": 1.18, - "learning_rate": 0.0001230976081044947, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020910905410064255, + "loss": 0.0136, "step": 233760 }, { - "epoch": 1.18, - "learning_rate": 0.00012309004041148068, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020910516588427112, + "loss": 0.0148, "step": 233770 }, { - "epoch": 1.18, - "learning_rate": 0.00012308247271846666, - "loss": 0.0129, + "epoch": 0.61, + "learning_rate": 0.00020910127766789963, + "loss": 0.0164, "step": 233780 }, { - "epoch": 1.18, - "learning_rate": 0.00012307490502545267, - "loss": 0.0113, + "epoch": 0.61, + "learning_rate": 0.00020909738945152818, + "loss": 0.0179, "step": 233790 }, { - "epoch": 1.18, - "learning_rate": 0.00012306733733243865, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.0002090935012351567, + "loss": 0.0167, "step": 233800 }, { - "epoch": 1.18, - "learning_rate": 0.00012305976963942464, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020908961301878526, + "loss": 0.0162, "step": 233810 }, { - "epoch": 1.18, - "learning_rate": 0.00012305220194641064, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002090857248024138, + "loss": 0.0157, "step": 233820 }, { - "epoch": 1.18, - "learning_rate": 0.00012304463425339663, - "loss": 0.0063, + "epoch": 0.61, + "learning_rate": 0.00020908183658604232, + "loss": 0.0153, "step": 233830 }, { - "epoch": 1.18, - "learning_rate": 0.0001230370665603826, - "loss": 0.0061, + "epoch": 0.61, + "learning_rate": 0.00020907794836967086, + "loss": 0.0272, "step": 233840 }, { - "epoch": 1.18, - "learning_rate": 0.00012302949886736862, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.0002090740601532994, + "loss": 0.0107, "step": 233850 }, { - "epoch": 1.18, - "learning_rate": 0.0001230219311743546, - "loss": 0.0119, + "epoch": 0.61, + "learning_rate": 0.00020907017193692794, + "loss": 0.0169, "step": 233860 }, { - "epoch": 1.18, - "learning_rate": 0.00012301436348134058, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020906628372055646, + "loss": 0.0123, "step": 233870 }, { - "epoch": 1.18, - "learning_rate": 0.00012300679578832656, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.000209062395504185, + "loss": 0.0198, "step": 233880 }, { - "epoch": 1.18, - "learning_rate": 0.00012299922809531257, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020905850728781354, + "loss": 0.0155, "step": 233890 }, { - "epoch": 1.18, - "learning_rate": 0.00012299166040229855, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020905461907144208, + "loss": 0.0162, "step": 233900 }, { - "epoch": 1.18, - "learning_rate": 0.00012298409270928453, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.0002090507308550706, + "loss": 0.0166, "step": 233910 }, { - "epoch": 1.18, - "learning_rate": 0.00012297652501627054, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020904684263869914, + "loss": 0.0173, "step": 233920 }, { - "epoch": 1.18, - "learning_rate": 0.00012296895732325652, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020904295442232768, + "loss": 0.0161, "step": 233930 }, { - "epoch": 1.18, - "learning_rate": 0.0001229613896302425, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020903906620595622, + "loss": 0.0166, "step": 233940 }, { - "epoch": 1.18, - "learning_rate": 0.0001229538219372285, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020903517798958473, + "loss": 0.0197, "step": 233950 }, { - "epoch": 1.18, - "learning_rate": 0.0001229462542442145, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020903128977321328, + "loss": 0.0165, "step": 233960 }, { - "epoch": 1.18, - "learning_rate": 0.00012293868655120047, - "loss": 0.0115, + "epoch": 0.61, + "learning_rate": 0.0002090274015568418, + "loss": 0.0195, "step": 233970 }, { - "epoch": 1.18, - "learning_rate": 0.00012293111885818648, - "loss": 0.0069, + "epoch": 0.61, + "learning_rate": 0.00020902351334047036, + "loss": 0.0158, "step": 233980 }, { - "epoch": 1.18, - "learning_rate": 0.00012292355116517246, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.0002090196251240989, + "loss": 0.0127, "step": 233990 }, { - "epoch": 1.18, - "learning_rate": 0.00012291598347215845, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020901573690772742, + "loss": 0.0187, "step": 234000 }, { - "epoch": 1.18, - "eval_cer": 0.9144275584736445, - "eval_loss": 0.0069518680684268475, - "eval_runtime": 115.6903, - "eval_samples_per_second": 17.288, - "eval_steps_per_second": 4.322, + "epoch": 0.61, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.011547002010047436, + "eval_runtime": 107.3826, + "eval_samples_per_second": 18.625, + "eval_steps_per_second": 4.656, "step": 234000 }, { - "epoch": 1.18, - "learning_rate": 0.00012290841577914445, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020901184869135593, + "loss": 0.0155, "step": 234010 }, { - "epoch": 1.18, - "learning_rate": 0.00012290084808613044, - "loss": 0.0114, + "epoch": 0.61, + "learning_rate": 0.0002090079604749845, + "loss": 0.0163, "step": 234020 }, { - "epoch": 1.18, - "learning_rate": 0.00012289328039311642, - "loss": 0.0118, + "epoch": 0.61, + "learning_rate": 0.00020900407225861304, + "loss": 0.0171, "step": 234030 }, { - "epoch": 1.18, - "learning_rate": 0.00012288571270010243, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020900018404224155, + "loss": 0.0206, "step": 234040 }, { - "epoch": 1.18, - "learning_rate": 0.0001228781450070884, - "loss": 0.0121, + "epoch": 0.61, + "learning_rate": 0.0002089962958258701, + "loss": 0.015, "step": 234050 }, { - "epoch": 1.18, - "learning_rate": 0.0001228705773140744, - "loss": 0.0133, + "epoch": 0.61, + "learning_rate": 0.00020899240760949864, + "loss": 0.0134, "step": 234060 }, { - "epoch": 1.18, - "learning_rate": 0.00012286300962106037, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020898851939312718, + "loss": 0.0202, "step": 234070 }, { - "epoch": 1.18, - "learning_rate": 0.00012285544192804638, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002089846311767557, + "loss": 0.0189, "step": 234080 }, { - "epoch": 1.18, - "learning_rate": 0.00012284787423503236, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020898074296038424, + "loss": 0.0156, "step": 234090 }, { - "epoch": 1.18, - "learning_rate": 0.00012284030654201834, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020897685474401278, + "loss": 0.0193, "step": 234100 }, { - "epoch": 1.18, - "learning_rate": 0.00012283273884900432, - "loss": 0.0122, + "epoch": 0.61, + "learning_rate": 0.00020897296652764132, + "loss": 0.0163, "step": 234110 }, { - "epoch": 1.18, - "learning_rate": 0.0001228251711559903, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020896907831126983, + "loss": 0.0211, "step": 234120 }, { - "epoch": 1.18, - "learning_rate": 0.0001228176034629763, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020896519009489838, + "loss": 0.0175, "step": 234130 }, { - "epoch": 1.18, - "learning_rate": 0.0001228100357699623, - "loss": 0.0132, + "epoch": 0.61, + "learning_rate": 0.00020896130187852694, + "loss": 0.0158, "step": 234140 }, { - "epoch": 1.18, - "learning_rate": 0.00012280246807694828, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020895741366215546, + "loss": 0.0141, "step": 234150 }, { - "epoch": 1.18, - "learning_rate": 0.00012279490038393428, - "loss": 0.0114, + "epoch": 0.61, + "learning_rate": 0.000208953525445784, + "loss": 0.0147, "step": 234160 }, { - "epoch": 1.18, - "learning_rate": 0.00012278733269092027, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020894963722941251, + "loss": 0.017, "step": 234170 }, { - "epoch": 1.18, - "learning_rate": 0.00012277976499790625, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020894574901304108, + "loss": 0.0198, "step": 234180 }, { - "epoch": 1.18, - "learning_rate": 0.00012277219730489226, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.0002089418607966696, + "loss": 0.0139, "step": 234190 }, { - "epoch": 1.18, - "learning_rate": 0.00012276462961187824, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020893797258029814, + "loss": 0.0175, "step": 234200 }, { - "epoch": 1.18, - "learning_rate": 0.00012275706191886422, - "loss": 0.0094, + "epoch": 0.61, + "learning_rate": 0.00020893408436392665, + "loss": 0.0138, "step": 234210 }, { - "epoch": 1.18, - "learning_rate": 0.00012274949422585023, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.0002089301961475552, + "loss": 0.0136, "step": 234220 }, { - "epoch": 1.18, - "learning_rate": 0.0001227419265328362, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020892630793118374, + "loss": 0.0177, "step": 234230 }, { - "epoch": 1.18, - "learning_rate": 0.0001227343588398222, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020892241971481228, + "loss": 0.0137, "step": 234240 }, { - "epoch": 1.18, - "learning_rate": 0.00012272679114680817, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.0002089185314984408, + "loss": 0.0145, "step": 234250 }, { - "epoch": 1.18, - "learning_rate": 0.00012271922345379418, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020891464328206934, + "loss": 0.0165, "step": 234260 }, { - "epoch": 1.18, - "learning_rate": 0.00012271165576078016, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020891075506569788, + "loss": 0.0154, "step": 234270 }, { - "epoch": 1.18, - "learning_rate": 0.00012270408806776614, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020890686684932642, + "loss": 0.0167, "step": 234280 }, { - "epoch": 1.18, - "learning_rate": 0.00012269652037475215, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.00020890297863295493, + "loss": 0.0146, "step": 234290 }, { - "epoch": 1.18, - "learning_rate": 0.00012268895268173813, - "loss": 0.012, + "epoch": 0.61, + "learning_rate": 0.00020889909041658347, + "loss": 0.0182, "step": 234300 }, { - "epoch": 1.18, - "learning_rate": 0.00012268138498872411, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020889520220021204, + "loss": 0.0159, "step": 234310 }, { - "epoch": 1.18, - "learning_rate": 0.00012267381729571012, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020889131398384056, + "loss": 0.017, "step": 234320 }, { - "epoch": 1.18, - "learning_rate": 0.0001226662496026961, - "loss": 0.0094, + "epoch": 0.61, + "learning_rate": 0.00020888742576746907, + "loss": 0.015, "step": 234330 }, { - "epoch": 1.18, - "learning_rate": 0.00012265868190968209, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020888353755109761, + "loss": 0.0148, "step": 234340 }, { - "epoch": 1.18, - "learning_rate": 0.0001226511142166681, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020887964933472618, + "loss": 0.0171, "step": 234350 }, { - "epoch": 1.18, - "learning_rate": 0.00012264354652365408, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.0002088757611183547, + "loss": 0.0146, "step": 234360 }, { - "epoch": 1.18, - "learning_rate": 0.00012263597883064006, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020887187290198324, + "loss": 0.0176, "step": 234370 }, { - "epoch": 1.18, - "learning_rate": 0.00012262841113762607, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020886798468561175, + "loss": 0.0137, "step": 234380 }, { - "epoch": 1.18, - "learning_rate": 0.00012262084344461205, - "loss": 0.0145, + "epoch": 0.61, + "learning_rate": 0.00020886409646924032, + "loss": 0.0166, "step": 234390 }, { - "epoch": 1.18, - "learning_rate": 0.00012261327575159803, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020886020825286884, + "loss": 0.016, "step": 234400 }, { - "epoch": 1.18, - "learning_rate": 0.000122605708058584, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020885632003649738, + "loss": 0.0161, "step": 234410 }, { - "epoch": 1.18, - "learning_rate": 0.00012259814036557002, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.0002088524318201259, + "loss": 0.0185, "step": 234420 }, { - "epoch": 1.18, - "learning_rate": 0.000122590572672556, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020884854360375446, + "loss": 0.014, "step": 234430 }, { - "epoch": 1.18, - "learning_rate": 0.00012258300497954198, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020884465538738298, + "loss": 0.0163, "step": 234440 }, { - "epoch": 1.18, - "learning_rate": 0.000122575437286528, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020884076717101152, + "loss": 0.0149, "step": 234450 }, { - "epoch": 1.18, - "learning_rate": 0.00012256786959351397, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020883687895464003, + "loss": 0.0162, "step": 234460 }, { - "epoch": 1.18, - "learning_rate": 0.00012256030190049995, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020883299073826857, + "loss": 0.0177, "step": 234470 }, { - "epoch": 1.18, - "learning_rate": 0.00012255273420748596, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020882910252189712, + "loss": 0.0169, "step": 234480 }, { - "epoch": 1.18, - "learning_rate": 0.00012254516651447194, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020882521430552566, + "loss": 0.0171, "step": 234490 }, { - "epoch": 1.18, - "learning_rate": 0.00012253759882145792, - "loss": 0.0068, + "epoch": 0.61, + "learning_rate": 0.00020882132608915417, + "loss": 0.0156, "step": 234500 }, { - "epoch": 1.18, - "learning_rate": 0.00012253003112844393, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020881743787278271, + "loss": 0.0177, "step": 234510 }, { - "epoch": 1.18, - "learning_rate": 0.00012252246343542991, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020881354965641128, + "loss": 0.0194, "step": 234520 }, { - "epoch": 1.18, - "learning_rate": 0.0001225148957424159, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.0002088096614400398, + "loss": 0.0235, "step": 234530 }, { - "epoch": 1.18, - "learning_rate": 0.0001225073280494019, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020880577322366834, + "loss": 0.0154, "step": 234540 }, { - "epoch": 1.18, - "learning_rate": 0.00012249976035638789, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020880188500729685, + "loss": 0.0189, "step": 234550 }, { - "epoch": 1.18, - "learning_rate": 0.00012249219266337387, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.00020879799679092542, + "loss": 0.0161, "step": 234560 }, { - "epoch": 1.18, - "learning_rate": 0.00012248462497035988, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020879410857455394, + "loss": 0.0121, "step": 234570 }, { - "epoch": 1.18, - "learning_rate": 0.00012247705727734586, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020879022035818248, + "loss": 0.0189, "step": 234580 }, { - "epoch": 1.18, - "learning_rate": 0.00012246948958433184, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.000208786332141811, + "loss": 0.0193, "step": 234590 }, { - "epoch": 1.18, - "learning_rate": 0.00012246192189131782, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020878244392543956, + "loss": 0.0173, "step": 234600 }, { - "epoch": 1.18, - "learning_rate": 0.00012245435419830383, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020877855570906808, + "loss": 0.0148, "step": 234610 }, { - "epoch": 1.18, - "learning_rate": 0.0001224467865052898, - "loss": 0.0123, + "epoch": 0.61, + "learning_rate": 0.00020877466749269662, + "loss": 0.0142, "step": 234620 }, { - "epoch": 1.18, - "learning_rate": 0.0001224392188122758, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020877077927632513, + "loss": 0.0159, "step": 234630 }, { - "epoch": 1.18, - "learning_rate": 0.0001224316511192618, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.0002087668910599537, + "loss": 0.0164, "step": 234640 }, { - "epoch": 1.18, - "learning_rate": 0.00012242408342624778, - "loss": 0.0111, + "epoch": 0.61, + "learning_rate": 0.00020876300284358222, + "loss": 0.0142, "step": 234650 }, { - "epoch": 1.18, - "learning_rate": 0.00012241651573323376, - "loss": 0.0072, + "epoch": 0.61, + "learning_rate": 0.00020875911462721076, + "loss": 0.0176, "step": 234660 }, { - "epoch": 1.18, - "learning_rate": 0.00012240894804021977, - "loss": 0.0067, + "epoch": 0.61, + "learning_rate": 0.00020875522641083927, + "loss": 0.0136, "step": 234670 }, { - "epoch": 1.18, - "learning_rate": 0.00012240138034720575, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020875133819446784, + "loss": 0.0167, "step": 234680 }, { - "epoch": 1.18, - "learning_rate": 0.00012239381265419173, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020874744997809638, + "loss": 0.0182, "step": 234690 }, { - "epoch": 1.18, - "learning_rate": 0.00012238624496117774, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.0002087435617617249, + "loss": 0.017, "step": 234700 }, { - "epoch": 1.18, - "learning_rate": 0.00012237867726816372, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020873967354535344, + "loss": 0.0184, "step": 234710 }, { - "epoch": 1.18, - "learning_rate": 0.0001223711095751497, - "loss": 0.0094, + "epoch": 0.61, + "learning_rate": 0.00020873578532898195, + "loss": 0.0181, "step": 234720 }, { - "epoch": 1.18, - "learning_rate": 0.0001223635418821357, - "loss": 0.0126, + "epoch": 0.61, + "learning_rate": 0.00020873189711261052, + "loss": 0.013, "step": 234730 }, { - "epoch": 1.18, - "learning_rate": 0.00012235597418912167, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020872800889623904, + "loss": 0.0168, "step": 234740 }, { - "epoch": 1.18, - "learning_rate": 0.00012234840649610768, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020872412067986758, + "loss": 0.0165, "step": 234750 }, { - "epoch": 1.18, - "learning_rate": 0.00012234083880309366, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.0002087202324634961, + "loss": 0.0163, "step": 234760 }, { - "epoch": 1.18, - "learning_rate": 0.00012233327111007964, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020871634424712466, + "loss": 0.015, "step": 234770 }, { - "epoch": 1.18, - "learning_rate": 0.00012232570341706562, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020871245603075318, + "loss": 0.018, "step": 234780 }, { - "epoch": 1.18, - "learning_rate": 0.00012231813572405163, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.00020870856781438172, + "loss": 0.0165, "step": 234790 }, { - "epoch": 1.18, - "learning_rate": 0.0001223105680310376, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020870467959801023, + "loss": 0.0141, "step": 234800 }, { - "epoch": 1.18, - "learning_rate": 0.0001223030003380236, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.0002087007913816388, + "loss": 0.0165, "step": 234810 }, { - "epoch": 1.18, - "learning_rate": 0.0001222954326450096, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020869690316526731, + "loss": 0.0173, "step": 234820 }, { - "epoch": 1.18, - "learning_rate": 0.00012228786495199558, - "loss": 0.0072, + "epoch": 0.61, + "learning_rate": 0.00020869301494889586, + "loss": 0.0147, "step": 234830 }, { - "epoch": 1.18, - "learning_rate": 0.00012228029725898156, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020868912673252437, + "loss": 0.0171, "step": 234840 }, { - "epoch": 1.18, - "learning_rate": 0.00012227272956596757, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020868523851615294, + "loss": 0.0198, "step": 234850 }, { - "epoch": 1.18, - "learning_rate": 0.00012226516187295355, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020868135029978148, + "loss": 0.0167, "step": 234860 }, { - "epoch": 1.18, - "learning_rate": 0.00012225759417993954, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020867746208341, + "loss": 0.0169, "step": 234870 }, { - "epoch": 1.18, - "learning_rate": 0.00012225002648692554, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.0002086735738670385, + "loss": 0.0135, "step": 234880 }, { - "epoch": 1.19, - "learning_rate": 0.00012224245879391153, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020866968565066708, + "loss": 0.0173, "step": 234890 }, { - "epoch": 1.19, - "learning_rate": 0.0001222348911008975, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020866579743429562, + "loss": 0.016, "step": 234900 }, { - "epoch": 1.19, - "learning_rate": 0.00012222732340788352, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020866190921792414, + "loss": 0.0171, "step": 234910 }, { - "epoch": 1.19, - "learning_rate": 0.0001222197557148695, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020865802100155268, + "loss": 0.021, "step": 234920 }, { - "epoch": 1.19, - "learning_rate": 0.00012221218802185548, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020865413278518122, + "loss": 0.0159, "step": 234930 }, { - "epoch": 1.19, - "learning_rate": 0.0001222046203288415, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.00020865024456880976, + "loss": 0.0168, "step": 234940 }, { - "epoch": 1.19, - "learning_rate": 0.00012219705263582747, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.00020864635635243827, + "loss": 0.0193, "step": 234950 }, { - "epoch": 1.19, - "learning_rate": 0.00012218948494281345, - "loss": 0.0108, + "epoch": 0.61, + "learning_rate": 0.00020864246813606682, + "loss": 0.0177, "step": 234960 }, { - "epoch": 1.19, - "learning_rate": 0.00012218191724979943, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020863857991969533, + "loss": 0.0151, "step": 234970 }, { - "epoch": 1.19, - "learning_rate": 0.00012217434955678544, - "loss": 0.0071, + "epoch": 0.61, + "learning_rate": 0.0002086346917033239, + "loss": 0.0158, "step": 234980 }, { - "epoch": 1.19, - "learning_rate": 0.00012216678186377142, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020863080348695241, + "loss": 0.0198, "step": 234990 }, { - "epoch": 1.19, - "learning_rate": 0.0001221592141707574, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020862691527058096, + "loss": 0.0213, "step": 235000 }, { - "epoch": 1.19, - "eval_cer": 0.9144362920387732, - "eval_loss": 0.0068534985184669495, - "eval_runtime": 115.6303, - "eval_samples_per_second": 17.297, - "eval_steps_per_second": 4.324, + "epoch": 0.61, + "eval_cer": 0.881704085960102, + "eval_loss": 0.010831459425389767, + "eval_runtime": 107.169, + "eval_samples_per_second": 18.662, + "eval_steps_per_second": 4.666, "step": 235000 }, { - "epoch": 1.19, - "learning_rate": 0.0001221516464777434, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020862302705420947, + "loss": 0.015, "step": 235010 }, { - "epoch": 1.19, - "learning_rate": 0.0001221440787847294, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020861913883783804, + "loss": 0.0163, "step": 235020 }, { - "epoch": 1.19, - "learning_rate": 0.00012213651109171537, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020861525062146658, + "loss": 0.0177, "step": 235030 }, { - "epoch": 1.19, - "learning_rate": 0.00012212894339870138, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.0002086113624050951, + "loss": 0.0129, "step": 235040 }, { - "epoch": 1.19, - "learning_rate": 0.00012212137570568736, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.0002086074741887236, + "loss": 0.0149, "step": 235050 }, { - "epoch": 1.19, - "learning_rate": 0.00012211380801267335, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020860358597235218, + "loss": 0.0162, "step": 235060 }, { - "epoch": 1.19, - "learning_rate": 0.00012210624031965935, - "loss": 0.0067, + "epoch": 0.61, + "learning_rate": 0.00020859969775598072, + "loss": 0.0159, "step": 235070 }, { - "epoch": 1.19, - "learning_rate": 0.00012209867262664534, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020859580953960923, + "loss": 0.0171, "step": 235080 }, { - "epoch": 1.19, - "learning_rate": 0.00012209110493363132, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020859192132323778, + "loss": 0.0138, "step": 235090 }, { - "epoch": 1.19, - "learning_rate": 0.00012208353724061733, - "loss": 0.0137, + "epoch": 0.61, + "learning_rate": 0.00020858803310686632, + "loss": 0.0185, "step": 235100 }, { - "epoch": 1.19, - "learning_rate": 0.0001220759695476033, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020858414489049486, + "loss": 0.0146, "step": 235110 }, { - "epoch": 1.19, - "learning_rate": 0.00012206840185458929, - "loss": 0.0119, + "epoch": 0.61, + "learning_rate": 0.00020858025667412337, + "loss": 0.0128, "step": 235120 }, { - "epoch": 1.19, - "learning_rate": 0.00012206083416157528, - "loss": 0.0062, + "epoch": 0.61, + "learning_rate": 0.00020857636845775192, + "loss": 0.0142, "step": 235130 }, { - "epoch": 1.19, - "learning_rate": 0.00012205326646856128, - "loss": 0.007, + "epoch": 0.61, + "learning_rate": 0.00020857248024138046, + "loss": 0.0141, "step": 235140 }, { - "epoch": 1.19, - "learning_rate": 0.00012204569877554726, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.000208568592025009, + "loss": 0.0214, "step": 235150 }, { - "epoch": 1.19, - "learning_rate": 0.00012203813108253326, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.0002085647038086375, + "loss": 0.0149, "step": 235160 }, { - "epoch": 1.19, - "learning_rate": 0.00012203056338951924, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020856081559226606, + "loss": 0.0167, "step": 235170 }, { - "epoch": 1.19, - "learning_rate": 0.00012202299569650523, - "loss": 0.0117, + "epoch": 0.61, + "learning_rate": 0.00020855692737589462, + "loss": 0.0168, "step": 235180 }, { - "epoch": 1.19, - "learning_rate": 0.00012201542800349123, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020855303915952314, + "loss": 0.0157, "step": 235190 }, { - "epoch": 1.19, - "learning_rate": 0.00012200786031047721, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020854915094315165, + "loss": 0.0156, "step": 235200 }, { - "epoch": 1.19, - "learning_rate": 0.0001220002926174632, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.0002085452627267802, + "loss": 0.015, "step": 235210 }, { - "epoch": 1.19, - "learning_rate": 0.0001219927249244492, - "loss": 0.0066, + "epoch": 0.61, + "learning_rate": 0.0002085413745104087, + "loss": 0.0183, "step": 235220 }, { - "epoch": 1.19, - "learning_rate": 0.00012198515723143518, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020853748629403728, + "loss": 0.0161, "step": 235230 }, { - "epoch": 1.19, - "learning_rate": 0.00012197758953842117, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.00020853359807766582, + "loss": 0.014, "step": 235240 }, { - "epoch": 1.19, - "learning_rate": 0.00012197002184540716, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020852970986129433, + "loss": 0.0192, "step": 235250 }, { - "epoch": 1.19, - "learning_rate": 0.00012196245415239315, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020852582164492288, + "loss": 0.0152, "step": 235260 }, { - "epoch": 1.19, - "learning_rate": 0.00012195488645937915, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020852193342855142, + "loss": 0.0162, "step": 235270 }, { - "epoch": 1.19, - "learning_rate": 0.00012194731876636513, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020851804521217996, + "loss": 0.015, "step": 235280 }, { - "epoch": 1.19, - "learning_rate": 0.00012193975107335112, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020851415699580847, + "loss": 0.0145, "step": 235290 }, { - "epoch": 1.19, - "learning_rate": 0.00012193218338033712, - "loss": 0.0069, + "epoch": 0.61, + "learning_rate": 0.00020851026877943702, + "loss": 0.0149, "step": 235300 }, { - "epoch": 1.19, - "learning_rate": 0.0001219246156873231, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020850638056306556, + "loss": 0.0171, "step": 235310 }, { - "epoch": 1.19, - "learning_rate": 0.0001219170479943091, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.0002085024923466941, + "loss": 0.0137, "step": 235320 }, { - "epoch": 1.19, - "learning_rate": 0.00012190948030129508, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002084986041303226, + "loss": 0.0189, "step": 235330 }, { - "epoch": 1.19, - "learning_rate": 0.00012190191260828107, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020849471591395115, + "loss": 0.0139, "step": 235340 }, { - "epoch": 1.19, - "learning_rate": 0.00012189434491526707, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020849082769757972, + "loss": 0.0126, "step": 235350 }, { - "epoch": 1.19, - "learning_rate": 0.00012188677722225303, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020848693948120824, + "loss": 0.0153, "step": 235360 }, { - "epoch": 1.19, - "learning_rate": 0.00012187920952923903, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020848305126483675, + "loss": 0.0159, "step": 235370 }, { - "epoch": 1.19, - "learning_rate": 0.00012187164183622501, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.0002084791630484653, + "loss": 0.016, "step": 235380 }, { - "epoch": 1.19, - "learning_rate": 0.000121864074143211, - "loss": 0.0115, + "epoch": 0.61, + "learning_rate": 0.00020847527483209386, + "loss": 0.0156, "step": 235390 }, { - "epoch": 1.19, - "learning_rate": 0.000121856506450197, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020847138661572238, + "loss": 0.0178, "step": 235400 }, { - "epoch": 1.19, - "learning_rate": 0.00012184893875718298, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020846749839935092, + "loss": 0.0137, "step": 235410 }, { - "epoch": 1.19, - "learning_rate": 0.00012184137106416898, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020846361018297943, + "loss": 0.0182, "step": 235420 }, { - "epoch": 1.19, - "learning_rate": 0.00012183380337115497, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.000208459721966608, + "loss": 0.0175, "step": 235430 }, { - "epoch": 1.19, - "learning_rate": 0.00012182623567814095, - "loss": 0.0069, + "epoch": 0.61, + "learning_rate": 0.00020845583375023652, + "loss": 0.0165, "step": 235440 }, { - "epoch": 1.19, - "learning_rate": 0.00012181866798512695, - "loss": 0.0111, + "epoch": 0.61, + "learning_rate": 0.00020845194553386506, + "loss": 0.0179, "step": 235450 }, { - "epoch": 1.19, - "learning_rate": 0.00012181110029211293, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020844805731749357, + "loss": 0.0164, "step": 235460 }, { - "epoch": 1.19, - "learning_rate": 0.00012180353259909892, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020844416910112211, + "loss": 0.0155, "step": 235470 }, { - "epoch": 1.19, - "learning_rate": 0.00012179596490608492, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020844028088475066, + "loss": 0.0193, "step": 235480 }, { - "epoch": 1.19, - "learning_rate": 0.0001217883972130709, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.0002084363926683792, + "loss": 0.0152, "step": 235490 }, { - "epoch": 1.19, - "learning_rate": 0.0001217808295200569, - "loss": 0.011, + "epoch": 0.61, + "learning_rate": 0.0002084325044520077, + "loss": 0.0146, "step": 235500 }, { - "epoch": 1.19, - "learning_rate": 0.00012177326182704289, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020842861623563625, + "loss": 0.0233, "step": 235510 }, { - "epoch": 1.19, - "learning_rate": 0.00012176569413402887, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.0002084247280192648, + "loss": 0.0148, "step": 235520 }, { - "epoch": 1.19, - "learning_rate": 0.00012175812644101487, - "loss": 0.0119, + "epoch": 0.61, + "learning_rate": 0.00020842083980289334, + "loss": 0.0204, "step": 235530 }, { - "epoch": 1.19, - "learning_rate": 0.00012175055874800085, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020841695158652185, + "loss": 0.0157, "step": 235540 }, { - "epoch": 1.19, - "learning_rate": 0.00012174299105498684, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.0002084130633701504, + "loss": 0.0183, "step": 235550 }, { - "epoch": 1.19, - "learning_rate": 0.00012173542336197284, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020840917515377896, + "loss": 0.0162, "step": 235560 }, { - "epoch": 1.19, - "learning_rate": 0.00012172785566895882, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020840528693740748, + "loss": 0.016, "step": 235570 }, { - "epoch": 1.19, - "learning_rate": 0.00012172028797594481, - "loss": 0.0065, + "epoch": 0.61, + "learning_rate": 0.00020840139872103602, + "loss": 0.0193, "step": 235580 }, { - "epoch": 1.19, - "learning_rate": 0.00012171272028293081, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020839751050466453, + "loss": 0.0156, "step": 235590 }, { - "epoch": 1.19, - "learning_rate": 0.00012170515258991679, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.0002083936222882931, + "loss": 0.0192, "step": 235600 }, { - "epoch": 1.19, - "learning_rate": 0.00012169758489690279, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020838973407192162, + "loss": 0.0197, "step": 235610 }, { - "epoch": 1.19, - "learning_rate": 0.00012169001720388877, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020838584585555016, + "loss": 0.0125, "step": 235620 }, { - "epoch": 1.19, - "learning_rate": 0.00012168244951087476, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020838195763917867, + "loss": 0.0161, "step": 235630 }, { - "epoch": 1.19, - "learning_rate": 0.00012167488181786076, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020837806942280724, + "loss": 0.0215, "step": 235640 }, { - "epoch": 1.19, - "learning_rate": 0.00012166731412484674, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020837418120643576, + "loss": 0.0176, "step": 235650 }, { - "epoch": 1.19, - "learning_rate": 0.00012165974643183273, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.0002083702929900643, + "loss": 0.0162, "step": 235660 }, { - "epoch": 1.19, - "learning_rate": 0.00012165217873881873, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.0002083664047736928, + "loss": 0.0136, "step": 235670 }, { - "epoch": 1.19, - "learning_rate": 0.00012164461104580471, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020836251655732138, + "loss": 0.0145, "step": 235680 }, { - "epoch": 1.19, - "learning_rate": 0.0001216370433527907, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.0002083586283409499, + "loss": 0.016, "step": 235690 }, { - "epoch": 1.19, - "learning_rate": 0.00012162947565977669, - "loss": 0.0073, + "epoch": 0.61, + "learning_rate": 0.00020835474012457844, + "loss": 0.015, "step": 235700 }, { - "epoch": 1.19, - "learning_rate": 0.00012162190796676268, - "loss": 0.0111, + "epoch": 0.61, + "learning_rate": 0.00020835085190820695, + "loss": 0.015, "step": 235710 }, { - "epoch": 1.19, - "learning_rate": 0.00012161434027374868, - "loss": 0.0104, + "epoch": 0.61, + "learning_rate": 0.0002083469636918355, + "loss": 0.0139, "step": 235720 }, { - "epoch": 1.19, - "learning_rate": 0.00012160677258073466, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020834307547546406, + "loss": 0.0143, "step": 235730 }, { - "epoch": 1.19, - "learning_rate": 0.00012159920488772065, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020833918725909258, + "loss": 0.0166, "step": 235740 }, { - "epoch": 1.19, - "learning_rate": 0.00012159163719470665, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020833529904272112, + "loss": 0.0159, "step": 235750 }, { - "epoch": 1.19, - "learning_rate": 0.00012158406950169263, - "loss": 0.0108, + "epoch": 0.61, + "learning_rate": 0.00020833141082634963, + "loss": 0.0182, "step": 235760 }, { - "epoch": 1.19, - "learning_rate": 0.00012157650180867862, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.0002083275226099782, + "loss": 0.0153, "step": 235770 }, { - "epoch": 1.19, - "learning_rate": 0.0001215689341156646, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020832363439360672, + "loss": 0.0172, "step": 235780 }, { - "epoch": 1.19, - "learning_rate": 0.0001215613664226506, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020831974617723526, + "loss": 0.0156, "step": 235790 }, { - "epoch": 1.19, - "learning_rate": 0.0001215537987296366, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020831585796086377, + "loss": 0.0234, "step": 235800 }, { - "epoch": 1.19, - "learning_rate": 0.00012154623103662258, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020831196974449234, + "loss": 0.0152, "step": 235810 }, { - "epoch": 1.19, - "learning_rate": 0.00012153866334360857, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020830808152812085, + "loss": 0.0164, "step": 235820 }, { - "epoch": 1.19, - "learning_rate": 0.00012153109565059457, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.0002083041933117494, + "loss": 0.0189, "step": 235830 }, { - "epoch": 1.19, - "learning_rate": 0.00012152352795758055, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.0002083003050953779, + "loss": 0.0159, "step": 235840 }, { - "epoch": 1.19, - "learning_rate": 0.00012151596026456654, - "loss": 0.0094, + "epoch": 0.61, + "learning_rate": 0.00020829641687900648, + "loss": 0.0152, "step": 235850 }, { - "epoch": 1.19, - "learning_rate": 0.00012150839257155253, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.000208292528662635, + "loss": 0.0164, "step": 235860 }, { - "epoch": 1.19, - "learning_rate": 0.00012150082487853852, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.00020828864044626354, + "loss": 0.0138, "step": 235870 }, { - "epoch": 1.19, - "learning_rate": 0.00012149325718552452, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020828475222989205, + "loss": 0.0178, "step": 235880 }, { - "epoch": 1.19, - "learning_rate": 0.0001214856894925105, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020828086401352062, + "loss": 0.0195, "step": 235890 }, { - "epoch": 1.19, - "learning_rate": 0.00012147812179949649, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.00020827697579714916, + "loss": 0.0145, "step": 235900 }, { - "epoch": 1.19, - "learning_rate": 0.00012147055410648249, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020827308758077768, + "loss": 0.0134, "step": 235910 }, { - "epoch": 1.19, - "learning_rate": 0.00012146298641346847, - "loss": 0.0116, + "epoch": 0.61, + "learning_rate": 0.0002082691993644062, + "loss": 0.0168, "step": 235920 }, { - "epoch": 1.19, - "learning_rate": 0.00012145541872045446, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020826531114803476, + "loss": 0.0191, "step": 235930 }, { - "epoch": 1.19, - "learning_rate": 0.00012144785102744046, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.0002082614229316633, + "loss": 0.0144, "step": 235940 }, { - "epoch": 1.19, - "learning_rate": 0.00012144028333442644, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.00020825753471529181, + "loss": 0.0139, "step": 235950 }, { - "epoch": 1.19, - "learning_rate": 0.00012143271564141243, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020825364649892036, + "loss": 0.0177, "step": 235960 }, { - "epoch": 1.19, - "learning_rate": 0.00012142514794839842, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020824975828254887, + "loss": 0.0175, "step": 235970 }, { - "epoch": 1.19, - "learning_rate": 0.00012141758025538441, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020824587006617744, + "loss": 0.0199, "step": 235980 }, { - "epoch": 1.19, - "learning_rate": 0.00012141001256237038, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020824198184980595, + "loss": 0.0114, "step": 235990 }, { - "epoch": 1.19, - "learning_rate": 0.00012140244486935637, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.0002082380936334345, + "loss": 0.0142, "step": 236000 }, { - "epoch": 1.19, - "eval_cer": 0.9144469663961525, - "eval_loss": 0.0067824204452335835, - "eval_runtime": 116.0471, - "eval_samples_per_second": 17.234, - "eval_steps_per_second": 4.309, + "epoch": 0.61, + "eval_cer": 0.8817376772465223, + "eval_loss": 0.011257501319050789, + "eval_runtime": 107.2888, + "eval_samples_per_second": 18.641, + "eval_steps_per_second": 4.66, "step": 236000 }, { - "epoch": 1.19, - "learning_rate": 0.00012139487717634237, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.000208234205417063, + "loss": 0.015, "step": 236010 }, { - "epoch": 1.19, - "learning_rate": 0.00012138730948332835, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020823031720069158, + "loss": 0.0134, "step": 236020 }, { - "epoch": 1.19, - "learning_rate": 0.00012137974179031435, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.0002082264289843201, + "loss": 0.0176, "step": 236030 }, { - "epoch": 1.19, - "learning_rate": 0.00012137217409730034, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020822254076794864, + "loss": 0.0177, "step": 236040 }, { - "epoch": 1.19, - "learning_rate": 0.00012136460640428632, - "loss": 0.0062, + "epoch": 0.61, + "learning_rate": 0.00020821865255157715, + "loss": 0.0164, "step": 236050 }, { - "epoch": 1.19, - "learning_rate": 0.00012135703871127232, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.00020821476433520572, + "loss": 0.0142, "step": 236060 }, { - "epoch": 1.19, - "learning_rate": 0.0001213494710182583, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020821087611883423, + "loss": 0.0172, "step": 236070 }, { - "epoch": 1.19, - "learning_rate": 0.00012134190332524429, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020820698790246277, + "loss": 0.0155, "step": 236080 }, { - "epoch": 1.19, - "learning_rate": 0.00012133433563223029, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.0002082030996860913, + "loss": 0.0167, "step": 236090 }, { - "epoch": 1.19, - "learning_rate": 0.00012132676793921627, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020819921146971986, + "loss": 0.0177, "step": 236100 }, { - "epoch": 1.19, - "learning_rate": 0.00012131920024620226, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.0002081953232533484, + "loss": 0.0201, "step": 236110 }, { - "epoch": 1.19, - "learning_rate": 0.00012131163255318826, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020819143503697691, + "loss": 0.0192, "step": 236120 }, { - "epoch": 1.19, - "learning_rate": 0.00012130406486017424, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020818754682060546, + "loss": 0.0185, "step": 236130 }, { - "epoch": 1.19, - "learning_rate": 0.00012129649716716024, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.000208183658604234, + "loss": 0.0148, "step": 236140 }, { - "epoch": 1.19, - "learning_rate": 0.00012128892947414622, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020817977038786254, + "loss": 0.0174, "step": 236150 }, { - "epoch": 1.19, - "learning_rate": 0.00012128136178113221, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020817588217149105, + "loss": 0.015, "step": 236160 }, { - "epoch": 1.19, - "learning_rate": 0.00012127379408811821, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.0002081719939551196, + "loss": 0.0202, "step": 236170 }, { - "epoch": 1.19, - "learning_rate": 0.00012126622639510419, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020816810573874814, + "loss": 0.0147, "step": 236180 }, { - "epoch": 1.19, - "learning_rate": 0.00012125865870209018, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020816421752237668, + "loss": 0.0117, "step": 236190 }, { - "epoch": 1.19, - "learning_rate": 0.00012125109100907618, - "loss": 0.0105, + "epoch": 0.61, + "learning_rate": 0.0002081603293060052, + "loss": 0.0135, "step": 236200 }, { - "epoch": 1.19, - "learning_rate": 0.00012124352331606216, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020815644108963373, + "loss": 0.0152, "step": 236210 }, { - "epoch": 1.19, - "learning_rate": 0.00012123595562304816, - "loss": 0.0075, + "epoch": 0.61, + "learning_rate": 0.00020815255287326225, + "loss": 0.0143, "step": 236220 }, { - "epoch": 1.19, - "learning_rate": 0.00012122838793003414, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020814866465689082, + "loss": 0.0158, "step": 236230 }, { - "epoch": 1.19, - "learning_rate": 0.00012122082023702013, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020814477644051933, + "loss": 0.0139, "step": 236240 }, { - "epoch": 1.19, - "learning_rate": 0.00012121325254400613, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020814088822414787, + "loss": 0.0179, "step": 236250 }, { - "epoch": 1.19, - "learning_rate": 0.00012120568485099211, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.0002081370000077764, + "loss": 0.0164, "step": 236260 }, { - "epoch": 1.19, - "learning_rate": 0.0001211981171579781, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020813311179140496, + "loss": 0.0185, "step": 236270 }, { - "epoch": 1.19, - "learning_rate": 0.0001211905494649641, - "loss": 0.0066, + "epoch": 0.61, + "learning_rate": 0.0002081292235750335, + "loss": 0.0151, "step": 236280 }, { - "epoch": 1.19, - "learning_rate": 0.00012118298177195008, - "loss": 0.0072, + "epoch": 0.61, + "learning_rate": 0.00020812533535866201, + "loss": 0.0189, "step": 236290 }, { - "epoch": 1.19, - "learning_rate": 0.00012117541407893607, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020812144714229056, + "loss": 0.0205, "step": 236300 }, { - "epoch": 1.19, - "learning_rate": 0.00012116784638592206, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.0002081175589259191, + "loss": 0.0183, "step": 236310 }, { - "epoch": 1.19, - "learning_rate": 0.00012116027869290805, - "loss": 0.0092, + "epoch": 0.61, + "learning_rate": 0.00020811367070954764, + "loss": 0.013, "step": 236320 }, { - "epoch": 1.19, - "learning_rate": 0.00012115271099989405, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020810978249317615, + "loss": 0.0135, "step": 236330 }, { - "epoch": 1.19, - "learning_rate": 0.00012114514330688003, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.0002081058942768047, + "loss": 0.0164, "step": 236340 }, { - "epoch": 1.19, - "learning_rate": 0.00012113757561386602, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020810200606043324, + "loss": 0.0161, "step": 236350 }, { - "epoch": 1.19, - "learning_rate": 0.00012113000792085202, - "loss": 0.0112, + "epoch": 0.61, + "learning_rate": 0.00020809811784406178, + "loss": 0.0128, "step": 236360 }, { - "epoch": 1.19, - "learning_rate": 0.000121122440227838, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.0002080942296276903, + "loss": 0.0182, "step": 236370 }, { - "epoch": 1.19, - "learning_rate": 0.000121114872534824, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020809034141131883, + "loss": 0.0131, "step": 236380 }, { - "epoch": 1.19, - "learning_rate": 0.00012110730484180999, - "loss": 0.008, - "step": 236390 + "epoch": 0.61, + "learning_rate": 0.00020808645319494738, + "loss": 0.0136, + "step": 236390 }, { - "epoch": 1.19, - "learning_rate": 0.00012109973714879597, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020808256497857592, + "loss": 0.016, "step": 236400 }, { - "epoch": 1.19, - "learning_rate": 0.00012109216945578197, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.00020807867676220443, + "loss": 0.0137, "step": 236410 }, { - "epoch": 1.19, - "learning_rate": 0.00012108460176276795, - "loss": 0.0091, + "epoch": 0.61, + "learning_rate": 0.00020807478854583297, + "loss": 0.0166, "step": 236420 }, { - "epoch": 1.19, - "learning_rate": 0.00012107703406975394, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020807090032946154, + "loss": 0.0136, "step": 236430 }, { - "epoch": 1.19, - "learning_rate": 0.00012106946637673994, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020806701211309006, + "loss": 0.0132, "step": 236440 }, { - "epoch": 1.19, - "learning_rate": 0.00012106189868372592, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.0002080631238967186, + "loss": 0.0152, "step": 236450 }, { - "epoch": 1.19, - "learning_rate": 0.00012105433099071191, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.0002080592356803471, + "loss": 0.0168, "step": 236460 }, { - "epoch": 1.19, - "learning_rate": 0.00012104676329769791, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.00020805534746397563, + "loss": 0.0138, "step": 236470 }, { - "epoch": 1.19, - "learning_rate": 0.00012103919560468389, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002080514592476042, + "loss": 0.0127, "step": 236480 }, { - "epoch": 1.19, - "learning_rate": 0.00012103162791166988, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020804757103123274, + "loss": 0.0157, "step": 236490 }, { - "epoch": 1.19, - "learning_rate": 0.00012102406021865587, - "loss": 0.0094, + "epoch": 0.61, + "learning_rate": 0.00020804368281486125, + "loss": 0.0161, "step": 236500 }, { - "epoch": 1.19, - "learning_rate": 0.00012101649252564186, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.0002080397945984898, + "loss": 0.017, "step": 236510 }, { - "epoch": 1.19, - "learning_rate": 0.00012100892483262786, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020803590638211834, + "loss": 0.0132, "step": 236520 }, { - "epoch": 1.19, - "learning_rate": 0.00012100135713961384, - "loss": 0.0103, + "epoch": 0.61, + "learning_rate": 0.00020803201816574688, + "loss": 0.013, "step": 236530 }, { - "epoch": 1.19, - "learning_rate": 0.00012099378944659983, - "loss": 0.0081, + "epoch": 0.61, + "learning_rate": 0.0002080281299493754, + "loss": 0.0197, "step": 236540 }, { - "epoch": 1.19, - "learning_rate": 0.00012098622175358583, - "loss": 0.0068, + "epoch": 0.61, + "learning_rate": 0.00020802424173300393, + "loss": 0.0182, "step": 236550 }, { - "epoch": 1.19, - "learning_rate": 0.00012097865406057181, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020802035351663248, + "loss": 0.0172, "step": 236560 }, { - "epoch": 1.19, - "learning_rate": 0.0001209710863675578, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020801646530026102, + "loss": 0.0132, "step": 236570 }, { - "epoch": 1.19, - "learning_rate": 0.00012096351867454379, - "loss": 0.0062, + "epoch": 0.61, + "learning_rate": 0.00020801257708388953, + "loss": 0.0159, "step": 236580 }, { - "epoch": 1.19, - "learning_rate": 0.00012095595098152978, - "loss": 0.0097, + "epoch": 0.61, + "learning_rate": 0.00020800868886751807, + "loss": 0.0149, "step": 236590 }, { - "epoch": 1.19, - "learning_rate": 0.00012094838328851578, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020800480065114664, + "loss": 0.02, "step": 236600 }, { - "epoch": 1.19, - "learning_rate": 0.00012094081559550174, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020800091243477516, + "loss": 0.0144, "step": 236610 }, { - "epoch": 1.19, - "learning_rate": 0.00012093324790248774, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002079970242184037, + "loss": 0.0133, "step": 236620 }, { - "epoch": 1.19, - "learning_rate": 0.00012092568020947372, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.0002079931360020322, + "loss": 0.016, "step": 236630 }, { - "epoch": 1.19, - "learning_rate": 0.00012091811251645971, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.00020798924778566078, + "loss": 0.0158, "step": 236640 }, { - "epoch": 1.19, - "learning_rate": 0.00012091054482344571, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.0002079853595692893, + "loss": 0.0151, "step": 236650 }, { - "epoch": 1.19, - "learning_rate": 0.00012090297713043169, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020798147135291784, + "loss": 0.0151, "step": 236660 }, { - "epoch": 1.19, - "learning_rate": 0.00012089540943741769, - "loss": 0.0095, + "epoch": 0.61, + "learning_rate": 0.00020797758313654635, + "loss": 0.0161, "step": 236670 }, { - "epoch": 1.19, - "learning_rate": 0.00012088784174440367, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020797369492017492, + "loss": 0.019, "step": 236680 }, { - "epoch": 1.19, - "learning_rate": 0.00012088027405138966, - "loss": 0.0108, + "epoch": 0.61, + "learning_rate": 0.00020796980670380344, + "loss": 0.0125, "step": 236690 }, { - "epoch": 1.19, - "learning_rate": 0.00012087270635837566, - "loss": 0.0072, + "epoch": 0.61, + "learning_rate": 0.00020796591848743198, + "loss": 0.0132, "step": 236700 }, { - "epoch": 1.19, - "learning_rate": 0.00012086513866536164, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.0002079620302710605, + "loss": 0.0148, "step": 236710 }, { - "epoch": 1.19, - "learning_rate": 0.00012085757097234763, - "loss": 0.0084, + "epoch": 0.61, + "learning_rate": 0.00020795814205468903, + "loss": 0.0166, "step": 236720 }, { - "epoch": 1.19, - "learning_rate": 0.00012085000327933363, - "loss": 0.0116, + "epoch": 0.61, + "learning_rate": 0.00020795425383831757, + "loss": 0.0125, "step": 236730 }, { - "epoch": 1.19, - "learning_rate": 0.00012084243558631961, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020795036562194612, + "loss": 0.0172, "step": 236740 }, { - "epoch": 1.19, - "learning_rate": 0.0001208348678933056, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020794647740557463, + "loss": 0.0158, "step": 236750 }, { - "epoch": 1.19, - "learning_rate": 0.00012082730020029159, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020794258918920317, + "loss": 0.0186, "step": 236760 }, { - "epoch": 1.19, - "learning_rate": 0.00012081973250727758, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020793870097283174, + "loss": 0.0167, "step": 236770 }, { - "epoch": 1.19, - "learning_rate": 0.00012081216481426358, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020793481275646026, + "loss": 0.0188, "step": 236780 }, { - "epoch": 1.19, - "learning_rate": 0.00012080459712124956, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020793092454008877, + "loss": 0.0151, "step": 236790 }, { - "epoch": 1.19, - "learning_rate": 0.00012079702942823555, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.0002079270363237173, + "loss": 0.0147, "step": 236800 }, { - "epoch": 1.19, - "learning_rate": 0.00012078946173522155, - "loss": 0.0102, + "epoch": 0.61, + "learning_rate": 0.00020792314810734588, + "loss": 0.0122, "step": 236810 }, { - "epoch": 1.19, - "learning_rate": 0.00012078189404220753, - "loss": 0.0106, + "epoch": 0.61, + "learning_rate": 0.0002079192598909744, + "loss": 0.0174, "step": 236820 }, { - "epoch": 1.19, - "learning_rate": 0.00012077432634919352, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020791537167460294, + "loss": 0.0157, "step": 236830 }, { - "epoch": 1.19, - "learning_rate": 0.00012076675865617952, - "loss": 0.0093, + "epoch": 0.61, + "learning_rate": 0.00020791148345823145, + "loss": 0.0143, "step": 236840 }, { - "epoch": 1.19, - "learning_rate": 0.0001207591909631655, - "loss": 0.0079, + "epoch": 0.61, + "learning_rate": 0.00020790759524186002, + "loss": 0.0129, "step": 236850 }, { - "epoch": 1.19, - "learning_rate": 0.0001207516232701515, - "loss": 0.0105, + "epoch": 0.61, + "learning_rate": 0.00020790370702548853, + "loss": 0.0192, "step": 236860 }, { - "epoch": 1.2, - "learning_rate": 0.00012074405557713748, - "loss": 0.0109, + "epoch": 0.61, + "learning_rate": 0.00020789981880911708, + "loss": 0.019, "step": 236870 }, { - "epoch": 1.2, - "learning_rate": 0.00012073648788412347, - "loss": 0.0144, + "epoch": 0.61, + "learning_rate": 0.0002078959305927456, + "loss": 0.0179, "step": 236880 }, { - "epoch": 1.2, - "learning_rate": 0.00012072892019110947, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020789204237637416, + "loss": 0.0189, "step": 236890 }, { - "epoch": 1.2, - "learning_rate": 0.00012072135249809545, - "loss": 0.0086, + "epoch": 0.61, + "learning_rate": 0.00020788815416000267, + "loss": 0.0164, "step": 236900 }, { - "epoch": 1.2, - "learning_rate": 0.00012071378480508144, - "loss": 0.0076, + "epoch": 0.61, + "learning_rate": 0.00020788426594363122, + "loss": 0.0134, "step": 236910 }, { - "epoch": 1.2, - "learning_rate": 0.00012070621711206744, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020788037772725973, + "loss": 0.0159, "step": 236920 }, { - "epoch": 1.2, - "learning_rate": 0.00012069864941905342, - "loss": 0.0101, + "epoch": 0.61, + "learning_rate": 0.0002078764895108883, + "loss": 0.018, "step": 236930 }, { - "epoch": 1.2, - "learning_rate": 0.00012069108172603942, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.00020787260129451684, + "loss": 0.0144, "step": 236940 }, { - "epoch": 1.2, - "learning_rate": 0.0001206835140330254, - "loss": 0.0107, + "epoch": 0.61, + "learning_rate": 0.00020786871307814536, + "loss": 0.0177, "step": 236950 }, { - "epoch": 1.2, - "learning_rate": 0.00012067594634001139, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020786482486177387, + "loss": 0.0158, "step": 236960 }, { - "epoch": 1.2, - "learning_rate": 0.00012066837864699739, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.0002078609366454024, + "loss": 0.0177, "step": 236970 }, { - "epoch": 1.2, - "learning_rate": 0.00012066081095398337, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020785704842903098, + "loss": 0.0151, "step": 236980 }, { - "epoch": 1.2, - "learning_rate": 0.00012065324326096936, - "loss": 0.008, + "epoch": 0.61, + "learning_rate": 0.0002078531602126595, + "loss": 0.0203, "step": 236990 }, { - "epoch": 1.2, - "learning_rate": 0.00012064567556795536, - "loss": 0.0089, + "epoch": 0.61, + "learning_rate": 0.00020784927199628804, + "loss": 0.0132, "step": 237000 }, { - "epoch": 1.2, - "eval_cer": 0.9144498775845288, - "eval_loss": 0.006527193821966648, - "eval_runtime": 116.0102, - "eval_samples_per_second": 17.24, - "eval_steps_per_second": 4.31, + "epoch": 0.61, + "eval_cer": 0.8817908634500211, + "eval_loss": 0.011273314245045185, + "eval_runtime": 107.1971, + "eval_samples_per_second": 18.657, + "eval_steps_per_second": 4.664, "step": 237000 }, { - "epoch": 1.2, - "learning_rate": 0.00012063810787494134, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020784538377991655, + "loss": 0.0184, "step": 237010 }, { - "epoch": 1.2, - "learning_rate": 0.00012063054018192733, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020784149556354512, + "loss": 0.0164, "step": 237020 }, { - "epoch": 1.2, - "learning_rate": 0.00012062297248891332, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020783760734717363, + "loss": 0.0196, "step": 237030 }, { - "epoch": 1.2, - "learning_rate": 0.00012061540479589931, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020783371913080218, + "loss": 0.0176, "step": 237040 }, { - "epoch": 1.2, - "learning_rate": 0.0001206078371028853, - "loss": 0.0085, + "epoch": 0.61, + "learning_rate": 0.0002078298309144307, + "loss": 0.0153, "step": 237050 }, { - "epoch": 1.2, - "learning_rate": 0.00012060026940987129, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020782594269805926, + "loss": 0.0163, "step": 237060 }, { - "epoch": 1.2, - "learning_rate": 0.00012059270171685728, - "loss": 0.0082, + "epoch": 0.61, + "learning_rate": 0.00020782205448168777, + "loss": 0.0149, "step": 237070 }, { - "epoch": 1.2, - "learning_rate": 0.00012058513402384328, - "loss": 0.009, + "epoch": 0.61, + "learning_rate": 0.00020781816626531632, + "loss": 0.0181, "step": 237080 }, { - "epoch": 1.2, - "learning_rate": 0.00012057756633082926, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020781427804894483, + "loss": 0.0136, "step": 237090 }, { - "epoch": 1.2, - "learning_rate": 0.00012056999863781525, - "loss": 0.0083, + "epoch": 0.61, + "learning_rate": 0.0002078103898325734, + "loss": 0.0215, "step": 237100 }, { - "epoch": 1.2, - "learning_rate": 0.00012056243094480124, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.0002078065016162019, + "loss": 0.0142, "step": 237110 }, { - "epoch": 1.2, - "learning_rate": 0.00012055486325178723, - "loss": 0.0087, + "epoch": 0.61, + "learning_rate": 0.00020780261339983045, + "loss": 0.0179, "step": 237120 }, { - "epoch": 1.2, - "learning_rate": 0.00012054729555877323, - "loss": 0.0056, + "epoch": 0.61, + "learning_rate": 0.00020779872518345897, + "loss": 0.0206, "step": 237130 }, { - "epoch": 1.2, - "learning_rate": 0.00012053972786575921, - "loss": 0.0098, + "epoch": 0.61, + "learning_rate": 0.00020779483696708754, + "loss": 0.0134, "step": 237140 }, { - "epoch": 1.2, - "learning_rate": 0.0001205321601727452, - "loss": 0.0074, + "epoch": 0.61, + "learning_rate": 0.00020779094875071608, + "loss": 0.017, "step": 237150 }, { - "epoch": 1.2, - "learning_rate": 0.0001205245924797312, - "loss": 0.01, + "epoch": 0.61, + "learning_rate": 0.0002077870605343446, + "loss": 0.0202, "step": 237160 }, { - "epoch": 1.2, - "learning_rate": 0.00012051702478671718, - "loss": 0.0059, + "epoch": 0.61, + "learning_rate": 0.00020778317231797314, + "loss": 0.0167, "step": 237170 }, { - "epoch": 1.2, - "learning_rate": 0.00012050945709370317, - "loss": 0.0088, + "epoch": 0.61, + "learning_rate": 0.00020777928410160168, + "loss": 0.0147, "step": 237180 }, { - "epoch": 1.2, - "learning_rate": 0.00012050188940068915, - "loss": 0.0105, + "epoch": 0.61, + "learning_rate": 0.00020777539588523022, + "loss": 0.0198, "step": 237190 }, { - "epoch": 1.2, - "learning_rate": 0.00012049432170767515, - "loss": 0.0096, + "epoch": 0.61, + "learning_rate": 0.00020777150766885873, + "loss": 0.0188, "step": 237200 }, { - "epoch": 1.2, - "learning_rate": 0.00012048675401466114, - "loss": 0.0077, + "epoch": 0.61, + "learning_rate": 0.00020776761945248728, + "loss": 0.0152, "step": 237210 }, { - "epoch": 1.2, - "learning_rate": 0.00012047918632164713, - "loss": 0.0107, + "epoch": 0.61, + "learning_rate": 0.0002077637312361158, + "loss": 0.0217, "step": 237220 }, { - "epoch": 1.2, - "learning_rate": 0.00012047161862863312, - "loss": 0.0078, + "epoch": 0.61, + "learning_rate": 0.00020775984301974436, + "loss": 0.0177, "step": 237230 }, { - "epoch": 1.2, - "learning_rate": 0.00012046405093561909, - "loss": 0.0099, + "epoch": 0.61, + "learning_rate": 0.00020775595480337287, + "loss": 0.0179, "step": 237240 }, { - "epoch": 1.2, - "learning_rate": 0.00012045648324260508, - "loss": 0.0119, + "epoch": 0.61, + "learning_rate": 0.00020775206658700141, + "loss": 0.0174, "step": 237250 }, { - "epoch": 1.2, - "learning_rate": 0.00012044891554959108, - "loss": 0.0108, + "epoch": 0.62, + "learning_rate": 0.00020774817837062993, + "loss": 0.0154, "step": 237260 }, { - "epoch": 1.2, - "learning_rate": 0.00012044134785657706, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.0002077442901542585, + "loss": 0.0177, "step": 237270 }, { - "epoch": 1.2, - "learning_rate": 0.00012043378016356306, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.000207740401937887, + "loss": 0.0133, "step": 237280 }, { - "epoch": 1.2, - "learning_rate": 0.00012042621247054905, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020773651372151555, + "loss": 0.0163, "step": 237290 }, { - "epoch": 1.2, - "learning_rate": 0.00012041864477753503, - "loss": 0.0121, + "epoch": 0.62, + "learning_rate": 0.00020773262550514407, + "loss": 0.0136, "step": 237300 }, { - "epoch": 1.2, - "learning_rate": 0.00012041107708452103, - "loss": 0.0133, + "epoch": 0.62, + "learning_rate": 0.00020772873728877264, + "loss": 0.0145, "step": 237310 }, { - "epoch": 1.2, - "learning_rate": 0.00012040350939150701, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020772484907240118, + "loss": 0.0143, "step": 237320 }, { - "epoch": 1.2, - "learning_rate": 0.000120395941698493, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002077209608560297, + "loss": 0.0147, "step": 237330 }, { - "epoch": 1.2, - "learning_rate": 0.000120388374005479, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020771707263965824, + "loss": 0.0192, "step": 237340 }, { - "epoch": 1.2, - "learning_rate": 0.00012038080631246498, - "loss": 0.0112, + "epoch": 0.62, + "learning_rate": 0.00020771318442328678, + "loss": 0.0156, "step": 237350 }, { - "epoch": 1.2, - "learning_rate": 0.00012037323861945097, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020770929620691532, + "loss": 0.0174, "step": 237360 }, { - "epoch": 1.2, - "learning_rate": 0.00012036567092643697, - "loss": 0.0113, + "epoch": 0.62, + "learning_rate": 0.00020770540799054383, + "loss": 0.0151, "step": 237370 }, { - "epoch": 1.2, - "learning_rate": 0.00012035810323342295, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020770151977417237, + "loss": 0.0175, "step": 237380 }, { - "epoch": 1.2, - "learning_rate": 0.00012035053554040895, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020769763155780092, + "loss": 0.0184, "step": 237390 }, { - "epoch": 1.2, - "learning_rate": 0.00012034296784739493, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020769374334142946, + "loss": 0.02, "step": 237400 }, { - "epoch": 1.2, - "learning_rate": 0.00012033540015438092, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020768985512505797, + "loss": 0.0147, "step": 237410 }, { - "epoch": 1.2, - "learning_rate": 0.00012032783246136692, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020768596690868651, + "loss": 0.0147, "step": 237420 }, { - "epoch": 1.2, - "learning_rate": 0.0001203202647683529, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020768207869231506, + "loss": 0.0162, "step": 237430 }, { - "epoch": 1.2, - "learning_rate": 0.0001203126970753389, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.0002076781904759436, + "loss": 0.0178, "step": 237440 }, { - "epoch": 1.2, - "learning_rate": 0.00012030512938232489, - "loss": 0.0109, + "epoch": 0.62, + "learning_rate": 0.0002076743022595721, + "loss": 0.0188, "step": 237450 }, { - "epoch": 1.2, - "learning_rate": 0.00012029756168931087, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020767041404320065, + "loss": 0.0158, "step": 237460 }, { - "epoch": 1.2, - "learning_rate": 0.00012028999399629687, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020766652582682917, + "loss": 0.0171, "step": 237470 }, { - "epoch": 1.2, - "learning_rate": 0.00012028242630328285, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020766263761045774, + "loss": 0.0135, "step": 237480 }, { - "epoch": 1.2, - "learning_rate": 0.00012027485861026884, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020765874939408628, + "loss": 0.018, "step": 237490 }, { - "epoch": 1.2, - "learning_rate": 0.00012026729091725484, - "loss": 0.0116, + "epoch": 0.62, + "learning_rate": 0.0002076548611777148, + "loss": 0.0115, "step": 237500 }, { - "epoch": 1.2, - "learning_rate": 0.00012025972322424082, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002076509729613433, + "loss": 0.0193, "step": 237510 }, { - "epoch": 1.2, - "learning_rate": 0.00012025215553122681, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020764708474497188, + "loss": 0.0169, "step": 237520 }, { - "epoch": 1.2, - "learning_rate": 0.00012024458783821281, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020764319652860042, + "loss": 0.0165, "step": 237530 }, { - "epoch": 1.2, - "learning_rate": 0.00012023702014519879, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020763930831222893, + "loss": 0.016, "step": 237540 }, { - "epoch": 1.2, - "learning_rate": 0.00012022945245218478, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.00020763542009585747, + "loss": 0.0167, "step": 237550 }, { - "epoch": 1.2, - "learning_rate": 0.00012022188475917077, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020763153187948602, + "loss": 0.0224, "step": 237560 }, { - "epoch": 1.2, - "learning_rate": 0.00012021431706615676, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.00020762764366311456, + "loss": 0.0151, "step": 237570 }, { - "epoch": 1.2, - "learning_rate": 0.00012020674937314276, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020762375544674307, + "loss": 0.0125, "step": 237580 }, { - "epoch": 1.2, - "learning_rate": 0.00012019918168012874, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002076198672303716, + "loss": 0.0156, "step": 237590 }, { - "epoch": 1.2, - "learning_rate": 0.00012019161398711473, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020761597901400016, + "loss": 0.018, "step": 237600 }, { - "epoch": 1.2, - "learning_rate": 0.00012018404629410073, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.0002076120907976287, + "loss": 0.0155, "step": 237610 }, { - "epoch": 1.2, - "learning_rate": 0.00012017647860108671, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.0002076082025812572, + "loss": 0.0158, "step": 237620 }, { - "epoch": 1.2, - "learning_rate": 0.0001201689109080727, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020760431436488575, + "loss": 0.0155, "step": 237630 }, { - "epoch": 1.2, - "learning_rate": 0.00012016134321505869, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020760042614851432, + "loss": 0.0173, "step": 237640 }, { - "epoch": 1.2, - "learning_rate": 0.00012015377552204468, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020759653793214284, + "loss": 0.0198, "step": 237650 }, { - "epoch": 1.2, - "learning_rate": 0.00012014620782903068, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.00020759264971577135, + "loss": 0.0182, "step": 237660 }, { - "epoch": 1.2, - "learning_rate": 0.00012013864013601666, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.0002075887614993999, + "loss": 0.0211, "step": 237670 }, { - "epoch": 1.2, - "learning_rate": 0.00012013107244300265, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.00020758487328302846, + "loss": 0.015, "step": 237680 }, { - "epoch": 1.2, - "learning_rate": 0.00012012350474998865, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020758098506665698, + "loss": 0.0156, "step": 237690 }, { - "epoch": 1.2, - "learning_rate": 0.00012011593705697463, - "loss": 0.0114, + "epoch": 0.62, + "learning_rate": 0.00020757709685028552, + "loss": 0.0172, "step": 237700 }, { - "epoch": 1.2, - "learning_rate": 0.00012010836936396062, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020757320863391403, + "loss": 0.0136, "step": 237710 }, { - "epoch": 1.2, - "learning_rate": 0.0001201008016709466, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.00020756932041754257, + "loss": 0.0148, "step": 237720 }, { - "epoch": 1.2, - "learning_rate": 0.0001200932339779326, - "loss": 0.0136, + "epoch": 0.62, + "learning_rate": 0.00020756543220117112, + "loss": 0.0158, "step": 237730 }, { - "epoch": 1.2, - "learning_rate": 0.0001200856662849186, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020756154398479966, + "loss": 0.0169, "step": 237740 }, { - "epoch": 1.2, - "learning_rate": 0.00012007809859190458, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020755765576842817, + "loss": 0.0127, "step": 237750 }, { - "epoch": 1.2, - "learning_rate": 0.00012007053089889057, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.0002075537675520567, + "loss": 0.0146, "step": 237760 }, { - "epoch": 1.2, - "learning_rate": 0.00012006296320587657, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020754987933568525, + "loss": 0.0174, "step": 237770 }, { - "epoch": 1.2, - "learning_rate": 0.00012005539551286255, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002075459911193138, + "loss": 0.0169, "step": 237780 }, { - "epoch": 1.2, - "learning_rate": 0.00012004782781984854, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.0002075421029029423, + "loss": 0.0166, "step": 237790 }, { - "epoch": 1.2, - "learning_rate": 0.00012004026012683452, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020753821468657085, + "loss": 0.0161, "step": 237800 }, { - "epoch": 1.2, - "learning_rate": 0.00012003269243382052, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020753432647019942, + "loss": 0.0141, "step": 237810 }, { - "epoch": 1.2, - "learning_rate": 0.00012002512474080651, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020753043825382794, + "loss": 0.0146, "step": 237820 }, { - "epoch": 1.2, - "learning_rate": 0.0001200175570477925, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020752655003745645, + "loss": 0.0148, "step": 237830 }, { - "epoch": 1.2, - "learning_rate": 0.00012000998935477849, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.000207522661821085, + "loss": 0.013, "step": 237840 }, { - "epoch": 1.2, - "learning_rate": 0.00012000242166176449, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.00020751877360471356, + "loss": 0.0121, "step": 237850 }, { - "epoch": 1.2, - "learning_rate": 0.00011999485396875047, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020751488538834208, + "loss": 0.0161, "step": 237860 }, { - "epoch": 1.2, - "learning_rate": 0.00011998728627573645, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020751099717197062, + "loss": 0.0184, "step": 237870 }, { - "epoch": 1.2, - "learning_rate": 0.00011997971858272243, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020750710895559913, + "loss": 0.0162, "step": 237880 }, { - "epoch": 1.2, - "learning_rate": 0.00011997215088970843, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002075032207392277, + "loss": 0.0142, "step": 237890 }, { - "epoch": 1.2, - "learning_rate": 0.00011996458319669442, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020749933252285621, + "loss": 0.0163, "step": 237900 }, { - "epoch": 1.2, - "learning_rate": 0.0001199570155036804, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020749544430648476, + "loss": 0.0137, "step": 237910 }, { - "epoch": 1.2, - "learning_rate": 0.0001199494478106664, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020749155609011327, + "loss": 0.0207, "step": 237920 }, { - "epoch": 1.2, - "learning_rate": 0.00011994188011765238, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020748766787374184, + "loss": 0.0163, "step": 237930 }, { - "epoch": 1.2, - "learning_rate": 0.00011993431242463837, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020748377965737035, + "loss": 0.0193, "step": 237940 }, { - "epoch": 1.2, - "learning_rate": 0.00011992674473162437, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002074798914409989, + "loss": 0.0161, "step": 237950 }, { - "epoch": 1.2, - "learning_rate": 0.00011991917703861035, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002074760032246274, + "loss": 0.0155, "step": 237960 }, { - "epoch": 1.2, - "learning_rate": 0.00011991160934559634, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020747211500825595, + "loss": 0.0198, "step": 237970 }, { - "epoch": 1.2, - "learning_rate": 0.00011990404165258234, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.0002074682267918845, + "loss": 0.016, "step": 237980 }, { - "epoch": 1.2, - "learning_rate": 0.00011989647395956832, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020746433857551304, + "loss": 0.0142, "step": 237990 }, { - "epoch": 1.2, - "learning_rate": 0.00011988890626655432, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020746045035914155, + "loss": 0.0152, "step": 238000 }, { - "epoch": 1.2, - "eval_cer": 0.9144586111496574, - "eval_loss": 0.006760002113878727, - "eval_runtime": 116.0385, - "eval_samples_per_second": 17.236, - "eval_steps_per_second": 4.309, + "epoch": 0.62, + "eval_cer": 0.8817488743419957, + "eval_loss": 0.01096505206078291, + "eval_runtime": 107.3808, + "eval_samples_per_second": 18.625, + "eval_steps_per_second": 4.656, "step": 238000 }, { - "epoch": 1.2, - "learning_rate": 0.0001198813385735403, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.0002074565621427701, + "loss": 0.0163, "step": 238010 }, { - "epoch": 1.2, - "learning_rate": 0.00011987377088052629, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020745267392639866, + "loss": 0.0175, "step": 238020 }, { - "epoch": 1.2, - "learning_rate": 0.00011986620318751229, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020744878571002717, + "loss": 0.0179, "step": 238030 }, { - "epoch": 1.2, - "learning_rate": 0.00011985863549449827, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020744489749365572, + "loss": 0.0163, "step": 238040 }, { - "epoch": 1.2, - "learning_rate": 0.00011985106780148426, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020744100927728423, + "loss": 0.0147, "step": 238050 }, { - "epoch": 1.2, - "learning_rate": 0.00011984350010847026, - "loss": 0.0071, + "epoch": 0.62, + "learning_rate": 0.0002074371210609128, + "loss": 0.0256, "step": 238060 }, { - "epoch": 1.2, - "learning_rate": 0.00011983593241545624, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020743323284454131, + "loss": 0.0223, "step": 238070 }, { - "epoch": 1.2, - "learning_rate": 0.00011982836472244224, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020742934462816986, + "loss": 0.0172, "step": 238080 }, { - "epoch": 1.2, - "learning_rate": 0.00011982079702942822, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.00020742545641179837, + "loss": 0.0153, "step": 238090 }, { - "epoch": 1.2, - "learning_rate": 0.00011981322933641421, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020742156819542694, + "loss": 0.0157, "step": 238100 }, { - "epoch": 1.2, - "learning_rate": 0.0001198056616434002, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020741767997905545, + "loss": 0.0158, "step": 238110 }, { - "epoch": 1.2, - "learning_rate": 0.00011979809395038619, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.000207413791762684, + "loss": 0.0131, "step": 238120 }, { - "epoch": 1.2, - "learning_rate": 0.00011979052625737218, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.0002074099035463125, + "loss": 0.0155, "step": 238130 }, { - "epoch": 1.2, - "learning_rate": 0.00011978295856435818, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.00020740601532994108, + "loss": 0.0161, "step": 238140 }, { - "epoch": 1.2, - "learning_rate": 0.00011977539087134416, - "loss": 0.0115, + "epoch": 0.62, + "learning_rate": 0.0002074021271135696, + "loss": 0.0182, "step": 238150 }, { - "epoch": 1.2, - "learning_rate": 0.00011976782317833015, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020739823889719813, + "loss": 0.0186, "step": 238160 }, { - "epoch": 1.2, - "learning_rate": 0.00011976025548531614, - "loss": 0.0112, + "epoch": 0.62, + "learning_rate": 0.00020739435068082665, + "loss": 0.0176, "step": 238170 }, { - "epoch": 1.2, - "learning_rate": 0.00011975268779230213, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020739046246445522, + "loss": 0.0168, "step": 238180 }, { - "epoch": 1.2, - "learning_rate": 0.00011974512009928813, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020738657424808376, + "loss": 0.0153, "step": 238190 }, { - "epoch": 1.2, - "learning_rate": 0.00011973755240627411, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020738268603171227, + "loss": 0.0147, "step": 238200 }, { - "epoch": 1.2, - "learning_rate": 0.0001197299847132601, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020737879781534082, + "loss": 0.0165, "step": 238210 }, { - "epoch": 1.2, - "learning_rate": 0.0001197224170202461, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020737490959896933, + "loss": 0.0179, "step": 238220 }, { - "epoch": 1.2, - "learning_rate": 0.00011971484932723208, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.0002073710213825979, + "loss": 0.0146, "step": 238230 }, { - "epoch": 1.2, - "learning_rate": 0.00011970728163421807, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002073671331662264, + "loss": 0.0174, "step": 238240 }, { - "epoch": 1.2, - "learning_rate": 0.00011969971394120406, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020736324494985496, + "loss": 0.0138, "step": 238250 }, { - "epoch": 1.2, - "learning_rate": 0.00011969214624819005, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020735935673348347, + "loss": 0.0124, "step": 238260 }, { - "epoch": 1.2, - "learning_rate": 0.00011968457855517605, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020735546851711204, + "loss": 0.0167, "step": 238270 }, { - "epoch": 1.2, - "learning_rate": 0.00011967701086216203, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020735158030074055, + "loss": 0.0171, "step": 238280 }, { - "epoch": 1.2, - "learning_rate": 0.00011966944316914802, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.0002073476920843691, + "loss": 0.0147, "step": 238290 }, { - "epoch": 1.2, - "learning_rate": 0.00011966187547613402, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.0002073438038679976, + "loss": 0.0151, "step": 238300 }, { - "epoch": 1.2, - "learning_rate": 0.00011965430778312, - "loss": 0.0098, + "epoch": 0.62, + "learning_rate": 0.00020733991565162618, + "loss": 0.0145, "step": 238310 }, { - "epoch": 1.2, - "learning_rate": 0.00011964674009010599, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.0002073360274352547, + "loss": 0.0186, "step": 238320 }, { - "epoch": 1.2, - "learning_rate": 0.00011963917239709199, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020733213921888323, + "loss": 0.02, "step": 238330 }, { - "epoch": 1.2, - "learning_rate": 0.00011963160470407797, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.00020732825100251175, + "loss": 0.0177, "step": 238340 }, { - "epoch": 1.2, - "learning_rate": 0.00011962403701106396, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020732436278614032, + "loss": 0.0168, "step": 238350 }, { - "epoch": 1.2, - "learning_rate": 0.00011961646931804995, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.00020732047456976886, + "loss": 0.0124, "step": 238360 }, { - "epoch": 1.2, - "learning_rate": 0.00011960890162503594, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020731658635339737, + "loss": 0.0166, "step": 238370 }, { - "epoch": 1.2, - "learning_rate": 0.00011960133393202194, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.0002073126981370259, + "loss": 0.0106, "step": 238380 }, { - "epoch": 1.2, - "learning_rate": 0.00011959376623900792, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020730880992065446, + "loss": 0.018, "step": 238390 }, { - "epoch": 1.2, - "learning_rate": 0.00011958619854599391, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.000207304921704283, + "loss": 0.0165, "step": 238400 }, { - "epoch": 1.2, - "learning_rate": 0.00011957863085297991, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002073010334879115, + "loss": 0.0175, "step": 238410 }, { - "epoch": 1.2, - "learning_rate": 0.00011957106315996589, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020729714527154005, + "loss": 0.0172, "step": 238420 }, { - "epoch": 1.2, - "learning_rate": 0.00011956349546695188, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.0002072932570551686, + "loss": 0.0213, "step": 238430 }, { - "epoch": 1.2, - "learning_rate": 0.00011955592777393787, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020728936883879714, + "loss": 0.0167, "step": 238440 }, { - "epoch": 1.2, - "learning_rate": 0.00011954836008092386, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020728548062242565, + "loss": 0.0139, "step": 238450 }, { - "epoch": 1.2, - "learning_rate": 0.00011954079238790986, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.0002072815924060542, + "loss": 0.0189, "step": 238460 }, { - "epoch": 1.2, - "learning_rate": 0.00011953322469489584, - "loss": 0.0066, + "epoch": 0.62, + "learning_rate": 0.0002072777041896827, + "loss": 0.0136, "step": 238470 }, { - "epoch": 1.2, - "learning_rate": 0.00011952565700188183, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020727381597331128, + "loss": 0.0181, "step": 238480 }, { - "epoch": 1.2, - "learning_rate": 0.00011951808930886783, - "loss": 0.0117, + "epoch": 0.62, + "learning_rate": 0.0002072699277569398, + "loss": 0.0169, "step": 238490 }, { - "epoch": 1.2, - "learning_rate": 0.0001195105216158538, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020726603954056833, + "loss": 0.0149, "step": 238500 }, { - "epoch": 1.2, - "learning_rate": 0.00011950295392283979, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020726215132419685, + "loss": 0.0157, "step": 238510 }, { - "epoch": 1.2, - "learning_rate": 0.00011949538622982577, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020725826310782542, + "loss": 0.0139, "step": 238520 }, { - "epoch": 1.2, - "learning_rate": 0.00011948781853681177, - "loss": 0.0072, + "epoch": 0.62, + "learning_rate": 0.00020725437489145396, + "loss": 0.0153, "step": 238530 }, { - "epoch": 1.2, - "learning_rate": 0.00011948025084379775, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020725048667508247, + "loss": 0.0112, "step": 238540 }, { - "epoch": 1.2, - "learning_rate": 0.00011947268315078374, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.000207246598458711, + "loss": 0.0126, "step": 238550 }, { - "epoch": 1.2, - "learning_rate": 0.00011946511545776974, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020724271024233956, + "loss": 0.0189, "step": 238560 }, { - "epoch": 1.2, - "learning_rate": 0.00011945754776475572, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.0002072388220259681, + "loss": 0.0143, "step": 238570 }, { - "epoch": 1.2, - "learning_rate": 0.00011944998007174171, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.0002072349338095966, + "loss": 0.0157, "step": 238580 }, { - "epoch": 1.2, - "learning_rate": 0.00011944241237872771, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020723104559322515, + "loss": 0.0127, "step": 238590 }, { - "epoch": 1.2, - "learning_rate": 0.00011943484468571369, - "loss": 0.0134, + "epoch": 0.62, + "learning_rate": 0.0002072271573768537, + "loss": 0.0206, "step": 238600 }, { - "epoch": 1.2, - "learning_rate": 0.00011942727699269969, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020722326916048224, + "loss": 0.0168, "step": 238610 }, { - "epoch": 1.2, - "learning_rate": 0.00011941970929968567, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020721938094411075, + "loss": 0.0131, "step": 238620 }, { - "epoch": 1.2, - "learning_rate": 0.00011941214160667166, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.0002072154927277393, + "loss": 0.0129, "step": 238630 }, { - "epoch": 1.2, - "learning_rate": 0.00011940457391365766, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020721160451136783, + "loss": 0.0146, "step": 238640 }, { - "epoch": 1.2, - "learning_rate": 0.00011939700622064364, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020720771629499638, + "loss": 0.0104, "step": 238650 }, { - "epoch": 1.2, - "learning_rate": 0.00011938943852762963, - "loss": 0.006, + "epoch": 0.62, + "learning_rate": 0.0002072038280786249, + "loss": 0.0157, "step": 238660 }, { - "epoch": 1.2, - "learning_rate": 0.00011938187083461563, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020719993986225343, + "loss": 0.0151, "step": 238670 }, { - "epoch": 1.2, - "learning_rate": 0.00011937430314160161, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.00020719605164588195, + "loss": 0.0214, "step": 238680 }, { - "epoch": 1.2, - "learning_rate": 0.0001193667354485876, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020719216342951052, + "loss": 0.0167, "step": 238690 }, { - "epoch": 1.2, - "learning_rate": 0.00011935916775557359, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.00020718827521313903, + "loss": 0.0163, "step": 238700 }, { - "epoch": 1.2, - "learning_rate": 0.00011935160006255958, - "loss": 0.0154, + "epoch": 0.62, + "learning_rate": 0.00020718438699676757, + "loss": 0.0166, "step": 238710 }, { - "epoch": 1.2, - "learning_rate": 0.00011934403236954558, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002071804987803961, + "loss": 0.0189, "step": 238720 }, { - "epoch": 1.2, - "learning_rate": 0.00011933646467653156, - "loss": 0.011, + "epoch": 0.62, + "learning_rate": 0.00020717661056402466, + "loss": 0.0168, "step": 238730 }, { - "epoch": 1.2, - "learning_rate": 0.00011932889698351755, + "epoch": 0.62, + "learning_rate": 0.0002071727223476532, "loss": 0.014, "step": 238740 }, { - "epoch": 1.2, - "learning_rate": 0.00011932132929050355, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.0002071688341312817, + "loss": 0.0184, "step": 238750 }, { - "epoch": 1.2, - "learning_rate": 0.00011931376159748953, - "loss": 0.0136, + "epoch": 0.62, + "learning_rate": 0.00020716494591491025, + "loss": 0.0132, "step": 238760 }, { - "epoch": 1.2, - "learning_rate": 0.00011930619390447552, - "loss": 0.0114, + "epoch": 0.62, + "learning_rate": 0.0002071610576985388, + "loss": 0.0194, "step": 238770 }, { - "epoch": 1.2, - "learning_rate": 0.00011929862621146152, - "loss": 0.0117, + "epoch": 0.62, + "learning_rate": 0.00020715716948216734, + "loss": 0.0154, "step": 238780 }, { - "epoch": 1.2, - "learning_rate": 0.0001192910585184475, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020715328126579585, + "loss": 0.0195, "step": 238790 }, { - "epoch": 1.2, - "learning_rate": 0.0001192834908254335, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.0002071493930494244, + "loss": 0.018, "step": 238800 }, { - "epoch": 1.2, - "learning_rate": 0.00011927592313241948, - "loss": 0.0109, + "epoch": 0.62, + "learning_rate": 0.00020714550483305293, + "loss": 0.014, "step": 238810 }, { - "epoch": 1.2, - "learning_rate": 0.00011926835543940547, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020714161661668148, + "loss": 0.0128, "step": 238820 }, { - "epoch": 1.2, - "learning_rate": 0.00011926078774639147, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020713772840031, + "loss": 0.0149, "step": 238830 }, { - "epoch": 1.2, - "learning_rate": 0.00011925322005337745, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020713384018393853, + "loss": 0.0185, "step": 238840 }, { - "epoch": 1.21, - "learning_rate": 0.00011924565236036344, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020712995196756707, + "loss": 0.0187, "step": 238850 }, { - "epoch": 1.21, - "learning_rate": 0.00011923808466734944, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020712606375119562, + "loss": 0.0177, "step": 238860 }, { - "epoch": 1.21, - "learning_rate": 0.00011923051697433542, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020712217553482413, + "loss": 0.0138, "step": 238870 }, { - "epoch": 1.21, - "learning_rate": 0.00011922294928132141, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020711828731845267, + "loss": 0.0162, "step": 238880 }, { - "epoch": 1.21, - "learning_rate": 0.0001192153815883074, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020711439910208124, + "loss": 0.0146, "step": 238890 }, { - "epoch": 1.21, - "learning_rate": 0.00011920781389529339, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020711051088570975, + "loss": 0.016, "step": 238900 }, { - "epoch": 1.21, - "learning_rate": 0.00011920024620227939, - "loss": 0.0132, + "epoch": 0.62, + "learning_rate": 0.0002071066226693383, + "loss": 0.0137, "step": 238910 }, { - "epoch": 1.21, - "learning_rate": 0.00011919267850926537, - "loss": 0.0115, + "epoch": 0.62, + "learning_rate": 0.0002071027344529668, + "loss": 0.0151, "step": 238920 }, { - "epoch": 1.21, - "learning_rate": 0.00011918511081625136, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020709884623659535, + "loss": 0.0152, "step": 238930 }, { - "epoch": 1.21, - "learning_rate": 0.00011917754312323736, - "loss": 0.0087, - "step": 238940 + "epoch": 0.62, + "learning_rate": 0.0002070949580202239, + "loss": 0.0196, + "step": 238940 }, { - "epoch": 1.21, - "learning_rate": 0.00011916997543022334, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020709106980385244, + "loss": 0.0142, "step": 238950 }, { - "epoch": 1.21, - "learning_rate": 0.00011916240773720933, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020708718158748095, + "loss": 0.0158, "step": 238960 }, { - "epoch": 1.21, - "learning_rate": 0.00011915484004419532, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002070832933711095, + "loss": 0.0182, "step": 238970 }, { - "epoch": 1.21, - "learning_rate": 0.00011914727235118131, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020707940515473803, + "loss": 0.0156, "step": 238980 }, { - "epoch": 1.21, - "learning_rate": 0.0001191397046581673, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.00020707551693836658, + "loss": 0.0147, "step": 238990 }, { - "epoch": 1.21, - "learning_rate": 0.00011913213696515329, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.0002070716287219951, + "loss": 0.0146, "step": 239000 }, { - "epoch": 1.21, - "eval_cer": 0.914452788772905, - "eval_loss": 0.006802674382925034, - "eval_runtime": 116.1446, - "eval_samples_per_second": 17.22, - "eval_steps_per_second": 4.305, + "epoch": 0.62, + "eval_cer": 0.8817236808771804, + "eval_loss": 0.011040524579584599, + "eval_runtime": 107.4536, + "eval_samples_per_second": 18.613, + "eval_steps_per_second": 4.653, "step": 239000 }, { - "epoch": 1.21, - "learning_rate": 0.00011912456927213928, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020706774050562363, + "loss": 0.0144, "step": 239010 }, { - "epoch": 1.21, - "learning_rate": 0.00011911700157912528, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020706385228925217, + "loss": 0.0217, "step": 239020 }, { - "epoch": 1.21, - "learning_rate": 0.00011910943388611126, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020705996407288071, + "loss": 0.0157, "step": 239030 }, { - "epoch": 1.21, - "learning_rate": 0.00011910186619309725, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020705607585650923, + "loss": 0.0138, "step": 239040 }, { - "epoch": 1.21, - "learning_rate": 0.00011909429850008323, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020705218764013777, + "loss": 0.0167, "step": 239050 }, { - "epoch": 1.21, - "learning_rate": 0.00011908673080706923, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020704829942376634, + "loss": 0.0188, "step": 239060 }, { - "epoch": 1.21, - "learning_rate": 0.00011907916311405522, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020704441120739485, + "loss": 0.0139, "step": 239070 }, { - "epoch": 1.21, - "learning_rate": 0.0001190715954210412, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.0002070405229910234, + "loss": 0.0108, "step": 239080 }, { - "epoch": 1.21, - "learning_rate": 0.0001190640277280272, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002070366347746519, + "loss": 0.015, "step": 239090 }, { - "epoch": 1.21, - "learning_rate": 0.0001190564600350132, - "loss": 0.007, + "epoch": 0.62, + "learning_rate": 0.00020703274655828048, + "loss": 0.017, "step": 239100 }, { - "epoch": 1.21, - "learning_rate": 0.00011904889234199918, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.000207028858341909, + "loss": 0.0127, "step": 239110 }, { - "epoch": 1.21, - "learning_rate": 0.00011904132464898517, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020702497012553754, + "loss": 0.0187, "step": 239120 }, { - "epoch": 1.21, - "learning_rate": 0.00011903375695597114, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020702108190916605, + "loss": 0.0178, "step": 239130 }, { - "epoch": 1.21, - "learning_rate": 0.00011902618926295714, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020701719369279462, + "loss": 0.0116, "step": 239140 }, { - "epoch": 1.21, - "learning_rate": 0.00011901862156994312, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020701330547642313, + "loss": 0.018, "step": 239150 }, { - "epoch": 1.21, - "learning_rate": 0.00011901105387692911, - "loss": 0.0069, + "epoch": 0.62, + "learning_rate": 0.00020700941726005167, + "loss": 0.0163, "step": 239160 }, { - "epoch": 1.21, - "learning_rate": 0.00011900348618391511, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.0002070055290436802, + "loss": 0.0118, "step": 239170 }, { - "epoch": 1.21, - "learning_rate": 0.00011899591849090109, - "loss": 0.0115, + "epoch": 0.62, + "learning_rate": 0.00020700164082730873, + "loss": 0.0171, "step": 239180 }, { - "epoch": 1.21, - "learning_rate": 0.00011898835079788708, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020699775261093727, + "loss": 0.0176, "step": 239190 }, { - "epoch": 1.21, - "learning_rate": 0.00011898078310487308, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020699386439456581, + "loss": 0.0148, "step": 239200 }, { - "epoch": 1.21, - "learning_rate": 0.00011897321541185906, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020698997617819433, + "loss": 0.0154, "step": 239210 }, { - "epoch": 1.21, - "learning_rate": 0.00011896564771884505, - "loss": 0.0087, + "epoch": 0.62, + "learning_rate": 0.00020698608796182287, + "loss": 0.0136, "step": 239220 }, { - "epoch": 1.21, - "learning_rate": 0.00011895808002583105, - "loss": 0.0114, + "epoch": 0.62, + "learning_rate": 0.00020698219974545144, + "loss": 0.0136, "step": 239230 }, { - "epoch": 1.21, - "learning_rate": 0.00011895051233281703, - "loss": 0.0121, + "epoch": 0.62, + "learning_rate": 0.00020697831152907995, + "loss": 0.0143, "step": 239240 }, { - "epoch": 1.21, - "learning_rate": 0.00011894294463980303, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020697442331270847, + "loss": 0.0135, "step": 239250 }, { - "epoch": 1.21, - "learning_rate": 0.00011893537694678901, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.000206970535096337, + "loss": 0.0133, "step": 239260 }, { - "epoch": 1.21, - "learning_rate": 0.000118927809253775, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020696664687996558, + "loss": 0.0211, "step": 239270 }, { - "epoch": 1.21, - "learning_rate": 0.000118920241560761, - "loss": 0.0069, + "epoch": 0.62, + "learning_rate": 0.0002069627586635941, + "loss": 0.0163, "step": 239280 }, { - "epoch": 1.21, - "learning_rate": 0.00011891267386774698, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020695887044722263, + "loss": 0.0158, "step": 239290 }, { - "epoch": 1.21, - "learning_rate": 0.00011890510617473297, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020695498223085115, + "loss": 0.0159, "step": 239300 }, { - "epoch": 1.21, - "learning_rate": 0.00011889753848171897, - "loss": 0.0109, + "epoch": 0.62, + "learning_rate": 0.00020695109401447972, + "loss": 0.0187, "step": 239310 }, { - "epoch": 1.21, - "learning_rate": 0.00011888997078870495, - "loss": 0.0067, + "epoch": 0.62, + "learning_rate": 0.00020694720579810823, + "loss": 0.0158, "step": 239320 }, { - "epoch": 1.21, - "learning_rate": 0.00011888240309569095, - "loss": 0.0119, + "epoch": 0.62, + "learning_rate": 0.00020694331758173677, + "loss": 0.0164, "step": 239330 }, { - "epoch": 1.21, - "learning_rate": 0.00011887483540267693, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.0002069394293653653, + "loss": 0.0194, "step": 239340 }, { - "epoch": 1.21, - "learning_rate": 0.00011886726770966292, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020693554114899386, + "loss": 0.014, "step": 239350 }, { - "epoch": 1.21, - "learning_rate": 0.00011885970001664892, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020693165293262237, + "loss": 0.0163, "step": 239360 }, { - "epoch": 1.21, - "learning_rate": 0.0001188521323236349, - "loss": 0.0122, + "epoch": 0.62, + "learning_rate": 0.00020692776471625091, + "loss": 0.0197, "step": 239370 }, { - "epoch": 1.21, - "learning_rate": 0.0001188445646306209, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020692387649987943, + "loss": 0.0155, "step": 239380 }, { - "epoch": 1.21, - "learning_rate": 0.00011883699693760689, - "loss": 0.0121, + "epoch": 0.62, + "learning_rate": 0.000206919988283508, + "loss": 0.0142, "step": 239390 }, { - "epoch": 1.21, - "learning_rate": 0.00011882942924459287, - "loss": 0.0157, + "epoch": 0.62, + "learning_rate": 0.00020691610006713654, + "loss": 0.0175, "step": 239400 }, { - "epoch": 1.21, - "learning_rate": 0.00011882186155157886, - "loss": 0.0116, + "epoch": 0.62, + "learning_rate": 0.00020691221185076505, + "loss": 0.0135, "step": 239410 }, { - "epoch": 1.21, - "learning_rate": 0.00011881429385856485, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020690832363439357, + "loss": 0.0155, "step": 239420 }, { - "epoch": 1.21, - "learning_rate": 0.00011880672616555084, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002069044354180221, + "loss": 0.0189, "step": 239430 }, { - "epoch": 1.21, - "learning_rate": 0.00011879915847253684, - "loss": 0.0129, + "epoch": 0.62, + "learning_rate": 0.00020690054720165068, + "loss": 0.0175, "step": 239440 }, { - "epoch": 1.21, - "learning_rate": 0.00011879159077952282, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.0002068966589852792, + "loss": 0.0157, "step": 239450 }, { - "epoch": 1.21, - "learning_rate": 0.00011878402308650881, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020689277076890773, + "loss": 0.0183, "step": 239460 }, { - "epoch": 1.21, - "learning_rate": 0.00011877645539349481, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020688888255253625, + "loss": 0.0159, "step": 239470 }, { - "epoch": 1.21, - "learning_rate": 0.00011876888770048079, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020688499433616482, + "loss": 0.0165, "step": 239480 }, { - "epoch": 1.21, - "learning_rate": 0.00011876132000746678, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020688110611979333, + "loss": 0.0156, "step": 239490 }, { - "epoch": 1.21, - "learning_rate": 0.00011875375231445277, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020687721790342187, + "loss": 0.0189, "step": 239500 }, { - "epoch": 1.21, - "learning_rate": 0.00011874618462143876, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.0002068733296870504, + "loss": 0.0172, "step": 239510 }, { - "epoch": 1.21, - "learning_rate": 0.00011873861692842476, - "loss": 0.0069, + "epoch": 0.62, + "learning_rate": 0.00020686944147067896, + "loss": 0.016, "step": 239520 }, { - "epoch": 1.21, - "learning_rate": 0.00011873104923541074, - "loss": 0.0066, + "epoch": 0.62, + "learning_rate": 0.00020686555325430747, + "loss": 0.0191, "step": 239530 }, { - "epoch": 1.21, - "learning_rate": 0.00011872348154239673, - "loss": 0.0062, + "epoch": 0.62, + "learning_rate": 0.000206861665037936, + "loss": 0.0171, "step": 239540 }, { - "epoch": 1.21, - "learning_rate": 0.00011871591384938273, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020685777682156453, + "loss": 0.011, "step": 239550 }, { - "epoch": 1.21, - "learning_rate": 0.00011870834615636871, - "loss": 0.0108, + "epoch": 0.62, + "learning_rate": 0.0002068538886051931, + "loss": 0.0122, "step": 239560 }, { - "epoch": 1.21, - "learning_rate": 0.0001187007784633547, - "loss": 0.007, + "epoch": 0.62, + "learning_rate": 0.0002068500003888216, + "loss": 0.0125, "step": 239570 }, { - "epoch": 1.21, - "learning_rate": 0.00011869321077034068, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.00020684611217245015, + "loss": 0.0137, "step": 239580 }, { - "epoch": 1.21, - "learning_rate": 0.00011868564307732668, - "loss": 0.011, + "epoch": 0.62, + "learning_rate": 0.00020684222395607867, + "loss": 0.0164, "step": 239590 }, { - "epoch": 1.21, - "learning_rate": 0.00011867807538431267, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020683833573970724, + "loss": 0.0172, "step": 239600 }, { - "epoch": 1.21, - "learning_rate": 0.00011867050769129866, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020683444752333578, + "loss": 0.0152, "step": 239610 }, { - "epoch": 1.21, - "learning_rate": 0.00011866293999828465, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.0002068305593069643, + "loss": 0.0162, "step": 239620 }, { - "epoch": 1.21, - "learning_rate": 0.00011865537230527065, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.00020682667109059283, + "loss": 0.0141, "step": 239630 }, { - "epoch": 1.21, - "learning_rate": 0.00011864780461225663, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020682278287422138, + "loss": 0.0127, "step": 239640 }, { - "epoch": 1.21, - "learning_rate": 0.00011864023691924262, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020681889465784992, + "loss": 0.0135, "step": 239650 }, { - "epoch": 1.21, - "learning_rate": 0.0001186326692262286, - "loss": 0.0107, + "epoch": 0.62, + "learning_rate": 0.00020681500644147843, + "loss": 0.016, "step": 239660 }, { - "epoch": 1.21, - "learning_rate": 0.0001186251015332146, - "loss": 0.0118, + "epoch": 0.62, + "learning_rate": 0.00020681111822510697, + "loss": 0.0126, "step": 239670 }, { - "epoch": 1.21, - "learning_rate": 0.0001186175338402006, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.0002068072300087355, + "loss": 0.0137, "step": 239680 }, { - "epoch": 1.21, - "learning_rate": 0.00011860996614718658, - "loss": 0.0103, + "epoch": 0.62, + "learning_rate": 0.00020680334179236406, + "loss": 0.017, "step": 239690 }, { - "epoch": 1.21, - "learning_rate": 0.00011860239845417257, - "loss": 0.0054, + "epoch": 0.62, + "learning_rate": 0.00020679945357599257, + "loss": 0.0165, "step": 239700 }, { - "epoch": 1.21, - "learning_rate": 0.00011859483076115857, - "loss": 0.0111, + "epoch": 0.62, + "learning_rate": 0.0002067955653596211, + "loss": 0.0149, "step": 239710 }, { - "epoch": 1.21, - "learning_rate": 0.00011858726306814455, - "loss": 0.0119, + "epoch": 0.62, + "learning_rate": 0.00020679167714324963, + "loss": 0.0142, "step": 239720 }, { - "epoch": 1.21, - "learning_rate": 0.00011857969537513054, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.0002067877889268782, + "loss": 0.0146, "step": 239730 }, { - "epoch": 1.21, - "learning_rate": 0.00011857212768211652, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.0002067839007105067, + "loss": 0.0156, "step": 239740 }, { - "epoch": 1.21, - "learning_rate": 0.00011856455998910252, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020678001249413525, + "loss": 0.0186, "step": 239750 }, { - "epoch": 1.21, - "learning_rate": 0.0001185569922960885, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020677612427776377, + "loss": 0.0155, "step": 239760 }, { - "epoch": 1.21, - "learning_rate": 0.00011854942460307448, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020677223606139234, + "loss": 0.0148, "step": 239770 }, { - "epoch": 1.21, - "learning_rate": 0.00011854185691006048, - "loss": 0.0062, + "epoch": 0.62, + "learning_rate": 0.00020676834784502088, + "loss": 0.0152, "step": 239780 }, { - "epoch": 1.21, - "learning_rate": 0.00011853428921704646, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.0002067644596286494, + "loss": 0.0158, "step": 239790 }, { - "epoch": 1.21, - "learning_rate": 0.00011852672152403245, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020676057141227793, + "loss": 0.0197, "step": 239800 }, { - "epoch": 1.21, - "learning_rate": 0.00011851915383101845, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020675668319590647, + "loss": 0.0191, "step": 239810 }, { - "epoch": 1.21, - "learning_rate": 0.00011851158613800443, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020675279497953502, + "loss": 0.0168, "step": 239820 }, { - "epoch": 1.21, - "learning_rate": 0.00011850401844499042, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020674890676316353, + "loss": 0.0154, "step": 239830 }, { - "epoch": 1.21, - "learning_rate": 0.00011849645075197642, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020674501854679207, + "loss": 0.0127, "step": 239840 }, { - "epoch": 1.21, - "learning_rate": 0.0001184888830589624, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.00020674113033042061, + "loss": 0.0219, "step": 239850 }, { - "epoch": 1.21, - "learning_rate": 0.0001184813153659484, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020673724211404916, + "loss": 0.0139, "step": 239860 }, { - "epoch": 1.21, - "learning_rate": 0.00011847374767293438, - "loss": 0.0067, + "epoch": 0.62, + "learning_rate": 0.00020673335389767767, + "loss": 0.0151, "step": 239870 }, { - "epoch": 1.21, - "learning_rate": 0.00011846617997992037, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.0002067294656813062, + "loss": 0.0134, "step": 239880 }, { - "epoch": 1.21, - "learning_rate": 0.00011845861228690637, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.00020672557746493475, + "loss": 0.0188, "step": 239890 }, { - "epoch": 1.21, - "learning_rate": 0.00011845104459389235, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.0002067216892485633, + "loss": 0.0134, "step": 239900 }, { - "epoch": 1.21, - "learning_rate": 0.00011844347690087834, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.0002067178010321918, + "loss": 0.0166, "step": 239910 }, { - "epoch": 1.21, - "learning_rate": 0.00011843590920786434, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020671391281582035, + "loss": 0.0186, "step": 239920 }, { - "epoch": 1.21, - "learning_rate": 0.00011842834151485032, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020671002459944887, + "loss": 0.0171, "step": 239930 }, { - "epoch": 1.21, - "learning_rate": 0.00011842077382183631, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020670613638307743, + "loss": 0.0179, "step": 239940 }, { - "epoch": 1.21, - "learning_rate": 0.0001184132061288223, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020670224816670598, + "loss": 0.0135, "step": 239950 }, { - "epoch": 1.21, - "learning_rate": 0.00011840563843580829, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.0002066983599503345, + "loss": 0.0156, "step": 239960 }, { - "epoch": 1.21, - "learning_rate": 0.00011839807074279429, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.000206694471733963, + "loss": 0.0138, "step": 239970 }, { - "epoch": 1.21, - "learning_rate": 0.00011839050304978027, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020669058351759157, + "loss": 0.0134, "step": 239980 }, { - "epoch": 1.21, - "learning_rate": 0.00011838293535676626, - "loss": 0.0097, + "epoch": 0.62, + "learning_rate": 0.00020668669530122012, + "loss": 0.0257, "step": 239990 }, { - "epoch": 1.21, - "learning_rate": 0.00011837536766375226, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020668280708484863, + "loss": 0.0143, "step": 240000 }, { - "epoch": 1.21, - "eval_cer": 0.9144537591690304, - "eval_loss": 0.006650357041507959, - "eval_runtime": 116.0541, - "eval_samples_per_second": 17.233, - "eval_steps_per_second": 4.308, + "epoch": 0.62, + "eval_cer": 0.8817922630869552, + "eval_loss": 0.011038198135793209, + "eval_runtime": 107.238, + "eval_samples_per_second": 18.65, + "eval_steps_per_second": 4.663, "step": 240000 }, { - "epoch": 1.21, - "learning_rate": 0.00011836779997073824, - "loss": 0.0113, + "epoch": 0.62, + "learning_rate": 0.00020667891886847717, + "loss": 0.0135, "step": 240010 }, { - "epoch": 1.21, - "learning_rate": 0.00011836023227772423, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020667503065210571, + "loss": 0.0155, "step": 240020 }, { - "epoch": 1.21, - "learning_rate": 0.00011835266458471022, - "loss": 0.0129, + "epoch": 0.62, + "learning_rate": 0.00020667114243573426, + "loss": 0.0183, "step": 240030 }, { - "epoch": 1.21, - "learning_rate": 0.00011834509689169621, - "loss": 0.0065, + "epoch": 0.62, + "learning_rate": 0.00020666725421936277, + "loss": 0.0184, "step": 240040 }, { - "epoch": 1.21, - "learning_rate": 0.0001183375291986822, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.0002066633660029913, + "loss": 0.0147, "step": 240050 }, { - "epoch": 1.21, - "learning_rate": 0.00011832996150566819, - "loss": 0.0102, + "epoch": 0.62, + "learning_rate": 0.00020665947778661985, + "loss": 0.0173, "step": 240060 }, { - "epoch": 1.21, - "learning_rate": 0.00011832239381265418, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.0002066555895702484, + "loss": 0.0188, "step": 240070 }, { - "epoch": 1.21, - "learning_rate": 0.00011831482611964018, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.0002066517013538769, + "loss": 0.0161, "step": 240080 }, { - "epoch": 1.21, - "learning_rate": 0.00011830725842662616, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020664781313750545, + "loss": 0.017, "step": 240090 }, { - "epoch": 1.21, - "learning_rate": 0.00011829969073361215, - "loss": 0.0108, + "epoch": 0.62, + "learning_rate": 0.00020664392492113402, + "loss": 0.0173, "step": 240100 }, { - "epoch": 1.21, - "learning_rate": 0.00011829212304059813, - "loss": 0.0067, + "epoch": 0.62, + "learning_rate": 0.00020664003670476253, + "loss": 0.0111, "step": 240110 }, { - "epoch": 1.21, - "learning_rate": 0.00011828455534758413, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020663614848839108, + "loss": 0.0131, "step": 240120 }, { - "epoch": 1.21, - "learning_rate": 0.00011827698765457012, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002066322602720196, + "loss": 0.0159, "step": 240130 }, { - "epoch": 1.21, - "learning_rate": 0.0001182694199615561, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020662837205564816, + "loss": 0.0142, "step": 240140 }, { - "epoch": 1.21, - "learning_rate": 0.0001182618522685421, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020662448383927667, + "loss": 0.0157, "step": 240150 }, { - "epoch": 1.21, - "learning_rate": 0.0001182542845755281, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020662059562290522, + "loss": 0.0148, "step": 240160 }, { - "epoch": 1.21, - "learning_rate": 0.00011824671688251408, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020661670740653373, + "loss": 0.0166, "step": 240170 }, { - "epoch": 1.21, - "learning_rate": 0.00011823914918950007, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020661281919016227, + "loss": 0.016, "step": 240180 }, { - "epoch": 1.21, - "learning_rate": 0.00011823158149648605, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.0002066089309737908, + "loss": 0.0165, "step": 240190 }, { - "epoch": 1.21, - "learning_rate": 0.00011822401380347205, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020660504275741935, + "loss": 0.0119, "step": 240200 }, { - "epoch": 1.21, - "learning_rate": 0.00011821644611045804, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020660115454104787, + "loss": 0.0158, "step": 240210 }, { - "epoch": 1.21, - "learning_rate": 0.00011820887841744403, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.0002065972663246764, + "loss": 0.015, "step": 240220 }, { - "epoch": 1.21, - "learning_rate": 0.00011820131072443002, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020659337810830495, + "loss": 0.0155, "step": 240230 }, { - "epoch": 1.21, - "learning_rate": 0.00011819374303141602, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.0002065894898919335, + "loss": 0.02, "step": 240240 }, { - "epoch": 1.21, - "learning_rate": 0.000118186175338402, - "loss": 0.0079, + "epoch": 0.62, + "learning_rate": 0.000206585601675562, + "loss": 0.0176, "step": 240250 }, { - "epoch": 1.21, - "learning_rate": 0.00011817860764538799, - "loss": 0.0118, + "epoch": 0.62, + "learning_rate": 0.00020658171345919055, + "loss": 0.0152, "step": 240260 }, { - "epoch": 1.21, - "learning_rate": 0.00011817103995237399, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020657782524281912, + "loss": 0.0154, "step": 240270 }, { - "epoch": 1.21, - "learning_rate": 0.00011816347225935997, - "loss": 0.0072, + "epoch": 0.62, + "learning_rate": 0.00020657393702644763, + "loss": 0.0199, "step": 240280 }, { - "epoch": 1.21, - "learning_rate": 0.00011815590456634596, - "loss": 0.0075, + "epoch": 0.62, + "learning_rate": 0.00020657004881007615, + "loss": 0.0153, "step": 240290 }, { - "epoch": 1.21, - "learning_rate": 0.00011814833687333194, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002065661605937047, + "loss": 0.0146, "step": 240300 }, { - "epoch": 1.21, - "learning_rate": 0.00011814076918031794, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.00020656227237733326, + "loss": 0.0175, "step": 240310 }, { - "epoch": 1.21, - "learning_rate": 0.00011813320148730393, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020655838416096177, + "loss": 0.0146, "step": 240320 }, { - "epoch": 1.21, - "learning_rate": 0.00011812563379428992, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.00020655449594459031, + "loss": 0.0195, "step": 240330 }, { - "epoch": 1.21, - "learning_rate": 0.00011811806610127591, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020655060772821883, + "loss": 0.0152, "step": 240340 }, { - "epoch": 1.21, - "learning_rate": 0.0001181104984082619, - "loss": 0.0072, + "epoch": 0.62, + "learning_rate": 0.0002065467195118474, + "loss": 0.0177, "step": 240350 }, { - "epoch": 1.21, - "learning_rate": 0.00011810293071524789, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.0002065428312954759, + "loss": 0.0174, "step": 240360 }, { - "epoch": 1.21, - "learning_rate": 0.00011809536302223388, - "loss": 0.0111, + "epoch": 0.62, + "learning_rate": 0.00020653894307910445, + "loss": 0.0143, "step": 240370 }, { - "epoch": 1.21, - "learning_rate": 0.00011808779532921985, - "loss": 0.0085, + "epoch": 0.62, + "learning_rate": 0.00020653505486273297, + "loss": 0.0142, "step": 240380 }, { - "epoch": 1.21, - "learning_rate": 0.00011808022763620585, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.00020653116664636154, + "loss": 0.0143, "step": 240390 }, { - "epoch": 1.21, - "learning_rate": 0.00011807265994319183, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.00020652727842999005, + "loss": 0.0176, "step": 240400 }, { - "epoch": 1.21, - "learning_rate": 0.00011806509225017782, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.0002065233902136186, + "loss": 0.0199, "step": 240410 }, { - "epoch": 1.21, - "learning_rate": 0.00011805752455716382, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.0002065195019972471, + "loss": 0.0164, "step": 240420 }, { - "epoch": 1.21, - "learning_rate": 0.0001180499568641498, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020651561378087565, + "loss": 0.0173, "step": 240430 }, { - "epoch": 1.21, - "learning_rate": 0.0001180423891711358, - "loss": 0.0111, + "epoch": 0.62, + "learning_rate": 0.0002065117255645042, + "loss": 0.0169, "step": 240440 }, { - "epoch": 1.21, - "learning_rate": 0.00011803482147812179, - "loss": 0.0108, + "epoch": 0.62, + "learning_rate": 0.00020650783734813273, + "loss": 0.0159, "step": 240450 }, { - "epoch": 1.21, - "learning_rate": 0.00011802725378510777, - "loss": 0.0064, + "epoch": 0.62, + "learning_rate": 0.00020650394913176125, + "loss": 0.0192, "step": 240460 }, { - "epoch": 1.21, - "learning_rate": 0.00011801968609209376, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.0002065000609153898, + "loss": 0.0149, "step": 240470 }, { - "epoch": 1.21, - "learning_rate": 0.00011801211839907975, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020649617269901836, + "loss": 0.0154, "step": 240480 }, { - "epoch": 1.21, - "learning_rate": 0.00011800455070606574, - "loss": 0.0115, + "epoch": 0.62, + "learning_rate": 0.00020649228448264687, + "loss": 0.0163, "step": 240490 }, { - "epoch": 1.21, - "learning_rate": 0.00011799698301305174, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020648839626627541, + "loss": 0.0141, "step": 240500 }, { - "epoch": 1.21, - "learning_rate": 0.00011798941532003772, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020648450804990393, + "loss": 0.0234, "step": 240510 }, { - "epoch": 1.21, - "learning_rate": 0.00011798184762702371, - "loss": 0.0067, + "epoch": 0.62, + "learning_rate": 0.0002064806198335325, + "loss": 0.0148, "step": 240520 }, { - "epoch": 1.21, - "learning_rate": 0.00011797427993400971, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.000206476731617161, + "loss": 0.0214, "step": 240530 }, { - "epoch": 1.21, - "learning_rate": 0.00011796671224099569, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020647284340078955, + "loss": 0.0149, "step": 240540 }, { - "epoch": 1.21, - "learning_rate": 0.00011795914454798168, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020646895518441807, + "loss": 0.0157, "step": 240550 }, { - "epoch": 1.21, - "learning_rate": 0.00011795157685496767, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020646506696804664, + "loss": 0.0153, "step": 240560 }, { - "epoch": 1.21, - "learning_rate": 0.00011794400916195366, - "loss": 0.0073, + "epoch": 0.62, + "learning_rate": 0.00020646117875167515, + "loss": 0.0168, "step": 240570 }, { - "epoch": 1.21, - "learning_rate": 0.00011793644146893966, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.0002064572905353037, + "loss": 0.0155, "step": 240580 }, { - "epoch": 1.21, - "learning_rate": 0.00011792887377592564, - "loss": 0.0071, + "epoch": 0.62, + "learning_rate": 0.0002064534023189322, + "loss": 0.0117, "step": 240590 }, { - "epoch": 1.21, - "learning_rate": 0.00011792130608291163, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.00020644951410256078, + "loss": 0.014, "step": 240600 }, { - "epoch": 1.21, - "learning_rate": 0.00011791373838989763, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.0002064456258861893, + "loss": 0.0156, "step": 240610 }, { - "epoch": 1.21, - "learning_rate": 0.00011790617069688361, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020644173766981783, + "loss": 0.0146, "step": 240620 }, { - "epoch": 1.21, - "learning_rate": 0.0001178986030038696, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020643784945344635, + "loss": 0.0133, "step": 240630 }, { - "epoch": 1.21, - "learning_rate": 0.00011789103531085559, - "loss": 0.0082, + "epoch": 0.62, + "learning_rate": 0.00020643396123707492, + "loss": 0.0129, "step": 240640 }, { - "epoch": 1.21, - "learning_rate": 0.00011788346761784158, - "loss": 0.0143, + "epoch": 0.62, + "learning_rate": 0.00020643007302070346, + "loss": 0.0157, "step": 240650 }, { - "epoch": 1.21, - "learning_rate": 0.00011787589992482758, - "loss": 0.0065, + "epoch": 0.62, + "learning_rate": 0.00020642618480433197, + "loss": 0.0161, "step": 240660 }, { - "epoch": 1.21, - "learning_rate": 0.00011786833223181356, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.0002064222965879605, + "loss": 0.0185, "step": 240670 }, { - "epoch": 1.21, - "learning_rate": 0.00011786076453879955, - "loss": 0.0077, + "epoch": 0.62, + "learning_rate": 0.00020641840837158903, + "loss": 0.0147, "step": 240680 }, { - "epoch": 1.21, - "learning_rate": 0.00011785319684578555, - "loss": 0.0119, + "epoch": 0.62, + "learning_rate": 0.0002064145201552176, + "loss": 0.0129, "step": 240690 }, { - "epoch": 1.21, - "learning_rate": 0.00011784562915277153, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002064106319388461, + "loss": 0.0129, "step": 240700 }, { - "epoch": 1.21, - "learning_rate": 0.00011783806145975752, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020640674372247465, + "loss": 0.0162, "step": 240710 }, { - "epoch": 1.21, - "learning_rate": 0.00011783049376674352, - "loss": 0.0078, + "epoch": 0.62, + "learning_rate": 0.00020640285550610317, + "loss": 0.0175, "step": 240720 }, { - "epoch": 1.21, - "learning_rate": 0.0001178229260737295, - "loss": 0.0086, + "epoch": 0.62, + "learning_rate": 0.00020639896728973174, + "loss": 0.0162, "step": 240730 }, { - "epoch": 1.21, - "learning_rate": 0.0001178153583807155, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020639507907336025, + "loss": 0.0172, "step": 240740 }, { - "epoch": 1.21, - "learning_rate": 0.00011780779068770148, - "loss": 0.0095, + "epoch": 0.62, + "learning_rate": 0.0002063911908569888, + "loss": 0.0194, "step": 240750 }, { - "epoch": 1.21, - "learning_rate": 0.00011780022299468747, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.0002063873026406173, + "loss": 0.015, "step": 240760 }, { - "epoch": 1.21, - "learning_rate": 0.00011779265530167347, - "loss": 0.0088, + "epoch": 0.62, + "learning_rate": 0.00020638341442424588, + "loss": 0.0179, "step": 240770 }, { - "epoch": 1.21, - "learning_rate": 0.00011778508760865945, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002063795262078744, + "loss": 0.0183, "step": 240780 }, { - "epoch": 1.21, - "learning_rate": 0.00011777751991564544, - "loss": 0.0105, + "epoch": 0.62, + "learning_rate": 0.00020637563799150293, + "loss": 0.0159, "step": 240790 }, { - "epoch": 1.21, - "learning_rate": 0.00011776995222263144, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020637174977513145, + "loss": 0.0176, "step": 240800 }, { - "epoch": 1.21, - "learning_rate": 0.00011776238452961742, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020636786155876002, + "loss": 0.0145, "step": 240810 }, { - "epoch": 1.21, - "learning_rate": 0.00011775481683660341, - "loss": 0.0067, + "epoch": 0.62, + "learning_rate": 0.00020636397334238856, + "loss": 0.0115, "step": 240820 }, { - "epoch": 1.22, - "learning_rate": 0.0001177472491435894, - "loss": 0.0084, + "epoch": 0.62, + "learning_rate": 0.00020636008512601707, + "loss": 0.0157, "step": 240830 }, { - "epoch": 1.22, - "learning_rate": 0.00011773968145057539, - "loss": 0.0106, + "epoch": 0.62, + "learning_rate": 0.00020635619690964559, + "loss": 0.0163, "step": 240840 }, { - "epoch": 1.22, - "learning_rate": 0.00011773211375756139, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020635230869327415, + "loss": 0.0117, "step": 240850 }, { - "epoch": 1.22, - "learning_rate": 0.00011772454606454737, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.0002063484204769027, + "loss": 0.0129, "step": 240860 }, { - "epoch": 1.22, - "learning_rate": 0.00011771697837153336, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.0002063445322605312, + "loss": 0.0224, "step": 240870 }, { - "epoch": 1.22, - "learning_rate": 0.00011770941067851936, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020634064404415975, + "loss": 0.0163, "step": 240880 }, { - "epoch": 1.22, - "learning_rate": 0.00011770184298550534, - "loss": 0.0093, + "epoch": 0.62, + "learning_rate": 0.0002063367558277883, + "loss": 0.0175, "step": 240890 }, { - "epoch": 1.22, - "learning_rate": 0.00011769427529249133, - "loss": 0.0081, + "epoch": 0.62, + "learning_rate": 0.00020633286761141684, + "loss": 0.018, "step": 240900 }, { - "epoch": 1.22, - "learning_rate": 0.00011768670759947731, - "loss": 0.0071, + "epoch": 0.62, + "learning_rate": 0.00020632897939504535, + "loss": 0.0153, "step": 240910 }, { - "epoch": 1.22, - "learning_rate": 0.00011767913990646331, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.0002063250911786739, + "loss": 0.0154, "step": 240920 }, { - "epoch": 1.22, - "learning_rate": 0.0001176715722134493, - "loss": 0.0152, + "epoch": 0.62, + "learning_rate": 0.0002063212029623024, + "loss": 0.0161, "step": 240930 }, { - "epoch": 1.22, - "learning_rate": 0.00011766400452043529, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020631731474593098, + "loss": 0.0188, "step": 240940 }, { - "epoch": 1.22, - "learning_rate": 0.00011765643682742128, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.0002063134265295595, + "loss": 0.0177, "step": 240950 }, { - "epoch": 1.22, - "learning_rate": 0.00011764886913440728, - "loss": 0.0083, + "epoch": 0.62, + "learning_rate": 0.00020630953831318803, + "loss": 0.013, "step": 240960 }, { - "epoch": 1.22, - "learning_rate": 0.00011764130144139326, - "loss": 0.0104, + "epoch": 0.62, + "learning_rate": 0.00020630565009681655, + "loss": 0.0143, "step": 240970 }, { - "epoch": 1.22, - "learning_rate": 0.00011763373374837925, - "loss": 0.01, + "epoch": 0.62, + "learning_rate": 0.00020630176188044511, + "loss": 0.0178, "step": 240980 }, { - "epoch": 1.22, - "learning_rate": 0.00011762616605536523, - "loss": 0.0068, + "epoch": 0.62, + "learning_rate": 0.00020629787366407366, + "loss": 0.0134, "step": 240990 }, { - "epoch": 1.22, - "learning_rate": 0.00011761859836235123, - "loss": 0.0096, + "epoch": 0.62, + "learning_rate": 0.00020629398544770217, + "loss": 0.0174, "step": 241000 }, { - "epoch": 1.22, - "eval_cer": 0.9144644335264098, - "eval_loss": 0.00682118721306324, - "eval_runtime": 115.8371, - "eval_samples_per_second": 17.266, - "eval_steps_per_second": 4.316, + "epoch": 0.62, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.011126725003123283, + "eval_runtime": 107.3943, + "eval_samples_per_second": 18.623, + "eval_steps_per_second": 4.656, "step": 241000 }, { - "epoch": 1.22, - "learning_rate": 0.0001176110306693372, - "loss": 0.009, + "epoch": 0.62, + "learning_rate": 0.00020629009723133069, + "loss": 0.0134, "step": 241010 }, { - "epoch": 1.22, - "learning_rate": 0.00011760346297632319, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020628620901495925, + "loss": 0.0136, "step": 241020 }, { - "epoch": 1.22, - "learning_rate": 0.00011759589528330919, - "loss": 0.0101, + "epoch": 0.62, + "learning_rate": 0.0002062823207985878, + "loss": 0.0128, "step": 241030 }, { - "epoch": 1.22, - "learning_rate": 0.00011758832759029517, - "loss": 0.008, + "epoch": 0.62, + "learning_rate": 0.0002062784325822163, + "loss": 0.0169, "step": 241040 }, { - "epoch": 1.22, - "learning_rate": 0.00011758075989728116, - "loss": 0.0074, + "epoch": 0.62, + "learning_rate": 0.00020627454436584485, + "loss": 0.0188, "step": 241050 }, { - "epoch": 1.22, - "learning_rate": 0.00011757319220426716, - "loss": 0.0099, + "epoch": 0.62, + "learning_rate": 0.0002062706561494734, + "loss": 0.0141, "step": 241060 }, { - "epoch": 1.22, - "learning_rate": 0.00011756562451125314, - "loss": 0.0094, + "epoch": 0.62, + "learning_rate": 0.00020626676793310194, + "loss": 0.0154, "step": 241070 }, { - "epoch": 1.22, - "learning_rate": 0.00011755805681823913, - "loss": 0.0089, + "epoch": 0.62, + "learning_rate": 0.00020626287971673045, + "loss": 0.0203, "step": 241080 }, { - "epoch": 1.22, - "learning_rate": 0.00011755048912522512, - "loss": 0.0091, + "epoch": 0.62, + "learning_rate": 0.000206258991500359, + "loss": 0.016, "step": 241090 }, { - "epoch": 1.22, - "learning_rate": 0.00011754292143221111, - "loss": 0.0092, + "epoch": 0.62, + "learning_rate": 0.00020625510328398753, + "loss": 0.0196, "step": 241100 }, { - "epoch": 1.22, - "learning_rate": 0.0001175353537391971, - "loss": 0.0076, + "epoch": 0.62, + "learning_rate": 0.00020625121506761607, + "loss": 0.0176, "step": 241110 }, { - "epoch": 1.22, - "learning_rate": 0.00011752778604618309, - "loss": 0.0101, + "epoch": 0.63, + "learning_rate": 0.0002062473268512446, + "loss": 0.0185, "step": 241120 }, { - "epoch": 1.22, - "learning_rate": 0.00011752021835316908, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020624343863487313, + "loss": 0.018, "step": 241130 }, { - "epoch": 1.22, - "learning_rate": 0.00011751265066015508, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002062395504185017, + "loss": 0.0121, "step": 241140 }, { - "epoch": 1.22, - "learning_rate": 0.00011750508296714106, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020623566220213021, + "loss": 0.026, "step": 241150 }, { - "epoch": 1.22, - "learning_rate": 0.00011749751527412705, - "loss": 0.0109, + "epoch": 0.63, + "learning_rate": 0.00020623177398575873, + "loss": 0.0126, "step": 241160 }, { - "epoch": 1.22, - "learning_rate": 0.00011748994758111305, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.00020622788576938727, + "loss": 0.014, "step": 241170 }, { - "epoch": 1.22, - "learning_rate": 0.00011748237988809903, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020622399755301578, + "loss": 0.0172, "step": 241180 }, { - "epoch": 1.22, - "learning_rate": 0.00011747481219508503, - "loss": 0.012, + "epoch": 0.63, + "learning_rate": 0.00020622010933664435, + "loss": 0.0178, "step": 241190 }, { - "epoch": 1.22, - "learning_rate": 0.000117467244502071, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002062162211202729, + "loss": 0.0151, "step": 241200 }, { - "epoch": 1.22, - "learning_rate": 0.000117459676809057, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.0002062123329039014, + "loss": 0.0196, "step": 241210 }, { - "epoch": 1.22, - "learning_rate": 0.000117452109116043, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020620844468752995, + "loss": 0.0151, "step": 241220 }, { - "epoch": 1.22, - "learning_rate": 0.00011744454142302898, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002062045564711585, + "loss": 0.0195, "step": 241230 }, { - "epoch": 1.22, - "learning_rate": 0.00011743697373001497, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020620066825478703, + "loss": 0.0163, "step": 241240 }, { - "epoch": 1.22, - "learning_rate": 0.00011742940603700097, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020619678003841555, + "loss": 0.0163, "step": 241250 }, { - "epoch": 1.22, - "learning_rate": 0.00011742183834398695, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.0002061928918220441, + "loss": 0.016, "step": 241260 }, { - "epoch": 1.22, - "learning_rate": 0.00011741427065097294, - "loss": 0.0064, + "epoch": 0.63, + "learning_rate": 0.00020618900360567263, + "loss": 0.0164, "step": 241270 }, { - "epoch": 1.22, - "learning_rate": 0.00011740670295795893, - "loss": 0.0112, + "epoch": 0.63, + "learning_rate": 0.00020618511538930117, + "loss": 0.0124, "step": 241280 }, { - "epoch": 1.22, - "learning_rate": 0.00011739913526494492, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.0002061812271729297, + "loss": 0.0178, "step": 241290 }, { - "epoch": 1.22, - "learning_rate": 0.00011739156757193092, - "loss": 0.0069, + "epoch": 0.63, + "learning_rate": 0.00020617733895655823, + "loss": 0.0176, "step": 241300 }, { - "epoch": 1.22, - "learning_rate": 0.0001173839998789169, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.00020617345074018677, + "loss": 0.0151, "step": 241310 }, { - "epoch": 1.22, - "learning_rate": 0.00011737643218590289, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.0002061695625238153, + "loss": 0.0168, "step": 241320 }, { - "epoch": 1.22, - "learning_rate": 0.00011736886449288889, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020616567430744383, + "loss": 0.0135, "step": 241330 }, { - "epoch": 1.22, - "learning_rate": 0.00011736129679987487, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020616178609107237, + "loss": 0.019, "step": 241340 }, { - "epoch": 1.22, - "learning_rate": 0.00011735372910686086, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.00020615789787470094, + "loss": 0.0141, "step": 241350 }, { - "epoch": 1.22, - "learning_rate": 0.00011734616141384685, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020615400965832945, + "loss": 0.0167, "step": 241360 }, { - "epoch": 1.22, - "learning_rate": 0.00011733859372083284, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.000206150121441958, + "loss": 0.0167, "step": 241370 }, { - "epoch": 1.22, - "learning_rate": 0.00011733102602781884, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.0002061462332255865, + "loss": 0.016, "step": 241380 }, { - "epoch": 1.22, - "learning_rate": 0.00011732345833480482, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020614234500921508, + "loss": 0.0141, "step": 241390 }, { - "epoch": 1.22, - "learning_rate": 0.00011731589064179081, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002061384567928436, + "loss": 0.0223, "step": 241400 }, { - "epoch": 1.22, - "learning_rate": 0.0001173083229487768, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.00020613456857647213, + "loss": 0.014, "step": 241410 }, { - "epoch": 1.22, - "learning_rate": 0.00011730075525576279, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020613068036010065, + "loss": 0.0135, "step": 241420 }, { - "epoch": 1.22, - "learning_rate": 0.00011729318756274878, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.0002061267921437292, + "loss": 0.0158, "step": 241430 }, { - "epoch": 1.22, - "learning_rate": 0.00011728561986973476, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.00020612290392735773, + "loss": 0.0163, "step": 241440 }, { - "epoch": 1.22, - "learning_rate": 0.00011727805217672076, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020611901571098627, + "loss": 0.0213, "step": 241450 }, { - "epoch": 1.22, - "learning_rate": 0.00011727048448370675, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002061151274946148, + "loss": 0.0159, "step": 241460 }, { - "epoch": 1.22, - "learning_rate": 0.00011726291679069274, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020611123927824333, + "loss": 0.0146, "step": 241470 }, { - "epoch": 1.22, - "learning_rate": 0.00011725534909767873, - "loss": 0.0072, - "step": 241480 + "epoch": 0.63, + "learning_rate": 0.00020610735106187187, + "loss": 0.0205, + "step": 241480 }, { - "epoch": 1.22, - "learning_rate": 0.00011724778140466473, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.0002061034628455004, + "loss": 0.0115, "step": 241490 }, { - "epoch": 1.22, - "learning_rate": 0.00011724021371165071, - "loss": 0.0069, + "epoch": 0.63, + "learning_rate": 0.00020609957462912893, + "loss": 0.0131, "step": 241500 }, { - "epoch": 1.22, - "learning_rate": 0.0001172326460186367, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020609568641275747, + "loss": 0.0151, "step": 241510 }, { - "epoch": 1.22, - "learning_rate": 0.00011722507832562268, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020609179819638604, + "loss": 0.017, "step": 241520 }, { - "epoch": 1.22, - "learning_rate": 0.00011721751063260868, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020608790998001455, + "loss": 0.0163, "step": 241530 }, { - "epoch": 1.22, - "learning_rate": 0.00011720994293959467, - "loss": 0.0061, + "epoch": 0.63, + "learning_rate": 0.0002060840217636431, + "loss": 0.0137, "step": 241540 }, { - "epoch": 1.22, - "learning_rate": 0.00011720237524658066, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.0002060801335472716, + "loss": 0.0183, "step": 241550 }, { - "epoch": 1.22, - "learning_rate": 0.00011719480755356665, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020607624533090018, + "loss": 0.0152, "step": 241560 }, { - "epoch": 1.22, - "learning_rate": 0.00011718723986055265, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.0002060723571145287, + "loss": 0.0157, "step": 241570 }, { - "epoch": 1.22, - "learning_rate": 0.00011717967216753863, - "loss": 0.0063, + "epoch": 0.63, + "learning_rate": 0.00020606846889815723, + "loss": 0.0126, "step": 241580 }, { - "epoch": 1.22, - "learning_rate": 0.00011717210447452462, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020606458068178575, + "loss": 0.0203, "step": 241590 }, { - "epoch": 1.22, - "learning_rate": 0.0001171645367815106, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020606069246541432, + "loss": 0.0163, "step": 241600 }, { - "epoch": 1.22, - "learning_rate": 0.0001171569690884966, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020605680424904283, + "loss": 0.0146, "step": 241610 }, { - "epoch": 1.22, - "learning_rate": 0.00011714940139548259, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.00020605291603267137, + "loss": 0.019, "step": 241620 }, { - "epoch": 1.22, - "learning_rate": 0.00011714183370246857, - "loss": 0.0139, + "epoch": 0.63, + "learning_rate": 0.0002060490278162999, + "loss": 0.0192, "step": 241630 }, { - "epoch": 1.22, - "learning_rate": 0.00011713426600945456, - "loss": 0.0063, + "epoch": 0.63, + "learning_rate": 0.00020604513959992846, + "loss": 0.0182, "step": 241640 }, { - "epoch": 1.22, - "learning_rate": 0.00011712669831644054, - "loss": 0.0064, + "epoch": 0.63, + "learning_rate": 0.00020604125138355697, + "loss": 0.0146, "step": 241650 }, { - "epoch": 1.22, - "learning_rate": 0.00011711913062342653, - "loss": 0.0109, + "epoch": 0.63, + "learning_rate": 0.0002060373631671855, + "loss": 0.0196, "step": 241660 }, { - "epoch": 1.22, - "learning_rate": 0.00011711156293041253, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020603347495081403, + "loss": 0.0129, "step": 241670 }, { - "epoch": 1.22, - "learning_rate": 0.00011710399523739851, - "loss": 0.0121, + "epoch": 0.63, + "learning_rate": 0.00020602958673444257, + "loss": 0.0174, "step": 241680 }, { - "epoch": 1.22, - "learning_rate": 0.0001170964275443845, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020602569851807114, + "loss": 0.0175, "step": 241690 }, { - "epoch": 1.22, - "learning_rate": 0.0001170888598513705, - "loss": 0.0068, + "epoch": 0.63, + "learning_rate": 0.00020602181030169965, + "loss": 0.015, "step": 241700 }, { - "epoch": 1.22, - "learning_rate": 0.00011708129215835648, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.0002060179220853282, + "loss": 0.0128, "step": 241710 }, { - "epoch": 1.22, - "learning_rate": 0.00011707372446534248, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.0002060140338689567, + "loss": 0.0153, "step": 241720 }, { - "epoch": 1.22, - "learning_rate": 0.00011706615677232846, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020601014565258528, + "loss": 0.0178, "step": 241730 }, { - "epoch": 1.22, - "learning_rate": 0.00011705858907931445, - "loss": 0.0067, + "epoch": 0.63, + "learning_rate": 0.0002060062574362138, + "loss": 0.0243, "step": 241740 }, { - "epoch": 1.22, - "learning_rate": 0.00011705102138630045, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020600236921984233, + "loss": 0.0232, "step": 241750 }, { - "epoch": 1.22, - "learning_rate": 0.00011704345369328643, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020599848100347085, + "loss": 0.0209, "step": 241760 }, { - "epoch": 1.22, - "learning_rate": 0.00011703588600027242, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020599459278709942, + "loss": 0.0178, "step": 241770 }, { - "epoch": 1.22, - "learning_rate": 0.00011702831830725842, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020599070457072793, + "loss": 0.0201, "step": 241780 }, { - "epoch": 1.22, - "learning_rate": 0.0001170207506142444, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020598681635435647, + "loss": 0.0181, "step": 241790 }, { - "epoch": 1.22, - "learning_rate": 0.0001170131829212304, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.000205982928137985, + "loss": 0.0158, "step": 241800 }, { - "epoch": 1.22, - "learning_rate": 0.00011700561522821638, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020597903992161356, + "loss": 0.0188, "step": 241810 }, { - "epoch": 1.22, - "learning_rate": 0.00011699804753520237, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020597515170524207, + "loss": 0.0163, "step": 241820 }, { - "epoch": 1.22, - "learning_rate": 0.00011699047984218837, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002059712634888706, + "loss": 0.0154, "step": 241830 }, { - "epoch": 1.22, - "learning_rate": 0.00011698291214917435, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.00020596737527249913, + "loss": 0.0144, "step": 241840 }, { - "epoch": 1.22, - "learning_rate": 0.00011697534445616034, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.0002059634870561277, + "loss": 0.0169, "step": 241850 }, { - "epoch": 1.22, - "learning_rate": 0.00011696777676314634, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020595959883975624, + "loss": 0.0137, "step": 241860 }, { - "epoch": 1.22, - "learning_rate": 0.00011696020907013232, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020595571062338475, + "loss": 0.0121, "step": 241870 }, { - "epoch": 1.22, - "learning_rate": 0.00011695264137711831, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.00020595182240701327, + "loss": 0.018, "step": 241880 }, { - "epoch": 1.22, - "learning_rate": 0.0001169450736841043, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020594793419064183, + "loss": 0.0164, "step": 241890 }, { - "epoch": 1.22, - "learning_rate": 0.00011693750599109029, - "loss": 0.0063, + "epoch": 0.63, + "learning_rate": 0.00020594404597427038, + "loss": 0.0181, "step": 241900 }, { - "epoch": 1.22, - "learning_rate": 0.00011692993829807629, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.0002059401577578989, + "loss": 0.0195, "step": 241910 }, { - "epoch": 1.22, - "learning_rate": 0.00011692237060506227, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020593626954152743, + "loss": 0.0182, "step": 241920 }, { - "epoch": 1.22, - "learning_rate": 0.00011691480291204826, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020593238132515595, + "loss": 0.0152, "step": 241930 }, { - "epoch": 1.22, - "learning_rate": 0.00011690723521903426, - "loss": 0.0111, + "epoch": 0.63, + "learning_rate": 0.00020592849310878452, + "loss": 0.0173, "step": 241940 }, { - "epoch": 1.22, - "learning_rate": 0.00011689966752602024, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020592460489241303, + "loss": 0.0198, "step": 241950 }, { - "epoch": 1.22, - "learning_rate": 0.00011689209983300623, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020592071667604157, + "loss": 0.0147, "step": 241960 }, { - "epoch": 1.22, - "learning_rate": 0.00011688453213999221, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.00020591682845967009, + "loss": 0.0147, "step": 241970 }, { - "epoch": 1.22, - "learning_rate": 0.00011687696444697821, - "loss": 0.0101, + "epoch": 0.63, + "learning_rate": 0.00020591294024329865, + "loss": 0.0153, "step": 241980 }, { - "epoch": 1.22, - "learning_rate": 0.0001168693967539642, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020590905202692717, + "loss": 0.0152, "step": 241990 }, { - "epoch": 1.22, - "learning_rate": 0.00011686182906095019, - "loss": 0.0066, + "epoch": 0.63, + "learning_rate": 0.0002059051638105557, + "loss": 0.0165, "step": 242000 }, { - "epoch": 1.22, - "eval_cer": 0.914452788772905, - "eval_loss": 0.006828702986240387, - "eval_runtime": 115.9715, - "eval_samples_per_second": 17.246, - "eval_steps_per_second": 4.311, + "epoch": 0.63, + "eval_cer": 0.8818272540103097, + "eval_loss": 0.0112527534365654, + "eval_runtime": 107.4809, + "eval_samples_per_second": 18.608, + "eval_steps_per_second": 4.652, "step": 242000 }, { - "epoch": 1.22, - "learning_rate": 0.00011685426136793618, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020590127559418423, + "loss": 0.0226, "step": 242010 }, { - "epoch": 1.22, - "learning_rate": 0.00011684669367492218, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.0002058973873778128, + "loss": 0.0165, "step": 242020 }, { - "epoch": 1.22, - "learning_rate": 0.00011683912598190816, - "loss": 0.0118, + "epoch": 0.63, + "learning_rate": 0.0002058934991614413, + "loss": 0.0154, "step": 242030 }, { - "epoch": 1.22, - "learning_rate": 0.00011683155828889415, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020588961094506985, + "loss": 0.0167, "step": 242040 }, { - "epoch": 1.22, - "learning_rate": 0.00011682399059588013, - "loss": 0.0069, + "epoch": 0.63, + "learning_rate": 0.00020588572272869837, + "loss": 0.0152, "step": 242050 }, { - "epoch": 1.22, - "learning_rate": 0.00011681642290286613, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020588183451232693, + "loss": 0.0181, "step": 242060 }, { - "epoch": 1.22, - "learning_rate": 0.00011680885520985212, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020587794629595548, + "loss": 0.0157, "step": 242070 }, { - "epoch": 1.22, - "learning_rate": 0.0001168012875168381, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.000205874058079584, + "loss": 0.0145, "step": 242080 }, { - "epoch": 1.22, - "learning_rate": 0.0001167937198238241, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020587016986321253, + "loss": 0.0125, "step": 242090 }, { - "epoch": 1.22, - "learning_rate": 0.0001167861521308101, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020586628164684107, + "loss": 0.0173, "step": 242100 }, { - "epoch": 1.22, - "learning_rate": 0.00011677858443779608, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020586239343046961, + "loss": 0.0182, "step": 242110 }, { - "epoch": 1.22, - "learning_rate": 0.00011677101674478207, - "loss": 0.0062, + "epoch": 0.63, + "learning_rate": 0.00020585850521409813, + "loss": 0.0125, "step": 242120 }, { - "epoch": 1.22, - "learning_rate": 0.00011676344905176805, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020585461699772667, + "loss": 0.0155, "step": 242130 }, { - "epoch": 1.22, - "learning_rate": 0.00011675588135875405, - "loss": 0.0175, + "epoch": 0.63, + "learning_rate": 0.0002058507287813552, + "loss": 0.0209, "step": 242140 }, { - "epoch": 1.22, - "learning_rate": 0.00011674831366574004, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020584684056498375, + "loss": 0.015, "step": 242150 }, { - "epoch": 1.22, - "learning_rate": 0.00011674074597272602, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.00020584295234861227, + "loss": 0.0167, "step": 242160 }, { - "epoch": 1.22, - "learning_rate": 0.00011673317827971202, - "loss": 0.0118, + "epoch": 0.63, + "learning_rate": 0.0002058390641322408, + "loss": 0.0138, "step": 242170 }, { - "epoch": 1.22, - "learning_rate": 0.00011672561058669801, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.00020583517591586933, + "loss": 0.0173, "step": 242180 }, { - "epoch": 1.22, - "learning_rate": 0.000116718042893684, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002058312876994979, + "loss": 0.0158, "step": 242190 }, { - "epoch": 1.22, - "learning_rate": 0.00011671047520066999, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002058273994831264, + "loss": 0.0178, "step": 242200 }, { - "epoch": 1.22, - "learning_rate": 0.00011670290750765599, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020582351126675495, + "loss": 0.0154, "step": 242210 }, { - "epoch": 1.22, - "learning_rate": 0.00011669533981464197, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.00020581962305038346, + "loss": 0.0185, "step": 242220 }, { - "epoch": 1.22, - "learning_rate": 0.00011668777212162796, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020581573483401203, + "loss": 0.0133, "step": 242230 }, { - "epoch": 1.22, - "learning_rate": 0.00011668020442861394, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020581184661764057, + "loss": 0.0146, "step": 242240 }, { - "epoch": 1.22, - "learning_rate": 0.00011667263673559994, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002058079584012691, + "loss": 0.0137, "step": 242250 }, { - "epoch": 1.22, - "learning_rate": 0.00011666506904258593, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.00020580407018489763, + "loss": 0.0206, "step": 242260 }, { - "epoch": 1.22, - "learning_rate": 0.0001166575013495719, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020580018196852617, + "loss": 0.0133, "step": 242270 }, { - "epoch": 1.22, - "learning_rate": 0.0001166499336565579, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020579629375215471, + "loss": 0.0139, "step": 242280 }, { - "epoch": 1.22, - "learning_rate": 0.00011664236596354388, - "loss": 0.0124, + "epoch": 0.63, + "learning_rate": 0.00020579240553578323, + "loss": 0.0128, "step": 242290 }, { - "epoch": 1.22, - "learning_rate": 0.00011663479827052987, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020578851731941177, + "loss": 0.0153, "step": 242300 }, { - "epoch": 1.22, - "learning_rate": 0.00011662723057751587, - "loss": 0.0122, + "epoch": 0.63, + "learning_rate": 0.0002057846291030403, + "loss": 0.013, "step": 242310 }, { - "epoch": 1.22, - "learning_rate": 0.00011661966288450185, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020578074088666885, + "loss": 0.0169, "step": 242320 }, { - "epoch": 1.22, - "learning_rate": 0.00011661209519148784, - "loss": 0.0117, + "epoch": 0.63, + "learning_rate": 0.00020577685267029737, + "loss": 0.0126, "step": 242330 }, { - "epoch": 1.22, - "learning_rate": 0.00011660452749847383, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002057729644539259, + "loss": 0.0138, "step": 242340 }, { - "epoch": 1.22, - "learning_rate": 0.00011659695980545982, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020576907623755445, + "loss": 0.018, "step": 242350 }, { - "epoch": 1.22, - "learning_rate": 0.00011658939211244582, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.000205765188021183, + "loss": 0.0191, "step": 242360 }, { - "epoch": 1.22, - "learning_rate": 0.0001165818244194318, - "loss": 0.012, + "epoch": 0.63, + "learning_rate": 0.0002057612998048115, + "loss": 0.015, "step": 242370 }, { - "epoch": 1.22, - "learning_rate": 0.00011657425672641779, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020575741158844005, + "loss": 0.0169, "step": 242380 }, { - "epoch": 1.22, - "learning_rate": 0.00011656668903340379, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020575352337206862, + "loss": 0.0169, "step": 242390 }, { - "epoch": 1.22, - "learning_rate": 0.00011655912134038977, - "loss": 0.0101, + "epoch": 0.63, + "learning_rate": 0.00020574963515569713, + "loss": 0.0198, "step": 242400 }, { - "epoch": 1.22, - "learning_rate": 0.00011655155364737576, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.00020574574693932567, + "loss": 0.0141, "step": 242410 }, { - "epoch": 1.22, - "learning_rate": 0.00011654398595436175, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.0002057418587229542, + "loss": 0.0117, "step": 242420 }, { - "epoch": 1.22, - "learning_rate": 0.00011653641826134774, - "loss": 0.0113, + "epoch": 0.63, + "learning_rate": 0.0002057379705065827, + "loss": 0.0194, "step": 242430 }, { - "epoch": 1.22, - "learning_rate": 0.00011652885056833374, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020573408229021127, + "loss": 0.0165, "step": 242440 }, { - "epoch": 1.22, - "learning_rate": 0.00011652128287531972, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020573019407383981, + "loss": 0.017, "step": 242450 }, { - "epoch": 1.22, - "learning_rate": 0.00011651371518230571, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020572630585746833, + "loss": 0.0344, "step": 242460 }, { - "epoch": 1.22, - "learning_rate": 0.00011650614748929171, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020572241764109687, + "loss": 0.0155, "step": 242470 }, { - "epoch": 1.22, - "learning_rate": 0.00011649857979627769, - "loss": 0.011, + "epoch": 0.63, + "learning_rate": 0.0002057185294247254, + "loss": 0.0158, "step": 242480 }, { - "epoch": 1.22, - "learning_rate": 0.00011649101210326368, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020571464120835395, + "loss": 0.0152, "step": 242490 }, { - "epoch": 1.22, - "learning_rate": 0.00011648344441024966, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020571075299198247, + "loss": 0.0152, "step": 242500 }, { - "epoch": 1.22, - "learning_rate": 0.00011647587671723566, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.000205706864775611, + "loss": 0.0156, "step": 242510 }, { - "epoch": 1.22, - "learning_rate": 0.00011646830902422165, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020570297655923955, + "loss": 0.015, "step": 242520 }, { - "epoch": 1.22, - "learning_rate": 0.00011646074133120764, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.0002056990883428681, + "loss": 0.0155, "step": 242530 }, { - "epoch": 1.22, - "learning_rate": 0.00011645317363819363, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.0002056952001264966, + "loss": 0.014, "step": 242540 }, { - "epoch": 1.22, - "learning_rate": 0.00011644560594517963, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020569131191012515, + "loss": 0.0154, "step": 242550 }, { - "epoch": 1.22, - "learning_rate": 0.00011643803825216561, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020568742369375372, + "loss": 0.0168, "step": 242560 }, { - "epoch": 1.22, - "learning_rate": 0.0001164304705591516, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020568353547738223, + "loss": 0.0172, "step": 242570 }, { - "epoch": 1.22, - "learning_rate": 0.00011642290286613758, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020567964726101077, + "loss": 0.0166, "step": 242580 }, { - "epoch": 1.22, - "learning_rate": 0.00011641533517312358, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.0002056757590446393, + "loss": 0.0128, "step": 242590 }, { - "epoch": 1.22, - "learning_rate": 0.00011640776748010957, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020567187082826786, + "loss": 0.0132, "step": 242600 }, { - "epoch": 1.22, - "learning_rate": 0.00011640019978709556, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.00020566798261189637, + "loss": 0.0126, "step": 242610 }, { - "epoch": 1.22, - "learning_rate": 0.00011639263209408155, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002056640943955249, + "loss": 0.0199, "step": 242620 }, { - "epoch": 1.22, - "learning_rate": 0.00011638506440106755, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020566020617915343, + "loss": 0.0158, "step": 242630 }, { - "epoch": 1.22, - "learning_rate": 0.00011637749670805353, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.000205656317962782, + "loss": 0.0187, "step": 242640 }, { - "epoch": 1.22, - "learning_rate": 0.00011636992901503952, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.0002056524297464105, + "loss": 0.0183, "step": 242650 }, { - "epoch": 1.22, - "learning_rate": 0.00011636236132202552, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020564854153003905, + "loss": 0.0167, "step": 242660 }, { - "epoch": 1.22, - "learning_rate": 0.0001163547936290115, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020564465331366757, + "loss": 0.0189, "step": 242670 }, { - "epoch": 1.22, - "learning_rate": 0.0001163472259359975, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.0002056407650972961, + "loss": 0.0171, "step": 242680 }, { - "epoch": 1.22, - "learning_rate": 0.00011633965824298347, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020563687688092465, + "loss": 0.0163, "step": 242690 }, { - "epoch": 1.22, - "learning_rate": 0.00011633209054996947, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.0002056329886645532, + "loss": 0.0118, "step": 242700 }, { - "epoch": 1.22, - "learning_rate": 0.00011632452285695546, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.0002056291004481817, + "loss": 0.0134, "step": 242710 }, { - "epoch": 1.22, - "learning_rate": 0.00011631695516394145, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020562521223181025, + "loss": 0.0128, "step": 242720 }, { - "epoch": 1.22, - "learning_rate": 0.00011630938747092744, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020562132401543882, + "loss": 0.015, "step": 242730 }, { - "epoch": 1.22, - "learning_rate": 0.00011630181977791344, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020561743579906733, + "loss": 0.0152, "step": 242740 }, { - "epoch": 1.22, - "learning_rate": 0.00011629425208489942, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020561354758269585, + "loss": 0.0212, "step": 242750 }, { - "epoch": 1.22, - "learning_rate": 0.00011628668439188541, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002056096593663244, + "loss": 0.0129, "step": 242760 }, { - "epoch": 1.22, - "learning_rate": 0.0001162791166988714, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.00020560577114995296, + "loss": 0.0122, "step": 242770 }, { - "epoch": 1.22, - "learning_rate": 0.00011627154900585739, - "loss": 0.0114, + "epoch": 0.63, + "learning_rate": 0.00020560188293358147, + "loss": 0.0183, "step": 242780 }, { - "epoch": 1.22, - "learning_rate": 0.00011626398131284338, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020559799471721, + "loss": 0.0134, "step": 242790 }, { - "epoch": 1.22, - "learning_rate": 0.00011625641361982937, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020559410650083853, + "loss": 0.0133, "step": 242800 }, { - "epoch": 1.23, - "learning_rate": 0.00011624884592681536, - "loss": 0.0112, + "epoch": 0.63, + "learning_rate": 0.0002055902182844671, + "loss": 0.0137, "step": 242810 }, { - "epoch": 1.23, - "learning_rate": 0.00011624127823380136, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002055863300680956, + "loss": 0.0183, "step": 242820 }, { - "epoch": 1.23, - "learning_rate": 0.00011623371054078734, - "loss": 0.0068, + "epoch": 0.63, + "learning_rate": 0.00020558244185172415, + "loss": 0.0145, "step": 242830 }, { - "epoch": 1.23, - "learning_rate": 0.00011622614284777333, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020557855363535267, + "loss": 0.0158, "step": 242840 }, { - "epoch": 1.23, - "learning_rate": 0.00011621857515475931, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020557466541898124, + "loss": 0.0122, "step": 242850 }, { - "epoch": 1.23, - "learning_rate": 0.00011621100746174531, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.00020557077720260975, + "loss": 0.0147, "step": 242860 }, { - "epoch": 1.23, - "learning_rate": 0.0001162034397687313, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.0002055668889862383, + "loss": 0.0176, "step": 242870 }, { - "epoch": 1.23, - "learning_rate": 0.00011619587207571728, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.0002055630007698668, + "loss": 0.0196, "step": 242880 }, { - "epoch": 1.23, - "learning_rate": 0.00011618830438270328, - "loss": 0.0126, + "epoch": 0.63, + "learning_rate": 0.00020555911255349537, + "loss": 0.0166, "step": 242890 }, { - "epoch": 1.23, - "learning_rate": 0.00011618073668968925, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.0002055552243371239, + "loss": 0.0171, "step": 242900 }, { - "epoch": 1.23, - "learning_rate": 0.00011617316899667524, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020555133612075243, + "loss": 0.0137, "step": 242910 }, { - "epoch": 1.23, - "learning_rate": 0.00011616560130366124, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020554744790438095, + "loss": 0.017, "step": 242920 }, { - "epoch": 1.23, - "learning_rate": 0.00011615803361064722, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.0002055435596880095, + "loss": 0.0164, "step": 242930 }, { - "epoch": 1.23, - "learning_rate": 0.00011615046591763321, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020553967147163806, + "loss": 0.0127, "step": 242940 }, { - "epoch": 1.23, - "learning_rate": 0.0001161428982246192, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020553578325526657, + "loss": 0.0168, "step": 242950 }, { - "epoch": 1.23, - "learning_rate": 0.00011613533053160519, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002055318950388951, + "loss": 0.017, "step": 242960 }, { - "epoch": 1.23, - "learning_rate": 0.00011612776283859119, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.00020552800682252363, + "loss": 0.0168, "step": 242970 }, { - "epoch": 1.23, - "learning_rate": 0.00011612019514557717, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.0002055241186061522, + "loss": 0.0144, "step": 242980 }, { - "epoch": 1.23, - "learning_rate": 0.00011611262745256316, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002055202303897807, + "loss": 0.0154, "step": 242990 }, { - "epoch": 1.23, - "learning_rate": 0.00011610505975954916, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020551634217340925, + "loss": 0.0139, "step": 243000 }, { - "epoch": 1.23, - "eval_cer": 0.9144401736232748, - "eval_loss": 0.006801496725529432, - "eval_runtime": 115.8442, - "eval_samples_per_second": 17.265, - "eval_steps_per_second": 4.316, + "epoch": 0.63, + "eval_cer": 0.8818188561887047, + "eval_loss": 0.011068116873502731, + "eval_runtime": 107.3469, + "eval_samples_per_second": 18.631, + "eval_steps_per_second": 4.658, "step": 243000 }, { - "epoch": 1.23, - "learning_rate": 0.00011609749206653514, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020551245395703777, + "loss": 0.0149, "step": 243010 }, { - "epoch": 1.23, - "learning_rate": 0.00011608992437352113, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020550856574066633, + "loss": 0.0138, "step": 243020 }, { - "epoch": 1.23, - "learning_rate": 0.00011608235668050711, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020550467752429485, + "loss": 0.0134, "step": 243030 }, { - "epoch": 1.23, - "learning_rate": 0.00011607478898749311, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.0002055007893079234, + "loss": 0.0177, "step": 243040 }, { - "epoch": 1.23, - "learning_rate": 0.0001160672212944791, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.0002054969010915519, + "loss": 0.0183, "step": 243050 }, { - "epoch": 1.23, - "learning_rate": 0.00011605965360146509, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020549301287518047, + "loss": 0.0157, "step": 243060 }, { - "epoch": 1.23, - "learning_rate": 0.00011605208590845108, - "loss": 0.0066, + "epoch": 0.63, + "learning_rate": 0.000205489124658809, + "loss": 0.0169, "step": 243070 }, { - "epoch": 1.23, - "learning_rate": 0.00011604451821543708, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020548523644243753, + "loss": 0.0158, "step": 243080 }, { - "epoch": 1.23, - "learning_rate": 0.00011603695052242306, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020548134822606604, + "loss": 0.0157, "step": 243090 }, { - "epoch": 1.23, - "learning_rate": 0.00011602938282940905, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020547746000969461, + "loss": 0.0145, "step": 243100 }, { - "epoch": 1.23, - "learning_rate": 0.00011602181513639505, - "loss": 0.0061, + "epoch": 0.63, + "learning_rate": 0.00020547357179332316, + "loss": 0.0175, "step": 243110 }, { - "epoch": 1.23, - "learning_rate": 0.00011601424744338103, - "loss": 0.0112, + "epoch": 0.63, + "learning_rate": 0.00020546968357695167, + "loss": 0.0141, "step": 243120 }, { - "epoch": 1.23, - "learning_rate": 0.00011600667975036702, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.0002054657953605802, + "loss": 0.0179, "step": 243130 }, { - "epoch": 1.23, - "learning_rate": 0.000115999112057353, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020546190714420875, + "loss": 0.0147, "step": 243140 }, { - "epoch": 1.23, - "learning_rate": 0.000115991544364339, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.0002054580189278373, + "loss": 0.015, "step": 243150 }, { - "epoch": 1.23, - "learning_rate": 0.000115983976671325, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.0002054541307114658, + "loss": 0.0142, "step": 243160 }, { - "epoch": 1.23, - "learning_rate": 0.00011597640897831098, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020545024249509435, + "loss": 0.02, "step": 243170 }, { - "epoch": 1.23, - "learning_rate": 0.00011596884128529697, - "loss": 0.0112, + "epoch": 0.63, + "learning_rate": 0.00020544635427872287, + "loss": 0.0202, "step": 243180 }, { - "epoch": 1.23, - "learning_rate": 0.00011596127359228297, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020544246606235143, + "loss": 0.0137, "step": 243190 }, { - "epoch": 1.23, - "learning_rate": 0.00011595370589926895, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020543857784597995, + "loss": 0.0162, "step": 243200 }, { - "epoch": 1.23, - "learning_rate": 0.00011594613820625494, - "loss": 0.0116, + "epoch": 0.63, + "learning_rate": 0.0002054346896296085, + "loss": 0.0188, "step": 243210 }, { - "epoch": 1.23, - "learning_rate": 0.00011593857051324092, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.000205430801413237, + "loss": 0.013, "step": 243220 }, { - "epoch": 1.23, - "learning_rate": 0.00011593100282022692, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020542691319686557, + "loss": 0.015, "step": 243230 }, { - "epoch": 1.23, - "learning_rate": 0.00011592343512721291, - "loss": 0.0065, + "epoch": 0.63, + "learning_rate": 0.0002054230249804941, + "loss": 0.0154, "step": 243240 }, { - "epoch": 1.23, - "learning_rate": 0.0001159158674341989, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020541913676412263, + "loss": 0.0177, "step": 243250 }, { - "epoch": 1.23, - "learning_rate": 0.00011590829974118489, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020541524854775114, + "loss": 0.0194, "step": 243260 }, { - "epoch": 1.23, - "learning_rate": 0.00011590073204817089, - "loss": 0.0113, + "epoch": 0.63, + "learning_rate": 0.0002054113603313797, + "loss": 0.0137, "step": 243270 }, { - "epoch": 1.23, - "learning_rate": 0.00011589316435515687, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020540747211500825, + "loss": 0.0125, "step": 243280 }, { - "epoch": 1.23, - "learning_rate": 0.00011588559666214286, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020540358389863677, + "loss": 0.0155, "step": 243290 }, { - "epoch": 1.23, - "learning_rate": 0.00011587802896912884, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020539969568226528, + "loss": 0.0158, "step": 243300 }, { - "epoch": 1.23, - "learning_rate": 0.00011587046127611484, - "loss": 0.0114, + "epoch": 0.63, + "learning_rate": 0.00020539580746589385, + "loss": 0.0199, "step": 243310 }, { - "epoch": 1.23, - "learning_rate": 0.00011586289358310083, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.0002053919192495224, + "loss": 0.0143, "step": 243320 }, { - "epoch": 1.23, - "learning_rate": 0.00011585532589008682, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.0002053880310331509, + "loss": 0.0169, "step": 243330 }, { - "epoch": 1.23, - "learning_rate": 0.00011584775819707281, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020538414281677945, + "loss": 0.0136, "step": 243340 }, { - "epoch": 1.23, - "learning_rate": 0.0001158401905040588, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.000205380254600408, + "loss": 0.0134, "step": 243350 }, { - "epoch": 1.23, - "learning_rate": 0.00011583262281104479, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020537636638403653, + "loss": 0.0124, "step": 243360 }, { - "epoch": 1.23, - "learning_rate": 0.00011582505511803078, - "loss": 0.0064, + "epoch": 0.63, + "learning_rate": 0.00020537247816766505, + "loss": 0.0171, "step": 243370 }, { - "epoch": 1.23, - "learning_rate": 0.00011581748742501676, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.0002053685899512936, + "loss": 0.0154, "step": 243380 }, { - "epoch": 1.23, - "learning_rate": 0.00011580991973200276, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020536470173492213, + "loss": 0.0146, "step": 243390 }, { - "epoch": 1.23, - "learning_rate": 0.00011580235203898875, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020536081351855067, + "loss": 0.0154, "step": 243400 }, { - "epoch": 1.23, - "learning_rate": 0.00011579478434597473, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.0002053569253021792, + "loss": 0.0156, "step": 243410 }, { - "epoch": 1.23, - "learning_rate": 0.00011578721665296073, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020535303708580773, + "loss": 0.0155, "step": 243420 }, { - "epoch": 1.23, - "learning_rate": 0.00011577964895994672, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.00020534914886943624, + "loss": 0.0158, "step": 243430 }, { - "epoch": 1.23, - "learning_rate": 0.0001157720812669327, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.0002053452606530648, + "loss": 0.0172, "step": 243440 }, { - "epoch": 1.23, - "learning_rate": 0.0001157645135739187, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.00020534137243669335, + "loss": 0.0126, "step": 243450 }, { - "epoch": 1.23, - "learning_rate": 0.00011575694588090468, - "loss": 0.0064, + "epoch": 0.63, + "learning_rate": 0.00020533748422032187, + "loss": 0.0171, "step": 243460 }, { - "epoch": 1.23, - "learning_rate": 0.00011574937818789068, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020533359600395038, + "loss": 0.0155, "step": 243470 }, { - "epoch": 1.23, - "learning_rate": 0.00011574181049487667, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.00020532970778757895, + "loss": 0.0161, "step": 243480 }, { - "epoch": 1.23, - "learning_rate": 0.00011573424280186265, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.0002053258195712075, + "loss": 0.0121, "step": 243490 }, { - "epoch": 1.23, - "learning_rate": 0.00011572667510884865, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.000205321931354836, + "loss": 0.0191, "step": 243500 }, { - "epoch": 1.23, - "learning_rate": 0.00011571910741583464, - "loss": 0.0068, + "epoch": 0.63, + "learning_rate": 0.00020531804313846455, + "loss": 0.0172, "step": 243510 }, { - "epoch": 1.23, - "learning_rate": 0.00011571153972282063, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.0002053141549220931, + "loss": 0.0149, "step": 243520 }, { - "epoch": 1.23, - "learning_rate": 0.00011570397202980661, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020531026670572163, + "loss": 0.0164, "step": 243530 }, { - "epoch": 1.23, - "learning_rate": 0.00011569640433679259, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020530637848935015, + "loss": 0.0129, "step": 243540 }, { - "epoch": 1.23, - "learning_rate": 0.00011568883664377858, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.0002053024902729787, + "loss": 0.012, "step": 243550 }, { - "epoch": 1.23, - "learning_rate": 0.00011568126895076458, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020529860205660723, + "loss": 0.0151, "step": 243560 }, { - "epoch": 1.23, - "learning_rate": 0.00011567370125775056, - "loss": 0.0097, + "epoch": 0.63, + "learning_rate": 0.00020529471384023577, + "loss": 0.0152, "step": 243570 }, { - "epoch": 1.23, - "learning_rate": 0.00011566613356473656, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.0002052908256238643, + "loss": 0.0149, "step": 243580 }, { - "epoch": 1.23, - "learning_rate": 0.00011565856587172254, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020528693740749283, + "loss": 0.0158, "step": 243590 }, { - "epoch": 1.23, - "learning_rate": 0.00011565099817870853, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002052830491911214, + "loss": 0.0167, "step": 243600 }, { - "epoch": 1.23, - "learning_rate": 0.00011564343048569453, - "loss": 0.0128, + "epoch": 0.63, + "learning_rate": 0.0002052791609747499, + "loss": 0.0145, "step": 243610 }, { - "epoch": 1.23, - "learning_rate": 0.00011563586279268051, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020527527275837843, + "loss": 0.0171, "step": 243620 }, { - "epoch": 1.23, - "learning_rate": 0.0001156282950996665, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020527138454200697, + "loss": 0.0154, "step": 243630 }, { - "epoch": 1.23, - "learning_rate": 0.0001156207274066525, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020526749632563554, + "loss": 0.0131, "step": 243640 }, { - "epoch": 1.23, - "learning_rate": 0.00011561315971363848, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020526360810926405, + "loss": 0.0143, "step": 243650 }, { - "epoch": 1.23, - "learning_rate": 0.00011560559202062447, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.0002052597198928926, + "loss": 0.0197, "step": 243660 }, { - "epoch": 1.23, - "learning_rate": 0.00011559802432761046, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.0002052558316765211, + "loss": 0.0201, "step": 243670 }, { - "epoch": 1.23, - "learning_rate": 0.00011559045663459645, - "loss": 0.0084, + "epoch": 0.63, + "learning_rate": 0.00020525194346014965, + "loss": 0.0165, "step": 243680 }, { - "epoch": 1.23, - "learning_rate": 0.00011558288894158245, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.0002052480552437782, + "loss": 0.0161, "step": 243690 }, { - "epoch": 1.23, - "learning_rate": 0.00011557532124856843, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020524416702740673, + "loss": 0.0209, "step": 243700 }, { - "epoch": 1.23, - "learning_rate": 0.00011556775355555442, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.00020524027881103525, + "loss": 0.0152, "step": 243710 }, { - "epoch": 1.23, - "learning_rate": 0.00011556018586254042, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.0002052363905946638, + "loss": 0.0157, "step": 243720 }, { - "epoch": 1.23, - "learning_rate": 0.0001155526181695264, - "loss": 0.0062, + "epoch": 0.63, + "learning_rate": 0.00020523250237829233, + "loss": 0.0136, "step": 243730 }, { - "epoch": 1.23, - "learning_rate": 0.0001155450504765124, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020522861416192087, + "loss": 0.0137, "step": 243740 }, { - "epoch": 1.23, - "learning_rate": 0.00011553748278349838, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.00020522472594554939, + "loss": 0.0159, "step": 243750 }, { - "epoch": 1.23, - "learning_rate": 0.00011552991509048437, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020522083772917793, + "loss": 0.0144, "step": 243760 }, { - "epoch": 1.23, - "learning_rate": 0.00011552234739747037, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.0002052169495128065, + "loss": 0.0141, "step": 243770 }, { - "epoch": 1.23, - "learning_rate": 0.00011551477970445635, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.000205213061296435, + "loss": 0.0157, "step": 243780 }, { - "epoch": 1.23, - "learning_rate": 0.00011550721201144234, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020520917308006353, + "loss": 0.0235, "step": 243790 }, { - "epoch": 1.23, - "learning_rate": 0.00011549964431842834, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020520528486369207, + "loss": 0.0147, "step": 243800 }, { - "epoch": 1.23, - "learning_rate": 0.00011549207662541432, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020520139664732064, + "loss": 0.0179, "step": 243810 }, { - "epoch": 1.23, - "learning_rate": 0.00011548450893240031, - "loss": 0.0108, + "epoch": 0.63, + "learning_rate": 0.00020519750843094915, + "loss": 0.0112, "step": 243820 }, { - "epoch": 1.23, - "learning_rate": 0.0001154769412393863, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.0002051936202145777, + "loss": 0.0166, "step": 243830 }, { - "epoch": 1.23, - "learning_rate": 0.00011546937354637229, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.0002051897319982062, + "loss": 0.0192, "step": 243840 }, { - "epoch": 1.23, - "learning_rate": 0.00011546180585335828, - "loss": 0.0094, + "epoch": 0.63, + "learning_rate": 0.00020518584378183478, + "loss": 0.0196, "step": 243850 }, { - "epoch": 1.23, - "learning_rate": 0.00011545423816034427, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.0002051819555654633, + "loss": 0.018, "step": 243860 }, { - "epoch": 1.23, - "learning_rate": 0.00011544667046733026, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020517806734909183, + "loss": 0.0127, "step": 243870 }, { - "epoch": 1.23, - "learning_rate": 0.00011543910277431626, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020517417913272035, + "loss": 0.0117, "step": 243880 }, { - "epoch": 1.23, - "learning_rate": 0.00011543153508130224, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.0002051702909163489, + "loss": 0.013, "step": 243890 }, { - "epoch": 1.23, - "learning_rate": 0.00011542396738828823, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020516640269997743, + "loss": 0.0196, "step": 243900 }, { - "epoch": 1.23, - "learning_rate": 0.00011541639969527421, - "loss": 0.0072, + "epoch": 0.63, + "learning_rate": 0.00020516251448360597, + "loss": 0.0129, "step": 243910 }, { - "epoch": 1.23, - "learning_rate": 0.00011540883200226021, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020515862626723449, + "loss": 0.0168, "step": 243920 }, { - "epoch": 1.23, - "learning_rate": 0.0001154012643092462, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020515473805086303, + "loss": 0.0134, "step": 243930 }, { - "epoch": 1.23, - "learning_rate": 0.00011539369661623219, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020515084983449157, + "loss": 0.0148, "step": 243940 }, { - "epoch": 1.23, - "learning_rate": 0.00011538612892321818, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.0002051469616181201, + "loss": 0.0114, "step": 243950 }, { - "epoch": 1.23, - "learning_rate": 0.00011537856123020418, - "loss": 0.008, + "epoch": 0.63, + "learning_rate": 0.00020514307340174863, + "loss": 0.0182, "step": 243960 }, { - "epoch": 1.23, - "learning_rate": 0.00011537099353719016, - "loss": 0.006, + "epoch": 0.63, + "learning_rate": 0.00020513918518537717, + "loss": 0.0138, "step": 243970 }, { - "epoch": 1.23, - "learning_rate": 0.00011536342584417615, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020513529696900574, + "loss": 0.0138, "step": 243980 }, { - "epoch": 1.23, - "learning_rate": 0.00011535585815116213, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020513140875263425, + "loss": 0.013, "step": 243990 }, { - "epoch": 1.23, - "learning_rate": 0.00011534829045814813, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.0002051275205362628, + "loss": 0.0155, "step": 244000 }, { - "epoch": 1.23, - "eval_cer": 0.9144731670915385, - "eval_loss": 0.00690747844055295, - "eval_runtime": 116.0173, - "eval_samples_per_second": 17.239, - "eval_steps_per_second": 4.31, + "epoch": 0.63, + "eval_cer": 0.881782465628416, + "eval_loss": 0.01116818655282259, + "eval_runtime": 107.1197, + "eval_samples_per_second": 18.671, + "eval_steps_per_second": 4.668, "step": 244000 }, { - "epoch": 1.23, - "learning_rate": 0.00011534072276513412, - "loss": 0.007, + "epoch": 0.63, + "learning_rate": 0.0002051236323198913, + "loss": 0.0135, "step": 244010 }, { - "epoch": 1.23, - "learning_rate": 0.0001153331550721201, - "loss": 0.0058, - "step": 244020 + "epoch": 0.63, + "learning_rate": 0.00020511974410351988, + "loss": 0.0152, + "step": 244020 }, { - "epoch": 1.23, - "learning_rate": 0.0001153255873791061, - "loss": 0.0058, + "epoch": 0.63, + "learning_rate": 0.0002051158558871484, + "loss": 0.0132, "step": 244030 }, { - "epoch": 1.23, - "learning_rate": 0.0001153180196860921, - "loss": 0.0135, + "epoch": 0.63, + "learning_rate": 0.00020511196767077693, + "loss": 0.0167, "step": 244040 }, { - "epoch": 1.23, - "learning_rate": 0.00011531045199307808, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020510807945440545, + "loss": 0.0162, "step": 244050 }, { - "epoch": 1.23, - "learning_rate": 0.00011530288430006407, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020510419123803401, + "loss": 0.0139, "step": 244060 }, { - "epoch": 1.23, - "learning_rate": 0.00011529531660705005, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.00020510030302166253, + "loss": 0.0149, "step": 244070 }, { - "epoch": 1.23, - "learning_rate": 0.00011528774891403605, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020509641480529107, + "loss": 0.0151, "step": 244080 }, { - "epoch": 1.23, - "learning_rate": 0.00011528018122102204, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020509252658891959, + "loss": 0.0172, "step": 244090 }, { - "epoch": 1.23, - "learning_rate": 0.00011527261352800802, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020508863837254815, + "loss": 0.0158, "step": 244100 }, { - "epoch": 1.23, - "learning_rate": 0.00011526504583499402, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020508475015617667, + "loss": 0.0193, "step": 244110 }, { - "epoch": 1.23, - "learning_rate": 0.00011525747814198001, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.0002050808619398052, + "loss": 0.0132, "step": 244120 }, { - "epoch": 1.23, - "learning_rate": 0.000115249910448966, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020507697372343372, + "loss": 0.0142, "step": 244130 }, { - "epoch": 1.23, - "learning_rate": 0.00011524234275595199, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020507308550706227, + "loss": 0.0164, "step": 244140 }, { - "epoch": 1.23, - "learning_rate": 0.00011523477506293799, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020506919729069084, + "loss": 0.0165, "step": 244150 }, { - "epoch": 1.23, - "learning_rate": 0.00011522720736992395, - "loss": 0.0104, + "epoch": 0.63, + "learning_rate": 0.00020506530907431935, + "loss": 0.0157, "step": 244160 }, { - "epoch": 1.23, - "learning_rate": 0.00011521963967690995, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.0002050614208579479, + "loss": 0.0251, "step": 244170 }, { - "epoch": 1.23, - "learning_rate": 0.00011521207198389593, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.0002050575326415764, + "loss": 0.0166, "step": 244180 }, { - "epoch": 1.23, - "learning_rate": 0.00011520450429088192, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020505364442520497, + "loss": 0.0128, "step": 244190 }, { - "epoch": 1.23, - "learning_rate": 0.0001151969365978679, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.0002050497562088335, + "loss": 0.0135, "step": 244200 }, { - "epoch": 1.23, - "learning_rate": 0.0001151893689048539, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020504586799246203, + "loss": 0.0133, "step": 244210 }, { - "epoch": 1.23, - "learning_rate": 0.0001151818012118399, - "loss": 0.0111, + "epoch": 0.63, + "learning_rate": 0.00020504197977609055, + "loss": 0.0218, "step": 244220 }, { - "epoch": 1.23, - "learning_rate": 0.00011517423351882588, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020503809155971911, + "loss": 0.0167, "step": 244230 }, { - "epoch": 1.23, - "learning_rate": 0.00011516666582581187, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.00020503420334334763, + "loss": 0.0185, "step": 244240 }, { - "epoch": 1.23, - "learning_rate": 0.00011515909813279787, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020503031512697617, + "loss": 0.016, "step": 244250 }, { - "epoch": 1.23, - "learning_rate": 0.00011515153043978385, - "loss": 0.0116, + "epoch": 0.63, + "learning_rate": 0.00020502642691060468, + "loss": 0.0167, "step": 244260 }, { - "epoch": 1.23, - "learning_rate": 0.00011514396274676984, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020502253869423325, + "loss": 0.0114, "step": 244270 }, { - "epoch": 1.23, - "learning_rate": 0.00011513639505375583, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020501865047786177, + "loss": 0.0182, "step": 244280 }, { - "epoch": 1.23, - "learning_rate": 0.00011512882736074182, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.0002050147622614903, + "loss": 0.0128, "step": 244290 }, { - "epoch": 1.23, - "learning_rate": 0.00011512125966772782, - "loss": 0.0078, + "epoch": 0.63, + "learning_rate": 0.00020501087404511882, + "loss": 0.0167, "step": 244300 }, { - "epoch": 1.23, - "learning_rate": 0.0001151136919747138, - "loss": 0.0082, + "epoch": 0.63, + "learning_rate": 0.0002050069858287474, + "loss": 0.014, "step": 244310 }, { - "epoch": 1.23, - "learning_rate": 0.00011510612428169979, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.00020500309761237593, + "loss": 0.0161, "step": 244320 }, { - "epoch": 1.23, - "learning_rate": 0.00011509855658868579, - "loss": 0.0124, + "epoch": 0.63, + "learning_rate": 0.00020499920939600445, + "loss": 0.0175, "step": 244330 }, { - "epoch": 1.23, - "learning_rate": 0.00011509098889567177, - "loss": 0.0068, + "epoch": 0.63, + "learning_rate": 0.00020499532117963296, + "loss": 0.0182, "step": 244340 }, { - "epoch": 1.23, - "learning_rate": 0.00011508342120265776, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020499143296326153, + "loss": 0.0172, "step": 244350 }, { - "epoch": 1.23, - "learning_rate": 0.00011507585350964374, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020498754474689007, + "loss": 0.0168, "step": 244360 }, { - "epoch": 1.23, - "learning_rate": 0.00011506828581662974, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.0002049836565305186, + "loss": 0.015, "step": 244370 }, { - "epoch": 1.23, - "learning_rate": 0.00011506071812361573, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.00020497976831414713, + "loss": 0.0141, "step": 244380 }, { - "epoch": 1.23, - "learning_rate": 0.00011505315043060172, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020497588009777564, + "loss": 0.0128, "step": 244390 }, { - "epoch": 1.23, - "learning_rate": 0.00011504558273758771, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.0002049719918814042, + "loss": 0.0159, "step": 244400 }, { - "epoch": 1.23, - "learning_rate": 0.0001150380150445737, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020496810366503273, + "loss": 0.0137, "step": 244410 }, { - "epoch": 1.23, - "learning_rate": 0.00011503044735155969, - "loss": 0.0121, + "epoch": 0.63, + "learning_rate": 0.00020496421544866127, + "loss": 0.0142, "step": 244420 }, { - "epoch": 1.23, - "learning_rate": 0.00011502287965854568, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020496032723228978, + "loss": 0.0127, "step": 244430 }, { - "epoch": 1.23, - "learning_rate": 0.00011501531196553166, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020495643901591835, + "loss": 0.0114, "step": 244440 }, { - "epoch": 1.23, - "learning_rate": 0.00011500774427251766, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.00020495255079954687, + "loss": 0.0125, "step": 244450 }, { - "epoch": 1.23, - "learning_rate": 0.00011500017657950365, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.0002049486625831754, + "loss": 0.013, "step": 244460 }, { - "epoch": 1.23, - "learning_rate": 0.00011499260888648964, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020494477436680392, + "loss": 0.0176, "step": 244470 }, { - "epoch": 1.23, - "learning_rate": 0.00011498504119347563, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.0002049408861504325, + "loss": 0.0137, "step": 244480 }, { - "epoch": 1.23, - "learning_rate": 0.00011497747350046163, - "loss": 0.0102, + "epoch": 0.63, + "learning_rate": 0.000204936997934061, + "loss": 0.0197, "step": 244490 }, { - "epoch": 1.23, - "learning_rate": 0.0001149699058074476, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.00020493310971768955, + "loss": 0.0124, "step": 244500 }, { - "epoch": 1.23, - "learning_rate": 0.0001149623381144336, - "loss": 0.013, + "epoch": 0.63, + "learning_rate": 0.00020492922150131806, + "loss": 0.0165, "step": 244510 }, { - "epoch": 1.23, - "learning_rate": 0.00011495477042141958, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.00020492533328494663, + "loss": 0.0146, "step": 244520 }, { - "epoch": 1.23, - "learning_rate": 0.00011494720272840558, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.00020492144506857517, + "loss": 0.014, "step": 244530 }, { - "epoch": 1.23, - "learning_rate": 0.00011493963503539157, - "loss": 0.0091, + "epoch": 0.63, + "learning_rate": 0.0002049175568522037, + "loss": 0.0146, "step": 244540 }, { - "epoch": 1.23, - "learning_rate": 0.00011493206734237755, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020491366863583223, + "loss": 0.0212, "step": 244550 }, { - "epoch": 1.23, - "learning_rate": 0.00011492449964936355, - "loss": 0.0096, + "epoch": 0.63, + "learning_rate": 0.00020490978041946077, + "loss": 0.0142, "step": 244560 }, { - "epoch": 1.23, - "learning_rate": 0.00011491693195634954, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.0002049058922030893, + "loss": 0.0166, "step": 244570 }, { - "epoch": 1.23, - "learning_rate": 0.00011490936426333553, - "loss": 0.0098, + "epoch": 0.63, + "learning_rate": 0.00020490200398671783, + "loss": 0.0132, "step": 244580 }, { - "epoch": 1.23, - "learning_rate": 0.00011490179657032152, - "loss": 0.0086, + "epoch": 0.63, + "learning_rate": 0.00020489811577034637, + "loss": 0.0154, "step": 244590 }, { - "epoch": 1.23, - "learning_rate": 0.00011489422887730752, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.0002048942275539749, + "loss": 0.0128, "step": 244600 }, { - "epoch": 1.23, - "learning_rate": 0.0001148866611842935, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.00020489033933760345, + "loss": 0.0154, "step": 244610 }, { - "epoch": 1.23, - "learning_rate": 0.00011487909349127949, - "loss": 0.0092, + "epoch": 0.63, + "learning_rate": 0.00020488645112123197, + "loss": 0.0151, "step": 244620 }, { - "epoch": 1.23, - "learning_rate": 0.00011487152579826547, - "loss": 0.0105, + "epoch": 0.63, + "learning_rate": 0.0002048825629048605, + "loss": 0.0138, "step": 244630 }, { - "epoch": 1.23, - "learning_rate": 0.00011486395810525147, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.00020487867468848902, + "loss": 0.0169, "step": 244640 }, { - "epoch": 1.23, - "learning_rate": 0.00011485639041223746, - "loss": 0.0071, + "epoch": 0.63, + "learning_rate": 0.0002048747864721176, + "loss": 0.0171, "step": 244650 }, { - "epoch": 1.23, - "learning_rate": 0.00011484882271922345, - "loss": 0.0095, + "epoch": 0.63, + "learning_rate": 0.0002048708982557461, + "loss": 0.018, "step": 244660 }, { - "epoch": 1.23, - "learning_rate": 0.00011484125502620944, - "loss": 0.0117, + "epoch": 0.63, + "learning_rate": 0.00020486701003937465, + "loss": 0.0181, "step": 244670 }, { - "epoch": 1.23, - "learning_rate": 0.00011483368733319544, - "loss": 0.0106, + "epoch": 0.63, + "learning_rate": 0.00020486312182300316, + "loss": 0.0249, "step": 244680 }, { - "epoch": 1.23, - "learning_rate": 0.00011482611964018142, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.00020485923360663173, + "loss": 0.012, "step": 244690 }, { - "epoch": 1.23, - "learning_rate": 0.00011481855194716741, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.00020485534539026027, + "loss": 0.0156, "step": 244700 }, { - "epoch": 1.23, - "learning_rate": 0.00011481098425415339, - "loss": 0.0147, + "epoch": 0.63, + "learning_rate": 0.0002048514571738888, + "loss": 0.014, "step": 244710 }, { - "epoch": 1.23, - "learning_rate": 0.00011480341656113939, - "loss": 0.01, + "epoch": 0.63, + "learning_rate": 0.00020484756895751733, + "loss": 0.0159, "step": 244720 }, { - "epoch": 1.23, - "learning_rate": 0.00011479584886812538, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020484368074114587, + "loss": 0.0196, "step": 244730 }, { - "epoch": 1.23, - "learning_rate": 0.00011478828117511136, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.0002048397925247744, + "loss": 0.0195, "step": 244740 }, { - "epoch": 1.23, - "learning_rate": 0.00011478071348209736, - "loss": 0.0076, + "epoch": 0.63, + "learning_rate": 0.00020483590430840293, + "loss": 0.0127, "step": 244750 }, { - "epoch": 1.23, - "learning_rate": 0.00011477314578908335, - "loss": 0.0077, + "epoch": 0.63, + "learning_rate": 0.00020483201609203147, + "loss": 0.0154, "step": 244760 }, { - "epoch": 1.23, - "learning_rate": 0.00011476557809606934, - "loss": 0.0118, + "epoch": 0.63, + "learning_rate": 0.00020482812787566, + "loss": 0.0216, "step": 244770 }, { - "epoch": 1.23, - "learning_rate": 0.00011475801040305532, - "loss": 0.0099, + "epoch": 0.63, + "learning_rate": 0.00020482423965928855, + "loss": 0.015, "step": 244780 }, { - "epoch": 1.23, - "learning_rate": 0.0001147504427100413, - "loss": 0.0101, + "epoch": 0.63, + "learning_rate": 0.00020482035144291707, + "loss": 0.017, "step": 244790 }, { - "epoch": 1.24, - "learning_rate": 0.0001147428750170273, - "loss": 0.0093, + "epoch": 0.63, + "learning_rate": 0.0002048164632265456, + "loss": 0.018, "step": 244800 }, { - "epoch": 1.24, - "learning_rate": 0.00011473530732401328, - "loss": 0.0073, + "epoch": 0.63, + "learning_rate": 0.00020481257501017415, + "loss": 0.0169, "step": 244810 }, { - "epoch": 1.24, - "learning_rate": 0.00011472773963099927, - "loss": 0.0087, + "epoch": 0.63, + "learning_rate": 0.0002048086867938027, + "loss": 0.0145, "step": 244820 }, { - "epoch": 1.24, - "learning_rate": 0.00011472017193798527, - "loss": 0.009, + "epoch": 0.63, + "learning_rate": 0.0002048047985774312, + "loss": 0.0245, "step": 244830 }, { - "epoch": 1.24, - "learning_rate": 0.00011471260424497125, - "loss": 0.0075, + "epoch": 0.63, + "learning_rate": 0.00020480091036105975, + "loss": 0.0175, "step": 244840 }, { - "epoch": 1.24, - "learning_rate": 0.00011470503655195724, - "loss": 0.0085, + "epoch": 0.63, + "learning_rate": 0.00020479702214468832, + "loss": 0.0145, "step": 244850 }, { - "epoch": 1.24, - "learning_rate": 0.00011469746885894324, - "loss": 0.0088, + "epoch": 0.63, + "learning_rate": 0.00020479313392831683, + "loss": 0.0165, "step": 244860 }, { - "epoch": 1.24, - "learning_rate": 0.00011468990116592922, - "loss": 0.0071, + "epoch": 0.63, + "learning_rate": 0.00020478924571194537, + "loss": 0.0128, "step": 244870 }, { - "epoch": 1.24, - "learning_rate": 0.00011468233347291521, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.0002047853574955739, + "loss": 0.0171, "step": 244880 }, { - "epoch": 1.24, - "learning_rate": 0.0001146747657799012, - "loss": 0.0101, + "epoch": 0.63, + "learning_rate": 0.0002047814692792024, + "loss": 0.0132, "step": 244890 }, { - "epoch": 1.24, - "learning_rate": 0.00011466719808688719, - "loss": 0.0074, + "epoch": 0.63, + "learning_rate": 0.00020477758106283097, + "loss": 0.015, "step": 244900 }, { - "epoch": 1.24, - "learning_rate": 0.00011465963039387318, - "loss": 0.0117, + "epoch": 0.63, + "learning_rate": 0.0002047736928464595, + "loss": 0.0155, "step": 244910 }, { - "epoch": 1.24, - "learning_rate": 0.00011465206270085917, - "loss": 0.0089, + "epoch": 0.63, + "learning_rate": 0.00020476980463008803, + "loss": 0.0154, "step": 244920 }, { - "epoch": 1.24, - "learning_rate": 0.00011464449500784516, - "loss": 0.0079, + "epoch": 0.63, + "learning_rate": 0.00020476591641371657, + "loss": 0.014, "step": 244930 }, { - "epoch": 1.24, - "learning_rate": 0.00011463692731483116, - "loss": 0.0119, + "epoch": 0.63, + "learning_rate": 0.0002047620281973451, + "loss": 0.021, "step": 244940 }, { - "epoch": 1.24, - "learning_rate": 0.00011462935962181714, - "loss": 0.0103, + "epoch": 0.63, + "learning_rate": 0.00020475813998097365, + "loss": 0.0161, "step": 244950 }, { - "epoch": 1.24, - "learning_rate": 0.00011462179192880313, - "loss": 0.0083, + "epoch": 0.63, + "learning_rate": 0.00020475425176460217, + "loss": 0.0181, "step": 244960 }, { - "epoch": 1.24, - "learning_rate": 0.00011461422423578911, - "loss": 0.0081, + "epoch": 0.63, + "learning_rate": 0.0002047503635482307, + "loss": 0.0152, "step": 244970 }, { - "epoch": 1.24, - "learning_rate": 0.00011460665654277511, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020474647533185925, + "loss": 0.0167, "step": 244980 }, { - "epoch": 1.24, - "learning_rate": 0.0001145990888497611, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.0002047425871154878, + "loss": 0.0157, "step": 244990 }, { - "epoch": 1.24, - "learning_rate": 0.00011459152115674709, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.0002047386988991163, + "loss": 0.0122, "step": 245000 }, { - "epoch": 1.24, - "eval_cer": 0.9144741374876638, - "eval_loss": 0.006758058909326792, - "eval_runtime": 115.9822, - "eval_samples_per_second": 17.244, - "eval_steps_per_second": 4.311, + "epoch": 0.64, + "eval_cer": 0.8817726681698768, + "eval_loss": 0.011478559114038944, + "eval_runtime": 107.2432, + "eval_samples_per_second": 18.649, + "eval_steps_per_second": 4.662, "step": 245000 }, { - "epoch": 1.24, - "learning_rate": 0.00011458395346373308, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020473481068274485, + "loss": 0.0153, "step": 245010 }, { - "epoch": 1.24, - "learning_rate": 0.00011457638577071908, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.00020473092246637342, + "loss": 0.0166, "step": 245020 }, { - "epoch": 1.24, - "learning_rate": 0.00011456881807770506, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020472703425000193, + "loss": 0.0161, "step": 245030 }, { - "epoch": 1.24, - "learning_rate": 0.00011456125038469105, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020472314603363047, + "loss": 0.0147, "step": 245040 }, { - "epoch": 1.24, - "learning_rate": 0.00011455368269167705, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020471925781725899, + "loss": 0.014, "step": 245050 }, { - "epoch": 1.24, - "learning_rate": 0.00011454611499866303, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020471536960088755, + "loss": 0.0186, "step": 245060 }, { - "epoch": 1.24, - "learning_rate": 0.00011453854730564902, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020471148138451607, + "loss": 0.0169, "step": 245070 }, { - "epoch": 1.24, - "learning_rate": 0.000114530979612635, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.0002047075931681446, + "loss": 0.0161, "step": 245080 }, { - "epoch": 1.24, - "learning_rate": 0.000114523411919621, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020470370495177313, + "loss": 0.0151, "step": 245090 }, { - "epoch": 1.24, - "learning_rate": 0.000114515844226607, - "loss": 0.011, + "epoch": 0.64, + "learning_rate": 0.0002046998167354017, + "loss": 0.0149, "step": 245100 }, { - "epoch": 1.24, - "learning_rate": 0.00011450827653359298, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.0002046959285190302, + "loss": 0.0182, "step": 245110 }, { - "epoch": 1.24, - "learning_rate": 0.00011450070884057897, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020469204030265875, + "loss": 0.0186, "step": 245120 }, { - "epoch": 1.24, - "learning_rate": 0.00011449314114756497, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020468815208628727, + "loss": 0.0185, "step": 245130 }, { - "epoch": 1.24, - "learning_rate": 0.00011448557345455095, - "loss": 0.0102, + "epoch": 0.64, + "learning_rate": 0.0002046842638699158, + "loss": 0.0187, "step": 245140 }, { - "epoch": 1.24, - "learning_rate": 0.00011447800576153694, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020468037565354435, + "loss": 0.014, "step": 245150 }, { - "epoch": 1.24, - "learning_rate": 0.00011447043806852292, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.0002046764874371729, + "loss": 0.0187, "step": 245160 }, { - "epoch": 1.24, - "learning_rate": 0.00011446287037550892, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.0002046725992208014, + "loss": 0.0198, "step": 245170 }, { - "epoch": 1.24, - "learning_rate": 0.00011445530268249491, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020466871100442995, + "loss": 0.0141, "step": 245180 }, { - "epoch": 1.24, - "learning_rate": 0.0001144477349894809, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020466482278805851, + "loss": 0.0184, "step": 245190 }, { - "epoch": 1.24, - "learning_rate": 0.00011444016729646689, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020466093457168703, + "loss": 0.0189, "step": 245200 }, { - "epoch": 1.24, - "learning_rate": 0.00011443259960345289, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020465704635531554, + "loss": 0.0163, "step": 245210 }, { - "epoch": 1.24, - "learning_rate": 0.00011442503191043887, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.00020465315813894409, + "loss": 0.0161, "step": 245220 }, { - "epoch": 1.24, - "learning_rate": 0.00011441746421742486, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020464926992257265, + "loss": 0.015, "step": 245230 }, { - "epoch": 1.24, - "learning_rate": 0.00011440989652441084, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020464538170620117, + "loss": 0.0133, "step": 245240 }, { - "epoch": 1.24, - "learning_rate": 0.00011440232883139684, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002046414934898297, + "loss": 0.0112, "step": 245250 }, { - "epoch": 1.24, - "learning_rate": 0.00011439476113838283, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020463760527345823, + "loss": 0.0164, "step": 245260 }, { - "epoch": 1.24, - "learning_rate": 0.00011438719344536881, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.0002046337170570868, + "loss": 0.0141, "step": 245270 }, { - "epoch": 1.24, - "learning_rate": 0.00011437962575235481, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.0002046298288407153, + "loss": 0.014, "step": 245280 }, { - "epoch": 1.24, - "learning_rate": 0.0001143720580593408, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020462594062434385, + "loss": 0.0188, "step": 245290 }, { - "epoch": 1.24, - "learning_rate": 0.00011436449036632679, - "loss": 0.0118, + "epoch": 0.64, + "learning_rate": 0.00020462205240797236, + "loss": 0.0184, "step": 245300 }, { - "epoch": 1.24, - "learning_rate": 0.00011435692267331278, - "loss": 0.0076, + "epoch": 0.64, + "learning_rate": 0.00020461816419160093, + "loss": 0.0157, "step": 245310 }, { - "epoch": 1.24, - "learning_rate": 0.00011434935498029876, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020461427597522945, + "loss": 0.0158, "step": 245320 }, { - "epoch": 1.24, - "learning_rate": 0.00011434178728728476, - "loss": 0.0175, + "epoch": 0.64, + "learning_rate": 0.000204610387758858, + "loss": 0.017, "step": 245330 }, { - "epoch": 1.24, - "learning_rate": 0.00011433421959427075, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.0002046064995424865, + "loss": 0.0173, "step": 245340 }, { - "epoch": 1.24, - "learning_rate": 0.00011432665190125673, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020460261132611507, + "loss": 0.0132, "step": 245350 }, { - "epoch": 1.24, - "learning_rate": 0.00011431908420824273, - "loss": 0.0069, + "epoch": 0.64, + "learning_rate": 0.00020459872310974361, + "loss": 0.0146, "step": 245360 }, { - "epoch": 1.24, - "learning_rate": 0.00011431151651522872, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020459483489337213, + "loss": 0.0158, "step": 245370 }, { - "epoch": 1.24, - "learning_rate": 0.0001143039488222147, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020459094667700064, + "loss": 0.0142, "step": 245380 }, { - "epoch": 1.24, - "learning_rate": 0.0001142963811292007, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020458705846062918, + "loss": 0.0132, "step": 245390 }, { - "epoch": 1.24, - "learning_rate": 0.00011428881343618668, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020458317024425775, + "loss": 0.0148, "step": 245400 }, { - "epoch": 1.24, - "learning_rate": 0.00011428124574317266, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020457928202788627, + "loss": 0.0305, "step": 245410 }, { - "epoch": 1.24, - "learning_rate": 0.00011427367805015864, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.0002045753938115148, + "loss": 0.0171, "step": 245420 }, { - "epoch": 1.24, - "learning_rate": 0.00011426611035714464, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.00020457150559514332, + "loss": 0.0151, "step": 245430 }, { - "epoch": 1.24, - "learning_rate": 0.00011425854266413063, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.0002045676173787719, + "loss": 0.0135, "step": 245440 }, { - "epoch": 1.24, - "learning_rate": 0.00011425097497111662, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.0002045637291624004, + "loss": 0.0151, "step": 245450 }, { - "epoch": 1.24, - "learning_rate": 0.00011424340727810261, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020455984094602895, + "loss": 0.0169, "step": 245460 }, { - "epoch": 1.24, - "learning_rate": 0.0001142358395850886, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020455595272965746, + "loss": 0.0175, "step": 245470 }, { - "epoch": 1.24, - "learning_rate": 0.00011422827189207459, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020455206451328603, + "loss": 0.0179, "step": 245480 }, { - "epoch": 1.24, - "learning_rate": 0.00011422070419906058, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020454817629691455, + "loss": 0.0182, "step": 245490 }, { - "epoch": 1.24, - "learning_rate": 0.00011421313650604658, - "loss": 0.0114, + "epoch": 0.64, + "learning_rate": 0.0002045442880805431, + "loss": 0.0139, "step": 245500 }, { - "epoch": 1.24, - "learning_rate": 0.00011420556881303256, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002045403998641716, + "loss": 0.0186, "step": 245510 }, { - "epoch": 1.24, - "learning_rate": 0.00011419800112001855, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020453651164780017, + "loss": 0.0185, "step": 245520 }, { - "epoch": 1.24, - "learning_rate": 0.00011419043342700454, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002045326234314287, + "loss": 0.0174, "step": 245530 }, { - "epoch": 1.24, - "learning_rate": 0.00011418286573399053, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020452873521505723, + "loss": 0.0161, "step": 245540 }, { - "epoch": 1.24, - "learning_rate": 0.00011417529804097653, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020452484699868574, + "loss": 0.0115, "step": 245550 }, { - "epoch": 1.24, - "learning_rate": 0.00011416773034796251, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.0002045209587823143, + "loss": 0.0181, "step": 245560 }, { - "epoch": 1.24, - "learning_rate": 0.0001141601626549485, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020451707056594285, + "loss": 0.0155, "step": 245570 }, { - "epoch": 1.24, - "learning_rate": 0.0001141525949619345, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020451318234957137, + "loss": 0.0162, "step": 245580 }, { - "epoch": 1.24, - "learning_rate": 0.00011414502726892048, - "loss": 0.0068, + "epoch": 0.64, + "learning_rate": 0.0002045092941331999, + "loss": 0.015, "step": 245590 }, { - "epoch": 1.24, - "learning_rate": 0.00011413745957590647, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020450540591682845, + "loss": 0.02, "step": 245600 }, { - "epoch": 1.24, - "learning_rate": 0.00011412989188289245, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.000204501517700457, + "loss": 0.0177, "step": 245610 }, { - "epoch": 1.24, - "learning_rate": 0.00011412232418987845, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.0002044976294840855, + "loss": 0.0164, "step": 245620 }, { - "epoch": 1.24, - "learning_rate": 0.00011411475649686444, - "loss": 0.0121, + "epoch": 0.64, + "learning_rate": 0.00020449374126771405, + "loss": 0.0188, "step": 245630 }, { - "epoch": 1.24, - "learning_rate": 0.00011410718880385043, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.00020448985305134256, + "loss": 0.0167, "step": 245640 }, { - "epoch": 1.24, - "learning_rate": 0.00011409962111083642, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020448596483497113, + "loss": 0.0144, "step": 245650 }, { - "epoch": 1.24, - "learning_rate": 0.00011409205341782242, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020448207661859965, + "loss": 0.0153, "step": 245660 }, { - "epoch": 1.24, - "learning_rate": 0.0001140844857248084, - "loss": 0.0069, + "epoch": 0.64, + "learning_rate": 0.0002044781884022282, + "loss": 0.0201, "step": 245670 }, { - "epoch": 1.24, - "learning_rate": 0.00011407691803179439, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.0002044743001858567, + "loss": 0.0141, "step": 245680 }, { - "epoch": 1.24, - "learning_rate": 0.00011406935033878037, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020447041196948527, + "loss": 0.0148, "step": 245690 }, { - "epoch": 1.24, - "learning_rate": 0.00011406178264576637, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020446652375311379, + "loss": 0.0188, "step": 245700 }, { - "epoch": 1.24, - "learning_rate": 0.00011405421495275236, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020446263553674233, + "loss": 0.0184, "step": 245710 }, { - "epoch": 1.24, - "learning_rate": 0.00011404664725973835, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020445874732037084, + "loss": 0.0158, "step": 245720 }, { - "epoch": 1.24, - "learning_rate": 0.00011403907956672434, - "loss": 0.0108, + "epoch": 0.64, + "learning_rate": 0.0002044548591039994, + "loss": 0.0145, "step": 245730 }, { - "epoch": 1.24, - "learning_rate": 0.00011403151187371034, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020445097088762795, + "loss": 0.016, "step": 245740 }, { - "epoch": 1.24, - "learning_rate": 0.00011402394418069632, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020444708267125647, + "loss": 0.0117, "step": 245750 }, { - "epoch": 1.24, - "learning_rate": 0.00011401637648768231, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.000204443194454885, + "loss": 0.0168, "step": 245760 }, { - "epoch": 1.24, - "learning_rate": 0.0001140088087946683, - "loss": 0.0068, + "epoch": 0.64, + "learning_rate": 0.00020443930623851355, + "loss": 0.0152, "step": 245770 }, { - "epoch": 1.24, - "learning_rate": 0.00011400124110165429, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.0002044354180221421, + "loss": 0.0194, "step": 245780 }, { - "epoch": 1.24, - "learning_rate": 0.00011399367340864028, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.0002044315298057706, + "loss": 0.0176, "step": 245790 }, { - "epoch": 1.24, - "learning_rate": 0.00011398610571562626, - "loss": 0.0109, + "epoch": 0.64, + "learning_rate": 0.00020442764158939915, + "loss": 0.0145, "step": 245800 }, { - "epoch": 1.24, - "learning_rate": 0.00011397853802261226, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.0002044237533730277, + "loss": 0.0159, "step": 245810 }, { - "epoch": 1.24, - "learning_rate": 0.00011397097032959825, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020441986515665623, + "loss": 0.0129, "step": 245820 }, { - "epoch": 1.24, - "learning_rate": 0.00011396340263658424, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020441597694028475, + "loss": 0.0123, "step": 245830 }, { - "epoch": 1.24, - "learning_rate": 0.00011395583494357023, - "loss": 0.0068, + "epoch": 0.64, + "learning_rate": 0.0002044120887239133, + "loss": 0.0149, "step": 245840 }, { - "epoch": 1.24, - "learning_rate": 0.00011394826725055621, - "loss": 0.0118, + "epoch": 0.64, + "learning_rate": 0.00020440820050754183, + "loss": 0.0126, "step": 245850 }, { - "epoch": 1.24, - "learning_rate": 0.00011394069955754221, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.00020440431229117037, + "loss": 0.0149, "step": 245860 }, { - "epoch": 1.24, - "learning_rate": 0.0001139331318645282, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020440042407479889, + "loss": 0.0203, "step": 245870 }, { - "epoch": 1.24, - "learning_rate": 0.00011392556417151418, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020439653585842743, + "loss": 0.0178, "step": 245880 }, { - "epoch": 1.24, - "learning_rate": 0.00011391799647850018, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020439264764205594, + "loss": 0.0139, "step": 245890 }, { - "epoch": 1.24, - "learning_rate": 0.00011391042878548617, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.0002043887594256845, + "loss": 0.0165, "step": 245900 }, { - "epoch": 1.24, - "learning_rate": 0.00011390286109247216, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020438487120931305, + "loss": 0.0207, "step": 245910 }, { - "epoch": 1.24, - "learning_rate": 0.00011389529339945815, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020438098299294157, + "loss": 0.0173, "step": 245920 }, { - "epoch": 1.24, - "learning_rate": 0.00011388772570644413, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020437709477657008, + "loss": 0.0154, "step": 245930 }, { - "epoch": 1.24, - "learning_rate": 0.00011388015801343013, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020437320656019865, + "loss": 0.0181, "step": 245940 }, { - "epoch": 1.24, - "learning_rate": 0.00011387259032041612, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002043693183438272, + "loss": 0.0189, "step": 245950 }, { - "epoch": 1.24, - "learning_rate": 0.0001138650226274021, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.0002043654301274557, + "loss": 0.0149, "step": 245960 }, { - "epoch": 1.24, - "learning_rate": 0.0001138574549343881, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020436154191108425, + "loss": 0.0143, "step": 245970 }, { - "epoch": 1.24, - "learning_rate": 0.0001138498872413741, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.0002043576536947128, + "loss": 0.0128, "step": 245980 }, { - "epoch": 1.24, - "learning_rate": 0.00011384231954836007, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020435376547834133, + "loss": 0.0153, "step": 245990 }, { - "epoch": 1.24, - "learning_rate": 0.00011383475185534607, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020434987726196985, + "loss": 0.0153, "step": 246000 }, { - "epoch": 1.24, - "eval_cer": 0.9144343512465224, - "eval_loss": 0.006622600369155407, - "eval_runtime": 115.7041, - "eval_samples_per_second": 17.285, - "eval_steps_per_second": 4.321, + "epoch": 0.64, + "eval_cer": 0.8817628707113375, + "eval_loss": 0.011506488546729088, + "eval_runtime": 107.342, + "eval_samples_per_second": 18.632, + "eval_steps_per_second": 4.658, "step": 246000 }, { - "epoch": 1.24, - "learning_rate": 0.00011382718416233205, - "loss": 0.0117, + "epoch": 0.64, + "learning_rate": 0.0002043459890455984, + "loss": 0.0135, "step": 246010 }, { - "epoch": 1.24, - "learning_rate": 0.00011381961646931805, - "loss": 0.011, + "epoch": 0.64, + "learning_rate": 0.00020434210082922693, + "loss": 0.0135, "step": 246020 }, { - "epoch": 1.24, - "learning_rate": 0.00011381204877630404, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020433821261285547, + "loss": 0.018, "step": 246030 }, { - "epoch": 1.24, - "learning_rate": 0.00011380448108329001, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020433432439648398, + "loss": 0.0146, "step": 246040 }, { - "epoch": 1.24, - "learning_rate": 0.000113796913390276, - "loss": 0.0117, + "epoch": 0.64, + "learning_rate": 0.00020433043618011253, + "loss": 0.0136, "step": 246050 }, { - "epoch": 1.24, - "learning_rate": 0.00011378934569726199, - "loss": 0.0121, + "epoch": 0.64, + "learning_rate": 0.0002043265479637411, + "loss": 0.0145, "step": 246060 }, { - "epoch": 1.24, - "learning_rate": 0.00011378177800424798, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002043226597473696, + "loss": 0.017, "step": 246070 }, { - "epoch": 1.24, - "learning_rate": 0.00011377421031123398, - "loss": 0.0069, + "epoch": 0.64, + "learning_rate": 0.00020431877153099812, + "loss": 0.0216, "step": 246080 }, { - "epoch": 1.24, - "learning_rate": 0.00011376664261821996, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020431488331462667, + "loss": 0.0151, "step": 246090 }, { - "epoch": 1.24, - "learning_rate": 0.00011375907492520595, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020431099509825523, + "loss": 0.014, "step": 246100 }, { - "epoch": 1.24, - "learning_rate": 0.00011375150723219195, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020430710688188375, + "loss": 0.0177, "step": 246110 }, { - "epoch": 1.24, - "learning_rate": 0.00011374393953917793, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.0002043032186655123, + "loss": 0.0147, "step": 246120 }, { - "epoch": 1.24, - "learning_rate": 0.00011373637184616392, - "loss": 0.0108, + "epoch": 0.64, + "learning_rate": 0.0002042993304491408, + "loss": 0.0142, "step": 246130 }, { - "epoch": 1.24, - "learning_rate": 0.0001137288041531499, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020429544223276935, + "loss": 0.016, "step": 246140 }, { - "epoch": 1.24, - "learning_rate": 0.0001137212364601359, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.0002042915540163979, + "loss": 0.0143, "step": 246150 }, { - "epoch": 1.24, - "learning_rate": 0.0001137136687671219, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020428766580002643, + "loss": 0.0172, "step": 246160 }, { - "epoch": 1.24, - "learning_rate": 0.00011370610107410788, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020428377758365494, + "loss": 0.0115, "step": 246170 }, { - "epoch": 1.24, - "learning_rate": 0.00011369853338109387, - "loss": 0.0102, + "epoch": 0.64, + "learning_rate": 0.0002042798893672835, + "loss": 0.0169, "step": 246180 }, { - "epoch": 1.24, - "learning_rate": 0.00011369096568807987, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.00020427600115091203, + "loss": 0.0147, "step": 246190 }, { - "epoch": 1.24, - "learning_rate": 0.00011368339799506585, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020427211293454057, + "loss": 0.0184, "step": 246200 }, { - "epoch": 1.24, - "learning_rate": 0.00011367583030205184, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020426822471816908, + "loss": 0.0138, "step": 246210 }, { - "epoch": 1.24, - "learning_rate": 0.00011366826260903782, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020426433650179763, + "loss": 0.0151, "step": 246220 }, { - "epoch": 1.24, - "learning_rate": 0.00011366069491602382, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.0002042604482854262, + "loss": 0.0135, "step": 246230 }, { - "epoch": 1.24, - "learning_rate": 0.00011365312722300981, - "loss": 0.0105, + "epoch": 0.64, + "learning_rate": 0.0002042565600690547, + "loss": 0.0151, "step": 246240 }, { - "epoch": 1.24, - "learning_rate": 0.0001136455595299958, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020425267185268322, + "loss": 0.0198, "step": 246250 }, { - "epoch": 1.24, - "learning_rate": 0.00011363799183698179, - "loss": 0.0107, + "epoch": 0.64, + "learning_rate": 0.00020424878363631177, + "loss": 0.0169, "step": 246260 }, { - "epoch": 1.24, - "learning_rate": 0.00011363042414396779, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020424489541994033, + "loss": 0.0185, "step": 246270 }, { - "epoch": 1.24, - "learning_rate": 0.00011362285645095377, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.00020424100720356885, + "loss": 0.0188, "step": 246280 }, { - "epoch": 1.24, - "learning_rate": 0.00011361528875793976, - "loss": 0.012, + "epoch": 0.64, + "learning_rate": 0.0002042371189871974, + "loss": 0.0148, "step": 246290 }, { - "epoch": 1.24, - "learning_rate": 0.00011360772106492574, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.0002042332307708259, + "loss": 0.0135, "step": 246300 }, { - "epoch": 1.24, - "learning_rate": 0.00011360015337191174, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020422934255445447, + "loss": 0.0154, "step": 246310 }, { - "epoch": 1.24, - "learning_rate": 0.00011359258567889773, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.000204225454338083, + "loss": 0.0181, "step": 246320 }, { - "epoch": 1.24, - "learning_rate": 0.00011358501798588371, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.00020422156612171153, + "loss": 0.0155, "step": 246330 }, { - "epoch": 1.24, - "learning_rate": 0.00011357745029286971, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020421767790534004, + "loss": 0.0141, "step": 246340 }, { - "epoch": 1.24, - "learning_rate": 0.0001135698825998557, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.0002042137896889686, + "loss": 0.0144, "step": 246350 }, { - "epoch": 1.24, - "learning_rate": 0.00011356231490684169, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020420990147259713, + "loss": 0.0142, "step": 246360 }, { - "epoch": 1.24, - "learning_rate": 0.00011355474721382768, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020420601325622567, + "loss": 0.0156, "step": 246370 }, { - "epoch": 1.24, - "learning_rate": 0.00011354717952081366, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.00020420212503985418, + "loss": 0.0169, "step": 246380 }, { - "epoch": 1.24, - "learning_rate": 0.00011353961182779966, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020419823682348273, + "loss": 0.0131, "step": 246390 }, { - "epoch": 1.24, - "learning_rate": 0.00011353204413478565, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020419434860711127, + "loss": 0.0162, "step": 246400 }, { - "epoch": 1.24, - "learning_rate": 0.00011352447644177163, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.0002041904603907398, + "loss": 0.0138, "step": 246410 }, { - "epoch": 1.24, - "learning_rate": 0.00011351690874875763, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.00020418657217436832, + "loss": 0.0153, "step": 246420 }, { - "epoch": 1.24, - "learning_rate": 0.00011350934105574362, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.00020418268395799686, + "loss": 0.0131, "step": 246430 }, { - "epoch": 1.24, - "learning_rate": 0.0001135017733627296, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020417879574162543, + "loss": 0.0127, "step": 246440 }, { - "epoch": 1.24, - "learning_rate": 0.0001134942056697156, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020417490752525395, + "loss": 0.0167, "step": 246450 }, { - "epoch": 1.24, - "learning_rate": 0.00011348663797670158, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002041710193088825, + "loss": 0.015, "step": 246460 }, { - "epoch": 1.24, - "learning_rate": 0.00011347907028368758, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.000204167131092511, + "loss": 0.0145, "step": 246470 }, { - "epoch": 1.24, - "learning_rate": 0.00011347150259067357, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020416324287613957, + "loss": 0.0146, "step": 246480 }, { - "epoch": 1.24, - "learning_rate": 0.00011346393489765955, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.0002041593546597681, + "loss": 0.0136, "step": 246490 }, { - "epoch": 1.24, - "learning_rate": 0.00011345636720464555, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020415546644339663, + "loss": 0.0156, "step": 246500 }, { - "epoch": 1.24, - "learning_rate": 0.00011344879951163154, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020415157822702514, + "loss": 0.0162, "step": 246510 }, { - "epoch": 1.24, - "learning_rate": 0.00011344123181861753, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.0002041476900106537, + "loss": 0.0163, "step": 246520 }, { - "epoch": 1.24, - "learning_rate": 0.00011343366412560352, - "loss": 0.0107, + "epoch": 0.64, + "learning_rate": 0.00020414380179428223, + "loss": 0.0172, "step": 246530 }, { - "epoch": 1.24, - "learning_rate": 0.00011342609643258952, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020413991357791077, + "loss": 0.0157, "step": 246540 }, { - "epoch": 1.24, - "learning_rate": 0.0001134185287395755, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020413602536153928, + "loss": 0.013, "step": 246550 }, { - "epoch": 1.24, - "learning_rate": 0.00011341096104656149, - "loss": 0.0064, + "epoch": 0.64, + "learning_rate": 0.00020413213714516785, + "loss": 0.0184, "step": 246560 }, { - "epoch": 1.24, - "learning_rate": 0.00011340339335354747, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.00020412824892879637, + "loss": 0.0153, "step": 246570 }, { - "epoch": 1.24, - "learning_rate": 0.00011339582566053347, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.0002041243607124249, + "loss": 0.0177, "step": 246580 }, { - "epoch": 1.24, - "learning_rate": 0.00011338825796751946, - "loss": 0.0114, + "epoch": 0.64, + "learning_rate": 0.00020412047249605342, + "loss": 0.0156, "step": 246590 }, { - "epoch": 1.24, - "learning_rate": 0.00011338069027450544, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.000204116584279682, + "loss": 0.0156, "step": 246600 }, { - "epoch": 1.24, - "learning_rate": 0.00011337312258149144, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020411269606331053, + "loss": 0.0165, "step": 246610 }, { - "epoch": 1.24, - "learning_rate": 0.00011336555488847743, - "loss": 0.0109, + "epoch": 0.64, + "learning_rate": 0.00020410880784693905, + "loss": 0.0165, "step": 246620 }, { - "epoch": 1.24, - "learning_rate": 0.00011335798719546342, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.0002041049196305676, + "loss": 0.0146, "step": 246630 }, { - "epoch": 1.24, - "learning_rate": 0.00011335041950244941, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.0002041010314141961, + "loss": 0.0157, "step": 246640 }, { - "epoch": 1.24, - "learning_rate": 0.00011334285180943539, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020409714319782467, + "loss": 0.0212, "step": 246650 }, { - "epoch": 1.24, - "learning_rate": 0.00011333528411642139, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.0002040932549814532, + "loss": 0.0142, "step": 246660 }, { - "epoch": 1.24, - "learning_rate": 0.00011332771642340736, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020408936676508173, + "loss": 0.0138, "step": 246670 }, { - "epoch": 1.24, - "learning_rate": 0.00011332014873039335, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020408547854871024, + "loss": 0.0155, "step": 246680 }, { - "epoch": 1.24, - "learning_rate": 0.00011331258103737935, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.0002040815903323388, + "loss": 0.0147, "step": 246690 }, { - "epoch": 1.24, - "learning_rate": 0.00011330501334436533, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020407770211596733, + "loss": 0.0129, "step": 246700 }, { - "epoch": 1.24, - "learning_rate": 0.00011329744565135132, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020407381389959587, + "loss": 0.0202, "step": 246710 }, { - "epoch": 1.24, - "learning_rate": 0.00011328987795833732, - "loss": 0.0111, + "epoch": 0.64, + "learning_rate": 0.00020406992568322438, + "loss": 0.0138, "step": 246720 }, { - "epoch": 1.24, - "learning_rate": 0.0001132823102653233, - "loss": 0.0111, + "epoch": 0.64, + "learning_rate": 0.00020406603746685295, + "loss": 0.0155, "step": 246730 }, { - "epoch": 1.24, - "learning_rate": 0.00011327474257230929, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020406214925048147, + "loss": 0.0143, "step": 246740 }, { - "epoch": 1.24, - "learning_rate": 0.00011326717487929527, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020405826103411, + "loss": 0.0133, "step": 246750 }, { - "epoch": 1.24, - "learning_rate": 0.00011325960718628127, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020405437281773852, + "loss": 0.0155, "step": 246760 }, { - "epoch": 1.24, - "learning_rate": 0.00011325203949326726, - "loss": 0.0069, + "epoch": 0.64, + "learning_rate": 0.0002040504846013671, + "loss": 0.0132, "step": 246770 }, { - "epoch": 1.25, - "learning_rate": 0.00011324447180025325, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020404659638499563, + "loss": 0.0177, "step": 246780 }, { - "epoch": 1.25, - "learning_rate": 0.00011323690410723924, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020404270816862415, + "loss": 0.0146, "step": 246790 }, { - "epoch": 1.25, - "learning_rate": 0.00011322933641422524, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020403881995225266, + "loss": 0.0144, "step": 246800 }, { - "epoch": 1.25, - "learning_rate": 0.00011322176872121122, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.00020403493173588123, + "loss": 0.0141, "step": 246810 }, { - "epoch": 1.25, - "learning_rate": 0.00011321420102819721, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020403104351950977, + "loss": 0.0197, "step": 246820 }, { - "epoch": 1.25, - "learning_rate": 0.0001132066333351832, - "loss": 0.0076, + "epoch": 0.64, + "learning_rate": 0.00020402715530313829, + "loss": 0.0156, "step": 246830 }, { - "epoch": 1.25, - "learning_rate": 0.00011319906564216919, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020402326708676683, + "loss": 0.0179, "step": 246840 }, { - "epoch": 1.25, - "learning_rate": 0.00011319149794915518, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020401937887039537, + "loss": 0.0171, "step": 246850 }, { - "epoch": 1.25, - "learning_rate": 0.00011318393025614117, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.0002040154906540239, + "loss": 0.0153, "step": 246860 }, { - "epoch": 1.25, - "learning_rate": 0.00011317636256312716, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020401160243765243, + "loss": 0.014, "step": 246870 }, { - "epoch": 1.25, - "learning_rate": 0.00011316879487011316, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020400771422128097, + "loss": 0.0168, "step": 246880 }, { - "epoch": 1.25, - "learning_rate": 0.00011316122717709914, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020400382600490948, + "loss": 0.0132, "step": 246890 }, { - "epoch": 1.25, - "learning_rate": 0.00011315365948408513, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020399993778853805, + "loss": 0.0167, "step": 246900 }, { - "epoch": 1.25, - "learning_rate": 0.00011314609179107111, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020399604957216657, + "loss": 0.0185, "step": 246910 }, { - "epoch": 1.25, - "learning_rate": 0.00011313852409805711, - "loss": 0.0114, + "epoch": 0.64, + "learning_rate": 0.0002039921613557951, + "loss": 0.0171, "step": 246920 }, { - "epoch": 1.25, - "learning_rate": 0.0001131309564050431, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020398827313942362, + "loss": 0.0124, "step": 246930 }, { - "epoch": 1.25, - "learning_rate": 0.00011312338871202908, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.0002039843849230522, + "loss": 0.0142, "step": 246940 }, { - "epoch": 1.25, - "learning_rate": 0.00011311582101901508, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020398049670668073, + "loss": 0.0141, "step": 246950 }, { - "epoch": 1.25, - "learning_rate": 0.00011310825332600107, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020397660849030925, + "loss": 0.0164, "step": 246960 }, { - "epoch": 1.25, - "learning_rate": 0.00011310068563298706, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020397272027393776, + "loss": 0.016, "step": 246970 }, { - "epoch": 1.25, - "learning_rate": 0.00011309311793997305, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.00020396883205756633, + "loss": 0.0165, "step": 246980 }, { - "epoch": 1.25, - "learning_rate": 0.00011308555024695905, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020396494384119487, + "loss": 0.0137, "step": 246990 }, { - "epoch": 1.25, - "learning_rate": 0.00011307798255394503, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020396105562482339, + "loss": 0.0184, "step": 247000 }, { - "epoch": 1.25, - "eval_cer": 0.914457640753532, - "eval_loss": 0.0065944562666118145, - "eval_runtime": 115.9058, - "eval_samples_per_second": 17.255, - "eval_steps_per_second": 4.314, + "epoch": 0.64, + "eval_cer": 0.8817614710744033, + "eval_loss": 0.01131850853562355, + "eval_runtime": 107.4227, + "eval_samples_per_second": 18.618, + "eval_steps_per_second": 4.655, "step": 247000 }, { - "epoch": 1.25, - "learning_rate": 0.00011307041486093102, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.00020395716740845193, + "loss": 0.0158, "step": 247010 }, { - "epoch": 1.25, - "learning_rate": 0.000113062847167917, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020395327919208047, + "loss": 0.0169, "step": 247020 }, { - "epoch": 1.25, - "learning_rate": 0.000113055279474903, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.000203949390975709, + "loss": 0.0142, "step": 247030 }, { - "epoch": 1.25, - "learning_rate": 0.000113047711781889, - "loss": 0.0117, + "epoch": 0.64, + "learning_rate": 0.00020394550275933753, + "loss": 0.0142, "step": 247040 }, { - "epoch": 1.25, - "learning_rate": 0.00011304014408887498, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020394161454296607, + "loss": 0.0199, "step": 247050 }, { - "epoch": 1.25, - "learning_rate": 0.00011303257639586097, - "loss": 0.0063, + "epoch": 0.64, + "learning_rate": 0.0002039377263265946, + "loss": 0.02, "step": 247060 }, { - "epoch": 1.25, - "learning_rate": 0.00011302500870284697, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020393383811022315, + "loss": 0.0165, "step": 247070 }, { - "epoch": 1.25, - "learning_rate": 0.00011301744100983295, - "loss": 0.0065, + "epoch": 0.64, + "learning_rate": 0.00020392994989385166, + "loss": 0.0178, "step": 247080 }, { - "epoch": 1.25, - "learning_rate": 0.00011300987331681894, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.0002039260616774802, + "loss": 0.0123, "step": 247090 }, { - "epoch": 1.25, - "learning_rate": 0.00011300230562380492, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.00020392217346110878, + "loss": 0.016, "step": 247100 }, { - "epoch": 1.25, - "learning_rate": 0.00011299473793079092, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.0002039182852447373, + "loss": 0.0165, "step": 247110 }, { - "epoch": 1.25, - "learning_rate": 0.00011298717023777691, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.0002039143970283658, + "loss": 0.0141, "step": 247120 }, { - "epoch": 1.25, - "learning_rate": 0.0001129796025447629, - "loss": 0.0125, + "epoch": 0.64, + "learning_rate": 0.00020391050881199435, + "loss": 0.0162, "step": 247130 }, { - "epoch": 1.25, - "learning_rate": 0.00011297203485174889, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020390662059562286, + "loss": 0.0126, "step": 247140 }, { - "epoch": 1.25, - "learning_rate": 0.00011296446715873488, - "loss": 0.013, + "epoch": 0.64, + "learning_rate": 0.00020390273237925143, + "loss": 0.0151, "step": 247150 }, { - "epoch": 1.25, - "learning_rate": 0.00011295689946572087, - "loss": 0.0101, + "epoch": 0.64, + "learning_rate": 0.00020389884416287997, + "loss": 0.0125, "step": 247160 }, { - "epoch": 1.25, - "learning_rate": 0.00011294933177270686, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020389495594650849, + "loss": 0.0157, "step": 247170 }, { - "epoch": 1.25, - "learning_rate": 0.00011294176407969284, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020389106773013703, + "loss": 0.0188, "step": 247180 }, { - "epoch": 1.25, - "learning_rate": 0.00011293419638667884, - "loss": 0.0076, + "epoch": 0.64, + "learning_rate": 0.00020388717951376557, + "loss": 0.0155, "step": 247190 }, { - "epoch": 1.25, - "learning_rate": 0.00011292662869366483, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.0002038832912973941, + "loss": 0.0135, "step": 247200 }, { - "epoch": 1.25, - "learning_rate": 0.00011291906100065081, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020387940308102262, + "loss": 0.0131, "step": 247210 }, { - "epoch": 1.25, - "learning_rate": 0.00011291149330763681, - "loss": 0.0114, + "epoch": 0.64, + "learning_rate": 0.00020387551486465117, + "loss": 0.013, "step": 247220 }, { - "epoch": 1.25, - "learning_rate": 0.0001129039256146228, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.0002038716266482797, + "loss": 0.0181, "step": 247230 }, { - "epoch": 1.25, - "learning_rate": 0.00011289635792160879, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020386773843190825, + "loss": 0.0176, "step": 247240 }, { - "epoch": 1.25, - "learning_rate": 0.00011288879022859478, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020386385021553676, + "loss": 0.0132, "step": 247250 }, { - "epoch": 1.25, - "learning_rate": 0.00011288122253558076, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.0002038599619991653, + "loss": 0.0237, "step": 247260 }, { - "epoch": 1.25, - "learning_rate": 0.00011287365484256676, - "loss": 0.0067, + "epoch": 0.64, + "learning_rate": 0.00020385607378279385, + "loss": 0.0177, "step": 247270 }, { - "epoch": 1.25, - "learning_rate": 0.00011286608714955275, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.0002038521855664224, + "loss": 0.0139, "step": 247280 }, { - "epoch": 1.25, - "learning_rate": 0.00011285851945653873, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.0002038482973500509, + "loss": 0.0179, "step": 247290 }, { - "epoch": 1.25, - "learning_rate": 0.00011285095176352471, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020384440913367945, + "loss": 0.0158, "step": 247300 }, { - "epoch": 1.25, - "learning_rate": 0.0001128433840705107, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020384052091730801, + "loss": 0.0178, "step": 247310 }, { - "epoch": 1.25, - "learning_rate": 0.00011283581637749669, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.00020383663270093653, + "loss": 0.0196, "step": 247320 }, { - "epoch": 1.25, - "learning_rate": 0.00011282824868448269, - "loss": 0.0112, + "epoch": 0.64, + "learning_rate": 0.00020383274448456507, + "loss": 0.0115, "step": 247330 }, { - "epoch": 1.25, - "learning_rate": 0.00011282068099146867, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020382885626819358, + "loss": 0.0156, "step": 247340 }, { - "epoch": 1.25, - "learning_rate": 0.00011281311329845466, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020382496805182215, + "loss": 0.0142, "step": 247350 }, { - "epoch": 1.25, - "learning_rate": 0.00011280554560544064, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020382107983545067, + "loss": 0.0144, "step": 247360 }, { - "epoch": 1.25, - "learning_rate": 0.00011279797791242664, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.0002038171916190792, + "loss": 0.0184, "step": 247370 }, { - "epoch": 1.25, - "learning_rate": 0.00011279041021941263, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.00020381330340270772, + "loss": 0.0143, "step": 247380 }, { - "epoch": 1.25, - "learning_rate": 0.00011278284252639862, - "loss": 0.0105, + "epoch": 0.64, + "learning_rate": 0.00020380941518633627, + "loss": 0.0211, "step": 247390 }, { - "epoch": 1.25, - "learning_rate": 0.00011277527483338461, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002038055269699648, + "loss": 0.0194, "step": 247400 }, { - "epoch": 1.25, - "learning_rate": 0.0001127677071403706, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020380163875359335, + "loss": 0.013, "step": 247410 }, { - "epoch": 1.25, - "learning_rate": 0.00011276013944735659, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020379775053722186, + "loss": 0.0122, "step": 247420 }, { - "epoch": 1.25, - "learning_rate": 0.00011275257175434258, - "loss": 0.0072, + "epoch": 0.64, + "learning_rate": 0.0002037938623208504, + "loss": 0.0178, "step": 247430 }, { - "epoch": 1.25, - "learning_rate": 0.00011274500406132858, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.00020378997410447895, + "loss": 0.0121, "step": 247440 }, { - "epoch": 1.25, - "learning_rate": 0.00011273743636831456, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.0002037860858881075, + "loss": 0.0165, "step": 247450 }, { - "epoch": 1.25, - "learning_rate": 0.00011272986867530055, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.000203782197671736, + "loss": 0.0141, "step": 247460 }, { - "epoch": 1.25, - "learning_rate": 0.00011272230098228653, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.00020377830945536454, + "loss": 0.0133, "step": 247470 }, { - "epoch": 1.25, - "learning_rate": 0.00011271473328927253, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002037744212389931, + "loss": 0.0151, "step": 247480 }, { - "epoch": 1.25, - "learning_rate": 0.00011270716559625852, - "loss": 0.0069, + "epoch": 0.64, + "learning_rate": 0.00020377053302262163, + "loss": 0.0154, "step": 247490 }, { - "epoch": 1.25, - "learning_rate": 0.0001126995979032445, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.00020376664480625017, + "loss": 0.0229, "step": 247500 }, { - "epoch": 1.25, - "learning_rate": 0.0001126920302102305, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020376275658987868, + "loss": 0.0154, "step": 247510 }, { - "epoch": 1.25, - "learning_rate": 0.0001126844625172165, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.00020375886837350725, + "loss": 0.0148, "step": 247520 }, { - "epoch": 1.25, - "learning_rate": 0.00011267689482420248, - "loss": 0.013, + "epoch": 0.64, + "learning_rate": 0.00020375498015713577, + "loss": 0.0144, "step": 247530 }, { - "epoch": 1.25, - "learning_rate": 0.00011266932713118847, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.0002037510919407643, + "loss": 0.0148, "step": 247540 }, { - "epoch": 1.25, - "learning_rate": 0.00011266175943817445, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020374720372439282, + "loss": 0.0106, "step": 247550 }, { - "epoch": 1.25, - "learning_rate": 0.00011265419174516045, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.0002037433155080214, + "loss": 0.0144, "step": 247560 }, { - "epoch": 1.25, - "learning_rate": 0.00011264662405214644, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.0002037394272916499, + "loss": 0.0206, "step": 247570 }, { - "epoch": 1.25, - "learning_rate": 0.00011263905635913243, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.00020373553907527845, + "loss": 0.014, "step": 247580 }, { - "epoch": 1.25, - "learning_rate": 0.00011263148866611842, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.00020373165085890696, + "loss": 0.0136, "step": 247590 }, { - "epoch": 1.25, - "learning_rate": 0.00011262392097310442, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.00020372776264253553, + "loss": 0.0192, "step": 247600 }, { - "epoch": 1.25, - "learning_rate": 0.0001126163532800904, - "loss": 0.0109, + "epoch": 0.64, + "learning_rate": 0.00020372387442616405, + "loss": 0.0211, "step": 247610 }, { - "epoch": 1.25, - "learning_rate": 0.00011260878558707639, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.0002037199862097926, + "loss": 0.0148, "step": 247620 }, { - "epoch": 1.25, - "learning_rate": 0.00011260121789406237, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.0002037160979934211, + "loss": 0.0176, "step": 247630 }, { - "epoch": 1.25, - "learning_rate": 0.00011259365020104837, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020371220977704964, + "loss": 0.0166, "step": 247640 }, { - "epoch": 1.25, - "learning_rate": 0.00011258608250803436, - "loss": 0.0097, + "epoch": 0.64, + "learning_rate": 0.0002037083215606782, + "loss": 0.0136, "step": 247650 }, { - "epoch": 1.25, - "learning_rate": 0.00011257851481502034, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.00020370443334430673, + "loss": 0.0188, "step": 247660 }, { - "epoch": 1.25, - "learning_rate": 0.00011257094712200634, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020370054512793524, + "loss": 0.015, "step": 247670 }, { - "epoch": 1.25, - "learning_rate": 0.00011256337942899233, - "loss": 0.0112, + "epoch": 0.64, + "learning_rate": 0.00020369665691156378, + "loss": 0.0145, "step": 247680 }, { - "epoch": 1.25, - "learning_rate": 0.00011255581173597832, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020369276869519235, + "loss": 0.0129, "step": 247690 }, { - "epoch": 1.25, - "learning_rate": 0.00011254824404296431, - "loss": 0.0065, + "epoch": 0.64, + "learning_rate": 0.00020368888047882087, + "loss": 0.0157, "step": 247700 }, { - "epoch": 1.25, - "learning_rate": 0.00011254067634995029, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.0002036849922624494, + "loss": 0.0194, "step": 247710 }, { - "epoch": 1.25, - "learning_rate": 0.00011253310865693629, - "loss": 0.0067, + "epoch": 0.64, + "learning_rate": 0.00020368110404607792, + "loss": 0.0171, "step": 247720 }, { - "epoch": 1.25, - "learning_rate": 0.00011252554096392228, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.0002036772158297065, + "loss": 0.0133, "step": 247730 }, { - "epoch": 1.25, - "learning_rate": 0.00011251797327090826, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.000203673327613335, + "loss": 0.0194, "step": 247740 }, { - "epoch": 1.25, - "learning_rate": 0.00011251040557789426, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020366943939696355, + "loss": 0.0175, "step": 247750 }, { - "epoch": 1.25, - "learning_rate": 0.00011250283788488025, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020366555118059206, + "loss": 0.0208, "step": 247760 }, { - "epoch": 1.25, - "learning_rate": 0.00011249527019186624, - "loss": 0.008, + "epoch": 0.64, + "learning_rate": 0.00020366166296422063, + "loss": 0.0169, "step": 247770 }, { - "epoch": 1.25, - "learning_rate": 0.00011248770249885223, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.00020365777474784915, + "loss": 0.0147, "step": 247780 }, { - "epoch": 1.25, - "learning_rate": 0.00011248013480583821, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.0002036538865314777, + "loss": 0.0194, "step": 247790 }, { - "epoch": 1.25, - "learning_rate": 0.0001124725671128242, - "loss": 0.0076, + "epoch": 0.64, + "learning_rate": 0.0002036499983151062, + "loss": 0.0217, "step": 247800 }, { - "epoch": 1.25, - "learning_rate": 0.0001124649994198102, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020364611009873477, + "loss": 0.0149, "step": 247810 }, { - "epoch": 1.25, - "learning_rate": 0.00011245743172679618, - "loss": 0.0098, + "epoch": 0.64, + "learning_rate": 0.0002036422218823633, + "loss": 0.0134, "step": 247820 }, { - "epoch": 1.25, - "learning_rate": 0.00011244986403378218, - "loss": 0.0107, + "epoch": 0.64, + "learning_rate": 0.00020363833366599183, + "loss": 0.0152, "step": 247830 }, { - "epoch": 1.25, - "learning_rate": 0.00011244229634076817, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020363444544962034, + "loss": 0.0139, "step": 247840 }, { - "epoch": 1.25, - "learning_rate": 0.00011243472864775415, - "loss": 0.0113, + "epoch": 0.64, + "learning_rate": 0.0002036305572332489, + "loss": 0.0204, "step": 247850 }, { - "epoch": 1.25, - "learning_rate": 0.00011242716095474015, - "loss": 0.0066, + "epoch": 0.64, + "learning_rate": 0.00020362666901687745, + "loss": 0.0137, "step": 247860 }, { - "epoch": 1.25, - "learning_rate": 0.00011241959326172613, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020362278080050597, + "loss": 0.0187, "step": 247870 }, { - "epoch": 1.25, - "learning_rate": 0.00011241202556871213, - "loss": 0.0104, + "epoch": 0.64, + "learning_rate": 0.0002036188925841345, + "loss": 0.0137, "step": 247880 }, { - "epoch": 1.25, - "learning_rate": 0.00011240445787569812, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020361500436776302, + "loss": 0.0145, "step": 247890 }, { - "epoch": 1.25, - "learning_rate": 0.0001123968901826841, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.0002036111161513916, + "loss": 0.015, "step": 247900 }, { - "epoch": 1.25, - "learning_rate": 0.0001123893224896701, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002036072279350201, + "loss": 0.0172, "step": 247910 }, { - "epoch": 1.25, - "learning_rate": 0.00011238175479665609, - "loss": 0.0091, + "epoch": 0.64, + "learning_rate": 0.00020360333971864865, + "loss": 0.0162, "step": 247920 }, { - "epoch": 1.25, - "learning_rate": 0.00011237418710364206, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020359945150227716, + "loss": 0.0152, "step": 247930 }, { - "epoch": 1.25, - "learning_rate": 0.00011236661941062806, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020359556328590573, + "loss": 0.0166, "step": 247940 }, { - "epoch": 1.25, - "learning_rate": 0.00011235905171761404, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020359167506953425, + "loss": 0.0151, "step": 247950 }, { - "epoch": 1.25, - "learning_rate": 0.00011235148402460003, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.0002035877868531628, + "loss": 0.0137, "step": 247960 }, { - "epoch": 1.25, - "learning_rate": 0.00011234391633158603, - "loss": 0.0093, + "epoch": 0.64, + "learning_rate": 0.0002035838986367913, + "loss": 0.0139, "step": 247970 }, { - "epoch": 1.25, - "learning_rate": 0.00011233634863857201, - "loss": 0.0112, + "epoch": 0.64, + "learning_rate": 0.00020358001042041987, + "loss": 0.0153, "step": 247980 }, { - "epoch": 1.25, - "learning_rate": 0.000112328780945558, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.00020357612220404838, + "loss": 0.0156, "step": 247990 }, { - "epoch": 1.25, - "learning_rate": 0.00011232121325254398, - "loss": 0.0083, + "epoch": 0.64, + "learning_rate": 0.00020357223398767693, + "loss": 0.0167, "step": 248000 }, { - "epoch": 1.25, - "eval_cer": 0.914462492734159, - "eval_loss": 0.006537660490721464, - "eval_runtime": 115.8787, - "eval_samples_per_second": 17.259, - "eval_steps_per_second": 4.315, + "epoch": 0.64, + "eval_cer": 0.8818244547364413, + "eval_loss": 0.010956432670354843, + "eval_runtime": 107.4182, + "eval_samples_per_second": 18.619, + "eval_steps_per_second": 4.655, "step": 248000 }, { - "epoch": 1.25, - "learning_rate": 0.00011231364555952998, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020356834577130544, + "loss": 0.0128, "step": 248010 }, { - "epoch": 1.25, - "learning_rate": 0.00011230607786651597, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.000203564457554934, + "loss": 0.018, "step": 248020 }, { - "epoch": 1.25, - "learning_rate": 0.00011229851017350196, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020356056933856255, + "loss": 0.016, "step": 248030 }, { - "epoch": 1.25, - "learning_rate": 0.00011229094248048795, - "loss": 0.0116, + "epoch": 0.64, + "learning_rate": 0.00020355668112219107, + "loss": 0.0149, "step": 248040 }, { - "epoch": 1.25, - "learning_rate": 0.00011228337478747395, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.0002035527929058196, + "loss": 0.0159, "step": 248050 }, { - "epoch": 1.25, - "learning_rate": 0.00011227580709445993, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.00020354890468944815, + "loss": 0.016, "step": 248060 }, { - "epoch": 1.25, - "learning_rate": 0.00011226823940144592, - "loss": 0.0092, + "epoch": 0.64, + "learning_rate": 0.0002035450164730767, + "loss": 0.0149, "step": 248070 }, { - "epoch": 1.25, - "learning_rate": 0.0001122606717084319, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.0002035411282567052, + "loss": 0.0139, "step": 248080 }, { - "epoch": 1.25, - "learning_rate": 0.0001122531040154179, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020353724004033375, + "loss": 0.016, "step": 248090 }, { - "epoch": 1.25, - "learning_rate": 0.0001122455363224039, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002035333518239623, + "loss": 0.016, "step": 248100 }, { - "epoch": 1.25, - "learning_rate": 0.00011223796862938988, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020352946360759083, + "loss": 0.0153, "step": 248110 }, { - "epoch": 1.25, - "learning_rate": 0.00011223040093637587, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020352557539121934, + "loss": 0.0231, "step": 248120 }, { - "epoch": 1.25, - "learning_rate": 0.00011222283324336187, - "loss": 0.0067, + "epoch": 0.64, + "learning_rate": 0.00020352168717484789, + "loss": 0.0148, "step": 248130 }, { - "epoch": 1.25, - "learning_rate": 0.00011221526555034785, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.0002035177989584764, + "loss": 0.0139, "step": 248140 }, { - "epoch": 1.25, - "learning_rate": 0.00011220769785733384, - "loss": 0.0053, + "epoch": 0.64, + "learning_rate": 0.00020351391074210497, + "loss": 0.0151, "step": 248150 }, { - "epoch": 1.25, - "learning_rate": 0.00011220013016431982, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020351002252573348, + "loss": 0.0125, "step": 248160 }, { - "epoch": 1.25, - "learning_rate": 0.00011219256247130582, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020350613430936203, + "loss": 0.0156, "step": 248170 }, { - "epoch": 1.25, - "learning_rate": 0.00011218499477829181, - "loss": 0.0102, + "epoch": 0.64, + "learning_rate": 0.00020350224609299054, + "loss": 0.0159, "step": 248180 }, { - "epoch": 1.25, - "learning_rate": 0.0001121774270852778, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.0002034983578766191, + "loss": 0.018, "step": 248190 }, { - "epoch": 1.25, - "learning_rate": 0.00011216985939226379, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020349446966024765, + "loss": 0.0171, "step": 248200 }, { - "epoch": 1.25, - "learning_rate": 0.00011216229169924978, - "loss": 0.0106, + "epoch": 0.64, + "learning_rate": 0.00020349058144387617, + "loss": 0.0154, "step": 248210 }, { - "epoch": 1.25, - "learning_rate": 0.00011215472400623577, - "loss": 0.0094, + "epoch": 0.64, + "learning_rate": 0.0002034866932275047, + "loss": 0.0157, "step": 248220 }, { - "epoch": 1.25, - "learning_rate": 0.00011214715631322176, - "loss": 0.0096, + "epoch": 0.64, + "learning_rate": 0.00020348280501113325, + "loss": 0.0163, "step": 248230 }, { - "epoch": 1.25, - "learning_rate": 0.00011213958862020774, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.0002034789167947618, + "loss": 0.0162, "step": 248240 }, { - "epoch": 1.25, - "learning_rate": 0.00011213202092719374, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.0002034750285783903, + "loss": 0.0154, "step": 248250 }, { - "epoch": 1.25, - "learning_rate": 0.00011212445323417973, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020347114036201885, + "loss": 0.0207, "step": 248260 }, { - "epoch": 1.25, - "learning_rate": 0.00011211688554116571, - "loss": 0.0069, + "epoch": 0.64, + "learning_rate": 0.0002034672521456474, + "loss": 0.0157, "step": 248270 }, { - "epoch": 1.25, - "learning_rate": 0.00011210931784815171, - "loss": 0.0086, + "epoch": 0.64, + "learning_rate": 0.00020346336392927593, + "loss": 0.0145, "step": 248280 }, { - "epoch": 1.25, - "learning_rate": 0.0001121017501551377, - "loss": 0.0112, + "epoch": 0.64, + "learning_rate": 0.00020345947571290444, + "loss": 0.0125, "step": 248290 }, { - "epoch": 1.25, - "learning_rate": 0.00011209418246212369, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.00020345558749653299, + "loss": 0.0134, "step": 248300 }, { - "epoch": 1.25, - "learning_rate": 0.00011208661476910968, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020345169928016153, + "loss": 0.018, "step": 248310 }, { - "epoch": 1.25, - "learning_rate": 0.00011207904707609566, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.00020344781106379007, + "loss": 0.0136, "step": 248320 }, { - "epoch": 1.25, - "learning_rate": 0.00011207147938308166, - "loss": 0.0095, + "epoch": 0.64, + "learning_rate": 0.00020344392284741858, + "loss": 0.0167, "step": 248330 }, { - "epoch": 1.25, - "learning_rate": 0.00011206391169006765, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020344003463104712, + "loss": 0.0136, "step": 248340 }, { - "epoch": 1.25, - "learning_rate": 0.00011205634399705363, - "loss": 0.0157, + "epoch": 0.64, + "learning_rate": 0.0002034361464146757, + "loss": 0.0199, "step": 248350 }, { - "epoch": 1.25, - "learning_rate": 0.00011204877630403963, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.0002034322581983042, + "loss": 0.0166, "step": 248360 }, { - "epoch": 1.25, - "learning_rate": 0.00011204120861102562, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.00020342836998193275, + "loss": 0.0154, "step": 248370 }, { - "epoch": 1.25, - "learning_rate": 0.0001120336409180116, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020342448176556126, + "loss": 0.0154, "step": 248380 }, { - "epoch": 1.25, - "learning_rate": 0.0001120260732249976, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020342059354918978, + "loss": 0.0139, "step": 248390 }, { - "epoch": 1.25, - "learning_rate": 0.00011201850553198358, - "loss": 0.0128, + "epoch": 0.64, + "learning_rate": 0.00020341670533281835, + "loss": 0.0142, "step": 248400 }, { - "epoch": 1.25, - "learning_rate": 0.00011201093783896958, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.0002034128171164469, + "loss": 0.0135, "step": 248410 }, { - "epoch": 1.25, - "learning_rate": 0.00011200337014595557, - "loss": 0.0084, + "epoch": 0.64, + "learning_rate": 0.0002034089289000754, + "loss": 0.0147, "step": 248420 }, { - "epoch": 1.25, - "learning_rate": 0.00011199580245294155, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020340504068370395, + "loss": 0.0143, "step": 248430 }, { - "epoch": 1.25, - "learning_rate": 0.00011198823475992755, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.0002034011524673325, + "loss": 0.0157, "step": 248440 }, { - "epoch": 1.25, - "learning_rate": 0.00011198066706691354, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020339726425096103, + "loss": 0.0125, "step": 248450 }, { - "epoch": 1.25, - "learning_rate": 0.00011197309937389952, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020339337603458954, + "loss": 0.0149, "step": 248460 }, { - "epoch": 1.25, - "learning_rate": 0.00011196553168088552, - "loss": 0.01, + "epoch": 0.64, + "learning_rate": 0.00020338948781821808, + "loss": 0.0154, "step": 248470 }, { - "epoch": 1.25, - "learning_rate": 0.00011195796398787151, - "loss": 0.007, + "epoch": 0.64, + "learning_rate": 0.00020338559960184663, + "loss": 0.015, "step": 248480 }, { - "epoch": 1.25, - "learning_rate": 0.0001119503962948575, - "loss": 0.009, + "epoch": 0.64, + "learning_rate": 0.00020338171138547517, + "loss": 0.016, "step": 248490 }, { - "epoch": 1.25, - "learning_rate": 0.00011194282860184349, - "loss": 0.0088, + "epoch": 0.64, + "learning_rate": 0.00020337782316910368, + "loss": 0.0148, "step": 248500 }, { - "epoch": 1.25, - "learning_rate": 0.00011193526090882947, - "loss": 0.0075, + "epoch": 0.64, + "learning_rate": 0.00020337393495273222, + "loss": 0.0199, "step": 248510 }, { - "epoch": 1.25, - "learning_rate": 0.00011192769321581547, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.0002033700467363608, + "loss": 0.0181, "step": 248520 }, { - "epoch": 1.25, - "learning_rate": 0.00011192012552280146, - "loss": 0.0073, + "epoch": 0.64, + "learning_rate": 0.0002033661585199893, + "loss": 0.0116, "step": 248530 }, { - "epoch": 1.25, - "learning_rate": 0.00011191255782978744, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020336227030361785, + "loss": 0.0127, "step": 248540 }, { - "epoch": 1.25, - "learning_rate": 0.00011190499013677342, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020335838208724636, + "loss": 0.0151, "step": 248550 }, { - "epoch": 1.25, - "learning_rate": 0.0001118974224437594, - "loss": 0.0087, + "epoch": 0.64, + "learning_rate": 0.00020335449387087493, + "loss": 0.015, "step": 248560 }, { - "epoch": 1.25, - "learning_rate": 0.0001118898547507454, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020335060565450345, + "loss": 0.0146, "step": 248570 }, { - "epoch": 1.25, - "learning_rate": 0.0001118822870577314, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.000203346717438132, + "loss": 0.0136, "step": 248580 }, { - "epoch": 1.25, - "learning_rate": 0.00011187471936471738, - "loss": 0.0055, + "epoch": 0.64, + "learning_rate": 0.0002033428292217605, + "loss": 0.0141, "step": 248590 }, { - "epoch": 1.25, - "learning_rate": 0.00011186715167170337, - "loss": 0.0078, + "epoch": 0.64, + "learning_rate": 0.00020333894100538907, + "loss": 0.015, "step": 248600 }, { - "epoch": 1.25, - "learning_rate": 0.00011185958397868935, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.0002033350527890176, + "loss": 0.0144, "step": 248610 }, { - "epoch": 1.25, - "learning_rate": 0.00011185201628567535, - "loss": 0.0065, + "epoch": 0.64, + "learning_rate": 0.00020333116457264613, + "loss": 0.0201, "step": 248620 }, { - "epoch": 1.25, - "learning_rate": 0.00011184444859266134, - "loss": 0.0103, + "epoch": 0.64, + "learning_rate": 0.00020332727635627464, + "loss": 0.0208, "step": 248630 }, { - "epoch": 1.25, - "learning_rate": 0.00011183688089964733, - "loss": 0.0068, + "epoch": 0.64, + "learning_rate": 0.00020332338813990318, + "loss": 0.0178, "step": 248640 }, { - "epoch": 1.25, - "learning_rate": 0.00011182931320663332, - "loss": 0.0089, + "epoch": 0.64, + "learning_rate": 0.00020331949992353173, + "loss": 0.0132, "step": 248650 }, { - "epoch": 1.25, - "learning_rate": 0.00011182174551361932, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.00020331561170716027, + "loss": 0.0157, "step": 248660 }, { - "epoch": 1.25, - "learning_rate": 0.0001118141778206053, - "loss": 0.0066, + "epoch": 0.64, + "learning_rate": 0.00020331172349078878, + "loss": 0.0155, "step": 248670 }, { - "epoch": 1.25, - "learning_rate": 0.00011180661012759129, - "loss": 0.0079, + "epoch": 0.64, + "learning_rate": 0.00020330783527441732, + "loss": 0.0153, "step": 248680 }, { - "epoch": 1.25, - "learning_rate": 0.00011179904243457727, - "loss": 0.0108, + "epoch": 0.64, + "learning_rate": 0.0002033039470580459, + "loss": 0.0165, "step": 248690 }, { - "epoch": 1.25, - "learning_rate": 0.00011179147474156327, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.0002033000588416744, + "loss": 0.0122, "step": 248700 }, { - "epoch": 1.25, - "learning_rate": 0.00011178390704854926, - "loss": 0.0099, + "epoch": 0.64, + "learning_rate": 0.00020329617062530292, + "loss": 0.0133, "step": 248710 }, { - "epoch": 1.25, - "learning_rate": 0.00011177633935553524, - "loss": 0.0077, + "epoch": 0.64, + "learning_rate": 0.00020329228240893146, + "loss": 0.0172, "step": 248720 }, { - "epoch": 1.25, - "learning_rate": 0.00011176877166252124, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020328839419256003, + "loss": 0.0167, "step": 248730 }, { - "epoch": 1.25, - "learning_rate": 0.00011176120396950723, - "loss": 0.0074, + "epoch": 0.64, + "learning_rate": 0.00020328450597618855, + "loss": 0.0135, "step": 248740 }, { - "epoch": 1.25, - "learning_rate": 0.00011175363627649322, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.0002032806177598171, + "loss": 0.0156, "step": 248750 }, { - "epoch": 1.26, - "learning_rate": 0.00011174606858347921, - "loss": 0.0082, + "epoch": 0.64, + "learning_rate": 0.0002032767295434456, + "loss": 0.0194, "step": 248760 }, { - "epoch": 1.26, - "learning_rate": 0.00011173850089046519, - "loss": 0.0071, + "epoch": 0.64, + "learning_rate": 0.00020327284132707417, + "loss": 0.0149, "step": 248770 }, { - "epoch": 1.26, - "learning_rate": 0.00011173093319745119, - "loss": 0.0117, + "epoch": 0.64, + "learning_rate": 0.00020326895311070269, + "loss": 0.0157, "step": 248780 }, { - "epoch": 1.26, - "learning_rate": 0.00011172336550443718, - "loss": 0.0085, + "epoch": 0.64, + "learning_rate": 0.00020326506489433123, + "loss": 0.0128, "step": 248790 }, { - "epoch": 1.26, - "learning_rate": 0.00011171579781142316, - "loss": 0.0081, + "epoch": 0.64, + "learning_rate": 0.00020326117667795974, + "loss": 0.0167, "step": 248800 }, { - "epoch": 1.26, - "learning_rate": 0.00011170823011840916, - "loss": 0.011, + "epoch": 0.64, + "learning_rate": 0.0002032572884615883, + "loss": 0.0133, "step": 248810 }, { - "epoch": 1.26, - "learning_rate": 0.00011170066242539515, - "loss": 0.0055, + "epoch": 0.64, + "learning_rate": 0.00020325340024521683, + "loss": 0.0188, "step": 248820 }, { - "epoch": 1.26, - "learning_rate": 0.00011169309473238114, - "loss": 0.014, + "epoch": 0.65, + "learning_rate": 0.00020324951202884537, + "loss": 0.0189, "step": 248830 }, { - "epoch": 1.26, - "learning_rate": 0.00011168552703936713, - "loss": 0.0116, + "epoch": 0.65, + "learning_rate": 0.00020324562381247388, + "loss": 0.0159, "step": 248840 }, { - "epoch": 1.26, - "learning_rate": 0.00011167795934635311, - "loss": 0.0121, + "epoch": 0.65, + "learning_rate": 0.00020324173559610245, + "loss": 0.0209, "step": 248850 }, { - "epoch": 1.26, - "learning_rate": 0.00011167039165333911, - "loss": 0.0106, + "epoch": 0.65, + "learning_rate": 0.00020323784737973096, + "loss": 0.0142, "step": 248860 }, { - "epoch": 1.26, - "learning_rate": 0.0001116628239603251, - "loss": 0.0061, + "epoch": 0.65, + "learning_rate": 0.0002032339591633595, + "loss": 0.0147, "step": 248870 }, { - "epoch": 1.26, - "learning_rate": 0.00011165525626731108, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020323007094698802, + "loss": 0.015, "step": 248880 }, { - "epoch": 1.26, - "learning_rate": 0.00011164768857429708, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020322618273061656, + "loss": 0.0135, "step": 248890 }, { - "epoch": 1.26, - "learning_rate": 0.00011164012088128307, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020322229451424513, + "loss": 0.0187, "step": 248900 }, { - "epoch": 1.26, - "learning_rate": 0.00011163255318826905, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020321840629787365, + "loss": 0.0146, "step": 248910 }, { - "epoch": 1.26, - "learning_rate": 0.00011162498549525505, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.0002032145180815022, + "loss": 0.0153, "step": 248920 }, { - "epoch": 1.26, - "learning_rate": 0.00011161741780224104, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.0002032106298651307, + "loss": 0.0173, "step": 248930 }, { - "epoch": 1.26, - "learning_rate": 0.00011160985010922703, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020320674164875927, + "loss": 0.0142, "step": 248940 }, { - "epoch": 1.26, - "learning_rate": 0.00011160228241621302, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020320285343238779, + "loss": 0.0195, "step": 248950 }, { - "epoch": 1.26, - "learning_rate": 0.000111594714723199, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020319896521601633, + "loss": 0.0166, "step": 248960 }, { - "epoch": 1.26, - "learning_rate": 0.000111587147030185, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020319507699964484, + "loss": 0.0148, "step": 248970 }, { - "epoch": 1.26, - "learning_rate": 0.00011157957933717099, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.0002031911887832734, + "loss": 0.0167, "step": 248980 }, { - "epoch": 1.26, - "learning_rate": 0.00011157201164415697, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020318730056690192, + "loss": 0.0188, "step": 248990 }, { - "epoch": 1.26, - "learning_rate": 0.00011156444395114297, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.00020318341235053047, + "loss": 0.0168, "step": 249000 }, { - "epoch": 1.26, - "eval_cer": 0.9144459960000272, - "eval_loss": 0.0065380726009607315, - "eval_runtime": 116.0227, - "eval_samples_per_second": 17.238, - "eval_steps_per_second": 4.31, + "epoch": 0.65, + "eval_cer": 0.8817922630869552, + "eval_loss": 0.011258595623075962, + "eval_runtime": 107.1544, + "eval_samples_per_second": 18.665, + "eval_steps_per_second": 4.666, "step": 249000 }, { - "epoch": 1.26, - "learning_rate": 0.00011155687625812896, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020317952413415898, + "loss": 0.0149, "step": 249010 }, { - "epoch": 1.26, - "learning_rate": 0.00011154930856511495, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.00020317563591778755, + "loss": 0.0117, "step": 249020 }, { - "epoch": 1.26, - "learning_rate": 0.00011154174087210094, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020317174770141606, + "loss": 0.014, "step": 249030 }, { - "epoch": 1.26, - "learning_rate": 0.00011153417317908692, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002031678594850446, + "loss": 0.0182, "step": 249040 }, { - "epoch": 1.26, - "learning_rate": 0.00011152660548607292, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020316397126867312, + "loss": 0.0152, "step": 249050 }, { - "epoch": 1.26, - "learning_rate": 0.00011151903779305891, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.0002031600830523017, + "loss": 0.0141, "step": 249060 }, { - "epoch": 1.26, - "learning_rate": 0.0001115114701000449, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020315619483593023, + "loss": 0.0198, "step": 249070 }, { - "epoch": 1.26, - "learning_rate": 0.00011150390240703089, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020315230661955875, + "loss": 0.0133, "step": 249080 }, { - "epoch": 1.26, - "learning_rate": 0.00011149633471401688, - "loss": 0.0103, + "epoch": 0.65, + "learning_rate": 0.0002031484184031873, + "loss": 0.0194, "step": 249090 }, { - "epoch": 1.26, - "learning_rate": 0.00011148876702100286, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.0002031445301868158, + "loss": 0.023, "step": 249100 }, { - "epoch": 1.26, - "learning_rate": 0.00011148119932798886, - "loss": 0.0088, - "step": 249110 + "epoch": 0.65, + "learning_rate": 0.00020314064197044437, + "loss": 0.014, + "step": 249110 }, { - "epoch": 1.26, - "learning_rate": 0.00011147363163497484, - "loss": 0.0103, + "epoch": 0.65, + "learning_rate": 0.00020313675375407288, + "loss": 0.0126, "step": 249120 }, { - "epoch": 1.26, - "learning_rate": 0.00011146606394196084, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020313286553770143, + "loss": 0.019, "step": 249130 }, { - "epoch": 1.26, - "learning_rate": 0.00011145849624894683, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020312897732132994, + "loss": 0.0196, "step": 249140 }, { - "epoch": 1.26, - "learning_rate": 0.00011145092855593281, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.0002031250891049585, + "loss": 0.0186, "step": 249150 }, { - "epoch": 1.26, - "learning_rate": 0.00011144336086291881, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020312120088858702, + "loss": 0.016, "step": 249160 }, { - "epoch": 1.26, - "learning_rate": 0.0001114357931699048, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020311731267221557, + "loss": 0.0148, "step": 249170 }, { - "epoch": 1.26, - "learning_rate": 0.00011142822547689077, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020311342445584408, + "loss": 0.0179, "step": 249180 }, { - "epoch": 1.26, - "learning_rate": 0.00011142065778387677, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020310953623947265, + "loss": 0.0151, "step": 249190 }, { - "epoch": 1.26, - "learning_rate": 0.00011141309009086275, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.00020310564802310116, + "loss": 0.0197, "step": 249200 }, { - "epoch": 1.26, - "learning_rate": 0.00011140552239784874, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002031017598067297, + "loss": 0.0199, "step": 249210 }, { - "epoch": 1.26, - "learning_rate": 0.00011139795470483472, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020309787159035822, + "loss": 0.0161, "step": 249220 }, { - "epoch": 1.26, - "learning_rate": 0.00011139038701182072, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.0002030939833739868, + "loss": 0.0156, "step": 249230 }, { - "epoch": 1.26, - "learning_rate": 0.00011138281931880671, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020309009515761533, + "loss": 0.0162, "step": 249240 }, { - "epoch": 1.26, - "learning_rate": 0.0001113752516257927, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020308620694124384, + "loss": 0.0151, "step": 249250 }, { - "epoch": 1.26, - "learning_rate": 0.00011136768393277869, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020308231872487236, + "loss": 0.0144, "step": 249260 }, { - "epoch": 1.26, - "learning_rate": 0.00011136011623976468, - "loss": 0.0131, + "epoch": 0.65, + "learning_rate": 0.00020307843050850093, + "loss": 0.0139, "step": 249270 }, { - "epoch": 1.26, - "learning_rate": 0.00011135254854675067, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020307454229212947, + "loss": 0.0169, "step": 249280 }, { - "epoch": 1.26, - "learning_rate": 0.00011134498085373666, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020307065407575798, + "loss": 0.0165, "step": 249290 }, { - "epoch": 1.26, - "learning_rate": 0.00011133741316072264, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020306676585938653, + "loss": 0.0149, "step": 249300 }, { - "epoch": 1.26, - "learning_rate": 0.00011132984546770864, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020306287764301507, + "loss": 0.012, "step": 249310 }, { - "epoch": 1.26, - "learning_rate": 0.00011132227777469463, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002030589894266436, + "loss": 0.0136, "step": 249320 }, { - "epoch": 1.26, - "learning_rate": 0.00011131471008168061, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.00020305510121027212, + "loss": 0.013, "step": 249330 }, { - "epoch": 1.26, - "learning_rate": 0.00011130714238866661, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020305121299390067, + "loss": 0.0161, "step": 249340 }, { - "epoch": 1.26, - "learning_rate": 0.0001112995746956526, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020304732477752918, + "loss": 0.0184, "step": 249350 }, { - "epoch": 1.26, - "learning_rate": 0.00011129200700263859, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020304343656115775, + "loss": 0.0132, "step": 249360 }, { - "epoch": 1.26, - "learning_rate": 0.00011128443930962458, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020303954834478626, + "loss": 0.0127, "step": 249370 }, { - "epoch": 1.26, - "learning_rate": 0.00011127687161661056, - "loss": 0.0063, + "epoch": 0.65, + "learning_rate": 0.0002030356601284148, + "loss": 0.0134, "step": 249380 }, { - "epoch": 1.26, - "learning_rate": 0.00011126930392359656, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020303177191204332, + "loss": 0.0136, "step": 249390 }, { - "epoch": 1.26, - "learning_rate": 0.00011126173623058255, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.0002030278836956719, + "loss": 0.0183, "step": 249400 }, { - "epoch": 1.26, - "learning_rate": 0.00011125416853756853, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020302399547930043, + "loss": 0.0162, "step": 249410 }, { - "epoch": 1.26, - "learning_rate": 0.00011124660084455453, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.00020302010726292894, + "loss": 0.0165, "step": 249420 }, { - "epoch": 1.26, - "learning_rate": 0.00011123903315154052, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020301621904655746, + "loss": 0.0157, "step": 249430 }, { - "epoch": 1.26, - "learning_rate": 0.0001112314654585265, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.00020301233083018603, + "loss": 0.0142, "step": 249440 }, { - "epoch": 1.26, - "learning_rate": 0.0001112238977655125, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020300844261381457, + "loss": 0.0154, "step": 249450 }, { - "epoch": 1.26, - "learning_rate": 0.0001112163300724985, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020300455439744308, + "loss": 0.0152, "step": 249460 }, { - "epoch": 1.26, - "learning_rate": 0.00011120876237948448, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.00020300066618107163, + "loss": 0.014, "step": 249470 }, { - "epoch": 1.26, - "learning_rate": 0.00011120119468647047, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020299677796470017, + "loss": 0.0173, "step": 249480 }, { - "epoch": 1.26, - "learning_rate": 0.00011119362699345645, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.0002029928897483287, + "loss": 0.0129, "step": 249490 }, { - "epoch": 1.26, - "learning_rate": 0.00011118605930044245, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020298900153195722, + "loss": 0.0151, "step": 249500 }, { - "epoch": 1.26, - "learning_rate": 0.00011117849160742844, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020298511331558576, + "loss": 0.0185, "step": 249510 }, { - "epoch": 1.26, - "learning_rate": 0.00011117092391441442, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002029812250992143, + "loss": 0.0177, "step": 249520 }, { - "epoch": 1.26, - "learning_rate": 0.00011116335622140042, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020297733688284285, + "loss": 0.0148, "step": 249530 }, { - "epoch": 1.26, - "learning_rate": 0.00011115578852838641, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020297344866647136, + "loss": 0.0146, "step": 249540 }, { - "epoch": 1.26, - "learning_rate": 0.0001111482208353724, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.0002029695604500999, + "loss": 0.0162, "step": 249550 }, { - "epoch": 1.26, - "learning_rate": 0.00011114065314235839, - "loss": 0.011, + "epoch": 0.65, + "learning_rate": 0.00020296567223372847, + "loss": 0.0148, "step": 249560 }, { - "epoch": 1.26, - "learning_rate": 0.00011113308544934437, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.000202961784017357, + "loss": 0.021, "step": 249570 }, { - "epoch": 1.26, - "learning_rate": 0.00011112551775633037, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.0002029578958009855, + "loss": 0.0175, "step": 249580 }, { - "epoch": 1.26, - "learning_rate": 0.00011111795006331636, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020295400758461404, + "loss": 0.0154, "step": 249590 }, { - "epoch": 1.26, - "learning_rate": 0.00011111038237030234, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.00020295011936824256, + "loss": 0.0128, "step": 249600 }, { - "epoch": 1.26, - "learning_rate": 0.00011110281467728834, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020294623115187113, + "loss": 0.0129, "step": 249610 }, { - "epoch": 1.26, - "learning_rate": 0.00011109524698427433, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020294234293549967, + "loss": 0.0145, "step": 249620 }, { - "epoch": 1.26, - "learning_rate": 0.00011108767929126032, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020293845471912818, + "loss": 0.0129, "step": 249630 }, { - "epoch": 1.26, - "learning_rate": 0.00011108011159824631, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020293456650275672, + "loss": 0.0134, "step": 249640 }, { - "epoch": 1.26, - "learning_rate": 0.00011107254390523229, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020293067828638527, + "loss": 0.0146, "step": 249650 }, { - "epoch": 1.26, - "learning_rate": 0.00011106497621221829, - "loss": 0.0132, + "epoch": 0.65, + "learning_rate": 0.0002029267900700138, + "loss": 0.0158, "step": 249660 }, { - "epoch": 1.26, - "learning_rate": 0.00011105740851920428, - "loss": 0.011, + "epoch": 0.65, + "learning_rate": 0.00020292290185364232, + "loss": 0.0183, "step": 249670 }, { - "epoch": 1.26, - "learning_rate": 0.00011104984082619026, - "loss": 0.0128, + "epoch": 0.65, + "learning_rate": 0.00020291901363727086, + "loss": 0.0163, "step": 249680 }, { - "epoch": 1.26, - "learning_rate": 0.00011104227313317626, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002029151254208994, + "loss": 0.0152, "step": 249690 }, { - "epoch": 1.26, - "learning_rate": 0.00011103470544016225, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020291123720452795, + "loss": 0.0224, "step": 249700 }, { - "epoch": 1.26, - "learning_rate": 0.00011102713774714823, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020290734898815646, + "loss": 0.0212, "step": 249710 }, { - "epoch": 1.26, - "learning_rate": 0.00011101957005413423, - "loss": 0.0105, + "epoch": 0.65, + "learning_rate": 0.000202903460771785, + "loss": 0.0141, "step": 249720 }, { - "epoch": 1.26, - "learning_rate": 0.00011101200236112021, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020289957255541355, + "loss": 0.0136, "step": 249730 }, { - "epoch": 1.26, - "learning_rate": 0.0001110044346681062, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.0002028956843390421, + "loss": 0.0153, "step": 249740 }, { - "epoch": 1.26, - "learning_rate": 0.0001109968669750922, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.0002028917961226706, + "loss": 0.0156, "step": 249750 }, { - "epoch": 1.26, - "learning_rate": 0.00011098929928207818, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.00020288790790629914, + "loss": 0.0143, "step": 249760 }, { - "epoch": 1.26, - "learning_rate": 0.00011098173158906418, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002028840196899277, + "loss": 0.0172, "step": 249770 }, { - "epoch": 1.26, - "learning_rate": 0.00011097416389605017, - "loss": 0.0066, + "epoch": 0.65, + "learning_rate": 0.00020288013147355623, + "loss": 0.021, "step": 249780 }, { - "epoch": 1.26, - "learning_rate": 0.00011096659620303615, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020287624325718477, + "loss": 0.018, "step": 249790 }, { - "epoch": 1.26, - "learning_rate": 0.00011095902851002215, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020287235504081328, + "loss": 0.0132, "step": 249800 }, { - "epoch": 1.26, - "learning_rate": 0.00011095146081700812, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020286846682444185, + "loss": 0.0172, "step": 249810 }, { - "epoch": 1.26, - "learning_rate": 0.00011094389312399411, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020286457860807037, + "loss": 0.0145, "step": 249820 }, { - "epoch": 1.26, - "learning_rate": 0.00011093632543098009, - "loss": 0.0065, + "epoch": 0.65, + "learning_rate": 0.0002028606903916989, + "loss": 0.0136, "step": 249830 }, { - "epoch": 1.26, - "learning_rate": 0.00011092875773796609, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020285680217532742, + "loss": 0.0168, "step": 249840 }, { - "epoch": 1.26, - "learning_rate": 0.00011092119004495208, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020285291395895596, + "loss": 0.0138, "step": 249850 }, { - "epoch": 1.26, - "learning_rate": 0.00011091362235193806, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.0002028490257425845, + "loss": 0.0138, "step": 249860 }, { - "epoch": 1.26, - "learning_rate": 0.00011090605465892406, - "loss": 0.0113, + "epoch": 0.65, + "learning_rate": 0.00020284513752621305, + "loss": 0.0138, "step": 249870 }, { - "epoch": 1.26, - "learning_rate": 0.00011089848696591005, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020284124930984156, + "loss": 0.0216, "step": 249880 }, { - "epoch": 1.26, - "learning_rate": 0.00011089091927289604, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.0002028373610934701, + "loss": 0.0176, "step": 249890 }, { - "epoch": 1.26, - "learning_rate": 0.00011088335157988203, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020283347287709864, + "loss": 0.0159, "step": 249900 }, { - "epoch": 1.26, - "learning_rate": 0.00011087578388686803, - "loss": 0.0131, + "epoch": 0.65, + "learning_rate": 0.00020282958466072719, + "loss": 0.0211, "step": 249910 }, { - "epoch": 1.26, - "learning_rate": 0.00011086821619385401, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002028256964443557, + "loss": 0.0151, "step": 249920 }, { - "epoch": 1.26, - "learning_rate": 0.00011086064850084, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020282180822798424, + "loss": 0.017, "step": 249930 }, { - "epoch": 1.26, - "learning_rate": 0.00011085308080782598, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.0002028179200116128, + "loss": 0.0147, "step": 249940 }, { - "epoch": 1.26, - "learning_rate": 0.00011084551311481198, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.00020281403179524133, + "loss": 0.0153, "step": 249950 }, { - "epoch": 1.26, - "learning_rate": 0.00011083794542179797, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020281014357886987, + "loss": 0.0131, "step": 249960 }, { - "epoch": 1.26, - "learning_rate": 0.00011083037772878396, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020280625536249838, + "loss": 0.0158, "step": 249970 }, { - "epoch": 1.26, - "learning_rate": 0.00011082281003576995, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020280236714612695, + "loss": 0.015, "step": 249980 }, { - "epoch": 1.26, - "learning_rate": 0.00011081524234275595, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.00020279847892975547, + "loss": 0.0166, "step": 249990 }, { - "epoch": 1.26, - "learning_rate": 0.00011080767464974193, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.000202794590713384, + "loss": 0.0181, "step": 250000 }, { - "epoch": 1.26, - "eval_cer": 0.9144537591690304, - "eval_loss": 0.0067350054159760475, - "eval_runtime": 115.9925, - "eval_samples_per_second": 17.243, - "eval_steps_per_second": 4.311, + "epoch": 0.65, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.010947254486382008, + "eval_runtime": 107.1468, + "eval_samples_per_second": 18.666, + "eval_steps_per_second": 4.666, "step": 250000 }, { - "epoch": 1.26, - "learning_rate": 0.00011080010695672792, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020279070249701252, + "loss": 0.0161, "step": 250010 }, { - "epoch": 1.26, - "learning_rate": 0.0001107925392637139, - "loss": 0.0154, + "epoch": 0.65, + "learning_rate": 0.0002027868142806411, + "loss": 0.0162, "step": 250020 }, { - "epoch": 1.26, - "learning_rate": 0.0001107849715706999, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.0002027829260642696, + "loss": 0.0143, "step": 250030 }, { - "epoch": 1.26, - "learning_rate": 0.00011077740387768589, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020277903784789815, + "loss": 0.0144, "step": 250040 }, { - "epoch": 1.26, - "learning_rate": 0.00011076983618467187, - "loss": 0.0067, + "epoch": 0.65, + "learning_rate": 0.00020277514963152666, + "loss": 0.0159, "step": 250050 }, { - "epoch": 1.26, - "learning_rate": 0.00011076226849165787, - "loss": 0.0066, + "epoch": 0.65, + "learning_rate": 0.00020277126141515523, + "loss": 0.0135, "step": 250060 }, { - "epoch": 1.26, - "learning_rate": 0.00011075470079864386, - "loss": 0.0121, + "epoch": 0.65, + "learning_rate": 0.00020276737319878374, + "loss": 0.0132, "step": 250070 }, { - "epoch": 1.26, - "learning_rate": 0.00011074713310562985, - "loss": 0.0063, + "epoch": 0.65, + "learning_rate": 0.00020276348498241229, + "loss": 0.0167, "step": 250080 }, { - "epoch": 1.26, - "learning_rate": 0.00011073956541261584, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002027595967660408, + "loss": 0.017, "step": 250090 }, { - "epoch": 1.26, - "learning_rate": 0.00011073199771960182, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020275570854966934, + "loss": 0.0169, "step": 250100 }, { - "epoch": 1.26, - "learning_rate": 0.00011072443002658782, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.0002027518203332979, + "loss": 0.0125, "step": 250110 }, { - "epoch": 1.26, - "learning_rate": 0.00011071686233357381, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.00020274793211692643, + "loss": 0.0158, "step": 250120 }, { - "epoch": 1.26, - "learning_rate": 0.0001107092946405598, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.00020274404390055494, + "loss": 0.018, "step": 250130 }, { - "epoch": 1.26, - "learning_rate": 0.00011070172694754579, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020274015568418348, + "loss": 0.017, "step": 250140 }, { - "epoch": 1.26, - "learning_rate": 0.00011069415925453178, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020273626746781205, + "loss": 0.0134, "step": 250150 }, { - "epoch": 1.26, - "learning_rate": 0.00011068659156151777, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020273237925144056, + "loss": 0.0144, "step": 250160 }, { - "epoch": 1.26, - "learning_rate": 0.00011067902386850376, - "loss": 0.007, + "epoch": 0.65, + "learning_rate": 0.0002027284910350691, + "loss": 0.0211, "step": 250170 }, { - "epoch": 1.26, - "learning_rate": 0.00011067145617548974, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020272460281869762, + "loss": 0.0185, "step": 250180 }, { - "epoch": 1.26, - "learning_rate": 0.00011066388848247574, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.0002027207146023262, + "loss": 0.0129, "step": 250190 }, { - "epoch": 1.26, - "learning_rate": 0.00011065632078946173, - "loss": 0.0106, + "epoch": 0.65, + "learning_rate": 0.0002027168263859547, + "loss": 0.0175, "step": 250200 }, { - "epoch": 1.26, - "learning_rate": 0.00011064875309644771, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020271293816958325, + "loss": 0.0168, "step": 250210 }, { - "epoch": 1.26, - "learning_rate": 0.00011064118540343371, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.00020270904995321176, + "loss": 0.0186, "step": 250220 }, { - "epoch": 1.26, - "learning_rate": 0.0001106336177104197, - "loss": 0.007, + "epoch": 0.65, + "learning_rate": 0.00020270516173684033, + "loss": 0.0125, "step": 250230 }, { - "epoch": 1.26, - "learning_rate": 0.00011062605001740568, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020270127352046884, + "loss": 0.0162, "step": 250240 }, { - "epoch": 1.26, - "learning_rate": 0.00011061848232439168, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.00020269738530409739, + "loss": 0.0198, "step": 250250 }, { - "epoch": 1.26, - "learning_rate": 0.00011061091463137766, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.0002026934970877259, + "loss": 0.0151, "step": 250260 }, { - "epoch": 1.26, - "learning_rate": 0.00011060334693836366, - "loss": 0.0108, + "epoch": 0.65, + "learning_rate": 0.00020268960887135447, + "loss": 0.0131, "step": 250270 }, { - "epoch": 1.26, - "learning_rate": 0.00011059577924534965, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.000202685720654983, + "loss": 0.0163, "step": 250280 }, { - "epoch": 1.26, - "learning_rate": 0.00011058821155233563, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020268183243861152, + "loss": 0.0157, "step": 250290 }, { - "epoch": 1.26, - "learning_rate": 0.00011058064385932163, - "loss": 0.0125, + "epoch": 0.65, + "learning_rate": 0.00020267794422224004, + "loss": 0.0146, "step": 250300 }, { - "epoch": 1.26, - "learning_rate": 0.00011057307616630762, - "loss": 0.006, + "epoch": 0.65, + "learning_rate": 0.0002026740560058686, + "loss": 0.0157, "step": 250310 }, { - "epoch": 1.26, - "learning_rate": 0.0001105655084732936, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020267016778949715, + "loss": 0.0148, "step": 250320 }, { - "epoch": 1.26, - "learning_rate": 0.0001105579407802796, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020266627957312566, + "loss": 0.0152, "step": 250330 }, { - "epoch": 1.26, - "learning_rate": 0.00011055037308726558, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.0002026623913567542, + "loss": 0.0212, "step": 250340 }, { - "epoch": 1.26, - "learning_rate": 0.00011054280539425158, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020265850314038272, + "loss": 0.02, "step": 250350 }, { - "epoch": 1.26, - "learning_rate": 0.00011053523770123757, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.0002026546149240113, + "loss": 0.0154, "step": 250360 }, { - "epoch": 1.26, - "learning_rate": 0.00011052767000822355, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.0002026507267076398, + "loss": 0.0151, "step": 250370 }, { - "epoch": 1.26, - "learning_rate": 0.00011052010231520955, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020264683849126835, + "loss": 0.0166, "step": 250380 }, { - "epoch": 1.26, - "learning_rate": 0.00011051253462219554, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020264295027489686, + "loss": 0.0168, "step": 250390 }, { - "epoch": 1.26, - "learning_rate": 0.00011050496692918152, - "loss": 0.013, + "epoch": 0.65, + "learning_rate": 0.00020263906205852543, + "loss": 0.0147, "step": 250400 }, { - "epoch": 1.26, - "learning_rate": 0.00011049739923616752, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.00020263517384215394, + "loss": 0.0168, "step": 250410 }, { - "epoch": 1.26, - "learning_rate": 0.00011048983154315351, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.00020263128562578248, + "loss": 0.0193, "step": 250420 }, { - "epoch": 1.26, - "learning_rate": 0.0001104822638501395, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.000202627397409411, + "loss": 0.0148, "step": 250430 }, { - "epoch": 1.26, - "learning_rate": 0.00011047469615712548, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020262350919303957, + "loss": 0.0148, "step": 250440 }, { - "epoch": 1.26, - "learning_rate": 0.00011046712846411146, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020261962097666808, + "loss": 0.0155, "step": 250450 }, { - "epoch": 1.26, - "learning_rate": 0.00011045956077109745, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020261573276029662, + "loss": 0.0147, "step": 250460 }, { - "epoch": 1.26, - "learning_rate": 0.00011045199307808343, - "loss": 0.0065, + "epoch": 0.65, + "learning_rate": 0.00020261184454392514, + "loss": 0.0155, "step": 250470 }, { - "epoch": 1.26, - "learning_rate": 0.00011044442538506943, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002026079563275537, + "loss": 0.0171, "step": 250480 }, { - "epoch": 1.26, - "learning_rate": 0.00011043685769205542, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020260406811118225, + "loss": 0.0163, "step": 250490 }, { - "epoch": 1.26, - "learning_rate": 0.0001104292899990414, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.00020260017989481076, + "loss": 0.0161, "step": 250500 }, { - "epoch": 1.26, - "learning_rate": 0.0001104217223060274, - "loss": 0.0067, + "epoch": 0.65, + "learning_rate": 0.0002025962916784393, + "loss": 0.0134, "step": 250510 }, { - "epoch": 1.26, - "learning_rate": 0.0001104141546130134, - "loss": 0.0116, + "epoch": 0.65, + "learning_rate": 0.00020259240346206785, + "loss": 0.0155, "step": 250520 }, { - "epoch": 1.26, - "learning_rate": 0.00011040658691999938, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.0002025885152456964, + "loss": 0.0146, "step": 250530 }, { - "epoch": 1.26, - "learning_rate": 0.00011039901922698537, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.0002025846270293249, + "loss": 0.0179, "step": 250540 }, { - "epoch": 1.26, - "learning_rate": 0.00011039145153397135, - "loss": 0.0066, + "epoch": 0.65, + "learning_rate": 0.00020258073881295344, + "loss": 0.0181, "step": 250550 }, { - "epoch": 1.26, - "learning_rate": 0.00011038388384095735, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020257685059658199, + "loss": 0.0163, "step": 250560 }, { - "epoch": 1.26, - "learning_rate": 0.00011037631614794334, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020257296238021053, + "loss": 0.0155, "step": 250570 }, { - "epoch": 1.26, - "learning_rate": 0.00011036874845492932, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020256907416383904, + "loss": 0.0196, "step": 250580 }, { - "epoch": 1.26, - "learning_rate": 0.00011036118076191532, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020256518594746758, + "loss": 0.0168, "step": 250590 }, { - "epoch": 1.26, - "learning_rate": 0.00011035361306890131, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.0002025612977310961, + "loss": 0.0177, "step": 250600 }, { - "epoch": 1.26, - "learning_rate": 0.0001103460453758873, - "loss": 0.0147, + "epoch": 0.65, + "learning_rate": 0.00020255740951472467, + "loss": 0.0141, "step": 250610 }, { - "epoch": 1.26, - "learning_rate": 0.00011033847768287329, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020255352129835318, + "loss": 0.0142, "step": 250620 }, { - "epoch": 1.26, - "learning_rate": 0.00011033090998985927, - "loss": 0.0103, + "epoch": 0.65, + "learning_rate": 0.00020254963308198172, + "loss": 0.0207, "step": 250630 }, { - "epoch": 1.26, - "learning_rate": 0.00011032334229684527, - "loss": 0.0112, + "epoch": 0.65, + "learning_rate": 0.00020254574486561024, + "loss": 0.0161, "step": 250640 }, { - "epoch": 1.26, - "learning_rate": 0.00011031577460383126, - "loss": 0.007, + "epoch": 0.65, + "learning_rate": 0.0002025418566492388, + "loss": 0.0169, "step": 250650 }, { - "epoch": 1.26, - "learning_rate": 0.00011030820691081724, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020253796843286735, + "loss": 0.0154, "step": 250660 }, { - "epoch": 1.26, - "learning_rate": 0.00011030063921780324, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020253408021649586, + "loss": 0.0167, "step": 250670 }, { - "epoch": 1.26, - "learning_rate": 0.00011029307152478923, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.0002025301920001244, + "loss": 0.0163, "step": 250680 }, { - "epoch": 1.26, - "learning_rate": 0.00011028550383177522, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020252630378375295, + "loss": 0.0116, "step": 250690 }, { - "epoch": 1.26, - "learning_rate": 0.00011027793613876121, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002025224155673815, + "loss": 0.0154, "step": 250700 }, { - "epoch": 1.26, - "learning_rate": 0.00011027036844574719, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020251852735101, + "loss": 0.0153, "step": 250710 }, { - "epoch": 1.26, - "learning_rate": 0.00011026280075273319, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020251463913463854, + "loss": 0.0174, "step": 250720 }, { - "epoch": 1.26, - "learning_rate": 0.00011025523305971918, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020251075091826709, + "loss": 0.0142, "step": 250730 }, { - "epoch": 1.27, - "learning_rate": 0.00011024766536670516, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.00020250686270189563, + "loss": 0.0142, "step": 250740 }, { - "epoch": 1.27, - "learning_rate": 0.00011024009767369116, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020250297448552414, + "loss": 0.0159, "step": 250750 }, { - "epoch": 1.27, - "learning_rate": 0.00011023252998067715, - "loss": 0.0115, + "epoch": 0.65, + "learning_rate": 0.00020249908626915268, + "loss": 0.0136, "step": 250760 }, { - "epoch": 1.27, - "learning_rate": 0.00011022496228766313, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020249519805278123, + "loss": 0.0191, "step": 250770 }, { - "epoch": 1.27, - "learning_rate": 0.00011021739459464913, - "loss": 0.013, + "epoch": 0.65, + "learning_rate": 0.00020249130983640977, + "loss": 0.0175, "step": 250780 }, { - "epoch": 1.27, - "learning_rate": 0.00011020982690163511, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020248742162003828, + "loss": 0.0169, "step": 250790 }, { - "epoch": 1.27, - "learning_rate": 0.0001102022592086211, - "loss": 0.0059, + "epoch": 0.65, + "learning_rate": 0.00020248353340366682, + "loss": 0.014, "step": 250800 }, { - "epoch": 1.27, - "learning_rate": 0.0001101946915156071, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.0002024796451872954, + "loss": 0.017, "step": 250810 }, { - "epoch": 1.27, - "learning_rate": 0.00011018712382259308, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.0002024757569709239, + "loss": 0.0162, "step": 250820 }, { - "epoch": 1.27, - "learning_rate": 0.00011017955612957908, - "loss": 0.0113, + "epoch": 0.65, + "learning_rate": 0.00020247186875455245, + "loss": 0.0125, "step": 250830 }, { - "epoch": 1.27, - "learning_rate": 0.00011017198843656507, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020246798053818096, + "loss": 0.0187, "step": 250840 }, { - "epoch": 1.27, - "learning_rate": 0.00011016442074355105, - "loss": 0.0103, + "epoch": 0.65, + "learning_rate": 0.00020246409232180948, + "loss": 0.0155, "step": 250850 }, { - "epoch": 1.27, - "learning_rate": 0.00011015685305053705, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020246020410543805, + "loss": 0.0174, "step": 250860 }, { - "epoch": 1.27, - "learning_rate": 0.00011014928535752304, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.0002024563158890666, + "loss": 0.0171, "step": 250870 }, { - "epoch": 1.27, - "learning_rate": 0.00011014171766450903, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.0002024524276726951, + "loss": 0.0137, "step": 250880 }, { - "epoch": 1.27, - "learning_rate": 0.00011013414997149502, - "loss": 0.0103, + "epoch": 0.65, + "learning_rate": 0.00020244853945632364, + "loss": 0.014, "step": 250890 }, { - "epoch": 1.27, - "learning_rate": 0.000110126582278481, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020244465123995219, + "loss": 0.0142, "step": 250900 }, { - "epoch": 1.27, - "learning_rate": 0.000110119014585467, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020244076302358073, + "loss": 0.0141, "step": 250910 }, { - "epoch": 1.27, - "learning_rate": 0.00011011144689245299, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020243687480720924, + "loss": 0.0141, "step": 250920 }, { - "epoch": 1.27, - "learning_rate": 0.00011010387919943897, - "loss": 0.0134, + "epoch": 0.65, + "learning_rate": 0.00020243298659083778, + "loss": 0.016, "step": 250930 }, { - "epoch": 1.27, - "learning_rate": 0.00011009631150642497, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020242909837446632, + "loss": 0.0155, "step": 250940 }, { - "epoch": 1.27, - "learning_rate": 0.00011008874381341096, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020242521015809487, + "loss": 0.0151, "step": 250950 }, { - "epoch": 1.27, - "learning_rate": 0.00011008117612039694, - "loss": 0.0106, + "epoch": 0.65, + "learning_rate": 0.00020242132194172338, + "loss": 0.0145, "step": 250960 }, { - "epoch": 1.27, - "learning_rate": 0.00011007360842738294, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020241743372535192, + "loss": 0.0174, "step": 250970 }, { - "epoch": 1.27, - "learning_rate": 0.00011006604073436892, - "loss": 0.0057, + "epoch": 0.65, + "learning_rate": 0.0002024135455089805, + "loss": 0.018, "step": 250980 }, { - "epoch": 1.27, - "learning_rate": 0.00011005847304135492, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.000202409657292609, + "loss": 0.0154, "step": 250990 }, { - "epoch": 1.27, - "learning_rate": 0.00011005090534834091, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.00020240576907623755, + "loss": 0.0162, "step": 251000 }, { - "epoch": 1.27, - "eval_cer": 0.9144605519419082, - "eval_loss": 0.0065511371940374374, - "eval_runtime": 116.1225, - "eval_samples_per_second": 17.223, - "eval_steps_per_second": 4.306, + "epoch": 0.65, + "eval_cer": 0.88176706962214, + "eval_loss": 0.011115950532257557, + "eval_runtime": 107.2723, + "eval_samples_per_second": 18.644, + "eval_steps_per_second": 4.661, "step": 251000 }, { - "epoch": 1.27, - "learning_rate": 0.00011004333765532689, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020240188085986606, + "loss": 0.0158, "step": 251010 }, { - "epoch": 1.27, - "learning_rate": 0.00011003576996231289, - "loss": 0.0103, + "epoch": 0.65, + "learning_rate": 0.00020239799264349463, + "loss": 0.0157, "step": 251020 }, { - "epoch": 1.27, - "learning_rate": 0.00011002820226929888, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020239410442712315, + "loss": 0.0159, "step": 251030 }, { - "epoch": 1.27, - "learning_rate": 0.00011002063457628486, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.0002023902162107517, + "loss": 0.0153, "step": 251040 }, { - "epoch": 1.27, - "learning_rate": 0.00011001306688327086, - "loss": 0.0064, + "epoch": 0.65, + "learning_rate": 0.0002023863279943802, + "loss": 0.0164, "step": 251050 }, { - "epoch": 1.27, - "learning_rate": 0.00011000549919025684, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020238243977800877, + "loss": 0.0188, "step": 251060 }, { - "epoch": 1.27, - "learning_rate": 0.00010999793149724282, - "loss": 0.0122, + "epoch": 0.65, + "learning_rate": 0.00020237855156163728, + "loss": 0.013, "step": 251070 }, { - "epoch": 1.27, - "learning_rate": 0.0001099903638042288, - "loss": 0.0112, + "epoch": 0.65, + "learning_rate": 0.00020237466334526583, + "loss": 0.018, "step": 251080 }, { - "epoch": 1.27, - "learning_rate": 0.0001099827961112148, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020237077512889434, + "loss": 0.0146, "step": 251090 }, { - "epoch": 1.27, - "learning_rate": 0.0001099752284182008, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020236688691252288, + "loss": 0.0174, "step": 251100 }, { - "epoch": 1.27, - "learning_rate": 0.00010996766072518677, - "loss": 0.0107, + "epoch": 0.65, + "learning_rate": 0.00020236299869615142, + "loss": 0.0171, "step": 251110 }, { - "epoch": 1.27, - "learning_rate": 0.00010996009303217277, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020235911047977997, + "loss": 0.0173, "step": 251120 }, { - "epoch": 1.27, - "learning_rate": 0.00010995252533915876, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020235522226340848, + "loss": 0.0121, "step": 251130 }, { - "epoch": 1.27, - "learning_rate": 0.00010994495764614475, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020235133404703702, + "loss": 0.0147, "step": 251140 }, { - "epoch": 1.27, - "learning_rate": 0.00010993738995313074, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.0002023474458306656, + "loss": 0.0241, "step": 251150 }, { - "epoch": 1.27, - "learning_rate": 0.00010992982226011672, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002023435576142941, + "loss": 0.0138, "step": 251160 }, { - "epoch": 1.27, - "learning_rate": 0.00010992225456710272, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020233966939792262, + "loss": 0.0151, "step": 251170 }, { - "epoch": 1.27, - "learning_rate": 0.00010991468687408871, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020233578118155116, + "loss": 0.0168, "step": 251180 }, { - "epoch": 1.27, - "learning_rate": 0.0001099071191810747, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020233189296517973, + "loss": 0.0165, "step": 251190 }, { - "epoch": 1.27, - "learning_rate": 0.00010989955148806069, - "loss": 0.007, + "epoch": 0.65, + "learning_rate": 0.00020232800474880824, + "loss": 0.0144, "step": 251200 }, { - "epoch": 1.27, - "learning_rate": 0.00010989198379504668, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020232411653243679, + "loss": 0.0178, "step": 251210 }, { - "epoch": 1.27, - "learning_rate": 0.00010988441610203267, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002023202283160653, + "loss": 0.0134, "step": 251220 }, { - "epoch": 1.27, - "learning_rate": 0.00010987684840901866, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020231634009969387, + "loss": 0.0159, "step": 251230 }, { - "epoch": 1.27, - "learning_rate": 0.00010986928071600464, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.00020231245188332238, + "loss": 0.0154, "step": 251240 }, { - "epoch": 1.27, - "learning_rate": 0.00010986171302299064, - "loss": 0.0115, + "epoch": 0.65, + "learning_rate": 0.00020230856366695093, + "loss": 0.0142, "step": 251250 }, { - "epoch": 1.27, - "learning_rate": 0.00010985414532997663, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020230467545057944, + "loss": 0.0166, "step": 251260 }, { - "epoch": 1.27, - "learning_rate": 0.00010984657763696261, - "loss": 0.0064, + "epoch": 0.65, + "learning_rate": 0.000202300787234208, + "loss": 0.0178, "step": 251270 }, { - "epoch": 1.27, - "learning_rate": 0.00010983900994394861, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020229689901783652, + "loss": 0.0168, "step": 251280 }, { - "epoch": 1.27, - "learning_rate": 0.0001098314422509346, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.00020229301080146506, + "loss": 0.0189, "step": 251290 }, { - "epoch": 1.27, - "learning_rate": 0.00010982387455792058, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020228912258509358, + "loss": 0.0121, "step": 251300 }, { - "epoch": 1.27, - "learning_rate": 0.00010981630686490658, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020228523436872215, + "loss": 0.0146, "step": 251310 }, { - "epoch": 1.27, - "learning_rate": 0.00010980873917189256, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020228134615235066, + "loss": 0.0172, "step": 251320 }, { - "epoch": 1.27, - "learning_rate": 0.00010980117147887856, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.0002022774579359792, + "loss": 0.0218, "step": 251330 }, { - "epoch": 1.27, - "learning_rate": 0.00010979360378586455, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.00020227356971960772, + "loss": 0.0132, "step": 251340 }, { - "epoch": 1.27, - "learning_rate": 0.00010978603609285053, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.00020226968150323626, + "loss": 0.0129, "step": 251350 }, { - "epoch": 1.27, - "learning_rate": 0.00010977846839983653, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020226579328686483, + "loss": 0.0153, "step": 251360 }, { - "epoch": 1.27, - "learning_rate": 0.00010977090070682252, - "loss": 0.0067, + "epoch": 0.65, + "learning_rate": 0.00020226190507049334, + "loss": 0.0158, "step": 251370 }, { - "epoch": 1.27, - "learning_rate": 0.0001097633330138085, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020225801685412189, + "loss": 0.0122, "step": 251380 }, { - "epoch": 1.27, - "learning_rate": 0.0001097557653207945, - "loss": 0.0096, + "epoch": 0.65, + "learning_rate": 0.0002022541286377504, + "loss": 0.0153, "step": 251390 }, { - "epoch": 1.27, - "learning_rate": 0.0001097481976277805, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020225024042137897, + "loss": 0.0147, "step": 251400 }, { - "epoch": 1.27, - "learning_rate": 0.00010974062993476648, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020224635220500748, + "loss": 0.0169, "step": 251410 }, { - "epoch": 1.27, - "learning_rate": 0.00010973306224175247, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020224246398863602, + "loss": 0.0163, "step": 251420 }, { - "epoch": 1.27, - "learning_rate": 0.00010972549454873845, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020223857577226454, + "loss": 0.0138, "step": 251430 }, { - "epoch": 1.27, - "learning_rate": 0.00010971792685572445, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.0002022346875558931, + "loss": 0.0164, "step": 251440 }, { - "epoch": 1.27, - "learning_rate": 0.00010971035916271044, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020223079933952162, + "loss": 0.0158, "step": 251450 }, { - "epoch": 1.27, - "learning_rate": 0.00010970279146969642, - "loss": 0.0108, + "epoch": 0.65, + "learning_rate": 0.00020222691112315016, + "loss": 0.0217, "step": 251460 }, { - "epoch": 1.27, - "learning_rate": 0.00010969522377668242, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020222302290677868, + "loss": 0.0126, "step": 251470 }, { - "epoch": 1.27, - "learning_rate": 0.00010968765608366841, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020221913469040725, + "loss": 0.0164, "step": 251480 }, { - "epoch": 1.27, - "learning_rate": 0.0001096800883906544, - "loss": 0.0113, + "epoch": 0.65, + "learning_rate": 0.00020221524647403576, + "loss": 0.0123, "step": 251490 }, { - "epoch": 1.27, - "learning_rate": 0.00010967252069764039, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.0002022113582576643, + "loss": 0.0136, "step": 251500 }, { - "epoch": 1.27, - "learning_rate": 0.00010966495300462637, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020220747004129282, + "loss": 0.0124, "step": 251510 }, { - "epoch": 1.27, - "learning_rate": 0.00010965738531161237, - "loss": 0.0115, + "epoch": 0.65, + "learning_rate": 0.0002022035818249214, + "loss": 0.017, "step": 251520 }, { - "epoch": 1.27, - "learning_rate": 0.00010964981761859836, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020219969360854993, + "loss": 0.0174, "step": 251530 }, { - "epoch": 1.27, - "learning_rate": 0.00010964224992558434, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020219580539217844, + "loss": 0.0149, "step": 251540 }, { - "epoch": 1.27, - "learning_rate": 0.00010963468223257034, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020219191717580698, + "loss": 0.0168, "step": 251550 }, { - "epoch": 1.27, - "learning_rate": 0.00010962711453955633, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020218802895943553, + "loss": 0.0174, "step": 251560 }, { - "epoch": 1.27, - "learning_rate": 0.00010961954684654231, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020218414074306407, + "loss": 0.0153, "step": 251570 }, { - "epoch": 1.27, - "learning_rate": 0.00010961197915352831, - "loss": 0.0104, + "epoch": 0.65, + "learning_rate": 0.00020218025252669258, + "loss": 0.0159, "step": 251580 }, { - "epoch": 1.27, - "learning_rate": 0.00010960441146051429, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020217636431032112, + "loss": 0.0152, "step": 251590 }, { - "epoch": 1.27, - "learning_rate": 0.00010959684376750029, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.00020217247609394964, + "loss": 0.0124, "step": 251600 }, { - "epoch": 1.27, - "learning_rate": 0.00010958927607448628, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.0002021685878775782, + "loss": 0.0185, "step": 251610 }, { - "epoch": 1.27, - "learning_rate": 0.00010958170838147226, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.00020216469966120672, + "loss": 0.0147, "step": 251620 }, { - "epoch": 1.27, - "learning_rate": 0.00010957414068845826, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.00020216081144483526, + "loss": 0.0177, "step": 251630 }, { - "epoch": 1.27, - "learning_rate": 0.00010956657299544425, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020215692322846378, + "loss": 0.0171, "step": 251640 }, { - "epoch": 1.27, - "learning_rate": 0.00010955900530243023, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020215303501209235, + "loss": 0.0139, "step": 251650 }, { - "epoch": 1.27, - "learning_rate": 0.00010955143760941623, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020214914679572086, + "loss": 0.0121, "step": 251660 }, { - "epoch": 1.27, - "learning_rate": 0.00010954386991640221, - "loss": 0.0068, + "epoch": 0.65, + "learning_rate": 0.0002021452585793494, + "loss": 0.0154, "step": 251670 }, { - "epoch": 1.27, - "learning_rate": 0.0001095363022233882, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020214137036297792, + "loss": 0.0141, "step": 251680 }, { - "epoch": 1.27, - "learning_rate": 0.0001095287345303742, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.0002021374821466065, + "loss": 0.0132, "step": 251690 }, { - "epoch": 1.27, - "learning_rate": 0.00010952116683736017, - "loss": 0.0072, + "epoch": 0.65, + "learning_rate": 0.00020213359393023503, + "loss": 0.0143, "step": 251700 }, { - "epoch": 1.27, - "learning_rate": 0.00010951359914434616, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020212970571386354, + "loss": 0.015, "step": 251710 }, { - "epoch": 1.27, - "learning_rate": 0.00010950603145133214, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020212581749749206, + "loss": 0.016, "step": 251720 }, { - "epoch": 1.27, - "learning_rate": 0.00010949846375831814, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020212192928112063, + "loss": 0.0135, "step": 251730 }, { - "epoch": 1.27, - "learning_rate": 0.00010949089606530413, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020211804106474917, + "loss": 0.0131, "step": 251740 }, { - "epoch": 1.27, - "learning_rate": 0.00010948332837229012, - "loss": 0.0122, + "epoch": 0.65, + "learning_rate": 0.00020211415284837768, + "loss": 0.0175, "step": 251750 }, { - "epoch": 1.27, - "learning_rate": 0.00010947576067927611, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020211026463200622, + "loss": 0.0128, "step": 251760 }, { - "epoch": 1.27, - "learning_rate": 0.00010946819298626209, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020210637641563477, + "loss": 0.0163, "step": 251770 }, { - "epoch": 1.27, - "learning_rate": 0.00010946062529324809, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.0002021024881992633, + "loss": 0.0168, "step": 251780 }, { - "epoch": 1.27, - "learning_rate": 0.00010945305760023408, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020209859998289182, + "loss": 0.0191, "step": 251790 }, { - "epoch": 1.27, - "learning_rate": 0.00010944548990722006, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020209471176652036, + "loss": 0.015, "step": 251800 }, { - "epoch": 1.27, - "learning_rate": 0.00010943792221420606, - "loss": 0.0111, + "epoch": 0.65, + "learning_rate": 0.0002020908235501489, + "loss": 0.0151, "step": 251810 }, { - "epoch": 1.27, - "learning_rate": 0.00010943035452119205, - "loss": 0.0094, + "epoch": 0.65, + "learning_rate": 0.00020208693533377745, + "loss": 0.0143, "step": 251820 }, { - "epoch": 1.27, - "learning_rate": 0.00010942278682817803, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020208304711740596, + "loss": 0.0147, "step": 251830 }, { - "epoch": 1.27, - "learning_rate": 0.00010941521913516403, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002020791589010345, + "loss": 0.0203, "step": 251840 }, { - "epoch": 1.27, - "learning_rate": 0.00010940765144215002, - "loss": 0.0117, + "epoch": 0.65, + "learning_rate": 0.00020207527068466302, + "loss": 0.0149, "step": 251850 }, { - "epoch": 1.27, - "learning_rate": 0.000109400083749136, - "loss": 0.011, + "epoch": 0.65, + "learning_rate": 0.00020207138246829159, + "loss": 0.0149, "step": 251860 }, { - "epoch": 1.27, - "learning_rate": 0.000109392516056122, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020206749425192013, + "loss": 0.0138, "step": 251870 }, { - "epoch": 1.27, - "learning_rate": 0.00010938494836310798, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.00020206360603554864, + "loss": 0.0168, "step": 251880 }, { - "epoch": 1.27, - "learning_rate": 0.00010937738067009398, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020205971781917716, + "loss": 0.0155, "step": 251890 }, { - "epoch": 1.27, - "learning_rate": 0.00010936981297707997, - "loss": 0.0064, + "epoch": 0.65, + "learning_rate": 0.00020205582960280573, + "loss": 0.0157, "step": 251900 }, { - "epoch": 1.27, - "learning_rate": 0.00010936224528406595, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020205194138643427, + "loss": 0.0171, "step": 251910 }, { - "epoch": 1.27, - "learning_rate": 0.00010935467759105195, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020204805317006278, + "loss": 0.0186, "step": 251920 }, { - "epoch": 1.27, - "learning_rate": 0.00010934710989803794, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020204416495369132, + "loss": 0.0158, "step": 251930 }, { - "epoch": 1.27, - "learning_rate": 0.00010933954220502393, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020204027673731986, + "loss": 0.014, "step": 251940 }, { - "epoch": 1.27, - "learning_rate": 0.00010933197451200992, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.0002020363885209484, + "loss": 0.0145, "step": 251950 }, { - "epoch": 1.27, - "learning_rate": 0.0001093244068189959, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020203250030457692, + "loss": 0.0137, "step": 251960 }, { - "epoch": 1.27, - "learning_rate": 0.0001093168391259819, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020202861208820546, + "loss": 0.0216, "step": 251970 }, { - "epoch": 1.27, - "learning_rate": 0.00010930927143296789, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.000202024723871834, + "loss": 0.0146, "step": 251980 }, { - "epoch": 1.27, - "learning_rate": 0.00010930170373995387, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.00020202083565546255, + "loss": 0.0134, "step": 251990 }, { - "epoch": 1.27, - "learning_rate": 0.00010929413604693987, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020201694743909106, + "loss": 0.0167, "step": 252000 }, { - "epoch": 1.27, - "eval_cer": 0.9144789894682909, - "eval_loss": 0.006821473129093647, - "eval_runtime": 116.1992, - "eval_samples_per_second": 17.212, - "eval_steps_per_second": 4.303, + "epoch": 0.65, + "eval_cer": 0.881797861634692, + "eval_loss": 0.010695898905396461, + "eval_runtime": 107.3781, + "eval_samples_per_second": 18.626, + "eval_steps_per_second": 4.656, "step": 252000 }, { - "epoch": 1.27, - "learning_rate": 0.00010928656835392586, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.0002020130592227196, + "loss": 0.0152, "step": 252010 }, { - "epoch": 1.27, - "learning_rate": 0.00010927900066091184, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020200917100634817, + "loss": 0.0138, "step": 252020 }, { - "epoch": 1.27, - "learning_rate": 0.00010927143296789784, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020200528278997669, + "loss": 0.0141, "step": 252030 }, { - "epoch": 1.27, - "learning_rate": 0.00010926386527488382, - "loss": 0.0102, + "epoch": 0.65, + "learning_rate": 0.0002020013945736052, + "loss": 0.0153, "step": 252040 }, { - "epoch": 1.27, - "learning_rate": 0.00010925629758186982, - "loss": 0.0111, + "epoch": 0.65, + "learning_rate": 0.00020199750635723374, + "loss": 0.0171, "step": 252050 }, { - "epoch": 1.27, - "learning_rate": 0.00010924872988885581, - "loss": 0.0092, + "epoch": 0.65, + "learning_rate": 0.0002019936181408623, + "loss": 0.0128, "step": 252060 }, { - "epoch": 1.27, - "learning_rate": 0.00010924116219584179, - "loss": 0.0105, + "epoch": 0.65, + "learning_rate": 0.00020198972992449082, + "loss": 0.0171, "step": 252070 }, { - "epoch": 1.27, - "learning_rate": 0.00010923359450282779, - "loss": 0.0085, + "epoch": 0.65, + "learning_rate": 0.00020198584170811937, + "loss": 0.0131, "step": 252080 }, { - "epoch": 1.27, - "learning_rate": 0.00010922602680981378, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.00020198195349174788, + "loss": 0.0157, "step": 252090 }, { - "epoch": 1.27, - "learning_rate": 0.00010921845911679976, - "loss": 0.0074, + "epoch": 0.65, + "learning_rate": 0.00020197806527537642, + "loss": 0.0201, "step": 252100 }, { - "epoch": 1.27, - "learning_rate": 0.00010921089142378576, - "loss": 0.008, + "epoch": 0.65, + "learning_rate": 0.00020197417705900496, + "loss": 0.017, "step": 252110 }, { - "epoch": 1.27, - "learning_rate": 0.00010920332373077174, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.0002019702888426335, + "loss": 0.0147, "step": 252120 }, { - "epoch": 1.27, - "learning_rate": 0.00010919575603775774, - "loss": 0.0109, + "epoch": 0.65, + "learning_rate": 0.00020196640062626202, + "loss": 0.0167, "step": 252130 }, { - "epoch": 1.27, - "learning_rate": 0.00010918818834474373, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020196251240989056, + "loss": 0.0137, "step": 252140 }, { - "epoch": 1.27, - "learning_rate": 0.00010918062065172971, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.0002019586241935191, + "loss": 0.0142, "step": 252150 }, { - "epoch": 1.27, - "learning_rate": 0.00010917305295871571, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020195473597714765, + "loss": 0.0173, "step": 252160 }, { - "epoch": 1.27, - "learning_rate": 0.0001091654852657017, - "loss": 0.0081, + "epoch": 0.65, + "learning_rate": 0.00020195084776077616, + "loss": 0.0147, "step": 252170 }, { - "epoch": 1.27, - "learning_rate": 0.00010915791757268768, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.0002019469595444047, + "loss": 0.018, "step": 252180 }, { - "epoch": 1.27, - "learning_rate": 0.00010915034987967368, - "loss": 0.0097, + "epoch": 0.65, + "learning_rate": 0.00020194307132803327, + "loss": 0.0114, "step": 252190 }, { - "epoch": 1.27, - "learning_rate": 0.00010914278218665966, - "loss": 0.0115, + "epoch": 0.65, + "learning_rate": 0.00020193918311166178, + "loss": 0.0153, "step": 252200 }, { - "epoch": 1.27, - "learning_rate": 0.00010913521449364565, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.0002019352948952903, + "loss": 0.0143, "step": 252210 }, { - "epoch": 1.27, - "learning_rate": 0.00010912764680063165, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020193140667891884, + "loss": 0.0164, "step": 252220 }, { - "epoch": 1.27, - "learning_rate": 0.00010912007910761763, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.0002019275184625474, + "loss": 0.0155, "step": 252230 }, { - "epoch": 1.27, - "learning_rate": 0.00010911251141460363, - "loss": 0.0101, + "epoch": 0.65, + "learning_rate": 0.00020192363024617592, + "loss": 0.0141, "step": 252240 }, { - "epoch": 1.27, - "learning_rate": 0.00010910494372158962, - "loss": 0.0114, + "epoch": 0.65, + "learning_rate": 0.00020191974202980447, + "loss": 0.0124, "step": 252250 }, { - "epoch": 1.27, - "learning_rate": 0.0001090973760285756, - "loss": 0.0113, + "epoch": 0.65, + "learning_rate": 0.00020191585381343298, + "loss": 0.0148, "step": 252260 }, { - "epoch": 1.27, - "learning_rate": 0.0001090898083355616, - "loss": 0.0083, + "epoch": 0.65, + "learning_rate": 0.00020191196559706155, + "loss": 0.0162, "step": 252270 }, { - "epoch": 1.27, - "learning_rate": 0.00010908224064254758, - "loss": 0.0098, + "epoch": 0.65, + "learning_rate": 0.00020190807738069006, + "loss": 0.0168, "step": 252280 }, { - "epoch": 1.27, - "learning_rate": 0.00010907467294953357, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002019041891643186, + "loss": 0.0141, "step": 252290 }, { - "epoch": 1.27, - "learning_rate": 0.00010906710525651957, - "loss": 0.0058, + "epoch": 0.65, + "learning_rate": 0.00020190030094794712, + "loss": 0.0154, "step": 252300 }, { - "epoch": 1.27, - "learning_rate": 0.00010905953756350555, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.0002018964127315757, + "loss": 0.0172, "step": 252310 }, { - "epoch": 1.27, - "learning_rate": 0.00010905196987049153, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.0002018925245152042, + "loss": 0.0142, "step": 252320 }, { - "epoch": 1.27, - "learning_rate": 0.00010904440217747751, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020188863629883274, + "loss": 0.0139, "step": 252330 }, { - "epoch": 1.27, - "learning_rate": 0.00010903683448446351, - "loss": 0.0099, + "epoch": 0.65, + "learning_rate": 0.00020188474808246126, + "loss": 0.0184, "step": 252340 }, { - "epoch": 1.27, - "learning_rate": 0.0001090292667914495, - "loss": 0.013, + "epoch": 0.65, + "learning_rate": 0.0002018808598660898, + "loss": 0.0117, "step": 252350 }, { - "epoch": 1.27, - "learning_rate": 0.00010902169909843549, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.00020187697164971834, + "loss": 0.0139, "step": 252360 }, { - "epoch": 1.27, - "learning_rate": 0.00010901413140542148, - "loss": 0.0077, + "epoch": 0.65, + "learning_rate": 0.00020187308343334688, + "loss": 0.0208, "step": 252370 }, { - "epoch": 1.27, - "learning_rate": 0.00010900656371240748, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002018691952169754, + "loss": 0.0202, "step": 252380 }, { - "epoch": 1.27, - "learning_rate": 0.00010899899601939346, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020186530700060394, + "loss": 0.0137, "step": 252390 }, { - "epoch": 1.27, - "learning_rate": 0.00010899142832637945, - "loss": 0.0079, + "epoch": 0.65, + "learning_rate": 0.0002018614187842325, + "loss": 0.0208, "step": 252400 }, { - "epoch": 1.27, - "learning_rate": 0.00010898386063336543, - "loss": 0.0111, + "epoch": 0.65, + "learning_rate": 0.00020185753056786102, + "loss": 0.0165, "step": 252410 }, { - "epoch": 1.27, - "learning_rate": 0.00010897629294035143, - "loss": 0.009, + "epoch": 0.65, + "learning_rate": 0.00020185364235148957, + "loss": 0.0181, "step": 252420 }, { - "epoch": 1.27, - "learning_rate": 0.00010896872524733742, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020184975413511808, + "loss": 0.0232, "step": 252430 }, { - "epoch": 1.27, - "learning_rate": 0.0001089611575543234, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.00020184586591874665, + "loss": 0.0147, "step": 252440 }, { - "epoch": 1.27, - "learning_rate": 0.0001089535898613094, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.00020184197770237516, + "loss": 0.0136, "step": 252450 }, { - "epoch": 1.27, - "learning_rate": 0.0001089460221682954, - "loss": 0.007, + "epoch": 0.65, + "learning_rate": 0.0002018380894860037, + "loss": 0.018, "step": 252460 }, { - "epoch": 1.27, - "learning_rate": 0.00010893845447528138, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020183420126963222, + "loss": 0.017, "step": 252470 }, { - "epoch": 1.27, - "learning_rate": 0.00010893088678226737, - "loss": 0.0082, + "epoch": 0.65, + "learning_rate": 0.0002018303130532608, + "loss": 0.0147, "step": 252480 }, { - "epoch": 1.27, - "learning_rate": 0.00010892331908925335, - "loss": 0.0066, + "epoch": 0.65, + "learning_rate": 0.0002018264248368893, + "loss": 0.0145, "step": 252490 }, { - "epoch": 1.27, - "learning_rate": 0.00010891575139623935, - "loss": 0.0091, + "epoch": 0.65, + "learning_rate": 0.00020182253662051784, + "loss": 0.0141, "step": 252500 }, { - "epoch": 1.27, - "learning_rate": 0.00010890818370322534, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.00020181864840414636, + "loss": 0.0148, "step": 252510 }, { - "epoch": 1.27, - "learning_rate": 0.00010890061601021132, - "loss": 0.0069, + "epoch": 0.65, + "learning_rate": 0.00020181476018777493, + "loss": 0.014, "step": 252520 }, { - "epoch": 1.27, - "learning_rate": 0.00010889304831719732, - "loss": 0.0084, + "epoch": 0.65, + "learning_rate": 0.00020181087197140344, + "loss": 0.0199, "step": 252530 }, { - "epoch": 1.27, - "learning_rate": 0.00010888548062418331, - "loss": 0.0076, + "epoch": 0.65, + "learning_rate": 0.00020180698375503198, + "loss": 0.015, "step": 252540 }, { - "epoch": 1.27, - "learning_rate": 0.0001088779129311693, - "loss": 0.0093, + "epoch": 0.65, + "learning_rate": 0.0002018030955386605, + "loss": 0.0132, "step": 252550 }, { - "epoch": 1.27, - "learning_rate": 0.00010887034523815529, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.00020179920732228907, + "loss": 0.0159, "step": 252560 }, { - "epoch": 1.27, - "learning_rate": 0.00010886277754514127, - "loss": 0.0071, + "epoch": 0.65, + "learning_rate": 0.0002017953191059176, + "loss": 0.019, "step": 252570 }, { - "epoch": 1.27, - "learning_rate": 0.00010885520985212727, - "loss": 0.0075, + "epoch": 0.65, + "learning_rate": 0.00020179143088954612, + "loss": 0.0167, "step": 252580 }, { - "epoch": 1.27, - "learning_rate": 0.00010884764215911326, - "loss": 0.0073, + "epoch": 0.65, + "learning_rate": 0.00020178754267317466, + "loss": 0.015, "step": 252590 }, { - "epoch": 1.27, - "learning_rate": 0.00010884007446609924, - "loss": 0.0089, + "epoch": 0.65, + "learning_rate": 0.00020178365445680318, + "loss": 0.0162, "step": 252600 }, { - "epoch": 1.27, - "learning_rate": 0.00010883250677308524, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020177976624043175, + "loss": 0.0164, "step": 252610 }, { - "epoch": 1.27, - "learning_rate": 0.00010882493908007123, - "loss": 0.0087, + "epoch": 0.65, + "learning_rate": 0.00020177587802406026, + "loss": 0.0169, "step": 252620 }, { - "epoch": 1.27, - "learning_rate": 0.00010881737138705721, - "loss": 0.0078, + "epoch": 0.65, + "learning_rate": 0.0002017719898076888, + "loss": 0.0159, "step": 252630 }, { - "epoch": 1.27, - "learning_rate": 0.00010880980369404321, - "loss": 0.0086, + "epoch": 0.65, + "learning_rate": 0.00020176810159131732, + "loss": 0.0186, "step": 252640 }, { - "epoch": 1.27, - "learning_rate": 0.00010880223600102919, - "loss": 0.0088, + "epoch": 0.65, + "learning_rate": 0.0002017642133749459, + "loss": 0.0138, "step": 252650 }, { - "epoch": 1.27, - "learning_rate": 0.00010879466830801519, - "loss": 0.01, + "epoch": 0.65, + "learning_rate": 0.0002017603251585744, + "loss": 0.0142, "step": 252660 }, { - "epoch": 1.27, - "learning_rate": 0.00010878710061500118, - "loss": 0.0066, + "epoch": 0.65, + "learning_rate": 0.00020175643694220294, + "loss": 0.0109, "step": 252670 }, { - "epoch": 1.27, - "learning_rate": 0.00010877953292198716, - "loss": 0.0095, + "epoch": 0.65, + "learning_rate": 0.00020175254872583146, + "loss": 0.0126, "step": 252680 }, { - "epoch": 1.27, - "learning_rate": 0.00010877196522897316, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020174866050946003, + "loss": 0.0127, "step": 252690 }, { - "epoch": 1.27, - "learning_rate": 0.00010876439753595915, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020174477229308854, + "loss": 0.0174, "step": 252700 }, { - "epoch": 1.27, - "learning_rate": 0.00010875682984294513, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020174088407671708, + "loss": 0.0149, "step": 252710 }, { - "epoch": 1.27, - "learning_rate": 0.00010874926214993113, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.0002017369958603456, + "loss": 0.0142, "step": 252720 }, { - "epoch": 1.28, - "learning_rate": 0.00010874169445691711, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020173310764397417, + "loss": 0.0177, "step": 252730 }, { - "epoch": 1.28, - "learning_rate": 0.0001087341267639031, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.0002017292194276027, + "loss": 0.0151, "step": 252740 }, { - "epoch": 1.28, - "learning_rate": 0.0001087265590708891, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020172533121123122, + "loss": 0.0162, "step": 252750 }, { - "epoch": 1.28, - "learning_rate": 0.00010871899137787508, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020172144299485974, + "loss": 0.0148, "step": 252760 }, { - "epoch": 1.28, - "learning_rate": 0.00010871142368486108, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.0002017175547784883, + "loss": 0.0182, "step": 252770 }, { - "epoch": 1.28, - "learning_rate": 0.00010870385599184707, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020171366656211685, + "loss": 0.0155, "step": 252780 }, { - "epoch": 1.28, - "learning_rate": 0.00010869628829883305, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020170977834574536, + "loss": 0.0157, "step": 252790 }, { - "epoch": 1.28, - "learning_rate": 0.00010868872060581905, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.0002017058901293739, + "loss": 0.0197, "step": 252800 }, { - "epoch": 1.28, - "learning_rate": 0.00010868115291280504, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.00020170200191300245, + "loss": 0.0174, "step": 252810 }, { - "epoch": 1.28, - "learning_rate": 0.00010867358521979102, - "loss": 0.0149, + "epoch": 0.66, + "learning_rate": 0.000201698113696631, + "loss": 0.0111, "step": 252820 }, { - "epoch": 1.28, - "learning_rate": 0.00010866601752677702, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.0002016942254802595, + "loss": 0.0137, "step": 252830 }, { - "epoch": 1.28, - "learning_rate": 0.000108658449833763, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020169033726388804, + "loss": 0.0156, "step": 252840 }, { - "epoch": 1.28, - "learning_rate": 0.000108650882140749, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020168644904751656, + "loss": 0.0185, "step": 252850 }, { - "epoch": 1.28, - "learning_rate": 0.00010864331444773499, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020168256083114513, + "loss": 0.0143, "step": 252860 }, { - "epoch": 1.28, - "learning_rate": 0.00010863574675472097, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020167867261477364, + "loss": 0.0179, "step": 252870 }, { - "epoch": 1.28, - "learning_rate": 0.00010862817906170697, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020167478439840218, + "loss": 0.0168, "step": 252880 }, { - "epoch": 1.28, - "learning_rate": 0.00010862061136869296, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.0002016708961820307, + "loss": 0.0118, "step": 252890 }, { - "epoch": 1.28, - "learning_rate": 0.00010861304367567894, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020166700796565927, + "loss": 0.0154, "step": 252900 }, { - "epoch": 1.28, - "learning_rate": 0.00010860547598266494, - "loss": 0.006, + "epoch": 0.66, + "learning_rate": 0.00020166311974928778, + "loss": 0.0149, "step": 252910 }, { - "epoch": 1.28, - "learning_rate": 0.00010859790828965092, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020165923153291632, + "loss": 0.0141, "step": 252920 }, { - "epoch": 1.28, - "learning_rate": 0.00010859034059663692, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020165534331654484, + "loss": 0.0174, "step": 252930 }, { - "epoch": 1.28, - "learning_rate": 0.00010858277290362291, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.0002016514551001734, + "loss": 0.0126, "step": 252940 }, { - "epoch": 1.28, - "learning_rate": 0.00010857520521060888, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020164756688380195, + "loss": 0.0175, "step": 252950 }, { - "epoch": 1.28, - "learning_rate": 0.00010856763751759487, - "loss": 0.0137, + "epoch": 0.66, + "learning_rate": 0.00020164367866743046, + "loss": 0.0169, "step": 252960 }, { - "epoch": 1.28, - "learning_rate": 0.00010856006982458085, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.000201639790451059, + "loss": 0.0137, "step": 252970 }, { - "epoch": 1.28, - "learning_rate": 0.00010855250213156685, - "loss": 0.0133, + "epoch": 0.66, + "learning_rate": 0.00020163590223468754, + "loss": 0.0145, "step": 252980 }, { - "epoch": 1.28, - "learning_rate": 0.00010854493443855284, - "loss": 0.009, + "epoch": 0.66, + "learning_rate": 0.00020163201401831609, + "loss": 0.0146, "step": 252990 }, { - "epoch": 1.28, - "learning_rate": 0.00010853736674553883, - "loss": 0.0104, + "epoch": 0.66, + "learning_rate": 0.0002016281258019446, + "loss": 0.0166, "step": 253000 }, { - "epoch": 1.28, - "eval_cer": 0.914462492734159, - "eval_loss": 0.006441994570195675, - "eval_runtime": 116.0386, - "eval_samples_per_second": 17.236, - "eval_steps_per_second": 4.309, + "epoch": 0.66, + "eval_cer": 0.8817474747050615, + "eval_loss": 0.01099295075982809, + "eval_runtime": 107.2229, + "eval_samples_per_second": 18.653, + "eval_steps_per_second": 4.663, "step": 253000 }, { - "epoch": 1.28, - "learning_rate": 0.00010852979905252482, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020162423758557314, + "loss": 0.0204, "step": 253010 }, { - "epoch": 1.28, - "learning_rate": 0.0001085222313595108, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020162034936920168, + "loss": 0.0127, "step": 253020 }, { - "epoch": 1.28, - "learning_rate": 0.0001085146636664968, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020161646115283023, + "loss": 0.0175, "step": 253030 }, { - "epoch": 1.28, - "learning_rate": 0.00010850709597348279, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020161257293645874, + "loss": 0.0173, "step": 253040 }, { - "epoch": 1.28, - "learning_rate": 0.00010849952828046877, - "loss": 0.0061, + "epoch": 0.66, + "learning_rate": 0.00020160868472008728, + "loss": 0.0143, "step": 253050 }, { - "epoch": 1.28, - "learning_rate": 0.00010849196058745477, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020160479650371585, + "loss": 0.0155, "step": 253060 }, { - "epoch": 1.28, - "learning_rate": 0.00010848439289444076, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020160090828734437, + "loss": 0.0144, "step": 253070 }, { - "epoch": 1.28, - "learning_rate": 0.00010847682520142675, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.00020159702007097288, + "loss": 0.0206, "step": 253080 }, { - "epoch": 1.28, - "learning_rate": 0.00010846925750841274, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020159313185460142, + "loss": 0.0134, "step": 253090 }, { - "epoch": 1.28, - "learning_rate": 0.00010846168981539872, - "loss": 0.0116, + "epoch": 0.66, + "learning_rate": 0.00020158924363822994, + "loss": 0.0153, "step": 253100 }, { - "epoch": 1.28, - "learning_rate": 0.00010845412212238472, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.0002015853554218585, + "loss": 0.0128, "step": 253110 }, { - "epoch": 1.28, - "learning_rate": 0.00010844655442937071, - "loss": 0.0119, + "epoch": 0.66, + "learning_rate": 0.00020158146720548705, + "loss": 0.0214, "step": 253120 }, { - "epoch": 1.28, - "learning_rate": 0.00010843898673635669, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020157757898911556, + "loss": 0.0137, "step": 253130 }, { - "epoch": 1.28, - "learning_rate": 0.00010843141904334269, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.0002015736907727441, + "loss": 0.0133, "step": 253140 }, { - "epoch": 1.28, - "learning_rate": 0.00010842385135032868, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020156980255637264, + "loss": 0.0142, "step": 253150 }, { - "epoch": 1.28, - "learning_rate": 0.00010841628365731466, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020156591434000119, + "loss": 0.0191, "step": 253160 }, { - "epoch": 1.28, - "learning_rate": 0.00010840871596430066, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.0002015620261236297, + "loss": 0.0197, "step": 253170 }, { - "epoch": 1.28, - "learning_rate": 0.00010840114827128664, - "loss": 0.0056, + "epoch": 0.66, + "learning_rate": 0.00020155813790725824, + "loss": 0.0167, "step": 253180 }, { - "epoch": 1.28, - "learning_rate": 0.00010839358057827264, - "loss": 0.0105, + "epoch": 0.66, + "learning_rate": 0.00020155424969088678, + "loss": 0.0157, "step": 253190 }, { - "epoch": 1.28, - "learning_rate": 0.00010838601288525863, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020155036147451533, + "loss": 0.0145, "step": 253200 }, { - "epoch": 1.28, - "learning_rate": 0.00010837844519224461, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020154647325814384, + "loss": 0.0135, "step": 253210 }, { - "epoch": 1.28, - "learning_rate": 0.00010837087749923061, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.00020154258504177238, + "loss": 0.0172, "step": 253220 }, { - "epoch": 1.28, - "learning_rate": 0.0001083633098062166, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020153869682540092, + "loss": 0.0174, "step": 253230 }, { - "epoch": 1.28, - "learning_rate": 0.00010835574211320258, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020153480860902946, + "loss": 0.0173, "step": 253240 }, { - "epoch": 1.28, - "learning_rate": 0.00010834817442018858, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020153092039265798, + "loss": 0.0148, "step": 253250 }, { - "epoch": 1.28, - "learning_rate": 0.00010834060672717456, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.00020152703217628652, + "loss": 0.0129, "step": 253260 }, { - "epoch": 1.28, - "learning_rate": 0.00010833303903416056, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.0002015231439599151, + "loss": 0.0198, "step": 253270 }, { - "epoch": 1.28, - "learning_rate": 0.00010832547134114655, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.0002015192557435436, + "loss": 0.0142, "step": 253280 }, { - "epoch": 1.28, - "learning_rate": 0.00010831790364813253, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020151536752717215, + "loss": 0.0155, "step": 253290 }, { - "epoch": 1.28, - "learning_rate": 0.00010831033595511853, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020151147931080066, + "loss": 0.0198, "step": 253300 }, { - "epoch": 1.28, - "learning_rate": 0.00010830276826210452, - "loss": 0.0058, + "epoch": 0.66, + "learning_rate": 0.00020150759109442923, + "loss": 0.0132, "step": 253310 }, { - "epoch": 1.28, - "learning_rate": 0.0001082952005690905, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020150370287805774, + "loss": 0.0206, "step": 253320 }, { - "epoch": 1.28, - "learning_rate": 0.0001082876328760765, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020149981466168629, + "loss": 0.0175, "step": 253330 }, { - "epoch": 1.28, - "learning_rate": 0.00010828006518306249, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.0002014959264453148, + "loss": 0.0177, "step": 253340 }, { - "epoch": 1.28, - "learning_rate": 0.00010827249749004847, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020149203822894334, + "loss": 0.0158, "step": 253350 }, { - "epoch": 1.28, - "learning_rate": 0.00010826492979703447, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020148815001257188, + "loss": 0.0167, "step": 253360 }, { - "epoch": 1.28, - "learning_rate": 0.00010825736210402045, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020148426179620042, + "loss": 0.0233, "step": 253370 }, { - "epoch": 1.28, - "learning_rate": 0.00010824979441100645, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020148037357982894, + "loss": 0.0155, "step": 253380 }, { - "epoch": 1.28, - "learning_rate": 0.00010824222671799244, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020147648536345748, + "loss": 0.0182, "step": 253390 }, { - "epoch": 1.28, - "learning_rate": 0.00010823465902497842, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020147259714708602, + "loss": 0.0216, "step": 253400 }, { - "epoch": 1.28, - "learning_rate": 0.00010822709133196442, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020146870893071456, + "loss": 0.0154, "step": 253410 }, { - "epoch": 1.28, - "learning_rate": 0.00010821952363895041, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020146482071434308, + "loss": 0.0154, "step": 253420 }, { - "epoch": 1.28, - "learning_rate": 0.0001082119559459364, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020146093249797162, + "loss": 0.0133, "step": 253430 }, { - "epoch": 1.28, - "learning_rate": 0.00010820438825292239, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.0002014570442816002, + "loss": 0.0173, "step": 253440 }, { - "epoch": 1.28, - "learning_rate": 0.00010819682055990837, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.0002014531560652287, + "loss": 0.0117, "step": 253450 }, { - "epoch": 1.28, - "learning_rate": 0.00010818925286689437, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020144926784885725, + "loss": 0.0172, "step": 253460 }, { - "epoch": 1.28, - "learning_rate": 0.00010818168517388036, - "loss": 0.0065, + "epoch": 0.66, + "learning_rate": 0.00020144537963248576, + "loss": 0.0137, "step": 253470 }, { - "epoch": 1.28, - "learning_rate": 0.00010817411748086634, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020144149141611433, + "loss": 0.0156, "step": 253480 }, { - "epoch": 1.28, - "learning_rate": 0.00010816654978785234, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020143760319974284, + "loss": 0.0168, "step": 253490 }, { - "epoch": 1.28, - "learning_rate": 0.00010815898209483833, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020143371498337138, + "loss": 0.0166, "step": 253500 }, { - "epoch": 1.28, - "learning_rate": 0.00010815141440182431, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.0002014298267669999, + "loss": 0.015, "step": 253510 }, { - "epoch": 1.28, - "learning_rate": 0.00010814384670881031, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020142593855062847, + "loss": 0.0144, "step": 253520 }, { - "epoch": 1.28, - "learning_rate": 0.00010813627901579629, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020142205033425698, + "loss": 0.0177, "step": 253530 }, { - "epoch": 1.28, - "learning_rate": 0.00010812871132278228, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.00020141816211788552, + "loss": 0.014, "step": 253540 }, { - "epoch": 1.28, - "learning_rate": 0.00010812114362976828, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020141427390151404, + "loss": 0.0185, "step": 253550 }, { - "epoch": 1.28, - "learning_rate": 0.00010811357593675426, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.0002014103856851426, + "loss": 0.0158, "step": 253560 }, { - "epoch": 1.28, - "learning_rate": 0.00010810600824374026, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020140649746877112, + "loss": 0.0159, "step": 253570 }, { - "epoch": 1.28, - "learning_rate": 0.00010809844055072622, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020140260925239966, + "loss": 0.0155, "step": 253580 }, { - "epoch": 1.28, - "learning_rate": 0.00010809087285771222, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020139872103602818, + "loss": 0.0209, "step": 253590 }, { - "epoch": 1.28, - "learning_rate": 0.00010808330516469821, - "loss": 0.0106, + "epoch": 0.66, + "learning_rate": 0.00020139483281965672, + "loss": 0.0128, "step": 253600 }, { - "epoch": 1.28, - "learning_rate": 0.0001080757374716842, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.0002013909446032853, + "loss": 0.0163, "step": 253610 }, { - "epoch": 1.28, - "learning_rate": 0.00010806816977867019, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.0002013870563869138, + "loss": 0.014, "step": 253620 }, { - "epoch": 1.28, - "learning_rate": 0.00010806060208565617, - "loss": 0.0113, + "epoch": 0.66, + "learning_rate": 0.00020138316817054232, + "loss": 0.0204, "step": 253630 }, { - "epoch": 1.28, - "learning_rate": 0.00010805303439264217, - "loss": 0.0108, + "epoch": 0.66, + "learning_rate": 0.00020137927995417086, + "loss": 0.0152, "step": 253640 }, { - "epoch": 1.28, - "learning_rate": 0.00010804546669962816, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020137539173779943, + "loss": 0.0158, "step": 253650 }, { - "epoch": 1.28, - "learning_rate": 0.00010803789900661414, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020137150352142794, + "loss": 0.0186, "step": 253660 }, { - "epoch": 1.28, - "learning_rate": 0.00010803033131360014, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020136761530505648, + "loss": 0.0169, "step": 253670 }, { - "epoch": 1.28, - "learning_rate": 0.00010802276362058613, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.000201363727088685, + "loss": 0.0172, "step": 253680 }, { - "epoch": 1.28, - "learning_rate": 0.00010801519592757211, - "loss": 0.0111, + "epoch": 0.66, + "learning_rate": 0.00020135983887231357, + "loss": 0.0151, "step": 253690 }, { - "epoch": 1.28, - "learning_rate": 0.00010800762823455811, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020135595065594208, + "loss": 0.0153, "step": 253700 }, { - "epoch": 1.28, - "learning_rate": 0.00010800006054154409, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020135206243957062, + "loss": 0.0139, "step": 253710 }, { - "epoch": 1.28, - "learning_rate": 0.00010799249284853009, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020134817422319914, + "loss": 0.0178, "step": 253720 }, { - "epoch": 1.28, - "learning_rate": 0.00010798492515551608, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.0002013442860068277, + "loss": 0.015, "step": 253730 }, { - "epoch": 1.28, - "learning_rate": 0.00010797735746250206, - "loss": 0.0064, + "epoch": 0.66, + "learning_rate": 0.00020134039779045622, + "loss": 0.018, "step": 253740 }, { - "epoch": 1.28, - "learning_rate": 0.00010796978976948806, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020133650957408476, + "loss": 0.0172, "step": 253750 }, { - "epoch": 1.28, - "learning_rate": 0.00010796222207647405, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020133262135771328, + "loss": 0.014, "step": 253760 }, { - "epoch": 1.28, - "learning_rate": 0.00010795465438346003, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020132873314134185, + "loss": 0.0151, "step": 253770 }, { - "epoch": 1.28, - "learning_rate": 0.00010794708669044603, - "loss": 0.0114, + "epoch": 0.66, + "learning_rate": 0.0002013248449249704, + "loss": 0.0165, "step": 253780 }, { - "epoch": 1.28, - "learning_rate": 0.00010793951899743202, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.0002013209567085989, + "loss": 0.0146, "step": 253790 }, { - "epoch": 1.28, - "learning_rate": 0.000107931951304418, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020131706849222742, + "loss": 0.0159, "step": 253800 }, { - "epoch": 1.28, - "learning_rate": 0.000107924383611404, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.00020131318027585599, + "loss": 0.0156, "step": 253810 }, { - "epoch": 1.28, - "learning_rate": 0.00010791681591838998, - "loss": 0.0109, + "epoch": 0.66, + "learning_rate": 0.00020130929205948453, + "loss": 0.0131, "step": 253820 }, { - "epoch": 1.28, - "learning_rate": 0.00010790924822537598, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020130540384311304, + "loss": 0.0166, "step": 253830 }, { - "epoch": 1.28, - "learning_rate": 0.00010790168053236197, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020130151562674158, + "loss": 0.013, "step": 253840 }, { - "epoch": 1.28, - "learning_rate": 0.00010789411283934795, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.0002012976274103701, + "loss": 0.0133, "step": 253850 }, { - "epoch": 1.28, - "learning_rate": 0.00010788654514633395, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020129373919399867, + "loss": 0.0143, "step": 253860 }, { - "epoch": 1.28, - "learning_rate": 0.00010787897745331994, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020128985097762718, + "loss": 0.0162, "step": 253870 }, { - "epoch": 1.28, - "learning_rate": 0.00010787140976030592, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020128596276125572, + "loss": 0.0159, "step": 253880 }, { - "epoch": 1.28, - "learning_rate": 0.00010786384206729192, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020128207454488424, + "loss": 0.0179, "step": 253890 }, { - "epoch": 1.28, - "learning_rate": 0.0001078562743742779, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.0002012781863285128, + "loss": 0.0172, "step": 253900 }, { - "epoch": 1.28, - "learning_rate": 0.0001078487066812639, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020127429811214132, + "loss": 0.0172, "step": 253910 }, { - "epoch": 1.28, - "learning_rate": 0.00010784113898824989, - "loss": 0.0103, + "epoch": 0.66, + "learning_rate": 0.00020127040989576986, + "loss": 0.0153, "step": 253920 }, { - "epoch": 1.28, - "learning_rate": 0.00010783357129523587, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020126652167939838, + "loss": 0.0216, "step": 253930 }, { - "epoch": 1.28, - "learning_rate": 0.00010782600360222187, - "loss": 0.0103, + "epoch": 0.66, + "learning_rate": 0.00020126263346302695, + "loss": 0.0136, "step": 253940 }, { - "epoch": 1.28, - "learning_rate": 0.00010781843590920786, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020125874524665546, + "loss": 0.0157, "step": 253950 }, { - "epoch": 1.28, - "learning_rate": 0.00010781086821619384, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.000201254857030284, + "loss": 0.0148, "step": 253960 }, { - "epoch": 1.28, - "learning_rate": 0.00010780330052317984, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020125096881391252, + "loss": 0.0174, "step": 253970 }, { - "epoch": 1.28, - "learning_rate": 0.00010779573283016582, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020124708059754109, + "loss": 0.0191, "step": 253980 }, { - "epoch": 1.28, - "learning_rate": 0.00010778816513715182, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020124319238116963, + "loss": 0.013, "step": 253990 }, { - "epoch": 1.28, - "learning_rate": 0.00010778059744413781, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020123930416479814, + "loss": 0.0141, "step": 254000 }, { - "epoch": 1.28, - "eval_cer": 0.9144450256039017, - "eval_loss": 0.00646965904161334, - "eval_runtime": 116.1648, - "eval_samples_per_second": 17.217, - "eval_steps_per_second": 4.304, + "epoch": 0.66, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.010805866681039333, + "eval_runtime": 107.3516, + "eval_samples_per_second": 18.63, + "eval_steps_per_second": 4.658, "step": 254000 }, { - "epoch": 1.28, - "learning_rate": 0.00010777302975112379, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020123541594842668, + "loss": 0.0205, "step": 254010 }, { - "epoch": 1.28, - "learning_rate": 0.00010776546205810979, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020123152773205522, + "loss": 0.0176, "step": 254020 }, { - "epoch": 1.28, - "learning_rate": 0.00010775789436509578, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020122763951568377, + "loss": 0.0166, "step": 254030 }, { - "epoch": 1.28, - "learning_rate": 0.00010775032667208176, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020122375129931228, + "loss": 0.013, "step": 254040 }, { - "epoch": 1.28, - "learning_rate": 0.00010774275897906776, - "loss": 0.0056, + "epoch": 0.66, + "learning_rate": 0.00020121986308294082, + "loss": 0.0134, "step": 254050 }, { - "epoch": 1.28, - "learning_rate": 0.00010773519128605374, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020121597486656936, + "loss": 0.0142, "step": 254060 }, { - "epoch": 1.28, - "learning_rate": 0.00010772762359303973, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.0002012120866501979, + "loss": 0.0137, "step": 254070 }, { - "epoch": 1.28, - "learning_rate": 0.00010772005590002573, - "loss": 0.0117, + "epoch": 0.66, + "learning_rate": 0.00020120819843382642, + "loss": 0.0142, "step": 254080 }, { - "epoch": 1.28, - "learning_rate": 0.00010771248820701171, - "loss": 0.0115, + "epoch": 0.66, + "learning_rate": 0.00020120431021745496, + "loss": 0.0122, "step": 254090 }, { - "epoch": 1.28, - "learning_rate": 0.0001077049205139977, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020120042200108348, + "loss": 0.0176, "step": 254100 }, { - "epoch": 1.28, - "learning_rate": 0.0001076973528209837, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020119653378471205, + "loss": 0.0149, "step": 254110 }, { - "epoch": 1.28, - "learning_rate": 0.00010768978512796968, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020119264556834056, + "loss": 0.0146, "step": 254120 }, { - "epoch": 1.28, - "learning_rate": 0.00010768221743495568, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.0002011887573519691, + "loss": 0.0158, "step": 254130 }, { - "epoch": 1.28, - "learning_rate": 0.00010767464974194166, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020118486913559762, + "loss": 0.0141, "step": 254140 }, { - "epoch": 1.28, - "learning_rate": 0.00010766708204892765, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020118098091922618, + "loss": 0.012, "step": 254150 }, { - "epoch": 1.28, - "learning_rate": 0.00010765951435591365, - "loss": 0.0119, + "epoch": 0.66, + "learning_rate": 0.00020117709270285473, + "loss": 0.0135, "step": 254160 }, { - "epoch": 1.28, - "learning_rate": 0.00010765194666289963, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020117320448648324, + "loss": 0.0151, "step": 254170 }, { - "epoch": 1.28, - "learning_rate": 0.00010764437896988563, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020116931627011178, + "loss": 0.0219, "step": 254180 }, { - "epoch": 1.28, - "learning_rate": 0.00010763681127687162, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020116542805374032, + "loss": 0.0167, "step": 254190 }, { - "epoch": 1.28, - "learning_rate": 0.0001076292435838576, - "loss": 0.0095, - "step": 254200 + "epoch": 0.66, + "learning_rate": 0.00020116153983736887, + "loss": 0.0172, + "step": 254200 }, { - "epoch": 1.28, - "learning_rate": 0.00010762167589084358, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020115765162099738, + "loss": 0.0163, "step": 254210 }, { - "epoch": 1.28, - "learning_rate": 0.00010761410819782956, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020115376340462592, + "loss": 0.0141, "step": 254220 }, { - "epoch": 1.28, - "learning_rate": 0.00010760654050481556, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020114987518825446, + "loss": 0.0168, "step": 254230 }, { - "epoch": 1.28, - "learning_rate": 0.00010759897281180155, - "loss": 0.0107, + "epoch": 0.66, + "learning_rate": 0.000201145986971883, + "loss": 0.0152, "step": 254240 }, { - "epoch": 1.28, - "learning_rate": 0.00010759140511878754, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020114209875551152, + "loss": 0.013, "step": 254250 }, { - "epoch": 1.28, - "learning_rate": 0.00010758383742577353, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.00020113821053914006, + "loss": 0.0168, "step": 254260 }, { - "epoch": 1.28, - "learning_rate": 0.00010757626973275951, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002011343223227686, + "loss": 0.0165, "step": 254270 }, { - "epoch": 1.28, - "learning_rate": 0.00010756870203974551, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020113043410639714, + "loss": 0.0132, "step": 254280 }, { - "epoch": 1.28, - "learning_rate": 0.0001075611343467315, - "loss": 0.0054, + "epoch": 0.66, + "learning_rate": 0.00020112654589002566, + "loss": 0.0134, "step": 254290 }, { - "epoch": 1.28, - "learning_rate": 0.00010755356665371748, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.0002011226576736542, + "loss": 0.016, "step": 254300 }, { - "epoch": 1.28, - "learning_rate": 0.00010754599896070348, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020111876945728272, + "loss": 0.0159, "step": 254310 }, { - "epoch": 1.28, - "learning_rate": 0.00010753843126768947, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020111488124091128, + "loss": 0.0178, "step": 254320 }, { - "epoch": 1.28, - "learning_rate": 0.00010753086357467546, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020111099302453983, + "loss": 0.0181, "step": 254330 }, { - "epoch": 1.28, - "learning_rate": 0.00010752329588166145, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020110710480816834, + "loss": 0.0201, "step": 254340 }, { - "epoch": 1.28, - "learning_rate": 0.00010751572818864743, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020110321659179685, + "loss": 0.0175, "step": 254350 }, { - "epoch": 1.28, - "learning_rate": 0.00010750816049563343, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020109932837542542, + "loss": 0.0134, "step": 254360 }, { - "epoch": 1.28, - "learning_rate": 0.00010750059280261942, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020109544015905396, + "loss": 0.0165, "step": 254370 }, { - "epoch": 1.28, - "learning_rate": 0.0001074930251096054, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020109155194268248, + "loss": 0.0126, "step": 254380 }, { - "epoch": 1.28, - "learning_rate": 0.0001074854574165914, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020108766372631102, + "loss": 0.0118, "step": 254390 }, { - "epoch": 1.28, - "learning_rate": 0.0001074778897235774, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020108377550993956, + "loss": 0.0143, "step": 254400 }, { - "epoch": 1.28, - "learning_rate": 0.00010747032203056337, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.0002010798872935681, + "loss": 0.0135, "step": 254410 }, { - "epoch": 1.28, - "learning_rate": 0.00010746275433754937, - "loss": 0.0174, + "epoch": 0.66, + "learning_rate": 0.00020107599907719662, + "loss": 0.0126, "step": 254420 }, { - "epoch": 1.28, - "learning_rate": 0.00010745518664453535, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020107211086082516, + "loss": 0.0135, "step": 254430 }, { - "epoch": 1.28, - "learning_rate": 0.00010744761895152135, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.0002010682226444537, + "loss": 0.0134, "step": 254440 }, { - "epoch": 1.28, - "learning_rate": 0.00010744005125850734, - "loss": 0.0054, + "epoch": 0.66, + "learning_rate": 0.00020106433442808224, + "loss": 0.0169, "step": 254450 }, { - "epoch": 1.28, - "learning_rate": 0.00010743248356549332, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020106044621171076, + "loss": 0.0138, "step": 254460 }, { - "epoch": 1.28, - "learning_rate": 0.00010742491587247932, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.0002010565579953393, + "loss": 0.0155, "step": 254470 }, { - "epoch": 1.28, - "learning_rate": 0.00010741734817946531, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020105266977896787, + "loss": 0.0136, "step": 254480 }, { - "epoch": 1.28, - "learning_rate": 0.0001074097804864513, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020104878156259638, + "loss": 0.0154, "step": 254490 }, { - "epoch": 1.28, - "learning_rate": 0.00010740221279343729, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.0002010448933462249, + "loss": 0.0161, "step": 254500 }, { - "epoch": 1.28, - "learning_rate": 0.00010739464510042327, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020104100512985344, + "loss": 0.0144, "step": 254510 }, { - "epoch": 1.28, - "learning_rate": 0.00010738707740740927, - "loss": 0.011, + "epoch": 0.66, + "learning_rate": 0.000201037116913482, + "loss": 0.014, "step": 254520 }, { - "epoch": 1.28, - "learning_rate": 0.00010737950971439526, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020103322869711052, + "loss": 0.0127, "step": 254530 }, { - "epoch": 1.28, - "learning_rate": 0.00010737194202138124, - "loss": 0.0104, + "epoch": 0.66, + "learning_rate": 0.00020102934048073906, + "loss": 0.0126, "step": 254540 }, { - "epoch": 1.28, - "learning_rate": 0.00010736437432836724, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020102545226436758, + "loss": 0.0143, "step": 254550 }, { - "epoch": 1.28, - "learning_rate": 0.00010735680663535323, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.00020102156404799612, + "loss": 0.0136, "step": 254560 }, { - "epoch": 1.28, - "learning_rate": 0.00010734923894233921, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020101767583162466, + "loss": 0.0157, "step": 254570 }, { - "epoch": 1.28, - "learning_rate": 0.00010734167124932521, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.0002010137876152532, + "loss": 0.0171, "step": 254580 }, { - "epoch": 1.28, - "learning_rate": 0.00010733410355631119, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020100989939888172, + "loss": 0.0158, "step": 254590 }, { - "epoch": 1.28, - "learning_rate": 0.00010732653586329718, - "loss": 0.0133, + "epoch": 0.66, + "learning_rate": 0.00020100601118251026, + "loss": 0.0177, "step": 254600 }, { - "epoch": 1.28, - "learning_rate": 0.00010731896817028318, - "loss": 0.0108, + "epoch": 0.66, + "learning_rate": 0.0002010021229661388, + "loss": 0.0137, "step": 254610 }, { - "epoch": 1.28, - "learning_rate": 0.00010731140047726916, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020099823474976734, + "loss": 0.0129, "step": 254620 }, { - "epoch": 1.28, - "learning_rate": 0.00010730383278425516, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020099434653339586, + "loss": 0.013, "step": 254630 }, { - "epoch": 1.28, - "learning_rate": 0.00010729626509124115, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.0002009904583170244, + "loss": 0.0169, "step": 254640 }, { - "epoch": 1.28, - "learning_rate": 0.00010728869739822713, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020098657010065297, + "loss": 0.0113, "step": 254650 }, { - "epoch": 1.28, - "learning_rate": 0.00010728112970521313, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020098268188428148, + "loss": 0.0133, "step": 254660 }, { - "epoch": 1.28, - "learning_rate": 0.00010727356201219911, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020097879366791, + "loss": 0.0189, "step": 254670 }, { - "epoch": 1.28, - "learning_rate": 0.0001072659943191851, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020097490545153854, + "loss": 0.0176, "step": 254680 }, { - "epoch": 1.28, - "learning_rate": 0.0001072584266261711, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.0002009710172351671, + "loss": 0.0147, "step": 254690 }, { - "epoch": 1.28, - "learning_rate": 0.00010725085893315708, - "loss": 0.0103, + "epoch": 0.66, + "learning_rate": 0.00020096712901879562, + "loss": 0.0142, "step": 254700 }, { - "epoch": 1.29, - "learning_rate": 0.00010724329124014308, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020096324080242416, + "loss": 0.016, "step": 254710 }, { - "epoch": 1.29, - "learning_rate": 0.00010723572354712907, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020095935258605268, + "loss": 0.0205, "step": 254720 }, { - "epoch": 1.29, - "learning_rate": 0.00010722815585411505, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020095546436968125, + "loss": 0.0131, "step": 254730 }, { - "epoch": 1.29, - "learning_rate": 0.00010722058816110105, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020095157615330976, + "loss": 0.0159, "step": 254740 }, { - "epoch": 1.29, - "learning_rate": 0.00010721302046808704, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002009476879369383, + "loss": 0.0127, "step": 254750 }, { - "epoch": 1.29, - "learning_rate": 0.00010720545277507302, - "loss": 0.0093, + "epoch": 0.66, + "learning_rate": 0.00020094379972056682, + "loss": 0.0165, "step": 254760 }, { - "epoch": 1.29, - "learning_rate": 0.00010719788508205902, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.0002009399115041954, + "loss": 0.0133, "step": 254770 }, { - "epoch": 1.29, - "learning_rate": 0.000107190317389045, - "loss": 0.0109, + "epoch": 0.66, + "learning_rate": 0.0002009360232878239, + "loss": 0.0169, "step": 254780 }, { - "epoch": 1.29, - "learning_rate": 0.000107182749696031, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.00020093213507145244, + "loss": 0.0171, "step": 254790 }, { - "epoch": 1.29, - "learning_rate": 0.00010717518200301699, - "loss": 0.0088, + "epoch": 0.66, + "learning_rate": 0.00020092824685508096, + "loss": 0.0157, "step": 254800 }, { - "epoch": 1.29, - "learning_rate": 0.00010716761431000297, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.0002009243586387095, + "loss": 0.0175, "step": 254810 }, { - "epoch": 1.29, - "learning_rate": 0.00010716004661698897, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020092047042233804, + "loss": 0.017, "step": 254820 }, { - "epoch": 1.29, - "learning_rate": 0.00010715247892397496, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020091658220596658, + "loss": 0.0155, "step": 254830 }, { - "epoch": 1.29, - "learning_rate": 0.00010714491123096093, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.0002009126939895951, + "loss": 0.013, "step": 254840 }, { - "epoch": 1.29, - "learning_rate": 0.00010713734353794692, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.00020090880577322364, + "loss": 0.017, "step": 254850 }, { - "epoch": 1.29, - "learning_rate": 0.0001071297758449329, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.0002009049175568522, + "loss": 0.0183, "step": 254860 }, { - "epoch": 1.29, - "learning_rate": 0.0001071222081519189, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020090102934048072, + "loss": 0.016, "step": 254870 }, { - "epoch": 1.29, - "learning_rate": 0.00010711464045890488, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020089714112410926, + "loss": 0.0139, "step": 254880 }, { - "epoch": 1.29, - "learning_rate": 0.00010710707276589088, - "loss": 0.0065, + "epoch": 0.66, + "learning_rate": 0.00020089325290773778, + "loss": 0.0163, "step": 254890 }, { - "epoch": 1.29, - "learning_rate": 0.00010709950507287687, - "loss": 0.0063, + "epoch": 0.66, + "learning_rate": 0.00020088936469136635, + "loss": 0.0139, "step": 254900 }, { - "epoch": 1.29, - "learning_rate": 0.00010709193737986285, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020088547647499486, + "loss": 0.0155, "step": 254910 }, { - "epoch": 1.29, - "learning_rate": 0.00010708436968684885, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.0002008815882586234, + "loss": 0.015, "step": 254920 }, { - "epoch": 1.29, - "learning_rate": 0.00010707680199383484, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020087770004225192, + "loss": 0.014, "step": 254930 }, { - "epoch": 1.29, - "learning_rate": 0.00010706923430082082, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020087381182588049, + "loss": 0.0157, "step": 254940 }, { - "epoch": 1.29, - "learning_rate": 0.00010706166660780682, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.000200869923609509, + "loss": 0.0137, "step": 254950 }, { - "epoch": 1.29, - "learning_rate": 0.0001070540989147928, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020086603539313754, + "loss": 0.0126, "step": 254960 }, { - "epoch": 1.29, - "learning_rate": 0.0001070465312217788, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020086214717676606, + "loss": 0.0135, "step": 254970 }, { - "epoch": 1.29, - "learning_rate": 0.00010703896352876479, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020085825896039463, + "loss": 0.0141, "step": 254980 }, { - "epoch": 1.29, - "learning_rate": 0.00010703139583575077, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020085437074402314, + "loss": 0.014, "step": 254990 }, { - "epoch": 1.29, - "learning_rate": 0.00010702382814273677, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020085048252765168, + "loss": 0.0139, "step": 255000 }, { - "epoch": 1.29, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.006503617390990257, - "eval_runtime": 116.441, - "eval_samples_per_second": 17.176, - "eval_steps_per_second": 4.294, + "epoch": 0.66, + "eval_cer": 0.8817488743419957, + "eval_loss": 0.010790371336042881, + "eval_runtime": 107.3987, + "eval_samples_per_second": 18.622, + "eval_steps_per_second": 4.656, "step": 255000 }, { - "epoch": 1.29, - "learning_rate": 0.00010701626044972276, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.0002008465943112802, + "loss": 0.0133, "step": 255010 }, { - "epoch": 1.29, - "learning_rate": 0.00010700869275670874, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020084270609490876, + "loss": 0.0159, "step": 255020 }, { - "epoch": 1.29, - "learning_rate": 0.00010700112506369474, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.0002008388178785373, + "loss": 0.0153, "step": 255030 }, { - "epoch": 1.29, - "learning_rate": 0.00010699355737068072, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020083492966216582, + "loss": 0.0155, "step": 255040 }, { - "epoch": 1.29, - "learning_rate": 0.00010698598967766672, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020083104144579436, + "loss": 0.0147, "step": 255050 }, { - "epoch": 1.29, - "learning_rate": 0.00010697842198465271, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020082715322942288, + "loss": 0.0162, "step": 255060 }, { - "epoch": 1.29, - "learning_rate": 0.00010697085429163869, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020082326501305145, + "loss": 0.0118, "step": 255070 }, { - "epoch": 1.29, - "learning_rate": 0.00010696328659862469, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020081937679667996, + "loss": 0.0139, "step": 255080 }, { - "epoch": 1.29, - "learning_rate": 0.00010695571890561068, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.0002008154885803085, + "loss": 0.0164, "step": 255090 }, { - "epoch": 1.29, - "learning_rate": 0.00010694815121259666, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020081160036393702, + "loss": 0.0166, "step": 255100 }, { - "epoch": 1.29, - "learning_rate": 0.00010694058351958266, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020080771214756559, + "loss": 0.0156, "step": 255110 }, { - "epoch": 1.29, - "learning_rate": 0.00010693301582656864, - "loss": 0.0108, + "epoch": 0.66, + "learning_rate": 0.0002008038239311941, + "loss": 0.0123, "step": 255120 }, { - "epoch": 1.29, - "learning_rate": 0.00010692544813355463, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020079993571482264, + "loss": 0.0141, "step": 255130 }, { - "epoch": 1.29, - "learning_rate": 0.00010691788044054063, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.00020079604749845116, + "loss": 0.0141, "step": 255140 }, { - "epoch": 1.29, - "learning_rate": 0.00010691031274752661, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020079215928207972, + "loss": 0.0199, "step": 255150 }, { - "epoch": 1.29, - "learning_rate": 0.0001069027450545126, - "loss": 0.0064, + "epoch": 0.66, + "learning_rate": 0.00020078827106570824, + "loss": 0.0165, "step": 255160 }, { - "epoch": 1.29, - "learning_rate": 0.0001068951773614986, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020078438284933678, + "loss": 0.0152, "step": 255170 }, { - "epoch": 1.29, - "learning_rate": 0.00010688760966848458, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.0002007804946329653, + "loss": 0.0135, "step": 255180 }, { - "epoch": 1.29, - "learning_rate": 0.00010688004197547058, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020077660641659386, + "loss": 0.0189, "step": 255190 }, { - "epoch": 1.29, - "learning_rate": 0.00010687247428245656, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.0002007727182002224, + "loss": 0.0189, "step": 255200 }, { - "epoch": 1.29, - "learning_rate": 0.00010686490658944255, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.00020076882998385092, + "loss": 0.0133, "step": 255210 }, { - "epoch": 1.29, - "learning_rate": 0.00010685733889642855, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020076494176747943, + "loss": 0.02, "step": 255220 }, { - "epoch": 1.29, - "learning_rate": 0.00010684977120341453, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.000200761053551108, + "loss": 0.0167, "step": 255230 }, { - "epoch": 1.29, - "learning_rate": 0.00010684220351040053, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020075716533473655, + "loss": 0.0172, "step": 255240 }, { - "epoch": 1.29, - "learning_rate": 0.00010683463581738652, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020075327711836506, + "loss": 0.0183, "step": 255250 }, { - "epoch": 1.29, - "learning_rate": 0.0001068270681243725, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.0002007493889019936, + "loss": 0.0128, "step": 255260 }, { - "epoch": 1.29, - "learning_rate": 0.0001068195004313585, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020074550068562214, + "loss": 0.0139, "step": 255270 }, { - "epoch": 1.29, - "learning_rate": 0.00010681193273834449, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020074161246925068, + "loss": 0.0164, "step": 255280 }, { - "epoch": 1.29, - "learning_rate": 0.00010680436504533047, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.0002007377242528792, + "loss": 0.0126, "step": 255290 }, { - "epoch": 1.29, - "learning_rate": 0.00010679679735231647, - "loss": 0.009, + "epoch": 0.66, + "learning_rate": 0.00020073383603650774, + "loss": 0.0184, "step": 255300 }, { - "epoch": 1.29, - "learning_rate": 0.00010678922965930245, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020072994782013626, + "loss": 0.015, "step": 255310 }, { - "epoch": 1.29, - "learning_rate": 0.00010678166196628845, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020072605960376482, + "loss": 0.014, "step": 255320 }, { - "epoch": 1.29, - "learning_rate": 0.00010677409427327444, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020072217138739334, + "loss": 0.0172, "step": 255330 }, { - "epoch": 1.29, - "learning_rate": 0.00010676652658026042, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020071828317102188, + "loss": 0.0137, "step": 255340 }, { - "epoch": 1.29, - "learning_rate": 0.00010675895888724642, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002007143949546504, + "loss": 0.0147, "step": 255350 }, { - "epoch": 1.29, - "learning_rate": 0.00010675139119423241, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020071050673827896, + "loss": 0.0142, "step": 255360 }, { - "epoch": 1.29, - "learning_rate": 0.00010674382350121839, - "loss": 0.0111, + "epoch": 0.66, + "learning_rate": 0.0002007066185219075, + "loss": 0.0157, "step": 255370 }, { - "epoch": 1.29, - "learning_rate": 0.00010673625580820439, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020070273030553602, + "loss": 0.0167, "step": 255380 }, { - "epoch": 1.29, - "learning_rate": 0.00010672868811519037, - "loss": 0.0074, + "epoch": 0.66, + "learning_rate": 0.00020069884208916453, + "loss": 0.0157, "step": 255390 }, { - "epoch": 1.29, - "learning_rate": 0.00010672112042217636, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.0002006949538727931, + "loss": 0.0157, "step": 255400 }, { - "epoch": 1.29, - "learning_rate": 0.00010671355272916236, - "loss": 0.0106, + "epoch": 0.66, + "learning_rate": 0.00020069106565642164, + "loss": 0.0133, "step": 255410 }, { - "epoch": 1.29, - "learning_rate": 0.00010670598503614834, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020068717744005016, + "loss": 0.0178, "step": 255420 }, { - "epoch": 1.29, - "learning_rate": 0.00010669841734313434, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.0002006832892236787, + "loss": 0.0161, "step": 255430 }, { - "epoch": 1.29, - "learning_rate": 0.00010669084965012033, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020067940100730724, + "loss": 0.0141, "step": 255440 }, { - "epoch": 1.29, - "learning_rate": 0.00010668328195710631, - "loss": 0.0077, + "epoch": 0.66, + "learning_rate": 0.00020067551279093578, + "loss": 0.0139, "step": 255450 }, { - "epoch": 1.29, - "learning_rate": 0.00010667571426409231, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.0002006716245745643, + "loss": 0.0165, "step": 255460 }, { - "epoch": 1.29, - "learning_rate": 0.00010666814657107828, - "loss": 0.0067, + "epoch": 0.66, + "learning_rate": 0.00020066773635819284, + "loss": 0.0136, "step": 255470 }, { - "epoch": 1.29, - "learning_rate": 0.00010666057887806427, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020066384814182138, + "loss": 0.017, "step": 255480 }, { - "epoch": 1.29, - "learning_rate": 0.00010665301118505025, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020065995992544992, + "loss": 0.0148, "step": 255490 }, { - "epoch": 1.29, - "learning_rate": 0.00010664544349203625, - "loss": 0.0123, + "epoch": 0.66, + "learning_rate": 0.00020065607170907844, + "loss": 0.0157, "step": 255500 }, { - "epoch": 1.29, - "learning_rate": 0.00010663787579902224, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020065218349270698, + "loss": 0.0146, "step": 255510 }, { - "epoch": 1.29, - "learning_rate": 0.00010663030810600822, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020064829527633555, + "loss": 0.0227, "step": 255520 }, { - "epoch": 1.29, - "learning_rate": 0.00010662274041299422, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020064440705996406, + "loss": 0.0131, "step": 255530 }, { - "epoch": 1.29, - "learning_rate": 0.00010661517271998021, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020064051884359258, + "loss": 0.0119, "step": 255540 }, { - "epoch": 1.29, - "learning_rate": 0.0001066076050269662, - "loss": 0.0059, + "epoch": 0.66, + "learning_rate": 0.00020063663062722112, + "loss": 0.0156, "step": 255550 }, { - "epoch": 1.29, - "learning_rate": 0.00010660003733395219, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020063274241084963, + "loss": 0.0156, "step": 255560 }, { - "epoch": 1.29, - "learning_rate": 0.00010659246964093817, - "loss": 0.0106, + "epoch": 0.66, + "learning_rate": 0.0002006288541944782, + "loss": 0.0135, "step": 255570 }, { - "epoch": 1.29, - "learning_rate": 0.00010658490194792417, - "loss": 0.0103, + "epoch": 0.66, + "learning_rate": 0.00020062496597810674, + "loss": 0.0152, "step": 255580 }, { - "epoch": 1.29, - "learning_rate": 0.00010657733425491016, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020062107776173526, + "loss": 0.0184, "step": 255590 }, { - "epoch": 1.29, - "learning_rate": 0.00010656976656189614, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.0002006171895453638, + "loss": 0.0178, "step": 255600 }, { - "epoch": 1.29, - "learning_rate": 0.00010656219886888214, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020061330132899234, + "loss": 0.0174, "step": 255610 }, { - "epoch": 1.29, - "learning_rate": 0.00010655463117586813, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.00020060941311262088, + "loss": 0.0153, "step": 255620 }, { - "epoch": 1.29, - "learning_rate": 0.00010654706348285411, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.0002006055248962494, + "loss": 0.0203, "step": 255630 }, { - "epoch": 1.29, - "learning_rate": 0.00010653949578984011, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020060163667987794, + "loss": 0.0201, "step": 255640 }, { - "epoch": 1.29, - "learning_rate": 0.00010653192809682609, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020059774846350648, + "loss": 0.0173, "step": 255650 }, { - "epoch": 1.29, - "learning_rate": 0.00010652436040381209, - "loss": 0.0116, + "epoch": 0.66, + "learning_rate": 0.00020059386024713502, + "loss": 0.0183, "step": 255660 }, { - "epoch": 1.29, - "learning_rate": 0.00010651679271079808, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020058997203076354, + "loss": 0.0174, "step": 255670 }, { - "epoch": 1.29, - "learning_rate": 0.00010650922501778406, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020058608381439208, + "loss": 0.0173, "step": 255680 }, { - "epoch": 1.29, - "learning_rate": 0.00010650165732477006, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020058219559802062, + "loss": 0.0134, "step": 255690 }, { - "epoch": 1.29, - "learning_rate": 0.00010649408963175605, - "loss": 0.0062, + "epoch": 0.66, + "learning_rate": 0.00020057830738164916, + "loss": 0.0168, "step": 255700 }, { - "epoch": 1.29, - "learning_rate": 0.00010648652193874203, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020057441916527768, + "loss": 0.0165, "step": 255710 }, { - "epoch": 1.29, - "learning_rate": 0.00010647895424572803, - "loss": 0.006, + "epoch": 0.66, + "learning_rate": 0.00020057053094890622, + "loss": 0.0143, "step": 255720 }, { - "epoch": 1.29, - "learning_rate": 0.00010647138655271402, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.0002005666427325348, + "loss": 0.0157, "step": 255730 }, { - "epoch": 1.29, - "learning_rate": 0.0001064638188597, - "loss": 0.009, + "epoch": 0.66, + "learning_rate": 0.0002005627545161633, + "loss": 0.0165, "step": 255740 }, { - "epoch": 1.29, - "learning_rate": 0.000106456251166686, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.00020055886629979184, + "loss": 0.0195, "step": 255750 }, { - "epoch": 1.29, - "learning_rate": 0.00010644868347367198, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020055497808342036, + "loss": 0.0149, "step": 255760 }, { - "epoch": 1.29, - "learning_rate": 0.00010644111578065798, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020055108986704893, + "loss": 0.0134, "step": 255770 }, { - "epoch": 1.29, - "learning_rate": 0.00010643354808764397, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020054720165067744, + "loss": 0.0146, "step": 255780 }, { - "epoch": 1.29, - "learning_rate": 0.00010642598039462995, - "loss": 0.0097, + "epoch": 0.66, + "learning_rate": 0.00020054331343430598, + "loss": 0.016, "step": 255790 }, { - "epoch": 1.29, - "learning_rate": 0.00010641841270161595, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.0002005394252179345, + "loss": 0.0121, "step": 255800 }, { - "epoch": 1.29, - "learning_rate": 0.00010641084500860194, - "loss": 0.0061, + "epoch": 0.66, + "learning_rate": 0.00020053553700156304, + "loss": 0.0164, "step": 255810 }, { - "epoch": 1.29, - "learning_rate": 0.00010640327731558792, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020053164878519158, + "loss": 0.0148, "step": 255820 }, { - "epoch": 1.29, - "learning_rate": 0.00010639570962257392, - "loss": 0.0111, + "epoch": 0.66, + "learning_rate": 0.00020052776056882012, + "loss": 0.01, "step": 255830 }, { - "epoch": 1.29, - "learning_rate": 0.0001063881419295599, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020052387235244864, + "loss": 0.0147, "step": 255840 }, { - "epoch": 1.29, - "learning_rate": 0.0001063805742365459, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020051998413607718, + "loss": 0.0137, "step": 255850 }, { - "epoch": 1.29, - "learning_rate": 0.00010637300654353189, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.00020051609591970572, + "loss": 0.0124, "step": 255860 }, { - "epoch": 1.29, - "learning_rate": 0.00010636543885051787, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020051220770333426, + "loss": 0.0137, "step": 255870 }, { - "epoch": 1.29, - "learning_rate": 0.00010635787115750387, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020050831948696278, + "loss": 0.0149, "step": 255880 }, { - "epoch": 1.29, - "learning_rate": 0.00010635030346448986, - "loss": 0.0101, + "epoch": 0.66, + "learning_rate": 0.00020050443127059132, + "loss": 0.016, "step": 255890 }, { - "epoch": 1.29, - "learning_rate": 0.00010634273577147584, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002005005430542199, + "loss": 0.0157, "step": 255900 }, { - "epoch": 1.29, - "learning_rate": 0.00010633516807846184, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.0002004966548378484, + "loss": 0.0159, "step": 255910 }, { - "epoch": 1.29, - "learning_rate": 0.00010632760038544782, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020049276662147694, + "loss": 0.0137, "step": 255920 }, { - "epoch": 1.29, - "learning_rate": 0.00010632003269243381, - "loss": 0.0119, + "epoch": 0.66, + "learning_rate": 0.00020048887840510546, + "loss": 0.0196, "step": 255930 }, { - "epoch": 1.29, - "learning_rate": 0.00010631246499941981, - "loss": 0.0065, + "epoch": 0.66, + "learning_rate": 0.00020048499018873403, + "loss": 0.0144, "step": 255940 }, { - "epoch": 1.29, - "learning_rate": 0.00010630489730640579, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020048110197236254, + "loss": 0.017, "step": 255950 }, { - "epoch": 1.29, - "learning_rate": 0.00010629732961339179, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.00020047721375599108, + "loss": 0.0147, "step": 255960 }, { - "epoch": 1.29, - "learning_rate": 0.00010628976192037778, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.0002004733255396196, + "loss": 0.0191, "step": 255970 }, { - "epoch": 1.29, - "learning_rate": 0.00010628219422736376, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.00020046943732324817, + "loss": 0.015, "step": 255980 }, { - "epoch": 1.29, - "learning_rate": 0.00010627462653434976, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020046554910687668, + "loss": 0.0153, "step": 255990 }, { - "epoch": 1.29, - "learning_rate": 0.00010626705884133574, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020046166089050522, + "loss": 0.0166, "step": 256000 }, { - "epoch": 1.29, - "eval_cer": 0.9144615223380336, - "eval_loss": 0.00655102264136076, - "eval_runtime": 116.4546, - "eval_samples_per_second": 17.174, - "eval_steps_per_second": 4.294, + "epoch": 0.66, + "eval_cer": 0.8818048598193629, + "eval_loss": 0.010679894126951694, + "eval_runtime": 107.5034, + "eval_samples_per_second": 18.604, + "eval_steps_per_second": 4.651, "step": 256000 }, { - "epoch": 1.29, - "learning_rate": 0.00010625949114832173, - "loss": 0.0075, + "epoch": 0.66, + "learning_rate": 0.00020045777267413374, + "loss": 0.0164, "step": 256010 }, { - "epoch": 1.29, - "learning_rate": 0.00010625192345530773, - "loss": 0.007, + "epoch": 0.66, + "learning_rate": 0.0002004538844577623, + "loss": 0.0223, "step": 256020 }, { - "epoch": 1.29, - "learning_rate": 0.00010624435576229371, - "loss": 0.01, + "epoch": 0.66, + "learning_rate": 0.00020044999624139082, + "loss": 0.0213, "step": 256030 }, { - "epoch": 1.29, - "learning_rate": 0.0001062367880692797, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020044610802501936, + "loss": 0.0197, "step": 256040 }, { - "epoch": 1.29, - "learning_rate": 0.0001062292203762657, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020044221980864788, + "loss": 0.0167, "step": 256050 }, { - "epoch": 1.29, - "learning_rate": 0.00010622165268325168, - "loss": 0.0081, + "epoch": 0.66, + "learning_rate": 0.00020043833159227642, + "loss": 0.0148, "step": 256060 }, { - "epoch": 1.29, - "learning_rate": 0.00010621408499023768, - "loss": 0.0099, + "epoch": 0.66, + "learning_rate": 0.00020043444337590499, + "loss": 0.0175, "step": 256070 }, { - "epoch": 1.29, - "learning_rate": 0.00010620651729722366, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.0002004305551595335, + "loss": 0.0215, "step": 256080 }, { - "epoch": 1.29, - "learning_rate": 0.00010619894960420965, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020042666694316202, + "loss": 0.019, "step": 256090 }, { - "epoch": 1.29, - "learning_rate": 0.00010619138191119562, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020042277872679056, + "loss": 0.0153, "step": 256100 }, { - "epoch": 1.29, - "learning_rate": 0.00010618381421818162, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020041889051041913, + "loss": 0.0154, "step": 256110 }, { - "epoch": 1.29, - "learning_rate": 0.00010617624652516761, - "loss": 0.008, + "epoch": 0.66, + "learning_rate": 0.00020041500229404764, + "loss": 0.0168, "step": 256120 }, { - "epoch": 1.29, - "learning_rate": 0.00010616867883215359, - "loss": 0.0109, + "epoch": 0.66, + "learning_rate": 0.00020041111407767618, + "loss": 0.017, "step": 256130 }, { - "epoch": 1.29, - "learning_rate": 0.00010616111113913959, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.0002004072258613047, + "loss": 0.0181, "step": 256140 }, { - "epoch": 1.29, - "learning_rate": 0.00010615354344612558, - "loss": 0.0094, + "epoch": 0.66, + "learning_rate": 0.00020040333764493327, + "loss": 0.0143, "step": 256150 }, { - "epoch": 1.29, - "learning_rate": 0.00010614597575311156, - "loss": 0.0076, + "epoch": 0.66, + "learning_rate": 0.00020039944942856178, + "loss": 0.0171, "step": 256160 }, { - "epoch": 1.29, - "learning_rate": 0.00010613840806009756, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.00020039556121219032, + "loss": 0.0115, "step": 256170 }, { - "epoch": 1.29, - "learning_rate": 0.00010613084036708355, - "loss": 0.0084, + "epoch": 0.66, + "learning_rate": 0.00020039167299581884, + "loss": 0.015, "step": 256180 }, { - "epoch": 1.29, - "learning_rate": 0.00010612327267406954, - "loss": 0.0103, + "epoch": 0.66, + "learning_rate": 0.0002003877847794474, + "loss": 0.0197, "step": 256190 }, { - "epoch": 1.29, - "learning_rate": 0.00010611570498105553, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020038389656307592, + "loss": 0.0174, "step": 256200 }, { - "epoch": 1.29, - "learning_rate": 0.00010610813728804151, - "loss": 0.0091, + "epoch": 0.66, + "learning_rate": 0.00020038000834670446, + "loss": 0.0139, "step": 256210 }, { - "epoch": 1.29, - "learning_rate": 0.0001061005695950275, - "loss": 0.0086, + "epoch": 0.66, + "learning_rate": 0.00020037612013033298, + "loss": 0.0182, "step": 256220 }, { - "epoch": 1.29, - "learning_rate": 0.0001060930019020135, - "loss": 0.0085, + "epoch": 0.66, + "learning_rate": 0.00020037223191396154, + "loss": 0.0124, "step": 256230 }, { - "epoch": 1.29, - "learning_rate": 0.00010608543420899948, - "loss": 0.0095, + "epoch": 0.66, + "learning_rate": 0.00020036834369759009, + "loss": 0.0136, "step": 256240 }, { - "epoch": 1.29, - "learning_rate": 0.00010607786651598548, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.0002003644554812186, + "loss": 0.0141, "step": 256250 }, { - "epoch": 1.29, - "learning_rate": 0.00010607029882297147, - "loss": 0.0072, + "epoch": 0.66, + "learning_rate": 0.00020036056726484711, + "loss": 0.0195, "step": 256260 }, { - "epoch": 1.29, - "learning_rate": 0.00010606273112995745, - "loss": 0.0059, + "epoch": 0.66, + "learning_rate": 0.00020035667904847568, + "loss": 0.0151, "step": 256270 }, { - "epoch": 1.29, - "learning_rate": 0.00010605516343694345, - "loss": 0.0112, + "epoch": 0.66, + "learning_rate": 0.00020035279083210423, + "loss": 0.0154, "step": 256280 }, { - "epoch": 1.29, - "learning_rate": 0.00010604759574392943, - "loss": 0.0104, + "epoch": 0.66, + "learning_rate": 0.00020034890261573274, + "loss": 0.0221, "step": 256290 }, { - "epoch": 1.29, - "learning_rate": 0.00010604002805091543, - "loss": 0.0111, + "epoch": 0.66, + "learning_rate": 0.00020034501439936128, + "loss": 0.0186, "step": 256300 }, { - "epoch": 1.29, - "learning_rate": 0.00010603246035790142, - "loss": 0.0069, + "epoch": 0.66, + "learning_rate": 0.0002003411261829898, + "loss": 0.0169, "step": 256310 }, { - "epoch": 1.29, - "learning_rate": 0.0001060248926648874, - "loss": 0.0092, + "epoch": 0.66, + "learning_rate": 0.00020033723796661836, + "loss": 0.0169, "step": 256320 }, { - "epoch": 1.29, - "learning_rate": 0.0001060173249718734, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020033334975024688, + "loss": 0.0103, "step": 256330 }, { - "epoch": 1.29, - "learning_rate": 0.00010600975727885939, - "loss": 0.0066, + "epoch": 0.66, + "learning_rate": 0.00020032946153387542, + "loss": 0.015, "step": 256340 }, { - "epoch": 1.29, - "learning_rate": 0.00010600218958584537, - "loss": 0.0065, + "epoch": 0.66, + "learning_rate": 0.00020032557331750394, + "loss": 0.0231, "step": 256350 }, { - "epoch": 1.29, - "learning_rate": 0.00010599462189283137, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.0002003216851011325, + "loss": 0.0178, "step": 256360 }, { - "epoch": 1.29, - "learning_rate": 0.00010598705419981735, - "loss": 0.0079, + "epoch": 0.66, + "learning_rate": 0.00020031779688476102, + "loss": 0.0185, "step": 256370 }, { - "epoch": 1.29, - "learning_rate": 0.00010597948650680335, - "loss": 0.0065, + "epoch": 0.66, + "learning_rate": 0.00020031390866838956, + "loss": 0.0166, "step": 256380 }, { - "epoch": 1.29, - "learning_rate": 0.00010597191881378934, - "loss": 0.0103, + "epoch": 0.66, + "learning_rate": 0.00020031002045201807, + "loss": 0.015, "step": 256390 }, { - "epoch": 1.29, - "learning_rate": 0.00010596435112077532, - "loss": 0.0078, + "epoch": 0.66, + "learning_rate": 0.00020030613223564664, + "loss": 0.0148, "step": 256400 }, { - "epoch": 1.29, - "learning_rate": 0.00010595678342776132, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020030224401927516, + "loss": 0.0136, "step": 256410 }, { - "epoch": 1.29, - "learning_rate": 0.00010594921573474731, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.0002002983558029037, + "loss": 0.0138, "step": 256420 }, { - "epoch": 1.29, - "learning_rate": 0.00010594164804173329, - "loss": 0.0089, + "epoch": 0.66, + "learning_rate": 0.00020029446758653221, + "loss": 0.013, "step": 256430 }, { - "epoch": 1.29, - "learning_rate": 0.00010593408034871929, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020029057937016078, + "loss": 0.0135, "step": 256440 }, { - "epoch": 1.29, - "learning_rate": 0.00010592651265570527, - "loss": 0.0098, + "epoch": 0.66, + "learning_rate": 0.00020028669115378932, + "loss": 0.0181, "step": 256450 }, { - "epoch": 1.29, - "learning_rate": 0.00010591894496269126, - "loss": 0.0068, + "epoch": 0.66, + "learning_rate": 0.00020028280293741784, + "loss": 0.0132, "step": 256460 }, { - "epoch": 1.29, - "learning_rate": 0.00010591137726967726, - "loss": 0.0096, + "epoch": 0.66, + "learning_rate": 0.00020027891472104638, + "loss": 0.0154, "step": 256470 }, { - "epoch": 1.29, - "learning_rate": 0.00010590380957666324, - "loss": 0.0087, + "epoch": 0.66, + "learning_rate": 0.00020027502650467492, + "loss": 0.0141, "step": 256480 }, { - "epoch": 1.29, - "learning_rate": 0.00010589624188364924, - "loss": 0.0102, + "epoch": 0.66, + "learning_rate": 0.00020027113828830346, + "loss": 0.0126, "step": 256490 }, { - "epoch": 1.29, - "learning_rate": 0.00010588867419063523, - "loss": 0.0071, + "epoch": 0.66, + "learning_rate": 0.00020026725007193198, + "loss": 0.0138, "step": 256500 }, { - "epoch": 1.29, - "learning_rate": 0.00010588110649762121, - "loss": 0.0083, + "epoch": 0.66, + "learning_rate": 0.00020026336185556052, + "loss": 0.0156, "step": 256510 }, { - "epoch": 1.29, - "learning_rate": 0.00010587353880460721, - "loss": 0.0073, + "epoch": 0.66, + "learning_rate": 0.00020025947363918906, + "loss": 0.0133, "step": 256520 }, { - "epoch": 1.29, - "learning_rate": 0.00010586597111159319, - "loss": 0.0082, + "epoch": 0.66, + "learning_rate": 0.0002002555854228176, + "loss": 0.0135, "step": 256530 }, { - "epoch": 1.29, - "learning_rate": 0.00010585840341857918, - "loss": 0.0058, + "epoch": 0.66, + "learning_rate": 0.00020025169720644612, + "loss": 0.0143, "step": 256540 }, { - "epoch": 1.29, - "learning_rate": 0.00010585083572556518, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00020024780899007466, + "loss": 0.0168, "step": 256550 }, { - "epoch": 1.29, - "learning_rate": 0.00010584326803255116, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00020024392077370317, + "loss": 0.0142, "step": 256560 }, { - "epoch": 1.29, - "learning_rate": 0.00010583570033953716, - "loss": 0.0111, + "epoch": 0.67, + "learning_rate": 0.00020024003255733174, + "loss": 0.0172, "step": 256570 }, { - "epoch": 1.29, - "learning_rate": 0.00010582813264652315, - "loss": 0.0122, + "epoch": 0.67, + "learning_rate": 0.00020023614434096026, + "loss": 0.0186, "step": 256580 }, { - "epoch": 1.29, - "learning_rate": 0.00010582056495350913, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.0002002322561245888, + "loss": 0.0171, "step": 256590 }, { - "epoch": 1.29, - "learning_rate": 0.00010581299726049513, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00020022836790821731, + "loss": 0.0136, "step": 256600 }, { - "epoch": 1.29, - "learning_rate": 0.00010580542956748111, - "loss": 0.0099, + "epoch": 0.67, + "learning_rate": 0.00020022447969184588, + "loss": 0.0167, "step": 256610 }, { - "epoch": 1.29, - "learning_rate": 0.0001057978618744671, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00020022059147547442, + "loss": 0.0135, "step": 256620 }, { - "epoch": 1.29, - "learning_rate": 0.0001057902941814531, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00020021670325910294, + "loss": 0.0133, "step": 256630 }, { - "epoch": 1.29, - "learning_rate": 0.00010578272648843908, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00020021281504273148, + "loss": 0.0139, "step": 256640 }, { - "epoch": 1.29, - "learning_rate": 0.00010577515879542507, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00020020892682636002, + "loss": 0.0203, "step": 256650 }, { - "epoch": 1.29, - "learning_rate": 0.00010576759110241107, - "loss": 0.0104, + "epoch": 0.67, + "learning_rate": 0.00020020503860998856, + "loss": 0.0154, "step": 256660 }, { - "epoch": 1.29, - "learning_rate": 0.00010576002340939705, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00020020115039361708, + "loss": 0.0141, "step": 256670 }, { - "epoch": 1.29, - "learning_rate": 0.00010575245571638305, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00020019726217724562, + "loss": 0.018, "step": 256680 }, { - "epoch": 1.3, - "learning_rate": 0.00010574488802336904, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00020019337396087416, + "loss": 0.0146, "step": 256690 }, { - "epoch": 1.3, - "learning_rate": 0.00010573732033035502, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.0002001894857445027, + "loss": 0.0154, "step": 256700 }, { - "epoch": 1.3, - "learning_rate": 0.00010572975263734102, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020018559752813122, + "loss": 0.0147, "step": 256710 }, { - "epoch": 1.3, - "learning_rate": 0.00010572218494432699, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00020018170931175976, + "loss": 0.0146, "step": 256720 }, { - "epoch": 1.3, - "learning_rate": 0.00010571461725131298, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.0002001778210953883, + "loss": 0.016, "step": 256730 }, { - "epoch": 1.3, - "learning_rate": 0.00010570704955829896, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020017393287901684, + "loss": 0.0139, "step": 256740 }, { - "epoch": 1.3, - "learning_rate": 0.00010569948186528496, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00020017004466264536, + "loss": 0.0147, "step": 256750 }, { - "epoch": 1.3, - "learning_rate": 0.00010569191417227095, - "loss": 0.0103, + "epoch": 0.67, + "learning_rate": 0.0002001661564462739, + "loss": 0.0121, "step": 256760 }, { - "epoch": 1.3, - "learning_rate": 0.00010568434647925693, - "loss": 0.0113, + "epoch": 0.67, + "learning_rate": 0.00020016226822990247, + "loss": 0.0178, "step": 256770 }, { - "epoch": 1.3, - "learning_rate": 0.00010567677878624293, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00020015838001353098, + "loss": 0.0151, "step": 256780 }, { - "epoch": 1.3, - "learning_rate": 0.00010566921109322892, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00020015449179715952, + "loss": 0.0153, "step": 256790 }, { - "epoch": 1.3, - "learning_rate": 0.0001056616434002149, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020015060358078804, + "loss": 0.0151, "step": 256800 }, { - "epoch": 1.3, - "learning_rate": 0.0001056540757072009, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.00020014671536441655, + "loss": 0.0165, "step": 256810 }, { - "epoch": 1.3, - "learning_rate": 0.00010564650801418688, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020014282714804512, + "loss": 0.0156, "step": 256820 }, { - "epoch": 1.3, - "learning_rate": 0.00010563894032117288, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00020013893893167366, + "loss": 0.0146, "step": 256830 }, { - "epoch": 1.3, - "learning_rate": 0.00010563137262815887, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00020013505071530218, + "loss": 0.0173, "step": 256840 }, { - "epoch": 1.3, - "learning_rate": 0.00010562380493514485, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00020013116249893072, + "loss": 0.0149, "step": 256850 }, { - "epoch": 1.3, - "learning_rate": 0.00010561623724213085, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00020012727428255926, + "loss": 0.0179, "step": 256860 }, { - "epoch": 1.3, - "learning_rate": 0.00010560866954911684, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.0002001233860661878, + "loss": 0.0232, "step": 256870 }, { - "epoch": 1.3, - "learning_rate": 0.00010560110185610282, - "loss": 0.0058, + "epoch": 0.67, + "learning_rate": 0.00020011949784981632, + "loss": 0.0157, "step": 256880 }, { - "epoch": 1.3, - "learning_rate": 0.00010559353416308882, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00020011560963344486, + "loss": 0.0216, "step": 256890 }, { - "epoch": 1.3, - "learning_rate": 0.0001055859664700748, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.0002001117214170734, + "loss": 0.0155, "step": 256900 }, { - "epoch": 1.3, - "learning_rate": 0.0001055783987770608, - "loss": 0.0109, + "epoch": 0.67, + "learning_rate": 0.00020010783320070194, + "loss": 0.016, "step": 256910 }, { - "epoch": 1.3, - "learning_rate": 0.00010557083108404679, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020010394498433046, + "loss": 0.0178, "step": 256920 }, { - "epoch": 1.3, - "learning_rate": 0.00010556326339103277, - "loss": 0.0121, + "epoch": 0.67, + "learning_rate": 0.000200100056767959, + "loss": 0.0148, "step": 256930 }, { - "epoch": 1.3, - "learning_rate": 0.00010555569569801877, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00020009616855158757, + "loss": 0.0175, "step": 256940 }, { - "epoch": 1.3, - "learning_rate": 0.00010554812800500476, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00020009228033521608, + "loss": 0.0149, "step": 256950 }, { - "epoch": 1.3, - "learning_rate": 0.00010554056031199074, - "loss": 0.0062, + "epoch": 0.67, + "learning_rate": 0.00020008839211884462, + "loss": 0.0161, "step": 256960 }, { - "epoch": 1.3, - "learning_rate": 0.00010553299261897674, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00020008450390247314, + "loss": 0.0136, "step": 256970 }, { - "epoch": 1.3, - "learning_rate": 0.00010552542492596272, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.0002000806156861017, + "loss": 0.015, "step": 256980 }, { - "epoch": 1.3, - "learning_rate": 0.00010551785723294871, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00020007672746973022, + "loss": 0.0142, "step": 256990 }, { - "epoch": 1.3, - "learning_rate": 0.00010551028953993471, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.00020007283925335876, + "loss": 0.0115, "step": 257000 }, { - "epoch": 1.3, - "eval_cer": 0.914467344714786, - "eval_loss": 0.006512925960123539, - "eval_runtime": 116.5432, - "eval_samples_per_second": 17.161, - "eval_steps_per_second": 4.29, + "epoch": 0.67, + "eval_cer": 0.8817446754311932, + "eval_loss": 0.010795309208333492, + "eval_runtime": 107.4074, + "eval_samples_per_second": 18.621, + "eval_steps_per_second": 4.655, "step": 257000 }, { - "epoch": 1.3, - "learning_rate": 0.00010550272184692069, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00020006895103698728, + "loss": 0.0141, "step": 257010 }, { - "epoch": 1.3, - "learning_rate": 0.00010549515415390669, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00020006506282061585, + "loss": 0.0179, "step": 257020 }, { - "epoch": 1.3, - "learning_rate": 0.00010548758646089268, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00020006117460424436, + "loss": 0.0136, "step": 257030 }, { - "epoch": 1.3, - "learning_rate": 0.00010548001876787866, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.0002000572863878729, + "loss": 0.0138, "step": 257040 }, { - "epoch": 1.3, - "learning_rate": 0.00010547245107486466, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00020005339817150142, + "loss": 0.0182, "step": 257050 }, { - "epoch": 1.3, - "learning_rate": 0.00010546488338185064, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00020004950995512996, + "loss": 0.0162, "step": 257060 }, { - "epoch": 1.3, - "learning_rate": 0.00010545731568883663, - "loss": 0.0102, + "epoch": 0.67, + "learning_rate": 0.0002000456217387585, + "loss": 0.0189, "step": 257070 }, { - "epoch": 1.3, - "learning_rate": 0.00010544974799582263, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00020004173352238704, + "loss": 0.0127, "step": 257080 }, { - "epoch": 1.3, - "learning_rate": 0.00010544218030280861, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00020003784530601556, + "loss": 0.0176, "step": 257090 }, { - "epoch": 1.3, - "learning_rate": 0.0001054346126097946, - "loss": 0.011, + "epoch": 0.67, + "learning_rate": 0.0002000339570896441, + "loss": 0.0141, "step": 257100 }, { - "epoch": 1.3, - "learning_rate": 0.0001054270449167806, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00020003006887327267, + "loss": 0.0131, "step": 257110 }, { - "epoch": 1.3, - "learning_rate": 0.00010541947722376658, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00020002618065690118, + "loss": 0.0167, "step": 257120 }, { - "epoch": 1.3, - "learning_rate": 0.00010541190953075258, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.0002000222924405297, + "loss": 0.016, "step": 257130 }, { - "epoch": 1.3, - "learning_rate": 0.00010540434183773856, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00020001840422415824, + "loss": 0.015, "step": 257140 }, { - "epoch": 1.3, - "learning_rate": 0.00010539677414472455, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.0002000145160077868, + "loss": 0.013, "step": 257150 }, { - "epoch": 1.3, - "learning_rate": 0.00010538920645171055, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00020001062779141532, + "loss": 0.0134, "step": 257160 }, { - "epoch": 1.3, - "learning_rate": 0.00010538163875869653, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00020000673957504386, + "loss": 0.017, "step": 257170 }, { - "epoch": 1.3, - "learning_rate": 0.00010537407106568252, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.00020000285135867238, + "loss": 0.0153, "step": 257180 }, { - "epoch": 1.3, - "learning_rate": 0.00010536650337266852, - "loss": 0.0124, + "epoch": 0.67, + "learning_rate": 0.00019999896314230094, + "loss": 0.0156, "step": 257190 }, { - "epoch": 1.3, - "learning_rate": 0.0001053589356796545, - "loss": 0.0101, + "epoch": 0.67, + "learning_rate": 0.00019999507492592946, + "loss": 0.0182, "step": 257200 }, { - "epoch": 1.3, - "learning_rate": 0.0001053513679866405, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.000199991186709558, + "loss": 0.0163, "step": 257210 }, { - "epoch": 1.3, - "learning_rate": 0.00010534380029362649, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019998729849318652, + "loss": 0.0157, "step": 257220 }, { - "epoch": 1.3, - "learning_rate": 0.00010533623260061247, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019998341027681508, + "loss": 0.0136, "step": 257230 }, { - "epoch": 1.3, - "learning_rate": 0.00010532866490759847, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.0001999795220604436, + "loss": 0.0143, "step": 257240 }, { - "epoch": 1.3, - "learning_rate": 0.00010532109721458445, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019997563384407214, + "loss": 0.0184, "step": 257250 }, { - "epoch": 1.3, - "learning_rate": 0.00010531352952157044, - "loss": 0.0102, + "epoch": 0.67, + "learning_rate": 0.00019997174562770066, + "loss": 0.0158, "step": 257260 }, { - "epoch": 1.3, - "learning_rate": 0.00010530596182855644, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019996785741132922, + "loss": 0.0208, "step": 257270 }, { - "epoch": 1.3, - "learning_rate": 0.00010529839413554242, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00019996396919495774, + "loss": 0.0141, "step": 257280 }, { - "epoch": 1.3, - "learning_rate": 0.00010529082644252842, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.00019996008097858628, + "loss": 0.0177, "step": 257290 }, { - "epoch": 1.3, - "learning_rate": 0.00010528325874951441, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.0001999561927622148, + "loss": 0.0182, "step": 257300 }, { - "epoch": 1.3, - "learning_rate": 0.00010527569105650039, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019995230454584334, + "loss": 0.0152, "step": 257310 }, { - "epoch": 1.3, - "learning_rate": 0.00010526812336348639, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.0001999484163294719, + "loss": 0.0162, "step": 257320 }, { - "epoch": 1.3, - "learning_rate": 0.00010526055567047237, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019994452811310042, + "loss": 0.0178, "step": 257330 }, { - "epoch": 1.3, - "learning_rate": 0.00010525298797745836, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019994063989672896, + "loss": 0.018, "step": 257340 }, { - "epoch": 1.3, - "learning_rate": 0.00010524542028444433, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019993675168035748, + "loss": 0.0204, "step": 257350 }, { - "epoch": 1.3, - "learning_rate": 0.00010523785259143033, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019993286346398604, + "loss": 0.0154, "step": 257360 }, { - "epoch": 1.3, - "learning_rate": 0.00010523028489841632, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019992897524761456, + "loss": 0.0155, "step": 257370 }, { - "epoch": 1.3, - "learning_rate": 0.0001052227172054023, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.0001999250870312431, + "loss": 0.0181, "step": 257380 }, { - "epoch": 1.3, - "learning_rate": 0.0001052151495123883, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019992119881487162, + "loss": 0.016, "step": 257390 }, { - "epoch": 1.3, - "learning_rate": 0.00010520758181937429, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019991731059850018, + "loss": 0.0145, "step": 257400 }, { - "epoch": 1.3, - "learning_rate": 0.00010520001412636027, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.0001999134223821287, + "loss": 0.0233, "step": 257410 }, { - "epoch": 1.3, - "learning_rate": 0.00010519244643334627, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019990953416575724, + "loss": 0.0139, "step": 257420 }, { - "epoch": 1.3, - "learning_rate": 0.00010518487874033225, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019990564594938575, + "loss": 0.0171, "step": 257430 }, { - "epoch": 1.3, - "learning_rate": 0.00010517731104731825, - "loss": 0.0061, + "epoch": 0.67, + "learning_rate": 0.00019990175773301432, + "loss": 0.011, "step": 257440 }, { - "epoch": 1.3, - "learning_rate": 0.00010516974335430424, - "loss": 0.0104, + "epoch": 0.67, + "learning_rate": 0.00019989786951664284, + "loss": 0.0152, "step": 257450 }, { - "epoch": 1.3, - "learning_rate": 0.00010516217566129022, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019989398130027138, + "loss": 0.0172, "step": 257460 }, { - "epoch": 1.3, - "learning_rate": 0.00010515460796827622, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.0001998900930838999, + "loss": 0.0143, "step": 257470 }, { - "epoch": 1.3, - "learning_rate": 0.00010514704027526221, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019988620486752846, + "loss": 0.0152, "step": 257480 }, { - "epoch": 1.3, - "learning_rate": 0.0001051394725822482, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.000199882316651157, + "loss": 0.012, "step": 257490 }, { - "epoch": 1.3, - "learning_rate": 0.00010513190488923419, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.00019987842843478552, + "loss": 0.0211, "step": 257500 }, { - "epoch": 1.3, - "learning_rate": 0.00010512433719622017, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019987454021841406, + "loss": 0.015, "step": 257510 }, { - "epoch": 1.3, - "learning_rate": 0.00010511676950320616, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.0001998706520020426, + "loss": 0.0212, "step": 257520 }, { - "epoch": 1.3, - "learning_rate": 0.00010510920181019216, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019986676378567114, + "loss": 0.0164, "step": 257530 }, { - "epoch": 1.3, - "learning_rate": 0.00010510163411717814, - "loss": 0.0059, + "epoch": 0.67, + "learning_rate": 0.00019986287556929966, + "loss": 0.0171, "step": 257540 }, { - "epoch": 1.3, - "learning_rate": 0.00010509406642416414, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.0001998589873529282, + "loss": 0.014, "step": 257550 }, { - "epoch": 1.3, - "learning_rate": 0.00010508649873115013, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019985509913655671, + "loss": 0.0136, "step": 257560 }, { - "epoch": 1.3, - "learning_rate": 0.00010507893103813611, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019985121092018528, + "loss": 0.0157, "step": 257570 }, { - "epoch": 1.3, - "learning_rate": 0.00010507136334512211, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.0001998473227038138, + "loss": 0.0181, "step": 257580 }, { - "epoch": 1.3, - "learning_rate": 0.00010506379565210809, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019984343448744234, + "loss": 0.0157, "step": 257590 }, { - "epoch": 1.3, - "learning_rate": 0.00010505622795909408, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019983954627107085, + "loss": 0.0156, "step": 257600 }, { - "epoch": 1.3, - "learning_rate": 0.00010504866026608008, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019983565805469942, + "loss": 0.0145, "step": 257610 }, { - "epoch": 1.3, - "learning_rate": 0.00010504109257306606, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.00019983176983832794, + "loss": 0.0204, "step": 257620 }, { - "epoch": 1.3, - "learning_rate": 0.00010503352488005206, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019982788162195648, + "loss": 0.0153, "step": 257630 }, { - "epoch": 1.3, - "learning_rate": 0.00010502595718703805, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.000199823993405585, + "loss": 0.0151, "step": 257640 }, { - "epoch": 1.3, - "learning_rate": 0.00010501838949402403, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00019982010518921356, + "loss": 0.0159, "step": 257650 }, { - "epoch": 1.3, - "learning_rate": 0.00010501082180101003, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.0001998162169728421, + "loss": 0.0136, "step": 257660 }, { - "epoch": 1.3, - "learning_rate": 0.00010500325410799602, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019981232875647062, + "loss": 0.0188, "step": 257670 }, { - "epoch": 1.3, - "learning_rate": 0.000104995686414982, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019980844054009913, + "loss": 0.0133, "step": 257680 }, { - "epoch": 1.3, - "learning_rate": 0.000104988118721968, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.0001998045523237277, + "loss": 0.0146, "step": 257690 }, { - "epoch": 1.3, - "learning_rate": 0.00010498055102895398, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019980066410735624, + "loss": 0.0156, "step": 257700 }, { - "epoch": 1.3, - "learning_rate": 0.00010497298333593997, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019979677589098476, + "loss": 0.0152, "step": 257710 }, { - "epoch": 1.3, - "learning_rate": 0.00010496541564292597, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.0001997928876746133, + "loss": 0.0143, "step": 257720 }, { - "epoch": 1.3, - "learning_rate": 0.00010495784794991195, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019978899945824184, + "loss": 0.0137, "step": 257730 }, { - "epoch": 1.3, - "learning_rate": 0.00010495028025689795, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019978511124187038, + "loss": 0.0129, "step": 257740 }, { - "epoch": 1.3, - "learning_rate": 0.00010494271256388394, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.0001997812230254989, + "loss": 0.0184, "step": 257750 }, { - "epoch": 1.3, - "learning_rate": 0.00010493514487086992, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019977733480912744, + "loss": 0.0108, "step": 257760 }, { - "epoch": 1.3, - "learning_rate": 0.00010492757717785592, - "loss": 0.0098, + "epoch": 0.67, + "learning_rate": 0.00019977344659275598, + "loss": 0.0173, "step": 257770 }, { - "epoch": 1.3, - "learning_rate": 0.0001049200094848419, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019976955837638452, + "loss": 0.0127, "step": 257780 }, { - "epoch": 1.3, - "learning_rate": 0.0001049124417918279, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019976567016001304, + "loss": 0.0145, "step": 257790 }, { - "epoch": 1.3, - "learning_rate": 0.00010490487409881389, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019976178194364158, + "loss": 0.0158, "step": 257800 }, { - "epoch": 1.3, - "learning_rate": 0.00010489730640579987, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.0001997578937272701, + "loss": 0.0159, "step": 257810 }, { - "epoch": 1.3, - "learning_rate": 0.00010488973871278587, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019975400551089866, + "loss": 0.0158, "step": 257820 }, { - "epoch": 1.3, - "learning_rate": 0.00010488217101977186, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.0001997501172945272, + "loss": 0.0186, "step": 257830 }, { - "epoch": 1.3, - "learning_rate": 0.00010487460332675784, - "loss": 0.0106, + "epoch": 0.67, + "learning_rate": 0.00019974622907815572, + "loss": 0.0135, "step": 257840 }, { - "epoch": 1.3, - "learning_rate": 0.00010486703563374384, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019974234086178423, + "loss": 0.0118, "step": 257850 }, { - "epoch": 1.3, - "learning_rate": 0.00010485946794072982, - "loss": 0.0099, + "epoch": 0.67, + "learning_rate": 0.0001997384526454128, + "loss": 0.0134, "step": 257860 }, { - "epoch": 1.3, - "learning_rate": 0.00010485190024771581, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019973456442904134, + "loss": 0.0141, "step": 257870 }, { - "epoch": 1.3, - "learning_rate": 0.00010484433255470181, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019973067621266986, + "loss": 0.0123, "step": 257880 }, { - "epoch": 1.3, - "learning_rate": 0.00010483676486168779, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.0001997267879962984, + "loss": 0.0139, "step": 257890 }, { - "epoch": 1.3, - "learning_rate": 0.00010482919716867378, - "loss": 0.0063, + "epoch": 0.67, + "learning_rate": 0.00019972289977992694, + "loss": 0.0207, "step": 257900 }, { - "epoch": 1.3, - "learning_rate": 0.00010482162947565978, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.00019971901156355548, + "loss": 0.0141, "step": 257910 }, { - "epoch": 1.3, - "learning_rate": 0.00010481406178264576, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.000199715123347184, + "loss": 0.019, "step": 257920 }, { - "epoch": 1.3, - "learning_rate": 0.00010480649408963176, - "loss": 0.011, + "epoch": 0.67, + "learning_rate": 0.00019971123513081254, + "loss": 0.0106, "step": 257930 }, { - "epoch": 1.3, - "learning_rate": 0.00010479892639661774, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019970734691444108, + "loss": 0.0147, "step": 257940 }, { - "epoch": 1.3, - "learning_rate": 0.00010479135870360373, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019970345869806962, + "loss": 0.0135, "step": 257950 }, { - "epoch": 1.3, - "learning_rate": 0.00010478379101058973, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019969957048169814, + "loss": 0.0168, "step": 257960 }, { - "epoch": 1.3, - "learning_rate": 0.00010477622331757571, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019969568226532668, + "loss": 0.0145, "step": 257970 }, { - "epoch": 1.3, - "learning_rate": 0.00010476865562456169, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00019969179404895525, + "loss": 0.0151, "step": 257980 }, { - "epoch": 1.3, - "learning_rate": 0.00010476108793154767, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019968790583258376, + "loss": 0.0156, "step": 257990 }, { - "epoch": 1.3, - "learning_rate": 0.00010475352023853367, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019968401761621228, + "loss": 0.0182, "step": 258000 }, { - "epoch": 1.3, - "eval_cer": 0.9144421144155256, - "eval_loss": 0.006312798708677292, - "eval_runtime": 116.232, - "eval_samples_per_second": 17.207, - "eval_steps_per_second": 4.302, + "epoch": 0.67, + "eval_cer": 0.8818202558256388, + "eval_loss": 0.010769709013402462, + "eval_runtime": 107.7755, + "eval_samples_per_second": 18.557, + "eval_steps_per_second": 4.639, "step": 258000 }, { - "epoch": 1.3, - "learning_rate": 0.00010474595254551966, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019968012939984082, + "loss": 0.0188, "step": 258010 }, { - "epoch": 1.3, - "learning_rate": 0.00010473838485250564, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019967624118346939, + "loss": 0.0165, "step": 258020 }, { - "epoch": 1.3, - "learning_rate": 0.00010473081715949164, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.0001996723529670979, + "loss": 0.0138, "step": 258030 }, { - "epoch": 1.3, - "learning_rate": 0.00010472324946647762, - "loss": 0.0103, + "epoch": 0.67, + "learning_rate": 0.00019966846475072644, + "loss": 0.0175, "step": 258040 }, { - "epoch": 1.3, - "learning_rate": 0.00010471568177346362, - "loss": 0.0107, + "epoch": 0.67, + "learning_rate": 0.00019966457653435496, + "loss": 0.0143, "step": 258050 }, { - "epoch": 1.3, - "learning_rate": 0.00010470811408044961, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.0001996606883179835, + "loss": 0.0129, "step": 258060 }, { - "epoch": 1.3, - "learning_rate": 0.00010470054638743559, - "loss": 0.0068, + "epoch": 0.67, + "learning_rate": 0.00019965680010161204, + "loss": 0.0146, "step": 258070 }, { - "epoch": 1.3, - "learning_rate": 0.00010469297869442159, - "loss": 0.0113, + "epoch": 0.67, + "learning_rate": 0.00019965291188524058, + "loss": 0.0186, "step": 258080 }, { - "epoch": 1.3, - "learning_rate": 0.00010468541100140758, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.0001996490236688691, + "loss": 0.0141, "step": 258090 }, { - "epoch": 1.3, - "learning_rate": 0.00010467784330839356, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019964513545249764, + "loss": 0.0153, "step": 258100 }, { - "epoch": 1.3, - "learning_rate": 0.00010467027561537956, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019964124723612618, + "loss": 0.0152, "step": 258110 }, { - "epoch": 1.3, - "learning_rate": 0.00010466270792236555, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019963735901975472, + "loss": 0.015, "step": 258120 }, { - "epoch": 1.3, - "learning_rate": 0.00010465514022935153, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019963347080338324, + "loss": 0.0174, "step": 258130 }, { - "epoch": 1.3, - "learning_rate": 0.00010464757253633753, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019962958258701178, + "loss": 0.0134, "step": 258140 }, { - "epoch": 1.3, - "learning_rate": 0.00010464000484332351, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019962569437064032, + "loss": 0.0146, "step": 258150 }, { - "epoch": 1.3, - "learning_rate": 0.0001046324371503095, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019962180615426886, + "loss": 0.0172, "step": 258160 }, { - "epoch": 1.3, - "learning_rate": 0.0001046248694572955, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019961791793789737, + "loss": 0.0131, "step": 258170 }, { - "epoch": 1.3, - "learning_rate": 0.00010461730176428148, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.00019961402972152592, + "loss": 0.0182, "step": 258180 }, { - "epoch": 1.3, - "learning_rate": 0.00010460973407126748, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019961014150515449, + "loss": 0.0112, "step": 258190 }, { - "epoch": 1.3, - "learning_rate": 0.00010460216637825347, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.000199606253288783, + "loss": 0.0161, "step": 258200 }, { - "epoch": 1.3, - "learning_rate": 0.00010459459868523945, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019960236507241154, + "loss": 0.0146, "step": 258210 }, { - "epoch": 1.3, - "learning_rate": 0.00010458703099222545, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019959847685604006, + "loss": 0.016, "step": 258220 }, { - "epoch": 1.3, - "learning_rate": 0.00010457946329921143, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019959458863966862, + "loss": 0.0155, "step": 258230 }, { - "epoch": 1.3, - "learning_rate": 0.00010457189560619743, - "loss": 0.011, + "epoch": 0.67, + "learning_rate": 0.00019959070042329714, + "loss": 0.0151, "step": 258240 }, { - "epoch": 1.3, - "learning_rate": 0.00010456432791318342, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019958681220692568, + "loss": 0.0149, "step": 258250 }, { - "epoch": 1.3, - "learning_rate": 0.0001045567602201694, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.0001995829239905542, + "loss": 0.0134, "step": 258260 }, { - "epoch": 1.3, - "learning_rate": 0.0001045491925271554, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019957903577418276, + "loss": 0.0186, "step": 258270 }, { - "epoch": 1.3, - "learning_rate": 0.00010454162483414139, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019957514755781128, + "loss": 0.0171, "step": 258280 }, { - "epoch": 1.3, - "learning_rate": 0.00010453405714112737, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019957125934143982, + "loss": 0.0264, "step": 258290 }, { - "epoch": 1.3, - "learning_rate": 0.00010452648944811337, - "loss": 0.0118, + "epoch": 0.67, + "learning_rate": 0.00019956737112506833, + "loss": 0.0148, "step": 258300 }, { - "epoch": 1.3, - "learning_rate": 0.00010451892175509935, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019956348290869688, + "loss": 0.0176, "step": 258310 }, { - "epoch": 1.3, - "learning_rate": 0.00010451135406208534, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019955959469232542, + "loss": 0.0161, "step": 258320 }, { - "epoch": 1.3, - "learning_rate": 0.00010450378636907134, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019955570647595396, + "loss": 0.0172, "step": 258330 }, { - "epoch": 1.3, - "learning_rate": 0.00010449621867605732, - "loss": 0.006, + "epoch": 0.67, + "learning_rate": 0.00019955181825958247, + "loss": 0.0139, "step": 258340 }, { - "epoch": 1.3, - "learning_rate": 0.00010448865098304332, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019954793004321102, + "loss": 0.0157, "step": 258350 }, { - "epoch": 1.3, - "learning_rate": 0.00010448108329002931, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019954404182683958, + "loss": 0.0197, "step": 258360 }, { - "epoch": 1.3, - "learning_rate": 0.00010447351559701529, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.0001995401536104681, + "loss": 0.014, "step": 258370 }, { - "epoch": 1.3, - "learning_rate": 0.00010446594790400129, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019953626539409664, + "loss": 0.0144, "step": 258380 }, { - "epoch": 1.3, - "learning_rate": 0.00010445838021098727, - "loss": 0.0065, + "epoch": 0.67, + "learning_rate": 0.00019953237717772516, + "loss": 0.0172, "step": 258390 }, { - "epoch": 1.3, - "learning_rate": 0.00010445081251797326, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019952848896135372, + "loss": 0.0199, "step": 258400 }, { - "epoch": 1.3, - "learning_rate": 0.00010444324482495926, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019952460074498224, + "loss": 0.0164, "step": 258410 }, { - "epoch": 1.3, - "learning_rate": 0.00010443567713194524, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.00019952071252861078, + "loss": 0.0161, "step": 258420 }, { - "epoch": 1.3, - "learning_rate": 0.00010442810943893124, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.0001995168243122393, + "loss": 0.0137, "step": 258430 }, { - "epoch": 1.3, - "learning_rate": 0.00010442054174591723, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019951293609586786, + "loss": 0.0152, "step": 258440 }, { - "epoch": 1.3, - "learning_rate": 0.00010441297405290321, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019950904787949638, + "loss": 0.0146, "step": 258450 }, { - "epoch": 1.3, - "learning_rate": 0.0001044054063598892, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00019950515966312492, + "loss": 0.0142, "step": 258460 }, { - "epoch": 1.3, - "learning_rate": 0.00010439783866687519, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019950127144675343, + "loss": 0.0177, "step": 258470 }, { - "epoch": 1.3, - "learning_rate": 0.00010439027097386118, - "loss": 0.0098, + "epoch": 0.67, + "learning_rate": 0.000199497383230382, + "loss": 0.0131, "step": 258480 }, { - "epoch": 1.3, - "learning_rate": 0.00010438270328084718, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019949349501401052, + "loss": 0.0148, "step": 258490 }, { - "epoch": 1.3, - "learning_rate": 0.00010437513558783316, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019948960679763906, + "loss": 0.0154, "step": 258500 }, { - "epoch": 1.3, - "learning_rate": 0.00010436756789481915, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019948571858126757, + "loss": 0.0182, "step": 258510 }, { - "epoch": 1.3, - "learning_rate": 0.00010436000020180515, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.00019948183036489614, + "loss": 0.0146, "step": 258520 }, { - "epoch": 1.3, - "learning_rate": 0.00010435243250879113, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.00019947794214852468, + "loss": 0.0113, "step": 258530 }, { - "epoch": 1.3, - "learning_rate": 0.00010434486481577713, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.0001994740539321532, + "loss": 0.0166, "step": 258540 }, { - "epoch": 1.3, - "learning_rate": 0.00010433729712276311, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.0001994701657157817, + "loss": 0.0122, "step": 258550 }, { - "epoch": 1.3, - "learning_rate": 0.0001043297294297491, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019946627749941025, + "loss": 0.0172, "step": 258560 }, { - "epoch": 1.3, - "learning_rate": 0.0001043221617367351, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019946238928303882, + "loss": 0.0153, "step": 258570 }, { - "epoch": 1.3, - "learning_rate": 0.00010431459404372108, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.00019945850106666734, + "loss": 0.0166, "step": 258580 }, { - "epoch": 1.3, - "learning_rate": 0.00010430702635070707, - "loss": 0.0061, + "epoch": 0.67, + "learning_rate": 0.00019945461285029588, + "loss": 0.0151, "step": 258590 }, { - "epoch": 1.3, - "learning_rate": 0.00010429945865769307, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.0001994507246339244, + "loss": 0.0168, "step": 258600 }, { - "epoch": 1.3, - "learning_rate": 0.00010429189096467904, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019944683641755296, + "loss": 0.0144, "step": 258610 }, { - "epoch": 1.3, - "learning_rate": 0.00010428432327166503, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019944294820118148, + "loss": 0.0154, "step": 258620 }, { - "epoch": 1.3, - "learning_rate": 0.00010427675557865101, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00019943905998481002, + "loss": 0.0156, "step": 258630 }, { - "epoch": 1.3, - "learning_rate": 0.00010426918788563701, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019943517176843853, + "loss": 0.0138, "step": 258640 }, { - "epoch": 1.3, - "learning_rate": 0.000104261620192623, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.0001994312835520671, + "loss": 0.0156, "step": 258650 }, { - "epoch": 1.3, - "learning_rate": 0.00010425405249960898, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019942739533569562, + "loss": 0.0183, "step": 258660 }, { - "epoch": 1.31, - "learning_rate": 0.00010424648480659498, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019942350711932416, + "loss": 0.0163, "step": 258670 }, { - "epoch": 1.31, - "learning_rate": 0.00010423891711358096, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019941961890295267, + "loss": 0.0141, "step": 258680 }, { - "epoch": 1.31, - "learning_rate": 0.00010423134942056696, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019941573068658124, + "loss": 0.0119, "step": 258690 }, { - "epoch": 1.31, - "learning_rate": 0.00010422378172755295, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019941184247020978, + "loss": 0.0146, "step": 258700 }, { - "epoch": 1.31, - "learning_rate": 0.00010421621403453893, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.0001994079542538383, + "loss": 0.0187, "step": 258710 }, { - "epoch": 1.31, - "learning_rate": 0.00010420864634152493, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.0001994040660374668, + "loss": 0.0128, "step": 258720 }, { - "epoch": 1.31, - "learning_rate": 0.00010420107864851092, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019940017782109538, + "loss": 0.0184, "step": 258730 }, { - "epoch": 1.31, - "learning_rate": 0.0001041935109554969, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019939628960472392, + "loss": 0.0152, "step": 258740 }, { - "epoch": 1.31, - "learning_rate": 0.0001041859432624829, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019939240138835244, + "loss": 0.0136, "step": 258750 }, { - "epoch": 1.31, - "learning_rate": 0.00010417837556946888, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019938851317198098, + "loss": 0.0192, "step": 258760 }, { - "epoch": 1.31, - "learning_rate": 0.00010417080787645488, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019938462495560952, + "loss": 0.0141, "step": 258770 }, { - "epoch": 1.31, - "learning_rate": 0.00010416324018344087, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00019938073673923806, + "loss": 0.0139, "step": 258780 }, { - "epoch": 1.31, - "learning_rate": 0.00010415567249042685, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.00019937684852286658, + "loss": 0.0114, "step": 258790 }, { - "epoch": 1.31, - "learning_rate": 0.00010414810479741285, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.00019937296030649512, + "loss": 0.013, "step": 258800 }, { - "epoch": 1.31, - "learning_rate": 0.00010414053710439884, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019936907209012363, + "loss": 0.0129, "step": 258810 }, { - "epoch": 1.31, - "learning_rate": 0.00010413296941138482, - "loss": 0.011, + "epoch": 0.67, + "learning_rate": 0.0001993651838737522, + "loss": 0.0136, "step": 258820 }, { - "epoch": 1.31, - "learning_rate": 0.00010412540171837082, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00019936129565738072, + "loss": 0.0187, "step": 258830 }, { - "epoch": 1.31, - "learning_rate": 0.0001041178340253568, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019935740744100926, + "loss": 0.0154, "step": 258840 }, { - "epoch": 1.31, - "learning_rate": 0.0001041102663323428, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019935351922463777, + "loss": 0.0189, "step": 258850 }, { - "epoch": 1.31, - "learning_rate": 0.00010410269863932879, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019934963100826634, + "loss": 0.0146, "step": 258860 }, { - "epoch": 1.31, - "learning_rate": 0.00010409513094631477, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019934574279189486, + "loss": 0.0171, "step": 258870 }, { - "epoch": 1.31, - "learning_rate": 0.00010408756325330077, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0001993418545755234, + "loss": 0.0182, "step": 258880 }, { - "epoch": 1.31, - "learning_rate": 0.00010407999556028676, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.0001993379663591519, + "loss": 0.013, "step": 258890 }, { - "epoch": 1.31, - "learning_rate": 0.00010407242786727274, - "loss": 0.0152, + "epoch": 0.67, + "learning_rate": 0.00019933407814278048, + "loss": 0.016, "step": 258900 }, { - "epoch": 1.31, - "learning_rate": 0.00010406486017425874, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019933018992640902, + "loss": 0.0154, "step": 258910 }, { - "epoch": 1.31, - "learning_rate": 0.00010405729248124472, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019932630171003754, + "loss": 0.0177, "step": 258920 }, { - "epoch": 1.31, - "learning_rate": 0.00010404972478823071, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019932241349366608, + "loss": 0.0152, "step": 258930 }, { - "epoch": 1.31, - "learning_rate": 0.00010404215709521671, - "loss": 0.0058, + "epoch": 0.67, + "learning_rate": 0.00019931852527729462, + "loss": 0.0145, "step": 258940 }, { - "epoch": 1.31, - "learning_rate": 0.00010403458940220269, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019931463706092316, + "loss": 0.0131, "step": 258950 }, { - "epoch": 1.31, - "learning_rate": 0.00010402702170918869, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019931074884455168, + "loss": 0.0147, "step": 258960 }, { - "epoch": 1.31, - "learning_rate": 0.00010401945401617468, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019930686062818022, + "loss": 0.0173, "step": 258970 }, { - "epoch": 1.31, - "learning_rate": 0.00010401188632316066, - "loss": 0.0112, + "epoch": 0.67, + "learning_rate": 0.00019930297241180876, + "loss": 0.0226, "step": 258980 }, { - "epoch": 1.31, - "learning_rate": 0.00010400431863014666, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.0001992990841954373, + "loss": 0.0124, "step": 258990 }, { - "epoch": 1.31, - "learning_rate": 0.00010399675093713264, - "loss": 0.0105, + "epoch": 0.67, + "learning_rate": 0.00019929519597906582, + "loss": 0.0149, "step": 259000 }, { - "epoch": 1.31, - "eval_cer": 0.914452788772905, - "eval_loss": 0.006329988595098257, - "eval_runtime": 116.6658, - "eval_samples_per_second": 17.143, - "eval_steps_per_second": 4.286, + "epoch": 0.67, + "eval_cer": 0.8817740678068109, + "eval_loss": 0.010703030042350292, + "eval_runtime": 107.7387, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, "step": 259000 }, { - "epoch": 1.31, - "learning_rate": 0.00010398918324411863, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019929130776269436, + "loss": 0.0154, "step": 259010 }, { - "epoch": 1.31, - "learning_rate": 0.00010398161555110463, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.00019928741954632293, + "loss": 0.0142, "step": 259020 }, { - "epoch": 1.31, - "learning_rate": 0.00010397404785809061, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019928353132995144, + "loss": 0.0151, "step": 259030 }, { - "epoch": 1.31, - "learning_rate": 0.0001039664801650766, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019927964311357996, + "loss": 0.016, "step": 259040 }, { - "epoch": 1.31, - "learning_rate": 0.0001039589124720626, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.0001992757548972085, + "loss": 0.0155, "step": 259050 }, { - "epoch": 1.31, - "learning_rate": 0.00010395134477904858, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.000199271866680837, + "loss": 0.0151, "step": 259060 }, { - "epoch": 1.31, - "learning_rate": 0.00010394377708603458, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.00019926797846446558, + "loss": 0.0196, "step": 259070 }, { - "epoch": 1.31, - "learning_rate": 0.00010393620939302056, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019926409024809412, + "loss": 0.014, "step": 259080 }, { - "epoch": 1.31, - "learning_rate": 0.00010392864170000655, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019926020203172264, + "loss": 0.0163, "step": 259090 }, { - "epoch": 1.31, - "learning_rate": 0.00010392107400699255, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019925631381535118, + "loss": 0.0142, "step": 259100 }, { - "epoch": 1.31, - "learning_rate": 0.00010391350631397853, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019925242559897972, + "loss": 0.0134, "step": 259110 }, { - "epoch": 1.31, - "learning_rate": 0.00010390593862096452, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019924853738260826, + "loss": 0.0161, "step": 259120 }, { - "epoch": 1.31, - "learning_rate": 0.00010389837092795052, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019924464916623678, + "loss": 0.0182, "step": 259130 }, { - "epoch": 1.31, - "learning_rate": 0.0001038908032349365, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019924076094986532, + "loss": 0.0138, "step": 259140 }, { - "epoch": 1.31, - "learning_rate": 0.0001038832355419225, - "loss": 0.0065, + "epoch": 0.67, + "learning_rate": 0.00019923687273349386, + "loss": 0.0154, "step": 259150 }, { - "epoch": 1.31, - "learning_rate": 0.00010387566784890849, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.0001992329845171224, + "loss": 0.0138, "step": 259160 }, { - "epoch": 1.31, - "learning_rate": 0.00010386810015589447, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019922909630075092, + "loss": 0.0152, "step": 259170 }, { - "epoch": 1.31, - "learning_rate": 0.00010386053246288047, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019922520808437946, + "loss": 0.0145, "step": 259180 }, { - "epoch": 1.31, - "learning_rate": 0.00010385296476986645, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.000199221319868008, + "loss": 0.018, "step": 259190 }, { - "epoch": 1.31, - "learning_rate": 0.00010384539707685244, - "loss": 0.0118, + "epoch": 0.67, + "learning_rate": 0.00019921743165163654, + "loss": 0.0166, "step": 259200 }, { - "epoch": 1.31, - "learning_rate": 0.00010383782938383844, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019921354343526505, + "loss": 0.0141, "step": 259210 }, { - "epoch": 1.31, - "learning_rate": 0.00010383026169082442, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.0001992096552188936, + "loss": 0.0138, "step": 259220 }, { - "epoch": 1.31, - "learning_rate": 0.00010382269399781041, - "loss": 0.0109, + "epoch": 0.67, + "learning_rate": 0.00019920576700252217, + "loss": 0.0157, "step": 259230 }, { - "epoch": 1.31, - "learning_rate": 0.00010381512630479638, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019920187878615068, + "loss": 0.0132, "step": 259240 }, { - "epoch": 1.31, - "learning_rate": 0.00010380755861178238, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019919799056977922, + "loss": 0.0127, "step": 259250 }, { - "epoch": 1.31, - "learning_rate": 0.00010379999091876837, - "loss": 0.007, + "epoch": 0.67, + "learning_rate": 0.00019919410235340774, + "loss": 0.0168, "step": 259260 }, { - "epoch": 1.31, - "learning_rate": 0.00010379242322575435, - "loss": 0.0124, + "epoch": 0.67, + "learning_rate": 0.0001991902141370363, + "loss": 0.0162, "step": 259270 }, { - "epoch": 1.31, - "learning_rate": 0.00010378485553274035, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019918632592066482, + "loss": 0.016, "step": 259280 }, { - "epoch": 1.31, - "learning_rate": 0.00010377728783972633, - "loss": 0.0089, - "step": 259290 + "epoch": 0.67, + "learning_rate": 0.00019918243770429336, + "loss": 0.0158, + "step": 259290 }, { - "epoch": 1.31, - "learning_rate": 0.00010376972014671233, - "loss": 0.0106, + "epoch": 0.67, + "learning_rate": 0.00019917854948792188, + "loss": 0.0197, "step": 259300 }, { - "epoch": 1.31, - "learning_rate": 0.00010376215245369832, - "loss": 0.0071, + "epoch": 0.67, + "learning_rate": 0.00019917466127155042, + "loss": 0.0195, "step": 259310 }, { - "epoch": 1.31, - "learning_rate": 0.0001037545847606843, - "loss": 0.0108, + "epoch": 0.67, + "learning_rate": 0.00019917077305517896, + "loss": 0.0238, "step": 259320 }, { - "epoch": 1.31, - "learning_rate": 0.0001037470170676703, - "loss": 0.0091, + "epoch": 0.67, + "learning_rate": 0.0001991668848388075, + "loss": 0.0174, "step": 259330 }, { - "epoch": 1.31, - "learning_rate": 0.00010373944937465629, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019916299662243601, + "loss": 0.0105, "step": 259340 }, { - "epoch": 1.31, - "learning_rate": 0.00010373188168164227, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019915910840606456, + "loss": 0.0166, "step": 259350 }, { - "epoch": 1.31, - "learning_rate": 0.00010372431398862827, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.0001991552201896931, + "loss": 0.0154, "step": 259360 }, { - "epoch": 1.31, - "learning_rate": 0.00010371674629561425, - "loss": 0.0107, + "epoch": 0.67, + "learning_rate": 0.00019915133197332164, + "loss": 0.0151, "step": 259370 }, { - "epoch": 1.31, - "learning_rate": 0.00010370917860260024, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019914744375695015, + "loss": 0.0183, "step": 259380 }, { - "epoch": 1.31, - "learning_rate": 0.00010370161090958624, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0001991435555405787, + "loss": 0.0191, "step": 259390 }, { - "epoch": 1.31, - "learning_rate": 0.00010369404321657222, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019913966732420726, + "loss": 0.016, "step": 259400 }, { - "epoch": 1.31, - "learning_rate": 0.00010368647552355822, - "loss": 0.0103, + "epoch": 0.67, + "learning_rate": 0.00019913577910783578, + "loss": 0.0182, "step": 259410 }, { - "epoch": 1.31, - "learning_rate": 0.00010367890783054421, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019913189089146432, + "loss": 0.0138, "step": 259420 }, { - "epoch": 1.31, - "learning_rate": 0.00010367134013753019, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019912800267509284, + "loss": 0.0165, "step": 259430 }, { - "epoch": 1.31, - "learning_rate": 0.00010366377244451619, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.0001991241144587214, + "loss": 0.0143, "step": 259440 }, { - "epoch": 1.31, - "learning_rate": 0.00010365620475150217, - "loss": 0.0096, + "epoch": 0.67, + "learning_rate": 0.00019912022624234992, + "loss": 0.0152, "step": 259450 }, { - "epoch": 1.31, - "learning_rate": 0.00010364863705848816, - "loss": 0.0117, + "epoch": 0.67, + "learning_rate": 0.00019911633802597846, + "loss": 0.0142, "step": 259460 }, { - "epoch": 1.31, - "learning_rate": 0.00010364106936547416, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019911244980960697, + "loss": 0.0142, "step": 259470 }, { - "epoch": 1.31, - "learning_rate": 0.00010363350167246014, - "loss": 0.0068, + "epoch": 0.67, + "learning_rate": 0.00019910856159323554, + "loss": 0.0137, "step": 259480 }, { - "epoch": 1.31, - "learning_rate": 0.00010362593397944614, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019910467337686406, + "loss": 0.019, "step": 259490 }, { - "epoch": 1.31, - "learning_rate": 0.00010361836628643213, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0001991007851604926, + "loss": 0.0136, "step": 259500 }, { - "epoch": 1.31, - "learning_rate": 0.00010361079859341811, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019909689694412111, + "loss": 0.0145, "step": 259510 }, { - "epoch": 1.31, - "learning_rate": 0.00010360323090040411, - "loss": 0.0104, + "epoch": 0.67, + "learning_rate": 0.00019909300872774966, + "loss": 0.0163, "step": 259520 }, { - "epoch": 1.31, - "learning_rate": 0.00010359566320739009, - "loss": 0.0086, + "epoch": 0.67, + "learning_rate": 0.0001990891205113782, + "loss": 0.0152, "step": 259530 }, { - "epoch": 1.31, - "learning_rate": 0.00010358809551437608, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.00019908523229500674, + "loss": 0.0113, "step": 259540 }, { - "epoch": 1.31, - "learning_rate": 0.00010358052782136208, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019908134407863525, + "loss": 0.0173, "step": 259550 }, { - "epoch": 1.31, - "learning_rate": 0.00010357296012834806, - "loss": 0.0122, + "epoch": 0.67, + "learning_rate": 0.0001990774558622638, + "loss": 0.0157, "step": 259560 }, { - "epoch": 1.31, - "learning_rate": 0.00010356539243533405, - "loss": 0.0065, + "epoch": 0.67, + "learning_rate": 0.00019907356764589236, + "loss": 0.0152, "step": 259570 }, { - "epoch": 1.31, - "learning_rate": 0.00010355782474232005, - "loss": 0.0083, + "epoch": 0.67, + "learning_rate": 0.00019906967942952088, + "loss": 0.014, "step": 259580 }, { - "epoch": 1.31, - "learning_rate": 0.00010355025704930603, - "loss": 0.012, + "epoch": 0.67, + "learning_rate": 0.0001990657912131494, + "loss": 0.0165, "step": 259590 }, { - "epoch": 1.31, - "learning_rate": 0.00010354268935629203, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019906190299677793, + "loss": 0.0164, "step": 259600 }, { - "epoch": 1.31, - "learning_rate": 0.00010353512166327802, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.0001990580147804065, + "loss": 0.0135, "step": 259610 }, { - "epoch": 1.31, - "learning_rate": 0.000103527553970264, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019905412656403502, + "loss": 0.0144, "step": 259620 }, { - "epoch": 1.31, - "learning_rate": 0.00010351998627725, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019905023834766356, + "loss": 0.0125, "step": 259630 }, { - "epoch": 1.31, - "learning_rate": 0.00010351241858423598, - "loss": 0.0114, + "epoch": 0.67, + "learning_rate": 0.00019904635013129207, + "loss": 0.0157, "step": 259640 }, { - "epoch": 1.31, - "learning_rate": 0.00010350485089122197, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019904246191492064, + "loss": 0.0156, "step": 259650 }, { - "epoch": 1.31, - "learning_rate": 0.00010349728319820797, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019903857369854916, + "loss": 0.016, "step": 259660 }, { - "epoch": 1.31, - "learning_rate": 0.00010348971550519395, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.0001990346854821777, + "loss": 0.0135, "step": 259670 }, { - "epoch": 1.31, - "learning_rate": 0.00010348214781217995, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019903079726580621, + "loss": 0.0135, "step": 259680 }, { - "epoch": 1.31, - "learning_rate": 0.00010347458011916594, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019902690904943478, + "loss": 0.0151, "step": 259690 }, { - "epoch": 1.31, - "learning_rate": 0.00010346701242615192, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.0001990230208330633, + "loss": 0.0143, "step": 259700 }, { - "epoch": 1.31, - "learning_rate": 0.00010345944473313792, - "loss": 0.0106, + "epoch": 0.67, + "learning_rate": 0.00019901913261669184, + "loss": 0.0122, "step": 259710 }, { - "epoch": 1.31, - "learning_rate": 0.0001034518770401239, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.00019901524440032035, + "loss": 0.0161, "step": 259720 }, { - "epoch": 1.31, - "learning_rate": 0.0001034443093471099, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019901135618394892, + "loss": 0.0196, "step": 259730 }, { - "epoch": 1.31, - "learning_rate": 0.00010343674165409589, - "loss": 0.0093, + "epoch": 0.67, + "learning_rate": 0.00019900746796757744, + "loss": 0.0131, "step": 259740 }, { - "epoch": 1.31, - "learning_rate": 0.00010342917396108187, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019900357975120598, + "loss": 0.0155, "step": 259750 }, { - "epoch": 1.31, - "learning_rate": 0.00010342160626806786, - "loss": 0.0067, + "epoch": 0.67, + "learning_rate": 0.0001989996915348345, + "loss": 0.013, "step": 259760 }, { - "epoch": 1.31, - "learning_rate": 0.00010341403857505386, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.00019899580331846303, + "loss": 0.0161, "step": 259770 }, { - "epoch": 1.31, - "learning_rate": 0.00010340647088203984, - "loss": 0.0062, + "epoch": 0.67, + "learning_rate": 0.0001989919151020916, + "loss": 0.0148, "step": 259780 }, { - "epoch": 1.31, - "learning_rate": 0.00010339890318902584, - "loss": 0.0058, + "epoch": 0.67, + "learning_rate": 0.00019898802688572012, + "loss": 0.0164, "step": 259790 }, { - "epoch": 1.31, - "learning_rate": 0.00010339133549601182, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019898413866934866, + "loss": 0.0184, "step": 259800 }, { - "epoch": 1.31, - "learning_rate": 0.00010338376780299781, - "loss": 0.0057, + "epoch": 0.67, + "learning_rate": 0.00019898025045297717, + "loss": 0.0132, "step": 259810 }, { - "epoch": 1.31, - "learning_rate": 0.00010337620010998381, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019897636223660574, + "loss": 0.02, "step": 259820 }, { - "epoch": 1.31, - "learning_rate": 0.00010336863241696979, - "loss": 0.0066, + "epoch": 0.67, + "learning_rate": 0.00019897247402023426, + "loss": 0.0138, "step": 259830 }, { - "epoch": 1.31, - "learning_rate": 0.00010336106472395578, - "loss": 0.0107, + "epoch": 0.67, + "learning_rate": 0.0001989685858038628, + "loss": 0.0132, "step": 259840 }, { - "epoch": 1.31, - "learning_rate": 0.00010335349703094178, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.0001989646975874913, + "loss": 0.0152, "step": 259850 }, { - "epoch": 1.31, - "learning_rate": 0.00010334592933792776, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019896080937111988, + "loss": 0.0132, "step": 259860 }, { - "epoch": 1.31, - "learning_rate": 0.00010333836164491374, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.0001989569211547484, + "loss": 0.018, "step": 259870 }, { - "epoch": 1.31, - "learning_rate": 0.00010333079395189972, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.00019895303293837694, + "loss": 0.0155, "step": 259880 }, { - "epoch": 1.31, - "learning_rate": 0.00010332322625888572, - "loss": 0.0097, + "epoch": 0.67, + "learning_rate": 0.00019894914472200545, + "loss": 0.0137, "step": 259890 }, { - "epoch": 1.31, - "learning_rate": 0.0001033156585658717, - "loss": 0.0079, + "epoch": 0.67, + "learning_rate": 0.00019894525650563402, + "loss": 0.018, "step": 259900 }, { - "epoch": 1.31, - "learning_rate": 0.0001033080908728577, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.00019894136828926254, + "loss": 0.017, "step": 259910 }, { - "epoch": 1.31, - "learning_rate": 0.00010330052317984369, - "loss": 0.0061, + "epoch": 0.67, + "learning_rate": 0.00019893748007289108, + "loss": 0.0186, "step": 259920 }, { - "epoch": 1.31, - "learning_rate": 0.00010329295548682967, - "loss": 0.0081, + "epoch": 0.67, + "learning_rate": 0.0001989335918565196, + "loss": 0.014, "step": 259930 }, { - "epoch": 1.31, - "learning_rate": 0.00010328538779381567, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019892970364014816, + "loss": 0.018, "step": 259940 }, { - "epoch": 1.31, - "learning_rate": 0.00010327782010080166, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.0001989258154237767, + "loss": 0.0148, "step": 259950 }, { - "epoch": 1.31, - "learning_rate": 0.00010327025240778764, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019892192720740522, + "loss": 0.016, "step": 259960 }, { - "epoch": 1.31, - "learning_rate": 0.00010326268471477364, - "loss": 0.0088, + "epoch": 0.67, + "learning_rate": 0.00019891803899103376, + "loss": 0.0147, "step": 259970 }, { - "epoch": 1.31, - "learning_rate": 0.00010325511702175962, - "loss": 0.008, + "epoch": 0.67, + "learning_rate": 0.0001989141507746623, + "loss": 0.0142, "step": 259980 }, { - "epoch": 1.31, - "learning_rate": 0.00010324754932874561, - "loss": 0.0084, + "epoch": 0.67, + "learning_rate": 0.00019891026255829084, + "loss": 0.0168, "step": 259990 }, { - "epoch": 1.31, - "learning_rate": 0.00010323998163573161, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019890637434191936, + "loss": 0.0179, "step": 260000 }, { - "epoch": 1.31, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.006425743922591209, - "eval_runtime": 116.2948, - "eval_samples_per_second": 17.198, - "eval_steps_per_second": 4.299, + "epoch": 0.67, + "eval_cer": 0.881806259456297, + "eval_loss": 0.010559357702732086, + "eval_runtime": 107.5865, + "eval_samples_per_second": 18.59, + "eval_steps_per_second": 4.647, "step": 260000 }, { - "epoch": 1.31, - "learning_rate": 0.00010323241394271759, - "loss": 0.0065, + "epoch": 0.67, + "learning_rate": 0.0001989024861255479, + "loss": 0.0177, "step": 260010 }, { - "epoch": 1.31, - "learning_rate": 0.00010322484624970359, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.0001988985979091764, + "loss": 0.0173, "step": 260020 }, { - "epoch": 1.31, - "learning_rate": 0.00010321727855668958, - "loss": 0.0094, + "epoch": 0.67, + "learning_rate": 0.00019889470969280498, + "loss": 0.0128, "step": 260030 }, { - "epoch": 1.31, - "learning_rate": 0.00010320971086367556, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.0001988908214764335, + "loss": 0.0193, "step": 260040 }, { - "epoch": 1.31, - "learning_rate": 0.00010320214317066156, - "loss": 0.0106, + "epoch": 0.67, + "learning_rate": 0.00019888693326006204, + "loss": 0.0116, "step": 260050 }, { - "epoch": 1.31, - "learning_rate": 0.00010319457547764755, - "loss": 0.0063, + "epoch": 0.67, + "learning_rate": 0.00019888304504369055, + "loss": 0.0177, "step": 260060 }, { - "epoch": 1.31, - "learning_rate": 0.00010318700778463353, - "loss": 0.0092, + "epoch": 0.67, + "learning_rate": 0.00019887915682731912, + "loss": 0.0185, "step": 260070 }, { - "epoch": 1.31, - "learning_rate": 0.00010317944009161953, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019887526861094764, + "loss": 0.0139, "step": 260080 }, { - "epoch": 1.31, - "learning_rate": 0.00010317187239860551, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019887138039457618, + "loss": 0.0157, "step": 260090 }, { - "epoch": 1.31, - "learning_rate": 0.0001031643047055915, - "loss": 0.0072, + "epoch": 0.67, + "learning_rate": 0.0001988674921782047, + "loss": 0.0166, "step": 260100 }, { - "epoch": 1.31, - "learning_rate": 0.0001031567370125775, - "loss": 0.0109, + "epoch": 0.67, + "learning_rate": 0.00019886360396183326, + "loss": 0.0172, "step": 260110 }, { - "epoch": 1.31, - "learning_rate": 0.00010314916931956348, - "loss": 0.0062, + "epoch": 0.67, + "learning_rate": 0.0001988597157454618, + "loss": 0.0149, "step": 260120 }, { - "epoch": 1.31, - "learning_rate": 0.00010314160162654948, - "loss": 0.0117, + "epoch": 0.67, + "learning_rate": 0.00019885582752909032, + "loss": 0.0159, "step": 260130 }, { - "epoch": 1.31, - "learning_rate": 0.00010313403393353547, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.00019885193931271883, + "loss": 0.0127, "step": 260140 }, { - "epoch": 1.31, - "learning_rate": 0.00010312646624052145, - "loss": 0.0078, + "epoch": 0.67, + "learning_rate": 0.0001988480510963474, + "loss": 0.0159, "step": 260150 }, { - "epoch": 1.31, - "learning_rate": 0.00010311889854750745, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00019884416287997594, + "loss": 0.0142, "step": 260160 }, { - "epoch": 1.31, - "learning_rate": 0.00010311133085449343, - "loss": 0.0069, + "epoch": 0.67, + "learning_rate": 0.00019884027466360446, + "loss": 0.015, "step": 260170 }, { - "epoch": 1.31, - "learning_rate": 0.00010310376316147942, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.000198836386447233, + "loss": 0.0157, "step": 260180 }, { - "epoch": 1.31, - "learning_rate": 0.00010309619546846542, - "loss": 0.006, + "epoch": 0.67, + "learning_rate": 0.00019883249823086154, + "loss": 0.017, "step": 260190 }, { - "epoch": 1.31, - "learning_rate": 0.0001030886277754514, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.00019882861001449008, + "loss": 0.0125, "step": 260200 }, { - "epoch": 1.31, - "learning_rate": 0.0001030810600824374, - "loss": 0.0125, + "epoch": 0.67, + "learning_rate": 0.0001988247217981186, + "loss": 0.0161, "step": 260210 }, { - "epoch": 1.31, - "learning_rate": 0.00010307349238942339, - "loss": 0.0064, + "epoch": 0.67, + "learning_rate": 0.00019882083358174714, + "loss": 0.0142, "step": 260220 }, { - "epoch": 1.31, - "learning_rate": 0.00010306592469640937, - "loss": 0.0095, + "epoch": 0.67, + "learning_rate": 0.00019881694536537568, + "loss": 0.016, "step": 260230 }, { - "epoch": 1.31, - "learning_rate": 0.00010305835700339537, - "loss": 0.0073, + "epoch": 0.67, + "learning_rate": 0.00019881305714900422, + "loss": 0.0135, "step": 260240 }, { - "epoch": 1.31, - "learning_rate": 0.00010305078931038135, - "loss": 0.009, + "epoch": 0.67, + "learning_rate": 0.00019880916893263273, + "loss": 0.0186, "step": 260250 }, { - "epoch": 1.31, - "learning_rate": 0.00010304322161736734, - "loss": 0.0082, + "epoch": 0.67, + "learning_rate": 0.00019880528071626128, + "loss": 0.0137, "step": 260260 }, { - "epoch": 1.31, - "learning_rate": 0.00010303565392435334, - "loss": 0.0101, + "epoch": 0.67, + "learning_rate": 0.0001988013924998898, + "loss": 0.0168, "step": 260270 }, { - "epoch": 1.31, - "learning_rate": 0.00010302808623133932, - "loss": 0.0089, + "epoch": 0.67, + "learning_rate": 0.00019879750428351836, + "loss": 0.0138, "step": 260280 }, { - "epoch": 1.31, - "learning_rate": 0.00010302051853832531, - "loss": 0.0112, + "epoch": 0.67, + "learning_rate": 0.0001987936160671469, + "loss": 0.0144, "step": 260290 }, { - "epoch": 1.31, - "learning_rate": 0.00010301295084531131, - "loss": 0.01, + "epoch": 0.67, + "learning_rate": 0.00019878972785077542, + "loss": 0.013, "step": 260300 }, { - "epoch": 1.31, - "learning_rate": 0.00010300538315229729, - "loss": 0.0062, + "epoch": 0.67, + "learning_rate": 0.00019878583963440393, + "loss": 0.0121, "step": 260310 }, { - "epoch": 1.31, - "learning_rate": 0.00010299781545928329, - "loss": 0.0077, + "epoch": 0.67, + "learning_rate": 0.0001987819514180325, + "loss": 0.0163, "step": 260320 }, { - "epoch": 1.31, - "learning_rate": 0.00010299024776626927, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00019877806320166104, + "loss": 0.0151, "step": 260330 }, { - "epoch": 1.31, - "learning_rate": 0.00010298268007325526, - "loss": 0.0063, + "epoch": 0.67, + "learning_rate": 0.00019877417498528956, + "loss": 0.0145, "step": 260340 }, { - "epoch": 1.31, - "learning_rate": 0.00010297511238024126, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.0001987702867689181, + "loss": 0.0132, "step": 260350 }, { - "epoch": 1.31, - "learning_rate": 0.00010296754468722724, - "loss": 0.0087, + "epoch": 0.67, + "learning_rate": 0.00019876639855254664, + "loss": 0.0138, "step": 260360 }, { - "epoch": 1.31, - "learning_rate": 0.00010295997699421323, - "loss": 0.0085, + "epoch": 0.67, + "learning_rate": 0.00019876251033617518, + "loss": 0.0136, "step": 260370 }, { - "epoch": 1.31, - "learning_rate": 0.00010295240930119923, - "loss": 0.0076, + "epoch": 0.67, + "learning_rate": 0.0001987586221198037, + "loss": 0.0117, "step": 260380 }, { - "epoch": 1.31, - "learning_rate": 0.00010294484160818521, - "loss": 0.0075, + "epoch": 0.67, + "learning_rate": 0.00019875473390343224, + "loss": 0.0121, "step": 260390 }, { - "epoch": 1.31, - "learning_rate": 0.0001029372739151712, - "loss": 0.0074, + "epoch": 0.67, + "learning_rate": 0.00019875084568706078, + "loss": 0.0183, "step": 260400 }, { - "epoch": 1.31, - "learning_rate": 0.00010292970622215719, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019874695747068932, + "loss": 0.0173, "step": 260410 }, { - "epoch": 1.31, - "learning_rate": 0.00010292213852914318, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019874306925431783, + "loss": 0.0169, "step": 260420 }, { - "epoch": 1.31, - "learning_rate": 0.00010291457083612918, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019873918103794638, + "loss": 0.0153, "step": 260430 }, { - "epoch": 1.31, - "learning_rate": 0.00010290700314311516, - "loss": 0.0107, + "epoch": 0.68, + "learning_rate": 0.00019873529282157494, + "loss": 0.0171, "step": 260440 }, { - "epoch": 1.31, - "learning_rate": 0.00010289943545010115, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019873140460520346, + "loss": 0.0166, "step": 260450 }, { - "epoch": 1.31, - "learning_rate": 0.00010289186775708715, - "loss": 0.0061, + "epoch": 0.68, + "learning_rate": 0.00019872751638883197, + "loss": 0.0183, "step": 260460 }, { - "epoch": 1.31, - "learning_rate": 0.00010288430006407313, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.00019872362817246052, + "loss": 0.0172, "step": 260470 }, { - "epoch": 1.31, - "learning_rate": 0.00010287673237105912, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019871973995608908, + "loss": 0.018, "step": 260480 }, { - "epoch": 1.31, - "learning_rate": 0.00010286916467804509, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.0001987158517397176, + "loss": 0.0124, "step": 260490 }, { - "epoch": 1.31, - "learning_rate": 0.00010286159698503109, - "loss": 0.011, + "epoch": 0.68, + "learning_rate": 0.00019871196352334614, + "loss": 0.0151, "step": 260500 }, { - "epoch": 1.31, - "learning_rate": 0.00010285402929201708, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019870807530697465, + "loss": 0.0166, "step": 260510 }, { - "epoch": 1.31, - "learning_rate": 0.00010284646159900306, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.0001987041870906032, + "loss": 0.0183, "step": 260520 }, { - "epoch": 1.31, - "learning_rate": 0.00010283889390598906, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019870029887423174, + "loss": 0.0152, "step": 260530 }, { - "epoch": 1.31, - "learning_rate": 0.00010283132621297504, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019869641065786028, + "loss": 0.013, "step": 260540 }, { - "epoch": 1.31, - "learning_rate": 0.00010282375851996104, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.0001986925224414888, + "loss": 0.0186, "step": 260550 }, { - "epoch": 1.31, - "learning_rate": 0.00010281619082694703, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019868863422511734, + "loss": 0.0175, "step": 260560 }, { - "epoch": 1.31, - "learning_rate": 0.00010280862313393301, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019868474600874588, + "loss": 0.0136, "step": 260570 }, { - "epoch": 1.31, - "learning_rate": 0.00010280105544091901, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019868085779237442, + "loss": 0.0145, "step": 260580 }, { - "epoch": 1.31, - "learning_rate": 0.000102793487747905, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019867696957600293, + "loss": 0.0157, "step": 260590 }, { - "epoch": 1.31, - "learning_rate": 0.00010278592005489098, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019867308135963148, + "loss": 0.0178, "step": 260600 }, { - "epoch": 1.31, - "learning_rate": 0.00010277835236187698, - "loss": 0.0064, + "epoch": 0.68, + "learning_rate": 0.00019866919314326004, + "loss": 0.0181, "step": 260610 }, { - "epoch": 1.31, - "learning_rate": 0.00010277078466886296, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019866530492688856, + "loss": 0.0139, "step": 260620 }, { - "epoch": 1.31, - "learning_rate": 0.00010276321697584895, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019866141671051707, + "loss": 0.0132, "step": 260630 }, { - "epoch": 1.31, - "learning_rate": 0.00010275564928283495, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019865752849414561, + "loss": 0.014, "step": 260640 }, { - "epoch": 1.32, - "learning_rate": 0.00010274808158982093, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019865364027777418, + "loss": 0.0148, "step": 260650 }, { - "epoch": 1.32, - "learning_rate": 0.00010274051389680693, - "loss": 0.0098, + "epoch": 0.68, + "learning_rate": 0.0001986497520614027, + "loss": 0.0135, "step": 260660 }, { - "epoch": 1.32, - "learning_rate": 0.00010273294620379292, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019864586384503124, + "loss": 0.0168, "step": 260670 }, { - "epoch": 1.32, - "learning_rate": 0.0001027253785107789, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019864197562865975, + "loss": 0.0127, "step": 260680 }, { - "epoch": 1.32, - "learning_rate": 0.0001027178108177649, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019863808741228832, + "loss": 0.0221, "step": 260690 }, { - "epoch": 1.32, - "learning_rate": 0.00010271024312475088, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019863419919591684, + "loss": 0.0164, "step": 260700 }, { - "epoch": 1.32, - "learning_rate": 0.00010270267543173687, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019863031097954538, + "loss": 0.0157, "step": 260710 }, { - "epoch": 1.32, - "learning_rate": 0.00010269510773872287, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001986264227631739, + "loss": 0.0142, "step": 260720 }, { - "epoch": 1.32, - "learning_rate": 0.00010268754004570885, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019862253454680246, + "loss": 0.0153, "step": 260730 }, { - "epoch": 1.32, - "learning_rate": 0.00010267997235269485, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.00019861864633043098, + "loss": 0.0139, "step": 260740 }, { - "epoch": 1.32, - "learning_rate": 0.00010267240465968084, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019861475811405952, + "loss": 0.0167, "step": 260750 }, { - "epoch": 1.32, - "learning_rate": 0.00010266483696666682, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.00019861086989768803, + "loss": 0.0142, "step": 260760 }, { - "epoch": 1.32, - "learning_rate": 0.00010265726927365282, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019860698168131657, + "loss": 0.0131, "step": 260770 }, { - "epoch": 1.32, - "learning_rate": 0.0001026497015806388, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019860309346494512, + "loss": 0.0137, "step": 260780 }, { - "epoch": 1.32, - "learning_rate": 0.0001026421338876248, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019859920524857366, + "loss": 0.0139, "step": 260790 }, { - "epoch": 1.32, - "learning_rate": 0.00010263456619461079, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019859531703220217, + "loss": 0.0142, "step": 260800 }, { - "epoch": 1.32, - "learning_rate": 0.00010262699850159677, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019859142881583071, + "loss": 0.0159, "step": 260810 }, { - "epoch": 1.32, - "learning_rate": 0.00010261943080858276, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.00019858754059945928, + "loss": 0.0177, "step": 260820 }, { - "epoch": 1.32, - "learning_rate": 0.00010261186311556876, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.0001985836523830878, + "loss": 0.0171, "step": 260830 }, { - "epoch": 1.32, - "learning_rate": 0.00010260429542255474, - "loss": 0.0098, + "epoch": 0.68, + "learning_rate": 0.00019857976416671634, + "loss": 0.0136, "step": 260840 }, { - "epoch": 1.32, - "learning_rate": 0.00010259672772954074, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019857587595034485, + "loss": 0.0117, "step": 260850 }, { - "epoch": 1.32, - "learning_rate": 0.00010258916003652672, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019857198773397342, + "loss": 0.0168, "step": 260860 }, { - "epoch": 1.32, - "learning_rate": 0.00010258159234351271, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019856809951760194, + "loss": 0.017, "step": 260870 }, { - "epoch": 1.32, - "learning_rate": 0.00010257402465049871, - "loss": 0.0052, + "epoch": 0.68, + "learning_rate": 0.00019856421130123048, + "loss": 0.0135, "step": 260880 }, { - "epoch": 1.32, - "learning_rate": 0.00010256645695748469, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.000198560323084859, + "loss": 0.0137, "step": 260890 }, { - "epoch": 1.32, - "learning_rate": 0.00010255888926447068, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019855643486848756, + "loss": 0.0152, "step": 260900 }, { - "epoch": 1.32, - "learning_rate": 0.00010255132157145668, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019855254665211608, + "loss": 0.0121, "step": 260910 }, { - "epoch": 1.32, - "learning_rate": 0.00010254375387844266, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019854865843574462, + "loss": 0.0146, "step": 260920 }, { - "epoch": 1.32, - "learning_rate": 0.00010253618618542866, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019854477021937313, + "loss": 0.0117, "step": 260930 }, { - "epoch": 1.32, - "learning_rate": 0.00010252861849241464, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.0001985408820030017, + "loss": 0.0175, "step": 260940 }, { - "epoch": 1.32, - "learning_rate": 0.00010252105079940063, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019853699378663022, + "loss": 0.0147, "step": 260950 }, { - "epoch": 1.32, - "learning_rate": 0.00010251348310638663, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019853310557025876, + "loss": 0.018, "step": 260960 }, { - "epoch": 1.32, - "learning_rate": 0.00010250591541337261, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019852921735388727, + "loss": 0.0143, "step": 260970 }, { - "epoch": 1.32, - "learning_rate": 0.0001024983477203586, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019852532913751584, + "loss": 0.0128, "step": 260980 }, { - "epoch": 1.32, - "learning_rate": 0.0001024907800273446, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019852144092114438, + "loss": 0.0135, "step": 260990 }, { - "epoch": 1.32, - "learning_rate": 0.00010248321233433058, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.0001985175527047729, + "loss": 0.0119, "step": 261000 }, { - "epoch": 1.32, - "eval_cer": 0.9144343512465224, - "eval_loss": 0.006257697008550167, - "eval_runtime": 116.3265, - "eval_samples_per_second": 17.193, - "eval_steps_per_second": 4.298, + "epoch": 0.68, + "eval_cer": 0.8817236808771804, + "eval_loss": 0.010634180158376694, + "eval_runtime": 107.7642, + "eval_samples_per_second": 18.559, + "eval_steps_per_second": 4.64, "step": 261000 }, { - "epoch": 1.32, - "learning_rate": 0.00010247564464131657, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019851366448840144, + "loss": 0.0155, "step": 261010 }, { - "epoch": 1.32, - "learning_rate": 0.00010246807694830256, - "loss": 0.006, + "epoch": 0.68, + "learning_rate": 0.00019850977627202995, + "loss": 0.0115, "step": 261020 }, { - "epoch": 1.32, - "learning_rate": 0.00010246050925528855, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019850588805565852, + "loss": 0.0165, "step": 261030 }, { - "epoch": 1.32, - "learning_rate": 0.00010245294156227455, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.00019850199983928704, + "loss": 0.0171, "step": 261040 }, { - "epoch": 1.32, - "learning_rate": 0.00010244537386926053, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019849811162291558, + "loss": 0.0189, "step": 261050 }, { - "epoch": 1.32, - "learning_rate": 0.00010243780617624652, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.0001984942234065441, + "loss": 0.0181, "step": 261060 }, { - "epoch": 1.32, - "learning_rate": 0.00010243023848323252, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.00019849033519017266, + "loss": 0.0197, "step": 261070 }, { - "epoch": 1.32, - "learning_rate": 0.0001024226707902185, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019848644697380118, + "loss": 0.0146, "step": 261080 }, { - "epoch": 1.32, - "learning_rate": 0.0001024151030972045, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019848255875742972, + "loss": 0.0128, "step": 261090 }, { - "epoch": 1.32, - "learning_rate": 0.00010240753540419049, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019847867054105823, + "loss": 0.0161, "step": 261100 }, { - "epoch": 1.32, - "learning_rate": 0.00010239996771117647, - "loss": 0.0109, + "epoch": 0.68, + "learning_rate": 0.0001984747823246868, + "loss": 0.0173, "step": 261110 }, { - "epoch": 1.32, - "learning_rate": 0.00010239240001816245, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019847089410831531, + "loss": 0.0153, "step": 261120 }, { - "epoch": 1.32, - "learning_rate": 0.00010238483232514843, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019846700589194386, + "loss": 0.0111, "step": 261130 }, { - "epoch": 1.32, - "learning_rate": 0.00010237726463213443, - "loss": 0.0107, + "epoch": 0.68, + "learning_rate": 0.00019846311767557237, + "loss": 0.0183, "step": 261140 }, { - "epoch": 1.32, - "learning_rate": 0.00010236969693912041, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019845922945920094, + "loss": 0.0137, "step": 261150 }, { - "epoch": 1.32, - "learning_rate": 0.0001023621292461064, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019845534124282948, + "loss": 0.0196, "step": 261160 }, { - "epoch": 1.32, - "learning_rate": 0.0001023545615530924, - "loss": 0.0109, + "epoch": 0.68, + "learning_rate": 0.000198451453026458, + "loss": 0.0117, "step": 261170 }, { - "epoch": 1.32, - "learning_rate": 0.00010234699386007838, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.0001984475648100865, + "loss": 0.0153, "step": 261180 }, { - "epoch": 1.32, - "learning_rate": 0.00010233942616706438, - "loss": 0.0108, + "epoch": 0.68, + "learning_rate": 0.00019844367659371508, + "loss": 0.0147, "step": 261190 }, { - "epoch": 1.32, - "learning_rate": 0.00010233185847405037, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019843978837734362, + "loss": 0.0136, "step": 261200 }, { - "epoch": 1.32, - "learning_rate": 0.00010232429078103635, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019843590016097214, + "loss": 0.0157, "step": 261210 }, { - "epoch": 1.32, - "learning_rate": 0.00010231672308802235, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019843201194460068, + "loss": 0.0171, "step": 261220 }, { - "epoch": 1.32, - "learning_rate": 0.00010230915539500833, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019842812372822922, + "loss": 0.0201, "step": 261230 }, { - "epoch": 1.32, - "learning_rate": 0.00010230158770199432, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019842423551185776, + "loss": 0.0166, "step": 261240 }, { - "epoch": 1.32, - "learning_rate": 0.00010229402000898032, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019842034729548627, + "loss": 0.0187, "step": 261250 }, { - "epoch": 1.32, - "learning_rate": 0.0001022864523159663, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019841645907911482, + "loss": 0.0161, "step": 261260 }, { - "epoch": 1.32, - "learning_rate": 0.0001022788846229523, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019841257086274333, + "loss": 0.0159, "step": 261270 }, { - "epoch": 1.32, - "learning_rate": 0.00010227131692993829, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.0001984086826463719, + "loss": 0.0131, "step": 261280 }, { - "epoch": 1.32, - "learning_rate": 0.00010226374923692427, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019840479443000041, + "loss": 0.0149, "step": 261290 }, { - "epoch": 1.32, - "learning_rate": 0.00010225618154391027, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019840090621362896, + "loss": 0.0152, "step": 261300 }, { - "epoch": 1.32, - "learning_rate": 0.00010224861385089625, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019839701799725747, + "loss": 0.0143, "step": 261310 }, { - "epoch": 1.32, - "learning_rate": 0.00010224104615788224, - "loss": 0.0058, + "epoch": 0.68, + "learning_rate": 0.00019839312978088604, + "loss": 0.0141, "step": 261320 }, { - "epoch": 1.32, - "learning_rate": 0.00010223347846486824, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019838924156451455, + "loss": 0.0151, "step": 261330 }, { - "epoch": 1.32, - "learning_rate": 0.00010222591077185422, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.0001983853533481431, + "loss": 0.0133, "step": 261340 }, { - "epoch": 1.32, - "learning_rate": 0.00010221834307884022, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.0001983814651317716, + "loss": 0.0163, "step": 261350 }, { - "epoch": 1.32, - "learning_rate": 0.00010221077538582621, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019837757691540018, + "loss": 0.0187, "step": 261360 }, { - "epoch": 1.32, - "learning_rate": 0.00010220320769281219, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.00019837368869902872, + "loss": 0.016, "step": 261370 }, { - "epoch": 1.32, - "learning_rate": 0.00010219563999979819, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019836980048265723, + "loss": 0.0143, "step": 261380 }, { - "epoch": 1.32, - "learning_rate": 0.00010218807230678417, - "loss": 0.0058, + "epoch": 0.68, + "learning_rate": 0.00019836591226628578, + "loss": 0.0135, "step": 261390 }, { - "epoch": 1.32, - "learning_rate": 0.00010218050461377016, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019836202404991432, + "loss": 0.0137, "step": 261400 }, { - "epoch": 1.32, - "learning_rate": 0.00010217293692075616, - "loss": 0.0111, + "epoch": 0.68, + "learning_rate": 0.00019835813583354286, + "loss": 0.0271, "step": 261410 }, { - "epoch": 1.32, - "learning_rate": 0.00010216536922774214, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019835424761717137, + "loss": 0.012, "step": 261420 }, { - "epoch": 1.32, - "learning_rate": 0.00010215780153472813, - "loss": 0.0102, + "epoch": 0.68, + "learning_rate": 0.00019835035940079992, + "loss": 0.0138, "step": 261430 }, { - "epoch": 1.32, - "learning_rate": 0.00010215023384171413, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019834647118442846, + "loss": 0.0188, "step": 261440 }, { - "epoch": 1.32, - "learning_rate": 0.00010214266614870011, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.000198342582968057, + "loss": 0.0144, "step": 261450 }, { - "epoch": 1.32, - "learning_rate": 0.0001021350984556861, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019833869475168551, + "loss": 0.0163, "step": 261460 }, { - "epoch": 1.32, - "learning_rate": 0.00010212753076267209, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019833480653531406, + "loss": 0.0151, "step": 261470 }, { - "epoch": 1.32, - "learning_rate": 0.00010211996306965808, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019833091831894262, + "loss": 0.0123, "step": 261480 }, { - "epoch": 1.32, - "learning_rate": 0.00010211239537664408, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.00019832703010257114, + "loss": 0.0144, "step": 261490 }, { - "epoch": 1.32, - "learning_rate": 0.00010210482768363006, - "loss": 0.0124, + "epoch": 0.68, + "learning_rate": 0.00019832314188619965, + "loss": 0.0183, "step": 261500 }, { - "epoch": 1.32, - "learning_rate": 0.00010209725999061605, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.0001983192536698282, + "loss": 0.0197, "step": 261510 }, { - "epoch": 1.32, - "learning_rate": 0.00010208969229760205, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.0001983153654534567, + "loss": 0.0135, "step": 261520 }, { - "epoch": 1.32, - "learning_rate": 0.00010208212460458803, - "loss": 0.0102, + "epoch": 0.68, + "learning_rate": 0.00019831147723708528, + "loss": 0.0159, "step": 261530 }, { - "epoch": 1.32, - "learning_rate": 0.00010207455691157403, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019830758902071382, + "loss": 0.0137, "step": 261540 }, { - "epoch": 1.32, - "learning_rate": 0.00010206698921856002, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019830370080434233, + "loss": 0.0143, "step": 261550 }, { - "epoch": 1.32, - "learning_rate": 0.000102059421525546, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019829981258797088, + "loss": 0.015, "step": 261560 }, { - "epoch": 1.32, - "learning_rate": 0.000102051853832532, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019829592437159942, + "loss": 0.019, "step": 261570 }, { - "epoch": 1.32, - "learning_rate": 0.00010204428613951798, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019829203615522796, + "loss": 0.0168, "step": 261580 }, { - "epoch": 1.32, - "learning_rate": 0.00010203671844650397, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019828814793885647, + "loss": 0.0189, "step": 261590 }, { - "epoch": 1.32, - "learning_rate": 0.00010202915075348997, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019828425972248502, + "loss": 0.015, "step": 261600 }, { - "epoch": 1.32, - "learning_rate": 0.00010202158306047595, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.00019828037150611356, + "loss": 0.0188, "step": 261610 }, { - "epoch": 1.32, - "learning_rate": 0.00010201401536746194, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.0001982764832897421, + "loss": 0.0157, "step": 261620 }, { - "epoch": 1.32, - "learning_rate": 0.00010200644767444794, - "loss": 0.0104, + "epoch": 0.68, + "learning_rate": 0.0001982725950733706, + "loss": 0.0183, "step": 261630 }, { - "epoch": 1.32, - "learning_rate": 0.00010199887998143392, - "loss": 0.0064, + "epoch": 0.68, + "learning_rate": 0.00019826870685699915, + "loss": 0.0159, "step": 261640 }, { - "epoch": 1.32, - "learning_rate": 0.00010199131228841992, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.0001982648186406277, + "loss": 0.0129, "step": 261650 }, { - "epoch": 1.32, - "learning_rate": 0.0001019837445954059, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019826093042425624, + "loss": 0.018, "step": 261660 }, { - "epoch": 1.32, - "learning_rate": 0.00010197617690239189, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019825704220788475, + "loss": 0.0158, "step": 261670 }, { - "epoch": 1.32, - "learning_rate": 0.00010196860920937789, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.0001982531539915133, + "loss": 0.0183, "step": 261680 }, { - "epoch": 1.32, - "learning_rate": 0.00010196104151636387, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019824926577514186, + "loss": 0.015, "step": 261690 }, { - "epoch": 1.32, - "learning_rate": 0.00010195347382334986, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.00019824537755877038, + "loss": 0.0187, "step": 261700 }, { - "epoch": 1.32, - "learning_rate": 0.00010194590613033586, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019824148934239892, + "loss": 0.0123, "step": 261710 }, { - "epoch": 1.32, - "learning_rate": 0.00010193833843732184, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019823760112602743, + "loss": 0.0171, "step": 261720 }, { - "epoch": 1.32, - "learning_rate": 0.00010193077074430784, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.000198233712909656, + "loss": 0.0137, "step": 261730 }, { - "epoch": 1.32, - "learning_rate": 0.00010192320305129382, - "loss": 0.0121, + "epoch": 0.68, + "learning_rate": 0.00019822982469328452, + "loss": 0.0116, "step": 261740 }, { - "epoch": 1.32, - "learning_rate": 0.0001019156353582798, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019822593647691306, + "loss": 0.0149, "step": 261750 }, { - "epoch": 1.32, - "learning_rate": 0.00010190806766526578, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019822204826054157, + "loss": 0.0119, "step": 261760 }, { - "epoch": 1.32, - "learning_rate": 0.00010190049997225177, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019821816004417011, + "loss": 0.013, "step": 261770 }, { - "epoch": 1.32, - "learning_rate": 0.00010189293227923777, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019821427182779866, + "loss": 0.0203, "step": 261780 }, { - "epoch": 1.32, - "learning_rate": 0.00010188536458622375, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.0001982103836114272, + "loss": 0.0167, "step": 261790 }, { - "epoch": 1.32, - "learning_rate": 0.00010187779689320975, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.0001982064953950557, + "loss": 0.0143, "step": 261800 }, { - "epoch": 1.32, - "learning_rate": 0.00010187022920019574, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019820260717868425, + "loss": 0.0153, "step": 261810 }, { - "epoch": 1.32, - "learning_rate": 0.00010186266150718172, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.0001981987189623128, + "loss": 0.0146, "step": 261820 }, { - "epoch": 1.32, - "learning_rate": 0.00010185509381416772, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019819483074594134, + "loss": 0.0166, "step": 261830 }, { - "epoch": 1.32, - "learning_rate": 0.0001018475261211537, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.00019819094252956985, + "loss": 0.0159, "step": 261840 }, { - "epoch": 1.32, - "learning_rate": 0.0001018399584281397, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.0001981870543131984, + "loss": 0.0167, "step": 261850 }, { - "epoch": 1.32, - "learning_rate": 0.00010183239073512569, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019818316609682696, + "loss": 0.0149, "step": 261860 }, { - "epoch": 1.32, - "learning_rate": 0.00010182482304211167, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019817927788045548, + "loss": 0.0136, "step": 261870 }, { - "epoch": 1.32, - "learning_rate": 0.00010181725534909767, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019817538966408402, + "loss": 0.015, "step": 261880 }, { - "epoch": 1.32, - "learning_rate": 0.00010180968765608366, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.00019817150144771253, + "loss": 0.0141, "step": 261890 }, { - "epoch": 1.32, - "learning_rate": 0.00010180211996306964, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.0001981676132313411, + "loss": 0.0116, "step": 261900 }, { - "epoch": 1.32, - "learning_rate": 0.00010179455227005564, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019816372501496962, + "loss": 0.0143, "step": 261910 }, { - "epoch": 1.32, - "learning_rate": 0.00010178698457704162, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019815983679859816, + "loss": 0.0188, "step": 261920 }, { - "epoch": 1.32, - "learning_rate": 0.00010177941688402761, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019815594858222667, + "loss": 0.0167, "step": 261930 }, { - "epoch": 1.32, - "learning_rate": 0.00010177184919101361, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.00019815206036585524, + "loss": 0.0198, "step": 261940 }, { - "epoch": 1.32, - "learning_rate": 0.00010176428149799959, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019814817214948376, + "loss": 0.0126, "step": 261950 }, { - "epoch": 1.32, - "learning_rate": 0.00010175671380498558, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.0001981442839331123, + "loss": 0.0159, "step": 261960 }, { - "epoch": 1.32, - "learning_rate": 0.00010174914611197158, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.0001981403957167408, + "loss": 0.0173, "step": 261970 }, { - "epoch": 1.32, - "learning_rate": 0.00010174157841895756, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019813650750036938, + "loss": 0.0144, "step": 261980 }, { - "epoch": 1.32, - "learning_rate": 0.00010173401072594356, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.0001981326192839979, + "loss": 0.0188, "step": 261990 }, { - "epoch": 1.32, - "learning_rate": 0.00010172644303292955, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019812873106762644, + "loss": 0.0156, "step": 262000 }, { - "epoch": 1.32, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.006132941693067551, - "eval_runtime": 116.3656, - "eval_samples_per_second": 17.187, - "eval_steps_per_second": 4.297, + "epoch": 0.68, + "eval_cer": 0.8817460750681273, + "eval_loss": 0.010492046363651752, + "eval_runtime": 107.6887, + "eval_samples_per_second": 18.572, + "eval_steps_per_second": 4.643, "step": 262000 }, { - "epoch": 1.32, - "learning_rate": 0.00010171887533991553, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019812484285125495, + "loss": 0.0173, "step": 262010 }, { - "epoch": 1.32, - "learning_rate": 0.00010171130764690153, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.0001981209546348835, + "loss": 0.0152, "step": 262020 }, { - "epoch": 1.32, - "learning_rate": 0.00010170373995388751, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019811706641851206, + "loss": 0.016, "step": 262030 }, { - "epoch": 1.32, - "learning_rate": 0.0001016961722608735, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019811317820214058, + "loss": 0.0155, "step": 262040 }, { - "epoch": 1.32, - "learning_rate": 0.0001016886045678595, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.0001981092899857691, + "loss": 0.0145, "step": 262050 }, { - "epoch": 1.32, - "learning_rate": 0.00010168103687484548, - "loss": 0.0128, + "epoch": 0.68, + "learning_rate": 0.00019810540176939763, + "loss": 0.0152, "step": 262060 }, { - "epoch": 1.32, - "learning_rate": 0.00010167346918183148, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.0001981015135530262, + "loss": 0.0147, "step": 262070 }, { - "epoch": 1.32, - "learning_rate": 0.00010166590148881747, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019809762533665472, + "loss": 0.0132, "step": 262080 }, { - "epoch": 1.32, - "learning_rate": 0.00010165833379580345, - "loss": 0.01, + "epoch": 0.68, + "learning_rate": 0.00019809373712028326, + "loss": 0.0163, "step": 262090 }, { - "epoch": 1.32, - "learning_rate": 0.00010165076610278945, - "loss": 0.0071, + "epoch": 0.68, + "learning_rate": 0.00019808984890391177, + "loss": 0.0173, "step": 262100 }, { - "epoch": 1.32, - "learning_rate": 0.00010164319840977543, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019808596068754034, + "loss": 0.0186, "step": 262110 }, { - "epoch": 1.32, - "learning_rate": 0.00010163563071676142, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019808207247116886, + "loss": 0.0184, "step": 262120 }, { - "epoch": 1.32, - "learning_rate": 0.00010162806302374742, - "loss": 0.01, + "epoch": 0.68, + "learning_rate": 0.0001980781842547974, + "loss": 0.0157, "step": 262130 }, { - "epoch": 1.32, - "learning_rate": 0.0001016204953307334, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.0001980742960384259, + "loss": 0.0153, "step": 262140 }, { - "epoch": 1.32, - "learning_rate": 0.0001016129276377194, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019807040782205448, + "loss": 0.0146, "step": 262150 }, { - "epoch": 1.32, - "learning_rate": 0.00010160535994470539, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.000198066519605683, + "loss": 0.0162, "step": 262160 }, { - "epoch": 1.32, - "learning_rate": 0.00010159779225169137, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019806263138931154, + "loss": 0.0156, "step": 262170 }, { - "epoch": 1.32, - "learning_rate": 0.00010159022455867737, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019805874317294005, + "loss": 0.0133, "step": 262180 }, { - "epoch": 1.32, - "learning_rate": 0.00010158265686566335, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.00019805485495656862, + "loss": 0.0137, "step": 262190 }, { - "epoch": 1.32, - "learning_rate": 0.00010157508917264934, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.00019805096674019716, + "loss": 0.0128, "step": 262200 }, { - "epoch": 1.32, - "learning_rate": 0.00010156752147963534, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019804707852382568, + "loss": 0.0128, "step": 262210 }, { - "epoch": 1.32, - "learning_rate": 0.00010155995378662132, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.0001980431903074542, + "loss": 0.018, "step": 262220 }, { - "epoch": 1.32, - "learning_rate": 0.00010155238609360731, - "loss": 0.0121, + "epoch": 0.68, + "learning_rate": 0.00019803930209108276, + "loss": 0.0172, "step": 262230 }, { - "epoch": 1.32, - "learning_rate": 0.00010154481840059331, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.0001980354138747113, + "loss": 0.0149, "step": 262240 }, { - "epoch": 1.32, - "learning_rate": 0.00010153725070757929, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019803152565833982, + "loss": 0.0134, "step": 262250 }, { - "epoch": 1.32, - "learning_rate": 0.00010152968301456529, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.00019802763744196836, + "loss": 0.0161, "step": 262260 }, { - "epoch": 1.32, - "learning_rate": 0.00010152211532155127, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019802374922559687, + "loss": 0.0144, "step": 262270 }, { - "epoch": 1.32, - "learning_rate": 0.00010151454762853726, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019801986100922544, + "loss": 0.0153, "step": 262280 }, { - "epoch": 1.32, - "learning_rate": 0.00010150697993552326, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019801597279285395, + "loss": 0.0155, "step": 262290 }, { - "epoch": 1.32, - "learning_rate": 0.00010149941224250924, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.0001980120845764825, + "loss": 0.0143, "step": 262300 }, { - "epoch": 1.32, - "learning_rate": 0.00010149184454949523, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.000198008196360111, + "loss": 0.0146, "step": 262310 }, { - "epoch": 1.32, - "learning_rate": 0.00010148427685648123, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019800430814373958, + "loss": 0.0192, "step": 262320 }, { - "epoch": 1.32, - "learning_rate": 0.00010147670916346721, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.0001980004199273681, + "loss": 0.0144, "step": 262330 }, { - "epoch": 1.32, - "learning_rate": 0.0001014691414704532, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019799653171099664, + "loss": 0.0127, "step": 262340 }, { - "epoch": 1.32, - "learning_rate": 0.00010146157377743919, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019799264349462515, + "loss": 0.0164, "step": 262350 }, { - "epoch": 1.32, - "learning_rate": 0.00010145400608442518, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019798875527825372, + "loss": 0.0146, "step": 262360 }, { - "epoch": 1.32, - "learning_rate": 0.00010144643839141118, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019798486706188223, + "loss": 0.0146, "step": 262370 }, { - "epoch": 1.32, - "learning_rate": 0.00010143887069839714, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.00019798097884551078, + "loss": 0.0108, "step": 262380 }, { - "epoch": 1.32, - "learning_rate": 0.00010143130300538314, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.0001979770906291393, + "loss": 0.0159, "step": 262390 }, { - "epoch": 1.32, - "learning_rate": 0.00010142373531236912, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019797320241276786, + "loss": 0.0134, "step": 262400 }, { - "epoch": 1.32, - "learning_rate": 0.00010141616761935512, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.0001979693141963964, + "loss": 0.0145, "step": 262410 }, { - "epoch": 1.32, - "learning_rate": 0.00010140859992634111, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019796542598002491, + "loss": 0.0153, "step": 262420 }, { - "epoch": 1.32, - "learning_rate": 0.00010140103223332709, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.00019796153776365346, + "loss": 0.0156, "step": 262430 }, { - "epoch": 1.32, - "learning_rate": 0.00010139346454031309, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.000197957649547282, + "loss": 0.0174, "step": 262440 }, { - "epoch": 1.32, - "learning_rate": 0.00010138589684729908, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019795376133091054, + "loss": 0.0155, "step": 262450 }, { - "epoch": 1.32, - "learning_rate": 0.00010137832915428506, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019794987311453905, + "loss": 0.0145, "step": 262460 }, { - "epoch": 1.32, - "learning_rate": 0.00010137076146127106, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.0001979459848981676, + "loss": 0.0172, "step": 262470 }, { - "epoch": 1.32, - "learning_rate": 0.00010136319376825704, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.00019794209668179614, + "loss": 0.0181, "step": 262480 }, { - "epoch": 1.32, - "learning_rate": 0.00010135562607524303, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019793820846542468, + "loss": 0.0144, "step": 262490 }, { - "epoch": 1.32, - "learning_rate": 0.00010134805838222903, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.0001979343202490532, + "loss": 0.0166, "step": 262500 }, { - "epoch": 1.32, - "learning_rate": 0.00010134049068921501, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.00019793043203268174, + "loss": 0.0153, "step": 262510 }, { - "epoch": 1.32, - "learning_rate": 0.000101332922996201, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019792654381631025, + "loss": 0.0132, "step": 262520 }, { - "epoch": 1.32, - "learning_rate": 0.000101325355303187, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019792265559993882, + "loss": 0.0119, "step": 262530 }, { - "epoch": 1.32, - "learning_rate": 0.00010131778761017298, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019791876738356733, + "loss": 0.018, "step": 262540 }, { - "epoch": 1.32, - "learning_rate": 0.00010131021991715898, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019791487916719587, + "loss": 0.0106, "step": 262550 }, { - "epoch": 1.32, - "learning_rate": 0.00010130265222414496, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.0001979109909508244, + "loss": 0.013, "step": 262560 }, { - "epoch": 1.32, - "learning_rate": 0.00010129508453113095, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019790710273445296, + "loss": 0.0153, "step": 262570 }, { - "epoch": 1.32, - "learning_rate": 0.00010128751683811695, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.0001979032145180815, + "loss": 0.0171, "step": 262580 }, { - "epoch": 1.32, - "learning_rate": 0.00010127994914510293, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.00019789932630171001, + "loss": 0.0197, "step": 262590 }, { - "epoch": 1.32, - "learning_rate": 0.00010127238145208893, - "loss": 0.0101, + "epoch": 0.68, + "learning_rate": 0.00019789543808533856, + "loss": 0.0112, "step": 262600 }, { - "epoch": 1.32, - "learning_rate": 0.00010126481375907492, - "loss": 0.0104, + "epoch": 0.68, + "learning_rate": 0.0001978915498689671, + "loss": 0.0158, "step": 262610 }, { - "epoch": 1.32, - "learning_rate": 0.0001012572460660609, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019788766165259564, + "loss": 0.0159, "step": 262620 }, { - "epoch": 1.32, - "learning_rate": 0.0001012496783730469, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019788377343622415, + "loss": 0.015, "step": 262630 }, { - "epoch": 1.33, - "learning_rate": 0.00010124211068003288, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.0001978798852198527, + "loss": 0.0154, "step": 262640 }, { - "epoch": 1.33, - "learning_rate": 0.00010123454298701887, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019787599700348124, + "loss": 0.0154, "step": 262650 }, { - "epoch": 1.33, - "learning_rate": 0.00010122697529400487, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019787210878710978, + "loss": 0.0174, "step": 262660 }, { - "epoch": 1.33, - "learning_rate": 0.00010121940760099085, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.0001978682205707383, + "loss": 0.0165, "step": 262670 }, { - "epoch": 1.33, - "learning_rate": 0.00010121183990797684, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019786433235436683, + "loss": 0.0127, "step": 262680 }, { - "epoch": 1.33, - "learning_rate": 0.00010120427221496284, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019786044413799538, + "loss": 0.0143, "step": 262690 }, { - "epoch": 1.33, - "learning_rate": 0.00010119670452194882, - "loss": 0.01, + "epoch": 0.68, + "learning_rate": 0.00019785655592162392, + "loss": 0.0133, "step": 262700 }, { - "epoch": 1.33, - "learning_rate": 0.00010118913682893482, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.00019785266770525243, + "loss": 0.0138, "step": 262710 }, { - "epoch": 1.33, - "learning_rate": 0.0001011815691359208, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019784877948888097, + "loss": 0.0165, "step": 262720 }, { - "epoch": 1.33, - "learning_rate": 0.00010117400144290679, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019784489127250954, + "loss": 0.0181, "step": 262730 }, { - "epoch": 1.33, - "learning_rate": 0.00010116643374989279, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.00019784100305613806, + "loss": 0.0156, "step": 262740 }, { - "epoch": 1.33, - "learning_rate": 0.00010115886605687877, - "loss": 0.0103, + "epoch": 0.68, + "learning_rate": 0.0001978371148397666, + "loss": 0.0128, "step": 262750 }, { - "epoch": 1.33, - "learning_rate": 0.00010115129836386476, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019783322662339511, + "loss": 0.0171, "step": 262760 }, { - "epoch": 1.33, - "learning_rate": 0.00010114373067085076, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019782933840702363, + "loss": 0.0158, "step": 262770 }, { - "epoch": 1.33, - "learning_rate": 0.00010113616297783674, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.0001978254501906522, + "loss": 0.0179, "step": 262780 }, { - "epoch": 1.33, - "learning_rate": 0.00010112859528482274, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019782156197428074, + "loss": 0.0154, "step": 262790 }, { - "epoch": 1.33, - "learning_rate": 0.00010112102759180872, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019781767375790925, + "loss": 0.0136, "step": 262800 }, { - "epoch": 1.33, - "learning_rate": 0.00010111345989879471, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.0001978137855415378, + "loss": 0.019, "step": 262810 }, { - "epoch": 1.33, - "learning_rate": 0.00010110589220578071, - "loss": 0.0057, + "epoch": 0.68, + "learning_rate": 0.00019780989732516634, + "loss": 0.0216, "step": 262820 }, { - "epoch": 1.33, - "learning_rate": 0.00010109832451276669, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019780600910879488, + "loss": 0.0133, "step": 262830 }, { - "epoch": 1.33, - "learning_rate": 0.00010109075681975268, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.0001978021208924234, + "loss": 0.0178, "step": 262840 }, { - "epoch": 1.33, - "learning_rate": 0.00010108318912673868, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019779823267605193, + "loss": 0.0139, "step": 262850 }, { - "epoch": 1.33, - "learning_rate": 0.00010107562143372466, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019779434445968048, + "loss": 0.0163, "step": 262860 }, { - "epoch": 1.33, - "learning_rate": 0.00010106805374071065, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019779045624330902, + "loss": 0.0137, "step": 262870 }, { - "epoch": 1.33, - "learning_rate": 0.00010106048604769664, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019778656802693753, + "loss": 0.015, "step": 262880 }, { - "epoch": 1.33, - "learning_rate": 0.00010105291835468263, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019778267981056607, + "loss": 0.0169, "step": 262890 }, { - "epoch": 1.33, - "learning_rate": 0.00010104535066166863, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019777879159419464, + "loss": 0.0215, "step": 262900 }, { - "epoch": 1.33, - "learning_rate": 0.00010103778296865461, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019777490337782316, + "loss": 0.0157, "step": 262910 }, { - "epoch": 1.33, - "learning_rate": 0.0001010302152756406, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019777101516145167, + "loss": 0.0177, "step": 262920 }, { - "epoch": 1.33, - "learning_rate": 0.0001010226475826266, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.0001977671269450802, + "loss": 0.0105, "step": 262930 }, { - "epoch": 1.33, - "learning_rate": 0.00010101507988961258, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019776323872870878, + "loss": 0.0122, "step": 262940 }, { - "epoch": 1.33, - "learning_rate": 0.00010100751219659857, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.0001977593505123373, + "loss": 0.0144, "step": 262950 }, { - "epoch": 1.33, - "learning_rate": 0.00010099994450358456, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.00019775546229596584, + "loss": 0.015, "step": 262960 }, { - "epoch": 1.33, - "learning_rate": 0.00010099237681057055, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019775157407959435, + "loss": 0.0197, "step": 262970 }, { - "epoch": 1.33, - "learning_rate": 0.00010098480911755655, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019774768586322292, + "loss": 0.0135, "step": 262980 }, { - "epoch": 1.33, - "learning_rate": 0.00010097724142454253, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019774379764685144, + "loss": 0.0167, "step": 262990 }, { - "epoch": 1.33, - "learning_rate": 0.00010096967373152852, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019773990943047998, + "loss": 0.0161, "step": 263000 }, { - "epoch": 1.33, - "eval_cer": 0.9144459960000272, - "eval_loss": 0.005995141342282295, - "eval_runtime": 116.2956, - "eval_samples_per_second": 17.198, - "eval_steps_per_second": 4.299, + "epoch": 0.68, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.010503942146897316, + "eval_runtime": 107.871, + "eval_samples_per_second": 18.541, + "eval_steps_per_second": 4.635, "step": 263000 }, { - "epoch": 1.33, - "learning_rate": 0.00010096210603851449, - "loss": 0.0107, + "epoch": 0.68, + "learning_rate": 0.0001977360212141085, + "loss": 0.0146, "step": 263010 }, { - "epoch": 1.33, - "learning_rate": 0.00010095453834550048, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019773213299773703, + "loss": 0.0173, "step": 263020 }, { - "epoch": 1.33, - "learning_rate": 0.00010094697065248648, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019772824478136558, + "loss": 0.0168, "step": 263030 }, { - "epoch": 1.33, - "learning_rate": 0.00010093940295947246, - "loss": 0.0063, + "epoch": 0.68, + "learning_rate": 0.00019772435656499412, + "loss": 0.0169, "step": 263040 }, { - "epoch": 1.33, - "learning_rate": 0.00010093183526645846, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019772046834862263, + "loss": 0.0164, "step": 263050 }, { - "epoch": 1.33, - "learning_rate": 0.00010092426757344445, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019771658013225117, + "loss": 0.0177, "step": 263060 }, { - "epoch": 1.33, - "learning_rate": 0.00010091669988043043, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019771269191587974, + "loss": 0.0146, "step": 263070 }, { - "epoch": 1.33, - "learning_rate": 0.00010090913218741643, - "loss": 0.0068, + "epoch": 0.68, + "learning_rate": 0.00019770880369950826, + "loss": 0.0218, "step": 263080 }, { - "epoch": 1.33, - "learning_rate": 0.00010090156449440241, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.00019770491548313677, + "loss": 0.0142, "step": 263090 }, { - "epoch": 1.33, - "learning_rate": 0.0001008939968013884, - "loss": 0.0061, + "epoch": 0.68, + "learning_rate": 0.0001977010272667653, + "loss": 0.015, "step": 263100 }, { - "epoch": 1.33, - "learning_rate": 0.0001008864291083744, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019769713905039388, + "loss": 0.0125, "step": 263110 }, { - "epoch": 1.33, - "learning_rate": 0.00010087886141536038, - "loss": 0.0059, + "epoch": 0.68, + "learning_rate": 0.0001976932508340224, + "loss": 0.02, "step": 263120 }, { - "epoch": 1.33, - "learning_rate": 0.00010087129372234638, - "loss": 0.0111, + "epoch": 0.68, + "learning_rate": 0.00019768936261765094, + "loss": 0.0167, "step": 263130 }, { - "epoch": 1.33, - "learning_rate": 0.00010086372602933237, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019768547440127945, + "loss": 0.0172, "step": 263140 }, { - "epoch": 1.33, - "learning_rate": 0.00010085615833631835, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019768158618490802, + "loss": 0.0145, "step": 263150 }, { - "epoch": 1.33, - "learning_rate": 0.00010084859064330435, - "loss": 0.0064, + "epoch": 0.68, + "learning_rate": 0.00019767769796853654, + "loss": 0.0158, "step": 263160 }, { - "epoch": 1.33, - "learning_rate": 0.00010084102295029033, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019767380975216508, + "loss": 0.0152, "step": 263170 }, { - "epoch": 1.33, - "learning_rate": 0.00010083345525727632, - "loss": 0.0066, + "epoch": 0.68, + "learning_rate": 0.0001976699215357936, + "loss": 0.019, "step": 263180 }, { - "epoch": 1.33, - "learning_rate": 0.00010082588756426232, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019766603331942216, + "loss": 0.0214, "step": 263190 }, { - "epoch": 1.33, - "learning_rate": 0.0001008183198712483, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.00019766214510305067, + "loss": 0.0148, "step": 263200 }, { - "epoch": 1.33, - "learning_rate": 0.0001008107521782343, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019765825688667922, + "loss": 0.0145, "step": 263210 }, { - "epoch": 1.33, - "learning_rate": 0.00010080318448522029, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019765436867030773, + "loss": 0.0127, "step": 263220 }, { - "epoch": 1.33, - "learning_rate": 0.00010079561679220627, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.0001976504804539363, + "loss": 0.016, "step": 263230 }, { - "epoch": 1.33, - "learning_rate": 0.00010078804909919227, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.00019764659223756481, + "loss": 0.0179, "step": 263240 }, { - "epoch": 1.33, - "learning_rate": 0.00010078048140617825, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019764270402119336, + "loss": 0.0144, "step": 263250 }, { - "epoch": 1.33, - "learning_rate": 0.00010077291371316424, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.00019763881580482187, + "loss": 0.015, "step": 263260 }, { - "epoch": 1.33, - "learning_rate": 0.00010076534602015024, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.0001976349275884504, + "loss": 0.0177, "step": 263270 }, { - "epoch": 1.33, - "learning_rate": 0.00010075777832713622, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.00019763103937207898, + "loss": 0.0141, "step": 263280 }, { - "epoch": 1.33, - "learning_rate": 0.00010075021063412221, - "loss": 0.0121, + "epoch": 0.68, + "learning_rate": 0.0001976271511557075, + "loss": 0.0155, "step": 263290 }, { - "epoch": 1.33, - "learning_rate": 0.00010074264294110821, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019762326293933604, + "loss": 0.0142, "step": 263300 }, { - "epoch": 1.33, - "learning_rate": 0.00010073507524809419, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019761937472296455, + "loss": 0.011, "step": 263310 }, { - "epoch": 1.33, - "learning_rate": 0.00010072750755508019, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.00019761548650659312, + "loss": 0.0158, "step": 263320 }, { - "epoch": 1.33, - "learning_rate": 0.00010071993986206617, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019761159829022163, + "loss": 0.0144, "step": 263330 }, { - "epoch": 1.33, - "learning_rate": 0.00010071237216905216, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019760771007385018, + "loss": 0.0158, "step": 263340 }, { - "epoch": 1.33, - "learning_rate": 0.00010070480447603816, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.0001976038218574787, + "loss": 0.0144, "step": 263350 }, { - "epoch": 1.33, - "learning_rate": 0.00010069723678302414, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019759993364110726, + "loss": 0.0166, "step": 263360 }, { - "epoch": 1.33, - "learning_rate": 0.00010068966909001013, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019759604542473577, + "loss": 0.0167, "step": 263370 }, { - "epoch": 1.33, - "learning_rate": 0.00010068210139699613, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019759215720836432, + "loss": 0.0137, "step": 263380 }, { - "epoch": 1.33, - "learning_rate": 0.00010067453370398211, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019758826899199283, + "loss": 0.0139, "step": 263390 }, { - "epoch": 1.33, - "learning_rate": 0.0001006669660109681, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.0001975843807756214, + "loss": 0.0141, "step": 263400 }, { - "epoch": 1.33, - "learning_rate": 0.00010065939831795409, - "loss": 0.0103, + "epoch": 0.68, + "learning_rate": 0.0001975804925592499, + "loss": 0.0129, "step": 263410 }, { - "epoch": 1.33, - "learning_rate": 0.00010065183062494008, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019757660434287846, + "loss": 0.0136, "step": 263420 }, { - "epoch": 1.33, - "learning_rate": 0.00010064426293192608, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019757271612650697, + "loss": 0.0167, "step": 263430 }, { - "epoch": 1.33, - "learning_rate": 0.00010063669523891206, - "loss": 0.0127, + "epoch": 0.68, + "learning_rate": 0.00019756882791013554, + "loss": 0.0142, "step": 263440 }, { - "epoch": 1.33, - "learning_rate": 0.00010062912754589805, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019756493969376408, + "loss": 0.0125, "step": 263450 }, { - "epoch": 1.33, - "learning_rate": 0.00010062155985288405, - "loss": 0.0086, + "epoch": 0.68, + "learning_rate": 0.0001975610514773926, + "loss": 0.0146, "step": 263460 }, { - "epoch": 1.33, - "learning_rate": 0.00010061399215987003, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019755716326102114, + "loss": 0.0145, "step": 263470 }, { - "epoch": 1.33, - "learning_rate": 0.00010060642446685602, - "loss": 0.0115, + "epoch": 0.68, + "learning_rate": 0.00019755327504464968, + "loss": 0.0139, "step": 263480 }, { - "epoch": 1.33, - "learning_rate": 0.00010059885677384202, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019754938682827822, + "loss": 0.0173, "step": 263490 }, { - "epoch": 1.33, - "learning_rate": 0.000100591289080828, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019754549861190673, + "loss": 0.017, "step": 263500 }, { - "epoch": 1.33, - "learning_rate": 0.000100583721387814, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019754161039553528, + "loss": 0.0156, "step": 263510 }, { - "epoch": 1.33, - "learning_rate": 0.00010057615369479998, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.0001975377221791638, + "loss": 0.0133, "step": 263520 }, { - "epoch": 1.33, - "learning_rate": 0.00010056858600178597, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019753383396279236, + "loss": 0.0178, "step": 263530 }, { - "epoch": 1.33, - "learning_rate": 0.00010056101830877197, - "loss": 0.011, + "epoch": 0.68, + "learning_rate": 0.00019752994574642087, + "loss": 0.0146, "step": 263540 }, { - "epoch": 1.33, - "learning_rate": 0.00010055345061575795, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019752605753004942, + "loss": 0.0133, "step": 263550 }, { - "epoch": 1.33, - "learning_rate": 0.00010054588292274394, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019752216931367793, + "loss": 0.0155, "step": 263560 }, { - "epoch": 1.33, - "learning_rate": 0.00010053831522972994, - "loss": 0.0069, + "epoch": 0.68, + "learning_rate": 0.0001975182810973065, + "loss": 0.017, "step": 263570 }, { - "epoch": 1.33, - "learning_rate": 0.00010053074753671592, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.000197514392880935, + "loss": 0.0139, "step": 263580 }, { - "epoch": 1.33, - "learning_rate": 0.00010052317984370191, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019751050466456355, + "loss": 0.0133, "step": 263590 }, { - "epoch": 1.33, - "learning_rate": 0.0001005156121506879, - "loss": 0.007, + "epoch": 0.68, + "learning_rate": 0.00019750661644819207, + "loss": 0.0121, "step": 263600 }, { - "epoch": 1.33, - "learning_rate": 0.00010050804445767389, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019750272823182064, + "loss": 0.0141, "step": 263610 }, { - "epoch": 1.33, - "learning_rate": 0.00010050047676465989, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019749884001544918, + "loss": 0.0144, "step": 263620 }, { - "epoch": 1.33, - "learning_rate": 0.00010049290907164587, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.0001974949517990777, + "loss": 0.0173, "step": 263630 }, { - "epoch": 1.33, - "learning_rate": 0.00010048534137863185, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.0001974910635827062, + "loss": 0.0143, "step": 263640 }, { - "epoch": 1.33, - "learning_rate": 0.00010047777368561783, - "loss": 0.0085, + "epoch": 0.68, + "learning_rate": 0.00019748717536633478, + "loss": 0.016, "step": 263650 }, { - "epoch": 1.33, - "learning_rate": 0.00010047020599260383, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019748328714996332, + "loss": 0.0154, "step": 263660 }, { - "epoch": 1.33, - "learning_rate": 0.00010046263829958982, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019747939893359183, + "loss": 0.0131, "step": 263670 }, { - "epoch": 1.33, - "learning_rate": 0.0001004550706065758, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019747551071722038, + "loss": 0.0143, "step": 263680 }, { - "epoch": 1.33, - "learning_rate": 0.0001004475029135618, - "loss": 0.0078, + "epoch": 0.68, + "learning_rate": 0.00019747162250084892, + "loss": 0.0154, "step": 263690 }, { - "epoch": 1.33, - "learning_rate": 0.00010043993522054778, - "loss": 0.0103, + "epoch": 0.68, + "learning_rate": 0.00019746773428447746, + "loss": 0.0149, "step": 263700 }, { - "epoch": 1.33, - "learning_rate": 0.00010043236752753377, - "loss": 0.0103, + "epoch": 0.68, + "learning_rate": 0.00019746384606810597, + "loss": 0.0119, "step": 263710 }, { - "epoch": 1.33, - "learning_rate": 0.00010042479983451977, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.00019745995785173451, + "loss": 0.0142, "step": 263720 }, { - "epoch": 1.33, - "learning_rate": 0.00010041723214150575, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019745606963536306, + "loss": 0.0142, "step": 263730 }, { - "epoch": 1.33, - "learning_rate": 0.00010040966444849174, - "loss": 0.0122, + "epoch": 0.68, + "learning_rate": 0.0001974521814189916, + "loss": 0.0133, "step": 263740 }, { - "epoch": 1.33, - "learning_rate": 0.00010040209675547774, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.0001974482932026201, + "loss": 0.016, "step": 263750 }, { - "epoch": 1.33, - "learning_rate": 0.00010039452906246372, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019744440498624865, + "loss": 0.0167, "step": 263760 }, { - "epoch": 1.33, - "learning_rate": 0.00010038696136944972, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.00019744051676987717, + "loss": 0.0175, "step": 263770 }, { - "epoch": 1.33, - "learning_rate": 0.0001003793936764357, - "loss": 0.0117, + "epoch": 0.68, + "learning_rate": 0.00019743662855350574, + "loss": 0.0147, "step": 263780 }, { - "epoch": 1.33, - "learning_rate": 0.00010037182598342169, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019743274033713428, + "loss": 0.0144, "step": 263790 }, { - "epoch": 1.33, - "learning_rate": 0.00010036425829040769, - "loss": 0.0079, + "epoch": 0.68, + "learning_rate": 0.0001974288521207628, + "loss": 0.0133, "step": 263800 }, { - "epoch": 1.33, - "learning_rate": 0.00010035669059739367, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.0001974249639043913, + "loss": 0.0149, "step": 263810 }, { - "epoch": 1.33, - "learning_rate": 0.00010034912290437966, - "loss": 0.0076, + "epoch": 0.68, + "learning_rate": 0.00019742107568801988, + "loss": 0.013, "step": 263820 }, { - "epoch": 1.33, - "learning_rate": 0.00010034155521136566, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019741718747164842, + "loss": 0.0147, "step": 263830 }, { - "epoch": 1.33, - "learning_rate": 0.00010033398751835164, - "loss": 0.0089, + "epoch": 0.68, + "learning_rate": 0.00019741329925527693, + "loss": 0.0128, "step": 263840 }, { - "epoch": 1.33, - "learning_rate": 0.00010032641982533764, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019740941103890547, + "loss": 0.0168, "step": 263850 }, { - "epoch": 1.33, - "learning_rate": 0.00010031885213232362, - "loss": 0.0075, + "epoch": 0.68, + "learning_rate": 0.00019740552282253402, + "loss": 0.0183, "step": 263860 }, { - "epoch": 1.33, - "learning_rate": 0.00010031128443930961, - "loss": 0.0099, + "epoch": 0.68, + "learning_rate": 0.00019740163460616256, + "loss": 0.0152, "step": 263870 }, { - "epoch": 1.33, - "learning_rate": 0.00010030371674629561, - "loss": 0.0102, + "epoch": 0.68, + "learning_rate": 0.00019739774638979107, + "loss": 0.0146, "step": 263880 }, { - "epoch": 1.33, - "learning_rate": 0.00010029614905328159, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019739385817341961, + "loss": 0.0217, "step": 263890 }, { - "epoch": 1.33, - "learning_rate": 0.00010028858136026758, - "loss": 0.0074, + "epoch": 0.68, + "learning_rate": 0.00019738996995704816, + "loss": 0.0118, "step": 263900 }, { - "epoch": 1.33, - "learning_rate": 0.00010028101366725358, - "loss": 0.0062, + "epoch": 0.68, + "learning_rate": 0.0001973860817406767, + "loss": 0.0133, "step": 263910 }, { - "epoch": 1.33, - "learning_rate": 0.00010027344597423956, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.0001973821935243052, + "loss": 0.0122, "step": 263920 }, { - "epoch": 1.33, - "learning_rate": 0.00010026587828122556, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019737830530793375, + "loss": 0.0169, "step": 263930 }, { - "epoch": 1.33, - "learning_rate": 0.00010025831058821155, - "loss": 0.0059, + "epoch": 0.68, + "learning_rate": 0.00019737441709156232, + "loss": 0.0162, "step": 263940 }, { - "epoch": 1.33, - "learning_rate": 0.00010025074289519753, - "loss": 0.01, + "epoch": 0.68, + "learning_rate": 0.00019737052887519084, + "loss": 0.0188, "step": 263950 }, { - "epoch": 1.33, - "learning_rate": 0.00010024317520218353, - "loss": 0.0073, + "epoch": 0.68, + "learning_rate": 0.00019736664065881935, + "loss": 0.0159, "step": 263960 }, { - "epoch": 1.33, - "learning_rate": 0.00010023560750916951, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.0001973627524424479, + "loss": 0.0135, "step": 263970 }, { - "epoch": 1.33, - "learning_rate": 0.0001002280398161555, - "loss": 0.0095, + "epoch": 0.68, + "learning_rate": 0.00019735886422607646, + "loss": 0.0151, "step": 263980 }, { - "epoch": 1.33, - "learning_rate": 0.0001002204721231415, - "loss": 0.0097, + "epoch": 0.68, + "learning_rate": 0.00019735497600970498, + "loss": 0.0144, "step": 263990 }, { - "epoch": 1.33, - "learning_rate": 0.00010021290443012748, - "loss": 0.0096, + "epoch": 0.68, + "learning_rate": 0.00019735108779333352, + "loss": 0.0157, "step": 264000 }, { - "epoch": 1.33, - "eval_cer": 0.9144285288697699, - "eval_loss": 0.006162929814308882, - "eval_runtime": 116.2184, - "eval_samples_per_second": 17.209, - "eval_steps_per_second": 4.302, + "epoch": 0.68, + "eval_cer": 0.881821655462573, + "eval_loss": 0.010292991995811462, + "eval_runtime": 107.7325, + "eval_samples_per_second": 18.564, + "eval_steps_per_second": 4.641, "step": 264000 }, { - "epoch": 1.33, - "learning_rate": 0.00010020533673711347, - "loss": 0.0106, + "epoch": 0.68, + "learning_rate": 0.00019734719957696203, + "loss": 0.0155, "step": 264010 }, { - "epoch": 1.33, - "learning_rate": 0.00010019776904409947, - "loss": 0.0084, + "epoch": 0.68, + "learning_rate": 0.00019734331136059057, + "loss": 0.0099, "step": 264020 }, { - "epoch": 1.33, - "learning_rate": 0.00010019020135108545, - "loss": 0.0065, + "epoch": 0.68, + "learning_rate": 0.00019733942314421912, + "loss": 0.0145, "step": 264030 }, { - "epoch": 1.33, - "learning_rate": 0.00010018263365807145, - "loss": 0.0059, + "epoch": 0.68, + "learning_rate": 0.00019733553492784766, + "loss": 0.0139, "step": 264040 }, { - "epoch": 1.33, - "learning_rate": 0.00010017506596505743, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019733164671147617, + "loss": 0.0116, "step": 264050 }, { - "epoch": 1.33, - "learning_rate": 0.00010016749827204342, - "loss": 0.0093, + "epoch": 0.68, + "learning_rate": 0.0001973277584951047, + "loss": 0.017, "step": 264060 }, { - "epoch": 1.33, - "learning_rate": 0.00010015993057902942, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019732387027873325, + "loss": 0.0142, "step": 264070 }, { - "epoch": 1.33, - "learning_rate": 0.0001001523628860154, - "loss": 0.0083, + "epoch": 0.68, + "learning_rate": 0.0001973199820623618, + "loss": 0.0161, "step": 264080 }, { - "epoch": 1.33, - "learning_rate": 0.0001001447951930014, - "loss": 0.0107, + "epoch": 0.68, + "learning_rate": 0.0001973160938459903, + "loss": 0.0163, "step": 264090 }, { - "epoch": 1.33, - "learning_rate": 0.00010013722749998739, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019731220562961885, + "loss": 0.0137, "step": 264100 }, { - "epoch": 1.33, - "learning_rate": 0.00010012965980697337, - "loss": 0.0105, + "epoch": 0.68, + "learning_rate": 0.0001973083174132474, + "loss": 0.0095, "step": 264110 }, { - "epoch": 1.33, - "learning_rate": 0.00010012209211395937, - "loss": 0.0081, + "epoch": 0.68, + "learning_rate": 0.00019730442919687594, + "loss": 0.0168, "step": 264120 }, { - "epoch": 1.33, - "learning_rate": 0.00010011452442094535, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.00019730054098050445, + "loss": 0.0172, "step": 264130 }, { - "epoch": 1.33, - "learning_rate": 0.00010010695672793134, - "loss": 0.0072, + "epoch": 0.68, + "learning_rate": 0.000197296652764133, + "loss": 0.0119, "step": 264140 }, { - "epoch": 1.33, - "learning_rate": 0.00010009938903491734, - "loss": 0.0092, + "epoch": 0.68, + "learning_rate": 0.00019729276454776156, + "loss": 0.0152, "step": 264150 }, { - "epoch": 1.33, - "learning_rate": 0.00010009182134190332, - "loss": 0.0082, + "epoch": 0.68, + "learning_rate": 0.00019728887633139008, + "loss": 0.0192, "step": 264160 }, { - "epoch": 1.33, - "learning_rate": 0.00010008425364888931, - "loss": 0.0091, + "epoch": 0.68, + "learning_rate": 0.00019728498811501862, + "loss": 0.0152, "step": 264170 }, { - "epoch": 1.33, - "learning_rate": 0.00010007668595587531, - "loss": 0.0088, + "epoch": 0.68, + "learning_rate": 0.00019728109989864713, + "loss": 0.0145, "step": 264180 }, { - "epoch": 1.33, - "learning_rate": 0.00010006911826286129, - "loss": 0.0094, + "epoch": 0.68, + "learning_rate": 0.0001972772116822757, + "loss": 0.0174, "step": 264190 }, { - "epoch": 1.33, - "learning_rate": 0.00010006155056984728, - "loss": 0.0067, + "epoch": 0.68, + "learning_rate": 0.00019727332346590421, + "loss": 0.0149, "step": 264200 }, { - "epoch": 1.33, - "learning_rate": 0.00010005398287683327, - "loss": 0.0077, + "epoch": 0.68, + "learning_rate": 0.00019726943524953276, + "loss": 0.0172, "step": 264210 }, { - "epoch": 1.33, - "learning_rate": 0.00010004641518381926, - "loss": 0.0087, + "epoch": 0.68, + "learning_rate": 0.00019726554703316127, + "loss": 0.0145, "step": 264220 }, { - "epoch": 1.33, - "learning_rate": 0.00010003884749080526, - "loss": 0.009, + "epoch": 0.68, + "learning_rate": 0.00019726165881678984, + "loss": 0.019, "step": 264230 }, { - "epoch": 1.33, - "learning_rate": 0.00010003127979779124, - "loss": 0.011, + "epoch": 0.68, + "learning_rate": 0.00019725777060041835, + "loss": 0.0156, "step": 264240 }, { - "epoch": 1.33, - "learning_rate": 0.00010002371210477723, - "loss": 0.008, + "epoch": 0.68, + "learning_rate": 0.0001972538823840469, + "loss": 0.0138, "step": 264250 }, { - "epoch": 1.33, - "learning_rate": 0.00010001614441176323, - "loss": 0.0059, + "epoch": 0.68, + "learning_rate": 0.0001972499941676754, + "loss": 0.0159, "step": 264260 }, { - "epoch": 1.33, - "learning_rate": 0.0001000085767187492, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019724610595130395, + "loss": 0.0132, "step": 264270 }, { - "epoch": 1.33, - "learning_rate": 0.00010000100902573519, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.0001972422177349325, + "loss": 0.0172, "step": 264280 }, { - "epoch": 1.33, - "learning_rate": 9.999344133272117e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019723832951856104, + "loss": 0.017, "step": 264290 }, { - "epoch": 1.33, - "learning_rate": 9.998587363970717e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019723444130218955, + "loss": 0.0172, "step": 264300 }, { - "epoch": 1.33, - "learning_rate": 9.997830594669315e-05, - "loss": 0.0096, + "epoch": 0.69, + "learning_rate": 0.0001972305530858181, + "loss": 0.0146, "step": 264310 }, { - "epoch": 1.33, - "learning_rate": 9.997073825367914e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019722666486944666, + "loss": 0.0183, "step": 264320 }, { - "epoch": 1.33, - "learning_rate": 9.996317056066514e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019722277665307517, + "loss": 0.0142, "step": 264330 }, { - "epoch": 1.33, - "learning_rate": 9.995560286765112e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019721888843670372, + "loss": 0.0154, "step": 264340 }, { - "epoch": 1.33, - "learning_rate": 9.994803517463711e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019721500022033223, + "loss": 0.0136, "step": 264350 }, { - "epoch": 1.33, - "learning_rate": 9.994046748162311e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.0001972111120039608, + "loss": 0.02, "step": 264360 }, { - "epoch": 1.33, - "learning_rate": 9.993289978860909e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.00019720722378758931, + "loss": 0.0153, "step": 264370 }, { - "epoch": 1.33, - "learning_rate": 9.992533209559509e-05, - "loss": 0.0073, - "step": 264380 + "epoch": 0.69, + "learning_rate": 0.00019720333557121786, + "loss": 0.0166, + "step": 264380 }, { - "epoch": 1.33, - "learning_rate": 9.991776440258108e-05, - "loss": 0.0131, + "epoch": 0.69, + "learning_rate": 0.00019719944735484637, + "loss": 0.0155, "step": 264390 }, { - "epoch": 1.33, - "learning_rate": 9.991019670956706e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019719555913847494, + "loss": 0.0153, "step": 264400 }, { - "epoch": 1.33, - "learning_rate": 9.990262901655306e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019719167092210345, + "loss": 0.0129, "step": 264410 }, { - "epoch": 1.33, - "learning_rate": 9.989506132353904e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.000197187782705732, + "loss": 0.0157, "step": 264420 }, { - "epoch": 1.33, - "learning_rate": 9.988749363052503e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001971838944893605, + "loss": 0.0121, "step": 264430 }, { - "epoch": 1.33, - "learning_rate": 9.987992593751103e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019718000627298908, + "loss": 0.0205, "step": 264440 }, { - "epoch": 1.33, - "learning_rate": 9.987235824449701e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001971761180566176, + "loss": 0.0189, "step": 264450 }, { - "epoch": 1.33, - "learning_rate": 9.9864790551483e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019717222984024613, + "loss": 0.0114, "step": 264460 }, { - "epoch": 1.33, - "learning_rate": 9.9857222858469e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019716834162387465, + "loss": 0.0146, "step": 264470 }, { - "epoch": 1.33, - "learning_rate": 9.984965516545498e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.00019716445340750322, + "loss": 0.0124, "step": 264480 }, { - "epoch": 1.33, - "learning_rate": 9.984208747244098e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019716056519113176, + "loss": 0.0168, "step": 264490 }, { - "epoch": 1.33, - "learning_rate": 9.983451977942696e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019715667697476027, + "loss": 0.0164, "step": 264500 }, { - "epoch": 1.33, - "learning_rate": 9.982695208641295e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001971527887583888, + "loss": 0.0164, "step": 264510 }, { - "epoch": 1.33, - "learning_rate": 9.981938439339895e-05, - "loss": 0.0118, + "epoch": 0.69, + "learning_rate": 0.00019714890054201733, + "loss": 0.0152, "step": 264520 }, { - "epoch": 1.33, - "learning_rate": 9.981181670038493e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.0001971450123256459, + "loss": 0.0121, "step": 264530 }, { - "epoch": 1.33, - "learning_rate": 9.980424900737092e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019714112410927441, + "loss": 0.0159, "step": 264540 }, { - "epoch": 1.33, - "learning_rate": 9.979668131435692e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019713723589290296, + "loss": 0.0132, "step": 264550 }, { - "epoch": 1.33, - "learning_rate": 9.97891136213429e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019713334767653147, + "loss": 0.0154, "step": 264560 }, { - "epoch": 1.33, - "learning_rate": 9.97815459283289e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019712945946016004, + "loss": 0.014, "step": 264570 }, { - "epoch": 1.33, - "learning_rate": 9.977397823531488e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019712557124378855, + "loss": 0.0215, "step": 264580 }, { - "epoch": 1.33, - "learning_rate": 9.976641054230087e-05, - "loss": 0.0061, + "epoch": 0.69, + "learning_rate": 0.0001971216830274171, + "loss": 0.0162, "step": 264590 }, { - "epoch": 1.33, - "learning_rate": 9.975884284928687e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001971177948110456, + "loss": 0.0151, "step": 264600 }, { - "epoch": 1.33, - "learning_rate": 9.975127515627285e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019711390659467418, + "loss": 0.0153, "step": 264610 }, { - "epoch": 1.34, - "learning_rate": 9.974370746325884e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.0001971100183783027, + "loss": 0.0136, "step": 264620 }, { - "epoch": 1.34, - "learning_rate": 9.973613977024484e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019710613016193123, + "loss": 0.0141, "step": 264630 }, { - "epoch": 1.34, - "learning_rate": 9.972857207723082e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019710224194555975, + "loss": 0.019, "step": 264640 }, { - "epoch": 1.34, - "learning_rate": 9.972100438421682e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019709835372918832, + "loss": 0.0143, "step": 264650 }, { - "epoch": 1.34, - "learning_rate": 9.97134366912028e-05, - "loss": 0.0108, + "epoch": 0.69, + "learning_rate": 0.00019709446551281686, + "loss": 0.0121, "step": 264660 }, { - "epoch": 1.34, - "learning_rate": 9.970586899818879e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019709057729644537, + "loss": 0.0141, "step": 264670 }, { - "epoch": 1.34, - "learning_rate": 9.969830130517479e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001970866890800739, + "loss": 0.0291, "step": 264680 }, { - "epoch": 1.34, - "learning_rate": 9.969073361216077e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019708280086370246, + "loss": 0.0203, "step": 264690 }, { - "epoch": 1.34, - "learning_rate": 9.968316591914676e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.000197078912647331, + "loss": 0.0177, "step": 264700 }, { - "epoch": 1.34, - "learning_rate": 9.967559822613276e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.0001970750244309595, + "loss": 0.0127, "step": 264710 }, { - "epoch": 1.34, - "learning_rate": 9.966803053311874e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019707113621458805, + "loss": 0.0134, "step": 264720 }, { - "epoch": 1.34, - "learning_rate": 9.966046284010473e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019706724799821657, + "loss": 0.0128, "step": 264730 }, { - "epoch": 1.34, - "learning_rate": 9.965289514709072e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019706335978184514, + "loss": 0.0139, "step": 264740 }, { - "epoch": 1.34, - "learning_rate": 9.964532745407671e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019705947156547365, + "loss": 0.0137, "step": 264750 }, { - "epoch": 1.34, - "learning_rate": 9.96377597610627e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001970555833491022, + "loss": 0.0179, "step": 264760 }, { - "epoch": 1.34, - "learning_rate": 9.963019206804869e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.0001970516951327307, + "loss": 0.013, "step": 264770 }, { - "epoch": 1.34, - "learning_rate": 9.962262437503468e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019704780691635928, + "loss": 0.0128, "step": 264780 }, { - "epoch": 1.34, - "learning_rate": 9.961505668202068e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001970439186999878, + "loss": 0.013, "step": 264790 }, { - "epoch": 1.34, - "learning_rate": 9.960748898900666e-05, - "loss": 0.0112, + "epoch": 0.69, + "learning_rate": 0.00019704003048361633, + "loss": 0.0151, "step": 264800 }, { - "epoch": 1.34, - "learning_rate": 9.959992129599265e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019703614226724485, + "loss": 0.0141, "step": 264810 }, { - "epoch": 1.34, - "learning_rate": 9.959235360297864e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019703225405087342, + "loss": 0.0131, "step": 264820 }, { - "epoch": 1.34, - "learning_rate": 9.958478590996463e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019702836583450193, + "loss": 0.0133, "step": 264830 }, { - "epoch": 1.34, - "learning_rate": 9.957721821695063e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019702447761813047, + "loss": 0.0127, "step": 264840 }, { - "epoch": 1.34, - "learning_rate": 9.95696505239366e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.000197020589401759, + "loss": 0.0144, "step": 264850 }, { - "epoch": 1.34, - "learning_rate": 9.95620828309226e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019701670118538756, + "loss": 0.0139, "step": 264860 }, { - "epoch": 1.34, - "learning_rate": 9.95545151379086e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.0001970128129690161, + "loss": 0.0115, "step": 264870 }, { - "epoch": 1.34, - "learning_rate": 9.954694744489458e-05, - "loss": 0.0095, + "epoch": 0.69, + "learning_rate": 0.0001970089247526446, + "loss": 0.0123, "step": 264880 }, { - "epoch": 1.34, - "learning_rate": 9.953937975188056e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019700503653627315, + "loss": 0.014, "step": 264890 }, { - "epoch": 1.34, - "learning_rate": 9.953181205886654e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.0001970011483199017, + "loss": 0.0148, "step": 264900 }, { - "epoch": 1.34, - "learning_rate": 9.952424436585254e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019699726010353024, + "loss": 0.0246, "step": 264910 }, { - "epoch": 1.34, - "learning_rate": 9.951667667283853e-05, - "loss": 0.0067, + "epoch": 0.69, + "learning_rate": 0.00019699337188715875, + "loss": 0.0159, "step": 264920 }, { - "epoch": 1.34, - "learning_rate": 9.950910897982451e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001969894836707873, + "loss": 0.012, "step": 264930 }, { - "epoch": 1.34, - "learning_rate": 9.950154128681051e-05, - "loss": 0.0112, + "epoch": 0.69, + "learning_rate": 0.00019698559545441584, + "loss": 0.0156, "step": 264940 }, { - "epoch": 1.34, - "learning_rate": 9.949397359379649e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019698170723804438, + "loss": 0.0166, "step": 264950 }, { - "epoch": 1.34, - "learning_rate": 9.948640590078248e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001969778190216729, + "loss": 0.0148, "step": 264960 }, { - "epoch": 1.34, - "learning_rate": 9.947883820776848e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019697393080530143, + "loss": 0.0157, "step": 264970 }, { - "epoch": 1.34, - "learning_rate": 9.947127051475446e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019697004258892995, + "loss": 0.0221, "step": 264980 }, { - "epoch": 1.34, - "learning_rate": 9.946370282174046e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019696615437255852, + "loss": 0.0145, "step": 264990 }, { - "epoch": 1.34, - "learning_rate": 9.945613512872645e-05, - "loss": 0.0052, + "epoch": 0.69, + "learning_rate": 0.00019696226615618703, + "loss": 0.0125, "step": 265000 }, { - "epoch": 1.34, - "eval_cer": 0.9144372624348985, - "eval_loss": 0.006056656129658222, - "eval_runtime": 116.3287, - "eval_samples_per_second": 17.193, - "eval_steps_per_second": 4.298, + "epoch": 0.69, + "eval_cer": 0.8817404765203906, + "eval_loss": 0.010400773026049137, + "eval_runtime": 107.7966, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, "step": 265000 }, { - "epoch": 1.34, - "learning_rate": 9.944856743571243e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019695837793981557, + "loss": 0.0113, "step": 265010 }, { - "epoch": 1.34, - "learning_rate": 9.944099974269843e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.0001969544897234441, + "loss": 0.0104, "step": 265020 }, { - "epoch": 1.34, - "learning_rate": 9.943343204968441e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.00019695060150707266, + "loss": 0.0158, "step": 265030 }, { - "epoch": 1.34, - "learning_rate": 9.94258643566704e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.0001969467132907012, + "loss": 0.02, "step": 265040 }, { - "epoch": 1.34, - "learning_rate": 9.94182966636564e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.0001969428250743297, + "loss": 0.0157, "step": 265050 }, { - "epoch": 1.34, - "learning_rate": 9.941072897064238e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019693893685795825, + "loss": 0.0143, "step": 265060 }, { - "epoch": 1.34, - "learning_rate": 9.940316127762837e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.0001969350486415868, + "loss": 0.0168, "step": 265070 }, { - "epoch": 1.34, - "learning_rate": 9.939559358461437e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019693116042521534, + "loss": 0.0158, "step": 265080 }, { - "epoch": 1.34, - "learning_rate": 9.938802589160035e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019692727220884385, + "loss": 0.0125, "step": 265090 }, { - "epoch": 1.34, - "learning_rate": 9.938045819858635e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.0001969233839924724, + "loss": 0.014, "step": 265100 }, { - "epoch": 1.34, - "learning_rate": 9.937289050557233e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019691949577610093, + "loss": 0.0132, "step": 265110 }, { - "epoch": 1.34, - "learning_rate": 9.936532281255832e-05, - "loss": 0.0051, + "epoch": 0.69, + "learning_rate": 0.00019691560755972948, + "loss": 0.0194, "step": 265120 }, { - "epoch": 1.34, - "learning_rate": 9.935775511954432e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.000196911719343358, + "loss": 0.0164, "step": 265130 }, { - "epoch": 1.34, - "learning_rate": 9.93501874265303e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019690783112698653, + "loss": 0.0169, "step": 265140 }, { - "epoch": 1.34, - "learning_rate": 9.93426197335163e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019690394291061507, + "loss": 0.0158, "step": 265150 }, { - "epoch": 1.34, - "learning_rate": 9.933505204050229e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019690005469424362, + "loss": 0.0156, "step": 265160 }, { - "epoch": 1.34, - "learning_rate": 9.932748434748827e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019689616647787213, + "loss": 0.017, "step": 265170 }, { - "epoch": 1.34, - "learning_rate": 9.931991665447427e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019689227826150067, + "loss": 0.0149, "step": 265180 }, { - "epoch": 1.34, - "learning_rate": 9.931234896146025e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019688839004512924, + "loss": 0.0146, "step": 265190 }, { - "epoch": 1.34, - "learning_rate": 9.930478126844624e-05, - "loss": 0.0106, + "epoch": 0.69, + "learning_rate": 0.00019688450182875776, + "loss": 0.0196, "step": 265200 }, { - "epoch": 1.34, - "learning_rate": 9.929721357543224e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.0001968806136123863, + "loss": 0.0167, "step": 265210 }, { - "epoch": 1.34, - "learning_rate": 9.928964588241822e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.0001968767253960148, + "loss": 0.0119, "step": 265220 }, { - "epoch": 1.34, - "learning_rate": 9.928207818940421e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019687283717964333, + "loss": 0.0114, "step": 265230 }, { - "epoch": 1.34, - "learning_rate": 9.927451049639021e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.0001968689489632719, + "loss": 0.0146, "step": 265240 }, { - "epoch": 1.34, - "learning_rate": 9.926694280337619e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019686506074690044, + "loss": 0.0137, "step": 265250 }, { - "epoch": 1.34, - "learning_rate": 9.925937511036218e-05, - "loss": 0.0057, + "epoch": 0.69, + "learning_rate": 0.00019686117253052895, + "loss": 0.0141, "step": 265260 }, { - "epoch": 1.34, - "learning_rate": 9.925180741734817e-05, - "loss": 0.0066, + "epoch": 0.69, + "learning_rate": 0.0001968572843141575, + "loss": 0.0245, "step": 265270 }, { - "epoch": 1.34, - "learning_rate": 9.924423972433416e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.00019685339609778603, + "loss": 0.0123, "step": 265280 }, { - "epoch": 1.34, - "learning_rate": 9.923667203132016e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019684950788141458, + "loss": 0.0271, "step": 265290 }, { - "epoch": 1.34, - "learning_rate": 9.922910433830614e-05, - "loss": 0.0096, + "epoch": 0.69, + "learning_rate": 0.0001968456196650431, + "loss": 0.0165, "step": 265300 }, { - "epoch": 1.34, - "learning_rate": 9.922153664529213e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019684173144867163, + "loss": 0.0155, "step": 265310 }, { - "epoch": 1.34, - "learning_rate": 9.921396895227813e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019683784323230017, + "loss": 0.0156, "step": 265320 }, { - "epoch": 1.34, - "learning_rate": 9.920640125926411e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019683395501592872, + "loss": 0.0123, "step": 265330 }, { - "epoch": 1.34, - "learning_rate": 9.91988335662501e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019683006679955723, + "loss": 0.0177, "step": 265340 }, { - "epoch": 1.34, - "learning_rate": 9.919126587323609e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019682617858318577, + "loss": 0.0137, "step": 265350 }, { - "epoch": 1.34, - "learning_rate": 9.918369818022208e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019682229036681434, + "loss": 0.0179, "step": 265360 }, { - "epoch": 1.34, - "learning_rate": 9.917613048720808e-05, - "loss": 0.0095, + "epoch": 0.69, + "learning_rate": 0.00019681840215044285, + "loss": 0.0154, "step": 265370 }, { - "epoch": 1.34, - "learning_rate": 9.916856279419406e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019681451393407137, + "loss": 0.0177, "step": 265380 }, { - "epoch": 1.34, - "learning_rate": 9.916099510118005e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.0001968106257176999, + "loss": 0.0152, "step": 265390 }, { - "epoch": 1.34, - "learning_rate": 9.915342740816605e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019680673750132848, + "loss": 0.0174, "step": 265400 }, { - "epoch": 1.34, - "learning_rate": 9.914585971515203e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.000196802849284957, + "loss": 0.0173, "step": 265410 }, { - "epoch": 1.34, - "learning_rate": 9.913829202213802e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019679896106858554, + "loss": 0.0133, "step": 265420 }, { - "epoch": 1.34, - "learning_rate": 9.913072432912402e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019679507285221405, + "loss": 0.0162, "step": 265430 }, { - "epoch": 1.34, - "learning_rate": 9.912315663611e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019679118463584262, + "loss": 0.0159, "step": 265440 }, { - "epoch": 1.34, - "learning_rate": 9.9115588943096e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019678729641947113, + "loss": 0.0182, "step": 265450 }, { - "epoch": 1.34, - "learning_rate": 9.910802125008198e-05, - "loss": 0.0096, + "epoch": 0.69, + "learning_rate": 0.00019678340820309968, + "loss": 0.0171, "step": 265460 }, { - "epoch": 1.34, - "learning_rate": 9.910045355706797e-05, - "loss": 0.0096, + "epoch": 0.69, + "learning_rate": 0.0001967795199867282, + "loss": 0.016, "step": 265470 }, { - "epoch": 1.34, - "learning_rate": 9.909288586405397e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019677563177035673, + "loss": 0.0166, "step": 265480 }, { - "epoch": 1.34, - "learning_rate": 9.908531817103995e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019677174355398527, + "loss": 0.0172, "step": 265490 }, { - "epoch": 1.34, - "learning_rate": 9.907775047802594e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019676785533761381, + "loss": 0.0137, "step": 265500 }, { - "epoch": 1.34, - "learning_rate": 9.907018278501194e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019676396712124233, + "loss": 0.0148, "step": 265510 }, { - "epoch": 1.34, - "learning_rate": 9.90626150919979e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019676007890487087, + "loss": 0.0166, "step": 265520 }, { - "epoch": 1.34, - "learning_rate": 9.90550473989839e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019675619068849944, + "loss": 0.0132, "step": 265530 }, { - "epoch": 1.34, - "learning_rate": 9.904747970596988e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019675230247212795, + "loss": 0.0178, "step": 265540 }, { - "epoch": 1.34, - "learning_rate": 9.903991201295588e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019674841425575647, + "loss": 0.0148, "step": 265550 }, { - "epoch": 1.34, - "learning_rate": 9.903234431994186e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.000196744526039385, + "loss": 0.0177, "step": 265560 }, { - "epoch": 1.34, - "learning_rate": 9.902477662692785e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019674063782301358, + "loss": 0.0141, "step": 265570 }, { - "epoch": 1.34, - "learning_rate": 9.901720893391385e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001967367496066421, + "loss": 0.0153, "step": 265580 }, { - "epoch": 1.34, - "learning_rate": 9.900964124089983e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.00019673286139027064, + "loss": 0.0127, "step": 265590 }, { - "epoch": 1.34, - "learning_rate": 9.900207354788582e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019672897317389915, + "loss": 0.0185, "step": 265600 }, { - "epoch": 1.34, - "learning_rate": 9.899450585487182e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019672508495752772, + "loss": 0.0159, "step": 265610 }, { - "epoch": 1.34, - "learning_rate": 9.89869381618578e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019672119674115623, + "loss": 0.0125, "step": 265620 }, { - "epoch": 1.34, - "learning_rate": 9.89793704688438e-05, - "loss": 0.0109, + "epoch": 0.69, + "learning_rate": 0.00019671730852478477, + "loss": 0.0185, "step": 265630 }, { - "epoch": 1.34, - "learning_rate": 9.897180277582978e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.0001967134203084133, + "loss": 0.0193, "step": 265640 }, { - "epoch": 1.34, - "learning_rate": 9.896423508281577e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019670953209204186, + "loss": 0.0142, "step": 265650 }, { - "epoch": 1.34, - "learning_rate": 9.895666738980177e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019670564387567037, + "loss": 0.0166, "step": 265660 }, { - "epoch": 1.34, - "learning_rate": 9.894909969678775e-05, - "loss": 0.0115, + "epoch": 0.69, + "learning_rate": 0.00019670175565929891, + "loss": 0.0135, "step": 265670 }, { - "epoch": 1.34, - "learning_rate": 9.894153200377374e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019669786744292743, + "loss": 0.0133, "step": 265680 }, { - "epoch": 1.34, - "learning_rate": 9.893396431075974e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.000196693979226556, + "loss": 0.0151, "step": 265690 }, { - "epoch": 1.34, - "learning_rate": 9.892639661774572e-05, - "loss": 0.0103, + "epoch": 0.69, + "learning_rate": 0.0001966900910101845, + "loss": 0.0181, "step": 265700 }, { - "epoch": 1.34, - "learning_rate": 9.891882892473172e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019668620279381305, + "loss": 0.0152, "step": 265710 }, { - "epoch": 1.34, - "learning_rate": 9.89112612317177e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019668231457744157, + "loss": 0.0111, "step": 265720 }, { - "epoch": 1.34, - "learning_rate": 9.890369353870369e-05, - "loss": 0.0108, + "epoch": 0.69, + "learning_rate": 0.0001966784263610701, + "loss": 0.0171, "step": 265730 }, { - "epoch": 1.34, - "learning_rate": 9.889612584568969e-05, - "loss": 0.0098, + "epoch": 0.69, + "learning_rate": 0.00019667453814469868, + "loss": 0.0138, "step": 265740 }, { - "epoch": 1.34, - "learning_rate": 9.888855815267567e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.0001966706499283272, + "loss": 0.0154, "step": 265750 }, { - "epoch": 1.34, - "learning_rate": 9.888099045966166e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019666676171195573, + "loss": 0.0193, "step": 265760 }, { - "epoch": 1.34, - "learning_rate": 9.887342276664766e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019666287349558425, + "loss": 0.0154, "step": 265770 }, { - "epoch": 1.34, - "learning_rate": 9.886585507363364e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019665898527921282, + "loss": 0.0141, "step": 265780 }, { - "epoch": 1.34, - "learning_rate": 9.885828738061963e-05, - "loss": 0.0105, + "epoch": 0.69, + "learning_rate": 0.00019665509706284133, + "loss": 0.0126, "step": 265790 }, { - "epoch": 1.34, - "learning_rate": 9.885071968760562e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019665120884646987, + "loss": 0.0191, "step": 265800 }, { - "epoch": 1.34, - "learning_rate": 9.884315199459161e-05, - "loss": 0.01, + "epoch": 0.69, + "learning_rate": 0.0001966473206300984, + "loss": 0.0186, "step": 265810 }, { - "epoch": 1.34, - "learning_rate": 9.88355843015776e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019664343241372696, + "loss": 0.0148, "step": 265820 }, { - "epoch": 1.34, - "learning_rate": 9.882801660856359e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019663954419735547, + "loss": 0.0143, "step": 265830 }, { - "epoch": 1.34, - "learning_rate": 9.882044891554958e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.000196635655980984, + "loss": 0.0148, "step": 265840 }, { - "epoch": 1.34, - "learning_rate": 9.881288122253558e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019663176776461253, + "loss": 0.0107, "step": 265850 }, { - "epoch": 1.34, - "learning_rate": 9.880531352952156e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001966278795482411, + "loss": 0.0165, "step": 265860 }, { - "epoch": 1.34, - "learning_rate": 9.879774583650755e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001966239913318696, + "loss": 0.0142, "step": 265870 }, { - "epoch": 1.34, - "learning_rate": 9.879017814349355e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019662010311549815, + "loss": 0.0142, "step": 265880 }, { - "epoch": 1.34, - "learning_rate": 9.878261045047953e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019661621489912667, + "loss": 0.0159, "step": 265890 }, { - "epoch": 1.34, - "learning_rate": 9.877504275746553e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019661232668275524, + "loss": 0.0175, "step": 265900 }, { - "epoch": 1.34, - "learning_rate": 9.876747506445151e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019660843846638378, + "loss": 0.0129, "step": 265910 }, { - "epoch": 1.34, - "learning_rate": 9.87599073714375e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.0001966045502500123, + "loss": 0.0148, "step": 265920 }, { - "epoch": 1.34, - "learning_rate": 9.87523396784235e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019660066203364083, + "loss": 0.0148, "step": 265930 }, { - "epoch": 1.34, - "learning_rate": 9.874477198540948e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019659677381726938, + "loss": 0.0141, "step": 265940 }, { - "epoch": 1.34, - "learning_rate": 9.873720429239547e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019659288560089792, + "loss": 0.0137, "step": 265950 }, { - "epoch": 1.34, - "learning_rate": 9.872963659938147e-05, - "loss": 0.0059, + "epoch": 0.69, + "learning_rate": 0.00019658899738452643, + "loss": 0.015, "step": 265960 }, { - "epoch": 1.34, - "learning_rate": 9.872206890636745e-05, - "loss": 0.0053, + "epoch": 0.69, + "learning_rate": 0.00019658510916815497, + "loss": 0.0153, "step": 265970 }, { - "epoch": 1.34, - "learning_rate": 9.871450121335344e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.0001965812209517835, + "loss": 0.0157, "step": 265980 }, { - "epoch": 1.34, - "learning_rate": 9.870693352033943e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019657733273541206, + "loss": 0.0174, "step": 265990 }, { - "epoch": 1.34, - "learning_rate": 9.869936582732542e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019657344451904057, + "loss": 0.0141, "step": 266000 }, { - "epoch": 1.34, - "eval_cer": 0.9144401736232748, - "eval_loss": 0.0059706708416342735, - "eval_runtime": 116.3669, - "eval_samples_per_second": 17.187, - "eval_steps_per_second": 4.297, + "epoch": 0.69, + "eval_cer": 0.8817782667176135, + "eval_loss": 0.01088875625282526, + "eval_runtime": 107.9649, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, "step": 266000 }, { - "epoch": 1.34, - "learning_rate": 9.869179813431142e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.0001965695563026691, + "loss": 0.0158, "step": 266010 }, { - "epoch": 1.34, - "learning_rate": 9.86842304412974e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019656566808629763, + "loss": 0.014, "step": 266020 }, { - "epoch": 1.34, - "learning_rate": 9.867666274828339e-05, - "loss": 0.0052, + "epoch": 0.69, + "learning_rate": 0.0001965617798699262, + "loss": 0.0155, "step": 266030 }, { - "epoch": 1.34, - "learning_rate": 9.866909505526939e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.0001965578916535547, + "loss": 0.0136, "step": 266040 }, { - "epoch": 1.34, - "learning_rate": 9.866152736225537e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019655400343718325, + "loss": 0.0157, "step": 266050 }, { - "epoch": 1.34, - "learning_rate": 9.865395966924136e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019655011522081177, + "loss": 0.0154, "step": 266060 }, { - "epoch": 1.34, - "learning_rate": 9.864639197622735e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019654622700444034, + "loss": 0.0129, "step": 266070 }, { - "epoch": 1.34, - "learning_rate": 9.863882428321334e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.00019654233878806888, + "loss": 0.014, "step": 266080 }, { - "epoch": 1.34, - "learning_rate": 9.863125659019934e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.0001965384505716974, + "loss": 0.0129, "step": 266090 }, { - "epoch": 1.34, - "learning_rate": 9.862368889718532e-05, - "loss": 0.0103, + "epoch": 0.69, + "learning_rate": 0.0001965345623553259, + "loss": 0.0136, "step": 266100 }, { - "epoch": 1.34, - "learning_rate": 9.861612120417131e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019653067413895448, + "loss": 0.0108, "step": 266110 }, { - "epoch": 1.34, - "learning_rate": 9.860855351115731e-05, - "loss": 0.0117, + "epoch": 0.69, + "learning_rate": 0.00019652678592258302, + "loss": 0.0115, "step": 266120 }, { - "epoch": 1.34, - "learning_rate": 9.860098581814329e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019652289770621153, + "loss": 0.0127, "step": 266130 }, { - "epoch": 1.34, - "learning_rate": 9.859341812512928e-05, - "loss": 0.0095, + "epoch": 0.69, + "learning_rate": 0.00019651900948984007, + "loss": 0.0144, "step": 266140 }, { - "epoch": 1.34, - "learning_rate": 9.858585043211525e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.00019651512127346861, + "loss": 0.0156, "step": 266150 }, { - "epoch": 1.34, - "learning_rate": 9.857828273910125e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019651123305709716, + "loss": 0.017, "step": 266160 }, { - "epoch": 1.34, - "learning_rate": 9.857071504608723e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019650734484072567, + "loss": 0.0154, "step": 266170 }, { - "epoch": 1.34, - "learning_rate": 9.856314735307322e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.0001965034566243542, + "loss": 0.0172, "step": 266180 }, { - "epoch": 1.34, - "learning_rate": 9.855557966005922e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019649956840798275, + "loss": 0.0142, "step": 266190 }, { - "epoch": 1.34, - "learning_rate": 9.85480119670452e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.0001964956801916113, + "loss": 0.0133, "step": 266200 }, { - "epoch": 1.34, - "learning_rate": 9.85404442740312e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.0001964917919752398, + "loss": 0.0132, "step": 266210 }, { - "epoch": 1.34, - "learning_rate": 9.853287658101719e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.00019648790375886835, + "loss": 0.0195, "step": 266220 }, { - "epoch": 1.34, - "learning_rate": 9.852530888800317e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019648401554249687, + "loss": 0.0165, "step": 266230 }, { - "epoch": 1.34, - "learning_rate": 9.851774119498917e-05, - "loss": 0.0066, + "epoch": 0.69, + "learning_rate": 0.00019648012732612544, + "loss": 0.0247, "step": 266240 }, { - "epoch": 1.34, - "learning_rate": 9.851017350197515e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019647623910975398, + "loss": 0.014, "step": 266250 }, { - "epoch": 1.34, - "learning_rate": 9.850260580896114e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.0001964723508933825, + "loss": 0.0155, "step": 266260 }, { - "epoch": 1.34, - "learning_rate": 9.849503811594714e-05, - "loss": 0.0057, + "epoch": 0.69, + "learning_rate": 0.000196468462677011, + "loss": 0.0155, "step": 266270 }, { - "epoch": 1.34, - "learning_rate": 9.848747042293312e-05, - "loss": 0.0054, + "epoch": 0.69, + "learning_rate": 0.00019646457446063957, + "loss": 0.0147, "step": 266280 }, { - "epoch": 1.34, - "learning_rate": 9.847990272991911e-05, - "loss": 0.0068, + "epoch": 0.69, + "learning_rate": 0.00019646068624426812, + "loss": 0.0152, "step": 266290 }, { - "epoch": 1.34, - "learning_rate": 9.847233503690511e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019645679802789663, + "loss": 0.0112, "step": 266300 }, { - "epoch": 1.34, - "learning_rate": 9.846476734389109e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019645290981152517, + "loss": 0.0178, "step": 266310 }, { - "epoch": 1.34, - "learning_rate": 9.845719965087708e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019644902159515371, + "loss": 0.014, "step": 266320 }, { - "epoch": 1.34, - "learning_rate": 9.844963195786308e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019644513337878226, + "loss": 0.0167, "step": 266330 }, { - "epoch": 1.34, - "learning_rate": 9.844206426484906e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019644124516241077, + "loss": 0.0214, "step": 266340 }, { - "epoch": 1.34, - "learning_rate": 9.843449657183506e-05, - "loss": 0.006, + "epoch": 0.69, + "learning_rate": 0.0001964373569460393, + "loss": 0.0147, "step": 266350 }, { - "epoch": 1.34, - "learning_rate": 9.842692887882104e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019643346872966785, + "loss": 0.0159, "step": 266360 }, { - "epoch": 1.34, - "learning_rate": 9.841936118580703e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.0001964295805132964, + "loss": 0.0151, "step": 266370 }, { - "epoch": 1.34, - "learning_rate": 9.841179349279303e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.0001964256922969249, + "loss": 0.0151, "step": 266380 }, { - "epoch": 1.34, - "learning_rate": 9.840422579977901e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019642180408055345, + "loss": 0.0148, "step": 266390 }, { - "epoch": 1.34, - "learning_rate": 9.8396658106765e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019641791586418202, + "loss": 0.0155, "step": 266400 }, { - "epoch": 1.34, - "learning_rate": 9.8389090413751e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019641402764781053, + "loss": 0.0143, "step": 266410 }, { - "epoch": 1.34, - "learning_rate": 9.838152272073698e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.00019641013943143905, + "loss": 0.0137, "step": 266420 }, { - "epoch": 1.34, - "learning_rate": 9.837395502772298e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.0001964062512150676, + "loss": 0.0145, "step": 266430 }, { - "epoch": 1.34, - "learning_rate": 9.836638733470896e-05, - "loss": 0.0057, + "epoch": 0.69, + "learning_rate": 0.00019640236299869616, + "loss": 0.0125, "step": 266440 }, { - "epoch": 1.34, - "learning_rate": 9.835881964169495e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019639847478232467, + "loss": 0.0168, "step": 266450 }, { - "epoch": 1.34, - "learning_rate": 9.835125194868095e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019639458656595322, + "loss": 0.0154, "step": 266460 }, { - "epoch": 1.34, - "learning_rate": 9.834368425566693e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019639069834958173, + "loss": 0.018, "step": 266470 }, { - "epoch": 1.34, - "learning_rate": 9.833611656265292e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019638681013321027, + "loss": 0.0168, "step": 266480 }, { - "epoch": 1.34, - "learning_rate": 9.832854886963892e-05, - "loss": 0.0102, + "epoch": 0.69, + "learning_rate": 0.0001963829219168388, + "loss": 0.0141, "step": 266490 }, { - "epoch": 1.34, - "learning_rate": 9.83209811766249e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019637903370046736, + "loss": 0.0166, "step": 266500 }, { - "epoch": 1.34, - "learning_rate": 9.83134134836109e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019637514548409587, + "loss": 0.0208, "step": 266510 }, { - "epoch": 1.34, - "learning_rate": 9.830584579059688e-05, - "loss": 0.0062, + "epoch": 0.69, + "learning_rate": 0.0001963712572677244, + "loss": 0.0137, "step": 266520 }, { - "epoch": 1.34, - "learning_rate": 9.829827809758287e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019636736905135295, + "loss": 0.0171, "step": 266530 }, { - "epoch": 1.34, - "learning_rate": 9.829071040456887e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.0001963634808349815, + "loss": 0.0169, "step": 266540 }, { - "epoch": 1.34, - "learning_rate": 9.828314271155485e-05, - "loss": 0.0093, + "epoch": 0.69, + "learning_rate": 0.00019635959261861, + "loss": 0.0158, "step": 266550 }, { - "epoch": 1.34, - "learning_rate": 9.827557501854084e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019635570440223855, + "loss": 0.0107, "step": 266560 }, { - "epoch": 1.34, - "learning_rate": 9.826800732552684e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001963518161858671, + "loss": 0.0154, "step": 266570 }, { - "epoch": 1.34, - "learning_rate": 9.826043963251282e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019634792796949563, + "loss": 0.0149, "step": 266580 }, { - "epoch": 1.34, - "learning_rate": 9.825287193949881e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019634403975312415, + "loss": 0.0142, "step": 266590 }, { - "epoch": 1.35, - "learning_rate": 9.82453042464848e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001963401515367527, + "loss": 0.012, "step": 266600 }, { - "epoch": 1.35, - "learning_rate": 9.823773655347079e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019633626332038126, + "loss": 0.0176, "step": 266610 }, { - "epoch": 1.35, - "learning_rate": 9.823016886045679e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019633237510400977, + "loss": 0.0152, "step": 266620 }, { - "epoch": 1.35, - "learning_rate": 9.822260116744277e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019632848688763832, + "loss": 0.0145, "step": 266630 }, { - "epoch": 1.35, - "learning_rate": 9.821503347442876e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019632459867126683, + "loss": 0.0141, "step": 266640 }, { - "epoch": 1.35, - "learning_rate": 9.820746578141476e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.0001963207104548954, + "loss": 0.0167, "step": 266650 }, { - "epoch": 1.35, - "learning_rate": 9.819989808840074e-05, - "loss": 0.0196, + "epoch": 0.69, + "learning_rate": 0.0001963168222385239, + "loss": 0.0147, "step": 266660 }, { - "epoch": 1.35, - "learning_rate": 9.819233039538673e-05, - "loss": 0.0096, + "epoch": 0.69, + "learning_rate": 0.00019631293402215245, + "loss": 0.0121, "step": 266670 }, { - "epoch": 1.35, - "learning_rate": 9.818476270237271e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019630904580578097, + "loss": 0.0185, "step": 266680 }, { - "epoch": 1.35, - "learning_rate": 9.817719500935871e-05, - "loss": 0.0066, + "epoch": 0.69, + "learning_rate": 0.00019630515758940954, + "loss": 0.0151, "step": 266690 }, { - "epoch": 1.35, - "learning_rate": 9.81696273163447e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019630126937303805, + "loss": 0.0148, "step": 266700 }, { - "epoch": 1.35, - "learning_rate": 9.816205962333069e-05, - "loss": 0.005, + "epoch": 0.69, + "learning_rate": 0.0001962973811566666, + "loss": 0.0176, "step": 266710 }, { - "epoch": 1.35, - "learning_rate": 9.815449193031668e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.0001962934929402951, + "loss": 0.0122, "step": 266720 }, { - "epoch": 1.35, - "learning_rate": 9.814692423730268e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019628960472392365, + "loss": 0.0176, "step": 266730 }, { - "epoch": 1.35, - "learning_rate": 9.813935654428866e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.0001962857165075522, + "loss": 0.0145, "step": 266740 }, { - "epoch": 1.35, - "learning_rate": 9.813178885127465e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019628182829118073, + "loss": 0.014, "step": 266750 }, { - "epoch": 1.35, - "learning_rate": 9.812422115826063e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019627794007480925, + "loss": 0.0138, "step": 266760 }, { - "epoch": 1.35, - "learning_rate": 9.811665346524663e-05, - "loss": 0.0131, + "epoch": 0.69, + "learning_rate": 0.0001962740518584378, + "loss": 0.0188, "step": 266770 }, { - "epoch": 1.35, - "learning_rate": 9.810908577223261e-05, - "loss": 0.0096, + "epoch": 0.69, + "learning_rate": 0.00019627016364206636, + "loss": 0.0142, "step": 266780 }, { - "epoch": 1.35, - "learning_rate": 9.810151807921859e-05, - "loss": 0.0064, + "epoch": 0.69, + "learning_rate": 0.00019626627542569487, + "loss": 0.0177, "step": 266790 }, { - "epoch": 1.35, - "learning_rate": 9.809395038620459e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.00019626238720932341, + "loss": 0.0149, "step": 266800 }, { - "epoch": 1.35, - "learning_rate": 9.808638269319057e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019625849899295193, + "loss": 0.015, "step": 266810 }, { - "epoch": 1.35, - "learning_rate": 9.807881500017656e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.0001962546107765805, + "loss": 0.0154, "step": 266820 }, { - "epoch": 1.35, - "learning_rate": 9.807124730716256e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.000196250722560209, + "loss": 0.0156, "step": 266830 }, { - "epoch": 1.35, - "learning_rate": 9.806367961414854e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019624683434383755, + "loss": 0.0141, "step": 266840 }, { - "epoch": 1.35, - "learning_rate": 9.805611192113454e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019624294612746607, + "loss": 0.0134, "step": 266850 }, { - "epoch": 1.35, - "learning_rate": 9.804854422812053e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019623905791109464, + "loss": 0.0164, "step": 266860 }, { - "epoch": 1.35, - "learning_rate": 9.804097653510651e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019623516969472315, + "loss": 0.0145, "step": 266870 }, { - "epoch": 1.35, - "learning_rate": 9.80334088420925e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001962312814783517, + "loss": 0.0155, "step": 266880 }, { - "epoch": 1.35, - "learning_rate": 9.802584114907849e-05, - "loss": 0.0098, + "epoch": 0.69, + "learning_rate": 0.0001962273932619802, + "loss": 0.019, "step": 266890 }, { - "epoch": 1.35, - "learning_rate": 9.801827345606448e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019622350504560878, + "loss": 0.0174, "step": 266900 }, { - "epoch": 1.35, - "learning_rate": 9.801070576305048e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001962196168292373, + "loss": 0.0176, "step": 266910 }, { - "epoch": 1.35, - "learning_rate": 9.800313807003646e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019621572861286583, + "loss": 0.0149, "step": 266920 }, { - "epoch": 1.35, - "learning_rate": 9.799557037702245e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019621184039649435, + "loss": 0.0125, "step": 266930 }, { - "epoch": 1.35, - "learning_rate": 9.798800268400845e-05, - "loss": 0.0101, + "epoch": 0.69, + "learning_rate": 0.00019620795218012292, + "loss": 0.0136, "step": 266940 }, { - "epoch": 1.35, - "learning_rate": 9.798043499099443e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.00019620406396375146, + "loss": 0.0147, "step": 266950 }, { - "epoch": 1.35, - "learning_rate": 9.797286729798043e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019620017574737997, + "loss": 0.0145, "step": 266960 }, { - "epoch": 1.35, - "learning_rate": 9.796529960496641e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.0001961962875310085, + "loss": 0.0163, "step": 266970 }, { - "epoch": 1.35, - "learning_rate": 9.79577319119524e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019619239931463703, + "loss": 0.0136, "step": 266980 }, { - "epoch": 1.35, - "learning_rate": 9.79501642189384e-05, - "loss": 0.0088, + "epoch": 0.69, + "learning_rate": 0.0001961885110982656, + "loss": 0.0139, "step": 266990 }, { - "epoch": 1.35, - "learning_rate": 9.794259652592438e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.0001961846228818941, + "loss": 0.0137, "step": 267000 }, { - "epoch": 1.35, - "eval_cer": 0.9144362920387732, - "eval_loss": 0.006072907242923975, - "eval_runtime": 116.2245, - "eval_samples_per_second": 17.208, - "eval_steps_per_second": 4.302, + "epoch": 0.69, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.01065248902887106, + "eval_runtime": 107.8983, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, "step": 267000 }, { - "epoch": 1.35, - "learning_rate": 9.793502883291037e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019618073466552265, + "loss": 0.0155, "step": 267010 }, { - "epoch": 1.35, - "learning_rate": 9.792746113989637e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019617684644915117, + "loss": 0.0146, "step": 267020 }, { - "epoch": 1.35, - "learning_rate": 9.791989344688235e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019617295823277974, + "loss": 0.0185, "step": 267030 }, { - "epoch": 1.35, - "learning_rate": 9.791232575386835e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019616907001640825, + "loss": 0.0161, "step": 267040 }, { - "epoch": 1.35, - "learning_rate": 9.790475806085433e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.0001961651818000368, + "loss": 0.0159, "step": 267050 }, { - "epoch": 1.35, - "learning_rate": 9.789719036784032e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001961612935836653, + "loss": 0.0138, "step": 267060 }, { - "epoch": 1.35, - "learning_rate": 9.788962267482632e-05, - "loss": 0.0071, + "epoch": 0.69, + "learning_rate": 0.00019615740536729388, + "loss": 0.0127, "step": 267070 }, { - "epoch": 1.35, - "learning_rate": 9.78820549818123e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.0001961535171509224, + "loss": 0.0167, "step": 267080 }, { - "epoch": 1.35, - "learning_rate": 9.787448728879829e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019614962893455093, + "loss": 0.0161, "step": 267090 }, { - "epoch": 1.35, - "learning_rate": 9.786691959578429e-05, - "loss": 0.0102, + "epoch": 0.69, + "learning_rate": 0.00019614574071817945, + "loss": 0.0146, "step": 267100 }, { - "epoch": 1.35, - "learning_rate": 9.785935190277027e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019614185250180802, + "loss": 0.0179, "step": 267110 }, { - "epoch": 1.35, - "learning_rate": 9.785178420975626e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019613796428543656, + "loss": 0.0139, "step": 267120 }, { - "epoch": 1.35, - "learning_rate": 9.784421651674225e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019613407606906507, + "loss": 0.016, "step": 267130 }, { - "epoch": 1.35, - "learning_rate": 9.783664882372824e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019613018785269359, + "loss": 0.0155, "step": 267140 }, { - "epoch": 1.35, - "learning_rate": 9.782908113071424e-05, - "loss": 0.0124, + "epoch": 0.69, + "learning_rate": 0.00019612629963632215, + "loss": 0.0156, "step": 267150 }, { - "epoch": 1.35, - "learning_rate": 9.782151343770022e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001961224114199507, + "loss": 0.0182, "step": 267160 }, { - "epoch": 1.35, - "learning_rate": 9.781394574468621e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.0001961185232035792, + "loss": 0.0144, "step": 267170 }, { - "epoch": 1.35, - "learning_rate": 9.780637805167221e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019611463498720775, + "loss": 0.0148, "step": 267180 }, { - "epoch": 1.35, - "learning_rate": 9.779881035865819e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.0001961107467708363, + "loss": 0.0198, "step": 267190 }, { - "epoch": 1.35, - "learning_rate": 9.779124266564418e-05, - "loss": 0.0057, + "epoch": 0.69, + "learning_rate": 0.00019610685855446484, + "loss": 0.0117, "step": 267200 }, { - "epoch": 1.35, - "learning_rate": 9.778367497263017e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019610297033809335, + "loss": 0.0158, "step": 267210 }, { - "epoch": 1.35, - "learning_rate": 9.777610727961616e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.0001960990821217219, + "loss": 0.0231, "step": 267220 }, { - "epoch": 1.35, - "learning_rate": 9.776853958660216e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.0001960951939053504, + "loss": 0.016, "step": 267230 }, { - "epoch": 1.35, - "learning_rate": 9.776097189358814e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019609130568897898, + "loss": 0.0136, "step": 267240 }, { - "epoch": 1.35, - "learning_rate": 9.775340420057413e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.0001960874174726075, + "loss": 0.0162, "step": 267250 }, { - "epoch": 1.35, - "learning_rate": 9.774583650756013e-05, - "loss": 0.0095, + "epoch": 0.69, + "learning_rate": 0.00019608352925623603, + "loss": 0.0135, "step": 267260 }, { - "epoch": 1.35, - "learning_rate": 9.773826881454611e-05, - "loss": 0.0112, + "epoch": 0.69, + "learning_rate": 0.00019607964103986455, + "loss": 0.0182, "step": 267270 }, { - "epoch": 1.35, - "learning_rate": 9.77307011215321e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019607575282349311, + "loss": 0.0149, "step": 267280 }, { - "epoch": 1.35, - "learning_rate": 9.772313342851808e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019607186460712163, + "loss": 0.0122, "step": 267290 }, { - "epoch": 1.35, - "learning_rate": 9.771556573550408e-05, - "loss": 0.0122, + "epoch": 0.69, + "learning_rate": 0.00019606797639075017, + "loss": 0.0141, "step": 267300 }, { - "epoch": 1.35, - "learning_rate": 9.770799804249007e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019606408817437869, + "loss": 0.0206, "step": 267310 }, { - "epoch": 1.35, - "learning_rate": 9.770043034947606e-05, - "loss": 0.0099, + "epoch": 0.69, + "learning_rate": 0.00019606019995800725, + "loss": 0.0128, "step": 267320 }, { - "epoch": 1.35, - "learning_rate": 9.769286265646205e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.0001960563117416358, + "loss": 0.0159, "step": 267330 }, { - "epoch": 1.35, - "learning_rate": 9.768529496344805e-05, - "loss": 0.0059, + "epoch": 0.69, + "learning_rate": 0.0001960524235252643, + "loss": 0.0153, "step": 267340 }, { - "epoch": 1.35, - "learning_rate": 9.767772727043403e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.00019604853530889285, + "loss": 0.0194, "step": 267350 }, { - "epoch": 1.35, - "learning_rate": 9.767015957742002e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.0001960446470925214, + "loss": 0.0124, "step": 267360 }, { - "epoch": 1.35, - "learning_rate": 9.766259188440602e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019604075887614994, + "loss": 0.0156, "step": 267370 }, { - "epoch": 1.35, - "learning_rate": 9.7655024191392e-05, - "loss": 0.0111, + "epoch": 0.69, + "learning_rate": 0.00019603687065977845, + "loss": 0.0157, "step": 267380 }, { - "epoch": 1.35, - "learning_rate": 9.7647456498378e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.000196032982443407, + "loss": 0.0135, "step": 267390 }, { - "epoch": 1.35, - "learning_rate": 9.763988880536398e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019602909422703553, + "loss": 0.017, "step": 267400 }, { - "epoch": 1.35, - "learning_rate": 9.763232111234996e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019602520601066407, + "loss": 0.0129, "step": 267410 }, { - "epoch": 1.35, - "learning_rate": 9.762475341933594e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.0001960213177942926, + "loss": 0.0188, "step": 267420 }, { - "epoch": 1.35, - "learning_rate": 9.761718572632193e-05, - "loss": 0.0089, + "epoch": 0.69, + "learning_rate": 0.00019601742957792113, + "loss": 0.0139, "step": 267430 }, { - "epoch": 1.35, - "learning_rate": 9.760961803330793e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.0001960135413615497, + "loss": 0.0121, "step": 267440 }, { - "epoch": 1.35, - "learning_rate": 9.760205034029391e-05, - "loss": 0.0093, + "epoch": 0.69, + "learning_rate": 0.00019600965314517821, + "loss": 0.0131, "step": 267450 }, { - "epoch": 1.35, - "learning_rate": 9.75944826472799e-05, - "loss": 0.0102, + "epoch": 0.69, + "learning_rate": 0.00019600576492880673, + "loss": 0.0132, "step": 267460 }, { - "epoch": 1.35, - "learning_rate": 9.75869149542659e-05, - "loss": 0.0109, + "epoch": 0.69, + "learning_rate": 0.00019600187671243527, + "loss": 0.0173, "step": 267470 }, { - "epoch": 1.35, - "learning_rate": 9.757934726125188e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.00019599798849606379, + "loss": 0.0158, "step": 267480 }, { - "epoch": 1.35, - "learning_rate": 9.757177956823788e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019599410027969235, + "loss": 0.0135, "step": 267490 }, { - "epoch": 1.35, - "learning_rate": 9.756421187522386e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.0001959902120633209, + "loss": 0.0201, "step": 267500 }, { - "epoch": 1.35, - "learning_rate": 9.755664418220985e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.0001959863238469494, + "loss": 0.0169, "step": 267510 }, { - "epoch": 1.35, - "learning_rate": 9.754907648919585e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019598243563057795, + "loss": 0.0207, "step": 267520 }, { - "epoch": 1.35, - "learning_rate": 9.754150879618183e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001959785474142065, + "loss": 0.0169, "step": 267530 }, { - "epoch": 1.35, - "learning_rate": 9.753394110316782e-05, - "loss": 0.0063, + "epoch": 0.69, + "learning_rate": 0.00019597465919783503, + "loss": 0.0141, "step": 267540 }, { - "epoch": 1.35, - "learning_rate": 9.752637341015382e-05, - "loss": 0.0057, + "epoch": 0.69, + "learning_rate": 0.00019597077098146355, + "loss": 0.0164, "step": 267550 }, { - "epoch": 1.35, - "learning_rate": 9.75188057171398e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.0001959668827650921, + "loss": 0.0168, "step": 267560 }, { - "epoch": 1.35, - "learning_rate": 9.75112380241258e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019596299454872063, + "loss": 0.0137, "step": 267570 }, { - "epoch": 1.35, - "learning_rate": 9.750367033111178e-05, - "loss": 0.007, + "epoch": 0.69, + "learning_rate": 0.00019595910633234917, + "loss": 0.0142, "step": 267580 }, { - "epoch": 1.35, - "learning_rate": 9.749610263809777e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.0001959552181159777, + "loss": 0.0205, "step": 267590 }, { - "epoch": 1.35, - "learning_rate": 9.748853494508377e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019595132989960623, + "loss": 0.016, "step": 267600 }, { - "epoch": 1.35, - "learning_rate": 9.748096725206975e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019594744168323477, + "loss": 0.012, "step": 267610 }, { - "epoch": 1.35, - "learning_rate": 9.747339955905574e-05, - "loss": 0.0081, + "epoch": 0.69, + "learning_rate": 0.00019594355346686331, + "loss": 0.016, "step": 267620 }, { - "epoch": 1.35, - "learning_rate": 9.746583186604174e-05, - "loss": 0.0074, + "epoch": 0.69, + "learning_rate": 0.00019593966525049183, + "loss": 0.0154, "step": 267630 }, { - "epoch": 1.35, - "learning_rate": 9.745826417302772e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019593577703412037, + "loss": 0.0155, "step": 267640 }, { - "epoch": 1.35, - "learning_rate": 9.745069648001371e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019593188881774894, + "loss": 0.0165, "step": 267650 }, { - "epoch": 1.35, - "learning_rate": 9.74431287869997e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019592800060137745, + "loss": 0.0128, "step": 267660 }, { - "epoch": 1.35, - "learning_rate": 9.743556109398569e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.000195924112385006, + "loss": 0.0133, "step": 267670 }, { - "epoch": 1.35, - "learning_rate": 9.742799340097169e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.0001959202241686345, + "loss": 0.0186, "step": 267680 }, { - "epoch": 1.35, - "learning_rate": 9.742042570795767e-05, - "loss": 0.0087, + "epoch": 0.69, + "learning_rate": 0.00019591633595226308, + "loss": 0.0133, "step": 267690 }, { - "epoch": 1.35, - "learning_rate": 9.741285801494366e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001959124477358916, + "loss": 0.0186, "step": 267700 }, { - "epoch": 1.35, - "learning_rate": 9.740529032192966e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.00019590855951952013, + "loss": 0.0146, "step": 267710 }, { - "epoch": 1.35, - "learning_rate": 9.739772262891564e-05, - "loss": 0.008, + "epoch": 0.69, + "learning_rate": 0.00019590467130314865, + "loss": 0.0145, "step": 267720 }, { - "epoch": 1.35, - "learning_rate": 9.739015493590163e-05, - "loss": 0.0072, + "epoch": 0.69, + "learning_rate": 0.0001959007830867772, + "loss": 0.0158, "step": 267730 }, { - "epoch": 1.35, - "learning_rate": 9.738258724288762e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019589689487040573, + "loss": 0.0148, "step": 267740 }, { - "epoch": 1.35, - "learning_rate": 9.737501954987361e-05, - "loss": 0.0073, + "epoch": 0.69, + "learning_rate": 0.00019589300665403427, + "loss": 0.0159, "step": 267750 }, { - "epoch": 1.35, - "learning_rate": 9.73674518568596e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.0001958891184376628, + "loss": 0.0163, "step": 267760 }, { - "epoch": 1.35, - "learning_rate": 9.735988416384559e-05, - "loss": 0.0092, + "epoch": 0.69, + "learning_rate": 0.00019588523022129133, + "loss": 0.0132, "step": 267770 }, { - "epoch": 1.35, - "learning_rate": 9.735231647083158e-05, - "loss": 0.0104, + "epoch": 0.69, + "learning_rate": 0.00019588134200491987, + "loss": 0.0137, "step": 267780 }, { - "epoch": 1.35, - "learning_rate": 9.734474877781758e-05, - "loss": 0.0093, + "epoch": 0.69, + "learning_rate": 0.0001958774537885484, + "loss": 0.0172, "step": 267790 }, { - "epoch": 1.35, - "learning_rate": 9.733718108480356e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019587356557217693, + "loss": 0.017, "step": 267800 }, { - "epoch": 1.35, - "learning_rate": 9.732961339178955e-05, - "loss": 0.0078, + "epoch": 0.69, + "learning_rate": 0.00019586967735580547, + "loss": 0.0164, "step": 267810 }, { - "epoch": 1.35, - "learning_rate": 9.732204569877555e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019586578913943404, + "loss": 0.014, "step": 267820 }, { - "epoch": 1.35, - "learning_rate": 9.731447800576153e-05, - "loss": 0.0108, + "epoch": 0.69, + "learning_rate": 0.00019586190092306255, + "loss": 0.0191, "step": 267830 }, { - "epoch": 1.35, - "learning_rate": 9.730691031274752e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.0001958580127066911, + "loss": 0.0169, "step": 267840 }, { - "epoch": 1.35, - "learning_rate": 9.72993426197335e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.0001958541244903196, + "loss": 0.0137, "step": 267850 }, { - "epoch": 1.35, - "learning_rate": 9.72917749267195e-05, - "loss": 0.0091, + "epoch": 0.69, + "learning_rate": 0.00019585023627394818, + "loss": 0.0165, "step": 267860 }, { - "epoch": 1.35, - "learning_rate": 9.72842072337055e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.0001958463480575767, + "loss": 0.0137, "step": 267870 }, { - "epoch": 1.35, - "learning_rate": 9.727663954069148e-05, - "loss": 0.0076, + "epoch": 0.69, + "learning_rate": 0.00019584245984120523, + "loss": 0.0103, "step": 267880 }, { - "epoch": 1.35, - "learning_rate": 9.726907184767747e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019583857162483375, + "loss": 0.0133, "step": 267890 }, { - "epoch": 1.35, - "learning_rate": 9.726150415466347e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019583468340846232, + "loss": 0.0161, "step": 267900 }, { - "epoch": 1.35, - "learning_rate": 9.725393646164945e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019583079519209083, + "loss": 0.013, "step": 267910 }, { - "epoch": 1.35, - "learning_rate": 9.724636876863544e-05, - "loss": 0.0084, + "epoch": 0.69, + "learning_rate": 0.00019582690697571937, + "loss": 0.0162, "step": 267920 }, { - "epoch": 1.35, - "learning_rate": 9.723880107562143e-05, - "loss": 0.0083, + "epoch": 0.69, + "learning_rate": 0.0001958230187593479, + "loss": 0.0165, "step": 267930 }, { - "epoch": 1.35, - "learning_rate": 9.723123338260742e-05, - "loss": 0.0065, + "epoch": 0.69, + "learning_rate": 0.00019581913054297646, + "loss": 0.0154, "step": 267940 }, { - "epoch": 1.35, - "learning_rate": 9.722366568959342e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019581524232660497, + "loss": 0.0176, "step": 267950 }, { - "epoch": 1.35, - "learning_rate": 9.72160979965794e-05, - "loss": 0.0082, + "epoch": 0.69, + "learning_rate": 0.0001958113541102335, + "loss": 0.0162, "step": 267960 }, { - "epoch": 1.35, - "learning_rate": 9.720853030356539e-05, - "loss": 0.0048, + "epoch": 0.69, + "learning_rate": 0.00019580746589386203, + "loss": 0.0128, "step": 267970 }, { - "epoch": 1.35, - "learning_rate": 9.720096261055139e-05, - "loss": 0.0075, + "epoch": 0.69, + "learning_rate": 0.00019580357767749057, + "loss": 0.0146, "step": 267980 }, { - "epoch": 1.35, - "learning_rate": 9.719339491753737e-05, - "loss": 0.0079, + "epoch": 0.69, + "learning_rate": 0.00019579968946111914, + "loss": 0.0131, "step": 267990 }, { - "epoch": 1.35, - "learning_rate": 9.718582722452336e-05, - "loss": 0.0097, + "epoch": 0.69, + "learning_rate": 0.00019579580124474765, + "loss": 0.0151, "step": 268000 }, { - "epoch": 1.35, - "eval_cer": 0.9144178545123905, - "eval_loss": 0.006040630396455526, - "eval_runtime": 116.1695, - "eval_samples_per_second": 17.216, - "eval_steps_per_second": 4.304, + "epoch": 0.69, + "eval_cer": 0.8817418761573248, + "eval_loss": 0.010366639122366905, + "eval_runtime": 108.2065, + "eval_samples_per_second": 18.483, + "eval_steps_per_second": 4.621, "step": 268000 }, { - "epoch": 1.35, - "learning_rate": 9.717825953150934e-05, - "loss": 0.0077, + "epoch": 0.69, + "learning_rate": 0.00019579191302837617, + "loss": 0.0174, "step": 268010 }, { - "epoch": 1.35, - "learning_rate": 9.717069183849534e-05, - "loss": 0.0066, + "epoch": 0.69, + "learning_rate": 0.0001957880248120047, + "loss": 0.0181, "step": 268020 }, { - "epoch": 1.35, - "learning_rate": 9.716312414548133e-05, - "loss": 0.0069, + "epoch": 0.69, + "learning_rate": 0.00019578413659563328, + "loss": 0.0145, "step": 268030 }, { - "epoch": 1.35, - "learning_rate": 9.71555564524673e-05, - "loss": 0.0067, + "epoch": 0.69, + "learning_rate": 0.0001957802483792618, + "loss": 0.014, "step": 268040 }, { - "epoch": 1.35, - "learning_rate": 9.71479887594533e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.00019577636016289033, + "loss": 0.0144, "step": 268050 }, { - "epoch": 1.35, - "learning_rate": 9.714042106643928e-05, - "loss": 0.0094, + "epoch": 0.69, + "learning_rate": 0.00019577247194651885, + "loss": 0.0139, "step": 268060 }, { - "epoch": 1.35, - "learning_rate": 9.713285337342527e-05, - "loss": 0.0093, + "epoch": 0.69, + "learning_rate": 0.00019576858373014742, + "loss": 0.0176, "step": 268070 }, { - "epoch": 1.35, - "learning_rate": 9.712528568041127e-05, - "loss": 0.009, + "epoch": 0.69, + "learning_rate": 0.00019576469551377593, + "loss": 0.0154, "step": 268080 }, { - "epoch": 1.35, - "learning_rate": 9.711771798739725e-05, - "loss": 0.0085, + "epoch": 0.69, + "learning_rate": 0.00019576080729740447, + "loss": 0.0175, "step": 268090 }, { - "epoch": 1.35, - "learning_rate": 9.711015029438325e-05, - "loss": 0.006, + "epoch": 0.69, + "learning_rate": 0.000195756919081033, + "loss": 0.0138, "step": 268100 }, { - "epoch": 1.35, - "learning_rate": 9.710258260136923e-05, - "loss": 0.0086, + "epoch": 0.69, + "learning_rate": 0.00019575303086466156, + "loss": 0.0133, "step": 268110 }, { - "epoch": 1.35, - "learning_rate": 9.709501490835522e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.00019574914264829007, + "loss": 0.0175, "step": 268120 }, { - "epoch": 1.35, - "learning_rate": 9.708744721534122e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.0001957452544319186, + "loss": 0.0146, "step": 268130 }, { - "epoch": 1.35, - "learning_rate": 9.70798795223272e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019574136621554713, + "loss": 0.0132, "step": 268140 }, { - "epoch": 1.35, - "learning_rate": 9.707231182931319e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001957374779991757, + "loss": 0.0173, "step": 268150 }, { - "epoch": 1.35, - "learning_rate": 9.706474413629919e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.0001957335897828042, + "loss": 0.0151, "step": 268160 }, { - "epoch": 1.35, - "learning_rate": 9.705717644328517e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.00019572970156643275, + "loss": 0.0132, "step": 268170 }, { - "epoch": 1.35, - "learning_rate": 9.704960875027116e-05, - "loss": 0.0103, + "epoch": 0.7, + "learning_rate": 0.00019572581335006127, + "loss": 0.0154, "step": 268180 }, { - "epoch": 1.35, - "learning_rate": 9.704204105725715e-05, - "loss": 0.011, + "epoch": 0.7, + "learning_rate": 0.00019572192513368983, + "loss": 0.0134, "step": 268190 }, { - "epoch": 1.35, - "learning_rate": 9.703447336424314e-05, - "loss": 0.0117, + "epoch": 0.7, + "learning_rate": 0.00019571803691731838, + "loss": 0.0151, "step": 268200 }, { - "epoch": 1.35, - "learning_rate": 9.702690567122914e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.0001957141487009469, + "loss": 0.0155, "step": 268210 }, { - "epoch": 1.35, - "learning_rate": 9.701933797821512e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019571026048457543, + "loss": 0.016, "step": 268220 }, { - "epoch": 1.35, - "learning_rate": 9.701177028520111e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019570637226820395, + "loss": 0.0128, "step": 268230 }, { - "epoch": 1.35, - "learning_rate": 9.700420259218711e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.00019570248405183252, + "loss": 0.0103, "step": 268240 }, { - "epoch": 1.35, - "learning_rate": 9.699663489917309e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019569859583546103, + "loss": 0.0144, "step": 268250 }, { - "epoch": 1.35, - "learning_rate": 9.698906720615908e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019569470761908957, + "loss": 0.0193, "step": 268260 }, { - "epoch": 1.35, - "learning_rate": 9.698149951314508e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.0001956908194027181, + "loss": 0.0183, "step": 268270 }, { - "epoch": 1.35, - "learning_rate": 9.697393182013106e-05, - "loss": 0.0108, + "epoch": 0.7, + "learning_rate": 0.00019568693118634666, + "loss": 0.0139, "step": 268280 }, { - "epoch": 1.35, - "learning_rate": 9.696636412711706e-05, - "loss": 0.0059, + "epoch": 0.7, + "learning_rate": 0.00019568304296997517, + "loss": 0.0102, "step": 268290 }, { - "epoch": 1.35, - "learning_rate": 9.695879643410304e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.0001956791547536037, + "loss": 0.0141, "step": 268300 }, { - "epoch": 1.35, - "learning_rate": 9.695122874108903e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019567526653723223, + "loss": 0.0133, "step": 268310 }, { - "epoch": 1.35, - "learning_rate": 9.694366104807503e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.0001956713783208608, + "loss": 0.0138, "step": 268320 }, { - "epoch": 1.35, - "learning_rate": 9.693609335506101e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.0001956674901044893, + "loss": 0.0157, "step": 268330 }, { - "epoch": 1.35, - "learning_rate": 9.6928525662047e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019566360188811785, + "loss": 0.0136, "step": 268340 }, { - "epoch": 1.35, - "learning_rate": 9.6920957969033e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019565971367174637, + "loss": 0.0157, "step": 268350 }, { - "epoch": 1.35, - "learning_rate": 9.691339027601898e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.00019565582545537493, + "loss": 0.0142, "step": 268360 }, { - "epoch": 1.35, - "learning_rate": 9.690582258300497e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.00019565193723900348, + "loss": 0.0146, "step": 268370 }, { - "epoch": 1.35, - "learning_rate": 9.689825488999096e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.000195648049022632, + "loss": 0.0161, "step": 268380 }, { - "epoch": 1.35, - "learning_rate": 9.689068719697695e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019564416080626053, + "loss": 0.0153, "step": 268390 }, { - "epoch": 1.35, - "learning_rate": 9.688311950396295e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019564027258988907, + "loss": 0.0152, "step": 268400 }, { - "epoch": 1.35, - "learning_rate": 9.687555181094893e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019563638437351762, + "loss": 0.0155, "step": 268410 }, { - "epoch": 1.35, - "learning_rate": 9.686798411793492e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019563249615714613, + "loss": 0.0123, "step": 268420 }, { - "epoch": 1.35, - "learning_rate": 9.686041642492092e-05, - "loss": 0.0054, + "epoch": 0.7, + "learning_rate": 0.00019562860794077467, + "loss": 0.0167, "step": 268430 }, { - "epoch": 1.35, - "learning_rate": 9.68528487319069e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.0001956247197244032, + "loss": 0.0167, "step": 268440 }, { - "epoch": 1.35, - "learning_rate": 9.68452810388929e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.00019562083150803175, + "loss": 0.0144, "step": 268450 }, { - "epoch": 1.35, - "learning_rate": 9.683771334587888e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019561694329166027, + "loss": 0.0118, "step": 268460 }, { - "epoch": 1.35, - "learning_rate": 9.683014565286487e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.0001956130550752888, + "loss": 0.0112, "step": 268470 }, { - "epoch": 1.35, - "learning_rate": 9.682257795985087e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019560916685891733, + "loss": 0.0139, "step": 268480 }, { - "epoch": 1.35, - "learning_rate": 9.681501026683685e-05, - "loss": 0.0107, + "epoch": 0.7, + "learning_rate": 0.0001956052786425459, + "loss": 0.0155, "step": 268490 }, { - "epoch": 1.35, - "learning_rate": 9.680744257382284e-05, - "loss": 0.0106, + "epoch": 0.7, + "learning_rate": 0.0001956013904261744, + "loss": 0.0129, "step": 268500 }, { - "epoch": 1.35, - "learning_rate": 9.679987488080884e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019559750220980295, + "loss": 0.0145, "step": 268510 }, { - "epoch": 1.35, - "learning_rate": 9.679230718779482e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019559361399343146, + "loss": 0.0151, "step": 268520 }, { - "epoch": 1.35, - "learning_rate": 9.678473949478081e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019558972577706003, + "loss": 0.0156, "step": 268530 }, { - "epoch": 1.35, - "learning_rate": 9.67771718017668e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.00019558583756068858, + "loss": 0.0142, "step": 268540 }, { - "epoch": 1.35, - "learning_rate": 9.676960410875279e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.0001955819493443171, + "loss": 0.0176, "step": 268550 }, { - "epoch": 1.35, - "learning_rate": 9.676203641573878e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001955780611279456, + "loss": 0.0199, "step": 268560 }, { - "epoch": 1.35, - "learning_rate": 9.675446872272477e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019557417291157417, + "loss": 0.0171, "step": 268570 }, { - "epoch": 1.36, - "learning_rate": 9.674690102971076e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019557028469520271, + "loss": 0.0151, "step": 268580 }, { - "epoch": 1.36, - "learning_rate": 9.673933333669676e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019556639647883123, + "loss": 0.0167, "step": 268590 }, { - "epoch": 1.36, - "learning_rate": 9.673176564368274e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019556250826245977, + "loss": 0.0154, "step": 268600 }, { - "epoch": 1.36, - "learning_rate": 9.672419795066873e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.0001955586200460883, + "loss": 0.0139, "step": 268610 }, { - "epoch": 1.36, - "learning_rate": 9.671663025765471e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019555473182971685, + "loss": 0.0149, "step": 268620 }, { - "epoch": 1.36, - "learning_rate": 9.670906256464071e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019555084361334537, + "loss": 0.016, "step": 268630 }, { - "epoch": 1.36, - "learning_rate": 9.67014948716267e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.0001955469553969739, + "loss": 0.015, "step": 268640 }, { - "epoch": 1.36, - "learning_rate": 9.669392717861269e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019554306718060245, + "loss": 0.0168, "step": 268650 }, { - "epoch": 1.36, - "learning_rate": 9.668635948559867e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.000195539178964231, + "loss": 0.015, "step": 268660 }, { - "epoch": 1.36, - "learning_rate": 9.667879179258465e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.0001955352907478595, + "loss": 0.0174, "step": 268670 }, { - "epoch": 1.36, - "learning_rate": 9.667122409957064e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019553140253148805, + "loss": 0.0138, "step": 268680 }, { - "epoch": 1.36, - "learning_rate": 9.666365640655664e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019552751431511662, + "loss": 0.0107, "step": 268690 }, { - "epoch": 1.36, - "learning_rate": 9.665608871354262e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.00019552362609874513, + "loss": 0.0176, "step": 268700 }, { - "epoch": 1.36, - "learning_rate": 9.664852102052861e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019551973788237367, + "loss": 0.0129, "step": 268710 }, { - "epoch": 1.36, - "learning_rate": 9.664095332751461e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.0001955158496660022, + "loss": 0.0197, "step": 268720 }, { - "epoch": 1.36, - "learning_rate": 9.663338563450059e-05, - "loss": 0.0059, + "epoch": 0.7, + "learning_rate": 0.0001955119614496307, + "loss": 0.0179, "step": 268730 }, { - "epoch": 1.36, - "learning_rate": 9.662581794148659e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019550807323325927, + "loss": 0.0131, "step": 268740 }, { - "epoch": 1.36, - "learning_rate": 9.661825024847257e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019550418501688781, + "loss": 0.0128, "step": 268750 }, { - "epoch": 1.36, - "learning_rate": 9.661068255545856e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019550029680051633, + "loss": 0.0141, "step": 268760 }, { - "epoch": 1.36, - "learning_rate": 9.660311486244456e-05, - "loss": 0.0121, + "epoch": 0.7, + "learning_rate": 0.00019549640858414487, + "loss": 0.0146, "step": 268770 }, { - "epoch": 1.36, - "learning_rate": 9.659554716943054e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.0001954925203677734, + "loss": 0.0217, "step": 268780 }, { - "epoch": 1.36, - "learning_rate": 9.658797947641653e-05, - "loss": 0.0057, + "epoch": 0.7, + "learning_rate": 0.00019548863215140195, + "loss": 0.0112, "step": 268790 }, { - "epoch": 1.36, - "learning_rate": 9.658041178340253e-05, - "loss": 0.0102, + "epoch": 0.7, + "learning_rate": 0.00019548474393503047, + "loss": 0.0181, "step": 268800 }, { - "epoch": 1.36, - "learning_rate": 9.657284409038851e-05, - "loss": 0.012, + "epoch": 0.7, + "learning_rate": 0.000195480855718659, + "loss": 0.0163, "step": 268810 }, { - "epoch": 1.36, - "learning_rate": 9.65652763973745e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.00019547696750228755, + "loss": 0.0158, "step": 268820 }, { - "epoch": 1.36, - "learning_rate": 9.655770870436049e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.0001954730792859161, + "loss": 0.0157, "step": 268830 }, { - "epoch": 1.36, - "learning_rate": 9.655014101134648e-05, - "loss": 0.0102, + "epoch": 0.7, + "learning_rate": 0.0001954691910695446, + "loss": 0.012, "step": 268840 }, { - "epoch": 1.36, - "learning_rate": 9.654257331833248e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019546530285317315, + "loss": 0.0146, "step": 268850 }, { - "epoch": 1.36, - "learning_rate": 9.653500562531846e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019546141463680172, + "loss": 0.0167, "step": 268860 }, { - "epoch": 1.36, - "learning_rate": 9.652743793230445e-05, - "loss": 0.0055, + "epoch": 0.7, + "learning_rate": 0.00019545752642043023, + "loss": 0.017, "step": 268870 }, { - "epoch": 1.36, - "learning_rate": 9.651987023929045e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019545363820405875, + "loss": 0.0158, "step": 268880 }, { - "epoch": 1.36, - "learning_rate": 9.651230254627643e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.0001954497499876873, + "loss": 0.0139, "step": 268890 }, { - "epoch": 1.36, - "learning_rate": 9.650473485326242e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019544586177131586, + "loss": 0.0159, "step": 268900 }, { - "epoch": 1.36, - "learning_rate": 9.64971671602484e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019544197355494437, + "loss": 0.0148, "step": 268910 }, { - "epoch": 1.36, - "learning_rate": 9.64895994672344e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001954380853385729, + "loss": 0.0157, "step": 268920 }, { - "epoch": 1.36, - "learning_rate": 9.64820317742204e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019543419712220143, + "loss": 0.0162, "step": 268930 }, { - "epoch": 1.36, - "learning_rate": 9.647446408120638e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019543030890583, + "loss": 0.0192, "step": 268940 }, { - "epoch": 1.36, - "learning_rate": 9.646689638819237e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.0001954264206894585, + "loss": 0.0178, "step": 268950 }, { - "epoch": 1.36, - "learning_rate": 9.645932869517837e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019542253247308705, + "loss": 0.0174, "step": 268960 }, { - "epoch": 1.36, - "learning_rate": 9.645176100216435e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019541864425671557, + "loss": 0.0147, "step": 268970 }, { - "epoch": 1.36, - "learning_rate": 9.644419330915034e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001954147560403441, + "loss": 0.0141, "step": 268980 }, { - "epoch": 1.36, - "learning_rate": 9.643662561613633e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019541086782397265, + "loss": 0.0178, "step": 268990 }, { - "epoch": 1.36, - "learning_rate": 9.642905792312232e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001954069796076012, + "loss": 0.0127, "step": 269000 }, { - "epoch": 1.36, - "eval_cer": 0.9144071801550111, - "eval_loss": 0.006098465994000435, - "eval_runtime": 116.3578, - "eval_samples_per_second": 17.188, - "eval_steps_per_second": 4.297, + "epoch": 0.7, + "eval_cer": 0.8817418761573248, + "eval_loss": 0.010232596658170223, + "eval_runtime": 108.1138, + "eval_samples_per_second": 18.499, + "eval_steps_per_second": 4.625, "step": 269000 }, { - "epoch": 1.36, - "learning_rate": 9.642149023010832e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.0001954030913912297, + "loss": 0.0133, "step": 269010 }, { - "epoch": 1.36, - "learning_rate": 9.64139225370943e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019539920317485825, + "loss": 0.0184, "step": 269020 }, { - "epoch": 1.36, - "learning_rate": 9.640635484408029e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.00019539531495848682, + "loss": 0.016, "step": 269030 }, { - "epoch": 1.36, - "learning_rate": 9.639878715106629e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019539142674211533, + "loss": 0.0139, "step": 269040 }, { - "epoch": 1.36, - "learning_rate": 9.639121945805227e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019538753852574385, + "loss": 0.0158, "step": 269050 }, { - "epoch": 1.36, - "learning_rate": 9.638365176503826e-05, - "loss": 0.0061, + "epoch": 0.7, + "learning_rate": 0.0001953836503093724, + "loss": 0.0153, "step": 269060 }, { - "epoch": 1.36, - "learning_rate": 9.637608407202424e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.00019537976209300096, + "loss": 0.0145, "step": 269070 }, { - "epoch": 1.36, - "learning_rate": 9.636851637901024e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.00019537587387662947, + "loss": 0.0131, "step": 269080 }, { - "epoch": 1.36, - "learning_rate": 9.636094868599623e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.000195371985660258, + "loss": 0.0134, "step": 269090 }, { - "epoch": 1.36, - "learning_rate": 9.635338099298222e-05, - "loss": 0.0059, + "epoch": 0.7, + "learning_rate": 0.00019536809744388653, + "loss": 0.0159, "step": 269100 }, { - "epoch": 1.36, - "learning_rate": 9.634581329996821e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.0001953642092275151, + "loss": 0.0155, "step": 269110 }, { - "epoch": 1.36, - "learning_rate": 9.63382456069542e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.0001953603210111436, + "loss": 0.0173, "step": 269120 }, { - "epoch": 1.36, - "learning_rate": 9.633067791394019e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019535643279477215, + "loss": 0.0169, "step": 269130 }, { - "epoch": 1.36, - "learning_rate": 9.632311022092618e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019535254457840067, + "loss": 0.0171, "step": 269140 }, { - "epoch": 1.36, - "learning_rate": 9.631554252791216e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019534865636202924, + "loss": 0.0134, "step": 269150 }, { - "epoch": 1.36, - "learning_rate": 9.630797483489816e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019534476814565775, + "loss": 0.0146, "step": 269160 }, { - "epoch": 1.36, - "learning_rate": 9.630040714188415e-05, - "loss": 0.0103, + "epoch": 0.7, + "learning_rate": 0.0001953408799292863, + "loss": 0.014, "step": 269170 }, { - "epoch": 1.36, - "learning_rate": 9.629283944887014e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.0001953369917129148, + "loss": 0.0152, "step": 269180 }, { - "epoch": 1.36, - "learning_rate": 9.628527175585613e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019533310349654338, + "loss": 0.0154, "step": 269190 }, { - "epoch": 1.36, - "learning_rate": 9.627770406284213e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.0001953292152801719, + "loss": 0.0151, "step": 269200 }, { - "epoch": 1.36, - "learning_rate": 9.627013636982811e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019532532706380043, + "loss": 0.0173, "step": 269210 }, { - "epoch": 1.36, - "learning_rate": 9.62625686768141e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019532143884742895, + "loss": 0.014, "step": 269220 }, { - "epoch": 1.36, - "learning_rate": 9.625500098380008e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.0001953175506310575, + "loss": 0.014, "step": 269230 }, { - "epoch": 1.36, - "learning_rate": 9.624743329078608e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019531366241468606, + "loss": 0.0124, "step": 269240 }, { - "epoch": 1.36, - "learning_rate": 9.623986559777207e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.00019530977419831457, + "loss": 0.0126, "step": 269250 }, { - "epoch": 1.36, - "learning_rate": 9.623229790475805e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.0001953058859819431, + "loss": 0.0174, "step": 269260 }, { - "epoch": 1.36, - "learning_rate": 9.622473021174405e-05, - "loss": 0.0118, + "epoch": 0.7, + "learning_rate": 0.00019530199776557163, + "loss": 0.0176, "step": 269270 }, { - "epoch": 1.36, - "learning_rate": 9.621716251873004e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001952981095492002, + "loss": 0.0158, "step": 269280 }, { - "epoch": 1.36, - "learning_rate": 9.620959482571601e-05, - "loss": 0.0121, + "epoch": 0.7, + "learning_rate": 0.0001952942213328287, + "loss": 0.0127, "step": 269290 }, { - "epoch": 1.36, - "learning_rate": 9.620202713270201e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019529033311645725, + "loss": 0.0211, "step": 269300 }, { - "epoch": 1.36, - "learning_rate": 9.619445943968799e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019528644490008577, + "loss": 0.0151, "step": 269310 }, { - "epoch": 1.36, - "learning_rate": 9.618689174667398e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019528255668371434, + "loss": 0.0141, "step": 269320 }, { - "epoch": 1.36, - "learning_rate": 9.617932405365998e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.00019527866846734285, + "loss": 0.0159, "step": 269330 }, { - "epoch": 1.36, - "learning_rate": 9.617175636064596e-05, - "loss": 0.0132, + "epoch": 0.7, + "learning_rate": 0.0001952747802509714, + "loss": 0.0138, "step": 269340 }, { - "epoch": 1.36, - "learning_rate": 9.616418866763196e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.0001952708920345999, + "loss": 0.0126, "step": 269350 }, { - "epoch": 1.36, - "learning_rate": 9.615662097461794e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019526700381822847, + "loss": 0.0158, "step": 269360 }, { - "epoch": 1.36, - "learning_rate": 9.614905328160393e-05, - "loss": 0.0111, + "epoch": 0.7, + "learning_rate": 0.000195263115601857, + "loss": 0.0171, "step": 269370 }, { - "epoch": 1.36, - "learning_rate": 9.614148558858993e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019525922738548553, + "loss": 0.0123, "step": 269380 }, { - "epoch": 1.36, - "learning_rate": 9.613391789557591e-05, - "loss": 0.0058, + "epoch": 0.7, + "learning_rate": 0.00019525533916911405, + "loss": 0.0129, "step": 269390 }, { - "epoch": 1.36, - "learning_rate": 9.61263502025619e-05, - "loss": 0.0119, + "epoch": 0.7, + "learning_rate": 0.00019525145095274261, + "loss": 0.0177, "step": 269400 }, { - "epoch": 1.36, - "learning_rate": 9.61187825095479e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019524756273637116, + "loss": 0.0161, "step": 269410 }, { - "epoch": 1.36, - "learning_rate": 9.611121481653388e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.00019524367451999967, + "loss": 0.0205, "step": 269420 }, { - "epoch": 1.36, - "learning_rate": 9.610364712351987e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.0001952397863036282, + "loss": 0.0169, "step": 269430 }, { - "epoch": 1.36, - "learning_rate": 9.609607943050586e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019523589808725675, + "loss": 0.0184, "step": 269440 }, { - "epoch": 1.36, - "learning_rate": 9.608851173749185e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001952320098708853, + "loss": 0.0129, "step": 269450 }, { - "epoch": 1.36, - "learning_rate": 9.608094404447785e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.0001952281216545138, + "loss": 0.0149, "step": 269460 }, { - "epoch": 1.36, - "learning_rate": 9.607337635146383e-05, - "loss": 0.0076, - "step": 269470 + "epoch": 0.7, + "learning_rate": 0.00019522423343814235, + "loss": 0.0183, + "step": 269470 }, { - "epoch": 1.36, - "learning_rate": 9.606580865844982e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.00019522034522177087, + "loss": 0.0154, "step": 269480 }, { - "epoch": 1.36, - "learning_rate": 9.605824096543582e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.00019521645700539943, + "loss": 0.0142, "step": 269490 }, { - "epoch": 1.36, - "learning_rate": 9.60506732724218e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019521256878902795, + "loss": 0.0157, "step": 269500 }, { - "epoch": 1.36, - "learning_rate": 9.60431055794078e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001952086805726565, + "loss": 0.0151, "step": 269510 }, { - "epoch": 1.36, - "learning_rate": 9.603553788639378e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.000195204792356285, + "loss": 0.0124, "step": 269520 }, { - "epoch": 1.36, - "learning_rate": 9.602797019337977e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019520090413991357, + "loss": 0.0154, "step": 269530 }, { - "epoch": 1.36, - "learning_rate": 9.602040250036577e-05, - "loss": 0.0061, + "epoch": 0.7, + "learning_rate": 0.0001951970159235421, + "loss": 0.0152, "step": 269540 }, { - "epoch": 1.36, - "learning_rate": 9.601283480735175e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019519312770717063, + "loss": 0.0163, "step": 269550 }, { - "epoch": 1.36, - "learning_rate": 9.600526711433774e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019518923949079914, + "loss": 0.0193, "step": 269560 }, { - "epoch": 1.36, - "learning_rate": 9.599769942132374e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001951853512744277, + "loss": 0.0143, "step": 269570 }, { - "epoch": 1.36, - "learning_rate": 9.599013172830972e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019518146305805626, + "loss": 0.0138, "step": 269580 }, { - "epoch": 1.36, - "learning_rate": 9.598256403529571e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019517757484168477, + "loss": 0.0186, "step": 269590 }, { - "epoch": 1.36, - "learning_rate": 9.59749963422817e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.00019517368662531328, + "loss": 0.0105, "step": 269600 }, { - "epoch": 1.36, - "learning_rate": 9.596742864926769e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019516979840894185, + "loss": 0.0141, "step": 269610 }, { - "epoch": 1.36, - "learning_rate": 9.595986095625368e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.0001951659101925704, + "loss": 0.0155, "step": 269620 }, { - "epoch": 1.36, - "learning_rate": 9.595229326323967e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.0001951620219761989, + "loss": 0.0161, "step": 269630 }, { - "epoch": 1.36, - "learning_rate": 9.594472557022566e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019515813375982745, + "loss": 0.0126, "step": 269640 }, { - "epoch": 1.36, - "learning_rate": 9.593715787721166e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.000195154245543456, + "loss": 0.0135, "step": 269650 }, { - "epoch": 1.36, - "learning_rate": 9.592959018419764e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019515035732708453, + "loss": 0.0175, "step": 269660 }, { - "epoch": 1.36, - "learning_rate": 9.592202249118363e-05, - "loss": 0.0098, + "epoch": 0.7, + "learning_rate": 0.00019514646911071305, + "loss": 0.0149, "step": 269670 }, { - "epoch": 1.36, - "learning_rate": 9.591445479816961e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.0001951425808943416, + "loss": 0.0154, "step": 269680 }, { - "epoch": 1.36, - "learning_rate": 9.590688710515561e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.00019513869267797013, + "loss": 0.016, "step": 269690 }, { - "epoch": 1.36, - "learning_rate": 9.58993194121416e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019513480446159867, + "loss": 0.0176, "step": 269700 }, { - "epoch": 1.36, - "learning_rate": 9.589175171912759e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.0001951309162452272, + "loss": 0.0147, "step": 269710 }, { - "epoch": 1.36, - "learning_rate": 9.588418402611358e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019512702802885573, + "loss": 0.0155, "step": 269720 }, { - "epoch": 1.36, - "learning_rate": 9.587661633309958e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019512313981248424, + "loss": 0.0141, "step": 269730 }, { - "epoch": 1.36, - "learning_rate": 9.586904864008556e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.0001951192515961128, + "loss": 0.0167, "step": 269740 }, { - "epoch": 1.36, - "learning_rate": 9.586148094707155e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019511536337974133, + "loss": 0.0209, "step": 269750 }, { - "epoch": 1.36, - "learning_rate": 9.585391325405755e-05, - "loss": 0.0103, + "epoch": 0.7, + "learning_rate": 0.00019511147516336987, + "loss": 0.0154, "step": 269760 }, { - "epoch": 1.36, - "learning_rate": 9.584634556104353e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019510758694699838, + "loss": 0.0157, "step": 269770 }, { - "epoch": 1.36, - "learning_rate": 9.583877786802952e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019510369873062695, + "loss": 0.0163, "step": 269780 }, { - "epoch": 1.36, - "learning_rate": 9.58312101750155e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001950998105142555, + "loss": 0.0158, "step": 269790 }, { - "epoch": 1.36, - "learning_rate": 9.58236424820015e-05, - "loss": 0.0103, + "epoch": 0.7, + "learning_rate": 0.000195095922297884, + "loss": 0.0166, "step": 269800 }, { - "epoch": 1.36, - "learning_rate": 9.58160747889875e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019509203408151255, + "loss": 0.0159, "step": 269810 }, { - "epoch": 1.36, - "learning_rate": 9.580850709597348e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.0001950881458651411, + "loss": 0.0152, "step": 269820 }, { - "epoch": 1.36, - "learning_rate": 9.580093940295947e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019508425764876963, + "loss": 0.0148, "step": 269830 }, { - "epoch": 1.36, - "learning_rate": 9.579337170994547e-05, - "loss": 0.0057, + "epoch": 0.7, + "learning_rate": 0.00019508036943239815, + "loss": 0.0166, "step": 269840 }, { - "epoch": 1.36, - "learning_rate": 9.578580401693145e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.0001950764812160267, + "loss": 0.015, "step": 269850 }, { - "epoch": 1.36, - "learning_rate": 9.577823632391744e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019507259299965523, + "loss": 0.017, "step": 269860 }, { - "epoch": 1.36, - "learning_rate": 9.577066863090342e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019506870478328377, + "loss": 0.017, "step": 269870 }, { - "epoch": 1.36, - "learning_rate": 9.576310093788942e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.0001950648165669123, + "loss": 0.0126, "step": 269880 }, { - "epoch": 1.36, - "learning_rate": 9.575553324487541e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019506092835054083, + "loss": 0.0188, "step": 269890 }, { - "epoch": 1.36, - "learning_rate": 9.57479655518614e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001950570401341694, + "loss": 0.0189, "step": 269900 }, { - "epoch": 1.36, - "learning_rate": 9.574039785884739e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001950531519177979, + "loss": 0.0135, "step": 269910 }, { - "epoch": 1.36, - "learning_rate": 9.573283016583336e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019504926370142643, + "loss": 0.0147, "step": 269920 }, { - "epoch": 1.36, - "learning_rate": 9.572526247281935e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019504537548505497, + "loss": 0.0176, "step": 269930 }, { - "epoch": 1.36, - "learning_rate": 9.571769477980535e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019504148726868354, + "loss": 0.0187, "step": 269940 }, { - "epoch": 1.36, - "learning_rate": 9.571012708679133e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019503759905231205, + "loss": 0.0167, "step": 269950 }, { - "epoch": 1.36, - "learning_rate": 9.570255939377733e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001950337108359406, + "loss": 0.0158, "step": 269960 }, { - "epoch": 1.36, - "learning_rate": 9.56949917007633e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001950298226195691, + "loss": 0.0152, "step": 269970 }, { - "epoch": 1.36, - "learning_rate": 9.56874240077493e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019502593440319765, + "loss": 0.0167, "step": 269980 }, { - "epoch": 1.36, - "learning_rate": 9.56798563147353e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.0001950220461868262, + "loss": 0.0138, "step": 269990 }, { - "epoch": 1.36, - "learning_rate": 9.567228862172128e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019501815797045473, + "loss": 0.014, "step": 270000 }, { - "epoch": 1.36, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.006005189847201109, - "eval_runtime": 116.1544, - "eval_samples_per_second": 17.218, - "eval_steps_per_second": 4.305, + "epoch": 0.7, + "eval_cer": 0.8817250805141147, + "eval_loss": 0.00999659113585949, + "eval_runtime": 107.9657, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, "step": 270000 }, { - "epoch": 1.36, - "learning_rate": 9.566472092870727e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019501426975408325, + "loss": 0.0118, "step": 270010 }, { - "epoch": 1.36, - "learning_rate": 9.565715323569327e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.0001950103815377118, + "loss": 0.0143, "step": 270020 }, { - "epoch": 1.36, - "learning_rate": 9.564958554267925e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019500649332134033, + "loss": 0.0168, "step": 270030 }, { - "epoch": 1.36, - "learning_rate": 9.564201784966524e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019500260510496887, + "loss": 0.0168, "step": 270040 }, { - "epoch": 1.36, - "learning_rate": 9.563445015665123e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001949987168885974, + "loss": 0.0142, "step": 270050 }, { - "epoch": 1.36, - "learning_rate": 9.562688246363722e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019499482867222593, + "loss": 0.0156, "step": 270060 }, { - "epoch": 1.36, - "learning_rate": 9.561931477062322e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019499094045585447, + "loss": 0.02, "step": 270070 }, { - "epoch": 1.36, - "learning_rate": 9.56117470776092e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.000194987052239483, + "loss": 0.0148, "step": 270080 }, { - "epoch": 1.36, - "learning_rate": 9.560417938459519e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.00019498316402311153, + "loss": 0.0167, "step": 270090 }, { - "epoch": 1.36, - "learning_rate": 9.559661169158119e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.00019497927580674007, + "loss": 0.0145, "step": 270100 }, { - "epoch": 1.36, - "learning_rate": 9.558904399856717e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019497538759036864, + "loss": 0.0151, "step": 270110 }, { - "epoch": 1.36, - "learning_rate": 9.558147630555316e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019497149937399715, + "loss": 0.0138, "step": 270120 }, { - "epoch": 1.36, - "learning_rate": 9.557390861253915e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.0001949676111576257, + "loss": 0.0157, "step": 270130 }, { - "epoch": 1.36, - "learning_rate": 9.556634091952514e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.0001949637229412542, + "loss": 0.0143, "step": 270140 }, { - "epoch": 1.36, - "learning_rate": 9.555877322651114e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019495983472488278, + "loss": 0.0116, "step": 270150 }, { - "epoch": 1.36, - "learning_rate": 9.555120553349712e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.0001949559465085113, + "loss": 0.015, "step": 270160 }, { - "epoch": 1.36, - "learning_rate": 9.554363784048311e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019495205829213983, + "loss": 0.0156, "step": 270170 }, { - "epoch": 1.36, - "learning_rate": 9.55360701474691e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.00019494817007576835, + "loss": 0.0124, "step": 270180 }, { - "epoch": 1.36, - "learning_rate": 9.552850245445509e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.0001949442818593969, + "loss": 0.022, "step": 270190 }, { - "epoch": 1.36, - "learning_rate": 9.552093476144108e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.00019494039364302543, + "loss": 0.015, "step": 270200 }, { - "epoch": 1.36, - "learning_rate": 9.551336706842708e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019493650542665397, + "loss": 0.0175, "step": 270210 }, { - "epoch": 1.36, - "learning_rate": 9.550579937541306e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019493261721028249, + "loss": 0.0257, "step": 270220 }, { - "epoch": 1.36, - "learning_rate": 9.549823168239905e-05, - "loss": 0.0057, + "epoch": 0.7, + "learning_rate": 0.00019492872899391103, + "loss": 0.0165, "step": 270230 }, { - "epoch": 1.36, - "learning_rate": 9.549066398938504e-05, - "loss": 0.0102, + "epoch": 0.7, + "learning_rate": 0.00019492484077753957, + "loss": 0.0175, "step": 270240 }, { - "epoch": 1.36, - "learning_rate": 9.548309629637103e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.0001949209525611681, + "loss": 0.0141, "step": 270250 }, { - "epoch": 1.36, - "learning_rate": 9.547552860335703e-05, - "loss": 0.0056, + "epoch": 0.7, + "learning_rate": 0.00019491706434479663, + "loss": 0.0137, "step": 270260 }, { - "epoch": 1.36, - "learning_rate": 9.546796091034301e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.00019491317612842517, + "loss": 0.014, "step": 270270 }, { - "epoch": 1.36, - "learning_rate": 9.5460393217329e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019490928791205374, + "loss": 0.0172, "step": 270280 }, { - "epoch": 1.36, - "learning_rate": 9.5452825524315e-05, - "loss": 0.0137, + "epoch": 0.7, + "learning_rate": 0.00019490539969568225, + "loss": 0.0156, "step": 270290 }, { - "epoch": 1.36, - "learning_rate": 9.544525783130098e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.0001949015114793108, + "loss": 0.0121, "step": 270300 }, { - "epoch": 1.36, - "learning_rate": 9.543769013828697e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.0001948976232629393, + "loss": 0.0115, "step": 270310 }, { - "epoch": 1.36, - "learning_rate": 9.543012244527296e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019489373504656788, + "loss": 0.0164, "step": 270320 }, { - "epoch": 1.36, - "learning_rate": 9.542255475225895e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.0001948898468301964, + "loss": 0.0182, "step": 270330 }, { - "epoch": 1.36, - "learning_rate": 9.541498705924495e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019488595861382493, + "loss": 0.0125, "step": 270340 }, { - "epoch": 1.36, - "learning_rate": 9.540741936623093e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019488207039745345, + "loss": 0.0149, "step": 270350 }, { - "epoch": 1.36, - "learning_rate": 9.539985167321692e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019487818218108201, + "loss": 0.0162, "step": 270360 }, { - "epoch": 1.36, - "learning_rate": 9.539228398020292e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019487429396471053, + "loss": 0.0171, "step": 270370 }, { - "epoch": 1.36, - "learning_rate": 9.53847162871889e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019487040574833907, + "loss": 0.0151, "step": 270380 }, { - "epoch": 1.36, - "learning_rate": 9.537714859417489e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019486651753196759, + "loss": 0.016, "step": 270390 }, { - "epoch": 1.36, - "learning_rate": 9.536958090116087e-05, - "loss": 0.0054, + "epoch": 0.7, + "learning_rate": 0.00019486262931559615, + "loss": 0.0143, "step": 270400 }, { - "epoch": 1.36, - "learning_rate": 9.536201320814687e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019485874109922467, + "loss": 0.0139, "step": 270410 }, { - "epoch": 1.36, - "learning_rate": 9.535444551513286e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001948548528828532, + "loss": 0.0167, "step": 270420 }, { - "epoch": 1.36, - "learning_rate": 9.534687782211885e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019485096466648173, + "loss": 0.0112, "step": 270430 }, { - "epoch": 1.36, - "learning_rate": 9.533931012910484e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019484707645011027, + "loss": 0.0151, "step": 270440 }, { - "epoch": 1.36, - "learning_rate": 9.533174243609084e-05, - "loss": 0.0108, + "epoch": 0.7, + "learning_rate": 0.00019484318823373884, + "loss": 0.0316, "step": 270450 }, { - "epoch": 1.36, - "learning_rate": 9.532417474307682e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019483930001736735, + "loss": 0.0137, "step": 270460 }, { - "epoch": 1.36, - "learning_rate": 9.531660705006281e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.00019483541180099586, + "loss": 0.0122, "step": 270470 }, { - "epoch": 1.36, - "learning_rate": 9.53090393570488e-05, - "loss": 0.0108, + "epoch": 0.7, + "learning_rate": 0.0001948315235846244, + "loss": 0.0198, "step": 270480 }, { - "epoch": 1.36, - "learning_rate": 9.530147166403479e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019482763536825297, + "loss": 0.0141, "step": 270490 }, { - "epoch": 1.36, - "learning_rate": 9.529390397102078e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.0001948237471518815, + "loss": 0.0144, "step": 270500 }, { - "epoch": 1.36, - "learning_rate": 9.528633627800677e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019481985893551003, + "loss": 0.0176, "step": 270510 }, { - "epoch": 1.36, - "learning_rate": 9.527876858499276e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019481597071913855, + "loss": 0.0158, "step": 270520 }, { - "epoch": 1.36, - "learning_rate": 9.527120089197876e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.00019481208250276711, + "loss": 0.0159, "step": 270530 }, { - "epoch": 1.36, - "learning_rate": 9.526363319896474e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019480819428639563, + "loss": 0.0167, "step": 270540 }, { - "epoch": 1.36, - "learning_rate": 9.525606550595072e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.00019480430607002417, + "loss": 0.0136, "step": 270550 }, { - "epoch": 1.37, - "learning_rate": 9.52484978129367e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019480041785365269, + "loss": 0.0141, "step": 270560 }, { - "epoch": 1.37, - "learning_rate": 9.52409301199227e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019479652963728125, + "loss": 0.0159, "step": 270570 }, { - "epoch": 1.37, - "learning_rate": 9.523336242690868e-05, - "loss": 0.0097, + "epoch": 0.7, + "learning_rate": 0.00019479264142090977, + "loss": 0.016, "step": 270580 }, { - "epoch": 1.37, - "learning_rate": 9.522579473389467e-05, - "loss": 0.0063, + "epoch": 0.7, + "learning_rate": 0.0001947887532045383, + "loss": 0.0197, "step": 270590 }, { - "epoch": 1.37, - "learning_rate": 9.521822704088067e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019478486498816682, + "loss": 0.0139, "step": 270600 }, { - "epoch": 1.37, - "learning_rate": 9.521065934786665e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.0001947809767717954, + "loss": 0.0164, "step": 270610 }, { - "epoch": 1.37, - "learning_rate": 9.520309165485264e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019477708855542393, + "loss": 0.0136, "step": 270620 }, { - "epoch": 1.37, - "learning_rate": 9.519552396183864e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.00019477320033905245, + "loss": 0.0125, "step": 270630 }, { - "epoch": 1.37, - "learning_rate": 9.518795626882462e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019476931212268096, + "loss": 0.0235, "step": 270640 }, { - "epoch": 1.37, - "learning_rate": 9.518038857581061e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.00019476542390630953, + "loss": 0.0144, "step": 270650 }, { - "epoch": 1.37, - "learning_rate": 9.517282088279661e-05, - "loss": 0.0066, + "epoch": 0.7, + "learning_rate": 0.00019476153568993807, + "loss": 0.0123, "step": 270660 }, { - "epoch": 1.37, - "learning_rate": 9.516525318978259e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.0001947576474735666, + "loss": 0.0149, "step": 270670 }, { - "epoch": 1.37, - "learning_rate": 9.515768549676859e-05, - "loss": 0.0133, + "epoch": 0.7, + "learning_rate": 0.00019475375925719513, + "loss": 0.0158, "step": 270680 }, { - "epoch": 1.37, - "learning_rate": 9.515011780375457e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019474987104082364, + "loss": 0.0146, "step": 270690 }, { - "epoch": 1.37, - "learning_rate": 9.514255011074056e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019474598282445221, + "loss": 0.0126, "step": 270700 }, { - "epoch": 1.37, - "learning_rate": 9.513498241772656e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019474209460808073, + "loss": 0.0169, "step": 270710 }, { - "epoch": 1.37, - "learning_rate": 9.512741472471254e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019473820639170927, + "loss": 0.0135, "step": 270720 }, { - "epoch": 1.37, - "learning_rate": 9.511984703169853e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019473431817533778, + "loss": 0.0186, "step": 270730 }, { - "epoch": 1.37, - "learning_rate": 9.511227933868453e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.00019473042995896635, + "loss": 0.0097, "step": 270740 }, { - "epoch": 1.37, - "learning_rate": 9.510471164567051e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019472654174259487, + "loss": 0.0124, "step": 270750 }, { - "epoch": 1.37, - "learning_rate": 9.50971439526565e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001947226535262234, + "loss": 0.0138, "step": 270760 }, { - "epoch": 1.37, - "learning_rate": 9.508957625964249e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.00019471876530985192, + "loss": 0.0137, "step": 270770 }, { - "epoch": 1.37, - "learning_rate": 9.508200856662848e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.0001947148770934805, + "loss": 0.0182, "step": 270780 }, { - "epoch": 1.37, - "learning_rate": 9.507444087361448e-05, - "loss": 0.0117, + "epoch": 0.7, + "learning_rate": 0.000194710988877109, + "loss": 0.0132, "step": 270790 }, { - "epoch": 1.37, - "learning_rate": 9.506687318060046e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019470710066073755, + "loss": 0.0208, "step": 270800 }, { - "epoch": 1.37, - "learning_rate": 9.505930548758645e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.00019470321244436606, + "loss": 0.017, "step": 270810 }, { - "epoch": 1.37, - "learning_rate": 9.505173779457245e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.00019469932422799463, + "loss": 0.0127, "step": 270820 }, { - "epoch": 1.37, - "learning_rate": 9.504417010155843e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019469543601162317, + "loss": 0.0129, "step": 270830 }, { - "epoch": 1.37, - "learning_rate": 9.503660240854442e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.0001946915477952517, + "loss": 0.0166, "step": 270840 }, { - "epoch": 1.37, - "learning_rate": 9.50290347155304e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019468765957888023, + "loss": 0.0197, "step": 270850 }, { - "epoch": 1.37, - "learning_rate": 9.50214670225164e-05, - "loss": 0.0098, + "epoch": 0.7, + "learning_rate": 0.00019468377136250877, + "loss": 0.0116, "step": 270860 }, { - "epoch": 1.37, - "learning_rate": 9.50138993295024e-05, - "loss": 0.006, + "epoch": 0.7, + "learning_rate": 0.0001946798831461373, + "loss": 0.0154, "step": 270870 }, { - "epoch": 1.37, - "learning_rate": 9.500633163648838e-05, - "loss": 0.0139, + "epoch": 0.7, + "learning_rate": 0.00019467599492976583, + "loss": 0.0144, "step": 270880 }, { - "epoch": 1.37, - "learning_rate": 9.499876394347437e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019467210671339437, + "loss": 0.0125, "step": 270890 }, { - "epoch": 1.37, - "learning_rate": 9.499119625046037e-05, - "loss": 0.0115, + "epoch": 0.7, + "learning_rate": 0.0001946682184970229, + "loss": 0.013, "step": 270900 }, { - "epoch": 1.37, - "learning_rate": 9.498362855744635e-05, - "loss": 0.0098, + "epoch": 0.7, + "learning_rate": 0.00019466433028065145, + "loss": 0.0157, "step": 270910 }, { - "epoch": 1.37, - "learning_rate": 9.497606086443234e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019466044206427997, + "loss": 0.0148, "step": 270920 }, { - "epoch": 1.37, - "learning_rate": 9.496849317141832e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001946565538479085, + "loss": 0.0108, "step": 270930 }, { - "epoch": 1.37, - "learning_rate": 9.496092547840432e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019465266563153702, + "loss": 0.0124, "step": 270940 }, { - "epoch": 1.37, - "learning_rate": 9.495335778539031e-05, - "loss": 0.0098, + "epoch": 0.7, + "learning_rate": 0.0001946487774151656, + "loss": 0.0162, "step": 270950 }, { - "epoch": 1.37, - "learning_rate": 9.49457900923763e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001946448891987941, + "loss": 0.0159, "step": 270960 }, { - "epoch": 1.37, - "learning_rate": 9.493822239936229e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019464100098242265, + "loss": 0.0123, "step": 270970 }, { - "epoch": 1.37, - "learning_rate": 9.493065470634829e-05, - "loss": 0.0089, + "epoch": 0.7, + "learning_rate": 0.00019463711276605116, + "loss": 0.0187, "step": 270980 }, { - "epoch": 1.37, - "learning_rate": 9.492308701333427e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019463322454967973, + "loss": 0.0122, "step": 270990 }, { - "epoch": 1.37, - "learning_rate": 9.491551932032026e-05, - "loss": 0.012, + "epoch": 0.7, + "learning_rate": 0.00019462933633330827, + "loss": 0.0186, "step": 271000 }, { - "epoch": 1.37, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.0061246431432664394, - "eval_runtime": 116.2526, - "eval_samples_per_second": 17.204, - "eval_steps_per_second": 4.301, + "epoch": 0.7, + "eval_cer": 0.8817404765203906, + "eval_loss": 0.01013705413788557, + "eval_runtime": 108.1485, + "eval_samples_per_second": 18.493, + "eval_steps_per_second": 4.623, "step": 271000 }, { - "epoch": 1.37, - "learning_rate": 9.490795162730624e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.0001946254481169368, + "loss": 0.0155, "step": 271010 }, { - "epoch": 1.37, - "learning_rate": 9.490038393429224e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019462155990056533, + "loss": 0.0114, "step": 271020 }, { - "epoch": 1.37, - "learning_rate": 9.489281624127823e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.00019461767168419387, + "loss": 0.0149, "step": 271030 }, { - "epoch": 1.37, - "learning_rate": 9.488524854826422e-05, - "loss": 0.0078, + "epoch": 0.7, + "learning_rate": 0.0001946137834678224, + "loss": 0.0167, "step": 271040 }, { - "epoch": 1.37, - "learning_rate": 9.487768085525021e-05, - "loss": 0.0111, + "epoch": 0.7, + "learning_rate": 0.00019460989525145093, + "loss": 0.0126, "step": 271050 }, { - "epoch": 1.37, - "learning_rate": 9.48701131622362e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019460600703507947, + "loss": 0.0154, "step": 271060 }, { - "epoch": 1.37, - "learning_rate": 9.486254546922219e-05, - "loss": 0.0117, + "epoch": 0.7, + "learning_rate": 0.000194602118818708, + "loss": 0.0183, "step": 271070 }, { - "epoch": 1.37, - "learning_rate": 9.485497777620818e-05, - "loss": 0.005, + "epoch": 0.7, + "learning_rate": 0.00019459823060233655, + "loss": 0.0123, "step": 271080 }, { - "epoch": 1.37, - "learning_rate": 9.484741008319416e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.00019459434238596507, + "loss": 0.0161, "step": 271090 }, { - "epoch": 1.37, - "learning_rate": 9.483984239018016e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.0001945904541695936, + "loss": 0.0151, "step": 271100 }, { - "epoch": 1.37, - "learning_rate": 9.483227469716615e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019458656595322215, + "loss": 0.0137, "step": 271110 }, { - "epoch": 1.37, - "learning_rate": 9.482470700415213e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001945826777368507, + "loss": 0.0129, "step": 271120 }, { - "epoch": 1.37, - "learning_rate": 9.481713931113813e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001945787895204792, + "loss": 0.0139, "step": 271130 }, { - "epoch": 1.37, - "learning_rate": 9.480957161812412e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.00019457490130410775, + "loss": 0.0144, "step": 271140 }, { - "epoch": 1.37, - "learning_rate": 9.48020039251101e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019457101308773632, + "loss": 0.016, "step": 271150 }, { - "epoch": 1.37, - "learning_rate": 9.47944362320961e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019456712487136483, + "loss": 0.0116, "step": 271160 }, { - "epoch": 1.37, - "learning_rate": 9.478686853908208e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019456323665499337, + "loss": 0.0156, "step": 271170 }, { - "epoch": 1.37, - "learning_rate": 9.477930084606806e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.0001945593484386219, + "loss": 0.0155, "step": 271180 }, { - "epoch": 1.37, - "learning_rate": 9.477173315305406e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.0001945554602222504, + "loss": 0.012, "step": 271190 }, { - "epoch": 1.37, - "learning_rate": 9.476416546004004e-05, - "loss": 0.0092, + "epoch": 0.7, + "learning_rate": 0.00019455157200587897, + "loss": 0.0185, "step": 271200 }, { - "epoch": 1.37, - "learning_rate": 9.475659776702604e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001945476837895075, + "loss": 0.0147, "step": 271210 }, { - "epoch": 1.37, - "learning_rate": 9.474903007401202e-05, - "loss": 0.0113, + "epoch": 0.7, + "learning_rate": 0.00019454379557313603, + "loss": 0.0156, "step": 271220 }, { - "epoch": 1.37, - "learning_rate": 9.474146238099801e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.00019453990735676457, + "loss": 0.0162, "step": 271230 }, { - "epoch": 1.37, - "learning_rate": 9.473389468798401e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.0001945360191403931, + "loss": 0.0117, "step": 271240 }, { - "epoch": 1.37, - "learning_rate": 9.472632699496999e-05, - "loss": 0.0095, + "epoch": 0.7, + "learning_rate": 0.00019453213092402165, + "loss": 0.0164, "step": 271250 }, { - "epoch": 1.37, - "learning_rate": 9.471875930195598e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019452824270765017, + "loss": 0.0129, "step": 271260 }, { - "epoch": 1.37, - "learning_rate": 9.471119160894198e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.0001945243544912787, + "loss": 0.0172, "step": 271270 }, { - "epoch": 1.37, - "learning_rate": 9.470362391592796e-05, - "loss": 0.0114, + "epoch": 0.7, + "learning_rate": 0.00019452046627490725, + "loss": 0.0181, "step": 271280 }, { - "epoch": 1.37, - "learning_rate": 9.469605622291395e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001945165780585358, + "loss": 0.0139, "step": 271290 }, { - "epoch": 1.37, - "learning_rate": 9.468848852989994e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.0001945126898421643, + "loss": 0.0171, "step": 271300 }, { - "epoch": 1.37, - "learning_rate": 9.468092083688593e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019450880162579285, + "loss": 0.0149, "step": 271310 }, { - "epoch": 1.37, - "learning_rate": 9.467335314387193e-05, - "loss": 0.0104, + "epoch": 0.7, + "learning_rate": 0.00019450491340942142, + "loss": 0.0132, "step": 271320 }, { - "epoch": 1.37, - "learning_rate": 9.466578545085791e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019450102519304993, + "loss": 0.0111, "step": 271330 }, { - "epoch": 1.37, - "learning_rate": 9.46582177578439e-05, - "loss": 0.0086, + "epoch": 0.7, + "learning_rate": 0.00019449713697667844, + "loss": 0.0155, "step": 271340 }, { - "epoch": 1.37, - "learning_rate": 9.46506500648299e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.000194493248760307, + "loss": 0.015, "step": 271350 }, { - "epoch": 1.37, - "learning_rate": 9.464308237181588e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019448936054393556, + "loss": 0.012, "step": 271360 }, { - "epoch": 1.37, - "learning_rate": 9.463551467880187e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019448547232756407, + "loss": 0.0198, "step": 271370 }, { - "epoch": 1.37, - "learning_rate": 9.462794698578786e-05, - "loss": 0.0065, + "epoch": 0.7, + "learning_rate": 0.0001944815841111926, + "loss": 0.0171, "step": 271380 }, { - "epoch": 1.37, - "learning_rate": 9.462037929277385e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.00019447769589482113, + "loss": 0.0149, "step": 271390 }, { - "epoch": 1.37, - "learning_rate": 9.461281159975985e-05, - "loss": 0.0115, + "epoch": 0.7, + "learning_rate": 0.0001944738076784497, + "loss": 0.0131, "step": 271400 }, { - "epoch": 1.37, - "learning_rate": 9.460524390674583e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001944699194620782, + "loss": 0.0144, "step": 271410 }, { - "epoch": 1.37, - "learning_rate": 9.459767621373182e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019446603124570675, + "loss": 0.0135, "step": 271420 }, { - "epoch": 1.37, - "learning_rate": 9.459010852071782e-05, - "loss": 0.01, + "epoch": 0.7, + "learning_rate": 0.00019446214302933527, + "loss": 0.0155, "step": 271430 }, { - "epoch": 1.37, - "learning_rate": 9.45825408277038e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.0001944582548129638, + "loss": 0.0128, "step": 271440 }, { - "epoch": 1.37, - "learning_rate": 9.45749731346898e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.00019445436659659235, + "loss": 0.0136, "step": 271450 }, { - "epoch": 1.37, - "learning_rate": 9.456740544167577e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.0001944504783802209, + "loss": 0.0239, "step": 271460 }, { - "epoch": 1.37, - "learning_rate": 9.455983774866177e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.0001944465901638494, + "loss": 0.0127, "step": 271470 }, { - "epoch": 1.37, - "learning_rate": 9.455227005564776e-05, - "loss": 0.0082, + "epoch": 0.7, + "learning_rate": 0.00019444270194747795, + "loss": 0.0109, "step": 271480 }, { - "epoch": 1.37, - "learning_rate": 9.454470236263375e-05, - "loss": 0.0071, + "epoch": 0.7, + "learning_rate": 0.00019443881373110652, + "loss": 0.0152, "step": 271490 }, { - "epoch": 1.37, - "learning_rate": 9.453713466961974e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.00019443492551473503, + "loss": 0.0149, "step": 271500 }, { - "epoch": 1.37, - "learning_rate": 9.452956697660574e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019443103729836354, + "loss": 0.014, "step": 271510 }, { - "epoch": 1.37, - "learning_rate": 9.452199928359172e-05, - "loss": 0.0072, + "epoch": 0.7, + "learning_rate": 0.00019442714908199209, + "loss": 0.0159, "step": 271520 }, { - "epoch": 1.37, - "learning_rate": 9.451443159057771e-05, - "loss": 0.0083, + "epoch": 0.7, + "learning_rate": 0.00019442326086562065, + "loss": 0.0219, "step": 271530 }, { - "epoch": 1.37, - "learning_rate": 9.45068638975637e-05, - "loss": 0.0101, + "epoch": 0.7, + "learning_rate": 0.00019441937264924917, + "loss": 0.0181, "step": 271540 }, { - "epoch": 1.37, - "learning_rate": 9.449929620454969e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.0001944154844328777, + "loss": 0.0148, "step": 271550 }, { - "epoch": 1.37, - "learning_rate": 9.449172851153568e-05, - "loss": 0.007, + "epoch": 0.7, + "learning_rate": 0.00019441159621650623, + "loss": 0.0128, "step": 271560 }, { - "epoch": 1.37, - "learning_rate": 9.448416081852167e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.0001944077080001348, + "loss": 0.0137, "step": 271570 }, { - "epoch": 1.37, - "learning_rate": 9.447659312550766e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.0001944038197837633, + "loss": 0.0153, "step": 271580 }, { - "epoch": 1.37, - "learning_rate": 9.446902543249366e-05, + "epoch": 0.7, + "learning_rate": 0.00019439993156739185, "loss": 0.0113, "step": 271590 }, { - "epoch": 1.37, - "learning_rate": 9.446145773947964e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.00019439604335102036, + "loss": 0.0141, "step": 271600 }, { - "epoch": 1.37, - "learning_rate": 9.445389004646563e-05, - "loss": 0.0099, + "epoch": 0.7, + "learning_rate": 0.00019439215513464893, + "loss": 0.0117, "step": 271610 }, { - "epoch": 1.37, - "learning_rate": 9.444632235345161e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019438826691827745, + "loss": 0.0139, "step": 271620 }, { - "epoch": 1.37, - "learning_rate": 9.443875466043761e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.000194384378701906, + "loss": 0.013, "step": 271630 }, { - "epoch": 1.37, - "learning_rate": 9.44311869674236e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.0001943804904855345, + "loss": 0.0164, "step": 271640 }, { - "epoch": 1.37, - "learning_rate": 9.442361927440958e-05, - "loss": 0.0093, + "epoch": 0.7, + "learning_rate": 0.00019437660226916307, + "loss": 0.0153, "step": 271650 }, { - "epoch": 1.37, - "learning_rate": 9.441605158139558e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.0001943727140527916, + "loss": 0.0119, "step": 271660 }, { - "epoch": 1.37, - "learning_rate": 9.440848388838157e-05, - "loss": 0.0064, + "epoch": 0.7, + "learning_rate": 0.00019436882583642013, + "loss": 0.014, "step": 271670 }, { - "epoch": 1.37, - "learning_rate": 9.440091619536756e-05, - "loss": 0.0096, + "epoch": 0.7, + "learning_rate": 0.00019436493762004864, + "loss": 0.0134, "step": 271680 }, { - "epoch": 1.37, - "learning_rate": 9.439334850235355e-05, - "loss": 0.0059, + "epoch": 0.7, + "learning_rate": 0.00019436104940367719, + "loss": 0.0127, "step": 271690 }, { - "epoch": 1.37, - "learning_rate": 9.438578080933955e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.00019435716118730575, + "loss": 0.0166, "step": 271700 }, { - "epoch": 1.37, - "learning_rate": 9.437821311632553e-05, - "loss": 0.0067, + "epoch": 0.7, + "learning_rate": 0.00019435327297093427, + "loss": 0.0151, "step": 271710 }, { - "epoch": 1.37, - "learning_rate": 9.437064542331152e-05, - "loss": 0.0079, + "epoch": 0.7, + "learning_rate": 0.0001943493847545628, + "loss": 0.0138, "step": 271720 }, { - "epoch": 1.37, - "learning_rate": 9.43630777302975e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019434549653819132, + "loss": 0.0171, "step": 271730 }, { - "epoch": 1.37, - "learning_rate": 9.43555100372835e-05, - "loss": 0.0068, + "epoch": 0.7, + "learning_rate": 0.0001943416083218199, + "loss": 0.0176, "step": 271740 }, { - "epoch": 1.37, - "learning_rate": 9.43479423442695e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.0001943377201054484, + "loss": 0.0178, "step": 271750 }, { - "epoch": 1.37, - "learning_rate": 9.434037465125548e-05, - "loss": 0.0053, + "epoch": 0.7, + "learning_rate": 0.00019433383188907695, + "loss": 0.0174, "step": 271760 }, { - "epoch": 1.37, - "learning_rate": 9.433280695824147e-05, - "loss": 0.0085, + "epoch": 0.7, + "learning_rate": 0.00019432994367270546, + "loss": 0.0195, "step": 271770 }, { - "epoch": 1.37, - "learning_rate": 9.432523926522747e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019432605545633403, + "loss": 0.0141, "step": 271780 }, { - "epoch": 1.37, - "learning_rate": 9.431767157221345e-05, - "loss": 0.0087, + "epoch": 0.7, + "learning_rate": 0.00019432216723996255, + "loss": 0.0157, "step": 271790 }, { - "epoch": 1.37, - "learning_rate": 9.431010387919944e-05, - "loss": 0.0074, + "epoch": 0.7, + "learning_rate": 0.0001943182790235911, + "loss": 0.016, "step": 271800 }, { - "epoch": 1.37, - "learning_rate": 9.430253618618541e-05, - "loss": 0.0061, + "epoch": 0.7, + "learning_rate": 0.0001943143908072196, + "loss": 0.015, "step": 271810 }, { - "epoch": 1.37, - "learning_rate": 9.42949684931714e-05, - "loss": 0.0081, + "epoch": 0.7, + "learning_rate": 0.00019431050259084817, + "loss": 0.0146, "step": 271820 }, { - "epoch": 1.37, - "learning_rate": 9.428740080015739e-05, - "loss": 0.0084, + "epoch": 0.7, + "learning_rate": 0.0001943066143744767, + "loss": 0.0139, "step": 271830 }, { - "epoch": 1.37, - "learning_rate": 9.427983310714338e-05, - "loss": 0.0134, + "epoch": 0.7, + "learning_rate": 0.00019430272615810523, + "loss": 0.0159, "step": 271840 }, { - "epoch": 1.37, - "learning_rate": 9.427226541412938e-05, - "loss": 0.0075, + "epoch": 0.7, + "learning_rate": 0.00019429883794173374, + "loss": 0.0175, "step": 271850 }, { - "epoch": 1.37, - "learning_rate": 9.426469772111536e-05, - "loss": 0.0069, + "epoch": 0.7, + "learning_rate": 0.0001942949497253623, + "loss": 0.0139, "step": 271860 }, { - "epoch": 1.37, - "learning_rate": 9.425713002810135e-05, - "loss": 0.0091, + "epoch": 0.7, + "learning_rate": 0.00019429106150899085, + "loss": 0.0171, "step": 271870 }, { - "epoch": 1.37, - "learning_rate": 9.424956233508735e-05, - "loss": 0.0076, + "epoch": 0.7, + "learning_rate": 0.00019428717329261937, + "loss": 0.0141, "step": 271880 }, { - "epoch": 1.37, - "learning_rate": 9.424199464207333e-05, - "loss": 0.009, + "epoch": 0.7, + "learning_rate": 0.0001942832850762479, + "loss": 0.0177, "step": 271890 }, { - "epoch": 1.37, - "learning_rate": 9.423442694905932e-05, - "loss": 0.0088, + "epoch": 0.7, + "learning_rate": 0.00019427939685987645, + "loss": 0.013, "step": 271900 }, { - "epoch": 1.37, - "learning_rate": 9.42268592560453e-05, - "loss": 0.008, + "epoch": 0.7, + "learning_rate": 0.000194275508643505, + "loss": 0.0165, "step": 271910 }, { - "epoch": 1.37, - "learning_rate": 9.42192915630313e-05, - "loss": 0.0059, + "epoch": 0.7, + "learning_rate": 0.0001942716204271335, + "loss": 0.0169, "step": 271920 }, { - "epoch": 1.37, - "learning_rate": 9.42117238700173e-05, - "loss": 0.0109, + "epoch": 0.7, + "learning_rate": 0.00019426773221076205, + "loss": 0.0159, "step": 271930 }, { - "epoch": 1.37, - "learning_rate": 9.420415617700328e-05, - "loss": 0.0077, + "epoch": 0.7, + "learning_rate": 0.00019426384399439056, + "loss": 0.0179, "step": 271940 }, { - "epoch": 1.37, - "learning_rate": 9.419658848398927e-05, - "loss": 0.0073, + "epoch": 0.7, + "learning_rate": 0.00019425995577801913, + "loss": 0.0154, "step": 271950 }, { - "epoch": 1.37, - "learning_rate": 9.418902079097527e-05, - "loss": 0.0094, + "epoch": 0.7, + "learning_rate": 0.00019425606756164765, + "loss": 0.0197, "step": 271960 }, { - "epoch": 1.37, - "learning_rate": 9.418145309796125e-05, - "loss": 0.0062, + "epoch": 0.7, + "learning_rate": 0.0001942521793452762, + "loss": 0.0156, "step": 271970 }, { - "epoch": 1.37, - "learning_rate": 9.417388540494724e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.0001942482911289047, + "loss": 0.0162, "step": 271980 }, { - "epoch": 1.37, - "learning_rate": 9.416631771193322e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019424440291253327, + "loss": 0.0129, "step": 271990 }, { - "epoch": 1.37, - "learning_rate": 9.415875001891922e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019424051469616179, + "loss": 0.0181, "step": 272000 }, { - "epoch": 1.37, - "eval_cer": 0.9144265880775191, - "eval_loss": 0.006095241755247116, - "eval_runtime": 116.2589, - "eval_samples_per_second": 17.203, - "eval_steps_per_second": 4.301, + "epoch": 0.71, + "eval_cer": 0.8817656699852059, + "eval_loss": 0.010548959486186504, + "eval_runtime": 108.289, + "eval_samples_per_second": 18.469, + "eval_steps_per_second": 4.617, "step": 272000 }, { - "epoch": 1.37, - "learning_rate": 9.415118232590521e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019423662647979033, + "loss": 0.0167, "step": 272010 }, { - "epoch": 1.37, - "learning_rate": 9.41436146328912e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.00019423273826341884, + "loss": 0.0175, "step": 272020 }, { - "epoch": 1.37, - "learning_rate": 9.413604693987719e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.0001942288500470474, + "loss": 0.0145, "step": 272030 }, { - "epoch": 1.37, - "learning_rate": 9.412847924686319e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019422496183067595, + "loss": 0.0126, "step": 272040 }, { - "epoch": 1.37, - "learning_rate": 9.412091155384917e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019422107361430447, + "loss": 0.0175, "step": 272050 }, { - "epoch": 1.37, - "learning_rate": 9.411334386083516e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019421718539793298, + "loss": 0.0136, "step": 272060 }, { - "epoch": 1.37, - "learning_rate": 9.410577616782114e-05, - "loss": 0.0097, + "epoch": 0.71, + "learning_rate": 0.00019421329718156155, + "loss": 0.0151, "step": 272070 }, { - "epoch": 1.37, - "learning_rate": 9.409820847480714e-05, - "loss": 0.0093, + "epoch": 0.71, + "learning_rate": 0.0001942094089651901, + "loss": 0.0184, "step": 272080 }, { - "epoch": 1.37, - "learning_rate": 9.409064078179313e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.0001942055207488186, + "loss": 0.0168, "step": 272090 }, { - "epoch": 1.37, - "learning_rate": 9.408307308877912e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019420163253244715, + "loss": 0.0195, "step": 272100 }, { - "epoch": 1.37, - "learning_rate": 9.407550539576511e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.0001941977443160757, + "loss": 0.0186, "step": 272110 }, { - "epoch": 1.37, - "learning_rate": 9.40679377027511e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019419385609970423, + "loss": 0.0138, "step": 272120 }, { - "epoch": 1.37, - "learning_rate": 9.406037000973709e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019418996788333275, + "loss": 0.0148, "step": 272130 }, { - "epoch": 1.37, - "learning_rate": 9.405280231672308e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.0001941860796669613, + "loss": 0.0134, "step": 272140 }, { - "epoch": 1.37, - "learning_rate": 9.404523462370908e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019418219145058983, + "loss": 0.0175, "step": 272150 }, { - "epoch": 1.37, - "learning_rate": 9.403766693069506e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019417830323421837, + "loss": 0.0156, "step": 272160 }, { - "epoch": 1.37, - "learning_rate": 9.403009923768105e-05, - "loss": 0.0103, + "epoch": 0.71, + "learning_rate": 0.00019417441501784689, + "loss": 0.0173, "step": 272170 }, { - "epoch": 1.37, - "learning_rate": 9.402253154466703e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019417052680147543, + "loss": 0.0158, "step": 272180 }, { - "epoch": 1.37, - "learning_rate": 9.401496385165303e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019416663858510394, + "loss": 0.0128, "step": 272190 }, { - "epoch": 1.37, - "learning_rate": 9.400739615863902e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.0001941627503687325, + "loss": 0.0166, "step": 272200 }, { - "epoch": 1.37, - "learning_rate": 9.3999828465625e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019415886215236105, + "loss": 0.0127, "step": 272210 }, { - "epoch": 1.37, - "learning_rate": 9.3992260772611e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019415497393598957, + "loss": 0.0146, "step": 272220 }, { - "epoch": 1.37, - "learning_rate": 9.3984693079597e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.00019415108571961808, + "loss": 0.0137, "step": 272230 }, { - "epoch": 1.37, - "learning_rate": 9.397712538658298e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019414719750324665, + "loss": 0.0145, "step": 272240 }, { - "epoch": 1.37, - "learning_rate": 9.396955769356897e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.0001941433092868752, + "loss": 0.012, "step": 272250 }, { - "epoch": 1.37, - "learning_rate": 9.396199000055495e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.0001941394210705037, + "loss": 0.016, "step": 272260 }, { - "epoch": 1.37, - "learning_rate": 9.395442230754095e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019413553285413225, + "loss": 0.0121, "step": 272270 }, { - "epoch": 1.37, - "learning_rate": 9.394685461452694e-05, - "loss": 0.0106, + "epoch": 0.71, + "learning_rate": 0.0001941316446377608, + "loss": 0.0143, "step": 272280 }, { - "epoch": 1.37, - "learning_rate": 9.393928692151293e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019412775642138933, + "loss": 0.0192, "step": 272290 }, { - "epoch": 1.37, - "learning_rate": 9.393171922849892e-05, - "loss": 0.0125, + "epoch": 0.71, + "learning_rate": 0.00019412386820501785, + "loss": 0.014, "step": 272300 }, { - "epoch": 1.37, - "learning_rate": 9.392415153548492e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.0001941199799886464, + "loss": 0.0136, "step": 272310 }, { - "epoch": 1.37, - "learning_rate": 9.39165838424709e-05, - "loss": 0.0095, + "epoch": 0.71, + "learning_rate": 0.00019411609177227493, + "loss": 0.0165, "step": 272320 }, { - "epoch": 1.37, - "learning_rate": 9.390901614945689e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019411220355590347, + "loss": 0.0127, "step": 272330 }, { - "epoch": 1.37, - "learning_rate": 9.390144845644287e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019410831533953199, + "loss": 0.0167, "step": 272340 }, { - "epoch": 1.37, - "learning_rate": 9.389388076342887e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019410442712316053, + "loss": 0.0126, "step": 272350 }, { - "epoch": 1.37, - "learning_rate": 9.388631307041486e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.0001941005389067891, + "loss": 0.0177, "step": 272360 }, { - "epoch": 1.37, - "learning_rate": 9.387874537740084e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001940966506904176, + "loss": 0.0127, "step": 272370 }, { - "epoch": 1.37, - "learning_rate": 9.387117768438684e-05, - "loss": 0.0056, + "epoch": 0.71, + "learning_rate": 0.00019409276247404612, + "loss": 0.0242, "step": 272380 }, { - "epoch": 1.37, - "learning_rate": 9.386360999137283e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019408887425767467, + "loss": 0.0161, "step": 272390 }, { - "epoch": 1.37, - "learning_rate": 9.385604229835882e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019408498604130324, + "loss": 0.0163, "step": 272400 }, { - "epoch": 1.37, - "learning_rate": 9.384847460534481e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019408109782493175, + "loss": 0.0157, "step": 272410 }, { - "epoch": 1.37, - "learning_rate": 9.384090691233079e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.0001940772096085603, + "loss": 0.018, "step": 272420 }, { - "epoch": 1.37, - "learning_rate": 9.383333921931679e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.0001940733213921888, + "loss": 0.0172, "step": 272430 }, { - "epoch": 1.37, - "learning_rate": 9.382577152630276e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019406943317581735, + "loss": 0.0126, "step": 272440 }, { - "epoch": 1.37, - "learning_rate": 9.381820383328875e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.0001940655449594459, + "loss": 0.0191, "step": 272450 }, { - "epoch": 1.37, - "learning_rate": 9.381063614027475e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019406165674307443, + "loss": 0.0136, "step": 272460 }, { - "epoch": 1.37, - "learning_rate": 9.380306844726073e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.00019405776852670295, + "loss": 0.0123, "step": 272470 }, { - "epoch": 1.37, - "learning_rate": 9.379550075424672e-05, - "loss": 0.01, + "epoch": 0.71, + "learning_rate": 0.0001940538803103315, + "loss": 0.0163, "step": 272480 }, { - "epoch": 1.37, - "learning_rate": 9.378793306123272e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019404999209396003, + "loss": 0.013, "step": 272490 }, { - "epoch": 1.37, - "learning_rate": 9.37803653682187e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019404610387758857, + "loss": 0.0137, "step": 272500 }, { - "epoch": 1.37, - "learning_rate": 9.37727976752047e-05, - "loss": 0.011, + "epoch": 0.71, + "learning_rate": 0.00019404221566121708, + "loss": 0.017, "step": 272510 }, { - "epoch": 1.37, - "learning_rate": 9.376522998219067e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019403832744484563, + "loss": 0.0173, "step": 272520 }, { - "epoch": 1.37, - "learning_rate": 9.375766228917667e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019403443922847417, + "loss": 0.0119, "step": 272530 }, { - "epoch": 1.37, - "learning_rate": 9.375009459616266e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.0001940305510121027, + "loss": 0.0145, "step": 272540 }, { - "epoch": 1.38, - "learning_rate": 9.374252690314865e-05, - "loss": 0.0123, + "epoch": 0.71, + "learning_rate": 0.00019402666279573122, + "loss": 0.0131, "step": 272550 }, { - "epoch": 1.38, - "learning_rate": 9.373495921013464e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019402277457935977, + "loss": 0.0161, "step": 272560 }, { - "epoch": 1.38, - "learning_rate": 9.372739151712064e-05, - "loss": 0.01, + "epoch": 0.71, + "learning_rate": 0.00019401888636298833, + "loss": 0.0161, "step": 272570 }, { - "epoch": 1.38, - "learning_rate": 9.371982382410662e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.00019401499814661685, + "loss": 0.0153, "step": 272580 }, { - "epoch": 1.38, - "learning_rate": 9.371225613109261e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.0001940111099302454, + "loss": 0.0145, "step": 272590 }, { - "epoch": 1.38, - "learning_rate": 9.370468843807861e-05, - "loss": 0.0054, + "epoch": 0.71, + "learning_rate": 0.0001940072217138739, + "loss": 0.0159, "step": 272600 }, { - "epoch": 1.38, - "learning_rate": 9.369712074506459e-05, - "loss": 0.0102, + "epoch": 0.71, + "learning_rate": 0.00019400333349750247, + "loss": 0.0136, "step": 272610 }, { - "epoch": 1.38, - "learning_rate": 9.368955305205058e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.000193999445281131, + "loss": 0.0152, "step": 272620 }, { - "epoch": 1.38, - "learning_rate": 9.368198535903657e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019399555706475953, + "loss": 0.0151, "step": 272630 }, { - "epoch": 1.38, - "learning_rate": 9.367441766602256e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019399166884838804, + "loss": 0.0193, "step": 272640 }, { - "epoch": 1.38, - "learning_rate": 9.366684997300856e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.0001939877806320166, + "loss": 0.0143, "step": 272650 }, { - "epoch": 1.38, - "learning_rate": 9.365928227999454e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019398389241564513, + "loss": 0.0126, "step": 272660 }, { - "epoch": 1.38, - "learning_rate": 9.365171458698053e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019398000419927367, + "loss": 0.0223, "step": 272670 }, { - "epoch": 1.38, - "learning_rate": 9.364414689396653e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019397611598290218, + "loss": 0.0141, "step": 272680 }, { - "epoch": 1.38, - "learning_rate": 9.363657920095251e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.00019397222776653073, + "loss": 0.0141, "step": 272690 }, { - "epoch": 1.38, - "learning_rate": 9.36290115079385e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019396833955015927, + "loss": 0.0162, "step": 272700 }, { - "epoch": 1.38, - "learning_rate": 9.362144381492449e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.0001939644513337878, + "loss": 0.0173, "step": 272710 }, { - "epoch": 1.38, - "learning_rate": 9.361387612191048e-05, - "loss": 0.01, + "epoch": 0.71, + "learning_rate": 0.00019396056311741632, + "loss": 0.017, "step": 272720 }, { - "epoch": 1.38, - "learning_rate": 9.360630842889648e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019395667490104487, + "loss": 0.0148, "step": 272730 }, { - "epoch": 1.38, - "learning_rate": 9.359874073588246e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019395278668467343, + "loss": 0.0151, "step": 272740 }, { - "epoch": 1.38, - "learning_rate": 9.359117304286845e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019394889846830195, + "loss": 0.0114, "step": 272750 }, { - "epoch": 1.38, - "learning_rate": 9.358360534985445e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001939450102519305, + "loss": 0.0216, "step": 272760 }, { - "epoch": 1.38, - "learning_rate": 9.357603765684043e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.000193941122035559, + "loss": 0.0142, "step": 272770 }, { - "epoch": 1.38, - "learning_rate": 9.356846996382642e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019393723381918757, + "loss": 0.0153, "step": 272780 }, { - "epoch": 1.38, - "learning_rate": 9.35609022708124e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.0001939333456028161, + "loss": 0.0131, "step": 272790 }, { - "epoch": 1.38, - "learning_rate": 9.35533345777984e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019392945738644463, + "loss": 0.0175, "step": 272800 }, { - "epoch": 1.38, - "learning_rate": 9.35457668847844e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019392556917007314, + "loss": 0.0136, "step": 272810 }, { - "epoch": 1.38, - "learning_rate": 9.353819919177038e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001939216809537017, + "loss": 0.012, "step": 272820 }, { - "epoch": 1.38, - "learning_rate": 9.353063149875637e-05, - "loss": 0.0053, + "epoch": 0.71, + "learning_rate": 0.00019391779273733023, + "loss": 0.0155, "step": 272830 }, { - "epoch": 1.38, - "learning_rate": 9.352306380574237e-05, - "loss": 0.0099, + "epoch": 0.71, + "learning_rate": 0.00019391390452095877, + "loss": 0.0158, "step": 272840 }, { - "epoch": 1.38, - "learning_rate": 9.351549611272835e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019391001630458728, + "loss": 0.0168, "step": 272850 }, { - "epoch": 1.38, - "learning_rate": 9.350792841971434e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019390612808821585, + "loss": 0.0167, "step": 272860 }, { - "epoch": 1.38, - "learning_rate": 9.350036072670032e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019390223987184437, + "loss": 0.0152, "step": 272870 }, { - "epoch": 1.38, - "learning_rate": 9.349279303368632e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.0001938983516554729, + "loss": 0.0204, "step": 272880 }, { - "epoch": 1.38, - "learning_rate": 9.348522534067231e-05, - "loss": 0.0061, + "epoch": 0.71, + "learning_rate": 0.00019389446343910142, + "loss": 0.0148, "step": 272890 }, { - "epoch": 1.38, - "learning_rate": 9.34776576476583e-05, - "loss": 0.0102, + "epoch": 0.71, + "learning_rate": 0.00019389057522273, + "loss": 0.0151, "step": 272900 }, { - "epoch": 1.38, - "learning_rate": 9.347008995464429e-05, - "loss": 0.0057, + "epoch": 0.71, + "learning_rate": 0.00019388668700635853, + "loss": 0.0142, "step": 272910 }, { - "epoch": 1.38, - "learning_rate": 9.346252226163029e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019388279878998705, + "loss": 0.012, "step": 272920 }, { - "epoch": 1.38, - "learning_rate": 9.345495456861627e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019387891057361556, + "loss": 0.0173, "step": 272930 }, { - "epoch": 1.38, - "learning_rate": 9.344738687560226e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.0001938750223572441, + "loss": 0.018, "step": 272940 }, { - "epoch": 1.38, - "learning_rate": 9.343981918258824e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019387113414087267, + "loss": 0.0127, "step": 272950 }, { - "epoch": 1.38, - "learning_rate": 9.343225148957424e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.0001938672459245012, + "loss": 0.016, "step": 272960 }, { - "epoch": 1.38, - "learning_rate": 9.342468379656023e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019386335770812973, + "loss": 0.014, "step": 272970 }, { - "epoch": 1.38, - "learning_rate": 9.341711610354621e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019385946949175824, + "loss": 0.0172, "step": 272980 }, { - "epoch": 1.38, - "learning_rate": 9.340954841053221e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.0001938555812753868, + "loss": 0.0159, "step": 272990 }, { - "epoch": 1.38, - "learning_rate": 9.34019807175182e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019385169305901533, + "loss": 0.0182, "step": 273000 }, { - "epoch": 1.38, - "eval_cer": 0.9144256176813937, - "eval_loss": 0.005903230048716068, - "eval_runtime": 116.3214, - "eval_samples_per_second": 17.194, - "eval_steps_per_second": 4.298, + "epoch": 0.71, + "eval_cer": 0.8817376772465223, + "eval_loss": 0.010078651830554008, + "eval_runtime": 108.1362, + "eval_samples_per_second": 18.495, + "eval_steps_per_second": 4.624, "step": 273000 }, { - "epoch": 1.38, - "learning_rate": 9.339441302450419e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.00019384780484264387, + "loss": 0.0187, "step": 273010 }, { - "epoch": 1.38, - "learning_rate": 9.338684533149018e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.00019384391662627238, + "loss": 0.0127, "step": 273020 }, { - "epoch": 1.38, - "learning_rate": 9.337927763847616e-05, - "loss": 0.0106, + "epoch": 0.71, + "learning_rate": 0.00019384002840990095, + "loss": 0.0135, "step": 273030 }, { - "epoch": 1.38, - "learning_rate": 9.337170994546216e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019383614019352947, + "loss": 0.0144, "step": 273040 }, { - "epoch": 1.38, - "learning_rate": 9.336414225244815e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.000193832251977158, + "loss": 0.016, "step": 273050 }, { - "epoch": 1.38, - "learning_rate": 9.335657455943412e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019382836376078652, + "loss": 0.0188, "step": 273060 }, { - "epoch": 1.38, - "learning_rate": 9.334900686642012e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.0001938244755444151, + "loss": 0.013, "step": 273070 }, { - "epoch": 1.38, - "learning_rate": 9.33414391734061e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019382058732804363, + "loss": 0.0191, "step": 273080 }, { - "epoch": 1.38, - "learning_rate": 9.333387148039209e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019381669911167215, + "loss": 0.0153, "step": 273090 }, { - "epoch": 1.38, - "learning_rate": 9.332630378737809e-05, - "loss": 0.0095, + "epoch": 0.71, + "learning_rate": 0.00019381281089530066, + "loss": 0.0147, "step": 273100 }, { - "epoch": 1.38, - "learning_rate": 9.331873609436407e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019380892267892923, + "loss": 0.016, "step": 273110 }, { - "epoch": 1.38, - "learning_rate": 9.331116840135006e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019380503446255777, + "loss": 0.0163, "step": 273120 }, { - "epoch": 1.38, - "learning_rate": 9.330360070833606e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.0001938011462461863, + "loss": 0.0162, "step": 273130 }, { - "epoch": 1.38, - "learning_rate": 9.329603301532204e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019379725802981483, + "loss": 0.0182, "step": 273140 }, { - "epoch": 1.38, - "learning_rate": 9.328846532230803e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.00019379336981344337, + "loss": 0.0166, "step": 273150 }, { - "epoch": 1.38, - "learning_rate": 9.328089762929402e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.0001937894815970719, + "loss": 0.014, "step": 273160 }, { - "epoch": 1.38, - "learning_rate": 9.327332993628001e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019378559338070043, + "loss": 0.0157, "step": 273170 }, { - "epoch": 1.38, - "learning_rate": 9.3265762243266e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019378170516432897, + "loss": 0.0145, "step": 273180 }, { - "epoch": 1.38, - "learning_rate": 9.325819455025199e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019377781694795748, + "loss": 0.0158, "step": 273190 }, { - "epoch": 1.38, - "learning_rate": 9.325062685723798e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019377392873158605, + "loss": 0.02, "step": 273200 }, { - "epoch": 1.38, - "learning_rate": 9.324305916422398e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019377004051521457, + "loss": 0.015, "step": 273210 }, { - "epoch": 1.38, - "learning_rate": 9.323549147120996e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.0001937661522988431, + "loss": 0.0154, "step": 273220 }, { - "epoch": 1.38, - "learning_rate": 9.322792377819595e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019376226408247162, + "loss": 0.0177, "step": 273230 }, { - "epoch": 1.38, - "learning_rate": 9.322035608518194e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.0001937583758661002, + "loss": 0.0142, "step": 273240 }, { - "epoch": 1.38, - "learning_rate": 9.321278839216793e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.0001937544876497287, + "loss": 0.0172, "step": 273250 }, { - "epoch": 1.38, - "learning_rate": 9.320522069915393e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019375059943335725, + "loss": 0.0126, "step": 273260 }, { - "epoch": 1.38, - "learning_rate": 9.31976530061399e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.00019374671121698576, + "loss": 0.0138, "step": 273270 }, { - "epoch": 1.38, - "learning_rate": 9.31900853131259e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019374282300061433, + "loss": 0.014, "step": 273280 }, { - "epoch": 1.38, - "learning_rate": 9.31825176201119e-05, - "loss": 0.0058, + "epoch": 0.71, + "learning_rate": 0.00019373893478424287, + "loss": 0.0148, "step": 273290 }, { - "epoch": 1.38, - "learning_rate": 9.317494992709788e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019373504656787139, + "loss": 0.014, "step": 273300 }, { - "epoch": 1.38, - "learning_rate": 9.316738223408387e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019373115835149993, + "loss": 0.0182, "step": 273310 }, { - "epoch": 1.38, - "learning_rate": 9.315981454106985e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019372727013512847, + "loss": 0.0144, "step": 273320 }, { - "epoch": 1.38, - "learning_rate": 9.315224684805585e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.000193723381918757, + "loss": 0.0154, "step": 273330 }, { - "epoch": 1.38, - "learning_rate": 9.314467915504184e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019371949370238553, + "loss": 0.0182, "step": 273340 }, { - "epoch": 1.38, - "learning_rate": 9.313711146202783e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.00019371560548601407, + "loss": 0.0173, "step": 273350 }, { - "epoch": 1.38, - "learning_rate": 9.312954376901382e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.0001937117172696426, + "loss": 0.0175, "step": 273360 }, { - "epoch": 1.38, - "learning_rate": 9.312197607599982e-05, - "loss": 0.0047, + "epoch": 0.71, + "learning_rate": 0.00019370782905327115, + "loss": 0.0208, "step": 273370 }, { - "epoch": 1.38, - "learning_rate": 9.31144083829858e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019370394083689967, + "loss": 0.0151, "step": 273380 }, { - "epoch": 1.38, - "learning_rate": 9.310684068997179e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.0001937000526205282, + "loss": 0.0147, "step": 273390 }, { - "epoch": 1.38, - "learning_rate": 9.309927299695777e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019369616440415675, + "loss": 0.0142, "step": 273400 }, { - "epoch": 1.38, - "learning_rate": 9.309170530394377e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.0001936922761877853, + "loss": 0.014, "step": 273410 }, { - "epoch": 1.38, - "learning_rate": 9.308413761092976e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.0001936883879714138, + "loss": 0.0139, "step": 273420 }, { - "epoch": 1.38, - "learning_rate": 9.307656991791575e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.00019368449975504235, + "loss": 0.0152, "step": 273430 }, { - "epoch": 1.38, - "learning_rate": 9.306900222490174e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019368061153867086, + "loss": 0.0183, "step": 273440 }, { - "epoch": 1.38, - "learning_rate": 9.306143453188774e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019367672332229943, + "loss": 0.0141, "step": 273450 }, { - "epoch": 1.38, - "learning_rate": 9.305386683887372e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.00019367283510592797, + "loss": 0.0131, "step": 273460 }, { - "epoch": 1.38, - "learning_rate": 9.304629914585971e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019366894688955649, + "loss": 0.0128, "step": 273470 }, { - "epoch": 1.38, - "learning_rate": 9.303873145284569e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019366505867318503, + "loss": 0.0148, "step": 273480 }, { - "epoch": 1.38, - "learning_rate": 9.303116375983169e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019366117045681357, + "loss": 0.0143, "step": 273490 }, { - "epoch": 1.38, - "learning_rate": 9.302359606681768e-05, - "loss": 0.0117, + "epoch": 0.71, + "learning_rate": 0.0001936572822404421, + "loss": 0.0173, "step": 273500 }, { - "epoch": 1.38, - "learning_rate": 9.301602837380366e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019365339402407063, + "loss": 0.0184, "step": 273510 }, { - "epoch": 1.38, - "learning_rate": 9.300846068078966e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019364950580769917, + "loss": 0.0158, "step": 273520 }, { - "epoch": 1.38, - "learning_rate": 9.300089298777565e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.0001936456175913277, + "loss": 0.018, "step": 273530 }, { - "epoch": 1.38, - "learning_rate": 9.299332529476164e-05, - "loss": 0.0056, + "epoch": 0.71, + "learning_rate": 0.00019364172937495625, + "loss": 0.0137, "step": 273540 }, { - "epoch": 1.38, - "learning_rate": 9.298575760174763e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019363784115858476, + "loss": 0.014, "step": 273550 }, { - "epoch": 1.38, - "learning_rate": 9.297818990873361e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.0001936339529422133, + "loss": 0.0133, "step": 273560 }, { - "epoch": 1.38, - "learning_rate": 9.297062221571961e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019363006472584185, + "loss": 0.018, "step": 273570 }, { - "epoch": 1.38, - "learning_rate": 9.29630545227056e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001936261765094704, + "loss": 0.0163, "step": 273580 }, { - "epoch": 1.38, - "learning_rate": 9.295548682969158e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.0001936222882930989, + "loss": 0.0159, "step": 273590 }, { - "epoch": 1.38, - "learning_rate": 9.294791913667758e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019361840007672745, + "loss": 0.0156, "step": 273600 }, { - "epoch": 1.38, - "learning_rate": 9.294035144366357e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019361451186035601, + "loss": 0.0155, "step": 273610 }, { - "epoch": 1.38, - "learning_rate": 9.293278375064956e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019361062364398453, + "loss": 0.0124, "step": 273620 }, { - "epoch": 1.38, - "learning_rate": 9.292521605763555e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019360673542761307, + "loss": 0.015, "step": 273630 }, { - "epoch": 1.38, - "learning_rate": 9.291764836462155e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019360284721124158, + "loss": 0.014, "step": 273640 }, { - "epoch": 1.38, - "learning_rate": 9.291008067160753e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019359895899487015, + "loss": 0.0127, "step": 273650 }, { - "epoch": 1.38, - "learning_rate": 9.290251297859352e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019359507077849867, + "loss": 0.0163, "step": 273660 }, { - "epoch": 1.38, - "learning_rate": 9.28949452855795e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001935911825621272, + "loss": 0.0132, "step": 273670 }, { - "epoch": 1.38, - "learning_rate": 9.28873775925655e-05, - "loss": 0.0092, + "epoch": 0.71, + "learning_rate": 0.00019358729434575572, + "loss": 0.0141, "step": 273680 }, { - "epoch": 1.38, - "learning_rate": 9.287980989955147e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019358340612938427, + "loss": 0.014, "step": 273690 }, { - "epoch": 1.38, - "learning_rate": 9.287224220653746e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001935795179130128, + "loss": 0.0134, "step": 273700 }, { - "epoch": 1.38, - "learning_rate": 9.286467451352346e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019357562969664135, + "loss": 0.0131, "step": 273710 }, { - "epoch": 1.38, - "learning_rate": 9.285710682050944e-05, - "loss": 0.0105, + "epoch": 0.71, + "learning_rate": 0.00019357174148026986, + "loss": 0.0127, "step": 273720 }, { - "epoch": 1.38, - "learning_rate": 9.284953912749543e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.0001935678532638984, + "loss": 0.0121, "step": 273730 }, { - "epoch": 1.38, - "learning_rate": 9.284197143448143e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019356396504752695, + "loss": 0.0169, "step": 273740 }, { - "epoch": 1.38, - "learning_rate": 9.283440374146741e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.0001935600768311555, + "loss": 0.0152, "step": 273750 }, { - "epoch": 1.38, - "learning_rate": 9.28268360484534e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.000193556188614784, + "loss": 0.0191, "step": 273760 }, { - "epoch": 1.38, - "learning_rate": 9.281926835543939e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019355230039841254, + "loss": 0.0187, "step": 273770 }, { - "epoch": 1.38, - "learning_rate": 9.281170066242538e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019354841218204111, + "loss": 0.0146, "step": 273780 }, { - "epoch": 1.38, - "learning_rate": 9.280413296941138e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019354452396566963, + "loss": 0.0126, "step": 273790 }, { - "epoch": 1.38, - "learning_rate": 9.279656527639736e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019354063574929814, + "loss": 0.0115, "step": 273800 }, { - "epoch": 1.38, - "learning_rate": 9.278899758338335e-05, - "loss": 0.0109, + "epoch": 0.71, + "learning_rate": 0.00019353674753292668, + "loss": 0.0153, "step": 273810 }, { - "epoch": 1.38, - "learning_rate": 9.278142989036935e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019353285931655525, + "loss": 0.0149, "step": 273820 }, { - "epoch": 1.38, - "learning_rate": 9.277386219735533e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019352897110018377, + "loss": 0.0149, "step": 273830 }, { - "epoch": 1.38, - "learning_rate": 9.276629450434132e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.0001935250828838123, + "loss": 0.0197, "step": 273840 }, { - "epoch": 1.38, - "learning_rate": 9.27587268113273e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019352119466744082, + "loss": 0.0147, "step": 273850 }, { - "epoch": 1.38, - "learning_rate": 9.27511591183133e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.0001935173064510694, + "loss": 0.0146, "step": 273860 }, { - "epoch": 1.38, - "learning_rate": 9.27435914252993e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.0001935134182346979, + "loss": 0.0153, "step": 273870 }, { - "epoch": 1.38, - "learning_rate": 9.273602373228528e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.00019350953001832645, + "loss": 0.0176, "step": 273880 }, { - "epoch": 1.38, - "learning_rate": 9.272845603927127e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019350564180195496, + "loss": 0.0145, "step": 273890 }, { - "epoch": 1.38, - "learning_rate": 9.272088834625727e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019350175358558353, + "loss": 0.0156, "step": 273900 }, { - "epoch": 1.38, - "learning_rate": 9.271332065324325e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019349786536921205, + "loss": 0.0146, "step": 273910 }, { - "epoch": 1.38, - "learning_rate": 9.270575296022924e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.0001934939771528406, + "loss": 0.0158, "step": 273920 }, { - "epoch": 1.38, - "learning_rate": 9.269818526721522e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.0001934900889364691, + "loss": 0.0165, "step": 273930 }, { - "epoch": 1.38, - "learning_rate": 9.269061757420122e-05, - "loss": 0.0062, + "epoch": 0.71, + "learning_rate": 0.00019348620072009764, + "loss": 0.0153, "step": 273940 }, { - "epoch": 1.38, - "learning_rate": 9.268304988118721e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.0001934823125037262, + "loss": 0.0152, "step": 273950 }, { - "epoch": 1.38, - "learning_rate": 9.26754821881732e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.00019347842428735473, + "loss": 0.012, "step": 273960 }, { - "epoch": 1.38, - "learning_rate": 9.266791449515919e-05, - "loss": 0.0055, + "epoch": 0.71, + "learning_rate": 0.00019347453607098324, + "loss": 0.0146, "step": 273970 }, { - "epoch": 1.38, - "learning_rate": 9.266034680214519e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019347064785461178, + "loss": 0.0142, "step": 273980 }, { - "epoch": 1.38, - "learning_rate": 9.265277910913117e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019346675963824035, + "loss": 0.0166, "step": 273990 }, { - "epoch": 1.38, - "learning_rate": 9.264521141611716e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019346287142186887, + "loss": 0.0154, "step": 274000 }, { - "epoch": 1.38, - "eval_cer": 0.9144392032271493, - "eval_loss": 0.005893085617572069, - "eval_runtime": 116.3239, - "eval_samples_per_second": 17.193, - "eval_steps_per_second": 4.298, + "epoch": 0.71, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.01036932785063982, + "eval_runtime": 107.9436, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, "step": 274000 }, { - "epoch": 1.38, - "learning_rate": 9.263764372310314e-05, - "loss": 0.005, + "epoch": 0.71, + "learning_rate": 0.0001934589832054974, + "loss": 0.0154, "step": 274010 }, { - "epoch": 1.38, - "learning_rate": 9.263007603008914e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019345509498912592, + "loss": 0.0133, "step": 274020 }, { - "epoch": 1.38, - "learning_rate": 9.262250833707513e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.0001934512067727545, + "loss": 0.0137, "step": 274030 }, { - "epoch": 1.38, - "learning_rate": 9.261494064406111e-05, - "loss": 0.0101, + "epoch": 0.71, + "learning_rate": 0.000193447318556383, + "loss": 0.0134, "step": 274040 }, { - "epoch": 1.38, - "learning_rate": 9.260737295104711e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019344343034001155, + "loss": 0.0189, "step": 274050 }, { - "epoch": 1.38, - "learning_rate": 9.25998052580331e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019343954212364006, + "loss": 0.015, "step": 274060 }, { - "epoch": 1.38, - "learning_rate": 9.259223756501909e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019343565390726863, + "loss": 0.0151, "step": 274070 }, { - "epoch": 1.38, - "learning_rate": 9.258466987200508e-05, - "loss": 0.0155, + "epoch": 0.71, + "learning_rate": 0.00019343176569089715, + "loss": 0.0122, "step": 274080 }, { - "epoch": 1.38, - "learning_rate": 9.257710217899108e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.0001934278774745257, + "loss": 0.0124, "step": 274090 }, { - "epoch": 1.38, - "learning_rate": 9.256953448597706e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.0001934239892581542, + "loss": 0.0174, "step": 274100 }, { - "epoch": 1.38, - "learning_rate": 9.256196679296305e-05, - "loss": 0.0065, + "epoch": 0.71, + "learning_rate": 0.00019342010104178277, + "loss": 0.0207, "step": 274110 }, { - "epoch": 1.38, - "learning_rate": 9.255439909994903e-05, - "loss": 0.01, + "epoch": 0.71, + "learning_rate": 0.00019341621282541129, + "loss": 0.0154, "step": 274120 }, { - "epoch": 1.38, - "learning_rate": 9.254683140693503e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019341232460903983, + "loss": 0.0145, "step": 274130 }, { - "epoch": 1.38, - "learning_rate": 9.253926371392102e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019340843639266834, + "loss": 0.012, "step": 274140 }, { - "epoch": 1.38, - "learning_rate": 9.2531696020907e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.0001934045481762969, + "loss": 0.0139, "step": 274150 }, { - "epoch": 1.38, - "learning_rate": 9.2524128327893e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019340065995992545, + "loss": 0.0144, "step": 274160 }, { - "epoch": 1.38, - "learning_rate": 9.2516560634879e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019339677174355397, + "loss": 0.0143, "step": 274170 }, { - "epoch": 1.38, - "learning_rate": 9.250899294186498e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.0001933928835271825, + "loss": 0.0157, "step": 274180 }, { - "epoch": 1.38, - "learning_rate": 9.250142524885097e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019338899531081102, + "loss": 0.0167, "step": 274190 }, { - "epoch": 1.38, - "learning_rate": 9.249385755583695e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001933851070944396, + "loss": 0.0115, "step": 274200 }, { - "epoch": 1.38, - "learning_rate": 9.248628986282295e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001933812188780681, + "loss": 0.0149, "step": 274210 }, { - "epoch": 1.38, - "learning_rate": 9.247872216980894e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019337733066169665, + "loss": 0.0145, "step": 274220 }, { - "epoch": 1.38, - "learning_rate": 9.247115447679492e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019337344244532516, + "loss": 0.0144, "step": 274230 }, { - "epoch": 1.38, - "learning_rate": 9.246358678378092e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019336955422895373, + "loss": 0.0159, "step": 274240 }, { - "epoch": 1.38, - "learning_rate": 9.245601909076691e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019336566601258225, + "loss": 0.0121, "step": 274250 }, { - "epoch": 1.38, - "learning_rate": 9.24484513977529e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.0001933617777962108, + "loss": 0.0176, "step": 274260 }, { - "epoch": 1.38, - "learning_rate": 9.244088370473889e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.0001933578895798393, + "loss": 0.0141, "step": 274270 }, { - "epoch": 1.38, - "learning_rate": 9.243331601172487e-05, - "loss": 0.0117, + "epoch": 0.71, + "learning_rate": 0.00019335400136346787, + "loss": 0.0204, "step": 274280 }, { - "epoch": 1.38, - "learning_rate": 9.242574831871087e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019335011314709638, + "loss": 0.011, "step": 274290 }, { - "epoch": 1.38, - "learning_rate": 9.241818062569686e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019334622493072493, + "loss": 0.0181, "step": 274300 }, { - "epoch": 1.38, - "learning_rate": 9.241061293268284e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019334233671435344, + "loss": 0.0135, "step": 274310 }, { - "epoch": 1.38, - "learning_rate": 9.240304523966883e-05, - "loss": 0.0099, + "epoch": 0.71, + "learning_rate": 0.000193338448497982, + "loss": 0.0202, "step": 274320 }, { - "epoch": 1.38, - "learning_rate": 9.239547754665481e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019333456028161055, + "loss": 0.0159, "step": 274330 }, { - "epoch": 1.38, - "learning_rate": 9.23879098536408e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019333067206523907, + "loss": 0.0115, "step": 274340 }, { - "epoch": 1.38, - "learning_rate": 9.23803421606268e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.0001933267838488676, + "loss": 0.0143, "step": 274350 }, { - "epoch": 1.38, - "learning_rate": 9.237277446761278e-05, - "loss": 0.011, + "epoch": 0.71, + "learning_rate": 0.00019332289563249615, + "loss": 0.0153, "step": 274360 }, { - "epoch": 1.38, - "learning_rate": 9.236520677459877e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.0001933190074161247, + "loss": 0.0131, "step": 274370 }, { - "epoch": 1.38, - "learning_rate": 9.235763908158475e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.0001933151191997532, + "loss": 0.0159, "step": 274380 }, { - "epoch": 1.38, - "learning_rate": 9.235007138857075e-05, - "loss": 0.0097, + "epoch": 0.71, + "learning_rate": 0.00019331123098338175, + "loss": 0.0124, "step": 274390 }, { - "epoch": 1.38, - "learning_rate": 9.234250369555674e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001933073427670103, + "loss": 0.0156, "step": 274400 }, { - "epoch": 1.38, - "learning_rate": 9.233493600254273e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.00019330345455063883, + "loss": 0.0146, "step": 274410 }, { - "epoch": 1.38, - "learning_rate": 9.232736830952872e-05, - "loss": 0.0097, + "epoch": 0.71, + "learning_rate": 0.00019329956633426734, + "loss": 0.017, "step": 274420 }, { - "epoch": 1.38, - "learning_rate": 9.231980061651472e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001932956781178959, + "loss": 0.0131, "step": 274430 }, { - "epoch": 1.38, - "learning_rate": 9.23122329235007e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.0001932917899015244, + "loss": 0.0162, "step": 274440 }, { - "epoch": 1.38, - "learning_rate": 9.230466523048669e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019328790168515297, + "loss": 0.0129, "step": 274450 }, { - "epoch": 1.38, - "learning_rate": 9.229709753747267e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019328401346878148, + "loss": 0.0172, "step": 274460 }, { - "epoch": 1.38, - "learning_rate": 9.228952984445867e-05, - "loss": 0.0051, + "epoch": 0.71, + "learning_rate": 0.00019328012525241003, + "loss": 0.0205, "step": 274470 }, { - "epoch": 1.38, - "learning_rate": 9.228196215144466e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019327623703603854, + "loss": 0.0152, "step": 274480 }, { - "epoch": 1.38, - "learning_rate": 9.227439445843065e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.0001932723488196671, + "loss": 0.0151, "step": 274490 }, { - "epoch": 1.38, - "learning_rate": 9.226682676541664e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019326846060329565, + "loss": 0.0149, "step": 274500 }, { - "epoch": 1.38, - "learning_rate": 9.225925907240264e-05, - "loss": 0.0061, + "epoch": 0.71, + "learning_rate": 0.00019326457238692417, + "loss": 0.0116, "step": 274510 }, { - "epoch": 1.38, - "learning_rate": 9.225169137938862e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019326068417055268, + "loss": 0.0132, "step": 274520 }, { - "epoch": 1.39, - "learning_rate": 9.224412368637461e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019325679595418125, + "loss": 0.0129, "step": 274530 }, { - "epoch": 1.39, - "learning_rate": 9.223655599336061e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.0001932529077378098, + "loss": 0.0158, "step": 274540 }, { - "epoch": 1.39, - "learning_rate": 9.222898830034659e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.0001932490195214383, + "loss": 0.0203, "step": 274550 }, { - "epoch": 1.39, - "learning_rate": 9.222142060733258e-05, - "loss": 0.0098, + "epoch": 0.71, + "learning_rate": 0.00019324513130506685, + "loss": 0.0112, "step": 274560 }, { - "epoch": 1.39, - "learning_rate": 9.221385291431856e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.0001932412430886954, + "loss": 0.0135, "step": 274570 }, { - "epoch": 1.39, - "learning_rate": 9.220628522130456e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019323735487232393, + "loss": 0.0164, "step": 274580 }, { - "epoch": 1.39, - "learning_rate": 9.219871752829055e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.00019323346665595244, + "loss": 0.0134, "step": 274590 }, { - "epoch": 1.39, - "learning_rate": 9.219114983527654e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019322957843958099, + "loss": 0.015, "step": 274600 }, { - "epoch": 1.39, - "learning_rate": 9.218358214226253e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019322569022320953, + "loss": 0.0125, "step": 274610 }, { - "epoch": 1.39, - "learning_rate": 9.217601444924853e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019322180200683807, + "loss": 0.0154, "step": 274620 }, { - "epoch": 1.39, - "learning_rate": 9.216844675623451e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019321791379046658, + "loss": 0.014, "step": 274630 }, { - "epoch": 1.39, - "learning_rate": 9.21608790632205e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019321402557409513, + "loss": 0.015, "step": 274640 }, { - "epoch": 1.39, - "learning_rate": 9.215331137020648e-05, - "loss": 0.0061, + "epoch": 0.71, + "learning_rate": 0.0001932101373577237, + "loss": 0.0114, "step": 274650 }, { - "epoch": 1.39, - "learning_rate": 9.214574367719248e-05, - "loss": 0.0116, + "epoch": 0.71, + "learning_rate": 0.0001932062491413522, + "loss": 0.0134, "step": 274660 }, { - "epoch": 1.39, - "learning_rate": 9.213817598417847e-05, - "loss": 0.0063, + "epoch": 0.71, + "learning_rate": 0.00019320236092498075, + "loss": 0.0204, "step": 274670 }, { - "epoch": 1.39, - "learning_rate": 9.213060829116446e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019319847270860926, + "loss": 0.0156, "step": 274680 }, { - "epoch": 1.39, - "learning_rate": 9.212304059815045e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019319458449223778, + "loss": 0.0181, "step": 274690 }, { - "epoch": 1.39, - "learning_rate": 9.211547290513645e-05, - "loss": 0.0107, + "epoch": 0.71, + "learning_rate": 0.00019319069627586635, + "loss": 0.0157, "step": 274700 }, { - "epoch": 1.39, - "learning_rate": 9.210790521212243e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001931868080594949, + "loss": 0.0112, "step": 274710 }, { - "epoch": 1.39, - "learning_rate": 9.210033751910842e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.0001931829198431234, + "loss": 0.0162, "step": 274720 }, { - "epoch": 1.39, - "learning_rate": 9.20927698260944e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019317903162675195, + "loss": 0.0156, "step": 274730 }, { - "epoch": 1.39, - "learning_rate": 9.20852021330804e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001931751434103805, + "loss": 0.0152, "step": 274740 }, { - "epoch": 1.39, - "learning_rate": 9.20776344400664e-05, - "loss": 0.0076, + "epoch": 0.71, + "learning_rate": 0.00019317125519400903, + "loss": 0.0109, "step": 274750 }, { - "epoch": 1.39, - "learning_rate": 9.207006674705237e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019316736697763754, + "loss": 0.012, "step": 274760 }, { - "epoch": 1.39, - "learning_rate": 9.206249905403837e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019316347876126609, + "loss": 0.0155, "step": 274770 }, { - "epoch": 1.39, - "learning_rate": 9.205493136102436e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019315959054489463, + "loss": 0.0136, "step": 274780 }, { - "epoch": 1.39, - "learning_rate": 9.204736366801035e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019315570232852317, + "loss": 0.0151, "step": 274790 }, { - "epoch": 1.39, - "learning_rate": 9.203979597499634e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019315181411215168, + "loss": 0.0123, "step": 274800 }, { - "epoch": 1.39, - "learning_rate": 9.203222828198232e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.00019314792589578022, + "loss": 0.0134, "step": 274810 }, { - "epoch": 1.39, - "learning_rate": 9.202466058896832e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.0001931440376794088, + "loss": 0.0135, "step": 274820 }, { - "epoch": 1.39, - "learning_rate": 9.201709289595431e-05, - "loss": 0.0056, + "epoch": 0.71, + "learning_rate": 0.0001931401494630373, + "loss": 0.0113, "step": 274830 }, { - "epoch": 1.39, - "learning_rate": 9.20095252029403e-05, - "loss": 0.0086, + "epoch": 0.71, + "learning_rate": 0.00019313626124666582, + "loss": 0.0161, "step": 274840 }, { - "epoch": 1.39, - "learning_rate": 9.200195750992629e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019313237303029436, + "loss": 0.0119, "step": 274850 }, { - "epoch": 1.39, - "learning_rate": 9.199438981691228e-05, - "loss": 0.0084, + "epoch": 0.71, + "learning_rate": 0.00019312848481392293, + "loss": 0.0173, "step": 274860 }, { - "epoch": 1.39, - "learning_rate": 9.198682212389827e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019312459659755145, + "loss": 0.0141, "step": 274870 }, { - "epoch": 1.39, - "learning_rate": 9.197925443088426e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019312070838118, + "loss": 0.0147, "step": 274880 }, { - "epoch": 1.39, - "learning_rate": 9.197168673787024e-05, - "loss": 0.0087, + "epoch": 0.71, + "learning_rate": 0.0001931168201648085, + "loss": 0.0136, "step": 274890 }, { - "epoch": 1.39, - "learning_rate": 9.196411904485624e-05, - "loss": 0.0097, + "epoch": 0.71, + "learning_rate": 0.00019311293194843707, + "loss": 0.0179, "step": 274900 }, { - "epoch": 1.39, - "learning_rate": 9.195655135184223e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.0001931090437320656, + "loss": 0.0158, "step": 274910 }, { - "epoch": 1.39, - "learning_rate": 9.194898365882821e-05, - "loss": 0.0095, + "epoch": 0.71, + "learning_rate": 0.00019310515551569413, + "loss": 0.016, "step": 274920 }, { - "epoch": 1.39, - "learning_rate": 9.194141596581421e-05, - "loss": 0.0104, + "epoch": 0.71, + "learning_rate": 0.00019310126729932264, + "loss": 0.0195, "step": 274930 }, { - "epoch": 1.39, - "learning_rate": 9.19338482728002e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.00019309737908295118, + "loss": 0.0148, "step": 274940 }, { - "epoch": 1.39, - "learning_rate": 9.192628057978617e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019309349086657973, + "loss": 0.0162, "step": 274950 }, { - "epoch": 1.39, - "learning_rate": 9.191871288677217e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019308960265020827, + "loss": 0.0121, "step": 274960 }, { - "epoch": 1.39, - "learning_rate": 9.191114519375815e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019308571443383678, + "loss": 0.0135, "step": 274970 }, { - "epoch": 1.39, - "learning_rate": 9.190357750074414e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019308182621746532, + "loss": 0.0307, "step": 274980 }, { - "epoch": 1.39, - "learning_rate": 9.189600980773014e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019307793800109387, + "loss": 0.0164, "step": 274990 }, { - "epoch": 1.39, - "learning_rate": 9.188844211471612e-05, - "loss": 0.0088, + "epoch": 0.71, + "learning_rate": 0.0001930740497847224, + "loss": 0.0202, "step": 275000 }, { - "epoch": 1.39, - "eval_cer": 0.9144459960000272, - "eval_loss": 0.005970404949039221, - "eval_runtime": 116.7373, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.71, + "eval_cer": 0.8818006609085604, + "eval_loss": 0.010618000291287899, + "eval_runtime": 108.0775, + "eval_samples_per_second": 18.505, + "eval_steps_per_second": 4.626, "step": 275000 }, { - "epoch": 1.39, - "learning_rate": 9.188087442170211e-05, - "loss": 0.0106, + "epoch": 0.71, + "learning_rate": 0.00019307016156835092, + "loss": 0.0244, "step": 275010 }, { - "epoch": 1.39, - "learning_rate": 9.18733067286881e-05, - "loss": 0.0089, + "epoch": 0.71, + "learning_rate": 0.00019306627335197946, + "loss": 0.0135, "step": 275020 }, { - "epoch": 1.39, - "learning_rate": 9.186573903567409e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019306238513560803, + "loss": 0.0144, "step": 275030 }, { - "epoch": 1.39, - "learning_rate": 9.185817134266009e-05, - "loss": 0.0061, + "epoch": 0.71, + "learning_rate": 0.00019305849691923655, + "loss": 0.0161, "step": 275040 }, { - "epoch": 1.39, - "learning_rate": 9.185060364964607e-05, - "loss": 0.0067, + "epoch": 0.71, + "learning_rate": 0.0001930546087028651, + "loss": 0.0146, "step": 275050 }, { - "epoch": 1.39, - "learning_rate": 9.184303595663206e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.0001930507204864936, + "loss": 0.0172, "step": 275060 }, { - "epoch": 1.39, - "learning_rate": 9.183546826361806e-05, - "loss": 0.0072, + "epoch": 0.71, + "learning_rate": 0.00019304683227012217, + "loss": 0.0122, "step": 275070 }, { - "epoch": 1.39, - "learning_rate": 9.182790057060404e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019304294405375069, + "loss": 0.0158, "step": 275080 }, { - "epoch": 1.39, - "learning_rate": 9.182033287759003e-05, - "loss": 0.0062, + "epoch": 0.71, + "learning_rate": 0.00019303905583737923, + "loss": 0.0159, "step": 275090 }, { - "epoch": 1.39, - "learning_rate": 9.181276518457601e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019303516762100774, + "loss": 0.017, "step": 275100 }, { - "epoch": 1.39, - "learning_rate": 9.180519749156201e-05, - "loss": 0.0062, + "epoch": 0.71, + "learning_rate": 0.0001930312794046363, + "loss": 0.0155, "step": 275110 }, { - "epoch": 1.39, - "learning_rate": 9.1797629798548e-05, - "loss": 0.0079, + "epoch": 0.71, + "learning_rate": 0.00019302739118826483, + "loss": 0.0143, "step": 275120 }, { - "epoch": 1.39, - "learning_rate": 9.179006210553399e-05, - "loss": 0.0115, + "epoch": 0.71, + "learning_rate": 0.00019302350297189337, + "loss": 0.0152, "step": 275130 }, { - "epoch": 1.39, - "learning_rate": 9.178249441251998e-05, - "loss": 0.0108, + "epoch": 0.71, + "learning_rate": 0.00019301961475552188, + "loss": 0.0164, "step": 275140 }, { - "epoch": 1.39, - "learning_rate": 9.177492671950598e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019301572653915045, + "loss": 0.014, "step": 275150 }, { - "epoch": 1.39, - "learning_rate": 9.176735902649196e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019301183832277897, + "loss": 0.0137, "step": 275160 }, { - "epoch": 1.39, - "learning_rate": 9.175979133347795e-05, - "loss": 0.0111, + "epoch": 0.71, + "learning_rate": 0.0001930079501064075, + "loss": 0.014, "step": 275170 }, { - "epoch": 1.39, - "learning_rate": 9.175222364046393e-05, - "loss": 0.0105, + "epoch": 0.71, + "learning_rate": 0.00019300406189003602, + "loss": 0.0117, "step": 275180 }, { - "epoch": 1.39, - "learning_rate": 9.174465594744993e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019300017367366456, + "loss": 0.0204, "step": 275190 }, { - "epoch": 1.39, - "learning_rate": 9.173708825443592e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019299628545729313, + "loss": 0.0158, "step": 275200 }, { - "epoch": 1.39, - "learning_rate": 9.17295205614219e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019299239724092165, + "loss": 0.0152, "step": 275210 }, { - "epoch": 1.39, - "learning_rate": 9.17219528684079e-05, - "loss": 0.0051, + "epoch": 0.71, + "learning_rate": 0.0001929885090245502, + "loss": 0.0157, "step": 275220 }, { - "epoch": 1.39, - "learning_rate": 9.17143851753939e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001929846208081787, + "loss": 0.0147, "step": 275230 }, { - "epoch": 1.39, - "learning_rate": 9.170681748237988e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019298073259180727, + "loss": 0.0118, "step": 275240 }, { - "epoch": 1.39, - "learning_rate": 9.169924978936587e-05, - "loss": 0.0097, + "epoch": 0.71, + "learning_rate": 0.00019297684437543579, + "loss": 0.0152, "step": 275250 }, { - "epoch": 1.39, - "learning_rate": 9.169168209635185e-05, - "loss": 0.0075, + "epoch": 0.71, + "learning_rate": 0.00019297295615906433, + "loss": 0.0129, "step": 275260 }, { - "epoch": 1.39, - "learning_rate": 9.168411440333785e-05, - "loss": 0.008, + "epoch": 0.71, + "learning_rate": 0.00019296906794269284, + "loss": 0.016, "step": 275270 }, { - "epoch": 1.39, - "learning_rate": 9.167654671032384e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.0001929651797263214, + "loss": 0.018, "step": 275280 }, { - "epoch": 1.39, - "learning_rate": 9.166897901730982e-05, - "loss": 0.0047, + "epoch": 0.71, + "learning_rate": 0.00019296129150994993, + "loss": 0.0134, "step": 275290 }, { - "epoch": 1.39, - "learning_rate": 9.166141132429582e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019295740329357847, + "loss": 0.0156, "step": 275300 }, { - "epoch": 1.39, - "learning_rate": 9.165384363128181e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019295351507720698, + "loss": 0.0179, "step": 275310 }, { - "epoch": 1.39, - "learning_rate": 9.16462759382678e-05, - "loss": 0.0101, + "epoch": 0.71, + "learning_rate": 0.00019294962686083555, + "loss": 0.0143, "step": 275320 }, { - "epoch": 1.39, - "learning_rate": 9.163870824525379e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019294573864446406, + "loss": 0.0112, "step": 275330 }, { - "epoch": 1.39, - "learning_rate": 9.163114055223977e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.0001929418504280926, + "loss": 0.0134, "step": 275340 }, { - "epoch": 1.39, - "learning_rate": 9.162357285922577e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019293796221172112, + "loss": 0.0138, "step": 275350 }, { - "epoch": 1.39, - "learning_rate": 9.161600516621176e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001929340739953497, + "loss": 0.0151, "step": 275360 }, { - "epoch": 1.39, - "learning_rate": 9.160843747319774e-05, - "loss": 0.0074, + "epoch": 0.71, + "learning_rate": 0.00019293018577897823, + "loss": 0.0135, "step": 275370 }, { - "epoch": 1.39, - "learning_rate": 9.160086978018374e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019292629756260675, + "loss": 0.0175, "step": 275380 }, { - "epoch": 1.39, - "learning_rate": 9.159330208716973e-05, - "loss": 0.0094, + "epoch": 0.71, + "learning_rate": 0.00019292240934623526, + "loss": 0.0138, "step": 275390 }, { - "epoch": 1.39, - "learning_rate": 9.158573439415572e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.0001929185211298638, + "loss": 0.013, "step": 275400 }, { - "epoch": 1.39, - "learning_rate": 9.157816670114171e-05, - "loss": 0.0069, + "epoch": 0.71, + "learning_rate": 0.00019291463291349237, + "loss": 0.0146, "step": 275410 }, { - "epoch": 1.39, - "learning_rate": 9.157059900812769e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019291074469712089, + "loss": 0.0122, "step": 275420 }, { - "epoch": 1.39, - "learning_rate": 9.156303131511369e-05, - "loss": 0.0096, + "epoch": 0.71, + "learning_rate": 0.00019290685648074943, + "loss": 0.0157, "step": 275430 }, { - "epoch": 1.39, - "learning_rate": 9.155546362209968e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019290296826437794, + "loss": 0.0152, "step": 275440 }, { - "epoch": 1.39, - "learning_rate": 9.154789592908566e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.0001928990800480065, + "loss": 0.0212, "step": 275450 }, { - "epoch": 1.39, - "learning_rate": 9.154032823607166e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.00019289519183163502, + "loss": 0.0204, "step": 275460 }, { - "epoch": 1.39, - "learning_rate": 9.153276054305765e-05, - "loss": 0.0097, + "epoch": 0.71, + "learning_rate": 0.00019289130361526357, + "loss": 0.0127, "step": 275470 }, { - "epoch": 1.39, - "learning_rate": 9.152519285004363e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.00019288741539889208, + "loss": 0.0152, "step": 275480 }, { - "epoch": 1.39, - "learning_rate": 9.151762515702963e-05, - "loss": 0.0117, + "epoch": 0.71, + "learning_rate": 0.00019288352718252065, + "loss": 0.0152, "step": 275490 }, { - "epoch": 1.39, - "learning_rate": 9.151005746401561e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019287963896614916, + "loss": 0.0131, "step": 275500 }, { - "epoch": 1.39, - "learning_rate": 9.15024897710016e-05, - "loss": 0.0064, + "epoch": 0.71, + "learning_rate": 0.0001928757507497777, + "loss": 0.0161, "step": 275510 }, { - "epoch": 1.39, - "learning_rate": 9.14949220779876e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019287186253340622, + "loss": 0.0137, "step": 275520 }, { - "epoch": 1.39, - "learning_rate": 9.148735438497358e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.0001928679743170348, + "loss": 0.0152, "step": 275530 }, { - "epoch": 1.39, - "learning_rate": 9.147978669195958e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019286408610066333, + "loss": 0.0138, "step": 275540 }, { - "epoch": 1.39, - "learning_rate": 9.147221899894557e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019286019788429185, + "loss": 0.0133, "step": 275550 }, { - "epoch": 1.39, - "learning_rate": 9.146465130593155e-05, - "loss": 0.0073, + "epoch": 0.71, + "learning_rate": 0.00019285630966792036, + "loss": 0.0131, "step": 275560 }, { - "epoch": 1.39, - "learning_rate": 9.145708361291755e-05, - "loss": 0.0081, + "epoch": 0.71, + "learning_rate": 0.00019285242145154893, + "loss": 0.0162, "step": 275570 }, { - "epoch": 1.39, - "learning_rate": 9.144951591990352e-05, - "loss": 0.009, + "epoch": 0.71, + "learning_rate": 0.00019284853323517747, + "loss": 0.0157, "step": 275580 }, { - "epoch": 1.39, - "learning_rate": 9.144194822688951e-05, - "loss": 0.0093, + "epoch": 0.71, + "learning_rate": 0.00019284464501880598, + "loss": 0.0151, "step": 275590 }, { - "epoch": 1.39, - "learning_rate": 9.143438053387551e-05, - "loss": 0.0077, + "epoch": 0.71, + "learning_rate": 0.00019284075680243453, + "loss": 0.0149, "step": 275600 }, { - "epoch": 1.39, - "learning_rate": 9.142681284086149e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019283686858606307, + "loss": 0.0128, "step": 275610 }, { - "epoch": 1.39, - "learning_rate": 9.141924514784748e-05, - "loss": 0.0078, + "epoch": 0.71, + "learning_rate": 0.0001928329803696916, + "loss": 0.0158, "step": 275620 }, { - "epoch": 1.39, - "learning_rate": 9.141167745483347e-05, - "loss": 0.006, + "epoch": 0.71, + "learning_rate": 0.00019282909215332012, + "loss": 0.0147, "step": 275630 }, { - "epoch": 1.39, - "learning_rate": 9.140410976181946e-05, - "loss": 0.0066, + "epoch": 0.71, + "learning_rate": 0.00019282520393694867, + "loss": 0.0178, "step": 275640 }, { - "epoch": 1.39, - "learning_rate": 9.139654206880546e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.00019282131572057718, + "loss": 0.0128, "step": 275650 }, { - "epoch": 1.39, - "learning_rate": 9.138897437579144e-05, - "loss": 0.0071, + "epoch": 0.71, + "learning_rate": 0.00019281742750420575, + "loss": 0.0148, "step": 275660 }, { - "epoch": 1.39, - "learning_rate": 9.138140668277743e-05, - "loss": 0.0107, + "epoch": 0.71, + "learning_rate": 0.00019281353928783426, + "loss": 0.013, "step": 275670 }, { - "epoch": 1.39, - "learning_rate": 9.137383898976343e-05, - "loss": 0.0103, + "epoch": 0.71, + "learning_rate": 0.0001928096510714628, + "loss": 0.0146, "step": 275680 }, { - "epoch": 1.39, - "learning_rate": 9.136627129674941e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019280576285509132, + "loss": 0.0145, "step": 275690 }, { - "epoch": 1.39, - "learning_rate": 9.13587036037354e-05, - "loss": 0.0083, + "epoch": 0.71, + "learning_rate": 0.0001928018746387199, + "loss": 0.0121, "step": 275700 }, { - "epoch": 1.39, - "learning_rate": 9.135113591072138e-05, - "loss": 0.0082, + "epoch": 0.71, + "learning_rate": 0.0001927979864223484, + "loss": 0.0124, "step": 275710 }, { - "epoch": 1.39, - "learning_rate": 9.134356821770738e-05, - "loss": 0.0095, + "epoch": 0.71, + "learning_rate": 0.00019279409820597694, + "loss": 0.0169, "step": 275720 }, { - "epoch": 1.39, - "learning_rate": 9.133600052469337e-05, - "loss": 0.0103, + "epoch": 0.71, + "learning_rate": 0.00019279020998960546, + "loss": 0.0141, "step": 275730 }, { - "epoch": 1.39, - "learning_rate": 9.132843283167936e-05, - "loss": 0.0112, + "epoch": 0.71, + "learning_rate": 0.00019278632177323403, + "loss": 0.0167, "step": 275740 }, { - "epoch": 1.39, - "learning_rate": 9.132086513866535e-05, - "loss": 0.0059, + "epoch": 0.71, + "learning_rate": 0.00019278243355686257, + "loss": 0.0135, "step": 275750 }, { - "epoch": 1.39, - "learning_rate": 9.131329744565135e-05, - "loss": 0.01, + "epoch": 0.71, + "learning_rate": 0.00019277854534049108, + "loss": 0.0145, "step": 275760 }, { - "epoch": 1.39, - "learning_rate": 9.130572975263733e-05, - "loss": 0.0091, + "epoch": 0.71, + "learning_rate": 0.00019277465712411963, + "loss": 0.0147, "step": 275770 }, { - "epoch": 1.39, - "learning_rate": 9.129816205962332e-05, - "loss": 0.0085, + "epoch": 0.71, + "learning_rate": 0.00019277076890774817, + "loss": 0.0132, "step": 275780 }, { - "epoch": 1.39, - "learning_rate": 9.12905943666093e-05, - "loss": 0.007, + "epoch": 0.71, + "learning_rate": 0.0001927668806913767, + "loss": 0.0141, "step": 275790 }, { - "epoch": 1.39, - "learning_rate": 9.12830266735953e-05, - "loss": 0.0058, + "epoch": 0.71, + "learning_rate": 0.00019276299247500522, + "loss": 0.0181, "step": 275800 }, { - "epoch": 1.39, - "learning_rate": 9.12754589805813e-05, - "loss": 0.0095, + "epoch": 0.71, + "learning_rate": 0.00019275910425863377, + "loss": 0.0141, "step": 275810 }, { - "epoch": 1.39, - "learning_rate": 9.126789128756728e-05, - "loss": 0.0068, + "epoch": 0.71, + "learning_rate": 0.0001927552160422623, + "loss": 0.0164, "step": 275820 }, { - "epoch": 1.39, - "learning_rate": 9.126032359455327e-05, - "loss": 0.0052, + "epoch": 0.71, + "learning_rate": 0.00019275132782589085, + "loss": 0.0157, "step": 275830 }, { - "epoch": 1.39, - "learning_rate": 9.125275590153927e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.00019274743960951936, + "loss": 0.0142, "step": 275840 }, { - "epoch": 1.39, - "learning_rate": 9.124518820852525e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001927435513931479, + "loss": 0.0161, "step": 275850 }, { - "epoch": 1.39, - "learning_rate": 9.123762051551124e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019273966317677647, + "loss": 0.0143, "step": 275860 }, { - "epoch": 1.39, - "learning_rate": 9.123005282249722e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.000192735774960405, + "loss": 0.0138, "step": 275870 }, { - "epoch": 1.39, - "learning_rate": 9.122248512948322e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001927318867440335, + "loss": 0.0173, "step": 275880 }, { - "epoch": 1.39, - "learning_rate": 9.121491743646921e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019272799852766204, + "loss": 0.0144, "step": 275890 }, { - "epoch": 1.39, - "learning_rate": 9.12073497434552e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019272411031129056, + "loss": 0.02, "step": 275900 }, { - "epoch": 1.39, - "learning_rate": 9.119978205044119e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019272022209491913, + "loss": 0.016, "step": 275910 }, { - "epoch": 1.39, - "learning_rate": 9.119221435742718e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019271633387854767, + "loss": 0.0175, "step": 275920 }, { - "epoch": 1.39, - "learning_rate": 9.118464666441317e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019271244566217618, + "loss": 0.0241, "step": 275930 }, { - "epoch": 1.39, - "learning_rate": 9.117707897139916e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019270855744580473, + "loss": 0.017, "step": 275940 }, { - "epoch": 1.39, - "learning_rate": 9.116951127838514e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.00019270466922943327, + "loss": 0.0132, "step": 275950 }, { - "epoch": 1.39, - "learning_rate": 9.116194358537114e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.0001927007810130618, + "loss": 0.0133, "step": 275960 }, { - "epoch": 1.39, - "learning_rate": 9.115437589235713e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.00019269689279669032, + "loss": 0.0119, "step": 275970 }, { - "epoch": 1.39, - "learning_rate": 9.114680819934311e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.00019269300458031886, + "loss": 0.0181, "step": 275980 }, { - "epoch": 1.39, - "learning_rate": 9.113924050632911e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001926891163639474, + "loss": 0.0148, "step": 275990 }, { - "epoch": 1.39, - "learning_rate": 9.11316728133151e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019268522814757595, + "loss": 0.0139, "step": 276000 }, { - "epoch": 1.39, - "eval_cer": 0.9144159137201398, - "eval_loss": 0.006024388130754232, - "eval_runtime": 116.144, - "eval_samples_per_second": 17.22, - "eval_steps_per_second": 4.305, + "epoch": 0.72, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.010350687429308891, + "eval_runtime": 107.9687, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, "step": 276000 }, { - "epoch": 1.39, - "learning_rate": 9.112410512030109e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019268133993120446, + "loss": 0.0166, "step": 276010 }, { - "epoch": 1.39, - "learning_rate": 9.111653742728708e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.000192677451714833, + "loss": 0.0144, "step": 276020 }, { - "epoch": 1.39, - "learning_rate": 9.110896973427308e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019267356349846155, + "loss": 0.0454, "step": 276030 }, { - "epoch": 1.39, - "learning_rate": 9.110140204125906e-05, - "loss": 0.0059, + "epoch": 0.72, + "learning_rate": 0.0001926696752820901, + "loss": 0.0141, "step": 276040 }, { - "epoch": 1.39, - "learning_rate": 9.109383434824505e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001926657870657186, + "loss": 0.0161, "step": 276050 }, { - "epoch": 1.39, - "learning_rate": 9.108626665523103e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019266189884934714, + "loss": 0.0144, "step": 276060 }, { - "epoch": 1.39, - "learning_rate": 9.107869896221703e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.0001926580106329757, + "loss": 0.0129, "step": 276070 }, { - "epoch": 1.39, - "learning_rate": 9.107113126920302e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019265412241660423, + "loss": 0.0179, "step": 276080 }, { - "epoch": 1.39, - "learning_rate": 9.1063563576189e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019265023420023277, + "loss": 0.0126, "step": 276090 }, { - "epoch": 1.39, - "learning_rate": 9.1055995883175e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019264634598386128, + "loss": 0.0142, "step": 276100 }, { - "epoch": 1.39, - "learning_rate": 9.1048428190161e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019264245776748985, + "loss": 0.0182, "step": 276110 }, { - "epoch": 1.39, - "learning_rate": 9.104086049714698e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019263856955111837, + "loss": 0.0138, "step": 276120 }, { - "epoch": 1.39, - "learning_rate": 9.103329280413297e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.0001926346813347469, + "loss": 0.0124, "step": 276130 }, { - "epoch": 1.39, - "learning_rate": 9.102572511111895e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019263079311837542, + "loss": 0.0141, "step": 276140 }, { - "epoch": 1.39, - "learning_rate": 9.101815741810495e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019262690490200396, + "loss": 0.0152, "step": 276150 }, { - "epoch": 1.39, - "learning_rate": 9.101058972509094e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.0001926230166856325, + "loss": 0.0142, "step": 276160 }, { - "epoch": 1.39, - "learning_rate": 9.100302203207692e-05, - "loss": 0.0086, + "epoch": 0.72, + "learning_rate": 0.00019261912846926105, + "loss": 0.0131, "step": 276170 }, { - "epoch": 1.39, - "learning_rate": 9.099545433906292e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019261524025288956, + "loss": 0.012, "step": 276180 }, { - "epoch": 1.39, - "learning_rate": 9.098788664604891e-05, - "loss": 0.0111, + "epoch": 0.72, + "learning_rate": 0.0001926113520365181, + "loss": 0.0171, "step": 276190 }, { - "epoch": 1.39, - "learning_rate": 9.09803189530349e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019260746382014665, + "loss": 0.0175, "step": 276200 }, { - "epoch": 1.39, - "learning_rate": 9.097275126002088e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.0001926035756037752, + "loss": 0.0211, "step": 276210 }, { - "epoch": 1.39, - "learning_rate": 9.096518356700686e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.0001925996873874037, + "loss": 0.0157, "step": 276220 }, { - "epoch": 1.39, - "learning_rate": 9.095761587399285e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019259579917103224, + "loss": 0.0177, "step": 276230 }, { - "epoch": 1.39, - "learning_rate": 9.095004818097883e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.0001925919109546608, + "loss": 0.0137, "step": 276240 }, { - "epoch": 1.39, - "learning_rate": 9.094248048796483e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019258802273828933, + "loss": 0.017, "step": 276250 }, { - "epoch": 1.39, - "learning_rate": 9.093491279495082e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019258413452191787, + "loss": 0.0149, "step": 276260 }, { - "epoch": 1.39, - "learning_rate": 9.09273451019368e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019258024630554638, + "loss": 0.0169, "step": 276270 }, { - "epoch": 1.39, - "learning_rate": 9.09197774089228e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019257635808917495, + "loss": 0.0116, "step": 276280 }, { - "epoch": 1.39, - "learning_rate": 9.09122097159088e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019257246987280347, + "loss": 0.014, "step": 276290 }, { - "epoch": 1.39, - "learning_rate": 9.090464202289478e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.000192568581656432, + "loss": 0.0135, "step": 276300 }, { - "epoch": 1.39, - "learning_rate": 9.089707432988077e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019256469344006052, + "loss": 0.0124, "step": 276310 }, { - "epoch": 1.39, - "learning_rate": 9.088950663686675e-05, - "loss": 0.0103, + "epoch": 0.72, + "learning_rate": 0.0001925608052236891, + "loss": 0.0138, "step": 276320 }, { - "epoch": 1.39, - "learning_rate": 9.088193894385275e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.0001925569170073176, + "loss": 0.0144, "step": 276330 }, { - "epoch": 1.39, - "learning_rate": 9.087437125083874e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019255302879094615, + "loss": 0.0133, "step": 276340 }, { - "epoch": 1.39, - "learning_rate": 9.086680355782473e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019254914057457466, + "loss": 0.0146, "step": 276350 }, { - "epoch": 1.39, - "learning_rate": 9.085923586481072e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019254525235820323, + "loss": 0.0145, "step": 276360 }, { - "epoch": 1.39, - "learning_rate": 9.085166817179672e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019254136414183174, + "loss": 0.0152, "step": 276370 }, { - "epoch": 1.39, - "learning_rate": 9.08441004787827e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019253747592546029, + "loss": 0.0149, "step": 276380 }, { - "epoch": 1.39, - "learning_rate": 9.083653278576869e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.0001925335877090888, + "loss": 0.0196, "step": 276390 }, { - "epoch": 1.39, - "learning_rate": 9.082896509275467e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019252969949271734, + "loss": 0.0136, "step": 276400 }, { - "epoch": 1.39, - "learning_rate": 9.082139739974067e-05, - "loss": 0.0094, + "epoch": 0.72, + "learning_rate": 0.0001925258112763459, + "loss": 0.0189, "step": 276410 }, { - "epoch": 1.39, - "learning_rate": 9.081382970672666e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019252192305997443, + "loss": 0.0154, "step": 276420 }, { - "epoch": 1.39, - "learning_rate": 9.080626201371264e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019251803484360294, + "loss": 0.0228, "step": 276430 }, { - "epoch": 1.39, - "learning_rate": 9.079869432069864e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019251414662723148, + "loss": 0.0119, "step": 276440 }, { - "epoch": 1.39, - "learning_rate": 9.079112662768463e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019251025841086005, + "loss": 0.0144, "step": 276450 }, { - "epoch": 1.39, - "learning_rate": 9.078355893467062e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019250637019448857, + "loss": 0.0125, "step": 276460 }, { - "epoch": 1.39, - "learning_rate": 9.077599124165661e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.0001925024819781171, + "loss": 0.0145, "step": 276470 }, { - "epoch": 1.39, - "learning_rate": 9.07684235486426e-05, - "loss": 0.0057, + "epoch": 0.72, + "learning_rate": 0.00019249859376174562, + "loss": 0.018, "step": 276480 }, { - "epoch": 1.39, - "learning_rate": 9.076085585562859e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.0001924947055453742, + "loss": 0.014, "step": 276490 }, { - "epoch": 1.39, - "learning_rate": 9.075328816261458e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.0001924908173290027, + "loss": 0.018, "step": 276500 }, { - "epoch": 1.4, - "learning_rate": 9.074572046960056e-05, - "loss": 0.0112, + "epoch": 0.72, + "learning_rate": 0.00019248692911263125, + "loss": 0.0116, "step": 276510 }, { - "epoch": 1.4, - "learning_rate": 9.073815277658656e-05, - "loss": 0.0102, + "epoch": 0.72, + "learning_rate": 0.00019248304089625976, + "loss": 0.0145, "step": 276520 }, { - "epoch": 1.4, - "learning_rate": 9.073058508357255e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019247915267988833, + "loss": 0.0154, "step": 276530 }, { - "epoch": 1.4, - "learning_rate": 9.072301739055854e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019247526446351684, + "loss": 0.0147, "step": 276540 }, { - "epoch": 1.4, - "learning_rate": 9.071544969754453e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019247137624714539, + "loss": 0.0138, "step": 276550 }, { - "epoch": 1.4, - "learning_rate": 9.070788200453053e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.0001924674880307739, + "loss": 0.0149, "step": 276560 }, { - "epoch": 1.4, - "learning_rate": 9.07003143115165e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019246359981440247, + "loss": 0.0179, "step": 276570 }, { - "epoch": 1.4, - "learning_rate": 9.06927466185025e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019245971159803098, + "loss": 0.0139, "step": 276580 }, { - "epoch": 1.4, - "learning_rate": 9.068517892548848e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019245582338165952, + "loss": 0.0196, "step": 276590 }, { - "epoch": 1.4, - "learning_rate": 9.067761123247448e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019245193516528804, + "loss": 0.0175, "step": 276600 }, { - "epoch": 1.4, - "learning_rate": 9.067004353946047e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.0001924480469489166, + "loss": 0.0119, "step": 276610 }, { - "epoch": 1.4, - "learning_rate": 9.066247584644645e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019244415873254515, + "loss": 0.0145, "step": 276620 }, { - "epoch": 1.4, - "learning_rate": 9.065490815343245e-05, - "loss": 0.0056, + "epoch": 0.72, + "learning_rate": 0.00019244027051617366, + "loss": 0.0107, "step": 276630 }, { - "epoch": 1.4, - "learning_rate": 9.064734046041844e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001924363822998022, + "loss": 0.018, "step": 276640 }, { - "epoch": 1.4, - "learning_rate": 9.063977276740443e-05, - "loss": 0.0062, + "epoch": 0.72, + "learning_rate": 0.00019243249408343072, + "loss": 0.0154, "step": 276650 }, { - "epoch": 1.4, - "learning_rate": 9.063220507439042e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.0001924286058670593, + "loss": 0.0161, "step": 276660 }, { - "epoch": 1.4, - "learning_rate": 9.06246373813764e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.0001924247176506878, + "loss": 0.0137, "step": 276670 }, { - "epoch": 1.4, - "learning_rate": 9.06170696883624e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019242082943431635, + "loss": 0.0173, "step": 276680 }, { - "epoch": 1.4, - "learning_rate": 9.060950199534839e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019241694121794486, + "loss": 0.0189, "step": 276690 }, { - "epoch": 1.4, - "learning_rate": 9.060193430233437e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019241305300157343, + "loss": 0.0155, "step": 276700 }, { - "epoch": 1.4, - "learning_rate": 9.059436660932037e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019240916478520194, + "loss": 0.0168, "step": 276710 }, { - "epoch": 1.4, - "learning_rate": 9.058679891630636e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019240527656883048, + "loss": 0.0179, "step": 276720 }, { - "epoch": 1.4, - "learning_rate": 9.057923122329235e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.000192401388352459, + "loss": 0.0175, "step": 276730 }, { - "epoch": 1.4, - "learning_rate": 9.057166353027834e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019239750013608757, + "loss": 0.0159, "step": 276740 }, { - "epoch": 1.4, - "learning_rate": 9.056409583726432e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019239361191971608, + "loss": 0.0133, "step": 276750 }, { - "epoch": 1.4, - "learning_rate": 9.055652814425032e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019238972370334462, + "loss": 0.0148, "step": 276760 }, { - "epoch": 1.4, - "learning_rate": 9.054896045123631e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019238583548697314, + "loss": 0.0149, "step": 276770 }, { - "epoch": 1.4, - "learning_rate": 9.054139275822229e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001923819472706017, + "loss": 0.0186, "step": 276780 }, { - "epoch": 1.4, - "learning_rate": 9.053382506520829e-05, - "loss": 0.0057, + "epoch": 0.72, + "learning_rate": 0.00019237805905423025, + "loss": 0.0132, "step": 276790 }, { - "epoch": 1.4, - "learning_rate": 9.052625737219428e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019237417083785876, + "loss": 0.0137, "step": 276800 }, { - "epoch": 1.4, - "learning_rate": 9.051868967918026e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.0001923702826214873, + "loss": 0.0162, "step": 276810 }, { - "epoch": 1.4, - "learning_rate": 9.051112198616626e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019236639440511585, + "loss": 0.0143, "step": 276820 }, { - "epoch": 1.4, - "learning_rate": 9.050355429315223e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.0001923625061887444, + "loss": 0.0169, "step": 276830 }, { - "epoch": 1.4, - "learning_rate": 9.049598660013822e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.0001923586179723729, + "loss": 0.0201, "step": 276840 }, { - "epoch": 1.4, - "learning_rate": 9.04884189071242e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019235472975600144, + "loss": 0.014, "step": 276850 }, { - "epoch": 1.4, - "learning_rate": 9.04808512141102e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019235084153963, + "loss": 0.0176, "step": 276860 }, { - "epoch": 1.4, - "learning_rate": 9.04732835210962e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019234695332325853, + "loss": 0.0142, "step": 276870 }, { - "epoch": 1.4, - "learning_rate": 9.046571582808218e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.00019234306510688704, + "loss": 0.0142, "step": 276880 }, { - "epoch": 1.4, - "learning_rate": 9.045814813506817e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019233917689051558, + "loss": 0.0135, "step": 276890 }, { - "epoch": 1.4, - "learning_rate": 9.045058044205417e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.0001923352886741441, + "loss": 0.0165, "step": 276900 }, { - "epoch": 1.4, - "learning_rate": 9.044301274904015e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.00019233140045777267, + "loss": 0.0167, "step": 276910 }, { - "epoch": 1.4, - "learning_rate": 9.043544505602614e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019232751224140118, + "loss": 0.0155, "step": 276920 }, { - "epoch": 1.4, - "learning_rate": 9.042787736301214e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019232362402502972, + "loss": 0.0172, "step": 276930 }, { - "epoch": 1.4, - "learning_rate": 9.042030966999812e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.00019231973580865824, + "loss": 0.0227, "step": 276940 }, { - "epoch": 1.4, - "learning_rate": 9.041274197698411e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.0001923158475922868, + "loss": 0.0176, "step": 276950 }, { - "epoch": 1.4, - "learning_rate": 9.04051742839701e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019231195937591535, + "loss": 0.0158, "step": 276960 }, { - "epoch": 1.4, - "learning_rate": 9.039760659095609e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019230807115954386, + "loss": 0.0134, "step": 276970 }, { - "epoch": 1.4, - "learning_rate": 9.039003889794208e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019230418294317238, + "loss": 0.0152, "step": 276980 }, { - "epoch": 1.4, - "learning_rate": 9.038247120492807e-05, - "loss": 0.0109, + "epoch": 0.72, + "learning_rate": 0.00019230029472680095, + "loss": 0.0171, "step": 276990 }, { - "epoch": 1.4, - "learning_rate": 9.037490351191406e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.0001922964065104295, + "loss": 0.0138, "step": 277000 }, { - "epoch": 1.4, - "eval_cer": 0.9144246472852683, - "eval_loss": 0.0058305272832512856, - "eval_runtime": 115.9259, - "eval_samples_per_second": 17.252, - "eval_steps_per_second": 4.313, + "epoch": 0.72, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.010107412934303284, + "eval_runtime": 108.0568, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, "step": 277000 }, { - "epoch": 1.4, - "learning_rate": 9.036733581890006e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.000192292518294058, + "loss": 0.012, "step": 277010 }, { - "epoch": 1.4, - "learning_rate": 9.035976812588604e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019228863007768654, + "loss": 0.0118, "step": 277020 }, { - "epoch": 1.4, - "learning_rate": 9.035220043287203e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019228474186131509, + "loss": 0.0182, "step": 277030 }, { - "epoch": 1.4, - "learning_rate": 9.034463273985801e-05, - "loss": 0.0185, + "epoch": 0.72, + "learning_rate": 0.00019228085364494363, + "loss": 0.0176, "step": 277040 }, { - "epoch": 1.4, - "learning_rate": 9.033706504684401e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019227696542857214, + "loss": 0.0138, "step": 277050 }, { - "epoch": 1.4, - "learning_rate": 9.032949735383e-05, - "loss": 0.0105, + "epoch": 0.72, + "learning_rate": 0.00019227307721220068, + "loss": 0.0124, "step": 277060 }, { - "epoch": 1.4, - "learning_rate": 9.032192966081599e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019226918899582923, + "loss": 0.0124, "step": 277070 }, { - "epoch": 1.4, - "learning_rate": 9.031436196780198e-05, - "loss": 0.0099, + "epoch": 0.72, + "learning_rate": 0.00019226530077945777, + "loss": 0.0164, "step": 277080 }, { - "epoch": 1.4, - "learning_rate": 9.030679427478798e-05, - "loss": 0.0111, + "epoch": 0.72, + "learning_rate": 0.00019226141256308628, + "loss": 0.0137, "step": 277090 }, { - "epoch": 1.4, - "learning_rate": 9.029922658177396e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019225752434671482, + "loss": 0.0167, "step": 277100 }, { - "epoch": 1.4, - "learning_rate": 9.029165888875995e-05, - "loss": 0.0076, - "step": 277110 + "epoch": 0.72, + "learning_rate": 0.0001922536361303434, + "loss": 0.0157, + "step": 277110 }, { - "epoch": 1.4, - "learning_rate": 9.028409119574593e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.0001922497479139719, + "loss": 0.0148, "step": 277120 }, { - "epoch": 1.4, - "learning_rate": 9.027652350273193e-05, - "loss": 0.0106, + "epoch": 0.72, + "learning_rate": 0.00019224585969760045, + "loss": 0.0154, "step": 277130 }, { - "epoch": 1.4, - "learning_rate": 9.026895580971792e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019224197148122896, + "loss": 0.0166, "step": 277140 }, { - "epoch": 1.4, - "learning_rate": 9.02613881167039e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019223808326485748, + "loss": 0.0136, "step": 277150 }, { - "epoch": 1.4, - "learning_rate": 9.02538204236899e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019223419504848605, + "loss": 0.0142, "step": 277160 }, { - "epoch": 1.4, - "learning_rate": 9.02462527306759e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.0001922303068321146, + "loss": 0.015, "step": 277170 }, { - "epoch": 1.4, - "learning_rate": 9.023868503766188e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001922264186157431, + "loss": 0.0166, "step": 277180 }, { - "epoch": 1.4, - "learning_rate": 9.023111734464787e-05, - "loss": 0.0056, + "epoch": 0.72, + "learning_rate": 0.00019222253039937164, + "loss": 0.0163, "step": 277190 }, { - "epoch": 1.4, - "learning_rate": 9.022354965163385e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019221864218300019, + "loss": 0.0165, "step": 277200 }, { - "epoch": 1.4, - "learning_rate": 9.021598195861985e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019221475396662873, + "loss": 0.0167, "step": 277210 }, { - "epoch": 1.4, - "learning_rate": 9.020841426560584e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019221086575025724, + "loss": 0.0196, "step": 277220 }, { - "epoch": 1.4, - "learning_rate": 9.020084657259182e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019220697753388578, + "loss": 0.015, "step": 277230 }, { - "epoch": 1.4, - "learning_rate": 9.019327887957782e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019220308931751432, + "loss": 0.0203, "step": 277240 }, { - "epoch": 1.4, - "learning_rate": 9.018571118656381e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019219920110114287, + "loss": 0.0171, "step": 277250 }, { - "epoch": 1.4, - "learning_rate": 9.01781434935498e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019219531288477138, + "loss": 0.0163, "step": 277260 }, { - "epoch": 1.4, - "learning_rate": 9.017057580053579e-05, - "loss": 0.0062, + "epoch": 0.72, + "learning_rate": 0.00019219142466839992, + "loss": 0.0175, "step": 277270 }, { - "epoch": 1.4, - "learning_rate": 9.016300810752177e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.0001921875364520285, + "loss": 0.0186, "step": 277280 }, { - "epoch": 1.4, - "learning_rate": 9.015544041450777e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.000192183648235657, + "loss": 0.011, "step": 277290 }, { - "epoch": 1.4, - "learning_rate": 9.014787272149376e-05, - "loss": 0.0109, + "epoch": 0.72, + "learning_rate": 0.00019217976001928552, + "loss": 0.0144, "step": 277300 }, { - "epoch": 1.4, - "learning_rate": 9.014030502847974e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019217587180291406, + "loss": 0.0161, "step": 277310 }, { - "epoch": 1.4, - "learning_rate": 9.013273733546574e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019217198358654263, + "loss": 0.0131, "step": 277320 }, { - "epoch": 1.4, - "learning_rate": 9.012516964245173e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019216809537017115, + "loss": 0.0124, "step": 277330 }, { - "epoch": 1.4, - "learning_rate": 9.011760194943771e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001921642071537997, + "loss": 0.0137, "step": 277340 }, { - "epoch": 1.4, - "learning_rate": 9.011003425642371e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.0001921603189374282, + "loss": 0.0142, "step": 277350 }, { - "epoch": 1.4, - "learning_rate": 9.010246656340969e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019215643072105677, + "loss": 0.0115, "step": 277360 }, { - "epoch": 1.4, - "learning_rate": 9.009489887039569e-05, - "loss": 0.0094, + "epoch": 0.72, + "learning_rate": 0.00019215254250468528, + "loss": 0.0148, "step": 277370 }, { - "epoch": 1.4, - "learning_rate": 9.008733117738168e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019214865428831383, + "loss": 0.0119, "step": 277380 }, { - "epoch": 1.4, - "learning_rate": 9.007976348436766e-05, - "loss": 0.0059, + "epoch": 0.72, + "learning_rate": 0.00019214476607194234, + "loss": 0.0178, "step": 277390 }, { - "epoch": 1.4, - "learning_rate": 9.007219579135366e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019214087785557088, + "loss": 0.0169, "step": 277400 }, { - "epoch": 1.4, - "learning_rate": 9.006462809833965e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019213698963919942, + "loss": 0.0159, "step": 277410 }, { - "epoch": 1.4, - "learning_rate": 9.005706040532563e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019213310142282797, + "loss": 0.0169, "step": 277420 }, { - "epoch": 1.4, - "learning_rate": 9.004949271231163e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019212921320645648, + "loss": 0.0174, "step": 277430 }, { - "epoch": 1.4, - "learning_rate": 9.004192501929761e-05, - "loss": 0.0102, + "epoch": 0.72, + "learning_rate": 0.00019212532499008502, + "loss": 0.0124, "step": 277440 }, { - "epoch": 1.4, - "learning_rate": 9.00343573262836e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001921214367737136, + "loss": 0.0172, "step": 277450 }, { - "epoch": 1.4, - "learning_rate": 9.002678963326959e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.0001921175485573421, + "loss": 0.0123, "step": 277460 }, { - "epoch": 1.4, - "learning_rate": 9.001922194025557e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.00019211366034097062, + "loss": 0.0134, "step": 277470 }, { - "epoch": 1.4, - "learning_rate": 9.001165424724156e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019210977212459916, + "loss": 0.0139, "step": 277480 }, { - "epoch": 1.4, - "learning_rate": 9.000408655422754e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019210588390822773, + "loss": 0.0184, "step": 277490 }, { - "epoch": 1.4, - "learning_rate": 8.999651886121354e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019210199569185624, + "loss": 0.0141, "step": 277500 }, { - "epoch": 1.4, - "learning_rate": 8.998895116819953e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.0001920981074754848, + "loss": 0.0144, "step": 277510 }, { - "epoch": 1.4, - "learning_rate": 8.998138347518552e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001920942192591133, + "loss": 0.0127, "step": 277520 }, { - "epoch": 1.4, - "learning_rate": 8.997381578217151e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.00019209033104274187, + "loss": 0.0123, "step": 277530 }, { - "epoch": 1.4, - "learning_rate": 8.99662480891575e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019208644282637038, + "loss": 0.0163, "step": 277540 }, { - "epoch": 1.4, - "learning_rate": 8.995868039614349e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019208255460999893, + "loss": 0.0171, "step": 277550 }, { - "epoch": 1.4, - "learning_rate": 8.995111270312948e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019207866639362744, + "loss": 0.0145, "step": 277560 }, { - "epoch": 1.4, - "learning_rate": 8.994354501011546e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.000192074778177256, + "loss": 0.012, "step": 277570 }, { - "epoch": 1.4, - "learning_rate": 8.993597731710146e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.00019207088996088452, + "loss": 0.0165, "step": 277580 }, { - "epoch": 1.4, - "learning_rate": 8.992840962408745e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019206700174451307, + "loss": 0.0164, "step": 277590 }, { - "epoch": 1.4, - "learning_rate": 8.992084193107344e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019206311352814158, + "loss": 0.0165, "step": 277600 }, { - "epoch": 1.4, - "learning_rate": 8.991327423805943e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019205922531177015, + "loss": 0.0204, "step": 277610 }, { - "epoch": 1.4, - "learning_rate": 8.990570654504543e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019205533709539866, + "loss": 0.0124, "step": 277620 }, { - "epoch": 1.4, - "learning_rate": 8.989813885203141e-05, - "loss": 0.0061, + "epoch": 0.72, + "learning_rate": 0.0001920514488790272, + "loss": 0.0147, "step": 277630 }, { - "epoch": 1.4, - "learning_rate": 8.98905711590174e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019204756066265572, + "loss": 0.0125, "step": 277640 }, { - "epoch": 1.4, - "learning_rate": 8.988300346600338e-05, - "loss": 0.0055, + "epoch": 0.72, + "learning_rate": 0.00019204367244628426, + "loss": 0.0127, "step": 277650 }, { - "epoch": 1.4, - "learning_rate": 8.987543577298938e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.00019203978422991283, + "loss": 0.0158, "step": 277660 }, { - "epoch": 1.4, - "learning_rate": 8.986786807997537e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019203589601354134, + "loss": 0.0138, "step": 277670 }, { - "epoch": 1.4, - "learning_rate": 8.986030038696135e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019203200779716989, + "loss": 0.0154, "step": 277680 }, { - "epoch": 1.4, - "learning_rate": 8.985273269394735e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.0001920281195807984, + "loss": 0.0184, "step": 277690 }, { - "epoch": 1.4, - "learning_rate": 8.984516500093334e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.00019202423136442697, + "loss": 0.0141, "step": 277700 }, { - "epoch": 1.4, - "learning_rate": 8.983759730791933e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019202034314805548, + "loss": 0.0165, "step": 277710 }, { - "epoch": 1.4, - "learning_rate": 8.983002961490532e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019201645493168403, + "loss": 0.0154, "step": 277720 }, { - "epoch": 1.4, - "learning_rate": 8.98224619218913e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019201256671531254, + "loss": 0.0163, "step": 277730 }, { - "epoch": 1.4, - "learning_rate": 8.98148942288773e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001920086784989411, + "loss": 0.0162, "step": 277740 }, { - "epoch": 1.4, - "learning_rate": 8.980732653586329e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019200479028256962, + "loss": 0.0169, "step": 277750 }, { - "epoch": 1.4, - "learning_rate": 8.979975884284927e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019200090206619816, + "loss": 0.0128, "step": 277760 }, { - "epoch": 1.4, - "learning_rate": 8.979219114983527e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019199701384982668, + "loss": 0.0167, "step": 277770 }, { - "epoch": 1.4, - "learning_rate": 8.978462345682126e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.00019199312563345525, + "loss": 0.0165, "step": 277780 }, { - "epoch": 1.4, - "learning_rate": 8.977705576380725e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019198923741708376, + "loss": 0.0121, "step": 277790 }, { - "epoch": 1.4, - "learning_rate": 8.976948807079324e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.0001919853492007123, + "loss": 0.0131, "step": 277800 }, { - "epoch": 1.4, - "learning_rate": 8.976192037777922e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019198146098434082, + "loss": 0.0132, "step": 277810 }, { - "epoch": 1.4, - "learning_rate": 8.975435268476522e-05, - "loss": 0.0098, + "epoch": 0.72, + "learning_rate": 0.0001919775727679694, + "loss": 0.0108, "step": 277820 }, { - "epoch": 1.4, - "learning_rate": 8.974678499175121e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019197368455159793, + "loss": 0.0165, "step": 277830 }, { - "epoch": 1.4, - "learning_rate": 8.97392172987372e-05, - "loss": 0.0104, + "epoch": 0.72, + "learning_rate": 0.00019196979633522644, + "loss": 0.0148, "step": 277840 }, { - "epoch": 1.4, - "learning_rate": 8.973164960572319e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019196590811885499, + "loss": 0.0133, "step": 277850 }, { - "epoch": 1.4, - "learning_rate": 8.972408191270918e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019196201990248353, + "loss": 0.0137, "step": 277860 }, { - "epoch": 1.4, - "learning_rate": 8.971651421969516e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019195813168611207, + "loss": 0.0128, "step": 277870 }, { - "epoch": 1.4, - "learning_rate": 8.970894652668116e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019195424346974058, + "loss": 0.0159, "step": 277880 }, { - "epoch": 1.4, - "learning_rate": 8.970137883366714e-05, - "loss": 0.0055, + "epoch": 0.72, + "learning_rate": 0.00019195035525336912, + "loss": 0.0165, "step": 277890 }, { - "epoch": 1.4, - "learning_rate": 8.969381114065314e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019194646703699764, + "loss": 0.0209, "step": 277900 }, { - "epoch": 1.4, - "learning_rate": 8.968624344763913e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001919425788206262, + "loss": 0.0189, "step": 277910 }, { - "epoch": 1.4, - "learning_rate": 8.967867575462511e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019193869060425472, + "loss": 0.0159, "step": 277920 }, { - "epoch": 1.4, - "learning_rate": 8.967110806161111e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019193480238788326, + "loss": 0.0148, "step": 277930 }, { - "epoch": 1.4, - "learning_rate": 8.96635403685971e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019193091417151178, + "loss": 0.0143, "step": 277940 }, { - "epoch": 1.4, - "learning_rate": 8.965597267558308e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019192702595514035, + "loss": 0.0146, "step": 277950 }, { - "epoch": 1.4, - "learning_rate": 8.964840498256908e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019192313773876886, + "loss": 0.0161, "step": 277960 }, { - "epoch": 1.4, - "learning_rate": 8.964083728955507e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.0001919192495223974, + "loss": 0.0136, "step": 277970 }, { - "epoch": 1.4, - "learning_rate": 8.963326959654106e-05, - "loss": 0.0061, + "epoch": 0.72, + "learning_rate": 0.00019191536130602592, + "loss": 0.0156, "step": 277980 }, { - "epoch": 1.4, - "learning_rate": 8.962570190352705e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.0001919114730896545, + "loss": 0.0179, "step": 277990 }, { - "epoch": 1.4, - "learning_rate": 8.961813421051303e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019190758487328303, + "loss": 0.0139, "step": 278000 }, { - "epoch": 1.4, - "eval_cer": 0.9144246472852683, - "eval_loss": 0.0060167377814650536, - "eval_runtime": 116.7043, - "eval_samples_per_second": 17.137, - "eval_steps_per_second": 4.284, + "epoch": 0.72, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.010161010548472404, + "eval_runtime": 108.0178, + "eval_samples_per_second": 18.515, + "eval_steps_per_second": 4.629, "step": 278000 }, { - "epoch": 1.4, - "learning_rate": 8.961056651749903e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019190369665691154, + "loss": 0.0165, "step": 278010 }, { - "epoch": 1.4, - "learning_rate": 8.960299882448502e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019189980844054006, + "loss": 0.0169, "step": 278020 }, { - "epoch": 1.4, - "learning_rate": 8.9595431131471e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019189592022416863, + "loss": 0.0142, "step": 278030 }, { - "epoch": 1.4, - "learning_rate": 8.9587863438457e-05, - "loss": 0.0053, + "epoch": 0.72, + "learning_rate": 0.00019189203200779717, + "loss": 0.0107, "step": 278040 }, { - "epoch": 1.4, - "learning_rate": 8.9580295745443e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019188814379142568, + "loss": 0.0135, "step": 278050 }, { - "epoch": 1.4, - "learning_rate": 8.957272805242897e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019188425557505422, + "loss": 0.0125, "step": 278060 }, { - "epoch": 1.4, - "learning_rate": 8.956516035941497e-05, - "loss": 0.0333, + "epoch": 0.72, + "learning_rate": 0.00019188036735868277, + "loss": 0.0164, "step": 278070 }, { - "epoch": 1.4, - "learning_rate": 8.955759266640095e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.0001918764791423113, + "loss": 0.0132, "step": 278080 }, { - "epoch": 1.4, - "learning_rate": 8.955002497338693e-05, - "loss": 0.0099, + "epoch": 0.72, + "learning_rate": 0.00019187259092593982, + "loss": 0.0191, "step": 278090 }, { - "epoch": 1.4, - "learning_rate": 8.954245728037291e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.00019186870270956836, + "loss": 0.0155, "step": 278100 }, { - "epoch": 1.4, - "learning_rate": 8.953488958735891e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001918648144931969, + "loss": 0.0146, "step": 278110 }, { - "epoch": 1.4, - "learning_rate": 8.95273218943449e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019186092627682545, + "loss": 0.0122, "step": 278120 }, { - "epoch": 1.4, - "learning_rate": 8.951975420133089e-05, - "loss": 0.0086, + "epoch": 0.72, + "learning_rate": 0.00019185703806045396, + "loss": 0.0182, "step": 278130 }, { - "epoch": 1.4, - "learning_rate": 8.951218650831688e-05, - "loss": 0.0102, + "epoch": 0.72, + "learning_rate": 0.0001918531498440825, + "loss": 0.0146, "step": 278140 }, { - "epoch": 1.4, - "learning_rate": 8.950461881530288e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019184926162771102, + "loss": 0.0137, "step": 278150 }, { - "epoch": 1.4, - "learning_rate": 8.949705112228886e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.00019184537341133959, + "loss": 0.0163, "step": 278160 }, { - "epoch": 1.4, - "learning_rate": 8.948948342927485e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001918414851949681, + "loss": 0.0163, "step": 278170 }, { - "epoch": 1.4, - "learning_rate": 8.948191573626083e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019183759697859664, + "loss": 0.0123, "step": 278180 }, { - "epoch": 1.4, - "learning_rate": 8.947434804324683e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019183370876222516, + "loss": 0.0177, "step": 278190 }, { - "epoch": 1.4, - "learning_rate": 8.946678035023282e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019182982054585373, + "loss": 0.0125, "step": 278200 }, { - "epoch": 1.4, - "learning_rate": 8.94592126572188e-05, - "loss": 0.0058, + "epoch": 0.72, + "learning_rate": 0.00019182593232948227, + "loss": 0.0119, "step": 278210 }, { - "epoch": 1.4, - "learning_rate": 8.94516449642048e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019182204411311078, + "loss": 0.0114, "step": 278220 }, { - "epoch": 1.4, - "learning_rate": 8.94440772711908e-05, - "loss": 0.0097, + "epoch": 0.72, + "learning_rate": 0.00019181815589673932, + "loss": 0.0117, "step": 278230 }, { - "epoch": 1.4, - "learning_rate": 8.943650957817678e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019181426768036787, + "loss": 0.0173, "step": 278240 }, { - "epoch": 1.4, - "learning_rate": 8.942894188516277e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.0001918103794639964, + "loss": 0.0125, "step": 278250 }, { - "epoch": 1.4, - "learning_rate": 8.942137419214875e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019180649124762492, + "loss": 0.0133, "step": 278260 }, { - "epoch": 1.4, - "learning_rate": 8.941380649913475e-05, - "loss": 0.0104, + "epoch": 0.72, + "learning_rate": 0.00019180260303125346, + "loss": 0.0144, "step": 278270 }, { - "epoch": 1.4, - "learning_rate": 8.940623880612074e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.000191798714814882, + "loss": 0.0141, "step": 278280 }, { - "epoch": 1.4, - "learning_rate": 8.939867111310672e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019179482659851055, + "loss": 0.0171, "step": 278290 }, { - "epoch": 1.4, - "learning_rate": 8.939110342009272e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019179093838213906, + "loss": 0.0188, "step": 278300 }, { - "epoch": 1.4, - "learning_rate": 8.938353572707871e-05, - "loss": 0.0117, + "epoch": 0.72, + "learning_rate": 0.0001917870501657676, + "loss": 0.0138, "step": 278310 }, { - "epoch": 1.4, - "learning_rate": 8.93759680340647e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.00019178316194939617, + "loss": 0.0136, "step": 278320 }, { - "epoch": 1.4, - "learning_rate": 8.936840034105069e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.00019177927373302469, + "loss": 0.015, "step": 278330 }, { - "epoch": 1.4, - "learning_rate": 8.936083264803667e-05, - "loss": 0.0086, + "epoch": 0.72, + "learning_rate": 0.0001917753855166532, + "loss": 0.0151, "step": 278340 }, { - "epoch": 1.4, - "learning_rate": 8.935326495502267e-05, - "loss": 0.01, + "epoch": 0.72, + "learning_rate": 0.00019177149730028174, + "loss": 0.0126, "step": 278350 }, { - "epoch": 1.4, - "learning_rate": 8.934569726200866e-05, - "loss": 0.0098, + "epoch": 0.72, + "learning_rate": 0.0001917676090839103, + "loss": 0.0107, "step": 278360 }, { - "epoch": 1.4, - "learning_rate": 8.933812956899464e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019176372086753883, + "loss": 0.0143, "step": 278370 }, { - "epoch": 1.4, - "learning_rate": 8.933056187598064e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019175983265116737, + "loss": 0.0163, "step": 278380 }, { - "epoch": 1.4, - "learning_rate": 8.932299418296663e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019175594443479588, + "loss": 0.0155, "step": 278390 }, { - "epoch": 1.4, - "learning_rate": 8.931542648995261e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019175205621842442, + "loss": 0.0142, "step": 278400 }, { - "epoch": 1.4, - "learning_rate": 8.930785879693861e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019174816800205296, + "loss": 0.013, "step": 278410 }, { - "epoch": 1.4, - "learning_rate": 8.93002911039246e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.0001917442797856815, + "loss": 0.0151, "step": 278420 }, { - "epoch": 1.4, - "learning_rate": 8.929272341091059e-05, - "loss": 0.0102, + "epoch": 0.72, + "learning_rate": 0.00019174039156931002, + "loss": 0.0183, "step": 278430 }, { - "epoch": 1.4, - "learning_rate": 8.928515571789658e-05, - "loss": 0.0086, + "epoch": 0.72, + "learning_rate": 0.00019173650335293856, + "loss": 0.015, "step": 278440 }, { - "epoch": 1.4, - "learning_rate": 8.927758802488256e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.0001917326151365671, + "loss": 0.0162, "step": 278450 }, { - "epoch": 1.4, - "learning_rate": 8.927002033186856e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019172872692019565, + "loss": 0.0141, "step": 278460 }, { - "epoch": 1.4, - "learning_rate": 8.926245263885455e-05, - "loss": 0.007, + "epoch": 0.72, + "learning_rate": 0.00019172483870382416, + "loss": 0.0145, "step": 278470 }, { - "epoch": 1.4, - "learning_rate": 8.925488494584053e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.0001917209504874527, + "loss": 0.0138, "step": 278480 }, { - "epoch": 1.41, - "learning_rate": 8.924731725282653e-05, - "loss": 0.0057, + "epoch": 0.72, + "learning_rate": 0.00019171706227108124, + "loss": 0.0133, "step": 278490 }, { - "epoch": 1.41, - "learning_rate": 8.923974955981252e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019171317405470979, + "loss": 0.013, "step": 278500 }, { - "epoch": 1.41, - "learning_rate": 8.92321818667985e-05, - "loss": 0.0075, + "epoch": 0.72, + "learning_rate": 0.0001917092858383383, + "loss": 0.0161, "step": 278510 }, { - "epoch": 1.41, - "learning_rate": 8.92246141737845e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019170539762196684, + "loss": 0.0164, "step": 278520 }, { - "epoch": 1.41, - "learning_rate": 8.921704648077048e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001917015094055954, + "loss": 0.0134, "step": 278530 }, { - "epoch": 1.41, - "learning_rate": 8.920947878775648e-05, - "loss": 0.0058, + "epoch": 0.72, + "learning_rate": 0.00019169762118922392, + "loss": 0.0197, "step": 278540 }, { - "epoch": 1.41, - "learning_rate": 8.920191109474247e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019169373297285247, + "loss": 0.0161, "step": 278550 }, { - "epoch": 1.41, - "learning_rate": 8.919434340172845e-05, - "loss": 0.0095, + "epoch": 0.72, + "learning_rate": 0.00019168984475648098, + "loss": 0.0134, "step": 278560 }, { - "epoch": 1.41, - "learning_rate": 8.918677570871445e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019168595654010955, + "loss": 0.016, "step": 278570 }, { - "epoch": 1.41, - "learning_rate": 8.917920801570044e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019168206832373806, + "loss": 0.0154, "step": 278580 }, { - "epoch": 1.41, - "learning_rate": 8.917164032268643e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.0001916781801073666, + "loss": 0.0162, "step": 278590 }, { - "epoch": 1.41, - "learning_rate": 8.916407262967242e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019167429189099512, + "loss": 0.0133, "step": 278600 }, { - "epoch": 1.41, - "learning_rate": 8.91565049366584e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.0001916704036746237, + "loss": 0.0143, "step": 278610 }, { - "epoch": 1.41, - "learning_rate": 8.91489372436444e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001916665154582522, + "loss": 0.019, "step": 278620 }, { - "epoch": 1.41, - "learning_rate": 8.914136955063039e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019166262724188075, + "loss": 0.0133, "step": 278630 }, { - "epoch": 1.41, - "learning_rate": 8.913380185761637e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019165873902550926, + "loss": 0.0151, "step": 278640 }, { - "epoch": 1.41, - "learning_rate": 8.912623416460237e-05, - "loss": 0.0067, + "epoch": 0.72, + "learning_rate": 0.0001916548508091378, + "loss": 0.0135, "step": 278650 }, { - "epoch": 1.41, - "learning_rate": 8.911866647158836e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019165096259276634, + "loss": 0.0149, "step": 278660 }, { - "epoch": 1.41, - "learning_rate": 8.911109877857434e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019164707437639488, + "loss": 0.0159, "step": 278670 }, { - "epoch": 1.41, - "learning_rate": 8.910353108556034e-05, - "loss": 0.0163, + "epoch": 0.72, + "learning_rate": 0.0001916431861600234, + "loss": 0.0146, "step": 278680 }, { - "epoch": 1.41, - "learning_rate": 8.909596339254632e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019163929794365194, + "loss": 0.0118, "step": 278690 }, { - "epoch": 1.41, - "learning_rate": 8.908839569953232e-05, - "loss": 0.0058, + "epoch": 0.72, + "learning_rate": 0.0001916354097272805, + "loss": 0.0122, "step": 278700 }, { - "epoch": 1.41, - "learning_rate": 8.908082800651831e-05, - "loss": 0.0087, + "epoch": 0.72, + "learning_rate": 0.00019163152151090902, + "loss": 0.0157, "step": 278710 }, { - "epoch": 1.41, - "learning_rate": 8.907326031350428e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019162763329453757, + "loss": 0.0177, "step": 278720 }, { - "epoch": 1.41, - "learning_rate": 8.906569262049027e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019162374507816608, + "loss": 0.0124, "step": 278730 }, { - "epoch": 1.41, - "learning_rate": 8.905812492747626e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019161985686179465, + "loss": 0.0136, "step": 278740 }, { - "epoch": 1.41, - "learning_rate": 8.905055723446225e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019161596864542316, + "loss": 0.0136, "step": 278750 }, { - "epoch": 1.41, - "learning_rate": 8.904298954144825e-05, - "loss": 0.0115, + "epoch": 0.72, + "learning_rate": 0.0001916120804290517, + "loss": 0.0133, "step": 278760 }, { - "epoch": 1.41, - "learning_rate": 8.903542184843423e-05, - "loss": 0.0111, + "epoch": 0.72, + "learning_rate": 0.00019160819221268022, + "loss": 0.0177, "step": 278770 }, { - "epoch": 1.41, - "learning_rate": 8.902785415542022e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.0001916043039963088, + "loss": 0.0153, "step": 278780 }, { - "epoch": 1.41, - "learning_rate": 8.90202864624062e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.0001916004157799373, + "loss": 0.0142, "step": 278790 }, { - "epoch": 1.41, - "learning_rate": 8.90127187693922e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019159652756356584, + "loss": 0.0167, "step": 278800 }, { - "epoch": 1.41, - "learning_rate": 8.900515107637819e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019159263934719436, + "loss": 0.0181, "step": 278810 }, { - "epoch": 1.41, - "learning_rate": 8.899758338336417e-05, - "loss": 0.009, + "epoch": 0.72, + "learning_rate": 0.00019158875113082293, + "loss": 0.0117, "step": 278820 }, { - "epoch": 1.41, - "learning_rate": 8.899001569035017e-05, - "loss": 0.0107, + "epoch": 0.72, + "learning_rate": 0.00019158486291445144, + "loss": 0.0162, "step": 278830 }, { - "epoch": 1.41, - "learning_rate": 8.898244799733616e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.00019158097469807998, + "loss": 0.0138, "step": 278840 }, { - "epoch": 1.41, - "learning_rate": 8.897488030432215e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.0001915770864817085, + "loss": 0.0188, "step": 278850 }, { - "epoch": 1.41, - "learning_rate": 8.896731261130814e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019157319826533707, + "loss": 0.0164, "step": 278860 }, { - "epoch": 1.41, - "learning_rate": 8.895974491829414e-05, - "loss": 0.0059, + "epoch": 0.72, + "learning_rate": 0.0001915693100489656, + "loss": 0.0143, "step": 278870 }, { - "epoch": 1.41, - "learning_rate": 8.895217722528012e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019156542183259412, + "loss": 0.0171, "step": 278880 }, { - "epoch": 1.41, - "learning_rate": 8.894460953226611e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.00019156153361622264, + "loss": 0.0156, "step": 278890 }, { - "epoch": 1.41, - "learning_rate": 8.89370418392521e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019155764539985118, + "loss": 0.0157, "step": 278900 }, { - "epoch": 1.41, - "learning_rate": 8.892947414623809e-05, - "loss": 0.0057, + "epoch": 0.72, + "learning_rate": 0.00019155375718347975, + "loss": 0.0133, "step": 278910 }, { - "epoch": 1.41, - "learning_rate": 8.892190645322408e-05, - "loss": 0.0089, + "epoch": 0.72, + "learning_rate": 0.00019154986896710826, + "loss": 0.0246, "step": 278920 }, { - "epoch": 1.41, - "learning_rate": 8.891433876021007e-05, - "loss": 0.0064, + "epoch": 0.72, + "learning_rate": 0.0001915459807507368, + "loss": 0.0165, "step": 278930 }, { - "epoch": 1.41, - "learning_rate": 8.890677106719606e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.00019154209253436532, + "loss": 0.0158, "step": 278940 }, { - "epoch": 1.41, - "learning_rate": 8.889920337418206e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.0001915382043179939, + "loss": 0.0173, "step": 278950 }, { - "epoch": 1.41, - "learning_rate": 8.889163568116804e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001915343161016224, + "loss": 0.0147, "step": 278960 }, { - "epoch": 1.41, - "learning_rate": 8.888406798815403e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019153042788525094, + "loss": 0.0155, "step": 278970 }, { - "epoch": 1.41, - "learning_rate": 8.887650029514001e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019152653966887946, + "loss": 0.0135, "step": 278980 }, { - "epoch": 1.41, - "learning_rate": 8.886893260212601e-05, - "loss": 0.0054, + "epoch": 0.72, + "learning_rate": 0.00019152265145250803, + "loss": 0.0136, "step": 278990 }, { - "epoch": 1.41, - "learning_rate": 8.8861364909112e-05, - "loss": 0.0108, + "epoch": 0.72, + "learning_rate": 0.00019151876323613654, + "loss": 0.0186, "step": 279000 }, { - "epoch": 1.41, - "eval_cer": 0.9144304696620207, - "eval_loss": 0.005943993106484413, - "eval_runtime": 116.6988, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.285, + "epoch": 0.72, + "eval_cer": 0.8817292794249172, + "eval_loss": 0.010195926763117313, + "eval_runtime": 107.8323, + "eval_samples_per_second": 18.547, + "eval_steps_per_second": 4.637, "step": 279000 }, { - "epoch": 1.41, - "learning_rate": 8.885379721609798e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019151487501976508, + "loss": 0.0157, "step": 279010 }, { - "epoch": 1.41, - "learning_rate": 8.884622952308398e-05, - "loss": 0.0072, + "epoch": 0.72, + "learning_rate": 0.0001915109868033936, + "loss": 0.0154, "step": 279020 }, { - "epoch": 1.41, - "learning_rate": 8.883866183006997e-05, - "loss": 0.0059, + "epoch": 0.72, + "learning_rate": 0.00019150709858702217, + "loss": 0.0161, "step": 279030 }, { - "epoch": 1.41, - "learning_rate": 8.883109413705596e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.0001915032103706507, + "loss": 0.0144, "step": 279040 }, { - "epoch": 1.41, - "learning_rate": 8.882352644404195e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019149932215427922, + "loss": 0.0188, "step": 279050 }, { - "epoch": 1.41, - "learning_rate": 8.881595875102793e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019149543393790774, + "loss": 0.0136, "step": 279060 }, { - "epoch": 1.41, - "learning_rate": 8.880839105801393e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001914915457215363, + "loss": 0.0121, "step": 279070 }, { - "epoch": 1.41, - "learning_rate": 8.880082336499992e-05, - "loss": 0.0054, + "epoch": 0.72, + "learning_rate": 0.00019148765750516485, + "loss": 0.0196, "step": 279080 }, { - "epoch": 1.41, - "learning_rate": 8.87932556719859e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.00019148376928879336, + "loss": 0.015, "step": 279090 }, { - "epoch": 1.41, - "learning_rate": 8.87856879789719e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.0001914798810724219, + "loss": 0.0128, "step": 279100 }, { - "epoch": 1.41, - "learning_rate": 8.87781202859579e-05, - "loss": 0.0065, + "epoch": 0.72, + "learning_rate": 0.00019147599285605045, + "loss": 0.0124, "step": 279110 }, { - "epoch": 1.41, - "learning_rate": 8.877055259294388e-05, - "loss": 0.0083, + "epoch": 0.72, + "learning_rate": 0.000191472104639679, + "loss": 0.0138, "step": 279120 }, { - "epoch": 1.41, - "learning_rate": 8.876298489992987e-05, - "loss": 0.0102, + "epoch": 0.72, + "learning_rate": 0.0001914682164233075, + "loss": 0.0174, "step": 279130 }, { - "epoch": 1.41, - "learning_rate": 8.875541720691585e-05, - "loss": 0.0076, + "epoch": 0.72, + "learning_rate": 0.00019146432820693604, + "loss": 0.0151, "step": 279140 }, { - "epoch": 1.41, - "learning_rate": 8.874784951390185e-05, - "loss": 0.008, + "epoch": 0.72, + "learning_rate": 0.00019146043999056456, + "loss": 0.0117, "step": 279150 }, { - "epoch": 1.41, - "learning_rate": 8.874028182088784e-05, - "loss": 0.0103, + "epoch": 0.72, + "learning_rate": 0.00019145655177419313, + "loss": 0.0133, "step": 279160 }, { - "epoch": 1.41, - "learning_rate": 8.873271412787382e-05, - "loss": 0.0114, + "epoch": 0.72, + "learning_rate": 0.00019145266355782164, + "loss": 0.0146, "step": 279170 }, { - "epoch": 1.41, - "learning_rate": 8.872514643485982e-05, - "loss": 0.011, + "epoch": 0.72, + "learning_rate": 0.00019144877534145018, + "loss": 0.0143, "step": 279180 }, { - "epoch": 1.41, - "learning_rate": 8.871757874184581e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.0001914448871250787, + "loss": 0.0138, "step": 279190 }, { - "epoch": 1.41, - "learning_rate": 8.87100110488318e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019144099890870727, + "loss": 0.0114, "step": 279200 }, { - "epoch": 1.41, - "learning_rate": 8.870244335581779e-05, - "loss": 0.0108, + "epoch": 0.72, + "learning_rate": 0.00019143711069233578, + "loss": 0.0166, "step": 279210 }, { - "epoch": 1.41, - "learning_rate": 8.869487566280377e-05, - "loss": 0.01, + "epoch": 0.72, + "learning_rate": 0.00019143322247596432, + "loss": 0.0165, "step": 279220 }, { - "epoch": 1.41, - "learning_rate": 8.868730796978977e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019142933425959284, + "loss": 0.0125, "step": 279230 }, { - "epoch": 1.41, - "learning_rate": 8.867974027677576e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.0001914254460432214, + "loss": 0.015, "step": 279240 }, { - "epoch": 1.41, - "learning_rate": 8.867217258376174e-05, - "loss": 0.0055, + "epoch": 0.72, + "learning_rate": 0.00019142155782684995, + "loss": 0.0129, "step": 279250 }, { - "epoch": 1.41, - "learning_rate": 8.866460489074774e-05, - "loss": 0.0071, + "epoch": 0.72, + "learning_rate": 0.00019141766961047846, + "loss": 0.0146, "step": 279260 }, { - "epoch": 1.41, - "learning_rate": 8.865703719773373e-05, - "loss": 0.0096, + "epoch": 0.72, + "learning_rate": 0.000191413781394107, + "loss": 0.0146, "step": 279270 }, { - "epoch": 1.41, - "learning_rate": 8.864946950471971e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019140989317773555, + "loss": 0.0109, "step": 279280 }, { - "epoch": 1.41, - "learning_rate": 8.864190181170571e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.0001914060049613641, + "loss": 0.0141, "step": 279290 }, { - "epoch": 1.41, - "learning_rate": 8.863433411869169e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.0001914021167449926, + "loss": 0.0164, "step": 279300 }, { - "epoch": 1.41, - "learning_rate": 8.862676642567769e-05, - "loss": 0.0074, + "epoch": 0.72, + "learning_rate": 0.00019139822852862114, + "loss": 0.0126, "step": 279310 }, { - "epoch": 1.41, - "learning_rate": 8.861919873266368e-05, - "loss": 0.0099, + "epoch": 0.72, + "learning_rate": 0.00019139434031224968, + "loss": 0.0166, "step": 279320 }, { - "epoch": 1.41, - "learning_rate": 8.861163103964966e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.00019139045209587823, + "loss": 0.0136, "step": 279330 }, { - "epoch": 1.41, - "learning_rate": 8.860406334663566e-05, - "loss": 0.0082, + "epoch": 0.72, + "learning_rate": 0.00019138656387950674, + "loss": 0.0162, "step": 279340 }, { - "epoch": 1.41, - "learning_rate": 8.859649565362162e-05, - "loss": 0.0097, + "epoch": 0.72, + "learning_rate": 0.00019138267566313528, + "loss": 0.0133, "step": 279350 }, { - "epoch": 1.41, - "learning_rate": 8.858892796060762e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019137878744676382, + "loss": 0.0139, "step": 279360 }, { - "epoch": 1.41, - "learning_rate": 8.858136026759361e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019137489923039237, + "loss": 0.0124, "step": 279370 }, { - "epoch": 1.41, - "learning_rate": 8.85737925745796e-05, - "loss": 0.0101, + "epoch": 0.72, + "learning_rate": 0.00019137101101402088, + "loss": 0.0157, "step": 279380 }, { - "epoch": 1.41, - "learning_rate": 8.856622488156559e-05, - "loss": 0.0099, + "epoch": 0.72, + "learning_rate": 0.00019136712279764942, + "loss": 0.0134, "step": 279390 }, { - "epoch": 1.41, - "learning_rate": 8.855865718855159e-05, - "loss": 0.01, + "epoch": 0.72, + "learning_rate": 0.00019136323458127794, + "loss": 0.0151, "step": 279400 }, { - "epoch": 1.41, - "learning_rate": 8.855108949553757e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001913593463649065, + "loss": 0.016, "step": 279410 }, { - "epoch": 1.41, - "learning_rate": 8.854352180252356e-05, - "loss": 0.0092, + "epoch": 0.72, + "learning_rate": 0.00019135545814853505, + "loss": 0.014, "step": 279420 }, { - "epoch": 1.41, - "learning_rate": 8.853595410950954e-05, - "loss": 0.0098, + "epoch": 0.72, + "learning_rate": 0.00019135156993216356, + "loss": 0.0143, "step": 279430 }, { - "epoch": 1.41, - "learning_rate": 8.852838641649554e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001913476817157921, + "loss": 0.0164, "step": 279440 }, { - "epoch": 1.41, - "learning_rate": 8.852081872348153e-05, - "loss": 0.0056, + "epoch": 0.72, + "learning_rate": 0.00019134379349942064, + "loss": 0.0156, "step": 279450 }, { - "epoch": 1.41, - "learning_rate": 8.851325103046752e-05, - "loss": 0.0063, + "epoch": 0.72, + "learning_rate": 0.00019133990528304919, + "loss": 0.0129, "step": 279460 }, { - "epoch": 1.41, - "learning_rate": 8.850568333745351e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.0001913360170666777, + "loss": 0.0214, "step": 279470 }, { - "epoch": 1.41, - "learning_rate": 8.84981156444395e-05, - "loss": 0.0077, + "epoch": 0.72, + "learning_rate": 0.00019133212885030624, + "loss": 0.0105, "step": 279480 }, { - "epoch": 1.41, - "learning_rate": 8.849054795142549e-05, - "loss": 0.0109, + "epoch": 0.72, + "learning_rate": 0.00019132824063393478, + "loss": 0.0181, "step": 279490 }, { - "epoch": 1.41, - "learning_rate": 8.848298025841148e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.00019132435241756333, + "loss": 0.0135, "step": 279500 }, { - "epoch": 1.41, - "learning_rate": 8.847541256539746e-05, - "loss": 0.0091, + "epoch": 0.72, + "learning_rate": 0.00019132046420119184, + "loss": 0.0152, "step": 279510 }, { - "epoch": 1.41, - "learning_rate": 8.846784487238346e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019131657598482038, + "loss": 0.012, "step": 279520 }, { - "epoch": 1.41, - "learning_rate": 8.846027717936945e-05, - "loss": 0.0068, + "epoch": 0.72, + "learning_rate": 0.00019131268776844892, + "loss": 0.0153, "step": 279530 }, { - "epoch": 1.41, - "learning_rate": 8.845270948635543e-05, - "loss": 0.0084, + "epoch": 0.72, + "learning_rate": 0.00019130879955207746, + "loss": 0.0132, "step": 279540 }, { - "epoch": 1.41, - "learning_rate": 8.844514179334143e-05, - "loss": 0.0085, + "epoch": 0.72, + "learning_rate": 0.00019130491133570598, + "loss": 0.0155, "step": 279550 }, { - "epoch": 1.41, - "learning_rate": 8.843757410032742e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.00019130102311933452, + "loss": 0.0135, "step": 279560 }, { - "epoch": 1.41, - "learning_rate": 8.84300064073134e-05, - "loss": 0.0079, + "epoch": 0.72, + "learning_rate": 0.0001912971349029631, + "loss": 0.0147, "step": 279570 }, { - "epoch": 1.41, - "learning_rate": 8.84224387142994e-05, - "loss": 0.0062, + "epoch": 0.72, + "learning_rate": 0.0001912932466865916, + "loss": 0.0135, "step": 279580 }, { - "epoch": 1.41, - "learning_rate": 8.841487102128538e-05, - "loss": 0.0073, + "epoch": 0.72, + "learning_rate": 0.00019128935847022015, + "loss": 0.0171, "step": 279590 }, { - "epoch": 1.41, - "learning_rate": 8.840730332827138e-05, - "loss": 0.006, + "epoch": 0.72, + "learning_rate": 0.00019128547025384866, + "loss": 0.0159, "step": 279600 }, { - "epoch": 1.41, - "learning_rate": 8.839973563525737e-05, - "loss": 0.0069, + "epoch": 0.72, + "learning_rate": 0.00019128158203747723, + "loss": 0.0124, "step": 279610 }, { - "epoch": 1.41, - "learning_rate": 8.839216794224335e-05, - "loss": 0.0088, + "epoch": 0.72, + "learning_rate": 0.00019127769382110574, + "loss": 0.0162, "step": 279620 }, { - "epoch": 1.41, - "learning_rate": 8.838460024922935e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019127380560473429, + "loss": 0.0142, "step": 279630 }, { - "epoch": 1.41, - "learning_rate": 8.837703255621534e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.0001912699173883628, + "loss": 0.0142, "step": 279640 }, { - "epoch": 1.41, - "learning_rate": 8.836946486320133e-05, - "loss": 0.0078, + "epoch": 0.72, + "learning_rate": 0.00019126602917199134, + "loss": 0.013, "step": 279650 }, { - "epoch": 1.41, - "learning_rate": 8.836189717018732e-05, - "loss": 0.0093, + "epoch": 0.72, + "learning_rate": 0.00019126214095561988, + "loss": 0.0145, "step": 279660 }, { - "epoch": 1.41, - "learning_rate": 8.83543294771733e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019125825273924842, + "loss": 0.0118, "step": 279670 }, { - "epoch": 1.41, - "learning_rate": 8.83467617841593e-05, - "loss": 0.0066, + "epoch": 0.72, + "learning_rate": 0.00019125436452287694, + "loss": 0.0145, "step": 279680 }, { - "epoch": 1.41, - "learning_rate": 8.833919409114529e-05, - "loss": 0.0081, + "epoch": 0.72, + "learning_rate": 0.00019125047630650548, + "loss": 0.0146, "step": 279690 }, { - "epoch": 1.41, - "learning_rate": 8.833162639813127e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019124658809013402, + "loss": 0.0154, "step": 279700 }, { - "epoch": 1.41, - "learning_rate": 8.832405870511727e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019124269987376256, + "loss": 0.0147, "step": 279710 }, { - "epoch": 1.41, - "learning_rate": 8.831649101210326e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019123881165739108, + "loss": 0.0143, "step": 279720 }, { - "epoch": 1.41, - "learning_rate": 8.830892331908924e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019123492344101962, + "loss": 0.0132, "step": 279730 }, { - "epoch": 1.41, - "learning_rate": 8.830135562607524e-05, - "loss": 0.0097, + "epoch": 0.73, + "learning_rate": 0.0001912310352246482, + "loss": 0.014, "step": 279740 }, { - "epoch": 1.41, - "learning_rate": 8.829378793306122e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.0001912271470082767, + "loss": 0.0153, "step": 279750 }, { - "epoch": 1.41, - "learning_rate": 8.828622024004722e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019122325879190522, + "loss": 0.0146, "step": 279760 }, { - "epoch": 1.41, - "learning_rate": 8.827865254703321e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019121937057553376, + "loss": 0.0138, "step": 279770 }, { - "epoch": 1.41, - "learning_rate": 8.827108485401919e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019121548235916233, + "loss": 0.013, "step": 279780 }, { - "epoch": 1.41, - "learning_rate": 8.826351716100519e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.00019121159414279084, + "loss": 0.0111, "step": 279790 }, { - "epoch": 1.41, - "learning_rate": 8.825594946799118e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019120770592641938, + "loss": 0.0108, "step": 279800 }, { - "epoch": 1.41, - "learning_rate": 8.824838177497716e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.0001912038177100479, + "loss": 0.0159, "step": 279810 }, { - "epoch": 1.41, - "learning_rate": 8.824081408196316e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019119992949367647, + "loss": 0.0155, "step": 279820 }, { - "epoch": 1.41, - "learning_rate": 8.823324638894914e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019119604127730498, + "loss": 0.0137, "step": 279830 }, { - "epoch": 1.41, - "learning_rate": 8.822567869593514e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019119215306093352, + "loss": 0.0183, "step": 279840 }, { - "epoch": 1.41, - "learning_rate": 8.821811100292113e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019118826484456204, + "loss": 0.0176, "step": 279850 }, { - "epoch": 1.41, - "learning_rate": 8.821054330990711e-05, - "loss": 0.0103, + "epoch": 0.73, + "learning_rate": 0.0001911843766281906, + "loss": 0.0154, "step": 279860 }, { - "epoch": 1.41, - "learning_rate": 8.820297561689311e-05, - "loss": 0.0126, + "epoch": 0.73, + "learning_rate": 0.00019118048841181912, + "loss": 0.0148, "step": 279870 }, { - "epoch": 1.41, - "learning_rate": 8.81954079238791e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019117660019544766, + "loss": 0.0156, "step": 279880 }, { - "epoch": 1.41, - "learning_rate": 8.818784023086508e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019117271197907618, + "loss": 0.0136, "step": 279890 }, { - "epoch": 1.41, - "learning_rate": 8.818027253785108e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019116882376270472, + "loss": 0.0185, "step": 279900 }, { - "epoch": 1.41, - "learning_rate": 8.817270484483707e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.0001911649355463333, + "loss": 0.0136, "step": 279910 }, { - "epoch": 1.41, - "learning_rate": 8.816513715182305e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.0001911610473299618, + "loss": 0.0154, "step": 279920 }, { - "epoch": 1.41, - "learning_rate": 8.815756945880905e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019115715911359032, + "loss": 0.0159, "step": 279930 }, { - "epoch": 1.41, - "learning_rate": 8.815000176579503e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019115327089721886, + "loss": 0.0156, "step": 279940 }, { - "epoch": 1.41, - "learning_rate": 8.814243407278103e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019114938268084743, + "loss": 0.0156, "step": 279950 }, { - "epoch": 1.41, - "learning_rate": 8.813486637976702e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019114549446447594, + "loss": 0.0147, "step": 279960 }, { - "epoch": 1.41, - "learning_rate": 8.8127298686753e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019114160624810448, + "loss": 0.018, "step": 279970 }, { - "epoch": 1.41, - "learning_rate": 8.811973099373898e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.000191137718031733, + "loss": 0.0225, "step": 279980 }, { - "epoch": 1.41, - "learning_rate": 8.811216330072497e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019113382981536157, + "loss": 0.0128, "step": 279990 }, { - "epoch": 1.41, - "learning_rate": 8.810459560771096e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019112994159899008, + "loss": 0.0165, "step": 280000 }, { - "epoch": 1.41, - "eval_cer": 0.914423676889143, - "eval_loss": 0.005915849469602108, - "eval_runtime": 116.6786, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.73, + "eval_cer": 0.8817152830555753, + "eval_loss": 0.010195476934313774, + "eval_runtime": 108.0537, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, "step": 280000 }, { - "epoch": 1.41, - "learning_rate": 8.809702791469696e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019112605338261862, + "loss": 0.0211, "step": 280010 }, { - "epoch": 1.41, - "learning_rate": 8.808946022168294e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00019112216516624714, + "loss": 0.0153, "step": 280020 }, { - "epoch": 1.41, - "learning_rate": 8.808189252866893e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.0001911182769498757, + "loss": 0.0141, "step": 280030 }, { - "epoch": 1.41, - "learning_rate": 8.807432483565491e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019111438873350422, + "loss": 0.015, "step": 280040 }, { - "epoch": 1.41, - "learning_rate": 8.806675714264091e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019111050051713276, + "loss": 0.0182, "step": 280050 }, { - "epoch": 1.41, - "learning_rate": 8.80591894496269e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019110661230076128, + "loss": 0.014, "step": 280060 }, { - "epoch": 1.41, - "learning_rate": 8.805162175661288e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019110272408438985, + "loss": 0.0166, "step": 280070 }, { - "epoch": 1.41, - "learning_rate": 8.804405406359888e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.00019109883586801836, + "loss": 0.0144, "step": 280080 }, { - "epoch": 1.41, - "learning_rate": 8.803648637058487e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.0001910949476516469, + "loss": 0.0145, "step": 280090 }, { - "epoch": 1.41, - "learning_rate": 8.802891867757086e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.00019109105943527542, + "loss": 0.0162, "step": 280100 }, { - "epoch": 1.41, - "learning_rate": 8.802135098455685e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.00019108717121890399, + "loss": 0.0169, "step": 280110 }, { - "epoch": 1.41, - "learning_rate": 8.801378329154283e-05, - "loss": 0.0122, + "epoch": 0.73, + "learning_rate": 0.00019108328300253253, + "loss": 0.016, "step": 280120 }, { - "epoch": 1.41, - "learning_rate": 8.800621559852883e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019107939478616104, + "loss": 0.0235, "step": 280130 }, { - "epoch": 1.41, - "learning_rate": 8.799864790551482e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019107550656978958, + "loss": 0.032, "step": 280140 }, { - "epoch": 1.41, - "learning_rate": 8.79910802125008e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.0001910716183534181, + "loss": 0.0134, "step": 280150 }, { - "epoch": 1.41, - "learning_rate": 8.79835125194868e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019106773013704667, + "loss": 0.0124, "step": 280160 }, { - "epoch": 1.41, - "learning_rate": 8.79759448264728e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019106384192067518, + "loss": 0.0107, "step": 280170 }, { - "epoch": 1.41, - "learning_rate": 8.796837713345878e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019105995370430372, + "loss": 0.0157, "step": 280180 }, { - "epoch": 1.41, - "learning_rate": 8.796080944044477e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019105606548793224, + "loss": 0.0127, "step": 280190 }, { - "epoch": 1.41, - "learning_rate": 8.795324174743075e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.0001910521772715608, + "loss": 0.0135, "step": 280200 }, { - "epoch": 1.41, - "learning_rate": 8.794567405441675e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019104828905518932, + "loss": 0.0175, "step": 280210 }, { - "epoch": 1.41, - "learning_rate": 8.793810636140274e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.00019104440083881786, + "loss": 0.0162, "step": 280220 }, { - "epoch": 1.41, - "learning_rate": 8.793053866838872e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.00019104051262244638, + "loss": 0.0156, "step": 280230 }, { - "epoch": 1.41, - "learning_rate": 8.792297097537472e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019103662440607495, + "loss": 0.0172, "step": 280240 }, { - "epoch": 1.41, - "learning_rate": 8.791540328236071e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.00019103273618970346, + "loss": 0.0169, "step": 280250 }, { - "epoch": 1.41, - "learning_rate": 8.79078355893467e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.000191028847973332, + "loss": 0.0134, "step": 280260 }, { - "epoch": 1.41, - "learning_rate": 8.790026789633269e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019102495975696052, + "loss": 0.0184, "step": 280270 }, { - "epoch": 1.41, - "learning_rate": 8.789270020331867e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019102107154058909, + "loss": 0.0172, "step": 280280 }, { - "epoch": 1.41, - "learning_rate": 8.788513251030467e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019101718332421763, + "loss": 0.0126, "step": 280290 }, { - "epoch": 1.41, - "learning_rate": 8.787756481729066e-05, - "loss": 0.0112, + "epoch": 0.73, + "learning_rate": 0.00019101329510784614, + "loss": 0.0117, "step": 280300 }, { - "epoch": 1.41, - "learning_rate": 8.786999712427664e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00019100940689147468, + "loss": 0.0147, "step": 280310 }, { - "epoch": 1.41, - "learning_rate": 8.786242943126264e-05, - "loss": 0.0099, + "epoch": 0.73, + "learning_rate": 0.00019100551867510322, + "loss": 0.0138, "step": 280320 }, { - "epoch": 1.41, - "learning_rate": 8.785486173824863e-05, - "loss": 0.0113, + "epoch": 0.73, + "learning_rate": 0.00019100163045873177, + "loss": 0.0158, "step": 280330 }, { - "epoch": 1.41, - "learning_rate": 8.784729404523461e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.00019099774224236028, + "loss": 0.0142, "step": 280340 }, { - "epoch": 1.41, - "learning_rate": 8.783972635222061e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019099385402598882, + "loss": 0.0195, "step": 280350 }, { - "epoch": 1.41, - "learning_rate": 8.78321586592066e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019098996580961736, + "loss": 0.0155, "step": 280360 }, { - "epoch": 1.41, - "learning_rate": 8.782459096619259e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.0001909860775932459, + "loss": 0.0134, "step": 280370 }, { - "epoch": 1.41, - "learning_rate": 8.781702327317858e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019098218937687442, + "loss": 0.0128, "step": 280380 }, { - "epoch": 1.41, - "learning_rate": 8.780945558016456e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019097830116050296, + "loss": 0.0174, "step": 280390 }, { - "epoch": 1.41, - "learning_rate": 8.780188788715056e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019097441294413148, + "loss": 0.0157, "step": 280400 }, { - "epoch": 1.41, - "learning_rate": 8.779432019413655e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019097052472776005, + "loss": 0.013, "step": 280410 }, { - "epoch": 1.41, - "learning_rate": 8.778675250112253e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.00019096663651138856, + "loss": 0.0121, "step": 280420 }, { - "epoch": 1.41, - "learning_rate": 8.777918480810853e-05, - "loss": 0.0049, + "epoch": 0.73, + "learning_rate": 0.0001909627482950171, + "loss": 0.0151, "step": 280430 }, { - "epoch": 1.41, - "learning_rate": 8.777161711509452e-05, - "loss": 0.0099, + "epoch": 0.73, + "learning_rate": 0.00019095886007864562, + "loss": 0.0199, "step": 280440 }, { - "epoch": 1.41, - "learning_rate": 8.77640494220805e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019095497186227418, + "loss": 0.0145, "step": 280450 }, { - "epoch": 1.41, - "learning_rate": 8.77564817290665e-05, - "loss": 0.0061, + "epoch": 0.73, + "learning_rate": 0.00019095108364590273, + "loss": 0.0121, "step": 280460 }, { - "epoch": 1.42, - "learning_rate": 8.774891403605248e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019094719542953124, + "loss": 0.0159, "step": 280470 }, { - "epoch": 1.42, - "learning_rate": 8.774134634303848e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00019094330721315976, + "loss": 0.0155, "step": 280480 }, { - "epoch": 1.42, - "learning_rate": 8.773377865002447e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019093941899678832, + "loss": 0.0162, "step": 280490 }, { - "epoch": 1.42, - "learning_rate": 8.772621095701045e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019093553078041687, + "loss": 0.0162, "step": 280500 }, { - "epoch": 1.42, - "learning_rate": 8.771864326399645e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019093164256404538, + "loss": 0.0155, "step": 280510 }, { - "epoch": 1.42, - "learning_rate": 8.771107557098244e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.00019092775434767392, + "loss": 0.0153, "step": 280520 }, { - "epoch": 1.42, - "learning_rate": 8.770350787796842e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019092386613130246, + "loss": 0.0152, "step": 280530 }, { - "epoch": 1.42, - "learning_rate": 8.769594018495442e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.000190919977914931, + "loss": 0.0137, "step": 280540 }, { - "epoch": 1.42, - "learning_rate": 8.76883724919404e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019091608969855952, + "loss": 0.0123, "step": 280550 }, { - "epoch": 1.42, - "learning_rate": 8.76808047989264e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019091220148218806, + "loss": 0.0149, "step": 280560 }, { - "epoch": 1.42, - "learning_rate": 8.767323710591239e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.0001909083132658166, + "loss": 0.0118, "step": 280570 }, { - "epoch": 1.42, - "learning_rate": 8.766566941289837e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.00019090442504944514, + "loss": 0.0129, "step": 280580 }, { - "epoch": 1.42, - "learning_rate": 8.765810171988437e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019090053683307366, + "loss": 0.0132, "step": 280590 }, { - "epoch": 1.42, - "learning_rate": 8.765053402687033e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.0001908966486167022, + "loss": 0.013, "step": 280600 }, { - "epoch": 1.42, - "learning_rate": 8.764296633385633e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019089276040033072, + "loss": 0.0155, "step": 280610 }, { - "epoch": 1.42, - "learning_rate": 8.763539864084232e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00019088887218395928, + "loss": 0.0131, "step": 280620 }, { - "epoch": 1.42, - "learning_rate": 8.76278309478283e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.0001908849839675878, + "loss": 0.0158, "step": 280630 }, { - "epoch": 1.42, - "learning_rate": 8.76202632548143e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019088109575121634, + "loss": 0.0185, "step": 280640 }, { - "epoch": 1.42, - "learning_rate": 8.761269556180028e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019087720753484485, + "loss": 0.0178, "step": 280650 }, { - "epoch": 1.42, - "learning_rate": 8.760512786878628e-05, - "loss": 0.0095, + "epoch": 0.73, + "learning_rate": 0.00019087331931847342, + "loss": 0.0114, "step": 280660 }, { - "epoch": 1.42, - "learning_rate": 8.759756017577227e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019086943110210197, + "loss": 0.0143, "step": 280670 }, { - "epoch": 1.42, - "learning_rate": 8.758999248275825e-05, - "loss": 0.0133, + "epoch": 0.73, + "learning_rate": 0.00019086554288573048, + "loss": 0.0151, "step": 280680 }, { - "epoch": 1.42, - "learning_rate": 8.758242478974425e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019086165466935902, + "loss": 0.0171, "step": 280690 }, { - "epoch": 1.42, - "learning_rate": 8.757485709673024e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019085776645298756, + "loss": 0.0139, "step": 280700 }, { - "epoch": 1.42, - "learning_rate": 8.756728940371623e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.0001908538782366161, + "loss": 0.0139, "step": 280710 }, { - "epoch": 1.42, - "learning_rate": 8.755972171070222e-05, - "loss": 0.0055, + "epoch": 0.73, + "learning_rate": 0.00019084999002024462, + "loss": 0.0139, "step": 280720 }, { - "epoch": 1.42, - "learning_rate": 8.75521540176882e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019084610180387316, + "loss": 0.0183, "step": 280730 }, { - "epoch": 1.42, - "learning_rate": 8.75445863246742e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.0001908422135875017, + "loss": 0.0135, "step": 280740 }, { - "epoch": 1.42, - "learning_rate": 8.753701863166019e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019083832537113024, + "loss": 0.0157, "step": 280750 }, { - "epoch": 1.42, - "learning_rate": 8.752945093864617e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019083443715475876, + "loss": 0.0118, "step": 280760 }, { - "epoch": 1.42, - "learning_rate": 8.752188324563217e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.0001908305489383873, + "loss": 0.0185, "step": 280770 }, { - "epoch": 1.42, - "learning_rate": 8.751431555261816e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.00019082666072201587, + "loss": 0.0136, "step": 280780 }, { - "epoch": 1.42, - "learning_rate": 8.750674785960414e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019082277250564438, + "loss": 0.0126, "step": 280790 }, { - "epoch": 1.42, - "learning_rate": 8.749918016659014e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.0001908188842892729, + "loss": 0.0157, "step": 280800 }, { - "epoch": 1.42, - "learning_rate": 8.749161247357613e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019081499607290144, + "loss": 0.0156, "step": 280810 }, { - "epoch": 1.42, - "learning_rate": 8.748404478056212e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019081110785653, + "loss": 0.0117, "step": 280820 }, { - "epoch": 1.42, - "learning_rate": 8.747647708754811e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00019080721964015852, + "loss": 0.0145, "step": 280830 }, { - "epoch": 1.42, - "learning_rate": 8.746890939453409e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.00019080333142378706, + "loss": 0.0137, "step": 280840 }, { - "epoch": 1.42, - "learning_rate": 8.746134170152009e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.00019079944320741558, + "loss": 0.0166, "step": 280850 }, { - "epoch": 1.42, - "learning_rate": 8.745377400850608e-05, - "loss": 0.0055, + "epoch": 0.73, + "learning_rate": 0.00019079555499104412, + "loss": 0.0142, "step": 280860 }, { - "epoch": 1.42, - "learning_rate": 8.744620631549206e-05, - "loss": 0.011, + "epoch": 0.73, + "learning_rate": 0.00019079166677467266, + "loss": 0.0161, "step": 280870 }, { - "epoch": 1.42, - "learning_rate": 8.743863862247806e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.0001907877785583012, + "loss": 0.0152, "step": 280880 }, { - "epoch": 1.42, - "learning_rate": 8.743107092946405e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019078389034192972, + "loss": 0.0178, "step": 280890 }, { - "epoch": 1.42, - "learning_rate": 8.742350323645004e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019078000212555826, + "loss": 0.011, "step": 280900 }, { - "epoch": 1.42, - "learning_rate": 8.741593554343603e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.0001907761139091868, + "loss": 0.0145, "step": 280910 }, { - "epoch": 1.42, - "learning_rate": 8.740836785042201e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019077222569281534, + "loss": 0.0168, "step": 280920 }, { - "epoch": 1.42, - "learning_rate": 8.740080015740801e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019076833747644386, + "loss": 0.0149, "step": 280930 }, { - "epoch": 1.42, - "learning_rate": 8.7393232464394e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.0001907644492600724, + "loss": 0.0135, "step": 280940 }, { - "epoch": 1.42, - "learning_rate": 8.738566477137998e-05, - "loss": 0.0059, + "epoch": 0.73, + "learning_rate": 0.00019076056104370094, + "loss": 0.019, "step": 280950 }, { - "epoch": 1.42, - "learning_rate": 8.737809707836598e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019075667282732948, + "loss": 0.0133, "step": 280960 }, { - "epoch": 1.42, - "learning_rate": 8.737052938535197e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.000190752784610958, + "loss": 0.0153, "step": 280970 }, { - "epoch": 1.42, - "learning_rate": 8.736296169233795e-05, - "loss": 0.0103, + "epoch": 0.73, + "learning_rate": 0.00019074889639458654, + "loss": 0.0193, "step": 280980 }, { - "epoch": 1.42, - "learning_rate": 8.735539399932395e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.0001907450081782151, + "loss": 0.013, "step": 280990 }, { - "epoch": 1.42, - "learning_rate": 8.734782630630993e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00019074111996184362, + "loss": 0.0145, "step": 281000 }, { - "epoch": 1.42, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.0056717172265052795, - "eval_runtime": 115.6852, - "eval_samples_per_second": 17.288, - "eval_steps_per_second": 4.322, + "epoch": 0.73, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.010047990828752518, + "eval_runtime": 108.1788, + "eval_samples_per_second": 18.488, + "eval_steps_per_second": 4.622, "step": 281000 }, { - "epoch": 1.42, - "learning_rate": 8.734025861329593e-05, - "loss": 0.013, + "epoch": 0.73, + "learning_rate": 0.00019073723174547216, + "loss": 0.0189, "step": 281010 }, { - "epoch": 1.42, - "learning_rate": 8.733269092028192e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019073334352910068, + "loss": 0.015, "step": 281020 }, { - "epoch": 1.42, - "learning_rate": 8.73251232272679e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019072945531272925, + "loss": 0.0122, "step": 281030 }, { - "epoch": 1.42, - "learning_rate": 8.73175555342539e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019072556709635776, + "loss": 0.0158, "step": 281040 }, { - "epoch": 1.42, - "learning_rate": 8.730998784123989e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.0001907216788799863, + "loss": 0.0164, "step": 281050 }, { - "epoch": 1.42, - "learning_rate": 8.730242014822587e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019071779066361482, + "loss": 0.0149, "step": 281060 }, { - "epoch": 1.42, - "learning_rate": 8.729485245521187e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.0001907139024472434, + "loss": 0.0125, "step": 281070 }, { - "epoch": 1.42, - "learning_rate": 8.728728476219785e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.0001907100142308719, + "loss": 0.0146, "step": 281080 }, { - "epoch": 1.42, - "learning_rate": 8.727971706918385e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019070612601450044, + "loss": 0.0176, "step": 281090 }, { - "epoch": 1.42, - "learning_rate": 8.727214937616984e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019070223779812896, + "loss": 0.0165, "step": 281100 }, { - "epoch": 1.42, - "learning_rate": 8.726458168315582e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.0001906983495817575, + "loss": 0.0114, "step": 281110 }, { - "epoch": 1.42, - "learning_rate": 8.725701399014182e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019069446136538604, + "loss": 0.0165, "step": 281120 }, { - "epoch": 1.42, - "learning_rate": 8.724944629712781e-05, - "loss": 0.0095, + "epoch": 0.73, + "learning_rate": 0.00019069057314901458, + "loss": 0.0144, "step": 281130 }, { - "epoch": 1.42, - "learning_rate": 8.72418786041138e-05, - "loss": 0.0093, + "epoch": 0.73, + "learning_rate": 0.0001906866849326431, + "loss": 0.0157, "step": 281140 }, { - "epoch": 1.42, - "learning_rate": 8.723431091109979e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.00019068279671627164, + "loss": 0.0141, "step": 281150 }, { - "epoch": 1.42, - "learning_rate": 8.722674321808577e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.0001906789084999002, + "loss": 0.0148, "step": 281160 }, { - "epoch": 1.42, - "learning_rate": 8.721917552507176e-05, - "loss": 0.0051, + "epoch": 0.73, + "learning_rate": 0.00019067502028352872, + "loss": 0.0156, "step": 281170 }, { - "epoch": 1.42, - "learning_rate": 8.721160783205776e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019067113206715726, + "loss": 0.014, "step": 281180 }, { - "epoch": 1.42, - "learning_rate": 8.720404013904374e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019066724385078578, + "loss": 0.0116, "step": 281190 }, { - "epoch": 1.42, - "learning_rate": 8.719647244602974e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019066335563441435, + "loss": 0.0144, "step": 281200 }, { - "epoch": 1.42, - "learning_rate": 8.718890475301573e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019065946741804286, + "loss": 0.0135, "step": 281210 }, { - "epoch": 1.42, - "learning_rate": 8.718133706000171e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.0001906555792016714, + "loss": 0.0153, "step": 281220 }, { - "epoch": 1.42, - "learning_rate": 8.71737693669877e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.00019065169098529992, + "loss": 0.0201, "step": 281230 }, { - "epoch": 1.42, - "learning_rate": 8.716620167397368e-05, - "loss": 0.0061, + "epoch": 0.73, + "learning_rate": 0.00019064780276892849, + "loss": 0.0114, "step": 281240 }, { - "epoch": 1.42, - "learning_rate": 8.715863398095967e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.000190643914552557, + "loss": 0.0143, "step": 281250 }, { - "epoch": 1.42, - "learning_rate": 8.715106628794567e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019064002633618554, + "loss": 0.0143, "step": 281260 }, { - "epoch": 1.42, - "learning_rate": 8.714349859493165e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.00019063613811981406, + "loss": 0.0174, "step": 281270 }, { - "epoch": 1.42, - "learning_rate": 8.713593090191764e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019063224990344263, + "loss": 0.018, "step": 281280 }, { - "epoch": 1.42, - "learning_rate": 8.712836320890362e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019062836168707114, + "loss": 0.017, "step": 281290 }, { - "epoch": 1.42, - "learning_rate": 8.712079551588962e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019062447347069968, + "loss": 0.0121, "step": 281300 }, { - "epoch": 1.42, - "learning_rate": 8.711322782287561e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.0001906205852543282, + "loss": 0.0122, "step": 281310 }, { - "epoch": 1.42, - "learning_rate": 8.71056601298616e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019061669703795677, + "loss": 0.0159, "step": 281320 }, { - "epoch": 1.42, - "learning_rate": 8.709809243684759e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.0001906128088215853, + "loss": 0.0146, "step": 281330 }, { - "epoch": 1.42, - "learning_rate": 8.709052474383359e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019060892060521382, + "loss": 0.0152, "step": 281340 }, { - "epoch": 1.42, - "learning_rate": 8.708295705081957e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019060503238884234, + "loss": 0.0172, "step": 281350 }, { - "epoch": 1.42, - "learning_rate": 8.707538935780556e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019060114417247088, + "loss": 0.0174, "step": 281360 }, { - "epoch": 1.42, - "learning_rate": 8.706782166479154e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019059725595609945, + "loss": 0.0141, "step": 281370 }, { - "epoch": 1.42, - "learning_rate": 8.706025397177754e-05, - "loss": 0.0046, + "epoch": 0.73, + "learning_rate": 0.00019059336773972796, + "loss": 0.0177, "step": 281380 }, { - "epoch": 1.42, - "learning_rate": 8.705268627876353e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.0001905894795233565, + "loss": 0.0122, "step": 281390 }, { - "epoch": 1.42, - "learning_rate": 8.704511858574951e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.00019058559130698502, + "loss": 0.0151, "step": 281400 }, { - "epoch": 1.42, - "learning_rate": 8.703755089273551e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019058170309061359, + "loss": 0.0141, "step": 281410 }, { - "epoch": 1.42, - "learning_rate": 8.70299831997215e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.0001905778148742421, + "loss": 0.0171, "step": 281420 }, { - "epoch": 1.42, - "learning_rate": 8.702241550670749e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019057392665787064, + "loss": 0.0141, "step": 281430 }, { - "epoch": 1.42, - "learning_rate": 8.701484781369348e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019057003844149916, + "loss": 0.013, "step": 281440 }, { - "epoch": 1.42, - "learning_rate": 8.700728012067946e-05, - "loss": 0.0126, + "epoch": 0.73, + "learning_rate": 0.00019056615022512773, + "loss": 0.0134, "step": 281450 }, { - "epoch": 1.42, - "learning_rate": 8.699971242766546e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019056226200875624, + "loss": 0.0148, "step": 281460 }, { - "epoch": 1.42, - "learning_rate": 8.699214473465145e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019055837379238478, + "loss": 0.0134, "step": 281470 }, { - "epoch": 1.42, - "learning_rate": 8.698457704163743e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.0001905544855760133, + "loss": 0.0179, "step": 281480 }, { - "epoch": 1.42, - "learning_rate": 8.697700934862343e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019055059735964186, + "loss": 0.0156, "step": 281490 }, { - "epoch": 1.42, - "learning_rate": 8.696944165560942e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.0001905467091432704, + "loss": 0.01, "step": 281500 }, { - "epoch": 1.42, - "learning_rate": 8.69618739625954e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019054282092689892, + "loss": 0.0147, "step": 281510 }, { - "epoch": 1.42, - "learning_rate": 8.69543062695814e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019053893271052744, + "loss": 0.0145, "step": 281520 }, { - "epoch": 1.42, - "learning_rate": 8.694673857656738e-05, - "loss": 0.0061, + "epoch": 0.73, + "learning_rate": 0.000190535044494156, + "loss": 0.01, "step": 281530 }, { - "epoch": 1.42, - "learning_rate": 8.693917088355338e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019053115627778455, + "loss": 0.0117, "step": 281540 }, { - "epoch": 1.42, - "learning_rate": 8.693160319053937e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019052726806141306, + "loss": 0.0158, "step": 281550 }, { - "epoch": 1.42, - "learning_rate": 8.692403549752535e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.0001905233798450416, + "loss": 0.0133, "step": 281560 }, { - "epoch": 1.42, - "learning_rate": 8.691646780451135e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.00019051949162867014, + "loss": 0.0128, "step": 281570 }, { - "epoch": 1.42, - "learning_rate": 8.690890011149734e-05, - "loss": 0.0055, + "epoch": 0.73, + "learning_rate": 0.00019051560341229869, + "loss": 0.0171, "step": 281580 }, { - "epoch": 1.42, - "learning_rate": 8.690133241848332e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.0001905117151959272, + "loss": 0.0108, "step": 281590 }, { - "epoch": 1.42, - "learning_rate": 8.689376472546932e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019050782697955574, + "loss": 0.018, "step": 281600 }, { - "epoch": 1.42, - "learning_rate": 8.68861970324553e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019050393876318426, + "loss": 0.0165, "step": 281610 }, { - "epoch": 1.42, - "learning_rate": 8.68786293394413e-05, - "loss": 0.0119, + "epoch": 0.73, + "learning_rate": 0.00019050005054681282, + "loss": 0.0144, "step": 281620 }, { - "epoch": 1.42, - "learning_rate": 8.687106164642729e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019049616233044134, + "loss": 0.0168, "step": 281630 }, { - "epoch": 1.42, - "learning_rate": 8.686349395341327e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019049227411406988, + "loss": 0.0178, "step": 281640 }, { - "epoch": 1.42, - "learning_rate": 8.685592626039927e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.0001904883858976984, + "loss": 0.0169, "step": 281650 }, { - "epoch": 1.42, - "learning_rate": 8.684835856738526e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.00019048449768132696, + "loss": 0.0129, "step": 281660 }, { - "epoch": 1.42, - "learning_rate": 8.684079087437124e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019048060946495548, + "loss": 0.0169, "step": 281670 }, { - "epoch": 1.42, - "learning_rate": 8.683322318135724e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019047672124858402, + "loss": 0.0171, "step": 281680 }, { - "epoch": 1.42, - "learning_rate": 8.682565548834322e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019047283303221253, + "loss": 0.0126, "step": 281690 }, { - "epoch": 1.42, - "learning_rate": 8.681808779532922e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.0001904689448158411, + "loss": 0.0137, "step": 281700 }, { - "epoch": 1.42, - "learning_rate": 8.681052010231521e-05, - "loss": 0.0157, + "epoch": 0.73, + "learning_rate": 0.00019046505659946965, + "loss": 0.0178, "step": 281710 }, { - "epoch": 1.42, - "learning_rate": 8.680295240930119e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019046116838309816, + "loss": 0.0145, "step": 281720 }, { - "epoch": 1.42, - "learning_rate": 8.679538471628719e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.0001904572801667267, + "loss": 0.0157, "step": 281730 }, { - "epoch": 1.42, - "learning_rate": 8.678781702327318e-05, - "loss": 0.0093, + "epoch": 0.73, + "learning_rate": 0.00019045339195035524, + "loss": 0.012, "step": 281740 }, { - "epoch": 1.42, - "learning_rate": 8.678024933025916e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019044950373398378, + "loss": 0.0136, "step": 281750 }, { - "epoch": 1.42, - "learning_rate": 8.677268163724516e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.0001904456155176123, + "loss": 0.0145, "step": 281760 }, { - "epoch": 1.42, - "learning_rate": 8.676511394423114e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019044172730124084, + "loss": 0.0142, "step": 281770 }, { - "epoch": 1.42, - "learning_rate": 8.675754625121713e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019043783908486938, + "loss": 0.0283, "step": 281780 }, { - "epoch": 1.42, - "learning_rate": 8.674997855820313e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00019043395086849792, + "loss": 0.0161, "step": 281790 }, { - "epoch": 1.42, - "learning_rate": 8.674241086518911e-05, - "loss": 0.0058, + "epoch": 0.73, + "learning_rate": 0.00019043006265212644, + "loss": 0.0145, "step": 281800 }, { - "epoch": 1.42, - "learning_rate": 8.67348431721751e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019042617443575498, + "loss": 0.0174, "step": 281810 }, { - "epoch": 1.42, - "learning_rate": 8.67272754791611e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019042228621938352, + "loss": 0.0128, "step": 281820 }, { - "epoch": 1.42, - "learning_rate": 8.671970778614708e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019041839800301206, + "loss": 0.0145, "step": 281830 }, { - "epoch": 1.42, - "learning_rate": 8.671214009313308e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.00019041450978664058, + "loss": 0.0177, "step": 281840 }, { - "epoch": 1.42, - "learning_rate": 8.670457240011907e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019041062157026912, + "loss": 0.0167, "step": 281850 }, { - "epoch": 1.42, - "learning_rate": 8.669700470710504e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019040673335389763, + "loss": 0.0154, "step": 281860 }, { - "epoch": 1.42, - "learning_rate": 8.668943701409104e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.0001904028451375262, + "loss": 0.0108, "step": 281870 }, { - "epoch": 1.42, - "learning_rate": 8.668186932107702e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019039895692115474, + "loss": 0.0149, "step": 281880 }, { - "epoch": 1.42, - "learning_rate": 8.667430162806301e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00019039506870478326, + "loss": 0.0156, "step": 281890 }, { - "epoch": 1.42, - "learning_rate": 8.666673393504899e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.0001903911804884118, + "loss": 0.0129, "step": 281900 }, { - "epoch": 1.42, - "learning_rate": 8.665916624203499e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019038729227204034, + "loss": 0.0135, "step": 281910 }, { - "epoch": 1.42, - "learning_rate": 8.665159854902098e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00019038340405566888, + "loss": 0.0144, "step": 281920 }, { - "epoch": 1.42, - "learning_rate": 8.664403085600696e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.0001903795158392974, + "loss": 0.0146, "step": 281930 }, { - "epoch": 1.42, - "learning_rate": 8.663646316299296e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019037562762292594, + "loss": 0.0166, "step": 281940 }, { - "epoch": 1.42, - "learning_rate": 8.662889546997895e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019037173940655448, + "loss": 0.0114, "step": 281950 }, { - "epoch": 1.42, - "learning_rate": 8.662132777696494e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019036785119018302, + "loss": 0.013, "step": 281960 }, { - "epoch": 1.42, - "learning_rate": 8.661376008395093e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019036396297381154, + "loss": 0.0163, "step": 281970 }, { - "epoch": 1.42, - "learning_rate": 8.660619239093691e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00019036007475744008, + "loss": 0.0141, "step": 281980 }, { - "epoch": 1.42, - "learning_rate": 8.659862469792291e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019035618654106862, + "loss": 0.0136, "step": 281990 }, { - "epoch": 1.42, - "learning_rate": 8.65910570049089e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019035229832469716, + "loss": 0.0137, "step": 282000 }, { - "epoch": 1.42, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.005825493950396776, - "eval_runtime": 115.8458, - "eval_samples_per_second": 17.264, - "eval_steps_per_second": 4.316, + "epoch": 0.73, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.009928989224135876, + "eval_runtime": 108.1846, + "eval_samples_per_second": 18.487, + "eval_steps_per_second": 4.622, "step": 282000 }, { - "epoch": 1.42, - "learning_rate": 8.658348931189488e-05, - "loss": 0.0092, + "epoch": 0.73, + "learning_rate": 0.00019034841010832568, + "loss": 0.0146, "step": 282010 }, { - "epoch": 1.42, - "learning_rate": 8.657592161888088e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019034452189195422, + "loss": 0.012, "step": 282020 }, { - "epoch": 1.42, - "learning_rate": 8.656835392586687e-05, - "loss": 0.0086, + "epoch": 0.73, + "learning_rate": 0.0001903406336755828, + "loss": 0.0128, "step": 282030 }, { - "epoch": 1.42, - "learning_rate": 8.656078623285286e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.0001903367454592113, + "loss": 0.0145, "step": 282040 }, { - "epoch": 1.42, - "learning_rate": 8.655321853983885e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019033285724283984, + "loss": 0.0155, "step": 282050 }, { - "epoch": 1.42, - "learning_rate": 8.654565084682483e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019032896902646836, + "loss": 0.0133, "step": 282060 }, { - "epoch": 1.42, - "learning_rate": 8.653808315381083e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019032508081009693, + "loss": 0.0159, "step": 282070 }, { - "epoch": 1.42, - "learning_rate": 8.653051546079682e-05, - "loss": 0.0097, + "epoch": 0.73, + "learning_rate": 0.00019032119259372544, + "loss": 0.0148, "step": 282080 }, { - "epoch": 1.42, - "learning_rate": 8.65229477677828e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019031730437735398, + "loss": 0.0127, "step": 282090 }, { - "epoch": 1.42, - "learning_rate": 8.65153800747688e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.0001903134161609825, + "loss": 0.0153, "step": 282100 }, { - "epoch": 1.42, - "learning_rate": 8.650781238175479e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019030952794461104, + "loss": 0.0137, "step": 282110 }, { - "epoch": 1.42, - "learning_rate": 8.650024468874077e-05, - "loss": 0.0104, + "epoch": 0.73, + "learning_rate": 0.00019030563972823958, + "loss": 0.0109, "step": 282120 }, { - "epoch": 1.42, - "learning_rate": 8.649267699572677e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019030175151186812, + "loss": 0.018, "step": 282130 }, { - "epoch": 1.42, - "learning_rate": 8.648510930271275e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00019029786329549664, + "loss": 0.0142, "step": 282140 }, { - "epoch": 1.42, - "learning_rate": 8.647754160969875e-05, - "loss": 0.0108, + "epoch": 0.73, + "learning_rate": 0.00019029397507912518, + "loss": 0.0119, "step": 282150 }, { - "epoch": 1.42, - "learning_rate": 8.646997391668474e-05, - "loss": 0.0059, + "epoch": 0.73, + "learning_rate": 0.00019029008686275372, + "loss": 0.0152, "step": 282160 }, { - "epoch": 1.42, - "learning_rate": 8.646240622367072e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019028619864638226, + "loss": 0.0132, "step": 282170 }, { - "epoch": 1.42, - "learning_rate": 8.645483853065672e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019028231043001078, + "loss": 0.0144, "step": 282180 }, { - "epoch": 1.42, - "learning_rate": 8.644727083764271e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00019027842221363932, + "loss": 0.0173, "step": 282190 }, { - "epoch": 1.42, - "learning_rate": 8.64397031446287e-05, - "loss": 0.0103, - "step": 282200 + "epoch": 0.73, + "learning_rate": 0.0001902745339972679, + "loss": 0.015, + "step": 282200 }, { - "epoch": 1.42, - "learning_rate": 8.643213545161469e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.0001902706457808964, + "loss": 0.0188, "step": 282210 }, { - "epoch": 1.42, - "learning_rate": 8.642456775860067e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019026675756452492, + "loss": 0.0127, "step": 282220 }, { - "epoch": 1.42, - "learning_rate": 8.641700006558667e-05, - "loss": 0.0054, + "epoch": 0.73, + "learning_rate": 0.00019026286934815346, + "loss": 0.0142, "step": 282230 }, { - "epoch": 1.42, - "learning_rate": 8.640943237257266e-05, - "loss": 0.0093, + "epoch": 0.73, + "learning_rate": 0.00019025898113178203, + "loss": 0.0137, "step": 282240 }, { - "epoch": 1.42, - "learning_rate": 8.640186467955864e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019025509291541054, + "loss": 0.018, "step": 282250 }, { - "epoch": 1.42, - "learning_rate": 8.639429698654464e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019025120469903908, + "loss": 0.0155, "step": 282260 }, { - "epoch": 1.42, - "learning_rate": 8.638672929353063e-05, - "loss": 0.0095, + "epoch": 0.73, + "learning_rate": 0.0001902473164826676, + "loss": 0.0125, "step": 282270 }, { - "epoch": 1.42, - "learning_rate": 8.637916160051661e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019024342826629617, + "loss": 0.013, "step": 282280 }, { - "epoch": 1.42, - "learning_rate": 8.637159390750261e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019023954004992468, + "loss": 0.017, "step": 282290 }, { - "epoch": 1.42, - "learning_rate": 8.63640262144886e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019023565183355322, + "loss": 0.0139, "step": 282300 }, { - "epoch": 1.42, - "learning_rate": 8.635645852147458e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019023176361718174, + "loss": 0.0181, "step": 282310 }, { - "epoch": 1.42, - "learning_rate": 8.634889082846058e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.0001902278754008103, + "loss": 0.0136, "step": 282320 }, { - "epoch": 1.42, - "learning_rate": 8.634132313544656e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019022398718443882, + "loss": 0.0188, "step": 282330 }, { - "epoch": 1.42, - "learning_rate": 8.633375544243256e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019022009896806736, + "loss": 0.0142, "step": 282340 }, { - "epoch": 1.42, - "learning_rate": 8.632618774941855e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019021621075169588, + "loss": 0.015, "step": 282350 }, { - "epoch": 1.42, - "learning_rate": 8.631862005640453e-05, - "loss": 0.0093, + "epoch": 0.73, + "learning_rate": 0.00019021232253532442, + "loss": 0.0137, "step": 282360 }, { - "epoch": 1.42, - "learning_rate": 8.631105236339053e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.000190208434318953, + "loss": 0.0141, "step": 282370 }, { - "epoch": 1.42, - "learning_rate": 8.630348467037652e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.0001902045461025815, + "loss": 0.0126, "step": 282380 }, { - "epoch": 1.42, - "learning_rate": 8.62959169773625e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00019020065788621002, + "loss": 0.0144, "step": 282390 }, { - "epoch": 1.42, - "learning_rate": 8.62883492843485e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019019676966983856, + "loss": 0.0126, "step": 282400 }, { - "epoch": 1.42, - "learning_rate": 8.628078159133448e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019019288145346713, + "loss": 0.0168, "step": 282410 }, { - "epoch": 1.42, - "learning_rate": 8.627321389832048e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019018899323709564, + "loss": 0.0207, "step": 282420 }, { - "epoch": 1.42, - "learning_rate": 8.626564620530647e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019018510502072418, + "loss": 0.0141, "step": 282430 }, { - "epoch": 1.42, - "learning_rate": 8.625807851229245e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.0001901812168043527, + "loss": 0.0115, "step": 282440 }, { - "epoch": 1.42, - "learning_rate": 8.625051081927845e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019017732858798127, + "loss": 0.019, "step": 282450 }, { - "epoch": 1.43, - "learning_rate": 8.624294312626444e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019017344037160978, + "loss": 0.0172, "step": 282460 }, { - "epoch": 1.43, - "learning_rate": 8.623537543325042e-05, - "loss": 0.0093, + "epoch": 0.73, + "learning_rate": 0.00019016955215523832, + "loss": 0.0135, "step": 282470 }, { - "epoch": 1.43, - "learning_rate": 8.622780774023642e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.00019016566393886684, + "loss": 0.0144, "step": 282480 }, { - "epoch": 1.43, - "learning_rate": 8.622024004722239e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.0001901617757224954, + "loss": 0.0167, "step": 282490 }, { - "epoch": 1.43, - "learning_rate": 8.621267235420838e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019015788750612392, + "loss": 0.0137, "step": 282500 }, { - "epoch": 1.43, - "learning_rate": 8.620510466119436e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.00019015399928975246, + "loss": 0.0149, "step": 282510 }, { - "epoch": 1.43, - "learning_rate": 8.619753696818036e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019015011107338098, + "loss": 0.0149, "step": 282520 }, { - "epoch": 1.43, - "learning_rate": 8.618996927516635e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019014622285700954, + "loss": 0.0138, "step": 282530 }, { - "epoch": 1.43, - "learning_rate": 8.618240158215233e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00019014233464063806, + "loss": 0.0138, "step": 282540 }, { - "epoch": 1.43, - "learning_rate": 8.617483388913833e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.0001901384464242666, + "loss": 0.0146, "step": 282550 }, { - "epoch": 1.43, - "learning_rate": 8.616726619612432e-05, - "loss": 0.0066, + "epoch": 0.73, + "learning_rate": 0.00019013455820789512, + "loss": 0.0116, "step": 282560 }, { - "epoch": 1.43, - "learning_rate": 8.61596985031103e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019013066999152368, + "loss": 0.0157, "step": 282570 }, { - "epoch": 1.43, - "learning_rate": 8.61521308100963e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00019012678177515223, + "loss": 0.015, "step": 282580 }, { - "epoch": 1.43, - "learning_rate": 8.614456311708228e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019012289355878074, + "loss": 0.0146, "step": 282590 }, { - "epoch": 1.43, - "learning_rate": 8.613699542406828e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00019011900534240928, + "loss": 0.0172, "step": 282600 }, { - "epoch": 1.43, - "learning_rate": 8.612942773105427e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.0001901151171260378, + "loss": 0.0105, "step": 282610 }, { - "epoch": 1.43, - "learning_rate": 8.612186003804025e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019011122890966636, + "loss": 0.0162, "step": 282620 }, { - "epoch": 1.43, - "learning_rate": 8.611429234502625e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00019010734069329488, + "loss": 0.0174, "step": 282630 }, { - "epoch": 1.43, - "learning_rate": 8.610672465201224e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00019010345247692342, + "loss": 0.0159, "step": 282640 }, { - "epoch": 1.43, - "learning_rate": 8.609915695899822e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019009956426055194, + "loss": 0.0173, "step": 282650 }, { - "epoch": 1.43, - "learning_rate": 8.609158926598422e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.0001900956760441805, + "loss": 0.0162, "step": 282660 }, { - "epoch": 1.43, - "learning_rate": 8.60840215729702e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019009178782780902, + "loss": 0.0158, "step": 282670 }, { - "epoch": 1.43, - "learning_rate": 8.60764538799562e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00019008789961143756, + "loss": 0.0133, "step": 282680 }, { - "epoch": 1.43, - "learning_rate": 8.606888618694219e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019008401139506608, + "loss": 0.015, "step": 282690 }, { - "epoch": 1.43, - "learning_rate": 8.606131849392817e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00019008012317869464, + "loss": 0.0128, "step": 282700 }, { - "epoch": 1.43, - "learning_rate": 8.605375080091417e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019007623496232316, + "loss": 0.0198, "step": 282710 }, { - "epoch": 1.43, - "learning_rate": 8.604618310790016e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.0001900723467459517, + "loss": 0.0139, "step": 282720 }, { - "epoch": 1.43, - "learning_rate": 8.603861541488614e-05, - "loss": 0.009, + "epoch": 0.73, + "learning_rate": 0.00019006845852958021, + "loss": 0.0136, "step": 282730 }, { - "epoch": 1.43, - "learning_rate": 8.603104772187214e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00019006457031320878, + "loss": 0.0149, "step": 282740 }, { - "epoch": 1.43, - "learning_rate": 8.602348002885813e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019006068209683732, + "loss": 0.0208, "step": 282750 }, { - "epoch": 1.43, - "learning_rate": 8.601591233584412e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019005679388046584, + "loss": 0.0158, "step": 282760 }, { - "epoch": 1.43, - "learning_rate": 8.600834464283011e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00019005290566409438, + "loss": 0.0135, "step": 282770 }, { - "epoch": 1.43, - "learning_rate": 8.600077694981609e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00019004901744772292, + "loss": 0.0143, "step": 282780 }, { - "epoch": 1.43, - "learning_rate": 8.599320925680209e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.00019004512923135146, + "loss": 0.0169, "step": 282790 }, { - "epoch": 1.43, - "learning_rate": 8.598564156378808e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00019004124101497998, + "loss": 0.0147, "step": 282800 }, { - "epoch": 1.43, - "learning_rate": 8.597807387077406e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00019003735279860852, + "loss": 0.0179, "step": 282810 }, { - "epoch": 1.43, - "learning_rate": 8.597050617776006e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00019003346458223706, + "loss": 0.0153, "step": 282820 }, { - "epoch": 1.43, - "learning_rate": 8.596293848474605e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.0001900295763658656, + "loss": 0.0148, "step": 282830 }, { - "epoch": 1.43, - "learning_rate": 8.595537079173203e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019002568814949412, + "loss": 0.0153, "step": 282840 }, { - "epoch": 1.43, - "learning_rate": 8.594780309871803e-05, - "loss": 0.0053, + "epoch": 0.73, + "learning_rate": 0.00019002179993312266, + "loss": 0.0141, "step": 282850 }, { - "epoch": 1.43, - "learning_rate": 8.594023540570401e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00019001791171675117, + "loss": 0.0137, "step": 282860 }, { - "epoch": 1.43, - "learning_rate": 8.593266771269e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00019001402350037974, + "loss": 0.0179, "step": 282870 }, { - "epoch": 1.43, - "learning_rate": 8.5925100019676e-05, - "loss": 0.0084, + "epoch": 0.73, + "learning_rate": 0.00019001013528400826, + "loss": 0.0119, "step": 282880 }, { - "epoch": 1.43, - "learning_rate": 8.591753232666198e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.0001900062470676368, + "loss": 0.0169, "step": 282890 }, { - "epoch": 1.43, - "learning_rate": 8.590996463364798e-05, - "loss": 0.0077, + "epoch": 0.73, + "learning_rate": 0.00019000235885126531, + "loss": 0.0175, "step": 282900 }, { - "epoch": 1.43, - "learning_rate": 8.590239694063397e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00018999847063489388, + "loss": 0.0166, "step": 282910 }, { - "epoch": 1.43, - "learning_rate": 8.589482924761995e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00018999458241852242, + "loss": 0.0143, "step": 282920 }, { - "epoch": 1.43, - "learning_rate": 8.588726155460595e-05, - "loss": 0.0072, + "epoch": 0.73, + "learning_rate": 0.00018999069420215094, + "loss": 0.0175, "step": 282930 }, { - "epoch": 1.43, - "learning_rate": 8.587969386159193e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00018998680598577945, + "loss": 0.0133, "step": 282940 }, { - "epoch": 1.43, - "learning_rate": 8.587212616857793e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00018998291776940802, + "loss": 0.0127, "step": 282950 }, { - "epoch": 1.43, - "learning_rate": 8.586455847556392e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00018997902955303656, + "loss": 0.0162, "step": 282960 }, { - "epoch": 1.43, - "learning_rate": 8.58569907825499e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00018997514133666508, + "loss": 0.0181, "step": 282970 }, { - "epoch": 1.43, - "learning_rate": 8.58494230895359e-05, - "loss": 0.0056, + "epoch": 0.73, + "learning_rate": 0.00018997125312029362, + "loss": 0.0156, "step": 282980 }, { - "epoch": 1.43, - "learning_rate": 8.584185539652189e-05, - "loss": 0.0069, + "epoch": 0.73, + "learning_rate": 0.00018996736490392216, + "loss": 0.0151, "step": 282990 }, { - "epoch": 1.43, - "learning_rate": 8.583428770350787e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.0001899634766875507, + "loss": 0.0129, "step": 283000 }, { - "epoch": 1.43, - "eval_cer": 0.9144392032271493, - "eval_loss": 0.005669817794114351, - "eval_runtime": 115.6754, - "eval_samples_per_second": 17.29, - "eval_steps_per_second": 4.322, + "epoch": 0.73, + "eval_cer": 0.8817348779726539, + "eval_loss": 0.010007109493017197, + "eval_runtime": 108.1539, + "eval_samples_per_second": 18.492, + "eval_steps_per_second": 4.623, "step": 283000 }, { - "epoch": 1.43, - "learning_rate": 8.582672001049387e-05, - "loss": 0.01, + "epoch": 0.73, + "learning_rate": 0.00018995958847117922, + "loss": 0.0133, "step": 283010 }, { - "epoch": 1.43, - "learning_rate": 8.581915231747985e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00018995570025480776, + "loss": 0.0122, "step": 283020 }, { - "epoch": 1.43, - "learning_rate": 8.581158462446584e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.0001899518120384363, + "loss": 0.0172, "step": 283030 }, { - "epoch": 1.43, - "learning_rate": 8.580401693145184e-05, - "loss": 0.007, + "epoch": 0.73, + "learning_rate": 0.00018994792382206484, + "loss": 0.014, "step": 283040 }, { - "epoch": 1.43, - "learning_rate": 8.579644923843782e-05, - "loss": 0.0098, + "epoch": 0.73, + "learning_rate": 0.00018994403560569336, + "loss": 0.0189, "step": 283050 }, { - "epoch": 1.43, - "learning_rate": 8.578888154542382e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.0001899401473893219, + "loss": 0.0127, "step": 283060 }, { - "epoch": 1.43, - "learning_rate": 8.578131385240981e-05, - "loss": 0.0091, + "epoch": 0.73, + "learning_rate": 0.00018993625917295047, + "loss": 0.0132, "step": 283070 }, { - "epoch": 1.43, - "learning_rate": 8.577374615939579e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00018993237095657898, + "loss": 0.0149, "step": 283080 }, { - "epoch": 1.43, - "learning_rate": 8.576617846638179e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00018992848274020752, + "loss": 0.0166, "step": 283090 }, { - "epoch": 1.43, - "learning_rate": 8.575861077336777e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00018992459452383604, + "loss": 0.0141, "step": 283100 }, { - "epoch": 1.43, - "learning_rate": 8.575104308035376e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00018992070630746455, + "loss": 0.0146, "step": 283110 }, { - "epoch": 1.43, - "learning_rate": 8.574347538733973e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00018991681809109312, + "loss": 0.0183, "step": 283120 }, { - "epoch": 1.43, - "learning_rate": 8.573590769432573e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.00018991292987472166, + "loss": 0.0169, "step": 283130 }, { - "epoch": 1.43, - "learning_rate": 8.572834000131172e-05, - "loss": 0.0102, + "epoch": 0.73, + "learning_rate": 0.00018990904165835018, + "loss": 0.0137, "step": 283140 }, { - "epoch": 1.43, - "learning_rate": 8.57207723082977e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00018990515344197872, + "loss": 0.0177, "step": 283150 }, { - "epoch": 1.43, - "learning_rate": 8.57132046152837e-05, - "loss": 0.008, + "epoch": 0.73, + "learning_rate": 0.00018990126522560726, + "loss": 0.0156, "step": 283160 }, { - "epoch": 1.43, - "learning_rate": 8.57056369222697e-05, - "loss": 0.0056, + "epoch": 0.73, + "learning_rate": 0.0001898973770092358, + "loss": 0.0139, "step": 283170 }, { - "epoch": 1.43, - "learning_rate": 8.569806922925567e-05, - "loss": 0.0093, + "epoch": 0.73, + "learning_rate": 0.00018989348879286432, + "loss": 0.0159, "step": 283180 }, { - "epoch": 1.43, - "learning_rate": 8.569050153624167e-05, - "loss": 0.0057, + "epoch": 0.73, + "learning_rate": 0.00018988960057649286, + "loss": 0.0104, "step": 283190 }, { - "epoch": 1.43, - "learning_rate": 8.568293384322766e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.0001898857123601214, + "loss": 0.0133, "step": 283200 }, { - "epoch": 1.43, - "learning_rate": 8.567536615021365e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00018988182414374994, + "loss": 0.0115, "step": 283210 }, { - "epoch": 1.43, - "learning_rate": 8.566779845719964e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00018987793592737846, + "loss": 0.0191, "step": 283220 }, { - "epoch": 1.43, - "learning_rate": 8.566023076418562e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.000189874047711007, + "loss": 0.0134, "step": 283230 }, { - "epoch": 1.43, - "learning_rate": 8.565266307117162e-05, - "loss": 0.0067, + "epoch": 0.73, + "learning_rate": 0.00018987015949463557, + "loss": 0.012, "step": 283240 }, { - "epoch": 1.43, - "learning_rate": 8.564509537815761e-05, - "loss": 0.0101, + "epoch": 0.73, + "learning_rate": 0.00018986627127826408, + "loss": 0.0124, "step": 283250 }, { - "epoch": 1.43, - "learning_rate": 8.56375276851436e-05, - "loss": 0.0059, + "epoch": 0.73, + "learning_rate": 0.0001898623830618926, + "loss": 0.0152, "step": 283260 }, { - "epoch": 1.43, - "learning_rate": 8.562995999212959e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00018985849484552114, + "loss": 0.0151, "step": 283270 }, { - "epoch": 1.43, - "learning_rate": 8.562239229911558e-05, - "loss": 0.0073, + "epoch": 0.73, + "learning_rate": 0.0001898546066291497, + "loss": 0.0162, "step": 283280 }, { - "epoch": 1.43, - "learning_rate": 8.561482460610157e-05, - "loss": 0.0074, + "epoch": 0.73, + "learning_rate": 0.00018985071841277822, + "loss": 0.0147, "step": 283290 }, { - "epoch": 1.43, - "learning_rate": 8.560725691308756e-05, - "loss": 0.0044, + "epoch": 0.73, + "learning_rate": 0.00018984683019640676, + "loss": 0.0144, "step": 283300 }, { - "epoch": 1.43, - "learning_rate": 8.559968922007354e-05, - "loss": 0.0089, + "epoch": 0.73, + "learning_rate": 0.00018984294198003528, + "loss": 0.0128, "step": 283310 }, { - "epoch": 1.43, - "learning_rate": 8.559212152705954e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00018983905376366385, + "loss": 0.013, "step": 283320 }, { - "epoch": 1.43, - "learning_rate": 8.558455383404553e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00018983516554729236, + "loss": 0.0139, "step": 283330 }, { - "epoch": 1.43, - "learning_rate": 8.557698614103151e-05, - "loss": 0.0064, + "epoch": 0.73, + "learning_rate": 0.0001898312773309209, + "loss": 0.0138, "step": 283340 }, { - "epoch": 1.43, - "learning_rate": 8.556941844801751e-05, - "loss": 0.0078, + "epoch": 0.73, + "learning_rate": 0.00018982738911454942, + "loss": 0.0133, "step": 283350 }, { - "epoch": 1.43, - "learning_rate": 8.55618507550035e-05, - "loss": 0.0079, + "epoch": 0.73, + "learning_rate": 0.00018982350089817796, + "loss": 0.0121, "step": 283360 }, { - "epoch": 1.43, - "learning_rate": 8.555428306198948e-05, - "loss": 0.0071, + "epoch": 0.73, + "learning_rate": 0.0001898196126818065, + "loss": 0.0141, "step": 283370 }, { - "epoch": 1.43, - "learning_rate": 8.554671536897548e-05, - "loss": 0.0076, + "epoch": 0.73, + "learning_rate": 0.00018981572446543504, + "loss": 0.0135, "step": 283380 }, { - "epoch": 1.43, - "learning_rate": 8.553914767596146e-05, - "loss": 0.0082, + "epoch": 0.73, + "learning_rate": 0.00018981183624906356, + "loss": 0.0146, "step": 283390 }, { - "epoch": 1.43, - "learning_rate": 8.553157998294746e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.0001898079480326921, + "loss": 0.0197, "step": 283400 }, { - "epoch": 1.43, - "learning_rate": 8.552401228993345e-05, - "loss": 0.0062, + "epoch": 0.73, + "learning_rate": 0.00018980405981632064, + "loss": 0.019, "step": 283410 }, { - "epoch": 1.43, - "learning_rate": 8.551644459691943e-05, - "loss": 0.0094, + "epoch": 0.73, + "learning_rate": 0.00018980017159994918, + "loss": 0.0171, "step": 283420 }, { - "epoch": 1.43, - "learning_rate": 8.550887690390543e-05, - "loss": 0.0075, + "epoch": 0.73, + "learning_rate": 0.0001897962833835777, + "loss": 0.0189, "step": 283430 }, { - "epoch": 1.43, - "learning_rate": 8.550130921089142e-05, - "loss": 0.0068, + "epoch": 0.73, + "learning_rate": 0.00018979239516720624, + "loss": 0.0136, "step": 283440 }, { - "epoch": 1.43, - "learning_rate": 8.54937415178774e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.0001897885069508348, + "loss": 0.0114, "step": 283450 }, { - "epoch": 1.43, - "learning_rate": 8.54861738248634e-05, - "loss": 0.0087, + "epoch": 0.73, + "learning_rate": 0.00018978461873446332, + "loss": 0.0123, "step": 283460 }, { - "epoch": 1.43, - "learning_rate": 8.547860613184938e-05, - "loss": 0.0081, + "epoch": 0.73, + "learning_rate": 0.00018978073051809186, + "loss": 0.0112, "step": 283470 }, { - "epoch": 1.43, - "learning_rate": 8.547103843883538e-05, - "loss": 0.0083, + "epoch": 0.73, + "learning_rate": 0.00018977684230172038, + "loss": 0.0156, "step": 283480 }, { - "epoch": 1.43, - "learning_rate": 8.546347074582137e-05, - "loss": 0.0088, + "epoch": 0.73, + "learning_rate": 0.00018977295408534895, + "loss": 0.0176, "step": 283490 }, { - "epoch": 1.43, - "learning_rate": 8.545590305280735e-05, - "loss": 0.0065, + "epoch": 0.73, + "learning_rate": 0.00018976906586897746, + "loss": 0.0131, "step": 283500 }, { - "epoch": 1.43, - "learning_rate": 8.544833535979335e-05, - "loss": 0.0096, + "epoch": 0.73, + "learning_rate": 0.000189765177652606, + "loss": 0.0154, "step": 283510 }, { - "epoch": 1.43, - "learning_rate": 8.544076766677934e-05, - "loss": 0.0085, + "epoch": 0.73, + "learning_rate": 0.00018976128943623452, + "loss": 0.0162, "step": 283520 }, { - "epoch": 1.43, - "learning_rate": 8.543319997376532e-05, - "loss": 0.0063, + "epoch": 0.73, + "learning_rate": 0.00018975740121986308, + "loss": 0.0183, "step": 283530 }, { - "epoch": 1.43, - "learning_rate": 8.542563228075132e-05, - "loss": 0.006, + "epoch": 0.73, + "learning_rate": 0.0001897535130034916, + "loss": 0.0169, "step": 283540 }, { - "epoch": 1.43, - "learning_rate": 8.54180645877373e-05, - "loss": 0.005, + "epoch": 0.74, + "learning_rate": 0.00018974962478712014, + "loss": 0.0125, "step": 283550 }, { - "epoch": 1.43, - "learning_rate": 8.54104968947233e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018974573657074866, + "loss": 0.0142, "step": 283560 }, { - "epoch": 1.43, - "learning_rate": 8.540292920170929e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018974184835437722, + "loss": 0.0153, "step": 283570 }, { - "epoch": 1.43, - "learning_rate": 8.539536150869527e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018973796013800574, + "loss": 0.0125, "step": 283580 }, { - "epoch": 1.43, - "learning_rate": 8.538779381568127e-05, - "loss": 0.0055, + "epoch": 0.74, + "learning_rate": 0.00018973407192163428, + "loss": 0.0197, "step": 283590 }, { - "epoch": 1.43, - "learning_rate": 8.538022612266726e-05, - "loss": 0.0061, + "epoch": 0.74, + "learning_rate": 0.0001897301837052628, + "loss": 0.0154, "step": 283600 }, { - "epoch": 1.43, - "learning_rate": 8.537265842965324e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018972629548889134, + "loss": 0.0113, "step": 283610 }, { - "epoch": 1.43, - "learning_rate": 8.536509073663924e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.0001897224072725199, + "loss": 0.0133, "step": 283620 }, { - "epoch": 1.43, - "learning_rate": 8.535752304362522e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018971851905614842, + "loss": 0.0173, "step": 283630 }, { - "epoch": 1.43, - "learning_rate": 8.534995535061121e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018971463083977696, + "loss": 0.0144, "step": 283640 }, { - "epoch": 1.43, - "learning_rate": 8.534238765759721e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018971074262340548, + "loss": 0.0145, "step": 283650 }, { - "epoch": 1.43, - "learning_rate": 8.533481996458319e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018970685440703404, + "loss": 0.0151, "step": 283660 }, { - "epoch": 1.43, - "learning_rate": 8.532725227156919e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018970296619066256, + "loss": 0.0177, "step": 283670 }, { - "epoch": 1.43, - "learning_rate": 8.531968457855518e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.0001896990779742911, + "loss": 0.0201, "step": 283680 }, { - "epoch": 1.43, - "learning_rate": 8.531211688554116e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018969518975791962, + "loss": 0.0166, "step": 283690 }, { - "epoch": 1.43, - "learning_rate": 8.530454919252716e-05, - "loss": 0.0092, + "epoch": 0.74, + "learning_rate": 0.00018969130154154818, + "loss": 0.0192, "step": 283700 }, { - "epoch": 1.43, - "learning_rate": 8.529698149951314e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.0001896874133251767, + "loss": 0.0135, "step": 283710 }, { - "epoch": 1.43, - "learning_rate": 8.528941380649913e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.00018968352510880524, + "loss": 0.0123, "step": 283720 }, { - "epoch": 1.43, - "learning_rate": 8.528184611348513e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018967963689243375, + "loss": 0.0144, "step": 283730 }, { - "epoch": 1.43, - "learning_rate": 8.527427842047111e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018967574867606232, + "loss": 0.0155, "step": 283740 }, { - "epoch": 1.43, - "learning_rate": 8.526671072745709e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018967186045969084, + "loss": 0.0155, "step": 283750 }, { - "epoch": 1.43, - "learning_rate": 8.525914303444307e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.00018966797224331938, + "loss": 0.0153, "step": 283760 }, { - "epoch": 1.43, - "learning_rate": 8.525157534142907e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.0001896640840269479, + "loss": 0.0228, "step": 283770 }, { - "epoch": 1.43, - "learning_rate": 8.524400764841506e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018966019581057646, + "loss": 0.0165, "step": 283780 }, { - "epoch": 1.43, - "learning_rate": 8.523643995540104e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.000189656307594205, + "loss": 0.0113, "step": 283790 }, { - "epoch": 1.43, - "learning_rate": 8.522887226238704e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018965241937783352, + "loss": 0.0148, "step": 283800 }, { - "epoch": 1.43, - "learning_rate": 8.522130456937303e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018964853116146203, + "loss": 0.0123, "step": 283810 }, { - "epoch": 1.43, - "learning_rate": 8.521373687635902e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.0001896446429450906, + "loss": 0.0161, "step": 283820 }, { - "epoch": 1.43, - "learning_rate": 8.520616918334501e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018964075472871914, + "loss": 0.0175, "step": 283830 }, { - "epoch": 1.43, - "learning_rate": 8.519860149033099e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018963686651234766, + "loss": 0.0148, "step": 283840 }, { - "epoch": 1.43, - "learning_rate": 8.519103379731699e-05, - "loss": 0.0055, + "epoch": 0.74, + "learning_rate": 0.0001896329782959762, + "loss": 0.0123, "step": 283850 }, { - "epoch": 1.43, - "learning_rate": 8.518346610430298e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018962909007960471, + "loss": 0.0199, "step": 283860 }, { - "epoch": 1.43, - "learning_rate": 8.517589841128896e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018962520186323328, + "loss": 0.0151, "step": 283870 }, { - "epoch": 1.43, - "learning_rate": 8.516833071827496e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.0001896213136468618, + "loss": 0.0154, "step": 283880 }, { - "epoch": 1.43, - "learning_rate": 8.516076302526095e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018961742543049034, + "loss": 0.0162, "step": 283890 }, { - "epoch": 1.43, - "learning_rate": 8.515319533224693e-05, - "loss": 0.0061, + "epoch": 0.74, + "learning_rate": 0.00018961353721411885, + "loss": 0.0185, "step": 283900 }, { - "epoch": 1.43, - "learning_rate": 8.514562763923293e-05, - "loss": 0.0061, + "epoch": 0.74, + "learning_rate": 0.00018960964899774742, + "loss": 0.017, "step": 283910 }, { - "epoch": 1.43, - "learning_rate": 8.513805994621891e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018960576078137594, + "loss": 0.015, "step": 283920 }, { - "epoch": 1.43, - "learning_rate": 8.51304922532049e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018960187256500448, + "loss": 0.0139, "step": 283930 }, { - "epoch": 1.43, - "learning_rate": 8.51229245601909e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.000189597984348633, + "loss": 0.0149, "step": 283940 }, { - "epoch": 1.43, - "learning_rate": 8.511535686717688e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018959409613226156, + "loss": 0.0108, "step": 283950 }, { - "epoch": 1.43, - "learning_rate": 8.510778917416288e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.0001895902079158901, + "loss": 0.0158, "step": 283960 }, { - "epoch": 1.43, - "learning_rate": 8.510022148114887e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018958631969951862, + "loss": 0.0154, "step": 283970 }, { - "epoch": 1.43, - "learning_rate": 8.509265378813485e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018958243148314713, + "loss": 0.0139, "step": 283980 }, { - "epoch": 1.43, - "learning_rate": 8.508508609512085e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.0001895785432667757, + "loss": 0.016, "step": 283990 }, { - "epoch": 1.43, - "learning_rate": 8.507751840210683e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018957465505040424, + "loss": 0.0152, "step": 284000 }, { - "epoch": 1.43, - "eval_cer": 0.914452788772905, - "eval_loss": 0.005701255518943071, - "eval_runtime": 115.7531, - "eval_samples_per_second": 17.278, - "eval_steps_per_second": 4.32, + "epoch": 0.74, + "eval_cer": 0.8817432757942589, + "eval_loss": 0.009913179092109203, + "eval_runtime": 108.0964, + "eval_samples_per_second": 18.502, + "eval_steps_per_second": 4.626, "step": 284000 }, { - "epoch": 1.43, - "learning_rate": 8.506995070909283e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018957076683403276, + "loss": 0.0116, "step": 284010 }, { - "epoch": 1.43, - "learning_rate": 8.506238301607882e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.0001895668786176613, + "loss": 0.0192, "step": 284020 }, { - "epoch": 1.43, - "learning_rate": 8.50548153230648e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018956299040128984, + "loss": 0.0149, "step": 284030 }, { - "epoch": 1.43, - "learning_rate": 8.50472476300508e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.00018955910218491838, + "loss": 0.0188, "step": 284040 }, { - "epoch": 1.43, - "learning_rate": 8.503967993703679e-05, - "loss": 0.0051, + "epoch": 0.74, + "learning_rate": 0.0001895552139685469, + "loss": 0.011, "step": 284050 }, { - "epoch": 1.43, - "learning_rate": 8.503211224402277e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018955132575217544, + "loss": 0.0142, "step": 284060 }, { - "epoch": 1.43, - "learning_rate": 8.502454455100877e-05, - "loss": 0.0053, + "epoch": 0.74, + "learning_rate": 0.00018954743753580398, + "loss": 0.0119, "step": 284070 }, { - "epoch": 1.43, - "learning_rate": 8.501697685799475e-05, - "loss": 0.006, + "epoch": 0.74, + "learning_rate": 0.00018954354931943252, + "loss": 0.0151, "step": 284080 }, { - "epoch": 1.43, - "learning_rate": 8.500940916498074e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018953966110306104, + "loss": 0.0141, "step": 284090 }, { - "epoch": 1.43, - "learning_rate": 8.500184147196674e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018953577288668958, + "loss": 0.0162, "step": 284100 }, { - "epoch": 1.43, - "learning_rate": 8.499427377895272e-05, - "loss": 0.0056, + "epoch": 0.74, + "learning_rate": 0.0001895318846703181, + "loss": 0.0142, "step": 284110 }, { - "epoch": 1.43, - "learning_rate": 8.498670608593872e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018952799645394666, + "loss": 0.016, "step": 284120 }, { - "epoch": 1.43, - "learning_rate": 8.497913839292471e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.00018952410823757518, + "loss": 0.0132, "step": 284130 }, { - "epoch": 1.43, - "learning_rate": 8.497157069991069e-05, - "loss": 0.0098, + "epoch": 0.74, + "learning_rate": 0.00018952022002120372, + "loss": 0.0192, "step": 284140 }, { - "epoch": 1.43, - "learning_rate": 8.496400300689669e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018951633180483223, + "loss": 0.0134, "step": 284150 }, { - "epoch": 1.43, - "learning_rate": 8.495643531388267e-05, - "loss": 0.01, + "epoch": 0.74, + "learning_rate": 0.0001895124435884608, + "loss": 0.0196, "step": 284160 }, { - "epoch": 1.43, - "learning_rate": 8.494886762086866e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018950855537208934, + "loss": 0.0107, "step": 284170 }, { - "epoch": 1.43, - "learning_rate": 8.494129992785466e-05, - "loss": 0.01, + "epoch": 0.74, + "learning_rate": 0.00018950466715571786, + "loss": 0.0164, "step": 284180 }, { - "epoch": 1.43, - "learning_rate": 8.493373223484064e-05, - "loss": 0.0084, + "epoch": 0.74, + "learning_rate": 0.0001895007789393464, + "loss": 0.0209, "step": 284190 }, { - "epoch": 1.43, - "learning_rate": 8.492616454182664e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018949689072297494, + "loss": 0.0194, "step": 284200 }, { - "epoch": 1.43, - "learning_rate": 8.491859684881263e-05, - "loss": 0.006, + "epoch": 0.74, + "learning_rate": 0.00018949300250660348, + "loss": 0.0171, "step": 284210 }, { - "epoch": 1.43, - "learning_rate": 8.491102915579861e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.000189489114290232, + "loss": 0.0166, "step": 284220 }, { - "epoch": 1.43, - "learning_rate": 8.490346146278461e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018948522607386054, + "loss": 0.0141, "step": 284230 }, { - "epoch": 1.43, - "learning_rate": 8.48958937697706e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018948133785748908, + "loss": 0.0141, "step": 284240 }, { - "epoch": 1.43, - "learning_rate": 8.488832607675658e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018947744964111762, + "loss": 0.014, "step": 284250 }, { - "epoch": 1.43, - "learning_rate": 8.488075838374258e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018947356142474614, + "loss": 0.0133, "step": 284260 }, { - "epoch": 1.43, - "learning_rate": 8.487319069072856e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018946967320837468, + "loss": 0.0119, "step": 284270 }, { - "epoch": 1.43, - "learning_rate": 8.486562299771456e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018946578499200325, + "loss": 0.0171, "step": 284280 }, { - "epoch": 1.43, - "learning_rate": 8.485805530470055e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018946189677563176, + "loss": 0.0159, "step": 284290 }, { - "epoch": 1.43, - "learning_rate": 8.485048761168653e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018945800855926028, + "loss": 0.02, "step": 284300 }, { - "epoch": 1.43, - "learning_rate": 8.484291991867253e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018945412034288882, + "loss": 0.0154, "step": 284310 }, { - "epoch": 1.43, - "learning_rate": 8.483535222565852e-05, - "loss": 0.0049, + "epoch": 0.74, + "learning_rate": 0.00018945023212651739, + "loss": 0.0133, "step": 284320 }, { - "epoch": 1.43, - "learning_rate": 8.48277845326445e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.0001894463439101459, + "loss": 0.017, "step": 284330 }, { - "epoch": 1.43, - "learning_rate": 8.48202168396305e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018944245569377444, + "loss": 0.0149, "step": 284340 }, { - "epoch": 1.43, - "learning_rate": 8.481264914661648e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018943856747740296, + "loss": 0.0153, "step": 284350 }, { - "epoch": 1.43, - "learning_rate": 8.480508145360247e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.0001894346792610315, + "loss": 0.0118, "step": 284360 }, { - "epoch": 1.43, - "learning_rate": 8.479751376058847e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018943079104466004, + "loss": 0.0158, "step": 284370 }, { - "epoch": 1.43, - "learning_rate": 8.478994606757444e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018942690282828858, + "loss": 0.0148, "step": 284380 }, { - "epoch": 1.43, - "learning_rate": 8.478237837456043e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.0001894230146119171, + "loss": 0.0133, "step": 284390 }, { - "epoch": 1.43, - "learning_rate": 8.477481068154641e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018941912639554564, + "loss": 0.0149, "step": 284400 }, { - "epoch": 1.43, - "learning_rate": 8.476724298853241e-05, - "loss": 0.01, + "epoch": 0.74, + "learning_rate": 0.00018941523817917418, + "loss": 0.0163, "step": 284410 }, { - "epoch": 1.43, - "learning_rate": 8.47596752955184e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018941134996280272, + "loss": 0.0124, "step": 284420 }, { - "epoch": 1.43, - "learning_rate": 8.475210760250439e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018940746174643124, + "loss": 0.012, "step": 284430 }, { - "epoch": 1.44, - "learning_rate": 8.474453990949038e-05, - "loss": 0.0099, + "epoch": 0.74, + "learning_rate": 0.00018940357353005978, + "loss": 0.0135, "step": 284440 }, { - "epoch": 1.44, - "learning_rate": 8.473697221647636e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018939968531368832, + "loss": 0.0139, "step": 284450 }, { - "epoch": 1.44, - "learning_rate": 8.472940452346236e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018939579709731686, + "loss": 0.0129, "step": 284460 }, { - "epoch": 1.44, - "learning_rate": 8.472183683044835e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018939190888094538, + "loss": 0.0142, "step": 284470 }, { - "epoch": 1.44, - "learning_rate": 8.471426913743433e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018938802066457392, + "loss": 0.0157, "step": 284480 }, { - "epoch": 1.44, - "learning_rate": 8.470670144442033e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018938413244820249, + "loss": 0.0198, "step": 284490 }, { - "epoch": 1.44, - "learning_rate": 8.469913375140632e-05, - "loss": 0.0105, + "epoch": 0.74, + "learning_rate": 0.000189380244231831, + "loss": 0.015, "step": 284500 }, { - "epoch": 1.44, - "learning_rate": 8.46915660583923e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018937635601545954, + "loss": 0.0144, "step": 284510 }, { - "epoch": 1.44, - "learning_rate": 8.46839983653783e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018937246779908806, + "loss": 0.0148, "step": 284520 }, { - "epoch": 1.44, - "learning_rate": 8.467643067236428e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018936857958271663, + "loss": 0.0187, "step": 284530 }, { - "epoch": 1.44, - "learning_rate": 8.466886297935028e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018936469136634514, + "loss": 0.0133, "step": 284540 }, { - "epoch": 1.44, - "learning_rate": 8.466129528633627e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018936080314997368, + "loss": 0.0118, "step": 284550 }, { - "epoch": 1.44, - "learning_rate": 8.465372759332225e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.0001893569149336022, + "loss": 0.0167, "step": 284560 }, { - "epoch": 1.44, - "learning_rate": 8.464615990030825e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018935302671723076, + "loss": 0.0214, "step": 284570 }, { - "epoch": 1.44, - "learning_rate": 8.463859220729424e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018934913850085928, + "loss": 0.0154, "step": 284580 }, { - "epoch": 1.44, - "learning_rate": 8.463102451428022e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018934525028448782, + "loss": 0.0151, "step": 284590 }, { - "epoch": 1.44, - "learning_rate": 8.462345682126622e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018934136206811634, + "loss": 0.0169, "step": 284600 }, { - "epoch": 1.44, - "learning_rate": 8.46158891282522e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018933747385174488, + "loss": 0.0127, "step": 284610 }, { - "epoch": 1.44, - "learning_rate": 8.46083214352382e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018933358563537342, + "loss": 0.0151, "step": 284620 }, { - "epoch": 1.44, - "learning_rate": 8.460075374222419e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018932969741900196, + "loss": 0.0113, "step": 284630 }, { - "epoch": 1.44, - "learning_rate": 8.459318604921017e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018932580920263047, + "loss": 0.0128, "step": 284640 }, { - "epoch": 1.44, - "learning_rate": 8.458561835619617e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018932192098625902, + "loss": 0.0152, "step": 284650 }, { - "epoch": 1.44, - "learning_rate": 8.457805066318216e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018931803276988759, + "loss": 0.0132, "step": 284660 }, { - "epoch": 1.44, - "learning_rate": 8.457048297016814e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.0001893141445535161, + "loss": 0.0149, "step": 284670 }, { - "epoch": 1.44, - "learning_rate": 8.456291527715414e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018931025633714464, + "loss": 0.0133, "step": 284680 }, { - "epoch": 1.44, - "learning_rate": 8.455534758414013e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018930636812077316, + "loss": 0.0139, "step": 284690 }, { - "epoch": 1.44, - "learning_rate": 8.454777989112611e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018930247990440172, + "loss": 0.0145, "step": 284700 }, { - "epoch": 1.44, - "learning_rate": 8.454021219811211e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018929859168803024, + "loss": 0.0145, "step": 284710 }, { - "epoch": 1.44, - "learning_rate": 8.453264450509809e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018929470347165878, + "loss": 0.0166, "step": 284720 }, { - "epoch": 1.44, - "learning_rate": 8.452507681208409e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.0001892908152552873, + "loss": 0.0154, "step": 284730 }, { - "epoch": 1.44, - "learning_rate": 8.451750911907008e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018928692703891586, + "loss": 0.0141, "step": 284740 }, { - "epoch": 1.44, - "learning_rate": 8.450994142605606e-05, - "loss": 0.0058, + "epoch": 0.74, + "learning_rate": 0.00018928303882254438, + "loss": 0.0159, "step": 284750 }, { - "epoch": 1.44, - "learning_rate": 8.450237373304206e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018927915060617292, + "loss": 0.0129, "step": 284760 }, { - "epoch": 1.44, - "learning_rate": 8.449480604002805e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018927526238980143, + "loss": 0.0152, "step": 284770 }, { - "epoch": 1.44, - "learning_rate": 8.448723834701403e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018927137417343, + "loss": 0.0151, "step": 284780 }, { - "epoch": 1.44, - "learning_rate": 8.447967065400003e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018926748595705852, + "loss": 0.0131, "step": 284790 }, { - "epoch": 1.44, - "learning_rate": 8.447210296098601e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018926359774068706, + "loss": 0.0158, "step": 284800 }, { - "epoch": 1.44, - "learning_rate": 8.4464535267972e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018925970952431557, + "loss": 0.0123, "step": 284810 }, { - "epoch": 1.44, - "learning_rate": 8.4456967574958e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018925582130794414, + "loss": 0.0136, "step": 284820 }, { - "epoch": 1.44, - "learning_rate": 8.444939988194398e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018925193309157268, + "loss": 0.0143, "step": 284830 }, { - "epoch": 1.44, - "learning_rate": 8.444183218892998e-05, - "loss": 0.0099, + "epoch": 0.74, + "learning_rate": 0.0001892480448752012, + "loss": 0.0164, "step": 284840 }, { - "epoch": 1.44, - "learning_rate": 8.443426449591597e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018924415665882971, + "loss": 0.0176, "step": 284850 }, { - "epoch": 1.44, - "learning_rate": 8.442669680290195e-05, - "loss": 0.0056, + "epoch": 0.74, + "learning_rate": 0.00018924026844245826, + "loss": 0.0154, "step": 284860 }, { - "epoch": 1.44, - "learning_rate": 8.441912910988795e-05, - "loss": 0.0116, + "epoch": 0.74, + "learning_rate": 0.00018923638022608682, + "loss": 0.0147, "step": 284870 }, { - "epoch": 1.44, - "learning_rate": 8.441156141687393e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018923249200971534, + "loss": 0.0141, "step": 284880 }, { - "epoch": 1.44, - "learning_rate": 8.440399372385992e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018922860379334388, + "loss": 0.0113, "step": 284890 }, { - "epoch": 1.44, - "learning_rate": 8.439642603084592e-05, - "loss": 0.0103, + "epoch": 0.74, + "learning_rate": 0.0001892247155769724, + "loss": 0.0183, "step": 284900 }, { - "epoch": 1.44, - "learning_rate": 8.43888583378319e-05, - "loss": 0.0084, + "epoch": 0.74, + "learning_rate": 0.00018922082736060096, + "loss": 0.0157, "step": 284910 }, { - "epoch": 1.44, - "learning_rate": 8.43812906448179e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018921693914422948, + "loss": 0.0129, "step": 284920 }, { - "epoch": 1.44, - "learning_rate": 8.437372295180389e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018921305092785802, + "loss": 0.0134, "step": 284930 }, { - "epoch": 1.44, - "learning_rate": 8.436615525878987e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018920916271148653, + "loss": 0.0157, "step": 284940 }, { - "epoch": 1.44, - "learning_rate": 8.435858756577587e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.0001892052744951151, + "loss": 0.0172, "step": 284950 }, { - "epoch": 1.44, - "learning_rate": 8.435101987276185e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018920138627874362, + "loss": 0.0147, "step": 284960 }, { - "epoch": 1.44, - "learning_rate": 8.434345217974784e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018919749806237216, + "loss": 0.0133, "step": 284970 }, { - "epoch": 1.44, - "learning_rate": 8.433588448673384e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018919360984600067, + "loss": 0.0137, "step": 284980 }, { - "epoch": 1.44, - "learning_rate": 8.432831679371982e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018918972162962924, + "loss": 0.0158, "step": 284990 }, { - "epoch": 1.44, - "learning_rate": 8.43207491007058e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018918583341325776, + "loss": 0.0123, "step": 285000 }, { - "epoch": 1.44, - "eval_cer": 0.9144430848116509, - "eval_loss": 0.00582539290189743, - "eval_runtime": 115.8203, - "eval_samples_per_second": 17.268, - "eval_steps_per_second": 4.317, + "epoch": 0.74, + "eval_cer": 0.881704085960102, + "eval_loss": 0.010136989876627922, + "eval_runtime": 108.2121, + "eval_samples_per_second": 18.482, + "eval_steps_per_second": 4.621, "step": 285000 }, { - "epoch": 1.44, - "learning_rate": 8.431318140769178e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.0001891819451968863, + "loss": 0.0153, "step": 285010 }, { - "epoch": 1.44, - "learning_rate": 8.430561371467778e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.0001891780569805148, + "loss": 0.0191, "step": 285020 }, { - "epoch": 1.44, - "learning_rate": 8.429804602166377e-05, - "loss": 0.0053, + "epoch": 0.74, + "learning_rate": 0.00018917416876414338, + "loss": 0.0122, "step": 285030 }, { - "epoch": 1.44, - "learning_rate": 8.429047832864975e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018917028054777192, + "loss": 0.0173, "step": 285040 }, { - "epoch": 1.44, - "learning_rate": 8.428291063563575e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018916639233140044, + "loss": 0.0152, "step": 285050 }, { - "epoch": 1.44, - "learning_rate": 8.427534294262173e-05, - "loss": 0.0098, + "epoch": 0.74, + "learning_rate": 0.00018916250411502898, + "loss": 0.013, "step": 285060 }, { - "epoch": 1.44, - "learning_rate": 8.426777524960773e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018915861589865752, + "loss": 0.0147, "step": 285070 }, { - "epoch": 1.44, - "learning_rate": 8.426020755659372e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018915472768228606, + "loss": 0.0144, "step": 285080 }, { - "epoch": 1.44, - "learning_rate": 8.42526398635797e-05, - "loss": 0.0084, + "epoch": 0.74, + "learning_rate": 0.00018915083946591458, + "loss": 0.012, "step": 285090 }, { - "epoch": 1.44, - "learning_rate": 8.42450721705657e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018914695124954312, + "loss": 0.0128, "step": 285100 }, { - "epoch": 1.44, - "learning_rate": 8.423750447755169e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018914306303317163, + "loss": 0.0109, "step": 285110 }, { - "epoch": 1.44, - "learning_rate": 8.422993678453767e-05, - "loss": 0.0112, + "epoch": 0.74, + "learning_rate": 0.0001891391748168002, + "loss": 0.0139, "step": 285120 }, { - "epoch": 1.44, - "learning_rate": 8.422236909152367e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018913528660042872, + "loss": 0.0141, "step": 285130 }, { - "epoch": 1.44, - "learning_rate": 8.421480139850966e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018913139838405726, + "loss": 0.0189, "step": 285140 }, { - "epoch": 1.44, - "learning_rate": 8.420723370549565e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018912751016768577, + "loss": 0.0131, "step": 285150 }, { - "epoch": 1.44, - "learning_rate": 8.419966601248164e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018912362195131434, + "loss": 0.0136, "step": 285160 }, { - "epoch": 1.44, - "learning_rate": 8.419209831946762e-05, - "loss": 0.006, + "epoch": 0.74, + "learning_rate": 0.00018911973373494286, + "loss": 0.0153, "step": 285170 }, { - "epoch": 1.44, - "learning_rate": 8.418453062645362e-05, - "loss": 0.0121, + "epoch": 0.74, + "learning_rate": 0.0001891158455185714, + "loss": 0.0143, "step": 285180 }, { - "epoch": 1.44, - "learning_rate": 8.417696293343961e-05, - "loss": 0.0046, + "epoch": 0.74, + "learning_rate": 0.0001891119573021999, + "loss": 0.0158, "step": 285190 }, { - "epoch": 1.44, - "learning_rate": 8.416939524042559e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.00018910806908582848, + "loss": 0.0168, "step": 285200 }, { - "epoch": 1.44, - "learning_rate": 8.416182754741159e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018910418086945702, + "loss": 0.0103, "step": 285210 }, { - "epoch": 1.44, - "learning_rate": 8.415425985439758e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018910029265308554, + "loss": 0.0174, "step": 285220 }, { - "epoch": 1.44, - "learning_rate": 8.414669216138356e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018909640443671408, + "loss": 0.0146, "step": 285230 }, { - "epoch": 1.44, - "learning_rate": 8.413912446836956e-05, - "loss": 0.0079, + "epoch": 0.74, + "learning_rate": 0.00018909251622034262, + "loss": 0.0175, "step": 285240 }, { - "epoch": 1.44, - "learning_rate": 8.413155677535554e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018908862800397116, + "loss": 0.0131, "step": 285250 }, { - "epoch": 1.44, - "learning_rate": 8.412398908234154e-05, - "loss": 0.0096, + "epoch": 0.74, + "learning_rate": 0.00018908473978759968, + "loss": 0.0175, "step": 285260 }, { - "epoch": 1.44, - "learning_rate": 8.411642138932753e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018908085157122822, + "loss": 0.0138, "step": 285270 }, { - "epoch": 1.44, - "learning_rate": 8.410885369631351e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018907696335485676, + "loss": 0.018, "step": 285280 }, { - "epoch": 1.44, - "learning_rate": 8.410128600329951e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.0001890730751384853, + "loss": 0.015, "step": 285290 }, { - "epoch": 1.44, - "learning_rate": 8.40937183102855e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018906918692211382, + "loss": 0.0135, "step": 285300 }, { - "epoch": 1.44, - "learning_rate": 8.408615061727148e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018906529870574236, + "loss": 0.0168, "step": 285310 }, { - "epoch": 1.44, - "learning_rate": 8.407858292425748e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.0001890614104893709, + "loss": 0.0182, "step": 285320 }, { - "epoch": 1.44, - "learning_rate": 8.407101523124346e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.00018905752227299944, + "loss": 0.0153, "step": 285330 }, { - "epoch": 1.44, - "learning_rate": 8.406344753822946e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018905363405662796, + "loss": 0.0171, "step": 285340 }, { - "epoch": 1.44, - "learning_rate": 8.405587984521545e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.0001890497458402565, + "loss": 0.0151, "step": 285350 }, { - "epoch": 1.44, - "learning_rate": 8.404831215220143e-05, - "loss": 0.0053, + "epoch": 0.74, + "learning_rate": 0.000189045857623885, + "loss": 0.0128, "step": 285360 }, { - "epoch": 1.44, - "learning_rate": 8.404074445918743e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018904196940751358, + "loss": 0.0147, "step": 285370 }, { - "epoch": 1.44, - "learning_rate": 8.403317676617342e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.00018903808119114212, + "loss": 0.0181, "step": 285380 }, { - "epoch": 1.44, - "learning_rate": 8.40256090731594e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018903419297477064, + "loss": 0.0175, "step": 285390 }, { - "epoch": 1.44, - "learning_rate": 8.40180413801454e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018903030475839915, + "loss": 0.0164, "step": 285400 }, { - "epoch": 1.44, - "learning_rate": 8.401047368713138e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018902641654202772, + "loss": 0.0125, "step": 285410 }, { - "epoch": 1.44, - "learning_rate": 8.400290599411737e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018902252832565626, + "loss": 0.0097, "step": 285420 }, { - "epoch": 1.44, - "learning_rate": 8.399533830110337e-05, - "loss": 0.0058, + "epoch": 0.74, + "learning_rate": 0.00018901864010928478, + "loss": 0.0152, "step": 285430 }, { - "epoch": 1.44, - "learning_rate": 8.398777060808935e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018901475189291332, + "loss": 0.0143, "step": 285440 }, { - "epoch": 1.44, - "learning_rate": 8.398020291507535e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018901086367654186, + "loss": 0.0169, "step": 285450 }, { - "epoch": 1.44, - "learning_rate": 8.397263522206134e-05, - "loss": 0.0121, + "epoch": 0.74, + "learning_rate": 0.0001890069754601704, + "loss": 0.0169, "step": 285460 }, { - "epoch": 1.44, - "learning_rate": 8.396506752904732e-05, - "loss": 0.0099, + "epoch": 0.74, + "learning_rate": 0.00018900308724379892, + "loss": 0.0158, "step": 285470 }, { - "epoch": 1.44, - "learning_rate": 8.395749983603332e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.00018899919902742746, + "loss": 0.0127, "step": 285480 }, { - "epoch": 1.44, - "learning_rate": 8.39499321430193e-05, - "loss": 0.005, + "epoch": 0.74, + "learning_rate": 0.000188995310811056, + "loss": 0.0171, "step": 285490 }, { - "epoch": 1.44, - "learning_rate": 8.39423644500053e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018899142259468454, + "loss": 0.018, "step": 285500 }, { - "epoch": 1.44, - "learning_rate": 8.393479675699129e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018898753437831306, + "loss": 0.0117, "step": 285510 }, { - "epoch": 1.44, - "learning_rate": 8.392722906397727e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.0001889836461619416, + "loss": 0.0164, "step": 285520 }, { - "epoch": 1.44, - "learning_rate": 8.391966137096327e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018897975794557017, + "loss": 0.0163, "step": 285530 }, { - "epoch": 1.44, - "learning_rate": 8.391209367794926e-05, - "loss": 0.0092, + "epoch": 0.74, + "learning_rate": 0.00018897586972919868, + "loss": 0.0153, "step": 285540 }, { - "epoch": 1.44, - "learning_rate": 8.390452598493524e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018897198151282722, + "loss": 0.0167, "step": 285550 }, { - "epoch": 1.44, - "learning_rate": 8.389695829192124e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018896809329645574, + "loss": 0.0168, "step": 285560 }, { - "epoch": 1.44, - "learning_rate": 8.388939059890722e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.0001889642050800843, + "loss": 0.0145, "step": 285570 }, { - "epoch": 1.44, - "learning_rate": 8.388182290589321e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018896031686371282, + "loss": 0.0142, "step": 285580 }, { - "epoch": 1.44, - "learning_rate": 8.387425521287921e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018895642864734136, + "loss": 0.0149, "step": 285590 }, { - "epoch": 1.44, - "learning_rate": 8.386668751986519e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018895254043096988, + "loss": 0.0136, "step": 285600 }, { - "epoch": 1.44, - "learning_rate": 8.385911982685118e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018894865221459842, + "loss": 0.0144, "step": 285610 }, { - "epoch": 1.44, - "learning_rate": 8.385155213383718e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018894476399822696, + "loss": 0.0118, "step": 285620 }, { - "epoch": 1.44, - "learning_rate": 8.384398444082315e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.0001889408757818555, + "loss": 0.0169, "step": 285630 }, { - "epoch": 1.44, - "learning_rate": 8.383641674780914e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018893698756548402, + "loss": 0.0126, "step": 285640 }, { - "epoch": 1.44, - "learning_rate": 8.382884905479512e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018893309934911256, + "loss": 0.0146, "step": 285650 }, { - "epoch": 1.44, - "learning_rate": 8.382128136178112e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.0001889292111327411, + "loss": 0.0155, "step": 285660 }, { - "epoch": 1.44, - "learning_rate": 8.381371366876711e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018892532291636964, + "loss": 0.0177, "step": 285670 }, { - "epoch": 1.44, - "learning_rate": 8.38061459757531e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018892143469999815, + "loss": 0.0151, "step": 285680 }, { - "epoch": 1.44, - "learning_rate": 8.379857828273909e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.0001889175464836267, + "loss": 0.0129, "step": 285690 }, { - "epoch": 1.44, - "learning_rate": 8.379101058972507e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018891365826725526, + "loss": 0.0173, "step": 285700 }, { - "epoch": 1.44, - "learning_rate": 8.378344289671107e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018890977005088378, + "loss": 0.0145, "step": 285710 }, { - "epoch": 1.44, - "learning_rate": 8.377587520369706e-05, - "loss": 0.0121, + "epoch": 0.74, + "learning_rate": 0.0001889058818345123, + "loss": 0.0135, "step": 285720 }, { - "epoch": 1.44, - "learning_rate": 8.376830751068304e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018890199361814084, + "loss": 0.0154, "step": 285730 }, { - "epoch": 1.44, - "learning_rate": 8.376073981766904e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.0001888981054017694, + "loss": 0.0122, "step": 285740 }, { - "epoch": 1.44, - "learning_rate": 8.375317212465503e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018889421718539792, + "loss": 0.0136, "step": 285750 }, { - "epoch": 1.44, - "learning_rate": 8.374560443164101e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018889032896902646, + "loss": 0.0147, "step": 285760 }, { - "epoch": 1.44, - "learning_rate": 8.373803673862701e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018888644075265498, + "loss": 0.0113, "step": 285770 }, { - "epoch": 1.44, - "learning_rate": 8.373046904561299e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018888255253628354, + "loss": 0.0143, "step": 285780 }, { - "epoch": 1.44, - "learning_rate": 8.372290135259899e-05, - "loss": 0.0084, + "epoch": 0.74, + "learning_rate": 0.00018887866431991206, + "loss": 0.0132, "step": 285790 }, { - "epoch": 1.44, - "learning_rate": 8.371533365958498e-05, - "loss": 0.0058, + "epoch": 0.74, + "learning_rate": 0.0001888747761035406, + "loss": 0.0179, "step": 285800 }, { - "epoch": 1.44, - "learning_rate": 8.370776596657096e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018887088788716911, + "loss": 0.0159, "step": 285810 }, { - "epoch": 1.44, - "learning_rate": 8.370019827355696e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018886699967079766, + "loss": 0.0157, "step": 285820 }, { - "epoch": 1.44, - "learning_rate": 8.369263058054295e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.0001888631114544262, + "loss": 0.0216, "step": 285830 }, { - "epoch": 1.44, - "learning_rate": 8.368506288752893e-05, - "loss": 0.0089, + "epoch": 0.74, + "learning_rate": 0.00018885922323805474, + "loss": 0.0137, "step": 285840 }, { - "epoch": 1.44, - "learning_rate": 8.367749519451493e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018885533502168325, + "loss": 0.0187, "step": 285850 }, { - "epoch": 1.44, - "learning_rate": 8.366992750150091e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.0001888514468053118, + "loss": 0.0165, "step": 285860 }, { - "epoch": 1.44, - "learning_rate": 8.36623598084869e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018884755858894036, + "loss": 0.0125, "step": 285870 }, { - "epoch": 1.44, - "learning_rate": 8.36547921154729e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018884367037256888, + "loss": 0.0096, "step": 285880 }, { - "epoch": 1.44, - "learning_rate": 8.364722442245888e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.0001888397821561974, + "loss": 0.0175, "step": 285890 }, { - "epoch": 1.44, - "learning_rate": 8.363965672944488e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018883589393982594, + "loss": 0.011, "step": 285900 }, { - "epoch": 1.44, - "learning_rate": 8.363208903643087e-05, - "loss": 0.0097, + "epoch": 0.74, + "learning_rate": 0.0001888320057234545, + "loss": 0.0144, "step": 285910 }, { - "epoch": 1.44, - "learning_rate": 8.362452134341685e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018882811750708302, + "loss": 0.0139, "step": 285920 }, { - "epoch": 1.44, - "learning_rate": 8.361695365040285e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018882422929071156, + "loss": 0.0123, "step": 285930 }, { - "epoch": 1.44, - "learning_rate": 8.360938595738883e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018882034107434007, + "loss": 0.0127, "step": 285940 }, { - "epoch": 1.44, - "learning_rate": 8.360181826437482e-05, - "loss": 0.0112, + "epoch": 0.74, + "learning_rate": 0.00018881645285796864, + "loss": 0.0138, "step": 285950 }, { - "epoch": 1.44, - "learning_rate": 8.359425057136082e-05, - "loss": 0.0101, + "epoch": 0.74, + "learning_rate": 0.00018881256464159716, + "loss": 0.012, "step": 285960 }, { - "epoch": 1.44, - "learning_rate": 8.35866828783468e-05, - "loss": 0.0092, + "epoch": 0.74, + "learning_rate": 0.0001888086764252257, + "loss": 0.0152, "step": 285970 }, { - "epoch": 1.44, - "learning_rate": 8.35791151853328e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018880478820885421, + "loss": 0.0156, "step": 285980 }, { - "epoch": 1.44, - "learning_rate": 8.357154749231879e-05, - "loss": 0.011, + "epoch": 0.74, + "learning_rate": 0.00018880089999248278, + "loss": 0.015, "step": 285990 }, { - "epoch": 1.44, - "learning_rate": 8.356397979930477e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.0001887970117761113, + "loss": 0.0144, "step": 286000 }, { - "epoch": 1.44, - "eval_cer": 0.914438232831024, - "eval_loss": 0.005684024654328823, - "eval_runtime": 115.553, - "eval_samples_per_second": 17.308, - "eval_steps_per_second": 4.327, + "epoch": 0.74, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.00980143342167139, + "eval_runtime": 107.852, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, "step": 286000 }, { - "epoch": 1.44, - "learning_rate": 8.355641210629077e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018879312355973984, + "loss": 0.0133, "step": 286010 }, { - "epoch": 1.44, - "learning_rate": 8.354884441327675e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018878923534336835, + "loss": 0.0156, "step": 286020 }, { - "epoch": 1.44, - "learning_rate": 8.354127672026274e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018878534712699692, + "loss": 0.0124, "step": 286030 }, { - "epoch": 1.44, - "learning_rate": 8.353370902724874e-05, - "loss": 0.0087, + "epoch": 0.74, + "learning_rate": 0.00018878145891062544, + "loss": 0.0172, "step": 286040 }, { - "epoch": 1.44, - "learning_rate": 8.352614133423472e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018877757069425398, + "loss": 0.0163, "step": 286050 }, { - "epoch": 1.44, - "learning_rate": 8.351857364122072e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.0001887736824778825, + "loss": 0.0118, "step": 286060 }, { - "epoch": 1.44, - "learning_rate": 8.351100594820671e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018876979426151103, + "loss": 0.0091, "step": 286070 }, { - "epoch": 1.44, - "learning_rate": 8.350343825519269e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.0001887659060451396, + "loss": 0.0165, "step": 286080 }, { - "epoch": 1.44, - "learning_rate": 8.349587056217869e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018876201782876812, + "loss": 0.0164, "step": 286090 }, { - "epoch": 1.44, - "learning_rate": 8.348830286916467e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018875812961239666, + "loss": 0.0143, "step": 286100 }, { - "epoch": 1.44, - "learning_rate": 8.348073517615066e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018875424139602517, + "loss": 0.0163, "step": 286110 }, { - "epoch": 1.44, - "learning_rate": 8.347316748313666e-05, - "loss": 0.0092, + "epoch": 0.74, + "learning_rate": 0.00018875035317965374, + "loss": 0.016, "step": 286120 }, { - "epoch": 1.44, - "learning_rate": 8.346559979012264e-05, - "loss": 0.0099, + "epoch": 0.74, + "learning_rate": 0.00018874646496328226, + "loss": 0.0115, "step": 286130 }, { - "epoch": 1.44, - "learning_rate": 8.345803209710863e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.0001887425767469108, + "loss": 0.0146, "step": 286140 }, { - "epoch": 1.44, - "learning_rate": 8.345046440409463e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.0001887386885305393, + "loss": 0.0121, "step": 286150 }, { - "epoch": 1.44, - "learning_rate": 8.344289671108061e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018873480031416788, + "loss": 0.018, "step": 286160 }, { - "epoch": 1.44, - "learning_rate": 8.34353290180666e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.0001887309120977964, + "loss": 0.0166, "step": 286170 }, { - "epoch": 1.44, - "learning_rate": 8.34277613250526e-05, - "loss": 0.0122, + "epoch": 0.74, + "learning_rate": 0.00018872702388142494, + "loss": 0.014, "step": 286180 }, { - "epoch": 1.44, - "learning_rate": 8.342019363203858e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018872313566505345, + "loss": 0.0131, "step": 286190 }, { - "epoch": 1.44, - "learning_rate": 8.341262593902458e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018871924744868202, + "loss": 0.0142, "step": 286200 }, { - "epoch": 1.44, - "learning_rate": 8.340505824601056e-05, - "loss": 0.0048, + "epoch": 0.74, + "learning_rate": 0.00018871535923231054, + "loss": 0.0153, "step": 286210 }, { - "epoch": 1.44, - "learning_rate": 8.339749055299655e-05, - "loss": 0.0088, + "epoch": 0.74, + "learning_rate": 0.00018871147101593908, + "loss": 0.016, "step": 286220 }, { - "epoch": 1.44, - "learning_rate": 8.338992285998255e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.0001887075827995676, + "loss": 0.0158, "step": 286230 }, { - "epoch": 1.44, - "learning_rate": 8.338235516696853e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018870369458319616, + "loss": 0.0134, "step": 286240 }, { - "epoch": 1.44, - "learning_rate": 8.337478747395453e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.0001886998063668247, + "loss": 0.0157, "step": 286250 }, { - "epoch": 1.44, - "learning_rate": 8.33672197809405e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018869591815045322, + "loss": 0.0108, "step": 286260 }, { - "epoch": 1.44, - "learning_rate": 8.335965208792649e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018869202993408176, + "loss": 0.014, "step": 286270 }, { - "epoch": 1.44, - "learning_rate": 8.335208439491248e-05, - "loss": 0.0057, + "epoch": 0.74, + "learning_rate": 0.0001886881417177103, + "loss": 0.015, "step": 286280 }, { - "epoch": 1.44, - "learning_rate": 8.334451670189846e-05, - "loss": 0.0098, + "epoch": 0.74, + "learning_rate": 0.00018868425350133884, + "loss": 0.0153, "step": 286290 }, { - "epoch": 1.44, - "learning_rate": 8.333694900888446e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018868036528496736, + "loss": 0.0164, "step": 286300 }, { - "epoch": 1.44, - "learning_rate": 8.332938131587044e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.0001886764770685959, + "loss": 0.0164, "step": 286310 }, { - "epoch": 1.44, - "learning_rate": 8.332181362285644e-05, - "loss": 0.0106, + "epoch": 0.74, + "learning_rate": 0.0001886725888522244, + "loss": 0.019, "step": 286320 }, { - "epoch": 1.44, - "learning_rate": 8.331424592984243e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018866870063585298, + "loss": 0.0138, "step": 286330 }, { - "epoch": 1.44, - "learning_rate": 8.330667823682841e-05, - "loss": 0.005, + "epoch": 0.74, + "learning_rate": 0.0001886648124194815, + "loss": 0.0165, "step": 286340 }, { - "epoch": 1.44, - "learning_rate": 8.329911054381441e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018866092420311004, + "loss": 0.0179, "step": 286350 }, { - "epoch": 1.44, - "learning_rate": 8.32915428508004e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018865703598673855, + "loss": 0.0121, "step": 286360 }, { - "epoch": 1.44, - "learning_rate": 8.328397515778638e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018865314777036712, + "loss": 0.016, "step": 286370 }, { - "epoch": 1.44, - "learning_rate": 8.327640746477238e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018864925955399564, + "loss": 0.0133, "step": 286380 }, { - "epoch": 1.44, - "learning_rate": 8.326883977175836e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018864537133762418, + "loss": 0.0143, "step": 286390 }, { - "epoch": 1.44, - "learning_rate": 8.326127207874436e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.0001886414831212527, + "loss": 0.0151, "step": 286400 }, { - "epoch": 1.44, - "learning_rate": 8.325370438573035e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018863759490488126, + "loss": 0.0155, "step": 286410 }, { - "epoch": 1.45, - "learning_rate": 8.324613669271633e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.0001886337066885098, + "loss": 0.0175, "step": 286420 }, { - "epoch": 1.45, - "learning_rate": 8.323856899970233e-05, - "loss": 0.0073, + "epoch": 0.74, + "learning_rate": 0.00018862981847213832, + "loss": 0.0164, "step": 286430 }, { - "epoch": 1.45, - "learning_rate": 8.323100130668832e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018862593025576683, + "loss": 0.0146, "step": 286440 }, { - "epoch": 1.45, - "learning_rate": 8.32234336136743e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.0001886220420393954, + "loss": 0.0134, "step": 286450 }, { - "epoch": 1.45, - "learning_rate": 8.32158659206603e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018861815382302394, + "loss": 0.0138, "step": 286460 }, { - "epoch": 1.45, - "learning_rate": 8.320829822764628e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.00018861426560665246, + "loss": 0.0147, "step": 286470 }, { - "epoch": 1.45, - "learning_rate": 8.320073053463227e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.000188610377390281, + "loss": 0.0178, "step": 286480 }, { - "epoch": 1.45, - "learning_rate": 8.319316284161827e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018860648917390954, + "loss": 0.0173, "step": 286490 }, { - "epoch": 1.45, - "learning_rate": 8.318559514860425e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018860260095753808, + "loss": 0.0148, "step": 286500 }, { - "epoch": 1.45, - "learning_rate": 8.317802745559025e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.0001885987127411666, + "loss": 0.0154, "step": 286510 }, { - "epoch": 1.45, - "learning_rate": 8.317045976257624e-05, - "loss": 0.0103, + "epoch": 0.74, + "learning_rate": 0.00018859482452479514, + "loss": 0.015, "step": 286520 }, { - "epoch": 1.45, - "learning_rate": 8.316289206956222e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018859093630842368, + "loss": 0.0143, "step": 286530 }, { - "epoch": 1.45, - "learning_rate": 8.315532437654822e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018858704809205222, + "loss": 0.0168, "step": 286540 }, { - "epoch": 1.45, - "learning_rate": 8.31477566835342e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018858315987568073, + "loss": 0.015, "step": 286550 }, { - "epoch": 1.45, - "learning_rate": 8.31401889905202e-05, - "loss": 0.0103, + "epoch": 0.74, + "learning_rate": 0.00018857927165930928, + "loss": 0.0136, "step": 286560 }, { - "epoch": 1.45, - "learning_rate": 8.313262129750619e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.0001885753834429378, + "loss": 0.0132, "step": 286570 }, { - "epoch": 1.45, - "learning_rate": 8.312505360449217e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018857149522656636, + "loss": 0.0138, "step": 286580 }, { - "epoch": 1.45, - "learning_rate": 8.311748591147817e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018856760701019487, + "loss": 0.0145, "step": 286590 }, { - "epoch": 1.45, - "learning_rate": 8.310991821846416e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018856371879382342, + "loss": 0.0147, "step": 286600 }, { - "epoch": 1.45, - "learning_rate": 8.310235052545014e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.00018855983057745193, + "loss": 0.0131, "step": 286610 }, { - "epoch": 1.45, - "learning_rate": 8.309478283243614e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.0001885559423610805, + "loss": 0.0162, "step": 286620 }, { - "epoch": 1.45, - "learning_rate": 8.308721513942213e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018855205414470904, + "loss": 0.0141, "step": 286630 }, { - "epoch": 1.45, - "learning_rate": 8.307964744640811e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018854816592833756, + "loss": 0.0133, "step": 286640 }, { - "epoch": 1.45, - "learning_rate": 8.307207975339411e-05, - "loss": 0.006, + "epoch": 0.74, + "learning_rate": 0.0001885442777119661, + "loss": 0.0171, "step": 286650 }, { - "epoch": 1.45, - "learning_rate": 8.306451206038009e-05, - "loss": 0.0092, + "epoch": 0.74, + "learning_rate": 0.00018854038949559464, + "loss": 0.0151, "step": 286660 }, { - "epoch": 1.45, - "learning_rate": 8.305694436736608e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018853650127922318, + "loss": 0.0132, "step": 286670 }, { - "epoch": 1.45, - "learning_rate": 8.304937667435208e-05, - "loss": 0.0084, + "epoch": 0.74, + "learning_rate": 0.0001885326130628517, + "loss": 0.0123, "step": 286680 }, { - "epoch": 1.45, - "learning_rate": 8.304180898133806e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018852872484648024, + "loss": 0.0124, "step": 286690 }, { - "epoch": 1.45, - "learning_rate": 8.303424128832406e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018852483663010878, + "loss": 0.018, "step": 286700 }, { - "epoch": 1.45, - "learning_rate": 8.302667359531005e-05, - "loss": 0.0084, + "epoch": 0.74, + "learning_rate": 0.00018852094841373732, + "loss": 0.0154, "step": 286710 }, { - "epoch": 1.45, - "learning_rate": 8.301910590229603e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.00018851706019736583, + "loss": 0.0164, "step": 286720 }, { - "epoch": 1.45, - "learning_rate": 8.301153820928203e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018851317198099438, + "loss": 0.013, "step": 286730 }, { - "epoch": 1.45, - "learning_rate": 8.300397051626801e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018850928376462294, + "loss": 0.0136, "step": 286740 }, { - "epoch": 1.45, - "learning_rate": 8.2996402823254e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018850539554825146, + "loss": 0.0149, "step": 286750 }, { - "epoch": 1.45, - "learning_rate": 8.298883513024e-05, - "loss": 0.0093, + "epoch": 0.74, + "learning_rate": 0.00018850150733187997, + "loss": 0.0144, "step": 286760 }, { - "epoch": 1.45, - "learning_rate": 8.298126743722598e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018849761911550852, + "loss": 0.0114, "step": 286770 }, { - "epoch": 1.45, - "learning_rate": 8.297369974421198e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018849373089913708, + "loss": 0.0131, "step": 286780 }, { - "epoch": 1.45, - "learning_rate": 8.296613205119797e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.0001884898426827656, + "loss": 0.0155, "step": 286790 }, { - "epoch": 1.45, - "learning_rate": 8.295856435818395e-05, - "loss": 0.0083, + "epoch": 0.74, + "learning_rate": 0.00018848595446639414, + "loss": 0.0161, "step": 286800 }, { - "epoch": 1.45, - "learning_rate": 8.295099666516995e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018848206625002265, + "loss": 0.0156, "step": 286810 }, { - "epoch": 1.45, - "learning_rate": 8.294342897215593e-05, - "loss": 0.0102, + "epoch": 0.74, + "learning_rate": 0.0001884781780336512, + "loss": 0.0152, "step": 286820 }, { - "epoch": 1.45, - "learning_rate": 8.293586127914192e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.00018847428981727974, + "loss": 0.0155, "step": 286830 }, { - "epoch": 1.45, - "learning_rate": 8.292829358612792e-05, - "loss": 0.0077, + "epoch": 0.74, + "learning_rate": 0.00018847040160090828, + "loss": 0.0125, "step": 286840 }, { - "epoch": 1.45, - "learning_rate": 8.29207258931139e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.0001884665133845368, + "loss": 0.021, "step": 286850 }, { - "epoch": 1.45, - "learning_rate": 8.29131582000999e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018846262516816534, + "loss": 0.0215, "step": 286860 }, { - "epoch": 1.45, - "learning_rate": 8.290559050708589e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018845873695179388, + "loss": 0.0153, "step": 286870 }, { - "epoch": 1.45, - "learning_rate": 8.289802281407187e-05, - "loss": 0.0063, + "epoch": 0.74, + "learning_rate": 0.00018845484873542242, + "loss": 0.0209, "step": 286880 }, { - "epoch": 1.45, - "learning_rate": 8.289045512105785e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018845096051905093, + "loss": 0.0141, "step": 286890 }, { - "epoch": 1.45, - "learning_rate": 8.288288742804383e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.00018844707230267948, + "loss": 0.0115, "step": 286900 }, { - "epoch": 1.45, - "learning_rate": 8.287531973502983e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018844318408630802, + "loss": 0.0106, "step": 286910 }, { - "epoch": 1.45, - "learning_rate": 8.286775204201581e-05, - "loss": 0.0069, + "epoch": 0.74, + "learning_rate": 0.00018843929586993656, + "loss": 0.014, "step": 286920 }, { - "epoch": 1.45, - "learning_rate": 8.28601843490018e-05, - "loss": 0.0092, + "epoch": 0.74, + "learning_rate": 0.00018843540765356507, + "loss": 0.0173, "step": 286930 }, { - "epoch": 1.45, - "learning_rate": 8.28526166559878e-05, - "loss": 0.0095, + "epoch": 0.74, + "learning_rate": 0.00018843151943719361, + "loss": 0.0147, "step": 286940 }, { - "epoch": 1.45, - "learning_rate": 8.284504896297378e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018842763122082218, + "loss": 0.0183, "step": 286950 }, { - "epoch": 1.45, - "learning_rate": 8.283748126995978e-05, - "loss": 0.0052, + "epoch": 0.74, + "learning_rate": 0.0001884237430044507, + "loss": 0.0168, "step": 286960 }, { - "epoch": 1.45, - "learning_rate": 8.282991357694577e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.00018841985478807924, + "loss": 0.0136, "step": 286970 }, { - "epoch": 1.45, - "learning_rate": 8.282234588393175e-05, - "loss": 0.0081, + "epoch": 0.74, + "learning_rate": 0.00018841596657170775, + "loss": 0.0145, "step": 286980 }, { - "epoch": 1.45, - "learning_rate": 8.281477819091775e-05, - "loss": 0.0067, + "epoch": 0.74, + "learning_rate": 0.00018841207835533632, + "loss": 0.0176, "step": 286990 }, { - "epoch": 1.45, - "learning_rate": 8.280721049790373e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018840819013896484, + "loss": 0.0137, "step": 287000 }, { - "epoch": 1.45, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.0057329838164150715, - "eval_runtime": 115.5304, - "eval_samples_per_second": 17.311, - "eval_steps_per_second": 4.328, + "epoch": 0.74, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.010108675807714462, + "eval_runtime": 107.8967, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, "step": 287000 }, { - "epoch": 1.45, - "learning_rate": 8.279964280488972e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.00018840430192259338, + "loss": 0.0134, "step": 287010 }, { - "epoch": 1.45, - "learning_rate": 8.279207511187572e-05, - "loss": 0.007, + "epoch": 0.74, + "learning_rate": 0.0001884004137062219, + "loss": 0.0159, "step": 287020 }, { - "epoch": 1.45, - "learning_rate": 8.27845074188617e-05, - "loss": 0.0062, + "epoch": 0.74, + "learning_rate": 0.00018839652548985046, + "loss": 0.016, "step": 287030 }, { - "epoch": 1.45, - "learning_rate": 8.27769397258477e-05, - "loss": 0.0058, + "epoch": 0.74, + "learning_rate": 0.00018839263727347898, + "loss": 0.0153, "step": 287040 }, { - "epoch": 1.45, - "learning_rate": 8.276937203283369e-05, - "loss": 0.0082, + "epoch": 0.74, + "learning_rate": 0.00018838874905710752, + "loss": 0.0172, "step": 287050 }, { - "epoch": 1.45, - "learning_rate": 8.276180433981967e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018838486084073603, + "loss": 0.0168, "step": 287060 }, { - "epoch": 1.45, - "learning_rate": 8.275423664680567e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018838097262436457, + "loss": 0.0155, "step": 287070 }, { - "epoch": 1.45, - "learning_rate": 8.274666895379166e-05, - "loss": 0.0094, + "epoch": 0.74, + "learning_rate": 0.00018837708440799312, + "loss": 0.0167, "step": 287080 }, { - "epoch": 1.45, - "learning_rate": 8.273910126077764e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018837319619162166, + "loss": 0.0141, "step": 287090 }, { - "epoch": 1.45, - "learning_rate": 8.273153356776364e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018836930797525017, + "loss": 0.0173, "step": 287100 }, { - "epoch": 1.45, - "learning_rate": 8.272396587474962e-05, - "loss": 0.0054, + "epoch": 0.74, + "learning_rate": 0.00018836541975887871, + "loss": 0.0125, "step": 287110 }, { - "epoch": 1.45, - "learning_rate": 8.271639818173562e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018836153154250728, + "loss": 0.0162, "step": 287120 }, { - "epoch": 1.45, - "learning_rate": 8.270883048872161e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.0001883576433261358, + "loss": 0.0167, "step": 287130 }, { - "epoch": 1.45, - "learning_rate": 8.270126279570759e-05, - "loss": 0.0097, + "epoch": 0.74, + "learning_rate": 0.00018835375510976434, + "loss": 0.0153, "step": 287140 }, { - "epoch": 1.45, - "learning_rate": 8.269369510269359e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018834986689339285, + "loss": 0.0182, "step": 287150 }, { - "epoch": 1.45, - "learning_rate": 8.268612740967958e-05, - "loss": 0.0076, + "epoch": 0.74, + "learning_rate": 0.00018834597867702142, + "loss": 0.0127, "step": 287160 }, { - "epoch": 1.45, - "learning_rate": 8.267855971666556e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.00018834209046064994, + "loss": 0.0139, "step": 287170 }, { - "epoch": 1.45, - "learning_rate": 8.267099202365156e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018833820224427848, + "loss": 0.0168, "step": 287180 }, { - "epoch": 1.45, - "learning_rate": 8.266342433063754e-05, - "loss": 0.0058, + "epoch": 0.74, + "learning_rate": 0.000188334314027907, + "loss": 0.0133, "step": 287190 }, { - "epoch": 1.45, - "learning_rate": 8.265585663762354e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018833042581153556, + "loss": 0.0171, "step": 287200 }, { - "epoch": 1.45, - "learning_rate": 8.264828894460953e-05, - "loss": 0.0075, + "epoch": 0.74, + "learning_rate": 0.00018832653759516408, + "loss": 0.0137, "step": 287210 }, { - "epoch": 1.45, - "learning_rate": 8.264072125159551e-05, - "loss": 0.0097, + "epoch": 0.74, + "learning_rate": 0.00018832264937879262, + "loss": 0.0137, "step": 287220 }, { - "epoch": 1.45, - "learning_rate": 8.26331535585815e-05, - "loss": 0.0065, + "epoch": 0.74, + "learning_rate": 0.00018831876116242113, + "loss": 0.0144, "step": 287230 }, { - "epoch": 1.45, - "learning_rate": 8.26255858655675e-05, - "loss": 0.0105, + "epoch": 0.74, + "learning_rate": 0.0001883148729460497, + "loss": 0.0158, "step": 287240 }, { - "epoch": 1.45, - "learning_rate": 8.261801817255348e-05, - "loss": 0.0059, + "epoch": 0.74, + "learning_rate": 0.00018831098472967822, + "loss": 0.0134, "step": 287250 }, { - "epoch": 1.45, - "learning_rate": 8.261045047953948e-05, - "loss": 0.0071, + "epoch": 0.74, + "learning_rate": 0.00018830709651330676, + "loss": 0.0112, "step": 287260 }, { - "epoch": 1.45, - "learning_rate": 8.260288278652546e-05, - "loss": 0.0064, + "epoch": 0.74, + "learning_rate": 0.00018830320829693527, + "loss": 0.0119, "step": 287270 }, { - "epoch": 1.45, - "learning_rate": 8.259531509351145e-05, - "loss": 0.0086, + "epoch": 0.74, + "learning_rate": 0.00018829932008056384, + "loss": 0.0154, "step": 287280 }, { - "epoch": 1.45, - "learning_rate": 8.258774740049745e-05, - "loss": 0.0094, - "step": 287290 + "epoch": 0.74, + "learning_rate": 0.00018829543186419238, + "loss": 0.0144, + "step": 287290 }, { - "epoch": 1.45, - "learning_rate": 8.258017970748343e-05, - "loss": 0.0055, + "epoch": 0.74, + "learning_rate": 0.0001882915436478209, + "loss": 0.0123, "step": 287300 }, { - "epoch": 1.45, - "learning_rate": 8.257261201446943e-05, - "loss": 0.0072, + "epoch": 0.74, + "learning_rate": 0.0001882876554314494, + "loss": 0.012, "step": 287310 }, { - "epoch": 1.45, - "learning_rate": 8.256504432145542e-05, - "loss": 0.008, + "epoch": 0.74, + "learning_rate": 0.00018828376721507795, + "loss": 0.0187, "step": 287320 }, { - "epoch": 1.45, - "learning_rate": 8.25574766284414e-05, - "loss": 0.0085, + "epoch": 0.74, + "learning_rate": 0.00018827987899870652, + "loss": 0.014, "step": 287330 }, { - "epoch": 1.45, - "learning_rate": 8.25499089354274e-05, - "loss": 0.009, + "epoch": 0.74, + "learning_rate": 0.00018827599078233504, + "loss": 0.0122, "step": 287340 }, { - "epoch": 1.45, - "learning_rate": 8.254234124241338e-05, - "loss": 0.0091, + "epoch": 0.74, + "learning_rate": 0.00018827210256596358, + "loss": 0.0167, "step": 287350 }, { - "epoch": 1.45, - "learning_rate": 8.253477354939937e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.0001882682143495921, + "loss": 0.0132, "step": 287360 }, { - "epoch": 1.45, - "learning_rate": 8.252720585638537e-05, - "loss": 0.0078, + "epoch": 0.74, + "learning_rate": 0.00018826432613322066, + "loss": 0.0165, "step": 287370 }, { - "epoch": 1.45, - "learning_rate": 8.251963816337135e-05, - "loss": 0.0068, + "epoch": 0.74, + "learning_rate": 0.00018826043791684918, + "loss": 0.0167, "step": 287380 }, { - "epoch": 1.45, - "learning_rate": 8.251207047035735e-05, - "loss": 0.0066, + "epoch": 0.74, + "learning_rate": 0.00018825654970047772, + "loss": 0.0185, "step": 287390 }, { - "epoch": 1.45, - "learning_rate": 8.250450277734334e-05, - "loss": 0.0074, + "epoch": 0.74, + "learning_rate": 0.00018825266148410623, + "loss": 0.0132, "step": 287400 }, { - "epoch": 1.45, - "learning_rate": 8.249693508432932e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.0001882487732677348, + "loss": 0.0175, "step": 287410 }, { - "epoch": 1.45, - "learning_rate": 8.248936739131532e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018824488505136332, + "loss": 0.0118, "step": 287420 }, { - "epoch": 1.45, - "learning_rate": 8.24817996983013e-05, - "loss": 0.0056, + "epoch": 0.75, + "learning_rate": 0.00018824099683499186, + "loss": 0.0132, "step": 287430 }, { - "epoch": 1.45, - "learning_rate": 8.247423200528729e-05, - "loss": 0.0096, + "epoch": 0.75, + "learning_rate": 0.00018823710861862037, + "loss": 0.0154, "step": 287440 }, { - "epoch": 1.45, - "learning_rate": 8.246666431227329e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.00018823322040224894, + "loss": 0.0112, "step": 287450 }, { - "epoch": 1.45, - "learning_rate": 8.245909661925927e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.00018822933218587748, + "loss": 0.0122, "step": 287460 }, { - "epoch": 1.45, - "learning_rate": 8.245152892624526e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.000188225443969506, + "loss": 0.0128, "step": 287470 }, { - "epoch": 1.45, - "learning_rate": 8.244396123323126e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.0001882215557531345, + "loss": 0.016, "step": 287480 }, { - "epoch": 1.45, - "learning_rate": 8.243639354021724e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018821766753676308, + "loss": 0.0125, "step": 287490 }, { - "epoch": 1.45, - "learning_rate": 8.242882584720324e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018821377932039162, + "loss": 0.0145, "step": 287500 }, { - "epoch": 1.45, - "learning_rate": 8.242125815418922e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018820989110402014, + "loss": 0.0167, "step": 287510 }, { - "epoch": 1.45, - "learning_rate": 8.24136904611752e-05, - "loss": 0.0046, + "epoch": 0.75, + "learning_rate": 0.00018820600288764868, + "loss": 0.0138, "step": 287520 }, { - "epoch": 1.45, - "learning_rate": 8.240612276816118e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018820211467127722, + "loss": 0.0136, "step": 287530 }, { - "epoch": 1.45, - "learning_rate": 8.239855507514718e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018819822645490576, + "loss": 0.0113, "step": 287540 }, { - "epoch": 1.45, - "learning_rate": 8.239098738213317e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018819433823853428, + "loss": 0.0129, "step": 287550 }, { - "epoch": 1.45, - "learning_rate": 8.238341968911915e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018819045002216282, + "loss": 0.0147, "step": 287560 }, { - "epoch": 1.45, - "learning_rate": 8.237585199610515e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018818656180579133, + "loss": 0.0172, "step": 287570 }, { - "epoch": 1.45, - "learning_rate": 8.236828430309114e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.0001881826735894199, + "loss": 0.0191, "step": 287580 }, { - "epoch": 1.45, - "learning_rate": 8.236071661007712e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018817878537304841, + "loss": 0.0156, "step": 287590 }, { - "epoch": 1.45, - "learning_rate": 8.235314891706312e-05, - "loss": 0.0054, + "epoch": 0.75, + "learning_rate": 0.00018817489715667696, + "loss": 0.0153, "step": 287600 }, { - "epoch": 1.45, - "learning_rate": 8.234558122404911e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018817100894030547, + "loss": 0.0165, "step": 287610 }, { - "epoch": 1.45, - "learning_rate": 8.23380135310351e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018816712072393404, + "loss": 0.0144, "step": 287620 }, { - "epoch": 1.45, - "learning_rate": 8.233044583802109e-05, - "loss": 0.0093, + "epoch": 0.75, + "learning_rate": 0.00018816323250756255, + "loss": 0.0122, "step": 287630 }, { - "epoch": 1.45, - "learning_rate": 8.232287814500707e-05, - "loss": 0.0099, + "epoch": 0.75, + "learning_rate": 0.0001881593442911911, + "loss": 0.0149, "step": 287640 }, { - "epoch": 1.45, - "learning_rate": 8.231531045199307e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.0001881554560748196, + "loss": 0.0167, "step": 287650 }, { - "epoch": 1.45, - "learning_rate": 8.230774275897906e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018815156785844818, + "loss": 0.0172, "step": 287660 }, { - "epoch": 1.45, - "learning_rate": 8.230017506596504e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018814767964207672, + "loss": 0.0111, "step": 287670 }, { - "epoch": 1.45, - "learning_rate": 8.229260737295104e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018814379142570524, + "loss": 0.0126, "step": 287680 }, { - "epoch": 1.45, - "learning_rate": 8.228503967993703e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018813990320933378, + "loss": 0.0124, "step": 287690 }, { - "epoch": 1.45, - "learning_rate": 8.227747198692301e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018813601499296232, + "loss": 0.0175, "step": 287700 }, { - "epoch": 1.45, - "learning_rate": 8.226990429390901e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018813212677659086, + "loss": 0.0165, "step": 287710 }, { - "epoch": 1.45, - "learning_rate": 8.226233660089499e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018812823856021937, + "loss": 0.0171, "step": 287720 }, { - "epoch": 1.45, - "learning_rate": 8.225476890788099e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018812435034384792, + "loss": 0.0184, "step": 287730 }, { - "epoch": 1.45, - "learning_rate": 8.224720121486698e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018812046212747646, + "loss": 0.0147, "step": 287740 }, { - "epoch": 1.45, - "learning_rate": 8.223963352185296e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.000188116573911105, + "loss": 0.0153, "step": 287750 }, { - "epoch": 1.45, - "learning_rate": 8.223206582883896e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018811268569473351, + "loss": 0.0147, "step": 287760 }, { - "epoch": 1.45, - "learning_rate": 8.222449813582495e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018810879747836206, + "loss": 0.0133, "step": 287770 }, { - "epoch": 1.45, - "learning_rate": 8.221693044281093e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.0001881049092619906, + "loss": 0.0158, "step": 287780 }, { - "epoch": 1.45, - "learning_rate": 8.220936274979693e-05, - "loss": 0.0054, + "epoch": 0.75, + "learning_rate": 0.00018810102104561914, + "loss": 0.0156, "step": 287790 }, { - "epoch": 1.45, - "learning_rate": 8.220179505678291e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018809713282924765, + "loss": 0.0139, "step": 287800 }, { - "epoch": 1.45, - "learning_rate": 8.21942273637689e-05, - "loss": 0.0057, + "epoch": 0.75, + "learning_rate": 0.0001880932446128762, + "loss": 0.0117, "step": 287810 }, { - "epoch": 1.45, - "learning_rate": 8.21866596707549e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.0001880893563965047, + "loss": 0.0139, "step": 287820 }, { - "epoch": 1.45, - "learning_rate": 8.217909197774088e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018808546818013328, + "loss": 0.0116, "step": 287830 }, { - "epoch": 1.45, - "learning_rate": 8.217152428472688e-05, - "loss": 0.0104, + "epoch": 0.75, + "learning_rate": 0.00018808157996376182, + "loss": 0.017, "step": 287840 }, { - "epoch": 1.45, - "learning_rate": 8.216395659171287e-05, - "loss": 0.005, + "epoch": 0.75, + "learning_rate": 0.00018807769174739033, + "loss": 0.0169, "step": 287850 }, { - "epoch": 1.45, - "learning_rate": 8.215638889869885e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.00018807380353101888, + "loss": 0.0175, "step": 287860 }, { - "epoch": 1.45, - "learning_rate": 8.214882120568485e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.00018806991531464742, + "loss": 0.0166, "step": 287870 }, { - "epoch": 1.45, - "learning_rate": 8.214125351267083e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.00018806602709827596, + "loss": 0.0152, "step": 287880 }, { - "epoch": 1.45, - "learning_rate": 8.213368581965682e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018806213888190447, + "loss": 0.0121, "step": 287890 }, { - "epoch": 1.45, - "learning_rate": 8.212611812664282e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018805825066553302, + "loss": 0.0138, "step": 287900 }, { - "epoch": 1.45, - "learning_rate": 8.21185504336288e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018805436244916156, + "loss": 0.0149, "step": 287910 }, { - "epoch": 1.45, - "learning_rate": 8.21109827406148e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.0001880504742327901, + "loss": 0.0164, "step": 287920 }, { - "epoch": 1.45, - "learning_rate": 8.210341504760079e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018804658601641861, + "loss": 0.0154, "step": 287930 }, { - "epoch": 1.45, - "learning_rate": 8.209584735458677e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018804269780004716, + "loss": 0.0141, "step": 287940 }, { - "epoch": 1.45, - "learning_rate": 8.208827966157277e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.0001880388095836757, + "loss": 0.0136, "step": 287950 }, { - "epoch": 1.45, - "learning_rate": 8.208071196855875e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018803492136730424, + "loss": 0.0178, "step": 287960 }, { - "epoch": 1.45, - "learning_rate": 8.207314427554474e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018803103315093275, + "loss": 0.0142, "step": 287970 }, { - "epoch": 1.45, - "learning_rate": 8.206557658253074e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.0001880271449345613, + "loss": 0.0124, "step": 287980 }, { - "epoch": 1.45, - "learning_rate": 8.205800888951672e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018802325671818986, + "loss": 0.0129, "step": 287990 }, { - "epoch": 1.45, - "learning_rate": 8.205044119650271e-05, - "loss": 0.0098, + "epoch": 0.75, + "learning_rate": 0.00018801936850181838, + "loss": 0.016, "step": 288000 }, { - "epoch": 1.45, - "eval_cer": 0.9144294992658953, - "eval_loss": 0.005808565299957991, - "eval_runtime": 115.5954, - "eval_samples_per_second": 17.302, - "eval_steps_per_second": 4.325, + "epoch": 0.75, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.009974485263228416, + "eval_runtime": 107.8815, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, "step": 288000 }, { - "epoch": 1.45, - "learning_rate": 8.204287350348871e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018801548028544692, + "loss": 0.0131, "step": 288010 }, { - "epoch": 1.45, - "learning_rate": 8.203530581047469e-05, - "loss": 0.005, + "epoch": 0.75, + "learning_rate": 0.00018801159206907543, + "loss": 0.0137, "step": 288020 }, { - "epoch": 1.45, - "learning_rate": 8.202773811746069e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.000188007703852704, + "loss": 0.0153, "step": 288030 }, { - "epoch": 1.45, - "learning_rate": 8.202017042444667e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018800381563633252, + "loss": 0.0122, "step": 288040 }, { - "epoch": 1.45, - "learning_rate": 8.201260273143266e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018799992741996106, + "loss": 0.0142, "step": 288050 }, { - "epoch": 1.45, - "learning_rate": 8.200503503841866e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018799603920358957, + "loss": 0.0153, "step": 288060 }, { - "epoch": 1.45, - "learning_rate": 8.199746734540464e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018799215098721812, + "loss": 0.0135, "step": 288070 }, { - "epoch": 1.45, - "learning_rate": 8.198989965239063e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018798826277084666, + "loss": 0.0201, "step": 288080 }, { - "epoch": 1.45, - "learning_rate": 8.198233195937663e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.0001879843745544752, + "loss": 0.0167, "step": 288090 }, { - "epoch": 1.45, - "learning_rate": 8.197476426636261e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001879804863381037, + "loss": 0.0146, "step": 288100 }, { - "epoch": 1.45, - "learning_rate": 8.19671965733486e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018797659812173225, + "loss": 0.0161, "step": 288110 }, { - "epoch": 1.45, - "learning_rate": 8.19596288803346e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001879727099053608, + "loss": 0.0146, "step": 288120 }, { - "epoch": 1.45, - "learning_rate": 8.195206118732058e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018796882168898934, + "loss": 0.0125, "step": 288130 }, { - "epoch": 1.45, - "learning_rate": 8.194449349430658e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018796493347261785, + "loss": 0.0191, "step": 288140 }, { - "epoch": 1.45, - "learning_rate": 8.193692580129254e-05, - "loss": 0.0056, + "epoch": 0.75, + "learning_rate": 0.0001879610452562464, + "loss": 0.0133, "step": 288150 }, { - "epoch": 1.45, - "learning_rate": 8.192935810827854e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018795715703987496, + "loss": 0.0134, "step": 288160 }, { - "epoch": 1.45, - "learning_rate": 8.192179041526452e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018795326882350348, + "loss": 0.0217, "step": 288170 }, { - "epoch": 1.45, - "learning_rate": 8.191422272225052e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.000187949380607132, + "loss": 0.0117, "step": 288180 }, { - "epoch": 1.45, - "learning_rate": 8.190665502923651e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018794549239076053, + "loss": 0.0186, "step": 288190 }, { - "epoch": 1.45, - "learning_rate": 8.189908733622249e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001879416041743891, + "loss": 0.0206, "step": 288200 }, { - "epoch": 1.45, - "learning_rate": 8.189151964320849e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018793771595801762, + "loss": 0.0158, "step": 288210 }, { - "epoch": 1.45, - "learning_rate": 8.188395195019448e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018793382774164616, + "loss": 0.0103, "step": 288220 }, { - "epoch": 1.45, - "learning_rate": 8.187638425718046e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018792993952527467, + "loss": 0.0146, "step": 288230 }, { - "epoch": 1.45, - "learning_rate": 8.186881656416646e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018792605130890324, + "loss": 0.0206, "step": 288240 }, { - "epoch": 1.45, - "learning_rate": 8.186124887115244e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.00018792216309253176, + "loss": 0.0166, "step": 288250 }, { - "epoch": 1.45, - "learning_rate": 8.185368117813844e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001879182748761603, + "loss": 0.0151, "step": 288260 }, { - "epoch": 1.45, - "learning_rate": 8.184611348512443e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.0001879143866597888, + "loss": 0.015, "step": 288270 }, { - "epoch": 1.45, - "learning_rate": 8.183854579211041e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018791049844341738, + "loss": 0.014, "step": 288280 }, { - "epoch": 1.45, - "learning_rate": 8.18309780990964e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.0001879066102270459, + "loss": 0.0134, "step": 288290 }, { - "epoch": 1.45, - "learning_rate": 8.18234104060824e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018790272201067444, + "loss": 0.0216, "step": 288300 }, { - "epoch": 1.45, - "learning_rate": 8.181584271306838e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018789883379430295, + "loss": 0.017, "step": 288310 }, { - "epoch": 1.45, - "learning_rate": 8.180827502005438e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.0001878949455779315, + "loss": 0.0147, "step": 288320 }, { - "epoch": 1.45, - "learning_rate": 8.180070732704036e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.00018789105736156006, + "loss": 0.0137, "step": 288330 }, { - "epoch": 1.45, - "learning_rate": 8.179313963402635e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018788716914518858, + "loss": 0.0143, "step": 288340 }, { - "epoch": 1.45, - "learning_rate": 8.178557194101235e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001878832809288171, + "loss": 0.0132, "step": 288350 }, { - "epoch": 1.45, - "learning_rate": 8.177800424799833e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018787939271244563, + "loss": 0.0141, "step": 288360 }, { - "epoch": 1.45, - "learning_rate": 8.177043655498433e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.0001878755044960742, + "loss": 0.0143, "step": 288370 }, { - "epoch": 1.45, - "learning_rate": 8.176286886197032e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018787161627970272, + "loss": 0.02, "step": 288380 }, { - "epoch": 1.45, - "learning_rate": 8.17553011689563e-05, - "loss": 0.0101, + "epoch": 0.75, + "learning_rate": 0.00018786772806333126, + "loss": 0.0139, "step": 288390 }, { - "epoch": 1.46, - "learning_rate": 8.17477334759423e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018786383984695977, + "loss": 0.0134, "step": 288400 }, { - "epoch": 1.46, - "learning_rate": 8.174016578292828e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018785995163058834, + "loss": 0.014, "step": 288410 }, { - "epoch": 1.46, - "learning_rate": 8.173259808991427e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018785606341421686, + "loss": 0.0153, "step": 288420 }, { - "epoch": 1.46, - "learning_rate": 8.172503039690027e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.0001878521751978454, + "loss": 0.0106, "step": 288430 }, { - "epoch": 1.46, - "learning_rate": 8.171746270388625e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001878482869814739, + "loss": 0.0141, "step": 288440 }, { - "epoch": 1.46, - "learning_rate": 8.170989501087225e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.00018784439876510248, + "loss": 0.0134, "step": 288450 }, { - "epoch": 1.46, - "learning_rate": 8.170232731785824e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.000187840510548731, + "loss": 0.0137, "step": 288460 }, { - "epoch": 1.46, - "learning_rate": 8.169475962484422e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018783662233235954, + "loss": 0.0141, "step": 288470 }, { - "epoch": 1.46, - "learning_rate": 8.168719193183022e-05, - "loss": 0.0098, + "epoch": 0.75, + "learning_rate": 0.00018783273411598805, + "loss": 0.0162, "step": 288480 }, { - "epoch": 1.46, - "learning_rate": 8.16796242388162e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018782884589961662, + "loss": 0.0115, "step": 288490 }, { - "epoch": 1.46, - "learning_rate": 8.167205654580219e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018782495768324513, + "loss": 0.0142, "step": 288500 }, { - "epoch": 1.46, - "learning_rate": 8.166448885278819e-05, - "loss": 0.0107, + "epoch": 0.75, + "learning_rate": 0.00018782106946687368, + "loss": 0.0128, "step": 288510 }, { - "epoch": 1.46, - "learning_rate": 8.165692115977417e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.0001878171812505022, + "loss": 0.0123, "step": 288520 }, { - "epoch": 1.46, - "learning_rate": 8.164935346676016e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018781329303413076, + "loss": 0.0137, "step": 288530 }, { - "epoch": 1.46, - "learning_rate": 8.164178577374616e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.0001878094048177593, + "loss": 0.0123, "step": 288540 }, { - "epoch": 1.46, - "learning_rate": 8.163421808073214e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018780551660138782, + "loss": 0.0142, "step": 288550 }, { - "epoch": 1.46, - "learning_rate": 8.162665038771814e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.00018780162838501636, + "loss": 0.014, "step": 288560 }, { - "epoch": 1.46, - "learning_rate": 8.161908269470413e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018779774016864487, + "loss": 0.0131, "step": 288570 }, { - "epoch": 1.46, - "learning_rate": 8.161151500169011e-05, - "loss": 0.0095, + "epoch": 0.75, + "learning_rate": 0.00018779385195227344, + "loss": 0.02, "step": 288580 }, { - "epoch": 1.46, - "learning_rate": 8.160394730867611e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018778996373590196, + "loss": 0.0145, "step": 288590 }, { - "epoch": 1.46, - "learning_rate": 8.159637961566209e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001877860755195305, + "loss": 0.0157, "step": 288600 }, { - "epoch": 1.46, - "learning_rate": 8.158881192264808e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.000187782187303159, + "loss": 0.013, "step": 288610 }, { - "epoch": 1.46, - "learning_rate": 8.158124422963408e-05, - "loss": 0.0055, + "epoch": 0.75, + "learning_rate": 0.00018777829908678758, + "loss": 0.0134, "step": 288620 }, { - "epoch": 1.46, - "learning_rate": 8.157367653662006e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001877744108704161, + "loss": 0.0124, "step": 288630 }, { - "epoch": 1.46, - "learning_rate": 8.156610884360606e-05, - "loss": 0.0053, + "epoch": 0.75, + "learning_rate": 0.00018777052265404464, + "loss": 0.0179, "step": 288640 }, { - "epoch": 1.46, - "learning_rate": 8.155854115059205e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018776663443767315, + "loss": 0.0156, "step": 288650 }, { - "epoch": 1.46, - "learning_rate": 8.155097345757803e-05, - "loss": 0.0053, + "epoch": 0.75, + "learning_rate": 0.00018776274622130172, + "loss": 0.0202, "step": 288660 }, { - "epoch": 1.46, - "learning_rate": 8.154340576456403e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018775885800493023, + "loss": 0.0133, "step": 288670 }, { - "epoch": 1.46, - "learning_rate": 8.153583807155001e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.00018775496978855878, + "loss": 0.014, "step": 288680 }, { - "epoch": 1.46, - "learning_rate": 8.1528270378536e-05, - "loss": 0.0109, + "epoch": 0.75, + "learning_rate": 0.0001877510815721873, + "loss": 0.0146, "step": 288690 }, { - "epoch": 1.46, - "learning_rate": 8.1520702685522e-05, - "loss": 0.006, + "epoch": 0.75, + "learning_rate": 0.00018774719335581586, + "loss": 0.0121, "step": 288700 }, { - "epoch": 1.46, - "learning_rate": 8.151313499250798e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.0001877433051394444, + "loss": 0.0098, "step": 288710 }, { - "epoch": 1.46, - "learning_rate": 8.150556729949397e-05, - "loss": 0.0056, + "epoch": 0.75, + "learning_rate": 0.00018773941692307292, + "loss": 0.0146, "step": 288720 }, { - "epoch": 1.46, - "learning_rate": 8.149799960647997e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018773552870670146, + "loss": 0.0142, "step": 288730 }, { - "epoch": 1.46, - "learning_rate": 8.149043191346595e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.00018773164049033, + "loss": 0.0111, "step": 288740 }, { - "epoch": 1.46, - "learning_rate": 8.148286422045195e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018772775227395854, + "loss": 0.0174, "step": 288750 }, { - "epoch": 1.46, - "learning_rate": 8.147529652743793e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.00018772386405758705, + "loss": 0.0151, "step": 288760 }, { - "epoch": 1.46, - "learning_rate": 8.146772883442391e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.0001877199758412156, + "loss": 0.0149, "step": 288770 }, { - "epoch": 1.46, - "learning_rate": 8.146016114140989e-05, - "loss": 0.0103, + "epoch": 0.75, + "learning_rate": 0.00018771608762484414, + "loss": 0.0173, "step": 288780 }, { - "epoch": 1.46, - "learning_rate": 8.145259344839589e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018771219940847268, + "loss": 0.0156, "step": 288790 }, { - "epoch": 1.46, - "learning_rate": 8.144502575538188e-05, - "loss": 0.006, + "epoch": 0.75, + "learning_rate": 0.0001877083111921012, + "loss": 0.0151, "step": 288800 }, { - "epoch": 1.46, - "learning_rate": 8.143745806236786e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018770442297572974, + "loss": 0.014, "step": 288810 }, { - "epoch": 1.46, - "learning_rate": 8.142989036935386e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018770053475935825, + "loss": 0.0151, "step": 288820 }, { - "epoch": 1.46, - "learning_rate": 8.142232267633985e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018769664654298682, + "loss": 0.0149, "step": 288830 }, { - "epoch": 1.46, - "learning_rate": 8.141475498332583e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018769275832661533, + "loss": 0.0145, "step": 288840 }, { - "epoch": 1.46, - "learning_rate": 8.140718729031183e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018768887011024388, + "loss": 0.0111, "step": 288850 }, { - "epoch": 1.46, - "learning_rate": 8.139961959729781e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.0001876849818938724, + "loss": 0.0137, "step": 288860 }, { - "epoch": 1.46, - "learning_rate": 8.13920519042838e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018768109367750096, + "loss": 0.014, "step": 288870 }, { - "epoch": 1.46, - "learning_rate": 8.13844842112698e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.0001876772054611295, + "loss": 0.0143, "step": 288880 }, { - "epoch": 1.46, - "learning_rate": 8.137691651825578e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018767331724475801, + "loss": 0.0127, "step": 288890 }, { - "epoch": 1.46, - "learning_rate": 8.136934882524178e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018766942902838653, + "loss": 0.0125, "step": 288900 }, { - "epoch": 1.46, - "learning_rate": 8.136178113222777e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.0001876655408120151, + "loss": 0.0123, "step": 288910 }, { - "epoch": 1.46, - "learning_rate": 8.135421343921375e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018766165259564364, + "loss": 0.0168, "step": 288920 }, { - "epoch": 1.46, - "learning_rate": 8.134664574619975e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018765776437927215, + "loss": 0.0143, "step": 288930 }, { - "epoch": 1.46, - "learning_rate": 8.133907805318573e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.0001876538761629007, + "loss": 0.0124, "step": 288940 }, { - "epoch": 1.46, - "learning_rate": 8.133151036017172e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018764998794652924, + "loss": 0.0154, "step": 288950 }, { - "epoch": 1.46, - "learning_rate": 8.132394266715772e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018764609973015778, + "loss": 0.0125, "step": 288960 }, { - "epoch": 1.46, - "learning_rate": 8.13163749741437e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001876422115137863, + "loss": 0.017, "step": 288970 }, { - "epoch": 1.46, - "learning_rate": 8.13088072811297e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018763832329741484, + "loss": 0.0144, "step": 288980 }, { - "epoch": 1.46, - "learning_rate": 8.130123958811569e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018763443508104338, + "loss": 0.0152, "step": 288990 }, { - "epoch": 1.46, - "learning_rate": 8.129367189510167e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018763054686467192, + "loss": 0.0144, "step": 289000 }, { - "epoch": 1.46, - "eval_cer": 0.9144401736232748, - "eval_loss": 0.005669711157679558, - "eval_runtime": 115.6193, - "eval_samples_per_second": 17.298, - "eval_steps_per_second": 4.325, + "epoch": 0.75, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.0096070421859622, + "eval_runtime": 107.8246, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, "step": 289000 }, { - "epoch": 1.46, - "learning_rate": 8.128610420208767e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018762665864830043, + "loss": 0.0106, "step": 289010 }, { - "epoch": 1.46, - "learning_rate": 8.127853650907366e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018762277043192897, + "loss": 0.0159, "step": 289020 }, { - "epoch": 1.46, - "learning_rate": 8.127096881605964e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018761888221555754, + "loss": 0.0164, "step": 289030 }, { - "epoch": 1.46, - "learning_rate": 8.126340112304564e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018761499399918606, + "loss": 0.0135, "step": 289040 }, { - "epoch": 1.46, - "learning_rate": 8.125583343003162e-05, - "loss": 0.0096, + "epoch": 0.75, + "learning_rate": 0.00018761110578281457, + "loss": 0.0144, "step": 289050 }, { - "epoch": 1.46, - "learning_rate": 8.124826573701761e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018760721756644311, + "loss": 0.0161, "step": 289060 }, { - "epoch": 1.46, - "learning_rate": 8.124069804400361e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.00018760332935007163, + "loss": 0.0134, "step": 289070 }, { - "epoch": 1.46, - "learning_rate": 8.123313035098959e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.0001875994411337002, + "loss": 0.0167, "step": 289080 }, { - "epoch": 1.46, - "learning_rate": 8.122556265797559e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018759555291732874, + "loss": 0.0154, "step": 289090 }, { - "epoch": 1.46, - "learning_rate": 8.121799496496158e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018759166470095725, + "loss": 0.0145, "step": 289100 }, { - "epoch": 1.46, - "learning_rate": 8.121042727194756e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.0001875877764845858, + "loss": 0.0154, "step": 289110 }, { - "epoch": 1.46, - "learning_rate": 8.120285957893356e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018758388826821434, + "loss": 0.0192, "step": 289120 }, { - "epoch": 1.46, - "learning_rate": 8.119529188591954e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018758000005184288, + "loss": 0.0141, "step": 289130 }, { - "epoch": 1.46, - "learning_rate": 8.118772419290553e-05, - "loss": 0.0051, + "epoch": 0.75, + "learning_rate": 0.0001875761118354714, + "loss": 0.0129, "step": 289140 }, { - "epoch": 1.46, - "learning_rate": 8.118015649989153e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018757222361909993, + "loss": 0.0112, "step": 289150 }, { - "epoch": 1.46, - "learning_rate": 8.117258880687751e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018756833540272848, + "loss": 0.0115, "step": 289160 }, { - "epoch": 1.46, - "learning_rate": 8.11650211138635e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018756444718635702, + "loss": 0.0163, "step": 289170 }, { - "epoch": 1.46, - "learning_rate": 8.11574534208495e-05, - "loss": 0.0134, + "epoch": 0.75, + "learning_rate": 0.00018756055896998553, + "loss": 0.0175, "step": 289180 }, { - "epoch": 1.46, - "learning_rate": 8.114988572783548e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018755667075361407, + "loss": 0.0139, "step": 289190 }, { - "epoch": 1.46, - "learning_rate": 8.114231803482148e-05, - "loss": 0.0054, + "epoch": 0.75, + "learning_rate": 0.00018755278253724264, + "loss": 0.0131, "step": 289200 }, { - "epoch": 1.46, - "learning_rate": 8.113475034180746e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018754889432087116, + "loss": 0.0179, "step": 289210 }, { - "epoch": 1.46, - "learning_rate": 8.112718264879345e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018754500610449967, + "loss": 0.0128, "step": 289220 }, { - "epoch": 1.46, - "learning_rate": 8.111961495577945e-05, - "loss": 0.0126, + "epoch": 0.75, + "learning_rate": 0.0001875411178881282, + "loss": 0.0149, "step": 289230 }, { - "epoch": 1.46, - "learning_rate": 8.111204726276543e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018753722967175678, + "loss": 0.0134, "step": 289240 }, { - "epoch": 1.46, - "learning_rate": 8.110447956975142e-05, - "loss": 0.0057, + "epoch": 0.75, + "learning_rate": 0.0001875333414553853, + "loss": 0.0151, "step": 289250 }, { - "epoch": 1.46, - "learning_rate": 8.109691187673742e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018752945323901384, + "loss": 0.0142, "step": 289260 }, { - "epoch": 1.46, - "learning_rate": 8.10893441837234e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018752556502264235, + "loss": 0.0121, "step": 289270 }, { - "epoch": 1.46, - "learning_rate": 8.10817764907094e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018752167680627092, + "loss": 0.0119, "step": 289280 }, { - "epoch": 1.46, - "learning_rate": 8.107420879769538e-05, - "loss": 0.0091, + "epoch": 0.75, + "learning_rate": 0.00018751778858989944, + "loss": 0.0174, "step": 289290 }, { - "epoch": 1.46, - "learning_rate": 8.106664110468137e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.00018751390037352798, + "loss": 0.0153, "step": 289300 }, { - "epoch": 1.46, - "learning_rate": 8.105907341166737e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.0001875100121571565, + "loss": 0.0128, "step": 289310 }, { - "epoch": 1.46, - "learning_rate": 8.105150571865335e-05, - "loss": 0.0129, + "epoch": 0.75, + "learning_rate": 0.00018750612394078503, + "loss": 0.0173, "step": 289320 }, { - "epoch": 1.46, - "learning_rate": 8.104393802563934e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018750223572441358, + "loss": 0.0157, "step": 289330 }, { - "epoch": 1.46, - "learning_rate": 8.103637033262534e-05, - "loss": 0.0109, + "epoch": 0.75, + "learning_rate": 0.00018749834750804212, + "loss": 0.0159, "step": 289340 }, { - "epoch": 1.46, - "learning_rate": 8.102880263961132e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018749445929167063, + "loss": 0.0139, "step": 289350 }, { - "epoch": 1.46, - "learning_rate": 8.102123494659732e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018749057107529917, + "loss": 0.0173, "step": 289360 }, { - "epoch": 1.46, - "learning_rate": 8.10136672535833e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018748668285892771, + "loss": 0.0152, "step": 289370 }, { - "epoch": 1.46, - "learning_rate": 8.100609956056929e-05, - "loss": 0.0107, + "epoch": 0.75, + "learning_rate": 0.00018748279464255626, + "loss": 0.0143, "step": 289380 }, { - "epoch": 1.46, - "learning_rate": 8.099853186755529e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018747890642618477, + "loss": 0.0157, "step": 289390 }, { - "epoch": 1.46, - "learning_rate": 8.099096417454125e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001874750182098133, + "loss": 0.0162, "step": 289400 }, { - "epoch": 1.46, - "learning_rate": 8.098339648152725e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018747112999344188, + "loss": 0.014, "step": 289410 }, { - "epoch": 1.46, - "learning_rate": 8.097582878851323e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.0001874672417770704, + "loss": 0.0178, "step": 289420 }, { - "epoch": 1.46, - "learning_rate": 8.096826109549923e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018746335356069894, + "loss": 0.0141, "step": 289430 }, { - "epoch": 1.46, - "learning_rate": 8.096069340248522e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018745946534432745, + "loss": 0.0119, "step": 289440 }, { - "epoch": 1.46, - "learning_rate": 8.09531257094712e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018745557712795602, + "loss": 0.0239, "step": 289450 }, { - "epoch": 1.46, - "learning_rate": 8.09455580164572e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018745168891158454, + "loss": 0.0167, "step": 289460 }, { - "epoch": 1.46, - "learning_rate": 8.093799032344318e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018744780069521308, + "loss": 0.0142, "step": 289470 }, { - "epoch": 1.46, - "learning_rate": 8.093042263042917e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.0001874439124788416, + "loss": 0.0164, "step": 289480 }, { - "epoch": 1.46, - "learning_rate": 8.092285493741517e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018744002426247016, + "loss": 0.0138, "step": 289490 }, { - "epoch": 1.46, - "learning_rate": 8.091528724440115e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018743613604609867, + "loss": 0.0133, "step": 289500 }, { - "epoch": 1.46, - "learning_rate": 8.090771955138715e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018743224782972722, + "loss": 0.0151, "step": 289510 }, { - "epoch": 1.46, - "learning_rate": 8.090015185837314e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.00018742835961335573, + "loss": 0.0133, "step": 289520 }, { - "epoch": 1.46, - "learning_rate": 8.089258416535912e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001874244713969843, + "loss": 0.0147, "step": 289530 }, { - "epoch": 1.46, - "learning_rate": 8.088501647234512e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018742058318061281, + "loss": 0.0123, "step": 289540 }, { - "epoch": 1.46, - "learning_rate": 8.087744877933111e-05, - "loss": 0.0095, + "epoch": 0.75, + "learning_rate": 0.00018741669496424136, + "loss": 0.0136, "step": 289550 }, { - "epoch": 1.46, - "learning_rate": 8.08698810863171e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.00018741280674786987, + "loss": 0.0173, "step": 289560 }, { - "epoch": 1.46, - "learning_rate": 8.086231339330309e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.0001874089185314984, + "loss": 0.0164, "step": 289570 }, { - "epoch": 1.46, - "learning_rate": 8.085474570028907e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018740503031512698, + "loss": 0.0165, "step": 289580 }, { - "epoch": 1.46, - "learning_rate": 8.084717800727506e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.0001874011420987555, + "loss": 0.018, "step": 289590 }, { - "epoch": 1.46, - "learning_rate": 8.083961031426106e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018739725388238404, + "loss": 0.0134, "step": 289600 }, { - "epoch": 1.46, - "learning_rate": 8.083204262124704e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018739336566601255, + "loss": 0.0138, "step": 289610 }, { - "epoch": 1.46, - "learning_rate": 8.082447492823304e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018738947744964112, + "loss": 0.0143, "step": 289620 }, { - "epoch": 1.46, - "learning_rate": 8.081690723521903e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.00018738558923326963, + "loss": 0.0149, "step": 289630 }, { - "epoch": 1.46, - "learning_rate": 8.080933954220501e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018738170101689818, + "loss": 0.0204, "step": 289640 }, { - "epoch": 1.46, - "learning_rate": 8.080177184919101e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.0001873778128005267, + "loss": 0.0134, "step": 289650 }, { - "epoch": 1.46, - "learning_rate": 8.079420415617699e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018737392458415526, + "loss": 0.0136, "step": 289660 }, { - "epoch": 1.46, - "learning_rate": 8.078663646316298e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018737003636778377, + "loss": 0.014, "step": 289670 }, { - "epoch": 1.46, - "learning_rate": 8.077906877014898e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.00018736614815141232, + "loss": 0.0156, "step": 289680 }, { - "epoch": 1.46, - "learning_rate": 8.077150107713496e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018736225993504083, + "loss": 0.0136, "step": 289690 }, { - "epoch": 1.46, - "learning_rate": 8.076393338412096e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.0001873583717186694, + "loss": 0.0142, "step": 289700 }, { - "epoch": 1.46, - "learning_rate": 8.075636569110695e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018735448350229791, + "loss": 0.0129, "step": 289710 }, { - "epoch": 1.46, - "learning_rate": 8.074879799809293e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018735059528592646, + "loss": 0.0128, "step": 289720 }, { - "epoch": 1.46, - "learning_rate": 8.074123030507893e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018734670706955497, + "loss": 0.0134, "step": 289730 }, { - "epoch": 1.46, - "learning_rate": 8.073366261206491e-05, - "loss": 0.0057, + "epoch": 0.75, + "learning_rate": 0.00018734281885318354, + "loss": 0.0135, "step": 289740 }, { - "epoch": 1.46, - "learning_rate": 8.07260949190509e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018733893063681208, + "loss": 0.0192, "step": 289750 }, { - "epoch": 1.46, - "learning_rate": 8.07185272260369e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.0001873350424204406, + "loss": 0.0142, "step": 289760 }, { - "epoch": 1.46, - "learning_rate": 8.071095953302288e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001873311542040691, + "loss": 0.0132, "step": 289770 }, { - "epoch": 1.46, - "learning_rate": 8.070339184000887e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018732726598769768, + "loss": 0.0128, "step": 289780 }, { - "epoch": 1.46, - "learning_rate": 8.069582414699487e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018732337777132622, + "loss": 0.0135, "step": 289790 }, { - "epoch": 1.46, - "learning_rate": 8.068825645398085e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018731948955495473, + "loss": 0.0129, "step": 289800 }, { - "epoch": 1.46, - "learning_rate": 8.068068876096685e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.00018731560133858328, + "loss": 0.0135, "step": 289810 }, { - "epoch": 1.46, - "learning_rate": 8.067312106795283e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.0001873117131222118, + "loss": 0.0129, "step": 289820 }, { - "epoch": 1.46, - "learning_rate": 8.066555337493882e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018730782490584036, + "loss": 0.0165, "step": 289830 }, { - "epoch": 1.46, - "learning_rate": 8.065798568192482e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018730393668946887, + "loss": 0.0134, "step": 289840 }, { - "epoch": 1.46, - "learning_rate": 8.06504179889108e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018730004847309742, + "loss": 0.0123, "step": 289850 }, { - "epoch": 1.46, - "learning_rate": 8.06428502958968e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018729616025672593, + "loss": 0.0153, "step": 289860 }, { - "epoch": 1.46, - "learning_rate": 8.063528260288279e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.0001872922720403545, + "loss": 0.0126, "step": 289870 }, { - "epoch": 1.46, - "learning_rate": 8.062771490986877e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.000187288383823983, + "loss": 0.0176, "step": 289880 }, { - "epoch": 1.46, - "learning_rate": 8.062014721685477e-05, - "loss": 0.0097, + "epoch": 0.75, + "learning_rate": 0.00018728449560761155, + "loss": 0.0145, "step": 289890 }, { - "epoch": 1.46, - "learning_rate": 8.061257952384075e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018728060739124007, + "loss": 0.0102, "step": 289900 }, { - "epoch": 1.46, - "learning_rate": 8.060501183082674e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018727671917486864, + "loss": 0.0143, "step": 289910 }, { - "epoch": 1.46, - "learning_rate": 8.059744413781274e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018727283095849718, + "loss": 0.0164, "step": 289920 }, { - "epoch": 1.46, - "learning_rate": 8.058987644479872e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001872689427421257, + "loss": 0.0149, "step": 289930 }, { - "epoch": 1.46, - "learning_rate": 8.058230875178471e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001872650545257542, + "loss": 0.0137, "step": 289940 }, { - "epoch": 1.46, - "learning_rate": 8.057474105877071e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018726116630938278, + "loss": 0.0122, "step": 289950 }, { - "epoch": 1.46, - "learning_rate": 8.056717336575669e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018725727809301132, + "loss": 0.0119, "step": 289960 }, { - "epoch": 1.46, - "learning_rate": 8.055960567274268e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018725338987663983, + "loss": 0.0172, "step": 289970 }, { - "epoch": 1.46, - "learning_rate": 8.055203797972867e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018724950166026838, + "loss": 0.0324, "step": 289980 }, { - "epoch": 1.46, - "learning_rate": 8.054447028671466e-05, - "loss": 0.0083, + "epoch": 0.75, + "learning_rate": 0.00018724561344389692, + "loss": 0.0143, "step": 289990 }, { - "epoch": 1.46, - "learning_rate": 8.053690259370066e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018724172522752546, + "loss": 0.0155, "step": 290000 }, { - "epoch": 1.46, - "eval_cer": 0.9144586111496574, - "eval_loss": 0.005535100121051073, - "eval_runtime": 115.6597, - "eval_samples_per_second": 17.292, - "eval_steps_per_second": 4.323, + "epoch": 0.75, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.00951974093914032, + "eval_runtime": 107.8612, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.636, "step": 290000 }, { - "epoch": 1.46, - "learning_rate": 8.052933490068664e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.00018723783701115397, + "loss": 0.0136, "step": 290010 }, { - "epoch": 1.46, - "learning_rate": 8.052176720767263e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018723394879478251, + "loss": 0.0121, "step": 290020 }, { - "epoch": 1.46, - "learning_rate": 8.05141995146586e-05, - "loss": 0.0092, + "epoch": 0.75, + "learning_rate": 0.00018723006057841106, + "loss": 0.0122, "step": 290030 }, { - "epoch": 1.46, - "learning_rate": 8.05066318216446e-05, - "loss": 0.01, + "epoch": 0.75, + "learning_rate": 0.0001872261723620396, + "loss": 0.0119, "step": 290040 }, { - "epoch": 1.46, - "learning_rate": 8.049906412863059e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.0001872222841456681, + "loss": 0.0195, "step": 290050 }, { - "epoch": 1.46, - "learning_rate": 8.049149643561657e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018721839592929665, + "loss": 0.0132, "step": 290060 }, { - "epoch": 1.46, - "learning_rate": 8.048392874260257e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.00018721450771292517, + "loss": 0.0152, "step": 290070 }, { - "epoch": 1.46, - "learning_rate": 8.047636104958856e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018721061949655374, + "loss": 0.0145, "step": 290080 }, { - "epoch": 1.46, - "learning_rate": 8.046879335657454e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018720673128018225, + "loss": 0.0156, "step": 290090 }, { - "epoch": 1.46, - "learning_rate": 8.046122566356054e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.0001872028430638108, + "loss": 0.0188, "step": 290100 }, { - "epoch": 1.46, - "learning_rate": 8.045365797054652e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.0001871989548474393, + "loss": 0.0116, "step": 290110 }, { - "epoch": 1.46, - "learning_rate": 8.044609027753252e-05, - "loss": 0.0057, + "epoch": 0.75, + "learning_rate": 0.00018719506663106788, + "loss": 0.0148, "step": 290120 }, { - "epoch": 1.46, - "learning_rate": 8.043852258451851e-05, - "loss": 0.0101, + "epoch": 0.75, + "learning_rate": 0.00018719117841469642, + "loss": 0.011, "step": 290130 }, { - "epoch": 1.46, - "learning_rate": 8.043095489150449e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018718729019832493, + "loss": 0.0148, "step": 290140 }, { - "epoch": 1.46, - "learning_rate": 8.042338719849049e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018718340198195347, + "loss": 0.0148, "step": 290150 }, { - "epoch": 1.46, - "learning_rate": 8.041581950547648e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018717951376558202, + "loss": 0.0141, "step": 290160 }, { - "epoch": 1.46, - "learning_rate": 8.040825181246246e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018717562554921056, + "loss": 0.0142, "step": 290170 }, { - "epoch": 1.46, - "learning_rate": 8.040068411944846e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018717173733283907, + "loss": 0.013, "step": 290180 }, { - "epoch": 1.46, - "learning_rate": 8.039311642643444e-05, - "loss": 0.0089, + "epoch": 0.75, + "learning_rate": 0.00018716784911646761, + "loss": 0.0138, "step": 290190 }, { - "epoch": 1.46, - "learning_rate": 8.038554873342043e-05, - "loss": 0.0091, + "epoch": 0.75, + "learning_rate": 0.00018716396090009616, + "loss": 0.0119, "step": 290200 }, { - "epoch": 1.46, - "learning_rate": 8.037798104040643e-05, - "loss": 0.0055, + "epoch": 0.75, + "learning_rate": 0.0001871600726837247, + "loss": 0.0114, "step": 290210 }, { - "epoch": 1.46, - "learning_rate": 8.037041334739241e-05, - "loss": 0.0091, + "epoch": 0.75, + "learning_rate": 0.0001871561844673532, + "loss": 0.0154, "step": 290220 }, { - "epoch": 1.46, - "learning_rate": 8.03628456543784e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018715229625098175, + "loss": 0.0149, "step": 290230 }, { - "epoch": 1.46, - "learning_rate": 8.03552779613644e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.0001871484080346103, + "loss": 0.0165, "step": 290240 }, { - "epoch": 1.46, - "learning_rate": 8.034771026835038e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018714451981823884, + "loss": 0.0132, "step": 290250 }, { - "epoch": 1.46, - "learning_rate": 8.034014257533638e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018714063160186735, + "loss": 0.0134, "step": 290260 }, { - "epoch": 1.46, - "learning_rate": 8.033257488232236e-05, - "loss": 0.006, + "epoch": 0.75, + "learning_rate": 0.0001871367433854959, + "loss": 0.0155, "step": 290270 }, { - "epoch": 1.46, - "learning_rate": 8.032500718930835e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018713285516912446, + "loss": 0.0136, "step": 290280 }, { - "epoch": 1.46, - "learning_rate": 8.031743949629435e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018712896695275298, + "loss": 0.0121, "step": 290290 }, { - "epoch": 1.46, - "learning_rate": 8.030987180328033e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018712507873638152, + "loss": 0.0195, "step": 290300 }, { - "epoch": 1.46, - "learning_rate": 8.030230411026633e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.00018712119052001003, + "loss": 0.0144, "step": 290310 }, { - "epoch": 1.46, - "learning_rate": 8.029473641725232e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018711730230363857, + "loss": 0.0141, "step": 290320 }, { - "epoch": 1.46, - "learning_rate": 8.02871687242383e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018711341408726712, + "loss": 0.0206, "step": 290330 }, { - "epoch": 1.46, - "learning_rate": 8.02796010312243e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018710952587089566, + "loss": 0.0126, "step": 290340 }, { - "epoch": 1.46, - "learning_rate": 8.027203333821028e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018710563765452417, + "loss": 0.0146, "step": 290350 }, { - "epoch": 1.46, - "learning_rate": 8.026446564519627e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018710174943815271, + "loss": 0.011, "step": 290360 }, { - "epoch": 1.46, - "learning_rate": 8.025689795218227e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018709786122178126, + "loss": 0.0106, "step": 290370 }, { - "epoch": 1.46, - "learning_rate": 8.024933025916825e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001870939730054098, + "loss": 0.0139, "step": 290380 }, { - "epoch": 1.47, - "learning_rate": 8.024176256615424e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.0001870900847890383, + "loss": 0.0119, "step": 290390 }, { - "epoch": 1.47, - "learning_rate": 8.023419487314024e-05, - "loss": 0.0057, + "epoch": 0.75, + "learning_rate": 0.00018708619657266685, + "loss": 0.0134, "step": 290400 }, { - "epoch": 1.47, - "learning_rate": 8.022662718012622e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.0001870823083562954, + "loss": 0.017, "step": 290410 }, { - "epoch": 1.47, - "learning_rate": 8.021905948711222e-05, - "loss": 0.0077, + "epoch": 0.75, + "learning_rate": 0.00018707842013992394, + "loss": 0.0133, "step": 290420 }, { - "epoch": 1.47, - "learning_rate": 8.02114917940982e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018707453192355245, + "loss": 0.0127, "step": 290430 }, { - "epoch": 1.47, - "learning_rate": 8.020392410108419e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.000187070643707181, + "loss": 0.0147, "step": 290440 }, { - "epoch": 1.47, - "learning_rate": 8.019635640807019e-05, - "loss": 0.0095, + "epoch": 0.75, + "learning_rate": 0.00018706675549080956, + "loss": 0.0132, "step": 290450 }, { - "epoch": 1.47, - "learning_rate": 8.018878871505617e-05, - "loss": 0.0098, + "epoch": 0.75, + "learning_rate": 0.00018706286727443808, + "loss": 0.0168, "step": 290460 }, { - "epoch": 1.47, - "learning_rate": 8.018122102204216e-05, - "loss": 0.0105, + "epoch": 0.75, + "learning_rate": 0.00018705897905806662, + "loss": 0.0193, "step": 290470 }, { - "epoch": 1.47, - "learning_rate": 8.017365332902816e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018705509084169513, + "loss": 0.015, "step": 290480 }, { - "epoch": 1.47, - "learning_rate": 8.016608563601414e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.0001870512026253237, + "loss": 0.0131, "step": 290490 }, { - "epoch": 1.47, - "learning_rate": 8.015851794300014e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.00018704731440895222, + "loss": 0.0155, "step": 290500 }, { - "epoch": 1.47, - "learning_rate": 8.015095024998613e-05, - "loss": 0.009, + "epoch": 0.75, + "learning_rate": 0.00018704342619258076, + "loss": 0.0165, "step": 290510 }, { - "epoch": 1.47, - "learning_rate": 8.014338255697211e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018703953797620927, + "loss": 0.0153, "step": 290520 }, { - "epoch": 1.47, - "learning_rate": 8.01358148639581e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018703564975983784, + "loss": 0.015, "step": 290530 }, { - "epoch": 1.47, - "learning_rate": 8.012824717094409e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018703176154346635, + "loss": 0.0125, "step": 290540 }, { - "epoch": 1.47, - "learning_rate": 8.012067947793008e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.0001870278733270949, + "loss": 0.0165, "step": 290550 }, { - "epoch": 1.47, - "learning_rate": 8.011311178491608e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001870239851107234, + "loss": 0.0153, "step": 290560 }, { - "epoch": 1.47, - "learning_rate": 8.010554409190206e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.00018702009689435195, + "loss": 0.013, "step": 290570 }, { - "epoch": 1.47, - "learning_rate": 8.009797639888805e-05, - "loss": 0.0099, + "epoch": 0.75, + "learning_rate": 0.0001870162086779805, + "loss": 0.0134, "step": 290580 }, { - "epoch": 1.47, - "learning_rate": 8.009040870587405e-05, - "loss": 0.0081, + "epoch": 0.75, + "learning_rate": 0.00018701232046160904, + "loss": 0.0158, "step": 290590 }, { - "epoch": 1.47, - "learning_rate": 8.008284101286003e-05, - "loss": 0.0058, + "epoch": 0.75, + "learning_rate": 0.00018700843224523755, + "loss": 0.0147, "step": 290600 }, { - "epoch": 1.47, - "learning_rate": 8.007527331984603e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001870045440288661, + "loss": 0.0139, "step": 290610 }, { - "epoch": 1.47, - "learning_rate": 8.006770562683201e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018700065581249466, + "loss": 0.017, "step": 290620 }, { - "epoch": 1.47, - "learning_rate": 8.0060137933818e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018699676759612318, + "loss": 0.0147, "step": 290630 }, { - "epoch": 1.47, - "learning_rate": 8.0052570240804e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.0001869928793797517, + "loss": 0.013, "step": 290640 }, { - "epoch": 1.47, - "learning_rate": 8.004500254778998e-05, - "loss": 0.0066, + "epoch": 0.75, + "learning_rate": 0.00018698899116338023, + "loss": 0.0137, "step": 290650 }, { - "epoch": 1.47, - "learning_rate": 8.003743485477596e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.0001869851029470088, + "loss": 0.0153, "step": 290660 }, { - "epoch": 1.47, - "learning_rate": 8.002986716176194e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.00018698121473063731, + "loss": 0.019, "step": 290670 }, { - "epoch": 1.47, - "learning_rate": 8.002229946874794e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018697732651426586, + "loss": 0.0174, "step": 290680 }, { - "epoch": 1.47, - "learning_rate": 8.001473177573393e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018697343829789437, + "loss": 0.0126, "step": 290690 }, { - "epoch": 1.47, - "learning_rate": 8.000716408271991e-05, - "loss": 0.0054, + "epoch": 0.75, + "learning_rate": 0.00018696955008152294, + "loss": 0.0136, "step": 290700 }, { - "epoch": 1.47, - "learning_rate": 7.999959638970591e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018696566186515145, + "loss": 0.0115, "step": 290710 }, { - "epoch": 1.47, - "learning_rate": 7.999202869669189e-05, - "loss": 0.0099, + "epoch": 0.75, + "learning_rate": 0.00018696177364878, + "loss": 0.0153, "step": 290720 }, { - "epoch": 1.47, - "learning_rate": 7.998446100367788e-05, - "loss": 0.0087, + "epoch": 0.75, + "learning_rate": 0.0001869578854324085, + "loss": 0.0143, "step": 290730 }, { - "epoch": 1.47, - "learning_rate": 7.997689331066388e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018695399721603708, + "loss": 0.0153, "step": 290740 }, { - "epoch": 1.47, - "learning_rate": 7.996932561764986e-05, - "loss": 0.0067, + "epoch": 0.75, + "learning_rate": 0.0001869501089996656, + "loss": 0.0163, "step": 290750 }, { - "epoch": 1.47, - "learning_rate": 7.996175792463586e-05, - "loss": 0.0086, + "epoch": 0.75, + "learning_rate": 0.00018694622078329414, + "loss": 0.0136, "step": 290760 }, { - "epoch": 1.47, - "learning_rate": 7.995419023162185e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.00018694233256692265, + "loss": 0.0151, "step": 290770 }, { - "epoch": 1.47, - "learning_rate": 7.994662253860783e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018693844435055122, + "loss": 0.0164, "step": 290780 }, { - "epoch": 1.47, - "learning_rate": 7.993905484559383e-05, - "loss": 0.0088, + "epoch": 0.75, + "learning_rate": 0.00018693455613417976, + "loss": 0.0177, "step": 290790 }, { - "epoch": 1.47, - "learning_rate": 7.993148715257981e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018693066791780827, + "loss": 0.0139, "step": 290800 }, { - "epoch": 1.47, - "learning_rate": 7.99239194595658e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.0001869267797014368, + "loss": 0.0143, "step": 290810 }, { - "epoch": 1.47, - "learning_rate": 7.99163517665518e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.00018692289148506533, + "loss": 0.0144, "step": 290820 }, { - "epoch": 1.47, - "learning_rate": 7.990878407353778e-05, - "loss": 0.0107, + "epoch": 0.75, + "learning_rate": 0.0001869190032686939, + "loss": 0.016, "step": 290830 }, { - "epoch": 1.47, - "learning_rate": 7.990121638052378e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018691511505232241, + "loss": 0.017, "step": 290840 }, { - "epoch": 1.47, - "learning_rate": 7.989364868750977e-05, - "loss": 0.009, + "epoch": 0.75, + "learning_rate": 0.00018691122683595096, + "loss": 0.0155, "step": 290850 }, { - "epoch": 1.47, - "learning_rate": 7.988608099449575e-05, - "loss": 0.008, + "epoch": 0.75, + "learning_rate": 0.00018690733861957947, + "loss": 0.0144, "step": 290860 }, { - "epoch": 1.47, - "learning_rate": 7.987851330148175e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018690345040320804, + "loss": 0.0126, "step": 290870 }, { - "epoch": 1.47, - "learning_rate": 7.987094560846773e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018689956218683655, + "loss": 0.0146, "step": 290880 }, { - "epoch": 1.47, - "learning_rate": 7.986337791545372e-05, - "loss": 0.0104, + "epoch": 0.75, + "learning_rate": 0.0001868956739704651, + "loss": 0.0168, "step": 290890 }, { - "epoch": 1.47, - "learning_rate": 7.985581022243972e-05, - "loss": 0.0059, + "epoch": 0.75, + "learning_rate": 0.0001868917857540936, + "loss": 0.0139, "step": 290900 }, { - "epoch": 1.47, - "learning_rate": 7.98482425294257e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018688789753772218, + "loss": 0.0133, "step": 290910 }, { - "epoch": 1.47, - "learning_rate": 7.98406748364117e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.0001868840093213507, + "loss": 0.0132, "step": 290920 }, { - "epoch": 1.47, - "learning_rate": 7.983310714339769e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018688012110497923, + "loss": 0.0131, "step": 290930 }, { - "epoch": 1.47, - "learning_rate": 7.982553945038367e-05, - "loss": 0.0061, + "epoch": 0.75, + "learning_rate": 0.00018687623288860775, + "loss": 0.0152, "step": 290940 }, { - "epoch": 1.47, - "learning_rate": 7.981797175736967e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018687234467223632, + "loss": 0.0144, "step": 290950 }, { - "epoch": 1.47, - "learning_rate": 7.981040406435566e-05, - "loss": 0.0078, + "epoch": 0.75, + "learning_rate": 0.00018686845645586483, + "loss": 0.0147, "step": 290960 }, { - "epoch": 1.47, - "learning_rate": 7.980283637134164e-05, - "loss": 0.0056, + "epoch": 0.75, + "learning_rate": 0.00018686456823949337, + "loss": 0.0146, "step": 290970 }, { - "epoch": 1.47, - "learning_rate": 7.979526867832764e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.0001868606800231219, + "loss": 0.0117, "step": 290980 }, { - "epoch": 1.47, - "learning_rate": 7.978770098531362e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018685679180675046, + "loss": 0.0159, "step": 290990 }, { - "epoch": 1.47, - "learning_rate": 7.978013329229961e-05, - "loss": 0.0068, + "epoch": 0.75, + "learning_rate": 0.000186852903590379, + "loss": 0.0129, "step": 291000 }, { - "epoch": 1.47, - "eval_cer": 0.9144314400581461, - "eval_loss": 0.00572578888386488, - "eval_runtime": 115.7089, - "eval_samples_per_second": 17.285, - "eval_steps_per_second": 4.321, + "epoch": 0.75, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.009270302951335907, + "eval_runtime": 107.7514, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, "step": 291000 }, { - "epoch": 1.47, - "learning_rate": 7.977256559928561e-05, - "loss": 0.0074, + "epoch": 0.75, + "learning_rate": 0.00018684901537400751, + "loss": 0.0247, "step": 291010 }, { - "epoch": 1.47, - "learning_rate": 7.976499790627159e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018684512715763606, + "loss": 0.0235, "step": 291020 }, { - "epoch": 1.47, - "learning_rate": 7.975743021325759e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018684123894126457, + "loss": 0.0144, "step": 291030 }, { - "epoch": 1.47, - "learning_rate": 7.974986252024358e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.00018683735072489314, + "loss": 0.0151, "step": 291040 }, { - "epoch": 1.47, - "learning_rate": 7.974229482722956e-05, - "loss": 0.0063, + "epoch": 0.75, + "learning_rate": 0.00018683346250852165, + "loss": 0.0149, "step": 291050 }, { - "epoch": 1.47, - "learning_rate": 7.973472713421556e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.0001868295742921502, + "loss": 0.0155, "step": 291060 }, { - "epoch": 1.47, - "learning_rate": 7.972715944120154e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.0001868256860757787, + "loss": 0.0135, "step": 291070 }, { - "epoch": 1.47, - "learning_rate": 7.971959174818753e-05, - "loss": 0.0079, + "epoch": 0.75, + "learning_rate": 0.00018682179785940728, + "loss": 0.0153, "step": 291080 }, { - "epoch": 1.47, - "learning_rate": 7.971202405517353e-05, - "loss": 0.0082, + "epoch": 0.75, + "learning_rate": 0.0001868179096430358, + "loss": 0.0165, "step": 291090 }, { - "epoch": 1.47, - "learning_rate": 7.970445636215951e-05, - "loss": 0.0075, + "epoch": 0.75, + "learning_rate": 0.00018681402142666433, + "loss": 0.0131, "step": 291100 }, { - "epoch": 1.47, - "learning_rate": 7.96968886691455e-05, - "loss": 0.0072, + "epoch": 0.75, + "learning_rate": 0.00018681013321029285, + "loss": 0.0151, "step": 291110 }, { - "epoch": 1.47, - "learning_rate": 7.96893209761315e-05, - "loss": 0.0062, + "epoch": 0.75, + "learning_rate": 0.00018680624499392142, + "loss": 0.0183, "step": 291120 }, { - "epoch": 1.47, - "learning_rate": 7.968175328311748e-05, - "loss": 0.0069, + "epoch": 0.75, + "learning_rate": 0.00018680235677754993, + "loss": 0.0157, "step": 291130 }, { - "epoch": 1.47, - "learning_rate": 7.967418559010348e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018679846856117847, + "loss": 0.0175, "step": 291140 }, { - "epoch": 1.47, - "learning_rate": 7.966661789708946e-05, - "loss": 0.0064, + "epoch": 0.75, + "learning_rate": 0.000186794580344807, + "loss": 0.0135, "step": 291150 }, { - "epoch": 1.47, - "learning_rate": 7.965905020407545e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018679069212843556, + "loss": 0.0188, "step": 291160 }, { - "epoch": 1.47, - "learning_rate": 7.965148251106145e-05, - "loss": 0.0084, + "epoch": 0.75, + "learning_rate": 0.0001867868039120641, + "loss": 0.0169, "step": 291170 }, { - "epoch": 1.47, - "learning_rate": 7.964391481804743e-05, - "loss": 0.0071, + "epoch": 0.75, + "learning_rate": 0.0001867829156956926, + "loss": 0.0126, "step": 291180 }, { - "epoch": 1.47, - "learning_rate": 7.963634712503342e-05, - "loss": 0.0065, + "epoch": 0.75, + "learning_rate": 0.00018677902747932115, + "loss": 0.0164, "step": 291190 }, { - "epoch": 1.47, - "learning_rate": 7.962877943201942e-05, - "loss": 0.0054, + "epoch": 0.75, + "learning_rate": 0.0001867751392629497, + "loss": 0.0158, "step": 291200 }, { - "epoch": 1.47, - "learning_rate": 7.96212117390054e-05, - "loss": 0.0094, + "epoch": 0.75, + "learning_rate": 0.00018677125104657824, + "loss": 0.0136, "step": 291210 }, { - "epoch": 1.47, - "learning_rate": 7.96136440459914e-05, - "loss": 0.0073, + "epoch": 0.75, + "learning_rate": 0.00018676736283020675, + "loss": 0.0143, "step": 291220 }, { - "epoch": 1.47, - "learning_rate": 7.960607635297738e-05, - "loss": 0.0085, + "epoch": 0.75, + "learning_rate": 0.0001867634746138353, + "loss": 0.0158, "step": 291230 }, { - "epoch": 1.47, - "learning_rate": 7.959850865996337e-05, - "loss": 0.007, + "epoch": 0.75, + "learning_rate": 0.00018675958639746384, + "loss": 0.0166, "step": 291240 }, { - "epoch": 1.47, - "learning_rate": 7.959094096694937e-05, - "loss": 0.0076, + "epoch": 0.75, + "learning_rate": 0.00018675569818109238, + "loss": 0.0133, "step": 291250 }, { - "epoch": 1.47, - "learning_rate": 7.958337327393535e-05, - "loss": 0.0101, + "epoch": 0.75, + "learning_rate": 0.0001867518099647209, + "loss": 0.0171, "step": 291260 }, { - "epoch": 1.47, - "learning_rate": 7.957580558092134e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018674792174834943, + "loss": 0.0125, "step": 291270 }, { - "epoch": 1.47, - "learning_rate": 7.956823788790734e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018674403353197795, + "loss": 0.0133, "step": 291280 }, { - "epoch": 1.47, - "learning_rate": 7.95606701948933e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018674014531560652, + "loss": 0.0159, "step": 291290 }, { - "epoch": 1.47, - "learning_rate": 7.95531025018793e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018673625709923503, + "loss": 0.0133, "step": 291300 }, { - "epoch": 1.47, - "learning_rate": 7.954553480886528e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018673236888286357, + "loss": 0.0147, "step": 291310 }, { - "epoch": 1.47, - "learning_rate": 7.953796711585128e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.0001867284806664921, + "loss": 0.0135, "step": 291320 }, { - "epoch": 1.47, - "learning_rate": 7.953039942283726e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.00018672459245012066, + "loss": 0.0139, "step": 291330 }, { - "epoch": 1.47, - "learning_rate": 7.952283172982325e-05, - "loss": 0.0048, + "epoch": 0.76, + "learning_rate": 0.0001867207042337492, + "loss": 0.0146, "step": 291340 }, { - "epoch": 1.47, - "learning_rate": 7.951526403680925e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.0001867168160173777, + "loss": 0.0179, "step": 291350 }, { - "epoch": 1.47, - "learning_rate": 7.950769634379523e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018671292780100623, + "loss": 0.0201, "step": 291360 }, { - "epoch": 1.47, - "learning_rate": 7.950012865078123e-05, - "loss": 0.0103, + "epoch": 0.76, + "learning_rate": 0.0001867090395846348, + "loss": 0.0114, "step": 291370 }, { - "epoch": 1.47, - "learning_rate": 7.949256095776722e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018670515136826334, + "loss": 0.0147, "step": 291380 }, { - "epoch": 1.47, - "learning_rate": 7.94849932647532e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.00018670126315189185, + "loss": 0.0147, "step": 291390 }, { - "epoch": 1.47, - "learning_rate": 7.94774255717392e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.0001866973749355204, + "loss": 0.0158, "step": 291400 }, { - "epoch": 1.47, - "learning_rate": 7.946985787872518e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018669348671914894, + "loss": 0.0144, "step": 291410 }, { - "epoch": 1.47, - "learning_rate": 7.946229018571117e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.00018668959850277748, + "loss": 0.0122, "step": 291420 }, { - "epoch": 1.47, - "learning_rate": 7.945472249269717e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.000186685710286406, + "loss": 0.0127, "step": 291430 }, { - "epoch": 1.47, - "learning_rate": 7.944715479968315e-05, - "loss": 0.0101, + "epoch": 0.76, + "learning_rate": 0.00018668182207003453, + "loss": 0.0145, "step": 291440 }, { - "epoch": 1.47, - "learning_rate": 7.943958710666914e-05, - "loss": 0.0093, + "epoch": 0.76, + "learning_rate": 0.00018667793385366307, + "loss": 0.0139, "step": 291450 }, { - "epoch": 1.47, - "learning_rate": 7.943201941365514e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018667404563729162, + "loss": 0.0188, "step": 291460 }, { - "epoch": 1.47, - "learning_rate": 7.942445172064112e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018667015742092013, + "loss": 0.0147, "step": 291470 }, { - "epoch": 1.47, - "learning_rate": 7.941688402762712e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018666626920454867, + "loss": 0.0145, "step": 291480 }, { - "epoch": 1.47, - "learning_rate": 7.940931633461311e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018666238098817724, + "loss": 0.0118, "step": 291490 }, { - "epoch": 1.47, - "learning_rate": 7.940174864159909e-05, - "loss": 0.0118, + "epoch": 0.76, + "learning_rate": 0.00018665849277180576, + "loss": 0.0159, "step": 291500 }, { - "epoch": 1.47, - "learning_rate": 7.939418094858509e-05, - "loss": 0.0119, + "epoch": 0.76, + "learning_rate": 0.0001866546045554343, + "loss": 0.0131, "step": 291510 }, { - "epoch": 1.47, - "learning_rate": 7.938661325557107e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.0001866507163390628, + "loss": 0.0183, "step": 291520 }, { - "epoch": 1.47, - "learning_rate": 7.937904556255706e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018664682812269133, + "loss": 0.018, "step": 291530 }, { - "epoch": 1.47, - "learning_rate": 7.937147786954306e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.0001866429399063199, + "loss": 0.0169, "step": 291540 }, { - "epoch": 1.47, - "learning_rate": 7.936391017652904e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018663905168994844, + "loss": 0.0156, "step": 291550 }, { - "epoch": 1.47, - "learning_rate": 7.935634248351504e-05, - "loss": 0.0099, + "epoch": 0.76, + "learning_rate": 0.00018663516347357695, + "loss": 0.0169, "step": 291560 }, { - "epoch": 1.47, - "learning_rate": 7.934877479050103e-05, - "loss": 0.0138, + "epoch": 0.76, + "learning_rate": 0.0001866312752572055, + "loss": 0.0151, "step": 291570 }, { - "epoch": 1.47, - "learning_rate": 7.934120709748701e-05, - "loss": 0.0103, + "epoch": 0.76, + "learning_rate": 0.00018662738704083403, + "loss": 0.0138, "step": 291580 }, { - "epoch": 1.47, - "learning_rate": 7.933363940447301e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018662349882446258, + "loss": 0.0153, "step": 291590 }, { - "epoch": 1.47, - "learning_rate": 7.932607171145899e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.0001866196106080911, + "loss": 0.0149, "step": 291600 }, { - "epoch": 1.47, - "learning_rate": 7.931850401844498e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018661572239171963, + "loss": 0.0124, "step": 291610 }, { - "epoch": 1.47, - "learning_rate": 7.931093632543098e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018661183417534817, + "loss": 0.0129, "step": 291620 }, { - "epoch": 1.47, - "learning_rate": 7.930336863241696e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018660794595897672, + "loss": 0.0124, "step": 291630 }, { - "epoch": 1.47, - "learning_rate": 7.929580093940295e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018660405774260523, + "loss": 0.0139, "step": 291640 }, { - "epoch": 1.47, - "learning_rate": 7.928823324638895e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018660016952623377, + "loss": 0.0192, "step": 291650 }, { - "epoch": 1.47, - "learning_rate": 7.928066555337493e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018659628130986234, + "loss": 0.0154, "step": 291660 }, { - "epoch": 1.47, - "learning_rate": 7.927309786036093e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018659239309349086, + "loss": 0.015, "step": 291670 }, { - "epoch": 1.47, - "learning_rate": 7.926553016734691e-05, - "loss": 0.0107, + "epoch": 0.76, + "learning_rate": 0.00018658850487711937, + "loss": 0.0143, "step": 291680 }, { - "epoch": 1.47, - "learning_rate": 7.92579624743329e-05, - "loss": 0.0096, + "epoch": 0.76, + "learning_rate": 0.0001865846166607479, + "loss": 0.0195, "step": 291690 }, { - "epoch": 1.47, - "learning_rate": 7.92503947813189e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018658072844437648, + "loss": 0.0112, "step": 291700 }, { - "epoch": 1.47, - "learning_rate": 7.924282708830488e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.000186576840228005, + "loss": 0.0134, "step": 291710 }, { - "epoch": 1.47, - "learning_rate": 7.923525939529087e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018657295201163354, + "loss": 0.0144, "step": 291720 }, { - "epoch": 1.47, - "learning_rate": 7.922769170227687e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018656906379526205, + "loss": 0.0133, "step": 291730 }, { - "epoch": 1.47, - "learning_rate": 7.922012400926285e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018656517557889062, + "loss": 0.0144, "step": 291740 }, { - "epoch": 1.47, - "learning_rate": 7.921255631624885e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018656128736251913, + "loss": 0.0125, "step": 291750 }, { - "epoch": 1.47, - "learning_rate": 7.920498862323483e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018655739914614768, + "loss": 0.0125, "step": 291760 }, { - "epoch": 1.47, - "learning_rate": 7.919742093022082e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.0001865535109297762, + "loss": 0.0151, "step": 291770 }, { - "epoch": 1.47, - "learning_rate": 7.918985323720682e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018654962271340473, + "loss": 0.0123, "step": 291780 }, { - "epoch": 1.47, - "learning_rate": 7.91822855441928e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018654573449703327, + "loss": 0.0124, "step": 291790 }, { - "epoch": 1.47, - "learning_rate": 7.91747178511788e-05, - "loss": 0.0103, + "epoch": 0.76, + "learning_rate": 0.00018654184628066182, + "loss": 0.0175, "step": 291800 }, { - "epoch": 1.47, - "learning_rate": 7.916715015816479e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018653795806429033, + "loss": 0.0146, "step": 291810 }, { - "epoch": 1.47, - "learning_rate": 7.915958246515077e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018653406984791887, + "loss": 0.049, "step": 291820 }, { - "epoch": 1.47, - "learning_rate": 7.915201477213676e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.0001865301816315474, + "loss": 0.0281, "step": 291830 }, { - "epoch": 1.47, - "learning_rate": 7.914444707912275e-05, - "loss": 0.0095, + "epoch": 0.76, + "learning_rate": 0.00018652629341517595, + "loss": 0.0168, "step": 291840 }, { - "epoch": 1.47, - "learning_rate": 7.913687938610874e-05, - "loss": 0.0098, + "epoch": 0.76, + "learning_rate": 0.00018652240519880447, + "loss": 0.014, "step": 291850 }, { - "epoch": 1.47, - "learning_rate": 7.912931169309474e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.000186518516982433, + "loss": 0.016, "step": 291860 }, { - "epoch": 1.47, - "learning_rate": 7.912174400008072e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.00018651462876606158, + "loss": 0.0118, "step": 291870 }, { - "epoch": 1.47, - "learning_rate": 7.911417630706671e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.0001865107405496901, + "loss": 0.0105, "step": 291880 }, { - "epoch": 1.47, - "learning_rate": 7.910660861405271e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.00018650685233331864, + "loss": 0.0158, "step": 291890 }, { - "epoch": 1.47, - "learning_rate": 7.909904092103869e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018650296411694715, + "loss": 0.0147, "step": 291900 }, { - "epoch": 1.47, - "learning_rate": 7.909147322802468e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018649907590057572, + "loss": 0.0125, "step": 291910 }, { - "epoch": 1.47, - "learning_rate": 7.908390553501065e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018649518768420423, + "loss": 0.0169, "step": 291920 }, { - "epoch": 1.47, - "learning_rate": 7.907633784199665e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018649129946783278, + "loss": 0.0154, "step": 291930 }, { - "epoch": 1.47, - "learning_rate": 7.906877014898264e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.0001864874112514613, + "loss": 0.0126, "step": 291940 }, { - "epoch": 1.47, - "learning_rate": 7.906120245596862e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018648352303508986, + "loss": 0.0136, "step": 291950 }, { - "epoch": 1.47, - "learning_rate": 7.905363476295462e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018647963481871837, + "loss": 0.0139, "step": 291960 }, { - "epoch": 1.47, - "learning_rate": 7.90460670699406e-05, - "loss": 0.0057, + "epoch": 0.76, + "learning_rate": 0.00018647574660234691, + "loss": 0.0132, "step": 291970 }, { - "epoch": 1.47, - "learning_rate": 7.90384993769266e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.00018647185838597543, + "loss": 0.0157, "step": 291980 }, { - "epoch": 1.47, - "learning_rate": 7.903093168391259e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.000186467970169604, + "loss": 0.0148, "step": 291990 }, { - "epoch": 1.47, - "learning_rate": 7.902336399089857e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.0001864640819532325, + "loss": 0.0138, "step": 292000 }, { - "epoch": 1.47, - "eval_cer": 0.9144362920387732, - "eval_loss": 0.0056129819713532925, - "eval_runtime": 115.8149, - "eval_samples_per_second": 17.269, - "eval_steps_per_second": 4.317, + "epoch": 0.76, + "eval_cer": 0.8817208816033121, + "eval_loss": 0.009960480034351349, + "eval_runtime": 107.9451, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, "step": 292000 }, { - "epoch": 1.47, - "learning_rate": 7.901579629788457e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018646019373686105, + "loss": 0.0124, "step": 292010 }, { - "epoch": 1.47, - "learning_rate": 7.900822860487056e-05, - "loss": 0.0053, + "epoch": 0.76, + "learning_rate": 0.00018645630552048957, + "loss": 0.0127, "step": 292020 }, { - "epoch": 1.47, - "learning_rate": 7.900066091185654e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.0001864524173041181, + "loss": 0.0188, "step": 292030 }, { - "epoch": 1.47, - "learning_rate": 7.899309321884254e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018644852908774668, + "loss": 0.0161, "step": 292040 }, { - "epoch": 1.47, - "learning_rate": 7.898552552582852e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.0001864446408713752, + "loss": 0.0164, "step": 292050 }, { - "epoch": 1.47, - "learning_rate": 7.897795783281451e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018644075265500374, + "loss": 0.0177, "step": 292060 }, { - "epoch": 1.47, - "learning_rate": 7.897039013980051e-05, - "loss": 0.0095, + "epoch": 0.76, + "learning_rate": 0.00018643686443863225, + "loss": 0.0172, "step": 292070 }, { - "epoch": 1.47, - "learning_rate": 7.896282244678649e-05, - "loss": 0.0099, + "epoch": 0.76, + "learning_rate": 0.00018643297622226082, + "loss": 0.0166, "step": 292080 }, { - "epoch": 1.47, - "learning_rate": 7.895525475377249e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018642908800588933, + "loss": 0.0154, "step": 292090 }, { - "epoch": 1.47, - "learning_rate": 7.894768706075848e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018642519978951787, + "loss": 0.0128, "step": 292100 }, { - "epoch": 1.47, - "learning_rate": 7.894011936774446e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.0001864213115731464, + "loss": 0.0172, "step": 292110 }, { - "epoch": 1.47, - "learning_rate": 7.893255167473046e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018641742335677496, + "loss": 0.0125, "step": 292120 }, { - "epoch": 1.47, - "learning_rate": 7.892498398171644e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018641353514040347, + "loss": 0.0159, "step": 292130 }, { - "epoch": 1.47, - "learning_rate": 7.891741628870243e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018640964692403201, + "loss": 0.0145, "step": 292140 }, { - "epoch": 1.47, - "learning_rate": 7.890984859568843e-05, - "loss": 0.0091, + "epoch": 0.76, + "learning_rate": 0.00018640575870766053, + "loss": 0.0143, "step": 292150 }, { - "epoch": 1.47, - "learning_rate": 7.890228090267441e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.0001864018704912891, + "loss": 0.0114, "step": 292160 }, { - "epoch": 1.47, - "learning_rate": 7.88947132096604e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001863979822749176, + "loss": 0.0139, "step": 292170 }, { - "epoch": 1.47, - "learning_rate": 7.88871455166464e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018639409405854615, + "loss": 0.0128, "step": 292180 }, { - "epoch": 1.47, - "learning_rate": 7.887957782363238e-05, - "loss": 0.0096, + "epoch": 0.76, + "learning_rate": 0.00018639020584217467, + "loss": 0.0121, "step": 292190 }, { - "epoch": 1.47, - "learning_rate": 7.887201013061838e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018638631762580324, + "loss": 0.0137, "step": 292200 }, { - "epoch": 1.47, - "learning_rate": 7.886444243760436e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018638242940943178, + "loss": 0.0181, "step": 292210 }, { - "epoch": 1.47, - "learning_rate": 7.885687474459035e-05, - "loss": 0.0093, + "epoch": 0.76, + "learning_rate": 0.0001863785411930603, + "loss": 0.0152, "step": 292220 }, { - "epoch": 1.47, - "learning_rate": 7.884930705157635e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.0001863746529766888, + "loss": 0.0157, "step": 292230 }, { - "epoch": 1.47, - "learning_rate": 7.884173935856233e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018637076476031738, + "loss": 0.0147, "step": 292240 }, { - "epoch": 1.47, - "learning_rate": 7.883417166554832e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018636687654394592, + "loss": 0.0174, "step": 292250 }, { - "epoch": 1.47, - "learning_rate": 7.882660397253432e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018636298832757443, + "loss": 0.0156, "step": 292260 }, { - "epoch": 1.47, - "learning_rate": 7.88190362795203e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018635910011120297, + "loss": 0.017, "step": 292270 }, { - "epoch": 1.47, - "learning_rate": 7.88114685865063e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.0001863552118948315, + "loss": 0.0183, "step": 292280 }, { - "epoch": 1.47, - "learning_rate": 7.880390089349228e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.00018635132367846006, + "loss": 0.0107, "step": 292290 }, { - "epoch": 1.47, - "learning_rate": 7.879633320047827e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.00018634743546208857, + "loss": 0.0141, "step": 292300 }, { - "epoch": 1.47, - "learning_rate": 7.878876550746427e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.0001863435472457171, + "loss": 0.0132, "step": 292310 }, { - "epoch": 1.47, - "learning_rate": 7.878119781445025e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018633965902934563, + "loss": 0.0145, "step": 292320 }, { - "epoch": 1.47, - "learning_rate": 7.877363012143624e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.0001863357708129742, + "loss": 0.0147, "step": 292330 }, { - "epoch": 1.47, - "learning_rate": 7.876606242842224e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.0001863318825966027, + "loss": 0.012, "step": 292340 }, { - "epoch": 1.47, - "learning_rate": 7.875849473540822e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018632799438023125, + "loss": 0.0154, "step": 292350 }, { - "epoch": 1.47, - "learning_rate": 7.875092704239421e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018632410616385977, + "loss": 0.0133, "step": 292360 }, { - "epoch": 1.48, - "learning_rate": 7.87433593493802e-05, - "loss": 0.0094, + "epoch": 0.76, + "learning_rate": 0.00018632021794748834, + "loss": 0.0145, "step": 292370 }, { - "epoch": 1.48, - "learning_rate": 7.873579165636619e-05, - "loss": 0.0057, - "step": 292380 + "epoch": 0.76, + "learning_rate": 0.00018631632973111688, + "loss": 0.0145, + "step": 292380 }, { - "epoch": 1.48, - "learning_rate": 7.872822396335219e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.0001863124415147454, + "loss": 0.0131, "step": 292390 }, { - "epoch": 1.48, - "learning_rate": 7.872065627033817e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.0001863085532983739, + "loss": 0.0178, "step": 292400 }, { - "epoch": 1.48, - "learning_rate": 7.871308857732416e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018630466508200248, + "loss": 0.0129, "step": 292410 }, { - "epoch": 1.48, - "learning_rate": 7.870552088431016e-05, - "loss": 0.0052, + "epoch": 0.76, + "learning_rate": 0.00018630077686563102, + "loss": 0.0147, "step": 292420 }, { - "epoch": 1.48, - "learning_rate": 7.869795319129614e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018629688864925953, + "loss": 0.0135, "step": 292430 }, { - "epoch": 1.48, - "learning_rate": 7.869038549828213e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018629300043288807, + "loss": 0.0155, "step": 292440 }, { - "epoch": 1.48, - "learning_rate": 7.868281780526813e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.00018628911221651661, + "loss": 0.0128, "step": 292450 }, { - "epoch": 1.48, - "learning_rate": 7.867525011225411e-05, - "loss": 0.0094, + "epoch": 0.76, + "learning_rate": 0.00018628522400014516, + "loss": 0.0144, "step": 292460 }, { - "epoch": 1.48, - "learning_rate": 7.86676824192401e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018628133578377367, + "loss": 0.0149, "step": 292470 }, { - "epoch": 1.48, - "learning_rate": 7.866011472622609e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.0001862774475674022, + "loss": 0.0118, "step": 292480 }, { - "epoch": 1.48, - "learning_rate": 7.865254703321208e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018627355935103075, + "loss": 0.0121, "step": 292490 }, { - "epoch": 1.48, - "learning_rate": 7.864497934019808e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.0001862696711346593, + "loss": 0.0175, "step": 292500 }, { - "epoch": 1.48, - "learning_rate": 7.863741164718406e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.0001862657829182878, + "loss": 0.0146, "step": 292510 }, { - "epoch": 1.48, - "learning_rate": 7.862984395417005e-05, - "loss": 0.0045, + "epoch": 0.76, + "learning_rate": 0.00018626189470191635, + "loss": 0.0119, "step": 292520 }, { - "epoch": 1.48, - "learning_rate": 7.862227626115605e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.00018625800648554487, + "loss": 0.0136, "step": 292530 }, { - "epoch": 1.48, - "learning_rate": 7.861470856814203e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018625411826917344, + "loss": 0.0114, "step": 292540 }, { - "epoch": 1.48, - "learning_rate": 7.860714087512801e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018625023005280195, + "loss": 0.0149, "step": 292550 }, { - "epoch": 1.48, - "learning_rate": 7.859957318211399e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.0001862463418364305, + "loss": 0.0133, "step": 292560 }, { - "epoch": 1.48, - "learning_rate": 7.859200548909999e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.000186242453620059, + "loss": 0.0149, "step": 292570 }, { - "epoch": 1.48, - "learning_rate": 7.858443779608597e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018623856540368757, + "loss": 0.0167, "step": 292580 }, { - "epoch": 1.48, - "learning_rate": 7.857687010307196e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018623467718731612, + "loss": 0.0124, "step": 292590 }, { - "epoch": 1.48, - "learning_rate": 7.856930241005796e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018623078897094463, + "loss": 0.0178, "step": 292600 }, { - "epoch": 1.48, - "learning_rate": 7.856173471704394e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018622690075457317, + "loss": 0.0144, "step": 292610 }, { - "epoch": 1.48, - "learning_rate": 7.855416702402994e-05, - "loss": 0.0094, + "epoch": 0.76, + "learning_rate": 0.00018622301253820171, + "loss": 0.015, "step": 292620 }, { - "epoch": 1.48, - "learning_rate": 7.854659933101593e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018621912432183026, + "loss": 0.0162, "step": 292630 }, { - "epoch": 1.48, - "learning_rate": 7.853903163800191e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018621523610545877, + "loss": 0.0146, "step": 292640 }, { - "epoch": 1.48, - "learning_rate": 7.853146394498791e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.0001862113478890873, + "loss": 0.0202, "step": 292650 }, { - "epoch": 1.48, - "learning_rate": 7.852389625197389e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018620745967271585, + "loss": 0.0155, "step": 292660 }, { - "epoch": 1.48, - "learning_rate": 7.851632855895988e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.0001862035714563444, + "loss": 0.0138, "step": 292670 }, { - "epoch": 1.48, - "learning_rate": 7.850876086594588e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.0001861996832399729, + "loss": 0.015, "step": 292680 }, { - "epoch": 1.48, - "learning_rate": 7.850119317293186e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018619579502360145, + "loss": 0.0131, "step": 292690 }, { - "epoch": 1.48, - "learning_rate": 7.849362547991785e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018619190680723002, + "loss": 0.0149, "step": 292700 }, { - "epoch": 1.48, - "learning_rate": 7.848605778690385e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018618801859085853, + "loss": 0.0152, "step": 292710 }, { - "epoch": 1.48, - "learning_rate": 7.847849009388983e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018618413037448705, + "loss": 0.0147, "step": 292720 }, { - "epoch": 1.48, - "learning_rate": 7.847092240087583e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.0001861802421581156, + "loss": 0.0159, "step": 292730 }, { - "epoch": 1.48, - "learning_rate": 7.846335470786181e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018617635394174416, + "loss": 0.0204, "step": 292740 }, { - "epoch": 1.48, - "learning_rate": 7.84557870148478e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018617246572537267, + "loss": 0.0126, "step": 292750 }, { - "epoch": 1.48, - "learning_rate": 7.84482193218338e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.00018616857750900122, + "loss": 0.0131, "step": 292760 }, { - "epoch": 1.48, - "learning_rate": 7.844065162881978e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018616468929262973, + "loss": 0.0175, "step": 292770 }, { - "epoch": 1.48, - "learning_rate": 7.843308393580577e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018616080107625827, + "loss": 0.0167, "step": 292780 }, { - "epoch": 1.48, - "learning_rate": 7.842551624279177e-05, - "loss": 0.0097, + "epoch": 0.76, + "learning_rate": 0.00018615691285988681, + "loss": 0.0139, "step": 292790 }, { - "epoch": 1.48, - "learning_rate": 7.841794854977775e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018615302464351536, + "loss": 0.0222, "step": 292800 }, { - "epoch": 1.48, - "learning_rate": 7.841038085676375e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.00018614913642714387, + "loss": 0.0144, "step": 292810 }, { - "epoch": 1.48, - "learning_rate": 7.840281316374973e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.0001861452482107724, + "loss": 0.0117, "step": 292820 }, { - "epoch": 1.48, - "learning_rate": 7.839524547073572e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018614135999440095, + "loss": 0.0187, "step": 292830 }, { - "epoch": 1.48, - "learning_rate": 7.838767777772172e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.0001861374717780295, + "loss": 0.0172, "step": 292840 }, { - "epoch": 1.48, - "learning_rate": 7.83801100847077e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.000186133583561658, + "loss": 0.0192, "step": 292850 }, { - "epoch": 1.48, - "learning_rate": 7.83725423916937e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018612969534528655, + "loss": 0.0145, "step": 292860 }, { - "epoch": 1.48, - "learning_rate": 7.836497469867969e-05, - "loss": 0.0097, + "epoch": 0.76, + "learning_rate": 0.0001861258071289151, + "loss": 0.0114, "step": 292870 }, { - "epoch": 1.48, - "learning_rate": 7.835740700566567e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018612191891254363, + "loss": 0.0147, "step": 292880 }, { - "epoch": 1.48, - "learning_rate": 7.834983931265166e-05, - "loss": 0.0042, + "epoch": 0.76, + "learning_rate": 0.00018611803069617215, + "loss": 0.0149, "step": 292890 }, { - "epoch": 1.48, - "learning_rate": 7.834227161963765e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.0001861141424798007, + "loss": 0.0127, "step": 292900 }, { - "epoch": 1.48, - "learning_rate": 7.833470392662364e-05, - "loss": 0.0097, + "epoch": 0.76, + "learning_rate": 0.00018611025426342926, + "loss": 0.0219, "step": 292910 }, { - "epoch": 1.48, - "learning_rate": 7.832713623360964e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018610636604705777, + "loss": 0.017, "step": 292920 }, { - "epoch": 1.48, - "learning_rate": 7.831956854059562e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018610247783068632, + "loss": 0.0222, "step": 292930 }, { - "epoch": 1.48, - "learning_rate": 7.831200084758161e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018609858961431483, + "loss": 0.0167, "step": 292940 }, { - "epoch": 1.48, - "learning_rate": 7.830443315456761e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.0001860947013979434, + "loss": 0.0134, "step": 292950 }, { - "epoch": 1.48, - "learning_rate": 7.829686546155359e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.0001860908131815719, + "loss": 0.012, "step": 292960 }, { - "epoch": 1.48, - "learning_rate": 7.828929776853958e-05, - "loss": 0.0108, + "epoch": 0.76, + "learning_rate": 0.00018608692496520045, + "loss": 0.0142, "step": 292970 }, { - "epoch": 1.48, - "learning_rate": 7.828173007552558e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018608303674882897, + "loss": 0.0138, "step": 292980 }, { - "epoch": 1.48, - "learning_rate": 7.827416238251156e-05, - "loss": 0.0047, + "epoch": 0.76, + "learning_rate": 0.00018607914853245754, + "loss": 0.013, "step": 292990 }, { - "epoch": 1.48, - "learning_rate": 7.826659468949756e-05, - "loss": 0.0053, + "epoch": 0.76, + "learning_rate": 0.00018607526031608605, + "loss": 0.0135, "step": 293000 }, { - "epoch": 1.48, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.005583611316978931, - "eval_runtime": 116.624, - "eval_samples_per_second": 17.149, - "eval_steps_per_second": 4.287, + "epoch": 0.76, + "eval_cer": 0.8817320786987856, + "eval_loss": 0.009882713668048382, + "eval_runtime": 108.0807, + "eval_samples_per_second": 18.505, + "eval_steps_per_second": 4.626, "step": 293000 }, { - "epoch": 1.48, - "learning_rate": 7.825902699648354e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.0001860713720997146, + "loss": 0.0113, "step": 293010 }, { - "epoch": 1.48, - "learning_rate": 7.825145930346953e-05, - "loss": 0.0113, + "epoch": 0.76, + "learning_rate": 0.0001860674838833431, + "loss": 0.0217, "step": 293020 }, { - "epoch": 1.48, - "learning_rate": 7.824389161045553e-05, - "loss": 0.0055, + "epoch": 0.76, + "learning_rate": 0.00018606359566697165, + "loss": 0.0152, "step": 293030 }, { - "epoch": 1.48, - "learning_rate": 7.823632391744151e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.0001860597074506002, + "loss": 0.0135, "step": 293040 }, { - "epoch": 1.48, - "learning_rate": 7.82287562244275e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018605581923422873, + "loss": 0.0136, "step": 293050 }, { - "epoch": 1.48, - "learning_rate": 7.82211885314135e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018605193101785725, + "loss": 0.0158, "step": 293060 }, { - "epoch": 1.48, - "learning_rate": 7.821362083839948e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.0001860480428014858, + "loss": 0.0142, "step": 293070 }, { - "epoch": 1.48, - "learning_rate": 7.820605314538548e-05, - "loss": 0.0097, + "epoch": 0.76, + "learning_rate": 0.00018604415458511436, + "loss": 0.0123, "step": 293080 }, { - "epoch": 1.48, - "learning_rate": 7.819848545237146e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.00018604026636874287, + "loss": 0.0141, "step": 293090 }, { - "epoch": 1.48, - "learning_rate": 7.819091775935745e-05, - "loss": 0.0094, + "epoch": 0.76, + "learning_rate": 0.00018603637815237141, + "loss": 0.0153, "step": 293100 }, { - "epoch": 1.48, - "learning_rate": 7.818335006634345e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018603248993599993, + "loss": 0.0136, "step": 293110 }, { - "epoch": 1.48, - "learning_rate": 7.817578237332943e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.0001860286017196285, + "loss": 0.018, "step": 293120 }, { - "epoch": 1.48, - "learning_rate": 7.816821468031542e-05, - "loss": 0.0096, + "epoch": 0.76, + "learning_rate": 0.000186024713503257, + "loss": 0.0142, "step": 293130 }, { - "epoch": 1.48, - "learning_rate": 7.816064698730142e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018602082528688555, + "loss": 0.0191, "step": 293140 }, { - "epoch": 1.48, - "learning_rate": 7.81530792942874e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018601693707051407, + "loss": 0.0117, "step": 293150 }, { - "epoch": 1.48, - "learning_rate": 7.81455116012734e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018601304885414264, + "loss": 0.0151, "step": 293160 }, { - "epoch": 1.48, - "learning_rate": 7.813794390825936e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018600916063777115, + "loss": 0.0145, "step": 293170 }, { - "epoch": 1.48, - "learning_rate": 7.813037621524536e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.0001860052724213997, + "loss": 0.0147, "step": 293180 }, { - "epoch": 1.48, - "learning_rate": 7.812280852223134e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.0001860013842050282, + "loss": 0.014, "step": 293190 }, { - "epoch": 1.48, - "learning_rate": 7.811524082921733e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018599749598865678, + "loss": 0.0148, "step": 293200 }, { - "epoch": 1.48, - "learning_rate": 7.810767313620333e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.0001859936077722853, + "loss": 0.0128, "step": 293210 }, { - "epoch": 1.48, - "learning_rate": 7.810010544318931e-05, - "loss": 0.0053, + "epoch": 0.76, + "learning_rate": 0.00018598971955591383, + "loss": 0.0148, "step": 293220 }, { - "epoch": 1.48, - "learning_rate": 7.80925377501753e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.00018598583133954235, + "loss": 0.0158, "step": 293230 }, { - "epoch": 1.48, - "learning_rate": 7.80849700571613e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018598194312317092, + "loss": 0.0143, "step": 293240 }, { - "epoch": 1.48, - "learning_rate": 7.807740236414728e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018597805490679946, + "loss": 0.0147, "step": 293250 }, { - "epoch": 1.48, - "learning_rate": 7.806983467113328e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018597416669042797, + "loss": 0.0137, "step": 293260 }, { - "epoch": 1.48, - "learning_rate": 7.806226697811926e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.0001859702784740565, + "loss": 0.0127, "step": 293270 }, { - "epoch": 1.48, - "learning_rate": 7.805469928510525e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018596639025768503, + "loss": 0.0163, "step": 293280 }, { - "epoch": 1.48, - "learning_rate": 7.804713159209125e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.0001859625020413136, + "loss": 0.016, "step": 293290 }, { - "epoch": 1.48, - "learning_rate": 7.803956389907723e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.0001859586138249421, + "loss": 0.0145, "step": 293300 }, { - "epoch": 1.48, - "learning_rate": 7.803199620606322e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018595472560857065, + "loss": 0.0115, "step": 293310 }, { - "epoch": 1.48, - "learning_rate": 7.802442851304922e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018595083739219917, + "loss": 0.0158, "step": 293320 }, { - "epoch": 1.48, - "learning_rate": 7.80168608200352e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018594694917582774, + "loss": 0.0119, "step": 293330 }, { - "epoch": 1.48, - "learning_rate": 7.80092931270212e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018594306095945625, + "loss": 0.0139, "step": 293340 }, { - "epoch": 1.48, - "learning_rate": 7.800172543400718e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.0001859391727430848, + "loss": 0.0186, "step": 293350 }, { - "epoch": 1.48, - "learning_rate": 7.799415774099317e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001859352845267133, + "loss": 0.0182, "step": 293360 }, { - "epoch": 1.48, - "learning_rate": 7.798659004797917e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018593139631034188, + "loss": 0.0164, "step": 293370 }, { - "epoch": 1.48, - "learning_rate": 7.797902235496515e-05, - "loss": 0.0057, + "epoch": 0.76, + "learning_rate": 0.0001859275080939704, + "loss": 0.0156, "step": 293380 }, { - "epoch": 1.48, - "learning_rate": 7.797145466195114e-05, - "loss": 0.0112, + "epoch": 0.76, + "learning_rate": 0.00018592361987759893, + "loss": 0.0136, "step": 293390 }, { - "epoch": 1.48, - "learning_rate": 7.796388696893714e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018591973166122745, + "loss": 0.0126, "step": 293400 }, { - "epoch": 1.48, - "learning_rate": 7.795631927592312e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.00018591584344485602, + "loss": 0.0127, "step": 293410 }, { - "epoch": 1.48, - "learning_rate": 7.794875158290912e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018591195522848453, + "loss": 0.0174, "step": 293420 }, { - "epoch": 1.48, - "learning_rate": 7.794118388989511e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018590806701211307, + "loss": 0.0131, "step": 293430 }, { - "epoch": 1.48, - "learning_rate": 7.793361619688109e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.0001859041787957416, + "loss": 0.0128, "step": 293440 }, { - "epoch": 1.48, - "learning_rate": 7.792604850386709e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018590029057937016, + "loss": 0.0146, "step": 293450 }, { - "epoch": 1.48, - "learning_rate": 7.791848081085307e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.0001858964023629987, + "loss": 0.0144, "step": 293460 }, { - "epoch": 1.48, - "learning_rate": 7.791091311783906e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.0001858925141466272, + "loss": 0.0158, "step": 293470 }, { - "epoch": 1.48, - "learning_rate": 7.790334542482506e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018588862593025575, + "loss": 0.0131, "step": 293480 }, { - "epoch": 1.48, - "learning_rate": 7.789577773181104e-05, - "loss": 0.0092, + "epoch": 0.76, + "learning_rate": 0.0001858847377138843, + "loss": 0.0192, "step": 293490 }, { - "epoch": 1.48, - "learning_rate": 7.788821003879703e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018588084949751284, + "loss": 0.0169, "step": 293500 }, { - "epoch": 1.48, - "learning_rate": 7.788064234578303e-05, - "loss": 0.0095, + "epoch": 0.76, + "learning_rate": 0.00018587696128114135, + "loss": 0.0115, "step": 293510 }, { - "epoch": 1.48, - "learning_rate": 7.787307465276901e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.0001858730730647699, + "loss": 0.0127, "step": 293520 }, { - "epoch": 1.48, - "learning_rate": 7.7865506959755e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.0001858691848483984, + "loss": 0.0173, "step": 293530 }, { - "epoch": 1.48, - "learning_rate": 7.785793926674099e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018586529663202698, + "loss": 0.0145, "step": 293540 }, { - "epoch": 1.48, - "learning_rate": 7.785037157372698e-05, - "loss": 0.0111, + "epoch": 0.76, + "learning_rate": 0.0001858614084156555, + "loss": 0.0144, "step": 293550 }, { - "epoch": 1.48, - "learning_rate": 7.784280388071298e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018585752019928403, + "loss": 0.0151, "step": 293560 }, { - "epoch": 1.48, - "learning_rate": 7.783523618769896e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018585363198291255, + "loss": 0.0196, "step": 293570 }, { - "epoch": 1.48, - "learning_rate": 7.782766849468495e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018584974376654112, + "loss": 0.0142, "step": 293580 }, { - "epoch": 1.48, - "learning_rate": 7.782010080167095e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018584585555016963, + "loss": 0.0133, "step": 293590 }, { - "epoch": 1.48, - "learning_rate": 7.781253310865693e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018584196733379817, + "loss": 0.0143, "step": 293600 }, { - "epoch": 1.48, - "learning_rate": 7.780496541564293e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018583807911742669, + "loss": 0.0134, "step": 293610 }, { - "epoch": 1.48, - "learning_rate": 7.77973977226289e-05, - "loss": 0.0093, + "epoch": 0.76, + "learning_rate": 0.00018583419090105525, + "loss": 0.0143, "step": 293620 }, { - "epoch": 1.48, - "learning_rate": 7.77898300296149e-05, - "loss": 0.0089, + "epoch": 0.76, + "learning_rate": 0.0001858303026846838, + "loss": 0.0134, "step": 293630 }, { - "epoch": 1.48, - "learning_rate": 7.77822623366009e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.0001858264144683123, + "loss": 0.0174, "step": 293640 }, { - "epoch": 1.48, - "learning_rate": 7.777469464358688e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018582252625194085, + "loss": 0.0144, "step": 293650 }, { - "epoch": 1.48, - "learning_rate": 7.776712695057287e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.0001858186380355694, + "loss": 0.0168, "step": 293660 }, { - "epoch": 1.48, - "learning_rate": 7.775955925755887e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018581474981919794, + "loss": 0.011, "step": 293670 }, { - "epoch": 1.48, - "learning_rate": 7.775199156454485e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018581086160282645, + "loss": 0.0136, "step": 293680 }, { - "epoch": 1.48, - "learning_rate": 7.774442387153084e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.000185806973386455, + "loss": 0.0153, "step": 293690 }, { - "epoch": 1.48, - "learning_rate": 7.773685617851683e-05, - "loss": 0.0106, + "epoch": 0.76, + "learning_rate": 0.00018580308517008353, + "loss": 0.0166, "step": 293700 }, { - "epoch": 1.48, - "learning_rate": 7.772928848550282e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018579919695371208, + "loss": 0.0121, "step": 293710 }, { - "epoch": 1.48, - "learning_rate": 7.772172079248882e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.0001857953087373406, + "loss": 0.018, "step": 293720 }, { - "epoch": 1.48, - "learning_rate": 7.77141530994748e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018579142052096913, + "loss": 0.0138, "step": 293730 }, { - "epoch": 1.48, - "learning_rate": 7.770658540646079e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018578753230459767, + "loss": 0.0188, "step": 293740 }, { - "epoch": 1.48, - "learning_rate": 7.769901771344679e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018578364408822621, + "loss": 0.0167, "step": 293750 }, { - "epoch": 1.48, - "learning_rate": 7.769145002043277e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018577975587185473, + "loss": 0.0106, "step": 293760 }, { - "epoch": 1.48, - "learning_rate": 7.768388232741876e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018577586765548327, + "loss": 0.0151, "step": 293770 }, { - "epoch": 1.48, - "learning_rate": 7.767631463440475e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018577197943911179, + "loss": 0.0173, "step": 293780 }, { - "epoch": 1.48, - "learning_rate": 7.766874694139074e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018576809122274035, + "loss": 0.0142, "step": 293790 }, { - "epoch": 1.48, - "learning_rate": 7.766117924837671e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.0001857642030063689, + "loss": 0.0187, "step": 293800 }, { - "epoch": 1.48, - "learning_rate": 7.76536115553627e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.0001857603147899974, + "loss": 0.0155, "step": 293810 }, { - "epoch": 1.48, - "learning_rate": 7.76460438623487e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018575642657362592, + "loss": 0.0148, "step": 293820 }, { - "epoch": 1.48, - "learning_rate": 7.763847616933468e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.0001857525383572545, + "loss": 0.0183, "step": 293830 }, { - "epoch": 1.48, - "learning_rate": 7.763090847632067e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018574865014088304, + "loss": 0.0163, "step": 293840 }, { - "epoch": 1.48, - "learning_rate": 7.762334078330667e-05, - "loss": 0.01, + "epoch": 0.76, + "learning_rate": 0.00018574476192451155, + "loss": 0.017, "step": 293850 }, { - "epoch": 1.48, - "learning_rate": 7.761577309029265e-05, - "loss": 0.0086, + "epoch": 0.76, + "learning_rate": 0.0001857408737081401, + "loss": 0.0161, "step": 293860 }, { - "epoch": 1.48, - "learning_rate": 7.760820539727865e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018573698549176863, + "loss": 0.0103, "step": 293870 }, { - "epoch": 1.48, - "learning_rate": 7.760063770426464e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018573309727539717, + "loss": 0.0132, "step": 293880 }, { - "epoch": 1.48, - "learning_rate": 7.759307001125062e-05, - "loss": 0.0053, + "epoch": 0.76, + "learning_rate": 0.0001857292090590257, + "loss": 0.0148, "step": 293890 }, { - "epoch": 1.48, - "learning_rate": 7.758550231823662e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018572532084265423, + "loss": 0.0157, "step": 293900 }, { - "epoch": 1.48, - "learning_rate": 7.75779346252226e-05, - "loss": 0.0094, + "epoch": 0.76, + "learning_rate": 0.00018572143262628277, + "loss": 0.0175, "step": 293910 }, { - "epoch": 1.48, - "learning_rate": 7.75703669322086e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018571754440991131, + "loss": 0.0118, "step": 293920 }, { - "epoch": 1.48, - "learning_rate": 7.756279923919459e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.00018571365619353983, + "loss": 0.0133, "step": 293930 }, { - "epoch": 1.48, - "learning_rate": 7.755523154618057e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018570976797716837, + "loss": 0.0165, "step": 293940 }, { - "epoch": 1.48, - "learning_rate": 7.754766385316657e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018570587976079694, + "loss": 0.0136, "step": 293950 }, { - "epoch": 1.48, - "learning_rate": 7.754009616015256e-05, - "loss": 0.0053, + "epoch": 0.76, + "learning_rate": 0.00018570199154442545, + "loss": 0.0171, "step": 293960 }, { - "epoch": 1.48, - "learning_rate": 7.753252846713854e-05, - "loss": 0.0091, + "epoch": 0.76, + "learning_rate": 0.000185698103328054, + "loss": 0.0164, "step": 293970 }, { - "epoch": 1.48, - "learning_rate": 7.752496077412454e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.0001856942151116825, + "loss": 0.017, "step": 293980 }, { - "epoch": 1.48, - "learning_rate": 7.751739308111052e-05, - "loss": 0.009, + "epoch": 0.76, + "learning_rate": 0.00018569032689531108, + "loss": 0.0141, "step": 293990 }, { - "epoch": 1.48, - "learning_rate": 7.750982538809651e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.0001856864386789396, + "loss": 0.0123, "step": 294000 }, { - "epoch": 1.48, - "eval_cer": 0.9144294992658953, - "eval_loss": 0.005396208260208368, - "eval_runtime": 116.6359, - "eval_samples_per_second": 17.147, - "eval_steps_per_second": 4.287, + "epoch": 0.76, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.010044018737971783, + "eval_runtime": 108.1094, + "eval_samples_per_second": 18.5, + "eval_steps_per_second": 4.625, "step": 294000 }, { - "epoch": 1.48, - "learning_rate": 7.750225769508251e-05, - "loss": 0.0058, + "epoch": 0.76, + "learning_rate": 0.00018568255046256813, + "loss": 0.0099, "step": 294010 }, { - "epoch": 1.48, - "learning_rate": 7.749469000206849e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018567866224619665, + "loss": 0.0134, "step": 294020 }, { - "epoch": 1.48, - "learning_rate": 7.748712230905448e-05, - "loss": 0.0066, + "epoch": 0.76, + "learning_rate": 0.0001856747740298252, + "loss": 0.0173, "step": 294030 }, { - "epoch": 1.48, - "learning_rate": 7.747955461604048e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018567088581345373, + "loss": 0.0127, "step": 294040 }, { - "epoch": 1.48, - "learning_rate": 7.747198692302646e-05, - "loss": 0.0048, + "epoch": 0.76, + "learning_rate": 0.00018566699759708227, + "loss": 0.0113, "step": 294050 }, { - "epoch": 1.48, - "learning_rate": 7.746441923001246e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001856631093807108, + "loss": 0.0164, "step": 294060 }, { - "epoch": 1.48, - "learning_rate": 7.745685153699844e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018565922116433933, + "loss": 0.0167, "step": 294070 }, { - "epoch": 1.48, - "learning_rate": 7.744928384398443e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018565533294796787, + "loss": 0.014, "step": 294080 }, { - "epoch": 1.48, - "learning_rate": 7.744171615097043e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.0001856514447315964, + "loss": 0.012, "step": 294090 }, { - "epoch": 1.48, - "learning_rate": 7.743414845795641e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018564755651522493, + "loss": 0.0161, "step": 294100 }, { - "epoch": 1.48, - "learning_rate": 7.74265807649424e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018564366829885347, + "loss": 0.0159, "step": 294110 }, { - "epoch": 1.48, - "learning_rate": 7.74190130719284e-05, - "loss": 0.0055, + "epoch": 0.76, + "learning_rate": 0.00018563978008248204, + "loss": 0.0147, "step": 294120 }, { - "epoch": 1.48, - "learning_rate": 7.741144537891438e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.00018563589186611055, + "loss": 0.0134, "step": 294130 }, { - "epoch": 1.48, - "learning_rate": 7.740387768590038e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018563200364973907, + "loss": 0.0125, "step": 294140 }, { - "epoch": 1.48, - "learning_rate": 7.739630999288636e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.0001856281154333676, + "loss": 0.0143, "step": 294150 }, { - "epoch": 1.48, - "learning_rate": 7.738874229987235e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018562422721699618, + "loss": 0.0137, "step": 294160 }, { - "epoch": 1.48, - "learning_rate": 7.738117460685835e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.0001856203390006247, + "loss": 0.0151, "step": 294170 }, { - "epoch": 1.48, - "learning_rate": 7.737360691384433e-05, - "loss": 0.0088, + "epoch": 0.76, + "learning_rate": 0.00018561645078425323, + "loss": 0.0132, "step": 294180 }, { - "epoch": 1.48, - "learning_rate": 7.736603922083032e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018561256256788175, + "loss": 0.0126, "step": 294190 }, { - "epoch": 1.48, - "learning_rate": 7.735847152781632e-05, - "loss": 0.0126, + "epoch": 0.76, + "learning_rate": 0.00018560867435151032, + "loss": 0.0154, "step": 294200 }, { - "epoch": 1.48, - "learning_rate": 7.73509038348023e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018560478613513883, + "loss": 0.0146, "step": 294210 }, { - "epoch": 1.48, - "learning_rate": 7.73433361417883e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018560089791876737, + "loss": 0.015, "step": 294220 }, { - "epoch": 1.48, - "learning_rate": 7.733576844877428e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.0001855970097023959, + "loss": 0.0184, "step": 294230 }, { - "epoch": 1.48, - "learning_rate": 7.732820075576027e-05, - "loss": 0.0084, + "epoch": 0.76, + "learning_rate": 0.00018559312148602446, + "loss": 0.0123, "step": 294240 }, { - "epoch": 1.48, - "learning_rate": 7.732063306274627e-05, - "loss": 0.0106, + "epoch": 0.76, + "learning_rate": 0.00018558923326965297, + "loss": 0.013, "step": 294250 }, { - "epoch": 1.48, - "learning_rate": 7.731306536973225e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.0001855853450532815, + "loss": 0.0138, "step": 294260 }, { - "epoch": 1.48, - "learning_rate": 7.730549767671824e-05, - "loss": 0.0064, + "epoch": 0.76, + "learning_rate": 0.00018558145683691003, + "loss": 0.0135, "step": 294270 }, { - "epoch": 1.48, - "learning_rate": 7.729792998370424e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018557756862053857, + "loss": 0.0116, "step": 294280 }, { - "epoch": 1.48, - "learning_rate": 7.729036229069022e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018557368040416714, + "loss": 0.0118, "step": 294290 }, { - "epoch": 1.48, - "learning_rate": 7.728279459767621e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018556979218779565, + "loss": 0.0149, "step": 294300 }, { - "epoch": 1.48, - "learning_rate": 7.72752269046622e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.00018556590397142417, + "loss": 0.015, "step": 294310 }, { - "epoch": 1.48, - "learning_rate": 7.726765921164819e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.0001855620157550527, + "loss": 0.0163, "step": 294320 }, { - "epoch": 1.48, - "learning_rate": 7.726009151863419e-05, - "loss": 0.0085, + "epoch": 0.76, + "learning_rate": 0.00018555812753868128, + "loss": 0.0172, "step": 294330 }, { - "epoch": 1.48, - "learning_rate": 7.725252382562017e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.0001855542393223098, + "loss": 0.0166, "step": 294340 }, { - "epoch": 1.49, - "learning_rate": 7.724495613260616e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018555035110593833, + "loss": 0.0144, "step": 294350 }, { - "epoch": 1.49, - "learning_rate": 7.723738843959216e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018554646288956685, + "loss": 0.011, "step": 294360 }, { - "epoch": 1.49, - "learning_rate": 7.722982074657814e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018554257467319542, + "loss": 0.0117, "step": 294370 }, { - "epoch": 1.49, - "learning_rate": 7.722225305356413e-05, - "loss": 0.0072, + "epoch": 0.76, + "learning_rate": 0.00018553868645682393, + "loss": 0.0127, "step": 294380 }, { - "epoch": 1.49, - "learning_rate": 7.721468536055013e-05, - "loss": 0.0113, + "epoch": 0.76, + "learning_rate": 0.00018553479824045247, + "loss": 0.0132, "step": 294390 }, { - "epoch": 1.49, - "learning_rate": 7.720711766753611e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.000185530910024081, + "loss": 0.0159, "step": 294400 }, { - "epoch": 1.49, - "learning_rate": 7.71995499745221e-05, - "loss": 0.0138, + "epoch": 0.76, + "learning_rate": 0.00018552702180770956, + "loss": 0.013, "step": 294410 }, { - "epoch": 1.49, - "learning_rate": 7.719198228150809e-05, - "loss": 0.0105, + "epoch": 0.76, + "learning_rate": 0.00018552313359133807, + "loss": 0.0125, "step": 294420 }, { - "epoch": 1.49, - "learning_rate": 7.718441458849407e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001855192453749666, + "loss": 0.0149, "step": 294430 }, { - "epoch": 1.49, - "learning_rate": 7.717684689548005e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018551535715859513, + "loss": 0.015, "step": 294440 }, { - "epoch": 1.49, - "learning_rate": 7.716927920246604e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.0001855114689422237, + "loss": 0.0165, "step": 294450 }, { - "epoch": 1.49, - "learning_rate": 7.716171150945204e-05, - "loss": 0.0069, + "epoch": 0.76, + "learning_rate": 0.0001855075807258522, + "loss": 0.019, "step": 294460 }, { - "epoch": 1.49, - "learning_rate": 7.715414381643802e-05, - "loss": 0.0057, + "epoch": 0.76, + "learning_rate": 0.00018550369250948075, + "loss": 0.0111, "step": 294470 }, { - "epoch": 1.49, - "learning_rate": 7.714657612342402e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018549980429310927, + "loss": 0.016, "step": 294480 }, { - "epoch": 1.49, - "learning_rate": 7.713900843041001e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018549591607673784, + "loss": 0.0166, "step": 294490 }, { - "epoch": 1.49, - "learning_rate": 7.713144073739599e-05, - "loss": 0.0054, + "epoch": 0.76, + "learning_rate": 0.00018549202786036638, + "loss": 0.0166, "step": 294500 }, { - "epoch": 1.49, - "learning_rate": 7.712387304438199e-05, - "loss": 0.005, + "epoch": 0.76, + "learning_rate": 0.0001854881396439949, + "loss": 0.0144, "step": 294510 }, { - "epoch": 1.49, - "learning_rate": 7.711630535136797e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018548425142762343, + "loss": 0.0163, "step": 294520 }, { - "epoch": 1.49, - "learning_rate": 7.710873765835396e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018548036321125195, + "loss": 0.0159, "step": 294530 }, { - "epoch": 1.49, - "learning_rate": 7.710116996533996e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018547647499488052, + "loss": 0.0129, "step": 294540 }, { - "epoch": 1.49, - "learning_rate": 7.709360227232594e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.00018547258677850903, + "loss": 0.0146, "step": 294550 }, { - "epoch": 1.49, - "learning_rate": 7.708603457931193e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018546869856213757, + "loss": 0.0123, "step": 294560 }, { - "epoch": 1.49, - "learning_rate": 7.707846688629793e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001854648103457661, + "loss": 0.0142, "step": 294570 }, { - "epoch": 1.49, - "learning_rate": 7.707089919328391e-05, - "loss": 0.0074, + "epoch": 0.76, + "learning_rate": 0.00018546092212939466, + "loss": 0.0145, "step": 294580 }, { - "epoch": 1.49, - "learning_rate": 7.70633315002699e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018545703391302317, + "loss": 0.0145, "step": 294590 }, { - "epoch": 1.49, - "learning_rate": 7.705576380725589e-05, - "loss": 0.0102, + "epoch": 0.76, + "learning_rate": 0.0001854531456966517, + "loss": 0.0121, "step": 294600 }, { - "epoch": 1.49, - "learning_rate": 7.704819611424188e-05, - "loss": 0.0057, + "epoch": 0.76, + "learning_rate": 0.00018544925748028023, + "loss": 0.0134, "step": 294610 }, { - "epoch": 1.49, - "learning_rate": 7.704062842122788e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001854453692639088, + "loss": 0.012, "step": 294620 }, { - "epoch": 1.49, - "learning_rate": 7.703306072821386e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.0001854414810475373, + "loss": 0.0116, "step": 294630 }, { - "epoch": 1.49, - "learning_rate": 7.702549303519985e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018543759283116585, + "loss": 0.0161, "step": 294640 }, { - "epoch": 1.49, - "learning_rate": 7.701792534218585e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018543370461479437, + "loss": 0.0132, "step": 294650 }, { - "epoch": 1.49, - "learning_rate": 7.701035764917183e-05, - "loss": 0.01, + "epoch": 0.76, + "learning_rate": 0.00018542981639842293, + "loss": 0.0149, "step": 294660 }, { - "epoch": 1.49, - "learning_rate": 7.700278995615783e-05, - "loss": 0.008, + "epoch": 0.76, + "learning_rate": 0.00018542592818205148, + "loss": 0.0125, "step": 294670 }, { - "epoch": 1.49, - "learning_rate": 7.699522226314381e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.00018542203996568, + "loss": 0.0114, "step": 294680 }, { - "epoch": 1.49, - "learning_rate": 7.69876545701298e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018541815174930853, + "loss": 0.0163, "step": 294690 }, { - "epoch": 1.49, - "learning_rate": 7.69800868771158e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.00018541426353293707, + "loss": 0.016, "step": 294700 }, { - "epoch": 1.49, - "learning_rate": 7.697251918410178e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018541037531656562, + "loss": 0.0152, "step": 294710 }, { - "epoch": 1.49, - "learning_rate": 7.696495149108777e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.00018540648710019413, + "loss": 0.0131, "step": 294720 }, { - "epoch": 1.49, - "learning_rate": 7.695738379807377e-05, - "loss": 0.0099, + "epoch": 0.76, + "learning_rate": 0.00018540259888382267, + "loss": 0.017, "step": 294730 }, { - "epoch": 1.49, - "learning_rate": 7.694981610505975e-05, - "loss": 0.0068, + "epoch": 0.76, + "learning_rate": 0.0001853987106674512, + "loss": 0.0151, "step": 294740 }, { - "epoch": 1.49, - "learning_rate": 7.694224841204574e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.00018539482245107976, + "loss": 0.0133, "step": 294750 }, { - "epoch": 1.49, - "learning_rate": 7.693468071903173e-05, - "loss": 0.0087, + "epoch": 0.76, + "learning_rate": 0.00018539093423470827, + "loss": 0.0133, "step": 294760 }, { - "epoch": 1.49, - "learning_rate": 7.692711302601772e-05, - "loss": 0.01, + "epoch": 0.76, + "learning_rate": 0.0001853870460183368, + "loss": 0.0136, "step": 294770 }, { - "epoch": 1.49, - "learning_rate": 7.691954533300372e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018538315780196533, + "loss": 0.0129, "step": 294780 }, { - "epoch": 1.49, - "learning_rate": 7.69119776399897e-05, - "loss": 0.0075, + "epoch": 0.76, + "learning_rate": 0.0001853792695855939, + "loss": 0.0129, "step": 294790 }, { - "epoch": 1.49, - "learning_rate": 7.690440994697569e-05, - "loss": 0.0076, + "epoch": 0.76, + "learning_rate": 0.0001853753813692224, + "loss": 0.0195, "step": 294800 }, { - "epoch": 1.49, - "learning_rate": 7.689684225396169e-05, - "loss": 0.006, + "epoch": 0.76, + "learning_rate": 0.00018537149315285095, + "loss": 0.0135, "step": 294810 }, { - "epoch": 1.49, - "learning_rate": 7.688927456094767e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018536760493647947, + "loss": 0.0152, "step": 294820 }, { - "epoch": 1.49, - "learning_rate": 7.688170686793366e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018536371672010803, + "loss": 0.0141, "step": 294830 }, { - "epoch": 1.49, - "learning_rate": 7.687413917491965e-05, - "loss": 0.0082, + "epoch": 0.76, + "learning_rate": 0.00018535982850373658, + "loss": 0.0137, "step": 294840 }, { - "epoch": 1.49, - "learning_rate": 7.686657148190564e-05, - "loss": 0.0059, + "epoch": 0.76, + "learning_rate": 0.0001853559402873651, + "loss": 0.0138, "step": 294850 }, { - "epoch": 1.49, - "learning_rate": 7.685900378889164e-05, - "loss": 0.0101, + "epoch": 0.76, + "learning_rate": 0.0001853520520709936, + "loss": 0.0137, "step": 294860 }, { - "epoch": 1.49, - "learning_rate": 7.685143609587762e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018534816385462217, + "loss": 0.0128, "step": 294870 }, { - "epoch": 1.49, - "learning_rate": 7.684386840286361e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.00018534427563825072, + "loss": 0.0133, "step": 294880 }, { - "epoch": 1.49, - "learning_rate": 7.683630070984961e-05, - "loss": 0.0071, + "epoch": 0.76, + "learning_rate": 0.00018534038742187923, + "loss": 0.0154, "step": 294890 }, { - "epoch": 1.49, - "learning_rate": 7.682873301683559e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018533649920550777, + "loss": 0.0142, "step": 294900 }, { - "epoch": 1.49, - "learning_rate": 7.682116532382158e-05, - "loss": 0.0056, + "epoch": 0.76, + "learning_rate": 0.0001853326109891363, + "loss": 0.0101, "step": 294910 }, { - "epoch": 1.49, - "learning_rate": 7.681359763080758e-05, - "loss": 0.0062, + "epoch": 0.76, + "learning_rate": 0.00018532872277276485, + "loss": 0.016, "step": 294920 }, { - "epoch": 1.49, - "learning_rate": 7.680602993779356e-05, - "loss": 0.0079, + "epoch": 0.76, + "learning_rate": 0.00018532483455639337, + "loss": 0.0136, "step": 294930 }, { - "epoch": 1.49, - "learning_rate": 7.679846224477955e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.0001853209463400219, + "loss": 0.0211, "step": 294940 }, { - "epoch": 1.49, - "learning_rate": 7.679089455176554e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018531705812365045, + "loss": 0.014, "step": 294950 }, { - "epoch": 1.49, - "learning_rate": 7.678332685875153e-05, - "loss": 0.0073, + "epoch": 0.76, + "learning_rate": 0.000185313169907279, + "loss": 0.0136, "step": 294960 }, { - "epoch": 1.49, - "learning_rate": 7.677575916573753e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001853092816909075, + "loss": 0.0171, "step": 294970 }, { - "epoch": 1.49, - "learning_rate": 7.676819147272351e-05, - "loss": 0.0083, + "epoch": 0.76, + "learning_rate": 0.00018530539347453605, + "loss": 0.0174, "step": 294980 }, { - "epoch": 1.49, - "learning_rate": 7.67606237797095e-05, - "loss": 0.0077, + "epoch": 0.76, + "learning_rate": 0.00018530150525816462, + "loss": 0.0119, "step": 294990 }, { - "epoch": 1.49, - "learning_rate": 7.67530560866955e-05, - "loss": 0.0065, + "epoch": 0.76, + "learning_rate": 0.00018529761704179313, + "loss": 0.0135, "step": 295000 }, { - "epoch": 1.49, - "eval_cer": 0.9144304696620207, - "eval_loss": 0.005469324998557568, - "eval_runtime": 116.6115, - "eval_samples_per_second": 17.151, - "eval_steps_per_second": 4.288, + "epoch": 0.76, + "eval_cer": 0.881688689953826, + "eval_loss": 0.00990963727235794, + "eval_runtime": 107.8953, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, "step": 295000 }, { - "epoch": 1.49, - "learning_rate": 7.674548839368148e-05, - "loss": 0.0067, + "epoch": 0.76, + "learning_rate": 0.00018529372882542165, + "loss": 0.0182, "step": 295010 }, { - "epoch": 1.49, - "learning_rate": 7.673792070066747e-05, - "loss": 0.0055, + "epoch": 0.76, + "learning_rate": 0.0001852898406090502, + "loss": 0.0148, "step": 295020 }, { - "epoch": 1.49, - "learning_rate": 7.673035300765346e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001852859523926787, + "loss": 0.0116, "step": 295030 }, { - "epoch": 1.49, - "learning_rate": 7.672278531463945e-05, - "loss": 0.01, + "epoch": 0.76, + "learning_rate": 0.00018528206417630727, + "loss": 0.0166, "step": 295040 }, { - "epoch": 1.49, - "learning_rate": 7.671521762162545e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018527817595993581, + "loss": 0.0164, "step": 295050 }, { - "epoch": 1.49, - "learning_rate": 7.670764992861141e-05, - "loss": 0.0081, + "epoch": 0.76, + "learning_rate": 0.00018527428774356433, + "loss": 0.0121, "step": 295060 }, { - "epoch": 1.49, - "learning_rate": 7.670008223559741e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.00018527039952719287, + "loss": 0.0115, "step": 295070 }, { - "epoch": 1.49, - "learning_rate": 7.669251454258339e-05, - "loss": 0.007, + "epoch": 0.76, + "learning_rate": 0.0001852665113108214, + "loss": 0.0162, "step": 295080 }, { - "epoch": 1.49, - "learning_rate": 7.668494684956938e-05, - "loss": 0.0096, + "epoch": 0.76, + "learning_rate": 0.00018526262309444995, + "loss": 0.0168, "step": 295090 }, { - "epoch": 1.49, - "learning_rate": 7.667737915655538e-05, - "loss": 0.0078, + "epoch": 0.76, + "learning_rate": 0.00018525873487807847, + "loss": 0.015, "step": 295100 }, { - "epoch": 1.49, - "learning_rate": 7.666981146354136e-05, - "loss": 0.0063, + "epoch": 0.76, + "learning_rate": 0.000185254846661707, + "loss": 0.014, "step": 295110 }, { - "epoch": 1.49, - "learning_rate": 7.666224377052736e-05, - "loss": 0.0061, + "epoch": 0.76, + "learning_rate": 0.00018525095844533555, + "loss": 0.0162, "step": 295120 }, { - "epoch": 1.49, - "learning_rate": 7.665467607751334e-05, - "loss": 0.0099, + "epoch": 0.77, + "learning_rate": 0.0001852470702289641, + "loss": 0.0123, "step": 295130 }, { - "epoch": 1.49, - "learning_rate": 7.664710838449933e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.0001852431820125926, + "loss": 0.019, "step": 295140 }, { - "epoch": 1.49, - "learning_rate": 7.663954069148533e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018523929379622115, + "loss": 0.0133, "step": 295150 }, { - "epoch": 1.49, - "learning_rate": 7.663197299847131e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018523540557984972, + "loss": 0.015, "step": 295160 }, { - "epoch": 1.49, - "learning_rate": 7.66244053054573e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.00018523151736347823, + "loss": 0.0191, "step": 295170 }, { - "epoch": 1.49, - "learning_rate": 7.66168376124433e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018522762914710675, + "loss": 0.0169, "step": 295180 }, { - "epoch": 1.49, - "learning_rate": 7.660926991942928e-05, - "loss": 0.0104, + "epoch": 0.77, + "learning_rate": 0.0001852237409307353, + "loss": 0.0154, "step": 295190 }, { - "epoch": 1.49, - "learning_rate": 7.660170222641528e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018521985271436386, + "loss": 0.0157, "step": 295200 }, { - "epoch": 1.49, - "learning_rate": 7.659413453340126e-05, - "loss": 0.0116, + "epoch": 0.77, + "learning_rate": 0.00018521596449799237, + "loss": 0.0157, "step": 295210 }, { - "epoch": 1.49, - "learning_rate": 7.658656684038725e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018521207628162091, + "loss": 0.0138, "step": 295220 }, { - "epoch": 1.49, - "learning_rate": 7.657899914737325e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018520818806524943, + "loss": 0.0132, "step": 295230 }, { - "epoch": 1.49, - "learning_rate": 7.657143145435923e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.000185204299848878, + "loss": 0.014, "step": 295240 }, { - "epoch": 1.49, - "learning_rate": 7.656386376134522e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001852004116325065, + "loss": 0.0108, "step": 295250 }, { - "epoch": 1.49, - "learning_rate": 7.655629606833122e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018519652341613505, + "loss": 0.0173, "step": 295260 }, { - "epoch": 1.49, - "learning_rate": 7.65487283753172e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.00018519263519976357, + "loss": 0.0174, "step": 295270 }, { - "epoch": 1.49, - "learning_rate": 7.65411606823032e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.0001851887469833921, + "loss": 0.0128, "step": 295280 }, { - "epoch": 1.49, - "learning_rate": 7.653359298928918e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018518485876702065, + "loss": 0.015, "step": 295290 }, { - "epoch": 1.49, - "learning_rate": 7.652602529627517e-05, - "loss": 0.0094, + "epoch": 0.77, + "learning_rate": 0.0001851809705506492, + "loss": 0.0117, "step": 295300 }, { - "epoch": 1.49, - "learning_rate": 7.651845760326117e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001851770823342777, + "loss": 0.0134, "step": 295310 }, { - "epoch": 1.49, - "learning_rate": 7.651088991024715e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018517319411790625, + "loss": 0.0125, "step": 295320 }, { - "epoch": 1.49, - "learning_rate": 7.650332221723314e-05, - "loss": 0.0115, + "epoch": 0.77, + "learning_rate": 0.0001851693059015348, + "loss": 0.0132, "step": 295330 }, { - "epoch": 1.49, - "learning_rate": 7.649575452421914e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018516541768516333, + "loss": 0.0134, "step": 295340 }, { - "epoch": 1.49, - "learning_rate": 7.648818683120512e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018516152946879185, + "loss": 0.0143, "step": 295350 }, { - "epoch": 1.49, - "learning_rate": 7.648061913819111e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.0001851576412524204, + "loss": 0.0209, "step": 295360 }, { - "epoch": 1.49, - "learning_rate": 7.647305144517711e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018515375303604896, + "loss": 0.0184, "step": 295370 }, { - "epoch": 1.49, - "learning_rate": 7.646548375216309e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018514986481967747, + "loss": 0.0122, "step": 295380 }, { - "epoch": 1.49, - "learning_rate": 7.645791605914909e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.000185145976603306, + "loss": 0.0123, "step": 295390 }, { - "epoch": 1.49, - "learning_rate": 7.645034836613507e-05, - "loss": 0.004, + "epoch": 0.77, + "learning_rate": 0.00018514208838693453, + "loss": 0.0153, "step": 295400 }, { - "epoch": 1.49, - "learning_rate": 7.644278067312106e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.0001851382001705631, + "loss": 0.0165, "step": 295410 }, { - "epoch": 1.49, - "learning_rate": 7.643521298010706e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.0001851343119541916, + "loss": 0.0181, "step": 295420 }, { - "epoch": 1.49, - "learning_rate": 7.642764528709304e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018513042373782015, + "loss": 0.015, "step": 295430 }, { - "epoch": 1.49, - "learning_rate": 7.642007759407903e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018512653552144867, + "loss": 0.013, "step": 295440 }, { - "epoch": 1.49, - "learning_rate": 7.641250990106503e-05, - "loss": 0.0112, + "epoch": 0.77, + "learning_rate": 0.00018512264730507724, + "loss": 0.0154, "step": 295450 }, { - "epoch": 1.49, - "learning_rate": 7.640494220805101e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018511875908870575, + "loss": 0.0101, "step": 295460 }, { - "epoch": 1.49, - "learning_rate": 7.6397374515037e-05, - "loss": 0.0088, + "epoch": 0.77, + "learning_rate": 0.0001851148708723343, + "loss": 0.0161, "step": 295470 }, { - "epoch": 1.49, - "learning_rate": 7.638980682202299e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.0001851109826559628, + "loss": 0.0175, "step": 295480 }, { - "epoch": 1.49, - "learning_rate": 7.638223912900898e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018510709443959138, + "loss": 0.0193, "step": 295490 }, { - "epoch": 1.49, - "learning_rate": 7.637467143599498e-05, - "loss": 0.0092, + "epoch": 0.77, + "learning_rate": 0.0001851032062232199, + "loss": 0.0131, "step": 295500 }, { - "epoch": 1.49, - "learning_rate": 7.636710374298096e-05, - "loss": 0.0058, + "epoch": 0.77, + "learning_rate": 0.00018509931800684843, + "loss": 0.0164, "step": 295510 }, { - "epoch": 1.49, - "learning_rate": 7.635953604996695e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.00018509542979047695, + "loss": 0.0137, "step": 295520 }, { - "epoch": 1.49, - "learning_rate": 7.635196835695295e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001850915415741055, + "loss": 0.0139, "step": 295530 }, { - "epoch": 1.49, - "learning_rate": 7.634440066393893e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018508765335773406, + "loss": 0.0112, "step": 295540 }, { - "epoch": 1.49, - "learning_rate": 7.633683297092492e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018508376514136257, + "loss": 0.0139, "step": 295550 }, { - "epoch": 1.49, - "learning_rate": 7.63292652779109e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.0001850798769249911, + "loss": 0.014, "step": 295560 }, { - "epoch": 1.49, - "learning_rate": 7.63216975848969e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018507598870861963, + "loss": 0.0141, "step": 295570 }, { - "epoch": 1.49, - "learning_rate": 7.63141298918829e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.0001850721004922482, + "loss": 0.0162, "step": 295580 }, { - "epoch": 1.49, - "learning_rate": 7.630656219886888e-05, - "loss": 0.0091, + "epoch": 0.77, + "learning_rate": 0.0001850682122758767, + "loss": 0.0153, "step": 295590 }, { - "epoch": 1.49, - "learning_rate": 7.629899450585487e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018506432405950525, + "loss": 0.0167, "step": 295600 }, { - "epoch": 1.49, - "learning_rate": 7.629142681284087e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018506043584313377, + "loss": 0.0254, "step": 295610 }, { - "epoch": 1.49, - "learning_rate": 7.628385911982685e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018505654762676234, + "loss": 0.0158, "step": 295620 }, { - "epoch": 1.49, - "learning_rate": 7.627629142681284e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018505265941039085, + "loss": 0.0132, "step": 295630 }, { - "epoch": 1.49, - "learning_rate": 7.626872373379882e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.0001850487711940194, + "loss": 0.0185, "step": 295640 }, { - "epoch": 1.49, - "learning_rate": 7.626115604078482e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001850448829776479, + "loss": 0.0179, "step": 295650 }, { - "epoch": 1.49, - "learning_rate": 7.625358834777081e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018504099476127647, + "loss": 0.014, "step": 295660 }, { - "epoch": 1.49, - "learning_rate": 7.62460206547568e-05, - "loss": 0.0048, + "epoch": 0.77, + "learning_rate": 0.000185037106544905, + "loss": 0.0156, "step": 295670 }, { - "epoch": 1.49, - "learning_rate": 7.623845296174279e-05, - "loss": 0.0106, + "epoch": 0.77, + "learning_rate": 0.00018503321832853353, + "loss": 0.013, "step": 295680 }, { - "epoch": 1.49, - "learning_rate": 7.623088526872876e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018502933011216205, + "loss": 0.0157, "step": 295690 }, { - "epoch": 1.49, - "learning_rate": 7.622331757571475e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018502544189579061, + "loss": 0.0142, "step": 295700 }, { - "epoch": 1.49, - "learning_rate": 7.621574988270075e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018502155367941916, + "loss": 0.0106, "step": 295710 }, { - "epoch": 1.49, - "learning_rate": 7.620818218968673e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018501766546304767, + "loss": 0.012, "step": 295720 }, { - "epoch": 1.49, - "learning_rate": 7.620061449667273e-05, - "loss": 0.0092, + "epoch": 0.77, + "learning_rate": 0.00018501377724667619, + "loss": 0.0152, "step": 295730 }, { - "epoch": 1.49, - "learning_rate": 7.619304680365871e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018500988903030475, + "loss": 0.0161, "step": 295740 }, { - "epoch": 1.49, - "learning_rate": 7.61854791106447e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001850060008139333, + "loss": 0.0133, "step": 295750 }, { - "epoch": 1.49, - "learning_rate": 7.61779114176307e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.0001850021125975618, + "loss": 0.0138, "step": 295760 }, { - "epoch": 1.49, - "learning_rate": 7.617034372461668e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018499822438119035, + "loss": 0.0131, "step": 295770 }, { - "epoch": 1.49, - "learning_rate": 7.616277603160267e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018499433616481887, + "loss": 0.0143, "step": 295780 }, { - "epoch": 1.49, - "learning_rate": 7.615520833858867e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018499044794844743, + "loss": 0.0151, "step": 295790 }, { - "epoch": 1.49, - "learning_rate": 7.614764064557465e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018498655973207595, + "loss": 0.0126, "step": 295800 }, { - "epoch": 1.49, - "learning_rate": 7.614007295256064e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.0001849826715157045, + "loss": 0.0122, "step": 295810 }, { - "epoch": 1.49, - "learning_rate": 7.613250525954664e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.000184978783299333, + "loss": 0.0159, "step": 295820 }, { - "epoch": 1.49, - "learning_rate": 7.612493756653262e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018497489508296157, + "loss": 0.0164, "step": 295830 }, { - "epoch": 1.49, - "learning_rate": 7.611736987351862e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001849710068665901, + "loss": 0.0173, "step": 295840 }, { - "epoch": 1.49, - "learning_rate": 7.61098021805046e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018496711865021863, + "loss": 0.0132, "step": 295850 }, { - "epoch": 1.49, - "learning_rate": 7.610223448749059e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018496323043384715, + "loss": 0.0125, "step": 295860 }, { - "epoch": 1.49, - "learning_rate": 7.609466679447659e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018495934221747571, + "loss": 0.0155, "step": 295870 }, { - "epoch": 1.49, - "learning_rate": 7.608709910146257e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.00018495545400110423, + "loss": 0.0111, "step": 295880 }, { - "epoch": 1.49, - "learning_rate": 7.607953140844856e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018495156578473277, + "loss": 0.0156, "step": 295890 }, { - "epoch": 1.49, - "learning_rate": 7.607196371543456e-05, - "loss": 0.0095, + "epoch": 0.77, + "learning_rate": 0.00018494767756836128, + "loss": 0.0118, "step": 295900 }, { - "epoch": 1.49, - "learning_rate": 7.606439602242054e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018494378935198985, + "loss": 0.0151, "step": 295910 }, { - "epoch": 1.49, - "learning_rate": 7.605682832940654e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.0001849399011356184, + "loss": 0.0125, "step": 295920 }, { - "epoch": 1.49, - "learning_rate": 7.604926063639252e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.0001849360129192469, + "loss": 0.0144, "step": 295930 }, { - "epoch": 1.49, - "learning_rate": 7.604169294337851e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018493212470287545, + "loss": 0.0151, "step": 295940 }, { - "epoch": 1.49, - "learning_rate": 7.603412525036451e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.000184928236486504, + "loss": 0.0136, "step": 295950 }, { - "epoch": 1.49, - "learning_rate": 7.602655755735049e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018492434827013253, + "loss": 0.013, "step": 295960 }, { - "epoch": 1.49, - "learning_rate": 7.601898986433648e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.00018492046005376105, + "loss": 0.0131, "step": 295970 }, { - "epoch": 1.49, - "learning_rate": 7.601142217132248e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.0001849165718373896, + "loss": 0.0119, "step": 295980 }, { - "epoch": 1.49, - "learning_rate": 7.600385447830846e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018491268362101813, + "loss": 0.0113, "step": 295990 }, { - "epoch": 1.49, - "learning_rate": 7.599628678529446e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018490879540464667, + "loss": 0.0132, "step": 296000 }, { - "epoch": 1.49, - "eval_cer": 0.9144605519419082, - "eval_loss": 0.005476477090269327, - "eval_runtime": 116.6265, - "eval_samples_per_second": 17.149, - "eval_steps_per_second": 4.287, + "epoch": 0.77, + "eval_cer": 0.881727879787983, + "eval_loss": 0.00943910051137209, + "eval_runtime": 107.9554, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.632, "step": 296000 }, { - "epoch": 1.49, - "learning_rate": 7.598871909228044e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001849049071882752, + "loss": 0.012, "step": 296010 }, { - "epoch": 1.49, - "learning_rate": 7.598115139926643e-05, - "loss": 0.0109, + "epoch": 0.77, + "learning_rate": 0.00018490101897190373, + "loss": 0.0153, "step": 296020 }, { - "epoch": 1.49, - "learning_rate": 7.597358370625243e-05, - "loss": 0.012, + "epoch": 0.77, + "learning_rate": 0.00018489713075553224, + "loss": 0.0116, "step": 296030 }, { - "epoch": 1.49, - "learning_rate": 7.596601601323841e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.0001848932425391608, + "loss": 0.0146, "step": 296040 }, { - "epoch": 1.49, - "learning_rate": 7.59584483202244e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018488935432278933, + "loss": 0.0132, "step": 296050 }, { - "epoch": 1.49, - "learning_rate": 7.59508806272104e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018488546610641787, + "loss": 0.0139, "step": 296060 }, { - "epoch": 1.49, - "learning_rate": 7.594331293419638e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018488157789004638, + "loss": 0.0164, "step": 296070 }, { - "epoch": 1.49, - "learning_rate": 7.593574524118237e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018487768967367495, + "loss": 0.0123, "step": 296080 }, { - "epoch": 1.49, - "learning_rate": 7.592817754816836e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.0001848738014573035, + "loss": 0.0144, "step": 296090 }, { - "epoch": 1.49, - "learning_rate": 7.592060985515435e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.000184869913240932, + "loss": 0.0167, "step": 296100 }, { - "epoch": 1.49, - "learning_rate": 7.591304216214035e-05, - "loss": 0.0106, + "epoch": 0.77, + "learning_rate": 0.00018486602502456055, + "loss": 0.0174, "step": 296110 }, { - "epoch": 1.49, - "learning_rate": 7.590547446912633e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001848621368081891, + "loss": 0.0149, "step": 296120 }, { - "epoch": 1.49, - "learning_rate": 7.589790677611232e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018485824859181763, + "loss": 0.0193, "step": 296130 }, { - "epoch": 1.49, - "learning_rate": 7.589033908309832e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018485436037544615, + "loss": 0.0133, "step": 296140 }, { - "epoch": 1.49, - "learning_rate": 7.58827713900843e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.0001848504721590747, + "loss": 0.0143, "step": 296150 }, { - "epoch": 1.49, - "learning_rate": 7.58752036970703e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018484658394270323, + "loss": 0.0139, "step": 296160 }, { - "epoch": 1.49, - "learning_rate": 7.586763600405628e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018484269572633177, + "loss": 0.0163, "step": 296170 }, { - "epoch": 1.49, - "learning_rate": 7.586006831104227e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.0001848388075099603, + "loss": 0.0142, "step": 296180 }, { - "epoch": 1.49, - "learning_rate": 7.585250061802827e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018483491929358883, + "loss": 0.0134, "step": 296190 }, { - "epoch": 1.49, - "learning_rate": 7.584493292501425e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018483103107721737, + "loss": 0.0151, "step": 296200 }, { - "epoch": 1.49, - "learning_rate": 7.583736523200024e-05, - "loss": 0.0053, + "epoch": 0.77, + "learning_rate": 0.0001848271428608459, + "loss": 0.0162, "step": 296210 }, { - "epoch": 1.49, - "learning_rate": 7.582979753898624e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018482325464447443, + "loss": 0.0181, "step": 296220 }, { - "epoch": 1.49, - "learning_rate": 7.582222984597222e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018481936642810297, + "loss": 0.0171, "step": 296230 }, { - "epoch": 1.49, - "learning_rate": 7.581466215295821e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018481547821173148, + "loss": 0.0143, "step": 296240 }, { - "epoch": 1.49, - "learning_rate": 7.58070944599442e-05, - "loss": 0.0102, + "epoch": 0.77, + "learning_rate": 0.00018481158999536005, + "loss": 0.0142, "step": 296250 }, { - "epoch": 1.49, - "learning_rate": 7.579952676693019e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.0001848077017789886, + "loss": 0.0146, "step": 296260 }, { - "epoch": 1.49, - "learning_rate": 7.579195907391618e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.0001848038135626171, + "loss": 0.0149, "step": 296270 }, { - "epoch": 1.49, - "learning_rate": 7.578439138090217e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018479992534624565, + "loss": 0.0126, "step": 296280 }, { - "epoch": 1.49, - "learning_rate": 7.577682368788816e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.0001847960371298742, + "loss": 0.0146, "step": 296290 }, { - "epoch": 1.49, - "learning_rate": 7.576925599487416e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018479214891350273, + "loss": 0.0165, "step": 296300 }, { - "epoch": 1.49, - "learning_rate": 7.576168830186014e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018478826069713125, + "loss": 0.0147, "step": 296310 }, { - "epoch": 1.49, - "learning_rate": 7.575412060884612e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.0001847843724807598, + "loss": 0.0128, "step": 296320 }, { - "epoch": 1.5, - "learning_rate": 7.57465529158321e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018478048426438833, + "loss": 0.0128, "step": 296330 }, { - "epoch": 1.5, - "learning_rate": 7.57389852228181e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018477659604801687, + "loss": 0.0131, "step": 296340 }, { - "epoch": 1.5, - "learning_rate": 7.573141752980409e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.0001847727078316454, + "loss": 0.0126, "step": 296350 }, { - "epoch": 1.5, - "learning_rate": 7.572384983679007e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018476881961527393, + "loss": 0.011, "step": 296360 }, { - "epoch": 1.5, - "learning_rate": 7.571628214377607e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018476493139890247, + "loss": 0.015, "step": 296370 }, { - "epoch": 1.5, - "learning_rate": 7.570871445076205e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.000184761043182531, + "loss": 0.0167, "step": 296380 }, { - "epoch": 1.5, - "learning_rate": 7.570114675774804e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018475715496615953, + "loss": 0.0146, "step": 296390 }, { - "epoch": 1.5, - "learning_rate": 7.569357906473404e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018475326674978807, + "loss": 0.0234, "step": 296400 }, { - "epoch": 1.5, - "learning_rate": 7.568601137172002e-05, - "loss": 0.0053, + "epoch": 0.77, + "learning_rate": 0.00018474937853341664, + "loss": 0.0167, "step": 296410 }, { - "epoch": 1.5, - "learning_rate": 7.567844367870601e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018474549031704515, + "loss": 0.012, "step": 296420 }, { - "epoch": 1.5, - "learning_rate": 7.567087598569201e-05, - "loss": 0.0101, + "epoch": 0.77, + "learning_rate": 0.0001847416021006737, + "loss": 0.0161, "step": 296430 }, { - "epoch": 1.5, - "learning_rate": 7.566330829267799e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001847377138843022, + "loss": 0.0139, "step": 296440 }, { - "epoch": 1.5, - "learning_rate": 7.565574059966399e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018473382566793078, + "loss": 0.0135, "step": 296450 }, { - "epoch": 1.5, - "learning_rate": 7.564817290664997e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001847299374515593, + "loss": 0.0125, "step": 296460 }, { - "epoch": 1.5, - "learning_rate": 7.564060521363596e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018472604923518783, + "loss": 0.0173, "step": 296470 }, { - "epoch": 1.5, - "learning_rate": 7.563303752062196e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018472216101881635, + "loss": 0.0153, "step": 296480 }, { - "epoch": 1.5, - "learning_rate": 7.562546982760794e-05, - "loss": 0.0094, + "epoch": 0.77, + "learning_rate": 0.0001847182728024449, + "loss": 0.0133, "step": 296490 }, { - "epoch": 1.5, - "learning_rate": 7.561790213459393e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018471438458607343, + "loss": 0.0156, "step": 296500 }, { - "epoch": 1.5, - "learning_rate": 7.561033444157993e-05, - "loss": 0.0056, + "epoch": 0.77, + "learning_rate": 0.00018471049636970197, + "loss": 0.0136, "step": 296510 }, { - "epoch": 1.5, - "learning_rate": 7.560276674856591e-05, - "loss": 0.0052, + "epoch": 0.77, + "learning_rate": 0.0001847066081533305, + "loss": 0.0193, "step": 296520 }, { - "epoch": 1.5, - "learning_rate": 7.55951990555519e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018470271993695903, + "loss": 0.0152, "step": 296530 }, { - "epoch": 1.5, - "learning_rate": 7.558763136253789e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018469883172058757, + "loss": 0.0119, "step": 296540 }, { - "epoch": 1.5, - "learning_rate": 7.558006366952388e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001846949435042161, + "loss": 0.0161, "step": 296550 }, { - "epoch": 1.5, - "learning_rate": 7.557249597650988e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018469105528784463, + "loss": 0.0176, "step": 296560 }, { - "epoch": 1.5, - "learning_rate": 7.556492828349586e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.00018468716707147317, + "loss": 0.0182, "step": 296570 }, { - "epoch": 1.5, - "learning_rate": 7.555736059048185e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018468327885510174, + "loss": 0.0121, "step": 296580 }, { - "epoch": 1.5, - "learning_rate": 7.554979289746785e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018467939063873025, + "loss": 0.0158, "step": 296590 }, { - "epoch": 1.5, - "learning_rate": 7.554222520445383e-05, - "loss": 0.0112, + "epoch": 0.77, + "learning_rate": 0.00018467550242235877, + "loss": 0.0139, "step": 296600 }, { - "epoch": 1.5, - "learning_rate": 7.553465751143982e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001846716142059873, + "loss": 0.0134, "step": 296610 }, { - "epoch": 1.5, - "learning_rate": 7.55270898184258e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018466772598961588, + "loss": 0.0175, "step": 296620 }, { - "epoch": 1.5, - "learning_rate": 7.55195221254118e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.0001846638377732444, + "loss": 0.0124, "step": 296630 }, { - "epoch": 1.5, - "learning_rate": 7.55119544323978e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018465994955687293, + "loss": 0.0115, "step": 296640 }, { - "epoch": 1.5, - "learning_rate": 7.550438673938378e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018465606134050145, + "loss": 0.0173, "step": 296650 }, { - "epoch": 1.5, - "learning_rate": 7.549681904636977e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018465217312413002, + "loss": 0.014, "step": 296660 }, { - "epoch": 1.5, - "learning_rate": 7.548925135335577e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018464828490775853, + "loss": 0.0145, "step": 296670 }, { - "epoch": 1.5, - "learning_rate": 7.548168366034175e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018464439669138707, + "loss": 0.0153, "step": 296680 }, { - "epoch": 1.5, - "learning_rate": 7.547411596732774e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.00018464050847501559, + "loss": 0.0153, "step": 296690 }, { - "epoch": 1.5, - "learning_rate": 7.546654827431373e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018463662025864415, + "loss": 0.0127, "step": 296700 }, { - "epoch": 1.5, - "learning_rate": 7.545898058129972e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018463273204227267, + "loss": 0.0147, "step": 296710 }, { - "epoch": 1.5, - "learning_rate": 7.545141288828572e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.0001846288438259012, + "loss": 0.0146, "step": 296720 }, { - "epoch": 1.5, - "learning_rate": 7.54438451952717e-05, - "loss": 0.009, + "epoch": 0.77, + "learning_rate": 0.00018462495560952973, + "loss": 0.0124, "step": 296730 }, { - "epoch": 1.5, - "learning_rate": 7.543627750225769e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018462106739315827, + "loss": 0.0134, "step": 296740 }, { - "epoch": 1.5, - "learning_rate": 7.542870980924369e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.00018461717917678684, + "loss": 0.0141, "step": 296750 }, { - "epoch": 1.5, - "learning_rate": 7.542114211622967e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018461329096041535, + "loss": 0.0137, "step": 296760 }, { - "epoch": 1.5, - "learning_rate": 7.541357442321566e-05, - "loss": 0.0095, + "epoch": 0.77, + "learning_rate": 0.00018460940274404386, + "loss": 0.016, "step": 296770 }, { - "epoch": 1.5, - "learning_rate": 7.540600673020164e-05, - "loss": 0.0113, + "epoch": 0.77, + "learning_rate": 0.0001846055145276724, + "loss": 0.0157, "step": 296780 }, { - "epoch": 1.5, - "learning_rate": 7.539843903718764e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018460162631130098, + "loss": 0.0134, "step": 296790 }, { - "epoch": 1.5, - "learning_rate": 7.539087134417363e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001845977380949295, + "loss": 0.0104, "step": 296800 }, { - "epoch": 1.5, - "learning_rate": 7.538330365115962e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018459384987855803, + "loss": 0.015, "step": 296810 }, { - "epoch": 1.5, - "learning_rate": 7.537573595814561e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.00018458996166218655, + "loss": 0.0158, "step": 296820 }, { - "epoch": 1.5, - "learning_rate": 7.53681682651316e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018458607344581511, + "loss": 0.0179, "step": 296830 }, { - "epoch": 1.5, - "learning_rate": 7.536060057211759e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018458218522944363, + "loss": 0.015, "step": 296840 }, { - "epoch": 1.5, - "learning_rate": 7.535303287910358e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018457829701307217, + "loss": 0.0152, "step": 296850 }, { - "epoch": 1.5, - "learning_rate": 7.534546518608958e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018457440879670069, + "loss": 0.0128, "step": 296860 }, { - "epoch": 1.5, - "learning_rate": 7.533789749307556e-05, - "loss": 0.0105, + "epoch": 0.77, + "learning_rate": 0.00018457052058032925, + "loss": 0.0183, "step": 296870 }, { - "epoch": 1.5, - "learning_rate": 7.533032980006155e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018456663236395777, + "loss": 0.0131, "step": 296880 }, { - "epoch": 1.5, - "learning_rate": 7.532276210704754e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.0001845627441475863, + "loss": 0.0154, "step": 296890 }, { - "epoch": 1.5, - "learning_rate": 7.531519441403353e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018455885593121482, + "loss": 0.0163, "step": 296900 }, { - "epoch": 1.5, - "learning_rate": 7.530762672101953e-05, - "loss": 0.0054, + "epoch": 0.77, + "learning_rate": 0.0001845549677148434, + "loss": 0.0159, "step": 296910 }, { - "epoch": 1.5, - "learning_rate": 7.53000590280055e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.0001845510794984719, + "loss": 0.0148, "step": 296920 }, { - "epoch": 1.5, - "learning_rate": 7.52924913349915e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018454719128210045, + "loss": 0.0179, "step": 296930 }, { - "epoch": 1.5, - "learning_rate": 7.528492364197747e-05, - "loss": 0.0098, + "epoch": 0.77, + "learning_rate": 0.00018454330306572896, + "loss": 0.0171, "step": 296940 }, { - "epoch": 1.5, - "learning_rate": 7.527735594896346e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018453941484935753, + "loss": 0.013, "step": 296950 }, { - "epoch": 1.5, - "learning_rate": 7.526978825594946e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018453552663298607, + "loss": 0.0114, "step": 296960 }, { - "epoch": 1.5, - "learning_rate": 7.526222056293544e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.0001845316384166146, + "loss": 0.0117, "step": 296970 }, { - "epoch": 1.5, - "learning_rate": 7.525465286992144e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018452775020024313, + "loss": 0.0127, "step": 296980 }, { - "epoch": 1.5, - "learning_rate": 7.524708517690742e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.00018452386198387165, + "loss": 0.0157, "step": 296990 }, { - "epoch": 1.5, - "learning_rate": 7.523951748389341e-05, - "loss": 0.0049, + "epoch": 0.77, + "learning_rate": 0.00018451997376750021, + "loss": 0.0137, "step": 297000 }, { - "epoch": 1.5, - "eval_cer": 0.9144440552077764, - "eval_loss": 0.005415515974164009, - "eval_runtime": 116.5765, - "eval_samples_per_second": 17.156, - "eval_steps_per_second": 4.289, + "epoch": 0.77, + "eval_cer": 0.8817432757942589, + "eval_loss": 0.010051160119473934, + "eval_runtime": 108.1046, + "eval_samples_per_second": 18.501, + "eval_steps_per_second": 4.625, "step": 297000 }, { - "epoch": 1.5, - "learning_rate": 7.523194979087941e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018451608555112873, + "loss": 0.0122, "step": 297010 }, { - "epoch": 1.5, - "learning_rate": 7.522438209786539e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018451219733475727, + "loss": 0.0184, "step": 297020 }, { - "epoch": 1.5, - "learning_rate": 7.521681440485138e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018450830911838578, + "loss": 0.0161, "step": 297030 }, { - "epoch": 1.5, - "learning_rate": 7.520924671183738e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018450442090201435, + "loss": 0.0141, "step": 297040 }, { - "epoch": 1.5, - "learning_rate": 7.520167901882336e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018450053268564287, + "loss": 0.0119, "step": 297050 }, { - "epoch": 1.5, - "learning_rate": 7.519411132580936e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.0001844966444692714, + "loss": 0.0152, "step": 297060 }, { - "epoch": 1.5, - "learning_rate": 7.518654363279534e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018449275625289992, + "loss": 0.0156, "step": 297070 }, { - "epoch": 1.5, - "learning_rate": 7.517897593978133e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.0001844888680365285, + "loss": 0.0131, "step": 297080 }, { - "epoch": 1.5, - "learning_rate": 7.517140824676733e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.000184484979820157, + "loss": 0.0135, "step": 297090 }, { - "epoch": 1.5, - "learning_rate": 7.516384055375331e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018448109160378555, + "loss": 0.0134, "step": 297100 }, { - "epoch": 1.5, - "learning_rate": 7.51562728607393e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018447720338741406, + "loss": 0.012, "step": 297110 }, { - "epoch": 1.5, - "learning_rate": 7.51487051677253e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018447331517104263, + "loss": 0.014, "step": 297120 }, { - "epoch": 1.5, - "learning_rate": 7.514113747471128e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018446942695467117, + "loss": 0.0163, "step": 297130 }, { - "epoch": 1.5, - "learning_rate": 7.513356978169727e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.0001844655387382997, + "loss": 0.0184, "step": 297140 }, { - "epoch": 1.5, - "learning_rate": 7.512600208868326e-05, - "loss": 0.0102, + "epoch": 0.77, + "learning_rate": 0.00018446165052192823, + "loss": 0.016, "step": 297150 }, { - "epoch": 1.5, - "learning_rate": 7.511843439566925e-05, - "loss": 0.005, + "epoch": 0.77, + "learning_rate": 0.00018445776230555677, + "loss": 0.0128, "step": 297160 }, { - "epoch": 1.5, - "learning_rate": 7.511086670265525e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.0001844538740891853, + "loss": 0.0139, "step": 297170 }, { - "epoch": 1.5, - "learning_rate": 7.510329900964123e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018444998587281383, + "loss": 0.0119, "step": 297180 }, { - "epoch": 1.5, - "learning_rate": 7.509573131662722e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018444609765644237, + "loss": 0.0118, "step": 297190 }, { - "epoch": 1.5, - "learning_rate": 7.508816362361322e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.0001844422094400709, + "loss": 0.0153, "step": 297200 }, { - "epoch": 1.5, - "learning_rate": 7.50805959305992e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018443832122369945, + "loss": 0.0115, "step": 297210 }, { - "epoch": 1.5, - "learning_rate": 7.50730282375852e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018443443300732797, + "loss": 0.0168, "step": 297220 }, { - "epoch": 1.5, - "learning_rate": 7.506546054457118e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.0001844305447909565, + "loss": 0.0147, "step": 297230 }, { - "epoch": 1.5, - "learning_rate": 7.505789285155717e-05, - "loss": 0.0052, + "epoch": 0.77, + "learning_rate": 0.00018442665657458502, + "loss": 0.0155, "step": 297240 }, { - "epoch": 1.5, - "learning_rate": 7.505032515854317e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001844227683582136, + "loss": 0.015, "step": 297250 }, { - "epoch": 1.5, - "learning_rate": 7.504275746552915e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.0001844188801418421, + "loss": 0.016, "step": 297260 }, { - "epoch": 1.5, - "learning_rate": 7.503518977251514e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018441499192547065, + "loss": 0.0164, "step": 297270 }, { - "epoch": 1.5, - "learning_rate": 7.502762207950114e-05, - "loss": 0.0098, + "epoch": 0.77, + "learning_rate": 0.00018441110370909916, + "loss": 0.0164, "step": 297280 }, { - "epoch": 1.5, - "learning_rate": 7.502005438648712e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018440721549272773, + "loss": 0.0114, "step": 297290 }, { - "epoch": 1.5, - "learning_rate": 7.501248669347311e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018440332727635627, + "loss": 0.0168, "step": 297300 }, { - "epoch": 1.5, - "learning_rate": 7.500491900045911e-05, - "loss": 0.0093, + "epoch": 0.77, + "learning_rate": 0.0001843994390599848, + "loss": 0.0112, "step": 297310 }, { - "epoch": 1.5, - "learning_rate": 7.499735130744509e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001843955508436133, + "loss": 0.015, "step": 297320 }, { - "epoch": 1.5, - "learning_rate": 7.498978361443108e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018439166262724187, + "loss": 0.0153, "step": 297330 }, { - "epoch": 1.5, - "learning_rate": 7.498221592141707e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.0001843877744108704, + "loss": 0.0117, "step": 297340 }, { - "epoch": 1.5, - "learning_rate": 7.497464822840306e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.00018438388619449893, + "loss": 0.0176, "step": 297350 }, { - "epoch": 1.5, - "learning_rate": 7.496708053538906e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018437999797812747, + "loss": 0.0167, "step": 297360 }, { - "epoch": 1.5, - "learning_rate": 7.495951284237504e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.000184376109761756, + "loss": 0.0136, "step": 297370 }, { - "epoch": 1.5, - "learning_rate": 7.495194514936103e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018437222154538455, + "loss": 0.0136, "step": 297380 }, { - "epoch": 1.5, - "learning_rate": 7.494437745634703e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018436833332901307, + "loss": 0.0164, "step": 297390 }, { - "epoch": 1.5, - "learning_rate": 7.493680976333301e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.0001843644451126416, + "loss": 0.0158, "step": 297400 }, { - "epoch": 1.5, - "learning_rate": 7.4929242070319e-05, - "loss": 0.0105, + "epoch": 0.77, + "learning_rate": 0.00018436055689627015, + "loss": 0.014, "step": 297410 }, { - "epoch": 1.5, - "learning_rate": 7.492167437730499e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.0001843566686798987, + "loss": 0.0142, "step": 297420 }, { - "epoch": 1.5, - "learning_rate": 7.491410668429097e-05, - "loss": 0.0091, + "epoch": 0.77, + "learning_rate": 0.0001843527804635272, + "loss": 0.0146, "step": 297430 }, { - "epoch": 1.5, - "learning_rate": 7.490653899127696e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018434889224715575, + "loss": 0.0143, "step": 297440 }, { - "epoch": 1.5, - "learning_rate": 7.489897129826296e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018434500403078432, + "loss": 0.0154, "step": 297450 }, { - "epoch": 1.5, - "learning_rate": 7.489140360524894e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018434111581441283, + "loss": 0.018, "step": 297460 }, { - "epoch": 1.5, - "learning_rate": 7.488383591223493e-05, - "loss": 0.012, - "step": 297470 + "epoch": 0.77, + "learning_rate": 0.00018433722759804135, + "loss": 0.0127, + "step": 297470 }, { - "epoch": 1.5, - "learning_rate": 7.487626821922093e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.0001843333393816699, + "loss": 0.0138, "step": 297480 }, { - "epoch": 1.5, - "learning_rate": 7.486870052620691e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.0001843294511652984, + "loss": 0.0144, "step": 297490 }, { - "epoch": 1.5, - "learning_rate": 7.48611328331929e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018432556294892697, + "loss": 0.0141, "step": 297500 }, { - "epoch": 1.5, - "learning_rate": 7.485356514017889e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001843216747325555, + "loss": 0.0154, "step": 297510 }, { - "epoch": 1.5, - "learning_rate": 7.484599744716488e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018431778651618403, + "loss": 0.0115, "step": 297520 }, { - "epoch": 1.5, - "learning_rate": 7.483842975415088e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018431389829981257, + "loss": 0.0117, "step": 297530 }, { - "epoch": 1.5, - "learning_rate": 7.483086206113686e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.0001843100100834411, + "loss": 0.0126, "step": 297540 }, { - "epoch": 1.5, - "learning_rate": 7.482329436812285e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018430612186706965, + "loss": 0.0129, "step": 297550 }, { - "epoch": 1.5, - "learning_rate": 7.481572667510885e-05, - "loss": 0.0094, + "epoch": 0.77, + "learning_rate": 0.00018430223365069817, + "loss": 0.0138, "step": 297560 }, { - "epoch": 1.5, - "learning_rate": 7.480815898209483e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.0001842983454343267, + "loss": 0.0132, "step": 297570 }, { - "epoch": 1.5, - "learning_rate": 7.480059128908082e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.00018429445721795525, + "loss": 0.018, "step": 297580 }, { - "epoch": 1.5, - "learning_rate": 7.47930235960668e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.0001842905690015838, + "loss": 0.0142, "step": 297590 }, { - "epoch": 1.5, - "learning_rate": 7.47854559030528e-05, - "loss": 0.0095, + "epoch": 0.77, + "learning_rate": 0.0001842866807852123, + "loss": 0.0145, "step": 297600 }, { - "epoch": 1.5, - "learning_rate": 7.47778882100388e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018428279256884085, + "loss": 0.0155, "step": 297610 }, { - "epoch": 1.5, - "learning_rate": 7.477032051702478e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018427890435246942, + "loss": 0.0147, "step": 297620 }, { - "epoch": 1.5, - "learning_rate": 7.476275282401077e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018427501613609793, + "loss": 0.0156, "step": 297630 }, { - "epoch": 1.5, - "learning_rate": 7.475518513099677e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018427112791972645, + "loss": 0.0126, "step": 297640 }, { - "epoch": 1.5, - "learning_rate": 7.474761743798275e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.000184267239703355, + "loss": 0.0137, "step": 297650 }, { - "epoch": 1.5, - "learning_rate": 7.474004974496874e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018426335148698356, + "loss": 0.0135, "step": 297660 }, { - "epoch": 1.5, - "learning_rate": 7.473248205195472e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018425946327061207, + "loss": 0.0126, "step": 297670 }, { - "epoch": 1.5, - "learning_rate": 7.472491435894072e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.0001842555750542406, + "loss": 0.0133, "step": 297680 }, { - "epoch": 1.5, - "learning_rate": 7.471734666592671e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018425168683786913, + "loss": 0.0133, "step": 297690 }, { - "epoch": 1.5, - "learning_rate": 7.47097789729127e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001842477986214977, + "loss": 0.017, "step": 297700 }, { - "epoch": 1.5, - "learning_rate": 7.470221127989869e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.0001842439104051262, + "loss": 0.0128, "step": 297710 }, { - "epoch": 1.5, - "learning_rate": 7.469464358688469e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.00018424002218875475, + "loss": 0.0124, "step": 297720 }, { - "epoch": 1.5, - "learning_rate": 7.468707589387067e-05, - "loss": 0.0093, + "epoch": 0.77, + "learning_rate": 0.00018423613397238327, + "loss": 0.0138, "step": 297730 }, { - "epoch": 1.5, - "learning_rate": 7.467950820085665e-05, - "loss": 0.0127, + "epoch": 0.77, + "learning_rate": 0.0001842322457560118, + "loss": 0.0161, "step": 297740 }, { - "epoch": 1.5, - "learning_rate": 7.467194050784264e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018422835753964035, + "loss": 0.0128, "step": 297750 }, { - "epoch": 1.5, - "learning_rate": 7.466437281482864e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001842244693232689, + "loss": 0.0205, "step": 297760 }, { - "epoch": 1.5, - "learning_rate": 7.465680512181462e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001842205811068974, + "loss": 0.0132, "step": 297770 }, { - "epoch": 1.5, - "learning_rate": 7.464923742880062e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018421669289052595, + "loss": 0.0121, "step": 297780 }, { - "epoch": 1.5, - "learning_rate": 7.46416697357866e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.0001842128046741545, + "loss": 0.0142, "step": 297790 }, { - "epoch": 1.5, - "learning_rate": 7.463410204277259e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018420891645778303, + "loss": 0.0136, "step": 297800 }, { - "epoch": 1.5, - "learning_rate": 7.462653434975859e-05, - "loss": 0.0099, + "epoch": 0.77, + "learning_rate": 0.00018420502824141154, + "loss": 0.0162, "step": 297810 }, { - "epoch": 1.5, - "learning_rate": 7.461896665674457e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018420114002504009, + "loss": 0.0148, "step": 297820 }, { - "epoch": 1.5, - "learning_rate": 7.461139896373056e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018419725180866866, + "loss": 0.0139, "step": 297830 }, { - "epoch": 1.5, - "learning_rate": 7.460383127071656e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018419336359229717, + "loss": 0.0138, "step": 297840 }, { - "epoch": 1.5, - "learning_rate": 7.459626357770254e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001841894753759257, + "loss": 0.0129, "step": 297850 }, { - "epoch": 1.5, - "learning_rate": 7.458869588468853e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018418558715955423, + "loss": 0.0205, "step": 297860 }, { - "epoch": 1.5, - "learning_rate": 7.458112819167452e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001841816989431828, + "loss": 0.0159, "step": 297870 }, { - "epoch": 1.5, - "learning_rate": 7.457356049866051e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.0001841778107268113, + "loss": 0.0129, "step": 297880 }, { - "epoch": 1.5, - "learning_rate": 7.45659928056465e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018417392251043985, + "loss": 0.014, "step": 297890 }, { - "epoch": 1.5, - "learning_rate": 7.455842511263249e-05, - "loss": 0.0058, + "epoch": 0.77, + "learning_rate": 0.00018417003429406837, + "loss": 0.0124, "step": 297900 }, { - "epoch": 1.5, - "learning_rate": 7.455085741961848e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018416614607769693, + "loss": 0.013, "step": 297910 }, { - "epoch": 1.5, - "learning_rate": 7.454328972660448e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018416225786132545, + "loss": 0.0186, "step": 297920 }, { - "epoch": 1.5, - "learning_rate": 7.453572203359046e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.000184158369644954, + "loss": 0.0104, "step": 297930 }, { - "epoch": 1.5, - "learning_rate": 7.452815434057645e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.0001841544814285825, + "loss": 0.0163, "step": 297940 }, { - "epoch": 1.5, - "learning_rate": 7.452058664756244e-05, - "loss": 0.0095, + "epoch": 0.77, + "learning_rate": 0.00018415059321221107, + "loss": 0.0149, "step": 297950 }, { - "epoch": 1.5, - "learning_rate": 7.451301895454843e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.0001841467049958396, + "loss": 0.0108, "step": 297960 }, { - "epoch": 1.5, - "learning_rate": 7.450545126153443e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018414281677946813, + "loss": 0.0181, "step": 297970 }, { - "epoch": 1.5, - "learning_rate": 7.449788356852041e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018413892856309664, + "loss": 0.011, "step": 297980 }, { - "epoch": 1.5, - "learning_rate": 7.44903158755064e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018413504034672519, + "loss": 0.0185, "step": 297990 }, { - "epoch": 1.5, - "learning_rate": 7.44827481824924e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018413115213035375, + "loss": 0.0159, "step": 298000 }, { - "epoch": 1.5, - "eval_cer": 0.9144489071884033, - "eval_loss": 0.0054661910980939865, - "eval_runtime": 116.6326, - "eval_samples_per_second": 17.148, - "eval_steps_per_second": 4.287, + "epoch": 0.77, + "eval_cer": 0.8817348779726539, + "eval_loss": 0.00948801077902317, + "eval_runtime": 107.7174, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, "step": 298000 }, { - "epoch": 1.5, - "learning_rate": 7.447518048947838e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018412726391398227, + "loss": 0.0123, "step": 298010 }, { - "epoch": 1.5, - "learning_rate": 7.446761279646437e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001841233756976108, + "loss": 0.013, "step": 298020 }, { - "epoch": 1.5, - "learning_rate": 7.446004510345035e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018411948748123933, + "loss": 0.0125, "step": 298030 }, { - "epoch": 1.5, - "learning_rate": 7.445247741043634e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.0001841155992648679, + "loss": 0.0146, "step": 298040 }, { - "epoch": 1.5, - "learning_rate": 7.444490971742233e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.0001841117110484964, + "loss": 0.0128, "step": 298050 }, { - "epoch": 1.5, - "learning_rate": 7.443734202440833e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.00018410782283212495, + "loss": 0.0143, "step": 298060 }, { - "epoch": 1.5, - "learning_rate": 7.442977433139431e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018410393461575346, + "loss": 0.0162, "step": 298070 }, { - "epoch": 1.5, - "learning_rate": 7.44222066383803e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018410004639938203, + "loss": 0.018, "step": 298080 }, { - "epoch": 1.5, - "learning_rate": 7.44146389453663e-05, - "loss": 0.0055, + "epoch": 0.77, + "learning_rate": 0.00018409615818301055, + "loss": 0.0158, "step": 298090 }, { - "epoch": 1.5, - "learning_rate": 7.440707125235228e-05, - "loss": 0.0058, + "epoch": 0.77, + "learning_rate": 0.0001840922699666391, + "loss": 0.0127, "step": 298100 }, { - "epoch": 1.5, - "learning_rate": 7.439950355933827e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.0001840883817502676, + "loss": 0.0159, "step": 298110 }, { - "epoch": 1.5, - "learning_rate": 7.439193586632426e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018408449353389617, + "loss": 0.0159, "step": 298120 }, { - "epoch": 1.5, - "learning_rate": 7.438436817331025e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.0001840806053175247, + "loss": 0.0144, "step": 298130 }, { - "epoch": 1.5, - "learning_rate": 7.437680048029625e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.00018407671710115323, + "loss": 0.013, "step": 298140 }, { - "epoch": 1.5, - "learning_rate": 7.436923278728223e-05, - "loss": 0.0079, + "epoch": 0.77, + "learning_rate": 0.00018407282888478174, + "loss": 0.0126, "step": 298150 }, { - "epoch": 1.5, - "learning_rate": 7.436166509426822e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.0001840689406684103, + "loss": 0.0142, "step": 298160 }, { - "epoch": 1.5, - "learning_rate": 7.435409740125422e-05, - "loss": 0.0096, + "epoch": 0.77, + "learning_rate": 0.00018406505245203885, + "loss": 0.0151, "step": 298170 }, { - "epoch": 1.5, - "learning_rate": 7.43465297082402e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018406116423566737, + "loss": 0.0141, "step": 298180 }, { - "epoch": 1.5, - "learning_rate": 7.43389620152262e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018405727601929588, + "loss": 0.0158, "step": 298190 }, { - "epoch": 1.5, - "learning_rate": 7.433139432221217e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018405338780292445, + "loss": 0.0161, "step": 298200 }, { - "epoch": 1.5, - "learning_rate": 7.432382662919817e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.000184049499586553, + "loss": 0.0113, "step": 298210 }, { - "epoch": 1.5, - "learning_rate": 7.431625893618416e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.0001840456113701815, + "loss": 0.0099, "step": 298220 }, { - "epoch": 1.5, - "learning_rate": 7.430869124317015e-05, - "loss": 0.0086, + "epoch": 0.77, + "learning_rate": 0.00018404172315381005, + "loss": 0.017, "step": 298230 }, { - "epoch": 1.5, - "learning_rate": 7.430112355015614e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.00018403783493743856, + "loss": 0.0158, "step": 298240 }, { - "epoch": 1.5, - "learning_rate": 7.429355585714214e-05, - "loss": 0.0069, + "epoch": 0.77, + "learning_rate": 0.00018403394672106713, + "loss": 0.0148, "step": 298250 }, { - "epoch": 1.5, - "learning_rate": 7.428598816412812e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018403005850469565, + "loss": 0.0128, "step": 298260 }, { - "epoch": 1.5, - "learning_rate": 7.427842047111411e-05, - "loss": 0.0106, + "epoch": 0.77, + "learning_rate": 0.0001840261702883242, + "loss": 0.0122, "step": 298270 }, { - "epoch": 1.5, - "learning_rate": 7.427085277810011e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.0001840222820719527, + "loss": 0.0152, "step": 298280 }, { - "epoch": 1.5, - "learning_rate": 7.426328508508609e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018401839385558127, + "loss": 0.0138, "step": 298290 }, { - "epoch": 1.5, - "learning_rate": 7.425571739207208e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.0001840145056392098, + "loss": 0.0165, "step": 298300 }, { - "epoch": 1.51, - "learning_rate": 7.424814969905807e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018401061742283833, + "loss": 0.0164, "step": 298310 }, { - "epoch": 1.51, - "learning_rate": 7.424058200604406e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018400672920646684, + "loss": 0.0183, "step": 298320 }, { - "epoch": 1.51, - "learning_rate": 7.423301431303006e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001840028409900954, + "loss": 0.0143, "step": 298330 }, { - "epoch": 1.51, - "learning_rate": 7.422544662001604e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018399895277372395, + "loss": 0.0146, "step": 298340 }, { - "epoch": 1.51, - "learning_rate": 7.421787892700203e-05, - "loss": 0.0063, + "epoch": 0.77, + "learning_rate": 0.00018399506455735247, + "loss": 0.0132, "step": 298350 }, { - "epoch": 1.51, - "learning_rate": 7.421031123398801e-05, - "loss": 0.0066, + "epoch": 0.77, + "learning_rate": 0.00018399117634098098, + "loss": 0.0129, "step": 298360 }, { - "epoch": 1.51, - "learning_rate": 7.420274354097401e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018398728812460955, + "loss": 0.0145, "step": 298370 }, { - "epoch": 1.51, - "learning_rate": 7.419517584795999e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.0001839833999082381, + "loss": 0.0122, "step": 298380 }, { - "epoch": 1.51, - "learning_rate": 7.418760815494598e-05, + "epoch": 0.77, + "learning_rate": 0.0001839795116918666, "loss": 0.0134, "step": 298390 }, { - "epoch": 1.51, - "learning_rate": 7.418004046193197e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018397562347549515, + "loss": 0.0151, "step": 298400 }, { - "epoch": 1.51, - "learning_rate": 7.417247276891796e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.0001839717352591237, + "loss": 0.0117, "step": 298410 }, { - "epoch": 1.51, - "learning_rate": 7.416490507590396e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.00018396784704275223, + "loss": 0.0138, "step": 298420 }, { - "epoch": 1.51, - "learning_rate": 7.415733738288994e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018396395882638075, + "loss": 0.0149, "step": 298430 }, { - "epoch": 1.51, - "learning_rate": 7.414976968987593e-05, - "loss": 0.0089, + "epoch": 0.77, + "learning_rate": 0.0001839600706100093, + "loss": 0.0157, "step": 298440 }, { - "epoch": 1.51, - "learning_rate": 7.414220199686193e-05, - "loss": 0.0081, + "epoch": 0.77, + "learning_rate": 0.00018395618239363783, + "loss": 0.0128, "step": 298450 }, { - "epoch": 1.51, - "learning_rate": 7.413463430384791e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.00018395229417726637, + "loss": 0.017, "step": 298460 }, { - "epoch": 1.51, - "learning_rate": 7.41270666108339e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018394840596089489, + "loss": 0.0174, "step": 298470 }, { - "epoch": 1.51, - "learning_rate": 7.411949891781989e-05, - "loss": 0.0088, + "epoch": 0.77, + "learning_rate": 0.00018394451774452343, + "loss": 0.013, "step": 298480 }, { - "epoch": 1.51, - "learning_rate": 7.411193122480588e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018394062952815194, + "loss": 0.0109, "step": 298490 }, { - "epoch": 1.51, - "learning_rate": 7.410436353179188e-05, - "loss": 0.0078, + "epoch": 0.77, + "learning_rate": 0.0001839367413117805, + "loss": 0.0151, "step": 298500 }, { - "epoch": 1.51, - "learning_rate": 7.409679583877786e-05, - "loss": 0.0046, + "epoch": 0.77, + "learning_rate": 0.00018393285309540903, + "loss": 0.0151, "step": 298510 }, { - "epoch": 1.51, - "learning_rate": 7.408922814576385e-05, - "loss": 0.0084, + "epoch": 0.77, + "learning_rate": 0.00018392896487903757, + "loss": 0.0128, "step": 298520 }, { - "epoch": 1.51, - "learning_rate": 7.408166045274985e-05, - "loss": 0.0057, + "epoch": 0.77, + "learning_rate": 0.00018392507666266608, + "loss": 0.0158, "step": 298530 }, { - "epoch": 1.51, - "learning_rate": 7.407409275973583e-05, - "loss": 0.0056, + "epoch": 0.77, + "learning_rate": 0.00018392118844629465, + "loss": 0.0107, "step": 298540 }, { - "epoch": 1.51, - "learning_rate": 7.406652506672182e-05, - "loss": 0.0077, + "epoch": 0.77, + "learning_rate": 0.0001839173002299232, + "loss": 0.0142, "step": 298550 }, { - "epoch": 1.51, - "learning_rate": 7.40589573737078e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.0001839134120135517, + "loss": 0.0126, "step": 298560 }, { - "epoch": 1.51, - "learning_rate": 7.40513896806938e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018390952379718025, + "loss": 0.0121, "step": 298570 }, { - "epoch": 1.51, - "learning_rate": 7.40438219876798e-05, - "loss": 0.0076, + "epoch": 0.77, + "learning_rate": 0.0001839056355808088, + "loss": 0.0145, "step": 298580 }, { - "epoch": 1.51, - "learning_rate": 7.403625429466578e-05, - "loss": 0.0083, + "epoch": 0.77, + "learning_rate": 0.00018390174736443733, + "loss": 0.0146, "step": 298590 }, { - "epoch": 1.51, - "learning_rate": 7.402868660165177e-05, - "loss": 0.0087, + "epoch": 0.77, + "learning_rate": 0.00018389785914806585, + "loss": 0.0159, "step": 298600 }, { - "epoch": 1.51, - "learning_rate": 7.402111890863777e-05, - "loss": 0.008, + "epoch": 0.77, + "learning_rate": 0.0001838939709316944, + "loss": 0.016, "step": 298610 }, { - "epoch": 1.51, - "learning_rate": 7.401355121562375e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.00018389008271532293, + "loss": 0.0115, "step": 298620 }, { - "epoch": 1.51, - "learning_rate": 7.400598352260974e-05, - "loss": 0.0056, + "epoch": 0.77, + "learning_rate": 0.00018388619449895147, + "loss": 0.0128, "step": 298630 }, { - "epoch": 1.51, - "learning_rate": 7.399841582959572e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018388230628257999, + "loss": 0.0136, "step": 298640 }, { - "epoch": 1.51, - "learning_rate": 7.399084813658172e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018387841806620853, + "loss": 0.0158, "step": 298650 }, { - "epoch": 1.51, - "learning_rate": 7.398328044356771e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018387452984983707, + "loss": 0.0145, "step": 298660 }, { - "epoch": 1.51, - "learning_rate": 7.39757127505537e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.0001838706416334656, + "loss": 0.0146, "step": 298670 }, { - "epoch": 1.51, - "learning_rate": 7.396814505753968e-05, - "loss": 0.0072, + "epoch": 0.77, + "learning_rate": 0.00018386675341709413, + "loss": 0.0153, "step": 298680 }, { - "epoch": 1.51, - "learning_rate": 7.396057736452567e-05, - "loss": 0.0092, + "epoch": 0.77, + "learning_rate": 0.00018386286520072267, + "loss": 0.0141, "step": 298690 }, { - "epoch": 1.51, - "learning_rate": 7.395300967151167e-05, - "loss": 0.0088, + "epoch": 0.77, + "learning_rate": 0.00018385897698435124, + "loss": 0.0134, "step": 298700 }, { - "epoch": 1.51, - "learning_rate": 7.394544197849765e-05, - "loss": 0.0065, + "epoch": 0.77, + "learning_rate": 0.00018385508876797975, + "loss": 0.0141, "step": 298710 }, { - "epoch": 1.51, - "learning_rate": 7.393787428548364e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.0001838512005516083, + "loss": 0.0114, "step": 298720 }, { - "epoch": 1.51, - "learning_rate": 7.393030659246964e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001838473123352368, + "loss": 0.0153, "step": 298730 }, { - "epoch": 1.51, - "learning_rate": 7.392273889945562e-05, - "loss": 0.0048, + "epoch": 0.77, + "learning_rate": 0.00018384342411886535, + "loss": 0.014, "step": 298740 }, { - "epoch": 1.51, - "learning_rate": 7.391517120644161e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.0001838395359024939, + "loss": 0.0096, "step": 298750 }, { - "epoch": 1.51, - "learning_rate": 7.39076035134276e-05, - "loss": 0.0092, + "epoch": 0.77, + "learning_rate": 0.00018383564768612243, + "loss": 0.0162, "step": 298760 }, { - "epoch": 1.51, - "learning_rate": 7.390003582041359e-05, - "loss": 0.0059, + "epoch": 0.77, + "learning_rate": 0.00018383175946975095, + "loss": 0.0136, "step": 298770 }, { - "epoch": 1.51, - "learning_rate": 7.389246812739959e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.0001838278712533795, + "loss": 0.0146, "step": 298780 }, { - "epoch": 1.51, - "learning_rate": 7.388490043438557e-05, - "loss": 0.0073, + "epoch": 0.77, + "learning_rate": 0.00018382398303700803, + "loss": 0.0143, "step": 298790 }, { - "epoch": 1.51, - "learning_rate": 7.387733274137156e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018382009482063657, + "loss": 0.0129, "step": 298800 }, { - "epoch": 1.51, - "learning_rate": 7.386976504835756e-05, - "loss": 0.0064, + "epoch": 0.77, + "learning_rate": 0.00018381620660426509, + "loss": 0.0153, "step": 298810 }, { - "epoch": 1.51, - "learning_rate": 7.386219735534354e-05, - "loss": 0.0075, + "epoch": 0.77, + "learning_rate": 0.00018381231838789363, + "loss": 0.0119, "step": 298820 }, { - "epoch": 1.51, - "learning_rate": 7.385462966232953e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018380843017152217, + "loss": 0.0164, "step": 298830 }, { - "epoch": 1.51, - "learning_rate": 7.384706196931552e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.0001838045419551507, + "loss": 0.0155, "step": 298840 }, { - "epoch": 1.51, - "learning_rate": 7.383949427630151e-05, - "loss": 0.0055, + "epoch": 0.77, + "learning_rate": 0.00018380065373877922, + "loss": 0.0151, "step": 298850 }, { - "epoch": 1.51, - "learning_rate": 7.38319265832875e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018379676552240777, + "loss": 0.0146, "step": 298860 }, { - "epoch": 1.51, - "learning_rate": 7.382435889027349e-05, - "loss": 0.0062, + "epoch": 0.77, + "learning_rate": 0.00018379287730603633, + "loss": 0.0147, "step": 298870 }, { - "epoch": 1.51, - "learning_rate": 7.381679119725948e-05, - "loss": 0.0074, + "epoch": 0.77, + "learning_rate": 0.00018378898908966485, + "loss": 0.0158, "step": 298880 }, { - "epoch": 1.51, - "learning_rate": 7.380922350424548e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.0001837851008732934, + "loss": 0.0157, "step": 298890 }, { - "epoch": 1.51, - "learning_rate": 7.380165581123146e-05, - "loss": 0.007, + "epoch": 0.77, + "learning_rate": 0.0001837812126569219, + "loss": 0.0178, "step": 298900 }, { - "epoch": 1.51, - "learning_rate": 7.379408811821745e-05, - "loss": 0.0056, + "epoch": 0.77, + "learning_rate": 0.00018377732444055047, + "loss": 0.0147, "step": 298910 }, { - "epoch": 1.51, - "learning_rate": 7.378652042520344e-05, - "loss": 0.0082, + "epoch": 0.77, + "learning_rate": 0.000183773436224179, + "loss": 0.0132, "step": 298920 }, { - "epoch": 1.51, - "learning_rate": 7.377895273218943e-05, - "loss": 0.0061, + "epoch": 0.77, + "learning_rate": 0.00018376954800780753, + "loss": 0.0132, "step": 298930 }, { - "epoch": 1.51, - "learning_rate": 7.377138503917543e-05, - "loss": 0.0068, + "epoch": 0.77, + "learning_rate": 0.00018376565979143604, + "loss": 0.0153, "step": 298940 }, { - "epoch": 1.51, - "learning_rate": 7.37638173461614e-05, - "loss": 0.0071, + "epoch": 0.77, + "learning_rate": 0.00018376177157506461, + "loss": 0.0132, "step": 298950 }, { - "epoch": 1.51, - "learning_rate": 7.37562496531474e-05, - "loss": 0.006, + "epoch": 0.77, + "learning_rate": 0.00018375788335869313, + "loss": 0.0186, "step": 298960 }, { - "epoch": 1.51, - "learning_rate": 7.37486819601334e-05, - "loss": 0.0085, + "epoch": 0.77, + "learning_rate": 0.00018375399514232167, + "loss": 0.011, "step": 298970 }, { - "epoch": 1.51, - "learning_rate": 7.374111426711938e-05, - "loss": 0.0067, + "epoch": 0.77, + "learning_rate": 0.00018375010692595018, + "loss": 0.0177, "step": 298980 }, { - "epoch": 1.51, - "learning_rate": 7.373354657410536e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018374621870957873, + "loss": 0.0142, "step": 298990 }, { - "epoch": 1.51, - "learning_rate": 7.372597888109135e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018374233049320727, + "loss": 0.0109, "step": 299000 }, { - "epoch": 1.51, - "eval_cer": 0.9144362920387732, - "eval_loss": 0.005306443199515343, - "eval_runtime": 116.5784, - "eval_samples_per_second": 17.156, - "eval_steps_per_second": 4.289, + "epoch": 0.78, + "eval_cer": 0.881657897941274, + "eval_loss": 0.009355046786367893, + "eval_runtime": 107.8593, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, "step": 299000 }, { - "epoch": 1.51, - "learning_rate": 7.371841118807734e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.0001837384422768358, + "loss": 0.0178, "step": 299010 }, { - "epoch": 1.51, - "learning_rate": 7.371084349506333e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.00018373455406046432, + "loss": 0.017, "step": 299020 }, { - "epoch": 1.51, - "learning_rate": 7.370327580204933e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018373066584409287, + "loss": 0.0144, "step": 299030 }, { - "epoch": 1.51, - "learning_rate": 7.369570810903531e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018372677762772143, + "loss": 0.0134, "step": 299040 }, { - "epoch": 1.51, - "learning_rate": 7.36881404160213e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018372288941134995, + "loss": 0.0155, "step": 299050 }, { - "epoch": 1.51, - "learning_rate": 7.36805727230073e-05, - "loss": 0.0088, + "epoch": 0.78, + "learning_rate": 0.00018371900119497846, + "loss": 0.0134, "step": 299060 }, { - "epoch": 1.51, - "learning_rate": 7.367300502999328e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.000183715112978607, + "loss": 0.0108, "step": 299070 }, { - "epoch": 1.51, - "learning_rate": 7.366543733697927e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018371122476223557, + "loss": 0.0145, "step": 299080 }, { - "epoch": 1.51, - "learning_rate": 7.365786964396526e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001837073365458641, + "loss": 0.0139, "step": 299090 }, { - "epoch": 1.51, - "learning_rate": 7.365030195095125e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018370344832949263, + "loss": 0.0143, "step": 299100 }, { - "epoch": 1.51, - "learning_rate": 7.364273425793725e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018369956011312114, + "loss": 0.0124, "step": 299110 }, { - "epoch": 1.51, - "learning_rate": 7.363516656492323e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001836956718967497, + "loss": 0.0218, "step": 299120 }, { - "epoch": 1.51, - "learning_rate": 7.362759887190922e-05, - "loss": 0.0091, + "epoch": 0.78, + "learning_rate": 0.00018369178368037823, + "loss": 0.0157, "step": 299130 }, { - "epoch": 1.51, - "learning_rate": 7.362003117889522e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018368789546400677, + "loss": 0.0127, "step": 299140 }, { - "epoch": 1.51, - "learning_rate": 7.36124634858812e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018368400724763528, + "loss": 0.0161, "step": 299150 }, { - "epoch": 1.51, - "learning_rate": 7.360489579286719e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018368011903126385, + "loss": 0.0168, "step": 299160 }, { - "epoch": 1.51, - "learning_rate": 7.359732809985317e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018367623081489237, + "loss": 0.0125, "step": 299170 }, { - "epoch": 1.51, - "learning_rate": 7.358976040683917e-05, - "loss": 0.0054, + "epoch": 0.78, + "learning_rate": 0.0001836723425985209, + "loss": 0.0122, "step": 299180 }, { - "epoch": 1.51, - "learning_rate": 7.358219271382516e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018366845438214942, + "loss": 0.0142, "step": 299190 }, { - "epoch": 1.51, - "learning_rate": 7.357462502081115e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.000183664566165778, + "loss": 0.0144, "step": 299200 }, { - "epoch": 1.51, - "learning_rate": 7.356705732779714e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018366067794940653, + "loss": 0.0136, "step": 299210 }, { - "epoch": 1.51, - "learning_rate": 7.355948963478314e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018365678973303505, + "loss": 0.0148, "step": 299220 }, { - "epoch": 1.51, - "learning_rate": 7.355192194176912e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018365290151666356, + "loss": 0.0142, "step": 299230 }, { - "epoch": 1.51, - "learning_rate": 7.354435424875511e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001836490133002921, + "loss": 0.0165, "step": 299240 }, { - "epoch": 1.51, - "learning_rate": 7.353678655574111e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018364512508392067, + "loss": 0.0141, "step": 299250 }, { - "epoch": 1.51, - "learning_rate": 7.352921886272709e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.0001836412368675492, + "loss": 0.0153, "step": 299260 }, { - "epoch": 1.51, - "learning_rate": 7.352165116971308e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.00018363734865117773, + "loss": 0.0174, "step": 299270 }, { - "epoch": 1.51, - "learning_rate": 7.351408347669907e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.00018363346043480624, + "loss": 0.0142, "step": 299280 }, { - "epoch": 1.51, - "learning_rate": 7.350651578368506e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001836295722184348, + "loss": 0.0192, "step": 299290 }, { - "epoch": 1.51, - "learning_rate": 7.349894809067104e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018362568400206333, + "loss": 0.0117, "step": 299300 }, { - "epoch": 1.51, - "learning_rate": 7.349138039765704e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018362179578569187, + "loss": 0.0115, "step": 299310 }, { - "epoch": 1.51, - "learning_rate": 7.348381270464302e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018361790756932038, + "loss": 0.0132, "step": 299320 }, { - "epoch": 1.51, - "learning_rate": 7.347624501162901e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018361401935294895, + "loss": 0.0188, "step": 299330 }, { - "epoch": 1.51, - "learning_rate": 7.346867731861501e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018361013113657747, + "loss": 0.0129, "step": 299340 }, { - "epoch": 1.51, - "learning_rate": 7.346110962560099e-05, - "loss": 0.0052, + "epoch": 0.78, + "learning_rate": 0.000183606242920206, + "loss": 0.0161, "step": 299350 }, { - "epoch": 1.51, - "learning_rate": 7.345354193258698e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018360235470383452, + "loss": 0.0128, "step": 299360 }, { - "epoch": 1.51, - "learning_rate": 7.344597423957297e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001835984664874631, + "loss": 0.0182, "step": 299370 }, { - "epoch": 1.51, - "learning_rate": 7.343840654655896e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.0001835945782710916, + "loss": 0.0145, "step": 299380 }, { - "epoch": 1.51, - "learning_rate": 7.343083885354496e-05, - "loss": 0.009, + "epoch": 0.78, + "learning_rate": 0.00018359069005472015, + "loss": 0.0137, "step": 299390 }, { - "epoch": 1.51, - "learning_rate": 7.342327116053094e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018358680183834866, + "loss": 0.0131, "step": 299400 }, { - "epoch": 1.51, - "learning_rate": 7.341570346751693e-05, - "loss": 0.0111, + "epoch": 0.78, + "learning_rate": 0.00018358291362197723, + "loss": 0.0151, "step": 299410 }, { - "epoch": 1.51, - "learning_rate": 7.340813577450293e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018357902540560577, + "loss": 0.0126, "step": 299420 }, { - "epoch": 1.51, - "learning_rate": 7.340056808148891e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.0001835751371892343, + "loss": 0.0105, "step": 299430 }, { - "epoch": 1.51, - "learning_rate": 7.33930003884749e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018357124897286283, + "loss": 0.0146, "step": 299440 }, { - "epoch": 1.51, - "learning_rate": 7.338543269546089e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018356736075649137, + "loss": 0.0155, "step": 299450 }, { - "epoch": 1.51, - "learning_rate": 7.337786500244688e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001835634725401199, + "loss": 0.0116, "step": 299460 }, { - "epoch": 1.51, - "learning_rate": 7.337029730943288e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018355958432374843, + "loss": 0.0149, "step": 299470 }, { - "epoch": 1.51, - "learning_rate": 7.336272961641886e-05, - "loss": 0.0053, + "epoch": 0.78, + "learning_rate": 0.00018355569610737697, + "loss": 0.0179, "step": 299480 }, { - "epoch": 1.51, - "learning_rate": 7.335516192340485e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018355180789100548, + "loss": 0.0153, "step": 299490 }, { - "epoch": 1.51, - "learning_rate": 7.334759423039085e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018354791967463405, + "loss": 0.0108, "step": 299500 }, { - "epoch": 1.51, - "learning_rate": 7.334002653737683e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018354403145826257, + "loss": 0.0163, "step": 299510 }, { - "epoch": 1.51, - "learning_rate": 7.333245884436282e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001835401432418911, + "loss": 0.0164, "step": 299520 }, { - "epoch": 1.51, - "learning_rate": 7.33248911513488e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018353625502551962, + "loss": 0.0172, "step": 299530 }, { - "epoch": 1.51, - "learning_rate": 7.33173234583348e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.0001835323668091482, + "loss": 0.0145, "step": 299540 }, { - "epoch": 1.51, - "learning_rate": 7.33097557653208e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.0001835284785927767, + "loss": 0.0117, "step": 299550 }, { - "epoch": 1.51, - "learning_rate": 7.330218807230678e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018352459037640525, + "loss": 0.0129, "step": 299560 }, { - "epoch": 1.51, - "learning_rate": 7.329462037929277e-05, - "loss": 0.0046, + "epoch": 0.78, + "learning_rate": 0.00018352070216003376, + "loss": 0.0145, "step": 299570 }, { - "epoch": 1.51, - "learning_rate": 7.328705268627877e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.00018351681394366233, + "loss": 0.0151, "step": 299580 }, { - "epoch": 1.51, - "learning_rate": 7.327948499326475e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018351292572729087, + "loss": 0.0112, "step": 299590 }, { - "epoch": 1.51, - "learning_rate": 7.327191730025074e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.0001835090375109194, + "loss": 0.0144, "step": 299600 }, { - "epoch": 1.51, - "learning_rate": 7.326434960723672e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018350514929454793, + "loss": 0.012, "step": 299610 }, { - "epoch": 1.51, - "learning_rate": 7.32567819142227e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.00018350126107817647, + "loss": 0.0135, "step": 299620 }, { - "epoch": 1.51, - "learning_rate": 7.32492142212087e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.000183497372861805, + "loss": 0.0158, "step": 299630 }, { - "epoch": 1.51, - "learning_rate": 7.32416465281947e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.00018349348464543353, + "loss": 0.018, "step": 299640 }, { - "epoch": 1.51, - "learning_rate": 7.323407883518068e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018348959642906207, + "loss": 0.0158, "step": 299650 }, { - "epoch": 1.51, - "learning_rate": 7.322651114216667e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.0001834857082126906, + "loss": 0.014, "step": 299660 }, { - "epoch": 1.51, - "learning_rate": 7.321894344915267e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018348181999631915, + "loss": 0.0159, "step": 299670 }, { - "epoch": 1.51, - "learning_rate": 7.321137575613865e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018347793177994767, + "loss": 0.0106, "step": 299680 }, { - "epoch": 1.51, - "learning_rate": 7.320380806312464e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001834740435635762, + "loss": 0.0166, "step": 299690 }, { - "epoch": 1.51, - "learning_rate": 7.319624037011064e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018347015534720475, + "loss": 0.0147, "step": 299700 }, { - "epoch": 1.51, - "learning_rate": 7.318867267709662e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.0001834662671308333, + "loss": 0.0149, "step": 299710 }, { - "epoch": 1.51, - "learning_rate": 7.318110498408261e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.0001834623789144618, + "loss": 0.0137, "step": 299720 }, { - "epoch": 1.51, - "learning_rate": 7.31735372910686e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018345849069809035, + "loss": 0.0124, "step": 299730 }, { - "epoch": 1.51, - "learning_rate": 7.316596959805459e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018345460248171886, + "loss": 0.0136, "step": 299740 }, { - "epoch": 1.51, - "learning_rate": 7.315840190504059e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.00018345071426534743, + "loss": 0.0094, "step": 299750 }, { - "epoch": 1.51, - "learning_rate": 7.315083421202657e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018344682604897597, + "loss": 0.0159, "step": 299760 }, { - "epoch": 1.51, - "learning_rate": 7.314326651901256e-05, - "loss": 0.0051, + "epoch": 0.78, + "learning_rate": 0.00018344293783260449, + "loss": 0.013, "step": 299770 }, { - "epoch": 1.51, - "learning_rate": 7.313569882599856e-05, - "loss": 0.0086, + "epoch": 0.78, + "learning_rate": 0.000183439049616233, + "loss": 0.0149, "step": 299780 }, { - "epoch": 1.51, - "learning_rate": 7.312813113298454e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018343516139986157, + "loss": 0.0126, "step": 299790 }, { - "epoch": 1.51, - "learning_rate": 7.312056343997053e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.0001834312731834901, + "loss": 0.0181, "step": 299800 }, { - "epoch": 1.51, - "learning_rate": 7.311299574695652e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018342738496711863, + "loss": 0.0138, "step": 299810 }, { - "epoch": 1.51, - "learning_rate": 7.310542805394251e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018342349675074717, + "loss": 0.0138, "step": 299820 }, { - "epoch": 1.51, - "learning_rate": 7.30978603609285e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001834196085343757, + "loss": 0.0135, "step": 299830 }, { - "epoch": 1.51, - "learning_rate": 7.309029266791449e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018341572031800425, + "loss": 0.0153, "step": 299840 }, { - "epoch": 1.51, - "learning_rate": 7.308272497490048e-05, - "loss": 0.0091, + "epoch": 0.78, + "learning_rate": 0.00018341183210163276, + "loss": 0.0107, "step": 299850 }, { - "epoch": 1.51, - "learning_rate": 7.307515728188648e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.0001834079438852613, + "loss": 0.0152, "step": 299860 }, { - "epoch": 1.51, - "learning_rate": 7.306758958887246e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018340405566888985, + "loss": 0.0162, "step": 299870 }, { - "epoch": 1.51, - "learning_rate": 7.306002189585845e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001834001674525184, + "loss": 0.0114, "step": 299880 }, { - "epoch": 1.51, - "learning_rate": 7.305245420284443e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001833962792361469, + "loss": 0.0147, "step": 299890 }, { - "epoch": 1.51, - "learning_rate": 7.304488650983043e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018339239101977545, + "loss": 0.0143, "step": 299900 }, { - "epoch": 1.51, - "learning_rate": 7.303731881681642e-05, - "loss": 0.0049, + "epoch": 0.78, + "learning_rate": 0.00018338850280340401, + "loss": 0.0176, "step": 299910 }, { - "epoch": 1.51, - "learning_rate": 7.30297511238024e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018338461458703253, + "loss": 0.0151, "step": 299920 }, { - "epoch": 1.51, - "learning_rate": 7.302218343078839e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018338072637066107, + "loss": 0.0125, "step": 299930 }, { - "epoch": 1.51, - "learning_rate": 7.301461573777438e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018337683815428959, + "loss": 0.0187, "step": 299940 }, { - "epoch": 1.51, - "learning_rate": 7.300704804476038e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.00018337294993791815, + "loss": 0.0145, "step": 299950 }, { - "epoch": 1.51, - "learning_rate": 7.299948035174636e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018336906172154667, + "loss": 0.0156, "step": 299960 }, { - "epoch": 1.51, - "learning_rate": 7.299191265873235e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.0001833651735051752, + "loss": 0.0169, "step": 299970 }, { - "epoch": 1.51, - "learning_rate": 7.298434496571834e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018336128528880372, + "loss": 0.0149, "step": 299980 }, { - "epoch": 1.51, - "learning_rate": 7.297677727270433e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.00018335739707243227, + "loss": 0.0106, "step": 299990 }, { - "epoch": 1.51, - "learning_rate": 7.296920957969033e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.0001833535088560608, + "loss": 0.0111, "step": 300000 }, { - "epoch": 1.51, - "eval_cer": 0.9144518183767796, - "eval_loss": 0.0054466393776237965, - "eval_runtime": 116.3507, - "eval_samples_per_second": 17.189, - "eval_steps_per_second": 4.297, + "epoch": 0.78, + "eval_cer": 0.881688689953826, + "eval_loss": 0.009534839540719986, + "eval_runtime": 107.6279, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 300000 }, { - "epoch": 1.51, - "learning_rate": 7.29616418866763e-05, - "loss": 0.0053, + "epoch": 0.78, + "learning_rate": 0.00018334962063968935, + "loss": 0.0164, "step": 300010 }, { - "epoch": 1.51, - "learning_rate": 7.29540741936623e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018334573242331786, + "loss": 0.0125, "step": 300020 }, { - "epoch": 1.51, - "learning_rate": 7.29465065006483e-05, - "loss": 0.0092, + "epoch": 0.78, + "learning_rate": 0.0001833418442069464, + "loss": 0.0183, "step": 300030 }, { - "epoch": 1.51, - "learning_rate": 7.293893880763428e-05, - "loss": 0.014, + "epoch": 0.78, + "learning_rate": 0.00018333795599057495, + "loss": 0.0127, "step": 300040 }, { - "epoch": 1.51, - "learning_rate": 7.293137111462027e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001833340677742035, + "loss": 0.0168, "step": 300050 }, { - "epoch": 1.51, - "learning_rate": 7.292380342160625e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.000183330179557832, + "loss": 0.0135, "step": 300060 }, { - "epoch": 1.51, - "learning_rate": 7.291623572859225e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018332629134146055, + "loss": 0.02, "step": 300070 }, { - "epoch": 1.51, - "learning_rate": 7.290866803557824e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.00018332240312508911, + "loss": 0.0152, "step": 300080 }, { - "epoch": 1.51, - "learning_rate": 7.290110034256423e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018331851490871763, + "loss": 0.0216, "step": 300090 }, { - "epoch": 1.51, - "learning_rate": 7.289353264955022e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.00018331462669234614, + "loss": 0.015, "step": 300100 }, { - "epoch": 1.51, - "learning_rate": 7.288596495653622e-05, - "loss": 0.0047, + "epoch": 0.78, + "learning_rate": 0.00018331073847597468, + "loss": 0.0151, "step": 300110 }, { - "epoch": 1.51, - "learning_rate": 7.28783972635222e-05, - "loss": 0.01, + "epoch": 0.78, + "learning_rate": 0.00018330685025960325, + "loss": 0.0157, "step": 300120 }, { - "epoch": 1.51, - "learning_rate": 7.287082957050819e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018330296204323177, + "loss": 0.0107, "step": 300130 }, { - "epoch": 1.51, - "learning_rate": 7.286326187749417e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.0001832990738268603, + "loss": 0.012, "step": 300140 }, { - "epoch": 1.51, - "learning_rate": 7.285569418448017e-05, - "loss": 0.0104, + "epoch": 0.78, + "learning_rate": 0.00018329518561048882, + "loss": 0.0145, "step": 300150 }, { - "epoch": 1.51, - "learning_rate": 7.284812649146616e-05, - "loss": 0.0045, + "epoch": 0.78, + "learning_rate": 0.0001832912973941174, + "loss": 0.0135, "step": 300160 }, { - "epoch": 1.51, - "learning_rate": 7.284055879845215e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001832874091777459, + "loss": 0.0143, "step": 300170 }, { - "epoch": 1.51, - "learning_rate": 7.283299110543814e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018328352096137445, + "loss": 0.0153, "step": 300180 }, { - "epoch": 1.51, - "learning_rate": 7.282542341242414e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018327963274500296, + "loss": 0.0134, "step": 300190 }, { - "epoch": 1.51, - "learning_rate": 7.281785571941012e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018327574452863153, + "loss": 0.0143, "step": 300200 }, { - "epoch": 1.51, - "learning_rate": 7.281028802639611e-05, - "loss": 0.0055, + "epoch": 0.78, + "learning_rate": 0.00018327185631226005, + "loss": 0.0149, "step": 300210 }, { - "epoch": 1.51, - "learning_rate": 7.28027203333821e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.0001832679680958886, + "loss": 0.0162, "step": 300220 }, { - "epoch": 1.51, - "learning_rate": 7.279515264036809e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001832640798795171, + "loss": 0.0125, "step": 300230 }, { - "epoch": 1.51, - "learning_rate": 7.278758494735407e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018326019166314564, + "loss": 0.0116, "step": 300240 }, { - "epoch": 1.51, - "learning_rate": 7.278001725434006e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018325630344677419, + "loss": 0.0161, "step": 300250 }, { - "epoch": 1.51, - "learning_rate": 7.277244956132605e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018325241523040273, + "loss": 0.0176, "step": 300260 }, { - "epoch": 1.51, - "learning_rate": 7.276488186831204e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018324852701403124, + "loss": 0.0125, "step": 300270 }, { - "epoch": 1.51, - "learning_rate": 7.275731417529804e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018324463879765978, + "loss": 0.0146, "step": 300280 }, { - "epoch": 1.51, - "learning_rate": 7.274974648228402e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018324075058128835, + "loss": 0.0132, "step": 300290 }, { - "epoch": 1.52, - "learning_rate": 7.274217878927001e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.00018323686236491687, + "loss": 0.0105, "step": 300300 }, { - "epoch": 1.52, - "learning_rate": 7.273461109625601e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001832329741485454, + "loss": 0.021, "step": 300310 }, { - "epoch": 1.52, - "learning_rate": 7.272704340324199e-05, - "loss": 0.005, + "epoch": 0.78, + "learning_rate": 0.00018322908593217392, + "loss": 0.0197, "step": 300320 }, { - "epoch": 1.52, - "learning_rate": 7.271947571022798e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.0001832251977158025, + "loss": 0.0161, "step": 300330 }, { - "epoch": 1.52, - "learning_rate": 7.271190801721397e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.000183221309499431, + "loss": 0.015, "step": 300340 }, { - "epoch": 1.52, - "learning_rate": 7.270434032419996e-05, - "loss": 0.0092, + "epoch": 0.78, + "learning_rate": 0.00018321742128305955, + "loss": 0.015, "step": 300350 }, { - "epoch": 1.52, - "learning_rate": 7.269677263118596e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018321353306668806, + "loss": 0.0138, "step": 300360 }, { - "epoch": 1.52, - "learning_rate": 7.268920493817194e-05, - "loss": 0.0102, + "epoch": 0.78, + "learning_rate": 0.00018320964485031663, + "loss": 0.014, "step": 300370 }, { - "epoch": 1.52, - "learning_rate": 7.268163724515793e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018320575663394515, + "loss": 0.0191, "step": 300380 }, { - "epoch": 1.52, - "learning_rate": 7.267406955214393e-05, - "loss": 0.0042, + "epoch": 0.78, + "learning_rate": 0.0001832018684175737, + "loss": 0.0115, "step": 300390 }, { - "epoch": 1.52, - "learning_rate": 7.266650185912991e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001831979802012022, + "loss": 0.0129, "step": 300400 }, { - "epoch": 1.52, - "learning_rate": 7.26589341661159e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.00018319409198483077, + "loss": 0.0136, "step": 300410 }, { - "epoch": 1.52, - "learning_rate": 7.265136647310188e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018319020376845929, + "loss": 0.0133, "step": 300420 }, { - "epoch": 1.52, - "learning_rate": 7.264379878008788e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018318631555208783, + "loss": 0.0132, "step": 300430 }, { - "epoch": 1.52, - "learning_rate": 7.263623108707387e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018318242733571634, + "loss": 0.018, "step": 300440 }, { - "epoch": 1.52, - "learning_rate": 7.262866339405986e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001831785391193449, + "loss": 0.0134, "step": 300450 }, { - "epoch": 1.52, - "learning_rate": 7.262109570104585e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.00018317465090297345, + "loss": 0.0159, "step": 300460 }, { - "epoch": 1.52, - "learning_rate": 7.261352800803185e-05, - "loss": 0.0055, + "epoch": 0.78, + "learning_rate": 0.00018317076268660197, + "loss": 0.0168, "step": 300470 }, { - "epoch": 1.52, - "learning_rate": 7.260596031501783e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.0001831668744702305, + "loss": 0.0136, "step": 300480 }, { - "epoch": 1.52, - "learning_rate": 7.259839262200382e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018316298625385902, + "loss": 0.0172, "step": 300490 }, { - "epoch": 1.52, - "learning_rate": 7.25908249289898e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.0001831590980374876, + "loss": 0.0123, "step": 300500 }, { - "epoch": 1.52, - "learning_rate": 7.25832572359758e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001831552098211161, + "loss": 0.0162, "step": 300510 }, { - "epoch": 1.52, - "learning_rate": 7.25756895429618e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018315132160474465, + "loss": 0.0148, "step": 300520 }, { - "epoch": 1.52, - "learning_rate": 7.256812184994778e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018314743338837316, + "loss": 0.0157, "step": 300530 }, { - "epoch": 1.52, - "learning_rate": 7.256055415693377e-05, - "loss": 0.0077, + "epoch": 0.78, + "learning_rate": 0.00018314354517200173, + "loss": 0.0153, "step": 300540 }, { - "epoch": 1.52, - "learning_rate": 7.255298646391977e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018313965695563025, + "loss": 0.0184, "step": 300550 }, { - "epoch": 1.52, - "learning_rate": 7.254541877090575e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.0001831357687392588, + "loss": 0.0113, "step": 300560 }, { - "epoch": 1.52, - "learning_rate": 7.253785107789173e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.0001831318805228873, + "loss": 0.0172, "step": 300570 }, { - "epoch": 1.52, - "learning_rate": 7.253028338487772e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.00018312799230651587, + "loss": 0.0134, "step": 300580 }, { - "epoch": 1.52, - "learning_rate": 7.25227156918637e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018312410409014439, + "loss": 0.0145, "step": 300590 }, { - "epoch": 1.52, - "learning_rate": 7.25151479988497e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018312021587377293, + "loss": 0.0165, "step": 300600 }, { - "epoch": 1.52, - "learning_rate": 7.25075803058357e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018311632765740144, + "loss": 0.0163, "step": 300610 }, { - "epoch": 1.52, - "learning_rate": 7.250001261282168e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018311243944103, + "loss": 0.0149, "step": 300620 }, { - "epoch": 1.52, - "learning_rate": 7.249244491980767e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018310855122465855, + "loss": 0.0127, "step": 300630 }, { - "epoch": 1.52, - "learning_rate": 7.248487722679367e-05, - "loss": 0.0053, + "epoch": 0.78, + "learning_rate": 0.00018310466300828707, + "loss": 0.0148, "step": 300640 }, { - "epoch": 1.52, - "learning_rate": 7.247730953377965e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018310077479191558, + "loss": 0.0198, "step": 300650 }, { - "epoch": 1.52, - "learning_rate": 7.246974184076564e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018309688657554415, + "loss": 0.0156, "step": 300660 }, { - "epoch": 1.52, - "learning_rate": 7.246217414775164e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.0001830929983591727, + "loss": 0.0148, "step": 300670 }, { - "epoch": 1.52, - "learning_rate": 7.245460645473762e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.0001830891101428012, + "loss": 0.0172, "step": 300680 }, { - "epoch": 1.52, - "learning_rate": 7.244703876172361e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018308522192642975, + "loss": 0.0125, "step": 300690 }, { - "epoch": 1.52, - "learning_rate": 7.24394710687096e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.0001830813337100583, + "loss": 0.0153, "step": 300700 }, { - "epoch": 1.52, - "learning_rate": 7.243190337569559e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018307744549368683, + "loss": 0.0132, "step": 300710 }, { - "epoch": 1.52, - "learning_rate": 7.242433568268159e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018307355727731535, + "loss": 0.0112, "step": 300720 }, { - "epoch": 1.52, - "learning_rate": 7.241676798966757e-05, - "loss": 0.0054, + "epoch": 0.78, + "learning_rate": 0.0001830696690609439, + "loss": 0.0126, "step": 300730 }, { - "epoch": 1.52, - "learning_rate": 7.240920029665356e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.0001830657808445724, + "loss": 0.0125, "step": 300740 }, { - "epoch": 1.52, - "learning_rate": 7.240163260363956e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018306189262820097, + "loss": 0.0185, "step": 300750 }, { - "epoch": 1.52, - "learning_rate": 7.239406491062554e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018305800441182948, + "loss": 0.0126, "step": 300760 }, { - "epoch": 1.52, - "learning_rate": 7.238649721761153e-05, - "loss": 0.0049, + "epoch": 0.78, + "learning_rate": 0.00018305411619545803, + "loss": 0.0122, "step": 300770 }, { - "epoch": 1.52, - "learning_rate": 7.237892952459751e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018305022797908654, + "loss": 0.011, "step": 300780 }, { - "epoch": 1.52, - "learning_rate": 7.237136183158351e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.0001830463397627151, + "loss": 0.0148, "step": 300790 }, { - "epoch": 1.52, - "learning_rate": 7.23637941385695e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018304245154634365, + "loss": 0.0141, "step": 300800 }, { - "epoch": 1.52, - "learning_rate": 7.235622644555549e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018303856332997217, + "loss": 0.0113, "step": 300810 }, { - "epoch": 1.52, - "learning_rate": 7.234865875254148e-05, - "loss": 0.0054, + "epoch": 0.78, + "learning_rate": 0.00018303467511360068, + "loss": 0.0175, "step": 300820 }, { - "epoch": 1.52, - "learning_rate": 7.234109105952748e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018303078689722925, + "loss": 0.0139, "step": 300830 }, { - "epoch": 1.52, - "learning_rate": 7.233352336651346e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.0001830268986808578, + "loss": 0.0146, "step": 300840 }, { - "epoch": 1.52, - "learning_rate": 7.232595567349945e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001830230104644863, + "loss": 0.0119, "step": 300850 }, { - "epoch": 1.52, - "learning_rate": 7.231838798048543e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018301912224811485, + "loss": 0.0151, "step": 300860 }, { - "epoch": 1.52, - "learning_rate": 7.231082028747142e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001830152340317434, + "loss": 0.0149, "step": 300870 }, { - "epoch": 1.52, - "learning_rate": 7.230325259445741e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018301134581537193, + "loss": 0.0164, "step": 300880 }, { - "epoch": 1.52, - "learning_rate": 7.22956849014434e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018300745759900044, + "loss": 0.0133, "step": 300890 }, { - "epoch": 1.52, - "learning_rate": 7.228811720842939e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018300356938262899, + "loss": 0.0145, "step": 300900 }, { - "epoch": 1.52, - "learning_rate": 7.228054951541538e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018299968116625753, + "loss": 0.0155, "step": 300910 }, { - "epoch": 1.52, - "learning_rate": 7.227298182240138e-05, - "loss": 0.0077, + "epoch": 0.78, + "learning_rate": 0.00018299579294988607, + "loss": 0.0121, "step": 300920 }, { - "epoch": 1.52, - "learning_rate": 7.226541412938736e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018299190473351458, + "loss": 0.0109, "step": 300930 }, { - "epoch": 1.52, - "learning_rate": 7.225784643637335e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018298801651714313, + "loss": 0.0154, "step": 300940 }, { - "epoch": 1.52, - "learning_rate": 7.225027874335933e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.0001829841283007717, + "loss": 0.0164, "step": 300950 }, { - "epoch": 1.52, - "learning_rate": 7.224271105034533e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001829802400844002, + "loss": 0.0128, "step": 300960 }, { - "epoch": 1.52, - "learning_rate": 7.223514335733132e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018297635186802872, + "loss": 0.015, "step": 300970 }, { - "epoch": 1.52, - "learning_rate": 7.22275756643173e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018297246365165727, + "loss": 0.0087, "step": 300980 }, { - "epoch": 1.52, - "learning_rate": 7.22200079713033e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.00018296857543528578, + "loss": 0.0132, "step": 300990 }, { - "epoch": 1.52, - "learning_rate": 7.22124402782893e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018296468721891435, + "loss": 0.0151, "step": 301000 }, { - "epoch": 1.52, - "eval_cer": 0.9144430848116509, - "eval_loss": 0.00536463363096118, - "eval_runtime": 116.4459, - "eval_samples_per_second": 17.175, - "eval_steps_per_second": 4.294, + "epoch": 0.78, + "eval_cer": 0.8817250805141147, + "eval_loss": 0.009607135318219662, + "eval_runtime": 107.6603, + "eval_samples_per_second": 18.577, + "eval_steps_per_second": 4.644, "step": 301000 }, { - "epoch": 1.52, - "learning_rate": 7.220487258527528e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.0001829607990025429, + "loss": 0.0145, "step": 301010 }, { - "epoch": 1.52, - "learning_rate": 7.219730489226127e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.0001829569107861714, + "loss": 0.0154, "step": 301020 }, { - "epoch": 1.52, - "learning_rate": 7.218973719924725e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.00018295302256979995, + "loss": 0.0118, "step": 301030 }, { - "epoch": 1.52, - "learning_rate": 7.218216950623325e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.0001829491343534285, + "loss": 0.017, "step": 301040 }, { - "epoch": 1.52, - "learning_rate": 7.217460181321924e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018294524613705703, + "loss": 0.0143, "step": 301050 }, { - "epoch": 1.52, - "learning_rate": 7.216703412020523e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018294135792068554, + "loss": 0.0156, "step": 301060 }, { - "epoch": 1.52, - "learning_rate": 7.215946642719122e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.00018293746970431409, + "loss": 0.0151, "step": 301070 }, { - "epoch": 1.52, - "learning_rate": 7.215189873417722e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018293358148794263, + "loss": 0.0205, "step": 301080 }, { - "epoch": 1.52, - "learning_rate": 7.21443310411632e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018292969327157117, + "loss": 0.0089, "step": 301090 }, { - "epoch": 1.52, - "learning_rate": 7.213676334814919e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018292580505519968, + "loss": 0.0172, "step": 301100 }, { - "epoch": 1.52, - "learning_rate": 7.212919565513517e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018292191683882823, + "loss": 0.0151, "step": 301110 }, { - "epoch": 1.52, - "learning_rate": 7.212162796212117e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.0001829180286224568, + "loss": 0.0137, "step": 301120 }, { - "epoch": 1.52, - "learning_rate": 7.211406026910716e-05, - "loss": 0.0057, + "epoch": 0.78, + "learning_rate": 0.0001829141404060853, + "loss": 0.0162, "step": 301130 }, { - "epoch": 1.52, - "learning_rate": 7.210649257609314e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018291025218971382, + "loss": 0.0151, "step": 301140 }, { - "epoch": 1.52, - "learning_rate": 7.209892488307914e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018290636397334236, + "loss": 0.0165, "step": 301150 }, { - "epoch": 1.52, - "learning_rate": 7.209135719006513e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018290247575697093, + "loss": 0.0146, "step": 301160 }, { - "epoch": 1.52, - "learning_rate": 7.208378949705112e-05, - "loss": 0.0048, + "epoch": 0.78, + "learning_rate": 0.00018289858754059945, + "loss": 0.0128, "step": 301170 }, { - "epoch": 1.52, - "learning_rate": 7.207622180403711e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.000182894699324228, + "loss": 0.0138, "step": 301180 }, { - "epoch": 1.52, - "learning_rate": 7.206865411102309e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001828908111078565, + "loss": 0.0147, "step": 301190 }, { - "epoch": 1.52, - "learning_rate": 7.206108641800909e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018288692289148507, + "loss": 0.0123, "step": 301200 }, { - "epoch": 1.52, - "learning_rate": 7.205351872499507e-05, - "loss": 0.0054, + "epoch": 0.78, + "learning_rate": 0.0001828830346751136, + "loss": 0.0192, "step": 301210 }, { - "epoch": 1.52, - "learning_rate": 7.204595103198106e-05, - "loss": 0.0094, + "epoch": 0.78, + "learning_rate": 0.00018287914645874213, + "loss": 0.0131, "step": 301220 }, { - "epoch": 1.52, - "learning_rate": 7.203838333896705e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018287525824237064, + "loss": 0.018, "step": 301230 }, { - "epoch": 1.52, - "learning_rate": 7.203081564595304e-05, - "loss": 0.0104, + "epoch": 0.78, + "learning_rate": 0.00018287137002599919, + "loss": 0.0113, "step": 301240 }, { - "epoch": 1.52, - "learning_rate": 7.202324795293904e-05, - "loss": 0.0098, + "epoch": 0.78, + "learning_rate": 0.00018286748180962773, + "loss": 0.012, "step": 301250 }, { - "epoch": 1.52, - "learning_rate": 7.201568025992502e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018286359359325627, + "loss": 0.0143, "step": 301260 }, { - "epoch": 1.52, - "learning_rate": 7.200811256691101e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018285970537688478, + "loss": 0.0158, "step": 301270 }, { - "epoch": 1.52, - "learning_rate": 7.200054487389701e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018285581716051332, + "loss": 0.0156, "step": 301280 }, { - "epoch": 1.52, - "learning_rate": 7.199297718088299e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018285192894414187, + "loss": 0.018, "step": 301290 }, { - "epoch": 1.52, - "learning_rate": 7.198540948786898e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.0001828480407277704, + "loss": 0.0129, "step": 301300 }, { - "epoch": 1.52, - "learning_rate": 7.197784179485496e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018284415251139892, + "loss": 0.017, "step": 301310 }, { - "epoch": 1.52, - "learning_rate": 7.197027410184096e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018284026429502746, + "loss": 0.0133, "step": 301320 }, { - "epoch": 1.52, - "learning_rate": 7.196270640882695e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018283637607865603, + "loss": 0.0168, "step": 301330 }, { - "epoch": 1.52, - "learning_rate": 7.195513871581294e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018283248786228455, + "loss": 0.0146, "step": 301340 }, { - "epoch": 1.52, - "learning_rate": 7.194757102279893e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001828285996459131, + "loss": 0.0137, "step": 301350 }, { - "epoch": 1.52, - "learning_rate": 7.194000332978493e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.0001828247114295416, + "loss": 0.012, "step": 301360 }, { - "epoch": 1.52, - "learning_rate": 7.193243563677091e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018282082321317017, + "loss": 0.0137, "step": 301370 }, { - "epoch": 1.52, - "learning_rate": 7.19248679437569e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.0001828169349967987, + "loss": 0.0157, "step": 301380 }, { - "epoch": 1.52, - "learning_rate": 7.191730025074288e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018281304678042723, + "loss": 0.0151, "step": 301390 }, { - "epoch": 1.52, - "learning_rate": 7.190973255772888e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018280915856405574, + "loss": 0.0148, "step": 301400 }, { - "epoch": 1.52, - "learning_rate": 7.190216486471487e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.0001828052703476843, + "loss": 0.0141, "step": 301410 }, { - "epoch": 1.52, - "learning_rate": 7.189459717170086e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018280138213131283, + "loss": 0.016, "step": 301420 }, { - "epoch": 1.52, - "learning_rate": 7.188702947868685e-05, - "loss": 0.0055, + "epoch": 0.78, + "learning_rate": 0.00018279749391494137, + "loss": 0.014, "step": 301430 }, { - "epoch": 1.52, - "learning_rate": 7.187946178567285e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018279360569856988, + "loss": 0.0132, "step": 301440 }, { - "epoch": 1.52, - "learning_rate": 7.187189409265883e-05, - "loss": 0.0055, + "epoch": 0.78, + "learning_rate": 0.00018278971748219842, + "loss": 0.0139, "step": 301450 }, { - "epoch": 1.52, - "learning_rate": 7.186432639964482e-05, - "loss": 0.0052, + "epoch": 0.78, + "learning_rate": 0.00018278582926582697, + "loss": 0.0148, "step": 301460 }, { - "epoch": 1.52, - "learning_rate": 7.18567587066308e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001827819410494555, + "loss": 0.0139, "step": 301470 }, { - "epoch": 1.52, - "learning_rate": 7.18491910136168e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018277805283308402, + "loss": 0.0124, "step": 301480 }, { - "epoch": 1.52, - "learning_rate": 7.18416233206028e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018277416461671256, + "loss": 0.0138, "step": 301490 }, { - "epoch": 1.52, - "learning_rate": 7.183405562758877e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018277027640034113, + "loss": 0.0163, "step": 301500 }, { - "epoch": 1.52, - "learning_rate": 7.182648793457476e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018276638818396965, + "loss": 0.0128, "step": 301510 }, { - "epoch": 1.52, - "learning_rate": 7.181892024156075e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.0001827624999675982, + "loss": 0.0206, "step": 301520 }, { - "epoch": 1.52, - "learning_rate": 7.181135254854675e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.0001827586117512267, + "loss": 0.0175, "step": 301530 }, { - "epoch": 1.52, - "learning_rate": 7.180378485553273e-05, - "loss": 0.0088, + "epoch": 0.78, + "learning_rate": 0.00018275472353485527, + "loss": 0.0169, "step": 301540 }, { - "epoch": 1.52, - "learning_rate": 7.179621716251872e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018275083531848379, + "loss": 0.0148, "step": 301550 }, { - "epoch": 1.52, - "learning_rate": 7.17886494695047e-05, - "loss": 0.0098, + "epoch": 0.78, + "learning_rate": 0.00018274694710211233, + "loss": 0.0137, "step": 301560 }, { - "epoch": 1.52, - "learning_rate": 7.17810817764907e-05, - "loss": 0.009, + "epoch": 0.78, + "learning_rate": 0.00018274305888574084, + "loss": 0.0161, "step": 301570 }, { - "epoch": 1.52, - "learning_rate": 7.17735140834767e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001827391706693694, + "loss": 0.0124, "step": 301580 }, { - "epoch": 1.52, - "learning_rate": 7.176594639046268e-05, - "loss": 0.0057, + "epoch": 0.78, + "learning_rate": 0.00018273528245299793, + "loss": 0.0129, "step": 301590 }, { - "epoch": 1.52, - "learning_rate": 7.175837869744867e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018273139423662647, + "loss": 0.0129, "step": 301600 }, { - "epoch": 1.52, - "learning_rate": 7.175081100443467e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018272750602025498, + "loss": 0.0129, "step": 301610 }, { - "epoch": 1.52, - "learning_rate": 7.174324331142065e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018272361780388355, + "loss": 0.0155, "step": 301620 }, { - "epoch": 1.52, - "learning_rate": 7.173567561840664e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018271972958751207, + "loss": 0.0161, "step": 301630 }, { - "epoch": 1.52, - "learning_rate": 7.172810792539264e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.0001827158413711406, + "loss": 0.0163, "step": 301640 }, { - "epoch": 1.52, - "learning_rate": 7.172054023237862e-05, - "loss": 0.0055, + "epoch": 0.78, + "learning_rate": 0.00018271195315476912, + "loss": 0.0138, "step": 301650 }, { - "epoch": 1.52, - "learning_rate": 7.171297253936461e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.0001827080649383977, + "loss": 0.0199, "step": 301660 }, { - "epoch": 1.52, - "learning_rate": 7.17054048463506e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018270417672202623, + "loss": 0.0168, "step": 301670 }, { - "epoch": 1.52, - "learning_rate": 7.169783715333659e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018270028850565475, + "loss": 0.0169, "step": 301680 }, { - "epoch": 1.52, - "learning_rate": 7.169026946032258e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018269640028928326, + "loss": 0.011, "step": 301690 }, { - "epoch": 1.52, - "learning_rate": 7.168270176730857e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.0001826925120729118, + "loss": 0.0166, "step": 301700 }, { - "epoch": 1.52, - "learning_rate": 7.167513407429456e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018268862385654037, + "loss": 0.0133, "step": 301710 }, { - "epoch": 1.52, - "learning_rate": 7.166756638128056e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018268473564016889, + "loss": 0.02, "step": 301720 }, { - "epoch": 1.52, - "learning_rate": 7.165999868826654e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018268084742379743, + "loss": 0.0133, "step": 301730 }, { - "epoch": 1.52, - "learning_rate": 7.165243099525253e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018267695920742594, + "loss": 0.0145, "step": 301740 }, { - "epoch": 1.52, - "learning_rate": 7.164486330223851e-05, - "loss": 0.01, + "epoch": 0.78, + "learning_rate": 0.0001826730709910545, + "loss": 0.0138, "step": 301750 }, { - "epoch": 1.52, - "learning_rate": 7.163729560922451e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018266918277468303, + "loss": 0.0198, "step": 301760 }, { - "epoch": 1.52, - "learning_rate": 7.16297279162105e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.00018266529455831157, + "loss": 0.0138, "step": 301770 }, { - "epoch": 1.52, - "learning_rate": 7.162216022319649e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018266140634194008, + "loss": 0.0128, "step": 301780 }, { - "epoch": 1.52, - "learning_rate": 7.161459253018248e-05, - "loss": 0.0057, + "epoch": 0.78, + "learning_rate": 0.00018265751812556865, + "loss": 0.0135, "step": 301790 }, { - "epoch": 1.52, - "learning_rate": 7.160702483716848e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018265362990919716, + "loss": 0.0134, "step": 301800 }, { - "epoch": 1.52, - "learning_rate": 7.159945714415446e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.0001826497416928257, + "loss": 0.0106, "step": 301810 }, { - "epoch": 1.52, - "learning_rate": 7.159188945114044e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018264585347645422, + "loss": 0.0134, "step": 301820 }, { - "epoch": 1.52, - "learning_rate": 7.158432175812643e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.0001826419652600828, + "loss": 0.013, "step": 301830 }, { - "epoch": 1.52, - "learning_rate": 7.157675406511242e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.0001826380770437113, + "loss": 0.0162, "step": 301840 }, { - "epoch": 1.52, - "learning_rate": 7.156918637209841e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018263418882733985, + "loss": 0.0133, "step": 301850 }, { - "epoch": 1.52, - "learning_rate": 7.15616186790844e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018263030061096836, + "loss": 0.0106, "step": 301860 }, { - "epoch": 1.52, - "learning_rate": 7.155405098607039e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018262641239459693, + "loss": 0.0152, "step": 301870 }, { - "epoch": 1.52, - "learning_rate": 7.154648329305638e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018262252417822547, + "loss": 0.0175, "step": 301880 }, { - "epoch": 1.52, - "learning_rate": 7.153891560004238e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.00018261863596185398, + "loss": 0.0144, "step": 301890 }, { - "epoch": 1.52, - "learning_rate": 7.153134790702836e-05, - "loss": 0.0084, + "epoch": 0.78, + "learning_rate": 0.00018261474774548253, + "loss": 0.0158, "step": 301900 }, { - "epoch": 1.52, - "learning_rate": 7.152378021401435e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018261085952911107, + "loss": 0.0177, "step": 301910 }, { - "epoch": 1.52, - "learning_rate": 7.151621252100033e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001826069713127396, + "loss": 0.0155, "step": 301920 }, { - "epoch": 1.52, - "learning_rate": 7.150864482798633e-05, - "loss": 0.0056, + "epoch": 0.78, + "learning_rate": 0.00018260308309636812, + "loss": 0.0136, "step": 301930 }, { - "epoch": 1.52, - "learning_rate": 7.150107713497232e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018259919487999667, + "loss": 0.014, "step": 301940 }, { - "epoch": 1.52, - "learning_rate": 7.14935094419583e-05, - "loss": 0.0057, + "epoch": 0.78, + "learning_rate": 0.00018259530666362518, + "loss": 0.0187, "step": 301950 }, { - "epoch": 1.52, - "learning_rate": 7.14859417489443e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.00018259141844725375, + "loss": 0.018, "step": 301960 }, { - "epoch": 1.52, - "learning_rate": 7.14783740559303e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018258753023088226, + "loss": 0.0118, "step": 301970 }, { - "epoch": 1.52, - "learning_rate": 7.147080636291628e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001825836420145108, + "loss": 0.0137, "step": 301980 }, { - "epoch": 1.52, - "learning_rate": 7.146323866990227e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018257975379813932, + "loss": 0.0131, "step": 301990 }, { - "epoch": 1.52, - "learning_rate": 7.145567097688825e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.0001825758655817679, + "loss": 0.0156, "step": 302000 }, { - "epoch": 1.52, - "eval_cer": 0.9144489071884033, - "eval_loss": 0.0054143439047038555, - "eval_runtime": 116.5206, - "eval_samples_per_second": 17.164, - "eval_steps_per_second": 4.291, + "epoch": 0.78, + "eval_cer": 0.8817026863231677, + "eval_loss": 0.00945495255291462, + "eval_runtime": 107.8912, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, "step": 302000 }, { - "epoch": 1.52, - "learning_rate": 7.144810328387425e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001825719773653964, + "loss": 0.0123, "step": 302010 }, { - "epoch": 1.52, - "learning_rate": 7.144053559086024e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018256808914902494, + "loss": 0.0183, "step": 302020 }, { - "epoch": 1.52, - "learning_rate": 7.143296789784623e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018256420093265346, + "loss": 0.0139, "step": 302030 }, { - "epoch": 1.52, - "learning_rate": 7.142540020483222e-05, - "loss": 0.0069, + "epoch": 0.78, + "learning_rate": 0.00018256031271628203, + "loss": 0.0136, "step": 302040 }, { - "epoch": 1.52, - "learning_rate": 7.141783251181822e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018255642449991057, + "loss": 0.0134, "step": 302050 }, { - "epoch": 1.52, - "learning_rate": 7.14102648188042e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018255253628353908, + "loss": 0.0158, "step": 302060 }, { - "epoch": 1.52, - "learning_rate": 7.140269712579019e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018254864806716763, + "loss": 0.0107, "step": 302070 }, { - "epoch": 1.52, - "learning_rate": 7.139512943277617e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.00018254475985079617, + "loss": 0.0156, "step": 302080 }, { - "epoch": 1.52, - "learning_rate": 7.138756173976217e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001825408716344247, + "loss": 0.0134, "step": 302090 }, { - "epoch": 1.52, - "learning_rate": 7.137999404674816e-05, - "loss": 0.0092, + "epoch": 0.78, + "learning_rate": 0.00018253698341805322, + "loss": 0.0156, "step": 302100 }, { - "epoch": 1.52, - "learning_rate": 7.137242635373414e-05, - "loss": 0.0076, + "epoch": 0.78, + "learning_rate": 0.00018253309520168177, + "loss": 0.0145, "step": 302110 }, { - "epoch": 1.52, - "learning_rate": 7.136485866072014e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.0001825292069853103, + "loss": 0.0114, "step": 302120 }, { - "epoch": 1.52, - "learning_rate": 7.135729096770612e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018252531876893885, + "loss": 0.0144, "step": 302130 }, { - "epoch": 1.52, - "learning_rate": 7.134972327469212e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018252143055256736, + "loss": 0.0152, "step": 302140 }, { - "epoch": 1.52, - "learning_rate": 7.13421555816781e-05, - "loss": 0.0097, + "epoch": 0.78, + "learning_rate": 0.0001825175423361959, + "loss": 0.0168, "step": 302150 }, { - "epoch": 1.52, - "learning_rate": 7.133458788866409e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018251365411982445, + "loss": 0.0185, "step": 302160 }, { - "epoch": 1.52, - "learning_rate": 7.132702019565009e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.000182509765903453, + "loss": 0.0135, "step": 302170 }, { - "epoch": 1.52, - "learning_rate": 7.131945250263607e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.0001825058776870815, + "loss": 0.0146, "step": 302180 }, { - "epoch": 1.52, - "learning_rate": 7.131188480962206e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018250198947071004, + "loss": 0.0127, "step": 302190 }, { - "epoch": 1.52, - "learning_rate": 7.130431711660805e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018249810125433856, + "loss": 0.0104, "step": 302200 }, { - "epoch": 1.52, - "learning_rate": 7.129674942359404e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018249421303796713, + "loss": 0.0114, "step": 302210 }, { - "epoch": 1.52, - "learning_rate": 7.128918173058004e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018249032482159567, + "loss": 0.0132, "step": 302220 }, { - "epoch": 1.52, - "learning_rate": 7.128161403756602e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018248643660522418, + "loss": 0.0131, "step": 302230 }, { - "epoch": 1.52, - "learning_rate": 7.127404634455201e-05, - "loss": 0.0083, + "epoch": 0.78, + "learning_rate": 0.0001824825483888527, + "loss": 0.009, "step": 302240 }, { - "epoch": 1.52, - "learning_rate": 7.1266478651538e-05, - "loss": 0.0059, + "epoch": 0.78, + "learning_rate": 0.00018247866017248127, + "loss": 0.0142, "step": 302250 }, { - "epoch": 1.52, - "learning_rate": 7.125891095852399e-05, - "loss": 0.009, + "epoch": 0.78, + "learning_rate": 0.0001824747719561098, + "loss": 0.0137, "step": 302260 }, { - "epoch": 1.52, - "learning_rate": 7.125134326550998e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018247088373973832, + "loss": 0.0124, "step": 302270 }, { - "epoch": 1.53, - "learning_rate": 7.124377557249596e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.00018246699552336686, + "loss": 0.0204, "step": 302280 }, { - "epoch": 1.53, - "learning_rate": 7.123620787948196e-05, - "loss": 0.0075, + "epoch": 0.78, + "learning_rate": 0.0001824631073069954, + "loss": 0.014, "step": 302290 }, { - "epoch": 1.53, - "learning_rate": 7.122864018646795e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018245921909062395, + "loss": 0.0138, "step": 302300 }, { - "epoch": 1.53, - "learning_rate": 7.122107249345394e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018245533087425246, + "loss": 0.0157, "step": 302310 }, { - "epoch": 1.53, - "learning_rate": 7.121350480043993e-05, - "loss": 0.0095, + "epoch": 0.78, + "learning_rate": 0.000182451442657881, + "loss": 0.0184, "step": 302320 }, { - "epoch": 1.53, - "learning_rate": 7.120593710742593e-05, - "loss": 0.0054, + "epoch": 0.78, + "learning_rate": 0.00018244755444150955, + "loss": 0.0154, "step": 302330 }, { - "epoch": 1.53, - "learning_rate": 7.119836941441191e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.0001824436662251381, + "loss": 0.017, "step": 302340 }, { - "epoch": 1.53, - "learning_rate": 7.11908017213979e-05, - "loss": 0.0077, + "epoch": 0.78, + "learning_rate": 0.0001824397780087666, + "loss": 0.015, "step": 302350 }, { - "epoch": 1.53, - "learning_rate": 7.118323402838388e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.00018243588979239514, + "loss": 0.0126, "step": 302360 }, { - "epoch": 1.53, - "learning_rate": 7.117566633536988e-05, - "loss": 0.0071, + "epoch": 0.78, + "learning_rate": 0.0001824320015760237, + "loss": 0.0153, "step": 302370 }, { - "epoch": 1.53, - "learning_rate": 7.116809864235587e-05, - "loss": 0.0073, + "epoch": 0.78, + "learning_rate": 0.00018242811335965223, + "loss": 0.0099, "step": 302380 }, { - "epoch": 1.53, - "learning_rate": 7.116053094934186e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018242422514328077, + "loss": 0.0143, "step": 302390 }, { - "epoch": 1.53, - "learning_rate": 7.115296325632785e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018242033692690928, + "loss": 0.0139, "step": 302400 }, { - "epoch": 1.53, - "learning_rate": 7.114539556331385e-05, - "loss": 0.0082, + "epoch": 0.78, + "learning_rate": 0.00018241644871053785, + "loss": 0.0127, "step": 302410 }, { - "epoch": 1.53, - "learning_rate": 7.113782787029983e-05, - "loss": 0.0085, + "epoch": 0.78, + "learning_rate": 0.00018241256049416637, + "loss": 0.0146, "step": 302420 }, { - "epoch": 1.53, - "learning_rate": 7.113026017728582e-05, - "loss": 0.0088, + "epoch": 0.78, + "learning_rate": 0.0001824086722777949, + "loss": 0.0158, "step": 302430 }, { - "epoch": 1.53, - "learning_rate": 7.11226924842718e-05, - "loss": 0.0096, + "epoch": 0.78, + "learning_rate": 0.00018240478406142342, + "loss": 0.0138, "step": 302440 }, { - "epoch": 1.53, - "learning_rate": 7.111512479125778e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.00018240089584505196, + "loss": 0.0153, "step": 302450 }, { - "epoch": 1.53, - "learning_rate": 7.110755709824378e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.0001823970076286805, + "loss": 0.0134, "step": 302460 }, { - "epoch": 1.53, - "learning_rate": 7.109998940522977e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.00018239311941230905, + "loss": 0.0145, "step": 302470 }, { - "epoch": 1.53, - "learning_rate": 7.109242171221576e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018238923119593756, + "loss": 0.0147, "step": 302480 }, { - "epoch": 1.53, - "learning_rate": 7.108485401920175e-05, - "loss": 0.0101, + "epoch": 0.78, + "learning_rate": 0.0001823853429795661, + "loss": 0.0209, "step": 302490 }, { - "epoch": 1.53, - "learning_rate": 7.107728632618775e-05, - "loss": 0.0096, + "epoch": 0.78, + "learning_rate": 0.00018238145476319465, + "loss": 0.0152, "step": 302500 }, { - "epoch": 1.53, - "learning_rate": 7.106971863317373e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.0001823775665468232, + "loss": 0.0126, "step": 302510 }, { - "epoch": 1.53, - "learning_rate": 7.106215094015972e-05, - "loss": 0.0061, + "epoch": 0.78, + "learning_rate": 0.0001823736783304517, + "loss": 0.016, "step": 302520 }, { - "epoch": 1.53, - "learning_rate": 7.10545832471457e-05, - "loss": 0.0089, + "epoch": 0.78, + "learning_rate": 0.00018236979011408024, + "loss": 0.0144, "step": 302530 }, { - "epoch": 1.53, - "learning_rate": 7.10470155541317e-05, - "loss": 0.0049, + "epoch": 0.78, + "learning_rate": 0.0001823659018977088, + "loss": 0.0155, "step": 302540 }, { - "epoch": 1.53, - "learning_rate": 7.10394478611177e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018236201368133733, + "loss": 0.0167, "step": 302550 }, { - "epoch": 1.53, - "learning_rate": 7.103188016810368e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.00018235812546496584, + "loss": 0.0149, "step": 302560 }, { - "epoch": 1.53, - "learning_rate": 7.102431247508967e-05, - "loss": 0.0065, + "epoch": 0.78, + "learning_rate": 0.00018235423724859438, + "loss": 0.0144, "step": 302570 }, { - "epoch": 1.53, - "learning_rate": 7.101674478207567e-05, - "loss": 0.0072, + "epoch": 0.78, + "learning_rate": 0.00018235034903222295, + "loss": 0.0133, "step": 302580 }, { - "epoch": 1.53, - "learning_rate": 7.100917708906165e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018234646081585147, + "loss": 0.017, "step": 302590 }, { - "epoch": 1.53, - "learning_rate": 7.100160939604764e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.00018234257259948, + "loss": 0.0126, "step": 302600 }, { - "epoch": 1.53, - "learning_rate": 7.099404170303364e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018233868438310852, + "loss": 0.0149, "step": 302610 }, { - "epoch": 1.53, - "learning_rate": 7.098647401001962e-05, - "loss": 0.0062, + "epoch": 0.78, + "learning_rate": 0.0001823347961667371, + "loss": 0.0108, "step": 302620 }, { - "epoch": 1.53, - "learning_rate": 7.097890631700561e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.0001823309079503656, + "loss": 0.0155, "step": 302630 }, { - "epoch": 1.53, - "learning_rate": 7.09713386239916e-05, - "loss": 0.0081, + "epoch": 0.78, + "learning_rate": 0.00018232701973399415, + "loss": 0.0117, "step": 302640 }, { - "epoch": 1.53, - "learning_rate": 7.096377093097759e-05, - "loss": 0.0096, + "epoch": 0.78, + "learning_rate": 0.00018232313151762266, + "loss": 0.0164, "step": 302650 }, { - "epoch": 1.53, - "learning_rate": 7.095620323796358e-05, - "loss": 0.0079, + "epoch": 0.78, + "learning_rate": 0.00018231924330125123, + "loss": 0.0118, "step": 302660 }, { - "epoch": 1.53, - "learning_rate": 7.094863554494957e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.00018231535508487974, + "loss": 0.0164, "step": 302670 }, { - "epoch": 1.53, - "learning_rate": 7.094106785193556e-05, - "loss": 0.0068, + "epoch": 0.78, + "learning_rate": 0.0001823114668685083, + "loss": 0.0135, "step": 302680 }, { - "epoch": 1.53, - "learning_rate": 7.093350015892156e-05, - "loss": 0.006, + "epoch": 0.78, + "learning_rate": 0.0001823075786521368, + "loss": 0.0168, "step": 302690 }, { - "epoch": 1.53, - "learning_rate": 7.092593246590754e-05, - "loss": 0.0064, + "epoch": 0.78, + "learning_rate": 0.00018230369043576534, + "loss": 0.0157, "step": 302700 }, { - "epoch": 1.53, - "learning_rate": 7.091836477289353e-05, - "loss": 0.007, + "epoch": 0.78, + "learning_rate": 0.0001822998022193939, + "loss": 0.0107, "step": 302710 }, { - "epoch": 1.53, - "learning_rate": 7.091079707987951e-05, - "loss": 0.0063, + "epoch": 0.78, + "learning_rate": 0.00018229591400302243, + "loss": 0.0118, "step": 302720 }, { - "epoch": 1.53, - "learning_rate": 7.090322938686551e-05, - "loss": 0.0093, + "epoch": 0.78, + "learning_rate": 0.00018229202578665094, + "loss": 0.0149, "step": 302730 }, { - "epoch": 1.53, - "learning_rate": 7.08956616938515e-05, - "loss": 0.0096, + "epoch": 0.78, + "learning_rate": 0.00018228813757027948, + "loss": 0.0146, "step": 302740 }, { - "epoch": 1.53, - "learning_rate": 7.088809400083749e-05, - "loss": 0.0067, + "epoch": 0.78, + "learning_rate": 0.00018228424935390805, + "loss": 0.0132, "step": 302750 }, { - "epoch": 1.53, - "learning_rate": 7.088052630782347e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018228036113753657, + "loss": 0.0146, "step": 302760 }, { - "epoch": 1.53, - "learning_rate": 7.087295861480946e-05, - "loss": 0.0087, + "epoch": 0.78, + "learning_rate": 0.0001822764729211651, + "loss": 0.0128, "step": 302770 }, { - "epoch": 1.53, - "learning_rate": 7.086539092179546e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018227258470479362, + "loss": 0.0116, "step": 302780 }, { - "epoch": 1.53, - "learning_rate": 7.085782322878144e-05, - "loss": 0.0058, + "epoch": 0.78, + "learning_rate": 0.0001822686964884222, + "loss": 0.0141, "step": 302790 }, { - "epoch": 1.53, - "learning_rate": 7.085025553576743e-05, - "loss": 0.008, + "epoch": 0.78, + "learning_rate": 0.0001822648082720507, + "loss": 0.0198, "step": 302800 }, { - "epoch": 1.53, - "learning_rate": 7.084268784275341e-05, - "loss": 0.0074, + "epoch": 0.78, + "learning_rate": 0.00018226092005567925, + "loss": 0.0135, "step": 302810 }, { - "epoch": 1.53, - "learning_rate": 7.083512014973941e-05, - "loss": 0.0066, + "epoch": 0.78, + "learning_rate": 0.00018225703183930776, + "loss": 0.015, "step": 302820 }, { - "epoch": 1.53, - "learning_rate": 7.08275524567254e-05, - "loss": 0.0078, + "epoch": 0.78, + "learning_rate": 0.00018225314362293633, + "loss": 0.0163, "step": 302830 }, { - "epoch": 1.53, - "learning_rate": 7.081998476371139e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018224925540656484, + "loss": 0.0138, "step": 302840 }, { - "epoch": 1.53, - "learning_rate": 7.081241707069738e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018224536719019339, + "loss": 0.0137, "step": 302850 }, { - "epoch": 1.53, - "learning_rate": 7.080484937768338e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.0001822414789738219, + "loss": 0.0146, "step": 302860 }, { - "epoch": 1.53, - "learning_rate": 7.079728168466936e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018223759075745047, + "loss": 0.0145, "step": 302870 }, { - "epoch": 1.53, - "learning_rate": 7.078971399165535e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018223370254107898, + "loss": 0.0165, "step": 302880 }, { - "epoch": 1.53, - "learning_rate": 7.078214629864133e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018222981432470753, + "loss": 0.0151, "step": 302890 }, { - "epoch": 1.53, - "learning_rate": 7.077457860562733e-05, - "loss": 0.0096, + "epoch": 0.79, + "learning_rate": 0.00018222592610833604, + "loss": 0.0132, "step": 302900 }, { - "epoch": 1.53, - "learning_rate": 7.076701091261332e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.0001822220378919646, + "loss": 0.0166, "step": 302910 }, { - "epoch": 1.53, - "learning_rate": 7.07594432195993e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.00018221814967559315, + "loss": 0.0157, "step": 302920 }, { - "epoch": 1.53, - "learning_rate": 7.07518755265853e-05, - "loss": 0.0098, + "epoch": 0.79, + "learning_rate": 0.00018221426145922166, + "loss": 0.0162, "step": 302930 }, { - "epoch": 1.53, - "learning_rate": 7.07443078335713e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001822103732428502, + "loss": 0.0134, "step": 302940 }, { - "epoch": 1.53, - "learning_rate": 7.073674014055728e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018220648502647872, + "loss": 0.0169, "step": 302950 }, { - "epoch": 1.53, - "learning_rate": 7.072917244754327e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.0001822025968101073, + "loss": 0.0146, "step": 302960 }, { - "epoch": 1.53, - "learning_rate": 7.072160475452925e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.0001821987085937358, + "loss": 0.011, "step": 302970 }, { - "epoch": 1.53, - "learning_rate": 7.071403706151525e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.00018219482037736435, + "loss": 0.0181, "step": 302980 }, { - "epoch": 1.53, - "learning_rate": 7.070646936850124e-05, - "loss": 0.0093, + "epoch": 0.79, + "learning_rate": 0.00018219093216099286, + "loss": 0.0197, "step": 302990 }, { - "epoch": 1.53, - "learning_rate": 7.069890167548722e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.00018218704394462143, + "loss": 0.0104, "step": 303000 }, { - "epoch": 1.53, - "eval_cer": 0.9144556999612812, - "eval_loss": 0.00549934571608901, - "eval_runtime": 116.3379, - "eval_samples_per_second": 17.191, - "eval_steps_per_second": 4.298, + "epoch": 0.79, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.009238921105861664, + "eval_runtime": 107.8053, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, "step": 303000 }, { - "epoch": 1.53, - "learning_rate": 7.069133398247322e-05, - "loss": 0.0096, + "epoch": 0.79, + "learning_rate": 0.00018218315572824994, + "loss": 0.0163, "step": 303010 }, { - "epoch": 1.53, - "learning_rate": 7.068376628945921e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018217926751187849, + "loss": 0.0127, "step": 303020 }, { - "epoch": 1.53, - "learning_rate": 7.06761985964452e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.000182175379295507, + "loss": 0.0149, "step": 303030 }, { - "epoch": 1.53, - "learning_rate": 7.066863090343119e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018217149107913557, + "loss": 0.0146, "step": 303040 }, { - "epoch": 1.53, - "learning_rate": 7.066106321041717e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018216760286276408, + "loss": 0.0164, "step": 303050 }, { - "epoch": 1.53, - "learning_rate": 7.065349551740317e-05, - "loss": 0.0091, + "epoch": 0.79, + "learning_rate": 0.00018216371464639262, + "loss": 0.0179, "step": 303060 }, { - "epoch": 1.53, - "learning_rate": 7.064592782438915e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018215982643002114, + "loss": 0.0168, "step": 303070 }, { - "epoch": 1.53, - "learning_rate": 7.063836013137514e-05, - "loss": 0.0095, + "epoch": 0.79, + "learning_rate": 0.0001821559382136497, + "loss": 0.0148, "step": 303080 }, { - "epoch": 1.53, - "learning_rate": 7.063079243836113e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.00018215204999727825, + "loss": 0.0124, "step": 303090 }, { - "epoch": 1.53, - "learning_rate": 7.062322474534712e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018214816178090676, + "loss": 0.0131, "step": 303100 }, { - "epoch": 1.53, - "learning_rate": 7.061565705233312e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.0001821442735645353, + "loss": 0.009, "step": 303110 }, { - "epoch": 1.53, - "learning_rate": 7.06080893593191e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018214038534816385, + "loss": 0.0166, "step": 303120 }, { - "epoch": 1.53, - "learning_rate": 7.060052166630509e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.0001821364971317924, + "loss": 0.0147, "step": 303130 }, { - "epoch": 1.53, - "learning_rate": 7.059295397329109e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.0001821326089154209, + "loss": 0.0144, "step": 303140 }, { - "epoch": 1.53, - "learning_rate": 7.058538628027707e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018212872069904945, + "loss": 0.012, "step": 303150 }, { - "epoch": 1.53, - "learning_rate": 7.057781858726306e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.000182124832482678, + "loss": 0.013, "step": 303160 }, { - "epoch": 1.53, - "learning_rate": 7.057025089424904e-05, - "loss": 0.0055, + "epoch": 0.79, + "learning_rate": 0.00018212094426630653, + "loss": 0.0139, "step": 303170 }, { - "epoch": 1.53, - "learning_rate": 7.056268320123504e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018211705604993504, + "loss": 0.0144, "step": 303180 }, { - "epoch": 1.53, - "learning_rate": 7.055511550822103e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018211316783356358, + "loss": 0.0157, "step": 303190 }, { - "epoch": 1.53, - "learning_rate": 7.054754781520702e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.0001821092796171921, + "loss": 0.013, "step": 303200 }, { - "epoch": 1.53, - "learning_rate": 7.053998012219301e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.00018210539140082067, + "loss": 0.0168, "step": 303210 }, { - "epoch": 1.53, - "learning_rate": 7.0532412429179e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018210150318444918, + "loss": 0.0162, "step": 303220 }, { - "epoch": 1.53, - "learning_rate": 7.052484473616499e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018209761496807772, + "loss": 0.0129, "step": 303230 }, { - "epoch": 1.53, - "learning_rate": 7.051727704315098e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018209372675170624, + "loss": 0.0147, "step": 303240 }, { - "epoch": 1.53, - "learning_rate": 7.050970935013696e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.0001820898385353348, + "loss": 0.013, "step": 303250 }, { - "epoch": 1.53, - "learning_rate": 7.050214165712296e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018208595031896335, + "loss": 0.0123, "step": 303260 }, { - "epoch": 1.53, - "learning_rate": 7.049457396410895e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.00018208206210259186, + "loss": 0.0137, "step": 303270 }, { - "epoch": 1.53, - "learning_rate": 7.048700627109494e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018207817388622038, + "loss": 0.0142, "step": 303280 }, { - "epoch": 1.53, - "learning_rate": 7.047943857808093e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.00018207428566984895, + "loss": 0.0126, "step": 303290 }, { - "epoch": 1.53, - "learning_rate": 7.047187088506693e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.0001820703974534775, + "loss": 0.0144, "step": 303300 }, { - "epoch": 1.53, - "learning_rate": 7.046430319205291e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.000182066509237106, + "loss": 0.0156, "step": 303310 }, { - "epoch": 1.53, - "learning_rate": 7.04567354990389e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018206262102073454, + "loss": 0.0166, "step": 303320 }, { - "epoch": 1.53, - "learning_rate": 7.044916780602488e-05, - "loss": 0.0047, + "epoch": 0.79, + "learning_rate": 0.00018205873280436309, + "loss": 0.0091, "step": 303330 }, { - "epoch": 1.53, - "learning_rate": 7.044160011301088e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018205484458799163, + "loss": 0.0148, "step": 303340 }, { - "epoch": 1.53, - "learning_rate": 7.043403241999687e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018205095637162014, + "loss": 0.0154, "step": 303350 }, { - "epoch": 1.53, - "learning_rate": 7.042646472698285e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018204706815524868, + "loss": 0.0137, "step": 303360 }, { - "epoch": 1.53, - "learning_rate": 7.041889703396885e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018204317993887723, + "loss": 0.0173, "step": 303370 }, { - "epoch": 1.53, - "learning_rate": 7.041132934095484e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018203929172250577, + "loss": 0.0156, "step": 303380 }, { - "epoch": 1.53, - "learning_rate": 7.040376164794083e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018203540350613428, + "loss": 0.0158, "step": 303390 }, { - "epoch": 1.53, - "learning_rate": 7.039619395492681e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018203151528976282, + "loss": 0.0127, "step": 303400 }, { - "epoch": 1.53, - "learning_rate": 7.03886262619128e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001820276270733914, + "loss": 0.0161, "step": 303410 }, { - "epoch": 1.53, - "learning_rate": 7.038105856889878e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001820237388570199, + "loss": 0.0155, "step": 303420 }, { - "epoch": 1.53, - "learning_rate": 7.037349087588478e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018201985064064842, + "loss": 0.0124, "step": 303430 }, { - "epoch": 1.53, - "learning_rate": 7.036592318287077e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018201596242427696, + "loss": 0.0161, "step": 303440 }, { - "epoch": 1.53, - "learning_rate": 7.035835548985676e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.00018201207420790548, + "loss": 0.013, "step": 303450 }, { - "epoch": 1.53, - "learning_rate": 7.035078779684275e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.00018200818599153405, + "loss": 0.0147, "step": 303460 }, { - "epoch": 1.53, - "learning_rate": 7.034322010382875e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.0001820042977751626, + "loss": 0.0179, "step": 303470 }, { - "epoch": 1.53, - "learning_rate": 7.033565241081473e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.0001820004095587911, + "loss": 0.0127, "step": 303480 }, { - "epoch": 1.53, - "learning_rate": 7.032808471780072e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018199652134241964, + "loss": 0.0156, "step": 303490 }, { - "epoch": 1.53, - "learning_rate": 7.03205170247867e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018199263312604819, + "loss": 0.0137, "step": 303500 }, { - "epoch": 1.53, - "learning_rate": 7.03129493317727e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.00018198874490967673, + "loss": 0.0166, "step": 303510 }, { - "epoch": 1.53, - "learning_rate": 7.03053816387587e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018198485669330524, + "loss": 0.0127, "step": 303520 }, { - "epoch": 1.53, - "learning_rate": 7.029781394574467e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018198096847693378, + "loss": 0.0123, "step": 303530 }, { - "epoch": 1.53, - "learning_rate": 7.029024625273067e-05, - "loss": 0.011, + "epoch": 0.79, + "learning_rate": 0.00018197708026056233, + "loss": 0.0183, "step": 303540 }, { - "epoch": 1.53, - "learning_rate": 7.028267855971666e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018197319204419087, + "loss": 0.0148, "step": 303550 }, { - "epoch": 1.53, - "learning_rate": 7.027511086670265e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.00018196930382781938, + "loss": 0.0137, "step": 303560 }, { - "epoch": 1.53, - "learning_rate": 7.026754317368864e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018196541561144792, + "loss": 0.011, "step": 303570 }, { - "epoch": 1.53, - "learning_rate": 7.025997548067464e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.0001819615273950765, + "loss": 0.0115, "step": 303580 }, { - "epoch": 1.53, - "learning_rate": 7.025240778766062e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.000181957639178705, + "loss": 0.013, "step": 303590 }, { - "epoch": 1.53, - "learning_rate": 7.024484009464661e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018195375096233352, + "loss": 0.015, "step": 303600 }, { - "epoch": 1.53, - "learning_rate": 7.02372724016326e-05, - "loss": 0.0107, + "epoch": 0.79, + "learning_rate": 0.00018194986274596206, + "loss": 0.0121, "step": 303610 }, { - "epoch": 1.53, - "learning_rate": 7.022970470861859e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018194597452959063, + "loss": 0.0155, "step": 303620 }, { - "epoch": 1.53, - "learning_rate": 7.022213701560458e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018194208631321915, + "loss": 0.0119, "step": 303630 }, { - "epoch": 1.53, - "learning_rate": 7.021456932259057e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.0001819381980968477, + "loss": 0.0142, "step": 303640 }, { - "epoch": 1.53, - "learning_rate": 7.020700162957656e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.0001819343098804762, + "loss": 0.0122, "step": 303650 }, { - "epoch": 1.53, - "learning_rate": 7.019943393656256e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018193042166410477, + "loss": 0.0167, "step": 303660 }, { - "epoch": 1.53, - "learning_rate": 7.019186624354854e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018192653344773329, + "loss": 0.0146, "step": 303670 }, { - "epoch": 1.53, - "learning_rate": 7.018429855053453e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.00018192264523136183, + "loss": 0.0133, "step": 303680 }, { - "epoch": 1.53, - "learning_rate": 7.017673085752051e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018191875701499034, + "loss": 0.0117, "step": 303690 }, { - "epoch": 1.53, - "learning_rate": 7.01691631645065e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.00018191486879861888, + "loss": 0.0121, "step": 303700 }, { - "epoch": 1.53, - "learning_rate": 7.016159547149249e-05, - "loss": 0.0091, + "epoch": 0.79, + "learning_rate": 0.00018191098058224742, + "loss": 0.0132, "step": 303710 }, { - "epoch": 1.53, - "learning_rate": 7.015402777847848e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018190709236587597, + "loss": 0.015, "step": 303720 }, { - "epoch": 1.53, - "learning_rate": 7.014646008546447e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018190320414950448, + "loss": 0.0126, "step": 303730 }, { - "epoch": 1.53, - "learning_rate": 7.013889239245046e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018189931593313302, + "loss": 0.0136, "step": 303740 }, { - "epoch": 1.53, - "learning_rate": 7.013132469943646e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018189542771676156, + "loss": 0.0212, "step": 303750 }, { - "epoch": 1.53, - "learning_rate": 7.012375700642244e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.0001818915395003901, + "loss": 0.0184, "step": 303760 }, { - "epoch": 1.53, - "learning_rate": 7.011618931340843e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018188765128401862, + "loss": 0.014, "step": 303770 }, { - "epoch": 1.53, - "learning_rate": 7.010862162039441e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.00018188376306764716, + "loss": 0.0168, "step": 303780 }, { - "epoch": 1.53, - "learning_rate": 7.010105392738041e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018187987485127573, + "loss": 0.0132, "step": 303790 }, { - "epoch": 1.53, - "learning_rate": 7.00934862343664e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018187598663490425, + "loss": 0.0159, "step": 303800 }, { - "epoch": 1.53, - "learning_rate": 7.008591854135239e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.0001818720984185328, + "loss": 0.0135, "step": 303810 }, { - "epoch": 1.53, - "learning_rate": 7.007835084833838e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.0001818682102021613, + "loss": 0.0163, "step": 303820 }, { - "epoch": 1.53, - "learning_rate": 7.007078315532438e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.00018186432198578987, + "loss": 0.0184, "step": 303830 }, { - "epoch": 1.53, - "learning_rate": 7.006321546231036e-05, - "loss": 0.0055, + "epoch": 0.79, + "learning_rate": 0.00018186043376941838, + "loss": 0.0174, "step": 303840 }, { - "epoch": 1.53, - "learning_rate": 7.005564776929635e-05, - "loss": 0.004, + "epoch": 0.79, + "learning_rate": 0.00018185654555304693, + "loss": 0.0163, "step": 303850 }, { - "epoch": 1.53, - "learning_rate": 7.004808007628233e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018185265733667544, + "loss": 0.0153, "step": 303860 }, { - "epoch": 1.53, - "learning_rate": 7.004051238326833e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.000181848769120304, + "loss": 0.0164, "step": 303870 }, { - "epoch": 1.53, - "learning_rate": 7.003294469025432e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.00018184488090393252, + "loss": 0.0134, "step": 303880 }, { - "epoch": 1.53, - "learning_rate": 7.00253769972403e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018184099268756107, + "loss": 0.013, "step": 303890 }, { - "epoch": 1.53, - "learning_rate": 7.00178093042263e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.00018183710447118958, + "loss": 0.0128, "step": 303900 }, { - "epoch": 1.53, - "learning_rate": 7.00102416112123e-05, - "loss": 0.0087, + "epoch": 0.79, + "learning_rate": 0.00018183321625481815, + "loss": 0.0167, "step": 303910 }, { - "epoch": 1.53, - "learning_rate": 7.000267391819828e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018182932803844666, + "loss": 0.0149, "step": 303920 }, { - "epoch": 1.53, - "learning_rate": 6.999510622518427e-05, - "loss": 0.0092, + "epoch": 0.79, + "learning_rate": 0.0001818254398220752, + "loss": 0.014, "step": 303930 }, { - "epoch": 1.53, - "learning_rate": 6.998753853217025e-05, - "loss": 0.0053, + "epoch": 0.79, + "learning_rate": 0.00018182155160570372, + "loss": 0.0154, "step": 303940 }, { - "epoch": 1.53, - "learning_rate": 6.997997083915625e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018181766338933226, + "loss": 0.012, "step": 303950 }, { - "epoch": 1.53, - "learning_rate": 6.997240314614224e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018181377517296083, + "loss": 0.0172, "step": 303960 }, { - "epoch": 1.53, - "learning_rate": 6.996483545312822e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018180988695658934, + "loss": 0.0165, "step": 303970 }, { - "epoch": 1.53, - "learning_rate": 6.995726776011422e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.00018180599874021789, + "loss": 0.0175, "step": 303980 }, { - "epoch": 1.53, - "learning_rate": 6.994970006710021e-05, - "loss": 0.01, + "epoch": 0.79, + "learning_rate": 0.0001818021105238464, + "loss": 0.0159, "step": 303990 }, { - "epoch": 1.53, - "learning_rate": 6.99421323740862e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.00018179822230747497, + "loss": 0.0132, "step": 304000 }, { - "epoch": 1.53, - "eval_cer": 0.9144459960000272, - "eval_loss": 0.005344762932509184, - "eval_runtime": 116.3874, - "eval_samples_per_second": 17.184, - "eval_steps_per_second": 4.296, + "epoch": 0.79, + "eval_cer": 0.8817474747050615, + "eval_loss": 0.009092407301068306, + "eval_runtime": 107.6272, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 304000 }, { - "epoch": 1.53, - "learning_rate": 6.993456468107218e-05, - "loss": 0.0104, + "epoch": 0.79, + "learning_rate": 0.00018179433409110348, + "loss": 0.0175, "step": 304010 }, { - "epoch": 1.53, - "learning_rate": 6.992699698805817e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018179044587473203, + "loss": 0.0127, "step": 304020 }, { - "epoch": 1.53, - "learning_rate": 6.991942929504417e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018178655765836054, + "loss": 0.0161, "step": 304030 }, { - "epoch": 1.53, - "learning_rate": 6.991186160203015e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.0001817826694419891, + "loss": 0.0113, "step": 304040 }, { - "epoch": 1.53, - "learning_rate": 6.990429390901614e-05, - "loss": 0.0103, + "epoch": 0.79, + "learning_rate": 0.00018177878122561762, + "loss": 0.0164, "step": 304050 }, { - "epoch": 1.53, - "learning_rate": 6.989672621600212e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018177489300924617, + "loss": 0.0152, "step": 304060 }, { - "epoch": 1.53, - "learning_rate": 6.988915852298812e-05, - "loss": 0.0096, + "epoch": 0.79, + "learning_rate": 0.00018177100479287468, + "loss": 0.0178, "step": 304070 }, { - "epoch": 1.53, - "learning_rate": 6.988159082997411e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018176711657650325, + "loss": 0.0094, "step": 304080 }, { - "epoch": 1.53, - "learning_rate": 6.98740231369601e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.00018176322836013176, + "loss": 0.0136, "step": 304090 }, { - "epoch": 1.53, - "learning_rate": 6.986645544394609e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.0001817593401437603, + "loss": 0.015, "step": 304100 }, { - "epoch": 1.53, - "learning_rate": 6.985888775093209e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.00018175545192738882, + "loss": 0.0146, "step": 304110 }, { - "epoch": 1.53, - "learning_rate": 6.985132005791807e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.0001817515637110174, + "loss": 0.0126, "step": 304120 }, { - "epoch": 1.53, - "learning_rate": 6.984375236490406e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.00018174767549464593, + "loss": 0.0118, "step": 304130 }, { - "epoch": 1.53, - "learning_rate": 6.983618467189004e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018174378727827444, + "loss": 0.0147, "step": 304140 }, { - "epoch": 1.53, - "learning_rate": 6.982861697887604e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.00018173989906190296, + "loss": 0.0132, "step": 304150 }, { - "epoch": 1.53, - "learning_rate": 6.982104928586203e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018173601084553153, + "loss": 0.0132, "step": 304160 }, { - "epoch": 1.53, - "learning_rate": 6.981348159284802e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018173212262916007, + "loss": 0.0113, "step": 304170 }, { - "epoch": 1.53, - "learning_rate": 6.980591389983401e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.00018172823441278858, + "loss": 0.0127, "step": 304180 }, { - "epoch": 1.53, - "learning_rate": 6.979834620682e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.00018172434619641713, + "loss": 0.0113, "step": 304190 }, { - "epoch": 1.53, - "learning_rate": 6.979077851380599e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018172045798004564, + "loss": 0.0114, "step": 304200 }, { - "epoch": 1.53, - "learning_rate": 6.978321082079198e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.0001817165697636742, + "loss": 0.0138, "step": 304210 }, { - "epoch": 1.53, - "learning_rate": 6.977564312777796e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018171268154730272, + "loss": 0.0109, "step": 304220 }, { - "epoch": 1.53, - "learning_rate": 6.976807543476396e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018170879333093126, + "loss": 0.0122, "step": 304230 }, { - "epoch": 1.53, - "learning_rate": 6.976050774174995e-05, - "loss": 0.0091, + "epoch": 0.79, + "learning_rate": 0.00018170490511455978, + "loss": 0.0156, "step": 304240 }, { - "epoch": 1.53, - "learning_rate": 6.975294004873593e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018170101689818835, + "loss": 0.0136, "step": 304250 }, { - "epoch": 1.54, - "learning_rate": 6.974537235572193e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018169712868181686, + "loss": 0.0134, "step": 304260 }, { - "epoch": 1.54, - "learning_rate": 6.973780466270792e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.0001816932404654454, + "loss": 0.0152, "step": 304270 }, { - "epoch": 1.54, - "learning_rate": 6.97302369696939e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.00018168935224907392, + "loss": 0.0119, "step": 304280 }, { - "epoch": 1.54, - "learning_rate": 6.97226692766799e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.0001816854640327025, + "loss": 0.0139, "step": 304290 }, { - "epoch": 1.54, - "learning_rate": 6.971510158366588e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.000181681575816331, + "loss": 0.0116, "step": 304300 }, { - "epoch": 1.54, - "learning_rate": 6.970753389065188e-05, - "loss": 0.0093, + "epoch": 0.79, + "learning_rate": 0.00018167768759995954, + "loss": 0.0112, "step": 304310 }, { - "epoch": 1.54, - "learning_rate": 6.969996619763787e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018167379938358806, + "loss": 0.0134, "step": 304320 }, { - "epoch": 1.54, - "learning_rate": 6.969239850462385e-05, - "loss": 0.0098, + "epoch": 0.79, + "learning_rate": 0.00018166991116721663, + "loss": 0.0179, "step": 304330 }, { - "epoch": 1.54, - "learning_rate": 6.968483081160984e-05, - "loss": 0.01, + "epoch": 0.79, + "learning_rate": 0.00018166602295084517, + "loss": 0.0168, "step": 304340 }, { - "epoch": 1.54, - "learning_rate": 6.967726311859583e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018166213473447368, + "loss": 0.0135, "step": 304350 }, { - "epoch": 1.54, - "learning_rate": 6.966969542558183e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018165824651810222, + "loss": 0.0128, "step": 304360 }, { - "epoch": 1.54, - "learning_rate": 6.966212773256781e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.00018165435830173077, + "loss": 0.0168, "step": 304370 }, { - "epoch": 1.54, - "learning_rate": 6.96545600395538e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.0001816504700853593, + "loss": 0.0106, "step": 304380 }, { - "epoch": 1.54, - "learning_rate": 6.964699234653978e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018164658186898782, + "loss": 0.0132, "step": 304390 }, { - "epoch": 1.54, - "learning_rate": 6.963942465352578e-05, - "loss": 0.0048, + "epoch": 0.79, + "learning_rate": 0.00018164269365261636, + "loss": 0.0141, "step": 304400 }, { - "epoch": 1.54, - "learning_rate": 6.963185696051177e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.0001816388054362449, + "loss": 0.0161, "step": 304410 }, { - "epoch": 1.54, - "learning_rate": 6.962428926749775e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018163491721987345, + "loss": 0.0125, "step": 304420 }, { - "epoch": 1.54, - "learning_rate": 6.961672157448375e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018163102900350196, + "loss": 0.0134, "step": 304430 }, { - "epoch": 1.54, - "learning_rate": 6.960915388146974e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.0001816271407871305, + "loss": 0.0141, "step": 304440 }, { - "epoch": 1.54, - "learning_rate": 6.960158618845573e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018162325257075902, + "loss": 0.0151, "step": 304450 }, { - "epoch": 1.54, - "learning_rate": 6.959401849544172e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.0001816193643543876, + "loss": 0.0127, "step": 304460 }, { - "epoch": 1.54, - "learning_rate": 6.95864508024277e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001816154761380161, + "loss": 0.0148, "step": 304470 }, { - "epoch": 1.54, - "learning_rate": 6.95788831094137e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018161158792164464, + "loss": 0.0139, "step": 304480 }, { - "epoch": 1.54, - "learning_rate": 6.957131541639969e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.00018160769970527316, + "loss": 0.0147, "step": 304490 }, { - "epoch": 1.54, - "learning_rate": 6.956374772338567e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018160381148890173, + "loss": 0.0144, "step": 304500 }, { - "epoch": 1.54, - "learning_rate": 6.955618003037167e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018159992327253027, + "loss": 0.0183, "step": 304510 }, { - "epoch": 1.54, - "learning_rate": 6.954861233735766e-05, - "loss": 0.0096, + "epoch": 0.79, + "learning_rate": 0.00018159603505615878, + "loss": 0.0144, "step": 304520 }, { - "epoch": 1.54, - "learning_rate": 6.954104464434365e-05, - "loss": 0.0095, + "epoch": 0.79, + "learning_rate": 0.00018159214683978732, + "loss": 0.016, "step": 304530 }, { - "epoch": 1.54, - "learning_rate": 6.953347695132964e-05, - "loss": 0.0055, + "epoch": 0.79, + "learning_rate": 0.00018158825862341587, + "loss": 0.0166, "step": 304540 }, { - "epoch": 1.54, - "learning_rate": 6.952590925831564e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.0001815843704070444, + "loss": 0.0126, "step": 304550 }, { - "epoch": 1.54, - "learning_rate": 6.951834156530162e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018158048219067292, + "loss": 0.0153, "step": 304560 }, { - "epoch": 1.54, - "learning_rate": 6.951077387228761e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018157659397430146, + "loss": 0.0159, "step": 304570 }, { - "epoch": 1.54, - "learning_rate": 6.95032061792736e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018157270575793, + "loss": 0.0158, "step": 304580 }, { - "epoch": 1.54, - "learning_rate": 6.949563848625959e-05, - "loss": 0.0052, + "epoch": 0.79, + "learning_rate": 0.00018156881754155855, + "loss": 0.0122, "step": 304590 }, { - "epoch": 1.54, - "learning_rate": 6.948807079324558e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.00018156492932518706, + "loss": 0.0185, "step": 304600 }, { - "epoch": 1.54, - "learning_rate": 6.948050310023157e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.0001815610411088156, + "loss": 0.0152, "step": 304610 }, { - "epoch": 1.54, - "learning_rate": 6.947293540721756e-05, - "loss": 0.0096, + "epoch": 0.79, + "learning_rate": 0.00018155715289244414, + "loss": 0.0125, "step": 304620 }, { - "epoch": 1.54, - "learning_rate": 6.946536771420355e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018155326467607269, + "loss": 0.0146, "step": 304630 }, { - "epoch": 1.54, - "learning_rate": 6.945780002118954e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.0001815493764597012, + "loss": 0.0139, "step": 304640 }, { - "epoch": 1.54, - "learning_rate": 6.945023232817552e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018154548824332974, + "loss": 0.0148, "step": 304650 }, { - "epoch": 1.54, - "learning_rate": 6.944266463516151e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.0001815416000269583, + "loss": 0.0215, "step": 304660 }, { - "epoch": 1.54, - "learning_rate": 6.94350969421475e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018153771181058683, + "loss": 0.017, "step": 304670 }, { - "epoch": 1.54, - "learning_rate": 6.942752924913349e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018153382359421537, + "loss": 0.0136, "step": 304680 }, { - "epoch": 1.54, - "learning_rate": 6.941996155611948e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018152993537784388, + "loss": 0.0121, "step": 304690 }, { - "epoch": 1.54, - "learning_rate": 6.941239386310547e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018152604716147242, + "loss": 0.0401, "step": 304700 }, { - "epoch": 1.54, - "learning_rate": 6.940482617009146e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018152215894510097, + "loss": 0.0176, "step": 304710 }, { - "epoch": 1.54, - "learning_rate": 6.939725847707746e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.0001815182707287295, + "loss": 0.0147, "step": 304720 }, { - "epoch": 1.54, - "learning_rate": 6.938969078406344e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018151438251235802, + "loss": 0.0182, "step": 304730 }, { - "epoch": 1.54, - "learning_rate": 6.938212309104943e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018151049429598656, + "loss": 0.0182, "step": 304740 }, { - "epoch": 1.54, - "learning_rate": 6.937455539803541e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.0001815066060796151, + "loss": 0.0119, "step": 304750 }, { - "epoch": 1.54, - "learning_rate": 6.936698770502141e-05, - "loss": 0.0086, + "epoch": 0.79, + "learning_rate": 0.00018150271786324365, + "loss": 0.015, "step": 304760 }, { - "epoch": 1.54, - "learning_rate": 6.93594200120074e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018149882964687216, + "loss": 0.0157, "step": 304770 }, { - "epoch": 1.54, - "learning_rate": 6.935185231899339e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.0001814949414305007, + "loss": 0.0137, "step": 304780 }, { - "epoch": 1.54, - "learning_rate": 6.934428462597938e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018149105321412924, + "loss": 0.0156, "step": 304790 }, { - "epoch": 1.54, - "learning_rate": 6.933671693296538e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018148716499775779, + "loss": 0.0143, "step": 304800 }, { - "epoch": 1.54, - "learning_rate": 6.932914923995136e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.0001814832767813863, + "loss": 0.0152, "step": 304810 }, { - "epoch": 1.54, - "learning_rate": 6.932158154693735e-05, - "loss": 0.009, + "epoch": 0.79, + "learning_rate": 0.00018147938856501484, + "loss": 0.0166, "step": 304820 }, { - "epoch": 1.54, - "learning_rate": 6.931401385392333e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.0001814755003486434, + "loss": 0.0155, "step": 304830 }, { - "epoch": 1.54, - "learning_rate": 6.930644616090933e-05, - "loss": 0.005, + "epoch": 0.79, + "learning_rate": 0.00018147161213227192, + "loss": 0.0166, "step": 304840 }, { - "epoch": 1.54, - "learning_rate": 6.929887846789532e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018146772391590047, + "loss": 0.017, "step": 304850 }, { - "epoch": 1.54, - "learning_rate": 6.92913107748813e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018146383569952898, + "loss": 0.0154, "step": 304860 }, { - "epoch": 1.54, - "learning_rate": 6.92837430818673e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018145994748315755, + "loss": 0.012, "step": 304870 }, { - "epoch": 1.54, - "learning_rate": 6.92761753888533e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018145605926678606, + "loss": 0.0131, "step": 304880 }, { - "epoch": 1.54, - "learning_rate": 6.926860769583928e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.0001814521710504146, + "loss": 0.0215, "step": 304890 }, { - "epoch": 1.54, - "learning_rate": 6.926104000282527e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018144828283404312, + "loss": 0.0155, "step": 304900 }, { - "epoch": 1.54, - "learning_rate": 6.925347230981125e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.0001814443946176717, + "loss": 0.0147, "step": 304910 }, { - "epoch": 1.54, - "learning_rate": 6.924590461679725e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.0001814405064013002, + "loss": 0.0151, "step": 304920 }, { - "epoch": 1.54, - "learning_rate": 6.923833692378324e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.00018143661818492875, + "loss": 0.0134, "step": 304930 }, { - "epoch": 1.54, - "learning_rate": 6.923076923076922e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018143272996855726, + "loss": 0.0161, "step": 304940 }, { - "epoch": 1.54, - "learning_rate": 6.922320153775522e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.0001814288417521858, + "loss": 0.0133, "step": 304950 }, { - "epoch": 1.54, - "learning_rate": 6.92156338447412e-05, - "loss": 0.0055, + "epoch": 0.79, + "learning_rate": 0.00018142495353581434, + "loss": 0.0202, "step": 304960 }, { - "epoch": 1.54, - "learning_rate": 6.92080661517272e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018142106531944288, + "loss": 0.0178, "step": 304970 }, { - "epoch": 1.54, - "learning_rate": 6.920049845871318e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.0001814171771030714, + "loss": 0.0125, "step": 304980 }, { - "epoch": 1.54, - "learning_rate": 6.919293076569917e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.00018141328888669994, + "loss": 0.0128, "step": 304990 }, { - "epoch": 1.54, - "learning_rate": 6.918536307268517e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.0001814094006703285, + "loss": 0.0116, "step": 305000 }, { - "epoch": 1.54, - "eval_cer": 0.9144392032271493, - "eval_loss": 0.0054320478811860085, - "eval_runtime": 116.39, - "eval_samples_per_second": 17.184, - "eval_steps_per_second": 4.296, + "epoch": 0.79, + "eval_cer": 0.8817292794249172, + "eval_loss": 0.009619629941880703, + "eval_runtime": 107.6086, + "eval_samples_per_second": 18.586, + "eval_steps_per_second": 4.646, "step": 305000 }, { - "epoch": 1.54, - "learning_rate": 6.917779537967115e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018140551245395702, + "loss": 0.014, "step": 305010 }, { - "epoch": 1.54, - "learning_rate": 6.917022768665714e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018140162423758554, + "loss": 0.0148, "step": 305020 }, { - "epoch": 1.54, - "learning_rate": 6.916265999364312e-05, - "loss": 0.0113, + "epoch": 0.79, + "learning_rate": 0.00018139773602121408, + "loss": 0.0119, "step": 305030 }, { - "epoch": 1.54, - "learning_rate": 6.915509230062912e-05, - "loss": 0.0112, + "epoch": 0.79, + "learning_rate": 0.00018139384780484265, + "loss": 0.0167, "step": 305040 }, { - "epoch": 1.54, - "learning_rate": 6.914752460761511e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018138995958847116, + "loss": 0.0112, "step": 305050 }, { - "epoch": 1.54, - "learning_rate": 6.91399569146011e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.0001813860713720997, + "loss": 0.0158, "step": 305060 }, { - "epoch": 1.54, - "learning_rate": 6.913238922158709e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018138218315572822, + "loss": 0.0146, "step": 305070 }, { - "epoch": 1.54, - "learning_rate": 6.912482152857309e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001813782949393568, + "loss": 0.0179, "step": 305080 }, { - "epoch": 1.54, - "learning_rate": 6.911725383555907e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.0001813744067229853, + "loss": 0.0129, "step": 305090 }, { - "epoch": 1.54, - "learning_rate": 6.910968614254506e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018137051850661384, + "loss": 0.0169, "step": 305100 }, { - "epoch": 1.54, - "learning_rate": 6.910211844953104e-05, - "loss": 0.0052, - "step": 305110 + "epoch": 0.79, + "learning_rate": 0.00018136663029024236, + "loss": 0.0136, + "step": 305110 }, { - "epoch": 1.54, - "learning_rate": 6.909455075651704e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018136274207387093, + "loss": 0.0133, "step": 305120 }, { - "epoch": 1.54, - "learning_rate": 6.908698306350303e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018135885385749944, + "loss": 0.0155, "step": 305130 }, { - "epoch": 1.54, - "learning_rate": 6.907941537048902e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018135496564112798, + "loss": 0.0115, "step": 305140 }, { - "epoch": 1.54, - "learning_rate": 6.907184767747501e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.0001813510774247565, + "loss": 0.0192, "step": 305150 }, { - "epoch": 1.54, - "learning_rate": 6.9064279984461e-05, - "loss": 0.0052, + "epoch": 0.79, + "learning_rate": 0.00018134718920838507, + "loss": 0.0164, "step": 305160 }, { - "epoch": 1.54, - "learning_rate": 6.905671229144699e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.0001813433009920136, + "loss": 0.0158, "step": 305170 }, { - "epoch": 1.54, - "learning_rate": 6.904914459843298e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.00018133941277564212, + "loss": 0.0135, "step": 305180 }, { - "epoch": 1.54, - "learning_rate": 6.904157690541896e-05, - "loss": 0.0084, + "epoch": 0.79, + "learning_rate": 0.00018133552455927064, + "loss": 0.0132, "step": 305190 }, { - "epoch": 1.54, - "learning_rate": 6.903400921240496e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018133163634289918, + "loss": 0.014, "step": 305200 }, { - "epoch": 1.54, - "learning_rate": 6.902644151939095e-05, - "loss": 0.0077, + "epoch": 0.79, + "learning_rate": 0.00018132774812652775, + "loss": 0.0156, "step": 305210 }, { - "epoch": 1.54, - "learning_rate": 6.901887382637693e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018132385991015626, + "loss": 0.0158, "step": 305220 }, { - "epoch": 1.54, - "learning_rate": 6.901130613336293e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.0001813199716937848, + "loss": 0.0135, "step": 305230 }, { - "epoch": 1.54, - "learning_rate": 6.900373844034892e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018131608347741332, + "loss": 0.018, "step": 305240 }, { - "epoch": 1.54, - "learning_rate": 6.89961707473349e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.0001813121952610419, + "loss": 0.016, "step": 305250 }, { - "epoch": 1.54, - "learning_rate": 6.89886030543209e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.0001813083070446704, + "loss": 0.0138, "step": 305260 }, { - "epoch": 1.54, - "learning_rate": 6.898103536130688e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018130441882829894, + "loss": 0.0097, "step": 305270 }, { - "epoch": 1.54, - "learning_rate": 6.897346766829286e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018130053061192746, + "loss": 0.0142, "step": 305280 }, { - "epoch": 1.54, - "learning_rate": 6.896589997527886e-05, - "loss": 0.0125, + "epoch": 0.79, + "learning_rate": 0.00018129664239555603, + "loss": 0.0148, "step": 305290 }, { - "epoch": 1.54, - "learning_rate": 6.895833228226485e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018129275417918454, + "loss": 0.0124, "step": 305300 }, { - "epoch": 1.54, - "learning_rate": 6.895076458925084e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018128886596281308, + "loss": 0.0153, "step": 305310 }, { - "epoch": 1.54, - "learning_rate": 6.894319689623683e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.0001812849777464416, + "loss": 0.015, "step": 305320 }, { - "epoch": 1.54, - "learning_rate": 6.893562920322283e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.00018128108953007017, + "loss": 0.0147, "step": 305330 }, { - "epoch": 1.54, - "learning_rate": 6.89280615102088e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018127720131369868, + "loss": 0.0179, "step": 305340 }, { - "epoch": 1.54, - "learning_rate": 6.89204938171948e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018127331309732722, + "loss": 0.0132, "step": 305350 }, { - "epoch": 1.54, - "learning_rate": 6.891292612418078e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018126942488095574, + "loss": 0.0154, "step": 305360 }, { - "epoch": 1.54, - "learning_rate": 6.890535843116678e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.0001812655366645843, + "loss": 0.015, "step": 305370 }, { - "epoch": 1.54, - "learning_rate": 6.889779073815277e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018126164844821285, + "loss": 0.011, "step": 305380 }, { - "epoch": 1.54, - "learning_rate": 6.889022304513875e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018125776023184136, + "loss": 0.0134, "step": 305390 }, { - "epoch": 1.54, - "learning_rate": 6.888265535212475e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.0001812538720154699, + "loss": 0.013, "step": 305400 }, { - "epoch": 1.54, - "learning_rate": 6.887508765911074e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018124998379909845, + "loss": 0.0139, "step": 305410 }, { - "epoch": 1.54, - "learning_rate": 6.886751996609673e-05, - "loss": 0.0055, + "epoch": 0.79, + "learning_rate": 0.000181246095582727, + "loss": 0.0146, "step": 305420 }, { - "epoch": 1.54, - "learning_rate": 6.885995227308272e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.0001812422073663555, + "loss": 0.0156, "step": 305430 }, { - "epoch": 1.54, - "learning_rate": 6.88523845800687e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018123831914998404, + "loss": 0.0127, "step": 305440 }, { - "epoch": 1.54, - "learning_rate": 6.88448168870547e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.00018123443093361256, + "loss": 0.0163, "step": 305450 }, { - "epoch": 1.54, - "learning_rate": 6.883724919404069e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.00018123054271724113, + "loss": 0.0142, "step": 305460 }, { - "epoch": 1.54, - "learning_rate": 6.882968150102667e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018122665450086964, + "loss": 0.0155, "step": 305470 }, { - "epoch": 1.54, - "learning_rate": 6.882211380801267e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018122276628449818, + "loss": 0.0158, "step": 305480 }, { - "epoch": 1.54, - "learning_rate": 6.881454611499866e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.0001812188780681267, + "loss": 0.0181, "step": 305490 }, { - "epoch": 1.54, - "learning_rate": 6.880697842198465e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018121498985175527, + "loss": 0.0194, "step": 305500 }, { - "epoch": 1.54, - "learning_rate": 6.879941072897064e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.00018121110163538378, + "loss": 0.0168, "step": 305510 }, { - "epoch": 1.54, - "learning_rate": 6.879184303595664e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018120721341901232, + "loss": 0.0149, "step": 305520 }, { - "epoch": 1.54, - "learning_rate": 6.878427534294262e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018120332520264084, + "loss": 0.0121, "step": 305530 }, { - "epoch": 1.54, - "learning_rate": 6.877670764992861e-05, - "loss": 0.0087, + "epoch": 0.79, + "learning_rate": 0.0001811994369862694, + "loss": 0.0119, "step": 305540 }, { - "epoch": 1.54, - "learning_rate": 6.876913995691459e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018119554876989795, + "loss": 0.0122, "step": 305550 }, { - "epoch": 1.54, - "learning_rate": 6.876157226390059e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018119166055352646, + "loss": 0.0116, "step": 305560 }, { - "epoch": 1.54, - "learning_rate": 6.875400457088658e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.000181187772337155, + "loss": 0.0108, "step": 305570 }, { - "epoch": 1.54, - "learning_rate": 6.874643687787256e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018118388412078355, + "loss": 0.0154, "step": 305580 }, { - "epoch": 1.54, - "learning_rate": 6.873886918485855e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.0001811799959044121, + "loss": 0.0129, "step": 305590 }, { - "epoch": 1.54, - "learning_rate": 6.873130149184454e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001811761076880406, + "loss": 0.0128, "step": 305600 }, { - "epoch": 1.54, - "learning_rate": 6.872373379883054e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018117221947166914, + "loss": 0.0109, "step": 305610 }, { - "epoch": 1.54, - "learning_rate": 6.871616610581652e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018116833125529768, + "loss": 0.0117, "step": 305620 }, { - "epoch": 1.54, - "learning_rate": 6.870859841280251e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018116444303892623, + "loss": 0.0127, "step": 305630 }, { - "epoch": 1.54, - "learning_rate": 6.87010307197885e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018116055482255474, + "loss": 0.0129, "step": 305640 }, { - "epoch": 1.54, - "learning_rate": 6.869346302677449e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018115666660618328, + "loss": 0.0127, "step": 305650 }, { - "epoch": 1.54, - "learning_rate": 6.868589533376048e-05, - "loss": 0.0052, + "epoch": 0.79, + "learning_rate": 0.00018115277838981182, + "loss": 0.0118, "step": 305660 }, { - "epoch": 1.54, - "learning_rate": 6.867832764074647e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018114889017344037, + "loss": 0.0144, "step": 305670 }, { - "epoch": 1.54, - "learning_rate": 6.867075994773246e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.00018114500195706888, + "loss": 0.0179, "step": 305680 }, { - "epoch": 1.54, - "learning_rate": 6.866319225471846e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018114111374069742, + "loss": 0.015, "step": 305690 }, { - "epoch": 1.54, - "learning_rate": 6.865562456170444e-05, - "loss": 0.0098, + "epoch": 0.79, + "learning_rate": 0.00018113722552432594, + "loss": 0.0138, "step": 305700 }, { - "epoch": 1.54, - "learning_rate": 6.864805686869043e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.0001811333373079545, + "loss": 0.0157, "step": 305710 }, { - "epoch": 1.54, - "learning_rate": 6.864048917567641e-05, - "loss": 0.0078, + "epoch": 0.79, + "learning_rate": 0.00018112944909158305, + "loss": 0.0151, "step": 305720 }, { - "epoch": 1.54, - "learning_rate": 6.863292148266241e-05, - "loss": 0.0102, + "epoch": 0.79, + "learning_rate": 0.00018112556087521156, + "loss": 0.0118, "step": 305730 }, { - "epoch": 1.54, - "learning_rate": 6.86253537896484e-05, - "loss": 0.0075, + "epoch": 0.79, + "learning_rate": 0.00018112167265884008, + "loss": 0.0116, "step": 305740 }, { - "epoch": 1.54, - "learning_rate": 6.861778609663438e-05, - "loss": 0.01, + "epoch": 0.79, + "learning_rate": 0.00018111778444246864, + "loss": 0.0142, "step": 305750 }, { - "epoch": 1.54, - "learning_rate": 6.861021840362038e-05, - "loss": 0.0059, + "epoch": 0.79, + "learning_rate": 0.0001811138962260972, + "loss": 0.0112, "step": 305760 }, { - "epoch": 1.54, - "learning_rate": 6.860265071060637e-05, - "loss": 0.0093, + "epoch": 0.79, + "learning_rate": 0.0001811100080097257, + "loss": 0.0144, "step": 305770 }, { - "epoch": 1.54, - "learning_rate": 6.859508301759236e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018110611979335424, + "loss": 0.013, "step": 305780 }, { - "epoch": 1.54, - "learning_rate": 6.858751532457835e-05, - "loss": 0.0054, + "epoch": 0.79, + "learning_rate": 0.00018110223157698278, + "loss": 0.0138, "step": 305790 }, { - "epoch": 1.54, - "learning_rate": 6.857994763156433e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018109834336061133, + "loss": 0.0137, "step": 305800 }, { - "epoch": 1.54, - "learning_rate": 6.857237993855033e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018109445514423984, + "loss": 0.014, "step": 305810 }, { - "epoch": 1.54, - "learning_rate": 6.856481224553632e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018109056692786838, + "loss": 0.015, "step": 305820 }, { - "epoch": 1.54, - "learning_rate": 6.85572445525223e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.00018108667871149692, + "loss": 0.0133, "step": 305830 }, { - "epoch": 1.54, - "learning_rate": 6.85496768595083e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018108279049512547, + "loss": 0.0109, "step": 305840 }, { - "epoch": 1.54, - "learning_rate": 6.85421091664943e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018107890227875398, + "loss": 0.0149, "step": 305850 }, { - "epoch": 1.54, - "learning_rate": 6.853454147348028e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018107501406238252, + "loss": 0.0155, "step": 305860 }, { - "epoch": 1.54, - "learning_rate": 6.852697378046627e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.0001810711258460111, + "loss": 0.0155, "step": 305870 }, { - "epoch": 1.54, - "learning_rate": 6.851940608745225e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001810672376296396, + "loss": 0.0139, "step": 305880 }, { - "epoch": 1.54, - "learning_rate": 6.851183839443825e-05, - "loss": 0.0102, + "epoch": 0.79, + "learning_rate": 0.00018106334941326812, + "loss": 0.0142, "step": 305890 }, { - "epoch": 1.54, - "learning_rate": 6.850427070142423e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018105946119689666, + "loss": 0.0122, "step": 305900 }, { - "epoch": 1.54, - "learning_rate": 6.849670300841022e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018105557298052523, + "loss": 0.0179, "step": 305910 }, { - "epoch": 1.54, - "learning_rate": 6.84891353153962e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018105168476415374, + "loss": 0.016, "step": 305920 }, { - "epoch": 1.54, - "learning_rate": 6.84815676223822e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018104779654778229, + "loss": 0.0145, "step": 305930 }, { - "epoch": 1.54, - "learning_rate": 6.84739999293682e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.0001810439083314108, + "loss": 0.0161, "step": 305940 }, { - "epoch": 1.54, - "learning_rate": 6.846643223635418e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018104002011503934, + "loss": 0.0134, "step": 305950 }, { - "epoch": 1.54, - "learning_rate": 6.845886454334017e-05, - "loss": 0.0058, + "epoch": 0.79, + "learning_rate": 0.00018103613189866788, + "loss": 0.0138, "step": 305960 }, { - "epoch": 1.54, - "learning_rate": 6.845129685032617e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018103224368229643, + "loss": 0.0172, "step": 305970 }, { - "epoch": 1.54, - "learning_rate": 6.844372915731215e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018102835546592494, + "loss": 0.0113, "step": 305980 }, { - "epoch": 1.54, - "learning_rate": 6.843616146429814e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018102446724955348, + "loss": 0.0119, "step": 305990 }, { - "epoch": 1.54, - "learning_rate": 6.842859377128412e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.00018102057903318202, + "loss": 0.0146, "step": 306000 }, { - "epoch": 1.54, - "eval_cer": 0.9144450256039017, - "eval_loss": 0.00540526770055294, - "eval_runtime": 116.2539, - "eval_samples_per_second": 17.204, - "eval_steps_per_second": 4.301, + "epoch": 0.79, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.009411798790097237, + "eval_runtime": 107.6226, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 306000 }, { - "epoch": 1.54, - "learning_rate": 6.842102607827012e-05, - "loss": 0.0125, + "epoch": 0.79, + "learning_rate": 0.00018101669081681056, + "loss": 0.0154, "step": 306010 }, { - "epoch": 1.54, - "learning_rate": 6.841345838525611e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.00018101280260043908, + "loss": 0.0155, "step": 306020 }, { - "epoch": 1.54, - "learning_rate": 6.84058906922421e-05, - "loss": 0.0085, + "epoch": 0.79, + "learning_rate": 0.00018100891438406762, + "loss": 0.018, "step": 306030 }, { - "epoch": 1.54, - "learning_rate": 6.839832299922809e-05, - "loss": 0.0083, + "epoch": 0.79, + "learning_rate": 0.0001810050261676962, + "loss": 0.0166, "step": 306040 }, { - "epoch": 1.54, - "learning_rate": 6.839075530621409e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.0001810011379513247, + "loss": 0.0132, "step": 306050 }, { - "epoch": 1.54, - "learning_rate": 6.838318761320007e-05, - "loss": 0.005, + "epoch": 0.79, + "learning_rate": 0.00018099724973495322, + "loss": 0.0116, "step": 306060 }, { - "epoch": 1.54, - "learning_rate": 6.837561992018606e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018099336151858176, + "loss": 0.0157, "step": 306070 }, { - "epoch": 1.54, - "learning_rate": 6.836805222717204e-05, - "loss": 0.0113, + "epoch": 0.79, + "learning_rate": 0.00018098947330221033, + "loss": 0.0142, "step": 306080 }, { - "epoch": 1.54, - "learning_rate": 6.836048453415804e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018098558508583884, + "loss": 0.0175, "step": 306090 }, { - "epoch": 1.54, - "learning_rate": 6.835291684114403e-05, - "loss": 0.0053, + "epoch": 0.79, + "learning_rate": 0.00018098169686946739, + "loss": 0.0121, "step": 306100 }, { - "epoch": 1.54, - "learning_rate": 6.834534914813001e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.0001809778086530959, + "loss": 0.0126, "step": 306110 }, { - "epoch": 1.54, - "learning_rate": 6.833778145511601e-05, - "loss": 0.0087, + "epoch": 0.79, + "learning_rate": 0.00018097392043672447, + "loss": 0.0154, "step": 306120 }, { - "epoch": 1.54, - "learning_rate": 6.8330213762102e-05, - "loss": 0.01, + "epoch": 0.79, + "learning_rate": 0.00018097003222035298, + "loss": 0.0162, "step": 306130 }, { - "epoch": 1.54, - "learning_rate": 6.832264606908799e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018096614400398152, + "loss": 0.0141, "step": 306140 }, { - "epoch": 1.54, - "learning_rate": 6.831507837607398e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018096225578761004, + "loss": 0.0143, "step": 306150 }, { - "epoch": 1.54, - "learning_rate": 6.830751068305996e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.0001809583675712386, + "loss": 0.0182, "step": 306160 }, { - "epoch": 1.54, - "learning_rate": 6.829994299004596e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018095447935486712, + "loss": 0.0172, "step": 306170 }, { - "epoch": 1.54, - "learning_rate": 6.829237529703195e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018095059113849566, + "loss": 0.0142, "step": 306180 }, { - "epoch": 1.54, - "learning_rate": 6.828480760401793e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018094670292212418, + "loss": 0.0125, "step": 306190 }, { - "epoch": 1.54, - "learning_rate": 6.827723991100393e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018094281470575272, + "loss": 0.0149, "step": 306200 }, { - "epoch": 1.54, - "learning_rate": 6.826967221798991e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018093892648938126, + "loss": 0.0155, "step": 306210 }, { - "epoch": 1.54, - "learning_rate": 6.82621045249759e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.0001809350382730098, + "loss": 0.0144, "step": 306220 }, { - "epoch": 1.54, - "learning_rate": 6.825453683196189e-05, - "loss": 0.0043, + "epoch": 0.79, + "learning_rate": 0.00018093115005663832, + "loss": 0.016, "step": 306230 }, { - "epoch": 1.55, - "learning_rate": 6.824696913894788e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018092726184026686, + "loss": 0.0128, "step": 306240 }, { - "epoch": 1.55, - "learning_rate": 6.823940144593386e-05, - "loss": 0.0071, + "epoch": 0.79, + "learning_rate": 0.00018092337362389543, + "loss": 0.0151, "step": 306250 }, { - "epoch": 1.55, - "learning_rate": 6.823183375291986e-05, - "loss": 0.0093, + "epoch": 0.79, + "learning_rate": 0.00018091948540752394, + "loss": 0.0169, "step": 306260 }, { - "epoch": 1.55, - "learning_rate": 6.822426605990585e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.00018091559719115248, + "loss": 0.0156, "step": 306270 }, { - "epoch": 1.55, - "learning_rate": 6.821669836689183e-05, - "loss": 0.008, + "epoch": 0.79, + "learning_rate": 0.000180911708974781, + "loss": 0.0123, "step": 306280 }, { - "epoch": 1.55, - "learning_rate": 6.820913067387783e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018090782075840957, + "loss": 0.0172, "step": 306290 }, { - "epoch": 1.55, - "learning_rate": 6.820156298086382e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018090393254203808, + "loss": 0.0144, "step": 306300 }, { - "epoch": 1.55, - "learning_rate": 6.81939952878498e-05, - "loss": 0.0055, + "epoch": 0.79, + "learning_rate": 0.00018090004432566662, + "loss": 0.0149, "step": 306310 }, { - "epoch": 1.55, - "learning_rate": 6.81864275948358e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.00018089615610929514, + "loss": 0.0157, "step": 306320 }, { - "epoch": 1.55, - "learning_rate": 6.817885990182178e-05, - "loss": 0.0097, + "epoch": 0.79, + "learning_rate": 0.0001808922678929237, + "loss": 0.0142, "step": 306330 }, { - "epoch": 1.55, - "learning_rate": 6.817129220880778e-05, - "loss": 0.007, + "epoch": 0.79, + "learning_rate": 0.00018088837967655222, + "loss": 0.0118, "step": 306340 }, { - "epoch": 1.55, - "learning_rate": 6.816372451579377e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018088449146018076, + "loss": 0.015, "step": 306350 }, { - "epoch": 1.55, - "learning_rate": 6.815615682277975e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018088060324380928, + "loss": 0.01, "step": 306360 }, { - "epoch": 1.55, - "learning_rate": 6.814858912976575e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018087671502743785, + "loss": 0.0163, "step": 306370 }, { - "epoch": 1.55, - "learning_rate": 6.814102143675174e-05, - "loss": 0.0065, + "epoch": 0.79, + "learning_rate": 0.00018087282681106636, + "loss": 0.0151, "step": 306380 }, { - "epoch": 1.55, - "learning_rate": 6.813345374373773e-05, - "loss": 0.0073, + "epoch": 0.79, + "learning_rate": 0.0001808689385946949, + "loss": 0.0156, "step": 306390 }, { - "epoch": 1.55, - "learning_rate": 6.812588605072372e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018086505037832342, + "loss": 0.0153, "step": 306400 }, { - "epoch": 1.55, - "learning_rate": 6.81183183577097e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018086116216195199, + "loss": 0.016, "step": 306410 }, { - "epoch": 1.55, - "learning_rate": 6.81107506646957e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018085727394558053, + "loss": 0.0142, "step": 306420 }, { - "epoch": 1.55, - "learning_rate": 6.810318297168169e-05, - "loss": 0.0062, + "epoch": 0.79, + "learning_rate": 0.00018085338572920904, + "loss": 0.0123, "step": 306430 }, { - "epoch": 1.55, - "learning_rate": 6.809561527866767e-05, - "loss": 0.0067, + "epoch": 0.79, + "learning_rate": 0.00018084949751283758, + "loss": 0.0162, "step": 306440 }, { - "epoch": 1.55, - "learning_rate": 6.808804758565367e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.0001808456092964661, + "loss": 0.0166, "step": 306450 }, { - "epoch": 1.55, - "learning_rate": 6.808047989263966e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018084172108009467, + "loss": 0.0124, "step": 306460 }, { - "epoch": 1.55, - "learning_rate": 6.807291219962564e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.00018083783286372318, + "loss": 0.0114, "step": 306470 }, { - "epoch": 1.55, - "learning_rate": 6.806534450661164e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018083394464735172, + "loss": 0.0104, "step": 306480 }, { - "epoch": 1.55, - "learning_rate": 6.805777681359763e-05, - "loss": 0.0072, + "epoch": 0.79, + "learning_rate": 0.00018083005643098024, + "loss": 0.0144, "step": 306490 }, { - "epoch": 1.55, - "learning_rate": 6.805020912058362e-05, - "loss": 0.0057, + "epoch": 0.79, + "learning_rate": 0.0001808261682146088, + "loss": 0.014, "step": 306500 }, { - "epoch": 1.55, - "learning_rate": 6.804264142756961e-05, - "loss": 0.0081, + "epoch": 0.79, + "learning_rate": 0.00018082227999823732, + "loss": 0.0126, "step": 306510 }, { - "epoch": 1.55, - "learning_rate": 6.803507373455559e-05, - "loss": 0.0069, + "epoch": 0.79, + "learning_rate": 0.00018081839178186586, + "loss": 0.0127, "step": 306520 }, { - "epoch": 1.55, - "learning_rate": 6.802750604154157e-05, - "loss": 0.0066, + "epoch": 0.79, + "learning_rate": 0.00018081450356549438, + "loss": 0.0146, "step": 306530 }, { - "epoch": 1.55, - "learning_rate": 6.801993834852757e-05, - "loss": 0.0049, + "epoch": 0.79, + "learning_rate": 0.00018081061534912295, + "loss": 0.0146, "step": 306540 }, { - "epoch": 1.55, - "learning_rate": 6.801237065551356e-05, - "loss": 0.0082, + "epoch": 0.79, + "learning_rate": 0.00018080672713275146, + "loss": 0.0148, "step": 306550 }, { - "epoch": 1.55, - "learning_rate": 6.800480296249955e-05, - "loss": 0.0088, + "epoch": 0.79, + "learning_rate": 0.00018080283891638, + "loss": 0.0111, "step": 306560 }, { - "epoch": 1.55, - "learning_rate": 6.799723526948554e-05, - "loss": 0.0056, + "epoch": 0.79, + "learning_rate": 0.00018079895070000852, + "loss": 0.0173, "step": 306570 }, { - "epoch": 1.55, - "learning_rate": 6.798966757647154e-05, - "loss": 0.0099, + "epoch": 0.79, + "learning_rate": 0.00018079506248363709, + "loss": 0.0146, "step": 306580 }, { - "epoch": 1.55, - "learning_rate": 6.798209988345752e-05, - "loss": 0.0051, + "epoch": 0.79, + "learning_rate": 0.00018079117426726563, + "loss": 0.0141, "step": 306590 }, { - "epoch": 1.55, - "learning_rate": 6.797453219044351e-05, - "loss": 0.0076, + "epoch": 0.79, + "learning_rate": 0.00018078728605089414, + "loss": 0.0152, "step": 306600 }, { - "epoch": 1.55, - "learning_rate": 6.79669644974295e-05, - "loss": 0.0061, + "epoch": 0.79, + "learning_rate": 0.00018078339783452266, + "loss": 0.0144, "step": 306610 }, { - "epoch": 1.55, - "learning_rate": 6.795939680441549e-05, - "loss": 0.0079, + "epoch": 0.79, + "learning_rate": 0.00018077950961815123, + "loss": 0.0173, "step": 306620 }, { - "epoch": 1.55, - "learning_rate": 6.795182911140148e-05, - "loss": 0.006, + "epoch": 0.79, + "learning_rate": 0.00018077562140177977, + "loss": 0.0113, "step": 306630 }, { - "epoch": 1.55, - "learning_rate": 6.794426141838746e-05, - "loss": 0.013, + "epoch": 0.79, + "learning_rate": 0.00018077173318540828, + "loss": 0.0123, "step": 306640 }, { - "epoch": 1.55, - "learning_rate": 6.793669372537346e-05, - "loss": 0.0068, + "epoch": 0.79, + "learning_rate": 0.00018076784496903682, + "loss": 0.016, "step": 306650 }, { - "epoch": 1.55, - "learning_rate": 6.792912603235945e-05, - "loss": 0.0089, + "epoch": 0.79, + "learning_rate": 0.00018076395675266534, + "loss": 0.0145, "step": 306660 }, { - "epoch": 1.55, - "learning_rate": 6.792155833934544e-05, - "loss": 0.0074, + "epoch": 0.79, + "learning_rate": 0.0001807600685362939, + "loss": 0.0116, "step": 306670 }, { - "epoch": 1.55, - "learning_rate": 6.791399064633143e-05, - "loss": 0.0064, + "epoch": 0.79, + "learning_rate": 0.00018075618031992242, + "loss": 0.0141, "step": 306680 }, { - "epoch": 1.55, - "learning_rate": 6.790642295331741e-05, - "loss": 0.0063, + "epoch": 0.79, + "learning_rate": 0.00018075229210355096, + "loss": 0.0168, "step": 306690 }, { - "epoch": 1.55, - "learning_rate": 6.789885526030341e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00018074840388717948, + "loss": 0.0148, "step": 306700 }, { - "epoch": 1.55, - "learning_rate": 6.78912875672894e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018074451567080805, + "loss": 0.0135, "step": 306710 }, { - "epoch": 1.55, - "learning_rate": 6.788371987427538e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00018074062745443656, + "loss": 0.0132, "step": 306720 }, { - "epoch": 1.55, - "learning_rate": 6.787615218126138e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.0001807367392380651, + "loss": 0.0145, "step": 306730 }, { - "epoch": 1.55, - "learning_rate": 6.786858448824737e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00018073285102169362, + "loss": 0.011, "step": 306740 }, { - "epoch": 1.55, - "learning_rate": 6.786101679523336e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018072896280532219, + "loss": 0.0115, "step": 306750 }, { - "epoch": 1.55, - "learning_rate": 6.785344910221935e-05, - "loss": 0.0094, + "epoch": 0.8, + "learning_rate": 0.00018072507458895073, + "loss": 0.0115, "step": 306760 }, { - "epoch": 1.55, - "learning_rate": 6.784588140920533e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018072118637257924, + "loss": 0.0151, "step": 306770 }, { - "epoch": 1.55, - "learning_rate": 6.783831371619133e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018071729815620776, + "loss": 0.013, "step": 306780 }, { - "epoch": 1.55, - "learning_rate": 6.783074602317732e-05, - "loss": 0.0094, + "epoch": 0.8, + "learning_rate": 0.00018071340993983632, + "loss": 0.0144, "step": 306790 }, { - "epoch": 1.55, - "learning_rate": 6.78231783301633e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00018070952172346487, + "loss": 0.0129, "step": 306800 }, { - "epoch": 1.55, - "learning_rate": 6.78156106371493e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00018070563350709338, + "loss": 0.0166, "step": 306810 }, { - "epoch": 1.55, - "learning_rate": 6.78080429441353e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018070174529072192, + "loss": 0.0138, "step": 306820 }, { - "epoch": 1.55, - "learning_rate": 6.780047525112127e-05, - "loss": 0.0093, + "epoch": 0.8, + "learning_rate": 0.00018069785707435046, + "loss": 0.0137, "step": 306830 }, { - "epoch": 1.55, - "learning_rate": 6.779290755810726e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.000180693968857979, + "loss": 0.0111, "step": 306840 }, { - "epoch": 1.55, - "learning_rate": 6.778533986509325e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00018069008064160752, + "loss": 0.0124, "step": 306850 }, { - "epoch": 1.55, - "learning_rate": 6.777777217207923e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00018068619242523606, + "loss": 0.0156, "step": 306860 }, { - "epoch": 1.55, - "learning_rate": 6.777020447906523e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001806823042088646, + "loss": 0.0128, "step": 306870 }, { - "epoch": 1.55, - "learning_rate": 6.776263678605122e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00018067841599249315, + "loss": 0.0155, "step": 306880 }, { - "epoch": 1.55, - "learning_rate": 6.77550690930372e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00018067452777612166, + "loss": 0.0128, "step": 306890 }, { - "epoch": 1.55, - "learning_rate": 6.77475014000232e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.0001806706395597502, + "loss": 0.0175, "step": 306900 }, { - "epoch": 1.55, - "learning_rate": 6.77399337070092e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00018066675134337872, + "loss": 0.0152, "step": 306910 }, { - "epoch": 1.55, - "learning_rate": 6.773236601399518e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018066286312700728, + "loss": 0.0157, "step": 306920 }, { - "epoch": 1.55, - "learning_rate": 6.772479832098117e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.0001806589749106358, + "loss": 0.0166, "step": 306930 }, { - "epoch": 1.55, - "learning_rate": 6.771723062796717e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018065508669426434, + "loss": 0.0152, "step": 306940 }, { - "epoch": 1.55, - "learning_rate": 6.770966293495315e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.00018065119847789286, + "loss": 0.0139, "step": 306950 }, { - "epoch": 1.55, - "learning_rate": 6.770209524193914e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00018064731026152142, + "loss": 0.0119, "step": 306960 }, { - "epoch": 1.55, - "learning_rate": 6.769452754892512e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.00018064342204514997, + "loss": 0.0138, "step": 306970 }, { - "epoch": 1.55, - "learning_rate": 6.768695985591112e-05, - "loss": 0.0095, + "epoch": 0.8, + "learning_rate": 0.00018063953382877848, + "loss": 0.0185, "step": 306980 }, { - "epoch": 1.55, - "learning_rate": 6.767939216289711e-05, - "loss": 0.0047, + "epoch": 0.8, + "learning_rate": 0.00018063564561240702, + "loss": 0.0133, "step": 306990 }, { - "epoch": 1.55, - "learning_rate": 6.76718244698831e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.00018063175739603556, + "loss": 0.0123, "step": 307000 }, { - "epoch": 1.55, - "eval_cer": 0.9144605519419082, - "eval_loss": 0.005416039377450943, - "eval_runtime": 116.4069, - "eval_samples_per_second": 17.181, - "eval_steps_per_second": 4.295, + "epoch": 0.8, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.00944979302585125, + "eval_runtime": 107.8315, + "eval_samples_per_second": 18.547, + "eval_steps_per_second": 4.637, "step": 307000 }, { - "epoch": 1.55, - "learning_rate": 6.766425677686909e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.0001806278691796641, + "loss": 0.0138, "step": 307010 }, { - "epoch": 1.55, - "learning_rate": 6.765668908385508e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018062398096329262, + "loss": 0.0126, "step": 307020 }, { - "epoch": 1.55, - "learning_rate": 6.764912139084107e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018062009274692116, + "loss": 0.0156, "step": 307030 }, { - "epoch": 1.55, - "learning_rate": 6.764155369782706e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.0001806162045305497, + "loss": 0.0137, "step": 307040 }, { - "epoch": 1.55, - "learning_rate": 6.763398600481304e-05, - "loss": 0.009, + "epoch": 0.8, + "learning_rate": 0.00018061231631417824, + "loss": 0.0168, "step": 307050 }, { - "epoch": 1.55, - "learning_rate": 6.762641831179904e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00018060842809780676, + "loss": 0.0258, "step": 307060 }, { - "epoch": 1.55, - "learning_rate": 6.761885061878503e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001806045398814353, + "loss": 0.0147, "step": 307070 }, { - "epoch": 1.55, - "learning_rate": 6.761128292577101e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00018060065166506384, + "loss": 0.0202, "step": 307080 }, { - "epoch": 1.55, - "learning_rate": 6.760371523275701e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00018059676344869238, + "loss": 0.0161, "step": 307090 }, { - "epoch": 1.55, - "learning_rate": 6.7596147539743e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001805928752323209, + "loss": 0.0198, "step": 307100 }, { - "epoch": 1.55, - "learning_rate": 6.758857984672899e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018058898701594944, + "loss": 0.0133, "step": 307110 }, { - "epoch": 1.55, - "learning_rate": 6.758101215371498e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.000180585098799578, + "loss": 0.0128, "step": 307120 }, { - "epoch": 1.55, - "learning_rate": 6.757344446070096e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018058121058320652, + "loss": 0.0154, "step": 307130 }, { - "epoch": 1.55, - "learning_rate": 6.756587676768696e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018057732236683507, + "loss": 0.0152, "step": 307140 }, { - "epoch": 1.55, - "learning_rate": 6.755830907467295e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018057343415046358, + "loss": 0.0107, "step": 307150 }, { - "epoch": 1.55, - "learning_rate": 6.755074138165893e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018056954593409212, + "loss": 0.0215, "step": 307160 }, { - "epoch": 1.55, - "learning_rate": 6.754317368864491e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00018056565771772066, + "loss": 0.0168, "step": 307170 }, { - "epoch": 1.55, - "learning_rate": 6.753560599563091e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.0001805617695013492, + "loss": 0.0147, "step": 307180 }, { - "epoch": 1.55, - "learning_rate": 6.75280383026169e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018055788128497772, + "loss": 0.015, "step": 307190 }, { - "epoch": 1.55, - "learning_rate": 6.752047060960289e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018055399306860626, + "loss": 0.0116, "step": 307200 }, { - "epoch": 1.55, - "learning_rate": 6.751290291658888e-05, - "loss": 0.0093, + "epoch": 0.8, + "learning_rate": 0.0001805501048522348, + "loss": 0.0153, "step": 307210 }, { - "epoch": 1.55, - "learning_rate": 6.750533522357486e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018054621663586334, + "loss": 0.0141, "step": 307220 }, { - "epoch": 1.55, - "learning_rate": 6.749776753056086e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018054232841949186, + "loss": 0.0099, "step": 307230 }, { - "epoch": 1.55, - "learning_rate": 6.749019983754685e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.0001805384402031204, + "loss": 0.0151, "step": 307240 }, { - "epoch": 1.55, - "learning_rate": 6.748263214453283e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018053455198674894, + "loss": 0.0129, "step": 307250 }, { - "epoch": 1.55, - "learning_rate": 6.747506445151883e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018053066377037748, + "loss": 0.0177, "step": 307260 }, { - "epoch": 1.55, - "learning_rate": 6.746749675850482e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.000180526775554006, + "loss": 0.0146, "step": 307270 }, { - "epoch": 1.55, - "learning_rate": 6.74599290654908e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018052288733763454, + "loss": 0.0175, "step": 307280 }, { - "epoch": 1.55, - "learning_rate": 6.74523613724768e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.0001805189991212631, + "loss": 0.0169, "step": 307290 }, { - "epoch": 1.55, - "learning_rate": 6.744479367946278e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018051511090489162, + "loss": 0.0156, "step": 307300 }, { - "epoch": 1.55, - "learning_rate": 6.743722598644878e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018051122268852016, + "loss": 0.0166, "step": 307310 }, { - "epoch": 1.55, - "learning_rate": 6.742965829343477e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00018050733447214868, + "loss": 0.0188, "step": 307320 }, { - "epoch": 1.55, - "learning_rate": 6.742209060042075e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018050344625577725, + "loss": 0.0149, "step": 307330 }, { - "epoch": 1.55, - "learning_rate": 6.741452290740675e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018049955803940576, + "loss": 0.0133, "step": 307340 }, { - "epoch": 1.55, - "learning_rate": 6.740695521439274e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001804956698230343, + "loss": 0.013, "step": 307350 }, { - "epoch": 1.55, - "learning_rate": 6.739938752137872e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018049178160666282, + "loss": 0.0127, "step": 307360 }, { - "epoch": 1.55, - "learning_rate": 6.739181982836472e-05, - "loss": 0.0045, + "epoch": 0.8, + "learning_rate": 0.0001804878933902914, + "loss": 0.0203, "step": 307370 }, { - "epoch": 1.55, - "learning_rate": 6.73842521353507e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.0001804840051739199, + "loss": 0.0157, "step": 307380 }, { - "epoch": 1.55, - "learning_rate": 6.73766844423367e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00018048011695754844, + "loss": 0.0141, "step": 307390 }, { - "epoch": 1.55, - "learning_rate": 6.736911674932269e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00018047622874117696, + "loss": 0.0114, "step": 307400 }, { - "epoch": 1.55, - "learning_rate": 6.736154905630867e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.0001804723405248055, + "loss": 0.0139, "step": 307410 }, { - "epoch": 1.55, - "learning_rate": 6.735398136329467e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00018046845230843404, + "loss": 0.0165, "step": 307420 }, { - "epoch": 1.55, - "learning_rate": 6.734641367028066e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.00018046456409206258, + "loss": 0.0127, "step": 307430 }, { - "epoch": 1.55, - "learning_rate": 6.733884597726664e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.0001804606758756911, + "loss": 0.0201, "step": 307440 }, { - "epoch": 1.55, - "learning_rate": 6.733127828425264e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018045678765931964, + "loss": 0.0157, "step": 307450 }, { - "epoch": 1.55, - "learning_rate": 6.732371059123863e-05, - "loss": 0.0144, + "epoch": 0.8, + "learning_rate": 0.0001804528994429482, + "loss": 0.0135, "step": 307460 }, { - "epoch": 1.55, - "learning_rate": 6.731614289822462e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018044901122657672, + "loss": 0.0176, "step": 307470 }, { - "epoch": 1.55, - "learning_rate": 6.73085752052106e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00018044512301020524, + "loss": 0.0131, "step": 307480 }, { - "epoch": 1.55, - "learning_rate": 6.730100751219659e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00018044123479383378, + "loss": 0.0162, "step": 307490 }, { - "epoch": 1.55, - "learning_rate": 6.729343981918257e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018043734657746235, + "loss": 0.0195, "step": 307500 }, { - "epoch": 1.55, - "learning_rate": 6.728587212616857e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00018043345836109086, + "loss": 0.0135, "step": 307510 }, { - "epoch": 1.55, - "learning_rate": 6.727830443315456e-05, - "loss": 0.0096, + "epoch": 0.8, + "learning_rate": 0.0001804295701447194, + "loss": 0.0137, "step": 307520 }, { - "epoch": 1.55, - "learning_rate": 6.727073674014055e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018042568192834792, + "loss": 0.015, "step": 307530 }, { - "epoch": 1.55, - "learning_rate": 6.726316904712654e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.0001804217937119765, + "loss": 0.0129, "step": 307540 }, { - "epoch": 1.55, - "learning_rate": 6.725560135411254e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.000180417905495605, + "loss": 0.0159, "step": 307550 }, { - "epoch": 1.55, - "learning_rate": 6.724803366109852e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018041401727923354, + "loss": 0.0129, "step": 307560 }, { - "epoch": 1.55, - "learning_rate": 6.724046596808451e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00018041012906286206, + "loss": 0.0129, "step": 307570 }, { - "epoch": 1.55, - "learning_rate": 6.723289827507049e-05, - "loss": 0.011, + "epoch": 0.8, + "learning_rate": 0.00018040624084649063, + "loss": 0.0125, "step": 307580 }, { - "epoch": 1.55, - "learning_rate": 6.722533058205649e-05, - "loss": 0.0045, + "epoch": 0.8, + "learning_rate": 0.00018040235263011914, + "loss": 0.0141, "step": 307590 }, { - "epoch": 1.55, - "learning_rate": 6.721776288904248e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018039846441374768, + "loss": 0.0177, "step": 307600 }, { - "epoch": 1.55, - "learning_rate": 6.721019519602846e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.0001803945761973762, + "loss": 0.0123, "step": 307610 }, { - "epoch": 1.55, - "learning_rate": 6.720262750301446e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00018039068798100477, + "loss": 0.0166, "step": 307620 }, { - "epoch": 1.55, - "learning_rate": 6.719505981000045e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001803867997646333, + "loss": 0.0128, "step": 307630 }, { - "epoch": 1.55, - "learning_rate": 6.718749211698644e-05, - "loss": 0.0046, + "epoch": 0.8, + "learning_rate": 0.00018038291154826182, + "loss": 0.0173, "step": 307640 }, { - "epoch": 1.55, - "learning_rate": 6.717992442397243e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00018037902333189034, + "loss": 0.0139, "step": 307650 }, { - "epoch": 1.55, - "learning_rate": 6.717235673095841e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018037513511551888, + "loss": 0.0132, "step": 307660 }, { - "epoch": 1.55, - "learning_rate": 6.716478903794441e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018037124689914745, + "loss": 0.0126, "step": 307670 }, { - "epoch": 1.55, - "learning_rate": 6.71572213449304e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018036735868277596, + "loss": 0.0138, "step": 307680 }, { - "epoch": 1.55, - "learning_rate": 6.714965365191638e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.0001803634704664045, + "loss": 0.0121, "step": 307690 }, { - "epoch": 1.55, - "learning_rate": 6.714208595890238e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018035958225003302, + "loss": 0.0158, "step": 307700 }, { - "epoch": 1.55, - "learning_rate": 6.713451826588837e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00018035569403366159, + "loss": 0.0143, "step": 307710 }, { - "epoch": 1.55, - "learning_rate": 6.712695057287436e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001803518058172901, + "loss": 0.0147, "step": 307720 }, { - "epoch": 1.55, - "learning_rate": 6.711938287986035e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018034791760091864, + "loss": 0.0174, "step": 307730 }, { - "epoch": 1.55, - "learning_rate": 6.711181518684633e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00018034402938454716, + "loss": 0.0147, "step": 307740 }, { - "epoch": 1.55, - "learning_rate": 6.710424749383233e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018034014116817573, + "loss": 0.0125, "step": 307750 }, { - "epoch": 1.55, - "learning_rate": 6.709667980081832e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018033625295180424, + "loss": 0.0139, "step": 307760 }, { - "epoch": 1.55, - "learning_rate": 6.70891121078043e-05, - "loss": 0.0088, + "epoch": 0.8, + "learning_rate": 0.00018033236473543278, + "loss": 0.0161, "step": 307770 }, { - "epoch": 1.55, - "learning_rate": 6.70815444147903e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.0001803284765190613, + "loss": 0.0146, "step": 307780 }, { - "epoch": 1.55, - "learning_rate": 6.707397672177628e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00018032458830268986, + "loss": 0.0153, "step": 307790 }, { - "epoch": 1.55, - "learning_rate": 6.706640902876227e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00018032070008631838, + "loss": 0.0109, "step": 307800 }, { - "epoch": 1.55, - "learning_rate": 6.705884133574826e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018031681186994692, + "loss": 0.0137, "step": 307810 }, { - "epoch": 1.55, - "learning_rate": 6.705127364273425e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018031292365357544, + "loss": 0.0142, "step": 307820 }, { - "epoch": 1.55, - "learning_rate": 6.704370594972023e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.000180309035437204, + "loss": 0.0157, "step": 307830 }, { - "epoch": 1.55, - "learning_rate": 6.703613825670623e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018030514722083255, + "loss": 0.0095, "step": 307840 }, { - "epoch": 1.55, - "learning_rate": 6.702857056369222e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018030125900446106, + "loss": 0.0138, "step": 307850 }, { - "epoch": 1.55, - "learning_rate": 6.70210028706782e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.0001802973707880896, + "loss": 0.0112, "step": 307860 }, { - "epoch": 1.55, - "learning_rate": 6.70134351776642e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.00018029348257171814, + "loss": 0.0153, "step": 307870 }, { - "epoch": 1.55, - "learning_rate": 6.70058674846502e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018028959435534669, + "loss": 0.0121, "step": 307880 }, { - "epoch": 1.55, - "learning_rate": 6.699829979163618e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.0001802857061389752, + "loss": 0.0118, "step": 307890 }, { - "epoch": 1.55, - "learning_rate": 6.699073209862217e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00018028181792260374, + "loss": 0.0135, "step": 307900 }, { - "epoch": 1.55, - "learning_rate": 6.698316440560817e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018027792970623226, + "loss": 0.0109, "step": 307910 }, { - "epoch": 1.55, - "learning_rate": 6.697559671259415e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00018027404148986082, + "loss": 0.014, "step": 307920 }, { - "epoch": 1.55, - "learning_rate": 6.696802901958014e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018027015327348934, + "loss": 0.0157, "step": 307930 }, { - "epoch": 1.55, - "learning_rate": 6.696046132656612e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.00018026626505711788, + "loss": 0.0174, "step": 307940 }, { - "epoch": 1.55, - "learning_rate": 6.695289363355212e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.0001802623768407464, + "loss": 0.0124, "step": 307950 }, { - "epoch": 1.55, - "learning_rate": 6.694532594053811e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018025848862437496, + "loss": 0.0143, "step": 307960 }, { - "epoch": 1.55, - "learning_rate": 6.69377582475241e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018025460040800348, + "loss": 0.0136, "step": 307970 }, { - "epoch": 1.55, - "learning_rate": 6.693019055451009e-05, - "loss": 0.0098, + "epoch": 0.8, + "learning_rate": 0.00018025071219163202, + "loss": 0.0161, "step": 307980 }, { - "epoch": 1.55, - "learning_rate": 6.692262286149608e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00018024682397526054, + "loss": 0.0131, "step": 307990 }, { - "epoch": 1.55, - "learning_rate": 6.691505516848207e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.0001802429357588891, + "loss": 0.0138, "step": 308000 }, { - "epoch": 1.55, - "eval_cer": 0.9144828710527925, - "eval_loss": 0.005395396146923304, - "eval_runtime": 116.4162, - "eval_samples_per_second": 17.18, - "eval_steps_per_second": 4.295, + "epoch": 0.8, + "eval_cer": 0.8817264801510488, + "eval_loss": 0.00954010896384716, + "eval_runtime": 107.7412, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, "step": 308000 }, { - "epoch": 1.55, - "learning_rate": 6.690748747546806e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018023904754251765, + "loss": 0.014, "step": 308010 }, { - "epoch": 1.55, - "learning_rate": 6.689991978245404e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.00018023515932614616, + "loss": 0.0127, "step": 308020 }, { - "epoch": 1.55, - "learning_rate": 6.689235208944004e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.0001802312711097747, + "loss": 0.0163, "step": 308030 }, { - "epoch": 1.55, - "learning_rate": 6.688478439642603e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00018022738289340324, + "loss": 0.0429, "step": 308040 }, { - "epoch": 1.55, - "learning_rate": 6.687721670341201e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00018022349467703178, + "loss": 0.0144, "step": 308050 }, { - "epoch": 1.55, - "learning_rate": 6.686964901039801e-05, - "loss": 0.0048, + "epoch": 0.8, + "learning_rate": 0.0001802196064606603, + "loss": 0.0119, "step": 308060 }, { - "epoch": 1.55, - "learning_rate": 6.6862081317384e-05, - "loss": 0.0096, + "epoch": 0.8, + "learning_rate": 0.00018021571824428884, + "loss": 0.02, "step": 308070 }, { - "epoch": 1.55, - "learning_rate": 6.685451362436999e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00018021183002791738, + "loss": 0.0129, "step": 308080 }, { - "epoch": 1.55, - "learning_rate": 6.684694593135598e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018020794181154592, + "loss": 0.0168, "step": 308090 }, { - "epoch": 1.55, - "learning_rate": 6.683937823834196e-05, - "loss": 0.0048, + "epoch": 0.8, + "learning_rate": 0.00018020405359517444, + "loss": 0.0161, "step": 308100 }, { - "epoch": 1.55, - "learning_rate": 6.683181054532794e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00018020016537880298, + "loss": 0.0186, "step": 308110 }, { - "epoch": 1.55, - "learning_rate": 6.682424285231394e-05, - "loss": 0.0091, + "epoch": 0.8, + "learning_rate": 0.00018019627716243152, + "loss": 0.0127, "step": 308120 }, { - "epoch": 1.55, - "learning_rate": 6.681667515929993e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018019238894606006, + "loss": 0.0112, "step": 308130 }, { - "epoch": 1.55, - "learning_rate": 6.680910746628591e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00018018850072968858, + "loss": 0.0126, "step": 308140 }, { - "epoch": 1.55, - "learning_rate": 6.680153977327191e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018018461251331712, + "loss": 0.014, "step": 308150 }, { - "epoch": 1.55, - "learning_rate": 6.67939720802579e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.00018018072429694563, + "loss": 0.0102, "step": 308160 }, { - "epoch": 1.55, - "learning_rate": 6.678640438724389e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001801768360805742, + "loss": 0.0149, "step": 308170 }, { - "epoch": 1.55, - "learning_rate": 6.677883669422988e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00018017294786420274, + "loss": 0.0143, "step": 308180 }, { - "epoch": 1.55, - "learning_rate": 6.677126900121586e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018016905964783126, + "loss": 0.0147, "step": 308190 }, { - "epoch": 1.55, - "learning_rate": 6.676370130820186e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018016517143145977, + "loss": 0.0155, "step": 308200 }, { - "epoch": 1.55, - "learning_rate": 6.675613361518785e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00018016128321508834, + "loss": 0.0156, "step": 308210 }, { - "epoch": 1.56, - "learning_rate": 6.674856592217383e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00018015739499871688, + "loss": 0.0155, "step": 308220 }, { - "epoch": 1.56, - "learning_rate": 6.674099822915983e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001801535067823454, + "loss": 0.0121, "step": 308230 }, { - "epoch": 1.56, - "learning_rate": 6.673343053614582e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00018014961856597394, + "loss": 0.0157, "step": 308240 }, { - "epoch": 1.56, - "learning_rate": 6.67258628431318e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018014573034960248, + "loss": 0.0165, "step": 308250 }, { - "epoch": 1.56, - "learning_rate": 6.67182951501178e-05, - "loss": 0.0096, + "epoch": 0.8, + "learning_rate": 0.00018014184213323102, + "loss": 0.0136, "step": 308260 }, { - "epoch": 1.56, - "learning_rate": 6.671072745710378e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00018013795391685954, + "loss": 0.0152, "step": 308270 }, { - "epoch": 1.56, - "learning_rate": 6.670315976408978e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00018013406570048808, + "loss": 0.012, "step": 308280 }, { - "epoch": 1.56, - "learning_rate": 6.669559207107577e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00018013017748411662, + "loss": 0.0122, "step": 308290 }, { - "epoch": 1.56, - "learning_rate": 6.668802437806175e-05, - "loss": 0.0092, + "epoch": 0.8, + "learning_rate": 0.00018012628926774516, + "loss": 0.0158, "step": 308300 }, { - "epoch": 1.56, - "learning_rate": 6.668045668504775e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018012240105137368, + "loss": 0.0171, "step": 308310 }, { - "epoch": 1.56, - "learning_rate": 6.667288899203374e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018011851283500222, + "loss": 0.015, "step": 308320 }, { - "epoch": 1.56, - "learning_rate": 6.666532129901972e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.0001801146246186308, + "loss": 0.0156, "step": 308330 }, { - "epoch": 1.56, - "learning_rate": 6.665775360600572e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.0001801107364022593, + "loss": 0.0137, "step": 308340 }, { - "epoch": 1.56, - "learning_rate": 6.66501859129917e-05, - "loss": 0.0076, + "epoch": 0.8, + "learning_rate": 0.00018010684818588784, + "loss": 0.0169, "step": 308350 }, { - "epoch": 1.56, - "learning_rate": 6.66426182199777e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018010295996951636, + "loss": 0.0121, "step": 308360 }, { - "epoch": 1.56, - "learning_rate": 6.663505052696369e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00018009907175314493, + "loss": 0.0202, "step": 308370 }, { - "epoch": 1.56, - "learning_rate": 6.662748283394967e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018009518353677344, + "loss": 0.0159, "step": 308380 }, { - "epoch": 1.56, - "learning_rate": 6.661991514093567e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.00018009129532040198, + "loss": 0.0141, "step": 308390 }, { - "epoch": 1.56, - "learning_rate": 6.661234744792166e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.0001800874071040305, + "loss": 0.0113, "step": 308400 }, { - "epoch": 1.56, - "learning_rate": 6.660477975490764e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00018008351888765904, + "loss": 0.0119, "step": 308410 }, { - "epoch": 1.56, - "learning_rate": 6.659721206189363e-05, - "loss": 0.0106, + "epoch": 0.8, + "learning_rate": 0.00018007963067128758, + "loss": 0.0158, "step": 308420 }, { - "epoch": 1.56, - "learning_rate": 6.658964436887962e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00018007574245491612, + "loss": 0.0177, "step": 308430 }, { - "epoch": 1.56, - "learning_rate": 6.658207667586562e-05, - "loss": 0.0098, + "epoch": 0.8, + "learning_rate": 0.00018007185423854464, + "loss": 0.017, "step": 308440 }, { - "epoch": 1.56, - "learning_rate": 6.65745089828516e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00018006796602217318, + "loss": 0.0146, "step": 308450 }, { - "epoch": 1.56, - "learning_rate": 6.656694128983759e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00018006407780580172, + "loss": 0.013, "step": 308460 }, { - "epoch": 1.56, - "learning_rate": 6.655937359682357e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00018006018958943026, + "loss": 0.014, "step": 308470 }, { - "epoch": 1.56, - "learning_rate": 6.655180590380957e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00018005630137305878, + "loss": 0.012, "step": 308480 }, { - "epoch": 1.56, - "learning_rate": 6.654423821079556e-05, - "loss": 0.0051, + "epoch": 0.8, + "learning_rate": 0.00018005241315668732, + "loss": 0.013, "step": 308490 }, { - "epoch": 1.56, - "learning_rate": 6.653667051778154e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001800485249403159, + "loss": 0.0167, "step": 308500 }, { - "epoch": 1.56, - "learning_rate": 6.652910282476754e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.0001800446367239444, + "loss": 0.0112, "step": 308510 }, { - "epoch": 1.56, - "learning_rate": 6.652153513175353e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018004074850757292, + "loss": 0.0191, "step": 308520 }, { - "epoch": 1.56, - "learning_rate": 6.651396743873952e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00018003686029120146, + "loss": 0.0143, "step": 308530 }, { - "epoch": 1.56, - "learning_rate": 6.650639974572551e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.00018003297207483003, + "loss": 0.0167, "step": 308540 }, { - "epoch": 1.56, - "learning_rate": 6.649883205271149e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00018002908385845854, + "loss": 0.0105, "step": 308550 }, { - "epoch": 1.56, - "learning_rate": 6.649126435969749e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00018002519564208708, + "loss": 0.0128, "step": 308560 }, { - "epoch": 1.56, - "learning_rate": 6.648369666668348e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.0001800213074257156, + "loss": 0.0149, "step": 308570 }, { - "epoch": 1.56, - "learning_rate": 6.647612897366946e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00018001741920934417, + "loss": 0.015, "step": 308580 }, { - "epoch": 1.56, - "learning_rate": 6.646856128065546e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00018001353099297268, + "loss": 0.0141, "step": 308590 }, { - "epoch": 1.56, - "learning_rate": 6.646099358764145e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00018000964277660122, + "loss": 0.012, "step": 308600 }, { - "epoch": 1.56, - "learning_rate": 6.645342589462744e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00018000575456022974, + "loss": 0.0171, "step": 308610 }, { - "epoch": 1.56, - "learning_rate": 6.644585820161343e-05, - "loss": 0.011, + "epoch": 0.8, + "learning_rate": 0.0001800018663438583, + "loss": 0.013, "step": 308620 }, { - "epoch": 1.56, - "learning_rate": 6.643829050859941e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00017999797812748682, + "loss": 0.0135, "step": 308630 }, { - "epoch": 1.56, - "learning_rate": 6.64307228155854e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017999408991111536, + "loss": 0.0126, "step": 308640 }, { - "epoch": 1.56, - "learning_rate": 6.64231551225714e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017999020169474388, + "loss": 0.0163, "step": 308650 }, { - "epoch": 1.56, - "learning_rate": 6.641558742955738e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00017998631347837242, + "loss": 0.0138, "step": 308660 }, { - "epoch": 1.56, - "learning_rate": 6.640801973654338e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00017998242526200096, + "loss": 0.0151, "step": 308670 }, { - "epoch": 1.56, - "learning_rate": 6.640045204352937e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001799785370456295, + "loss": 0.0137, "step": 308680 }, { - "epoch": 1.56, - "learning_rate": 6.639288435051535e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017997464882925802, + "loss": 0.0149, "step": 308690 }, { - "epoch": 1.56, - "learning_rate": 6.638531665750135e-05, - "loss": 0.0081, + "epoch": 0.8, + "learning_rate": 0.00017997076061288656, + "loss": 0.0153, "step": 308700 }, { - "epoch": 1.56, - "learning_rate": 6.637774896448733e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017996687239651513, + "loss": 0.018, "step": 308710 }, { - "epoch": 1.56, - "learning_rate": 6.637018127147333e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017996298418014364, + "loss": 0.0136, "step": 308720 }, { - "epoch": 1.56, - "learning_rate": 6.636261357845931e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00017995909596377218, + "loss": 0.0123, "step": 308730 }, { - "epoch": 1.56, - "learning_rate": 6.63550458854453e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.0001799552077474007, + "loss": 0.0108, "step": 308740 }, { - "epoch": 1.56, - "learning_rate": 6.634747819243128e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017995131953102927, + "loss": 0.0188, "step": 308750 }, { - "epoch": 1.56, - "learning_rate": 6.633991049941728e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00017994743131465778, + "loss": 0.0106, "step": 308760 }, { - "epoch": 1.56, - "learning_rate": 6.633234280640327e-05, - "loss": 0.0095, + "epoch": 0.8, + "learning_rate": 0.00017994354309828632, + "loss": 0.0167, "step": 308770 }, { - "epoch": 1.56, - "learning_rate": 6.632477511338926e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00017993965488191484, + "loss": 0.0158, "step": 308780 }, { - "epoch": 1.56, - "learning_rate": 6.631720742037525e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.0001799357666655434, + "loss": 0.0143, "step": 308790 }, { - "epoch": 1.56, - "learning_rate": 6.630963972736123e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.00017993187844917192, + "loss": 0.014, "step": 308800 }, { - "epoch": 1.56, - "learning_rate": 6.630207203434723e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00017992799023280046, + "loss": 0.0156, "step": 308810 }, { - "epoch": 1.56, - "learning_rate": 6.629450434133322e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00017992410201642898, + "loss": 0.015, "step": 308820 }, { - "epoch": 1.56, - "learning_rate": 6.62869366483192e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017992021380005754, + "loss": 0.0128, "step": 308830 }, { - "epoch": 1.56, - "learning_rate": 6.62793689553052e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00017991632558368606, + "loss": 0.0157, "step": 308840 }, { - "epoch": 1.56, - "learning_rate": 6.627180126229119e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.0001799124373673146, + "loss": 0.0129, "step": 308850 }, { - "epoch": 1.56, - "learning_rate": 6.626423356927717e-05, - "loss": 0.0089, + "epoch": 0.8, + "learning_rate": 0.00017990854915094312, + "loss": 0.0153, "step": 308860 }, { - "epoch": 1.56, - "learning_rate": 6.625666587626317e-05, - "loss": 0.0047, + "epoch": 0.8, + "learning_rate": 0.00017990466093457168, + "loss": 0.0167, "step": 308870 }, { - "epoch": 1.56, - "learning_rate": 6.624909818324916e-05, - "loss": 0.0088, + "epoch": 0.8, + "learning_rate": 0.00017990077271820023, + "loss": 0.0117, "step": 308880 }, { - "epoch": 1.56, - "learning_rate": 6.624153049023515e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00017989688450182874, + "loss": 0.0151, "step": 308890 }, { - "epoch": 1.56, - "learning_rate": 6.623396279722114e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00017989299628545728, + "loss": 0.0163, "step": 308900 }, { - "epoch": 1.56, - "learning_rate": 6.622639510420712e-05, - "loss": 0.0088, + "epoch": 0.8, + "learning_rate": 0.0001798891080690858, + "loss": 0.0129, "step": 308910 }, { - "epoch": 1.56, - "learning_rate": 6.621882741119312e-05, - "loss": 0.0094, + "epoch": 0.8, + "learning_rate": 0.00017988521985271437, + "loss": 0.0142, "step": 308920 }, { - "epoch": 1.56, - "learning_rate": 6.621125971817911e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017988133163634288, + "loss": 0.0163, "step": 308930 }, { - "epoch": 1.56, - "learning_rate": 6.62036920251651e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017987744341997142, + "loss": 0.0177, "step": 308940 }, { - "epoch": 1.56, - "learning_rate": 6.619612433215109e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017987355520359994, + "loss": 0.0156, "step": 308950 }, { - "epoch": 1.56, - "learning_rate": 6.618855663913708e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.0001798696669872285, + "loss": 0.0154, "step": 308960 }, { - "epoch": 1.56, - "learning_rate": 6.618098894612307e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017986577877085702, + "loss": 0.0104, "step": 308970 }, { - "epoch": 1.56, - "learning_rate": 6.617342125310906e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00017986189055448556, + "loss": 0.0151, "step": 308980 }, { - "epoch": 1.56, - "learning_rate": 6.616585356009504e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017985800233811408, + "loss": 0.0162, "step": 308990 }, { - "epoch": 1.56, - "learning_rate": 6.615828586708104e-05, - "loss": 0.0052, + "epoch": 0.8, + "learning_rate": 0.00017985411412174264, + "loss": 0.0138, "step": 309000 }, { - "epoch": 1.56, - "eval_cer": 0.9144654039225352, - "eval_loss": 0.005355709232389927, - "eval_runtime": 116.4345, - "eval_samples_per_second": 17.177, - "eval_steps_per_second": 4.294, + "epoch": 0.8, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.009455575607717037, + "eval_runtime": 107.8878, + "eval_samples_per_second": 18.538, + "eval_steps_per_second": 4.634, "step": 309000 }, { - "epoch": 1.56, - "learning_rate": 6.615071817406703e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.00017985022590537116, + "loss": 0.0127, "step": 309010 }, { - "epoch": 1.56, - "learning_rate": 6.614315048105301e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.0001798463376889997, + "loss": 0.0138, "step": 309020 }, { - "epoch": 1.56, - "learning_rate": 6.613558278803901e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017984244947262821, + "loss": 0.0113, "step": 309030 }, { - "epoch": 1.56, - "learning_rate": 6.612801509502499e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017983856125625678, + "loss": 0.0121, "step": 309040 }, { - "epoch": 1.56, - "learning_rate": 6.612044740201098e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017983467303988533, + "loss": 0.0122, "step": 309050 }, { - "epoch": 1.56, - "learning_rate": 6.611287970899697e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017983078482351384, + "loss": 0.0171, "step": 309060 }, { - "epoch": 1.56, - "learning_rate": 6.610531201598296e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.00017982689660714235, + "loss": 0.0115, "step": 309070 }, { - "epoch": 1.56, - "learning_rate": 6.609774432296894e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.00017982300839077092, + "loss": 0.0125, "step": 309080 }, { - "epoch": 1.56, - "learning_rate": 6.609017662995494e-05, - "loss": 0.0081, + "epoch": 0.8, + "learning_rate": 0.00017981912017439946, + "loss": 0.015, "step": 309090 }, { - "epoch": 1.56, - "learning_rate": 6.608260893694093e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017981523195802798, + "loss": 0.0178, "step": 309100 }, { - "epoch": 1.56, - "learning_rate": 6.607504124392691e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00017981134374165652, + "loss": 0.0131, "step": 309110 }, { - "epoch": 1.56, - "learning_rate": 6.606747355091291e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00017980745552528506, + "loss": 0.0124, "step": 309120 }, { - "epoch": 1.56, - "learning_rate": 6.60599058578989e-05, - "loss": 0.0046, + "epoch": 0.8, + "learning_rate": 0.0001798035673089136, + "loss": 0.0106, "step": 309130 }, { - "epoch": 1.56, - "learning_rate": 6.605233816488489e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00017979967909254212, + "loss": 0.0177, "step": 309140 }, { - "epoch": 1.56, - "learning_rate": 6.604477047187088e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00017979579087617066, + "loss": 0.011, "step": 309150 }, { - "epoch": 1.56, - "learning_rate": 6.603720277885686e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017979190265979917, + "loss": 0.0135, "step": 309160 }, { - "epoch": 1.56, - "learning_rate": 6.602963508584286e-05, - "loss": 0.0089, + "epoch": 0.8, + "learning_rate": 0.00017978801444342774, + "loss": 0.0143, "step": 309170 }, { - "epoch": 1.56, - "learning_rate": 6.602206739282885e-05, - "loss": 0.0094, + "epoch": 0.8, + "learning_rate": 0.00017978412622705626, + "loss": 0.0125, "step": 309180 }, { - "epoch": 1.56, - "learning_rate": 6.601449969981483e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001797802380106848, + "loss": 0.0152, "step": 309190 }, { - "epoch": 1.56, - "learning_rate": 6.600693200680083e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017977634979431331, + "loss": 0.0131, "step": 309200 }, { - "epoch": 1.56, - "learning_rate": 6.599936431378682e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00017977246157794188, + "loss": 0.0137, "step": 309210 }, { - "epoch": 1.56, - "learning_rate": 6.59917966207728e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00017976857336157042, + "loss": 0.0144, "step": 309220 }, { - "epoch": 1.56, - "learning_rate": 6.59842289277588e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017976468514519894, + "loss": 0.0156, "step": 309230 }, { - "epoch": 1.56, - "learning_rate": 6.597666123474478e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.00017976079692882745, + "loss": 0.012, "step": 309240 }, { - "epoch": 1.56, - "learning_rate": 6.596909354173078e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017975690871245602, + "loss": 0.0143, "step": 309250 }, { - "epoch": 1.56, - "learning_rate": 6.596152584871677e-05, - "loss": 0.0091, + "epoch": 0.8, + "learning_rate": 0.00017975302049608456, + "loss": 0.0133, "step": 309260 }, { - "epoch": 1.56, - "learning_rate": 6.595395815570275e-05, - "loss": 0.0084, + "epoch": 0.8, + "learning_rate": 0.00017974913227971308, + "loss": 0.0163, "step": 309270 }, { - "epoch": 1.56, - "learning_rate": 6.594639046268875e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017974524406334162, + "loss": 0.0144, "step": 309280 }, { - "epoch": 1.56, - "learning_rate": 6.593882276967474e-05, - "loss": 0.007, + "epoch": 0.8, + "learning_rate": 0.00017974135584697016, + "loss": 0.0172, "step": 309290 }, { - "epoch": 1.56, - "learning_rate": 6.593125507666072e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.0001797374676305987, + "loss": 0.0145, "step": 309300 }, { - "epoch": 1.56, - "learning_rate": 6.592368738364672e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00017973357941422722, + "loss": 0.0139, "step": 309310 }, { - "epoch": 1.56, - "learning_rate": 6.59161196906327e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00017972969119785576, + "loss": 0.013, "step": 309320 }, { - "epoch": 1.56, - "learning_rate": 6.59085519976187e-05, - "loss": 0.0055, + "epoch": 0.8, + "learning_rate": 0.0001797258029814843, + "loss": 0.0163, "step": 309330 }, { - "epoch": 1.56, - "learning_rate": 6.590098430460469e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017972191476511284, + "loss": 0.0139, "step": 309340 }, { - "epoch": 1.56, - "learning_rate": 6.589341661159067e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017971802654874136, + "loss": 0.0113, "step": 309350 }, { - "epoch": 1.56, - "learning_rate": 6.588584891857665e-05, - "loss": 0.0082, + "epoch": 0.8, + "learning_rate": 0.0001797141383323699, + "loss": 0.013, "step": 309360 }, { - "epoch": 1.56, - "learning_rate": 6.587828122556265e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017971025011599847, + "loss": 0.0142, "step": 309370 }, { - "epoch": 1.56, - "learning_rate": 6.587071353254864e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017970636189962698, + "loss": 0.0158, "step": 309380 }, { - "epoch": 1.56, - "learning_rate": 6.586314583953462e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.0001797024736832555, + "loss": 0.0128, "step": 309390 }, { - "epoch": 1.56, - "learning_rate": 6.585557814652062e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017969858546688404, + "loss": 0.0163, "step": 309400 }, { - "epoch": 1.56, - "learning_rate": 6.584801045350661e-05, - "loss": 0.0051, + "epoch": 0.8, + "learning_rate": 0.00017969469725051255, + "loss": 0.014, "step": 309410 }, { - "epoch": 1.56, - "learning_rate": 6.58404427604926e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017969080903414112, + "loss": 0.0145, "step": 309420 }, { - "epoch": 1.56, - "learning_rate": 6.583287506747859e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017968692081776966, + "loss": 0.0151, "step": 309430 }, { - "epoch": 1.56, - "learning_rate": 6.582530737446457e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017968303260139818, + "loss": 0.0132, "step": 309440 }, { - "epoch": 1.56, - "learning_rate": 6.581773968145057e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.00017967914438502672, + "loss": 0.0141, "step": 309450 }, { - "epoch": 1.56, - "learning_rate": 6.581017198843656e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00017967525616865526, + "loss": 0.0152, "step": 309460 }, { - "epoch": 1.56, - "learning_rate": 6.580260429542254e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.0001796713679522838, + "loss": 0.015, "step": 309470 }, { - "epoch": 1.56, - "learning_rate": 6.579503660240854e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017966747973591232, + "loss": 0.015, "step": 309480 }, { - "epoch": 1.56, - "learning_rate": 6.578746890939453e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017966359151954086, + "loss": 0.0122, "step": 309490 }, { - "epoch": 1.56, - "learning_rate": 6.577990121638052e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001796597033031694, + "loss": 0.0137, "step": 309500 }, { - "epoch": 1.56, - "learning_rate": 6.577233352336651e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017965581508679794, + "loss": 0.0146, "step": 309510 }, { - "epoch": 1.56, - "learning_rate": 6.576476583035249e-05, - "loss": 0.0051, + "epoch": 0.8, + "learning_rate": 0.00017965192687042646, + "loss": 0.0144, "step": 309520 }, { - "epoch": 1.56, - "learning_rate": 6.575719813733849e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.000179648038654055, + "loss": 0.015, "step": 309530 }, { - "epoch": 1.56, - "learning_rate": 6.574963044432448e-05, - "loss": 0.0099, + "epoch": 0.8, + "learning_rate": 0.00017964415043768357, + "loss": 0.0117, "step": 309540 }, { - "epoch": 1.56, - "learning_rate": 6.574206275131046e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017964026222131208, + "loss": 0.0164, "step": 309550 }, { - "epoch": 1.56, - "learning_rate": 6.573449505829646e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.0001796363740049406, + "loss": 0.0156, "step": 309560 }, { - "epoch": 1.56, - "learning_rate": 6.572692736528245e-05, - "loss": 0.0096, + "epoch": 0.8, + "learning_rate": 0.00017963248578856914, + "loss": 0.01, "step": 309570 }, { - "epoch": 1.56, - "learning_rate": 6.571935967226843e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.0001796285975721977, + "loss": 0.014, "step": 309580 }, { - "epoch": 1.56, - "learning_rate": 6.571179197925443e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00017962470935582622, + "loss": 0.0146, "step": 309590 }, { - "epoch": 1.56, - "learning_rate": 6.570422428624041e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00017962082113945476, + "loss": 0.0142, "step": 309600 }, { - "epoch": 1.56, - "learning_rate": 6.56966565932264e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00017961693292308328, + "loss": 0.0139, "step": 309610 }, { - "epoch": 1.56, - "learning_rate": 6.56890889002124e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00017961304470671185, + "loss": 0.0123, "step": 309620 }, { - "epoch": 1.56, - "learning_rate": 6.568152120719838e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00017960915649034036, + "loss": 0.0196, "step": 309630 }, { - "epoch": 1.56, - "learning_rate": 6.567395351418438e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.0001796052682739689, + "loss": 0.0162, "step": 309640 }, { - "epoch": 1.56, - "learning_rate": 6.566638582117037e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017960138005759742, + "loss": 0.0141, "step": 309650 }, { - "epoch": 1.56, - "learning_rate": 6.565881812815635e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017959749184122596, + "loss": 0.0137, "step": 309660 }, { - "epoch": 1.56, - "learning_rate": 6.565125043514234e-05, - "loss": 0.0048, + "epoch": 0.8, + "learning_rate": 0.0001795936036248545, + "loss": 0.0133, "step": 309670 }, { - "epoch": 1.56, - "learning_rate": 6.564368274212833e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017958971540848304, + "loss": 0.0153, "step": 309680 }, { - "epoch": 1.56, - "learning_rate": 6.563611504911431e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017958582719211156, + "loss": 0.0172, "step": 309690 }, { - "epoch": 1.56, - "learning_rate": 6.562854735610031e-05, - "loss": 0.0038, + "epoch": 0.8, + "learning_rate": 0.0001795819389757401, + "loss": 0.015, "step": 309700 }, { - "epoch": 1.56, - "learning_rate": 6.56209796630863e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00017957805075936864, + "loss": 0.0166, "step": 309710 }, { - "epoch": 1.56, - "learning_rate": 6.561341197007228e-05, - "loss": 0.0047, + "epoch": 0.8, + "learning_rate": 0.00017957416254299718, + "loss": 0.0139, "step": 309720 }, { - "epoch": 1.56, - "learning_rate": 6.560584427705828e-05, - "loss": 0.0103, + "epoch": 0.8, + "learning_rate": 0.0001795702743266257, + "loss": 0.0136, "step": 309730 }, { - "epoch": 1.56, - "learning_rate": 6.559827658404427e-05, - "loss": 0.0058, + "epoch": 0.8, + "learning_rate": 0.00017956638611025424, + "loss": 0.0153, "step": 309740 }, { - "epoch": 1.56, - "learning_rate": 6.559070889103025e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.0001795624978938828, + "loss": 0.0158, "step": 309750 }, { - "epoch": 1.56, - "learning_rate": 6.558314119801625e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017955860967751132, + "loss": 0.0131, "step": 309760 }, { - "epoch": 1.56, - "learning_rate": 6.557557350500223e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017955472146113986, + "loss": 0.012, "step": 309770 }, { - "epoch": 1.56, - "learning_rate": 6.556800581198823e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017955083324476838, + "loss": 0.0154, "step": 309780 }, { - "epoch": 1.56, - "learning_rate": 6.556043811897422e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00017954694502839695, + "loss": 0.0115, "step": 309790 }, { - "epoch": 1.56, - "learning_rate": 6.55528704259602e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017954305681202546, + "loss": 0.0146, "step": 309800 }, { - "epoch": 1.56, - "learning_rate": 6.55453027329462e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.000179539168595654, + "loss": 0.0155, "step": 309810 }, { - "epoch": 1.56, - "learning_rate": 6.553773503993219e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017953528037928252, + "loss": 0.0202, "step": 309820 }, { - "epoch": 1.56, - "learning_rate": 6.553016734691817e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.00017953139216291109, + "loss": 0.0125, "step": 309830 }, { - "epoch": 1.56, - "learning_rate": 6.552259965390417e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.0001795275039465396, + "loss": 0.0182, "step": 309840 }, { - "epoch": 1.56, - "learning_rate": 6.551503196089016e-05, - "loss": 0.0057, + "epoch": 0.8, + "learning_rate": 0.00017952361573016814, + "loss": 0.0162, "step": 309850 }, { - "epoch": 1.56, - "learning_rate": 6.550746426787615e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00017951972751379666, + "loss": 0.0166, "step": 309860 }, { - "epoch": 1.56, - "learning_rate": 6.549989657486214e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.00017951583929742522, + "loss": 0.013, "step": 309870 }, { - "epoch": 1.56, - "learning_rate": 6.549232888184812e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017951195108105374, + "loss": 0.0134, "step": 309880 }, { - "epoch": 1.56, - "learning_rate": 6.548476118883412e-05, - "loss": 0.0066, + "epoch": 0.8, + "learning_rate": 0.00017950806286468228, + "loss": 0.0145, "step": 309890 }, { - "epoch": 1.56, - "learning_rate": 6.547719349582011e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.0001795041746483108, + "loss": 0.0132, "step": 309900 }, { - "epoch": 1.56, - "learning_rate": 6.54696258028061e-05, - "loss": 0.0085, + "epoch": 0.8, + "learning_rate": 0.00017950028643193934, + "loss": 0.0153, "step": 309910 }, { - "epoch": 1.56, - "learning_rate": 6.546205810979209e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.0001794963982155679, + "loss": 0.0146, "step": 309920 }, { - "epoch": 1.56, - "learning_rate": 6.545449041677808e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017949250999919642, + "loss": 0.0152, "step": 309930 }, { - "epoch": 1.56, - "learning_rate": 6.544692272376406e-05, - "loss": 0.0106, + "epoch": 0.8, + "learning_rate": 0.00017948862178282496, + "loss": 0.0114, "step": 309940 }, { - "epoch": 1.56, - "learning_rate": 6.543935503075006e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017948473356645348, + "loss": 0.0175, "step": 309950 }, { - "epoch": 1.56, - "learning_rate": 6.543178733773604e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00017948084535008205, + "loss": 0.0154, "step": 309960 }, { - "epoch": 1.56, - "learning_rate": 6.542421964472204e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017947695713371056, + "loss": 0.0162, "step": 309970 }, { - "epoch": 1.56, - "learning_rate": 6.541665195170802e-05, - "loss": 0.0087, + "epoch": 0.8, + "learning_rate": 0.0001794730689173391, + "loss": 0.012, "step": 309980 }, { - "epoch": 1.56, - "learning_rate": 6.540908425869401e-05, - "loss": 0.009, + "epoch": 0.8, + "learning_rate": 0.00017946918070096762, + "loss": 0.0156, "step": 309990 }, { - "epoch": 1.56, - "learning_rate": 6.540151656568e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00017946529248459618, + "loss": 0.0144, "step": 310000 }, { - "epoch": 1.56, - "eval_cer": 0.9144556999612812, - "eval_loss": 0.005289402790367603, - "eval_runtime": 116.4374, - "eval_samples_per_second": 17.177, - "eval_steps_per_second": 4.294, + "epoch": 0.8, + "eval_cer": 0.8817222812402463, + "eval_loss": 0.009546291083097458, + "eval_runtime": 107.8383, + "eval_samples_per_second": 18.546, + "eval_steps_per_second": 4.637, "step": 310000 }, { - "epoch": 1.56, - "learning_rate": 6.539394887266599e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.0001794614042682247, + "loss": 0.0172, "step": 310010 }, { - "epoch": 1.56, - "learning_rate": 6.538638117965198e-05, - "loss": 0.0064, + "epoch": 0.8, + "learning_rate": 0.00017945751605185324, + "loss": 0.0134, "step": 310020 }, { - "epoch": 1.56, - "learning_rate": 6.537881348663797e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.00017945362783548176, + "loss": 0.0173, "step": 310030 }, { - "epoch": 1.56, - "learning_rate": 6.537124579362396e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00017944973961911032, + "loss": 0.0127, "step": 310040 }, { - "epoch": 1.56, - "learning_rate": 6.536367810060994e-05, - "loss": 0.0065, + "epoch": 0.8, + "learning_rate": 0.00017944585140273884, + "loss": 0.0145, "step": 310050 }, { - "epoch": 1.56, - "learning_rate": 6.535611040759594e-05, - "loss": 0.0053, + "epoch": 0.8, + "learning_rate": 0.00017944196318636738, + "loss": 0.0168, "step": 310060 }, { - "epoch": 1.56, - "learning_rate": 6.534854271458193e-05, - "loss": 0.0089, + "epoch": 0.8, + "learning_rate": 0.0001794380749699959, + "loss": 0.0138, "step": 310070 }, { - "epoch": 1.56, - "learning_rate": 6.534097502156791e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017943418675362446, + "loss": 0.0147, "step": 310080 }, { - "epoch": 1.56, - "learning_rate": 6.533340732855391e-05, - "loss": 0.008, + "epoch": 0.8, + "learning_rate": 0.000179430298537253, + "loss": 0.0104, "step": 310090 }, { - "epoch": 1.56, - "learning_rate": 6.53258396355399e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017942641032088152, + "loss": 0.0153, "step": 310100 }, { - "epoch": 1.56, - "learning_rate": 6.531827194252588e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00017942252210451003, + "loss": 0.0108, "step": 310110 }, { - "epoch": 1.56, - "learning_rate": 6.531070424951188e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.0001794186338881386, + "loss": 0.0158, "step": 310120 }, { - "epoch": 1.56, - "learning_rate": 6.530313655649786e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017941474567176714, + "loss": 0.0133, "step": 310130 }, { - "epoch": 1.56, - "learning_rate": 6.529556886348386e-05, - "loss": 0.0083, + "epoch": 0.8, + "learning_rate": 0.00017941085745539566, + "loss": 0.0132, "step": 310140 }, { - "epoch": 1.56, - "learning_rate": 6.528800117046985e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.0001794069692390242, + "loss": 0.0132, "step": 310150 }, { - "epoch": 1.56, - "learning_rate": 6.528043347745583e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017940308102265272, + "loss": 0.0095, "step": 310160 }, { - "epoch": 1.56, - "learning_rate": 6.527286578444183e-05, - "loss": 0.0054, + "epoch": 0.8, + "learning_rate": 0.00017939919280628128, + "loss": 0.0094, "step": 310170 }, { - "epoch": 1.56, - "learning_rate": 6.526529809142782e-05, - "loss": 0.006, + "epoch": 0.8, + "learning_rate": 0.0001793953045899098, + "loss": 0.0134, "step": 310180 }, { - "epoch": 1.56, - "learning_rate": 6.52577303984138e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017939141637353834, + "loss": 0.0139, "step": 310190 }, { - "epoch": 1.56, - "learning_rate": 6.52501627053998e-05, - "loss": 0.0058, - "step": 310200 + "epoch": 0.8, + "learning_rate": 0.00017938752815716685, + "loss": 0.0141, + "step": 310200 }, { - "epoch": 1.57, - "learning_rate": 6.524259501238578e-05, - "loss": 0.0086, + "epoch": 0.8, + "learning_rate": 0.00017938363994079542, + "loss": 0.0117, "step": 310210 }, { - "epoch": 1.57, - "learning_rate": 6.523502731937178e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017937975172442394, + "loss": 0.0119, "step": 310220 }, { - "epoch": 1.57, - "learning_rate": 6.522745962635777e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017937586350805248, + "loss": 0.0116, "step": 310230 }, { - "epoch": 1.57, - "learning_rate": 6.521989193334375e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.000179371975291681, + "loss": 0.0126, "step": 310240 }, { - "epoch": 1.57, - "learning_rate": 6.521232424032975e-05, - "loss": 0.0052, + "epoch": 0.8, + "learning_rate": 0.00017936808707530956, + "loss": 0.0155, "step": 310250 }, { - "epoch": 1.57, - "learning_rate": 6.520475654731574e-05, - "loss": 0.0063, + "epoch": 0.8, + "learning_rate": 0.00017936419885893808, + "loss": 0.0156, "step": 310260 }, { - "epoch": 1.57, - "learning_rate": 6.519718885430172e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017936031064256662, + "loss": 0.0145, "step": 310270 }, { - "epoch": 1.57, - "learning_rate": 6.518962116128772e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017935642242619513, + "loss": 0.0129, "step": 310280 }, { - "epoch": 1.57, - "learning_rate": 6.51820534682737e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.0001793525342098237, + "loss": 0.0136, "step": 310290 }, { - "epoch": 1.57, - "learning_rate": 6.51744857752597e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017934864599345224, + "loss": 0.0168, "step": 310300 }, { - "epoch": 1.57, - "learning_rate": 6.516691808224568e-05, - "loss": 0.0062, + "epoch": 0.8, + "learning_rate": 0.00017934475777708076, + "loss": 0.0134, "step": 310310 }, { - "epoch": 1.57, - "learning_rate": 6.515935038923167e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.0001793408695607093, + "loss": 0.014, "step": 310320 }, { - "epoch": 1.57, - "learning_rate": 6.515178269621765e-05, - "loss": 0.0091, + "epoch": 0.8, + "learning_rate": 0.00017933698134433784, + "loss": 0.0157, "step": 310330 }, { - "epoch": 1.57, - "learning_rate": 6.514421500320365e-05, - "loss": 0.0099, + "epoch": 0.8, + "learning_rate": 0.00017933309312796638, + "loss": 0.0157, "step": 310340 }, { - "epoch": 1.57, - "learning_rate": 6.513664731018964e-05, - "loss": 0.0092, + "epoch": 0.8, + "learning_rate": 0.0001793292049115949, + "loss": 0.0136, "step": 310350 }, { - "epoch": 1.57, - "learning_rate": 6.512907961717562e-05, - "loss": 0.0072, + "epoch": 0.8, + "learning_rate": 0.00017932531669522344, + "loss": 0.0109, "step": 310360 }, { - "epoch": 1.57, - "learning_rate": 6.512151192416162e-05, - "loss": 0.0095, + "epoch": 0.8, + "learning_rate": 0.00017932142847885198, + "loss": 0.0177, "step": 310370 }, { - "epoch": 1.57, - "learning_rate": 6.511394423114761e-05, - "loss": 0.0074, + "epoch": 0.8, + "learning_rate": 0.00017931754026248052, + "loss": 0.0178, "step": 310380 }, { - "epoch": 1.57, - "learning_rate": 6.51063765381336e-05, - "loss": 0.0071, + "epoch": 0.8, + "learning_rate": 0.00017931365204610904, + "loss": 0.0141, "step": 310390 }, { - "epoch": 1.57, - "learning_rate": 6.509880884511959e-05, - "loss": 0.0075, + "epoch": 0.8, + "learning_rate": 0.00017930976382973758, + "loss": 0.0152, "step": 310400 }, { - "epoch": 1.57, - "learning_rate": 6.509124115210557e-05, - "loss": 0.0095, + "epoch": 0.8, + "learning_rate": 0.0001793058756133661, + "loss": 0.0144, "step": 310410 }, { - "epoch": 1.57, - "learning_rate": 6.508367345909157e-05, - "loss": 0.0077, + "epoch": 0.8, + "learning_rate": 0.00017930198739699466, + "loss": 0.0165, "step": 310420 }, { - "epoch": 1.57, - "learning_rate": 6.507610576607756e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017929809918062318, + "loss": 0.014, "step": 310430 }, { - "epoch": 1.57, - "learning_rate": 6.506853807306354e-05, - "loss": 0.0061, + "epoch": 0.8, + "learning_rate": 0.00017929421096425172, + "loss": 0.0127, "step": 310440 }, { - "epoch": 1.57, - "learning_rate": 6.506097038004954e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017929032274788023, + "loss": 0.0163, "step": 310450 }, { - "epoch": 1.57, - "learning_rate": 6.505340268703553e-05, - "loss": 0.0079, + "epoch": 0.8, + "learning_rate": 0.0001792864345315088, + "loss": 0.0138, "step": 310460 }, { - "epoch": 1.57, - "learning_rate": 6.504583499402152e-05, - "loss": 0.005, + "epoch": 0.8, + "learning_rate": 0.00017928254631513734, + "loss": 0.0141, "step": 310470 }, { - "epoch": 1.57, - "learning_rate": 6.503826730100751e-05, - "loss": 0.0068, + "epoch": 0.8, + "learning_rate": 0.00017927865809876586, + "loss": 0.0146, "step": 310480 }, { - "epoch": 1.57, - "learning_rate": 6.503069960799349e-05, - "loss": 0.0088, + "epoch": 0.8, + "learning_rate": 0.0001792747698823944, + "loss": 0.0122, "step": 310490 }, { - "epoch": 1.57, - "learning_rate": 6.502313191497949e-05, - "loss": 0.0069, + "epoch": 0.8, + "learning_rate": 0.00017927088166602294, + "loss": 0.0152, "step": 310500 }, { - "epoch": 1.57, - "learning_rate": 6.501556422196548e-05, - "loss": 0.0059, + "epoch": 0.8, + "learning_rate": 0.00017926699344965148, + "loss": 0.0138, "step": 310510 }, { - "epoch": 1.57, - "learning_rate": 6.500799652895146e-05, - "loss": 0.0073, + "epoch": 0.8, + "learning_rate": 0.00017926310523328, + "loss": 0.0114, "step": 310520 }, { - "epoch": 1.57, - "learning_rate": 6.500042883593746e-05, - "loss": 0.0067, + "epoch": 0.8, + "learning_rate": 0.00017925921701690854, + "loss": 0.0115, "step": 310530 }, { - "epoch": 1.57, - "learning_rate": 6.499286114292345e-05, - "loss": 0.0078, + "epoch": 0.8, + "learning_rate": 0.00017925532880053708, + "loss": 0.0128, "step": 310540 }, { - "epoch": 1.57, - "learning_rate": 6.498529344990943e-05, - "loss": 0.0056, + "epoch": 0.8, + "learning_rate": 0.00017925144058416562, + "loss": 0.0135, "step": 310550 }, { - "epoch": 1.57, - "learning_rate": 6.497772575689543e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017924755236779414, + "loss": 0.013, "step": 310560 }, { - "epoch": 1.57, - "learning_rate": 6.497015806388141e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017924366415142268, + "loss": 0.0142, "step": 310570 }, { - "epoch": 1.57, - "learning_rate": 6.49625903708674e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017923977593505122, + "loss": 0.016, "step": 310580 }, { - "epoch": 1.57, - "learning_rate": 6.49550226778534e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017923588771867976, + "loss": 0.0126, "step": 310590 }, { - "epoch": 1.57, - "learning_rate": 6.494745498483938e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017923199950230828, + "loss": 0.0145, "step": 310600 }, { - "epoch": 1.57, - "learning_rate": 6.493988729182536e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017922811128593682, + "loss": 0.0155, "step": 310610 }, { - "epoch": 1.57, - "learning_rate": 6.493231959881136e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.0001792242230695654, + "loss": 0.0119, "step": 310620 }, { - "epoch": 1.57, - "learning_rate": 6.492475190579735e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.0001792203348531939, + "loss": 0.0151, "step": 310630 }, { - "epoch": 1.57, - "learning_rate": 6.491718421278334e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017921644663682244, + "loss": 0.0171, "step": 310640 }, { - "epoch": 1.57, - "learning_rate": 6.490961651976933e-05, - "loss": 0.0049, + "epoch": 0.81, + "learning_rate": 0.00017921255842045096, + "loss": 0.0145, "step": 310650 }, { - "epoch": 1.57, - "learning_rate": 6.490204882675531e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017920867020407947, + "loss": 0.0132, "step": 310660 }, { - "epoch": 1.57, - "learning_rate": 6.48944811337413e-05, - "loss": 0.0096, + "epoch": 0.81, + "learning_rate": 0.00017920478198770804, + "loss": 0.0144, "step": 310670 }, { - "epoch": 1.57, - "learning_rate": 6.48869134407273e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017920089377133658, + "loss": 0.0143, "step": 310680 }, { - "epoch": 1.57, - "learning_rate": 6.487934574771328e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.0001791970055549651, + "loss": 0.0096, "step": 310690 }, { - "epoch": 1.57, - "learning_rate": 6.487177805469928e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017919311733859364, + "loss": 0.0138, "step": 310700 }, { - "epoch": 1.57, - "learning_rate": 6.486421036168527e-05, - "loss": 0.0095, + "epoch": 0.81, + "learning_rate": 0.00017918922912222218, + "loss": 0.0125, "step": 310710 }, { - "epoch": 1.57, - "learning_rate": 6.485664266867125e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.00017918534090585072, + "loss": 0.0144, "step": 310720 }, { - "epoch": 1.57, - "learning_rate": 6.484907497565725e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017918145268947924, + "loss": 0.0109, "step": 310730 }, { - "epoch": 1.57, - "learning_rate": 6.484150728264323e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017917756447310778, + "loss": 0.0137, "step": 310740 }, { - "epoch": 1.57, - "learning_rate": 6.483393958962923e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017917367625673632, + "loss": 0.0167, "step": 310750 }, { - "epoch": 1.57, - "learning_rate": 6.482637189661522e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017916978804036486, + "loss": 0.0159, "step": 310760 }, { - "epoch": 1.57, - "learning_rate": 6.48188042036012e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017916589982399338, + "loss": 0.0134, "step": 310770 }, { - "epoch": 1.57, - "learning_rate": 6.48112365105872e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.00017916201160762192, + "loss": 0.0144, "step": 310780 }, { - "epoch": 1.57, - "learning_rate": 6.480366881757319e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017915812339125049, + "loss": 0.0163, "step": 310790 }, { - "epoch": 1.57, - "learning_rate": 6.479610112455917e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.000179154235174879, + "loss": 0.0112, "step": 310800 }, { - "epoch": 1.57, - "learning_rate": 6.478853343154517e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017915034695850754, + "loss": 0.0153, "step": 310810 }, { - "epoch": 1.57, - "learning_rate": 6.478096573853116e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017914645874213606, + "loss": 0.0124, "step": 310820 }, { - "epoch": 1.57, - "learning_rate": 6.477339804551715e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017914257052576463, + "loss": 0.013, "step": 310830 }, { - "epoch": 1.57, - "learning_rate": 6.476583035250314e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017913868230939314, + "loss": 0.0148, "step": 310840 }, { - "epoch": 1.57, - "learning_rate": 6.475826265948912e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017913479409302168, + "loss": 0.0102, "step": 310850 }, { - "epoch": 1.57, - "learning_rate": 6.475069496647512e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.0001791309058766502, + "loss": 0.0222, "step": 310860 }, { - "epoch": 1.57, - "learning_rate": 6.474312727346111e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.00017912701766027876, + "loss": 0.0163, "step": 310870 }, { - "epoch": 1.57, - "learning_rate": 6.473555958044709e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017912312944390728, + "loss": 0.0134, "step": 310880 }, { - "epoch": 1.57, - "learning_rate": 6.472799188743309e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017911924122753582, + "loss": 0.0115, "step": 310890 }, { - "epoch": 1.57, - "learning_rate": 6.472042419441908e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017911535301116434, + "loss": 0.0146, "step": 310900 }, { - "epoch": 1.57, - "learning_rate": 6.471285650140506e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017911146479479288, + "loss": 0.0154, "step": 310910 }, { - "epoch": 1.57, - "learning_rate": 6.470528880839106e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017910757657842142, + "loss": 0.012, "step": 310920 }, { - "epoch": 1.57, - "learning_rate": 6.469772111537704e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017910368836204996, + "loss": 0.015, "step": 310930 }, { - "epoch": 1.57, - "learning_rate": 6.469015342236302e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017909980014567848, + "loss": 0.0169, "step": 310940 }, { - "epoch": 1.57, - "learning_rate": 6.468258572934902e-05, - "loss": 0.0087, + "epoch": 0.81, + "learning_rate": 0.00017909591192930702, + "loss": 0.0122, "step": 310950 }, { - "epoch": 1.57, - "learning_rate": 6.467501803633501e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017909202371293559, + "loss": 0.013, "step": 310960 }, { - "epoch": 1.57, - "learning_rate": 6.4667450343321e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.0001790881354965641, + "loss": 0.0115, "step": 310970 }, { - "epoch": 1.57, - "learning_rate": 6.465988265030699e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017908424728019261, + "loss": 0.0124, "step": 310980 }, { - "epoch": 1.57, - "learning_rate": 6.465231495729298e-05, - "loss": 0.0088, + "epoch": 0.81, + "learning_rate": 0.00017908035906382116, + "loss": 0.013, "step": 310990 }, { - "epoch": 1.57, - "learning_rate": 6.464474726427897e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017907647084744972, + "loss": 0.0165, "step": 311000 }, { - "epoch": 1.57, - "eval_cer": 0.9144498775845288, - "eval_loss": 0.005227969028055668, - "eval_runtime": 116.309, - "eval_samples_per_second": 17.196, - "eval_steps_per_second": 4.299, + "epoch": 0.81, + "eval_cer": 0.8817222812402463, + "eval_loss": 0.009462043642997742, + "eval_runtime": 107.7393, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, "step": 311000 }, { - "epoch": 1.57, - "learning_rate": 6.463717957126496e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017907258263107824, + "loss": 0.0137, "step": 311010 }, { - "epoch": 1.57, - "learning_rate": 6.462961187825094e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017906869441470678, + "loss": 0.0148, "step": 311020 }, { - "epoch": 1.57, - "learning_rate": 6.462204418523694e-05, - "loss": 0.0093, + "epoch": 0.81, + "learning_rate": 0.0001790648061983353, + "loss": 0.0125, "step": 311030 }, { - "epoch": 1.57, - "learning_rate": 6.461447649222293e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017906091798196386, + "loss": 0.0136, "step": 311040 }, { - "epoch": 1.57, - "learning_rate": 6.460690879920891e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017905702976559238, + "loss": 0.016, "step": 311050 }, { - "epoch": 1.57, - "learning_rate": 6.459934110619491e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017905314154922092, + "loss": 0.0151, "step": 311060 }, { - "epoch": 1.57, - "learning_rate": 6.45917734131809e-05, - "loss": 0.0049, + "epoch": 0.81, + "learning_rate": 0.00017904925333284944, + "loss": 0.0115, "step": 311070 }, { - "epoch": 1.57, - "learning_rate": 6.458420572016688e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.000179045365116478, + "loss": 0.0164, "step": 311080 }, { - "epoch": 1.57, - "learning_rate": 6.457663802715288e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017904147690010652, + "loss": 0.0128, "step": 311090 }, { - "epoch": 1.57, - "learning_rate": 6.456907033413886e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017903758868373506, + "loss": 0.0131, "step": 311100 }, { - "epoch": 1.57, - "learning_rate": 6.456150264112486e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017903370046736357, + "loss": 0.0192, "step": 311110 }, { - "epoch": 1.57, - "learning_rate": 6.455393494811085e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017902981225099214, + "loss": 0.0105, "step": 311120 }, { - "epoch": 1.57, - "learning_rate": 6.454636725509683e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017902592403462066, + "loss": 0.0138, "step": 311130 }, { - "epoch": 1.57, - "learning_rate": 6.453879956208283e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.0001790220358182492, + "loss": 0.0137, "step": 311140 }, { - "epoch": 1.57, - "learning_rate": 6.453123186906882e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017901814760187771, + "loss": 0.0123, "step": 311150 }, { - "epoch": 1.57, - "learning_rate": 6.45236641760548e-05, - "loss": 0.0082, + "epoch": 0.81, + "learning_rate": 0.00017901425938550626, + "loss": 0.0139, "step": 311160 }, { - "epoch": 1.57, - "learning_rate": 6.45160964830408e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017901037116913482, + "loss": 0.0151, "step": 311170 }, { - "epoch": 1.57, - "learning_rate": 6.450852879002678e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.00017900648295276334, + "loss": 0.0145, "step": 311180 }, { - "epoch": 1.57, - "learning_rate": 6.450096109701278e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017900259473639188, + "loss": 0.0126, "step": 311190 }, { - "epoch": 1.57, - "learning_rate": 6.449339340399877e-05, - "loss": 0.0094, + "epoch": 0.81, + "learning_rate": 0.0001789987065200204, + "loss": 0.0129, "step": 311200 }, { - "epoch": 1.57, - "learning_rate": 6.448582571098475e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017899481830364896, + "loss": 0.0157, "step": 311210 }, { - "epoch": 1.57, - "learning_rate": 6.447825801797075e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017899093008727748, + "loss": 0.0122, "step": 311220 }, { - "epoch": 1.57, - "learning_rate": 6.447069032495674e-05, - "loss": 0.0088, + "epoch": 0.81, + "learning_rate": 0.00017898704187090602, + "loss": 0.0116, "step": 311230 }, { - "epoch": 1.57, - "learning_rate": 6.446312263194272e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017898315365453453, + "loss": 0.0155, "step": 311240 }, { - "epoch": 1.57, - "learning_rate": 6.44555549389287e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.0001789792654381631, + "loss": 0.0138, "step": 311250 }, { - "epoch": 1.57, - "learning_rate": 6.44479872459147e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017897537722179162, + "loss": 0.0114, "step": 311260 }, { - "epoch": 1.57, - "learning_rate": 6.44404195529007e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017897148900542016, + "loss": 0.0113, "step": 311270 }, { - "epoch": 1.57, - "learning_rate": 6.443285185988668e-05, - "loss": 0.0093, + "epoch": 0.81, + "learning_rate": 0.00017896760078904867, + "loss": 0.0163, "step": 311280 }, { - "epoch": 1.57, - "learning_rate": 6.442528416687267e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.00017896371257267724, + "loss": 0.011, "step": 311290 }, { - "epoch": 1.57, - "learning_rate": 6.441771647385865e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017895982435630576, + "loss": 0.0136, "step": 311300 }, { - "epoch": 1.57, - "learning_rate": 6.441014878084465e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.0001789559361399343, + "loss": 0.0129, "step": 311310 }, { - "epoch": 1.57, - "learning_rate": 6.440258108783064e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.0001789520479235628, + "loss": 0.014, "step": 311320 }, { - "epoch": 1.57, - "learning_rate": 6.439501339481662e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017894815970719138, + "loss": 0.0137, "step": 311330 }, { - "epoch": 1.57, - "learning_rate": 6.438744570180262e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017894427149081992, + "loss": 0.0124, "step": 311340 }, { - "epoch": 1.57, - "learning_rate": 6.437987800878861e-05, - "loss": 0.0097, + "epoch": 0.81, + "learning_rate": 0.00017894038327444844, + "loss": 0.0129, "step": 311350 }, { - "epoch": 1.57, - "learning_rate": 6.43723103157746e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017893649505807698, + "loss": 0.0167, "step": 311360 }, { - "epoch": 1.57, - "learning_rate": 6.436474262276059e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017893260684170552, + "loss": 0.0136, "step": 311370 }, { - "epoch": 1.57, - "learning_rate": 6.435717492974657e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017892871862533406, + "loss": 0.0124, "step": 311380 }, { - "epoch": 1.57, - "learning_rate": 6.434960723673257e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017892483040896258, + "loss": 0.0124, "step": 311390 }, { - "epoch": 1.57, - "learning_rate": 6.434203954371856e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.00017892094219259112, + "loss": 0.0144, "step": 311400 }, { - "epoch": 1.57, - "learning_rate": 6.433447185070454e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017891705397621963, + "loss": 0.0123, "step": 311410 }, { - "epoch": 1.57, - "learning_rate": 6.432690415769054e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.0001789131657598482, + "loss": 0.0143, "step": 311420 }, { - "epoch": 1.57, - "learning_rate": 6.431933646467653e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017890927754347672, + "loss": 0.0136, "step": 311430 }, { - "epoch": 1.57, - "learning_rate": 6.431176877166251e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017890538932710526, + "loss": 0.017, "step": 311440 }, { - "epoch": 1.57, - "learning_rate": 6.430420107864851e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.00017890150111073377, + "loss": 0.0131, "step": 311450 }, { - "epoch": 1.57, - "learning_rate": 6.429663338563449e-05, - "loss": 0.0048, + "epoch": 0.81, + "learning_rate": 0.00017889761289436234, + "loss": 0.0148, "step": 311460 }, { - "epoch": 1.57, - "learning_rate": 6.428906569262049e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017889372467799086, + "loss": 0.0102, "step": 311470 }, { - "epoch": 1.57, - "learning_rate": 6.428149799960648e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.0001788898364616194, + "loss": 0.0168, "step": 311480 }, { - "epoch": 1.57, - "learning_rate": 6.427393030659246e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.0001788859482452479, + "loss": 0.0206, "step": 311490 }, { - "epoch": 1.57, - "learning_rate": 6.426636261357846e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017888206002887648, + "loss": 0.0153, "step": 311500 }, { - "epoch": 1.57, - "learning_rate": 6.425879492056445e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017887817181250502, + "loss": 0.0148, "step": 311510 }, { - "epoch": 1.57, - "learning_rate": 6.425122722755043e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017887428359613354, + "loss": 0.0141, "step": 311520 }, { - "epoch": 1.57, - "learning_rate": 6.424365953453643e-05, - "loss": 0.0047, + "epoch": 0.81, + "learning_rate": 0.00017887039537976208, + "loss": 0.0141, "step": 311530 }, { - "epoch": 1.57, - "learning_rate": 6.423609184152241e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017886650716339062, + "loss": 0.0143, "step": 311540 }, { - "epoch": 1.57, - "learning_rate": 6.42285241485084e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017886261894701916, + "loss": 0.0149, "step": 311550 }, { - "epoch": 1.57, - "learning_rate": 6.422095645549439e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017885873073064768, + "loss": 0.0122, "step": 311560 }, { - "epoch": 1.57, - "learning_rate": 6.421338876248038e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017885484251427622, + "loss": 0.0142, "step": 311570 }, { - "epoch": 1.57, - "learning_rate": 6.420582106946636e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017885095429790476, + "loss": 0.0128, "step": 311580 }, { - "epoch": 1.57, - "learning_rate": 6.419825337645236e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.0001788470660815333, + "loss": 0.015, "step": 311590 }, { - "epoch": 1.57, - "learning_rate": 6.419068568343835e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.00017884317786516182, + "loss": 0.0104, "step": 311600 }, { - "epoch": 1.57, - "learning_rate": 6.418311799042433e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.00017883928964879036, + "loss": 0.0142, "step": 311610 }, { - "epoch": 1.57, - "learning_rate": 6.417555029741033e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.0001788354014324189, + "loss": 0.0137, "step": 311620 }, { - "epoch": 1.57, - "learning_rate": 6.416798260439631e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017883151321604744, + "loss": 0.0152, "step": 311630 }, { - "epoch": 1.57, - "learning_rate": 6.41604149113823e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017882762499967596, + "loss": 0.0149, "step": 311640 }, { - "epoch": 1.57, - "learning_rate": 6.41528472183683e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.0001788237367833045, + "loss": 0.0152, "step": 311650 }, { - "epoch": 1.57, - "learning_rate": 6.414527952535428e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.000178819848566933, + "loss": 0.0115, "step": 311660 }, { - "epoch": 1.57, - "learning_rate": 6.413771183234028e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.00017881596035056158, + "loss": 0.0145, "step": 311670 }, { - "epoch": 1.57, - "learning_rate": 6.413014413932627e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017881207213419012, + "loss": 0.0156, "step": 311680 }, { - "epoch": 1.57, - "learning_rate": 6.412257644631225e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017880818391781864, + "loss": 0.0141, "step": 311690 }, { - "epoch": 1.57, - "learning_rate": 6.411500875329825e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017880429570144715, + "loss": 0.0081, "step": 311700 }, { - "epoch": 1.57, - "learning_rate": 6.410744106028423e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017880040748507572, + "loss": 0.0117, "step": 311710 }, { - "epoch": 1.57, - "learning_rate": 6.409987336727023e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017879651926870426, + "loss": 0.014, "step": 311720 }, { - "epoch": 1.57, - "learning_rate": 6.409230567425622e-05, - "loss": 0.0096, + "epoch": 0.81, + "learning_rate": 0.00017879263105233278, + "loss": 0.0122, "step": 311730 }, { - "epoch": 1.57, - "learning_rate": 6.40847379812422e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017878874283596132, + "loss": 0.0145, "step": 311740 }, { - "epoch": 1.57, - "learning_rate": 6.40771702882282e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017878485461958986, + "loss": 0.0166, "step": 311750 }, { - "epoch": 1.57, - "learning_rate": 6.406960259521419e-05, - "loss": 0.0085, + "epoch": 0.81, + "learning_rate": 0.0001787809664032184, + "loss": 0.0131, "step": 311760 }, { - "epoch": 1.57, - "learning_rate": 6.406203490220017e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017877707818684692, + "loss": 0.0146, "step": 311770 }, { - "epoch": 1.57, - "learning_rate": 6.405446720918617e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017877318997047546, + "loss": 0.0126, "step": 311780 }, { - "epoch": 1.57, - "learning_rate": 6.404689951617216e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.000178769301754104, + "loss": 0.0168, "step": 311790 }, { - "epoch": 1.57, - "learning_rate": 6.403933182315814e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017876541353773254, + "loss": 0.01, "step": 311800 }, { - "epoch": 1.57, - "learning_rate": 6.403176413014414e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017876152532136106, + "loss": 0.013, "step": 311810 }, { - "epoch": 1.57, - "learning_rate": 6.402419643713012e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.0001787576371049896, + "loss": 0.014, "step": 311820 }, { - "epoch": 1.57, - "learning_rate": 6.401662874411612e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017875374888861817, + "loss": 0.013, "step": 311830 }, { - "epoch": 1.57, - "learning_rate": 6.400906105110211e-05, - "loss": 0.0096, + "epoch": 0.81, + "learning_rate": 0.00017874986067224668, + "loss": 0.0154, "step": 311840 }, { - "epoch": 1.57, - "learning_rate": 6.400149335808809e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.0001787459724558752, + "loss": 0.011, "step": 311850 }, { - "epoch": 1.57, - "learning_rate": 6.399392566507409e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017874208423950374, + "loss": 0.0164, "step": 311860 }, { - "epoch": 1.57, - "learning_rate": 6.398635797206007e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.0001787381960231323, + "loss": 0.014, "step": 311870 }, { - "epoch": 1.57, - "learning_rate": 6.397879027904606e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017873430780676082, + "loss": 0.014, "step": 311880 }, { - "epoch": 1.57, - "learning_rate": 6.397122258603205e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017873041959038936, + "loss": 0.0163, "step": 311890 }, { - "epoch": 1.57, - "learning_rate": 6.396365489301804e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017872653137401788, + "loss": 0.0146, "step": 311900 }, { - "epoch": 1.57, - "learning_rate": 6.395608720000402e-05, - "loss": 0.0141, + "epoch": 0.81, + "learning_rate": 0.00017872264315764642, + "loss": 0.016, "step": 311910 }, { - "epoch": 1.57, - "learning_rate": 6.394851950699002e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017871875494127496, + "loss": 0.0168, "step": 311920 }, { - "epoch": 1.57, - "learning_rate": 6.394095181397601e-05, - "loss": 0.0048, + "epoch": 0.81, + "learning_rate": 0.0001787148667249035, + "loss": 0.0166, "step": 311930 }, { - "epoch": 1.57, - "learning_rate": 6.3933384120962e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017871097850853202, + "loss": 0.014, "step": 311940 }, { - "epoch": 1.57, - "learning_rate": 6.392581642794799e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017870709029216056, + "loss": 0.014, "step": 311950 }, { - "epoch": 1.57, - "learning_rate": 6.391824873493398e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.0001787032020757891, + "loss": 0.014, "step": 311960 }, { - "epoch": 1.57, - "learning_rate": 6.391068104191996e-05, - "loss": 0.0116, + "epoch": 0.81, + "learning_rate": 0.00017869931385941764, + "loss": 0.0134, "step": 311970 }, { - "epoch": 1.57, - "learning_rate": 6.390311334890596e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017869542564304615, + "loss": 0.0136, "step": 311980 }, { - "epoch": 1.57, - "learning_rate": 6.389554565589194e-05, - "loss": 0.0093, + "epoch": 0.81, + "learning_rate": 0.0001786915374266747, + "loss": 0.0118, "step": 311990 }, { - "epoch": 1.57, - "learning_rate": 6.388797796287794e-05, - "loss": 0.0116, + "epoch": 0.81, + "learning_rate": 0.00017868764921030327, + "loss": 0.0147, "step": 312000 }, { - "epoch": 1.57, - "eval_cer": 0.914462492734159, - "eval_loss": 0.005281941965222359, - "eval_runtime": 116.1751, - "eval_samples_per_second": 17.215, - "eval_steps_per_second": 4.304, + "epoch": 0.81, + "eval_cer": 0.8817222812402463, + "eval_loss": 0.009489587508141994, + "eval_runtime": 107.733, + "eval_samples_per_second": 18.564, + "eval_steps_per_second": 4.641, "step": 312000 }, { - "epoch": 1.57, - "learning_rate": 6.388041026986393e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017868376099393178, + "loss": 0.0161, "step": 312010 }, { - "epoch": 1.57, - "learning_rate": 6.387284257684991e-05, - "loss": 0.0085, + "epoch": 0.81, + "learning_rate": 0.0001786798727775603, + "loss": 0.0142, "step": 312020 }, { - "epoch": 1.57, - "learning_rate": 6.386527488383591e-05, - "loss": 0.0098, + "epoch": 0.81, + "learning_rate": 0.00017867598456118884, + "loss": 0.0109, "step": 312030 }, { - "epoch": 1.57, - "learning_rate": 6.38577071908219e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.0001786720963448174, + "loss": 0.0124, "step": 312040 }, { - "epoch": 1.57, - "learning_rate": 6.385013949780788e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017866820812844592, + "loss": 0.0108, "step": 312050 }, { - "epoch": 1.57, - "learning_rate": 6.384257180479388e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017866431991207446, + "loss": 0.0146, "step": 312060 }, { - "epoch": 1.57, - "learning_rate": 6.383500411177986e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017866043169570298, + "loss": 0.0143, "step": 312070 }, { - "epoch": 1.57, - "learning_rate": 6.382743641876586e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017865654347933154, + "loss": 0.0172, "step": 312080 }, { - "epoch": 1.57, - "learning_rate": 6.381986872575185e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017865265526296006, + "loss": 0.0092, "step": 312090 }, { - "epoch": 1.57, - "learning_rate": 6.381230103273783e-05, - "loss": 0.0113, + "epoch": 0.81, + "learning_rate": 0.0001786487670465886, + "loss": 0.0143, "step": 312100 }, { - "epoch": 1.57, - "learning_rate": 6.380473333972383e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017864487883021711, + "loss": 0.0136, "step": 312110 }, { - "epoch": 1.57, - "learning_rate": 6.379716564670982e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017864099061384566, + "loss": 0.0165, "step": 312120 }, { - "epoch": 1.57, - "learning_rate": 6.37895979536958e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.0001786371023974742, + "loss": 0.015, "step": 312130 }, { - "epoch": 1.57, - "learning_rate": 6.37820302606818e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017863321418110274, + "loss": 0.0131, "step": 312140 }, { - "epoch": 1.57, - "learning_rate": 6.377446256766778e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017862932596473125, + "loss": 0.0149, "step": 312150 }, { - "epoch": 1.57, - "learning_rate": 6.376689487465377e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.0001786254377483598, + "loss": 0.0134, "step": 312160 }, { - "epoch": 1.57, - "learning_rate": 6.375932718163977e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.00017862154953198834, + "loss": 0.0214, "step": 312170 }, { - "epoch": 1.57, - "learning_rate": 6.375175948862575e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.00017861766131561688, + "loss": 0.0127, "step": 312180 }, { - "epoch": 1.58, - "learning_rate": 6.374419179561173e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.0001786137730992454, + "loss": 0.0136, "step": 312190 }, { - "epoch": 1.58, - "learning_rate": 6.373662410259773e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017860988488287394, + "loss": 0.013, "step": 312200 }, { - "epoch": 1.58, - "learning_rate": 6.372905640958372e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.0001786059966665025, + "loss": 0.0133, "step": 312210 }, { - "epoch": 1.58, - "learning_rate": 6.37214887165697e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017860210845013102, + "loss": 0.0132, "step": 312220 }, { - "epoch": 1.58, - "learning_rate": 6.37139210235557e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017859822023375956, + "loss": 0.0112, "step": 312230 }, { - "epoch": 1.58, - "learning_rate": 6.37063533305417e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017859433201738807, + "loss": 0.0108, "step": 312240 }, { - "epoch": 1.58, - "learning_rate": 6.369878563752768e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017859044380101664, + "loss": 0.0121, "step": 312250 }, { - "epoch": 1.58, - "learning_rate": 6.369121794451367e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017858655558464516, + "loss": 0.0154, "step": 312260 }, { - "epoch": 1.58, - "learning_rate": 6.368365025149965e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.0001785826673682737, + "loss": 0.0129, "step": 312270 }, { - "epoch": 1.58, - "learning_rate": 6.367608255848565e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017857877915190221, + "loss": 0.0159, "step": 312280 }, { - "epoch": 1.58, - "learning_rate": 6.366851486547164e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017857489093553078, + "loss": 0.0139, "step": 312290 }, { - "epoch": 1.58, - "learning_rate": 6.366094717245762e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.0001785710027191593, + "loss": 0.0109, "step": 312300 }, { - "epoch": 1.58, - "learning_rate": 6.365337947944362e-05, - "loss": 0.0096, + "epoch": 0.81, + "learning_rate": 0.00017856711450278784, + "loss": 0.0139, "step": 312310 }, { - "epoch": 1.58, - "learning_rate": 6.364581178642961e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017856322628641635, + "loss": 0.0115, "step": 312320 }, { - "epoch": 1.58, - "learning_rate": 6.36382440934156e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017855933807004492, + "loss": 0.0146, "step": 312330 }, { - "epoch": 1.58, - "learning_rate": 6.363067640040159e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017855544985367344, + "loss": 0.0151, "step": 312340 }, { - "epoch": 1.58, - "learning_rate": 6.362310870738757e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017855156163730198, + "loss": 0.0143, "step": 312350 }, { - "epoch": 1.58, - "learning_rate": 6.361554101437357e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.0001785476734209305, + "loss": 0.0158, "step": 312360 }, { - "epoch": 1.58, - "learning_rate": 6.360797332135956e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017854378520455903, + "loss": 0.0114, "step": 312370 }, { - "epoch": 1.58, - "learning_rate": 6.360040562834554e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.0001785398969881876, + "loss": 0.0125, "step": 312380 }, { - "epoch": 1.58, - "learning_rate": 6.359283793533154e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.00017853600877181612, + "loss": 0.0136, "step": 312390 }, { - "epoch": 1.58, - "learning_rate": 6.358527024231753e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017853212055544466, + "loss": 0.0143, "step": 312400 }, { - "epoch": 1.58, - "learning_rate": 6.357770254930351e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017852823233907317, + "loss": 0.0119, "step": 312410 }, { - "epoch": 1.58, - "learning_rate": 6.357013485628951e-05, - "loss": 0.0116, + "epoch": 0.81, + "learning_rate": 0.00017852434412270174, + "loss": 0.0155, "step": 312420 }, { - "epoch": 1.58, - "learning_rate": 6.356256716327549e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017852045590633026, + "loss": 0.0131, "step": 312430 }, { - "epoch": 1.58, - "learning_rate": 6.355499947026149e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.0001785165676899588, + "loss": 0.0112, "step": 312440 }, { - "epoch": 1.58, - "learning_rate": 6.354743177724748e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017851267947358731, + "loss": 0.0167, "step": 312450 }, { - "epoch": 1.58, - "learning_rate": 6.353986408423346e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017850879125721588, + "loss": 0.0172, "step": 312460 }, { - "epoch": 1.58, - "learning_rate": 6.353229639121946e-05, - "loss": 0.0099, + "epoch": 0.81, + "learning_rate": 0.0001785049030408444, + "loss": 0.0144, "step": 312470 }, { - "epoch": 1.58, - "learning_rate": 6.352472869820545e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017850101482447294, + "loss": 0.0129, "step": 312480 }, { - "epoch": 1.58, - "learning_rate": 6.351716100519143e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017849712660810145, + "loss": 0.0127, "step": 312490 }, { - "epoch": 1.58, - "learning_rate": 6.350959331217741e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017849323839173002, + "loss": 0.0128, "step": 312500 }, { - "epoch": 1.58, - "learning_rate": 6.350202561916341e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017848935017535854, + "loss": 0.0162, "step": 312510 }, { - "epoch": 1.58, - "learning_rate": 6.349445792614939e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017848546195898708, + "loss": 0.0174, "step": 312520 }, { - "epoch": 1.58, - "learning_rate": 6.348689023313539e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.0001784815737426156, + "loss": 0.0145, "step": 312530 }, { - "epoch": 1.58, - "learning_rate": 6.347932254012138e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017847768552624416, + "loss": 0.0143, "step": 312540 }, { - "epoch": 1.58, - "learning_rate": 6.347175484710736e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.0001784737973098727, + "loss": 0.0135, "step": 312550 }, { - "epoch": 1.58, - "learning_rate": 6.346418715409336e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017846990909350122, + "loss": 0.0176, "step": 312560 }, { - "epoch": 1.58, - "learning_rate": 6.345661946107935e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017846602087712973, + "loss": 0.0144, "step": 312570 }, { - "epoch": 1.58, - "learning_rate": 6.344905176806533e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.0001784621326607583, + "loss": 0.0121, "step": 312580 }, { - "epoch": 1.58, - "learning_rate": 6.344148407505133e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017845824444438684, + "loss": 0.0129, "step": 312590 }, { - "epoch": 1.58, - "learning_rate": 6.343391638203731e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.00017845435622801536, + "loss": 0.0146, "step": 312600 }, { - "epoch": 1.58, - "learning_rate": 6.34263486890233e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.0001784504680116439, + "loss": 0.0148, "step": 312610 }, { - "epoch": 1.58, - "learning_rate": 6.34187809960093e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.0001784465797952724, + "loss": 0.0111, "step": 312620 }, { - "epoch": 1.58, - "learning_rate": 6.341121330299528e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017844269157890098, + "loss": 0.0106, "step": 312630 }, { - "epoch": 1.58, - "learning_rate": 6.340364560998128e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.0001784388033625295, + "loss": 0.0143, "step": 312640 }, { - "epoch": 1.58, - "learning_rate": 6.339607791696727e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017843491514615804, + "loss": 0.0189, "step": 312650 }, { - "epoch": 1.58, - "learning_rate": 6.338851022395325e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017843102692978655, + "loss": 0.0149, "step": 312660 }, { - "epoch": 1.58, - "learning_rate": 6.338094253093925e-05, - "loss": 0.0091, + "epoch": 0.81, + "learning_rate": 0.00017842713871341512, + "loss": 0.0147, "step": 312670 }, { - "epoch": 1.58, - "learning_rate": 6.337337483792523e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017842325049704364, + "loss": 0.0133, "step": 312680 }, { - "epoch": 1.58, - "learning_rate": 6.336580714491122e-05, - "loss": 0.0082, + "epoch": 0.81, + "learning_rate": 0.00017841936228067218, + "loss": 0.0134, "step": 312690 }, { - "epoch": 1.58, - "learning_rate": 6.335823945189722e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.0001784154740643007, + "loss": 0.0131, "step": 312700 }, { - "epoch": 1.58, - "learning_rate": 6.33506717588832e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017841158584792926, + "loss": 0.0162, "step": 312710 }, { - "epoch": 1.58, - "learning_rate": 6.33431040658692e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017840769763155778, + "loss": 0.0159, "step": 312720 }, { - "epoch": 1.58, - "learning_rate": 6.333553637285519e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017840380941518632, + "loss": 0.0135, "step": 312730 }, { - "epoch": 1.58, - "learning_rate": 6.332796867984117e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017839992119881483, + "loss": 0.0172, "step": 312740 }, { - "epoch": 1.58, - "learning_rate": 6.332040098682717e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.0001783960329824434, + "loss": 0.0145, "step": 312750 }, { - "epoch": 1.58, - "learning_rate": 6.331283329381316e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017839214476607194, + "loss": 0.0158, "step": 312760 }, { - "epoch": 1.58, - "learning_rate": 6.330526560079914e-05, - "loss": 0.0092, + "epoch": 0.81, + "learning_rate": 0.00017838825654970046, + "loss": 0.0118, "step": 312770 }, { - "epoch": 1.58, - "learning_rate": 6.329769790778514e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.000178384368333329, + "loss": 0.0138, "step": 312780 }, { - "epoch": 1.58, - "learning_rate": 6.329013021477112e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017838048011695754, + "loss": 0.0159, "step": 312790 }, { - "epoch": 1.58, - "learning_rate": 6.328256252175712e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017837659190058608, + "loss": 0.0127, "step": 312800 }, { - "epoch": 1.58, - "learning_rate": 6.32749948287431e-05, - "loss": 0.0109, + "epoch": 0.81, + "learning_rate": 0.0001783727036842146, + "loss": 0.0187, "step": 312810 }, { - "epoch": 1.58, - "learning_rate": 6.326742713572909e-05, - "loss": 0.0049, + "epoch": 0.81, + "learning_rate": 0.00017836881546784314, + "loss": 0.013, "step": 312820 }, { - "epoch": 1.58, - "learning_rate": 6.325985944271507e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017836492725147168, + "loss": 0.0146, "step": 312830 }, { - "epoch": 1.58, - "learning_rate": 6.325229174970107e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017836103903510022, + "loss": 0.0147, "step": 312840 }, { - "epoch": 1.58, - "learning_rate": 6.324472405668706e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017835715081872874, + "loss": 0.0114, "step": 312850 }, { - "epoch": 1.58, - "learning_rate": 6.323715636367304e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017835326260235728, + "loss": 0.0157, "step": 312860 }, { - "epoch": 1.58, - "learning_rate": 6.322958867065904e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.0001783493743859858, + "loss": 0.0126, "step": 312870 }, { - "epoch": 1.58, - "learning_rate": 6.322202097764502e-05, - "loss": 0.0085, + "epoch": 0.81, + "learning_rate": 0.00017834548616961436, + "loss": 0.0136, "step": 312880 }, { - "epoch": 1.58, - "learning_rate": 6.321445328463102e-05, - "loss": 0.0087, + "epoch": 0.81, + "learning_rate": 0.00017834159795324287, + "loss": 0.0135, "step": 312890 }, { - "epoch": 1.58, - "learning_rate": 6.320688559161701e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017833770973687142, + "loss": 0.0138, "step": 312900 }, { - "epoch": 1.58, - "learning_rate": 6.319931789860299e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017833382152049993, + "loss": 0.0168, "step": 312910 }, { - "epoch": 1.58, - "learning_rate": 6.319175020558899e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.0001783299333041285, + "loss": 0.0139, "step": 312920 }, { - "epoch": 1.58, - "learning_rate": 6.318418251257498e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017832604508775704, + "loss": 0.0132, "step": 312930 }, { - "epoch": 1.58, - "learning_rate": 6.317661481956096e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017832215687138556, + "loss": 0.0131, "step": 312940 }, { - "epoch": 1.58, - "learning_rate": 6.316904712654696e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.0001783182686550141, + "loss": 0.0148, "step": 312950 }, { - "epoch": 1.58, - "learning_rate": 6.316147943353294e-05, - "loss": 0.0083, + "epoch": 0.81, + "learning_rate": 0.00017831438043864264, + "loss": 0.0151, "step": 312960 }, { - "epoch": 1.58, - "learning_rate": 6.315391174051894e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017831049222227118, + "loss": 0.0138, "step": 312970 }, { - "epoch": 1.58, - "learning_rate": 6.314634404750493e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.0001783066040058997, + "loss": 0.0103, "step": 312980 }, { - "epoch": 1.58, - "learning_rate": 6.313877635449091e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017830271578952824, + "loss": 0.0135, "step": 312990 }, { - "epoch": 1.58, - "learning_rate": 6.313120866147691e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017829882757315678, + "loss": 0.0127, "step": 313000 }, { - "epoch": 1.58, - "eval_cer": 0.914438232831024, - "eval_loss": 0.005189271178096533, - "eval_runtime": 116.2305, - "eval_samples_per_second": 17.207, - "eval_steps_per_second": 4.302, + "epoch": 0.81, + "eval_cer": 0.8817208816033121, + "eval_loss": 0.009489119984209538, + "eval_runtime": 107.6322, + "eval_samples_per_second": 18.582, + "eval_steps_per_second": 4.645, "step": 313000 }, { - "epoch": 1.58, - "learning_rate": 6.31236409684629e-05, - "loss": 0.0081, + "epoch": 0.81, + "learning_rate": 0.00017829493935678532, + "loss": 0.0174, "step": 313010 }, { - "epoch": 1.58, - "learning_rate": 6.311607327544888e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017829105114041383, + "loss": 0.0113, "step": 313020 }, { - "epoch": 1.58, - "learning_rate": 6.310850558243488e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017828716292404238, + "loss": 0.0159, "step": 313030 }, { - "epoch": 1.58, - "learning_rate": 6.310093788942086e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017828327470767092, + "loss": 0.0129, "step": 313040 }, { - "epoch": 1.58, - "learning_rate": 6.309337019640685e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017827938649129946, + "loss": 0.0109, "step": 313050 }, { - "epoch": 1.58, - "learning_rate": 6.308580250339285e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017827549827492797, + "loss": 0.0133, "step": 313060 }, { - "epoch": 1.58, - "learning_rate": 6.307823481037883e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017827161005855652, + "loss": 0.0138, "step": 313070 }, { - "epoch": 1.58, - "learning_rate": 6.307066711736483e-05, - "loss": 0.0082, + "epoch": 0.81, + "learning_rate": 0.00017826772184218508, + "loss": 0.0117, "step": 313080 }, { - "epoch": 1.58, - "learning_rate": 6.306309942435082e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.0001782638336258136, + "loss": 0.0126, "step": 313090 }, { - "epoch": 1.58, - "learning_rate": 6.30555317313368e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017825994540944214, + "loss": 0.0115, "step": 313100 }, { - "epoch": 1.58, - "learning_rate": 6.30479640383228e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017825605719307066, + "loss": 0.0152, "step": 313110 }, { - "epoch": 1.58, - "learning_rate": 6.304039634530878e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.0001782521689766992, + "loss": 0.0107, "step": 313120 }, { - "epoch": 1.58, - "learning_rate": 6.303282865229476e-05, - "loss": 0.0097, + "epoch": 0.81, + "learning_rate": 0.00017824828076032774, + "loss": 0.0191, "step": 313130 }, { - "epoch": 1.58, - "learning_rate": 6.302526095928076e-05, - "loss": 0.0082, + "epoch": 0.81, + "learning_rate": 0.00017824439254395628, + "loss": 0.0161, "step": 313140 }, { - "epoch": 1.58, - "learning_rate": 6.301769326626675e-05, - "loss": 0.0066, + "epoch": 0.81, + "learning_rate": 0.0001782405043275848, + "loss": 0.0103, "step": 313150 }, { - "epoch": 1.58, - "learning_rate": 6.301012557325273e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017823661611121334, + "loss": 0.0144, "step": 313160 }, { - "epoch": 1.58, - "learning_rate": 6.300255788023873e-05, - "loss": 0.0052, + "epoch": 0.81, + "learning_rate": 0.00017823272789484188, + "loss": 0.0161, "step": 313170 }, { - "epoch": 1.58, - "learning_rate": 6.299499018722472e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017822883967847042, + "loss": 0.0126, "step": 313180 }, { - "epoch": 1.58, - "learning_rate": 6.29874224942107e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017822495146209893, + "loss": 0.0112, "step": 313190 }, { - "epoch": 1.58, - "learning_rate": 6.29798548011967e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017822106324572748, + "loss": 0.0139, "step": 313200 }, { - "epoch": 1.58, - "learning_rate": 6.29722871081827e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017821717502935602, + "loss": 0.0139, "step": 313210 }, { - "epoch": 1.58, - "learning_rate": 6.296471941516867e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017821328681298456, + "loss": 0.0117, "step": 313220 }, { - "epoch": 1.58, - "learning_rate": 6.295715172215467e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017820939859661307, + "loss": 0.0154, "step": 313230 }, { - "epoch": 1.58, - "learning_rate": 6.294958402914065e-05, - "loss": 0.0084, + "epoch": 0.81, + "learning_rate": 0.00017820551038024162, + "loss": 0.0154, "step": 313240 }, { - "epoch": 1.58, - "learning_rate": 6.294201633612665e-05, - "loss": 0.005, + "epoch": 0.81, + "learning_rate": 0.00017820162216387018, + "loss": 0.0117, "step": 313250 }, { - "epoch": 1.58, - "learning_rate": 6.293444864311264e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.0001781977339474987, + "loss": 0.0138, "step": 313260 }, { - "epoch": 1.58, - "learning_rate": 6.292688095009862e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017819384573112724, + "loss": 0.0189, "step": 313270 }, { - "epoch": 1.58, - "learning_rate": 6.291931325708462e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017818995751475575, + "loss": 0.0158, "step": 313280 }, { - "epoch": 1.58, - "learning_rate": 6.291174556407061e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.00017818606929838432, + "loss": 0.0177, "step": 313290 }, { - "epoch": 1.58, - "learning_rate": 6.29041778710566e-05, - "loss": 0.0096, + "epoch": 0.81, + "learning_rate": 0.00017818218108201284, + "loss": 0.0127, "step": 313300 }, { - "epoch": 1.58, - "learning_rate": 6.289661017804259e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017817829286564138, + "loss": 0.0145, "step": 313310 }, { - "epoch": 1.58, - "learning_rate": 6.288904248502857e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.0001781744046492699, + "loss": 0.0184, "step": 313320 }, { - "epoch": 1.58, - "learning_rate": 6.288147479201457e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017817051643289846, + "loss": 0.0142, "step": 313330 }, { - "epoch": 1.58, - "learning_rate": 6.287390709900056e-05, - "loss": 0.0093, + "epoch": 0.81, + "learning_rate": 0.00017816662821652698, + "loss": 0.0136, "step": 313340 }, { - "epoch": 1.58, - "learning_rate": 6.286633940598654e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017816274000015552, + "loss": 0.014, "step": 313350 }, { - "epoch": 1.58, - "learning_rate": 6.285877171297254e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017815885178378403, + "loss": 0.0124, "step": 313360 }, { - "epoch": 1.58, - "learning_rate": 6.285120401995853e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017815496356741258, + "loss": 0.0108, "step": 313370 }, { - "epoch": 1.58, - "learning_rate": 6.284363632694451e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017815107535104112, + "loss": 0.0105, "step": 313380 }, { - "epoch": 1.58, - "learning_rate": 6.283606863393051e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017814718713466966, + "loss": 0.015, "step": 313390 }, { - "epoch": 1.58, - "learning_rate": 6.282850094091649e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017814329891829817, + "loss": 0.017, "step": 313400 }, { - "epoch": 1.58, - "learning_rate": 6.282093324790249e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017813941070192671, + "loss": 0.0134, "step": 313410 }, { - "epoch": 1.58, - "learning_rate": 6.281336555488848e-05, - "loss": 0.0071, + "epoch": 0.81, + "learning_rate": 0.00017813552248555528, + "loss": 0.0144, "step": 313420 }, { - "epoch": 1.58, - "learning_rate": 6.280579786187446e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.0001781316342691838, + "loss": 0.0182, "step": 313430 }, { - "epoch": 1.58, - "learning_rate": 6.279823016886044e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.0001781277460528123, + "loss": 0.0171, "step": 313440 }, { - "epoch": 1.58, - "learning_rate": 6.279066247584644e-05, - "loss": 0.0086, + "epoch": 0.81, + "learning_rate": 0.00017812385783644085, + "loss": 0.0147, "step": 313450 }, { - "epoch": 1.58, - "learning_rate": 6.278309478283243e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017811996962006942, + "loss": 0.0146, "step": 313460 }, { - "epoch": 1.58, - "learning_rate": 6.277552708981841e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017811608140369794, + "loss": 0.0122, "step": 313470 }, { - "epoch": 1.58, - "learning_rate": 6.276795939680441e-05, - "loss": 0.0092, + "epoch": 0.81, + "learning_rate": 0.00017811219318732648, + "loss": 0.0158, "step": 313480 }, { - "epoch": 1.58, - "learning_rate": 6.276039170379039e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.000178108304970955, + "loss": 0.0169, "step": 313490 }, { - "epoch": 1.58, - "learning_rate": 6.275282401077639e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017810441675458356, + "loss": 0.0125, "step": 313500 }, { - "epoch": 1.58, - "learning_rate": 6.274525631776238e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017810052853821208, + "loss": 0.0133, "step": 313510 }, { - "epoch": 1.58, - "learning_rate": 6.273768862474836e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017809664032184062, + "loss": 0.0178, "step": 313520 }, { - "epoch": 1.58, - "learning_rate": 6.273012093173436e-05, - "loss": 0.01, + "epoch": 0.81, + "learning_rate": 0.00017809275210546913, + "loss": 0.0139, "step": 313530 }, { - "epoch": 1.58, - "learning_rate": 6.272255323872035e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.0001780888638890977, + "loss": 0.0141, "step": 313540 }, { - "epoch": 1.58, - "learning_rate": 6.271498554570633e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017808497567272622, + "loss": 0.0156, "step": 313550 }, { - "epoch": 1.58, - "learning_rate": 6.270741785269233e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017808108745635476, + "loss": 0.0113, "step": 313560 }, { - "epoch": 1.58, - "learning_rate": 6.269985015967831e-05, - "loss": 0.0097, + "epoch": 0.81, + "learning_rate": 0.00017807719923998327, + "loss": 0.0129, "step": 313570 }, { - "epoch": 1.58, - "learning_rate": 6.26922824666643e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017807331102361184, + "loss": 0.0129, "step": 313580 }, { - "epoch": 1.58, - "learning_rate": 6.26847147736503e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017806942280724038, + "loss": 0.0131, "step": 313590 }, { - "epoch": 1.58, - "learning_rate": 6.267714708063628e-05, - "loss": 0.0096, + "epoch": 0.81, + "learning_rate": 0.0001780655345908689, + "loss": 0.0132, "step": 313600 }, { - "epoch": 1.58, - "learning_rate": 6.266957938762228e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.0001780616463744974, + "loss": 0.0166, "step": 313610 }, { - "epoch": 1.58, - "learning_rate": 6.266201169460827e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017805775815812595, + "loss": 0.0147, "step": 313620 }, { - "epoch": 1.58, - "learning_rate": 6.265444400159425e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017805386994175452, + "loss": 0.0172, "step": 313630 }, { - "epoch": 1.58, - "learning_rate": 6.264687630858025e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017804998172538304, + "loss": 0.0171, "step": 313640 }, { - "epoch": 1.58, - "learning_rate": 6.263930861556623e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017804609350901158, + "loss": 0.0148, "step": 313650 }, { - "epoch": 1.58, - "learning_rate": 6.263174092255222e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.0001780422052926401, + "loss": 0.0194, "step": 313660 }, { - "epoch": 1.58, - "learning_rate": 6.262417322953822e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.00017803831707626866, + "loss": 0.0142, "step": 313670 }, { - "epoch": 1.58, - "learning_rate": 6.26166055365242e-05, - "loss": 0.005, + "epoch": 0.81, + "learning_rate": 0.00017803442885989718, + "loss": 0.0141, "step": 313680 }, { - "epoch": 1.58, - "learning_rate": 6.26090378435102e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017803054064352572, + "loss": 0.014, "step": 313690 }, { - "epoch": 1.58, - "learning_rate": 6.260147015049619e-05, - "loss": 0.0051, + "epoch": 0.81, + "learning_rate": 0.00017802665242715423, + "loss": 0.0159, "step": 313700 }, { - "epoch": 1.58, - "learning_rate": 6.259390245748217e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.0001780227642107828, + "loss": 0.0111, "step": 313710 }, { - "epoch": 1.58, - "learning_rate": 6.258633476446817e-05, - "loss": 0.0058, + "epoch": 0.81, + "learning_rate": 0.00017801887599441132, + "loss": 0.0144, "step": 313720 }, { - "epoch": 1.58, - "learning_rate": 6.257876707145416e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017801498777803986, + "loss": 0.0159, "step": 313730 }, { - "epoch": 1.58, - "learning_rate": 6.257119937844014e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017801109956166837, + "loss": 0.0148, "step": 313740 }, { - "epoch": 1.58, - "learning_rate": 6.256363168542614e-05, - "loss": 0.0087, + "epoch": 0.81, + "learning_rate": 0.00017800721134529694, + "loss": 0.0129, "step": 313750 }, { - "epoch": 1.58, - "learning_rate": 6.255606399241212e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017800332312892546, + "loss": 0.0185, "step": 313760 }, { - "epoch": 1.58, - "learning_rate": 6.25484962993981e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.000177999434912554, + "loss": 0.0144, "step": 313770 }, { - "epoch": 1.58, - "learning_rate": 6.25409286063841e-05, - "loss": 0.0074, + "epoch": 0.81, + "learning_rate": 0.0001779955466961825, + "loss": 0.0131, "step": 313780 }, { - "epoch": 1.58, - "learning_rate": 6.253336091337009e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017799165847981108, + "loss": 0.0141, "step": 313790 }, { - "epoch": 1.58, - "learning_rate": 6.252579322035607e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017798777026343962, + "loss": 0.0131, "step": 313800 }, { - "epoch": 1.58, - "learning_rate": 6.251822552734207e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017798388204706814, + "loss": 0.0173, "step": 313810 }, { - "epoch": 1.58, - "learning_rate": 6.251065783432806e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017797999383069668, + "loss": 0.0157, "step": 313820 }, { - "epoch": 1.58, - "learning_rate": 6.250309014131404e-05, - "loss": 0.0069, + "epoch": 0.81, + "learning_rate": 0.00017797610561432522, + "loss": 0.0142, "step": 313830 }, { - "epoch": 1.58, - "learning_rate": 6.249552244830004e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017797221739795376, + "loss": 0.0146, "step": 313840 }, { - "epoch": 1.58, - "learning_rate": 6.248795475528602e-05, - "loss": 0.0075, + "epoch": 0.81, + "learning_rate": 0.00017796832918158228, + "loss": 0.0188, "step": 313850 }, { - "epoch": 1.58, - "learning_rate": 6.248038706227202e-05, - "loss": 0.0089, + "epoch": 0.81, + "learning_rate": 0.00017796444096521082, + "loss": 0.0187, "step": 313860 }, { - "epoch": 1.58, - "learning_rate": 6.247281936925801e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017796055274883933, + "loss": 0.0122, "step": 313870 }, { - "epoch": 1.58, - "learning_rate": 6.246525167624399e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.0001779566645324679, + "loss": 0.0124, "step": 313880 }, { - "epoch": 1.58, - "learning_rate": 6.245768398322999e-05, - "loss": 0.0064, + "epoch": 0.81, + "learning_rate": 0.00017795277631609642, + "loss": 0.0155, "step": 313890 }, { - "epoch": 1.58, - "learning_rate": 6.245011629021598e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.00017794888809972496, + "loss": 0.0122, "step": 313900 }, { - "epoch": 1.58, - "learning_rate": 6.244254859720196e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017794499988335347, + "loss": 0.0112, "step": 313910 }, { - "epoch": 1.58, - "learning_rate": 6.243498090418796e-05, - "loss": 0.0105, + "epoch": 0.81, + "learning_rate": 0.00017794111166698204, + "loss": 0.0132, "step": 313920 }, { - "epoch": 1.58, - "learning_rate": 6.242741321117394e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017793722345061055, + "loss": 0.0159, "step": 313930 }, { - "epoch": 1.58, - "learning_rate": 6.241984551815994e-05, - "loss": 0.007, + "epoch": 0.81, + "learning_rate": 0.0001779333352342391, + "loss": 0.0109, "step": 313940 }, { - "epoch": 1.58, - "learning_rate": 6.241227782514593e-05, - "loss": 0.0062, + "epoch": 0.81, + "learning_rate": 0.0001779294470178676, + "loss": 0.0126, "step": 313950 }, { - "epoch": 1.58, - "learning_rate": 6.240471013213191e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017792555880149618, + "loss": 0.0143, "step": 313960 }, { - "epoch": 1.58, - "learning_rate": 6.23971424391179e-05, - "loss": 0.0068, + "epoch": 0.81, + "learning_rate": 0.00017792167058512472, + "loss": 0.0152, "step": 313970 }, { - "epoch": 1.58, - "learning_rate": 6.23895747461039e-05, - "loss": 0.0085, + "epoch": 0.81, + "learning_rate": 0.00017791778236875324, + "loss": 0.0124, "step": 313980 }, { - "epoch": 1.58, - "learning_rate": 6.238200705308988e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017791389415238178, + "loss": 0.0134, "step": 313990 }, { - "epoch": 1.58, - "learning_rate": 6.237443936007588e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017791000593601032, + "loss": 0.0175, "step": 314000 }, { - "epoch": 1.58, - "eval_cer": 0.9144314400581461, - "eval_loss": 0.005062195006757975, - "eval_runtime": 116.4946, - "eval_samples_per_second": 17.168, - "eval_steps_per_second": 4.292, + "epoch": 0.81, + "eval_cer": 0.8817376772465223, + "eval_loss": 0.00921955332159996, + "eval_runtime": 107.7056, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, "step": 314000 }, { - "epoch": 1.58, - "learning_rate": 6.236687166706186e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017790611771963886, + "loss": 0.0127, "step": 314010 }, { - "epoch": 1.58, - "learning_rate": 6.235930397404785e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017790222950326738, + "loss": 0.014, "step": 314020 }, { - "epoch": 1.58, - "learning_rate": 6.235173628103385e-05, - "loss": 0.0076, + "epoch": 0.81, + "learning_rate": 0.00017789834128689592, + "loss": 0.0157, "step": 314030 }, { - "epoch": 1.58, - "learning_rate": 6.234416858801983e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.00017789445307052446, + "loss": 0.0136, "step": 314040 }, { - "epoch": 1.58, - "learning_rate": 6.233660089500583e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.000177890564854153, + "loss": 0.0132, "step": 314050 }, { - "epoch": 1.58, - "learning_rate": 6.232903320199182e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017788667663778151, + "loss": 0.0131, "step": 314060 }, { - "epoch": 1.58, - "learning_rate": 6.23214655089778e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017788278842141006, + "loss": 0.0135, "step": 314070 }, { - "epoch": 1.58, - "learning_rate": 6.231389781596378e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.0001778789002050386, + "loss": 0.013, "step": 314080 }, { - "epoch": 1.58, - "learning_rate": 6.230633012294978e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017787501198866714, + "loss": 0.0132, "step": 314090 }, { - "epoch": 1.58, - "learning_rate": 6.229876242993576e-05, - "loss": 0.0063, + "epoch": 0.81, + "learning_rate": 0.00017787112377229565, + "loss": 0.0149, "step": 314100 }, { - "epoch": 1.58, - "learning_rate": 6.229119473692176e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.0001778672355559242, + "loss": 0.0144, "step": 314110 }, { - "epoch": 1.58, - "learning_rate": 6.228362704390775e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.0001778633473395527, + "loss": 0.018, "step": 314120 }, { - "epoch": 1.58, - "learning_rate": 6.227605935089373e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.00017785945912318128, + "loss": 0.013, "step": 314130 }, { - "epoch": 1.58, - "learning_rate": 6.226849165787973e-05, - "loss": 0.0108, + "epoch": 0.81, + "learning_rate": 0.00017785557090680982, + "loss": 0.0133, "step": 314140 }, { - "epoch": 1.58, - "learning_rate": 6.226092396486572e-05, - "loss": 0.0088, + "epoch": 0.81, + "learning_rate": 0.00017785168269043834, + "loss": 0.012, "step": 314150 }, { - "epoch": 1.58, - "learning_rate": 6.22533562718517e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017784779447406685, + "loss": 0.0148, "step": 314160 }, { - "epoch": 1.59, - "learning_rate": 6.22457885788377e-05, - "loss": 0.0061, + "epoch": 0.81, + "learning_rate": 0.00017784390625769542, + "loss": 0.0142, "step": 314170 }, { - "epoch": 1.59, - "learning_rate": 6.223822088582369e-05, - "loss": 0.0057, + "epoch": 0.81, + "learning_rate": 0.00017784001804132396, + "loss": 0.0119, "step": 314180 }, { - "epoch": 1.59, - "learning_rate": 6.223065319280967e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.00017783612982495247, + "loss": 0.016, "step": 314190 }, { - "epoch": 1.59, - "learning_rate": 6.222308549979567e-05, - "loss": 0.0079, + "epoch": 0.81, + "learning_rate": 0.00017783224160858102, + "loss": 0.0145, "step": 314200 }, { - "epoch": 1.59, - "learning_rate": 6.221551780678165e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.00017782835339220956, + "loss": 0.0144, "step": 314210 }, { - "epoch": 1.59, - "learning_rate": 6.220795011376765e-05, - "loss": 0.0054, + "epoch": 0.81, + "learning_rate": 0.0001778244651758381, + "loss": 0.0132, "step": 314220 }, { - "epoch": 1.59, - "learning_rate": 6.220038242075364e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.00017782057695946661, + "loss": 0.0138, "step": 314230 }, { - "epoch": 1.59, - "learning_rate": 6.219281472773962e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017781668874309516, + "loss": 0.0129, "step": 314240 }, { - "epoch": 1.59, - "learning_rate": 6.218524703472562e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.0001778128005267237, + "loss": 0.025, "step": 314250 }, { - "epoch": 1.59, - "learning_rate": 6.217767934171161e-05, - "loss": 0.0044, + "epoch": 0.81, + "learning_rate": 0.00017780891231035224, + "loss": 0.0131, "step": 314260 }, { - "epoch": 1.59, - "learning_rate": 6.21701116486976e-05, - "loss": 0.006, + "epoch": 0.81, + "learning_rate": 0.00017780502409398075, + "loss": 0.0158, "step": 314270 }, { - "epoch": 1.59, - "learning_rate": 6.216254395568359e-05, - "loss": 0.0055, + "epoch": 0.81, + "learning_rate": 0.0001778011358776093, + "loss": 0.0108, "step": 314280 }, { - "epoch": 1.59, - "learning_rate": 6.215497626266957e-05, - "loss": 0.0078, + "epoch": 0.81, + "learning_rate": 0.00017779724766123786, + "loss": 0.0142, "step": 314290 }, { - "epoch": 1.59, - "learning_rate": 6.214740856965557e-05, - "loss": 0.0053, + "epoch": 0.81, + "learning_rate": 0.00017779335944486638, + "loss": 0.0108, "step": 314300 }, { - "epoch": 1.59, - "learning_rate": 6.213984087664156e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.0001777894712284949, + "loss": 0.0107, "step": 314310 }, { - "epoch": 1.59, - "learning_rate": 6.213227318362754e-05, - "loss": 0.0065, + "epoch": 0.81, + "learning_rate": 0.00017778558301212343, + "loss": 0.0153, "step": 314320 }, { - "epoch": 1.59, - "learning_rate": 6.212470549061354e-05, - "loss": 0.0067, + "epoch": 0.81, + "learning_rate": 0.000177781694795752, + "loss": 0.0169, "step": 314330 }, { - "epoch": 1.59, - "learning_rate": 6.211713779759953e-05, - "loss": 0.0048, + "epoch": 0.81, + "learning_rate": 0.00017777780657938052, + "loss": 0.0137, "step": 314340 }, { - "epoch": 1.59, - "learning_rate": 6.210957010458551e-05, - "loss": 0.0059, + "epoch": 0.81, + "learning_rate": 0.00017777391836300906, + "loss": 0.0126, "step": 314350 }, { - "epoch": 1.59, - "learning_rate": 6.210200241157151e-05, - "loss": 0.0077, + "epoch": 0.81, + "learning_rate": 0.00017777003014663757, + "loss": 0.013, "step": 314360 }, { - "epoch": 1.59, - "learning_rate": 6.209443471855749e-05, - "loss": 0.0072, + "epoch": 0.81, + "learning_rate": 0.00017776614193026612, + "loss": 0.0134, "step": 314370 }, { - "epoch": 1.59, - "learning_rate": 6.208686702554347e-05, - "loss": 0.0073, + "epoch": 0.81, + "learning_rate": 0.00017776225371389466, + "loss": 0.0124, "step": 314380 }, { - "epoch": 1.59, - "learning_rate": 6.207929933252947e-05, - "loss": 0.008, + "epoch": 0.81, + "learning_rate": 0.0001777583654975232, + "loss": 0.0141, "step": 314390 }, { - "epoch": 1.59, - "learning_rate": 6.207173163951546e-05, - "loss": 0.009, + "epoch": 0.81, + "learning_rate": 0.0001777544772811517, + "loss": 0.0139, "step": 314400 }, { - "epoch": 1.59, - "learning_rate": 6.206416394650144e-05, - "loss": 0.0056, + "epoch": 0.81, + "learning_rate": 0.00017775058906478026, + "loss": 0.0116, "step": 314410 }, { - "epoch": 1.59, - "learning_rate": 6.205659625348744e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.0001777467008484088, + "loss": 0.0148, "step": 314420 }, { - "epoch": 1.59, - "learning_rate": 6.204902856047343e-05, - "loss": 0.009, + "epoch": 0.82, + "learning_rate": 0.00017774281263203734, + "loss": 0.0115, "step": 314430 }, { - "epoch": 1.59, - "learning_rate": 6.204146086745941e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017773892441566585, + "loss": 0.0142, "step": 314440 }, { - "epoch": 1.59, - "learning_rate": 6.203389317444541e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001777350361992944, + "loss": 0.0146, "step": 314450 }, { - "epoch": 1.59, - "learning_rate": 6.202632548143139e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017773114798292296, + "loss": 0.0131, "step": 314460 }, { - "epoch": 1.59, - "learning_rate": 6.201875778841739e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017772725976655148, + "loss": 0.0124, "step": 314470 }, { - "epoch": 1.59, - "learning_rate": 6.201119009540338e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017772337155018, + "loss": 0.0137, "step": 314480 }, { - "epoch": 1.59, - "learning_rate": 6.200362240238936e-05, - "loss": 0.0054, + "epoch": 0.82, + "learning_rate": 0.00017771948333380853, + "loss": 0.0206, "step": 314490 }, { - "epoch": 1.59, - "learning_rate": 6.199605470937536e-05, - "loss": 0.0047, + "epoch": 0.82, + "learning_rate": 0.0001777155951174371, + "loss": 0.0129, "step": 314500 }, { - "epoch": 1.59, - "learning_rate": 6.198848701636135e-05, - "loss": 0.0054, + "epoch": 0.82, + "learning_rate": 0.00017771170690106562, + "loss": 0.0146, "step": 314510 }, { - "epoch": 1.59, - "learning_rate": 6.198091932334733e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017770781868469416, + "loss": 0.0162, "step": 314520 }, { - "epoch": 1.59, - "learning_rate": 6.197335163033333e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017770393046832267, + "loss": 0.0152, "step": 314530 }, { - "epoch": 1.59, - "learning_rate": 6.196578393731931e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017770004225195124, + "loss": 0.0146, "step": 314540 }, { - "epoch": 1.59, - "learning_rate": 6.19582162443053e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017769615403557976, + "loss": 0.0103, "step": 314550 }, { - "epoch": 1.59, - "learning_rate": 6.19506485512913e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.0001776922658192083, + "loss": 0.0129, "step": 314560 }, { - "epoch": 1.59, - "learning_rate": 6.194308085827728e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001776883776028368, + "loss": 0.0132, "step": 314570 }, { - "epoch": 1.59, - "learning_rate": 6.193551316526328e-05, - "loss": 0.009, + "epoch": 0.82, + "learning_rate": 0.00017768448938646538, + "loss": 0.0188, "step": 314580 }, { - "epoch": 1.59, - "learning_rate": 6.192794547224927e-05, - "loss": 0.005, + "epoch": 0.82, + "learning_rate": 0.0001776806011700939, + "loss": 0.0136, "step": 314590 }, { - "epoch": 1.59, - "learning_rate": 6.192037777923525e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.00017767671295372244, + "loss": 0.0155, "step": 314600 }, { - "epoch": 1.59, - "learning_rate": 6.191281008622125e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017767282473735095, + "loss": 0.0119, "step": 314610 }, { - "epoch": 1.59, - "learning_rate": 6.190524239320723e-05, - "loss": 0.0094, + "epoch": 0.82, + "learning_rate": 0.0001776689365209795, + "loss": 0.0161, "step": 314620 }, { - "epoch": 1.59, - "learning_rate": 6.189767470019322e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017766504830460804, + "loss": 0.0143, "step": 314630 }, { - "epoch": 1.59, - "learning_rate": 6.189010700717922e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017766116008823658, + "loss": 0.0131, "step": 314640 }, { - "epoch": 1.59, - "learning_rate": 6.18825393141652e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.0001776572718718651, + "loss": 0.0111, "step": 314650 }, { - "epoch": 1.59, - "learning_rate": 6.18749716211512e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017765338365549363, + "loss": 0.0124, "step": 314660 }, { - "epoch": 1.59, - "learning_rate": 6.186740392813719e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.0001776494954391222, + "loss": 0.0148, "step": 314670 }, { - "epoch": 1.59, - "learning_rate": 6.185983623512317e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017764560722275072, + "loss": 0.0159, "step": 314680 }, { - "epoch": 1.59, - "learning_rate": 6.185226854210917e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017764171900637926, + "loss": 0.0122, "step": 314690 }, { - "epoch": 1.59, - "learning_rate": 6.184470084909515e-05, - "loss": 0.0044, + "epoch": 0.82, + "learning_rate": 0.00017763783079000777, + "loss": 0.0144, "step": 314700 }, { - "epoch": 1.59, - "learning_rate": 6.183713315608114e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017763394257363634, + "loss": 0.0175, "step": 314710 }, { - "epoch": 1.59, - "learning_rate": 6.182956546306712e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017763005435726486, + "loss": 0.012, "step": 314720 }, { - "epoch": 1.59, - "learning_rate": 6.182199777005312e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.0001776261661408934, + "loss": 0.0138, "step": 314730 }, { - "epoch": 1.59, - "learning_rate": 6.18144300770391e-05, - "loss": 0.0115, + "epoch": 0.82, + "learning_rate": 0.0001776222779245219, + "loss": 0.0128, "step": 314740 }, { - "epoch": 1.59, - "learning_rate": 6.18068623840251e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017761838970815048, + "loss": 0.0121, "step": 314750 }, { - "epoch": 1.59, - "learning_rate": 6.179929469101109e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.000177614501491779, + "loss": 0.0136, "step": 314760 }, { - "epoch": 1.59, - "learning_rate": 6.179172699799707e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017761061327540754, + "loss": 0.0171, "step": 314770 }, { - "epoch": 1.59, - "learning_rate": 6.178415930498307e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017760672505903605, + "loss": 0.0142, "step": 314780 }, { - "epoch": 1.59, - "learning_rate": 6.177659161196906e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017760283684266462, + "loss": 0.0184, "step": 314790 }, { - "epoch": 1.59, - "learning_rate": 6.176902391895504e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017759894862629313, + "loss": 0.0168, "step": 314800 }, { - "epoch": 1.59, - "learning_rate": 6.176145622594104e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017759506040992168, + "loss": 0.0112, "step": 314810 }, { - "epoch": 1.59, - "learning_rate": 6.175388853292702e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001775911721935502, + "loss": 0.0152, "step": 314820 }, { - "epoch": 1.59, - "learning_rate": 6.174632083991302e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017758728397717876, + "loss": 0.0178, "step": 314830 }, { - "epoch": 1.59, - "learning_rate": 6.173875314689901e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.0001775833957608073, + "loss": 0.0131, "step": 314840 }, { - "epoch": 1.59, - "learning_rate": 6.173118545388499e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017757950754443582, + "loss": 0.0142, "step": 314850 }, { - "epoch": 1.59, - "learning_rate": 6.172361776087099e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017757561932806436, + "loss": 0.0104, "step": 314860 }, { - "epoch": 1.59, - "learning_rate": 6.171605006785698e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017757173111169287, + "loss": 0.0206, "step": 314870 }, { - "epoch": 1.59, - "learning_rate": 6.170848237484296e-05, - "loss": 0.0107, + "epoch": 0.82, + "learning_rate": 0.00017756784289532144, + "loss": 0.0137, "step": 314880 }, { - "epoch": 1.59, - "learning_rate": 6.170091468182896e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.00017756395467894996, + "loss": 0.0163, "step": 314890 }, { - "epoch": 1.59, - "learning_rate": 6.169334698881494e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.0001775600664625785, + "loss": 0.021, "step": 314900 }, { - "epoch": 1.59, - "learning_rate": 6.168577929580093e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.000177556178246207, + "loss": 0.0149, "step": 314910 }, { - "epoch": 1.59, - "learning_rate": 6.167821160278693e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.00017755229002983558, + "loss": 0.0164, "step": 314920 }, { - "epoch": 1.59, - "learning_rate": 6.167064390977291e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.0001775484018134641, + "loss": 0.0169, "step": 314930 }, { - "epoch": 1.59, - "learning_rate": 6.16630762167589e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017754451359709264, + "loss": 0.0123, "step": 314940 }, { - "epoch": 1.59, - "learning_rate": 6.16555085237449e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017754062538072115, + "loss": 0.0167, "step": 314950 }, { - "epoch": 1.59, - "learning_rate": 6.164794083073088e-05, - "loss": 0.0045, + "epoch": 0.82, + "learning_rate": 0.00017753673716434972, + "loss": 0.0131, "step": 314960 }, { - "epoch": 1.59, - "learning_rate": 6.164037313771688e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017753284894797823, + "loss": 0.0146, "step": 314970 }, { - "epoch": 1.59, - "learning_rate": 6.163280544470286e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.00017752896073160678, + "loss": 0.0137, "step": 314980 }, { - "epoch": 1.59, - "learning_rate": 6.162523775168885e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.0001775250725152353, + "loss": 0.013, "step": 314990 }, { - "epoch": 1.59, - "learning_rate": 6.161767005867485e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017752118429886386, + "loss": 0.0138, "step": 315000 }, { - "epoch": 1.59, - "eval_cer": 0.9144207657007667, - "eval_loss": 0.005126504693180323, - "eval_runtime": 116.2813, - "eval_samples_per_second": 17.2, - "eval_steps_per_second": 4.3, + "epoch": 0.82, + "eval_cer": 0.8817446754311932, + "eval_loss": 0.009523827582597733, + "eval_runtime": 107.5021, + "eval_samples_per_second": 18.604, + "eval_steps_per_second": 4.651, "step": 315000 }, { - "epoch": 1.59, - "learning_rate": 6.161010236566083e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.0001775172960824924, + "loss": 0.0146, "step": 315010 }, { - "epoch": 1.59, - "learning_rate": 6.160253467264681e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.00017751340786612092, + "loss": 0.0146, "step": 315020 }, { - "epoch": 1.59, - "learning_rate": 6.159496697963281e-05, - "loss": 0.005, + "epoch": 0.82, + "learning_rate": 0.00017750951964974943, + "loss": 0.014, "step": 315030 }, { - "epoch": 1.59, - "learning_rate": 6.15873992866188e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.000177505631433378, + "loss": 0.0107, "step": 315040 }, { - "epoch": 1.59, - "learning_rate": 6.157983159360478e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.00017750174321700654, + "loss": 0.0157, "step": 315050 }, { - "epoch": 1.59, - "learning_rate": 6.157226390059078e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017749785500063505, + "loss": 0.0109, "step": 315060 }, { - "epoch": 1.59, - "learning_rate": 6.156469620757676e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.0001774939667842636, + "loss": 0.0139, "step": 315070 }, { - "epoch": 1.59, - "learning_rate": 6.155712851456275e-05, - "loss": 0.0095, + "epoch": 0.82, + "learning_rate": 0.00017749007856789214, + "loss": 0.0187, "step": 315080 }, { - "epoch": 1.59, - "learning_rate": 6.154956082154875e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017748619035152068, + "loss": 0.0137, "step": 315090 }, { - "epoch": 1.59, - "learning_rate": 6.154199312853473e-05, - "loss": 0.0104, + "epoch": 0.82, + "learning_rate": 0.0001774823021351492, + "loss": 0.0141, "step": 315100 }, { - "epoch": 1.59, - "learning_rate": 6.153442543552073e-05, - "loss": 0.0092, + "epoch": 0.82, + "learning_rate": 0.00017747841391877774, + "loss": 0.0158, "step": 315110 }, { - "epoch": 1.59, - "learning_rate": 6.152685774250672e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017747452570240625, + "loss": 0.0122, "step": 315120 }, { - "epoch": 1.59, - "learning_rate": 6.15192900494927e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017747063748603482, + "loss": 0.0124, "step": 315130 }, { - "epoch": 1.59, - "learning_rate": 6.15117223564787e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017746674926966333, + "loss": 0.0145, "step": 315140 }, { - "epoch": 1.59, - "learning_rate": 6.150415466346469e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017746286105329188, + "loss": 0.0146, "step": 315150 }, { - "epoch": 1.59, - "learning_rate": 6.149658697045067e-05, - "loss": 0.0081, + "epoch": 0.82, + "learning_rate": 0.0001774589728369204, + "loss": 0.0146, "step": 315160 }, { - "epoch": 1.59, - "learning_rate": 6.148901927743667e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017745508462054896, + "loss": 0.0124, "step": 315170 }, { - "epoch": 1.59, - "learning_rate": 6.148145158442265e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.0001774511964041775, + "loss": 0.0186, "step": 315180 }, { - "epoch": 1.59, - "learning_rate": 6.147388389140865e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017744730818780601, + "loss": 0.0166, "step": 315190 }, { - "epoch": 1.59, - "learning_rate": 6.146631619839464e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017744341997143453, + "loss": 0.0156, "step": 315200 }, { - "epoch": 1.59, - "learning_rate": 6.145874850538062e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.0001774395317550631, + "loss": 0.0143, "step": 315210 }, { - "epoch": 1.59, - "learning_rate": 6.145118081236662e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.00017743564353869164, + "loss": 0.0141, "step": 315220 }, { - "epoch": 1.59, - "learning_rate": 6.144361311935261e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017743175532232015, + "loss": 0.0122, "step": 315230 }, { - "epoch": 1.59, - "learning_rate": 6.14360454263386e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.0001774278671059487, + "loss": 0.0118, "step": 315240 }, { - "epoch": 1.59, - "learning_rate": 6.142847773332459e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017742397888957724, + "loss": 0.0119, "step": 315250 }, { - "epoch": 1.59, - "learning_rate": 6.142091004031057e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017742009067320578, + "loss": 0.0169, "step": 315260 }, { - "epoch": 1.59, - "learning_rate": 6.141334234729656e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001774162024568343, + "loss": 0.0136, "step": 315270 }, { - "epoch": 1.59, - "learning_rate": 6.140577465428256e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.00017741231424046284, + "loss": 0.0134, "step": 315280 }, { - "epoch": 1.59, - "learning_rate": 6.139820696126854e-05, - "loss": 0.006, - "step": 315290 + "epoch": 0.82, + "learning_rate": 0.00017740842602409138, + "loss": 0.0146, + "step": 315290 }, { - "epoch": 1.59, - "learning_rate": 6.139063926825454e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017740453780771992, + "loss": 0.0131, "step": 315300 }, { - "epoch": 1.59, - "learning_rate": 6.138307157524053e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017740064959134843, + "loss": 0.0158, "step": 315310 }, { - "epoch": 1.59, - "learning_rate": 6.137550388222651e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017739676137497697, + "loss": 0.0402, "step": 315320 }, { - "epoch": 1.59, - "learning_rate": 6.13679361892125e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017739287315860554, + "loss": 0.0161, "step": 315330 }, { - "epoch": 1.59, - "learning_rate": 6.136036849619849e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017738898494223406, + "loss": 0.0141, "step": 315340 }, { - "epoch": 1.59, - "learning_rate": 6.135280080318447e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017738509672586257, + "loss": 0.0138, "step": 315350 }, { - "epoch": 1.59, - "learning_rate": 6.134523311017047e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017738120850949111, + "loss": 0.0114, "step": 315360 }, { - "epoch": 1.59, - "learning_rate": 6.133766541715646e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017737732029311963, + "loss": 0.0159, "step": 315370 }, { - "epoch": 1.59, - "learning_rate": 6.133009772414244e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.0001773734320767482, + "loss": 0.0168, "step": 315380 }, { - "epoch": 1.59, - "learning_rate": 6.132253003112844e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017736954386037674, + "loss": 0.0099, "step": 315390 }, { - "epoch": 1.59, - "learning_rate": 6.131496233811443e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017736565564400525, + "loss": 0.0132, "step": 315400 }, { - "epoch": 1.59, - "learning_rate": 6.130739464510041e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.0001773617674276338, + "loss": 0.0151, "step": 315410 }, { - "epoch": 1.59, - "learning_rate": 6.129982695208641e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017735787921126234, + "loss": 0.0133, "step": 315420 }, { - "epoch": 1.59, - "learning_rate": 6.129225925907239e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017735399099489088, + "loss": 0.0198, "step": 315430 }, { - "epoch": 1.59, - "learning_rate": 6.128469156605838e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.0001773501027785194, + "loss": 0.0172, "step": 315440 }, { - "epoch": 1.59, - "learning_rate": 6.127712387304438e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017734621456214793, + "loss": 0.0158, "step": 315450 }, { - "epoch": 1.59, - "learning_rate": 6.126955618003036e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017734232634577648, + "loss": 0.0158, "step": 315460 }, { - "epoch": 1.59, - "learning_rate": 6.126198848701636e-05, - "loss": 0.0102, + "epoch": 0.82, + "learning_rate": 0.00017733843812940502, + "loss": 0.0146, "step": 315470 }, { - "epoch": 1.59, - "learning_rate": 6.125442079400235e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017733454991303353, + "loss": 0.0151, "step": 315480 }, { - "epoch": 1.59, - "learning_rate": 6.124685310098833e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017733066169666207, + "loss": 0.012, "step": 315490 }, { - "epoch": 1.59, - "learning_rate": 6.123928540797433e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017732677348029062, + "loss": 0.0114, "step": 315500 }, { - "epoch": 1.59, - "learning_rate": 6.123171771496031e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.00017732288526391916, + "loss": 0.0147, "step": 315510 }, { - "epoch": 1.59, - "learning_rate": 6.12241500219463e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017731899704754767, + "loss": 0.0123, "step": 315520 }, { - "epoch": 1.59, - "learning_rate": 6.12165823289323e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017731510883117621, + "loss": 0.0131, "step": 315530 }, { - "epoch": 1.59, - "learning_rate": 6.120901463591828e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017731122061480478, + "loss": 0.0135, "step": 315540 }, { - "epoch": 1.59, - "learning_rate": 6.120144694290428e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.0001773073323984333, + "loss": 0.015, "step": 315550 }, { - "epoch": 1.59, - "learning_rate": 6.119387924989027e-05, - "loss": 0.0081, + "epoch": 0.82, + "learning_rate": 0.00017730344418206184, + "loss": 0.0126, "step": 315560 }, { - "epoch": 1.59, - "learning_rate": 6.118631155687625e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.00017729955596569035, + "loss": 0.0169, "step": 315570 }, { - "epoch": 1.59, - "learning_rate": 6.117874386386225e-05, - "loss": 0.0081, + "epoch": 0.82, + "learning_rate": 0.00017729566774931892, + "loss": 0.0127, "step": 315580 }, { - "epoch": 1.59, - "learning_rate": 6.117117617084823e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017729177953294744, + "loss": 0.0125, "step": 315590 }, { - "epoch": 1.59, - "learning_rate": 6.116360847783422e-05, - "loss": 0.0094, + "epoch": 0.82, + "learning_rate": 0.00017728789131657598, + "loss": 0.0164, "step": 315600 }, { - "epoch": 1.59, - "learning_rate": 6.115604078482022e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.0001772840031002045, + "loss": 0.011, "step": 315610 }, { - "epoch": 1.59, - "learning_rate": 6.11484730918062e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017728011488383303, + "loss": 0.0146, "step": 315620 }, { - "epoch": 1.59, - "learning_rate": 6.11409053987922e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017727622666746158, + "loss": 0.0165, "step": 315630 }, { - "epoch": 1.59, - "learning_rate": 6.113333770577818e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017727233845109012, + "loss": 0.015, "step": 315640 }, { - "epoch": 1.59, - "learning_rate": 6.112577001276417e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017726845023471863, + "loss": 0.0125, "step": 315650 }, { - "epoch": 1.59, - "learning_rate": 6.111820231975015e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017726456201834717, + "loss": 0.0127, "step": 315660 }, { - "epoch": 1.59, - "learning_rate": 6.111063462673615e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017726067380197572, + "loss": 0.0113, "step": 315670 }, { - "epoch": 1.59, - "learning_rate": 6.110306693372214e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.00017725678558560426, + "loss": 0.0183, "step": 315680 }, { - "epoch": 1.59, - "learning_rate": 6.109549924070812e-05, - "loss": 0.0111, + "epoch": 0.82, + "learning_rate": 0.00017725289736923277, + "loss": 0.0128, "step": 315690 }, { - "epoch": 1.59, - "learning_rate": 6.108793154769412e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.0001772490091528613, + "loss": 0.0158, "step": 315700 }, { - "epoch": 1.59, - "learning_rate": 6.10803638546801e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017724512093648988, + "loss": 0.0151, "step": 315710 }, { - "epoch": 1.59, - "learning_rate": 6.10727961616661e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.0001772412327201184, + "loss": 0.0124, "step": 315720 }, { - "epoch": 1.59, - "learning_rate": 6.106522846865209e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017723734450374694, + "loss": 0.0124, "step": 315730 }, { - "epoch": 1.59, - "learning_rate": 6.105766077563807e-05, - "loss": 0.009, + "epoch": 0.82, + "learning_rate": 0.00017723345628737545, + "loss": 0.0137, "step": 315740 }, { - "epoch": 1.59, - "learning_rate": 6.105009308262407e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017722956807100402, + "loss": 0.0114, "step": 315750 }, { - "epoch": 1.59, - "learning_rate": 6.104252538961006e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017722567985463254, + "loss": 0.0131, "step": 315760 }, { - "epoch": 1.59, - "learning_rate": 6.1034957696596043e-05, - "loss": 0.0092, + "epoch": 0.82, + "learning_rate": 0.00017722179163826108, + "loss": 0.0138, "step": 315770 }, { - "epoch": 1.59, - "learning_rate": 6.102739000358204e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.0001772179034218896, + "loss": 0.0129, "step": 315780 }, { - "epoch": 1.59, - "learning_rate": 6.101982231056803e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017721401520551816, + "loss": 0.0123, "step": 315790 }, { - "epoch": 1.59, - "learning_rate": 6.1012254617554015e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017721012698914668, + "loss": 0.0128, "step": 315800 }, { - "epoch": 1.59, - "learning_rate": 6.100468692454e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017720623877277522, + "loss": 0.0152, "step": 315810 }, { - "epoch": 1.59, - "learning_rate": 6.0997119231526e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017720235055640373, + "loss": 0.017, "step": 315820 }, { - "epoch": 1.59, - "learning_rate": 6.0989551538511986e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.0001771984623400323, + "loss": 0.0126, "step": 315830 }, { - "epoch": 1.59, - "learning_rate": 6.0981983845497975e-05, - "loss": 0.0086, + "epoch": 0.82, + "learning_rate": 0.00017719457412366081, + "loss": 0.0146, "step": 315840 }, { - "epoch": 1.59, - "learning_rate": 6.097441615248396e-05, + "epoch": 0.82, + "learning_rate": 0.00017719068590728936, "loss": 0.012, "step": 315850 }, { - "epoch": 1.59, - "learning_rate": 6.096684845946996e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017718679769091787, + "loss": 0.0142, "step": 315860 }, { - "epoch": 1.59, - "learning_rate": 6.0959280766455946e-05, - "loss": 0.0114, + "epoch": 0.82, + "learning_rate": 0.0001771829094745464, + "loss": 0.011, "step": 315870 }, { - "epoch": 1.59, - "learning_rate": 6.0951713073441934e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017717902125817498, + "loss": 0.0167, "step": 315880 }, { - "epoch": 1.59, - "learning_rate": 6.094414538042792e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001771751330418035, + "loss": 0.0164, "step": 315890 }, { - "epoch": 1.59, - "learning_rate": 6.093657768741392e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.000177171244825432, + "loss": 0.0121, "step": 315900 }, { - "epoch": 1.59, - "learning_rate": 6.0929009994399906e-05, - "loss": 0.005, + "epoch": 0.82, + "learning_rate": 0.00017716735660906055, + "loss": 0.0134, "step": 315910 }, { - "epoch": 1.59, - "learning_rate": 6.0921442301385894e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017716346839268912, + "loss": 0.0137, "step": 315920 }, { - "epoch": 1.59, - "learning_rate": 6.091387460837188e-05, - "loss": 0.0048, + "epoch": 0.82, + "learning_rate": 0.00017715958017631764, + "loss": 0.0136, "step": 315930 }, { - "epoch": 1.59, - "learning_rate": 6.090630691535788e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017715569195994618, + "loss": 0.0118, "step": 315940 }, { - "epoch": 1.59, - "learning_rate": 6.089873922234386e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.0001771518037435747, + "loss": 0.0123, "step": 315950 }, { - "epoch": 1.59, - "learning_rate": 6.089117152932985e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017714791552720326, + "loss": 0.0117, "step": 315960 }, { - "epoch": 1.59, - "learning_rate": 6.0883603836315835e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017714402731083177, + "loss": 0.0118, "step": 315970 }, { - "epoch": 1.59, - "learning_rate": 6.087603614330182e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017714013909446032, + "loss": 0.0132, "step": 315980 }, { - "epoch": 1.59, - "learning_rate": 6.086846845028782e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017713625087808883, + "loss": 0.0145, "step": 315990 }, { - "epoch": 1.59, - "learning_rate": 6.0860900757273806e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.0001771323626617174, + "loss": 0.0163, "step": 316000 }, { - "epoch": 1.59, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.005030008032917976, - "eval_runtime": 116.3264, - "eval_samples_per_second": 17.193, - "eval_steps_per_second": 4.298, + "epoch": 0.82, + "eval_cer": 0.8817068852339703, + "eval_loss": 0.00930152740329504, + "eval_runtime": 107.6124, + "eval_samples_per_second": 18.585, + "eval_steps_per_second": 4.646, "step": 316000 }, { - "epoch": 1.59, - "learning_rate": 6.0853333064259795e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017712847444534591, + "loss": 0.013, "step": 316010 }, { - "epoch": 1.59, - "learning_rate": 6.084576537124578e-05, - "loss": 0.0054, + "epoch": 0.82, + "learning_rate": 0.00017712458622897446, + "loss": 0.0178, "step": 316020 }, { - "epoch": 1.59, - "learning_rate": 6.083819767823178e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017712069801260297, + "loss": 0.0121, "step": 316030 }, { - "epoch": 1.59, - "learning_rate": 6.0830629985217766e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017711680979623154, + "loss": 0.0131, "step": 316040 }, { - "epoch": 1.59, - "learning_rate": 6.0823062292203754e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017711292157986008, + "loss": 0.0146, "step": 316050 }, { - "epoch": 1.59, - "learning_rate": 6.081549459918974e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.0001771090333634886, + "loss": 0.0149, "step": 316060 }, { - "epoch": 1.59, - "learning_rate": 6.080792690617574e-05, - "loss": 0.0049, + "epoch": 0.82, + "learning_rate": 0.0001771051451471171, + "loss": 0.0115, "step": 316070 }, { - "epoch": 1.59, - "learning_rate": 6.0800359213161726e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017710125693074568, + "loss": 0.015, "step": 316080 }, { - "epoch": 1.59, - "learning_rate": 6.0792791520147714e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017709736871437422, + "loss": 0.0108, "step": 316090 }, { - "epoch": 1.59, - "learning_rate": 6.078522382713371e-05, - "loss": 0.0048, + "epoch": 0.82, + "learning_rate": 0.00017709348049800273, + "loss": 0.0124, "step": 316100 }, { - "epoch": 1.59, - "learning_rate": 6.07776561341197e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017708959228163128, + "loss": 0.0129, "step": 316110 }, { - "epoch": 1.59, - "learning_rate": 6.0770088441105685e-05, - "loss": 0.0096, + "epoch": 0.82, + "learning_rate": 0.0001770857040652598, + "loss": 0.0163, "step": 316120 }, { - "epoch": 1.59, - "learning_rate": 6.0762520748091674e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017708181584888836, + "loss": 0.0168, "step": 316130 }, { - "epoch": 1.59, - "learning_rate": 6.075495305507767e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017707792763251687, + "loss": 0.012, "step": 316140 }, { - "epoch": 1.6, - "learning_rate": 6.074738536206366e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017707403941614542, + "loss": 0.0163, "step": 316150 }, { - "epoch": 1.6, - "learning_rate": 6.0739817669049645e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017707015119977393, + "loss": 0.0102, "step": 316160 }, { - "epoch": 1.6, - "learning_rate": 6.073224997603563e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001770662629834025, + "loss": 0.0148, "step": 316170 }, { - "epoch": 1.6, - "learning_rate": 6.072468228302163e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017706237476703101, + "loss": 0.0139, "step": 316180 }, { - "epoch": 1.6, - "learning_rate": 6.0717114590007616e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017705848655065956, + "loss": 0.0146, "step": 316190 }, { - "epoch": 1.6, - "learning_rate": 6.0709546896993605e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017705459833428807, + "loss": 0.0144, "step": 316200 }, { - "epoch": 1.6, - "learning_rate": 6.070197920397959e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017705071011791664, + "loss": 0.0163, "step": 316210 }, { - "epoch": 1.6, - "learning_rate": 6.069441151096559e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.00017704682190154515, + "loss": 0.0133, "step": 316220 }, { - "epoch": 1.6, - "learning_rate": 6.0686843817951576e-05, - "loss": 0.0047, + "epoch": 0.82, + "learning_rate": 0.0001770429336851737, + "loss": 0.0153, "step": 316230 }, { - "epoch": 1.6, - "learning_rate": 6.0679276124937564e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.0001770390454688022, + "loss": 0.0104, "step": 316240 }, { - "epoch": 1.6, - "learning_rate": 6.067170843192355e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017703515725243078, + "loss": 0.0142, "step": 316250 }, { - "epoch": 1.6, - "learning_rate": 6.066414073890955e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017703126903605932, + "loss": 0.0105, "step": 316260 }, { - "epoch": 1.6, - "learning_rate": 6.065657304589553e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017702738081968783, + "loss": 0.0126, "step": 316270 }, { - "epoch": 1.6, - "learning_rate": 6.064900535288152e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017702349260331638, + "loss": 0.0146, "step": 316280 }, { - "epoch": 1.6, - "learning_rate": 6.0641437659867505e-05, - "loss": 0.0086, + "epoch": 0.82, + "learning_rate": 0.00017701960438694492, + "loss": 0.0129, "step": 316290 }, { - "epoch": 1.6, - "learning_rate": 6.0633869966853494e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017701571617057346, + "loss": 0.0147, "step": 316300 }, { - "epoch": 1.6, - "learning_rate": 6.062630227383949e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017701182795420197, + "loss": 0.0139, "step": 316310 }, { - "epoch": 1.6, - "learning_rate": 6.061873458082548e-05, - "loss": 0.0085, + "epoch": 0.82, + "learning_rate": 0.00017700793973783052, + "loss": 0.012, "step": 316320 }, { - "epoch": 1.6, - "learning_rate": 6.0611166887811465e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017700405152145906, + "loss": 0.0151, "step": 316330 }, { - "epoch": 1.6, - "learning_rate": 6.060359919479745e-05, - "loss": 0.0051, + "epoch": 0.82, + "learning_rate": 0.0001770001633050876, + "loss": 0.0109, "step": 316340 }, { - "epoch": 1.6, - "learning_rate": 6.059603150178345e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.0001769962750887161, + "loss": 0.013, "step": 316350 }, { - "epoch": 1.6, - "learning_rate": 6.0588463808769436e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017699238687234465, + "loss": 0.0162, "step": 316360 }, { - "epoch": 1.6, - "learning_rate": 6.0580896115755425e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017698849865597317, + "loss": 0.0132, "step": 316370 }, { - "epoch": 1.6, - "learning_rate": 6.057332842274141e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017698461043960174, + "loss": 0.014, "step": 316380 }, { - "epoch": 1.6, - "learning_rate": 6.056576072972741e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017698072222323025, + "loss": 0.0139, "step": 316390 }, { - "epoch": 1.6, - "learning_rate": 6.0558193036713396e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.0001769768340068588, + "loss": 0.0173, "step": 316400 }, { - "epoch": 1.6, - "learning_rate": 6.0550625343699384e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001769729457904873, + "loss": 0.014, "step": 316410 }, { - "epoch": 1.6, - "learning_rate": 6.054305765068537e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017696905757411588, + "loss": 0.0132, "step": 316420 }, { - "epoch": 1.6, - "learning_rate": 6.053548995767137e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017696516935774442, + "loss": 0.0162, "step": 316430 }, { - "epoch": 1.6, - "learning_rate": 6.0527922264657356e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017696128114137293, + "loss": 0.0122, "step": 316440 }, { - "epoch": 1.6, - "learning_rate": 6.0520354571643344e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017695739292500148, + "loss": 0.0114, "step": 316450 }, { - "epoch": 1.6, - "learning_rate": 6.051278687862933e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017695350470863002, + "loss": 0.0143, "step": 316460 }, { - "epoch": 1.6, - "learning_rate": 6.050521918561533e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.00017694961649225856, + "loss": 0.0139, "step": 316470 }, { - "epoch": 1.6, - "learning_rate": 6.0497651492601315e-05, - "loss": 0.0085, + "epoch": 0.82, + "learning_rate": 0.00017694572827588707, + "loss": 0.0119, "step": 316480 }, { - "epoch": 1.6, - "learning_rate": 6.0490083799587304e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017694184005951561, + "loss": 0.0162, "step": 316490 }, { - "epoch": 1.6, - "learning_rate": 6.048251610657329e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017693795184314416, + "loss": 0.0138, "step": 316500 }, { - "epoch": 1.6, - "learning_rate": 6.047494841355929e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001769340636267727, + "loss": 0.0121, "step": 316510 }, { - "epoch": 1.6, - "learning_rate": 6.0467380720545275e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001769301754104012, + "loss": 0.0099, "step": 316520 }, { - "epoch": 1.6, - "learning_rate": 6.045981302753126e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.00017692628719402975, + "loss": 0.0122, "step": 316530 }, { - "epoch": 1.6, - "learning_rate": 6.045224533451725e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001769223989776583, + "loss": 0.0146, "step": 316540 }, { - "epoch": 1.6, - "learning_rate": 6.0444677641503247e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017691851076128684, + "loss": 0.0136, "step": 316550 }, { - "epoch": 1.6, - "learning_rate": 6.0437109948489235e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017691462254491535, + "loss": 0.0111, "step": 316560 }, { - "epoch": 1.6, - "learning_rate": 6.042954225547522e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.0001769107343285439, + "loss": 0.0143, "step": 316570 }, { - "epoch": 1.6, - "learning_rate": 6.0421974562461204e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017690684611217246, + "loss": 0.0165, "step": 316580 }, { - "epoch": 1.6, - "learning_rate": 6.04144068694472e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017690295789580098, + "loss": 0.0098, "step": 316590 }, { - "epoch": 1.6, - "learning_rate": 6.040683917643319e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017689906967942952, + "loss": 0.011, "step": 316600 }, { - "epoch": 1.6, - "learning_rate": 6.0399271483419176e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.00017689518146305803, + "loss": 0.0134, "step": 316610 }, { - "epoch": 1.6, - "learning_rate": 6.0391703790405164e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017689129324668655, + "loss": 0.0126, "step": 316620 }, { - "epoch": 1.6, - "learning_rate": 6.038413609739116e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017688740503031512, + "loss": 0.0166, "step": 316630 }, { - "epoch": 1.6, - "learning_rate": 6.037656840437715e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017688351681394366, + "loss": 0.0123, "step": 316640 }, { - "epoch": 1.6, - "learning_rate": 6.0369000711363135e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017687962859757217, + "loss": 0.0129, "step": 316650 }, { - "epoch": 1.6, - "learning_rate": 6.0361433018349124e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017687574038120071, + "loss": 0.0119, "step": 316660 }, { - "epoch": 1.6, - "learning_rate": 6.035386532533512e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017687185216482926, + "loss": 0.0126, "step": 316670 }, { - "epoch": 1.6, - "learning_rate": 6.034629763232111e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.0001768679639484578, + "loss": 0.0168, "step": 316680 }, { - "epoch": 1.6, - "learning_rate": 6.0338729939307095e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.0001768640757320863, + "loss": 0.0142, "step": 316690 }, { - "epoch": 1.6, - "learning_rate": 6.033116224629308e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017686018751571485, + "loss": 0.0145, "step": 316700 }, { - "epoch": 1.6, - "learning_rate": 6.032359455327908e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.0001768562992993434, + "loss": 0.0143, "step": 316710 }, { - "epoch": 1.6, - "learning_rate": 6.0316026860265067e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017685241108297194, + "loss": 0.0117, "step": 316720 }, { - "epoch": 1.6, - "learning_rate": 6.0308459167251055e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017684852286660045, + "loss": 0.0137, "step": 316730 }, { - "epoch": 1.6, - "learning_rate": 6.030089147423704e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.000176844634650229, + "loss": 0.0133, "step": 316740 }, { - "epoch": 1.6, - "learning_rate": 6.029332378122304e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017684074643385756, + "loss": 0.0137, "step": 316750 }, { - "epoch": 1.6, - "learning_rate": 6.0285756088209026e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017683685821748608, + "loss": 0.0153, "step": 316760 }, { - "epoch": 1.6, - "learning_rate": 6.0278188395195014e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017683297000111462, + "loss": 0.0179, "step": 316770 }, { - "epoch": 1.6, - "learning_rate": 6.0270620702181e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017682908178474313, + "loss": 0.017, "step": 316780 }, { - "epoch": 1.6, - "learning_rate": 6.0263053009167e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.0001768251935683717, + "loss": 0.0151, "step": 316790 }, { - "epoch": 1.6, - "learning_rate": 6.0255485316152986e-05, - "loss": 0.0097, + "epoch": 0.82, + "learning_rate": 0.00017682130535200022, + "loss": 0.0135, "step": 316800 }, { - "epoch": 1.6, - "learning_rate": 6.0247917623138974e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017681741713562876, + "loss": 0.0126, "step": 316810 }, { - "epoch": 1.6, - "learning_rate": 6.024034993012496e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017681352891925727, + "loss": 0.015, "step": 316820 }, { - "epoch": 1.6, - "learning_rate": 6.023278223711096e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017680964070288584, + "loss": 0.0132, "step": 316830 }, { - "epoch": 1.6, - "learning_rate": 6.0225214544096946e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017680575248651436, + "loss": 0.0125, "step": 316840 }, { - "epoch": 1.6, - "learning_rate": 6.0217646851082934e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.0001768018642701429, + "loss": 0.0121, "step": 316850 }, { - "epoch": 1.6, - "learning_rate": 6.021007915806892e-05, - "loss": 0.0082, + "epoch": 0.82, + "learning_rate": 0.0001767979760537714, + "loss": 0.0142, "step": 316860 }, { - "epoch": 1.6, - "learning_rate": 6.020251146505492e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017679408783739995, + "loss": 0.0163, "step": 316870 }, { - "epoch": 1.6, - "learning_rate": 6.0194943772040905e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001767901996210285, + "loss": 0.0156, "step": 316880 }, { - "epoch": 1.6, - "learning_rate": 6.018737607902689e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017678631140465704, + "loss": 0.0104, "step": 316890 }, { - "epoch": 1.6, - "learning_rate": 6.0179808386012875e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017678242318828555, + "loss": 0.0174, "step": 316900 }, { - "epoch": 1.6, - "learning_rate": 6.017224069299886e-05, - "loss": 0.0055, + "epoch": 0.82, + "learning_rate": 0.0001767785349719141, + "loss": 0.0136, "step": 316910 }, { - "epoch": 1.6, - "learning_rate": 6.016467299998486e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017677464675554266, + "loss": 0.0135, "step": 316920 }, { - "epoch": 1.6, - "learning_rate": 6.0157105306970846e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017677075853917118, + "loss": 0.0128, "step": 316930 }, { - "epoch": 1.6, - "learning_rate": 6.0149537613956834e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.0001767668703227997, + "loss": 0.0097, "step": 316940 }, { - "epoch": 1.6, - "learning_rate": 6.014196992094282e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017676298210642823, + "loss": 0.0147, "step": 316950 }, { - "epoch": 1.6, - "learning_rate": 6.013440222792882e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.0001767590938900568, + "loss": 0.0149, "step": 316960 }, { - "epoch": 1.6, - "learning_rate": 6.0126834534914806e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017675520567368532, + "loss": 0.0153, "step": 316970 }, { - "epoch": 1.6, - "learning_rate": 6.0119266841900794e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017675131745731386, + "loss": 0.0146, "step": 316980 }, { - "epoch": 1.6, - "learning_rate": 6.011169914888678e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017674742924094237, + "loss": 0.0154, "step": 316990 }, { - "epoch": 1.6, - "learning_rate": 6.010413145587278e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017674354102457094, + "loss": 0.0141, "step": 317000 }, { - "epoch": 1.6, - "eval_cer": 0.9144518183767796, - "eval_loss": 0.005164159927517176, - "eval_runtime": 116.3465, - "eval_samples_per_second": 17.19, - "eval_steps_per_second": 4.298, + "epoch": 0.82, + "eval_cer": 0.8817502739789299, + "eval_loss": 0.01099375169724226, + "eval_runtime": 107.5512, + "eval_samples_per_second": 18.596, + "eval_steps_per_second": 4.649, "step": 317000 }, { - "epoch": 1.6, - "learning_rate": 6.0096563762858766e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017673965280819945, + "loss": 0.0143, "step": 317010 }, { - "epoch": 1.6, - "learning_rate": 6.0088996069844754e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.000176735764591828, + "loss": 0.018, "step": 317020 }, { - "epoch": 1.6, - "learning_rate": 6.008142837683074e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.0001767318763754565, + "loss": 0.0141, "step": 317030 }, { - "epoch": 1.6, - "learning_rate": 6.007386068381674e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.00017672798815908508, + "loss": 0.0152, "step": 317040 }, { - "epoch": 1.6, - "learning_rate": 6.0066292990802725e-05, - "loss": 0.0097, + "epoch": 0.82, + "learning_rate": 0.0001767240999427136, + "loss": 0.0138, "step": 317050 }, { - "epoch": 1.6, - "learning_rate": 6.0058725297788713e-05, - "loss": 0.0098, + "epoch": 0.82, + "learning_rate": 0.00017672021172634214, + "loss": 0.0121, "step": 317060 }, { - "epoch": 1.6, - "learning_rate": 6.005115760477471e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017671632350997065, + "loss": 0.0165, "step": 317070 }, { - "epoch": 1.6, - "learning_rate": 6.00435899117607e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.00017671243529359922, + "loss": 0.012, "step": 317080 }, { - "epoch": 1.6, - "learning_rate": 6.0036022218746685e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017670854707722773, + "loss": 0.0127, "step": 317090 }, { - "epoch": 1.6, - "learning_rate": 6.002845452573267e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.00017670465886085628, + "loss": 0.0193, "step": 317100 }, { - "epoch": 1.6, - "learning_rate": 6.002088683271867e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001767007706444848, + "loss": 0.0172, "step": 317110 }, { - "epoch": 1.6, - "learning_rate": 6.0013319139704656e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.00017669688242811333, + "loss": 0.0152, "step": 317120 }, { - "epoch": 1.6, - "learning_rate": 6.0005751446690645e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001766929942117419, + "loss": 0.0121, "step": 317130 }, { - "epoch": 1.6, - "learning_rate": 5.999818375367663e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017668910599537041, + "loss": 0.0119, "step": 317140 }, { - "epoch": 1.6, - "learning_rate": 5.999061606066263e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.00017668521777899896, + "loss": 0.0105, "step": 317150 }, { - "epoch": 1.6, - "learning_rate": 5.9983048367648616e-05, - "loss": 0.0064, + "epoch": 0.82, + "learning_rate": 0.00017668132956262747, + "loss": 0.0123, "step": 317160 }, { - "epoch": 1.6, - "learning_rate": 5.9975480674634604e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017667744134625604, + "loss": 0.0144, "step": 317170 }, { - "epoch": 1.6, - "learning_rate": 5.996791298162059e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017667355312988455, + "loss": 0.0126, "step": 317180 }, { - "epoch": 1.6, - "learning_rate": 5.996034528860659e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.0001766696649135131, + "loss": 0.013, "step": 317190 }, { - "epoch": 1.6, - "learning_rate": 5.9952777595592576e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.0001766657766971416, + "loss": 0.0163, "step": 317200 }, { - "epoch": 1.6, - "learning_rate": 5.994520990257856e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017666188848077018, + "loss": 0.0148, "step": 317210 }, { - "epoch": 1.6, - "learning_rate": 5.9937642209564545e-05, - "loss": 0.0053, + "epoch": 0.82, + "learning_rate": 0.0001766580002643987, + "loss": 0.0112, "step": 317220 }, { - "epoch": 1.6, - "learning_rate": 5.9930074516550533e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.00017665411204802724, + "loss": 0.0181, "step": 317230 }, { - "epoch": 1.6, - "learning_rate": 5.992250682353653e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017665022383165575, + "loss": 0.0109, "step": 317240 }, { - "epoch": 1.6, - "learning_rate": 5.991493913052252e-05, - "loss": 0.0077, + "epoch": 0.82, + "learning_rate": 0.00017664633561528432, + "loss": 0.014, "step": 317250 }, { - "epoch": 1.6, - "learning_rate": 5.9907371437508505e-05, - "loss": 0.005, + "epoch": 0.82, + "learning_rate": 0.00017664244739891283, + "loss": 0.013, "step": 317260 }, { - "epoch": 1.6, - "learning_rate": 5.989980374449449e-05, - "loss": 0.0086, + "epoch": 0.82, + "learning_rate": 0.00017663855918254137, + "loss": 0.0206, "step": 317270 }, { - "epoch": 1.6, - "learning_rate": 5.989223605148049e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.0001766346709661699, + "loss": 0.0145, "step": 317280 }, { - "epoch": 1.6, - "learning_rate": 5.9884668358466476e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017663078274979846, + "loss": 0.0149, "step": 317290 }, { - "epoch": 1.6, - "learning_rate": 5.9877100665452465e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.000176626894533427, + "loss": 0.0112, "step": 317300 }, { - "epoch": 1.6, - "learning_rate": 5.986953297243845e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017662300631705551, + "loss": 0.0133, "step": 317310 }, { - "epoch": 1.6, - "learning_rate": 5.986196527942445e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017661911810068406, + "loss": 0.0176, "step": 317320 }, { - "epoch": 1.6, - "learning_rate": 5.9854397586410436e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017661522988431257, + "loss": 0.0102, "step": 317330 }, { - "epoch": 1.6, - "learning_rate": 5.9846829893396424e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017661134166794114, + "loss": 0.0123, "step": 317340 }, { - "epoch": 1.6, - "learning_rate": 5.983926220038241e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017660745345156965, + "loss": 0.0146, "step": 317350 }, { - "epoch": 1.6, - "learning_rate": 5.983169450736841e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.0001766035652351982, + "loss": 0.015, "step": 317360 }, { - "epoch": 1.6, - "learning_rate": 5.9824126814354396e-05, - "loss": 0.0066, + "epoch": 0.82, + "learning_rate": 0.0001765996770188267, + "loss": 0.0131, "step": 317370 }, { - "epoch": 1.6, - "learning_rate": 5.9816559121340384e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017659578880245528, + "loss": 0.0112, "step": 317380 }, { - "epoch": 1.6, - "learning_rate": 5.980899142832637e-05, - "loss": 0.0079, + "epoch": 0.82, + "learning_rate": 0.0001765919005860838, + "loss": 0.0133, "step": 317390 }, { - "epoch": 1.6, - "learning_rate": 5.980142373531237e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017658801236971233, + "loss": 0.0127, "step": 317400 }, { - "epoch": 1.6, - "learning_rate": 5.9793856042298355e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017658412415334085, + "loss": 0.014, "step": 317410 }, { - "epoch": 1.6, - "learning_rate": 5.9786288349284344e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017658023593696942, + "loss": 0.0114, "step": 317420 }, { - "epoch": 1.6, - "learning_rate": 5.977872065627033e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.00017657634772059793, + "loss": 0.0117, "step": 317430 }, { - "epoch": 1.6, - "learning_rate": 5.977115296325633e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017657245950422647, + "loss": 0.0116, "step": 317440 }, { - "epoch": 1.6, - "learning_rate": 5.9763585270242315e-05, - "loss": 0.0078, + "epoch": 0.82, + "learning_rate": 0.000176568571287855, + "loss": 0.0131, "step": 317450 }, { - "epoch": 1.6, - "learning_rate": 5.97560175772283e-05, - "loss": 0.0063, + "epoch": 0.82, + "learning_rate": 0.00017656468307148356, + "loss": 0.014, "step": 317460 }, { - "epoch": 1.6, - "learning_rate": 5.974844988421429e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.0001765607948551121, + "loss": 0.014, "step": 317470 }, { - "epoch": 1.6, - "learning_rate": 5.9740882191200286e-05, - "loss": 0.0093, + "epoch": 0.82, + "learning_rate": 0.0001765569066387406, + "loss": 0.0124, "step": 317480 }, { - "epoch": 1.6, - "learning_rate": 5.9733314498186275e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.00017655301842236913, + "loss": 0.0158, "step": 317490 }, { - "epoch": 1.6, - "learning_rate": 5.972574680517226e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.0001765491302059977, + "loss": 0.0144, "step": 317500 }, { - "epoch": 1.6, - "learning_rate": 5.971817911215825e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017654524198962624, + "loss": 0.0129, "step": 317510 }, { - "epoch": 1.6, - "learning_rate": 5.9710611419144246e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017654135377325475, + "loss": 0.0141, "step": 317520 }, { - "epoch": 1.6, - "learning_rate": 5.970304372613023e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.0001765374655568833, + "loss": 0.0133, "step": 317530 }, { - "epoch": 1.6, - "learning_rate": 5.9695476033116216e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017653357734051184, + "loss": 0.0134, "step": 317540 }, { - "epoch": 1.6, - "learning_rate": 5.9687908340102204e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017652968912414038, + "loss": 0.0126, "step": 317550 }, { - "epoch": 1.6, - "learning_rate": 5.96803406470882e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.0001765258009077689, + "loss": 0.0134, "step": 317560 }, { - "epoch": 1.6, - "learning_rate": 5.967277295407419e-05, - "loss": 0.0102, + "epoch": 0.82, + "learning_rate": 0.00017652191269139743, + "loss": 0.0165, "step": 317570 }, { - "epoch": 1.6, - "learning_rate": 5.9665205261060175e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.00017651802447502595, + "loss": 0.0109, "step": 317580 }, { - "epoch": 1.6, - "learning_rate": 5.9657637568046164e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017651413625865452, + "loss": 0.0116, "step": 317590 }, { - "epoch": 1.6, - "learning_rate": 5.965006987503216e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017651024804228303, + "loss": 0.0182, "step": 317600 }, { - "epoch": 1.6, - "learning_rate": 5.964250218201815e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017650635982591157, + "loss": 0.0141, "step": 317610 }, { - "epoch": 1.6, - "learning_rate": 5.9634934489004135e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.0001765024716095401, + "loss": 0.0139, "step": 317620 }, { - "epoch": 1.6, - "learning_rate": 5.962736679599012e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017649858339316866, + "loss": 0.0107, "step": 317630 }, { - "epoch": 1.6, - "learning_rate": 5.961979910297612e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001764946951767972, + "loss": 0.01, "step": 317640 }, { - "epoch": 1.6, - "learning_rate": 5.9612231409962106e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001764908069604257, + "loss": 0.0103, "step": 317650 }, { - "epoch": 1.6, - "learning_rate": 5.9604663716948095e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017648691874405423, + "loss": 0.0131, "step": 317660 }, { - "epoch": 1.6, - "learning_rate": 5.959709602393408e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.0001764830305276828, + "loss": 0.0152, "step": 317670 }, { - "epoch": 1.6, - "learning_rate": 5.958952833092008e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017647914231131134, + "loss": 0.0111, "step": 317680 }, { - "epoch": 1.6, - "learning_rate": 5.9581960637906066e-05, - "loss": 0.0072, + "epoch": 0.82, + "learning_rate": 0.00017647525409493985, + "loss": 0.0143, "step": 317690 }, { - "epoch": 1.6, - "learning_rate": 5.9574392944892054e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001764713658785684, + "loss": 0.0127, "step": 317700 }, { - "epoch": 1.6, - "learning_rate": 5.956682525187804e-05, - "loss": 0.0089, + "epoch": 0.82, + "learning_rate": 0.00017646747766219694, + "loss": 0.015, "step": 317710 }, { - "epoch": 1.6, - "learning_rate": 5.955925755886404e-05, - "loss": 0.0069, + "epoch": 0.82, + "learning_rate": 0.00017646358944582548, + "loss": 0.0153, "step": 317720 }, { - "epoch": 1.6, - "learning_rate": 5.9551689865850026e-05, - "loss": 0.008, + "epoch": 0.82, + "learning_rate": 0.000176459701229454, + "loss": 0.0129, "step": 317730 }, { - "epoch": 1.6, - "learning_rate": 5.9544122172836014e-05, - "loss": 0.0074, + "epoch": 0.82, + "learning_rate": 0.00017645581301308253, + "loss": 0.0121, "step": 317740 }, { - "epoch": 1.6, - "learning_rate": 5.9536554479822e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017645192479671107, + "loss": 0.018, "step": 317750 }, { - "epoch": 1.6, - "learning_rate": 5.9528986786808e-05, - "loss": 0.0089, + "epoch": 0.82, + "learning_rate": 0.00017644803658033962, + "loss": 0.014, "step": 317760 }, { - "epoch": 1.6, - "learning_rate": 5.9521419093793985e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.00017644414836396813, + "loss": 0.0106, "step": 317770 }, { - "epoch": 1.6, - "learning_rate": 5.9513851400779974e-05, - "loss": 0.009, + "epoch": 0.82, + "learning_rate": 0.00017644026014759667, + "loss": 0.0113, "step": 317780 }, { - "epoch": 1.6, - "learning_rate": 5.950628370776596e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017643637193122524, + "loss": 0.0113, "step": 317790 }, { - "epoch": 1.6, - "learning_rate": 5.949871601475196e-05, - "loss": 0.0056, + "epoch": 0.82, + "learning_rate": 0.00017643248371485376, + "loss": 0.014, "step": 317800 }, { - "epoch": 1.6, - "learning_rate": 5.9491148321737945e-05, - "loss": 0.007, + "epoch": 0.82, + "learning_rate": 0.00017642859549848227, + "loss": 0.014, "step": 317810 }, { - "epoch": 1.6, - "learning_rate": 5.948358062872393e-05, - "loss": 0.0084, + "epoch": 0.82, + "learning_rate": 0.0001764247072821108, + "loss": 0.0108, "step": 317820 }, { - "epoch": 1.6, - "learning_rate": 5.947601293570992e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017642081906573933, + "loss": 0.0164, "step": 317830 }, { - "epoch": 1.6, - "learning_rate": 5.94684452426959e-05, - "loss": 0.0069, - "step": 317840 + "epoch": 0.82, + "learning_rate": 0.0001764169308493679, + "loss": 0.0122, + "step": 317840 }, { - "epoch": 1.6, - "learning_rate": 5.94608775496819e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.00017641304263299644, + "loss": 0.0134, "step": 317850 }, { - "epoch": 1.6, - "learning_rate": 5.9453309856667886e-05, - "loss": 0.0088, + "epoch": 0.82, + "learning_rate": 0.00017640915441662495, + "loss": 0.0125, "step": 317860 }, { - "epoch": 1.6, - "learning_rate": 5.9445742163653874e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.0001764052662002535, + "loss": 0.0133, "step": 317870 }, { - "epoch": 1.6, - "learning_rate": 5.943817447063986e-05, - "loss": 0.005, + "epoch": 0.82, + "learning_rate": 0.00017640137798388203, + "loss": 0.0123, "step": 317880 }, { - "epoch": 1.6, - "learning_rate": 5.943060677762586e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017639748976751058, + "loss": 0.0142, "step": 317890 }, { - "epoch": 1.6, - "learning_rate": 5.9423039084611846e-05, - "loss": 0.0062, + "epoch": 0.82, + "learning_rate": 0.0001763936015511391, + "loss": 0.0137, "step": 317900 }, { - "epoch": 1.6, - "learning_rate": 5.9415471391597834e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017638971333476763, + "loss": 0.0142, "step": 317910 }, { - "epoch": 1.6, - "learning_rate": 5.940790369858382e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017638582511839617, + "loss": 0.0102, "step": 317920 }, { - "epoch": 1.6, - "learning_rate": 5.940033600556982e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017638193690202472, + "loss": 0.0125, "step": 317930 }, { - "epoch": 1.6, - "learning_rate": 5.9392768312555805e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017637804868565323, + "loss": 0.0113, "step": 317940 }, { - "epoch": 1.6, - "learning_rate": 5.9385200619541794e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017637416046928177, + "loss": 0.0129, "step": 317950 }, { - "epoch": 1.6, - "learning_rate": 5.937763292652778e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017637027225291034, + "loss": 0.0126, "step": 317960 }, { - "epoch": 1.6, - "learning_rate": 5.937006523351378e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.00017636638403653886, + "loss": 0.0128, "step": 317970 }, { - "epoch": 1.6, - "learning_rate": 5.9362497540499765e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017636249582016737, + "loss": 0.0114, "step": 317980 }, { - "epoch": 1.6, - "learning_rate": 5.935492984748575e-05, - "loss": 0.0076, + "epoch": 0.82, + "learning_rate": 0.0001763586076037959, + "loss": 0.0232, "step": 317990 }, { - "epoch": 1.6, - "learning_rate": 5.934736215447174e-05, - "loss": 0.0051, + "epoch": 0.82, + "learning_rate": 0.00017635471938742448, + "loss": 0.023, "step": 318000 }, { - "epoch": 1.6, - "eval_cer": 0.9144285288697699, - "eval_loss": 0.005206539761275053, - "eval_runtime": 116.4709, - "eval_samples_per_second": 17.172, - "eval_steps_per_second": 4.293, + "epoch": 0.82, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.009950380772352219, + "eval_runtime": 107.6438, + "eval_samples_per_second": 18.58, + "eval_steps_per_second": 4.645, "step": 318000 }, { - "epoch": 1.6, - "learning_rate": 5.9339794461457737e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.000176350831171053, + "loss": 0.0163, "step": 318010 }, { - "epoch": 1.6, - "learning_rate": 5.9332226768443725e-05, - "loss": 0.0096, + "epoch": 0.82, + "learning_rate": 0.00017634694295468154, + "loss": 0.015, "step": 318020 }, { - "epoch": 1.6, - "learning_rate": 5.932465907542971e-05, - "loss": 0.0058, + "epoch": 0.82, + "learning_rate": 0.00017634305473831005, + "loss": 0.015, "step": 318030 }, { - "epoch": 1.6, - "learning_rate": 5.931709138241571e-05, - "loss": 0.0061, + "epoch": 0.82, + "learning_rate": 0.00017633916652193862, + "loss": 0.0161, "step": 318040 }, { - "epoch": 1.6, - "learning_rate": 5.9309523689401696e-05, - "loss": 0.0083, + "epoch": 0.82, + "learning_rate": 0.00017633527830556713, + "loss": 0.0122, "step": 318050 }, { - "epoch": 1.6, - "learning_rate": 5.9301955996387684e-05, - "loss": 0.006, + "epoch": 0.82, + "learning_rate": 0.00017633139008919568, + "loss": 0.0197, "step": 318060 }, { - "epoch": 1.6, - "learning_rate": 5.929438830337367e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.0001763275018728242, + "loss": 0.0125, "step": 318070 }, { - "epoch": 1.6, - "learning_rate": 5.928682061035967e-05, - "loss": 0.0052, + "epoch": 0.82, + "learning_rate": 0.00017632361365645273, + "loss": 0.0186, "step": 318080 }, { - "epoch": 1.6, - "learning_rate": 5.9279252917345656e-05, - "loss": 0.0086, + "epoch": 0.82, + "learning_rate": 0.00017631972544008127, + "loss": 0.0187, "step": 318090 }, { - "epoch": 1.6, - "learning_rate": 5.9271685224331644e-05, - "loss": 0.0057, + "epoch": 0.82, + "learning_rate": 0.00017631583722370982, + "loss": 0.0159, "step": 318100 }, { - "epoch": 1.6, - "learning_rate": 5.926411753131763e-05, - "loss": 0.0086, + "epoch": 0.82, + "learning_rate": 0.00017631194900733833, + "loss": 0.0142, "step": 318110 }, { - "epoch": 1.6, - "learning_rate": 5.925654983830363e-05, - "loss": 0.0067, + "epoch": 0.82, + "learning_rate": 0.00017630806079096687, + "loss": 0.0187, "step": 318120 }, { - "epoch": 1.6, - "learning_rate": 5.9248982145289615e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.0001763041725745954, + "loss": 0.0112, "step": 318130 }, { - "epoch": 1.61, - "learning_rate": 5.9241414452275604e-05, - "loss": 0.0093, + "epoch": 0.82, + "learning_rate": 0.00017630028435822395, + "loss": 0.0127, "step": 318140 }, { - "epoch": 1.61, - "learning_rate": 5.9233846759261585e-05, - "loss": 0.0101, + "epoch": 0.82, + "learning_rate": 0.00017629639614185247, + "loss": 0.0134, "step": 318150 }, { - "epoch": 1.61, - "learning_rate": 5.922627906624757e-05, - "loss": 0.0071, + "epoch": 0.82, + "learning_rate": 0.000176292507925481, + "loss": 0.01, "step": 318160 }, { - "epoch": 1.61, - "learning_rate": 5.921871137323357e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017628861970910958, + "loss": 0.0115, "step": 318170 }, { - "epoch": 1.61, - "learning_rate": 5.9211143680219557e-05, - "loss": 0.0075, + "epoch": 0.82, + "learning_rate": 0.0001762847314927381, + "loss": 0.0131, "step": 318180 }, { - "epoch": 1.61, - "learning_rate": 5.9203575987205545e-05, - "loss": 0.0091, + "epoch": 0.82, + "learning_rate": 0.00017628084327636664, + "loss": 0.0139, "step": 318190 }, { - "epoch": 1.61, - "learning_rate": 5.919600829419153e-05, - "loss": 0.0086, + "epoch": 0.82, + "learning_rate": 0.00017627695505999515, + "loss": 0.0145, "step": 318200 }, { - "epoch": 1.61, - "learning_rate": 5.918844060117753e-05, - "loss": 0.0073, + "epoch": 0.82, + "learning_rate": 0.00017627306684362372, + "loss": 0.0122, "step": 318210 }, { - "epoch": 1.61, - "learning_rate": 5.9180872908163516e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017626917862725223, + "loss": 0.0124, "step": 318220 }, { - "epoch": 1.61, - "learning_rate": 5.9173305215149504e-05, - "loss": 0.0087, + "epoch": 0.82, + "learning_rate": 0.00017626529041088078, + "loss": 0.0101, "step": 318230 }, { - "epoch": 1.61, - "learning_rate": 5.916573752213549e-05, - "loss": 0.0068, + "epoch": 0.82, + "learning_rate": 0.0001762614021945093, + "loss": 0.0112, "step": 318240 }, { - "epoch": 1.61, - "learning_rate": 5.915816982912149e-05, - "loss": 0.0059, + "epoch": 0.82, + "learning_rate": 0.00017625751397813786, + "loss": 0.0157, "step": 318250 }, { - "epoch": 1.61, - "learning_rate": 5.9150602136107476e-05, - "loss": 0.0065, + "epoch": 0.82, + "learning_rate": 0.00017625362576176637, + "loss": 0.0183, "step": 318260 }, { - "epoch": 1.61, - "learning_rate": 5.9143034443093464e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017624973754539491, + "loss": 0.0134, "step": 318270 }, { - "epoch": 1.61, - "learning_rate": 5.913546675007945e-05, - "loss": 0.005, + "epoch": 0.83, + "learning_rate": 0.00017624584932902343, + "loss": 0.0103, "step": 318280 }, { - "epoch": 1.61, - "learning_rate": 5.912789905706545e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.000176241961112652, + "loss": 0.0175, "step": 318290 }, { - "epoch": 1.61, - "learning_rate": 5.9120331364051436e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.0001762380728962805, + "loss": 0.0145, "step": 318300 }, { - "epoch": 1.61, - "learning_rate": 5.9112763671037424e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017623418467990905, + "loss": 0.0223, "step": 318310 }, { - "epoch": 1.61, - "learning_rate": 5.910519597802341e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017623029646353757, + "loss": 0.0132, "step": 318320 }, { - "epoch": 1.61, - "learning_rate": 5.909762828500941e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.0001762264082471661, + "loss": 0.0121, "step": 318330 }, { - "epoch": 1.61, - "learning_rate": 5.9090060591995395e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017622252003079468, + "loss": 0.0164, "step": 318340 }, { - "epoch": 1.61, - "learning_rate": 5.908249289898138e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.0001762186318144232, + "loss": 0.0151, "step": 318350 }, { - "epoch": 1.61, - "learning_rate": 5.907492520596737e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017621474359805174, + "loss": 0.0146, "step": 318360 }, { - "epoch": 1.61, - "learning_rate": 5.9067357512953367e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017621085538168025, + "loss": 0.0164, "step": 318370 }, { - "epoch": 1.61, - "learning_rate": 5.9059789819939355e-05, - "loss": 0.0082, + "epoch": 0.83, + "learning_rate": 0.00017620696716530882, + "loss": 0.0139, "step": 318380 }, { - "epoch": 1.61, - "learning_rate": 5.905222212692534e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017620307894893733, + "loss": 0.0172, "step": 318390 }, { - "epoch": 1.61, - "learning_rate": 5.904465443391133e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017619919073256587, + "loss": 0.0146, "step": 318400 }, { - "epoch": 1.61, - "learning_rate": 5.9037086740897326e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001761953025161944, + "loss": 0.0143, "step": 318410 }, { - "epoch": 1.61, - "learning_rate": 5.9029519047883314e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017619141429982296, + "loss": 0.0137, "step": 318420 }, { - "epoch": 1.61, - "learning_rate": 5.90219513548693e-05, - "loss": 0.0088, + "epoch": 0.83, + "learning_rate": 0.00017618752608345147, + "loss": 0.0153, "step": 318430 }, { - "epoch": 1.61, - "learning_rate": 5.901438366185529e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017618363786708001, + "loss": 0.0123, "step": 318440 }, { - "epoch": 1.61, - "learning_rate": 5.9006815968841286e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017617974965070853, + "loss": 0.0142, "step": 318450 }, { - "epoch": 1.61, - "learning_rate": 5.8999248275827274e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.0001761758614343371, + "loss": 0.0111, "step": 318460 }, { - "epoch": 1.61, - "learning_rate": 5.8991680582813256e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.0001761719732179656, + "loss": 0.0108, "step": 318470 }, { - "epoch": 1.61, - "learning_rate": 5.8984112889799244e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017616808500159415, + "loss": 0.0167, "step": 318480 }, { - "epoch": 1.61, - "learning_rate": 5.897654519678523e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017616419678522267, + "loss": 0.0114, "step": 318490 }, { - "epoch": 1.61, - "learning_rate": 5.896897750377123e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017616030856885124, + "loss": 0.0136, "step": 318500 }, { - "epoch": 1.61, - "learning_rate": 5.8961409810757215e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017615642035247978, + "loss": 0.0144, "step": 318510 }, { - "epoch": 1.61, - "learning_rate": 5.8953842117743203e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.0001761525321361083, + "loss": 0.0148, "step": 318520 }, { - "epoch": 1.61, - "learning_rate": 5.89462744247292e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001761486439197368, + "loss": 0.0124, "step": 318530 }, { - "epoch": 1.61, - "learning_rate": 5.893870673171519e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017614475570336538, + "loss": 0.0134, "step": 318540 }, { - "epoch": 1.61, - "learning_rate": 5.8931139038701175e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017614086748699392, + "loss": 0.0136, "step": 318550 }, { - "epoch": 1.61, - "learning_rate": 5.892357134568716e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017613697927062243, + "loss": 0.0149, "step": 318560 }, { - "epoch": 1.61, - "learning_rate": 5.891600365267316e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017613309105425097, + "loss": 0.015, "step": 318570 }, { - "epoch": 1.61, - "learning_rate": 5.8908435959659146e-05, - "loss": 0.0098, + "epoch": 0.83, + "learning_rate": 0.0001761292028378795, + "loss": 0.0127, "step": 318580 }, { - "epoch": 1.61, - "learning_rate": 5.8900868266645135e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017612531462150806, + "loss": 0.0163, "step": 318590 }, { - "epoch": 1.61, - "learning_rate": 5.889330057363112e-05, - "loss": 0.0039, + "epoch": 0.83, + "learning_rate": 0.00017612142640513657, + "loss": 0.0135, "step": 318600 }, { - "epoch": 1.61, - "learning_rate": 5.888573288061712e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017611753818876511, + "loss": 0.0157, "step": 318610 }, { - "epoch": 1.61, - "learning_rate": 5.8878165187603106e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017611364997239363, + "loss": 0.0131, "step": 318620 }, { - "epoch": 1.61, - "learning_rate": 5.8870597494589094e-05, - "loss": 0.0049, + "epoch": 0.83, + "learning_rate": 0.0001761097617560222, + "loss": 0.0132, "step": 318630 }, { - "epoch": 1.61, - "learning_rate": 5.886302980157508e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001761058735396507, + "loss": 0.0159, "step": 318640 }, { - "epoch": 1.61, - "learning_rate": 5.885546210856108e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017610198532327925, + "loss": 0.0137, "step": 318650 }, { - "epoch": 1.61, - "learning_rate": 5.8847894415547066e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017609809710690777, + "loss": 0.0133, "step": 318660 }, { - "epoch": 1.61, - "learning_rate": 5.8840326722533054e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017609420889053634, + "loss": 0.0124, "step": 318670 }, { - "epoch": 1.61, - "learning_rate": 5.883275902951904e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017609032067416485, + "loss": 0.0139, "step": 318680 }, { - "epoch": 1.61, - "learning_rate": 5.882519133650504e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.0001760864324577934, + "loss": 0.0115, "step": 318690 }, { - "epoch": 1.61, - "learning_rate": 5.8817623643491025e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.0001760825442414219, + "loss": 0.0119, "step": 318700 }, { - "epoch": 1.61, - "learning_rate": 5.8810055950477013e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017607865602505048, + "loss": 0.0116, "step": 318710 }, { - "epoch": 1.61, - "learning_rate": 5.8802488257463e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017607476780867902, + "loss": 0.0159, "step": 318720 }, { - "epoch": 1.61, - "learning_rate": 5.8794920564449e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017607087959230753, + "loss": 0.0117, "step": 318730 }, { - "epoch": 1.61, - "learning_rate": 5.8787352871434985e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017606699137593607, + "loss": 0.014, "step": 318740 }, { - "epoch": 1.61, - "learning_rate": 5.877978517842097e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017606310315956462, + "loss": 0.0121, "step": 318750 }, { - "epoch": 1.61, - "learning_rate": 5.877221748540696e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017605921494319316, + "loss": 0.0124, "step": 318760 }, { - "epoch": 1.61, - "learning_rate": 5.8764649792392956e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017605532672682167, + "loss": 0.0152, "step": 318770 }, { - "epoch": 1.61, - "learning_rate": 5.875708209937894e-05, - "loss": 0.0097, + "epoch": 0.83, + "learning_rate": 0.0001760514385104502, + "loss": 0.0142, "step": 318780 }, { - "epoch": 1.61, - "learning_rate": 5.8749514406364926e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017604755029407875, + "loss": 0.0179, "step": 318790 }, { - "epoch": 1.61, - "learning_rate": 5.8741946713350914e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.0001760436620777073, + "loss": 0.0161, "step": 318800 }, { - "epoch": 1.61, - "learning_rate": 5.87343790203369e-05, - "loss": 0.009, + "epoch": 0.83, + "learning_rate": 0.0001760397738613358, + "loss": 0.0131, "step": 318810 }, { - "epoch": 1.61, - "learning_rate": 5.87268113273229e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017603588564496435, + "loss": 0.0128, "step": 318820 }, { - "epoch": 1.61, - "learning_rate": 5.8719243634308886e-05, - "loss": 0.009, + "epoch": 0.83, + "learning_rate": 0.00017603199742859287, + "loss": 0.0218, "step": 318830 }, { - "epoch": 1.61, - "learning_rate": 5.8711675941294874e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017602810921222144, + "loss": 0.0155, "step": 318840 }, { - "epoch": 1.61, - "learning_rate": 5.870410824828086e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017602422099584995, + "loss": 0.0156, "step": 318850 }, { - "epoch": 1.61, - "learning_rate": 5.869654055526686e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.0001760203327794785, + "loss": 0.0132, "step": 318860 }, { - "epoch": 1.61, - "learning_rate": 5.8688972862252845e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.000176016444563107, + "loss": 0.0166, "step": 318870 }, { - "epoch": 1.61, - "learning_rate": 5.8681405169238834e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017601255634673558, + "loss": 0.0144, "step": 318880 }, { - "epoch": 1.61, - "learning_rate": 5.867383747622482e-05, - "loss": 0.0096, + "epoch": 0.83, + "learning_rate": 0.00017600866813036412, + "loss": 0.0134, "step": 318890 }, { - "epoch": 1.61, - "learning_rate": 5.866626978321082e-05, - "loss": 0.0101, + "epoch": 0.83, + "learning_rate": 0.00017600477991399263, + "loss": 0.0152, "step": 318900 }, { - "epoch": 1.61, - "learning_rate": 5.8658702090196805e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017600089169762117, + "loss": 0.0142, "step": 318910 }, { - "epoch": 1.61, - "learning_rate": 5.865113439718279e-05, - "loss": 0.004, + "epoch": 0.83, + "learning_rate": 0.00017599700348124971, + "loss": 0.0139, "step": 318920 }, { - "epoch": 1.61, - "learning_rate": 5.864356670416878e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017599311526487826, + "loss": 0.0161, "step": 318930 }, { - "epoch": 1.61, - "learning_rate": 5.8635999011154776e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017598922704850677, + "loss": 0.0141, "step": 318940 }, { - "epoch": 1.61, - "learning_rate": 5.8628431318140765e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001759853388321353, + "loss": 0.0158, "step": 318950 }, { - "epoch": 1.61, - "learning_rate": 5.862086362512675e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017598145061576385, + "loss": 0.0117, "step": 318960 }, { - "epoch": 1.61, - "learning_rate": 5.861329593211274e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.0001759775623993924, + "loss": 0.0119, "step": 318970 }, { - "epoch": 1.61, - "learning_rate": 5.8605728239098736e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.0001759736741830209, + "loss": 0.0127, "step": 318980 }, { - "epoch": 1.61, - "learning_rate": 5.8598160546084724e-05, - "loss": 0.0108, + "epoch": 0.83, + "learning_rate": 0.00017596978596664945, + "loss": 0.0135, "step": 318990 }, { - "epoch": 1.61, - "learning_rate": 5.859059285307071e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.000175965897750278, + "loss": 0.0133, "step": 319000 }, { - "epoch": 1.61, - "eval_cer": 0.9144294992658953, - "eval_loss": 0.00516105629503727, - "eval_runtime": 116.3084, - "eval_samples_per_second": 17.196, - "eval_steps_per_second": 4.299, + "epoch": 0.83, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.00930393859744072, + "eval_runtime": 107.7238, + "eval_samples_per_second": 18.566, + "eval_steps_per_second": 4.641, "step": 319000 }, { - "epoch": 1.61, - "learning_rate": 5.858302516005671e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017596200953390654, + "loss": 0.0146, "step": 319010 }, { - "epoch": 1.61, - "learning_rate": 5.8575457467042696e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017595812131753505, + "loss": 0.0205, "step": 319020 }, { - "epoch": 1.61, - "learning_rate": 5.8567889774028684e-05, - "loss": 0.0084, + "epoch": 0.83, + "learning_rate": 0.0001759542331011636, + "loss": 0.0136, "step": 319030 }, { - "epoch": 1.61, - "learning_rate": 5.856032208101467e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017595034488479216, + "loss": 0.0117, "step": 319040 }, { - "epoch": 1.61, - "learning_rate": 5.855275438800067e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017594645666842067, + "loss": 0.0155, "step": 319050 }, { - "epoch": 1.61, - "learning_rate": 5.8545186694986655e-05, - "loss": 0.0092, + "epoch": 0.83, + "learning_rate": 0.00017594256845204922, + "loss": 0.0166, "step": 319060 }, { - "epoch": 1.61, - "learning_rate": 5.8537619001972644e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017593868023567773, + "loss": 0.0159, "step": 319070 }, { - "epoch": 1.61, - "learning_rate": 5.853005130895863e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017593479201930625, + "loss": 0.0149, "step": 319080 }, { - "epoch": 1.61, - "learning_rate": 5.852248361594463e-05, - "loss": 0.0092, + "epoch": 0.83, + "learning_rate": 0.00017593090380293481, + "loss": 0.0163, "step": 319090 }, { - "epoch": 1.61, - "learning_rate": 5.851491592293061e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017592701558656336, + "loss": 0.0121, "step": 319100 }, { - "epoch": 1.61, - "learning_rate": 5.8507348229916596e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017592312737019187, + "loss": 0.0118, "step": 319110 }, { - "epoch": 1.61, - "learning_rate": 5.8499780536902585e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.0001759192391538204, + "loss": 0.0177, "step": 319120 }, { - "epoch": 1.61, - "learning_rate": 5.849221284388857e-05, - "loss": 0.0044, + "epoch": 0.83, + "learning_rate": 0.00017591535093744895, + "loss": 0.015, "step": 319130 }, { - "epoch": 1.61, - "learning_rate": 5.848464515087457e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.0001759114627210775, + "loss": 0.0112, "step": 319140 }, { - "epoch": 1.61, - "learning_rate": 5.8477077457860556e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.000175907574504706, + "loss": 0.0134, "step": 319150 }, { - "epoch": 1.61, - "learning_rate": 5.8469509764846544e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.00017590368628833455, + "loss": 0.0119, "step": 319160 }, { - "epoch": 1.61, - "learning_rate": 5.846194207183253e-05, - "loss": 0.0095, + "epoch": 0.83, + "learning_rate": 0.0001758997980719631, + "loss": 0.0115, "step": 319170 }, { - "epoch": 1.61, - "learning_rate": 5.845437437881853e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017589590985559163, + "loss": 0.0136, "step": 319180 }, { - "epoch": 1.61, - "learning_rate": 5.8446806685804516e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017589202163922015, + "loss": 0.0169, "step": 319190 }, { - "epoch": 1.61, - "learning_rate": 5.8439238992790504e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.0001758881334228487, + "loss": 0.0129, "step": 319200 }, { - "epoch": 1.61, - "learning_rate": 5.843167129977649e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017588424520647726, + "loss": 0.0168, "step": 319210 }, { - "epoch": 1.61, - "learning_rate": 5.842410360676249e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017588035699010577, + "loss": 0.0131, "step": 319220 }, { - "epoch": 1.61, - "learning_rate": 5.8416535913748475e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017587646877373432, + "loss": 0.0144, "step": 319230 }, { - "epoch": 1.61, - "learning_rate": 5.8408968220734464e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017587258055736283, + "loss": 0.0148, "step": 319240 }, { - "epoch": 1.61, - "learning_rate": 5.840140052772045e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.0001758686923409914, + "loss": 0.0159, "step": 319250 }, { - "epoch": 1.61, - "learning_rate": 5.839383283470645e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017586480412461991, + "loss": 0.0099, "step": 319260 }, { - "epoch": 1.61, - "learning_rate": 5.8386265141692435e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017586091590824846, + "loss": 0.0125, "step": 319270 }, { - "epoch": 1.61, - "learning_rate": 5.837869744867842e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017585702769187697, + "loss": 0.0147, "step": 319280 }, { - "epoch": 1.61, - "learning_rate": 5.837112975566441e-05, - "loss": 0.011, + "epoch": 0.83, + "learning_rate": 0.00017585313947550554, + "loss": 0.0126, "step": 319290 }, { - "epoch": 1.61, - "learning_rate": 5.8363562062650406e-05, - "loss": 0.0049, + "epoch": 0.83, + "learning_rate": 0.00017584925125913405, + "loss": 0.0157, "step": 319300 }, { - "epoch": 1.61, - "learning_rate": 5.8355994369636395e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001758453630427626, + "loss": 0.0167, "step": 319310 }, { - "epoch": 1.61, - "learning_rate": 5.834842667662238e-05, - "loss": 0.0052, + "epoch": 0.83, + "learning_rate": 0.0001758414748263911, + "loss": 0.0128, "step": 319320 }, { - "epoch": 1.61, - "learning_rate": 5.834085898360837e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017583758661001965, + "loss": 0.0199, "step": 319330 }, { - "epoch": 1.61, - "learning_rate": 5.8333291290594366e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.0001758336983936482, + "loss": 0.0162, "step": 319340 }, { - "epoch": 1.61, - "learning_rate": 5.8325723597580354e-05, - "loss": 0.009, + "epoch": 0.83, + "learning_rate": 0.00017582981017727673, + "loss": 0.0136, "step": 319350 }, { - "epoch": 1.61, - "learning_rate": 5.831815590456634e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017582592196090525, + "loss": 0.0108, "step": 319360 }, { - "epoch": 1.61, - "learning_rate": 5.831058821155233e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.0001758220337445338, + "loss": 0.0162, "step": 319370 }, { - "epoch": 1.61, - "learning_rate": 5.8303020518538326e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017581814552816236, + "loss": 0.0158, "step": 319380 }, { - "epoch": 1.61, - "learning_rate": 5.8295452825524314e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017581425731179087, + "loss": 0.0129, "step": 319390 }, { - "epoch": 1.61, - "learning_rate": 5.82878851325103e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.0001758103690954194, + "loss": 0.0128, "step": 319400 }, { - "epoch": 1.61, - "learning_rate": 5.8280317439496284e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017580648087904793, + "loss": 0.0127, "step": 319410 }, { - "epoch": 1.61, - "learning_rate": 5.827274974648227e-05, - "loss": 0.0091, + "epoch": 0.83, + "learning_rate": 0.0001758025926626765, + "loss": 0.011, "step": 319420 }, { - "epoch": 1.61, - "learning_rate": 5.826518205346827e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.000175798704446305, + "loss": 0.0126, "step": 319430 }, { - "epoch": 1.61, - "learning_rate": 5.8257614360454255e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.00017579481622993355, + "loss": 0.0105, "step": 319440 }, { - "epoch": 1.61, - "learning_rate": 5.825004666744024e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017579092801356207, + "loss": 0.0147, "step": 319450 }, { - "epoch": 1.61, - "learning_rate": 5.824247897442623e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017578703979719064, + "loss": 0.0139, "step": 319460 }, { - "epoch": 1.61, - "learning_rate": 5.8234911281412227e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017578315158081915, + "loss": 0.0113, "step": 319470 }, { - "epoch": 1.61, - "learning_rate": 5.8227343588398215e-05, - "loss": 0.0082, + "epoch": 0.83, + "learning_rate": 0.0001757792633644477, + "loss": 0.0197, "step": 319480 }, { - "epoch": 1.61, - "learning_rate": 5.82197758953842e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.0001757753751480762, + "loss": 0.014, "step": 319490 }, { - "epoch": 1.61, - "learning_rate": 5.82122082023702e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017577148693170478, + "loss": 0.0108, "step": 319500 }, { - "epoch": 1.61, - "learning_rate": 5.8204640509356186e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.0001757675987153333, + "loss": 0.0131, "step": 319510 }, { - "epoch": 1.61, - "learning_rate": 5.8197072816342174e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017576371049896183, + "loss": 0.0108, "step": 319520 }, { - "epoch": 1.61, - "learning_rate": 5.818950512332816e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017575982228259035, + "loss": 0.0146, "step": 319530 }, { - "epoch": 1.61, - "learning_rate": 5.818193743031416e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017575593406621892, + "loss": 0.0147, "step": 319540 }, { - "epoch": 1.61, - "learning_rate": 5.8174369737300146e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017575204584984743, + "loss": 0.0151, "step": 319550 }, { - "epoch": 1.61, - "learning_rate": 5.8166802044286134e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017574815763347597, + "loss": 0.0132, "step": 319560 }, { - "epoch": 1.61, - "learning_rate": 5.815923435127212e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001757442694171045, + "loss": 0.0137, "step": 319570 }, { - "epoch": 1.61, - "learning_rate": 5.815166665825812e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017574038120073303, + "loss": 0.0116, "step": 319580 }, { - "epoch": 1.61, - "learning_rate": 5.8144098965244105e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.0001757364929843616, + "loss": 0.0148, "step": 319590 }, { - "epoch": 1.61, - "learning_rate": 5.8136531272230094e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001757326047679901, + "loss": 0.0193, "step": 319600 }, { - "epoch": 1.61, - "learning_rate": 5.812896357921608e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017572871655161865, + "loss": 0.013, "step": 319610 }, { - "epoch": 1.61, - "learning_rate": 5.812139588620208e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017572482833524717, + "loss": 0.0124, "step": 319620 }, { - "epoch": 1.61, - "learning_rate": 5.8113828193188065e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017572094011887574, + "loss": 0.0104, "step": 319630 }, { - "epoch": 1.61, - "learning_rate": 5.810626050017405e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017571705190250425, + "loss": 0.0166, "step": 319640 }, { - "epoch": 1.61, - "learning_rate": 5.809869280716004e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.0001757131636861328, + "loss": 0.0149, "step": 319650 }, { - "epoch": 1.61, - "learning_rate": 5.8091125114146037e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.0001757092754697613, + "loss": 0.0123, "step": 319660 }, { - "epoch": 1.61, - "learning_rate": 5.8083557421132025e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017570538725338988, + "loss": 0.0156, "step": 319670 }, { - "epoch": 1.61, - "learning_rate": 5.807598972811801e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.0001757014990370184, + "loss": 0.0144, "step": 319680 }, { - "epoch": 1.61, - "learning_rate": 5.8068422035104e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017569761082064693, + "loss": 0.0122, "step": 319690 }, { - "epoch": 1.61, - "learning_rate": 5.8060854342089996e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017569372260427545, + "loss": 0.011, "step": 319700 }, { - "epoch": 1.61, - "learning_rate": 5.8053286649075984e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017568983438790402, + "loss": 0.0139, "step": 319710 }, { - "epoch": 1.61, - "learning_rate": 5.804571895606197e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017568594617153253, + "loss": 0.0105, "step": 319720 }, { - "epoch": 1.61, - "learning_rate": 5.8038151263047954e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017568205795516107, + "loss": 0.013, "step": 319730 }, { - "epoch": 1.61, - "learning_rate": 5.803058357003394e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001756781697387896, + "loss": 0.016, "step": 319740 }, { - "epoch": 1.61, - "learning_rate": 5.802301587701994e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017567428152241816, + "loss": 0.0131, "step": 319750 }, { - "epoch": 1.61, - "learning_rate": 5.8015448184005926e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.0001756703933060467, + "loss": 0.0144, "step": 319760 }, { - "epoch": 1.61, - "learning_rate": 5.8007880490991914e-05, - "loss": 0.0087, + "epoch": 0.83, + "learning_rate": 0.0001756665050896752, + "loss": 0.0129, "step": 319770 }, { - "epoch": 1.61, - "learning_rate": 5.80003127979779e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017566261687330375, + "loss": 0.0207, "step": 319780 }, { - "epoch": 1.61, - "learning_rate": 5.79927451049639e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.0001756587286569323, + "loss": 0.0124, "step": 319790 }, { - "epoch": 1.61, - "learning_rate": 5.7985177411949885e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017565484044056084, + "loss": 0.0164, "step": 319800 }, { - "epoch": 1.61, - "learning_rate": 5.7977609718935873e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017565095222418935, + "loss": 0.01, "step": 319810 }, { - "epoch": 1.61, - "learning_rate": 5.797004202592186e-05, - "loss": 0.0048, + "epoch": 0.83, + "learning_rate": 0.0001756470640078179, + "loss": 0.0173, "step": 319820 }, { - "epoch": 1.61, - "learning_rate": 5.7962474332907857e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.0001756431757914464, + "loss": 0.0167, "step": 319830 }, { - "epoch": 1.61, - "learning_rate": 5.7954906639893845e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017563928757507498, + "loss": 0.0124, "step": 319840 }, { - "epoch": 1.61, - "learning_rate": 5.794733894687983e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.0001756353993587035, + "loss": 0.0158, "step": 319850 }, { - "epoch": 1.61, - "learning_rate": 5.793977125386582e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017563151114233203, + "loss": 0.0146, "step": 319860 }, { - "epoch": 1.61, - "learning_rate": 5.7932203560851816e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.00017562762292596055, + "loss": 0.014, "step": 319870 }, { - "epoch": 1.61, - "learning_rate": 5.7924635867837804e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017562373470958912, + "loss": 0.0206, "step": 319880 }, { - "epoch": 1.61, - "learning_rate": 5.791706817482379e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017561984649321763, + "loss": 0.0133, "step": 319890 }, { - "epoch": 1.61, - "learning_rate": 5.790950048180978e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017561595827684617, + "loss": 0.0119, "step": 319900 }, { - "epoch": 1.61, - "learning_rate": 5.7901932788795776e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017561207006047469, + "loss": 0.0111, "step": 319910 }, { - "epoch": 1.61, - "learning_rate": 5.7894365095781764e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017560818184410326, + "loss": 0.0141, "step": 319920 }, { - "epoch": 1.61, - "learning_rate": 5.788679740276775e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001756042936277318, + "loss": 0.0159, "step": 319930 }, { - "epoch": 1.61, - "learning_rate": 5.787922970975374e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.0001756004054113603, + "loss": 0.013, "step": 319940 }, { - "epoch": 1.61, - "learning_rate": 5.7871662016739736e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017559651719498885, + "loss": 0.0123, "step": 319950 }, { - "epoch": 1.61, - "learning_rate": 5.7864094323725724e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.0001755926289786174, + "loss": 0.0135, "step": 319960 }, { - "epoch": 1.61, - "learning_rate": 5.785652663071171e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017558874076224594, + "loss": 0.0127, "step": 319970 }, { - "epoch": 1.61, - "learning_rate": 5.784895893769771e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017558485254587445, + "loss": 0.0161, "step": 319980 }, { - "epoch": 1.61, - "learning_rate": 5.7841391244683695e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.000175580964329503, + "loss": 0.0119, "step": 319990 }, { - "epoch": 1.61, - "learning_rate": 5.7833823551669683e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017557707611313153, + "loss": 0.0151, "step": 320000 }, { - "epoch": 1.61, - "eval_cer": 0.9144392032271493, - "eval_loss": 0.005123169161379337, - "eval_runtime": 116.2037, - "eval_samples_per_second": 17.211, - "eval_steps_per_second": 4.303, + "epoch": 0.83, + "eval_cer": 0.8816998870492994, + "eval_loss": 0.009145650081336498, + "eval_runtime": 107.5595, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.649, "step": 320000 }, { - "epoch": 1.61, - "learning_rate": 5.782625585865567e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017557318789676008, + "loss": 0.014, "step": 320010 }, { - "epoch": 1.61, - "learning_rate": 5.781868816564167e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.0001755692996803886, + "loss": 0.0102, "step": 320020 }, { - "epoch": 1.61, - "learning_rate": 5.7811120472627655e-05, - "loss": 0.0101, + "epoch": 0.83, + "learning_rate": 0.00017556541146401713, + "loss": 0.0166, "step": 320030 }, { - "epoch": 1.61, - "learning_rate": 5.7803552779613636e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017556152324764567, + "loss": 0.0124, "step": 320040 }, { - "epoch": 1.61, - "learning_rate": 5.7795985086599625e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017555763503127422, + "loss": 0.012, "step": 320050 }, { - "epoch": 1.61, - "learning_rate": 5.778841739358561e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017555374681490273, + "loss": 0.0132, "step": 320060 }, { - "epoch": 1.61, - "learning_rate": 5.778084970057161e-05, - "loss": 0.0097, + "epoch": 0.83, + "learning_rate": 0.00017554985859853127, + "loss": 0.0173, "step": 320070 }, { - "epoch": 1.61, - "learning_rate": 5.7773282007557596e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017554597038215979, + "loss": 0.0112, "step": 320080 }, { - "epoch": 1.61, - "learning_rate": 5.7765714314543584e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017554208216578835, + "loss": 0.0141, "step": 320090 }, { - "epoch": 1.61, - "learning_rate": 5.775814662152957e-05, - "loss": 0.0095, + "epoch": 0.83, + "learning_rate": 0.0001755381939494169, + "loss": 0.0148, "step": 320100 }, { - "epoch": 1.61, - "learning_rate": 5.775057892851557e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.0001755343057330454, + "loss": 0.0146, "step": 320110 }, { - "epoch": 1.62, - "learning_rate": 5.7743011235501556e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017553041751667393, + "loss": 0.0164, "step": 320120 }, { - "epoch": 1.62, - "learning_rate": 5.7735443542487544e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001755265293003025, + "loss": 0.0116, "step": 320130 }, { - "epoch": 1.62, - "learning_rate": 5.772787584947353e-05, - "loss": 0.0096, + "epoch": 0.83, + "learning_rate": 0.00017552264108393104, + "loss": 0.0162, "step": 320140 }, { - "epoch": 1.62, - "learning_rate": 5.772030815645953e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017551875286755955, + "loss": 0.0125, "step": 320150 }, { - "epoch": 1.62, - "learning_rate": 5.7712740463445515e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001755148646511881, + "loss": 0.0128, "step": 320160 }, { - "epoch": 1.62, - "learning_rate": 5.7705172770431503e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017551097643481663, + "loss": 0.012, "step": 320170 }, { - "epoch": 1.62, - "learning_rate": 5.769760507741749e-05, - "loss": 0.0079, + "epoch": 0.83, + "learning_rate": 0.00017550708821844518, + "loss": 0.0136, "step": 320180 }, { - "epoch": 1.62, - "learning_rate": 5.769003738440349e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.0001755032000020737, + "loss": 0.013, "step": 320190 }, { - "epoch": 1.62, - "learning_rate": 5.7682469691389475e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017549931178570223, + "loss": 0.0134, "step": 320200 }, { - "epoch": 1.62, - "learning_rate": 5.767490199837546e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017549542356933077, + "loss": 0.0124, "step": 320210 }, { - "epoch": 1.62, - "learning_rate": 5.766733430536145e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017549153535295931, + "loss": 0.0173, "step": 320220 }, { - "epoch": 1.62, - "learning_rate": 5.7659766612347446e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017548764713658783, + "loss": 0.0169, "step": 320230 }, { - "epoch": 1.62, - "learning_rate": 5.7652198919333435e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017548375892021637, + "loss": 0.0116, "step": 320240 }, { - "epoch": 1.62, - "learning_rate": 5.764463122631942e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.00017547987070384494, + "loss": 0.0156, "step": 320250 }, { - "epoch": 1.62, - "learning_rate": 5.763706353330541e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017547598248747345, + "loss": 0.0121, "step": 320260 }, { - "epoch": 1.62, - "learning_rate": 5.7629495840291406e-05, - "loss": 0.0111, + "epoch": 0.83, + "learning_rate": 0.00017547209427110197, + "loss": 0.0104, "step": 320270 }, { - "epoch": 1.62, - "learning_rate": 5.7621928147277394e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001754682060547305, + "loss": 0.0146, "step": 320280 }, { - "epoch": 1.62, - "learning_rate": 5.761436045426338e-05, - "loss": 0.0095, + "epoch": 0.83, + "learning_rate": 0.00017546431783835908, + "loss": 0.0134, "step": 320290 }, { - "epoch": 1.62, - "learning_rate": 5.760679276124937e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.0001754604296219876, + "loss": 0.0134, "step": 320300 }, { - "epoch": 1.62, - "learning_rate": 5.7599225068235366e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017545654140561614, + "loss": 0.0121, "step": 320310 }, { - "epoch": 1.62, - "learning_rate": 5.7591657375221354e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017545265318924465, + "loss": 0.0171, "step": 320320 }, { - "epoch": 1.62, - "learning_rate": 5.758408968220734e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.0001754487649728732, + "loss": 0.0172, "step": 320330 }, { - "epoch": 1.62, - "learning_rate": 5.757652198919333e-05, - "loss": 0.0091, + "epoch": 0.83, + "learning_rate": 0.00017544487675650173, + "loss": 0.0131, "step": 320340 }, { - "epoch": 1.62, - "learning_rate": 5.756895429617931e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017544098854013027, + "loss": 0.0133, "step": 320350 }, { - "epoch": 1.62, - "learning_rate": 5.756138660316531e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.0001754371003237588, + "loss": 0.0138, "step": 320360 }, { - "epoch": 1.62, - "learning_rate": 5.7553818910151295e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017543321210738733, + "loss": 0.0122, "step": 320370 }, { - "epoch": 1.62, - "learning_rate": 5.754625121713728e-05, - "loss": 0.0111, - "step": 320380 + "epoch": 0.83, + "learning_rate": 0.00017542932389101587, + "loss": 0.0143, + "step": 320380 }, { - "epoch": 1.62, - "learning_rate": 5.753868352412327e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017542543567464441, + "loss": 0.0183, "step": 320390 }, { - "epoch": 1.62, - "learning_rate": 5.7531115831109266e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.00017542154745827293, + "loss": 0.0126, "step": 320400 }, { - "epoch": 1.62, - "learning_rate": 5.7523548138095255e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017541765924190147, + "loss": 0.0166, "step": 320410 }, { - "epoch": 1.62, - "learning_rate": 5.751598044508124e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017541377102553004, + "loss": 0.0156, "step": 320420 }, { - "epoch": 1.62, - "learning_rate": 5.750841275206723e-05, - "loss": 0.0078, + "epoch": 0.83, + "learning_rate": 0.00017540988280915855, + "loss": 0.0106, "step": 320430 }, { - "epoch": 1.62, - "learning_rate": 5.7500845059053226e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017540599459278707, + "loss": 0.0136, "step": 320440 }, { - "epoch": 1.62, - "learning_rate": 5.7493277366039214e-05, - "loss": 0.0086, + "epoch": 0.83, + "learning_rate": 0.0001754021063764156, + "loss": 0.0122, "step": 320450 }, { - "epoch": 1.62, - "learning_rate": 5.74857096730252e-05, - "loss": 0.0121, + "epoch": 0.83, + "learning_rate": 0.00017539821816004418, + "loss": 0.0106, "step": 320460 }, { - "epoch": 1.62, - "learning_rate": 5.74781419800112e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.0001753943299436727, + "loss": 0.0145, "step": 320470 }, { - "epoch": 1.62, - "learning_rate": 5.7470574286997186e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017539044172730123, + "loss": 0.0152, "step": 320480 }, { - "epoch": 1.62, - "learning_rate": 5.7463006593983174e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017538655351092975, + "loss": 0.0129, "step": 320490 }, { - "epoch": 1.62, - "learning_rate": 5.745543890096916e-05, - "loss": 0.0085, + "epoch": 0.83, + "learning_rate": 0.00017538266529455832, + "loss": 0.0118, "step": 320500 }, { - "epoch": 1.62, - "learning_rate": 5.744787120795516e-05, - "loss": 0.0091, + "epoch": 0.83, + "learning_rate": 0.00017537877707818683, + "loss": 0.015, "step": 320510 }, { - "epoch": 1.62, - "learning_rate": 5.7440303514941145e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017537488886181537, + "loss": 0.0161, "step": 320520 }, { - "epoch": 1.62, - "learning_rate": 5.7432735821927134e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.0001753710006454439, + "loss": 0.0157, "step": 320530 }, { - "epoch": 1.62, - "learning_rate": 5.742516812891312e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017536711242907246, + "loss": 0.0187, "step": 320540 }, { - "epoch": 1.62, - "learning_rate": 5.741760043589912e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017536322421270097, + "loss": 0.0165, "step": 320550 }, { - "epoch": 1.62, - "learning_rate": 5.7410032742885105e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.0001753593359963295, + "loss": 0.0154, "step": 320560 }, { - "epoch": 1.62, - "learning_rate": 5.740246504987109e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017535544777995803, + "loss": 0.0126, "step": 320570 }, { - "epoch": 1.62, - "learning_rate": 5.739489735685708e-05, - "loss": 0.0097, + "epoch": 0.83, + "learning_rate": 0.00017535155956358657, + "loss": 0.0151, "step": 320580 }, { - "epoch": 1.62, - "learning_rate": 5.7387329663843076e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001753476713472151, + "loss": 0.0114, "step": 320590 }, { - "epoch": 1.62, - "learning_rate": 5.7379761970829065e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017534378313084365, + "loss": 0.0117, "step": 320600 }, { - "epoch": 1.62, - "learning_rate": 5.737219427781505e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017533989491447217, + "loss": 0.019, "step": 320610 }, { - "epoch": 1.62, - "learning_rate": 5.736462658480104e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001753360066981007, + "loss": 0.0184, "step": 320620 }, { - "epoch": 1.62, - "learning_rate": 5.7357058891787036e-05, - "loss": 0.0048, + "epoch": 0.83, + "learning_rate": 0.00017533211848172928, + "loss": 0.0134, "step": 320630 }, { - "epoch": 1.62, - "learning_rate": 5.7349491198773024e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.0001753282302653578, + "loss": 0.0127, "step": 320640 }, { - "epoch": 1.62, - "learning_rate": 5.734192350575901e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017532434204898633, + "loss": 0.0115, "step": 320650 }, { - "epoch": 1.62, - "learning_rate": 5.7334355812745e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017532045383261485, + "loss": 0.0096, "step": 320660 }, { - "epoch": 1.62, - "learning_rate": 5.732678811973098e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017531656561624342, + "loss": 0.0135, "step": 320670 }, { - "epoch": 1.62, - "learning_rate": 5.731922042671698e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017531267739987193, + "loss": 0.0112, "step": 320680 }, { - "epoch": 1.62, - "learning_rate": 5.7311652733702965e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017530878918350047, + "loss": 0.0159, "step": 320690 }, { - "epoch": 1.62, - "learning_rate": 5.7304085040688954e-05, - "loss": 0.0084, + "epoch": 0.83, + "learning_rate": 0.000175304900967129, + "loss": 0.013, "step": 320700 }, { - "epoch": 1.62, - "learning_rate": 5.729651734767494e-05, - "loss": 0.0056, + "epoch": 0.83, + "learning_rate": 0.00017530101275075756, + "loss": 0.021, "step": 320710 }, { - "epoch": 1.62, - "learning_rate": 5.728894965466094e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017529712453438607, + "loss": 0.0166, "step": 320720 }, { - "epoch": 1.62, - "learning_rate": 5.7281381961646925e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.0001752932363180146, + "loss": 0.0133, "step": 320730 }, { - "epoch": 1.62, - "learning_rate": 5.727381426863291e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017528934810164313, + "loss": 0.0129, "step": 320740 }, { - "epoch": 1.62, - "learning_rate": 5.72662465756189e-05, - "loss": 0.0093, + "epoch": 0.83, + "learning_rate": 0.0001752854598852717, + "loss": 0.0173, "step": 320750 }, { - "epoch": 1.62, - "learning_rate": 5.7258678882604896e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.0001752815716689002, + "loss": 0.0157, "step": 320760 }, { - "epoch": 1.62, - "learning_rate": 5.7251111189590885e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017527768345252875, + "loss": 0.0123, "step": 320770 }, { - "epoch": 1.62, - "learning_rate": 5.724354349657687e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.00017527379523615727, + "loss": 0.0144, "step": 320780 }, { - "epoch": 1.62, - "learning_rate": 5.723597580356286e-05, - "loss": 0.005, + "epoch": 0.83, + "learning_rate": 0.00017526990701978584, + "loss": 0.0136, "step": 320790 }, { - "epoch": 1.62, - "learning_rate": 5.7228408110548856e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017526601880341438, + "loss": 0.015, "step": 320800 }, { - "epoch": 1.62, - "learning_rate": 5.7220840417534844e-05, - "loss": 0.0106, + "epoch": 0.83, + "learning_rate": 0.0001752621305870429, + "loss": 0.0145, "step": 320810 }, { - "epoch": 1.62, - "learning_rate": 5.721327272452083e-05, - "loss": 0.0052, + "epoch": 0.83, + "learning_rate": 0.00017525824237067143, + "loss": 0.013, "step": 320820 }, { - "epoch": 1.62, - "learning_rate": 5.720570503150682e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017525435415429995, + "loss": 0.0154, "step": 320830 }, { - "epoch": 1.62, - "learning_rate": 5.7198137338492816e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017525046593792852, + "loss": 0.0176, "step": 320840 }, { - "epoch": 1.62, - "learning_rate": 5.7190569645478804e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017524657772155703, + "loss": 0.0174, "step": 320850 }, { - "epoch": 1.62, - "learning_rate": 5.718300195246479e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017524268950518557, + "loss": 0.0133, "step": 320860 }, { - "epoch": 1.62, - "learning_rate": 5.717543425945078e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001752388012888141, + "loss": 0.0142, "step": 320870 }, { - "epoch": 1.62, - "learning_rate": 5.7167866566436775e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017523491307244266, + "loss": 0.0146, "step": 320880 }, { - "epoch": 1.62, - "learning_rate": 5.7160298873422764e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.00017523102485607117, + "loss": 0.0136, "step": 320890 }, { - "epoch": 1.62, - "learning_rate": 5.715273118040875e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.0001752271366396997, + "loss": 0.0134, "step": 320900 }, { - "epoch": 1.62, - "learning_rate": 5.714516348739474e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.00017522324842332823, + "loss": 0.0134, "step": 320910 }, { - "epoch": 1.62, - "learning_rate": 5.7137595794380735e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.0001752193602069568, + "loss": 0.0109, "step": 320920 }, { - "epoch": 1.62, - "learning_rate": 5.713002810136672e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.0001752154719905853, + "loss": 0.0143, "step": 320930 }, { - "epoch": 1.62, - "learning_rate": 5.712246040835271e-05, - "loss": 0.0047, + "epoch": 0.83, + "learning_rate": 0.00017521158377421385, + "loss": 0.0123, "step": 320940 }, { - "epoch": 1.62, - "learning_rate": 5.7114892715338707e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017520769555784237, + "loss": 0.0152, "step": 320950 }, { - "epoch": 1.62, - "learning_rate": 5.7107325022324695e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017520380734147093, + "loss": 0.0146, "step": 320960 }, { - "epoch": 1.62, - "learning_rate": 5.709975732931068e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017519991912509948, + "loss": 0.0112, "step": 320970 }, { - "epoch": 1.62, - "learning_rate": 5.7092189636296664e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.000175196030908728, + "loss": 0.0145, "step": 320980 }, { - "epoch": 1.62, - "learning_rate": 5.708462194328265e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001751921426923565, + "loss": 0.0135, "step": 320990 }, { - "epoch": 1.62, - "learning_rate": 5.707705425026865e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.00017518825447598507, + "loss": 0.0112, "step": 321000 }, { - "epoch": 1.62, - "eval_cer": 0.9144275584736445, - "eval_loss": 0.005066942423582077, - "eval_runtime": 116.3307, - "eval_samples_per_second": 17.192, - "eval_steps_per_second": 4.298, + "epoch": 0.83, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.00950040016323328, + "eval_runtime": 107.7703, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.639, "step": 321000 }, { - "epoch": 1.62, - "learning_rate": 5.7069486557254636e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017518436625961362, + "loss": 0.0165, "step": 321010 }, { - "epoch": 1.62, - "learning_rate": 5.7061918864240624e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017518047804324213, + "loss": 0.0115, "step": 321020 }, { - "epoch": 1.62, - "learning_rate": 5.705435117122661e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017517658982687067, + "loss": 0.0124, "step": 321030 }, { - "epoch": 1.62, - "learning_rate": 5.704678347821261e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017517270161049921, + "loss": 0.0176, "step": 321040 }, { - "epoch": 1.62, - "learning_rate": 5.7039215785198595e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017516881339412776, + "loss": 0.0146, "step": 321050 }, { - "epoch": 1.62, - "learning_rate": 5.7031648092184584e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.00017516492517775627, + "loss": 0.0112, "step": 321060 }, { - "epoch": 1.62, - "learning_rate": 5.702408039917057e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.0001751610369613848, + "loss": 0.0129, "step": 321070 }, { - "epoch": 1.62, - "learning_rate": 5.701651270615657e-05, - "loss": 0.0084, + "epoch": 0.83, + "learning_rate": 0.00017515714874501333, + "loss": 0.0111, "step": 321080 }, { - "epoch": 1.62, - "learning_rate": 5.7008945013142555e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001751532605286419, + "loss": 0.0121, "step": 321090 }, { - "epoch": 1.62, - "learning_rate": 5.700137732012854e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.0001751493723122704, + "loss": 0.0152, "step": 321100 }, { - "epoch": 1.62, - "learning_rate": 5.699380962711453e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.00017514548409589895, + "loss": 0.0129, "step": 321110 }, { - "epoch": 1.62, - "learning_rate": 5.6986241934100527e-05, - "loss": 0.0048, + "epoch": 0.83, + "learning_rate": 0.00017514159587952747, + "loss": 0.0136, "step": 321120 }, { - "epoch": 1.62, - "learning_rate": 5.6978674241086515e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017513770766315603, + "loss": 0.0129, "step": 321130 }, { - "epoch": 1.62, - "learning_rate": 5.69711065480725e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017513381944678455, + "loss": 0.0133, "step": 321140 }, { - "epoch": 1.62, - "learning_rate": 5.696353885505849e-05, - "loss": 0.0049, + "epoch": 0.83, + "learning_rate": 0.0001751299312304131, + "loss": 0.0117, "step": 321150 }, { - "epoch": 1.62, - "learning_rate": 5.6955971162044486e-05, - "loss": 0.0075, + "epoch": 0.83, + "learning_rate": 0.0001751260430140416, + "loss": 0.0164, "step": 321160 }, { - "epoch": 1.62, - "learning_rate": 5.6948403469030474e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017512215479767017, + "loss": 0.0122, "step": 321170 }, { - "epoch": 1.62, - "learning_rate": 5.694083577601646e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.00017511826658129872, + "loss": 0.0097, "step": 321180 }, { - "epoch": 1.62, - "learning_rate": 5.693326808300245e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017511437836492723, + "loss": 0.0243, "step": 321190 }, { - "epoch": 1.62, - "learning_rate": 5.6925700389988446e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017511049014855577, + "loss": 0.015, "step": 321200 }, { - "epoch": 1.62, - "learning_rate": 5.6918132696974434e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.0001751066019321843, + "loss": 0.0127, "step": 321210 }, { - "epoch": 1.62, - "learning_rate": 5.691056500396042e-05, - "loss": 0.0091, + "epoch": 0.83, + "learning_rate": 0.00017510271371581285, + "loss": 0.0108, "step": 321220 }, { - "epoch": 1.62, - "learning_rate": 5.690299731094641e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017509882549944137, + "loss": 0.0119, "step": 321230 }, { - "epoch": 1.62, - "learning_rate": 5.6895429617932406e-05, - "loss": 0.0092, + "epoch": 0.83, + "learning_rate": 0.0001750949372830699, + "loss": 0.014, "step": 321240 }, { - "epoch": 1.62, - "learning_rate": 5.6887861924918394e-05, - "loss": 0.0049, + "epoch": 0.83, + "learning_rate": 0.00017509104906669845, + "loss": 0.0114, "step": 321250 }, { - "epoch": 1.62, - "learning_rate": 5.688029423190438e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.000175087160850327, + "loss": 0.0123, "step": 321260 }, { - "epoch": 1.62, - "learning_rate": 5.687272653889037e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.0001750832726339555, + "loss": 0.0142, "step": 321270 }, { - "epoch": 1.62, - "learning_rate": 5.6865158845876365e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017507938441758405, + "loss": 0.0121, "step": 321280 }, { - "epoch": 1.62, - "learning_rate": 5.685759115286235e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017507549620121262, + "loss": 0.0134, "step": 321290 }, { - "epoch": 1.62, - "learning_rate": 5.6850023459848335e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017507160798484113, + "loss": 0.0142, "step": 321300 }, { - "epoch": 1.62, - "learning_rate": 5.684245576683432e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017506771976846965, + "loss": 0.0114, "step": 321310 }, { - "epoch": 1.62, - "learning_rate": 5.683488807382031e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.0001750638315520982, + "loss": 0.0124, "step": 321320 }, { - "epoch": 1.62, - "learning_rate": 5.6827320380806306e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.0001750599433357267, + "loss": 0.0113, "step": 321330 }, { - "epoch": 1.62, - "learning_rate": 5.6819752687792294e-05, - "loss": 0.0072, + "epoch": 0.83, + "learning_rate": 0.00017505605511935527, + "loss": 0.0143, "step": 321340 }, { - "epoch": 1.62, - "learning_rate": 5.681218499477828e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017505216690298381, + "loss": 0.0131, "step": 321350 }, { - "epoch": 1.62, - "learning_rate": 5.680461730176427e-05, - "loss": 0.005, + "epoch": 0.83, + "learning_rate": 0.00017504827868661233, + "loss": 0.0127, "step": 321360 }, { - "epoch": 1.62, - "learning_rate": 5.6797049608750266e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017504439047024087, + "loss": 0.0171, "step": 321370 }, { - "epoch": 1.62, - "learning_rate": 5.6789481915736254e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.0001750405022538694, + "loss": 0.0136, "step": 321380 }, { - "epoch": 1.62, - "learning_rate": 5.678191422272224e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017503661403749795, + "loss": 0.0179, "step": 321390 }, { - "epoch": 1.62, - "learning_rate": 5.677434652970823e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017503272582112647, + "loss": 0.0112, "step": 321400 }, { - "epoch": 1.62, - "learning_rate": 5.6766778836694226e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.000175028837604755, + "loss": 0.0152, "step": 321410 }, { - "epoch": 1.62, - "learning_rate": 5.6759211143680214e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017502494938838355, + "loss": 0.0098, "step": 321420 }, { - "epoch": 1.62, - "learning_rate": 5.67516434506662e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.0001750210611720121, + "loss": 0.0146, "step": 321430 }, { - "epoch": 1.62, - "learning_rate": 5.67440757576522e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001750171729556406, + "loss": 0.0137, "step": 321440 }, { - "epoch": 1.62, - "learning_rate": 5.6736508064638185e-05, - "loss": 0.0048, + "epoch": 0.83, + "learning_rate": 0.00017501328473926915, + "loss": 0.0159, "step": 321450 }, { - "epoch": 1.62, - "learning_rate": 5.6728940371624173e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.0001750093965228977, + "loss": 0.0121, "step": 321460 }, { - "epoch": 1.62, - "learning_rate": 5.672137267861016e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017500550830652623, + "loss": 0.0169, "step": 321470 }, { - "epoch": 1.62, - "learning_rate": 5.671380498559616e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.00017500162009015475, + "loss": 0.0121, "step": 321480 }, { - "epoch": 1.62, - "learning_rate": 5.6706237292582145e-05, - "loss": 0.0063, + "epoch": 0.83, + "learning_rate": 0.0001749977318737833, + "loss": 0.0133, "step": 321490 }, { - "epoch": 1.62, - "learning_rate": 5.669866959956813e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017499384365741186, + "loss": 0.0158, "step": 321500 }, { - "epoch": 1.62, - "learning_rate": 5.669110190655412e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017498995544104037, + "loss": 0.0143, "step": 321510 }, { - "epoch": 1.62, - "learning_rate": 5.6683534213540116e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.00017498606722466891, + "loss": 0.0132, "step": 321520 }, { - "epoch": 1.62, - "learning_rate": 5.6675966520526105e-05, - "loss": 0.0071, + "epoch": 0.83, + "learning_rate": 0.00017498217900829743, + "loss": 0.0145, "step": 321530 }, { - "epoch": 1.62, - "learning_rate": 5.666839882751209e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.000174978290791926, + "loss": 0.0147, "step": 321540 }, { - "epoch": 1.62, - "learning_rate": 5.666083113449808e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.0001749744025755545, + "loss": 0.0144, "step": 321550 }, { - "epoch": 1.62, - "learning_rate": 5.6653263441484076e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.00017497051435918305, + "loss": 0.0168, "step": 321560 }, { - "epoch": 1.62, - "learning_rate": 5.6645695748470064e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017496662614281157, + "loss": 0.017, "step": 321570 }, { - "epoch": 1.62, - "learning_rate": 5.663812805545605e-05, - "loss": 0.0062, + "epoch": 0.83, + "learning_rate": 0.0001749627379264401, + "loss": 0.012, "step": 321580 }, { - "epoch": 1.62, - "learning_rate": 5.663056036244204e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017495884971006865, + "loss": 0.0112, "step": 321590 }, { - "epoch": 1.62, - "learning_rate": 5.6622992669428036e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001749549614936972, + "loss": 0.0193, "step": 321600 }, { - "epoch": 1.62, - "learning_rate": 5.661542497641402e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.0001749510732773257, + "loss": 0.012, "step": 321610 }, { - "epoch": 1.62, - "learning_rate": 5.6607857283400005e-05, - "loss": 0.0061, + "epoch": 0.83, + "learning_rate": 0.00017494718506095425, + "loss": 0.0178, "step": 321620 }, { - "epoch": 1.62, - "learning_rate": 5.6600289590385993e-05, - "loss": 0.0108, + "epoch": 0.83, + "learning_rate": 0.0001749432968445828, + "loss": 0.0129, "step": 321630 }, { - "epoch": 1.62, - "learning_rate": 5.659272189737198e-05, - "loss": 0.0069, + "epoch": 0.83, + "learning_rate": 0.00017493940862821133, + "loss": 0.0131, "step": 321640 }, { - "epoch": 1.62, - "learning_rate": 5.658515420435798e-05, - "loss": 0.0081, + "epoch": 0.83, + "learning_rate": 0.00017493552041183985, + "loss": 0.0186, "step": 321650 }, { - "epoch": 1.62, - "learning_rate": 5.6577586511343965e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.0001749316321954684, + "loss": 0.0121, "step": 321660 }, { - "epoch": 1.62, - "learning_rate": 5.657001881832995e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017492774397909696, + "loss": 0.0153, "step": 321670 }, { - "epoch": 1.62, - "learning_rate": 5.656245112531594e-05, - "loss": 0.0066, + "epoch": 0.83, + "learning_rate": 0.00017492385576272547, + "loss": 0.0136, "step": 321680 }, { - "epoch": 1.62, - "learning_rate": 5.6554883432301936e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017491996754635401, + "loss": 0.0129, "step": 321690 }, { - "epoch": 1.62, - "learning_rate": 5.6547315739287925e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017491607932998253, + "loss": 0.0138, "step": 321700 }, { - "epoch": 1.62, - "learning_rate": 5.653974804627391e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.0001749121911136111, + "loss": 0.016, "step": 321710 }, { - "epoch": 1.62, - "learning_rate": 5.65321803532599e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.0001749083028972396, + "loss": 0.0115, "step": 321720 }, { - "epoch": 1.62, - "learning_rate": 5.6524612660245896e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017490441468086815, + "loss": 0.0144, "step": 321730 }, { - "epoch": 1.62, - "learning_rate": 5.6517044967231884e-05, - "loss": 0.0067, + "epoch": 0.83, + "learning_rate": 0.00017490052646449667, + "loss": 0.0156, "step": 321740 }, { - "epoch": 1.62, - "learning_rate": 5.650947727421787e-05, - "loss": 0.0053, + "epoch": 0.83, + "learning_rate": 0.00017489663824812524, + "loss": 0.0135, "step": 321750 }, { - "epoch": 1.62, - "learning_rate": 5.650190958120386e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017489275003175375, + "loss": 0.0136, "step": 321760 }, { - "epoch": 1.62, - "learning_rate": 5.6494341888189856e-05, - "loss": 0.0054, + "epoch": 0.83, + "learning_rate": 0.0001748888618153823, + "loss": 0.0125, "step": 321770 }, { - "epoch": 1.62, - "learning_rate": 5.6486774195175844e-05, - "loss": 0.0094, + "epoch": 0.83, + "learning_rate": 0.0001748849735990108, + "loss": 0.0133, "step": 321780 }, { - "epoch": 1.62, - "learning_rate": 5.647920650216183e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.00017488108538263938, + "loss": 0.0137, "step": 321790 }, { - "epoch": 1.62, - "learning_rate": 5.647163880914782e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.0001748771971662679, + "loss": 0.0116, "step": 321800 }, { - "epoch": 1.62, - "learning_rate": 5.6464071116133815e-05, - "loss": 0.0068, + "epoch": 0.83, + "learning_rate": 0.00017487330894989643, + "loss": 0.0137, "step": 321810 }, { - "epoch": 1.62, - "learning_rate": 5.6456503423119804e-05, - "loss": 0.0084, + "epoch": 0.83, + "learning_rate": 0.00017486942073352495, + "loss": 0.0121, "step": 321820 }, { - "epoch": 1.62, - "learning_rate": 5.644893573010579e-05, - "loss": 0.0065, + "epoch": 0.83, + "learning_rate": 0.0001748655325171535, + "loss": 0.0122, "step": 321830 }, { - "epoch": 1.62, - "learning_rate": 5.644136803709178e-05, - "loss": 0.0083, + "epoch": 0.83, + "learning_rate": 0.00017486164430078206, + "loss": 0.0094, "step": 321840 }, { - "epoch": 1.62, - "learning_rate": 5.6433800344077775e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017485775608441057, + "loss": 0.0167, "step": 321850 }, { - "epoch": 1.62, - "learning_rate": 5.642623265106376e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017485386786803909, + "loss": 0.0129, "step": 321860 }, { - "epoch": 1.62, - "learning_rate": 5.641866495804975e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017484997965166763, + "loss": 0.0129, "step": 321870 }, { - "epoch": 1.62, - "learning_rate": 5.641109726503574e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.0001748460914352962, + "loss": 0.0107, "step": 321880 }, { - "epoch": 1.62, - "learning_rate": 5.6403529572021735e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.0001748422032189247, + "loss": 0.0138, "step": 321890 }, { - "epoch": 1.62, - "learning_rate": 5.639596187900772e-05, - "loss": 0.0055, + "epoch": 0.83, + "learning_rate": 0.00017483831500255325, + "loss": 0.0174, "step": 321900 }, { - "epoch": 1.62, - "learning_rate": 5.638839418599371e-05, - "loss": 0.0082, + "epoch": 0.83, + "learning_rate": 0.00017483442678618177, + "loss": 0.013, "step": 321910 }, { - "epoch": 1.62, - "learning_rate": 5.6380826492979706e-05, - "loss": 0.0059, + "epoch": 0.83, + "learning_rate": 0.00017483053856981034, + "loss": 0.0128, "step": 321920 }, { - "epoch": 1.62, - "learning_rate": 5.637325879996569e-05, - "loss": 0.008, + "epoch": 0.83, + "learning_rate": 0.00017482665035343885, + "loss": 0.0138, "step": 321930 }, { - "epoch": 1.62, - "learning_rate": 5.6365691106951676e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.0001748227621370674, + "loss": 0.0163, "step": 321940 }, { - "epoch": 1.62, - "learning_rate": 5.6358123413937664e-05, - "loss": 0.006, + "epoch": 0.83, + "learning_rate": 0.0001748188739206959, + "loss": 0.0124, "step": 321950 }, { - "epoch": 1.62, - "learning_rate": 5.635055572092365e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017481498570432448, + "loss": 0.015, "step": 321960 }, { - "epoch": 1.62, - "learning_rate": 5.634298802790965e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.000174811097487953, + "loss": 0.0147, "step": 321970 }, { - "epoch": 1.62, - "learning_rate": 5.6335420334895635e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017480720927158153, + "loss": 0.0116, "step": 321980 }, { - "epoch": 1.62, - "learning_rate": 5.6327852641881624e-05, - "loss": 0.0076, + "epoch": 0.83, + "learning_rate": 0.00017480332105521005, + "loss": 0.0123, "step": 321990 }, { - "epoch": 1.62, - "learning_rate": 5.632028494886761e-05, - "loss": 0.0095, + "epoch": 0.83, + "learning_rate": 0.00017479943283883861, + "loss": 0.0118, "step": 322000 }, { - "epoch": 1.62, - "eval_cer": 0.9144197953046413, - "eval_loss": 0.005024084821343422, - "eval_runtime": 116.2702, - "eval_samples_per_second": 17.201, - "eval_steps_per_second": 4.3, + "epoch": 0.83, + "eval_cer": 0.8817208816033121, + "eval_loss": 0.00928072165697813, + "eval_runtime": 107.7164, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, "step": 322000 }, { - "epoch": 1.62, - "learning_rate": 5.631271725585361e-05, - "loss": 0.0047, + "epoch": 0.83, + "learning_rate": 0.00017479554462246716, + "loss": 0.0122, "step": 322010 }, { - "epoch": 1.62, - "learning_rate": 5.6305149562839595e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017479165640609567, + "loss": 0.0135, "step": 322020 }, { - "epoch": 1.62, - "learning_rate": 5.629758186982558e-05, - "loss": 0.0073, + "epoch": 0.83, + "learning_rate": 0.00017478776818972419, + "loss": 0.0153, "step": 322030 }, { - "epoch": 1.62, - "learning_rate": 5.629001417681157e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.00017478387997335275, + "loss": 0.0143, "step": 322040 }, { - "epoch": 1.62, - "learning_rate": 5.6282446483797566e-05, - "loss": 0.0058, + "epoch": 0.83, + "learning_rate": 0.0001747799917569813, + "loss": 0.0099, "step": 322050 }, { - "epoch": 1.62, - "learning_rate": 5.6274878790783555e-05, - "loss": 0.0077, + "epoch": 0.83, + "learning_rate": 0.0001747761035406098, + "loss": 0.0157, "step": 322060 }, { - "epoch": 1.62, - "learning_rate": 5.626731109776954e-05, - "loss": 0.0051, + "epoch": 0.83, + "learning_rate": 0.00017477221532423835, + "loss": 0.0159, "step": 322070 }, { - "epoch": 1.62, - "learning_rate": 5.625974340475553e-05, - "loss": 0.007, + "epoch": 0.83, + "learning_rate": 0.00017476832710786687, + "loss": 0.0146, "step": 322080 }, { - "epoch": 1.62, - "learning_rate": 5.6252175711741526e-05, - "loss": 0.0064, + "epoch": 0.83, + "learning_rate": 0.00017476443889149544, + "loss": 0.0118, "step": 322090 }, { - "epoch": 1.63, - "learning_rate": 5.6244608018727514e-05, - "loss": 0.0057, + "epoch": 0.83, + "learning_rate": 0.00017476055067512395, + "loss": 0.0115, "step": 322100 }, { - "epoch": 1.63, - "learning_rate": 5.62370403257135e-05, - "loss": 0.0074, + "epoch": 0.83, + "learning_rate": 0.0001747566624587525, + "loss": 0.0104, "step": 322110 }, { - "epoch": 1.63, - "learning_rate": 5.622947263269949e-05, - "loss": 0.0089, + "epoch": 0.83, + "learning_rate": 0.000174752774242381, + "loss": 0.0151, "step": 322120 }, { - "epoch": 1.63, - "learning_rate": 5.6221904939685486e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.00017474888602600957, + "loss": 0.015, "step": 322130 }, { - "epoch": 1.63, - "learning_rate": 5.6214337246671474e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.0001747449978096381, + "loss": 0.0112, "step": 322140 }, { - "epoch": 1.63, - "learning_rate": 5.620676955365746e-05, - "loss": 0.008, + "epoch": 0.84, + "learning_rate": 0.00017474110959326663, + "loss": 0.0136, "step": 322150 }, { - "epoch": 1.63, - "learning_rate": 5.619920186064345e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017473722137689515, + "loss": 0.0151, "step": 322160 }, { - "epoch": 1.63, - "learning_rate": 5.6191634167629445e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017473333316052371, + "loss": 0.0115, "step": 322170 }, { - "epoch": 1.63, - "learning_rate": 5.6184066474615434e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.00017472944494415223, + "loss": 0.0194, "step": 322180 }, { - "epoch": 1.63, - "learning_rate": 5.617649878160142e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017472555672778077, + "loss": 0.0121, "step": 322190 }, { - "epoch": 1.63, - "learning_rate": 5.616893108858741e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017472166851140928, + "loss": 0.016, "step": 322200 }, { - "epoch": 1.63, - "learning_rate": 5.6161363395573405e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017471778029503785, + "loss": 0.0105, "step": 322210 }, { - "epoch": 1.63, - "learning_rate": 5.615379570255939e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.0001747138920786664, + "loss": 0.0182, "step": 322220 }, { - "epoch": 1.63, - "learning_rate": 5.614622800954538e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.0001747100038622949, + "loss": 0.0121, "step": 322230 }, { - "epoch": 1.63, - "learning_rate": 5.613866031653136e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017470611564592345, + "loss": 0.0111, "step": 322240 }, { - "epoch": 1.63, - "learning_rate": 5.613109262351735e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.000174702227429552, + "loss": 0.0132, "step": 322250 }, { - "epoch": 1.63, - "learning_rate": 5.6123524930503346e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017469833921318053, + "loss": 0.0149, "step": 322260 }, { - "epoch": 1.63, - "learning_rate": 5.6115957237489334e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017469445099680905, + "loss": 0.0144, "step": 322270 }, { - "epoch": 1.63, - "learning_rate": 5.610838954447532e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.0001746905627804376, + "loss": 0.0158, "step": 322280 }, { - "epoch": 1.63, - "learning_rate": 5.610082185146131e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017468667456406613, + "loss": 0.0147, "step": 322290 }, { - "epoch": 1.63, - "learning_rate": 5.6093254158447306e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.00017468278634769467, + "loss": 0.0138, "step": 322300 }, { - "epoch": 1.63, - "learning_rate": 5.6085686465433294e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001746788981313232, + "loss": 0.0159, "step": 322310 }, { - "epoch": 1.63, - "learning_rate": 5.607811877241928e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017467500991495173, + "loss": 0.0129, "step": 322320 }, { - "epoch": 1.63, - "learning_rate": 5.607055107940527e-05, - "loss": 0.0098, + "epoch": 0.84, + "learning_rate": 0.00017467112169858024, + "loss": 0.015, "step": 322330 }, { - "epoch": 1.63, - "learning_rate": 5.6062983386391265e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001746672334822088, + "loss": 0.0162, "step": 322340 }, { - "epoch": 1.63, - "learning_rate": 5.6055415693377254e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017466334526583733, + "loss": 0.0154, "step": 322350 }, { - "epoch": 1.63, - "learning_rate": 5.604784800036324e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017465945704946587, + "loss": 0.0136, "step": 322360 }, { - "epoch": 1.63, - "learning_rate": 5.604028030734923e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017465556883309438, + "loss": 0.0136, "step": 322370 }, { - "epoch": 1.63, - "learning_rate": 5.6032712614335225e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017465168061672295, + "loss": 0.012, "step": 322380 }, { - "epoch": 1.63, - "learning_rate": 5.602514492132121e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.0001746477924003515, + "loss": 0.0147, "step": 322390 }, { - "epoch": 1.63, - "learning_rate": 5.60175772283072e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.00017464390418398, + "loss": 0.0113, "step": 322400 }, { - "epoch": 1.63, - "learning_rate": 5.6010009535293197e-05, - "loss": 0.0087, + "epoch": 0.84, + "learning_rate": 0.00017464001596760855, + "loss": 0.0125, "step": 322410 }, { - "epoch": 1.63, - "learning_rate": 5.6002441842279185e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.0001746361277512371, + "loss": 0.0144, "step": 322420 }, { - "epoch": 1.63, - "learning_rate": 5.599487414926517e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017463223953486563, + "loss": 0.0132, "step": 322430 }, { - "epoch": 1.63, - "learning_rate": 5.598730645625116e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017462835131849415, + "loss": 0.011, "step": 322440 }, { - "epoch": 1.63, - "learning_rate": 5.5979738763237156e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001746244631021227, + "loss": 0.0139, "step": 322450 }, { - "epoch": 1.63, - "learning_rate": 5.5972171070223144e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017462057488575123, + "loss": 0.016, "step": 322460 }, { - "epoch": 1.63, - "learning_rate": 5.596460337720913e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017461668666937977, + "loss": 0.0107, "step": 322470 }, { - "epoch": 1.63, - "learning_rate": 5.595703568419512e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.0001746127984530083, + "loss": 0.0147, "step": 322480 }, { - "epoch": 1.63, - "learning_rate": 5.5949467991181116e-05, - "loss": 0.0089, + "epoch": 0.84, + "learning_rate": 0.00017460891023663683, + "loss": 0.0152, "step": 322490 }, { - "epoch": 1.63, - "learning_rate": 5.5941900298167104e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.00017460502202026537, + "loss": 0.0144, "step": 322500 }, { - "epoch": 1.63, - "learning_rate": 5.593433260515309e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.0001746011338038939, + "loss": 0.0164, "step": 322510 }, { - "epoch": 1.63, - "learning_rate": 5.592676491213908e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017459724558752243, + "loss": 0.0129, "step": 322520 }, { - "epoch": 1.63, - "learning_rate": 5.5919197219125075e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017459335737115097, + "loss": 0.0168, "step": 322530 }, { - "epoch": 1.63, - "learning_rate": 5.5911629526111064e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017458946915477948, + "loss": 0.0122, "step": 322540 }, { - "epoch": 1.63, - "learning_rate": 5.5904061833097045e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017458558093840805, + "loss": 0.0138, "step": 322550 }, { - "epoch": 1.63, - "learning_rate": 5.589649414008303e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001745816927220366, + "loss": 0.0201, "step": 322560 }, { - "epoch": 1.63, - "learning_rate": 5.588892644706902e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.0001745778045056651, + "loss": 0.0128, "step": 322570 }, { - "epoch": 1.63, - "learning_rate": 5.5881358754055017e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017457391628929362, + "loss": 0.0134, "step": 322580 }, { - "epoch": 1.63, - "learning_rate": 5.5873791061041005e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.0001745700280729222, + "loss": 0.0211, "step": 322590 }, { - "epoch": 1.63, - "learning_rate": 5.586622336802699e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017456613985655073, + "loss": 0.0128, "step": 322600 }, { - "epoch": 1.63, - "learning_rate": 5.585865567501298e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017456225164017925, + "loss": 0.0128, "step": 322610 }, { - "epoch": 1.63, - "learning_rate": 5.5851087981998976e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.0001745583634238078, + "loss": 0.013, "step": 322620 }, { - "epoch": 1.63, - "learning_rate": 5.5843520288984964e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017455447520743633, + "loss": 0.0135, "step": 322630 }, { - "epoch": 1.63, - "learning_rate": 5.583595259597095e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017455058699106487, + "loss": 0.0131, "step": 322640 }, { - "epoch": 1.63, - "learning_rate": 5.582838490295694e-05, - "loss": 0.0054, + "epoch": 0.84, + "learning_rate": 0.0001745466987746934, + "loss": 0.0127, "step": 322650 }, { - "epoch": 1.63, - "learning_rate": 5.5820817209942936e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017454281055832193, + "loss": 0.014, "step": 322660 }, { - "epoch": 1.63, - "learning_rate": 5.5813249516928924e-05, - "loss": 0.0087, + "epoch": 0.84, + "learning_rate": 0.00017453892234195047, + "loss": 0.0122, "step": 322670 }, { - "epoch": 1.63, - "learning_rate": 5.580568182391491e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.000174535034125579, + "loss": 0.0131, "step": 322680 }, { - "epoch": 1.63, - "learning_rate": 5.57981141309009e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017453114590920753, + "loss": 0.0123, "step": 322690 }, { - "epoch": 1.63, - "learning_rate": 5.5790546437886896e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017452725769283607, + "loss": 0.0127, "step": 322700 }, { - "epoch": 1.63, - "learning_rate": 5.5782978744872884e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017452336947646464, + "loss": 0.0169, "step": 322710 }, { - "epoch": 1.63, - "learning_rate": 5.577541105185887e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.00017451948126009315, + "loss": 0.0102, "step": 322720 }, { - "epoch": 1.63, - "learning_rate": 5.576784335884486e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017451559304372167, + "loss": 0.0158, "step": 322730 }, { - "epoch": 1.63, - "learning_rate": 5.5760275665830855e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.0001745117048273502, + "loss": 0.0125, "step": 322740 }, { - "epoch": 1.63, - "learning_rate": 5.5752707972816843e-05, - "loss": 0.0042, + "epoch": 0.84, + "learning_rate": 0.00017450781661097878, + "loss": 0.0141, "step": 322750 }, { - "epoch": 1.63, - "learning_rate": 5.574514027980283e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.0001745039283946073, + "loss": 0.0144, "step": 322760 }, { - "epoch": 1.63, - "learning_rate": 5.573757258678882e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017450004017823583, + "loss": 0.0123, "step": 322770 }, { - "epoch": 1.63, - "learning_rate": 5.5730004893774815e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017449615196186435, + "loss": 0.0148, "step": 322780 }, { - "epoch": 1.63, - "learning_rate": 5.57224372007608e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.0001744922637454929, + "loss": 0.0154, "step": 322790 }, { - "epoch": 1.63, - "learning_rate": 5.571486950774679e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017448837552912143, + "loss": 0.02, "step": 322800 }, { - "epoch": 1.63, - "learning_rate": 5.570730181473278e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017448448731274997, + "loss": 0.0128, "step": 322810 }, { - "epoch": 1.63, - "learning_rate": 5.5699734121718774e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.0001744805990963785, + "loss": 0.0153, "step": 322820 }, { - "epoch": 1.63, - "learning_rate": 5.569216642870476e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017447671088000703, + "loss": 0.0132, "step": 322830 }, { - "epoch": 1.63, - "learning_rate": 5.568459873569075e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017447282266363557, + "loss": 0.0171, "step": 322840 }, { - "epoch": 1.63, - "learning_rate": 5.567703104267674e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.0001744689344472641, + "loss": 0.0138, "step": 322850 }, { - "epoch": 1.63, - "learning_rate": 5.5669463349662734e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017446504623089263, + "loss": 0.0185, "step": 322860 }, { - "epoch": 1.63, - "learning_rate": 5.5661895656648716e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017446115801452117, + "loss": 0.0149, "step": 322870 }, { - "epoch": 1.63, - "learning_rate": 5.5654327963634704e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.00017445726979814974, + "loss": 0.0169, "step": 322880 }, { - "epoch": 1.63, - "learning_rate": 5.564676027062069e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017445338158177825, + "loss": 0.0187, "step": 322890 }, { - "epoch": 1.63, - "learning_rate": 5.563919257760669e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017444949336540677, + "loss": 0.0146, "step": 322900 }, { - "epoch": 1.63, - "learning_rate": 5.5631624884592675e-05, - "loss": 0.0087, + "epoch": 0.84, + "learning_rate": 0.0001744456051490353, + "loss": 0.0148, "step": 322910 }, { - "epoch": 1.63, - "learning_rate": 5.5624057191578663e-05, - "loss": 0.0095, + "epoch": 0.84, + "learning_rate": 0.00017444171693266388, + "loss": 0.0144, "step": 322920 }, { - "epoch": 1.63, - "learning_rate": 5.561648949856465e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.0001744378287162924, + "loss": 0.0133, "step": 322930 }, { - "epoch": 1.63, - "learning_rate": 5.560892180555065e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017443394049992093, + "loss": 0.0114, "step": 322940 }, { - "epoch": 1.63, - "learning_rate": 5.5601354112536635e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017443005228354945, + "loss": 0.0131, "step": 322950 }, { - "epoch": 1.63, - "learning_rate": 5.559378641952262e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017442616406717802, + "loss": 0.0155, "step": 322960 }, { - "epoch": 1.63, - "learning_rate": 5.558621872650861e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017442227585080653, + "loss": 0.0125, "step": 322970 }, { - "epoch": 1.63, - "learning_rate": 5.5578651033494606e-05, - "loss": 0.0054, + "epoch": 0.84, + "learning_rate": 0.00017441838763443507, + "loss": 0.0104, "step": 322980 }, { - "epoch": 1.63, - "learning_rate": 5.5571083340480595e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017441449941806359, + "loss": 0.0131, "step": 322990 }, { - "epoch": 1.63, - "learning_rate": 5.556351564746658e-05, - "loss": 0.0101, + "epoch": 0.84, + "learning_rate": 0.00017441061120169216, + "loss": 0.0112, "step": 323000 }, { - "epoch": 1.63, - "eval_cer": 0.9144265880775191, - "eval_loss": 0.004934444557875395, - "eval_runtime": 116.3298, - "eval_samples_per_second": 17.192, - "eval_steps_per_second": 4.298, + "epoch": 0.84, + "eval_cer": 0.881688689953826, + "eval_loss": 0.009281335398554802, + "eval_runtime": 107.738, + "eval_samples_per_second": 18.564, + "eval_steps_per_second": 4.641, "step": 323000 }, { - "epoch": 1.63, - "learning_rate": 5.555594795445257e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017440672298532067, + "loss": 0.0108, "step": 323010 }, { - "epoch": 1.63, - "learning_rate": 5.5548380261438566e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001744028347689492, + "loss": 0.0152, "step": 323020 }, { - "epoch": 1.63, - "learning_rate": 5.5540812568424554e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017439894655257773, + "loss": 0.0139, "step": 323030 }, { - "epoch": 1.63, - "learning_rate": 5.553324487541054e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017439505833620627, + "loss": 0.0107, "step": 323040 }, { - "epoch": 1.63, - "learning_rate": 5.552567718239653e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.0001743911701198348, + "loss": 0.013, "step": 323050 }, { - "epoch": 1.63, - "learning_rate": 5.5518109489382526e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017438728190346335, + "loss": 0.0131, "step": 323060 }, { - "epoch": 1.63, - "learning_rate": 5.5510541796368514e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017438339368709187, + "loss": 0.0175, "step": 323070 }, { - "epoch": 1.63, - "learning_rate": 5.55029741033545e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.0001743795054707204, + "loss": 0.0148, "step": 323080 }, { - "epoch": 1.63, - "learning_rate": 5.549540641034049e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017437561725434898, + "loss": 0.0148, "step": 323090 }, { - "epoch": 1.63, - "learning_rate": 5.5487838717326485e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001743717290379775, + "loss": 0.0161, "step": 323100 }, { - "epoch": 1.63, - "learning_rate": 5.5480271024312473e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017436784082160603, + "loss": 0.0117, "step": 323110 }, { - "epoch": 1.63, - "learning_rate": 5.547270333129846e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017436395260523455, + "loss": 0.0179, "step": 323120 }, { - "epoch": 1.63, - "learning_rate": 5.546513563828445e-05, - "loss": 0.0091, + "epoch": 0.84, + "learning_rate": 0.00017436006438886312, + "loss": 0.0121, "step": 323130 }, { - "epoch": 1.63, - "learning_rate": 5.5457567945270445e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017435617617249163, + "loss": 0.0142, "step": 323140 }, { - "epoch": 1.63, - "learning_rate": 5.545000025225643e-05, - "loss": 0.0047, + "epoch": 0.84, + "learning_rate": 0.00017435228795612017, + "loss": 0.0124, "step": 323150 }, { - "epoch": 1.63, - "learning_rate": 5.544243255924242e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017434839973974869, + "loss": 0.017, "step": 323160 }, { - "epoch": 1.63, - "learning_rate": 5.543486486622841e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017434451152337725, + "loss": 0.0124, "step": 323170 }, { - "epoch": 1.63, - "learning_rate": 5.542729717321439e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017434062330700577, + "loss": 0.0122, "step": 323180 }, { - "epoch": 1.63, - "learning_rate": 5.5419729480200386e-05, - "loss": 0.0108, + "epoch": 0.84, + "learning_rate": 0.0001743367350906343, + "loss": 0.0147, "step": 323190 }, { - "epoch": 1.63, - "learning_rate": 5.5412161787186374e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017433284687426283, + "loss": 0.0142, "step": 323200 }, { - "epoch": 1.63, - "learning_rate": 5.540459409417236e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001743289586578914, + "loss": 0.0125, "step": 323210 }, { - "epoch": 1.63, - "learning_rate": 5.539702640115835e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.0001743250704415199, + "loss": 0.0248, "step": 323220 }, { - "epoch": 1.63, - "learning_rate": 5.5389458708144346e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017432118222514845, + "loss": 0.0136, "step": 323230 }, { - "epoch": 1.63, - "learning_rate": 5.5381891015130334e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017431729400877696, + "loss": 0.0155, "step": 323240 }, { - "epoch": 1.63, - "learning_rate": 5.537432332211632e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017431340579240553, + "loss": 0.0127, "step": 323250 }, { - "epoch": 1.63, - "learning_rate": 5.536675562910231e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017430951757603408, + "loss": 0.0136, "step": 323260 }, { - "epoch": 1.63, - "learning_rate": 5.5359187936088305e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001743056293596626, + "loss": 0.0149, "step": 323270 }, { - "epoch": 1.63, - "learning_rate": 5.5351620243074294e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.00017430174114329113, + "loss": 0.0153, "step": 323280 }, { - "epoch": 1.63, - "learning_rate": 5.534405255006028e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017429785292691965, + "loss": 0.0137, "step": 323290 }, { - "epoch": 1.63, - "learning_rate": 5.533648485704627e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017429396471054821, + "loss": 0.0155, "step": 323300 }, { - "epoch": 1.63, - "learning_rate": 5.5328917164032265e-05, - "loss": 0.0044, + "epoch": 0.84, + "learning_rate": 0.00017429007649417673, + "loss": 0.0127, "step": 323310 }, { - "epoch": 1.63, - "learning_rate": 5.532134947101825e-05, - "loss": 0.0085, + "epoch": 0.84, + "learning_rate": 0.00017428618827780527, + "loss": 0.0141, "step": 323320 }, { - "epoch": 1.63, - "learning_rate": 5.531378177800424e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017428230006143379, + "loss": 0.0111, "step": 323330 }, { - "epoch": 1.63, - "learning_rate": 5.530621408499023e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017427841184506235, + "loss": 0.0144, "step": 323340 }, { - "epoch": 1.63, - "learning_rate": 5.5298646391976225e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017427452362869087, + "loss": 0.011, "step": 323350 }, { - "epoch": 1.63, - "learning_rate": 5.529107869896221e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.0001742706354123194, + "loss": 0.0191, "step": 323360 }, { - "epoch": 1.63, - "learning_rate": 5.52835110059482e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017426674719594792, + "loss": 0.0117, "step": 323370 }, { - "epoch": 1.63, - "learning_rate": 5.5275943312934196e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.0001742628589795765, + "loss": 0.0133, "step": 323380 }, { - "epoch": 1.63, - "learning_rate": 5.5268375619920184e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.000174258970763205, + "loss": 0.0136, "step": 323390 }, { - "epoch": 1.63, - "learning_rate": 5.526080792690617e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017425508254683355, + "loss": 0.0099, "step": 323400 }, { - "epoch": 1.63, - "learning_rate": 5.525324023389216e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017425119433046206, + "loss": 0.0153, "step": 323410 }, { - "epoch": 1.63, - "learning_rate": 5.5245672540878156e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.00017424730611409063, + "loss": 0.0151, "step": 323420 }, { - "epoch": 1.63, - "learning_rate": 5.5238104847864144e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017424341789771917, + "loss": 0.0109, "step": 323430 }, { - "epoch": 1.63, - "learning_rate": 5.523053715485013e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.0001742395296813477, + "loss": 0.0155, "step": 323440 }, { - "epoch": 1.63, - "learning_rate": 5.522296946183612e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.0001742356414649762, + "loss": 0.0162, "step": 323450 }, { - "epoch": 1.63, - "learning_rate": 5.5215401768822115e-05, - "loss": 0.0054, + "epoch": 0.84, + "learning_rate": 0.00017423175324860477, + "loss": 0.0121, "step": 323460 }, { - "epoch": 1.63, - "learning_rate": 5.5207834075808104e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.00017422786503223331, + "loss": 0.017, "step": 323470 }, { - "epoch": 1.63, - "learning_rate": 5.520026638279409e-05, - "loss": 0.0045, + "epoch": 0.84, + "learning_rate": 0.00017422397681586183, + "loss": 0.0114, "step": 323480 }, { - "epoch": 1.63, - "learning_rate": 5.519269868978008e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017422008859949037, + "loss": 0.012, "step": 323490 }, { - "epoch": 1.63, - "learning_rate": 5.518513099676606e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.0001742162003831189, + "loss": 0.0138, "step": 323500 }, { - "epoch": 1.63, - "learning_rate": 5.5177563303752056e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017421231216674745, + "loss": 0.0147, "step": 323510 }, { - "epoch": 1.63, - "learning_rate": 5.5169995610738045e-05, - "loss": 0.0095, + "epoch": 0.84, + "learning_rate": 0.00017420842395037597, + "loss": 0.0158, "step": 323520 }, { - "epoch": 1.63, - "learning_rate": 5.516242791772403e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.0001742045357340045, + "loss": 0.012, "step": 323530 }, { - "epoch": 1.63, - "learning_rate": 5.515486022471002e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017420064751763302, + "loss": 0.0135, "step": 323540 }, { - "epoch": 1.63, - "learning_rate": 5.5147292531696016e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.0001741967593012616, + "loss": 0.0135, "step": 323550 }, { - "epoch": 1.63, - "learning_rate": 5.5139724838682004e-05, - "loss": 0.0095, + "epoch": 0.84, + "learning_rate": 0.0001741928710848901, + "loss": 0.0149, "step": 323560 }, { - "epoch": 1.63, - "learning_rate": 5.513215714566799e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017418898286851865, + "loss": 0.0098, "step": 323570 }, { - "epoch": 1.63, - "learning_rate": 5.512458945265398e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.00017418509465214716, + "loss": 0.0197, "step": 323580 }, { - "epoch": 1.63, - "learning_rate": 5.5117021759639976e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017418120643577573, + "loss": 0.0168, "step": 323590 }, { - "epoch": 1.63, - "learning_rate": 5.5109454066625964e-05, - "loss": 0.0049, + "epoch": 0.84, + "learning_rate": 0.00017417731821940427, + "loss": 0.0136, "step": 323600 }, { - "epoch": 1.63, - "learning_rate": 5.510188637361195e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001741734300030328, + "loss": 0.016, "step": 323610 }, { - "epoch": 1.63, - "learning_rate": 5.509431868059794e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001741695417866613, + "loss": 0.0125, "step": 323620 }, { - "epoch": 1.63, - "learning_rate": 5.5086750987583935e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.00017416565357028987, + "loss": 0.0137, "step": 323630 }, { - "epoch": 1.63, - "learning_rate": 5.5079183294569924e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.0001741617653539184, + "loss": 0.0139, "step": 323640 }, { - "epoch": 1.63, - "learning_rate": 5.507161560155591e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017415787713754693, + "loss": 0.0121, "step": 323650 }, { - "epoch": 1.63, - "learning_rate": 5.50640479085419e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017415398892117547, + "loss": 0.0143, "step": 323660 }, { - "epoch": 1.63, - "learning_rate": 5.5056480215527895e-05, - "loss": 0.0085, + "epoch": 0.84, + "learning_rate": 0.000174150100704804, + "loss": 0.0117, "step": 323670 }, { - "epoch": 1.63, - "learning_rate": 5.504891252251388e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017414621248843255, + "loss": 0.0148, "step": 323680 }, { - "epoch": 1.63, - "learning_rate": 5.504134482949987e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017414232427206107, + "loss": 0.0107, "step": 323690 }, { - "epoch": 1.63, - "learning_rate": 5.503377713648586e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001741384360556896, + "loss": 0.0157, "step": 323700 }, { - "epoch": 1.63, - "learning_rate": 5.5026209443471855e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017413454783931815, + "loss": 0.014, "step": 323710 }, { - "epoch": 1.63, - "learning_rate": 5.501864175045784e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001741306596229467, + "loss": 0.0163, "step": 323720 }, { - "epoch": 1.63, - "learning_rate": 5.501107405744383e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.0001741267714065752, + "loss": 0.0177, "step": 323730 }, { - "epoch": 1.63, - "learning_rate": 5.500350636442982e-05, - "loss": 0.0036, + "epoch": 0.84, + "learning_rate": 0.00017412288319020375, + "loss": 0.0145, "step": 323740 }, { - "epoch": 1.63, - "learning_rate": 5.4995938671415814e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017411899497383232, + "loss": 0.0175, "step": 323750 }, { - "epoch": 1.63, - "learning_rate": 5.49883709784018e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017411510675746083, + "loss": 0.0151, "step": 323760 }, { - "epoch": 1.63, - "learning_rate": 5.498080328538779e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017411121854108935, + "loss": 0.012, "step": 323770 }, { - "epoch": 1.63, - "learning_rate": 5.497323559237378e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.0001741073303247179, + "loss": 0.0118, "step": 323780 }, { - "epoch": 1.63, - "learning_rate": 5.4965667899359774e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.0001741034421083464, + "loss": 0.0178, "step": 323790 }, { - "epoch": 1.63, - "learning_rate": 5.495810020634576e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017409955389197497, + "loss": 0.0127, "step": 323800 }, { - "epoch": 1.63, - "learning_rate": 5.4950532513331744e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.0001740956656756035, + "loss": 0.0134, "step": 323810 }, { - "epoch": 1.63, - "learning_rate": 5.494296482031773e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.00017409177745923203, + "loss": 0.0158, "step": 323820 }, { - "epoch": 1.63, - "learning_rate": 5.493539712730373e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017408788924286057, + "loss": 0.0136, "step": 323830 }, { - "epoch": 1.63, - "learning_rate": 5.4927829434289715e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001740840010264891, + "loss": 0.0125, "step": 323840 }, { - "epoch": 1.63, - "learning_rate": 5.49202617412757e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017408011281011765, + "loss": 0.0152, "step": 323850 }, { - "epoch": 1.63, - "learning_rate": 5.491269404826169e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.00017407622459374617, + "loss": 0.017, "step": 323860 }, { - "epoch": 1.63, - "learning_rate": 5.4905126355247687e-05, - "loss": 0.008, + "epoch": 0.84, + "learning_rate": 0.0001740723363773747, + "loss": 0.0127, "step": 323870 }, { - "epoch": 1.63, - "learning_rate": 5.4897558662233675e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017406844816100325, + "loss": 0.0123, "step": 323880 }, { - "epoch": 1.63, - "learning_rate": 5.488999096921966e-05, - "loss": 0.0103, + "epoch": 0.84, + "learning_rate": 0.0001740645599446318, + "loss": 0.013, "step": 323890 }, { - "epoch": 1.63, - "learning_rate": 5.488242327620565e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001740606717282603, + "loss": 0.0126, "step": 323900 }, { - "epoch": 1.63, - "learning_rate": 5.4874855583191646e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017405678351188885, + "loss": 0.0176, "step": 323910 }, { - "epoch": 1.63, - "learning_rate": 5.4867287890177634e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001740528952955174, + "loss": 0.0167, "step": 323920 }, { - "epoch": 1.63, - "learning_rate": 5.485972019716362e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.00017404900707914593, + "loss": 0.0138, "step": 323930 }, { - "epoch": 1.63, - "learning_rate": 5.485215250414961e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017404511886277445, + "loss": 0.0145, "step": 323940 }, { - "epoch": 1.63, - "learning_rate": 5.4844584811135606e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.000174041230646403, + "loss": 0.012, "step": 323950 }, { - "epoch": 1.63, - "learning_rate": 5.4837017118121594e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017403734243003156, + "loss": 0.012, "step": 323960 }, { - "epoch": 1.63, - "learning_rate": 5.482944942510758e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017403345421366007, + "loss": 0.0143, "step": 323970 }, { - "epoch": 1.63, - "learning_rate": 5.482188173209357e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.0001740295659972886, + "loss": 0.0126, "step": 323980 }, { - "epoch": 1.63, - "learning_rate": 5.4814314039079565e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.00017402567778091713, + "loss": 0.0123, "step": 323990 }, { - "epoch": 1.63, - "learning_rate": 5.4806746346065554e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.0001740217895645457, + "loss": 0.0106, "step": 324000 }, { - "epoch": 1.63, - "eval_cer": 0.9144275584736445, - "eval_loss": 0.0047448608092963696, - "eval_runtime": 116.3969, - "eval_samples_per_second": 17.183, - "eval_steps_per_second": 4.296, + "epoch": 0.84, + "eval_cer": 0.8816970877754311, + "eval_loss": 0.009332822635769844, + "eval_runtime": 107.8709, + "eval_samples_per_second": 18.541, + "eval_steps_per_second": 4.635, "step": 324000 }, { - "epoch": 1.63, - "learning_rate": 5.479917865305154e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.0001740179013481742, + "loss": 0.0139, "step": 324010 }, { - "epoch": 1.63, - "learning_rate": 5.479161096003753e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017401401313180275, + "loss": 0.0142, "step": 324020 }, { - "epoch": 1.63, - "learning_rate": 5.4784043267023525e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017401012491543127, + "loss": 0.0136, "step": 324030 }, { - "epoch": 1.63, - "learning_rate": 5.477647557400951e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.0001740062366990598, + "loss": 0.0186, "step": 324040 }, { - "epoch": 1.63, - "learning_rate": 5.47689078809955e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017400234848268835, + "loss": 0.016, "step": 324050 }, { - "epoch": 1.63, - "learning_rate": 5.476134018798149e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001739984602663169, + "loss": 0.0139, "step": 324060 }, { - "epoch": 1.63, - "learning_rate": 5.4753772494967485e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.0001739945720499454, + "loss": 0.0123, "step": 324070 }, { - "epoch": 1.64, - "learning_rate": 5.474620480195347e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017399068383357395, + "loss": 0.0155, "step": 324080 }, { - "epoch": 1.64, - "learning_rate": 5.473863710893946e-05, - "loss": 0.0093, + "epoch": 0.84, + "learning_rate": 0.0001739867956172025, + "loss": 0.0169, "step": 324090 }, { - "epoch": 1.64, - "learning_rate": 5.473106941592545e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017398290740083103, + "loss": 0.0153, "step": 324100 }, { - "epoch": 1.64, - "learning_rate": 5.4723501722911444e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017397901918445955, + "loss": 0.0137, "step": 324110 }, { - "epoch": 1.64, - "learning_rate": 5.4715934029897426e-05, - "loss": 0.0054, + "epoch": 0.84, + "learning_rate": 0.0001739751309680881, + "loss": 0.0138, "step": 324120 }, { - "epoch": 1.64, - "learning_rate": 5.4708366336883414e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017397124275171666, + "loss": 0.0137, "step": 324130 }, { - "epoch": 1.64, - "learning_rate": 5.47007986438694e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017396735453534517, + "loss": 0.0138, "step": 324140 }, { - "epoch": 1.64, - "learning_rate": 5.469323095085539e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001739634663189737, + "loss": 0.024, "step": 324150 }, { - "epoch": 1.64, - "learning_rate": 5.4685663257841386e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017395957810260223, + "loss": 0.0175, "step": 324160 }, { - "epoch": 1.64, - "learning_rate": 5.4678095564827374e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.0001739556898862308, + "loss": 0.0154, "step": 324170 }, { - "epoch": 1.64, - "learning_rate": 5.467052787181336e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.0001739518016698593, + "loss": 0.015, "step": 324180 }, { - "epoch": 1.64, - "learning_rate": 5.466296017879935e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017394791345348785, + "loss": 0.0152, "step": 324190 }, { - "epoch": 1.64, - "learning_rate": 5.4655392485785345e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017394402523711637, + "loss": 0.0136, "step": 324200 }, { - "epoch": 1.64, - "learning_rate": 5.4647824792771333e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017394013702074493, + "loss": 0.0199, "step": 324210 }, { - "epoch": 1.64, - "learning_rate": 5.464025709975732e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017393624880437345, + "loss": 0.0115, "step": 324220 }, { - "epoch": 1.64, - "learning_rate": 5.463268940674331e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.000173932360588002, + "loss": 0.0119, "step": 324230 }, { - "epoch": 1.64, - "learning_rate": 5.4625121713729305e-05, - "loss": 0.0054, + "epoch": 0.84, + "learning_rate": 0.0001739284723716305, + "loss": 0.0162, "step": 324240 }, { - "epoch": 1.64, - "learning_rate": 5.461755402071529e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017392458415525907, + "loss": 0.0118, "step": 324250 }, { - "epoch": 1.64, - "learning_rate": 5.460998632770128e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.0001739206959388876, + "loss": 0.0137, "step": 324260 }, { - "epoch": 1.64, - "learning_rate": 5.460241863468727e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017391680772251613, + "loss": 0.0122, "step": 324270 }, { - "epoch": 1.64, - "learning_rate": 5.4594850941673264e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017391291950614464, + "loss": 0.0193, "step": 324280 }, { - "epoch": 1.64, - "learning_rate": 5.458728324865925e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017390903128977319, + "loss": 0.0135, "step": 324290 }, { - "epoch": 1.64, - "learning_rate": 5.457971555564524e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017390514307340175, + "loss": 0.015, "step": 324300 }, { - "epoch": 1.64, - "learning_rate": 5.457214786263123e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017390125485703027, + "loss": 0.0144, "step": 324310 }, { - "epoch": 1.64, - "learning_rate": 5.4564580169617224e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017389736664065878, + "loss": 0.016, "step": 324320 }, { - "epoch": 1.64, - "learning_rate": 5.455701247660321e-05, - "loss": 0.0051, + "epoch": 0.84, + "learning_rate": 0.00017389347842428733, + "loss": 0.0142, "step": 324330 }, { - "epoch": 1.64, - "learning_rate": 5.45494447835892e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.0001738895902079159, + "loss": 0.0149, "step": 324340 }, { - "epoch": 1.64, - "learning_rate": 5.4541877090575196e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001738857019915444, + "loss": 0.0142, "step": 324350 }, { - "epoch": 1.64, - "learning_rate": 5.4534309397561184e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017388181377517295, + "loss": 0.0169, "step": 324360 }, { - "epoch": 1.64, - "learning_rate": 5.452674170454717e-05, - "loss": 0.0089, + "epoch": 0.84, + "learning_rate": 0.00017387792555880146, + "loss": 0.0154, "step": 324370 }, { - "epoch": 1.64, - "learning_rate": 5.451917401153316e-05, - "loss": 0.0091, + "epoch": 0.84, + "learning_rate": 0.00017387403734243003, + "loss": 0.0159, "step": 324380 }, { - "epoch": 1.64, - "learning_rate": 5.4511606318519155e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017387014912605855, + "loss": 0.012, "step": 324390 }, { - "epoch": 1.64, - "learning_rate": 5.4504038625505143e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.0001738662609096871, + "loss": 0.0116, "step": 324400 }, { - "epoch": 1.64, - "learning_rate": 5.449647093249113e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.0001738623726933156, + "loss": 0.0121, "step": 324410 }, { - "epoch": 1.64, - "learning_rate": 5.448890323947712e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017385848447694417, + "loss": 0.0126, "step": 324420 }, { - "epoch": 1.64, - "learning_rate": 5.4481335546463115e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.0001738545962605727, + "loss": 0.0138, "step": 324430 }, { - "epoch": 1.64, - "learning_rate": 5.4473767853449096e-05, - "loss": 0.0085, + "epoch": 0.84, + "learning_rate": 0.00017385070804420123, + "loss": 0.0112, "step": 324440 }, { - "epoch": 1.64, - "learning_rate": 5.4466200160435085e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017384681982782974, + "loss": 0.0159, "step": 324450 }, { - "epoch": 1.64, - "learning_rate": 5.445863246742107e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.0001738429316114583, + "loss": 0.0106, "step": 324460 }, { - "epoch": 1.64, - "learning_rate": 5.445106477440706e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017383904339508685, + "loss": 0.0132, "step": 324470 }, { - "epoch": 1.64, - "learning_rate": 5.4443497081393056e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017383515517871537, + "loss": 0.0139, "step": 324480 }, { - "epoch": 1.64, - "learning_rate": 5.4435929388379044e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017383126696234388, + "loss": 0.0132, "step": 324490 }, { - "epoch": 1.64, - "learning_rate": 5.442836169536503e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017382737874597245, + "loss": 0.0147, "step": 324500 }, { - "epoch": 1.64, - "learning_rate": 5.442079400235102e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.000173823490529601, + "loss": 0.0164, "step": 324510 }, { - "epoch": 1.64, - "learning_rate": 5.4413226309337016e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.0001738196023132295, + "loss": 0.0212, "step": 324520 }, { - "epoch": 1.64, - "learning_rate": 5.4405658616323004e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017381571409685805, + "loss": 0.012, "step": 324530 }, { - "epoch": 1.64, - "learning_rate": 5.439809092330899e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.00017381182588048656, + "loss": 0.012, "step": 324540 }, { - "epoch": 1.64, - "learning_rate": 5.439052323029498e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017380793766411513, + "loss": 0.0154, "step": 324550 }, { - "epoch": 1.64, - "learning_rate": 5.4382955537280975e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017380404944774365, + "loss": 0.0155, "step": 324560 }, { - "epoch": 1.64, - "learning_rate": 5.4375387844266963e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.0001738001612313722, + "loss": 0.014, "step": 324570 }, { - "epoch": 1.64, - "learning_rate": 5.436782015125295e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.0001737962730150007, + "loss": 0.0163, "step": 324580 }, { - "epoch": 1.64, - "learning_rate": 5.436025245823894e-05, - "loss": 0.0095, + "epoch": 0.84, + "learning_rate": 0.00017379238479862927, + "loss": 0.0153, "step": 324590 }, { - "epoch": 1.64, - "learning_rate": 5.4352684765224935e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.0001737884965822578, + "loss": 0.0173, "step": 324600 }, { - "epoch": 1.64, - "learning_rate": 5.434511707221092e-05, - "loss": 0.0049, + "epoch": 0.84, + "learning_rate": 0.00017378460836588633, + "loss": 0.0149, "step": 324610 }, { - "epoch": 1.64, - "learning_rate": 5.433754937919691e-05, - "loss": 0.01, + "epoch": 0.84, + "learning_rate": 0.00017378072014951484, + "loss": 0.0135, "step": 324620 }, { - "epoch": 1.64, - "learning_rate": 5.43299816861829e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.0001737768319331434, + "loss": 0.0151, "step": 324630 }, { - "epoch": 1.64, - "learning_rate": 5.4322413993168895e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017377294371677193, + "loss": 0.0136, "step": 324640 }, { - "epoch": 1.64, - "learning_rate": 5.431484630015488e-05, - "loss": 0.0045, + "epoch": 0.84, + "learning_rate": 0.00017376905550040047, + "loss": 0.0132, "step": 324650 }, { - "epoch": 1.64, - "learning_rate": 5.430727860714087e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017376516728402898, + "loss": 0.0134, "step": 324660 }, { - "epoch": 1.64, - "learning_rate": 5.429971091412686e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017376127906765755, + "loss": 0.0158, "step": 324670 }, { - "epoch": 1.64, - "learning_rate": 5.4292143221112854e-05, - "loss": 0.0091, + "epoch": 0.84, + "learning_rate": 0.0001737573908512861, + "loss": 0.0165, "step": 324680 }, { - "epoch": 1.64, - "learning_rate": 5.428457552809884e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.0001737535026349146, + "loss": 0.0124, "step": 324690 }, { - "epoch": 1.64, - "learning_rate": 5.427700783508483e-05, - "loss": 0.0126, + "epoch": 0.84, + "learning_rate": 0.00017374961441854315, + "loss": 0.0153, "step": 324700 }, { - "epoch": 1.64, - "learning_rate": 5.426944014207082e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.0001737457262021717, + "loss": 0.0127, "step": 324710 }, { - "epoch": 1.64, - "learning_rate": 5.4261872449056814e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017374183798580023, + "loss": 0.0131, "step": 324720 }, { - "epoch": 1.64, - "learning_rate": 5.42543047560428e-05, - "loss": 0.0106, + "epoch": 0.84, + "learning_rate": 0.00017373794976942875, + "loss": 0.0122, "step": 324730 }, { - "epoch": 1.64, - "learning_rate": 5.424673706302879e-05, - "loss": 0.0081, + "epoch": 0.84, + "learning_rate": 0.0001737340615530573, + "loss": 0.0122, "step": 324740 }, { - "epoch": 1.64, - "learning_rate": 5.423916937001477e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017373017333668583, + "loss": 0.0119, "step": 324750 }, { - "epoch": 1.64, - "learning_rate": 5.423160167700076e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.00017372628512031437, + "loss": 0.0162, "step": 324760 }, { - "epoch": 1.64, - "learning_rate": 5.4224033983986755e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.0001737223969039429, + "loss": 0.0172, "step": 324770 }, { - "epoch": 1.64, - "learning_rate": 5.421646629097274e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017371850868757143, + "loss": 0.0125, "step": 324780 }, { - "epoch": 1.64, - "learning_rate": 5.420889859795873e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017371462047119994, + "loss": 0.0112, "step": 324790 }, { - "epoch": 1.64, - "learning_rate": 5.4201330904944726e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.0001737107322548285, + "loss": 0.0153, "step": 324800 }, { - "epoch": 1.64, - "learning_rate": 5.4193763211930715e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017370684403845703, + "loss": 0.0123, "step": 324810 }, { - "epoch": 1.64, - "learning_rate": 5.41861955189167e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017370295582208557, + "loss": 0.0131, "step": 324820 }, { - "epoch": 1.64, - "learning_rate": 5.417862782590269e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017369906760571408, + "loss": 0.0126, "step": 324830 }, { - "epoch": 1.64, - "learning_rate": 5.4171060132888686e-05, - "loss": 0.0082, + "epoch": 0.84, + "learning_rate": 0.00017369517938934265, + "loss": 0.0129, "step": 324840 }, { - "epoch": 1.64, - "learning_rate": 5.4163492439874674e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.0001736912911729712, + "loss": 0.0111, "step": 324850 }, { - "epoch": 1.64, - "learning_rate": 5.415592474686066e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.0001736874029565997, + "loss": 0.0116, "step": 324860 }, { - "epoch": 1.64, - "learning_rate": 5.414835705384665e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017368351474022825, + "loss": 0.0139, "step": 324870 }, { - "epoch": 1.64, - "learning_rate": 5.4140789360832646e-05, - "loss": 0.0086, + "epoch": 0.84, + "learning_rate": 0.0001736796265238568, + "loss": 0.0158, "step": 324880 }, { - "epoch": 1.64, - "learning_rate": 5.4133221667818634e-05, - "loss": 0.0054, + "epoch": 0.84, + "learning_rate": 0.00017367573830748533, + "loss": 0.0141, "step": 324890 }, { - "epoch": 1.64, - "learning_rate": 5.412565397480462e-05, - "loss": 0.0055, + "epoch": 0.84, + "learning_rate": 0.00017367185009111385, + "loss": 0.0137, "step": 324900 }, { - "epoch": 1.64, - "learning_rate": 5.411808628179061e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001736679618747424, + "loss": 0.0133, "step": 324910 }, { - "epoch": 1.64, - "learning_rate": 5.4110518588776605e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017366407365837093, + "loss": 0.0132, "step": 324920 }, { - "epoch": 1.64, - "learning_rate": 5.4102950895762594e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.00017366018544199947, + "loss": 0.0145, "step": 324930 }, { - "epoch": 1.64, - "learning_rate": 5.409538320274858e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.00017365629722562799, + "loss": 0.012, "step": 324940 }, { - "epoch": 1.64, - "learning_rate": 5.408781550973457e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.00017365240900925653, + "loss": 0.0119, "step": 324950 }, { - "epoch": 1.64, - "learning_rate": 5.4080247816720565e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017364852079288507, + "loss": 0.0148, "step": 324960 }, { - "epoch": 1.64, - "learning_rate": 5.407268012370655e-05, - "loss": 0.008, + "epoch": 0.84, + "learning_rate": 0.0001736446325765136, + "loss": 0.0167, "step": 324970 }, { - "epoch": 1.64, - "learning_rate": 5.406511243069254e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017364074436014213, + "loss": 0.0147, "step": 324980 }, { - "epoch": 1.64, - "learning_rate": 5.405754473767853e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017363685614377067, + "loss": 0.0174, "step": 324990 }, { - "epoch": 1.64, - "learning_rate": 5.4049977044664525e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017363296792739924, + "loss": 0.011, "step": 325000 }, { - "epoch": 1.64, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.005062679760158062, - "eval_runtime": 116.3486, - "eval_samples_per_second": 17.19, - "eval_steps_per_second": 4.297, + "epoch": 0.84, + "eval_cer": 0.8817362776095881, + "eval_loss": 0.009082542732357979, + "eval_runtime": 107.6825, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, "step": 325000 }, { - "epoch": 1.64, - "learning_rate": 5.404240935165051e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.00017362907971102775, + "loss": 0.0131, "step": 325010 }, { - "epoch": 1.64, - "learning_rate": 5.40348416586365e-05, - "loss": 0.0077, + "epoch": 0.84, + "learning_rate": 0.0001736251914946563, + "loss": 0.0125, "step": 325020 }, { - "epoch": 1.64, - "learning_rate": 5.402727396562249e-05, - "loss": 0.0079, + "epoch": 0.84, + "learning_rate": 0.0001736213032782848, + "loss": 0.0129, "step": 325030 }, { - "epoch": 1.64, - "learning_rate": 5.4019706272608484e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017361741506191332, + "loss": 0.0109, "step": 325040 }, { - "epoch": 1.64, - "learning_rate": 5.401213857959447e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.0001736135268455419, + "loss": 0.0112, "step": 325050 }, { - "epoch": 1.64, - "learning_rate": 5.400457088658046e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017360963862917043, + "loss": 0.0129, "step": 325060 }, { - "epoch": 1.64, - "learning_rate": 5.399700319356644e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017360575041279895, + "loss": 0.0146, "step": 325070 }, { - "epoch": 1.64, - "learning_rate": 5.398943550055243e-05, - "loss": 0.007, + "epoch": 0.84, + "learning_rate": 0.0001736018621964275, + "loss": 0.0128, "step": 325080 }, { - "epoch": 1.64, - "learning_rate": 5.3981867807538425e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017359797398005603, + "loss": 0.0146, "step": 325090 }, { - "epoch": 1.64, - "learning_rate": 5.3974300114524414e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017359408576368457, + "loss": 0.0161, "step": 325100 }, { - "epoch": 1.64, - "learning_rate": 5.39667324215104e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.00017359019754731309, + "loss": 0.0147, "step": 325110 }, { - "epoch": 1.64, - "learning_rate": 5.395916472849639e-05, - "loss": 0.0091, + "epoch": 0.84, + "learning_rate": 0.00017358630933094163, + "loss": 0.0126, "step": 325120 }, { - "epoch": 1.64, - "learning_rate": 5.3951597035482385e-05, - "loss": 0.0125, + "epoch": 0.84, + "learning_rate": 0.00017358242111457017, + "loss": 0.0136, "step": 325130 }, { - "epoch": 1.64, - "learning_rate": 5.394402934246837e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.0001735785328981987, + "loss": 0.0147, "step": 325140 }, { - "epoch": 1.64, - "learning_rate": 5.393646164945436e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017357464468182722, + "loss": 0.0122, "step": 325150 }, { - "epoch": 1.64, - "learning_rate": 5.392889395644035e-05, - "loss": 0.0045, + "epoch": 0.84, + "learning_rate": 0.00017357075646545577, + "loss": 0.0103, "step": 325160 }, { - "epoch": 1.64, - "learning_rate": 5.3921326263426345e-05, - "loss": 0.0059, + "epoch": 0.84, + "learning_rate": 0.00017356686824908434, + "loss": 0.0122, "step": 325170 }, { - "epoch": 1.64, - "learning_rate": 5.391375857041233e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017356298003271285, + "loss": 0.0138, "step": 325180 }, { - "epoch": 1.64, - "learning_rate": 5.390619087739832e-05, - "loss": 0.0107, + "epoch": 0.84, + "learning_rate": 0.0001735590918163414, + "loss": 0.0163, "step": 325190 }, { - "epoch": 1.64, - "learning_rate": 5.389862318438431e-05, - "loss": 0.0068, + "epoch": 0.84, + "learning_rate": 0.0001735552035999699, + "loss": 0.0128, "step": 325200 }, { - "epoch": 1.64, - "learning_rate": 5.3891055491370304e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017355131538359847, + "loss": 0.0135, "step": 325210 }, { - "epoch": 1.64, - "learning_rate": 5.388348779835629e-05, - "loss": 0.0075, + "epoch": 0.84, + "learning_rate": 0.000173547427167227, + "loss": 0.0137, "step": 325220 }, { - "epoch": 1.64, - "learning_rate": 5.387592010534228e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.00017354353895085553, + "loss": 0.0132, "step": 325230 }, { - "epoch": 1.64, - "learning_rate": 5.386835241232827e-05, - "loss": 0.0049, + "epoch": 0.84, + "learning_rate": 0.00017353965073448405, + "loss": 0.0106, "step": 325240 }, { - "epoch": 1.64, - "learning_rate": 5.3860784719314264e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.00017353576251811261, + "loss": 0.013, "step": 325250 }, { - "epoch": 1.64, - "learning_rate": 5.385321702630025e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017353187430174113, + "loss": 0.0167, "step": 325260 }, { - "epoch": 1.64, - "learning_rate": 5.384564933328624e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017352798608536967, + "loss": 0.0109, "step": 325270 }, { - "epoch": 1.64, - "learning_rate": 5.383808164027223e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017352409786899818, + "loss": 0.0143, "step": 325280 }, { - "epoch": 1.64, - "learning_rate": 5.3830513947258224e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.00017352020965262673, + "loss": 0.0113, "step": 325290 }, { - "epoch": 1.64, - "learning_rate": 5.382294625424421e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017351632143625527, + "loss": 0.0185, "step": 325300 }, { - "epoch": 1.64, - "learning_rate": 5.38153785612302e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001735124332198838, + "loss": 0.0126, "step": 325310 }, { - "epoch": 1.64, - "learning_rate": 5.3807810868216195e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017350854500351232, + "loss": 0.0144, "step": 325320 }, { - "epoch": 1.64, - "learning_rate": 5.380024317520218e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017350465678714087, + "loss": 0.0136, "step": 325330 }, { - "epoch": 1.64, - "learning_rate": 5.379267548218817e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017350076857076943, + "loss": 0.0138, "step": 325340 }, { - "epoch": 1.64, - "learning_rate": 5.378510778917416e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017349688035439795, + "loss": 0.0147, "step": 325350 }, { - "epoch": 1.64, - "learning_rate": 5.3777540096160155e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017349299213802646, + "loss": 0.0146, "step": 325360 }, { - "epoch": 1.64, - "learning_rate": 5.376997240314614e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.000173489103921655, + "loss": 0.0116, "step": 325370 }, { - "epoch": 1.64, - "learning_rate": 5.3762404710132124e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017348521570528357, + "loss": 0.015, "step": 325380 }, { - "epoch": 1.64, - "learning_rate": 5.375483701711811e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.0001734813274889121, + "loss": 0.0153, "step": 325390 }, { - "epoch": 1.64, - "learning_rate": 5.37472693241041e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017347743927254063, + "loss": 0.0116, "step": 325400 }, { - "epoch": 1.64, - "learning_rate": 5.3739701631090096e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017347355105616914, + "loss": 0.0119, "step": 325410 }, { - "epoch": 1.64, - "learning_rate": 5.3732133938076084e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.0001734696628397977, + "loss": 0.0135, "step": 325420 }, { - "epoch": 1.64, - "learning_rate": 5.372456624506207e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.00017346577462342623, + "loss": 0.0143, "step": 325430 }, { - "epoch": 1.64, - "learning_rate": 5.371699855204806e-05, - "loss": 0.0065, + "epoch": 0.84, + "learning_rate": 0.00017346188640705477, + "loss": 0.0158, "step": 325440 }, { - "epoch": 1.64, - "learning_rate": 5.3709430859034055e-05, - "loss": 0.0085, + "epoch": 0.84, + "learning_rate": 0.00017345799819068328, + "loss": 0.0107, "step": 325450 }, { - "epoch": 1.64, - "learning_rate": 5.3701863166020044e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.00017345410997431185, + "loss": 0.0127, "step": 325460 }, { - "epoch": 1.64, - "learning_rate": 5.369429547300603e-05, - "loss": 0.0065, - "step": 325470 + "epoch": 0.84, + "learning_rate": 0.00017345022175794037, + "loss": 0.0125, + "step": 325470 }, { - "epoch": 1.64, - "learning_rate": 5.368672777999202e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.0001734463335415689, + "loss": 0.0132, "step": 325480 }, { - "epoch": 1.64, - "learning_rate": 5.3679160086978015e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017344244532519742, + "loss": 0.0108, "step": 325490 }, { - "epoch": 1.64, - "learning_rate": 5.3671592393964e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.000173438557108826, + "loss": 0.0166, "step": 325500 }, { - "epoch": 1.64, - "learning_rate": 5.366402470094999e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001734346688924545, + "loss": 0.012, "step": 325510 }, { - "epoch": 1.64, - "learning_rate": 5.365645700793598e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017343078067608305, + "loss": 0.012, "step": 325520 }, { - "epoch": 1.64, - "learning_rate": 5.3648889314921975e-05, - "loss": 0.0062, + "epoch": 0.84, + "learning_rate": 0.00017342689245971156, + "loss": 0.0189, "step": 325530 }, { - "epoch": 1.64, - "learning_rate": 5.364132162190796e-05, - "loss": 0.0098, + "epoch": 0.84, + "learning_rate": 0.0001734230042433401, + "loss": 0.0139, "step": 325540 }, { - "epoch": 1.64, - "learning_rate": 5.363375392889395e-05, - "loss": 0.005, + "epoch": 0.84, + "learning_rate": 0.00017341911602696867, + "loss": 0.0157, "step": 325550 }, { - "epoch": 1.64, - "learning_rate": 5.362618623587994e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.0001734152278105972, + "loss": 0.0164, "step": 325560 }, { - "epoch": 1.64, - "learning_rate": 5.3618618542865934e-05, - "loss": 0.0107, + "epoch": 0.84, + "learning_rate": 0.00017341133959422573, + "loss": 0.0141, "step": 325570 }, { - "epoch": 1.64, - "learning_rate": 5.361105084985192e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017340745137785424, + "loss": 0.0189, "step": 325580 }, { - "epoch": 1.64, - "learning_rate": 5.360348315683791e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.0001734035631614828, + "loss": 0.0135, "step": 325590 }, { - "epoch": 1.64, - "learning_rate": 5.35959154638239e-05, - "loss": 0.0061, + "epoch": 0.84, + "learning_rate": 0.00017339967494511133, + "loss": 0.0135, "step": 325600 }, { - "epoch": 1.64, - "learning_rate": 5.3588347770809894e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017339578672873987, + "loss": 0.0127, "step": 325610 }, { - "epoch": 1.64, - "learning_rate": 5.358078007779588e-05, - "loss": 0.0098, + "epoch": 0.84, + "learning_rate": 0.00017339189851236838, + "loss": 0.0144, "step": 325620 }, { - "epoch": 1.64, - "learning_rate": 5.357321238478187e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017338801029599695, + "loss": 0.0152, "step": 325630 }, { - "epoch": 1.64, - "learning_rate": 5.356564469176786e-05, - "loss": 0.0078, + "epoch": 0.84, + "learning_rate": 0.00017338412207962547, + "loss": 0.0132, "step": 325640 }, { - "epoch": 1.64, - "learning_rate": 5.3558076998753854e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.000173380233863254, + "loss": 0.0124, "step": 325650 }, { - "epoch": 1.64, - "learning_rate": 5.355050930573984e-05, - "loss": 0.0048, + "epoch": 0.84, + "learning_rate": 0.00017337634564688252, + "loss": 0.0134, "step": 325660 }, { - "epoch": 1.64, - "learning_rate": 5.354294161272583e-05, - "loss": 0.0049, + "epoch": 0.84, + "learning_rate": 0.0001733724574305111, + "loss": 0.0105, "step": 325670 }, { - "epoch": 1.64, - "learning_rate": 5.353537391971182e-05, - "loss": 0.0088, + "epoch": 0.84, + "learning_rate": 0.0001733685692141396, + "loss": 0.0144, "step": 325680 }, { - "epoch": 1.64, - "learning_rate": 5.3527806226697813e-05, - "loss": 0.0072, + "epoch": 0.84, + "learning_rate": 0.00017336468099776815, + "loss": 0.0121, "step": 325690 }, { - "epoch": 1.64, - "learning_rate": 5.3520238533683795e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.00017336079278139666, + "loss": 0.0144, "step": 325700 }, { - "epoch": 1.64, - "learning_rate": 5.351267084066978e-05, - "loss": 0.0052, + "epoch": 0.84, + "learning_rate": 0.00017335690456502523, + "loss": 0.0139, "step": 325710 }, { - "epoch": 1.64, - "learning_rate": 5.350510314765577e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017335301634865377, + "loss": 0.0112, "step": 325720 }, { - "epoch": 1.64, - "learning_rate": 5.349753545464176e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001733491281322823, + "loss": 0.0128, "step": 325730 }, { - "epoch": 1.64, - "learning_rate": 5.3489967761627754e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017334523991591083, + "loss": 0.0137, "step": 325740 }, { - "epoch": 1.64, - "learning_rate": 5.348240006861374e-05, - "loss": 0.0047, + "epoch": 0.84, + "learning_rate": 0.00017334135169953937, + "loss": 0.013, "step": 325750 }, { - "epoch": 1.64, - "learning_rate": 5.347483237559973e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.0001733374634831679, + "loss": 0.0137, "step": 325760 }, { - "epoch": 1.64, - "learning_rate": 5.3467264682585726e-05, - "loss": 0.0099, + "epoch": 0.84, + "learning_rate": 0.00017333357526679643, + "loss": 0.0154, "step": 325770 }, { - "epoch": 1.64, - "learning_rate": 5.3459696989571714e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.00017332968705042497, + "loss": 0.0176, "step": 325780 }, { - "epoch": 1.64, - "learning_rate": 5.34521292965577e-05, - "loss": 0.0064, + "epoch": 0.84, + "learning_rate": 0.00017332579883405348, + "loss": 0.0152, "step": 325790 }, { - "epoch": 1.64, - "learning_rate": 5.344456160354369e-05, - "loss": 0.006, + "epoch": 0.84, + "learning_rate": 0.00017332191061768205, + "loss": 0.011, "step": 325800 }, { - "epoch": 1.64, - "learning_rate": 5.3436993910529686e-05, - "loss": 0.0066, + "epoch": 0.84, + "learning_rate": 0.00017331802240131057, + "loss": 0.0107, "step": 325810 }, { - "epoch": 1.64, - "learning_rate": 5.3429426217515674e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.0001733141341849391, + "loss": 0.0131, "step": 325820 }, { - "epoch": 1.64, - "learning_rate": 5.342185852450166e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017331024596856762, + "loss": 0.0123, "step": 325830 }, { - "epoch": 1.64, - "learning_rate": 5.341429083148765e-05, - "loss": 0.0056, + "epoch": 0.84, + "learning_rate": 0.0001733063577521962, + "loss": 0.0123, "step": 325840 }, { - "epoch": 1.64, - "learning_rate": 5.3406723138473645e-05, - "loss": 0.0098, + "epoch": 0.84, + "learning_rate": 0.0001733024695358247, + "loss": 0.0185, "step": 325850 }, { - "epoch": 1.64, - "learning_rate": 5.3399155445459633e-05, - "loss": 0.0076, + "epoch": 0.84, + "learning_rate": 0.00017329858131945325, + "loss": 0.0146, "step": 325860 }, { - "epoch": 1.64, - "learning_rate": 5.339158775244562e-05, - "loss": 0.0083, + "epoch": 0.84, + "learning_rate": 0.00017329469310308176, + "loss": 0.0094, "step": 325870 }, { - "epoch": 1.64, - "learning_rate": 5.338402005943161e-05, - "loss": 0.0071, + "epoch": 0.84, + "learning_rate": 0.00017329080488671033, + "loss": 0.0111, "step": 325880 }, { - "epoch": 1.64, - "learning_rate": 5.3376452366417605e-05, - "loss": 0.0045, + "epoch": 0.84, + "learning_rate": 0.00017328691667033887, + "loss": 0.0133, "step": 325890 }, { - "epoch": 1.64, - "learning_rate": 5.336888467340359e-05, - "loss": 0.0074, + "epoch": 0.84, + "learning_rate": 0.0001732830284539674, + "loss": 0.0155, "step": 325900 }, { - "epoch": 1.64, - "learning_rate": 5.336131698038958e-05, - "loss": 0.0057, + "epoch": 0.84, + "learning_rate": 0.0001732791402375959, + "loss": 0.0174, "step": 325910 }, { - "epoch": 1.64, - "learning_rate": 5.335374928737557e-05, - "loss": 0.0084, + "epoch": 0.84, + "learning_rate": 0.00017327525202122447, + "loss": 0.0104, "step": 325920 }, { - "epoch": 1.64, - "learning_rate": 5.3346181594361565e-05, - "loss": 0.0069, + "epoch": 0.84, + "learning_rate": 0.000173271363804853, + "loss": 0.0121, "step": 325930 }, { - "epoch": 1.64, - "learning_rate": 5.333861390134755e-05, - "loss": 0.0058, + "epoch": 0.84, + "learning_rate": 0.00017326747558848153, + "loss": 0.0103, "step": 325940 }, { - "epoch": 1.64, - "learning_rate": 5.333104620833354e-05, - "loss": 0.0073, + "epoch": 0.84, + "learning_rate": 0.00017326358737211007, + "loss": 0.0096, "step": 325950 }, { - "epoch": 1.64, - "learning_rate": 5.332347851531953e-05, - "loss": 0.0063, + "epoch": 0.84, + "learning_rate": 0.0001732596991557386, + "loss": 0.0149, "step": 325960 }, { - "epoch": 1.64, - "learning_rate": 5.3315910822305524e-05, - "loss": 0.0053, + "epoch": 0.84, + "learning_rate": 0.00017325581093936715, + "loss": 0.0124, "step": 325970 }, { - "epoch": 1.64, - "learning_rate": 5.330834312929151e-05, - "loss": 0.0067, + "epoch": 0.84, + "learning_rate": 0.00017325192272299567, + "loss": 0.0149, "step": 325980 }, { - "epoch": 1.64, - "learning_rate": 5.33007754362775e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.0001732480345066242, + "loss": 0.0139, "step": 325990 }, { - "epoch": 1.64, - "learning_rate": 5.329320774326349e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017324414629025275, + "loss": 0.0144, "step": 326000 }, { - "epoch": 1.64, - "eval_cer": 0.914412032135638, - "eval_loss": 0.004975411109626293, - "eval_runtime": 116.3509, - "eval_samples_per_second": 17.189, - "eval_steps_per_second": 4.297, + "epoch": 0.85, + "eval_cer": 0.8817180823294437, + "eval_loss": 0.008809900842607021, + "eval_runtime": 107.5599, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.649, "step": 326000 }, { - "epoch": 1.64, - "learning_rate": 5.328564005024947e-05, - "loss": 0.011, + "epoch": 0.85, + "learning_rate": 0.0001732402580738813, + "loss": 0.0124, "step": 326010 }, { - "epoch": 1.64, - "learning_rate": 5.3278072357235465e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.0001732363698575098, + "loss": 0.013, "step": 326020 }, { - "epoch": 1.64, - "learning_rate": 5.3270504664221453e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017323248164113835, + "loss": 0.0132, "step": 326030 }, { - "epoch": 1.64, - "learning_rate": 5.326293697120744e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017322859342476686, + "loss": 0.0117, "step": 326040 }, { - "epoch": 1.64, - "learning_rate": 5.325536927819343e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017322470520839543, + "loss": 0.0145, "step": 326050 }, { - "epoch": 1.65, - "learning_rate": 5.3247801585179425e-05, - "loss": 0.0085, + "epoch": 0.85, + "learning_rate": 0.00017322081699202397, + "loss": 0.0137, "step": 326060 }, { - "epoch": 1.65, - "learning_rate": 5.324023389216541e-05, - "loss": 0.0048, + "epoch": 0.85, + "learning_rate": 0.00017321692877565249, + "loss": 0.0132, "step": 326070 }, { - "epoch": 1.65, - "learning_rate": 5.32326661991514e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.000173213040559281, + "loss": 0.0152, "step": 326080 }, { - "epoch": 1.65, - "learning_rate": 5.322509850613739e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017320915234290957, + "loss": 0.0176, "step": 326090 }, { - "epoch": 1.65, - "learning_rate": 5.3217530813123385e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.0001732052641265381, + "loss": 0.0135, "step": 326100 }, { - "epoch": 1.65, - "learning_rate": 5.320996312010937e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017320137591016663, + "loss": 0.0144, "step": 326110 }, { - "epoch": 1.65, - "learning_rate": 5.320239542709536e-05, - "loss": 0.0097, + "epoch": 0.85, + "learning_rate": 0.00017319748769379517, + "loss": 0.0169, "step": 326120 }, { - "epoch": 1.65, - "learning_rate": 5.319482773408135e-05, - "loss": 0.008, + "epoch": 0.85, + "learning_rate": 0.0001731935994774237, + "loss": 0.0103, "step": 326130 }, { - "epoch": 1.65, - "learning_rate": 5.3187260041067344e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017318971126105225, + "loss": 0.0097, "step": 326140 }, { - "epoch": 1.65, - "learning_rate": 5.317969234805333e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017318582304468077, + "loss": 0.0134, "step": 326150 }, { - "epoch": 1.65, - "learning_rate": 5.317212465503932e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.0001731819348283093, + "loss": 0.0115, "step": 326160 }, { - "epoch": 1.65, - "learning_rate": 5.316455696202531e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017317804661193785, + "loss": 0.0163, "step": 326170 }, { - "epoch": 1.65, - "learning_rate": 5.3156989269011304e-05, - "loss": 0.0106, + "epoch": 0.85, + "learning_rate": 0.0001731741583955664, + "loss": 0.0173, "step": 326180 }, { - "epoch": 1.65, - "learning_rate": 5.314942157599729e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.0001731702701791949, + "loss": 0.0125, "step": 326190 }, { - "epoch": 1.65, - "learning_rate": 5.314185388298328e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017316638196282345, + "loss": 0.0127, "step": 326200 }, { - "epoch": 1.65, - "learning_rate": 5.313428618996927e-05, - "loss": 0.0085, + "epoch": 0.85, + "learning_rate": 0.00017316249374645202, + "loss": 0.0123, "step": 326210 }, { - "epoch": 1.65, - "learning_rate": 5.3126718496955264e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017315860553008053, + "loss": 0.0154, "step": 326220 }, { - "epoch": 1.65, - "learning_rate": 5.311915080394125e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017315471731370904, + "loss": 0.0119, "step": 326230 }, { - "epoch": 1.65, - "learning_rate": 5.311158311092724e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017315082909733759, + "loss": 0.0107, "step": 326240 }, { - "epoch": 1.65, - "learning_rate": 5.310401541791323e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017314694088096615, + "loss": 0.0122, "step": 326250 }, { - "epoch": 1.65, - "learning_rate": 5.309644772489922e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017314305266459467, + "loss": 0.0174, "step": 326260 }, { - "epoch": 1.65, - "learning_rate": 5.308888003188521e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.0001731391644482232, + "loss": 0.0159, "step": 326270 }, { - "epoch": 1.65, - "learning_rate": 5.30813123388712e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017313527623185173, + "loss": 0.012, "step": 326280 }, { - "epoch": 1.65, - "learning_rate": 5.3073744645857195e-05, - "loss": 0.0104, + "epoch": 0.85, + "learning_rate": 0.00017313138801548027, + "loss": 0.0142, "step": 326290 }, { - "epoch": 1.65, - "learning_rate": 5.306617695284318e-05, - "loss": 0.0088, + "epoch": 0.85, + "learning_rate": 0.0001731274997991088, + "loss": 0.018, "step": 326300 }, { - "epoch": 1.65, - "learning_rate": 5.305860925982917e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017312361158273735, + "loss": 0.0135, "step": 326310 }, { - "epoch": 1.65, - "learning_rate": 5.305104156681515e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017311972336636586, + "loss": 0.0134, "step": 326320 }, { - "epoch": 1.65, - "learning_rate": 5.304347387380114e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.0001731158351499944, + "loss": 0.0156, "step": 326330 }, { - "epoch": 1.65, - "learning_rate": 5.3035906180787136e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017311194693362295, + "loss": 0.012, "step": 326340 }, { - "epoch": 1.65, - "learning_rate": 5.3028338487773124e-05, - "loss": 0.0084, + "epoch": 0.85, + "learning_rate": 0.0001731080587172515, + "loss": 0.0164, "step": 326350 }, { - "epoch": 1.65, - "learning_rate": 5.302077079475911e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017310417050088, + "loss": 0.0152, "step": 326360 }, { - "epoch": 1.65, - "learning_rate": 5.30132031017451e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017310028228450855, + "loss": 0.0173, "step": 326370 }, { - "epoch": 1.65, - "learning_rate": 5.3005635408731095e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001730963940681371, + "loss": 0.0126, "step": 326380 }, { - "epoch": 1.65, - "learning_rate": 5.2998067715717084e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017309250585176563, + "loss": 0.0111, "step": 326390 }, { - "epoch": 1.65, - "learning_rate": 5.299050002270307e-05, - "loss": 0.008, + "epoch": 0.85, + "learning_rate": 0.00017308861763539414, + "loss": 0.016, "step": 326400 }, { - "epoch": 1.65, - "learning_rate": 5.298293232968906e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017308472941902269, + "loss": 0.0137, "step": 326410 }, { - "epoch": 1.65, - "learning_rate": 5.2975364636675055e-05, - "loss": 0.0047, + "epoch": 0.85, + "learning_rate": 0.00017308084120265125, + "loss": 0.0141, "step": 326420 }, { - "epoch": 1.65, - "learning_rate": 5.296779694366104e-05, - "loss": 0.0076, + "epoch": 0.85, + "learning_rate": 0.00017307695298627977, + "loss": 0.0136, "step": 326430 }, { - "epoch": 1.65, - "learning_rate": 5.296022925064703e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.0001730730647699083, + "loss": 0.0127, "step": 326440 }, { - "epoch": 1.65, - "learning_rate": 5.295266155763302e-05, - "loss": 0.0085, + "epoch": 0.85, + "learning_rate": 0.00017306917655353682, + "loss": 0.0123, "step": 326450 }, { - "epoch": 1.65, - "learning_rate": 5.2945093864619015e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.0001730652883371654, + "loss": 0.0133, "step": 326460 }, { - "epoch": 1.65, - "learning_rate": 5.2937526171605e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.0001730614001207939, + "loss": 0.0158, "step": 326470 }, { - "epoch": 1.65, - "learning_rate": 5.292995847859099e-05, - "loss": 0.0086, + "epoch": 0.85, + "learning_rate": 0.00017305751190442245, + "loss": 0.0134, "step": 326480 }, { - "epoch": 1.65, - "learning_rate": 5.292239078557698e-05, - "loss": 0.0087, + "epoch": 0.85, + "learning_rate": 0.00017305362368805096, + "loss": 0.0128, "step": 326490 }, { - "epoch": 1.65, - "learning_rate": 5.2914823092562974e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017304973547167953, + "loss": 0.0147, "step": 326500 }, { - "epoch": 1.65, - "learning_rate": 5.290725539954896e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017304584725530805, + "loss": 0.0161, "step": 326510 }, { - "epoch": 1.65, - "learning_rate": 5.289968770653495e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.0001730419590389366, + "loss": 0.0126, "step": 326520 }, { - "epoch": 1.65, - "learning_rate": 5.289212001352094e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.0001730380708225651, + "loss": 0.013, "step": 326530 }, { - "epoch": 1.65, - "learning_rate": 5.2884552320506934e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017303418260619365, + "loss": 0.017, "step": 326540 }, { - "epoch": 1.65, - "learning_rate": 5.287698462749292e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.0001730302943898222, + "loss": 0.0116, "step": 326550 }, { - "epoch": 1.65, - "learning_rate": 5.286941693447891e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017302640617345073, + "loss": 0.0158, "step": 326560 }, { - "epoch": 1.65, - "learning_rate": 5.28618492414649e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017302251795707924, + "loss": 0.0151, "step": 326570 }, { - "epoch": 1.65, - "learning_rate": 5.2854281548450894e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017301862974070778, + "loss": 0.0255, "step": 326580 }, { - "epoch": 1.65, - "learning_rate": 5.284671385543688e-05, - "loss": 0.0078, + "epoch": 0.85, + "learning_rate": 0.00017301474152433635, + "loss": 0.0153, "step": 326590 }, { - "epoch": 1.65, - "learning_rate": 5.283914616242287e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017301085330796487, + "loss": 0.0241, "step": 326600 }, { - "epoch": 1.65, - "learning_rate": 5.283157846940886e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.0001730069650915934, + "loss": 0.0177, "step": 326610 }, { - "epoch": 1.65, - "learning_rate": 5.282401077639485e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017300307687522192, + "loss": 0.0149, "step": 326620 }, { - "epoch": 1.65, - "learning_rate": 5.281644308338084e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.0001729991886588505, + "loss": 0.0123, "step": 326630 }, { - "epoch": 1.65, - "learning_rate": 5.280887539036682e-05, - "loss": 0.0094, + "epoch": 0.85, + "learning_rate": 0.000172995300442479, + "loss": 0.0143, "step": 326640 }, { - "epoch": 1.65, - "learning_rate": 5.280130769735281e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017299141222610755, + "loss": 0.0112, "step": 326650 }, { - "epoch": 1.65, - "learning_rate": 5.27937400043388e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017298752400973606, + "loss": 0.0106, "step": 326660 }, { - "epoch": 1.65, - "learning_rate": 5.2786172311324794e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017298363579336463, + "loss": 0.0153, "step": 326670 }, { - "epoch": 1.65, - "learning_rate": 5.277860461831078e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017297974757699315, + "loss": 0.0154, "step": 326680 }, { - "epoch": 1.65, - "learning_rate": 5.277103692529677e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.0001729758593606217, + "loss": 0.013, "step": 326690 }, { - "epoch": 1.65, - "learning_rate": 5.276346923228276e-05, - "loss": 0.0085, + "epoch": 0.85, + "learning_rate": 0.0001729719711442502, + "loss": 0.0172, "step": 326700 }, { - "epoch": 1.65, - "learning_rate": 5.2755901539268754e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017296808292787877, + "loss": 0.0094, "step": 326710 }, { - "epoch": 1.65, - "learning_rate": 5.274833384625474e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017296419471150729, + "loss": 0.0126, "step": 326720 }, { - "epoch": 1.65, - "learning_rate": 5.274076615324073e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017296030649513583, + "loss": 0.0175, "step": 326730 }, { - "epoch": 1.65, - "learning_rate": 5.2733198460226725e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017295641827876434, + "loss": 0.0164, "step": 326740 }, { - "epoch": 1.65, - "learning_rate": 5.2725630767212714e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.0001729525300623929, + "loss": 0.0105, "step": 326750 }, { - "epoch": 1.65, - "learning_rate": 5.27180630741987e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017294864184602145, + "loss": 0.0177, "step": 326760 }, { - "epoch": 1.65, - "learning_rate": 5.271049538118469e-05, - "loss": 0.0084, + "epoch": 0.85, + "learning_rate": 0.00017294475362964997, + "loss": 0.0155, "step": 326770 }, { - "epoch": 1.65, - "learning_rate": 5.2702927688170685e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.0001729408654132785, + "loss": 0.0135, "step": 326780 }, { - "epoch": 1.65, - "learning_rate": 5.269535999515667e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017293697719690702, + "loss": 0.0146, "step": 326790 }, { - "epoch": 1.65, - "learning_rate": 5.268779230214266e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.0001729330889805356, + "loss": 0.0142, "step": 326800 }, { - "epoch": 1.65, - "learning_rate": 5.268022460912865e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.0001729292007641641, + "loss": 0.0153, "step": 326810 }, { - "epoch": 1.65, - "learning_rate": 5.2672656916114645e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017292531254779265, + "loss": 0.0134, "step": 326820 }, { - "epoch": 1.65, - "learning_rate": 5.266508922310063e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017292142433142116, + "loss": 0.0146, "step": 326830 }, { - "epoch": 1.65, - "learning_rate": 5.265752153008662e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017291753611504973, + "loss": 0.011, "step": 326840 }, { - "epoch": 1.65, - "learning_rate": 5.264995383707261e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017291364789867825, + "loss": 0.0136, "step": 326850 }, { - "epoch": 1.65, - "learning_rate": 5.2642386144058604e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001729097596823068, + "loss": 0.0146, "step": 326860 }, { - "epoch": 1.65, - "learning_rate": 5.263481845104459e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.0001729058714659353, + "loss": 0.0143, "step": 326870 }, { - "epoch": 1.65, - "learning_rate": 5.262725075803058e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017290198324956387, + "loss": 0.013, "step": 326880 }, { - "epoch": 1.65, - "learning_rate": 5.261968306501657e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017289809503319239, + "loss": 0.0153, "step": 326890 }, { - "epoch": 1.65, - "learning_rate": 5.2612115372002564e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017289420681682093, + "loss": 0.012, "step": 326900 }, { - "epoch": 1.65, - "learning_rate": 5.260454767898855e-05, - "loss": 0.0084, + "epoch": 0.85, + "learning_rate": 0.00017289031860044944, + "loss": 0.0105, "step": 326910 }, { - "epoch": 1.65, - "learning_rate": 5.259697998597454e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.000172886430384078, + "loss": 0.0152, "step": 326920 }, { - "epoch": 1.65, - "learning_rate": 5.258941229296053e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017288254216770655, + "loss": 0.0158, "step": 326930 }, { - "epoch": 1.65, - "learning_rate": 5.2581844599946524e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017287865395133507, + "loss": 0.0092, "step": 326940 }, { - "epoch": 1.65, - "learning_rate": 5.2574276906932505e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017287476573496358, + "loss": 0.015, "step": 326950 }, { - "epoch": 1.65, - "learning_rate": 5.256670921391849e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.00017287087751859215, + "loss": 0.0156, "step": 326960 }, { - "epoch": 1.65, - "learning_rate": 5.255914152090448e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.0001728669893022207, + "loss": 0.0132, "step": 326970 }, { - "epoch": 1.65, - "learning_rate": 5.255157382789047e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.0001728631010858492, + "loss": 0.01, "step": 326980 }, { - "epoch": 1.65, - "learning_rate": 5.2544006134876465e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017285921286947775, + "loss": 0.0143, "step": 326990 }, { - "epoch": 1.65, - "learning_rate": 5.253643844186245e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.0001728553246531063, + "loss": 0.0128, "step": 327000 }, { - "epoch": 1.65, - "eval_cer": 0.9144285288697699, - "eval_loss": 0.004966360051184893, - "eval_runtime": 116.3822, - "eval_samples_per_second": 17.185, - "eval_steps_per_second": 4.296, + "epoch": 0.85, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.009260199032723904, + "eval_runtime": 107.8033, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, "step": 327000 }, { - "epoch": 1.65, - "learning_rate": 5.252887074884844e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017285143643673483, + "loss": 0.0156, "step": 327010 }, { - "epoch": 1.65, - "learning_rate": 5.252130305583443e-05, - "loss": 0.0102, + "epoch": 0.85, + "learning_rate": 0.00017284754822036335, + "loss": 0.0143, "step": 327020 }, { - "epoch": 1.65, - "learning_rate": 5.2513735362820424e-05, - "loss": 0.0109, + "epoch": 0.85, + "learning_rate": 0.0001728436600039919, + "loss": 0.0125, "step": 327030 }, { - "epoch": 1.65, - "learning_rate": 5.250616766980641e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001728397717876204, + "loss": 0.013, "step": 327040 }, { - "epoch": 1.65, - "learning_rate": 5.24985999767924e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017283588357124897, + "loss": 0.0144, "step": 327050 }, { - "epoch": 1.65, - "learning_rate": 5.249103228377839e-05, - "loss": 0.0087, + "epoch": 0.85, + "learning_rate": 0.00017283199535487749, + "loss": 0.0126, "step": 327060 }, { - "epoch": 1.65, - "learning_rate": 5.2483464590764384e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017282810713850603, + "loss": 0.012, "step": 327070 }, { - "epoch": 1.65, - "learning_rate": 5.247589689775037e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017282421892213454, + "loss": 0.0119, "step": 327080 }, { - "epoch": 1.65, - "learning_rate": 5.246832920473636e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.0001728203307057631, + "loss": 0.0119, "step": 327090 }, { - "epoch": 1.65, - "learning_rate": 5.246076151172235e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017281644248939162, + "loss": 0.0142, "step": 327100 }, { - "epoch": 1.65, - "learning_rate": 5.2453193818708344e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017281255427302017, + "loss": 0.014, "step": 327110 }, { - "epoch": 1.65, - "learning_rate": 5.244562612569433e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017280866605664868, + "loss": 0.0134, "step": 327120 }, { - "epoch": 1.65, - "learning_rate": 5.243805843268032e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017280477784027725, + "loss": 0.0143, "step": 327130 }, { - "epoch": 1.65, - "learning_rate": 5.243049073966631e-05, - "loss": 0.0081, + "epoch": 0.85, + "learning_rate": 0.0001728008896239058, + "loss": 0.0145, "step": 327140 }, { - "epoch": 1.65, - "learning_rate": 5.2422923046652303e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.0001727970014075343, + "loss": 0.0165, "step": 327150 }, { - "epoch": 1.65, - "learning_rate": 5.241535535363829e-05, - "loss": 0.0039, + "epoch": 0.85, + "learning_rate": 0.00017279311319116285, + "loss": 0.0146, "step": 327160 }, { - "epoch": 1.65, - "learning_rate": 5.240778766062428e-05, - "loss": 0.009, + "epoch": 0.85, + "learning_rate": 0.0001727892249747914, + "loss": 0.0154, "step": 327170 }, { - "epoch": 1.65, - "learning_rate": 5.240021996761027e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017278533675841993, + "loss": 0.0145, "step": 327180 }, { - "epoch": 1.65, - "learning_rate": 5.239265227459626e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017278144854204844, + "loss": 0.012, "step": 327190 }, { - "epoch": 1.65, - "learning_rate": 5.238508458158225e-05, - "loss": 0.0177, + "epoch": 0.85, + "learning_rate": 0.000172777560325677, + "loss": 0.0127, "step": 327200 }, { - "epoch": 1.65, - "learning_rate": 5.237751688856824e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017277367210930553, + "loss": 0.0164, "step": 327210 }, { - "epoch": 1.65, - "learning_rate": 5.236994919555423e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017276978389293407, + "loss": 0.0122, "step": 327220 }, { - "epoch": 1.65, - "learning_rate": 5.236238150254022e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017276589567656258, + "loss": 0.0095, "step": 327230 }, { - "epoch": 1.65, - "learning_rate": 5.235481380952621e-05, - "loss": 0.0094, + "epoch": 0.85, + "learning_rate": 0.00017276200746019113, + "loss": 0.0136, "step": 327240 }, { - "epoch": 1.65, - "learning_rate": 5.23472461165122e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.0001727581192438197, + "loss": 0.0163, "step": 327250 }, { - "epoch": 1.65, - "learning_rate": 5.2339678423498194e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.0001727542310274482, + "loss": 0.0161, "step": 327260 }, { - "epoch": 1.65, - "learning_rate": 5.2332110730484176e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017275034281107672, + "loss": 0.0143, "step": 327270 }, { - "epoch": 1.65, - "learning_rate": 5.2324543037470164e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.00017274645459470527, + "loss": 0.0131, "step": 327280 }, { - "epoch": 1.65, - "learning_rate": 5.231697534445615e-05, - "loss": 0.0086, + "epoch": 0.85, + "learning_rate": 0.00017274256637833378, + "loss": 0.0152, "step": 327290 }, { - "epoch": 1.65, - "learning_rate": 5.230940765144214e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017273867816196235, + "loss": 0.0116, "step": 327300 }, { - "epoch": 1.65, - "learning_rate": 5.2301839958428135e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.0001727347899455909, + "loss": 0.0112, "step": 327310 }, { - "epoch": 1.65, - "learning_rate": 5.2294272265414123e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.0001727309017292194, + "loss": 0.0134, "step": 327320 }, { - "epoch": 1.65, - "learning_rate": 5.228670457240011e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017272701351284795, + "loss": 0.0095, "step": 327330 }, { - "epoch": 1.65, - "learning_rate": 5.22791368793861e-05, - "loss": 0.0045, + "epoch": 0.85, + "learning_rate": 0.0001727231252964765, + "loss": 0.0125, "step": 327340 }, { - "epoch": 1.65, - "learning_rate": 5.2271569186372095e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017271923708010503, + "loss": 0.0136, "step": 327350 }, { - "epoch": 1.65, - "learning_rate": 5.226400149335808e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017271534886373354, + "loss": 0.0156, "step": 327360 }, { - "epoch": 1.65, - "learning_rate": 5.225643380034407e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017271146064736209, + "loss": 0.0133, "step": 327370 }, { - "epoch": 1.65, - "learning_rate": 5.224886610733006e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017270757243099063, + "loss": 0.0124, "step": 327380 }, { - "epoch": 1.65, - "learning_rate": 5.2241298414316055e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017270368421461917, + "loss": 0.0127, "step": 327390 }, { - "epoch": 1.65, - "learning_rate": 5.223373072130204e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017269979599824768, + "loss": 0.0136, "step": 327400 }, { - "epoch": 1.65, - "learning_rate": 5.222616302828803e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017269590778187623, + "loss": 0.0113, "step": 327410 }, { - "epoch": 1.65, - "learning_rate": 5.221859533527402e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017269201956550477, + "loss": 0.0122, "step": 327420 }, { - "epoch": 1.65, - "learning_rate": 5.2211027642260014e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001726881313491333, + "loss": 0.021, "step": 327430 }, { - "epoch": 1.65, - "learning_rate": 5.2203459949246e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017268424313276182, + "loss": 0.013, "step": 327440 }, { - "epoch": 1.65, - "learning_rate": 5.219589225623199e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017268035491639036, + "loss": 0.0138, "step": 327450 }, { - "epoch": 1.65, - "learning_rate": 5.218832456321798e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017267646670001893, + "loss": 0.0163, "step": 327460 }, { - "epoch": 1.65, - "learning_rate": 5.2180756870203974e-05, - "loss": 0.0081, + "epoch": 0.85, + "learning_rate": 0.00017267257848364745, + "loss": 0.0135, "step": 327470 }, { - "epoch": 1.65, - "learning_rate": 5.217318917718996e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.000172668690267276, + "loss": 0.0129, "step": 327480 }, { - "epoch": 1.65, - "learning_rate": 5.216562148417595e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001726648020509045, + "loss": 0.0132, "step": 327490 }, { - "epoch": 1.65, - "learning_rate": 5.215805379116194e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017266091383453307, + "loss": 0.0116, "step": 327500 }, { - "epoch": 1.65, - "learning_rate": 5.2150486098147933e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.0001726570256181616, + "loss": 0.0148, "step": 327510 }, { - "epoch": 1.65, - "learning_rate": 5.214291840513392e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017265313740179013, + "loss": 0.0173, "step": 327520 }, { - "epoch": 1.65, - "learning_rate": 5.213535071211991e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017264924918541864, + "loss": 0.015, "step": 327530 }, { - "epoch": 1.65, - "learning_rate": 5.21277830191059e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017264536096904719, + "loss": 0.014, "step": 327540 }, { - "epoch": 1.65, - "learning_rate": 5.212021532609189e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017264147275267573, + "loss": 0.0128, "step": 327550 }, { - "epoch": 1.65, - "learning_rate": 5.211264763307788e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.00017263758453630427, + "loss": 0.0129, "step": 327560 }, { - "epoch": 1.65, - "learning_rate": 5.210507994006387e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017263369631993278, + "loss": 0.0136, "step": 327570 }, { - "epoch": 1.65, - "learning_rate": 5.209751224704985e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017262980810356132, + "loss": 0.011, "step": 327580 }, { - "epoch": 1.65, - "learning_rate": 5.208994455403584e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017262591988718987, + "loss": 0.0154, "step": 327590 }, { - "epoch": 1.65, - "learning_rate": 5.2082376861021834e-05, - "loss": 0.0084, + "epoch": 0.85, + "learning_rate": 0.0001726220316708184, + "loss": 0.0112, "step": 327600 }, { - "epoch": 1.65, - "learning_rate": 5.207480916800782e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017261814345444692, + "loss": 0.0116, "step": 327610 }, { - "epoch": 1.65, - "learning_rate": 5.206724147499381e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017261425523807546, + "loss": 0.0167, "step": 327620 }, { - "epoch": 1.65, - "learning_rate": 5.20596737819798e-05, - "loss": 0.0087, + "epoch": 0.85, + "learning_rate": 0.00017261036702170403, + "loss": 0.0145, "step": 327630 }, { - "epoch": 1.65, - "learning_rate": 5.2052106088965794e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017260647880533255, + "loss": 0.0113, "step": 327640 }, { - "epoch": 1.65, - "learning_rate": 5.204453839595178e-05, - "loss": 0.009, + "epoch": 0.85, + "learning_rate": 0.0001726025905889611, + "loss": 0.0141, "step": 327650 }, { - "epoch": 1.65, - "learning_rate": 5.203697070293777e-05, - "loss": 0.0076, + "epoch": 0.85, + "learning_rate": 0.0001725987023725896, + "loss": 0.0116, "step": 327660 }, { - "epoch": 1.65, - "learning_rate": 5.202940300992376e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017259481415621817, + "loss": 0.0152, "step": 327670 }, { - "epoch": 1.65, - "learning_rate": 5.2021835316909754e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.0001725909259398467, + "loss": 0.0147, "step": 327680 }, { - "epoch": 1.65, - "learning_rate": 5.201426762389574e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017258703772347523, + "loss": 0.0197, "step": 327690 }, { - "epoch": 1.65, - "learning_rate": 5.200669993088173e-05, - "loss": 0.008, + "epoch": 0.85, + "learning_rate": 0.00017258314950710374, + "loss": 0.0149, "step": 327700 }, { - "epoch": 1.65, - "learning_rate": 5.1999132237867725e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.0001725792612907323, + "loss": 0.012, "step": 327710 }, { - "epoch": 1.65, - "learning_rate": 5.199156454485371e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017257537307436083, + "loss": 0.0142, "step": 327720 }, { - "epoch": 1.65, - "learning_rate": 5.19839968518397e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017257148485798937, + "loss": 0.0154, "step": 327730 }, { - "epoch": 1.65, - "learning_rate": 5.197642915882569e-05, - "loss": 0.0112, + "epoch": 0.85, + "learning_rate": 0.00017256759664161788, + "loss": 0.0113, "step": 327740 }, { - "epoch": 1.65, - "learning_rate": 5.1968861465811685e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017256370842524642, + "loss": 0.0161, "step": 327750 }, { - "epoch": 1.65, - "learning_rate": 5.196129377279767e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017255982020887497, + "loss": 0.0141, "step": 327760 }, { - "epoch": 1.65, - "learning_rate": 5.195372607978366e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001725559319925035, + "loss": 0.0132, "step": 327770 }, { - "epoch": 1.65, - "learning_rate": 5.194615838676965e-05, - "loss": 0.0113, + "epoch": 0.85, + "learning_rate": 0.00017255204377613202, + "loss": 0.0115, "step": 327780 }, { - "epoch": 1.65, - "learning_rate": 5.1938590693755644e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.00017254815555976056, + "loss": 0.0173, "step": 327790 }, { - "epoch": 1.65, - "learning_rate": 5.193102300074163e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017254426734338913, + "loss": 0.0208, "step": 327800 }, { - "epoch": 1.65, - "learning_rate": 5.192345530772762e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017254037912701765, + "loss": 0.0145, "step": 327810 }, { - "epoch": 1.65, - "learning_rate": 5.191588761471361e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017253649091064616, + "loss": 0.0137, "step": 327820 }, { - "epoch": 1.65, - "learning_rate": 5.1908319921699604e-05, - "loss": 0.0099, + "epoch": 0.85, + "learning_rate": 0.0001725326026942747, + "loss": 0.0146, "step": 327830 }, { - "epoch": 1.65, - "learning_rate": 5.190075222868559e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017252871447790327, + "loss": 0.0122, "step": 327840 }, { - "epoch": 1.65, - "learning_rate": 5.189318453567158e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.0001725248262615318, + "loss": 0.0123, "step": 327850 }, { - "epoch": 1.65, - "learning_rate": 5.188561684265757e-05, - "loss": 0.0043, + "epoch": 0.85, + "learning_rate": 0.00017252093804516033, + "loss": 0.015, "step": 327860 }, { - "epoch": 1.65, - "learning_rate": 5.1878049149643564e-05, - "loss": 0.0089, + "epoch": 0.85, + "learning_rate": 0.00017251704982878884, + "loss": 0.0129, "step": 327870 }, { - "epoch": 1.65, - "learning_rate": 5.187048145662955e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.0001725131616124174, + "loss": 0.0125, "step": 327880 }, { - "epoch": 1.65, - "learning_rate": 5.186291376361554e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017250927339604593, + "loss": 0.0143, "step": 327890 }, { - "epoch": 1.65, - "learning_rate": 5.185534607060152e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017250538517967447, + "loss": 0.0116, "step": 327900 }, { - "epoch": 1.65, - "learning_rate": 5.184777837758751e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017250149696330298, + "loss": 0.0186, "step": 327910 }, { - "epoch": 1.65, - "learning_rate": 5.1840210684573505e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017249760874693155, + "loss": 0.015, "step": 327920 }, { - "epoch": 1.65, - "learning_rate": 5.183264299155949e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017249372053056007, + "loss": 0.016, "step": 327930 }, { - "epoch": 1.65, - "learning_rate": 5.182507529854548e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.0001724898323141886, + "loss": 0.0113, "step": 327940 }, { - "epoch": 1.65, - "learning_rate": 5.181750760553147e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017248594409781712, + "loss": 0.0156, "step": 327950 }, { - "epoch": 1.65, - "learning_rate": 5.1809939912517464e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.0001724820558814457, + "loss": 0.0145, "step": 327960 }, { - "epoch": 1.65, - "learning_rate": 5.180237221950345e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.0001724781676650742, + "loss": 0.0138, "step": 327970 }, { - "epoch": 1.65, - "learning_rate": 5.179480452648944e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017247427944870275, + "loss": 0.013, "step": 327980 }, { - "epoch": 1.65, - "learning_rate": 5.178723683347543e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017247039123233126, + "loss": 0.0133, "step": 327990 }, { - "epoch": 1.65, - "learning_rate": 5.1779669140461424e-05, - "loss": 0.0089, + "epoch": 0.85, + "learning_rate": 0.0001724665030159598, + "loss": 0.0127, "step": 328000 }, { - "epoch": 1.65, - "eval_cer": 0.9144556999612812, - "eval_loss": 0.0049345288425683975, - "eval_runtime": 116.3068, - "eval_samples_per_second": 17.196, - "eval_steps_per_second": 4.299, + "epoch": 0.85, + "eval_cer": 0.8817222812402463, + "eval_loss": 0.009132904931902885, + "eval_runtime": 107.5638, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.648, "step": 328000 }, { - "epoch": 1.65, - "learning_rate": 5.177210144744741e-05, - "loss": 0.0068, - "step": 328010 + "epoch": 0.85, + "learning_rate": 0.00017246261479958837, + "loss": 0.0146, + "step": 328010 }, { - "epoch": 1.65, - "learning_rate": 5.17645337544334e-05, - "loss": 0.0093, + "epoch": 0.85, + "learning_rate": 0.00017245872658321689, + "loss": 0.0105, "step": 328020 }, { - "epoch": 1.65, - "learning_rate": 5.175696606141939e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017245483836684543, + "loss": 0.0131, "step": 328030 }, { - "epoch": 1.65, - "learning_rate": 5.1749398368405384e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017245095015047394, + "loss": 0.0128, "step": 328040 }, { - "epoch": 1.66, - "learning_rate": 5.174183067539137e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.0001724470619341025, + "loss": 0.0125, "step": 328050 }, { - "epoch": 1.66, - "learning_rate": 5.173426298237736e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017244317371773103, + "loss": 0.0126, "step": 328060 }, { - "epoch": 1.66, - "learning_rate": 5.172669528936335e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017243928550135957, + "loss": 0.014, "step": 328070 }, { - "epoch": 1.66, - "learning_rate": 5.171912759634934e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017243539728498808, + "loss": 0.0143, "step": 328080 }, { - "epoch": 1.66, - "learning_rate": 5.171155990333533e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.00017243150906861665, + "loss": 0.0197, "step": 328090 }, { - "epoch": 1.66, - "learning_rate": 5.170399221032132e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017242762085224516, + "loss": 0.0125, "step": 328100 }, { - "epoch": 1.66, - "learning_rate": 5.169642451730731e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.0001724237326358737, + "loss": 0.0164, "step": 328110 }, { - "epoch": 1.66, - "learning_rate": 5.16888568242933e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.00017241984441950222, + "loss": 0.0135, "step": 328120 }, { - "epoch": 1.66, - "learning_rate": 5.168128913127929e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.0001724159562031308, + "loss": 0.0141, "step": 328130 }, { - "epoch": 1.66, - "learning_rate": 5.167372143826528e-05, - "loss": 0.008, + "epoch": 0.85, + "learning_rate": 0.0001724120679867593, + "loss": 0.0173, "step": 328140 }, { - "epoch": 1.66, - "learning_rate": 5.166615374525127e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017240817977038785, + "loss": 0.014, "step": 328150 }, { - "epoch": 1.66, - "learning_rate": 5.165858605223726e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017240429155401636, + "loss": 0.0158, "step": 328160 }, { - "epoch": 1.66, - "learning_rate": 5.165101835922325e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017240040333764493, + "loss": 0.0153, "step": 328170 }, { - "epoch": 1.66, - "learning_rate": 5.164345066620924e-05, - "loss": 0.0042, + "epoch": 0.85, + "learning_rate": 0.00017239651512127347, + "loss": 0.0166, "step": 328180 }, { - "epoch": 1.66, - "learning_rate": 5.163588297319523e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017239262690490199, + "loss": 0.0129, "step": 328190 }, { - "epoch": 1.66, - "learning_rate": 5.162831528018122e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017238873868853053, + "loss": 0.0146, "step": 328200 }, { - "epoch": 1.66, - "learning_rate": 5.1620747587167204e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017238485047215907, + "loss": 0.0145, "step": 328210 }, { - "epoch": 1.66, - "learning_rate": 5.161317989415319e-05, - "loss": 0.0086, + "epoch": 0.85, + "learning_rate": 0.0001723809622557876, + "loss": 0.0157, "step": 328220 }, { - "epoch": 1.66, - "learning_rate": 5.160561220113918e-05, - "loss": 0.0044, + "epoch": 0.85, + "learning_rate": 0.00017237707403941612, + "loss": 0.013, "step": 328230 }, { - "epoch": 1.66, - "learning_rate": 5.1598044508125175e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017237318582304467, + "loss": 0.0132, "step": 328240 }, { - "epoch": 1.66, - "learning_rate": 5.159047681511116e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017236929760667318, + "loss": 0.0153, "step": 328250 }, { - "epoch": 1.66, - "learning_rate": 5.158290912209715e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017236540939030175, + "loss": 0.013, "step": 328260 }, { - "epoch": 1.66, - "learning_rate": 5.157534142908314e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017236152117393026, + "loss": 0.0165, "step": 328270 }, { - "epoch": 1.66, - "learning_rate": 5.1567773736069135e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.0001723576329575588, + "loss": 0.0118, "step": 328280 }, { - "epoch": 1.66, - "learning_rate": 5.156020604305512e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017235374474118732, + "loss": 0.0171, "step": 328290 }, { - "epoch": 1.66, - "learning_rate": 5.155263835004111e-05, - "loss": 0.008, + "epoch": 0.85, + "learning_rate": 0.0001723498565248159, + "loss": 0.0106, "step": 328300 }, { - "epoch": 1.66, - "learning_rate": 5.15450706570271e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.0001723459683084444, + "loss": 0.0137, "step": 328310 }, { - "epoch": 1.66, - "learning_rate": 5.1537502964013094e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017234208009207295, + "loss": 0.0141, "step": 328320 }, { - "epoch": 1.66, - "learning_rate": 5.152993527099908e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017233819187570146, + "loss": 0.0147, "step": 328330 }, { - "epoch": 1.66, - "learning_rate": 5.152236757798507e-05, - "loss": 0.0094, + "epoch": 0.85, + "learning_rate": 0.00017233430365933003, + "loss": 0.0175, "step": 328340 }, { - "epoch": 1.66, - "learning_rate": 5.151479988497106e-05, - "loss": 0.0084, + "epoch": 0.85, + "learning_rate": 0.00017233041544295857, + "loss": 0.014, "step": 328350 }, { - "epoch": 1.66, - "learning_rate": 5.1507232191957054e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017232652722658708, + "loss": 0.0171, "step": 328360 }, { - "epoch": 1.66, - "learning_rate": 5.149966449894304e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017232263901021563, + "loss": 0.0157, "step": 328370 }, { - "epoch": 1.66, - "learning_rate": 5.149209680592903e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017231875079384417, + "loss": 0.0172, "step": 328380 }, { - "epoch": 1.66, - "learning_rate": 5.148452911291502e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.0001723148625774727, + "loss": 0.013, "step": 328390 }, { - "epoch": 1.66, - "learning_rate": 5.1476961419901014e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017231097436110122, + "loss": 0.0124, "step": 328400 }, { - "epoch": 1.66, - "learning_rate": 5.1469393726887e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017230708614472977, + "loss": 0.0129, "step": 328410 }, { - "epoch": 1.66, - "learning_rate": 5.146182603387299e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.0001723031979283583, + "loss": 0.0138, "step": 328420 }, { - "epoch": 1.66, - "learning_rate": 5.145425834085898e-05, - "loss": 0.0066, + "epoch": 0.85, + "learning_rate": 0.00017229930971198685, + "loss": 0.0142, "step": 328430 }, { - "epoch": 1.66, - "learning_rate": 5.144669064784497e-05, - "loss": 0.0048, + "epoch": 0.85, + "learning_rate": 0.00017229542149561536, + "loss": 0.0128, "step": 328440 }, { - "epoch": 1.66, - "learning_rate": 5.143912295483096e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.0001722915332792439, + "loss": 0.014, "step": 328450 }, { - "epoch": 1.66, - "learning_rate": 5.143155526181695e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017228764506287245, + "loss": 0.0135, "step": 328460 }, { - "epoch": 1.66, - "learning_rate": 5.142398756880294e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.000172283756846501, + "loss": 0.0111, "step": 328470 }, { - "epoch": 1.66, - "learning_rate": 5.141641987578893e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.0001722798686301295, + "loss": 0.0349, "step": 328480 }, { - "epoch": 1.66, - "learning_rate": 5.140885218277492e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017227598041375804, + "loss": 0.0137, "step": 328490 }, { - "epoch": 1.66, - "learning_rate": 5.140128448976091e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017227209219738656, + "loss": 0.0122, "step": 328500 }, { - "epoch": 1.66, - "learning_rate": 5.13937167967469e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017226820398101513, + "loss": 0.0211, "step": 328510 }, { - "epoch": 1.66, - "learning_rate": 5.138614910373288e-05, - "loss": 0.0043, + "epoch": 0.85, + "learning_rate": 0.00017226431576464367, + "loss": 0.011, "step": 328520 }, { - "epoch": 1.66, - "learning_rate": 5.1378581410718874e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.00017226042754827218, + "loss": 0.011, "step": 328530 }, { - "epoch": 1.66, - "learning_rate": 5.137101371770486e-05, - "loss": 0.0091, + "epoch": 0.85, + "learning_rate": 0.0001722565393319007, + "loss": 0.0129, "step": 328540 }, { - "epoch": 1.66, - "learning_rate": 5.136344602469085e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017225265111552927, + "loss": 0.0204, "step": 328550 }, { - "epoch": 1.66, - "learning_rate": 5.135587833167684e-05, - "loss": 0.0076, + "epoch": 0.85, + "learning_rate": 0.0001722487628991578, + "loss": 0.0129, "step": 328560 }, { - "epoch": 1.66, - "learning_rate": 5.1348310638662834e-05, - "loss": 0.0081, + "epoch": 0.85, + "learning_rate": 0.00017224487468278632, + "loss": 0.0115, "step": 328570 }, { - "epoch": 1.66, - "learning_rate": 5.134074294564882e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017224098646641487, + "loss": 0.0104, "step": 328580 }, { - "epoch": 1.66, - "learning_rate": 5.133317525263481e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.0001722370982500434, + "loss": 0.0133, "step": 328590 }, { - "epoch": 1.66, - "learning_rate": 5.13256075596208e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017223321003367195, + "loss": 0.0137, "step": 328600 }, { - "epoch": 1.66, - "learning_rate": 5.1318039866606793e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017222932181730046, + "loss": 0.0165, "step": 328610 }, { - "epoch": 1.66, - "learning_rate": 5.131047217359278e-05, - "loss": 0.0085, + "epoch": 0.85, + "learning_rate": 0.000172225433600929, + "loss": 0.0169, "step": 328620 }, { - "epoch": 1.66, - "learning_rate": 5.130290448057877e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017222154538455755, + "loss": 0.0118, "step": 328630 }, { - "epoch": 1.66, - "learning_rate": 5.129533678756476e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.0001722176571681861, + "loss": 0.0143, "step": 328640 }, { - "epoch": 1.66, - "learning_rate": 5.128776909455075e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.0001722137689518146, + "loss": 0.0121, "step": 328650 }, { - "epoch": 1.66, - "learning_rate": 5.128020140153674e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.00017220988073544314, + "loss": 0.0165, "step": 328660 }, { - "epoch": 1.66, - "learning_rate": 5.127263370852273e-05, - "loss": 0.0089, + "epoch": 0.85, + "learning_rate": 0.0001722059925190717, + "loss": 0.012, "step": 328670 }, { - "epoch": 1.66, - "learning_rate": 5.1265066015508724e-05, - "loss": 0.0107, + "epoch": 0.85, + "learning_rate": 0.00017220210430270023, + "loss": 0.0139, "step": 328680 }, { - "epoch": 1.66, - "learning_rate": 5.125749832249471e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017219821608632874, + "loss": 0.0109, "step": 328690 }, { - "epoch": 1.66, - "learning_rate": 5.12499306294807e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.00017219432786995728, + "loss": 0.0138, "step": 328700 }, { - "epoch": 1.66, - "learning_rate": 5.124236293646669e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017219043965358585, + "loss": 0.0128, "step": 328710 }, { - "epoch": 1.66, - "learning_rate": 5.1234795243452684e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017218655143721437, + "loss": 0.0142, "step": 328720 }, { - "epoch": 1.66, - "learning_rate": 5.122722755043867e-05, - "loss": 0.0046, + "epoch": 0.85, + "learning_rate": 0.0001721826632208429, + "loss": 0.0129, "step": 328730 }, { - "epoch": 1.66, - "learning_rate": 5.121965985742466e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017217877500447142, + "loss": 0.0131, "step": 328740 }, { - "epoch": 1.66, - "learning_rate": 5.121209216441065e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017217488678809996, + "loss": 0.011, "step": 328750 }, { - "epoch": 1.66, - "learning_rate": 5.1204524471396644e-05, - "loss": 0.0053, + "epoch": 0.85, + "learning_rate": 0.0001721709985717285, + "loss": 0.013, "step": 328760 }, { - "epoch": 1.66, - "learning_rate": 5.119695677838263e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.00017216711035535705, + "loss": 0.0145, "step": 328770 }, { - "epoch": 1.66, - "learning_rate": 5.118938908536862e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017216322213898556, + "loss": 0.0171, "step": 328780 }, { - "epoch": 1.66, - "learning_rate": 5.118182139235461e-05, - "loss": 0.0086, + "epoch": 0.85, + "learning_rate": 0.0001721593339226141, + "loss": 0.0098, "step": 328790 }, { - "epoch": 1.66, - "learning_rate": 5.1174253699340603e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017215544570624265, + "loss": 0.0114, "step": 328800 }, { - "epoch": 1.66, - "learning_rate": 5.116668600632659e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.0001721515574898712, + "loss": 0.0123, "step": 328810 }, { - "epoch": 1.66, - "learning_rate": 5.115911831331258e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.0001721476692734997, + "loss": 0.0252, "step": 328820 }, { - "epoch": 1.66, - "learning_rate": 5.115155062029857e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017214378105712824, + "loss": 0.0145, "step": 328830 }, { - "epoch": 1.66, - "learning_rate": 5.114398292728455e-05, - "loss": 0.005, + "epoch": 0.85, + "learning_rate": 0.0001721398928407568, + "loss": 0.0156, "step": 328840 }, { - "epoch": 1.66, - "learning_rate": 5.1136415234270545e-05, - "loss": 0.0048, + "epoch": 0.85, + "learning_rate": 0.00017213600462438533, + "loss": 0.015, "step": 328850 }, { - "epoch": 1.66, - "learning_rate": 5.112884754125653e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017213211640801384, + "loss": 0.0142, "step": 328860 }, { - "epoch": 1.66, - "learning_rate": 5.112127984824252e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017212822819164238, + "loss": 0.0127, "step": 328870 }, { - "epoch": 1.66, - "learning_rate": 5.111371215522851e-05, - "loss": 0.0086, + "epoch": 0.85, + "learning_rate": 0.00017212433997527095, + "loss": 0.0112, "step": 328880 }, { - "epoch": 1.66, - "learning_rate": 5.1106144462214504e-05, - "loss": 0.0037, + "epoch": 0.85, + "learning_rate": 0.00017212045175889947, + "loss": 0.0196, "step": 328890 }, { - "epoch": 1.66, - "learning_rate": 5.109857676920049e-05, - "loss": 0.0052, + "epoch": 0.85, + "learning_rate": 0.000172116563542528, + "loss": 0.015, "step": 328900 }, { - "epoch": 1.66, - "learning_rate": 5.109100907618648e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017211267532615652, + "loss": 0.0139, "step": 328910 }, { - "epoch": 1.66, - "learning_rate": 5.108344138317247e-05, - "loss": 0.0055, + "epoch": 0.85, + "learning_rate": 0.0001721087871097851, + "loss": 0.0185, "step": 328920 }, { - "epoch": 1.66, - "learning_rate": 5.1075873690158464e-05, - "loss": 0.0083, + "epoch": 0.85, + "learning_rate": 0.0001721048988934136, + "loss": 0.0116, "step": 328930 }, { - "epoch": 1.66, - "learning_rate": 5.106830599714445e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017210101067704215, + "loss": 0.0124, "step": 328940 }, { - "epoch": 1.66, - "learning_rate": 5.106073830413044e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017209712246067066, + "loss": 0.0144, "step": 328950 }, { - "epoch": 1.66, - "learning_rate": 5.105317061111643e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017209323424429923, + "loss": 0.0115, "step": 328960 }, { - "epoch": 1.66, - "learning_rate": 5.1045602918102423e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.00017208934602792775, + "loss": 0.0127, "step": 328970 }, { - "epoch": 1.66, - "learning_rate": 5.103803522508841e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.0001720854578115563, + "loss": 0.0117, "step": 328980 }, { - "epoch": 1.66, - "learning_rate": 5.10304675320744e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.0001720815695951848, + "loss": 0.0105, "step": 328990 }, { - "epoch": 1.66, - "learning_rate": 5.102289983906039e-05, - "loss": 0.0058, + "epoch": 0.85, + "learning_rate": 0.00017207768137881334, + "loss": 0.013, "step": 329000 }, { - "epoch": 1.66, - "eval_cer": 0.914447936792278, - "eval_loss": 0.004932132083922625, - "eval_runtime": 116.3131, - "eval_samples_per_second": 17.195, - "eval_steps_per_second": 4.299, + "epoch": 0.85, + "eval_cer": 0.8817348779726539, + "eval_loss": 0.009153938852250576, + "eval_runtime": 107.5607, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.649, "step": 329000 }, { - "epoch": 1.66, - "learning_rate": 5.101533214604638e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017207379316244188, + "loss": 0.0126, "step": 329010 }, { - "epoch": 1.66, - "learning_rate": 5.100776445303237e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017206990494607043, + "loss": 0.0101, "step": 329020 }, { - "epoch": 1.66, - "learning_rate": 5.100019676001836e-05, - "loss": 0.0103, + "epoch": 0.85, + "learning_rate": 0.00017206601672969894, + "loss": 0.0113, "step": 329030 }, { - "epoch": 1.66, - "learning_rate": 5.099262906700435e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017206212851332748, + "loss": 0.0129, "step": 329040 }, { - "epoch": 1.66, - "learning_rate": 5.098506137399034e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017205824029695605, + "loss": 0.0165, "step": 329050 }, { - "epoch": 1.66, - "learning_rate": 5.097749368097633e-05, - "loss": 0.0049, + "epoch": 0.85, + "learning_rate": 0.00017205435208058457, + "loss": 0.0136, "step": 329060 }, { - "epoch": 1.66, - "learning_rate": 5.096992598796232e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.0001720504638642131, + "loss": 0.015, "step": 329070 }, { - "epoch": 1.66, - "learning_rate": 5.096235829494831e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017204657564784162, + "loss": 0.0145, "step": 329080 }, { - "epoch": 1.66, - "learning_rate": 5.09547906019343e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.0001720426874314702, + "loss": 0.0143, "step": 329090 }, { - "epoch": 1.66, - "learning_rate": 5.094722290892029e-05, - "loss": 0.0097, + "epoch": 0.85, + "learning_rate": 0.0001720387992150987, + "loss": 0.013, "step": 329100 }, { - "epoch": 1.66, - "learning_rate": 5.093965521590628e-05, - "loss": 0.0046, + "epoch": 0.85, + "learning_rate": 0.00017203491099872725, + "loss": 0.0144, "step": 329110 }, { - "epoch": 1.66, - "learning_rate": 5.093208752289227e-05, - "loss": 0.0081, + "epoch": 0.85, + "learning_rate": 0.00017203102278235576, + "loss": 0.0118, "step": 329120 }, { - "epoch": 1.66, - "learning_rate": 5.092451982987826e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017202713456598433, + "loss": 0.0129, "step": 329130 }, { - "epoch": 1.66, - "learning_rate": 5.091695213686425e-05, - "loss": 0.0056, + "epoch": 0.85, + "learning_rate": 0.00017202324634961284, + "loss": 0.0175, "step": 329140 }, { - "epoch": 1.66, - "learning_rate": 5.090938444385023e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017201935813324139, + "loss": 0.0116, "step": 329150 }, { - "epoch": 1.66, - "learning_rate": 5.090181675083622e-05, - "loss": 0.0051, + "epoch": 0.85, + "learning_rate": 0.0001720154699168699, + "loss": 0.0123, "step": 329160 }, { - "epoch": 1.66, - "learning_rate": 5.0894249057822215e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017201158170049847, + "loss": 0.0142, "step": 329170 }, { - "epoch": 1.66, - "learning_rate": 5.08866813648082e-05, - "loss": 0.0091, + "epoch": 0.85, + "learning_rate": 0.00017200769348412698, + "loss": 0.015, "step": 329180 }, { - "epoch": 1.66, - "learning_rate": 5.087911367179419e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017200380526775553, + "loss": 0.0116, "step": 329190 }, { - "epoch": 1.66, - "learning_rate": 5.087154597878018e-05, - "loss": 0.0076, + "epoch": 0.85, + "learning_rate": 0.00017199991705138404, + "loss": 0.0145, "step": 329200 }, { - "epoch": 1.66, - "learning_rate": 5.0863978285766175e-05, - "loss": 0.0081, + "epoch": 0.85, + "learning_rate": 0.0001719960288350126, + "loss": 0.0157, "step": 329210 }, { - "epoch": 1.66, - "learning_rate": 5.085641059275216e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017199214061864115, + "loss": 0.0109, "step": 329220 }, { - "epoch": 1.66, - "learning_rate": 5.084884289973815e-05, - "loss": 0.0092, + "epoch": 0.85, + "learning_rate": 0.00017198825240226967, + "loss": 0.0126, "step": 329230 }, { - "epoch": 1.66, - "learning_rate": 5.084127520672414e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.0001719843641858982, + "loss": 0.0102, "step": 329240 }, { - "epoch": 1.66, - "learning_rate": 5.0833707513710134e-05, - "loss": 0.0042, + "epoch": 0.85, + "learning_rate": 0.00017198047596952672, + "loss": 0.0148, "step": 329250 }, { - "epoch": 1.66, - "learning_rate": 5.082613982069612e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.0001719765877531553, + "loss": 0.0178, "step": 329260 }, { - "epoch": 1.66, - "learning_rate": 5.081857212768211e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.0001719726995367838, + "loss": 0.0133, "step": 329270 }, { - "epoch": 1.66, - "learning_rate": 5.08110044346681e-05, - "loss": 0.0083, + "epoch": 0.85, + "learning_rate": 0.00017196881132041235, + "loss": 0.012, "step": 329280 }, { - "epoch": 1.66, - "learning_rate": 5.0803436741654094e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017196492310404086, + "loss": 0.013, "step": 329290 }, { - "epoch": 1.66, - "learning_rate": 5.079586904864008e-05, - "loss": 0.0045, + "epoch": 0.85, + "learning_rate": 0.00017196103488766943, + "loss": 0.0154, "step": 329300 }, { - "epoch": 1.66, - "learning_rate": 5.078830135562607e-05, - "loss": 0.0063, + "epoch": 0.85, + "learning_rate": 0.00017195714667129794, + "loss": 0.0109, "step": 329310 }, { - "epoch": 1.66, - "learning_rate": 5.078073366261206e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017195325845492649, + "loss": 0.0142, "step": 329320 }, { - "epoch": 1.66, - "learning_rate": 5.0773165969598054e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.000171949370238555, + "loss": 0.0132, "step": 329330 }, { - "epoch": 1.66, - "learning_rate": 5.076559827658404e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.00017194548202218357, + "loss": 0.0151, "step": 329340 }, { - "epoch": 1.66, - "learning_rate": 5.075803058357003e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017194159380581208, + "loss": 0.0124, "step": 329350 }, { - "epoch": 1.66, - "learning_rate": 5.075046289055602e-05, - "loss": 0.0078, + "epoch": 0.85, + "learning_rate": 0.00017193770558944063, + "loss": 0.0231, "step": 329360 }, { - "epoch": 1.66, - "learning_rate": 5.074289519754201e-05, - "loss": 0.0059, + "epoch": 0.85, + "learning_rate": 0.00017193381737306914, + "loss": 0.0133, "step": 329370 }, { - "epoch": 1.66, - "learning_rate": 5.0735327504528e-05, - "loss": 0.0109, + "epoch": 0.85, + "learning_rate": 0.0001719299291566977, + "loss": 0.0112, "step": 329380 }, { - "epoch": 1.66, - "learning_rate": 5.072775981151399e-05, - "loss": 0.0044, + "epoch": 0.85, + "learning_rate": 0.00017192604094032625, + "loss": 0.0149, "step": 329390 }, { - "epoch": 1.66, - "learning_rate": 5.072019211849998e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017192215272395476, + "loss": 0.0142, "step": 329400 }, { - "epoch": 1.66, - "learning_rate": 5.071262442548597e-05, - "loss": 0.0076, + "epoch": 0.85, + "learning_rate": 0.00017191826450758328, + "loss": 0.0253, "step": 329410 }, { - "epoch": 1.66, - "learning_rate": 5.070505673247196e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017191437629121185, + "loss": 0.0118, "step": 329420 }, { - "epoch": 1.66, - "learning_rate": 5.069748903945795e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.0001719104880748404, + "loss": 0.0094, "step": 329430 }, { - "epoch": 1.66, - "learning_rate": 5.068992134644394e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.0001719065998584689, + "loss": 0.016, "step": 329440 }, { - "epoch": 1.66, - "learning_rate": 5.068235365342993e-05, - "loss": 0.0077, + "epoch": 0.85, + "learning_rate": 0.00017190271164209745, + "loss": 0.0149, "step": 329450 }, { - "epoch": 1.66, - "learning_rate": 5.067478596041592e-05, - "loss": 0.008, + "epoch": 0.85, + "learning_rate": 0.000171898823425726, + "loss": 0.0165, "step": 329460 }, { - "epoch": 1.66, - "learning_rate": 5.06672182674019e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017189493520935453, + "loss": 0.0103, "step": 329470 }, { - "epoch": 1.66, - "learning_rate": 5.065965057438789e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017189104699298304, + "loss": 0.0106, "step": 329480 }, { - "epoch": 1.66, - "learning_rate": 5.065208288137388e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017188715877661159, + "loss": 0.013, "step": 329490 }, { - "epoch": 1.66, - "learning_rate": 5.0644515188359874e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.0001718832705602401, + "loss": 0.0111, "step": 329500 }, { - "epoch": 1.66, - "learning_rate": 5.063694749534586e-05, - "loss": 0.0047, + "epoch": 0.85, + "learning_rate": 0.00017187938234386867, + "loss": 0.0145, "step": 329510 }, { - "epoch": 1.66, - "learning_rate": 5.062937980233185e-05, - "loss": 0.0085, + "epoch": 0.85, + "learning_rate": 0.00017187549412749718, + "loss": 0.0162, "step": 329520 }, { - "epoch": 1.66, - "learning_rate": 5.062181210931784e-05, - "loss": 0.007, + "epoch": 0.85, + "learning_rate": 0.00017187160591112572, + "loss": 0.0129, "step": 329530 }, { - "epoch": 1.66, - "learning_rate": 5.061424441630383e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017186771769475424, + "loss": 0.0222, "step": 329540 }, { - "epoch": 1.66, - "learning_rate": 5.060667672328982e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.0001718638294783828, + "loss": 0.0121, "step": 329550 }, { - "epoch": 1.66, - "learning_rate": 5.059910903027581e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017185994126201132, + "loss": 0.0138, "step": 329560 }, { - "epoch": 1.66, - "learning_rate": 5.05915413372618e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.00017185605304563986, + "loss": 0.0118, "step": 329570 }, { - "epoch": 1.66, - "learning_rate": 5.058397364424779e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017185216482926838, + "loss": 0.0111, "step": 329580 }, { - "epoch": 1.66, - "learning_rate": 5.057640595123378e-05, - "loss": 0.0068, + "epoch": 0.85, + "learning_rate": 0.00017184827661289695, + "loss": 0.0156, "step": 329590 }, { - "epoch": 1.66, - "learning_rate": 5.056883825821977e-05, - "loss": 0.0047, + "epoch": 0.85, + "learning_rate": 0.0001718443883965255, + "loss": 0.0132, "step": 329600 }, { - "epoch": 1.66, - "learning_rate": 5.056127056520576e-05, - "loss": 0.006, + "epoch": 0.85, + "learning_rate": 0.000171840500180154, + "loss": 0.0138, "step": 329610 }, { - "epoch": 1.66, - "learning_rate": 5.055370287219175e-05, - "loss": 0.0069, + "epoch": 0.85, + "learning_rate": 0.00017183661196378255, + "loss": 0.0125, "step": 329620 }, { - "epoch": 1.66, - "learning_rate": 5.054613517917774e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.0001718327237474111, + "loss": 0.0167, "step": 329630 }, { - "epoch": 1.66, - "learning_rate": 5.053856748616373e-05, - "loss": 0.0065, + "epoch": 0.85, + "learning_rate": 0.00017182883553103963, + "loss": 0.0159, "step": 329640 }, { - "epoch": 1.66, - "learning_rate": 5.0530999793149724e-05, - "loss": 0.0072, + "epoch": 0.85, + "learning_rate": 0.00017182494731466814, + "loss": 0.0127, "step": 329650 }, { - "epoch": 1.66, - "learning_rate": 5.052343210013571e-05, - "loss": 0.0083, + "epoch": 0.85, + "learning_rate": 0.00017182105909829668, + "loss": 0.0129, "step": 329660 }, { - "epoch": 1.66, - "learning_rate": 5.05158644071217e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017181717088192523, + "loss": 0.0138, "step": 329670 }, { - "epoch": 1.66, - "learning_rate": 5.050829671410769e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017181328266555377, + "loss": 0.0125, "step": 329680 }, { - "epoch": 1.66, - "learning_rate": 5.0500729021093684e-05, - "loss": 0.0079, + "epoch": 0.85, + "learning_rate": 0.00017180939444918228, + "loss": 0.0113, "step": 329690 }, { - "epoch": 1.66, - "learning_rate": 5.049316132807967e-05, - "loss": 0.0057, + "epoch": 0.85, + "learning_rate": 0.00017180550623281082, + "loss": 0.0139, "step": 329700 }, { - "epoch": 1.66, - "learning_rate": 5.048559363506566e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.0001718016180164394, + "loss": 0.0163, "step": 329710 }, { - "epoch": 1.66, - "learning_rate": 5.047802594205165e-05, - "loss": 0.0071, + "epoch": 0.85, + "learning_rate": 0.0001717977298000679, + "loss": 0.0123, "step": 329720 }, { - "epoch": 1.66, - "learning_rate": 5.047045824903764e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017179384158369642, + "loss": 0.0134, "step": 329730 }, { - "epoch": 1.66, - "learning_rate": 5.046289055602363e-05, - "loss": 0.0075, + "epoch": 0.85, + "learning_rate": 0.00017178995336732496, + "loss": 0.0121, "step": 329740 }, { - "epoch": 1.66, - "learning_rate": 5.045532286300962e-05, - "loss": 0.0062, + "epoch": 0.85, + "learning_rate": 0.00017178606515095348, + "loss": 0.0131, "step": 329750 }, { - "epoch": 1.66, - "learning_rate": 5.044775516999561e-05, - "loss": 0.0061, + "epoch": 0.85, + "learning_rate": 0.00017178217693458205, + "loss": 0.016, "step": 329760 }, { - "epoch": 1.66, - "learning_rate": 5.04401874769816e-05, - "loss": 0.0073, + "epoch": 0.85, + "learning_rate": 0.0001717782887182106, + "loss": 0.0152, "step": 329770 }, { - "epoch": 1.66, - "learning_rate": 5.0432619783967584e-05, - "loss": 0.0082, + "epoch": 0.85, + "learning_rate": 0.0001717744005018391, + "loss": 0.0106, "step": 329780 }, { - "epoch": 1.66, - "learning_rate": 5.042505209095357e-05, - "loss": 0.0096, + "epoch": 0.85, + "learning_rate": 0.00017177051228546764, + "loss": 0.0146, "step": 329790 }, { - "epoch": 1.66, - "learning_rate": 5.041748439793956e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017176662406909619, + "loss": 0.015, "step": 329800 }, { - "epoch": 1.66, - "learning_rate": 5.040991670492555e-05, - "loss": 0.0064, + "epoch": 0.85, + "learning_rate": 0.00017176273585272473, + "loss": 0.0155, "step": 329810 }, { - "epoch": 1.66, - "learning_rate": 5.0402349011911544e-05, - "loss": 0.0067, + "epoch": 0.85, + "learning_rate": 0.00017175884763635324, + "loss": 0.0131, "step": 329820 }, { - "epoch": 1.66, - "learning_rate": 5.039478131889753e-05, - "loss": 0.0074, + "epoch": 0.85, + "learning_rate": 0.00017175495941998178, + "loss": 0.0152, "step": 329830 }, { - "epoch": 1.66, - "learning_rate": 5.038721362588352e-05, - "loss": 0.0054, + "epoch": 0.85, + "learning_rate": 0.00017175107120361033, + "loss": 0.0122, "step": 329840 }, { - "epoch": 1.66, - "learning_rate": 5.037964593286951e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017174718298723887, + "loss": 0.0153, "step": 329850 }, { - "epoch": 1.66, - "learning_rate": 5.0372078239855504e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.00017174329477086738, + "loss": 0.0179, "step": 329860 }, { - "epoch": 1.66, - "learning_rate": 5.036451054684149e-05, - "loss": 0.0104, + "epoch": 0.86, + "learning_rate": 0.00017173940655449592, + "loss": 0.013, "step": 329870 }, { - "epoch": 1.66, - "learning_rate": 5.035694285382748e-05, - "loss": 0.0092, + "epoch": 0.86, + "learning_rate": 0.00017173551833812447, + "loss": 0.0115, "step": 329880 }, { - "epoch": 1.66, - "learning_rate": 5.034937516081347e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.000171731630121753, + "loss": 0.0168, "step": 329890 }, { - "epoch": 1.66, - "learning_rate": 5.034180746779946e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017172774190538152, + "loss": 0.0148, "step": 329900 }, { - "epoch": 1.66, - "learning_rate": 5.033423977478545e-05, - "loss": 0.0043, + "epoch": 0.86, + "learning_rate": 0.00017172385368901006, + "loss": 0.0208, "step": 329910 }, { - "epoch": 1.66, - "learning_rate": 5.032667208177144e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017171996547263863, + "loss": 0.0132, "step": 329920 }, { - "epoch": 1.66, - "learning_rate": 5.031910438875743e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017171607725626715, + "loss": 0.0151, "step": 329930 }, { - "epoch": 1.66, - "learning_rate": 5.031153669574342e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.0001717121890398957, + "loss": 0.0174, "step": 329940 }, { - "epoch": 1.66, - "learning_rate": 5.030396900272941e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.0001717083008235242, + "loss": 0.0138, "step": 329950 }, { - "epoch": 1.66, - "learning_rate": 5.02964013097154e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017170441260715277, + "loss": 0.0126, "step": 329960 }, { - "epoch": 1.66, - "learning_rate": 5.028883361670139e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017170052439078129, + "loss": 0.0125, "step": 329970 }, { - "epoch": 1.66, - "learning_rate": 5.028126592368738e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017169663617440983, + "loss": 0.0162, "step": 329980 }, { - "epoch": 1.66, - "learning_rate": 5.027369823067337e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017169274795803834, + "loss": 0.0123, "step": 329990 }, { - "epoch": 1.66, - "learning_rate": 5.026613053765936e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017168885974166688, + "loss": 0.0171, "step": 330000 }, { - "epoch": 1.66, - "eval_cer": 0.9144411440194001, - "eval_loss": 0.0048608663491904736, - "eval_runtime": 116.3415, - "eval_samples_per_second": 17.191, - "eval_steps_per_second": 4.298, + "epoch": 0.86, + "eval_cer": 0.881719481966378, + "eval_loss": 0.008729472756385803, + "eval_runtime": 107.757, + "eval_samples_per_second": 18.56, + "eval_steps_per_second": 4.64, "step": 330000 }, { - "epoch": 1.66, - "learning_rate": 5.025856284464535e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017168497152529543, + "loss": 0.0129, "step": 330010 }, { - "epoch": 1.66, - "learning_rate": 5.025099515163134e-05, - "loss": 0.0089, + "epoch": 0.86, + "learning_rate": 0.00017168108330892397, + "loss": 0.0154, "step": 330020 }, { - "epoch": 1.67, - "learning_rate": 5.024342745861733e-05, - "loss": 0.0044, + "epoch": 0.86, + "learning_rate": 0.00017167719509255248, + "loss": 0.0135, "step": 330030 }, { - "epoch": 1.67, - "learning_rate": 5.023585976560332e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017167330687618102, + "loss": 0.0169, "step": 330040 }, { - "epoch": 1.67, - "learning_rate": 5.022829207258931e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017166941865980956, + "loss": 0.0126, "step": 330050 }, { - "epoch": 1.67, - "learning_rate": 5.02207243795753e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.0001716655304434381, + "loss": 0.0143, "step": 330060 }, { - "epoch": 1.67, - "learning_rate": 5.021315668656129e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017166164222706662, + "loss": 0.0127, "step": 330070 }, { - "epoch": 1.67, - "learning_rate": 5.020558899354728e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.00017165775401069516, + "loss": 0.011, "step": 330080 }, { - "epoch": 1.67, - "learning_rate": 5.019802130053326e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017165386579432373, + "loss": 0.0126, "step": 330090 }, { - "epoch": 1.67, - "learning_rate": 5.0190453607519255e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017164997757795225, + "loss": 0.0132, "step": 330100 }, { - "epoch": 1.67, - "learning_rate": 5.018288591450524e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.0001716460893615808, + "loss": 0.0159, "step": 330110 }, { - "epoch": 1.67, - "learning_rate": 5.017531822149123e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.0001716422011452093, + "loss": 0.0141, "step": 330120 }, { - "epoch": 1.67, - "learning_rate": 5.016775052847722e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017163831292883787, + "loss": 0.0119, "step": 330130 }, { - "epoch": 1.67, - "learning_rate": 5.0160182835463214e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017163442471246638, + "loss": 0.0111, "step": 330140 }, { - "epoch": 1.67, - "learning_rate": 5.01526151424492e-05, - "loss": 0.01, + "epoch": 0.86, + "learning_rate": 0.00017163053649609493, + "loss": 0.0141, "step": 330150 }, { - "epoch": 1.67, - "learning_rate": 5.014504744943519e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017162664827972344, + "loss": 0.0101, "step": 330160 }, { - "epoch": 1.67, - "learning_rate": 5.013747975642118e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.000171622760063352, + "loss": 0.0165, "step": 330170 }, { - "epoch": 1.67, - "learning_rate": 5.0129912063407174e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017161887184698052, + "loss": 0.0127, "step": 330180 }, { - "epoch": 1.67, - "learning_rate": 5.012234437039316e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017161498363060907, + "loss": 0.0128, "step": 330190 }, { - "epoch": 1.67, - "learning_rate": 5.011477667737915e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017161109541423758, + "loss": 0.0119, "step": 330200 }, { - "epoch": 1.67, - "learning_rate": 5.010720898436514e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017160720719786615, + "loss": 0.0122, "step": 330210 }, { - "epoch": 1.67, - "learning_rate": 5.0099641291351134e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017160331898149466, + "loss": 0.0122, "step": 330220 }, { - "epoch": 1.67, - "learning_rate": 5.009207359833712e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.0001715994307651232, + "loss": 0.0159, "step": 330230 }, { - "epoch": 1.67, - "learning_rate": 5.008450590532311e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017159554254875172, + "loss": 0.0131, "step": 330240 }, { - "epoch": 1.67, - "learning_rate": 5.00769382123091e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.00017159165433238026, + "loss": 0.0141, "step": 330250 }, { - "epoch": 1.67, - "learning_rate": 5.0069370519295093e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017158776611600883, + "loss": 0.0148, "step": 330260 }, { - "epoch": 1.67, - "learning_rate": 5.006180282628108e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017158387789963734, + "loss": 0.0136, "step": 330270 }, { - "epoch": 1.67, - "learning_rate": 5.005423513326707e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017157998968326586, + "loss": 0.016, "step": 330280 }, { - "epoch": 1.67, - "learning_rate": 5.004666744025306e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.0001715761014668944, + "loss": 0.0119, "step": 330290 }, { - "epoch": 1.67, - "learning_rate": 5.003909974723905e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017157221325052297, + "loss": 0.0149, "step": 330300 }, { - "epoch": 1.67, - "learning_rate": 5.003153205422504e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017156832503415148, + "loss": 0.012, "step": 330310 }, { - "epoch": 1.67, - "learning_rate": 5.002396436121103e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017156443681778003, + "loss": 0.0102, "step": 330320 }, { - "epoch": 1.67, - "learning_rate": 5.001639666819702e-05, - "loss": 0.0099, + "epoch": 0.86, + "learning_rate": 0.00017156054860140854, + "loss": 0.0113, "step": 330330 }, { - "epoch": 1.67, - "learning_rate": 5.000882897518301e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.0001715566603850371, + "loss": 0.0127, "step": 330340 }, { - "epoch": 1.67, - "learning_rate": 5.0001261282169e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017155277216866562, + "loss": 0.0156, "step": 330350 }, { - "epoch": 1.67, - "learning_rate": 4.999369358915499e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017154888395229417, + "loss": 0.0149, "step": 330360 }, { - "epoch": 1.67, - "learning_rate": 4.998612589614098e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017154499573592268, + "loss": 0.0176, "step": 330370 }, { - "epoch": 1.67, - "learning_rate": 4.997855820312697e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017154110751955125, + "loss": 0.0153, "step": 330380 }, { - "epoch": 1.67, - "learning_rate": 4.997099051011296e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017153721930317976, + "loss": 0.0135, "step": 330390 }, { - "epoch": 1.67, - "learning_rate": 4.996342281709895e-05, - "loss": 0.0042, + "epoch": 0.86, + "learning_rate": 0.0001715333310868083, + "loss": 0.0135, "step": 330400 }, { - "epoch": 1.67, - "learning_rate": 4.995585512408493e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017152944287043682, + "loss": 0.0138, "step": 330410 }, { - "epoch": 1.67, - "learning_rate": 4.994828743107092e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.0001715255546540654, + "loss": 0.0133, "step": 330420 }, { - "epoch": 1.67, - "learning_rate": 4.9940719738056913e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017152166643769393, + "loss": 0.014, "step": 330430 }, { - "epoch": 1.67, - "learning_rate": 4.99331520450429e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.00017151777822132244, + "loss": 0.0143, "step": 330440 }, { - "epoch": 1.67, - "learning_rate": 4.992558435202889e-05, - "loss": 0.0114, + "epoch": 0.86, + "learning_rate": 0.00017151389000495096, + "loss": 0.0118, "step": 330450 }, { - "epoch": 1.67, - "learning_rate": 4.991801665901488e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017151000178857953, + "loss": 0.0109, "step": 330460 }, { - "epoch": 1.67, - "learning_rate": 4.991044896600087e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.00017150611357220807, + "loss": 0.0138, "step": 330470 }, { - "epoch": 1.67, - "learning_rate": 4.990288127298686e-05, - "loss": 0.0147, + "epoch": 0.86, + "learning_rate": 0.00017150222535583658, + "loss": 0.0124, "step": 330480 }, { - "epoch": 1.67, - "learning_rate": 4.989531357997285e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017149833713946513, + "loss": 0.0115, "step": 330490 }, { - "epoch": 1.67, - "learning_rate": 4.988774588695884e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.00017149444892309364, + "loss": 0.018, "step": 330500 }, { - "epoch": 1.67, - "learning_rate": 4.988017819394483e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.0001714905607067222, + "loss": 0.0112, "step": 330510 }, { - "epoch": 1.67, - "learning_rate": 4.987261050093082e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017148667249035072, + "loss": 0.0116, "step": 330520 }, { - "epoch": 1.67, - "learning_rate": 4.986504280791681e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017148278427397926, + "loss": 0.0113, "step": 330530 }, { - "epoch": 1.67, - "learning_rate": 4.98574751149028e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017147889605760778, + "loss": 0.0144, "step": 330540 }, { - "epoch": 1.67, - "learning_rate": 4.984990742188879e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017147500784123635, + "loss": 0.0136, "step": 330550 }, { - "epoch": 1.67, - "learning_rate": 4.984233972887478e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017147111962486486, + "loss": 0.0137, "step": 330560 }, { - "epoch": 1.67, - "learning_rate": 4.983477203586077e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.0001714672314084934, + "loss": 0.0128, "step": 330570 }, { - "epoch": 1.67, - "learning_rate": 4.982720434284676e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017146334319212192, + "loss": 0.0134, "step": 330580 }, { - "epoch": 1.67, - "learning_rate": 4.981963664983275e-05, - "loss": 0.0046, + "epoch": 0.86, + "learning_rate": 0.0001714594549757505, + "loss": 0.0225, "step": 330590 }, { - "epoch": 1.67, - "learning_rate": 4.981206895681874e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.000171455566759379, + "loss": 0.0123, "step": 330600 }, { - "epoch": 1.67, - "learning_rate": 4.980450126380473e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017145167854300754, + "loss": 0.017, "step": 330610 }, { - "epoch": 1.67, - "learning_rate": 4.9796933570790724e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017144779032663606, + "loss": 0.0155, "step": 330620 }, { - "epoch": 1.67, - "learning_rate": 4.978936587777671e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.00017144390211026463, + "loss": 0.0159, "step": 330630 }, { - "epoch": 1.67, - "learning_rate": 4.97817981847627e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017144001389389317, + "loss": 0.013, "step": 330640 }, { - "epoch": 1.67, - "learning_rate": 4.977423049174869e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017143612567752168, + "loss": 0.0136, "step": 330650 }, { - "epoch": 1.67, - "learning_rate": 4.976666279873468e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017143223746115022, + "loss": 0.0144, "step": 330660 }, { - "epoch": 1.67, - "learning_rate": 4.975909510572067e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017142834924477877, + "loss": 0.0139, "step": 330670 }, { - "epoch": 1.67, - "learning_rate": 4.975152741270666e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.0001714244610284073, + "loss": 0.0201, "step": 330680 }, { - "epoch": 1.67, - "learning_rate": 4.974395971969265e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017142057281203582, + "loss": 0.0151, "step": 330690 }, { - "epoch": 1.67, - "learning_rate": 4.973639202667864e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017141668459566436, + "loss": 0.0164, "step": 330700 }, { - "epoch": 1.67, - "learning_rate": 4.972882433366463e-05, - "loss": 0.0089, + "epoch": 0.86, + "learning_rate": 0.0001714127963792929, + "loss": 0.0154, "step": 330710 }, { - "epoch": 1.67, - "learning_rate": 4.972125664065061e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017140890816292145, + "loss": 0.0152, "step": 330720 }, { - "epoch": 1.67, - "learning_rate": 4.97136889476366e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017140501994654996, + "loss": 0.0147, "step": 330730 }, { - "epoch": 1.67, - "learning_rate": 4.970612125462259e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.0001714011317301785, + "loss": 0.0122, "step": 330740 }, { - "epoch": 1.67, - "learning_rate": 4.9698553561608584e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017139724351380702, + "loss": 0.0146, "step": 330750 }, { - "epoch": 1.67, - "learning_rate": 4.969098586859457e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.0001713933552974356, + "loss": 0.0129, "step": 330760 }, { - "epoch": 1.67, - "learning_rate": 4.968341817558056e-05, - "loss": 0.0039, + "epoch": 0.86, + "learning_rate": 0.0001713894670810641, + "loss": 0.0182, "step": 330770 }, { - "epoch": 1.67, - "learning_rate": 4.967585048256655e-05, - "loss": 0.0102, + "epoch": 0.86, + "learning_rate": 0.00017138557886469264, + "loss": 0.019, "step": 330780 }, { - "epoch": 1.67, - "learning_rate": 4.9668282789552544e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017138169064832116, + "loss": 0.0162, "step": 330790 }, { - "epoch": 1.67, - "learning_rate": 4.966071509653853e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017137780243194973, + "loss": 0.0137, "step": 330800 }, { - "epoch": 1.67, - "learning_rate": 4.965314740352452e-05, - "loss": 0.0046, + "epoch": 0.86, + "learning_rate": 0.00017137391421557827, + "loss": 0.0141, "step": 330810 }, { - "epoch": 1.67, - "learning_rate": 4.964557971051051e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.00017137002599920678, + "loss": 0.0165, "step": 330820 }, { - "epoch": 1.67, - "learning_rate": 4.96380120174965e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017136613778283532, + "loss": 0.0161, "step": 330830 }, { - "epoch": 1.67, - "learning_rate": 4.963044432448249e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017136224956646387, + "loss": 0.0141, "step": 330840 }, { - "epoch": 1.67, - "learning_rate": 4.962287663146848e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001713583613500924, + "loss": 0.0126, "step": 330850 }, { - "epoch": 1.67, - "learning_rate": 4.961530893845447e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017135447313372092, + "loss": 0.0146, "step": 330860 }, { - "epoch": 1.67, - "learning_rate": 4.960774124544046e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017135058491734946, + "loss": 0.0105, "step": 330870 }, { - "epoch": 1.67, - "learning_rate": 4.960017355242645e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.000171346696700978, + "loss": 0.014, "step": 330880 }, { - "epoch": 1.67, - "learning_rate": 4.959260585941244e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017134280848460655, + "loss": 0.0153, "step": 330890 }, { - "epoch": 1.67, - "learning_rate": 4.958503816639843e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017133892026823506, + "loss": 0.013, "step": 330900 }, { - "epoch": 1.67, - "learning_rate": 4.957747047338442e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.0001713350320518636, + "loss": 0.0146, "step": 330910 }, { - "epoch": 1.67, - "learning_rate": 4.956990278037041e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017133114383549214, + "loss": 0.0178, "step": 330920 }, { - "epoch": 1.67, - "learning_rate": 4.95623350873564e-05, - "loss": 0.0081, + "epoch": 0.86, + "learning_rate": 0.0001713272556191207, + "loss": 0.0146, "step": 330930 }, { - "epoch": 1.67, - "learning_rate": 4.955476739434239e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.0001713233674027492, + "loss": 0.0125, "step": 330940 }, { - "epoch": 1.67, - "learning_rate": 4.954719970132838e-05, - "loss": 0.0089, + "epoch": 0.86, + "learning_rate": 0.00017131947918637774, + "loss": 0.0151, "step": 330950 }, { - "epoch": 1.67, - "learning_rate": 4.953963200831437e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.0001713155909700063, + "loss": 0.0131, "step": 330960 }, { - "epoch": 1.67, - "learning_rate": 4.953206431530036e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017131170275363483, + "loss": 0.0151, "step": 330970 }, { - "epoch": 1.67, - "learning_rate": 4.952449662228635e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017130781453726337, + "loss": 0.0112, "step": 330980 }, { - "epoch": 1.67, - "learning_rate": 4.951692892927234e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017130392632089188, + "loss": 0.0154, "step": 330990 }, { - "epoch": 1.67, - "learning_rate": 4.950936123625833e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.0001713000381045204, + "loss": 0.0131, "step": 331000 }, { - "epoch": 1.67, - "eval_cer": 0.9144440552077764, - "eval_loss": 0.004910916555672884, - "eval_runtime": 116.3705, - "eval_samples_per_second": 17.186, - "eval_steps_per_second": 4.297, + "epoch": 0.86, + "eval_cer": 0.881751673615864, + "eval_loss": 0.008923850953578949, + "eval_runtime": 107.6261, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 331000 }, { - "epoch": 1.67, - "learning_rate": 4.950179354324432e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017129614988814897, + "loss": 0.0114, "step": 331010 }, { - "epoch": 1.67, - "learning_rate": 4.9494225850230306e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.0001712922616717775, + "loss": 0.0155, "step": 331020 }, { - "epoch": 1.67, - "learning_rate": 4.94866581572163e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017128837345540602, + "loss": 0.0134, "step": 331030 }, { - "epoch": 1.67, - "learning_rate": 4.947909046420228e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017128448523903456, + "loss": 0.0115, "step": 331040 }, { - "epoch": 1.67, - "learning_rate": 4.947152277118827e-05, - "loss": 0.0093, + "epoch": 0.86, + "learning_rate": 0.0001712805970226631, + "loss": 0.012, "step": 331050 }, { - "epoch": 1.67, - "learning_rate": 4.946395507817426e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017127670880629165, + "loss": 0.0119, "step": 331060 }, { - "epoch": 1.67, - "learning_rate": 4.9456387385160254e-05, - "loss": 0.0041, + "epoch": 0.86, + "learning_rate": 0.00017127282058992016, + "loss": 0.0099, "step": 331070 }, { - "epoch": 1.67, - "learning_rate": 4.944881969214624e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.0001712689323735487, + "loss": 0.0112, "step": 331080 }, { - "epoch": 1.67, - "learning_rate": 4.944125199913223e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.00017126504415717724, + "loss": 0.0124, "step": 331090 }, { - "epoch": 1.67, - "learning_rate": 4.943368430611822e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017126115594080579, + "loss": 0.0145, "step": 331100 }, { - "epoch": 1.67, - "learning_rate": 4.9426116613104214e-05, - "loss": 0.0081, + "epoch": 0.86, + "learning_rate": 0.0001712572677244343, + "loss": 0.0109, "step": 331110 }, { - "epoch": 1.67, - "learning_rate": 4.94185489200902e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017125337950806284, + "loss": 0.0146, "step": 331120 }, { - "epoch": 1.67, - "learning_rate": 4.941098122707619e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.0001712494912916914, + "loss": 0.0133, "step": 331130 }, { - "epoch": 1.67, - "learning_rate": 4.940341353406218e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017124560307531993, + "loss": 0.0123, "step": 331140 }, { - "epoch": 1.67, - "learning_rate": 4.9395845841048174e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017124171485894844, + "loss": 0.0105, "step": 331150 }, { - "epoch": 1.67, - "learning_rate": 4.938827814803416e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.00017123782664257698, + "loss": 0.0137, "step": 331160 }, { - "epoch": 1.67, - "learning_rate": 4.938071045502015e-05, - "loss": 0.0091, + "epoch": 0.86, + "learning_rate": 0.00017123393842620555, + "loss": 0.0087, "step": 331170 }, { - "epoch": 1.67, - "learning_rate": 4.937314276200614e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017123005020983406, + "loss": 0.014, "step": 331180 }, { - "epoch": 1.67, - "learning_rate": 4.936557506899213e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.0001712261619934626, + "loss": 0.0133, "step": 331190 }, { - "epoch": 1.67, - "learning_rate": 4.935800737597812e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017122227377709112, + "loss": 0.0117, "step": 331200 }, { - "epoch": 1.67, - "learning_rate": 4.935043968296411e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.0001712183855607197, + "loss": 0.0222, "step": 331210 }, { - "epoch": 1.67, - "learning_rate": 4.93428719899501e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.0001712144973443482, + "loss": 0.0128, "step": 331220 }, { - "epoch": 1.67, - "learning_rate": 4.933530429693609e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.00017121060912797675, + "loss": 0.0151, "step": 331230 }, { - "epoch": 1.67, - "learning_rate": 4.932773660392208e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017120672091160526, + "loss": 0.0166, "step": 331240 }, { - "epoch": 1.67, - "learning_rate": 4.932016891090807e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.0001712028326952338, + "loss": 0.0176, "step": 331250 }, { - "epoch": 1.67, - "learning_rate": 4.931260121789406e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017119894447886234, + "loss": 0.0131, "step": 331260 }, { - "epoch": 1.67, - "learning_rate": 4.930503352488005e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017119505626249089, + "loss": 0.0138, "step": 331270 }, { - "epoch": 1.67, - "learning_rate": 4.929746583186604e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001711911680461194, + "loss": 0.0142, "step": 331280 }, { - "epoch": 1.67, - "learning_rate": 4.928989813885203e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017118727982974794, + "loss": 0.0138, "step": 331290 }, { - "epoch": 1.67, - "learning_rate": 4.928233044583802e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.0001711833916133765, + "loss": 0.0156, "step": 331300 }, { - "epoch": 1.67, - "learning_rate": 4.927476275282401e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017117950339700502, + "loss": 0.0109, "step": 331310 }, { - "epoch": 1.67, - "learning_rate": 4.926719505981e-05, - "loss": 0.0098, + "epoch": 0.86, + "learning_rate": 0.00017117561518063354, + "loss": 0.0128, "step": 331320 }, { - "epoch": 1.67, - "learning_rate": 4.925962736679599e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.00017117172696426208, + "loss": 0.0102, "step": 331330 }, { - "epoch": 1.67, - "learning_rate": 4.925205967378198e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017116783874789065, + "loss": 0.0139, "step": 331340 }, { - "epoch": 1.67, - "learning_rate": 4.924449198076796e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017116395053151916, + "loss": 0.0145, "step": 331350 }, { - "epoch": 1.67, - "learning_rate": 4.923692428775395e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.0001711600623151477, + "loss": 0.017, "step": 331360 }, { - "epoch": 1.67, - "learning_rate": 4.922935659473994e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017115617409877622, + "loss": 0.0148, "step": 331370 }, { - "epoch": 1.67, - "learning_rate": 4.922178890172593e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.0001711522858824048, + "loss": 0.0167, "step": 331380 }, { - "epoch": 1.67, - "learning_rate": 4.921422120871192e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.0001711483976660333, + "loss": 0.0107, "step": 331390 }, { - "epoch": 1.67, - "learning_rate": 4.920665351569791e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017114450944966185, + "loss": 0.0157, "step": 331400 }, { - "epoch": 1.67, - "learning_rate": 4.91990858226839e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017114062123329036, + "loss": 0.0146, "step": 331410 }, { - "epoch": 1.67, - "learning_rate": 4.919151812966989e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017113673301691893, + "loss": 0.0148, "step": 331420 }, { - "epoch": 1.67, - "learning_rate": 4.918395043665588e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017113284480054744, + "loss": 0.0122, "step": 331430 }, { - "epoch": 1.67, - "learning_rate": 4.917638274364187e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017112895658417598, + "loss": 0.0095, "step": 331440 }, { - "epoch": 1.67, - "learning_rate": 4.916881505062786e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.0001711250683678045, + "loss": 0.0139, "step": 331450 }, { - "epoch": 1.67, - "learning_rate": 4.916124735761385e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017112118015143307, + "loss": 0.0113, "step": 331460 }, { - "epoch": 1.67, - "learning_rate": 4.915367966459984e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017111729193506158, + "loss": 0.0146, "step": 331470 }, { - "epoch": 1.67, - "learning_rate": 4.914611197158583e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017111340371869012, + "loss": 0.0152, "step": 331480 }, { - "epoch": 1.67, - "learning_rate": 4.913854427857182e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017110951550231864, + "loss": 0.0145, "step": 331490 }, { - "epoch": 1.67, - "learning_rate": 4.913097658555781e-05, - "loss": 0.0074, + "epoch": 0.86, + "learning_rate": 0.00017110562728594718, + "loss": 0.0123, "step": 331500 }, { - "epoch": 1.67, - "learning_rate": 4.91234088925438e-05, - "loss": 0.0082, + "epoch": 0.86, + "learning_rate": 0.00017110173906957575, + "loss": 0.0177, "step": 331510 }, { - "epoch": 1.67, - "learning_rate": 4.911584119952979e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017109785085320426, + "loss": 0.0129, "step": 331520 }, { - "epoch": 1.67, - "learning_rate": 4.910827350651578e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.0001710939626368328, + "loss": 0.0123, "step": 331530 }, { - "epoch": 1.67, - "learning_rate": 4.910070581350177e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017109007442046132, + "loss": 0.0134, "step": 331540 }, { - "epoch": 1.67, - "learning_rate": 4.909313812048776e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.0001710861862040899, + "loss": 0.0136, "step": 331550 }, { - "epoch": 1.67, - "learning_rate": 4.908557042747375e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.0001710822979877184, + "loss": 0.015, "step": 331560 }, { - "epoch": 1.67, - "learning_rate": 4.907800273445974e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017107840977134694, + "loss": 0.0148, "step": 331570 }, { - "epoch": 1.67, - "learning_rate": 4.907043504144573e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017107452155497546, + "loss": 0.013, "step": 331580 }, { - "epoch": 1.67, - "learning_rate": 4.906286734843172e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017107063333860403, + "loss": 0.0106, "step": 331590 }, { - "epoch": 1.67, - "learning_rate": 4.905529965541771e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017106674512223254, + "loss": 0.0158, "step": 331600 }, { - "epoch": 1.67, - "learning_rate": 4.90477319624037e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017106285690586108, + "loss": 0.0109, "step": 331610 }, { - "epoch": 1.67, - "learning_rate": 4.904016426938969e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.0001710589686894896, + "loss": 0.0098, "step": 331620 }, { - "epoch": 1.67, - "learning_rate": 4.903259657637568e-05, - "loss": 0.0098, + "epoch": 0.86, + "learning_rate": 0.00017105508047311817, + "loss": 0.0135, "step": 331630 }, { - "epoch": 1.67, - "learning_rate": 4.902502888336167e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017105119225674668, + "loss": 0.0149, "step": 331640 }, { - "epoch": 1.67, - "learning_rate": 4.901746119034766e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017104730404037522, + "loss": 0.014, "step": 331650 }, { - "epoch": 1.67, - "learning_rate": 4.900989349733365e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017104341582400374, + "loss": 0.0132, "step": 331660 }, { - "epoch": 1.67, - "learning_rate": 4.900232580431963e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.0001710395276076323, + "loss": 0.0137, "step": 331670 }, { - "epoch": 1.67, - "learning_rate": 4.8994758111305624e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017103563939126085, + "loss": 0.0146, "step": 331680 }, { - "epoch": 1.67, - "learning_rate": 4.898719041829161e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017103175117488936, + "loss": 0.0137, "step": 331690 }, { - "epoch": 1.67, - "learning_rate": 4.89796227252776e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.0001710278629585179, + "loss": 0.0107, "step": 331700 }, { - "epoch": 1.67, - "learning_rate": 4.897205503226359e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017102397474214645, + "loss": 0.0133, "step": 331710 }, { - "epoch": 1.67, - "learning_rate": 4.8964487339249583e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.000171020086525775, + "loss": 0.0117, "step": 331720 }, { - "epoch": 1.67, - "learning_rate": 4.895691964623557e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.0001710161983094035, + "loss": 0.0121, "step": 331730 }, { - "epoch": 1.67, - "learning_rate": 4.894935195322156e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017101231009303204, + "loss": 0.0108, "step": 331740 }, { - "epoch": 1.67, - "learning_rate": 4.894178426020755e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.00017100842187666056, + "loss": 0.0139, "step": 331750 }, { - "epoch": 1.67, - "learning_rate": 4.893421656719354e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017100453366028913, + "loss": 0.0117, "step": 331760 }, { - "epoch": 1.67, - "learning_rate": 4.892664887417953e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.00017100064544391764, + "loss": 0.0131, "step": 331770 }, { - "epoch": 1.67, - "learning_rate": 4.891908118116552e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017099675722754618, + "loss": 0.013, "step": 331780 }, { - "epoch": 1.67, - "learning_rate": 4.891151348815151e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.0001709928690111747, + "loss": 0.0102, "step": 331790 }, { - "epoch": 1.67, - "learning_rate": 4.89039457951375e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.00017098898079480327, + "loss": 0.0127, "step": 331800 }, { - "epoch": 1.67, - "learning_rate": 4.889637810212349e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017098509257843178, + "loss": 0.0174, "step": 331810 }, { - "epoch": 1.67, - "learning_rate": 4.888881040910948e-05, - "loss": 0.0093, + "epoch": 0.86, + "learning_rate": 0.00017098120436206032, + "loss": 0.0113, "step": 331820 }, { - "epoch": 1.67, - "learning_rate": 4.888124271609547e-05, - "loss": 0.0111, + "epoch": 0.86, + "learning_rate": 0.00017097731614568884, + "loss": 0.0113, "step": 331830 }, { - "epoch": 1.67, - "learning_rate": 4.887367502308146e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.0001709734279293174, + "loss": 0.0131, "step": 331840 }, { - "epoch": 1.67, - "learning_rate": 4.886610733006745e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017096953971294595, + "loss": 0.0127, "step": 331850 }, { - "epoch": 1.67, - "learning_rate": 4.885853963705344e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017096565149657446, + "loss": 0.0098, "step": 331860 }, { - "epoch": 1.67, - "learning_rate": 4.885097194403943e-05, - "loss": 0.008, + "epoch": 0.86, + "learning_rate": 0.00017096176328020298, + "loss": 0.0137, "step": 331870 }, { - "epoch": 1.67, - "learning_rate": 4.884340425102542e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017095787506383155, + "loss": 0.0098, "step": 331880 }, { - "epoch": 1.67, - "learning_rate": 4.883583655801141e-05, - "loss": 0.0046, + "epoch": 0.86, + "learning_rate": 0.0001709539868474601, + "loss": 0.0137, "step": 331890 }, { - "epoch": 1.67, - "learning_rate": 4.88282688649974e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.0001709500986310886, + "loss": 0.0197, "step": 331900 }, { - "epoch": 1.67, - "learning_rate": 4.882070117198339e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017094621041471714, + "loss": 0.0109, "step": 331910 }, { - "epoch": 1.67, - "learning_rate": 4.881313347896938e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017094232219834569, + "loss": 0.0142, "step": 331920 }, { - "epoch": 1.67, - "learning_rate": 4.880556578595537e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017093843398197423, + "loss": 0.0144, "step": 331930 }, { - "epoch": 1.67, - "learning_rate": 4.879799809294136e-05, - "loss": 0.0088, + "epoch": 0.86, + "learning_rate": 0.00017093454576560274, + "loss": 0.0135, "step": 331940 }, { - "epoch": 1.67, - "learning_rate": 4.8790430399927346e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017093065754923128, + "loss": 0.0132, "step": 331950 }, { - "epoch": 1.67, - "learning_rate": 4.878286270691334e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.00017092676933285982, + "loss": 0.0142, "step": 331960 }, { - "epoch": 1.67, - "learning_rate": 4.877529501389933e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017092288111648837, + "loss": 0.0137, "step": 331970 }, { - "epoch": 1.67, - "learning_rate": 4.876772732088531e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017091899290011688, + "loss": 0.0121, "step": 331980 }, { - "epoch": 1.67, - "learning_rate": 4.87601596278713e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017091510468374542, + "loss": 0.015, "step": 331990 }, { - "epoch": 1.67, - "learning_rate": 4.875259193485729e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017091121646737394, + "loss": 0.0125, "step": 332000 }, { - "epoch": 1.67, - "eval_cer": 0.9144421144155256, - "eval_loss": 0.004793255589902401, - "eval_runtime": 116.2412, - "eval_samples_per_second": 17.206, - "eval_steps_per_second": 4.301, + "epoch": 0.86, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.008775945752859116, + "eval_runtime": 107.8889, + "eval_samples_per_second": 18.538, + "eval_steps_per_second": 4.634, "step": 332000 }, { - "epoch": 1.68, - "learning_rate": 4.874502424184328e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.0001709073282510025, + "loss": 0.015, "step": 332010 }, { - "epoch": 1.68, - "learning_rate": 4.873745654882927e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017090344003463105, + "loss": 0.0138, "step": 332020 }, { - "epoch": 1.68, - "learning_rate": 4.872988885581526e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017089955181825956, + "loss": 0.017, "step": 332030 }, { - "epoch": 1.68, - "learning_rate": 4.8722321162801254e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017089566360188808, + "loss": 0.0146, "step": 332040 }, { - "epoch": 1.68, - "learning_rate": 4.871475346978724e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017089177538551665, + "loss": 0.0199, "step": 332050 }, { - "epoch": 1.68, - "learning_rate": 4.870718577677323e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.0001708878871691452, + "loss": 0.0132, "step": 332060 }, { - "epoch": 1.68, - "learning_rate": 4.869961808375922e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.0001708839989527737, + "loss": 0.0123, "step": 332070 }, { - "epoch": 1.68, - "learning_rate": 4.8692050390745214e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017088011073640224, + "loss": 0.0106, "step": 332080 }, { - "epoch": 1.68, - "learning_rate": 4.86844826977312e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.00017087622252003078, + "loss": 0.0132, "step": 332090 }, { - "epoch": 1.68, - "learning_rate": 4.867691500471719e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017087233430365933, + "loss": 0.0136, "step": 332100 }, { - "epoch": 1.68, - "learning_rate": 4.866934731170318e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017086844608728784, + "loss": 0.0139, "step": 332110 }, { - "epoch": 1.68, - "learning_rate": 4.866177961868917e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017086455787091638, + "loss": 0.0131, "step": 332120 }, { - "epoch": 1.68, - "learning_rate": 4.865421192567516e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017086066965454492, + "loss": 0.0116, "step": 332130 }, { - "epoch": 1.68, - "learning_rate": 4.864664423266115e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017085678143817347, + "loss": 0.0118, "step": 332140 }, { - "epoch": 1.68, - "learning_rate": 4.863907653964714e-05, - "loss": 0.0051, + "epoch": 0.86, + "learning_rate": 0.00017085289322180198, + "loss": 0.0178, "step": 332150 }, { - "epoch": 1.68, - "learning_rate": 4.863150884663313e-05, - "loss": 0.0096, + "epoch": 0.86, + "learning_rate": 0.00017084900500543052, + "loss": 0.0125, "step": 332160 }, { - "epoch": 1.68, - "learning_rate": 4.862394115361912e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.0001708451167890591, + "loss": 0.0115, "step": 332170 }, { - "epoch": 1.68, - "learning_rate": 4.861637346060511e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.0001708412285726876, + "loss": 0.0173, "step": 332180 }, { - "epoch": 1.68, - "learning_rate": 4.86088057675911e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017083734035631612, + "loss": 0.01, "step": 332190 }, { - "epoch": 1.68, - "learning_rate": 4.860123807457709e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017083345213994466, + "loss": 0.0127, "step": 332200 }, { - "epoch": 1.68, - "learning_rate": 4.859367038156308e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017082956392357323, + "loss": 0.0217, "step": 332210 }, { - "epoch": 1.68, - "learning_rate": 4.858610268854907e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017082567570720174, + "loss": 0.0123, "step": 332220 }, { - "epoch": 1.68, - "learning_rate": 4.857853499553506e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017082178749083029, + "loss": 0.024, "step": 332230 }, { - "epoch": 1.68, - "learning_rate": 4.857096730252105e-05, - "loss": 0.0128, + "epoch": 0.86, + "learning_rate": 0.0001708178992744588, + "loss": 0.0116, "step": 332240 }, { - "epoch": 1.68, - "learning_rate": 4.856339960950704e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017081401105808734, + "loss": 0.0123, "step": 332250 }, { - "epoch": 1.68, - "learning_rate": 4.855583191649303e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017081012284171588, + "loss": 0.0166, "step": 332260 }, { - "epoch": 1.68, - "learning_rate": 4.854826422347902e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.00017080623462534443, + "loss": 0.0113, "step": 332270 }, { - "epoch": 1.68, - "learning_rate": 4.854069653046501e-05, - "loss": 0.0041, + "epoch": 0.86, + "learning_rate": 0.00017080234640897294, + "loss": 0.0109, "step": 332280 }, { - "epoch": 1.68, - "learning_rate": 4.853312883745099e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.00017079845819260148, + "loss": 0.0148, "step": 332290 }, { - "epoch": 1.68, - "learning_rate": 4.852556114443698e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017079456997623002, + "loss": 0.0157, "step": 332300 }, { - "epoch": 1.68, - "learning_rate": 4.851799345142297e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017079068175985857, + "loss": 0.012, "step": 332310 }, { - "epoch": 1.68, - "learning_rate": 4.851042575840896e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017078679354348708, + "loss": 0.0125, "step": 332320 }, { - "epoch": 1.68, - "learning_rate": 4.850285806539495e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017078290532711562, + "loss": 0.0242, "step": 332330 }, { - "epoch": 1.68, - "learning_rate": 4.849529037238094e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017077901711074416, + "loss": 0.0101, "step": 332340 }, { - "epoch": 1.68, - "learning_rate": 4.848772267936693e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001707751288943727, + "loss": 0.017, "step": 332350 }, { - "epoch": 1.68, - "learning_rate": 4.848015498635292e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.00017077124067800122, + "loss": 0.0117, "step": 332360 }, { - "epoch": 1.68, - "learning_rate": 4.847258729333891e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017076735246162976, + "loss": 0.0156, "step": 332370 }, { - "epoch": 1.68, - "learning_rate": 4.84650196003249e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017076346424525833, + "loss": 0.0124, "step": 332380 }, { - "epoch": 1.68, - "learning_rate": 4.845745190731089e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017075957602888684, + "loss": 0.0128, "step": 332390 }, { - "epoch": 1.68, - "learning_rate": 4.844988421429688e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017075568781251539, + "loss": 0.0131, "step": 332400 }, { - "epoch": 1.68, - "learning_rate": 4.844231652128287e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.0001707517995961439, + "loss": 0.0149, "step": 332410 }, { - "epoch": 1.68, - "learning_rate": 4.843474882826886e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017074791137977247, + "loss": 0.011, "step": 332420 }, { - "epoch": 1.68, - "learning_rate": 4.842718113525485e-05, - "loss": 0.0082, + "epoch": 0.86, + "learning_rate": 0.00017074402316340098, + "loss": 0.0156, "step": 332430 }, { - "epoch": 1.68, - "learning_rate": 4.841961344224084e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017074013494702953, + "loss": 0.0137, "step": 332440 }, { - "epoch": 1.68, - "learning_rate": 4.841204574922683e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017073624673065804, + "loss": 0.0189, "step": 332450 }, { - "epoch": 1.68, - "learning_rate": 4.840447805621282e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.0001707323585142866, + "loss": 0.016, "step": 332460 }, { - "epoch": 1.68, - "learning_rate": 4.839691036319881e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017072847029791512, + "loss": 0.016, "step": 332470 }, { - "epoch": 1.68, - "learning_rate": 4.8389342670184797e-05, - "loss": 0.0048, + "epoch": 0.86, + "learning_rate": 0.00017072458208154366, + "loss": 0.0127, "step": 332480 }, { - "epoch": 1.68, - "learning_rate": 4.838177497717079e-05, - "loss": 0.0069, + "epoch": 0.86, + "learning_rate": 0.00017072069386517218, + "loss": 0.0099, "step": 332490 }, { - "epoch": 1.68, - "learning_rate": 4.837420728415678e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.00017071680564880072, + "loss": 0.0143, "step": 332500 }, { - "epoch": 1.68, - "learning_rate": 4.836663959114277e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017071291743242926, + "loss": 0.0144, "step": 332510 }, { - "epoch": 1.68, - "learning_rate": 4.8359071898128756e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001707090292160578, + "loss": 0.0136, "step": 332520 }, { - "epoch": 1.68, - "learning_rate": 4.835150420511475e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017070514099968632, + "loss": 0.0109, "step": 332530 }, { - "epoch": 1.68, - "learning_rate": 4.834393651210074e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017070125278331486, + "loss": 0.0157, "step": 332540 }, { - "epoch": 1.68, - "learning_rate": 4.833636881908673e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017069736456694343, + "loss": 0.0183, "step": 332550 }, { - "epoch": 1.68, - "learning_rate": 4.832880112607272e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.00017069347635057194, + "loss": 0.0135, "step": 332560 }, { - "epoch": 1.68, - "learning_rate": 4.832123343305871e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017068958813420049, + "loss": 0.0117, "step": 332570 }, { - "epoch": 1.68, - "learning_rate": 4.83136657400447e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.000170685699917829, + "loss": 0.0142, "step": 332580 }, { - "epoch": 1.68, - "learning_rate": 4.830609804703069e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017068181170145757, + "loss": 0.014, "step": 332590 }, { - "epoch": 1.68, - "learning_rate": 4.829853035401668e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017067792348508608, + "loss": 0.0137, "step": 332600 }, { - "epoch": 1.68, - "learning_rate": 4.8290962661002664e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017067403526871462, + "loss": 0.0156, "step": 332610 }, { - "epoch": 1.68, - "learning_rate": 4.828339496798865e-05, - "loss": 0.0087, + "epoch": 0.86, + "learning_rate": 0.00017067014705234314, + "loss": 0.0187, "step": 332620 }, { - "epoch": 1.68, - "learning_rate": 4.827582727497464e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001706662588359717, + "loss": 0.016, "step": 332630 }, { - "epoch": 1.68, - "learning_rate": 4.826825958196063e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017066237061960022, + "loss": 0.0123, "step": 332640 }, { - "epoch": 1.68, - "learning_rate": 4.826069188894662e-05, - "loss": 0.0103, + "epoch": 0.86, + "learning_rate": 0.00017065848240322876, + "loss": 0.0118, "step": 332650 }, { - "epoch": 1.68, - "learning_rate": 4.825312419593261e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017065459418685728, + "loss": 0.0126, "step": 332660 }, { - "epoch": 1.68, - "learning_rate": 4.82455565029186e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017065070597048585, + "loss": 0.011, "step": 332670 }, { - "epoch": 1.68, - "learning_rate": 4.823798880990459e-05, - "loss": 0.0103, + "epoch": 0.86, + "learning_rate": 0.00017064681775411436, + "loss": 0.0171, "step": 332680 }, { - "epoch": 1.68, - "learning_rate": 4.823042111689058e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.0001706429295377429, + "loss": 0.0108, "step": 332690 }, { - "epoch": 1.68, - "learning_rate": 4.822285342387657e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017063904132137142, + "loss": 0.0155, "step": 332700 }, { - "epoch": 1.68, - "learning_rate": 4.821528573086256e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.000170635153105, + "loss": 0.0129, "step": 332710 }, { - "epoch": 1.68, - "learning_rate": 4.820771803784855e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017063126488862853, + "loss": 0.0119, "step": 332720 }, { - "epoch": 1.68, - "learning_rate": 4.820015034483454e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017062737667225704, + "loss": 0.0148, "step": 332730 }, { - "epoch": 1.68, - "learning_rate": 4.819258265182053e-05, - "loss": 0.0092, + "epoch": 0.86, + "learning_rate": 0.00017062348845588556, + "loss": 0.0152, "step": 332740 }, { - "epoch": 1.68, - "learning_rate": 4.818501495880652e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.0001706196002395141, + "loss": 0.0131, "step": 332750 }, { - "epoch": 1.68, - "learning_rate": 4.817744726579251e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017061571202314267, + "loss": 0.0103, "step": 332760 }, { - "epoch": 1.68, - "learning_rate": 4.81698795727785e-05, - "loss": 0.0045, + "epoch": 0.86, + "learning_rate": 0.00017061182380677118, + "loss": 0.013, "step": 332770 }, { - "epoch": 1.68, - "learning_rate": 4.816231187976449e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017060793559039972, + "loss": 0.0127, "step": 332780 }, { - "epoch": 1.68, - "learning_rate": 4.815474418675048e-05, - "loss": 0.0082, + "epoch": 0.86, + "learning_rate": 0.00017060404737402824, + "loss": 0.0133, "step": 332790 }, { - "epoch": 1.68, - "learning_rate": 4.814717649373647e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.0001706001591576568, + "loss": 0.0165, "step": 332800 }, { - "epoch": 1.68, - "learning_rate": 4.813960880072246e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017059627094128532, + "loss": 0.0134, "step": 332810 }, { - "epoch": 1.68, - "learning_rate": 4.813204110770845e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017059238272491386, + "loss": 0.016, "step": 332820 }, { - "epoch": 1.68, - "learning_rate": 4.812447341469444e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017058849450854238, + "loss": 0.0113, "step": 332830 }, { - "epoch": 1.68, - "learning_rate": 4.8116905721680427e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.00017058460629217095, + "loss": 0.0147, "step": 332840 }, { - "epoch": 1.68, - "learning_rate": 4.810933802866642e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017058071807579946, + "loss": 0.0153, "step": 332850 }, { - "epoch": 1.68, - "learning_rate": 4.810177033565241e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.000170576829859428, + "loss": 0.0107, "step": 332860 }, { - "epoch": 1.68, - "learning_rate": 4.80942026426384e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017057294164305652, + "loss": 0.0156, "step": 332870 }, { - "epoch": 1.68, - "learning_rate": 4.8086634949624386e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017056905342668509, + "loss": 0.0128, "step": 332880 }, { - "epoch": 1.68, - "learning_rate": 4.807906725661038e-05, - "loss": 0.0077, + "epoch": 0.86, + "learning_rate": 0.00017056516521031363, + "loss": 0.0112, "step": 332890 }, { - "epoch": 1.68, - "learning_rate": 4.807149956359637e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017056127699394214, + "loss": 0.0139, "step": 332900 }, { - "epoch": 1.68, - "learning_rate": 4.806393187058236e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017055738877757066, + "loss": 0.0098, "step": 332910 }, { - "epoch": 1.68, - "learning_rate": 4.805636417756834e-05, - "loss": 0.0043, + "epoch": 0.86, + "learning_rate": 0.00017055350056119923, + "loss": 0.0166, "step": 332920 }, { - "epoch": 1.68, - "learning_rate": 4.804879648455433e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.00017054961234482777, + "loss": 0.0125, "step": 332930 }, { - "epoch": 1.68, - "learning_rate": 4.804122879154032e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017054572412845628, + "loss": 0.017, "step": 332940 }, { - "epoch": 1.68, - "learning_rate": 4.803366109852631e-05, - "loss": 0.0102, + "epoch": 0.86, + "learning_rate": 0.00017054183591208482, + "loss": 0.0117, "step": 332950 }, { - "epoch": 1.68, - "learning_rate": 4.80260934055123e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017053794769571334, + "loss": 0.0127, "step": 332960 }, { - "epoch": 1.68, - "learning_rate": 4.801852571249829e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.0001705340594793419, + "loss": 0.0141, "step": 332970 }, { - "epoch": 1.68, - "learning_rate": 4.801095801948428e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.00017053017126297042, + "loss": 0.0121, "step": 332980 }, { - "epoch": 1.68, - "learning_rate": 4.800339032647027e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017052628304659896, + "loss": 0.0117, "step": 332990 }, { - "epoch": 1.68, - "learning_rate": 4.799582263345626e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.00017052239483022748, + "loss": 0.0094, "step": 333000 }, { - "epoch": 1.68, - "eval_cer": 0.9144343512465224, - "eval_loss": 0.004823221359401941, - "eval_runtime": 116.4518, - "eval_samples_per_second": 17.174, - "eval_steps_per_second": 4.294, + "epoch": 0.86, + "eval_cer": 0.8817502739789299, + "eval_loss": 0.009038124233484268, + "eval_runtime": 107.8356, + "eval_samples_per_second": 18.547, + "eval_steps_per_second": 4.637, "step": 333000 }, { - "epoch": 1.68, - "learning_rate": 4.7988254940442253e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017051850661385605, + "loss": 0.0133, "step": 333010 }, { - "epoch": 1.68, - "learning_rate": 4.798068724742824e-05, - "loss": 0.0085, + "epoch": 0.86, + "learning_rate": 0.00017051461839748456, + "loss": 0.0106, "step": 333020 }, { - "epoch": 1.68, - "learning_rate": 4.797311955441423e-05, - "loss": 0.0098, + "epoch": 0.86, + "learning_rate": 0.0001705107301811131, + "loss": 0.0144, "step": 333030 }, { - "epoch": 1.68, - "learning_rate": 4.796555186140022e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017050684196474162, + "loss": 0.018, "step": 333040 }, { - "epoch": 1.68, - "learning_rate": 4.795798416838621e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017050295374837019, + "loss": 0.0132, "step": 333050 }, { - "epoch": 1.68, - "learning_rate": 4.79504164753722e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.0001704990655319987, + "loss": 0.0163, "step": 333060 }, { - "epoch": 1.68, - "learning_rate": 4.794284878235819e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017049517731562724, + "loss": 0.0099, "step": 333070 }, { - "epoch": 1.68, - "learning_rate": 4.793528108934418e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017049128909925576, + "loss": 0.0146, "step": 333080 }, { - "epoch": 1.68, - "learning_rate": 4.792771339633017e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.00017048740088288432, + "loss": 0.0134, "step": 333090 }, { - "epoch": 1.68, - "learning_rate": 4.792014570331616e-05, - "loss": 0.0067, - "step": 333100 + "epoch": 0.86, + "learning_rate": 0.00017048351266651287, + "loss": 0.0133, + "step": 333100 }, { - "epoch": 1.68, - "learning_rate": 4.791257801030215e-05, - "loss": 0.0078, + "epoch": 0.86, + "learning_rate": 0.00017047962445014138, + "loss": 0.0141, "step": 333110 }, { - "epoch": 1.68, - "learning_rate": 4.790501031728814e-05, - "loss": 0.0058, + "epoch": 0.86, + "learning_rate": 0.00017047573623376992, + "loss": 0.0133, "step": 333120 }, { - "epoch": 1.68, - "learning_rate": 4.789744262427413e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017047184801739846, + "loss": 0.0126, "step": 333130 }, { - "epoch": 1.68, - "learning_rate": 4.788987493126012e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.000170467959801027, + "loss": 0.0124, "step": 333140 }, { - "epoch": 1.68, - "learning_rate": 4.788230723824611e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017046407158465552, + "loss": 0.0158, "step": 333150 }, { - "epoch": 1.68, - "learning_rate": 4.78747395452321e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017046018336828406, + "loss": 0.0114, "step": 333160 }, { - "epoch": 1.68, - "learning_rate": 4.786717185221809e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.0001704562951519126, + "loss": 0.013, "step": 333170 }, { - "epoch": 1.68, - "learning_rate": 4.785960415920408e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.00017045240693554115, + "loss": 0.0127, "step": 333180 }, { - "epoch": 1.68, - "learning_rate": 4.785203646619007e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.00017044851871916966, + "loss": 0.0138, "step": 333190 }, { - "epoch": 1.68, - "learning_rate": 4.784446877317606e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.0001704446305027982, + "loss": 0.0122, "step": 333200 }, { - "epoch": 1.68, - "learning_rate": 4.783690108016205e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017044074228642672, + "loss": 0.0177, "step": 333210 }, { - "epoch": 1.68, - "learning_rate": 4.782933338714804e-05, - "loss": 0.0055, + "epoch": 0.86, + "learning_rate": 0.00017043685407005528, + "loss": 0.0155, "step": 333220 }, { - "epoch": 1.68, - "learning_rate": 4.782176569413403e-05, - "loss": 0.009, + "epoch": 0.86, + "learning_rate": 0.0001704329658536838, + "loss": 0.0159, "step": 333230 }, { - "epoch": 1.68, - "learning_rate": 4.781419800112001e-05, - "loss": 0.0056, + "epoch": 0.86, + "learning_rate": 0.00017042907763731234, + "loss": 0.0158, "step": 333240 }, { - "epoch": 1.68, - "learning_rate": 4.7806630308106e-05, - "loss": 0.0065, + "epoch": 0.86, + "learning_rate": 0.00017042518942094086, + "loss": 0.0141, "step": 333250 }, { - "epoch": 1.68, - "learning_rate": 4.779906261509199e-05, - "loss": 0.0059, + "epoch": 0.86, + "learning_rate": 0.00017042130120456942, + "loss": 0.0108, "step": 333260 }, { - "epoch": 1.68, - "learning_rate": 4.779149492207798e-05, - "loss": 0.0052, + "epoch": 0.86, + "learning_rate": 0.00017041741298819797, + "loss": 0.0146, "step": 333270 }, { - "epoch": 1.68, - "learning_rate": 4.778392722906397e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017041352477182648, + "loss": 0.0165, "step": 333280 }, { - "epoch": 1.68, - "learning_rate": 4.777635953604996e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017040963655545502, + "loss": 0.0111, "step": 333290 }, { - "epoch": 1.68, - "learning_rate": 4.776879184303595e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.00017040574833908356, + "loss": 0.0141, "step": 333300 }, { - "epoch": 1.68, - "learning_rate": 4.776122415002194e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.0001704018601227121, + "loss": 0.0136, "step": 333310 }, { - "epoch": 1.68, - "learning_rate": 4.775365645700793e-05, - "loss": 0.0088, + "epoch": 0.86, + "learning_rate": 0.00017039797190634062, + "loss": 0.0144, "step": 333320 }, { - "epoch": 1.68, - "learning_rate": 4.774608876399392e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017039408368996916, + "loss": 0.013, "step": 333330 }, { - "epoch": 1.68, - "learning_rate": 4.773852107097991e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.0001703901954735977, + "loss": 0.0131, "step": 333340 }, { - "epoch": 1.68, - "learning_rate": 4.77309533779659e-05, - "loss": 0.0057, + "epoch": 0.86, + "learning_rate": 0.00017038630725722624, + "loss": 0.0133, "step": 333350 }, { - "epoch": 1.68, - "learning_rate": 4.772338568495189e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017038241904085476, + "loss": 0.0116, "step": 333360 }, { - "epoch": 1.68, - "learning_rate": 4.771581799193788e-05, - "loss": 0.0083, + "epoch": 0.86, + "learning_rate": 0.0001703785308244833, + "loss": 0.0102, "step": 333370 }, { - "epoch": 1.68, - "learning_rate": 4.770825029892387e-05, - "loss": 0.0071, + "epoch": 0.86, + "learning_rate": 0.00017037464260811184, + "loss": 0.0123, "step": 333380 }, { - "epoch": 1.68, - "learning_rate": 4.770068260590986e-05, - "loss": 0.007, + "epoch": 0.86, + "learning_rate": 0.00017037075439174038, + "loss": 0.0139, "step": 333390 }, { - "epoch": 1.68, - "learning_rate": 4.769311491289585e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.0001703668661753689, + "loss": 0.0153, "step": 333400 }, { - "epoch": 1.68, - "learning_rate": 4.7685547219881836e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017036297795899744, + "loss": 0.0127, "step": 333410 }, { - "epoch": 1.68, - "learning_rate": 4.767797952686783e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.000170359089742626, + "loss": 0.0135, "step": 333420 }, { - "epoch": 1.68, - "learning_rate": 4.767041183385382e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017035520152625452, + "loss": 0.0097, "step": 333430 }, { - "epoch": 1.68, - "learning_rate": 4.766284414083981e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017035131330988307, + "loss": 0.0096, "step": 333440 }, { - "epoch": 1.68, - "learning_rate": 4.7655276447825796e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017034742509351158, + "loss": 0.0144, "step": 333450 }, { - "epoch": 1.68, - "learning_rate": 4.764770875481179e-05, - "loss": 0.0062, + "epoch": 0.86, + "learning_rate": 0.0001703435368771401, + "loss": 0.0133, "step": 333460 }, { - "epoch": 1.68, - "learning_rate": 4.764014106179778e-05, - "loss": 0.0041, + "epoch": 0.86, + "learning_rate": 0.00017033964866076866, + "loss": 0.014, "step": 333470 }, { - "epoch": 1.68, - "learning_rate": 4.763257336878377e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001703357604443972, + "loss": 0.015, "step": 333480 }, { - "epoch": 1.68, - "learning_rate": 4.7625005675769756e-05, - "loss": 0.0047, + "epoch": 0.86, + "learning_rate": 0.00017033187222802572, + "loss": 0.0113, "step": 333490 }, { - "epoch": 1.68, - "learning_rate": 4.761743798275575e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017032798401165426, + "loss": 0.0123, "step": 333500 }, { - "epoch": 1.68, - "learning_rate": 4.760987028974174e-05, - "loss": 0.0066, + "epoch": 0.86, + "learning_rate": 0.0001703240957952828, + "loss": 0.0098, "step": 333510 }, { - "epoch": 1.68, - "learning_rate": 4.760230259672773e-05, - "loss": 0.0079, + "epoch": 0.86, + "learning_rate": 0.00017032020757891134, + "loss": 0.0142, "step": 333520 }, { - "epoch": 1.68, - "learning_rate": 4.759473490371372e-05, - "loss": 0.0053, + "epoch": 0.86, + "learning_rate": 0.00017031631936253986, + "loss": 0.0116, "step": 333530 }, { - "epoch": 1.68, - "learning_rate": 4.758716721069971e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.0001703124311461684, + "loss": 0.0156, "step": 333540 }, { - "epoch": 1.68, - "learning_rate": 4.757959951768569e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017030854292979694, + "loss": 0.0153, "step": 333550 }, { - "epoch": 1.68, - "learning_rate": 4.757203182467168e-05, - "loss": 0.0064, + "epoch": 0.86, + "learning_rate": 0.00017030465471342548, + "loss": 0.0145, "step": 333560 }, { - "epoch": 1.68, - "learning_rate": 4.756446413165767e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.000170300766497054, + "loss": 0.0108, "step": 333570 }, { - "epoch": 1.68, - "learning_rate": 4.755689643864366e-05, - "loss": 0.0075, + "epoch": 0.86, + "learning_rate": 0.00017029687828068254, + "loss": 0.017, "step": 333580 }, { - "epoch": 1.68, - "learning_rate": 4.754932874562965e-05, - "loss": 0.0073, + "epoch": 0.86, + "learning_rate": 0.0001702929900643111, + "loss": 0.0138, "step": 333590 }, { - "epoch": 1.68, - "learning_rate": 4.754176105261564e-05, - "loss": 0.005, + "epoch": 0.86, + "learning_rate": 0.00017028910184793962, + "loss": 0.0129, "step": 333600 }, { - "epoch": 1.68, - "learning_rate": 4.753419335960163e-05, - "loss": 0.0054, + "epoch": 0.86, + "learning_rate": 0.00017028521363156816, + "loss": 0.0126, "step": 333610 }, { - "epoch": 1.68, - "learning_rate": 4.752662566658762e-05, - "loss": 0.0049, + "epoch": 0.86, + "learning_rate": 0.00017028132541519668, + "loss": 0.0093, "step": 333620 }, { - "epoch": 1.68, - "learning_rate": 4.751905797357361e-05, - "loss": 0.0068, + "epoch": 0.86, + "learning_rate": 0.00017027743719882525, + "loss": 0.0149, "step": 333630 }, { - "epoch": 1.68, - "learning_rate": 4.75114902805596e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.00017027354898245376, + "loss": 0.0108, "step": 333640 }, { - "epoch": 1.68, - "learning_rate": 4.750392258754559e-05, - "loss": 0.0063, + "epoch": 0.86, + "learning_rate": 0.0001702696607660823, + "loss": 0.0145, "step": 333650 }, { - "epoch": 1.68, - "learning_rate": 4.749635489453158e-05, - "loss": 0.006, + "epoch": 0.86, + "learning_rate": 0.00017026577254971082, + "loss": 0.0123, "step": 333660 }, { - "epoch": 1.68, - "learning_rate": 4.748878720151757e-05, - "loss": 0.0072, + "epoch": 0.86, + "learning_rate": 0.0001702618843333394, + "loss": 0.0113, "step": 333670 }, { - "epoch": 1.68, - "learning_rate": 4.748121950850356e-05, - "loss": 0.0076, + "epoch": 0.86, + "learning_rate": 0.0001702579961169679, + "loss": 0.0119, "step": 333680 }, { - "epoch": 1.68, - "learning_rate": 4.747365181548955e-05, - "loss": 0.0061, + "epoch": 0.86, + "learning_rate": 0.00017025410790059644, + "loss": 0.0107, "step": 333690 }, { - "epoch": 1.68, - "learning_rate": 4.746608412247554e-05, - "loss": 0.0067, + "epoch": 0.86, + "learning_rate": 0.00017025021968422496, + "loss": 0.0176, "step": 333700 }, { - "epoch": 1.68, - "learning_rate": 4.745851642946153e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.0001702463314678535, + "loss": 0.0151, "step": 333710 }, { - "epoch": 1.68, - "learning_rate": 4.745094873644752e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00017024244325148204, + "loss": 0.0241, "step": 333720 }, { - "epoch": 1.68, - "learning_rate": 4.744338104343351e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00017023855503511058, + "loss": 0.0129, "step": 333730 }, { - "epoch": 1.68, - "learning_rate": 4.74358133504195e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.0001702346668187391, + "loss": 0.0136, "step": 333740 }, { - "epoch": 1.68, - "learning_rate": 4.742824565740549e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00017023077860236764, + "loss": 0.0139, "step": 333750 }, { - "epoch": 1.68, - "learning_rate": 4.742067796439148e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.0001702268903859962, + "loss": 0.0134, "step": 333760 }, { - "epoch": 1.68, - "learning_rate": 4.7413110271377466e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00017022300216962472, + "loss": 0.0107, "step": 333770 }, { - "epoch": 1.68, - "learning_rate": 4.740554257836346e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00017021911395325324, + "loss": 0.0168, "step": 333780 }, { - "epoch": 1.68, - "learning_rate": 4.739797488534945e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00017021522573688178, + "loss": 0.0126, "step": 333790 }, { - "epoch": 1.68, - "learning_rate": 4.739040719233544e-05, - "loss": 0.0045, + "epoch": 0.87, + "learning_rate": 0.00017021133752051035, + "loss": 0.013, "step": 333800 }, { - "epoch": 1.68, - "learning_rate": 4.7382839499321426e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00017020744930413886, + "loss": 0.0137, "step": 333810 }, { - "epoch": 1.68, - "learning_rate": 4.737527180630742e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.0001702035610877674, + "loss": 0.0125, "step": 333820 }, { - "epoch": 1.68, - "learning_rate": 4.736770411329341e-05, - "loss": 0.0084, + "epoch": 0.87, + "learning_rate": 0.00017019967287139592, + "loss": 0.0251, "step": 333830 }, { - "epoch": 1.68, - "learning_rate": 4.73601364202794e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.0001701957846550245, + "loss": 0.0148, "step": 333840 }, { - "epoch": 1.68, - "learning_rate": 4.7352568727265386e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.000170191896438653, + "loss": 0.0147, "step": 333850 }, { - "epoch": 1.68, - "learning_rate": 4.734500103425138e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00017018800822228154, + "loss": 0.0138, "step": 333860 }, { - "epoch": 1.68, - "learning_rate": 4.733743334123736e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00017018412000591006, + "loss": 0.0183, "step": 333870 }, { - "epoch": 1.68, - "learning_rate": 4.732986564822335e-05, - "loss": 0.0082, + "epoch": 0.87, + "learning_rate": 0.00017018023178953863, + "loss": 0.0129, "step": 333880 }, { - "epoch": 1.68, - "learning_rate": 4.732229795520934e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00017017634357316714, + "loss": 0.0138, "step": 333890 }, { - "epoch": 1.68, - "learning_rate": 4.731473026219533e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00017017245535679568, + "loss": 0.0117, "step": 333900 }, { - "epoch": 1.68, - "learning_rate": 4.730716256918132e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.0001701685671404242, + "loss": 0.012, "step": 333910 }, { - "epoch": 1.68, - "learning_rate": 4.729959487616731e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00017016467892405277, + "loss": 0.0099, "step": 333920 }, { - "epoch": 1.68, - "learning_rate": 4.72920271831533e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00017016079070768128, + "loss": 0.0159, "step": 333930 }, { - "epoch": 1.68, - "learning_rate": 4.7284459490139287e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00017015690249130982, + "loss": 0.0135, "step": 333940 }, { - "epoch": 1.68, - "learning_rate": 4.727689179712528e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00017015301427493834, + "loss": 0.0145, "step": 333950 }, { - "epoch": 1.68, - "learning_rate": 4.726932410411127e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00017014912605856688, + "loss": 0.0103, "step": 333960 }, { - "epoch": 1.68, - "learning_rate": 4.726175641109726e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00017014523784219545, + "loss": 0.0151, "step": 333970 }, { - "epoch": 1.68, - "learning_rate": 4.725418871808325e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00017014134962582396, + "loss": 0.013, "step": 333980 }, { - "epoch": 1.69, - "learning_rate": 4.724662102506924e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.0001701374614094525, + "loss": 0.0148, "step": 333990 }, { - "epoch": 1.69, - "learning_rate": 4.723905333205523e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00017013357319308102, + "loss": 0.0121, "step": 334000 }, { - "epoch": 1.69, - "eval_cer": 0.9144139729278888, - "eval_loss": 0.004758420865982771, - "eval_runtime": 116.3871, - "eval_samples_per_second": 17.184, - "eval_steps_per_second": 4.296, + "epoch": 0.87, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.009081809781491756, + "eval_runtime": 107.8501, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, "step": 334000 }, { - "epoch": 1.69, - "learning_rate": 4.723148563904122e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.0001701296849767096, + "loss": 0.0123, "step": 334010 }, { - "epoch": 1.69, - "learning_rate": 4.722391794602721e-05, - "loss": 0.0079, + "epoch": 0.87, + "learning_rate": 0.0001701257967603381, + "loss": 0.0134, "step": 334020 }, { - "epoch": 1.69, - "learning_rate": 4.72163502530132e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00017012190854396664, + "loss": 0.0162, "step": 334030 }, { - "epoch": 1.69, - "learning_rate": 4.720878255999919e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00017011802032759516, + "loss": 0.0145, "step": 334040 }, { - "epoch": 1.69, - "learning_rate": 4.720121486698518e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00017011413211122373, + "loss": 0.0147, "step": 334050 }, { - "epoch": 1.69, - "learning_rate": 4.719364717397117e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.00017011024389485224, + "loss": 0.0129, "step": 334060 }, { - "epoch": 1.69, - "learning_rate": 4.718607948095716e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00017010635567848078, + "loss": 0.0114, "step": 334070 }, { - "epoch": 1.69, - "learning_rate": 4.717851178794315e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.0001701024674621093, + "loss": 0.0134, "step": 334080 }, { - "epoch": 1.69, - "learning_rate": 4.717094409492914e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00017009857924573787, + "loss": 0.0109, "step": 334090 }, { - "epoch": 1.69, - "learning_rate": 4.716337640191513e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00017009469102936638, + "loss": 0.0136, "step": 334100 }, { - "epoch": 1.69, - "learning_rate": 4.715580870890112e-05, - "loss": 0.0049, + "epoch": 0.87, + "learning_rate": 0.00017009080281299492, + "loss": 0.0125, "step": 334110 }, { - "epoch": 1.69, - "learning_rate": 4.714824101588711e-05, - "loss": 0.0084, + "epoch": 0.87, + "learning_rate": 0.00017008691459662344, + "loss": 0.0112, "step": 334120 }, { - "epoch": 1.69, - "learning_rate": 4.7140673322873097e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.000170083026380252, + "loss": 0.015, "step": 334130 }, { - "epoch": 1.69, - "learning_rate": 4.713310562985909e-05, - "loss": 0.0079, + "epoch": 0.87, + "learning_rate": 0.00017007913816388055, + "loss": 0.0137, "step": 334140 }, { - "epoch": 1.69, - "learning_rate": 4.712553793684508e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00017007524994750906, + "loss": 0.0119, "step": 334150 }, { - "epoch": 1.69, - "learning_rate": 4.711797024383107e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.0001700713617311376, + "loss": 0.0108, "step": 334160 }, { - "epoch": 1.69, - "learning_rate": 4.7110402550817056e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00017006747351476614, + "loss": 0.012, "step": 334170 }, { - "epoch": 1.69, - "learning_rate": 4.710283485780304e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00017006358529839469, + "loss": 0.015, "step": 334180 }, { - "epoch": 1.69, - "learning_rate": 4.709526716478903e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.0001700596970820232, + "loss": 0.0124, "step": 334190 }, { - "epoch": 1.69, - "learning_rate": 4.708769947177502e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00017005580886565174, + "loss": 0.0119, "step": 334200 }, { - "epoch": 1.69, - "learning_rate": 4.708013177876101e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00017005192064928026, + "loss": 0.0177, "step": 334210 }, { - "epoch": 1.69, - "learning_rate": 4.7072564085747e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00017004803243290883, + "loss": 0.0119, "step": 334220 }, { - "epoch": 1.69, - "learning_rate": 4.706499639273299e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00017004414421653734, + "loss": 0.0169, "step": 334230 }, { - "epoch": 1.69, - "learning_rate": 4.705742869971898e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00017004025600016588, + "loss": 0.0137, "step": 334240 }, { - "epoch": 1.69, - "learning_rate": 4.704986100670497e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.0001700363677837944, + "loss": 0.0145, "step": 334250 }, { - "epoch": 1.69, - "learning_rate": 4.704229331369096e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00017003247956742296, + "loss": 0.0116, "step": 334260 }, { - "epoch": 1.69, - "learning_rate": 4.703472562067695e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00017002859135105148, + "loss": 0.013, "step": 334270 }, { - "epoch": 1.69, - "learning_rate": 4.702715792766294e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00017002470313468002, + "loss": 0.0133, "step": 334280 }, { - "epoch": 1.69, - "learning_rate": 4.701959023464893e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00017002081491830854, + "loss": 0.0153, "step": 334290 }, { - "epoch": 1.69, - "learning_rate": 4.7012022541634917e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.0001700169267019371, + "loss": 0.0138, "step": 334300 }, { - "epoch": 1.69, - "learning_rate": 4.700445484862091e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00017001303848556565, + "loss": 0.0154, "step": 334310 }, { - "epoch": 1.69, - "learning_rate": 4.69968871556069e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00017000915026919416, + "loss": 0.0131, "step": 334320 }, { - "epoch": 1.69, - "learning_rate": 4.698931946259289e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00017000526205282267, + "loss": 0.0167, "step": 334330 }, { - "epoch": 1.69, - "learning_rate": 4.6981751769578876e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00017000137383645124, + "loss": 0.0142, "step": 334340 }, { - "epoch": 1.69, - "learning_rate": 4.697418407656487e-05, - "loss": 0.0092, + "epoch": 0.87, + "learning_rate": 0.00016999748562007979, + "loss": 0.0128, "step": 334350 }, { - "epoch": 1.69, - "learning_rate": 4.696661638355086e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.0001699935974037083, + "loss": 0.0144, "step": 334360 }, { - "epoch": 1.69, - "learning_rate": 4.695904869053685e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016998970918733684, + "loss": 0.0137, "step": 334370 }, { - "epoch": 1.69, - "learning_rate": 4.6951480997522836e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016998582097096538, + "loss": 0.0127, "step": 334380 }, { - "epoch": 1.69, - "learning_rate": 4.694391330450883e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016998193275459392, + "loss": 0.013, "step": 334390 }, { - "epoch": 1.69, - "learning_rate": 4.693634561149482e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016997804453822244, + "loss": 0.0138, "step": 334400 }, { - "epoch": 1.69, - "learning_rate": 4.692877791848081e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016997415632185098, + "loss": 0.0111, "step": 334410 }, { - "epoch": 1.69, - "learning_rate": 4.6921210225466796e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016997026810547952, + "loss": 0.0158, "step": 334420 }, { - "epoch": 1.69, - "learning_rate": 4.691364253245279e-05, - "loss": 0.0092, + "epoch": 0.87, + "learning_rate": 0.00016996637988910806, + "loss": 0.017, "step": 334430 }, { - "epoch": 1.69, - "learning_rate": 4.690607483943878e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016996249167273658, + "loss": 0.0131, "step": 334440 }, { - "epoch": 1.69, - "learning_rate": 4.689850714642477e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016995860345636512, + "loss": 0.0144, "step": 334450 }, { - "epoch": 1.69, - "learning_rate": 4.6890939453410755e-05, - "loss": 0.008, + "epoch": 0.87, + "learning_rate": 0.00016995471523999363, + "loss": 0.0169, "step": 334460 }, { - "epoch": 1.69, - "learning_rate": 4.688337176039675e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.0001699508270236222, + "loss": 0.0133, "step": 334470 }, { - "epoch": 1.69, - "learning_rate": 4.687580406738274e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016994693880725075, + "loss": 0.0108, "step": 334480 }, { - "epoch": 1.69, - "learning_rate": 4.686823637436872e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016994305059087926, + "loss": 0.0106, "step": 334490 }, { - "epoch": 1.69, - "learning_rate": 4.686066868135471e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016993916237450777, + "loss": 0.0195, "step": 334500 }, { - "epoch": 1.69, - "learning_rate": 4.68531009883407e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016993527415813634, + "loss": 0.0179, "step": 334510 }, { - "epoch": 1.69, - "learning_rate": 4.684553329532669e-05, - "loss": 0.0083, + "epoch": 0.87, + "learning_rate": 0.00016993138594176488, + "loss": 0.0149, "step": 334520 }, { - "epoch": 1.69, - "learning_rate": 4.683796560231268e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.0001699274977253934, + "loss": 0.0128, "step": 334530 }, { - "epoch": 1.69, - "learning_rate": 4.683039790929867e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016992360950902194, + "loss": 0.0127, "step": 334540 }, { - "epoch": 1.69, - "learning_rate": 4.682283021628466e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016991972129265048, + "loss": 0.0146, "step": 334550 }, { - "epoch": 1.69, - "learning_rate": 4.681526252327065e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016991583307627902, + "loss": 0.014, "step": 334560 }, { - "epoch": 1.69, - "learning_rate": 4.680769483025664e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016991194485990754, + "loss": 0.016, "step": 334570 }, { - "epoch": 1.69, - "learning_rate": 4.680012713724263e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016990805664353608, + "loss": 0.0115, "step": 334580 }, { - "epoch": 1.69, - "learning_rate": 4.679255944422862e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016990416842716462, + "loss": 0.0148, "step": 334590 }, { - "epoch": 1.69, - "learning_rate": 4.678499175121461e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016990028021079316, + "loss": 0.0139, "step": 334600 }, { - "epoch": 1.69, - "learning_rate": 4.67774240582006e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016989639199442168, + "loss": 0.0129, "step": 334610 }, { - "epoch": 1.69, - "learning_rate": 4.676985636518659e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016989250377805022, + "loss": 0.0167, "step": 334620 }, { - "epoch": 1.69, - "learning_rate": 4.676228867217258e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.0001698886155616788, + "loss": 0.0154, "step": 334630 }, { - "epoch": 1.69, - "learning_rate": 4.675472097915857e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.0001698847273453073, + "loss": 0.0113, "step": 334640 }, { - "epoch": 1.69, - "learning_rate": 4.674715328614456e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016988083912893582, + "loss": 0.0175, "step": 334650 }, { - "epoch": 1.69, - "learning_rate": 4.673958559313055e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016987695091256436, + "loss": 0.0112, "step": 334660 }, { - "epoch": 1.69, - "learning_rate": 4.673201790011654e-05, - "loss": 0.0085, + "epoch": 0.87, + "learning_rate": 0.00016987306269619293, + "loss": 0.0154, "step": 334670 }, { - "epoch": 1.69, - "learning_rate": 4.672445020710253e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016986917447982144, + "loss": 0.0136, "step": 334680 }, { - "epoch": 1.69, - "learning_rate": 4.671688251408852e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016986528626344998, + "loss": 0.0128, "step": 334690 }, { - "epoch": 1.69, - "learning_rate": 4.6709314821074506e-05, - "loss": 0.0103, + "epoch": 0.87, + "learning_rate": 0.0001698613980470785, + "loss": 0.0126, "step": 334700 }, { - "epoch": 1.69, - "learning_rate": 4.67017471280605e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016985750983070704, + "loss": 0.0154, "step": 334710 }, { - "epoch": 1.69, - "learning_rate": 4.669417943504649e-05, - "loss": 0.0038, + "epoch": 0.87, + "learning_rate": 0.00016985362161433558, + "loss": 0.019, "step": 334720 }, { - "epoch": 1.69, - "learning_rate": 4.668661174203248e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016984973339796412, + "loss": 0.0125, "step": 334730 }, { - "epoch": 1.69, - "learning_rate": 4.6679044049018466e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016984584518159264, + "loss": 0.0103, "step": 334740 }, { - "epoch": 1.69, - "learning_rate": 4.667147635600446e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016984195696522118, + "loss": 0.0126, "step": 334750 }, { - "epoch": 1.69, - "learning_rate": 4.666390866299045e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016983806874884972, + "loss": 0.014, "step": 334760 }, { - "epoch": 1.69, - "learning_rate": 4.665634096997644e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016983418053247826, + "loss": 0.0183, "step": 334770 }, { - "epoch": 1.69, - "learning_rate": 4.6648773276962426e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016983029231610678, + "loss": 0.0165, "step": 334780 }, { - "epoch": 1.69, - "learning_rate": 4.664120558394842e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016982640409973532, + "loss": 0.0127, "step": 334790 }, { - "epoch": 1.69, - "learning_rate": 4.663363789093441e-05, - "loss": 0.0046, + "epoch": 0.87, + "learning_rate": 0.00016982251588336386, + "loss": 0.0123, "step": 334800 }, { - "epoch": 1.69, - "learning_rate": 4.662607019792039e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.0001698186276669924, + "loss": 0.0142, "step": 334810 }, { - "epoch": 1.69, - "learning_rate": 4.661850250490638e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00016981473945062092, + "loss": 0.0123, "step": 334820 }, { - "epoch": 1.69, - "learning_rate": 4.661093481189237e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016981085123424946, + "loss": 0.0141, "step": 334830 }, { - "epoch": 1.69, - "learning_rate": 4.660336711887836e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016980696301787803, + "loss": 0.0122, "step": 334840 }, { - "epoch": 1.69, - "learning_rate": 4.659579942586435e-05, - "loss": 0.008, + "epoch": 0.87, + "learning_rate": 0.00016980307480150654, + "loss": 0.0134, "step": 334850 }, { - "epoch": 1.69, - "learning_rate": 4.658823173285034e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016979918658513508, + "loss": 0.0135, "step": 334860 }, { - "epoch": 1.69, - "learning_rate": 4.6580664039836326e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.0001697952983687636, + "loss": 0.0117, "step": 334870 }, { - "epoch": 1.69, - "learning_rate": 4.657309634682232e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016979141015239217, + "loss": 0.0146, "step": 334880 }, { - "epoch": 1.69, - "learning_rate": 4.656552865380831e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016978752193602068, + "loss": 0.0121, "step": 334890 }, { - "epoch": 1.69, - "learning_rate": 4.65579609607943e-05, - "loss": 0.0082, + "epoch": 0.87, + "learning_rate": 0.00016978363371964922, + "loss": 0.0152, "step": 334900 }, { - "epoch": 1.69, - "learning_rate": 4.6550393267780286e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016977974550327774, + "loss": 0.0138, "step": 334910 }, { - "epoch": 1.69, - "learning_rate": 4.654282557476628e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.0001697758572869063, + "loss": 0.0119, "step": 334920 }, { - "epoch": 1.69, - "learning_rate": 4.653525788175227e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00016977196907053482, + "loss": 0.0113, "step": 334930 }, { - "epoch": 1.69, - "learning_rate": 4.652769018873826e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016976808085416336, + "loss": 0.0137, "step": 334940 }, { - "epoch": 1.69, - "learning_rate": 4.652012249572425e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016976419263779188, + "loss": 0.0122, "step": 334950 }, { - "epoch": 1.69, - "learning_rate": 4.651255480271024e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016976030442142042, + "loss": 0.01, "step": 334960 }, { - "epoch": 1.69, - "learning_rate": 4.650498710969623e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016975641620504896, + "loss": 0.0201, "step": 334970 }, { - "epoch": 1.69, - "learning_rate": 4.649741941668222e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.0001697525279886775, + "loss": 0.0162, "step": 334980 }, { - "epoch": 1.69, - "learning_rate": 4.648985172366821e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00016974863977230602, + "loss": 0.0127, "step": 334990 }, { - "epoch": 1.69, - "learning_rate": 4.64822840306542e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016974475155593456, + "loss": 0.0106, "step": 335000 }, { - "epoch": 1.69, - "eval_cer": 0.914412032135638, - "eval_loss": 0.004865641705691814, - "eval_runtime": 116.3195, - "eval_samples_per_second": 17.194, - "eval_steps_per_second": 4.299, + "epoch": 0.87, + "eval_cer": 0.8817180823294437, + "eval_loss": 0.009029078297317028, + "eval_runtime": 107.7187, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, "step": 335000 }, { - "epoch": 1.69, - "learning_rate": 4.647471633764019e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016974086333956313, + "loss": 0.0122, "step": 335010 }, { - "epoch": 1.69, - "learning_rate": 4.646714864462618e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016973697512319164, + "loss": 0.0172, "step": 335020 }, { - "epoch": 1.69, - "learning_rate": 4.645958095161217e-05, - "loss": 0.0082, + "epoch": 0.87, + "learning_rate": 0.00016973308690682018, + "loss": 0.0143, "step": 335030 }, { - "epoch": 1.69, - "learning_rate": 4.645201325859816e-05, - "loss": 0.0048, + "epoch": 0.87, + "learning_rate": 0.0001697291986904487, + "loss": 0.014, "step": 335040 }, { - "epoch": 1.69, - "learning_rate": 4.644444556558415e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016972531047407727, + "loss": 0.0146, "step": 335050 }, { - "epoch": 1.69, - "learning_rate": 4.6436877872570136e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016972142225770578, + "loss": 0.0117, "step": 335060 }, { - "epoch": 1.69, - "learning_rate": 4.642931017955613e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016971753404133432, + "loss": 0.0148, "step": 335070 }, { - "epoch": 1.69, - "learning_rate": 4.642174248654212e-05, - "loss": 0.0091, + "epoch": 0.87, + "learning_rate": 0.00016971364582496284, + "loss": 0.0178, "step": 335080 }, { - "epoch": 1.69, - "learning_rate": 4.641417479352811e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.0001697097576085914, + "loss": 0.0139, "step": 335090 }, { - "epoch": 1.69, - "learning_rate": 4.6406607100514096e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016970586939221992, + "loss": 0.0149, "step": 335100 }, { - "epoch": 1.69, - "learning_rate": 4.639903940750009e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.00016970198117584846, + "loss": 0.0109, "step": 335110 }, { - "epoch": 1.69, - "learning_rate": 4.639147171448607e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016969809295947698, + "loss": 0.0137, "step": 335120 }, { - "epoch": 1.69, - "learning_rate": 4.638390402147206e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016969420474310555, + "loss": 0.0112, "step": 335130 }, { - "epoch": 1.69, - "learning_rate": 4.637633632845805e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016969031652673406, + "loss": 0.0111, "step": 335140 }, { - "epoch": 1.69, - "learning_rate": 4.636876863544404e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.0001696864283103626, + "loss": 0.018, "step": 335150 }, { - "epoch": 1.69, - "learning_rate": 4.636120094243003e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.00016968254009399112, + "loss": 0.0171, "step": 335160 }, { - "epoch": 1.69, - "learning_rate": 4.635363324941602e-05, - "loss": 0.0045, + "epoch": 0.87, + "learning_rate": 0.00016967865187761968, + "loss": 0.0136, "step": 335170 }, { - "epoch": 1.69, - "learning_rate": 4.634606555640201e-05, - "loss": 0.0079, + "epoch": 0.87, + "learning_rate": 0.00016967476366124823, + "loss": 0.0133, "step": 335180 }, { - "epoch": 1.69, - "learning_rate": 4.6338497863388e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016967087544487674, + "loss": 0.0116, "step": 335190 }, { - "epoch": 1.69, - "learning_rate": 4.633093017037399e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016966698722850528, + "loss": 0.0151, "step": 335200 }, { - "epoch": 1.69, - "learning_rate": 4.632336247735998e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.0001696630990121338, + "loss": 0.0116, "step": 335210 }, { - "epoch": 1.69, - "learning_rate": 4.631579478434597e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00016965921079576237, + "loss": 0.0176, "step": 335220 }, { - "epoch": 1.69, - "learning_rate": 4.6308227091331956e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016965532257939088, + "loss": 0.016, "step": 335230 }, { - "epoch": 1.69, - "learning_rate": 4.630065939831795e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016965143436301942, + "loss": 0.0141, "step": 335240 }, { - "epoch": 1.69, - "learning_rate": 4.629309170530394e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016964754614664794, + "loss": 0.0115, "step": 335250 }, { - "epoch": 1.69, - "learning_rate": 4.628552401228993e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.0001696436579302765, + "loss": 0.0154, "step": 335260 }, { - "epoch": 1.69, - "learning_rate": 4.6277956319275916e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016963976971390502, + "loss": 0.0137, "step": 335270 }, { - "epoch": 1.69, - "learning_rate": 4.627038862626191e-05, - "loss": 0.0042, + "epoch": 0.87, + "learning_rate": 0.00016963588149753356, + "loss": 0.0129, "step": 335280 }, { - "epoch": 1.69, - "learning_rate": 4.62628209332479e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016963199328116208, + "loss": 0.0148, "step": 335290 }, { - "epoch": 1.69, - "learning_rate": 4.625525324023389e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016962810506479064, + "loss": 0.0131, "step": 335300 }, { - "epoch": 1.69, - "learning_rate": 4.6247685547219876e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016962421684841916, + "loss": 0.0106, "step": 335310 }, { - "epoch": 1.69, - "learning_rate": 4.624011785420587e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.0001696203286320477, + "loss": 0.0152, "step": 335320 }, { - "epoch": 1.69, - "learning_rate": 4.623255016119186e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016961644041567622, + "loss": 0.0147, "step": 335330 }, { - "epoch": 1.69, - "learning_rate": 4.622498246817785e-05, - "loss": 0.0044, + "epoch": 0.87, + "learning_rate": 0.00016961255219930478, + "loss": 0.0137, "step": 335340 }, { - "epoch": 1.69, - "learning_rate": 4.6217414775163835e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016960866398293333, + "loss": 0.0093, "step": 335350 }, { - "epoch": 1.69, - "learning_rate": 4.620984708214983e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016960477576656184, + "loss": 0.0126, "step": 335360 }, { - "epoch": 1.69, - "learning_rate": 4.620227938913582e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016960088755019035, + "loss": 0.014, "step": 335370 }, { - "epoch": 1.69, - "learning_rate": 4.619471169612181e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016959699933381892, + "loss": 0.0115, "step": 335380 }, { - "epoch": 1.69, - "learning_rate": 4.6187144003107795e-05, - "loss": 0.0086, + "epoch": 0.87, + "learning_rate": 0.00016959311111744747, + "loss": 0.0151, "step": 335390 }, { - "epoch": 1.69, - "learning_rate": 4.617957631009379e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016958922290107598, + "loss": 0.0114, "step": 335400 }, { - "epoch": 1.69, - "learning_rate": 4.617200861707978e-05, - "loss": 0.0049, + "epoch": 0.87, + "learning_rate": 0.00016958533468470452, + "loss": 0.0173, "step": 335410 }, { - "epoch": 1.69, - "learning_rate": 4.6164440924065767e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016958144646833306, + "loss": 0.0158, "step": 335420 }, { - "epoch": 1.69, - "learning_rate": 4.6156873231051755e-05, - "loss": 0.0082, + "epoch": 0.87, + "learning_rate": 0.0001695775582519616, + "loss": 0.0136, "step": 335430 }, { - "epoch": 1.69, - "learning_rate": 4.614930553803774e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016957367003559012, + "loss": 0.014, "step": 335440 }, { - "epoch": 1.69, - "learning_rate": 4.614173784502373e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016956978181921866, + "loss": 0.0158, "step": 335450 }, { - "epoch": 1.69, - "learning_rate": 4.613417015200972e-05, - "loss": 0.0082, + "epoch": 0.87, + "learning_rate": 0.00016956589360284718, + "loss": 0.0112, "step": 335460 }, { - "epoch": 1.69, - "learning_rate": 4.612660245899571e-05, - "loss": 0.0087, + "epoch": 0.87, + "learning_rate": 0.00016956200538647574, + "loss": 0.0131, "step": 335470 }, { - "epoch": 1.69, - "learning_rate": 4.61190347659817e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016955811717010426, + "loss": 0.017, "step": 335480 }, { - "epoch": 1.69, - "learning_rate": 4.611146707296769e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.0001695542289537328, + "loss": 0.0126, "step": 335490 }, { - "epoch": 1.69, - "learning_rate": 4.610389937995368e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016955034073736131, + "loss": 0.013, "step": 335500 }, { - "epoch": 1.69, - "learning_rate": 4.609633168693967e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016954645252098988, + "loss": 0.016, "step": 335510 }, { - "epoch": 1.69, - "learning_rate": 4.608876399392566e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.0001695425643046184, + "loss": 0.0175, "step": 335520 }, { - "epoch": 1.69, - "learning_rate": 4.608119630091165e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016953867608824694, + "loss": 0.0118, "step": 335530 }, { - "epoch": 1.69, - "learning_rate": 4.607362860789764e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016953478787187545, + "loss": 0.0119, "step": 335540 }, { - "epoch": 1.69, - "learning_rate": 4.606606091488363e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016953089965550402, + "loss": 0.0171, "step": 335550 }, { - "epoch": 1.69, - "learning_rate": 4.605849322186962e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016952701143913256, + "loss": 0.0142, "step": 335560 }, { - "epoch": 1.69, - "learning_rate": 4.605092552885561e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016952312322276108, + "loss": 0.0125, "step": 335570 }, { - "epoch": 1.69, - "learning_rate": 4.60433578358416e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016951923500638962, + "loss": 0.0184, "step": 335580 }, { - "epoch": 1.69, - "learning_rate": 4.6035790142827587e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016951534679001816, + "loss": 0.0169, "step": 335590 }, { - "epoch": 1.69, - "learning_rate": 4.602822244981358e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.0001695114585736467, + "loss": 0.0125, "step": 335600 }, { - "epoch": 1.69, - "learning_rate": 4.602065475679957e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016950757035727522, + "loss": 0.0271, "step": 335610 }, { - "epoch": 1.69, - "learning_rate": 4.601308706378556e-05, - "loss": 0.005, + "epoch": 0.87, + "learning_rate": 0.00016950368214090376, + "loss": 0.0148, "step": 335620 }, { - "epoch": 1.69, - "learning_rate": 4.6005519370771546e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.0001694997939245323, + "loss": 0.0122, "step": 335630 }, { - "epoch": 1.69, - "learning_rate": 4.599795167775754e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016949590570816084, + "loss": 0.0142, "step": 335640 }, { - "epoch": 1.69, - "learning_rate": 4.599038398474353e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016949201749178936, + "loss": 0.0114, "step": 335650 }, { - "epoch": 1.69, - "learning_rate": 4.598281629172952e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.0001694881292754179, + "loss": 0.0167, "step": 335660 }, { - "epoch": 1.69, - "learning_rate": 4.5975248598715506e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00016948424105904647, + "loss": 0.0159, "step": 335670 }, { - "epoch": 1.69, - "learning_rate": 4.59676809057015e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016948035284267498, + "loss": 0.0157, "step": 335680 }, { - "epoch": 1.69, - "learning_rate": 4.596011321268749e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.0001694764646263035, + "loss": 0.0142, "step": 335690 }, { - "epoch": 1.69, - "learning_rate": 4.595254551967348e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016947257640993204, + "loss": 0.0134, "step": 335700 }, { - "epoch": 1.69, - "learning_rate": 4.5944977826659466e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016946868819356055, + "loss": 0.0126, "step": 335710 }, { - "epoch": 1.69, - "learning_rate": 4.593741013364546e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016946479997718912, + "loss": 0.0118, "step": 335720 }, { - "epoch": 1.69, - "learning_rate": 4.592984244063145e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016946091176081766, + "loss": 0.0133, "step": 335730 }, { - "epoch": 1.69, - "learning_rate": 4.592227474761744e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016945702354444618, + "loss": 0.0116, "step": 335740 }, { - "epoch": 1.69, - "learning_rate": 4.591470705460342e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016945313532807472, + "loss": 0.0204, "step": 335750 }, { - "epoch": 1.69, - "learning_rate": 4.5907139361589407e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016944924711170326, + "loss": 0.0156, "step": 335760 }, { - "epoch": 1.69, - "learning_rate": 4.58995716685754e-05, - "loss": 0.0083, + "epoch": 0.87, + "learning_rate": 0.0001694453588953318, + "loss": 0.0134, "step": 335770 }, { - "epoch": 1.69, - "learning_rate": 4.589200397556139e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016944147067896032, + "loss": 0.0114, "step": 335780 }, { - "epoch": 1.69, - "learning_rate": 4.588443628254738e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016943758246258886, + "loss": 0.0142, "step": 335790 }, { - "epoch": 1.69, - "learning_rate": 4.5876868589533366e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.0001694336942462174, + "loss": 0.0139, "step": 335800 }, { - "epoch": 1.69, - "learning_rate": 4.586930089651936e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016942980602984594, + "loss": 0.0269, "step": 335810 }, { - "epoch": 1.69, - "learning_rate": 4.586173320350535e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016942591781347446, + "loss": 0.0674, "step": 335820 }, { - "epoch": 1.69, - "learning_rate": 4.585416551049134e-05, - "loss": 0.0105, + "epoch": 0.87, + "learning_rate": 0.000169422029597103, + "loss": 0.03, "step": 335830 }, { - "epoch": 1.69, - "learning_rate": 4.5846597817477326e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016941814138073154, + "loss": 0.0132, "step": 335840 }, { - "epoch": 1.69, - "learning_rate": 4.583903012446332e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016941425316436008, + "loss": 0.0179, "step": 335850 }, { - "epoch": 1.69, - "learning_rate": 4.583146243144931e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.0001694103649479886, + "loss": 0.0124, "step": 335860 }, { - "epoch": 1.69, - "learning_rate": 4.58238947384353e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016940647673161714, + "loss": 0.015, "step": 335870 }, { - "epoch": 1.69, - "learning_rate": 4.5816327045421286e-05, - "loss": 0.0083, + "epoch": 0.87, + "learning_rate": 0.0001694025885152457, + "loss": 0.0158, "step": 335880 }, { - "epoch": 1.69, - "learning_rate": 4.580875935240728e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016939870029887422, + "loss": 0.0123, "step": 335890 }, { - "epoch": 1.69, - "learning_rate": 4.580119165939327e-05, - "loss": 0.0049, + "epoch": 0.87, + "learning_rate": 0.00016939481208250276, + "loss": 0.0197, "step": 335900 }, { - "epoch": 1.69, - "learning_rate": 4.579362396637926e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016939092386613128, + "loss": 0.0125, "step": 335910 }, { - "epoch": 1.69, - "learning_rate": 4.578605627336525e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016938703564975985, + "loss": 0.0161, "step": 335920 }, { - "epoch": 1.69, - "learning_rate": 4.577848858035124e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016938314743338836, + "loss": 0.0158, "step": 335930 }, { - "epoch": 1.69, - "learning_rate": 4.577092088733723e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.0001693792592170169, + "loss": 0.0125, "step": 335940 }, { - "epoch": 1.69, - "learning_rate": 4.576335319432322e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016937537100064542, + "loss": 0.0094, "step": 335950 }, { - "epoch": 1.69, - "learning_rate": 4.575578550130921e-05, - "loss": 0.0079, + "epoch": 0.87, + "learning_rate": 0.00016937148278427396, + "loss": 0.0152, "step": 335960 }, { - "epoch": 1.7, - "learning_rate": 4.57482178082952e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.0001693675945679025, + "loss": 0.0121, "step": 335970 }, { - "epoch": 1.7, - "learning_rate": 4.574065011528119e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016936370635153104, + "loss": 0.0127, "step": 335980 }, { - "epoch": 1.7, - "learning_rate": 4.5733082422267176e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016935981813515956, + "loss": 0.0159, "step": 335990 }, { - "epoch": 1.7, - "learning_rate": 4.572551472925317e-05, - "loss": 0.0091, + "epoch": 0.87, + "learning_rate": 0.0001693559299187881, + "loss": 0.0134, "step": 336000 }, { - "epoch": 1.7, - "eval_cer": 0.9144372624348985, - "eval_loss": 0.004783105570822954, - "eval_runtime": 116.4347, - "eval_samples_per_second": 17.177, - "eval_steps_per_second": 4.294, + "epoch": 0.87, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.009199898689985275, + "eval_runtime": 107.6047, + "eval_samples_per_second": 18.587, + "eval_steps_per_second": 4.647, "step": 336000 }, { - "epoch": 1.7, - "learning_rate": 4.571794703623916e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016935204170241664, + "loss": 0.0142, "step": 336010 }, { - "epoch": 1.7, - "learning_rate": 4.571037934322515e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016934815348604518, + "loss": 0.0123, "step": 336020 }, { - "epoch": 1.7, - "learning_rate": 4.5702811650211136e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.0001693442652696737, + "loss": 0.018, "step": 336030 }, { - "epoch": 1.7, - "learning_rate": 4.569524395719713e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.00016934037705330224, + "loss": 0.0124, "step": 336040 }, { - "epoch": 1.7, - "learning_rate": 4.568767626418312e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.0001693364888369308, + "loss": 0.0155, "step": 336050 }, { - "epoch": 1.7, - "learning_rate": 4.568010857116911e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016933260062055932, + "loss": 0.0152, "step": 336060 }, { - "epoch": 1.7, - "learning_rate": 4.567254087815509e-05, - "loss": 0.0045, + "epoch": 0.87, + "learning_rate": 0.00016932871240418786, + "loss": 0.0168, "step": 336070 }, { - "epoch": 1.7, - "learning_rate": 4.566497318514108e-05, - "loss": 0.0095, + "epoch": 0.87, + "learning_rate": 0.00016932482418781638, + "loss": 0.0123, "step": 336080 }, { - "epoch": 1.7, - "learning_rate": 4.565740549212707e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016932093597144495, + "loss": 0.0152, "step": 336090 }, { - "epoch": 1.7, - "learning_rate": 4.564983779911306e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016931704775507346, + "loss": 0.0143, "step": 336100 }, { - "epoch": 1.7, - "learning_rate": 4.564227010609905e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.000169313159538702, + "loss": 0.014, "step": 336110 }, { - "epoch": 1.7, - "learning_rate": 4.563470241308504e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016930927132233052, + "loss": 0.0166, "step": 336120 }, { - "epoch": 1.7, - "learning_rate": 4.562713472007103e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016930538310595909, + "loss": 0.0142, "step": 336130 }, { - "epoch": 1.7, - "learning_rate": 4.561956702705702e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.0001693014948895876, + "loss": 0.0114, "step": 336140 }, { - "epoch": 1.7, - "learning_rate": 4.561199933404301e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016929760667321614, + "loss": 0.0127, "step": 336150 }, { - "epoch": 1.7, - "learning_rate": 4.5604431641028996e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016929371845684466, + "loss": 0.0106, "step": 336160 }, { - "epoch": 1.7, - "learning_rate": 4.559686394801499e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00016928983024047322, + "loss": 0.0186, "step": 336170 }, { - "epoch": 1.7, - "learning_rate": 4.558929625500098e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016928594202410174, + "loss": 0.0118, "step": 336180 }, { - "epoch": 1.7, - "learning_rate": 4.558172856198697e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016928205380773028, + "loss": 0.0139, "step": 336190 }, { - "epoch": 1.7, - "learning_rate": 4.5574160868972956e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.0001692781655913588, + "loss": 0.0175, "step": 336200 }, { - "epoch": 1.7, - "learning_rate": 4.556659317595895e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016927427737498734, + "loss": 0.0109, "step": 336210 }, { - "epoch": 1.7, - "learning_rate": 4.555902548294494e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.0001692703891586159, + "loss": 0.014, "step": 336220 }, { - "epoch": 1.7, - "learning_rate": 4.555145778993093e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016926650094224442, + "loss": 0.0124, "step": 336230 }, { - "epoch": 1.7, - "learning_rate": 4.5543890096916916e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016926261272587294, + "loss": 0.0119, "step": 336240 }, { - "epoch": 1.7, - "learning_rate": 4.553632240390291e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016925872450950148, + "loss": 0.014, "step": 336250 }, { - "epoch": 1.7, - "learning_rate": 4.55287547108889e-05, - "loss": 0.008, + "epoch": 0.87, + "learning_rate": 0.00016925483629313005, + "loss": 0.0122, "step": 336260 }, { - "epoch": 1.7, - "learning_rate": 4.552118701787489e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016925094807675856, + "loss": 0.0126, "step": 336270 }, { - "epoch": 1.7, - "learning_rate": 4.5513619324860875e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.0001692470598603871, + "loss": 0.0124, "step": 336280 }, { - "epoch": 1.7, - "learning_rate": 4.550605163184687e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016924317164401562, + "loss": 0.015, "step": 336290 }, { - "epoch": 1.7, - "learning_rate": 4.549848393883286e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016923928342764418, + "loss": 0.0099, "step": 336300 }, { - "epoch": 1.7, - "learning_rate": 4.549091624581885e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.0001692353952112727, + "loss": 0.0144, "step": 336310 }, { - "epoch": 1.7, - "learning_rate": 4.5483348552804835e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016923150699490124, + "loss": 0.0116, "step": 336320 }, { - "epoch": 1.7, - "learning_rate": 4.547578085979083e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016922761877852976, + "loss": 0.0138, "step": 336330 }, { - "epoch": 1.7, - "learning_rate": 4.546821316677682e-05, - "loss": 0.0046, + "epoch": 0.87, + "learning_rate": 0.00016922373056215832, + "loss": 0.0175, "step": 336340 }, { - "epoch": 1.7, - "learning_rate": 4.5460645473762806e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016921984234578684, + "loss": 0.0147, "step": 336350 }, { - "epoch": 1.7, - "learning_rate": 4.5453077780748795e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016921595412941538, + "loss": 0.0128, "step": 336360 }, { - "epoch": 1.7, - "learning_rate": 4.544551008773479e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.0001692120659130439, + "loss": 0.0141, "step": 336370 }, { - "epoch": 1.7, - "learning_rate": 4.543794239472077e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.00016920817769667246, + "loss": 0.0129, "step": 336380 }, { - "epoch": 1.7, - "learning_rate": 4.543037470170676e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016920428948030098, + "loss": 0.0127, "step": 336390 }, { - "epoch": 1.7, - "learning_rate": 4.542280700869275e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016920040126392952, + "loss": 0.0126, "step": 336400 }, { - "epoch": 1.7, - "learning_rate": 4.541523931567874e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00016919651304755803, + "loss": 0.0174, "step": 336410 }, { - "epoch": 1.7, - "learning_rate": 4.540767162266473e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.0001691926248311866, + "loss": 0.0125, "step": 336420 }, { - "epoch": 1.7, - "learning_rate": 4.540010392965072e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016918873661481514, + "loss": 0.0125, "step": 336430 }, { - "epoch": 1.7, - "learning_rate": 4.539253623663671e-05, - "loss": 0.0083, + "epoch": 0.87, + "learning_rate": 0.00016918484839844366, + "loss": 0.0119, "step": 336440 }, { - "epoch": 1.7, - "learning_rate": 4.53849685436227e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.0001691809601820722, + "loss": 0.0158, "step": 336450 }, { - "epoch": 1.7, - "learning_rate": 4.537740085060869e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00016917707196570072, + "loss": 0.0149, "step": 336460 }, { - "epoch": 1.7, - "learning_rate": 4.536983315759468e-05, - "loss": 0.0101, + "epoch": 0.87, + "learning_rate": 0.00016917318374932928, + "loss": 0.0139, "step": 336470 }, { - "epoch": 1.7, - "learning_rate": 4.536226546458067e-05, - "loss": 0.0045, + "epoch": 0.87, + "learning_rate": 0.0001691692955329578, + "loss": 0.0187, "step": 336480 }, { - "epoch": 1.7, - "learning_rate": 4.535469777156666e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016916540731658634, + "loss": 0.014, "step": 336490 }, { - "epoch": 1.7, - "learning_rate": 4.534713007855265e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016916151910021486, + "loss": 0.0126, "step": 336500 }, { - "epoch": 1.7, - "learning_rate": 4.533956238553864e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016915763088384342, + "loss": 0.0191, "step": 336510 }, { - "epoch": 1.7, - "learning_rate": 4.5331994692524626e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016915374266747194, + "loss": 0.0118, "step": 336520 }, { - "epoch": 1.7, - "learning_rate": 4.532442699951062e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016914985445110048, + "loss": 0.0095, "step": 336530 }, { - "epoch": 1.7, - "learning_rate": 4.531685930649661e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.000169145966234729, + "loss": 0.015, "step": 336540 }, { - "epoch": 1.7, - "learning_rate": 4.53092916134826e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016914207801835756, + "loss": 0.0162, "step": 336550 }, { - "epoch": 1.7, - "learning_rate": 4.5301723920468586e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016913818980198608, + "loss": 0.0183, "step": 336560 }, { - "epoch": 1.7, - "learning_rate": 4.529415622745458e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016913430158561462, + "loss": 0.0146, "step": 336570 }, { - "epoch": 1.7, - "learning_rate": 4.528658853444057e-05, - "loss": 0.008, + "epoch": 0.87, + "learning_rate": 0.00016913041336924313, + "loss": 0.0143, "step": 336580 }, { - "epoch": 1.7, - "learning_rate": 4.527902084142656e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.0001691265251528717, + "loss": 0.0137, "step": 336590 }, { - "epoch": 1.7, - "learning_rate": 4.5271453148412546e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.00016912263693650024, + "loss": 0.0157, "step": 336600 }, { - "epoch": 1.7, - "learning_rate": 4.526388545539854e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016911874872012876, + "loss": 0.0289, "step": 336610 }, { - "epoch": 1.7, - "learning_rate": 4.525631776238453e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.0001691148605037573, + "loss": 0.0142, "step": 336620 }, { - "epoch": 1.7, - "learning_rate": 4.524875006937052e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016911097228738584, + "loss": 0.0146, "step": 336630 }, { - "epoch": 1.7, - "learning_rate": 4.5241182376356505e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016910708407101438, + "loss": 0.0155, "step": 336640 }, { - "epoch": 1.7, - "learning_rate": 4.52336146833425e-05, - "loss": 0.0074, + "epoch": 0.87, + "learning_rate": 0.0001691031958546429, + "loss": 0.0117, "step": 336650 }, { - "epoch": 1.7, - "learning_rate": 4.522604699032849e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016909930763827144, + "loss": 0.0148, "step": 336660 }, { - "epoch": 1.7, - "learning_rate": 4.521847929731448e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016909541942189998, + "loss": 0.0117, "step": 336670 }, { - "epoch": 1.7, - "learning_rate": 4.5210911604300465e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016909153120552852, + "loss": 0.0151, "step": 336680 }, { - "epoch": 1.7, - "learning_rate": 4.5203343911286446e-05, - "loss": 0.0101, + "epoch": 0.87, + "learning_rate": 0.00016908764298915704, + "loss": 0.0113, "step": 336690 }, { - "epoch": 1.7, - "learning_rate": 4.519577621827244e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016908375477278558, + "loss": 0.0104, "step": 336700 }, { - "epoch": 1.7, - "learning_rate": 4.518820852525843e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.0001690798665564141, + "loss": 0.0133, "step": 336710 }, { - "epoch": 1.7, - "learning_rate": 4.518064083224442e-05, - "loss": 0.0092, + "epoch": 0.87, + "learning_rate": 0.00016907597834004266, + "loss": 0.0142, "step": 336720 }, { - "epoch": 1.7, - "learning_rate": 4.5173073139230406e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016907209012367118, + "loss": 0.0124, "step": 336730 }, { - "epoch": 1.7, - "learning_rate": 4.51655054462164e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016906820190729972, + "loss": 0.0141, "step": 336740 }, { - "epoch": 1.7, - "learning_rate": 4.515793775320239e-05, - "loss": 0.0131, + "epoch": 0.87, + "learning_rate": 0.00016906431369092823, + "loss": 0.0134, "step": 336750 }, { - "epoch": 1.7, - "learning_rate": 4.515037006018838e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.0001690604254745568, + "loss": 0.0144, "step": 336760 }, { - "epoch": 1.7, - "learning_rate": 4.5142802367174366e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016905653725818534, + "loss": 0.0156, "step": 336770 }, { - "epoch": 1.7, - "learning_rate": 4.513523467416036e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.00016905264904181386, + "loss": 0.0123, "step": 336780 }, { - "epoch": 1.7, - "learning_rate": 4.512766698114635e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.0001690487608254424, + "loss": 0.0115, "step": 336790 }, { - "epoch": 1.7, - "learning_rate": 4.512009928813234e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016904487260907094, + "loss": 0.0143, "step": 336800 }, { - "epoch": 1.7, - "learning_rate": 4.5112531595118325e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016904098439269948, + "loss": 0.0121, "step": 336810 }, { - "epoch": 1.7, - "learning_rate": 4.510496390210432e-05, - "loss": 0.0057, + "epoch": 0.87, + "learning_rate": 0.000169037096176328, + "loss": 0.017, "step": 336820 }, { - "epoch": 1.7, - "learning_rate": 4.509739620909031e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.00016903320795995654, + "loss": 0.0148, "step": 336830 }, { - "epoch": 1.7, - "learning_rate": 4.50898285160763e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016902931974358508, + "loss": 0.0157, "step": 336840 }, { - "epoch": 1.7, - "learning_rate": 4.5082260823062285e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016902543152721362, + "loss": 0.0113, "step": 336850 }, { - "epoch": 1.7, - "learning_rate": 4.507469313004828e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016902154331084214, + "loss": 0.0103, "step": 336860 }, { - "epoch": 1.7, - "learning_rate": 4.506712543703427e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016901765509447068, + "loss": 0.0145, "step": 336870 }, { - "epoch": 1.7, - "learning_rate": 4.5059557744020257e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016901376687809922, + "loss": 0.0136, "step": 336880 }, { - "epoch": 1.7, - "learning_rate": 4.505199005100625e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016900987866172776, + "loss": 0.0149, "step": 336890 }, { - "epoch": 1.7, - "learning_rate": 4.504442235799224e-05, - "loss": 0.0053, + "epoch": 0.87, + "learning_rate": 0.00016900599044535628, + "loss": 0.0147, "step": 336900 }, { - "epoch": 1.7, - "learning_rate": 4.503685466497823e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.00016900210222898482, + "loss": 0.0129, "step": 336910 }, { - "epoch": 1.7, - "learning_rate": 4.5029286971964216e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.0001689982140126134, + "loss": 0.0135, "step": 336920 }, { - "epoch": 1.7, - "learning_rate": 4.502171927895021e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.0001689943257962419, + "loss": 0.013, "step": 336930 }, { - "epoch": 1.7, - "learning_rate": 4.50141515859362e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016899043757987044, + "loss": 0.0145, "step": 336940 }, { - "epoch": 1.7, - "learning_rate": 4.500658389292219e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016898654936349896, + "loss": 0.013, "step": 336950 }, { - "epoch": 1.7, - "learning_rate": 4.4999016199908176e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016898266114712747, + "loss": 0.0149, "step": 336960 }, { - "epoch": 1.7, - "learning_rate": 4.499144850689417e-05, - "loss": 0.0073, + "epoch": 0.87, + "learning_rate": 0.00016897877293075604, + "loss": 0.0118, "step": 336970 }, { - "epoch": 1.7, - "learning_rate": 4.498388081388016e-05, - "loss": 0.0079, + "epoch": 0.87, + "learning_rate": 0.00016897488471438458, + "loss": 0.0139, "step": 336980 }, { - "epoch": 1.7, - "learning_rate": 4.497631312086615e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.0001689709964980131, + "loss": 0.0136, "step": 336990 }, { - "epoch": 1.7, - "learning_rate": 4.4968745427852135e-05, - "loss": 0.0093, + "epoch": 0.87, + "learning_rate": 0.00016896710828164164, + "loss": 0.0113, "step": 337000 }, { - "epoch": 1.7, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.004760997835546732, - "eval_runtime": 116.4296, - "eval_samples_per_second": 17.178, - "eval_steps_per_second": 4.294, + "epoch": 0.87, + "eval_cer": 0.8817166826925096, + "eval_loss": 0.008749060332775116, + "eval_runtime": 107.716, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, "step": 337000 }, { - "epoch": 1.7, - "learning_rate": 4.496117773483812e-05, - "loss": 0.0047, + "epoch": 0.87, + "learning_rate": 0.00016896322006527018, + "loss": 0.0128, "step": 337010 }, { - "epoch": 1.7, - "learning_rate": 4.495361004182411e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016895933184889872, + "loss": 0.0141, "step": 337020 }, { - "epoch": 1.7, - "learning_rate": 4.49460423488101e-05, - "loss": 0.0046, + "epoch": 0.87, + "learning_rate": 0.00016895544363252724, + "loss": 0.0114, "step": 337030 }, { - "epoch": 1.7, - "learning_rate": 4.493847465579609e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016895155541615578, + "loss": 0.0135, "step": 337040 }, { - "epoch": 1.7, - "learning_rate": 4.4930906962782077e-05, - "loss": 0.0099, + "epoch": 0.87, + "learning_rate": 0.00016894766719978432, + "loss": 0.0151, "step": 337050 }, { - "epoch": 1.7, - "learning_rate": 4.492333926976807e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016894377898341286, + "loss": 0.0122, "step": 337060 }, { - "epoch": 1.7, - "learning_rate": 4.491577157675406e-05, - "loss": 0.0062, + "epoch": 0.87, + "learning_rate": 0.00016893989076704138, + "loss": 0.014, "step": 337070 }, { - "epoch": 1.7, - "learning_rate": 4.490820388374005e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016893600255066992, + "loss": 0.0106, "step": 337080 }, { - "epoch": 1.7, - "learning_rate": 4.4900636190726036e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016893211433429849, + "loss": 0.0099, "step": 337090 }, { - "epoch": 1.7, - "learning_rate": 4.489306849771203e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.000168928226117927, + "loss": 0.0103, "step": 337100 }, { - "epoch": 1.7, - "learning_rate": 4.488550080469802e-05, - "loss": 0.0065, + "epoch": 0.87, + "learning_rate": 0.00016892433790155552, + "loss": 0.0129, "step": 337110 }, { - "epoch": 1.7, - "learning_rate": 4.487793311168401e-05, - "loss": 0.0054, + "epoch": 0.87, + "learning_rate": 0.00016892044968518406, + "loss": 0.0112, "step": 337120 }, { - "epoch": 1.7, - "learning_rate": 4.4870365418669996e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016891656146881263, + "loss": 0.0147, "step": 337130 }, { - "epoch": 1.7, - "learning_rate": 4.486279772565599e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016891267325244114, + "loss": 0.0141, "step": 337140 }, { - "epoch": 1.7, - "learning_rate": 4.485523003264198e-05, - "loss": 0.007, + "epoch": 0.87, + "learning_rate": 0.00016890878503606968, + "loss": 0.0125, "step": 337150 }, { - "epoch": 1.7, - "learning_rate": 4.484766233962797e-05, - "loss": 0.0076, + "epoch": 0.87, + "learning_rate": 0.0001689048968196982, + "loss": 0.0137, "step": 337160 }, { - "epoch": 1.7, - "learning_rate": 4.4840094646613956e-05, - "loss": 0.0063, + "epoch": 0.87, + "learning_rate": 0.00016890100860332677, + "loss": 0.0105, "step": 337170 }, { - "epoch": 1.7, - "learning_rate": 4.483252695359995e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.00016889712038695528, + "loss": 0.0139, "step": 337180 }, { - "epoch": 1.7, - "learning_rate": 4.482495926058594e-05, - "loss": 0.0086, + "epoch": 0.87, + "learning_rate": 0.00016889323217058382, + "loss": 0.0141, "step": 337190 }, { - "epoch": 1.7, - "learning_rate": 4.481739156757193e-05, - "loss": 0.0061, + "epoch": 0.87, + "learning_rate": 0.00016888934395421234, + "loss": 0.0123, "step": 337200 }, { - "epoch": 1.7, - "learning_rate": 4.4809823874557915e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.00016888545573784088, + "loss": 0.0134, "step": 337210 }, { - "epoch": 1.7, - "learning_rate": 4.480225618154391e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016888156752146942, + "loss": 0.0149, "step": 337220 }, { - "epoch": 1.7, - "learning_rate": 4.47946884885299e-05, - "loss": 0.004, + "epoch": 0.87, + "learning_rate": 0.00016887767930509796, + "loss": 0.0142, "step": 337230 }, { - "epoch": 1.7, - "learning_rate": 4.4787120795515887e-05, - "loss": 0.0083, + "epoch": 0.87, + "learning_rate": 0.00016887379108872648, + "loss": 0.0121, "step": 337240 }, { - "epoch": 1.7, - "learning_rate": 4.4779553102501875e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016886990287235502, + "loss": 0.0133, "step": 337250 }, { - "epoch": 1.7, - "learning_rate": 4.477198540948787e-05, - "loss": 0.0072, + "epoch": 0.87, + "learning_rate": 0.00016886601465598359, + "loss": 0.0126, "step": 337260 }, { - "epoch": 1.7, - "learning_rate": 4.476441771647386e-05, - "loss": 0.0081, + "epoch": 0.87, + "learning_rate": 0.0001688621264396121, + "loss": 0.0168, "step": 337270 }, { - "epoch": 1.7, - "learning_rate": 4.4756850023459846e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016885823822324061, + "loss": 0.0154, "step": 337280 }, { - "epoch": 1.7, - "learning_rate": 4.4749282330445834e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016885435000686916, + "loss": 0.0134, "step": 337290 }, { - "epoch": 1.7, - "learning_rate": 4.474171463743183e-05, - "loss": 0.0052, + "epoch": 0.87, + "learning_rate": 0.00016885046179049773, + "loss": 0.0104, "step": 337300 }, { - "epoch": 1.7, - "learning_rate": 4.473414694441782e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016884657357412624, + "loss": 0.0119, "step": 337310 }, { - "epoch": 1.7, - "learning_rate": 4.47265792514038e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016884268535775478, + "loss": 0.0167, "step": 337320 }, { - "epoch": 1.7, - "learning_rate": 4.471901155838979e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.0001688387971413833, + "loss": 0.0156, "step": 337330 }, { - "epoch": 1.7, - "learning_rate": 4.4711443865375776e-05, - "loss": 0.0058, + "epoch": 0.87, + "learning_rate": 0.00016883490892501186, + "loss": 0.0113, "step": 337340 }, { - "epoch": 1.7, - "learning_rate": 4.470387617236177e-05, - "loss": 0.0075, + "epoch": 0.87, + "learning_rate": 0.00016883102070864038, + "loss": 0.0109, "step": 337350 }, { - "epoch": 1.7, - "learning_rate": 4.469630847934776e-05, - "loss": 0.0071, + "epoch": 0.87, + "learning_rate": 0.00016882713249226892, + "loss": 0.0122, "step": 337360 }, { - "epoch": 1.7, - "learning_rate": 4.468874078633375e-05, - "loss": 0.0091, + "epoch": 0.87, + "learning_rate": 0.00016882324427589744, + "loss": 0.0105, "step": 337370 }, { - "epoch": 1.7, - "learning_rate": 4.468117309331974e-05, - "loss": 0.0056, + "epoch": 0.87, + "learning_rate": 0.000168819356059526, + "loss": 0.0139, "step": 337380 }, { - "epoch": 1.7, - "learning_rate": 4.467360540030573e-05, - "loss": 0.0069, + "epoch": 0.87, + "learning_rate": 0.00016881546784315452, + "loss": 0.0128, "step": 337390 }, { - "epoch": 1.7, - "learning_rate": 4.466603770729172e-05, - "loss": 0.0068, + "epoch": 0.87, + "learning_rate": 0.00016881157962678306, + "loss": 0.0147, "step": 337400 }, { - "epoch": 1.7, - "learning_rate": 4.465847001427771e-05, - "loss": 0.0066, + "epoch": 0.87, + "learning_rate": 0.00016880769141041157, + "loss": 0.0135, "step": 337410 }, { - "epoch": 1.7, - "learning_rate": 4.46509023212637e-05, - "loss": 0.0051, + "epoch": 0.87, + "learning_rate": 0.00016880380319404014, + "loss": 0.012, "step": 337420 }, { - "epoch": 1.7, - "learning_rate": 4.464333462824969e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016879991497766866, + "loss": 0.0123, "step": 337430 }, { - "epoch": 1.7, - "learning_rate": 4.463576693523568e-05, - "loss": 0.0064, + "epoch": 0.87, + "learning_rate": 0.0001687960267612972, + "loss": 0.0123, "step": 337440 }, { - "epoch": 1.7, - "learning_rate": 4.4628199242221666e-05, - "loss": 0.0078, + "epoch": 0.87, + "learning_rate": 0.00016879213854492571, + "loss": 0.0133, "step": 337450 }, { - "epoch": 1.7, - "learning_rate": 4.462063154920766e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016878825032855426, + "loss": 0.0127, "step": 337460 }, { - "epoch": 1.7, - "learning_rate": 4.461306385619365e-05, - "loss": 0.0077, + "epoch": 0.87, + "learning_rate": 0.00016878436211218282, + "loss": 0.0116, "step": 337470 }, { - "epoch": 1.7, - "learning_rate": 4.460549616317964e-05, - "loss": 0.0059, + "epoch": 0.87, + "learning_rate": 0.00016878047389581134, + "loss": 0.0157, "step": 337480 }, { - "epoch": 1.7, - "learning_rate": 4.4597928470165626e-05, - "loss": 0.0067, + "epoch": 0.87, + "learning_rate": 0.00016877658567943988, + "loss": 0.0121, "step": 337490 }, { - "epoch": 1.7, - "learning_rate": 4.459036077715162e-05, - "loss": 0.0036, + "epoch": 0.87, + "learning_rate": 0.0001687726974630684, + "loss": 0.0178, "step": 337500 }, { - "epoch": 1.7, - "learning_rate": 4.458279308413761e-05, - "loss": 0.0088, + "epoch": 0.87, + "learning_rate": 0.00016876880924669696, + "loss": 0.0099, "step": 337510 }, { - "epoch": 1.7, - "learning_rate": 4.45752253911236e-05, - "loss": 0.0046, + "epoch": 0.87, + "learning_rate": 0.00016876492103032548, + "loss": 0.012, "step": 337520 }, { - "epoch": 1.7, - "learning_rate": 4.4567657698109586e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.00016876103281395402, + "loss": 0.0188, "step": 337530 }, { - "epoch": 1.7, - "learning_rate": 4.456009000509558e-05, - "loss": 0.0055, + "epoch": 0.87, + "learning_rate": 0.00016875714459758253, + "loss": 0.0174, "step": 337540 }, { - "epoch": 1.7, - "learning_rate": 4.455252231208157e-05, - "loss": 0.006, + "epoch": 0.87, + "learning_rate": 0.0001687532563812111, + "loss": 0.0129, "step": 337550 }, { - "epoch": 1.7, - "learning_rate": 4.454495461906756e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016874936816483962, + "loss": 0.0254, "step": 337560 }, { - "epoch": 1.7, - "learning_rate": 4.4537386926053545e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016874547994846816, + "loss": 0.0116, "step": 337570 }, { - "epoch": 1.7, - "learning_rate": 4.452981923303954e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016874159173209667, + "loss": 0.0124, "step": 337580 }, { - "epoch": 1.7, - "learning_rate": 4.452225154002553e-05, - "loss": 0.0047, + "epoch": 0.88, + "learning_rate": 0.00016873770351572524, + "loss": 0.0121, "step": 337590 }, { - "epoch": 1.7, - "learning_rate": 4.451468384701152e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016873381529935376, + "loss": 0.0141, "step": 337600 }, { - "epoch": 1.7, - "learning_rate": 4.4507116153997505e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.0001687299270829823, + "loss": 0.0132, "step": 337610 }, { - "epoch": 1.7, - "learning_rate": 4.44995484609835e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016872603886661081, + "loss": 0.0148, "step": 337620 }, { - "epoch": 1.7, - "learning_rate": 4.449198076796949e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016872215065023938, + "loss": 0.0093, "step": 337630 }, { - "epoch": 1.7, - "learning_rate": 4.448441307495547e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016871826243386792, + "loss": 0.0147, "step": 337640 }, { - "epoch": 1.7, - "learning_rate": 4.447684538194146e-05, - "loss": 0.0088, + "epoch": 0.88, + "learning_rate": 0.00016871437421749644, + "loss": 0.0124, "step": 337650 }, { - "epoch": 1.7, - "learning_rate": 4.4469277688927446e-05, - "loss": 0.0046, + "epoch": 0.88, + "learning_rate": 0.00016871048600112498, + "loss": 0.0108, "step": 337660 }, { - "epoch": 1.7, - "learning_rate": 4.446170999591344e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016870659778475352, + "loss": 0.0128, "step": 337670 }, { - "epoch": 1.7, - "learning_rate": 4.445414230289943e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016870270956838206, + "loss": 0.0128, "step": 337680 }, { - "epoch": 1.7, - "learning_rate": 4.444657460988542e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016869882135201058, + "loss": 0.0141, "step": 337690 }, { - "epoch": 1.7, - "learning_rate": 4.4439006916871406e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.00016869493313563912, + "loss": 0.0128, "step": 337700 }, { - "epoch": 1.7, - "learning_rate": 4.44314392238574e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016869104491926763, + "loss": 0.0115, "step": 337710 }, { - "epoch": 1.7, - "learning_rate": 4.442387153084339e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.0001686871567028962, + "loss": 0.0115, "step": 337720 }, { - "epoch": 1.7, - "learning_rate": 4.441630383782938e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016868326848652472, + "loss": 0.012, "step": 337730 }, { - "epoch": 1.7, - "learning_rate": 4.4408736144815365e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016867938027015326, + "loss": 0.0118, "step": 337740 }, { - "epoch": 1.7, - "learning_rate": 4.440116845180136e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016867549205378177, + "loss": 0.0113, "step": 337750 }, { - "epoch": 1.7, - "learning_rate": 4.439360075878735e-05, - "loss": 0.0089, + "epoch": 0.88, + "learning_rate": 0.00016867160383741034, + "loss": 0.0128, "step": 337760 }, { - "epoch": 1.7, - "learning_rate": 4.438603306577334e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016866771562103886, + "loss": 0.0105, "step": 337770 }, { - "epoch": 1.7, - "learning_rate": 4.4378465372759325e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.0001686638274046674, + "loss": 0.015, "step": 337780 }, { - "epoch": 1.7, - "learning_rate": 4.437089767974532e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.0001686599391882959, + "loss": 0.0137, "step": 337790 }, { - "epoch": 1.7, - "learning_rate": 4.436332998673131e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016865605097192448, + "loss": 0.0147, "step": 337800 }, { - "epoch": 1.7, - "learning_rate": 4.4355762293717296e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016865216275555302, + "loss": 0.0119, "step": 337810 }, { - "epoch": 1.7, - "learning_rate": 4.4348194600703285e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016864827453918154, + "loss": 0.0132, "step": 337820 }, { - "epoch": 1.7, - "learning_rate": 4.434062690768928e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016864438632281005, + "loss": 0.0195, "step": 337830 }, { - "epoch": 1.7, - "learning_rate": 4.433305921467527e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016864049810643862, + "loss": 0.0134, "step": 337840 }, { - "epoch": 1.7, - "learning_rate": 4.4325491521661256e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016863660989006716, + "loss": 0.0162, "step": 337850 }, { - "epoch": 1.7, - "learning_rate": 4.431792382864725e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016863272167369568, + "loss": 0.0128, "step": 337860 }, { - "epoch": 1.7, - "learning_rate": 4.431035613563324e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016862883345732422, + "loss": 0.0129, "step": 337870 }, { - "epoch": 1.7, - "learning_rate": 4.430278844261923e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016862494524095276, + "loss": 0.0143, "step": 337880 }, { - "epoch": 1.7, - "learning_rate": 4.4295220749605216e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.0001686210570245813, + "loss": 0.0091, "step": 337890 }, { - "epoch": 1.7, - "learning_rate": 4.428765305659121e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016861716880820982, + "loss": 0.0391, "step": 337900 }, { - "epoch": 1.7, - "learning_rate": 4.42800853635772e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016861328059183836, + "loss": 0.0178, "step": 337910 }, { - "epoch": 1.7, - "learning_rate": 4.427251767056319e-05, - "loss": 0.0091, + "epoch": 0.88, + "learning_rate": 0.0001686093923754669, + "loss": 0.0135, "step": 337920 }, { - "epoch": 1.7, - "learning_rate": 4.4264949977549175e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016860550415909544, + "loss": 0.0155, "step": 337930 }, { - "epoch": 1.7, - "learning_rate": 4.425738228453517e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016860161594272396, + "loss": 0.0129, "step": 337940 }, { - "epoch": 1.7, - "learning_rate": 4.424981459152115e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.0001685977277263525, + "loss": 0.013, "step": 337950 }, { - "epoch": 1.71, - "learning_rate": 4.424224689850714e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.000168593839509981, + "loss": 0.0118, "step": 337960 }, { - "epoch": 1.71, - "learning_rate": 4.423467920549313e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016858995129360958, + "loss": 0.0176, "step": 337970 }, { - "epoch": 1.71, - "learning_rate": 4.4227111512479116e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.0001685860630772381, + "loss": 0.0116, "step": 337980 }, { - "epoch": 1.71, - "learning_rate": 4.421954381946511e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.00016858217486086664, + "loss": 0.0145, "step": 337990 }, { - "epoch": 1.71, - "learning_rate": 4.42119761264511e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016857828664449515, + "loss": 0.0145, "step": 338000 }, { - "epoch": 1.71, - "eval_cer": 0.9144197953046413, - "eval_loss": 0.004835808649659157, - "eval_runtime": 116.338, - "eval_samples_per_second": 17.191, - "eval_steps_per_second": 4.298, + "epoch": 0.88, + "eval_cer": 0.8817600714374692, + "eval_loss": 0.00871712900698185, + "eval_runtime": 107.6623, + "eval_samples_per_second": 18.577, + "eval_steps_per_second": 4.644, "step": 338000 }, { - "epoch": 1.71, - "learning_rate": 4.420440843343709e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016857439842812372, + "loss": 0.0126, "step": 338010 }, { - "epoch": 1.71, - "learning_rate": 4.4196840740423076e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016857051021175226, + "loss": 0.0117, "step": 338020 }, { - "epoch": 1.71, - "learning_rate": 4.418927304740907e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016856662199538078, + "loss": 0.0143, "step": 338030 }, { - "epoch": 1.71, - "learning_rate": 4.418170535439506e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016856273377900932, + "loss": 0.0136, "step": 338040 }, { - "epoch": 1.71, - "learning_rate": 4.417413766138105e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016855884556263786, + "loss": 0.0121, "step": 338050 }, { - "epoch": 1.71, - "learning_rate": 4.4166569968367036e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.0001685549573462664, + "loss": 0.0123, "step": 338060 }, { - "epoch": 1.71, - "learning_rate": 4.415900227535303e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016855106912989492, + "loss": 0.0137, "step": 338070 }, { - "epoch": 1.71, - "learning_rate": 4.415143458233902e-05, - "loss": 0.0085, + "epoch": 0.88, + "learning_rate": 0.00016854718091352346, + "loss": 0.0165, "step": 338080 }, { - "epoch": 1.71, - "learning_rate": 4.414386688932501e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.000168543292697152, + "loss": 0.0132, "step": 338090 }, { - "epoch": 1.71, - "learning_rate": 4.4136299196310995e-05, - "loss": 0.0043, + "epoch": 0.88, + "learning_rate": 0.00016853940448078054, + "loss": 0.0137, "step": 338100 }, { - "epoch": 1.71, - "learning_rate": 4.412873150329699e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016853551626440906, + "loss": 0.0127, "step": 338110 }, { - "epoch": 1.71, - "learning_rate": 4.412116381028298e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.0001685316280480376, + "loss": 0.0104, "step": 338120 }, { - "epoch": 1.71, - "learning_rate": 4.411359611726897e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016852773983166617, + "loss": 0.0123, "step": 338130 }, { - "epoch": 1.71, - "learning_rate": 4.4106028424254955e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016852385161529468, + "loss": 0.0105, "step": 338140 }, { - "epoch": 1.71, - "learning_rate": 4.409846073124095e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.0001685199633989232, + "loss": 0.0148, "step": 338150 }, { - "epoch": 1.71, - "learning_rate": 4.409089303822694e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016851607518255174, + "loss": 0.0122, "step": 338160 }, { - "epoch": 1.71, - "learning_rate": 4.4083325345212926e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016851218696618025, + "loss": 0.0113, "step": 338170 }, { - "epoch": 1.71, - "learning_rate": 4.4075757652198915e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016850829874980882, + "loss": 0.0119, "step": 338180 }, { - "epoch": 1.71, - "learning_rate": 4.406818995918491e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016850441053343736, + "loss": 0.0136, "step": 338190 }, { - "epoch": 1.71, - "learning_rate": 4.40606222661709e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016850052231706588, + "loss": 0.0108, "step": 338200 }, { - "epoch": 1.71, - "learning_rate": 4.4053054573156886e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016849663410069442, + "loss": 0.0174, "step": 338210 }, { - "epoch": 1.71, - "learning_rate": 4.4045486880142874e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016849274588432296, + "loss": 0.0125, "step": 338220 }, { - "epoch": 1.71, - "learning_rate": 4.403791918712887e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.0001684888576679515, + "loss": 0.0109, "step": 338230 }, { - "epoch": 1.71, - "learning_rate": 4.403035149411486e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016848496945158002, + "loss": 0.0103, "step": 338240 }, { - "epoch": 1.71, - "learning_rate": 4.4022783801100846e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016848108123520856, + "loss": 0.0116, "step": 338250 }, { - "epoch": 1.71, - "learning_rate": 4.401521610808683e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.0001684771930188371, + "loss": 0.0112, "step": 338260 }, { - "epoch": 1.71, - "learning_rate": 4.4007648415072815e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.00016847330480246564, + "loss": 0.0156, "step": 338270 }, { - "epoch": 1.71, - "learning_rate": 4.400008072205881e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016846941658609416, + "loss": 0.0199, "step": 338280 }, { - "epoch": 1.71, - "learning_rate": 4.39925130290448e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.0001684655283697227, + "loss": 0.0133, "step": 338290 }, { - "epoch": 1.71, - "learning_rate": 4.398494533603079e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016846164015335124, + "loss": 0.0134, "step": 338300 }, { - "epoch": 1.71, - "learning_rate": 4.3977377643016775e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016845775193697978, + "loss": 0.0154, "step": 338310 }, { - "epoch": 1.71, - "learning_rate": 4.396980995000277e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.0001684538637206083, + "loss": 0.0149, "step": 338320 }, { - "epoch": 1.71, - "learning_rate": 4.396224225698876e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016844997550423684, + "loss": 0.0161, "step": 338330 }, { - "epoch": 1.71, - "learning_rate": 4.3954674563974747e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.0001684460872878654, + "loss": 0.0123, "step": 338340 }, { - "epoch": 1.71, - "learning_rate": 4.394710687096074e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016844219907149392, + "loss": 0.0175, "step": 338350 }, { - "epoch": 1.71, - "learning_rate": 4.393953917794673e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016843831085512246, + "loss": 0.0191, "step": 338360 }, { - "epoch": 1.71, - "learning_rate": 4.393197148493272e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016843442263875098, + "loss": 0.0143, "step": 338370 }, { - "epoch": 1.71, - "learning_rate": 4.3924403791918706e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016843053442237954, + "loss": 0.0113, "step": 338380 }, { - "epoch": 1.71, - "learning_rate": 4.39168360989047e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016842664620600806, + "loss": 0.0159, "step": 338390 }, { - "epoch": 1.71, - "learning_rate": 4.390926840589069e-05, - "loss": 0.0083, + "epoch": 0.88, + "learning_rate": 0.0001684227579896366, + "loss": 0.0132, "step": 338400 }, { - "epoch": 1.71, - "learning_rate": 4.390170071287668e-05, - "loss": 0.0039, + "epoch": 0.88, + "learning_rate": 0.00016841886977326512, + "loss": 0.0114, "step": 338410 }, { - "epoch": 1.71, - "learning_rate": 4.3894133019862666e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016841498155689366, + "loss": 0.0134, "step": 338420 }, { - "epoch": 1.71, - "learning_rate": 4.388656532684866e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.0001684110933405222, + "loss": 0.0244, "step": 338430 }, { - "epoch": 1.71, - "learning_rate": 4.387899763383465e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016840720512415074, + "loss": 0.0144, "step": 338440 }, { - "epoch": 1.71, - "learning_rate": 4.387142994082064e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016840331690777925, + "loss": 0.0116, "step": 338450 }, { - "epoch": 1.71, - "learning_rate": 4.3863862247806625e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.0001683994286914078, + "loss": 0.0403, "step": 338460 }, { - "epoch": 1.71, - "learning_rate": 4.385629455479262e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016839554047503634, + "loss": 0.0135, "step": 338470 }, { - "epoch": 1.71, - "learning_rate": 4.384872686177861e-05, - "loss": 0.0044, + "epoch": 0.88, + "learning_rate": 0.00016839165225866488, + "loss": 0.0094, "step": 338480 }, { - "epoch": 1.71, - "learning_rate": 4.38411591687646e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.0001683877640422934, + "loss": 0.0159, "step": 338490 }, { - "epoch": 1.71, - "learning_rate": 4.3833591475750585e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016838387582592194, + "loss": 0.0123, "step": 338500 }, { - "epoch": 1.71, - "learning_rate": 4.382602378273658e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.0001683799876095505, + "loss": 0.0136, "step": 338510 }, { - "epoch": 1.71, - "learning_rate": 4.381845608972257e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016837609939317902, + "loss": 0.0154, "step": 338520 }, { - "epoch": 1.71, - "learning_rate": 4.3810888396708557e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016837221117680756, + "loss": 0.0108, "step": 338530 }, { - "epoch": 1.71, - "learning_rate": 4.3803320703694545e-05, - "loss": 0.0097, + "epoch": 0.88, + "learning_rate": 0.00016836832296043608, + "loss": 0.0128, "step": 338540 }, { - "epoch": 1.71, - "learning_rate": 4.379575301068054e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016836443474406464, + "loss": 0.0156, "step": 338550 }, { - "epoch": 1.71, - "learning_rate": 4.378818531766653e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016836054652769316, + "loss": 0.0102, "step": 338560 }, { - "epoch": 1.71, - "learning_rate": 4.3780617624652516e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.0001683566583113217, + "loss": 0.0188, "step": 338570 }, { - "epoch": 1.71, - "learning_rate": 4.37730499316385e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016835277009495021, + "loss": 0.0097, "step": 338580 }, { - "epoch": 1.71, - "learning_rate": 4.3765482238624486e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016834888187857878, + "loss": 0.0168, "step": 338590 }, { - "epoch": 1.71, - "learning_rate": 4.375791454561048e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.0001683449936622073, + "loss": 0.0142, "step": 338600 }, { - "epoch": 1.71, - "learning_rate": 4.375034685259647e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016834110544583584, + "loss": 0.01, "step": 338610 }, { - "epoch": 1.71, - "learning_rate": 4.374277915958246e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016833721722946435, + "loss": 0.0145, "step": 338620 }, { - "epoch": 1.71, - "learning_rate": 4.3735211466568446e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016833332901309292, + "loss": 0.0147, "step": 338630 }, { - "epoch": 1.71, - "learning_rate": 4.372764377355444e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016832944079672144, + "loss": 0.014, "step": 338640 }, { - "epoch": 1.71, - "learning_rate": 4.372007608054043e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016832555258034998, + "loss": 0.015, "step": 338650 }, { - "epoch": 1.71, - "learning_rate": 4.371250838752642e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.0001683216643639785, + "loss": 0.0115, "step": 338660 }, { - "epoch": 1.71, - "learning_rate": 4.3704940694512405e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.00016831777614760704, + "loss": 0.0112, "step": 338670 }, { - "epoch": 1.71, - "learning_rate": 4.36973730014984e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.0001683138879312356, + "loss": 0.0134, "step": 338680 }, { - "epoch": 1.71, - "learning_rate": 4.368980530848439e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016830999971486412, + "loss": 0.0139, "step": 338690 }, { - "epoch": 1.71, - "learning_rate": 4.3682237615470377e-05, - "loss": 0.0083, + "epoch": 0.88, + "learning_rate": 0.00016830611149849263, + "loss": 0.0137, "step": 338700 }, { - "epoch": 1.71, - "learning_rate": 4.3674669922456365e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016830222328212117, + "loss": 0.0137, "step": 338710 }, { - "epoch": 1.71, - "learning_rate": 4.366710222944236e-05, - "loss": 0.0097, + "epoch": 0.88, + "learning_rate": 0.00016829833506574974, + "loss": 0.0138, "step": 338720 }, { - "epoch": 1.71, - "learning_rate": 4.365953453642835e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016829444684937826, + "loss": 0.0158, "step": 338730 }, { - "epoch": 1.71, - "learning_rate": 4.3651966843414336e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.0001682905586330068, + "loss": 0.0127, "step": 338740 }, { - "epoch": 1.71, - "learning_rate": 4.3644399150400324e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016828667041663531, + "loss": 0.0173, "step": 338750 }, { - "epoch": 1.71, - "learning_rate": 4.363683145738632e-05, - "loss": 0.0098, + "epoch": 0.88, + "learning_rate": 0.00016828278220026388, + "loss": 0.0105, "step": 338760 }, { - "epoch": 1.71, - "learning_rate": 4.362926376437231e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.0001682788939838924, + "loss": 0.0141, "step": 338770 }, { - "epoch": 1.71, - "learning_rate": 4.3621696071358296e-05, - "loss": 0.0088, + "epoch": 0.88, + "learning_rate": 0.00016827500576752094, + "loss": 0.013, "step": 338780 }, { - "epoch": 1.71, - "learning_rate": 4.3614128378344284e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.00016827111755114945, + "loss": 0.0128, "step": 338790 }, { - "epoch": 1.71, - "learning_rate": 4.360656068533028e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016826722933477802, + "loss": 0.0158, "step": 338800 }, { - "epoch": 1.71, - "learning_rate": 4.359899299231627e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016826334111840654, + "loss": 0.0131, "step": 338810 }, { - "epoch": 1.71, - "learning_rate": 4.3591425299302256e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.00016825945290203508, + "loss": 0.0111, "step": 338820 }, { - "epoch": 1.71, - "learning_rate": 4.358385760628825e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.0001682555646856636, + "loss": 0.0155, "step": 338830 }, { - "epoch": 1.71, - "learning_rate": 4.357628991327424e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016825167646929216, + "loss": 0.0162, "step": 338840 }, { - "epoch": 1.71, - "learning_rate": 4.356872222026023e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.0001682477882529207, + "loss": 0.0136, "step": 338850 }, { - "epoch": 1.71, - "learning_rate": 4.3561154527246215e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016824390003654922, + "loss": 0.0141, "step": 338860 }, { - "epoch": 1.71, - "learning_rate": 4.355358683423221e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016824001182017773, + "loss": 0.0158, "step": 338870 }, { - "epoch": 1.71, - "learning_rate": 4.35460191412182e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.0001682361236038063, + "loss": 0.0141, "step": 338880 }, { - "epoch": 1.71, - "learning_rate": 4.353845144820418e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016823223538743484, + "loss": 0.0138, "step": 338890 }, { - "epoch": 1.71, - "learning_rate": 4.353088375519017e-05, - "loss": 0.0038, + "epoch": 0.88, + "learning_rate": 0.00016822834717106336, + "loss": 0.0143, "step": 338900 }, { - "epoch": 1.71, - "learning_rate": 4.3523316062176156e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.0001682244589546919, + "loss": 0.0147, "step": 338910 }, { - "epoch": 1.71, - "learning_rate": 4.351574836916215e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.0001682205707383204, + "loss": 0.0146, "step": 338920 }, { - "epoch": 1.71, - "learning_rate": 4.350818067614814e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016821668252194898, + "loss": 0.0159, "step": 338930 }, { - "epoch": 1.71, - "learning_rate": 4.350061298313413e-05, - "loss": 0.0044, + "epoch": 0.88, + "learning_rate": 0.0001682127943055775, + "loss": 0.0146, "step": 338940 }, { - "epoch": 1.71, - "learning_rate": 4.3493045290120116e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016820890608920604, + "loss": 0.0192, "step": 338950 }, { - "epoch": 1.71, - "learning_rate": 4.348547759710611e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016820501787283455, + "loss": 0.0107, "step": 338960 }, { - "epoch": 1.71, - "learning_rate": 4.34779099040921e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016820112965646312, + "loss": 0.0151, "step": 338970 }, { - "epoch": 1.71, - "learning_rate": 4.347034221107809e-05, - "loss": 0.0043, + "epoch": 0.88, + "learning_rate": 0.00016819724144009164, + "loss": 0.0132, "step": 338980 }, { - "epoch": 1.71, - "learning_rate": 4.3462774518064076e-05, - "loss": 0.0088, + "epoch": 0.88, + "learning_rate": 0.00016819335322372018, + "loss": 0.0148, "step": 338990 }, { - "epoch": 1.71, - "learning_rate": 4.345520682505007e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.0001681894650073487, + "loss": 0.0153, "step": 339000 }, { - "epoch": 1.71, - "eval_cer": 0.9144285288697699, - "eval_loss": 0.0047121611423790455, - "eval_runtime": 116.4797, - "eval_samples_per_second": 17.17, - "eval_steps_per_second": 4.293, + "epoch": 0.88, + "eval_cer": 0.8817222812402463, + "eval_loss": 0.008869285695254803, + "eval_runtime": 107.8634, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, "step": 339000 }, { - "epoch": 1.71, - "learning_rate": 4.344763913203606e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.00016818557679097726, + "loss": 0.0173, "step": 339010 }, { - "epoch": 1.71, - "learning_rate": 4.344007143902205e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016818168857460578, + "loss": 0.0122, "step": 339020 }, { - "epoch": 1.71, - "learning_rate": 4.3432503746008035e-05, - "loss": 0.0096, + "epoch": 0.88, + "learning_rate": 0.00016817780035823432, + "loss": 0.0158, "step": 339030 }, { - "epoch": 1.71, - "learning_rate": 4.342493605299403e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.00016817391214186283, + "loss": 0.0123, "step": 339040 }, { - "epoch": 1.71, - "learning_rate": 4.341736835998002e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.0001681700239254914, + "loss": 0.015, "step": 339050 }, { - "epoch": 1.71, - "learning_rate": 4.340980066696601e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016816613570911994, + "loss": 0.0122, "step": 339060 }, { - "epoch": 1.71, - "learning_rate": 4.3402232973951995e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016816224749274846, + "loss": 0.0133, "step": 339070 }, { - "epoch": 1.71, - "learning_rate": 4.339466528093799e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.000168158359276377, + "loss": 0.012, "step": 339080 }, { - "epoch": 1.71, - "learning_rate": 4.338709758792398e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016815447106000554, + "loss": 0.0116, "step": 339090 }, { - "epoch": 1.71, - "learning_rate": 4.3379529894909966e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016815058284363408, + "loss": 0.0104, "step": 339100 }, { - "epoch": 1.71, - "learning_rate": 4.3371962201895955e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.0001681466946272626, + "loss": 0.0137, "step": 339110 }, { - "epoch": 1.71, - "learning_rate": 4.336439450888195e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016814280641089114, + "loss": 0.0111, "step": 339120 }, { - "epoch": 1.71, - "learning_rate": 4.335682681586794e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016813891819451968, + "loss": 0.0151, "step": 339130 }, { - "epoch": 1.71, - "learning_rate": 4.3349259122853926e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016813502997814822, + "loss": 0.0188, "step": 339140 }, { - "epoch": 1.71, - "learning_rate": 4.3341691429839914e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016813114176177674, + "loss": 0.0175, "step": 339150 }, { - "epoch": 1.71, - "learning_rate": 4.333412373682591e-05, - "loss": 0.0088, + "epoch": 0.88, + "learning_rate": 0.00016812725354540528, + "loss": 0.011, "step": 339160 }, { - "epoch": 1.71, - "learning_rate": 4.33265560438119e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.0001681233653290338, + "loss": 0.0112, "step": 339170 }, { - "epoch": 1.71, - "learning_rate": 4.3318988350797886e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016811947711266236, + "loss": 0.0142, "step": 339180 }, { - "epoch": 1.71, - "learning_rate": 4.3311420657783874e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016811558889629088, + "loss": 0.0147, "step": 339190 }, { - "epoch": 1.71, - "learning_rate": 4.330385296476987e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016811170067991942, + "loss": 0.0174, "step": 339200 }, { - "epoch": 1.71, - "learning_rate": 4.329628527175585e-05, - "loss": 0.0048, + "epoch": 0.88, + "learning_rate": 0.00016810781246354793, + "loss": 0.0137, "step": 339210 }, { - "epoch": 1.71, - "learning_rate": 4.328871757874184e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.0001681039242471765, + "loss": 0.013, "step": 339220 }, { - "epoch": 1.71, - "learning_rate": 4.328114988572783e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016810003603080504, + "loss": 0.0112, "step": 339230 }, { - "epoch": 1.71, - "learning_rate": 4.3273582192713815e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016809614781443356, + "loss": 0.0129, "step": 339240 }, { - "epoch": 1.71, - "learning_rate": 4.326601449969981e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.0001680922595980621, + "loss": 0.0143, "step": 339250 }, { - "epoch": 1.71, - "learning_rate": 4.32584468066858e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016808837138169064, + "loss": 0.0131, "step": 339260 }, { - "epoch": 1.71, - "learning_rate": 4.3250879113671786e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016808448316531918, + "loss": 0.0147, "step": 339270 }, { - "epoch": 1.71, - "learning_rate": 4.3243311420657775e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.0001680805949489477, + "loss": 0.0148, "step": 339280 }, { - "epoch": 1.71, - "learning_rate": 4.323574372764377e-05, - "loss": 0.0035, + "epoch": 0.88, + "learning_rate": 0.00016807670673257624, + "loss": 0.0166, "step": 339290 }, { - "epoch": 1.71, - "learning_rate": 4.322817603462976e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016807281851620478, + "loss": 0.0118, "step": 339300 }, { - "epoch": 1.71, - "learning_rate": 4.3220608341615746e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016806893029983332, + "loss": 0.0125, "step": 339310 }, { - "epoch": 1.71, - "learning_rate": 4.321304064860174e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016806504208346184, + "loss": 0.0122, "step": 339320 }, { - "epoch": 1.71, - "learning_rate": 4.320547295558773e-05, - "loss": 0.0085, + "epoch": 0.88, + "learning_rate": 0.00016806115386709038, + "loss": 0.0158, "step": 339330 }, { - "epoch": 1.71, - "learning_rate": 4.319790526257372e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016805726565071892, + "loss": 0.0173, "step": 339340 }, { - "epoch": 1.71, - "learning_rate": 4.3190337569559706e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016805337743434746, + "loss": 0.012, "step": 339350 }, { - "epoch": 1.71, - "learning_rate": 4.31827698765457e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016804948921797597, + "loss": 0.0126, "step": 339360 }, { - "epoch": 1.71, - "learning_rate": 4.317520218353169e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016804560100160452, + "loss": 0.0156, "step": 339370 }, { - "epoch": 1.71, - "learning_rate": 4.316763449051768e-05, - "loss": 0.0047, + "epoch": 0.88, + "learning_rate": 0.00016804171278523308, + "loss": 0.0125, "step": 339380 }, { - "epoch": 1.71, - "learning_rate": 4.3160066797503665e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.0001680378245688616, + "loss": 0.0121, "step": 339390 }, { - "epoch": 1.71, - "learning_rate": 4.315249910448966e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016803393635249014, + "loss": 0.0102, "step": 339400 }, { - "epoch": 1.71, - "learning_rate": 4.314493141147565e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.00016803004813611866, + "loss": 0.0105, "step": 339410 }, { - "epoch": 1.71, - "learning_rate": 4.313736371846164e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016802615991974717, + "loss": 0.011, "step": 339420 }, { - "epoch": 1.71, - "learning_rate": 4.3129796025447625e-05, - "loss": 0.0042, + "epoch": 0.88, + "learning_rate": 0.00016802227170337574, + "loss": 0.012, "step": 339430 }, { - "epoch": 1.71, - "learning_rate": 4.312222833243362e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016801838348700428, + "loss": 0.0117, "step": 339440 }, { - "epoch": 1.71, - "learning_rate": 4.311466063941961e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.0001680144952706328, + "loss": 0.014, "step": 339450 }, { - "epoch": 1.71, - "learning_rate": 4.3107092946405596e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016801060705426134, + "loss": 0.0115, "step": 339460 }, { - "epoch": 1.71, - "learning_rate": 4.3099525253391585e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016800671883788988, + "loss": 0.0125, "step": 339470 }, { - "epoch": 1.71, - "learning_rate": 4.309195756037758e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016800283062151842, + "loss": 0.0148, "step": 339480 }, { - "epoch": 1.71, - "learning_rate": 4.308438986736357e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.00016799894240514693, + "loss": 0.014, "step": 339490 }, { - "epoch": 1.71, - "learning_rate": 4.3076822174349556e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016799505418877548, + "loss": 0.0135, "step": 339500 }, { - "epoch": 1.71, - "learning_rate": 4.3069254481335544e-05, - "loss": 0.0092, + "epoch": 0.88, + "learning_rate": 0.00016799116597240402, + "loss": 0.0175, "step": 339510 }, { - "epoch": 1.71, - "learning_rate": 4.3061686788321526e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016798727775603256, + "loss": 0.0127, "step": 339520 }, { - "epoch": 1.71, - "learning_rate": 4.305411909530752e-05, - "loss": 0.0074, + "epoch": 0.88, + "learning_rate": 0.00016798338953966107, + "loss": 0.0119, "step": 339530 }, { - "epoch": 1.71, - "learning_rate": 4.304655140229351e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016797950132328962, + "loss": 0.0182, "step": 339540 }, { - "epoch": 1.71, - "learning_rate": 4.30389837092795e-05, - "loss": 0.0046, + "epoch": 0.88, + "learning_rate": 0.00016797561310691818, + "loss": 0.0123, "step": 339550 }, { - "epoch": 1.71, - "learning_rate": 4.3031416016265485e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.0001679717248905467, + "loss": 0.0097, "step": 339560 }, { - "epoch": 1.71, - "learning_rate": 4.302384832325148e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.0001679678366741752, + "loss": 0.0162, "step": 339570 }, { - "epoch": 1.71, - "learning_rate": 4.301628063023747e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.00016796394845780376, + "loss": 0.015, "step": 339580 }, { - "epoch": 1.71, - "learning_rate": 4.300871293722346e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016796006024143232, + "loss": 0.0108, "step": 339590 }, { - "epoch": 1.71, - "learning_rate": 4.3001145244209445e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.00016795617202506084, + "loss": 0.0134, "step": 339600 }, { - "epoch": 1.71, - "learning_rate": 4.299357755119544e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016795228380868938, + "loss": 0.018, "step": 339610 }, { - "epoch": 1.71, - "learning_rate": 4.298600985818143e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.0001679483955923179, + "loss": 0.0109, "step": 339620 }, { - "epoch": 1.71, - "learning_rate": 4.2978442165167416e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.00016794450737594646, + "loss": 0.0114, "step": 339630 }, { - "epoch": 1.71, - "learning_rate": 4.2970874472153405e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016794061915957498, + "loss": 0.0148, "step": 339640 }, { - "epoch": 1.71, - "learning_rate": 4.29633067791394e-05, - "loss": 0.0093, + "epoch": 0.88, + "learning_rate": 0.00016793673094320352, + "loss": 0.0118, "step": 339650 }, { - "epoch": 1.71, - "learning_rate": 4.295573908612539e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016793284272683203, + "loss": 0.014, "step": 339660 }, { - "epoch": 1.71, - "learning_rate": 4.2948171393111376e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016792895451046058, + "loss": 0.0155, "step": 339670 }, { - "epoch": 1.71, - "learning_rate": 4.2940603700097364e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016792506629408912, + "loss": 0.0146, "step": 339680 }, { - "epoch": 1.71, - "learning_rate": 4.293303600708336e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016792117807771766, + "loss": 0.0127, "step": 339690 }, { - "epoch": 1.71, - "learning_rate": 4.292546831406935e-05, - "loss": 0.0089, + "epoch": 0.88, + "learning_rate": 0.00016791728986134617, + "loss": 0.0124, "step": 339700 }, { - "epoch": 1.71, - "learning_rate": 4.2917900621055336e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016791340164497472, + "loss": 0.0116, "step": 339710 }, { - "epoch": 1.71, - "learning_rate": 4.2910332928041324e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016790951342860328, + "loss": 0.0137, "step": 339720 }, { - "epoch": 1.71, - "learning_rate": 4.290276523502732e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.0001679056252122318, + "loss": 0.015, "step": 339730 }, { - "epoch": 1.71, - "learning_rate": 4.289519754201331e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.0001679017369958603, + "loss": 0.0117, "step": 339740 }, { - "epoch": 1.71, - "learning_rate": 4.2887629848999295e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016789784877948885, + "loss": 0.013, "step": 339750 }, { - "epoch": 1.71, - "learning_rate": 4.2880062155985284e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016789396056311742, + "loss": 0.0139, "step": 339760 }, { - "epoch": 1.71, - "learning_rate": 4.287249446297128e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016789007234674594, + "loss": 0.0106, "step": 339770 }, { - "epoch": 1.71, - "learning_rate": 4.286492676995727e-05, - "loss": 0.0077, + "epoch": 0.88, + "learning_rate": 0.00016788618413037448, + "loss": 0.0144, "step": 339780 }, { - "epoch": 1.71, - "learning_rate": 4.2857359076943255e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.000167882295914003, + "loss": 0.0125, "step": 339790 }, { - "epoch": 1.71, - "learning_rate": 4.284979138392925e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016787840769763156, + "loss": 0.0155, "step": 339800 }, { - "epoch": 1.71, - "learning_rate": 4.284222369091524e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.00016787451948126008, + "loss": 0.0164, "step": 339810 }, { - "epoch": 1.71, - "learning_rate": 4.2834655997901227e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016787063126488862, + "loss": 0.0131, "step": 339820 }, { - "epoch": 1.71, - "learning_rate": 4.2827088304887215e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016786674304851713, + "loss": 0.0143, "step": 339830 }, { - "epoch": 1.71, - "learning_rate": 4.2819520611873196e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.0001678628548321457, + "loss": 0.0135, "step": 339840 }, { - "epoch": 1.71, - "learning_rate": 4.281195291885919e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016785896661577422, + "loss": 0.0142, "step": 339850 }, { - "epoch": 1.71, - "learning_rate": 4.280438522584518e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016785507839940276, + "loss": 0.0104, "step": 339860 }, { - "epoch": 1.71, - "learning_rate": 4.279681753283117e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016785119018303127, + "loss": 0.0136, "step": 339870 }, { - "epoch": 1.71, - "learning_rate": 4.2789249839817156e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016784730196665984, + "loss": 0.0192, "step": 339880 }, { - "epoch": 1.71, - "learning_rate": 4.278168214680315e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016784341375028836, + "loss": 0.0146, "step": 339890 }, { - "epoch": 1.71, - "learning_rate": 4.277411445378914e-05, - "loss": 0.0046, + "epoch": 0.88, + "learning_rate": 0.0001678395255339169, + "loss": 0.0134, "step": 339900 }, { - "epoch": 1.71, - "learning_rate": 4.276654676077513e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.0001678356373175454, + "loss": 0.0129, "step": 339910 }, { - "epoch": 1.71, - "learning_rate": 4.2758979067761115e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016783174910117395, + "loss": 0.0176, "step": 339920 }, { - "epoch": 1.71, - "learning_rate": 4.275141137474711e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016782786088480252, + "loss": 0.0114, "step": 339930 }, { - "epoch": 1.72, - "learning_rate": 4.27438436817331e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016782397266843104, + "loss": 0.0148, "step": 339940 }, { - "epoch": 1.72, - "learning_rate": 4.273627598871909e-05, - "loss": 0.0046, + "epoch": 0.88, + "learning_rate": 0.00016782008445205958, + "loss": 0.0123, "step": 339950 }, { - "epoch": 1.72, - "learning_rate": 4.2728708295705075e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.0001678161962356881, + "loss": 0.0111, "step": 339960 }, { - "epoch": 1.72, - "learning_rate": 4.272114060269107e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016781230801931666, + "loss": 0.0134, "step": 339970 }, { - "epoch": 1.72, - "learning_rate": 4.271357290967706e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016780841980294518, + "loss": 0.0164, "step": 339980 }, { - "epoch": 1.72, - "learning_rate": 4.2706005216663047e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016780453158657372, + "loss": 0.0138, "step": 339990 }, { - "epoch": 1.72, - "learning_rate": 4.2698437523649035e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016780064337020223, + "loss": 0.0115, "step": 340000 }, { - "epoch": 1.72, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004758994095027447, - "eval_runtime": 116.784, - "eval_samples_per_second": 17.126, - "eval_steps_per_second": 4.281, + "epoch": 0.88, + "eval_cer": 0.881751673615864, + "eval_loss": 0.008945505134761333, + "eval_runtime": 107.8028, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, "step": 340000 }, { - "epoch": 1.72, - "learning_rate": 4.269086983063503e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.0001677967551538308, + "loss": 0.0123, "step": 340010 }, { - "epoch": 1.72, - "learning_rate": 4.268330213762102e-05, - "loss": 0.009, + "epoch": 0.88, + "learning_rate": 0.00016779286693745932, + "loss": 0.0096, "step": 340020 }, { - "epoch": 1.72, - "learning_rate": 4.2675734444607006e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016778897872108786, + "loss": 0.0126, "step": 340030 }, { - "epoch": 1.72, - "learning_rate": 4.2668166751592994e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016778509050471637, + "loss": 0.0152, "step": 340040 }, { - "epoch": 1.72, - "learning_rate": 4.266059905857899e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016778120228834494, + "loss": 0.0208, "step": 340050 }, { - "epoch": 1.72, - "learning_rate": 4.265303136556498e-05, - "loss": 0.0078, + "epoch": 0.88, + "learning_rate": 0.00016777731407197346, + "loss": 0.0112, "step": 340060 }, { - "epoch": 1.72, - "learning_rate": 4.2645463672550966e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.000167773425855602, + "loss": 0.0157, "step": 340070 }, { - "epoch": 1.72, - "learning_rate": 4.2637895979536954e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.0001677695376392305, + "loss": 0.0103, "step": 340080 }, { - "epoch": 1.72, - "learning_rate": 4.263032828652295e-05, - "loss": 0.0083, + "epoch": 0.88, + "learning_rate": 0.00016776564942285908, + "loss": 0.0134, "step": 340090 }, { - "epoch": 1.72, - "learning_rate": 4.262276059350894e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016776176120648762, + "loss": 0.0144, "step": 340100 }, { - "epoch": 1.72, - "learning_rate": 4.2615192900494926e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016775787299011614, + "loss": 0.01, "step": 340110 }, { - "epoch": 1.72, - "learning_rate": 4.2607625207480914e-05, - "loss": 0.0039, + "epoch": 0.88, + "learning_rate": 0.00016775398477374468, + "loss": 0.0135, "step": 340120 }, { - "epoch": 1.72, - "learning_rate": 4.260005751446691e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016775009655737322, + "loss": 0.0104, "step": 340130 }, { - "epoch": 1.72, - "learning_rate": 4.25924898214529e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016774620834100176, + "loss": 0.0187, "step": 340140 }, { - "epoch": 1.72, - "learning_rate": 4.258492212843888e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016774232012463028, + "loss": 0.0113, "step": 340150 }, { - "epoch": 1.72, - "learning_rate": 4.2577354435424867e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.00016773843190825882, + "loss": 0.0129, "step": 340160 }, { - "epoch": 1.72, - "learning_rate": 4.2569786742410855e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016773454369188733, + "loss": 0.0095, "step": 340170 }, { - "epoch": 1.72, - "learning_rate": 4.256221904939685e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.0001677306554755159, + "loss": 0.0221, "step": 340180 }, { - "epoch": 1.72, - "learning_rate": 4.255465135638284e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016772676725914442, + "loss": 0.0124, "step": 340190 }, { - "epoch": 1.72, - "learning_rate": 4.2547083663368826e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016772287904277296, + "loss": 0.0126, "step": 340200 }, { - "epoch": 1.72, - "learning_rate": 4.2539515970354814e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016771899082640147, + "loss": 0.0146, "step": 340210 }, { - "epoch": 1.72, - "learning_rate": 4.253194827734081e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016771510261003004, + "loss": 0.0145, "step": 340220 }, { - "epoch": 1.72, - "learning_rate": 4.25243805843268e-05, - "loss": 0.0036, + "epoch": 0.88, + "learning_rate": 0.00016771121439365855, + "loss": 0.0169, "step": 340230 }, { - "epoch": 1.72, - "learning_rate": 4.2516812891312786e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.0001677073261772871, + "loss": 0.0127, "step": 340240 }, { - "epoch": 1.72, - "learning_rate": 4.2509245198298774e-05, - "loss": 0.0046, + "epoch": 0.88, + "learning_rate": 0.0001677034379609156, + "loss": 0.0161, "step": 340250 }, { - "epoch": 1.72, - "learning_rate": 4.250167750528477e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016769954974454418, + "loss": 0.0192, "step": 340260 }, { - "epoch": 1.72, - "learning_rate": 4.249410981227076e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.00016769566152817272, + "loss": 0.0125, "step": 340270 }, { - "epoch": 1.72, - "learning_rate": 4.2486542119256746e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016769177331180124, + "loss": 0.0142, "step": 340280 }, { - "epoch": 1.72, - "learning_rate": 4.247897442624274e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.00016768788509542975, + "loss": 0.0125, "step": 340290 }, { - "epoch": 1.72, - "learning_rate": 4.247140673322873e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016768399687905832, + "loss": 0.0126, "step": 340300 }, { - "epoch": 1.72, - "learning_rate": 4.246383904021472e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016768010866268686, + "loss": 0.0102, "step": 340310 }, { - "epoch": 1.72, - "learning_rate": 4.2456271347200705e-05, - "loss": 0.009, + "epoch": 0.88, + "learning_rate": 0.00016767622044631538, + "loss": 0.0128, "step": 340320 }, { - "epoch": 1.72, - "learning_rate": 4.24487036541867e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016767233222994392, + "loss": 0.0194, "step": 340330 }, { - "epoch": 1.72, - "learning_rate": 4.244113596117269e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016766844401357246, + "loss": 0.0162, "step": 340340 }, { - "epoch": 1.72, - "learning_rate": 4.243356826815868e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.000167664555797201, + "loss": 0.0135, "step": 340350 }, { - "epoch": 1.72, - "learning_rate": 4.2426000575144665e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016766066758082951, + "loss": 0.016, "step": 340360 }, { - "epoch": 1.72, - "learning_rate": 4.241843288213066e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016765677936445806, + "loss": 0.0121, "step": 340370 }, { - "epoch": 1.72, - "learning_rate": 4.241086518911665e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.0001676528911480866, + "loss": 0.0127, "step": 340380 }, { - "epoch": 1.72, - "learning_rate": 4.2403297496102636e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016764900293171514, + "loss": 0.0129, "step": 340390 }, { - "epoch": 1.72, - "learning_rate": 4.2395729803088625e-05, - "loss": 0.0073, + "epoch": 0.88, + "learning_rate": 0.00016764511471534365, + "loss": 0.0128, "step": 340400 }, { - "epoch": 1.72, - "learning_rate": 4.238816211007462e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.0001676412264989722, + "loss": 0.0102, "step": 340410 }, { - "epoch": 1.72, - "learning_rate": 4.238059441706061e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.0001676373382826007, + "loss": 0.0095, "step": 340420 }, { - "epoch": 1.72, - "learning_rate": 4.2373026724046596e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016763345006622928, + "loss": 0.0123, "step": 340430 }, { - "epoch": 1.72, - "learning_rate": 4.2365459031032584e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016762956184985782, + "loss": 0.0109, "step": 340440 }, { - "epoch": 1.72, - "learning_rate": 4.235789133801858e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016762567363348634, + "loss": 0.0127, "step": 340450 }, { - "epoch": 1.72, - "learning_rate": 4.235032364500456e-05, - "loss": 0.0092, + "epoch": 0.88, + "learning_rate": 0.00016762178541711485, + "loss": 0.0108, "step": 340460 }, { - "epoch": 1.72, - "learning_rate": 4.234275595199055e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016761789720074342, + "loss": 0.0093, "step": 340470 }, { - "epoch": 1.72, - "learning_rate": 4.233518825897654e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016761400898437196, + "loss": 0.0131, "step": 340480 }, { - "epoch": 1.72, - "learning_rate": 4.2327620565962525e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016761012076800047, + "loss": 0.0119, "step": 340490 }, { - "epoch": 1.72, - "learning_rate": 4.232005287294852e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016760623255162902, + "loss": 0.0135, "step": 340500 }, { - "epoch": 1.72, - "learning_rate": 4.231248517993451e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.00016760234433525756, + "loss": 0.0154, "step": 340510 }, { - "epoch": 1.72, - "learning_rate": 4.23049174869205e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.0001675984561188861, + "loss": 0.0131, "step": 340520 }, { - "epoch": 1.72, - "learning_rate": 4.2297349793906485e-05, - "loss": 0.0049, + "epoch": 0.88, + "learning_rate": 0.00016759456790251461, + "loss": 0.0174, "step": 340530 }, { - "epoch": 1.72, - "learning_rate": 4.228978210089248e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016759067968614316, + "loss": 0.0139, "step": 340540 }, { - "epoch": 1.72, - "learning_rate": 4.228221440787847e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.0001675867914697717, + "loss": 0.0132, "step": 340550 }, { - "epoch": 1.72, - "learning_rate": 4.2274646714864456e-05, - "loss": 0.0096, + "epoch": 0.88, + "learning_rate": 0.00016758290325340024, + "loss": 0.0132, "step": 340560 }, { - "epoch": 1.72, - "learning_rate": 4.2267079021850445e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016757901503702875, + "loss": 0.0117, "step": 340570 }, { - "epoch": 1.72, - "learning_rate": 4.225951132883644e-05, - "loss": 0.0084, + "epoch": 0.88, + "learning_rate": 0.0001675751268206573, + "loss": 0.0138, "step": 340580 }, { - "epoch": 1.72, - "learning_rate": 4.225194363582243e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016757123860428586, + "loss": 0.0165, "step": 340590 }, { - "epoch": 1.72, - "learning_rate": 4.2244375942808416e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.00016756735038791438, + "loss": 0.0148, "step": 340600 }, { - "epoch": 1.72, - "learning_rate": 4.2236808249794404e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.0001675634621715429, + "loss": 0.0164, "step": 340610 }, { - "epoch": 1.72, - "learning_rate": 4.22292405567804e-05, - "loss": 0.0078, + "epoch": 0.88, + "learning_rate": 0.00016755957395517143, + "loss": 0.014, "step": 340620 }, { - "epoch": 1.72, - "learning_rate": 4.222167286376639e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.0001675556857388, + "loss": 0.0123, "step": 340630 }, { - "epoch": 1.72, - "learning_rate": 4.2214105170752376e-05, - "loss": 0.0128, + "epoch": 0.88, + "learning_rate": 0.00016755179752242852, + "loss": 0.014, "step": 340640 }, { - "epoch": 1.72, - "learning_rate": 4.2206537477738364e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016754790930605706, + "loss": 0.0105, "step": 340650 }, { - "epoch": 1.72, - "learning_rate": 4.219896978472436e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016754402108968557, + "loss": 0.0137, "step": 340660 }, { - "epoch": 1.72, - "learning_rate": 4.219140209171035e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016754013287331412, + "loss": 0.0141, "step": 340670 }, { - "epoch": 1.72, - "learning_rate": 4.2183834398696335e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016753624465694266, + "loss": 0.011, "step": 340680 }, { - "epoch": 1.72, - "learning_rate": 4.2176266705682324e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.0001675323564405712, + "loss": 0.011, "step": 340690 }, { - "epoch": 1.72, - "learning_rate": 4.216869901266832e-05, - "loss": 0.0078, + "epoch": 0.88, + "learning_rate": 0.00016752846822419971, + "loss": 0.0161, "step": 340700 }, { - "epoch": 1.72, - "learning_rate": 4.216113131965431e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.00016752458000782826, + "loss": 0.013, "step": 340710 }, { - "epoch": 1.72, - "learning_rate": 4.2153563626640295e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.0001675206917914568, + "loss": 0.0136, "step": 340720 }, { - "epoch": 1.72, - "learning_rate": 4.214599593362628e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016751680357508534, + "loss": 0.0128, "step": 340730 }, { - "epoch": 1.72, - "learning_rate": 4.213842824061228e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016751291535871385, + "loss": 0.0148, "step": 340740 }, { - "epoch": 1.72, - "learning_rate": 4.2130860547598266e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.0001675090271423424, + "loss": 0.0117, "step": 340750 }, { - "epoch": 1.72, - "learning_rate": 4.2123292854584255e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016750513892597094, + "loss": 0.016, "step": 340760 }, { - "epoch": 1.72, - "learning_rate": 4.211572516157025e-05, - "loss": 0.0065, + "epoch": 0.88, + "learning_rate": 0.00016750125070959948, + "loss": 0.0173, "step": 340770 }, { - "epoch": 1.72, - "learning_rate": 4.210815746855623e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.000167497362493228, + "loss": 0.0119, "step": 340780 }, { - "epoch": 1.72, - "learning_rate": 4.210058977554222e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.00016749347427685653, + "loss": 0.0142, "step": 340790 }, { - "epoch": 1.72, - "learning_rate": 4.209302208252821e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.0001674895860604851, + "loss": 0.0191, "step": 340800 }, { - "epoch": 1.72, - "learning_rate": 4.2085454389514196e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016748569784411362, + "loss": 0.0115, "step": 340810 }, { - "epoch": 1.72, - "learning_rate": 4.207788669650019e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016748180962774216, + "loss": 0.0136, "step": 340820 }, { - "epoch": 1.72, - "learning_rate": 4.207031900348618e-05, - "loss": 0.0097, + "epoch": 0.88, + "learning_rate": 0.00016747792141137067, + "loss": 0.0126, "step": 340830 }, { - "epoch": 1.72, - "learning_rate": 4.206275131047217e-05, - "loss": 0.0082, + "epoch": 0.88, + "learning_rate": 0.00016747403319499924, + "loss": 0.0148, "step": 340840 }, { - "epoch": 1.72, - "learning_rate": 4.2055183617458155e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016747014497862776, + "loss": 0.0132, "step": 340850 }, { - "epoch": 1.72, - "learning_rate": 4.204761592444415e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.0001674662567622563, + "loss": 0.0107, "step": 340860 }, { - "epoch": 1.72, - "learning_rate": 4.204004823143014e-05, - "loss": 0.0086, + "epoch": 0.88, + "learning_rate": 0.0001674623685458848, + "loss": 0.0155, "step": 340870 }, { - "epoch": 1.72, - "learning_rate": 4.203248053841613e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016745848032951338, + "loss": 0.0147, "step": 340880 }, { - "epoch": 1.72, - "learning_rate": 4.2024912845402115e-05, - "loss": 0.0048, + "epoch": 0.88, + "learning_rate": 0.0001674545921131419, + "loss": 0.0156, "step": 340890 }, { - "epoch": 1.72, - "learning_rate": 4.201734515238811e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016745070389677044, + "loss": 0.0136, "step": 340900 }, { - "epoch": 1.72, - "learning_rate": 4.20097774593741e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016744681568039895, + "loss": 0.011, "step": 340910 }, { - "epoch": 1.72, - "learning_rate": 4.2002209766360086e-05, - "loss": 0.0048, + "epoch": 0.88, + "learning_rate": 0.0001674429274640275, + "loss": 0.0162, "step": 340920 }, { - "epoch": 1.72, - "learning_rate": 4.1994642073346075e-05, - "loss": 0.0056, + "epoch": 0.88, + "learning_rate": 0.00016743903924765604, + "loss": 0.012, "step": 340930 }, { - "epoch": 1.72, - "learning_rate": 4.198707438033207e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.00016743515103128458, + "loss": 0.0107, "step": 340940 }, { - "epoch": 1.72, - "learning_rate": 4.197950668731806e-05, - "loss": 0.0076, + "epoch": 0.88, + "learning_rate": 0.0001674312628149131, + "loss": 0.014, "step": 340950 }, { - "epoch": 1.72, - "learning_rate": 4.1971938994304046e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016742737459854163, + "loss": 0.0131, "step": 340960 }, { - "epoch": 1.72, - "learning_rate": 4.1964371301290034e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.0001674234863821702, + "loss": 0.0127, "step": 340970 }, { - "epoch": 1.72, - "learning_rate": 4.195680360827603e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.00016741959816579872, + "loss": 0.0146, "step": 340980 }, { - "epoch": 1.72, - "learning_rate": 4.194923591526202e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016741570994942726, + "loss": 0.0129, "step": 340990 }, { - "epoch": 1.72, - "learning_rate": 4.1941668222248006e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016741182173305577, + "loss": 0.0123, "step": 341000 }, { - "epoch": 1.72, - "eval_cer": 0.9144285288697699, - "eval_loss": 0.00470845028758049, - "eval_runtime": 116.8214, - "eval_samples_per_second": 17.12, - "eval_steps_per_second": 4.28, + "epoch": 0.88, + "eval_cer": 0.8817390768834564, + "eval_loss": 0.008974668569862843, + "eval_runtime": 107.5548, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, "step": 341000 }, { - "epoch": 1.72, - "learning_rate": 4.1934100529233994e-05, - "loss": 0.0051, + "epoch": 0.88, + "learning_rate": 0.00016740793351668434, + "loss": 0.0118, "step": 341010 }, { - "epoch": 1.72, - "learning_rate": 4.192653283621999e-05, - "loss": 0.0075, + "epoch": 0.88, + "learning_rate": 0.00016740404530031286, + "loss": 0.0127, "step": 341020 }, { - "epoch": 1.72, - "learning_rate": 4.191896514320598e-05, - "loss": 0.0072, + "epoch": 0.88, + "learning_rate": 0.0001674001570839414, + "loss": 0.016, "step": 341030 }, { - "epoch": 1.72, - "learning_rate": 4.1911397450191965e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.0001673962688675699, + "loss": 0.0158, "step": 341040 }, { - "epoch": 1.72, - "learning_rate": 4.1903829757177954e-05, - "loss": 0.0043, + "epoch": 0.88, + "learning_rate": 0.00016739238065119848, + "loss": 0.0118, "step": 341050 }, { - "epoch": 1.72, - "learning_rate": 4.189626206416395e-05, - "loss": 0.0071, + "epoch": 0.88, + "learning_rate": 0.000167388492434827, + "loss": 0.0117, "step": 341060 }, { - "epoch": 1.72, - "learning_rate": 4.188869437114994e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.00016738460421845554, + "loss": 0.0131, "step": 341070 }, { - "epoch": 1.72, - "learning_rate": 4.1881126678135925e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016738071600208405, + "loss": 0.0138, "step": 341080 }, { - "epoch": 1.72, - "learning_rate": 4.1873558985121906e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016737682778571262, + "loss": 0.0142, "step": 341090 }, { - "epoch": 1.72, - "learning_rate": 4.1865991292107895e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.00016737293956934114, + "loss": 0.0137, "step": 341100 }, { - "epoch": 1.72, - "learning_rate": 4.185842359909389e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.00016736905135296968, + "loss": 0.0156, "step": 341110 }, { - "epoch": 1.72, - "learning_rate": 4.185085590607988e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.0001673651631365982, + "loss": 0.014, "step": 341120 }, { - "epoch": 1.72, - "learning_rate": 4.1843288213065866e-05, - "loss": 0.0063, + "epoch": 0.88, + "learning_rate": 0.00016736127492022676, + "loss": 0.0131, "step": 341130 }, { - "epoch": 1.72, - "learning_rate": 4.1835720520051854e-05, - "loss": 0.0068, + "epoch": 0.88, + "learning_rate": 0.0001673573867038553, + "loss": 0.0148, "step": 341140 }, { - "epoch": 1.72, - "learning_rate": 4.182815282703785e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016735349848748382, + "loss": 0.0136, "step": 341150 }, { - "epoch": 1.72, - "learning_rate": 4.182058513402384e-05, - "loss": 0.0113, + "epoch": 0.88, + "learning_rate": 0.00016734961027111233, + "loss": 0.0134, "step": 341160 }, { - "epoch": 1.72, - "learning_rate": 4.1813017441009826e-05, - "loss": 0.0062, + "epoch": 0.88, + "learning_rate": 0.00016734572205474087, + "loss": 0.0115, "step": 341170 }, { - "epoch": 1.72, - "learning_rate": 4.1805449747995814e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.00016734183383836944, + "loss": 0.0128, "step": 341180 }, { - "epoch": 1.72, - "learning_rate": 4.179788205498181e-05, - "loss": 0.0057, + "epoch": 0.88, + "learning_rate": 0.00016733794562199796, + "loss": 0.0136, "step": 341190 }, { - "epoch": 1.72, - "learning_rate": 4.17903143619678e-05, - "loss": 0.007, + "epoch": 0.88, + "learning_rate": 0.0001673340574056265, + "loss": 0.0127, "step": 341200 }, { - "epoch": 1.72, - "learning_rate": 4.1782746668953785e-05, - "loss": 0.0044, + "epoch": 0.88, + "learning_rate": 0.000167330169189255, + "loss": 0.0115, "step": 341210 }, { - "epoch": 1.72, - "learning_rate": 4.1775178975939774e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016732628097288358, + "loss": 0.0161, "step": 341220 }, { - "epoch": 1.72, - "learning_rate": 4.176761128292577e-05, - "loss": 0.0066, + "epoch": 0.88, + "learning_rate": 0.0001673223927565121, + "loss": 0.0141, "step": 341230 }, { - "epoch": 1.72, - "learning_rate": 4.176004358991176e-05, - "loss": 0.0058, + "epoch": 0.88, + "learning_rate": 0.00016731850454014064, + "loss": 0.0151, "step": 341240 }, { - "epoch": 1.72, - "learning_rate": 4.1752475896897745e-05, - "loss": 0.006, + "epoch": 0.88, + "learning_rate": 0.00016731461632376915, + "loss": 0.0119, "step": 341250 }, { - "epoch": 1.72, - "learning_rate": 4.174490820388374e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016731072810739772, + "loss": 0.0166, "step": 341260 }, { - "epoch": 1.72, - "learning_rate": 4.173734051086973e-05, - "loss": 0.0061, + "epoch": 0.88, + "learning_rate": 0.00016730683989102623, + "loss": 0.0127, "step": 341270 }, { - "epoch": 1.72, - "learning_rate": 4.1729772817855717e-05, - "loss": 0.0052, + "epoch": 0.88, + "learning_rate": 0.00016730295167465478, + "loss": 0.0129, "step": 341280 }, { - "epoch": 1.72, - "learning_rate": 4.1722205124841705e-05, - "loss": 0.005, + "epoch": 0.88, + "learning_rate": 0.0001672990634582833, + "loss": 0.0142, "step": 341290 }, { - "epoch": 1.72, - "learning_rate": 4.17146374318277e-05, - "loss": 0.008, + "epoch": 0.88, + "learning_rate": 0.00016729517524191186, + "loss": 0.0127, "step": 341300 }, { - "epoch": 1.72, - "learning_rate": 4.170706973881369e-05, - "loss": 0.0053, + "epoch": 0.88, + "learning_rate": 0.0001672912870255404, + "loss": 0.0134, "step": 341310 }, { - "epoch": 1.72, - "learning_rate": 4.1699502045799676e-05, - "loss": 0.0055, + "epoch": 0.88, + "learning_rate": 0.00016728739880916892, + "loss": 0.0099, "step": 341320 }, { - "epoch": 1.72, - "learning_rate": 4.1691934352785664e-05, - "loss": 0.0079, + "epoch": 0.88, + "learning_rate": 0.00016728351059279743, + "loss": 0.0123, "step": 341330 }, { - "epoch": 1.72, - "learning_rate": 4.168436665977166e-05, - "loss": 0.0067, + "epoch": 0.88, + "learning_rate": 0.000167279622376426, + "loss": 0.0138, "step": 341340 }, { - "epoch": 1.72, - "learning_rate": 4.167679896675765e-05, - "loss": 0.0054, + "epoch": 0.88, + "learning_rate": 0.00016727573416005454, + "loss": 0.0128, "step": 341350 }, { - "epoch": 1.72, - "learning_rate": 4.1669231273743636e-05, - "loss": 0.0045, + "epoch": 0.88, + "learning_rate": 0.00016727184594368306, + "loss": 0.0115, "step": 341360 }, { - "epoch": 1.72, - "learning_rate": 4.1661663580729624e-05, - "loss": 0.0064, + "epoch": 0.88, + "learning_rate": 0.0001672679577273116, + "loss": 0.0126, "step": 341370 }, { - "epoch": 1.72, - "learning_rate": 4.165409588771562e-05, - "loss": 0.0085, + "epoch": 0.88, + "learning_rate": 0.00016726406951094014, + "loss": 0.0136, "step": 341380 }, { - "epoch": 1.72, - "learning_rate": 4.164652819470161e-05, - "loss": 0.0081, + "epoch": 0.88, + "learning_rate": 0.00016726018129456868, + "loss": 0.0136, "step": 341390 }, { - "epoch": 1.72, - "learning_rate": 4.1638960501687595e-05, - "loss": 0.0069, + "epoch": 0.88, + "learning_rate": 0.0001672562930781972, + "loss": 0.0134, "step": 341400 }, { - "epoch": 1.72, - "learning_rate": 4.163139280867358e-05, - "loss": 0.0059, + "epoch": 0.88, + "learning_rate": 0.00016725240486182574, + "loss": 0.0121, "step": 341410 }, { - "epoch": 1.72, - "learning_rate": 4.1623825115659565e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016724851664545425, + "loss": 0.0161, "step": 341420 }, { - "epoch": 1.72, - "learning_rate": 4.161625742264556e-05, - "loss": 0.0084, + "epoch": 0.89, + "learning_rate": 0.00016724462842908282, + "loss": 0.013, "step": 341430 }, { - "epoch": 1.72, - "learning_rate": 4.160868972963155e-05, - "loss": 0.0103, + "epoch": 0.89, + "learning_rate": 0.00016724074021271133, + "loss": 0.0121, "step": 341440 }, { - "epoch": 1.72, - "learning_rate": 4.1601122036617537e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016723685199633988, + "loss": 0.0156, "step": 341450 }, { - "epoch": 1.72, - "learning_rate": 4.1593554343603525e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.0001672329637799684, + "loss": 0.0139, "step": 341460 }, { - "epoch": 1.72, - "learning_rate": 4.158598665058952e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016722907556359696, + "loss": 0.0136, "step": 341470 }, { - "epoch": 1.72, - "learning_rate": 4.157841895757551e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016722518734722547, + "loss": 0.0151, "step": 341480 }, { - "epoch": 1.72, - "learning_rate": 4.1570851264561496e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016722129913085402, + "loss": 0.0135, "step": 341490 }, { - "epoch": 1.72, - "learning_rate": 4.1563283571547484e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016721741091448253, + "loss": 0.0112, "step": 341500 }, { - "epoch": 1.72, - "learning_rate": 4.155571587853348e-05, - "loss": 0.0075, + "epoch": 0.89, + "learning_rate": 0.0001672135226981111, + "loss": 0.0129, "step": 341510 }, { - "epoch": 1.72, - "learning_rate": 4.154814818551947e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016720963448173964, + "loss": 0.0108, "step": 341520 }, { - "epoch": 1.72, - "learning_rate": 4.1540580492505456e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016720574626536815, + "loss": 0.0137, "step": 341530 }, { - "epoch": 1.72, - "learning_rate": 4.1533012799491444e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.0001672018580489967, + "loss": 0.0122, "step": 341540 }, { - "epoch": 1.72, - "learning_rate": 4.152544510647744e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.00016719796983262524, + "loss": 0.0138, "step": 341550 }, { - "epoch": 1.72, - "learning_rate": 4.151787741346343e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016719408161625378, + "loss": 0.0118, "step": 341560 }, { - "epoch": 1.72, - "learning_rate": 4.1510309720449416e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.0001671901933998823, + "loss": 0.013, "step": 341570 }, { - "epoch": 1.72, - "learning_rate": 4.1502742027435404e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016718630518351084, + "loss": 0.0131, "step": 341580 }, { - "epoch": 1.72, - "learning_rate": 4.14951743344214e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016718241696713938, + "loss": 0.0127, "step": 341590 }, { - "epoch": 1.72, - "learning_rate": 4.148760664140739e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016717852875076792, + "loss": 0.013, "step": 341600 }, { - "epoch": 1.72, - "learning_rate": 4.1480038948393375e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016717464053439643, + "loss": 0.0122, "step": 341610 }, { - "epoch": 1.72, - "learning_rate": 4.1472471255379363e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.00016717075231802498, + "loss": 0.0115, "step": 341620 }, { - "epoch": 1.72, - "learning_rate": 4.146490356236536e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016716686410165352, + "loss": 0.0112, "step": 341630 }, { - "epoch": 1.72, - "learning_rate": 4.1457335869351347e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016716297588528206, + "loss": 0.0114, "step": 341640 }, { - "epoch": 1.72, - "learning_rate": 4.1449768176337335e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016715908766891057, + "loss": 0.0142, "step": 341650 }, { - "epoch": 1.72, - "learning_rate": 4.144220048332332e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.00016715519945253911, + "loss": 0.0132, "step": 341660 }, { - "epoch": 1.72, - "learning_rate": 4.143463279030932e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016715131123616763, + "loss": 0.0159, "step": 341670 }, { - "epoch": 1.72, - "learning_rate": 4.1427065097295306e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.0001671474230197962, + "loss": 0.0133, "step": 341680 }, { - "epoch": 1.72, - "learning_rate": 4.1419497404281294e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.00016714353480342474, + "loss": 0.0125, "step": 341690 }, { - "epoch": 1.72, - "learning_rate": 4.141192971126728e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016713964658705325, + "loss": 0.0172, "step": 341700 }, { - "epoch": 1.72, - "learning_rate": 4.140436201825328e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.0001671357583706818, + "loss": 0.0124, "step": 341710 }, { - "epoch": 1.72, - "learning_rate": 4.139679432523926e-05, - "loss": 0.0105, + "epoch": 0.89, + "learning_rate": 0.00016713187015431034, + "loss": 0.0143, "step": 341720 }, { - "epoch": 1.72, - "learning_rate": 4.138922663222525e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016712798193793888, + "loss": 0.0119, "step": 341730 }, { - "epoch": 1.72, - "learning_rate": 4.1381658939211236e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.0001671240937215674, + "loss": 0.0107, "step": 341740 }, { - "epoch": 1.72, - "learning_rate": 4.137409124619723e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016712020550519594, + "loss": 0.0126, "step": 341750 }, { - "epoch": 1.72, - "learning_rate": 4.136652355318322e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016711631728882448, + "loss": 0.0111, "step": 341760 }, { - "epoch": 1.72, - "learning_rate": 4.135895586016921e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016711242907245302, + "loss": 0.0113, "step": 341770 }, { - "epoch": 1.72, - "learning_rate": 4.1351388167155195e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.00016710854085608153, + "loss": 0.0136, "step": 341780 }, { - "epoch": 1.72, - "learning_rate": 4.134382047414119e-05, - "loss": 0.0088, + "epoch": 0.89, + "learning_rate": 0.00016710465263971007, + "loss": 0.0163, "step": 341790 }, { - "epoch": 1.72, - "learning_rate": 4.133625278112718e-05, - "loss": 0.0043, + "epoch": 0.89, + "learning_rate": 0.00016710076442333862, + "loss": 0.0141, "step": 341800 }, { - "epoch": 1.72, - "learning_rate": 4.132868508811317e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016709687620696716, + "loss": 0.016, "step": 341810 }, { - "epoch": 1.72, - "learning_rate": 4.1321117395099155e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016709298799059567, + "loss": 0.012, "step": 341820 }, { - "epoch": 1.72, - "learning_rate": 4.131354970208515e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.00016708909977422421, + "loss": 0.0155, "step": 341830 }, { - "epoch": 1.72, - "learning_rate": 4.130598200907114e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016708521155785278, + "loss": 0.013, "step": 341840 }, { - "epoch": 1.72, - "learning_rate": 4.1298414316057126e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.0001670813233414813, + "loss": 0.0161, "step": 341850 }, { - "epoch": 1.72, - "learning_rate": 4.1290846623043115e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016707743512510984, + "loss": 0.0122, "step": 341860 }, { - "epoch": 1.72, - "learning_rate": 4.128327893002911e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016707354690873835, + "loss": 0.0152, "step": 341870 }, { - "epoch": 1.72, - "learning_rate": 4.12757112370151e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016706965869236692, + "loss": 0.012, "step": 341880 }, { - "epoch": 1.72, - "learning_rate": 4.1268143544001086e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.00016706577047599544, + "loss": 0.014, "step": 341890 }, { - "epoch": 1.72, - "learning_rate": 4.1260575850987074e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016706188225962398, + "loss": 0.0113, "step": 341900 }, { - "epoch": 1.72, - "learning_rate": 4.125300815797307e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.0001670579940432525, + "loss": 0.0122, "step": 341910 }, { - "epoch": 1.73, - "learning_rate": 4.124544046495906e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016705410582688103, + "loss": 0.0114, "step": 341920 }, { - "epoch": 1.73, - "learning_rate": 4.1237872771945046e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016705021761050958, + "loss": 0.0144, "step": 341930 }, { - "epoch": 1.73, - "learning_rate": 4.1230305078931034e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.00016704632939413812, + "loss": 0.0178, "step": 341940 }, { - "epoch": 1.73, - "learning_rate": 4.122273738591703e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016704244117776663, + "loss": 0.0128, "step": 341950 }, { - "epoch": 1.73, - "learning_rate": 4.121516969290302e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016703855296139517, + "loss": 0.0138, "step": 341960 }, { - "epoch": 1.73, - "learning_rate": 4.1207601999889005e-05, - "loss": 0.0088, + "epoch": 0.89, + "learning_rate": 0.00016703466474502372, + "loss": 0.0122, "step": 341970 }, { - "epoch": 1.73, - "learning_rate": 4.1200034306874993e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016703077652865226, + "loss": 0.0133, "step": 341980 }, { - "epoch": 1.73, - "learning_rate": 4.119246661386099e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016702688831228077, + "loss": 0.0149, "step": 341990 }, { - "epoch": 1.73, - "learning_rate": 4.118489892084698e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.0001670230000959093, + "loss": 0.0081, "step": 342000 }, { - "epoch": 1.73, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004726854152977467, - "eval_runtime": 116.8239, - "eval_samples_per_second": 17.12, - "eval_steps_per_second": 4.28, + "epoch": 0.89, + "eval_cer": 0.8817460750681273, + "eval_loss": 0.009189891628921032, + "eval_runtime": 107.711, + "eval_samples_per_second": 18.568, + "eval_steps_per_second": 4.642, "step": 342000 }, { - "epoch": 1.73, - "learning_rate": 4.1177331227832965e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016701911187953788, + "loss": 0.0144, "step": 342010 }, { - "epoch": 1.73, - "learning_rate": 4.116976353481895e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.0001670152236631664, + "loss": 0.0166, "step": 342020 }, { - "epoch": 1.73, - "learning_rate": 4.116219584180495e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.00016701133544679494, + "loss": 0.0131, "step": 342030 }, { - "epoch": 1.73, - "learning_rate": 4.115462814879093e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016700744723042345, + "loss": 0.011, "step": 342040 }, { - "epoch": 1.73, - "learning_rate": 4.114706045577692e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016700355901405202, + "loss": 0.0102, "step": 342050 }, { - "epoch": 1.73, - "learning_rate": 4.1139492762762906e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016699967079768054, + "loss": 0.0101, "step": 342060 }, { - "epoch": 1.73, - "learning_rate": 4.1131925069748894e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016699578258130908, + "loss": 0.0155, "step": 342070 }, { - "epoch": 1.73, - "learning_rate": 4.112435737673489e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.0001669918943649376, + "loss": 0.0123, "step": 342080 }, { - "epoch": 1.73, - "learning_rate": 4.111678968372088e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016698800614856616, + "loss": 0.0113, "step": 342090 }, { - "epoch": 1.73, - "learning_rate": 4.1109221990706866e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016698411793219468, + "loss": 0.0123, "step": 342100 }, { - "epoch": 1.73, - "learning_rate": 4.1101654297692854e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016698022971582322, + "loss": 0.0125, "step": 342110 }, { - "epoch": 1.73, - "learning_rate": 4.109408660467885e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016697634149945173, + "loss": 0.0108, "step": 342120 }, { - "epoch": 1.73, - "learning_rate": 4.108651891166484e-05, - "loss": 0.0045, + "epoch": 0.89, + "learning_rate": 0.0001669724532830803, + "loss": 0.0156, "step": 342130 }, { - "epoch": 1.73, - "learning_rate": 4.1078951218650825e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016696856506670882, + "loss": 0.0122, "step": 342140 }, { - "epoch": 1.73, - "learning_rate": 4.1071383525636814e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016696467685033736, + "loss": 0.0146, "step": 342150 }, { - "epoch": 1.73, - "learning_rate": 4.106381583262281e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016696078863396587, + "loss": 0.0134, "step": 342160 }, { - "epoch": 1.73, - "learning_rate": 4.10562481396088e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.0001669569004175944, + "loss": 0.0173, "step": 342170 }, { - "epoch": 1.73, - "learning_rate": 4.1048680446594785e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016695301220122298, + "loss": 0.0162, "step": 342180 }, { - "epoch": 1.73, - "learning_rate": 4.104111275358077e-05, - "loss": 0.0098, + "epoch": 0.89, + "learning_rate": 0.0001669491239848515, + "loss": 0.0183, "step": 342190 }, { - "epoch": 1.73, - "learning_rate": 4.103354506056677e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016694523576848, + "loss": 0.0132, "step": 342200 }, { - "epoch": 1.73, - "learning_rate": 4.1025977367552756e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016694134755210855, + "loss": 0.0133, "step": 342210 }, { - "epoch": 1.73, - "learning_rate": 4.1018409674538745e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.00016693745933573712, + "loss": 0.0129, "step": 342220 }, { - "epoch": 1.73, - "learning_rate": 4.101084198152474e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.00016693357111936564, + "loss": 0.0158, "step": 342230 }, { - "epoch": 1.73, - "learning_rate": 4.100327428851073e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016692968290299418, + "loss": 0.0148, "step": 342240 }, { - "epoch": 1.73, - "learning_rate": 4.0995706595496716e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.0001669257946866227, + "loss": 0.0172, "step": 342250 }, { - "epoch": 1.73, - "learning_rate": 4.0988138902482704e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016692190647025126, + "loss": 0.0175, "step": 342260 }, { - "epoch": 1.73, - "learning_rate": 4.09805712094687e-05, - "loss": 0.0084, + "epoch": 0.89, + "learning_rate": 0.00016691801825387978, + "loss": 0.0118, "step": 342270 }, { - "epoch": 1.73, - "learning_rate": 4.097300351645469e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016691413003750832, + "loss": 0.0102, "step": 342280 }, { - "epoch": 1.73, - "learning_rate": 4.0965435823440676e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016691024182113683, + "loss": 0.0136, "step": 342290 }, { - "epoch": 1.73, - "learning_rate": 4.0957868130426664e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.0001669063536047654, + "loss": 0.0132, "step": 342300 }, { - "epoch": 1.73, - "learning_rate": 4.095030043741266e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016690246538839391, + "loss": 0.0131, "step": 342310 }, { - "epoch": 1.73, - "learning_rate": 4.094273274439865e-05, - "loss": 0.0089, + "epoch": 0.89, + "learning_rate": 0.00016689857717202246, + "loss": 0.0132, "step": 342320 }, { - "epoch": 1.73, - "learning_rate": 4.0935165051384635e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016689468895565097, + "loss": 0.0139, "step": 342330 }, { - "epoch": 1.73, - "learning_rate": 4.0927597358370624e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016689080073927954, + "loss": 0.0142, "step": 342340 }, { - "epoch": 1.73, - "learning_rate": 4.0920029665356605e-05, - "loss": 0.0095, + "epoch": 0.89, + "learning_rate": 0.00016688691252290805, + "loss": 0.015, "step": 342350 }, { - "epoch": 1.73, - "learning_rate": 4.09124619723426e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.0001668830243065366, + "loss": 0.0122, "step": 342360 }, { - "epoch": 1.73, - "learning_rate": 4.090489427932859e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.0001668791360901651, + "loss": 0.0131, "step": 342370 }, { - "epoch": 1.73, - "learning_rate": 4.0897326586314576e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016687524787379368, + "loss": 0.0146, "step": 342380 }, { - "epoch": 1.73, - "learning_rate": 4.0889758893300565e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016687135965742222, + "loss": 0.0142, "step": 342390 }, { - "epoch": 1.73, - "learning_rate": 4.088219120028656e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016686747144105074, + "loss": 0.0123, "step": 342400 }, { - "epoch": 1.73, - "learning_rate": 4.087462350727255e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016686358322467928, + "loss": 0.0158, "step": 342410 }, { - "epoch": 1.73, - "learning_rate": 4.0867055814258536e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.0001668596950083078, + "loss": 0.0197, "step": 342420 }, { - "epoch": 1.73, - "learning_rate": 4.0859488121244524e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016685580679193636, + "loss": 0.0134, "step": 342430 }, { - "epoch": 1.73, - "learning_rate": 4.085192042823052e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016685191857556487, + "loss": 0.0137, "step": 342440 }, { - "epoch": 1.73, - "learning_rate": 4.084435273521651e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016684803035919342, + "loss": 0.0164, "step": 342450 }, { - "epoch": 1.73, - "learning_rate": 4.0836785042202496e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016684414214282193, + "loss": 0.0123, "step": 342460 }, { - "epoch": 1.73, - "learning_rate": 4.0829217349188484e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.0001668402539264505, + "loss": 0.0144, "step": 342470 }, { - "epoch": 1.73, - "learning_rate": 4.082164965617448e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016683636571007901, + "loss": 0.0118, "step": 342480 }, { - "epoch": 1.73, - "learning_rate": 4.081408196316047e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016683247749370756, + "loss": 0.0159, "step": 342490 }, { - "epoch": 1.73, - "learning_rate": 4.0806514270146455e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016682858927733607, + "loss": 0.0127, "step": 342500 }, { - "epoch": 1.73, - "learning_rate": 4.0798946577132444e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016682470106096464, + "loss": 0.0129, "step": 342510 }, { - "epoch": 1.73, - "learning_rate": 4.079137888411844e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016682081284459315, + "loss": 0.0152, "step": 342520 }, { - "epoch": 1.73, - "learning_rate": 4.078381119110443e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.0001668169246282217, + "loss": 0.0128, "step": 342530 }, { - "epoch": 1.73, - "learning_rate": 4.0776243498090415e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.0001668130364118502, + "loss": 0.0092, "step": 342540 }, { - "epoch": 1.73, - "learning_rate": 4.07686758050764e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016680914819547878, + "loss": 0.0122, "step": 342550 }, { - "epoch": 1.73, - "learning_rate": 4.07611081120624e-05, - "loss": 0.0103, + "epoch": 0.89, + "learning_rate": 0.00016680525997910732, + "loss": 0.0145, "step": 342560 }, { - "epoch": 1.73, - "learning_rate": 4.0753540419048386e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016680137176273583, + "loss": 0.0172, "step": 342570 }, { - "epoch": 1.73, - "learning_rate": 4.0745972726034375e-05, - "loss": 0.0115, + "epoch": 0.89, + "learning_rate": 0.00016679748354636438, + "loss": 0.0217, "step": 342580 }, { - "epoch": 1.73, - "learning_rate": 4.073840503302036e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016679359532999292, + "loss": 0.0114, "step": 342590 }, { - "epoch": 1.73, - "learning_rate": 4.073083734000636e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016678970711362146, + "loss": 0.0138, "step": 342600 }, { - "epoch": 1.73, - "learning_rate": 4.0723269646992346e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.00016678581889724997, + "loss": 0.0136, "step": 342610 }, { - "epoch": 1.73, - "learning_rate": 4.0715701953978334e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016678193068087852, + "loss": 0.0118, "step": 342620 }, { - "epoch": 1.73, - "learning_rate": 4.070813426096432e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016677804246450706, + "loss": 0.0156, "step": 342630 }, { - "epoch": 1.73, - "learning_rate": 4.070056656795032e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.0001667741542481356, + "loss": 0.0119, "step": 342640 }, { - "epoch": 1.73, - "learning_rate": 4.0692998874936306e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.0001667702660317641, + "loss": 0.0152, "step": 342650 }, { - "epoch": 1.73, - "learning_rate": 4.068543118192229e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016676637781539266, + "loss": 0.0161, "step": 342660 }, { - "epoch": 1.73, - "learning_rate": 4.0677863488908275e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016676248959902117, + "loss": 0.0119, "step": 342670 }, { - "epoch": 1.73, - "learning_rate": 4.067029579589427e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016675860138264974, + "loss": 0.0187, "step": 342680 }, { - "epoch": 1.73, - "learning_rate": 4.066272810288026e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016675471316627825, + "loss": 0.0139, "step": 342690 }, { - "epoch": 1.73, - "learning_rate": 4.065516040986625e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.0001667508249499068, + "loss": 0.0142, "step": 342700 }, { - "epoch": 1.73, - "learning_rate": 4.0647592716852235e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.0001667469367335353, + "loss": 0.0162, "step": 342710 }, { - "epoch": 1.73, - "learning_rate": 4.064002502383823e-05, - "loss": 0.009, + "epoch": 0.89, + "learning_rate": 0.00016674304851716388, + "loss": 0.0103, "step": 342720 }, { - "epoch": 1.73, - "learning_rate": 4.063245733082422e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016673916030079242, + "loss": 0.0113, "step": 342730 }, { - "epoch": 1.73, - "learning_rate": 4.0624889637810207e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016673527208442093, + "loss": 0.014, "step": 342740 }, { - "epoch": 1.73, - "learning_rate": 4.0617321944796195e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016673138386804945, + "loss": 0.0127, "step": 342750 }, { - "epoch": 1.73, - "learning_rate": 4.060975425178219e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016672749565167802, + "loss": 0.0125, "step": 342760 }, { - "epoch": 1.73, - "learning_rate": 4.060218655876818e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016672360743530656, + "loss": 0.015, "step": 342770 }, { - "epoch": 1.73, - "learning_rate": 4.0594618865754166e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.00016671971921893507, + "loss": 0.0122, "step": 342780 }, { - "epoch": 1.73, - "learning_rate": 4.0587051172740154e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016671583100256361, + "loss": 0.0184, "step": 342790 }, { - "epoch": 1.73, - "learning_rate": 4.057948347972615e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016671194278619216, + "loss": 0.0146, "step": 342800 }, { - "epoch": 1.73, - "learning_rate": 4.057191578671214e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.0001667080545698207, + "loss": 0.0142, "step": 342810 }, { - "epoch": 1.73, - "learning_rate": 4.0564348093698126e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.0001667041663534492, + "loss": 0.0133, "step": 342820 }, { - "epoch": 1.73, - "learning_rate": 4.0556780400684114e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016670027813707775, + "loss": 0.0117, "step": 342830 }, { - "epoch": 1.73, - "learning_rate": 4.054921270767011e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.0001666963899207063, + "loss": 0.015, "step": 342840 }, { - "epoch": 1.73, - "learning_rate": 4.05416450146561e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016669250170433484, + "loss": 0.0124, "step": 342850 }, { - "epoch": 1.73, - "learning_rate": 4.0534077321642085e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016668861348796335, + "loss": 0.0143, "step": 342860 }, { - "epoch": 1.73, - "learning_rate": 4.0526509628628074e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.0001666847252715919, + "loss": 0.0116, "step": 342870 }, { - "epoch": 1.73, - "learning_rate": 4.051894193561407e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016668083705522046, + "loss": 0.0129, "step": 342880 }, { - "epoch": 1.73, - "learning_rate": 4.051137424260006e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016667694883884898, + "loss": 0.0119, "step": 342890 }, { - "epoch": 1.73, - "learning_rate": 4.0503806549586045e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016667306062247752, + "loss": 0.0146, "step": 342900 }, { - "epoch": 1.73, - "learning_rate": 4.049623885657203e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016666917240610603, + "loss": 0.0182, "step": 342910 }, { - "epoch": 1.73, - "learning_rate": 4.048867116355803e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016666528418973455, + "loss": 0.0131, "step": 342920 }, { - "epoch": 1.73, - "learning_rate": 4.0481103470544017e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016666139597336312, + "loss": 0.0143, "step": 342930 }, { - "epoch": 1.73, - "learning_rate": 4.0473535777530005e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016665750775699166, + "loss": 0.0136, "step": 342940 }, { - "epoch": 1.73, - "learning_rate": 4.046596808451599e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016665361954062017, + "loss": 0.0146, "step": 342950 }, { - "epoch": 1.73, - "learning_rate": 4.045840039150199e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016664973132424871, + "loss": 0.0244, "step": 342960 }, { - "epoch": 1.73, - "learning_rate": 4.0450832698487976e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016664584310787726, + "loss": 0.0123, "step": 342970 }, { - "epoch": 1.73, - "learning_rate": 4.044326500547396e-05, - "loss": 0.0084, + "epoch": 0.89, + "learning_rate": 0.0001666419548915058, + "loss": 0.0138, "step": 342980 }, { - "epoch": 1.73, - "learning_rate": 4.0435697312459946e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.0001666380666751343, + "loss": 0.0117, "step": 342990 }, { - "epoch": 1.73, - "learning_rate": 4.0428129619445934e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.00016663417845876285, + "loss": 0.0133, "step": 343000 }, { - "epoch": 1.73, - "eval_cer": 0.9144333808503969, - "eval_loss": 0.00461353175342083, - "eval_runtime": 116.7176, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.89, + "eval_cer": 0.8817236808771804, + "eval_loss": 0.008914493024349213, + "eval_runtime": 107.4576, + "eval_samples_per_second": 18.612, + "eval_steps_per_second": 4.653, "step": 343000 }, { - "epoch": 1.73, - "learning_rate": 4.042056192643193e-05, - "loss": 0.0097, + "epoch": 0.89, + "learning_rate": 0.0001666302902423914, + "loss": 0.0131, "step": 343010 }, { - "epoch": 1.73, - "learning_rate": 4.041299423341792e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016662640202601994, + "loss": 0.0119, "step": 343020 }, { - "epoch": 1.73, - "learning_rate": 4.0405426540403906e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016662251380964845, + "loss": 0.0125, "step": 343030 }, { - "epoch": 1.73, - "learning_rate": 4.0397858847389894e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.000166618625593277, + "loss": 0.0132, "step": 343040 }, { - "epoch": 1.73, - "learning_rate": 4.039029115437589e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016661473737690556, + "loss": 0.0138, "step": 343050 }, { - "epoch": 1.73, - "learning_rate": 4.038272346136188e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016661084916053408, + "loss": 0.0157, "step": 343060 }, { - "epoch": 1.73, - "learning_rate": 4.0375155768347865e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.0001666069609441626, + "loss": 0.0111, "step": 343070 }, { - "epoch": 1.73, - "learning_rate": 4.0367588075333853e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016660307272779113, + "loss": 0.0123, "step": 343080 }, { - "epoch": 1.73, - "learning_rate": 4.036002038231985e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.0001665991845114197, + "loss": 0.0132, "step": 343090 }, { - "epoch": 1.73, - "learning_rate": 4.0352452689305837e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016659529629504822, + "loss": 0.0129, "step": 343100 }, { - "epoch": 1.73, - "learning_rate": 4.0344884996291825e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016659140807867676, + "loss": 0.0158, "step": 343110 }, { - "epoch": 1.73, - "learning_rate": 4.033731730327781e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016658751986230527, + "loss": 0.0149, "step": 343120 }, { - "epoch": 1.73, - "learning_rate": 4.032974961026381e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016658363164593384, + "loss": 0.0138, "step": 343130 }, { - "epoch": 1.73, - "learning_rate": 4.0322181917249796e-05, - "loss": 0.0082, + "epoch": 0.89, + "learning_rate": 0.00016657974342956236, + "loss": 0.0142, "step": 343140 }, { - "epoch": 1.73, - "learning_rate": 4.0314614224235784e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.0001665758552131909, + "loss": 0.0115, "step": 343150 }, { - "epoch": 1.73, - "learning_rate": 4.030704653122177e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.0001665719669968194, + "loss": 0.0123, "step": 343160 }, { - "epoch": 1.73, - "learning_rate": 4.029947883820777e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016656807878044795, + "loss": 0.0126, "step": 343170 }, { - "epoch": 1.73, - "learning_rate": 4.0291911145193756e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.0001665641905640765, + "loss": 0.0125, "step": 343180 }, { - "epoch": 1.73, - "learning_rate": 4.0284343452179744e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016656030234770504, + "loss": 0.0137, "step": 343190 }, { - "epoch": 1.73, - "learning_rate": 4.027677575916574e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.00016655641413133355, + "loss": 0.0146, "step": 343200 }, { - "epoch": 1.73, - "learning_rate": 4.026920806615173e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.0001665525259149621, + "loss": 0.0119, "step": 343210 }, { - "epoch": 1.73, - "learning_rate": 4.0261640373137716e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016654863769859063, + "loss": 0.0141, "step": 343220 }, { - "epoch": 1.73, - "learning_rate": 4.0254072680123704e-05, - "loss": 0.0082, + "epoch": 0.89, + "learning_rate": 0.00016654474948221918, + "loss": 0.0134, "step": 343230 }, { - "epoch": 1.73, - "learning_rate": 4.02465049871097e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.0001665408612658477, + "loss": 0.0162, "step": 343240 }, { - "epoch": 1.73, - "learning_rate": 4.023893729409569e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016653697304947623, + "loss": 0.0165, "step": 343250 }, { - "epoch": 1.73, - "learning_rate": 4.0231369601081675e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.0001665330848331048, + "loss": 0.013, "step": 343260 }, { - "epoch": 1.73, - "learning_rate": 4.0223801908067663e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016652919661673332, + "loss": 0.0117, "step": 343270 }, { - "epoch": 1.73, - "learning_rate": 4.021623421505366e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016652530840036186, + "loss": 0.0138, "step": 343280 }, { - "epoch": 1.73, - "learning_rate": 4.020866652203964e-05, - "loss": 0.0077, - "step": 343290 + "epoch": 0.89, + "learning_rate": 0.00016652142018399037, + "loss": 0.011, + "step": 343290 }, { - "epoch": 1.73, - "learning_rate": 4.020109882902563e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016651753196761894, + "loss": 0.0132, "step": 343300 }, { - "epoch": 1.73, - "learning_rate": 4.0193531136011616e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016651364375124745, + "loss": 0.0144, "step": 343310 }, { - "epoch": 1.73, - "learning_rate": 4.0185963442997605e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.000166509755534876, + "loss": 0.0126, "step": 343320 }, { - "epoch": 1.73, - "learning_rate": 4.01783957499836e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.0001665058673185045, + "loss": 0.0141, "step": 343330 }, { - "epoch": 1.73, - "learning_rate": 4.017082805696959e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016650197910213308, + "loss": 0.0154, "step": 343340 }, { - "epoch": 1.73, - "learning_rate": 4.0163260363955576e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.0001664980908857616, + "loss": 0.0129, "step": 343350 }, { - "epoch": 1.73, - "learning_rate": 4.0155692670941564e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016649420266939014, + "loss": 0.0155, "step": 343360 }, { - "epoch": 1.73, - "learning_rate": 4.014812497792756e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016649031445301865, + "loss": 0.0124, "step": 343370 }, { - "epoch": 1.73, - "learning_rate": 4.014055728491355e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.0001664864262366472, + "loss": 0.0192, "step": 343380 }, { - "epoch": 1.73, - "learning_rate": 4.0132989591899536e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016648253802027573, + "loss": 0.0142, "step": 343390 }, { - "epoch": 1.73, - "learning_rate": 4.0125421898885524e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016647864980390428, + "loss": 0.0151, "step": 343400 }, { - "epoch": 1.73, - "learning_rate": 4.011785420587152e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.0001664747615875328, + "loss": 0.0146, "step": 343410 }, { - "epoch": 1.73, - "learning_rate": 4.011028651285751e-05, - "loss": 0.0082, + "epoch": 0.89, + "learning_rate": 0.00016647087337116133, + "loss": 0.0139, "step": 343420 }, { - "epoch": 1.73, - "learning_rate": 4.0102718819843495e-05, - "loss": 0.0094, + "epoch": 0.89, + "learning_rate": 0.0001664669851547899, + "loss": 0.0144, "step": 343430 }, { - "epoch": 1.73, - "learning_rate": 4.0095151126829483e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016646309693841841, + "loss": 0.0155, "step": 343440 }, { - "epoch": 1.73, - "learning_rate": 4.008758343381548e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016645920872204696, + "loss": 0.0141, "step": 343450 }, { - "epoch": 1.73, - "learning_rate": 4.008001574080147e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016645532050567547, + "loss": 0.0107, "step": 343460 }, { - "epoch": 1.73, - "learning_rate": 4.0072448047787455e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.00016645143228930404, + "loss": 0.0141, "step": 343470 }, { - "epoch": 1.73, - "learning_rate": 4.006488035477344e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016644754407293255, + "loss": 0.011, "step": 343480 }, { - "epoch": 1.73, - "learning_rate": 4.005731266175944e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.0001664436558565611, + "loss": 0.0375, "step": 343490 }, { - "epoch": 1.73, - "learning_rate": 4.0049744968745426e-05, - "loss": 0.0045, + "epoch": 0.89, + "learning_rate": 0.0001664397676401896, + "loss": 0.0137, "step": 343500 }, { - "epoch": 1.73, - "learning_rate": 4.0042177275731415e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016643587942381818, + "loss": 0.015, "step": 343510 }, { - "epoch": 1.73, - "learning_rate": 4.00346095827174e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.0001664319912074467, + "loss": 0.0165, "step": 343520 }, { - "epoch": 1.73, - "learning_rate": 4.00270418897034e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.00016642810299107524, + "loss": 0.014, "step": 343530 }, { - "epoch": 1.73, - "learning_rate": 4.0019474196689386e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016642421477470375, + "loss": 0.0119, "step": 343540 }, { - "epoch": 1.73, - "learning_rate": 4.0011906503675374e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016642032655833232, + "loss": 0.0126, "step": 343550 }, { - "epoch": 1.73, - "learning_rate": 4.000433881066136e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016641643834196083, + "loss": 0.0126, "step": 343560 }, { - "epoch": 1.73, - "learning_rate": 3.999677111764736e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016641255012558937, + "loss": 0.0119, "step": 343570 }, { - "epoch": 1.73, - "learning_rate": 3.9989203424633346e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.0001664086619092179, + "loss": 0.0123, "step": 343580 }, { - "epoch": 1.73, - "learning_rate": 3.9981635731619334e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016640477369284646, + "loss": 0.0155, "step": 343590 }, { - "epoch": 1.73, - "learning_rate": 3.997406803860532e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.000166400885476475, + "loss": 0.0156, "step": 343600 }, { - "epoch": 1.73, - "learning_rate": 3.9966500345591304e-05, - "loss": 0.009, + "epoch": 0.89, + "learning_rate": 0.00016639699726010351, + "loss": 0.014, "step": 343610 }, { - "epoch": 1.73, - "learning_rate": 3.99589326525773e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016639310904373206, + "loss": 0.0166, "step": 343620 }, { - "epoch": 1.73, - "learning_rate": 3.995136495956329e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.00016638922082736057, + "loss": 0.0133, "step": 343630 }, { - "epoch": 1.73, - "learning_rate": 3.9943797266549275e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016638533261098914, + "loss": 0.0157, "step": 343640 }, { - "epoch": 1.73, - "learning_rate": 3.993622957353527e-05, - "loss": 0.0075, + "epoch": 0.89, + "learning_rate": 0.00016638144439461765, + "loss": 0.0121, "step": 343650 }, { - "epoch": 1.73, - "learning_rate": 3.992866188052126e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.0001663775561782462, + "loss": 0.0144, "step": 343660 }, { - "epoch": 1.73, - "learning_rate": 3.9921094187507246e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.0001663736679618747, + "loss": 0.0157, "step": 343670 }, { - "epoch": 1.73, - "learning_rate": 3.9913526494493235e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016636977974550328, + "loss": 0.0139, "step": 343680 }, { - "epoch": 1.73, - "learning_rate": 3.990595880147923e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.0001663658915291318, + "loss": 0.015, "step": 343690 }, { - "epoch": 1.73, - "learning_rate": 3.989839110846522e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016636200331276033, + "loss": 0.0123, "step": 343700 }, { - "epoch": 1.73, - "learning_rate": 3.9890823415451206e-05, - "loss": 0.004, + "epoch": 0.89, + "learning_rate": 0.00016635811509638885, + "loss": 0.0126, "step": 343710 }, { - "epoch": 1.73, - "learning_rate": 3.9883255722437194e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016635422688001742, + "loss": 0.0148, "step": 343720 }, { - "epoch": 1.73, - "learning_rate": 3.987568802942319e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016635033866364593, + "loss": 0.0116, "step": 343730 }, { - "epoch": 1.73, - "learning_rate": 3.986812033640918e-05, - "loss": 0.009, + "epoch": 0.89, + "learning_rate": 0.00016634645044727447, + "loss": 0.0122, "step": 343740 }, { - "epoch": 1.73, - "learning_rate": 3.9860552643395166e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.000166342562230903, + "loss": 0.0156, "step": 343750 }, { - "epoch": 1.73, - "learning_rate": 3.9852984950381154e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016633867401453156, + "loss": 0.0145, "step": 343760 }, { - "epoch": 1.73, - "learning_rate": 3.984541725736715e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.0001663347857981601, + "loss": 0.0122, "step": 343770 }, { - "epoch": 1.73, - "learning_rate": 3.983784956435314e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.00016633089758178861, + "loss": 0.0135, "step": 343780 }, { - "epoch": 1.73, - "learning_rate": 3.9830281871339125e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016632700936541713, + "loss": 0.0128, "step": 343790 }, { - "epoch": 1.73, - "learning_rate": 3.9822714178325114e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.0001663231211490457, + "loss": 0.0111, "step": 343800 }, { - "epoch": 1.73, - "learning_rate": 3.981514648531111e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016631923293267424, + "loss": 0.013, "step": 343810 }, { - "epoch": 1.73, - "learning_rate": 3.98075787922971e-05, - "loss": 0.0097, + "epoch": 0.89, + "learning_rate": 0.00016631534471630275, + "loss": 0.0147, "step": 343820 }, { - "epoch": 1.73, - "learning_rate": 3.9800011099283085e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.0001663114564999313, + "loss": 0.0145, "step": 343830 }, { - "epoch": 1.73, - "learning_rate": 3.979244340626907e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016630756828355984, + "loss": 0.021, "step": 343840 }, { - "epoch": 1.73, - "learning_rate": 3.978487571325507e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.00016630368006718838, + "loss": 0.0127, "step": 343850 }, { - "epoch": 1.73, - "learning_rate": 3.9777308020241056e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.0001662997918508169, + "loss": 0.0138, "step": 343860 }, { - "epoch": 1.73, - "learning_rate": 3.9769740327227045e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.00016629590363444543, + "loss": 0.0135, "step": 343870 }, { - "epoch": 1.73, - "learning_rate": 3.976217263421303e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016629201541807395, + "loss": 0.0134, "step": 343880 }, { - "epoch": 1.73, - "learning_rate": 3.975460494119903e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016628812720170252, + "loss": 0.0136, "step": 343890 }, { - "epoch": 1.74, - "learning_rate": 3.9747037248185016e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016628423898533103, + "loss": 0.0112, "step": 343900 }, { - "epoch": 1.74, - "learning_rate": 3.9739469555171004e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016628035076895957, + "loss": 0.0129, "step": 343910 }, { - "epoch": 1.74, - "learning_rate": 3.9731901862156986e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.0001662764625525881, + "loss": 0.0139, "step": 343920 }, { - "epoch": 1.74, - "learning_rate": 3.9724334169142974e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.00016627257433621666, + "loss": 0.0159, "step": 343930 }, { - "epoch": 1.74, - "learning_rate": 3.971676647612897e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016626868611984517, + "loss": 0.0127, "step": 343940 }, { - "epoch": 1.74, - "learning_rate": 3.970919878311496e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.0001662647979034737, + "loss": 0.0126, "step": 343950 }, { - "epoch": 1.74, - "learning_rate": 3.9701631090100945e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016626090968710223, + "loss": 0.0138, "step": 343960 }, { - "epoch": 1.74, - "learning_rate": 3.9694063397086934e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.0001662570214707308, + "loss": 0.0129, "step": 343970 }, { - "epoch": 1.74, - "learning_rate": 3.968649570407293e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.00016625313325435934, + "loss": 0.0105, "step": 343980 }, { - "epoch": 1.74, - "learning_rate": 3.967892801105892e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.00016624924503798785, + "loss": 0.0122, "step": 343990 }, { - "epoch": 1.74, - "learning_rate": 3.9671360318044905e-05, - "loss": 0.004, + "epoch": 0.89, + "learning_rate": 0.0001662453568216164, + "loss": 0.0123, "step": 344000 }, { - "epoch": 1.74, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004634759854525328, - "eval_runtime": 116.8176, - "eval_samples_per_second": 17.121, - "eval_steps_per_second": 4.28, + "epoch": 0.89, + "eval_cer": 0.8817558725266665, + "eval_loss": 0.008971183560788631, + "eval_runtime": 107.4319, + "eval_samples_per_second": 18.616, + "eval_steps_per_second": 4.654, "step": 344000 }, { - "epoch": 1.74, - "learning_rate": 3.966379262503089e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016624146860524494, + "loss": 0.0164, "step": 344010 }, { - "epoch": 1.74, - "learning_rate": 3.965622493201689e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016623758038887348, + "loss": 0.0116, "step": 344020 }, { - "epoch": 1.74, - "learning_rate": 3.9648657239002876e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.000166233692172502, + "loss": 0.0129, "step": 344030 }, { - "epoch": 1.74, - "learning_rate": 3.9641089545988865e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016622980395613053, + "loss": 0.0159, "step": 344040 }, { - "epoch": 1.74, - "learning_rate": 3.963352185297485e-05, - "loss": 0.0043, + "epoch": 0.89, + "learning_rate": 0.00016622591573975908, + "loss": 0.0154, "step": 344050 }, { - "epoch": 1.74, - "learning_rate": 3.962595415996085e-05, - "loss": 0.0085, + "epoch": 0.89, + "learning_rate": 0.00016622202752338762, + "loss": 0.0135, "step": 344060 }, { - "epoch": 1.74, - "learning_rate": 3.9618386466946836e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016621813930701613, + "loss": 0.0168, "step": 344070 }, { - "epoch": 1.74, - "learning_rate": 3.9610818773932824e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016621425109064467, + "loss": 0.0153, "step": 344080 }, { - "epoch": 1.74, - "learning_rate": 3.960325108091881e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016621036287427324, + "loss": 0.0157, "step": 344090 }, { - "epoch": 1.74, - "learning_rate": 3.959568338790481e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016620647465790176, + "loss": 0.0122, "step": 344100 }, { - "epoch": 1.74, - "learning_rate": 3.9588115694890796e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016620258644153027, + "loss": 0.0131, "step": 344110 }, { - "epoch": 1.74, - "learning_rate": 3.9580548001876784e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.0001661986982251588, + "loss": 0.0125, "step": 344120 }, { - "epoch": 1.74, - "learning_rate": 3.957298030886277e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016619481000878733, + "loss": 0.0126, "step": 344130 }, { - "epoch": 1.74, - "learning_rate": 3.956541261584877e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.0001661909217924159, + "loss": 0.0161, "step": 344140 }, { - "epoch": 1.74, - "learning_rate": 3.9557844922834755e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016618703357604444, + "loss": 0.0122, "step": 344150 }, { - "epoch": 1.74, - "learning_rate": 3.9550277229820744e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016618314535967295, + "loss": 0.0129, "step": 344160 }, { - "epoch": 1.74, - "learning_rate": 3.954270953680674e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.0001661792571433015, + "loss": 0.014, "step": 344170 }, { - "epoch": 1.74, - "learning_rate": 3.953514184379273e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016617536892693004, + "loss": 0.0111, "step": 344180 }, { - "epoch": 1.74, - "learning_rate": 3.9527574150778715e-05, - "loss": 0.0086, + "epoch": 0.89, + "learning_rate": 0.00016617148071055858, + "loss": 0.0113, "step": 344190 }, { - "epoch": 1.74, - "learning_rate": 3.95200064577647e-05, - "loss": 0.0051, + "epoch": 0.89, + "learning_rate": 0.0001661675924941871, + "loss": 0.0129, "step": 344200 }, { - "epoch": 1.74, - "learning_rate": 3.95124387647507e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016616370427781563, + "loss": 0.015, "step": 344210 }, { - "epoch": 1.74, - "learning_rate": 3.9504871071736687e-05, - "loss": 0.008, + "epoch": 0.89, + "learning_rate": 0.00016615981606144417, + "loss": 0.0127, "step": 344220 }, { - "epoch": 1.74, - "learning_rate": 3.949730337872267e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.00016615592784507272, + "loss": 0.0164, "step": 344230 }, { - "epoch": 1.74, - "learning_rate": 3.9489735685708656e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016615203962870123, + "loss": 0.0125, "step": 344240 }, { - "epoch": 1.74, - "learning_rate": 3.9482167992694644e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016614815141232977, + "loss": 0.0152, "step": 344250 }, { - "epoch": 1.74, - "learning_rate": 3.947460029968064e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016614426319595831, + "loss": 0.0128, "step": 344260 }, { - "epoch": 1.74, - "learning_rate": 3.946703260666663e-05, - "loss": 0.0042, + "epoch": 0.89, + "learning_rate": 0.00016614037497958686, + "loss": 0.0135, "step": 344270 }, { - "epoch": 1.74, - "learning_rate": 3.9459464913652616e-05, - "loss": 0.0044, + "epoch": 0.89, + "learning_rate": 0.00016613648676321537, + "loss": 0.0165, "step": 344280 }, { - "epoch": 1.74, - "learning_rate": 3.9451897220638604e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.0001661325985468439, + "loss": 0.0133, "step": 344290 }, { - "epoch": 1.74, - "learning_rate": 3.94443295276246e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016612871033047248, + "loss": 0.0114, "step": 344300 }, { - "epoch": 1.74, - "learning_rate": 3.943676183461059e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.000166124822114101, + "loss": 0.0117, "step": 344310 }, { - "epoch": 1.74, - "learning_rate": 3.9429194141596575e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016612093389772954, + "loss": 0.0177, "step": 344320 }, { - "epoch": 1.74, - "learning_rate": 3.9421626448582564e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.00016611704568135805, + "loss": 0.0098, "step": 344330 }, { - "epoch": 1.74, - "learning_rate": 3.941405875556856e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016611315746498662, + "loss": 0.0145, "step": 344340 }, { - "epoch": 1.74, - "learning_rate": 3.940649106255455e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016610926924861513, + "loss": 0.0118, "step": 344350 }, { - "epoch": 1.74, - "learning_rate": 3.9398923369540535e-05, - "loss": 0.0073, + "epoch": 0.89, + "learning_rate": 0.00016610538103224368, + "loss": 0.0138, "step": 344360 }, { - "epoch": 1.74, - "learning_rate": 3.939135567652652e-05, - "loss": 0.0046, + "epoch": 0.89, + "learning_rate": 0.0001661014928158722, + "loss": 0.0106, "step": 344370 }, { - "epoch": 1.74, - "learning_rate": 3.938378798351252e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016609760459950073, + "loss": 0.0166, "step": 344380 }, { - "epoch": 1.74, - "learning_rate": 3.9376220290498507e-05, - "loss": 0.0047, + "epoch": 0.89, + "learning_rate": 0.00016609371638312927, + "loss": 0.0107, "step": 344390 }, { - "epoch": 1.74, - "learning_rate": 3.9368652597484495e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.00016608982816675782, + "loss": 0.0129, "step": 344400 }, { - "epoch": 1.74, - "learning_rate": 3.936108490447048e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016608593995038633, + "loss": 0.0181, "step": 344410 }, { - "epoch": 1.74, - "learning_rate": 3.935351721145648e-05, - "loss": 0.0087, + "epoch": 0.89, + "learning_rate": 0.00016608205173401487, + "loss": 0.0173, "step": 344420 }, { - "epoch": 1.74, - "learning_rate": 3.9345949518442466e-05, - "loss": 0.0074, + "epoch": 0.89, + "learning_rate": 0.00016607816351764341, + "loss": 0.013, "step": 344430 }, { - "epoch": 1.74, - "learning_rate": 3.9338381825428454e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.00016607427530127196, + "loss": 0.0113, "step": 344440 }, { - "epoch": 1.74, - "learning_rate": 3.933081413241444e-05, - "loss": 0.004, + "epoch": 0.89, + "learning_rate": 0.00016607038708490047, + "loss": 0.0113, "step": 344450 }, { - "epoch": 1.74, - "learning_rate": 3.932324643940044e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.000166066498868529, + "loss": 0.0146, "step": 344460 }, { - "epoch": 1.74, - "learning_rate": 3.9315678746386426e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016606261065215758, + "loss": 0.0147, "step": 344470 }, { - "epoch": 1.74, - "learning_rate": 3.9308111053372414e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.0001660587224357861, + "loss": 0.009, "step": 344480 }, { - "epoch": 1.74, - "learning_rate": 3.93005433603584e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016605483421941464, + "loss": 0.0136, "step": 344490 }, { - "epoch": 1.74, - "learning_rate": 3.92929756673444e-05, - "loss": 0.0089, + "epoch": 0.89, + "learning_rate": 0.00016605094600304315, + "loss": 0.0106, "step": 344500 }, { - "epoch": 1.74, - "learning_rate": 3.9285407974330386e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016604705778667172, + "loss": 0.0121, "step": 344510 }, { - "epoch": 1.74, - "learning_rate": 3.9277840281316374e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016604316957030023, + "loss": 0.0122, "step": 344520 }, { - "epoch": 1.74, - "learning_rate": 3.927027258830236e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.00016603928135392878, + "loss": 0.012, "step": 344530 }, { - "epoch": 1.74, - "learning_rate": 3.926270489528836e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.0001660353931375573, + "loss": 0.015, "step": 344540 }, { - "epoch": 1.74, - "learning_rate": 3.925513720227434e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016603150492118586, + "loss": 0.0116, "step": 344550 }, { - "epoch": 1.74, - "learning_rate": 3.924756950926033e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016602761670481437, + "loss": 0.0134, "step": 344560 }, { - "epoch": 1.74, - "learning_rate": 3.9240001816246315e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016602372848844292, + "loss": 0.0169, "step": 344570 }, { - "epoch": 1.74, - "learning_rate": 3.92324341232323e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016601984027207143, + "loss": 0.0136, "step": 344580 }, { - "epoch": 1.74, - "learning_rate": 3.92248664302183e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.0001660159520557, + "loss": 0.0126, "step": 344590 }, { - "epoch": 1.74, - "learning_rate": 3.9217298737204286e-05, - "loss": 0.0055, + "epoch": 0.89, + "learning_rate": 0.0001660120638393285, + "loss": 0.0116, "step": 344600 }, { - "epoch": 1.74, - "learning_rate": 3.9209731044190274e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016600817562295705, + "loss": 0.0099, "step": 344610 }, { - "epoch": 1.74, - "learning_rate": 3.920216335117627e-05, - "loss": 0.0039, + "epoch": 0.89, + "learning_rate": 0.00016600428740658557, + "loss": 0.016, "step": 344620 }, { - "epoch": 1.74, - "learning_rate": 3.919459565816226e-05, - "loss": 0.0081, + "epoch": 0.89, + "learning_rate": 0.0001660003991902141, + "loss": 0.0132, "step": 344630 }, { - "epoch": 1.74, - "learning_rate": 3.9187027965148246e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016599651097384268, + "loss": 0.0176, "step": 344640 }, { - "epoch": 1.74, - "learning_rate": 3.9179460272134234e-05, - "loss": 0.0084, + "epoch": 0.89, + "learning_rate": 0.0001659926227574712, + "loss": 0.0157, "step": 344650 }, { - "epoch": 1.74, - "learning_rate": 3.917189257912023e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.0001659887345410997, + "loss": 0.0119, "step": 344660 }, { - "epoch": 1.74, - "learning_rate": 3.916432488610622e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.00016598484632472825, + "loss": 0.0138, "step": 344670 }, { - "epoch": 1.74, - "learning_rate": 3.9156757193092206e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016598095810835682, + "loss": 0.0123, "step": 344680 }, { - "epoch": 1.74, - "learning_rate": 3.9149189500078194e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016597706989198533, + "loss": 0.0128, "step": 344690 }, { - "epoch": 1.74, - "learning_rate": 3.914162180706419e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016597318167561388, + "loss": 0.0151, "step": 344700 }, { - "epoch": 1.74, - "learning_rate": 3.913405411405018e-05, - "loss": 0.0134, + "epoch": 0.89, + "learning_rate": 0.0001659692934592424, + "loss": 0.0135, "step": 344710 }, { - "epoch": 1.74, - "learning_rate": 3.9126486421036165e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016596540524287096, + "loss": 0.0134, "step": 344720 }, { - "epoch": 1.74, - "learning_rate": 3.9118918728022153e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016596151702649947, + "loss": 0.0149, "step": 344730 }, { - "epoch": 1.74, - "learning_rate": 3.911135103500815e-05, - "loss": 0.0071, + "epoch": 0.89, + "learning_rate": 0.00016595762881012801, + "loss": 0.0135, "step": 344740 }, { - "epoch": 1.74, - "learning_rate": 3.910378334199414e-05, - "loss": 0.006, + "epoch": 0.89, + "learning_rate": 0.00016595374059375653, + "loss": 0.0131, "step": 344750 }, { - "epoch": 1.74, - "learning_rate": 3.9096215648980125e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.0001659498523773851, + "loss": 0.016, "step": 344760 }, { - "epoch": 1.74, - "learning_rate": 3.908864795596611e-05, - "loss": 0.0044, + "epoch": 0.89, + "learning_rate": 0.0001659459641610136, + "loss": 0.0144, "step": 344770 }, { - "epoch": 1.74, - "learning_rate": 3.908108026295211e-05, - "loss": 0.0082, + "epoch": 0.89, + "learning_rate": 0.00016594207594464215, + "loss": 0.0156, "step": 344780 }, { - "epoch": 1.74, - "learning_rate": 3.9073512569938096e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016593818772827067, + "loss": 0.0146, "step": 344790 }, { - "epoch": 1.74, - "learning_rate": 3.9065944876924085e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016593429951189924, + "loss": 0.0115, "step": 344800 }, { - "epoch": 1.74, - "learning_rate": 3.905837718391007e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016593041129552775, + "loss": 0.0121, "step": 344810 }, { - "epoch": 1.74, - "learning_rate": 3.905080949089607e-05, - "loss": 0.007, + "epoch": 0.89, + "learning_rate": 0.0001659265230791563, + "loss": 0.0147, "step": 344820 }, { - "epoch": 1.74, - "learning_rate": 3.9043241797882056e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.0001659226348627848, + "loss": 0.0099, "step": 344830 }, { - "epoch": 1.74, - "learning_rate": 3.9035674104868044e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016591874664641338, + "loss": 0.0123, "step": 344840 }, { - "epoch": 1.74, - "learning_rate": 3.902810641185403e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016591485843004192, + "loss": 0.0141, "step": 344850 }, { - "epoch": 1.74, - "learning_rate": 3.9020538718840014e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.00016591097021367043, + "loss": 0.014, "step": 344860 }, { - "epoch": 1.74, - "learning_rate": 3.901297102582601e-05, - "loss": 0.0072, + "epoch": 0.89, + "learning_rate": 0.00016590708199729897, + "loss": 0.0118, "step": 344870 }, { - "epoch": 1.74, - "learning_rate": 3.9005403332812e-05, - "loss": 0.0099, + "epoch": 0.89, + "learning_rate": 0.0001659031937809275, + "loss": 0.0122, "step": 344880 }, { - "epoch": 1.74, - "learning_rate": 3.8997835639797985e-05, - "loss": 0.0063, + "epoch": 0.89, + "learning_rate": 0.00016589930556455606, + "loss": 0.0132, "step": 344890 }, { - "epoch": 1.74, - "learning_rate": 3.8990267946783973e-05, - "loss": 0.0065, + "epoch": 0.89, + "learning_rate": 0.00016589541734818457, + "loss": 0.0173, "step": 344900 }, { - "epoch": 1.74, - "learning_rate": 3.898270025376997e-05, - "loss": 0.0067, + "epoch": 0.89, + "learning_rate": 0.00016589152913181311, + "loss": 0.0134, "step": 344910 }, { - "epoch": 1.74, - "learning_rate": 3.897513256075596e-05, - "loss": 0.0049, + "epoch": 0.89, + "learning_rate": 0.00016588764091544163, + "loss": 0.0098, "step": 344920 }, { - "epoch": 1.74, - "learning_rate": 3.8967564867741945e-05, - "loss": 0.0058, + "epoch": 0.89, + "learning_rate": 0.0001658837526990702, + "loss": 0.0164, "step": 344930 }, { - "epoch": 1.74, - "learning_rate": 3.895999717472793e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.0001658798644826987, + "loss": 0.0148, "step": 344940 }, { - "epoch": 1.74, - "learning_rate": 3.895242948171393e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.00016587597626632725, + "loss": 0.0154, "step": 344950 }, { - "epoch": 1.74, - "learning_rate": 3.8944861788699916e-05, - "loss": 0.0059, + "epoch": 0.89, + "learning_rate": 0.00016587208804995577, + "loss": 0.0124, "step": 344960 }, { - "epoch": 1.74, - "learning_rate": 3.8937294095685905e-05, - "loss": 0.0075, + "epoch": 0.89, + "learning_rate": 0.00016586819983358434, + "loss": 0.0142, "step": 344970 }, { - "epoch": 1.74, - "learning_rate": 3.892972640267189e-05, - "loss": 0.0096, + "epoch": 0.89, + "learning_rate": 0.00016586431161721285, + "loss": 0.0119, "step": 344980 }, { - "epoch": 1.74, - "learning_rate": 3.892215870965789e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.0001658604234008414, + "loss": 0.0159, "step": 344990 }, { - "epoch": 1.74, - "learning_rate": 3.8914591016643876e-05, - "loss": 0.0079, + "epoch": 0.89, + "learning_rate": 0.0001658565351844699, + "loss": 0.0155, "step": 345000 }, { - "epoch": 1.74, - "eval_cer": 0.9144159137201398, - "eval_loss": 0.004668357782065868, - "eval_runtime": 116.7577, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.89, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.008910181932151318, + "eval_runtime": 107.3178, + "eval_samples_per_second": 18.636, + "eval_steps_per_second": 4.659, "step": 345000 }, { - "epoch": 1.74, - "learning_rate": 3.8907023323629864e-05, - "loss": 0.0054, + "epoch": 0.89, + "learning_rate": 0.00016585264696809848, + "loss": 0.0124, "step": 345010 }, { - "epoch": 1.74, - "learning_rate": 3.889945563061585e-05, - "loss": 0.0093, + "epoch": 0.89, + "learning_rate": 0.00016584875875172702, + "loss": 0.0131, "step": 345020 }, { - "epoch": 1.74, - "learning_rate": 3.889188793760185e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016584487053535553, + "loss": 0.0139, "step": 345030 }, { - "epoch": 1.74, - "learning_rate": 3.8884320244587836e-05, - "loss": 0.0052, + "epoch": 0.89, + "learning_rate": 0.00016584098231898407, + "loss": 0.0161, "step": 345040 }, { - "epoch": 1.74, - "learning_rate": 3.8876752551573824e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016583709410261262, + "loss": 0.0104, "step": 345050 }, { - "epoch": 1.74, - "learning_rate": 3.886918485855981e-05, - "loss": 0.0091, + "epoch": 0.89, + "learning_rate": 0.00016583320588624116, + "loss": 0.0153, "step": 345060 }, { - "epoch": 1.74, - "learning_rate": 3.886161716554581e-05, - "loss": 0.0057, + "epoch": 0.89, + "learning_rate": 0.00016582931766986967, + "loss": 0.014, "step": 345070 }, { - "epoch": 1.74, - "learning_rate": 3.8854049472531795e-05, - "loss": 0.0076, + "epoch": 0.89, + "learning_rate": 0.0001658254294534982, + "loss": 0.0122, "step": 345080 }, { - "epoch": 1.74, - "learning_rate": 3.8846481779517784e-05, - "loss": 0.0075, + "epoch": 0.89, + "learning_rate": 0.00016582154123712676, + "loss": 0.0118, "step": 345090 }, { - "epoch": 1.74, - "learning_rate": 3.883891408650377e-05, - "loss": 0.005, + "epoch": 0.89, + "learning_rate": 0.0001658176530207553, + "loss": 0.0125, "step": 345100 }, { - "epoch": 1.74, - "learning_rate": 3.883134639348977e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.0001658137648043838, + "loss": 0.0127, "step": 345110 }, { - "epoch": 1.74, - "learning_rate": 3.8823778700475755e-05, - "loss": 0.0042, + "epoch": 0.89, + "learning_rate": 0.00016580987658801235, + "loss": 0.0117, "step": 345120 }, { - "epoch": 1.74, - "learning_rate": 3.881621100746174e-05, - "loss": 0.0061, + "epoch": 0.89, + "learning_rate": 0.00016580598837164087, + "loss": 0.0117, "step": 345130 }, { - "epoch": 1.74, - "learning_rate": 3.880864331444774e-05, - "loss": 0.0062, + "epoch": 0.89, + "learning_rate": 0.00016580210015526944, + "loss": 0.0131, "step": 345140 }, { - "epoch": 1.74, - "learning_rate": 3.8801075621433726e-05, - "loss": 0.0064, + "epoch": 0.89, + "learning_rate": 0.00016579821193889795, + "loss": 0.0098, "step": 345150 }, { - "epoch": 1.74, - "learning_rate": 3.8793507928419715e-05, - "loss": 0.0068, + "epoch": 0.89, + "learning_rate": 0.0001657943237225265, + "loss": 0.0097, "step": 345160 }, { - "epoch": 1.74, - "learning_rate": 3.87859402354057e-05, - "loss": 0.0053, + "epoch": 0.89, + "learning_rate": 0.000165790435506155, + "loss": 0.0099, "step": 345170 }, { - "epoch": 1.74, - "learning_rate": 3.8778372542391684e-05, - "loss": 0.0078, + "epoch": 0.89, + "learning_rate": 0.00016578654728978358, + "loss": 0.0137, "step": 345180 }, { - "epoch": 1.74, - "learning_rate": 3.877080484937768e-05, - "loss": 0.0056, + "epoch": 0.89, + "learning_rate": 0.00016578265907341212, + "loss": 0.014, "step": 345190 }, { - "epoch": 1.74, - "learning_rate": 3.876323715636367e-05, - "loss": 0.0088, + "epoch": 0.89, + "learning_rate": 0.00016577877085704063, + "loss": 0.0123, "step": 345200 }, { - "epoch": 1.74, - "learning_rate": 3.8755669463349656e-05, - "loss": 0.0048, + "epoch": 0.89, + "learning_rate": 0.00016577488264066917, + "loss": 0.0132, "step": 345210 }, { - "epoch": 1.74, - "learning_rate": 3.8748101770335644e-05, - "loss": 0.0066, + "epoch": 0.89, + "learning_rate": 0.00016577099442429772, + "loss": 0.0149, "step": 345220 }, { - "epoch": 1.74, - "learning_rate": 3.874053407732164e-05, - "loss": 0.0075, + "epoch": 0.89, + "learning_rate": 0.00016576710620792626, + "loss": 0.0116, "step": 345230 }, { - "epoch": 1.74, - "learning_rate": 3.873296638430763e-05, - "loss": 0.0082, + "epoch": 0.89, + "learning_rate": 0.00016576321799155477, + "loss": 0.0116, "step": 345240 }, { - "epoch": 1.74, - "learning_rate": 3.8725398691293615e-05, - "loss": 0.0077, + "epoch": 0.89, + "learning_rate": 0.0001657593297751833, + "loss": 0.0151, "step": 345250 }, { - "epoch": 1.74, - "learning_rate": 3.8717830998279604e-05, - "loss": 0.0069, + "epoch": 0.89, + "learning_rate": 0.00016575544155881185, + "loss": 0.0142, "step": 345260 }, { - "epoch": 1.74, - "learning_rate": 3.87102633052656e-05, - "loss": 0.0043, + "epoch": 0.89, + "learning_rate": 0.0001657515533424404, + "loss": 0.0114, "step": 345270 }, { - "epoch": 1.74, - "learning_rate": 3.870269561225159e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.0001657476651260689, + "loss": 0.0158, "step": 345280 }, { - "epoch": 1.74, - "learning_rate": 3.8695127919237575e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016574377690969745, + "loss": 0.0112, "step": 345290 }, { - "epoch": 1.74, - "learning_rate": 3.868756022622356e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.000165739888693326, + "loss": 0.0123, "step": 345300 }, { - "epoch": 1.74, - "learning_rate": 3.867999253320956e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016573600047695454, + "loss": 0.0125, "step": 345310 }, { - "epoch": 1.74, - "learning_rate": 3.8672424840195546e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016573211226058305, + "loss": 0.0151, "step": 345320 }, { - "epoch": 1.74, - "learning_rate": 3.8664857147181535e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.0001657282240442116, + "loss": 0.009, "step": 345330 }, { - "epoch": 1.74, - "learning_rate": 3.865728945416752e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016572433582784016, + "loss": 0.0111, "step": 345340 }, { - "epoch": 1.74, - "learning_rate": 3.864972176115352e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016572044761146868, + "loss": 0.014, "step": 345350 }, { - "epoch": 1.74, - "learning_rate": 3.8642154068139506e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016571655939509722, + "loss": 0.0127, "step": 345360 }, { - "epoch": 1.74, - "learning_rate": 3.8634586375125494e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016571267117872573, + "loss": 0.0132, "step": 345370 }, { - "epoch": 1.74, - "learning_rate": 3.862701868211148e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016570878296235425, + "loss": 0.0117, "step": 345380 }, { - "epoch": 1.74, - "learning_rate": 3.861945098909748e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016570489474598281, + "loss": 0.017, "step": 345390 }, { - "epoch": 1.74, - "learning_rate": 3.8611883296083466e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.00016570100652961136, + "loss": 0.011, "step": 345400 }, { - "epoch": 1.74, - "learning_rate": 3.8604315603069454e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016569711831323987, + "loss": 0.0146, "step": 345410 }, { - "epoch": 1.74, - "learning_rate": 3.859674791005544e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.0001656932300968684, + "loss": 0.0144, "step": 345420 }, { - "epoch": 1.74, - "learning_rate": 3.858918021704144e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016568934188049695, + "loss": 0.0122, "step": 345430 }, { - "epoch": 1.74, - "learning_rate": 3.8581612524027425e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.0001656854536641255, + "loss": 0.0127, "step": 345440 }, { - "epoch": 1.74, - "learning_rate": 3.8574044831013414e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.000165681565447754, + "loss": 0.0153, "step": 345450 }, { - "epoch": 1.74, - "learning_rate": 3.85664771379994e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016567767723138255, + "loss": 0.0102, "step": 345460 }, { - "epoch": 1.74, - "learning_rate": 3.85589094449854e-05, - "loss": 0.0077, + "epoch": 0.9, + "learning_rate": 0.0001656737890150111, + "loss": 0.0142, "step": 345470 }, { - "epoch": 1.74, - "learning_rate": 3.8551341751971385e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016566990079863964, + "loss": 0.0122, "step": 345480 }, { - "epoch": 1.74, - "learning_rate": 3.8543774058957366e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016566601258226815, + "loss": 0.0124, "step": 345490 }, { - "epoch": 1.74, - "learning_rate": 3.8536206365943355e-05, - "loss": 0.0095, + "epoch": 0.9, + "learning_rate": 0.0001656621243658967, + "loss": 0.0133, "step": 345500 }, { - "epoch": 1.74, - "learning_rate": 3.852863867292934e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016565823614952526, + "loss": 0.0144, "step": 345510 }, { - "epoch": 1.74, - "learning_rate": 3.852107097991534e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.00016565434793315377, + "loss": 0.012, "step": 345520 }, { - "epoch": 1.74, - "learning_rate": 3.8513503286901326e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001656504597167823, + "loss": 0.016, "step": 345530 }, { - "epoch": 1.74, - "learning_rate": 3.8505935593887314e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016564657150041083, + "loss": 0.0095, "step": 345540 }, { - "epoch": 1.74, - "learning_rate": 3.84983679008733e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001656426832840394, + "loss": 0.016, "step": 345550 }, { - "epoch": 1.74, - "learning_rate": 3.84908002078593e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016563879506766791, + "loss": 0.0109, "step": 345560 }, { - "epoch": 1.74, - "learning_rate": 3.8483232514845286e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016563490685129646, + "loss": 0.012, "step": 345570 }, { - "epoch": 1.74, - "learning_rate": 3.8475664821831274e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016563101863492497, + "loss": 0.0143, "step": 345580 }, { - "epoch": 1.74, - "learning_rate": 3.846809712881727e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016562713041855354, + "loss": 0.0126, "step": 345590 }, { - "epoch": 1.74, - "learning_rate": 3.846052943580326e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016562324220218205, + "loss": 0.0127, "step": 345600 }, { - "epoch": 1.74, - "learning_rate": 3.8452961742789245e-05, - "loss": 0.0085, + "epoch": 0.9, + "learning_rate": 0.0001656193539858106, + "loss": 0.0127, "step": 345610 }, { - "epoch": 1.74, - "learning_rate": 3.8445394049775234e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.0001656154657694391, + "loss": 0.0147, "step": 345620 }, { - "epoch": 1.74, - "learning_rate": 3.843782635676123e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016561157755306765, + "loss": 0.0119, "step": 345630 }, { - "epoch": 1.74, - "learning_rate": 3.843025866374722e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001656076893366962, + "loss": 0.0141, "step": 345640 }, { - "epoch": 1.74, - "learning_rate": 3.8422690970733205e-05, - "loss": 0.0087, + "epoch": 0.9, + "learning_rate": 0.00016560380112032473, + "loss": 0.0111, "step": 345650 }, { - "epoch": 1.74, - "learning_rate": 3.841512327771919e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016559991290395325, + "loss": 0.0155, "step": 345660 }, { - "epoch": 1.74, - "learning_rate": 3.840755558470519e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.0001655960246875818, + "loss": 0.0118, "step": 345670 }, { - "epoch": 1.74, - "learning_rate": 3.8399987891691177e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016559213647121036, + "loss": 0.0127, "step": 345680 }, { - "epoch": 1.74, - "learning_rate": 3.8392420198677165e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016558824825483887, + "loss": 0.015, "step": 345690 }, { - "epoch": 1.74, - "learning_rate": 3.838485250566315e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001655843600384674, + "loss": 0.02, "step": 345700 }, { - "epoch": 1.74, - "learning_rate": 3.837728481264915e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016558047182209593, + "loss": 0.0156, "step": 345710 }, { - "epoch": 1.74, - "learning_rate": 3.8369717119635136e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.0001655765836057245, + "loss": 0.0143, "step": 345720 }, { - "epoch": 1.74, - "learning_rate": 3.8362149426621124e-05, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.000165572695389353, + "loss": 0.0139, "step": 345730 }, { - "epoch": 1.74, - "learning_rate": 3.835458173360711e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016556880717298155, + "loss": 0.0159, "step": 345740 }, { - "epoch": 1.74, - "learning_rate": 3.834701404059311e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016556491895661007, + "loss": 0.0102, "step": 345750 }, { - "epoch": 1.74, - "learning_rate": 3.8339446347579096e-05, - "loss": 0.0095, + "epoch": 0.9, + "learning_rate": 0.00016556103074023864, + "loss": 0.016, "step": 345760 }, { - "epoch": 1.74, - "learning_rate": 3.8331878654565084e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016555714252386715, + "loss": 0.0115, "step": 345770 }, { - "epoch": 1.74, - "learning_rate": 3.832431096155107e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.0001655532543074957, + "loss": 0.0118, "step": 345780 }, { - "epoch": 1.74, - "learning_rate": 3.831674326853707e-05, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.0001655493660911242, + "loss": 0.0145, "step": 345790 }, { - "epoch": 1.74, - "learning_rate": 3.8309175575523055e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016554547787475278, + "loss": 0.0114, "step": 345800 }, { - "epoch": 1.74, - "learning_rate": 3.830160788250904e-05, - "loss": 0.0085, + "epoch": 0.9, + "learning_rate": 0.0001655415896583813, + "loss": 0.0136, "step": 345810 }, { - "epoch": 1.74, - "learning_rate": 3.8294040189495025e-05, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.00016553770144200983, + "loss": 0.0104, "step": 345820 }, { - "epoch": 1.74, - "learning_rate": 3.828647249648101e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016553381322563835, + "loss": 0.0095, "step": 345830 }, { - "epoch": 1.74, - "learning_rate": 3.827890480346701e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016552992500926692, + "loss": 0.0136, "step": 345840 }, { - "epoch": 1.74, - "learning_rate": 3.8271337110452997e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016552603679289543, + "loss": 0.012, "step": 345850 }, { - "epoch": 1.74, - "learning_rate": 3.8263769417438985e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.00016552214857652397, + "loss": 0.014, "step": 345860 }, { - "epoch": 1.74, - "learning_rate": 3.825620172442497e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.0001655182603601525, + "loss": 0.0181, "step": 345870 }, { - "epoch": 1.75, - "learning_rate": 3.824863403141097e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016551437214378103, + "loss": 0.0154, "step": 345880 }, { - "epoch": 1.75, - "learning_rate": 3.8241066338396956e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.0001655104839274096, + "loss": 0.0124, "step": 345890 }, { - "epoch": 1.75, - "learning_rate": 3.8233498645382944e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.0001655065957110381, + "loss": 0.0139, "step": 345900 }, { - "epoch": 1.75, - "learning_rate": 3.822593095236893e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016550270749466665, + "loss": 0.0173, "step": 345910 }, { - "epoch": 1.75, - "learning_rate": 3.821836325935493e-05, - "loss": 0.0044, + "epoch": 0.9, + "learning_rate": 0.00016549881927829517, + "loss": 0.0129, "step": 345920 }, { - "epoch": 1.75, - "learning_rate": 3.8210795566340916e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016549493106192374, + "loss": 0.0116, "step": 345930 }, { - "epoch": 1.75, - "learning_rate": 3.8203227873326904e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016549104284555225, + "loss": 0.012, "step": 345940 }, { - "epoch": 1.75, - "learning_rate": 3.819566018031289e-05, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.0001654871546291808, + "loss": 0.0157, "step": 345950 }, { - "epoch": 1.75, - "learning_rate": 3.818809248729889e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.0001654832664128093, + "loss": 0.0132, "step": 345960 }, { - "epoch": 1.75, - "learning_rate": 3.8180524794284876e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016547937819643788, + "loss": 0.0107, "step": 345970 }, { - "epoch": 1.75, - "learning_rate": 3.8172957101270864e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.0001654754899800664, + "loss": 0.0149, "step": 345980 }, { - "epoch": 1.75, - "learning_rate": 3.816538940825685e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016547160176369493, + "loss": 0.016, "step": 345990 }, { - "epoch": 1.75, - "learning_rate": 3.815782171524285e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016546771354732345, + "loss": 0.0109, "step": 346000 }, { - "epoch": 1.75, - "eval_cer": 0.9144227064930175, - "eval_loss": 0.004535060841590166, - "eval_runtime": 116.7184, - "eval_samples_per_second": 17.135, - "eval_steps_per_second": 4.284, + "epoch": 0.9, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.009006353095173836, + "eval_runtime": 107.5267, + "eval_samples_per_second": 18.6, + "eval_steps_per_second": 4.65, "step": 346000 }, { - "epoch": 1.75, - "learning_rate": 3.8150254022228835e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016546382533095202, + "loss": 0.0119, "step": 346010 }, { - "epoch": 1.75, - "learning_rate": 3.8142686329214823e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016545993711458053, + "loss": 0.0151, "step": 346020 }, { - "epoch": 1.75, - "learning_rate": 3.813511863620081e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016545604889820907, + "loss": 0.0149, "step": 346030 }, { - "epoch": 1.75, - "learning_rate": 3.812755094318681e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001654521606818376, + "loss": 0.0154, "step": 346040 }, { - "epoch": 1.75, - "learning_rate": 3.8119983250172795e-05, - "loss": 0.0082, + "epoch": 0.9, + "learning_rate": 0.00016544827246546616, + "loss": 0.0135, "step": 346050 }, { - "epoch": 1.75, - "learning_rate": 3.811241555715878e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.0001654443842490947, + "loss": 0.0141, "step": 346060 }, { - "epoch": 1.75, - "learning_rate": 3.810484786414477e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001654404960327232, + "loss": 0.0135, "step": 346070 }, { - "epoch": 1.75, - "learning_rate": 3.8097280171130766e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016543660781635175, + "loss": 0.0131, "step": 346080 }, { - "epoch": 1.75, - "learning_rate": 3.8089712478116754e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001654327195999803, + "loss": 0.0121, "step": 346090 }, { - "epoch": 1.75, - "learning_rate": 3.808214478510274e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016542883138360884, + "loss": 0.0105, "step": 346100 }, { - "epoch": 1.75, - "learning_rate": 3.807457709208874e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016542494316723735, + "loss": 0.0104, "step": 346110 }, { - "epoch": 1.75, - "learning_rate": 3.806700939907472e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001654210549508659, + "loss": 0.0111, "step": 346120 }, { - "epoch": 1.75, - "learning_rate": 3.805944170606071e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001654171667344944, + "loss": 0.0129, "step": 346130 }, { - "epoch": 1.75, - "learning_rate": 3.8051874013046696e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016541327851812298, + "loss": 0.0113, "step": 346140 }, { - "epoch": 1.75, - "learning_rate": 3.8044306320032684e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.0001654093903017515, + "loss": 0.0124, "step": 346150 }, { - "epoch": 1.75, - "learning_rate": 3.803673862701868e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.00016540550208538003, + "loss": 0.0128, "step": 346160 }, { - "epoch": 1.75, - "learning_rate": 3.802917093400467e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016540161386900855, + "loss": 0.0161, "step": 346170 }, { - "epoch": 1.75, - "learning_rate": 3.8021603240990655e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016539772565263712, + "loss": 0.0098, "step": 346180 }, { - "epoch": 1.75, - "learning_rate": 3.8014035547976643e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016539383743626563, + "loss": 0.0117, "step": 346190 }, { - "epoch": 1.75, - "learning_rate": 3.800646785496264e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016538994921989417, + "loss": 0.0131, "step": 346200 }, { - "epoch": 1.75, - "learning_rate": 3.799890016194863e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.0001653860610035227, + "loss": 0.0142, "step": 346210 }, { - "epoch": 1.75, - "learning_rate": 3.7991332468934615e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016538217278715126, + "loss": 0.0135, "step": 346220 }, { - "epoch": 1.75, - "learning_rate": 3.79837647759206e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.0001653782845707798, + "loss": 0.0116, "step": 346230 }, { - "epoch": 1.75, - "learning_rate": 3.79761970829066e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001653743963544083, + "loss": 0.0122, "step": 346240 }, { - "epoch": 1.75, - "learning_rate": 3.7968629389892586e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016537050813803683, + "loss": 0.0144, "step": 346250 }, { - "epoch": 1.75, - "learning_rate": 3.7961061696878575e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.0001653666199216654, + "loss": 0.0105, "step": 346260 }, { - "epoch": 1.75, - "learning_rate": 3.795349400386456e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016536273170529394, + "loss": 0.0156, "step": 346270 }, { - "epoch": 1.75, - "learning_rate": 3.794592631085056e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016535884348892245, + "loss": 0.0114, "step": 346280 }, { - "epoch": 1.75, - "learning_rate": 3.7938358617836546e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.000165354955272551, + "loss": 0.0158, "step": 346290 }, { - "epoch": 1.75, - "learning_rate": 3.7930790924822534e-05, - "loss": 0.0079, + "epoch": 0.9, + "learning_rate": 0.00016535106705617953, + "loss": 0.0121, "step": 346300 }, { - "epoch": 1.75, - "learning_rate": 3.792322323180852e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016534717883980808, + "loss": 0.0112, "step": 346310 }, { - "epoch": 1.75, - "learning_rate": 3.791565553879452e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.0001653432906234366, + "loss": 0.011, "step": 346320 }, { - "epoch": 1.75, - "learning_rate": 3.7908087845780506e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016533940240706513, + "loss": 0.0126, "step": 346330 }, { - "epoch": 1.75, - "learning_rate": 3.7900520152766494e-05, - "loss": 0.0086, + "epoch": 0.9, + "learning_rate": 0.00016533551419069367, + "loss": 0.0154, "step": 346340 }, { - "epoch": 1.75, - "learning_rate": 3.789295245975248e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016533162597432222, + "loss": 0.0129, "step": 346350 }, { - "epoch": 1.75, - "learning_rate": 3.788538476673848e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016532773775795073, + "loss": 0.0111, "step": 346360 }, { - "epoch": 1.75, - "learning_rate": 3.7877817073724465e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016532384954157927, + "loss": 0.0144, "step": 346370 }, { - "epoch": 1.75, - "learning_rate": 3.7870249380710453e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016531996132520779, + "loss": 0.0199, "step": 346380 }, { - "epoch": 1.75, - "learning_rate": 3.786268168769644e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016531607310883635, + "loss": 0.012, "step": 346390 }, { - "epoch": 1.75, - "learning_rate": 3.785511399468244e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016531218489246487, + "loss": 0.0123, "step": 346400 }, { - "epoch": 1.75, - "learning_rate": 3.7847546301668425e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001653082966760934, + "loss": 0.012, "step": 346410 }, { - "epoch": 1.75, - "learning_rate": 3.783997860865441e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016530440845972193, + "loss": 0.0117, "step": 346420 }, { - "epoch": 1.75, - "learning_rate": 3.7832410915640395e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.0001653005202433505, + "loss": 0.0122, "step": 346430 }, { - "epoch": 1.75, - "learning_rate": 3.782484322262638e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016529663202697904, + "loss": 0.0123, "step": 346440 }, { - "epoch": 1.75, - "learning_rate": 3.781727552961238e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016529274381060755, + "loss": 0.0131, "step": 346450 }, { - "epoch": 1.75, - "learning_rate": 3.7809707836598366e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.0001652888555942361, + "loss": 0.0104, "step": 346460 }, { - "epoch": 1.75, - "learning_rate": 3.7802140143584354e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016528496737786463, + "loss": 0.0162, "step": 346470 }, { - "epoch": 1.75, - "learning_rate": 3.779457245057034e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016528107916149318, + "loss": 0.0115, "step": 346480 }, { - "epoch": 1.75, - "learning_rate": 3.778700475755634e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001652771909451217, + "loss": 0.0155, "step": 346490 }, { - "epoch": 1.75, - "learning_rate": 3.7779437064542326e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016527330272875023, + "loss": 0.023, "step": 346500 }, { - "epoch": 1.75, - "learning_rate": 3.7771869371528314e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016526941451237877, + "loss": 0.0155, "step": 346510 }, { - "epoch": 1.75, - "learning_rate": 3.77643016785143e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016526552629600731, + "loss": 0.0136, "step": 346520 }, { - "epoch": 1.75, - "learning_rate": 3.77567339855003e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.00016526163807963583, + "loss": 0.0166, "step": 346530 }, { - "epoch": 1.75, - "learning_rate": 3.7749166292486285e-05, - "loss": 0.0076, + "epoch": 0.9, + "learning_rate": 0.00016525774986326437, + "loss": 0.0118, "step": 346540 }, { - "epoch": 1.75, - "learning_rate": 3.7741598599472274e-05, - "loss": 0.0044, + "epoch": 0.9, + "learning_rate": 0.00016525386164689294, + "loss": 0.0147, "step": 346550 }, { - "epoch": 1.75, - "learning_rate": 3.773403090645827e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016524997343052145, + "loss": 0.0153, "step": 346560 }, { - "epoch": 1.75, - "learning_rate": 3.772646321344426e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016524608521414997, + "loss": 0.0144, "step": 346570 }, { - "epoch": 1.75, - "learning_rate": 3.7718895520430245e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001652421969977785, + "loss": 0.011, "step": 346580 }, { - "epoch": 1.75, - "learning_rate": 3.771132782741623e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016523830878140708, + "loss": 0.0158, "step": 346590 }, { - "epoch": 1.75, - "learning_rate": 3.770376013440223e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.0001652344205650356, + "loss": 0.0137, "step": 346600 }, { - "epoch": 1.75, - "learning_rate": 3.7696192441388216e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016523053234866414, + "loss": 0.0112, "step": 346610 }, { - "epoch": 1.75, - "learning_rate": 3.7688624748374205e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016522664413229265, + "loss": 0.0162, "step": 346620 }, { - "epoch": 1.75, - "learning_rate": 3.768105705536019e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.0001652227559159212, + "loss": 0.0116, "step": 346630 }, { - "epoch": 1.75, - "learning_rate": 3.767348936234619e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.00016521886769954973, + "loss": 0.0121, "step": 346640 }, { - "epoch": 1.75, - "learning_rate": 3.7665921669332176e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016521497948317827, + "loss": 0.0181, "step": 346650 }, { - "epoch": 1.75, - "learning_rate": 3.7658353976318164e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001652110912668068, + "loss": 0.0168, "step": 346660 }, { - "epoch": 1.75, - "learning_rate": 3.765078628330415e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016520720305043533, + "loss": 0.0132, "step": 346670 }, { - "epoch": 1.75, - "learning_rate": 3.764321859029015e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.00016520331483406387, + "loss": 0.019, "step": 346680 }, { - "epoch": 1.75, - "learning_rate": 3.7635650897276136e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.00016519942661769241, + "loss": 0.0142, "step": 346690 }, { - "epoch": 1.75, - "learning_rate": 3.7628083204262124e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016519553840132093, + "loss": 0.0146, "step": 346700 }, { - "epoch": 1.75, - "learning_rate": 3.762051551124811e-05, - "loss": 0.0077, + "epoch": 0.9, + "learning_rate": 0.00016519165018494947, + "loss": 0.0148, "step": 346710 }, { - "epoch": 1.75, - "learning_rate": 3.761294781823411e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.000165187761968578, + "loss": 0.0113, "step": 346720 }, { - "epoch": 1.75, - "learning_rate": 3.7605380125220095e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016518387375220655, + "loss": 0.0116, "step": 346730 }, { - "epoch": 1.75, - "learning_rate": 3.7597812432206084e-05, - "loss": 0.009, + "epoch": 0.9, + "learning_rate": 0.00016517998553583507, + "loss": 0.0152, "step": 346740 }, { - "epoch": 1.75, - "learning_rate": 3.7590244739192065e-05, - "loss": 0.009, + "epoch": 0.9, + "learning_rate": 0.0001651760973194636, + "loss": 0.0121, "step": 346750 }, { - "epoch": 1.75, - "learning_rate": 3.758267704617805e-05, - "loss": 0.0087, + "epoch": 0.9, + "learning_rate": 0.00016517220910309218, + "loss": 0.0128, "step": 346760 }, { - "epoch": 1.75, - "learning_rate": 3.757510935316405e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001651683208867207, + "loss": 0.0149, "step": 346770 }, { - "epoch": 1.75, - "learning_rate": 3.7567541660150036e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016516443267034923, + "loss": 0.0122, "step": 346780 }, { - "epoch": 1.75, - "learning_rate": 3.7559973967136025e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016516054445397775, + "loss": 0.0138, "step": 346790 }, { - "epoch": 1.75, - "learning_rate": 3.755240627412201e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.00016515665623760632, + "loss": 0.0097, "step": 346800 }, { - "epoch": 1.75, - "learning_rate": 3.754483858110801e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016515276802123483, + "loss": 0.0112, "step": 346810 }, { - "epoch": 1.75, - "learning_rate": 3.7537270888093996e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016514887980486337, + "loss": 0.0131, "step": 346820 }, { - "epoch": 1.75, - "learning_rate": 3.7529703195079984e-05, - "loss": 0.0088, + "epoch": 0.9, + "learning_rate": 0.0001651449915884919, + "loss": 0.0143, "step": 346830 }, { - "epoch": 1.75, - "learning_rate": 3.752213550206597e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016514110337212046, + "loss": 0.0144, "step": 346840 }, { - "epoch": 1.75, - "learning_rate": 3.751456780905197e-05, - "loss": 0.0047, + "epoch": 0.9, + "learning_rate": 0.00016513721515574897, + "loss": 0.011, "step": 346850 }, { - "epoch": 1.75, - "learning_rate": 3.7507000116037956e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016513332693937751, + "loss": 0.0136, "step": 346860 }, { - "epoch": 1.75, - "learning_rate": 3.7499432423023944e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016512943872300603, + "loss": 0.0106, "step": 346870 }, { - "epoch": 1.75, - "learning_rate": 3.749186473000993e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016512555050663457, + "loss": 0.0141, "step": 346880 }, { - "epoch": 1.75, - "learning_rate": 3.748429703699593e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.0001651216622902631, + "loss": 0.0177, "step": 346890 }, { - "epoch": 1.75, - "learning_rate": 3.7476729343981915e-05, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.00016511777407389165, + "loss": 0.0099, "step": 346900 }, { - "epoch": 1.75, - "learning_rate": 3.7469161650967904e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016511388585752017, + "loss": 0.0143, "step": 346910 }, { - "epoch": 1.75, - "learning_rate": 3.746159395795389e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.0001651099976411487, + "loss": 0.0098, "step": 346920 }, { - "epoch": 1.75, - "learning_rate": 3.745402626493989e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016510610942477728, + "loss": 0.0123, "step": 346930 }, { - "epoch": 1.75, - "learning_rate": 3.7446458571925875e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.0001651022212084058, + "loss": 0.0121, "step": 346940 }, { - "epoch": 1.75, - "learning_rate": 3.743889087891186e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016509833299203433, + "loss": 0.0139, "step": 346950 }, { - "epoch": 1.75, - "learning_rate": 3.743132318589785e-05, - "loss": 0.0113, + "epoch": 0.9, + "learning_rate": 0.00016509444477566285, + "loss": 0.0119, "step": 346960 }, { - "epoch": 1.75, - "learning_rate": 3.7423755492883846e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016509055655929142, + "loss": 0.012, "step": 346970 }, { - "epoch": 1.75, - "learning_rate": 3.741618779986983e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016508666834291993, + "loss": 0.0124, "step": 346980 }, { - "epoch": 1.75, - "learning_rate": 3.740862010685582e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.00016508278012654847, + "loss": 0.0125, "step": 346990 }, { - "epoch": 1.75, - "learning_rate": 3.740105241384181e-05, - "loss": 0.0079, + "epoch": 0.9, + "learning_rate": 0.000165078891910177, + "loss": 0.0137, "step": 347000 }, { - "epoch": 1.75, - "eval_cer": 0.9144304696620207, - "eval_loss": 0.004600143525749445, - "eval_runtime": 116.8017, - "eval_samples_per_second": 17.123, - "eval_steps_per_second": 4.281, + "epoch": 0.9, + "eval_cer": 0.8817502739789299, + "eval_loss": 0.008850464597344398, + "eval_runtime": 107.5314, + "eval_samples_per_second": 18.599, + "eval_steps_per_second": 4.65, "step": 347000 }, { - "epoch": 1.75, - "learning_rate": 3.73934847208278e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016507500369380556, + "loss": 0.0101, "step": 347010 }, { - "epoch": 1.75, - "learning_rate": 3.738591702781379e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016507111547743407, + "loss": 0.0126, "step": 347020 }, { - "epoch": 1.75, - "learning_rate": 3.737834933479978e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.0001650672272610626, + "loss": 0.0119, "step": 347030 }, { - "epoch": 1.75, - "learning_rate": 3.737078164178577e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016506333904469113, + "loss": 0.0134, "step": 347040 }, { - "epoch": 1.75, - "learning_rate": 3.736321394877176e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.0001650594508283197, + "loss": 0.0122, "step": 347050 }, { - "epoch": 1.75, - "learning_rate": 3.735564625575775e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.0001650555626119482, + "loss": 0.0151, "step": 347060 }, { - "epoch": 1.75, - "learning_rate": 3.734807856274374e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016505167439557675, + "loss": 0.0135, "step": 347070 }, { - "epoch": 1.75, - "learning_rate": 3.734051086972973e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016504778617920527, + "loss": 0.0137, "step": 347080 }, { - "epoch": 1.75, - "learning_rate": 3.733294317671572e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016504389796283384, + "loss": 0.0135, "step": 347090 }, { - "epoch": 1.75, - "learning_rate": 3.732537548370171e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016504000974646238, + "loss": 0.0152, "step": 347100 }, { - "epoch": 1.75, - "learning_rate": 3.73178077906877e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001650361215300909, + "loss": 0.0132, "step": 347110 }, { - "epoch": 1.75, - "learning_rate": 3.731024009767369e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.0001650322333137194, + "loss": 0.0164, "step": 347120 }, { - "epoch": 1.75, - "learning_rate": 3.730267240465968e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016502834509734795, + "loss": 0.0106, "step": 347130 }, { - "epoch": 1.75, - "learning_rate": 3.7295104711645667e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016502445688097652, + "loss": 0.0113, "step": 347140 }, { - "epoch": 1.75, - "learning_rate": 3.7287537018631655e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016502056866460503, + "loss": 0.0131, "step": 347150 }, { - "epoch": 1.75, - "learning_rate": 3.727996932561764e-05, - "loss": 0.0094, + "epoch": 0.9, + "learning_rate": 0.00016501668044823357, + "loss": 0.014, "step": 347160 }, { - "epoch": 1.75, - "learning_rate": 3.727240163260364e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.0001650127922318621, + "loss": 0.0119, "step": 347170 }, { - "epoch": 1.75, - "learning_rate": 3.7264833939589626e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016500890401549066, + "loss": 0.012, "step": 347180 }, { - "epoch": 1.75, - "learning_rate": 3.7257266246575614e-05, - "loss": 0.0047, + "epoch": 0.9, + "learning_rate": 0.00016500501579911917, + "loss": 0.013, "step": 347190 }, { - "epoch": 1.75, - "learning_rate": 3.72496985535616e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001650011275827477, + "loss": 0.0139, "step": 347200 }, { - "epoch": 1.75, - "learning_rate": 3.72421308605476e-05, - "loss": 0.0105, + "epoch": 0.9, + "learning_rate": 0.00016499723936637623, + "loss": 0.0121, "step": 347210 }, { - "epoch": 1.75, - "learning_rate": 3.7234563167533586e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001649933511500048, + "loss": 0.0149, "step": 347220 }, { - "epoch": 1.75, - "learning_rate": 3.7226995474519574e-05, - "loss": 0.0101, + "epoch": 0.9, + "learning_rate": 0.0001649894629336333, + "loss": 0.0143, "step": 347230 }, { - "epoch": 1.75, - "learning_rate": 3.721942778150556e-05, - "loss": 0.0075, + "epoch": 0.9, + "learning_rate": 0.00016498557471726185, + "loss": 0.0126, "step": 347240 }, { - "epoch": 1.75, - "learning_rate": 3.721186008849156e-05, - "loss": 0.0086, + "epoch": 0.9, + "learning_rate": 0.00016498168650089037, + "loss": 0.0132, "step": 347250 }, { - "epoch": 1.75, - "learning_rate": 3.7204292395477545e-05, - "loss": 0.0041, + "epoch": 0.9, + "learning_rate": 0.00016497779828451894, + "loss": 0.0135, "step": 347260 }, { - "epoch": 1.75, - "learning_rate": 3.7196724702463534e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016497391006814748, + "loss": 0.0116, "step": 347270 }, { - "epoch": 1.75, - "learning_rate": 3.718915700944952e-05, - "loss": 0.0081, + "epoch": 0.9, + "learning_rate": 0.000164970021851776, + "loss": 0.0151, "step": 347280 }, { - "epoch": 1.75, - "learning_rate": 3.718158931643552e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.0001649661336354045, + "loss": 0.0146, "step": 347290 }, { - "epoch": 1.75, - "learning_rate": 3.71740216234215e-05, - "loss": 0.0076, + "epoch": 0.9, + "learning_rate": 0.00016496224541903307, + "loss": 0.0148, "step": 347300 }, { - "epoch": 1.75, - "learning_rate": 3.716645393040749e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.00016495835720266162, + "loss": 0.0118, "step": 347310 }, { - "epoch": 1.75, - "learning_rate": 3.715888623739348e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016495446898629013, + "loss": 0.0141, "step": 347320 }, { - "epoch": 1.75, - "learning_rate": 3.715131854437947e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016495058076991867, + "loss": 0.013, "step": 347330 }, { - "epoch": 1.75, - "learning_rate": 3.714375085136546e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016494669255354721, + "loss": 0.0125, "step": 347340 }, { - "epoch": 1.75, - "learning_rate": 3.713618315835145e-05, - "loss": 0.0044, + "epoch": 0.9, + "learning_rate": 0.00016494280433717576, + "loss": 0.0125, "step": 347350 }, { - "epoch": 1.75, - "learning_rate": 3.712861546533744e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016493891612080427, + "loss": 0.0131, "step": 347360 }, { - "epoch": 1.75, - "learning_rate": 3.712104777232343e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001649350279044328, + "loss": 0.013, "step": 347370 }, { - "epoch": 1.75, - "learning_rate": 3.711348007930942e-05, - "loss": 0.012, + "epoch": 0.9, + "learning_rate": 0.00016493113968806133, + "loss": 0.0102, "step": 347380 }, { - "epoch": 1.75, - "learning_rate": 3.710591238629541e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.0001649272514716899, + "loss": 0.013, "step": 347390 }, { - "epoch": 1.75, - "learning_rate": 3.70983446932814e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001649233632553184, + "loss": 0.0156, "step": 347400 }, { - "epoch": 1.75, - "learning_rate": 3.709077700026739e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016491947503894695, + "loss": 0.0186, "step": 347410 }, { - "epoch": 1.75, - "learning_rate": 3.708320930725338e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016491558682257547, + "loss": 0.0128, "step": 347420 }, { - "epoch": 1.75, - "learning_rate": 3.707564161423937e-05, - "loss": 0.0039, + "epoch": 0.9, + "learning_rate": 0.00016491169860620403, + "loss": 0.0155, "step": 347430 }, { - "epoch": 1.75, - "learning_rate": 3.706807392122536e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016490781038983255, + "loss": 0.0093, "step": 347440 }, { - "epoch": 1.75, - "learning_rate": 3.706050622821135e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.0001649039221734611, + "loss": 0.0131, "step": 347450 }, { - "epoch": 1.75, - "learning_rate": 3.705293853519734e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.0001649000339570896, + "loss": 0.0137, "step": 347460 }, { - "epoch": 1.75, - "learning_rate": 3.7045370842183325e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016489614574071817, + "loss": 0.0133, "step": 347470 }, { - "epoch": 1.75, - "learning_rate": 3.7037803149169313e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016489225752434672, + "loss": 0.0124, "step": 347480 }, { - "epoch": 1.75, - "learning_rate": 3.70302354561553e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016488836930797523, + "loss": 0.0121, "step": 347490 }, { - "epoch": 1.75, - "learning_rate": 3.70226677631413e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016488448109160377, + "loss": 0.0096, "step": 347500 }, { - "epoch": 1.75, - "learning_rate": 3.7015100070127285e-05, - "loss": 0.0087, + "epoch": 0.9, + "learning_rate": 0.00016488059287523231, + "loss": 0.0109, "step": 347510 }, { - "epoch": 1.75, - "learning_rate": 3.700753237711327e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016487670465886086, + "loss": 0.0146, "step": 347520 }, { - "epoch": 1.75, - "learning_rate": 3.699996468409927e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016487281644248937, + "loss": 0.0161, "step": 347530 }, { - "epoch": 1.75, - "learning_rate": 3.6992396991085256e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.0001648689282261179, + "loss": 0.0157, "step": 347540 }, { - "epoch": 1.75, - "learning_rate": 3.6984829298071244e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016486504000974645, + "loss": 0.0142, "step": 347550 }, { - "epoch": 1.75, - "learning_rate": 3.697726160505723e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.000164861151793375, + "loss": 0.0145, "step": 347560 }, { - "epoch": 1.75, - "learning_rate": 3.696969391204323e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001648572635770035, + "loss": 0.0129, "step": 347570 }, { - "epoch": 1.75, - "learning_rate": 3.6962126219029216e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016485337536063205, + "loss": 0.0098, "step": 347580 }, { - "epoch": 1.75, - "learning_rate": 3.6954558526015204e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001648494871442606, + "loss": 0.0123, "step": 347590 }, { - "epoch": 1.75, - "learning_rate": 3.694699083300119e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016484559892788913, + "loss": 0.0122, "step": 347600 }, { - "epoch": 1.75, - "learning_rate": 3.693942313998718e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016484171071151765, + "loss": 0.0137, "step": 347610 }, { - "epoch": 1.75, - "learning_rate": 3.693185544697317e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001648378224951462, + "loss": 0.0152, "step": 347620 }, { - "epoch": 1.75, - "learning_rate": 3.692428775395916e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001648339342787747, + "loss": 0.0113, "step": 347630 }, { - "epoch": 1.75, - "learning_rate": 3.691672006094515e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016483004606240327, + "loss": 0.013, "step": 347640 }, { - "epoch": 1.75, - "learning_rate": 3.690915236793114e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016482615784603182, + "loss": 0.0173, "step": 347650 }, { - "epoch": 1.75, - "learning_rate": 3.690158467491713e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016482226962966033, + "loss": 0.0154, "step": 347660 }, { - "epoch": 1.75, - "learning_rate": 3.689401698190312e-05, - "loss": 0.0087, + "epoch": 0.9, + "learning_rate": 0.00016481838141328887, + "loss": 0.0139, "step": 347670 }, { - "epoch": 1.75, - "learning_rate": 3.688644928888911e-05, - "loss": 0.0101, + "epoch": 0.9, + "learning_rate": 0.0001648144931969174, + "loss": 0.0116, "step": 347680 }, { - "epoch": 1.75, - "learning_rate": 3.68788815958751e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016481060498054595, + "loss": 0.0119, "step": 347690 }, { - "epoch": 1.75, - "learning_rate": 3.687131390286109e-05, - "loss": 0.0083, + "epoch": 0.9, + "learning_rate": 0.00016480671676417447, + "loss": 0.0114, "step": 347700 }, { - "epoch": 1.75, - "learning_rate": 3.6863746209847076e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.000164802828547803, + "loss": 0.0106, "step": 347710 }, { - "epoch": 1.75, - "learning_rate": 3.685617851683307e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016479894033143155, + "loss": 0.0145, "step": 347720 }, { - "epoch": 1.75, - "learning_rate": 3.684861082381906e-05, - "loss": 0.0087, + "epoch": 0.9, + "learning_rate": 0.0001647950521150601, + "loss": 0.0117, "step": 347730 }, { - "epoch": 1.75, - "learning_rate": 3.684104313080505e-05, - "loss": 0.0044, + "epoch": 0.9, + "learning_rate": 0.0001647911638986886, + "loss": 0.0116, "step": 347740 }, { - "epoch": 1.75, - "learning_rate": 3.6833475437791036e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016478727568231715, + "loss": 0.0158, "step": 347750 }, { - "epoch": 1.75, - "learning_rate": 3.682590774477703e-05, - "loss": 0.0091, + "epoch": 0.9, + "learning_rate": 0.0001647833874659457, + "loss": 0.0101, "step": 347760 }, { - "epoch": 1.75, - "learning_rate": 3.681834005176301e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016477949924957423, + "loss": 0.0162, "step": 347770 }, { - "epoch": 1.75, - "learning_rate": 3.681077235874901e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016477561103320275, + "loss": 0.0146, "step": 347780 }, { - "epoch": 1.75, - "learning_rate": 3.6803204665734996e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001647717228168313, + "loss": 0.0114, "step": 347790 }, { - "epoch": 1.75, - "learning_rate": 3.6795636972720984e-05, - "loss": 0.0047, + "epoch": 0.9, + "learning_rate": 0.00016476783460045986, + "loss": 0.0159, "step": 347800 }, { - "epoch": 1.75, - "learning_rate": 3.678806927970697e-05, - "loss": 0.0043, + "epoch": 0.9, + "learning_rate": 0.00016476394638408837, + "loss": 0.0127, "step": 347810 }, { - "epoch": 1.75, - "learning_rate": 3.678050158669297e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016476005816771691, + "loss": 0.0135, "step": 347820 }, { - "epoch": 1.75, - "learning_rate": 3.6772933893678955e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016475616995134543, + "loss": 0.0143, "step": 347830 }, { - "epoch": 1.75, - "learning_rate": 3.6765366200664943e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.000164752281734974, + "loss": 0.0113, "step": 347840 }, { - "epoch": 1.75, - "learning_rate": 3.675779850765093e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.0001647483935186025, + "loss": 0.0147, "step": 347850 }, { - "epoch": 1.75, - "learning_rate": 3.675023081463693e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016474450530223105, + "loss": 0.0156, "step": 347860 }, { - "epoch": 1.76, - "learning_rate": 3.6742663121622915e-05, - "loss": 0.0044, + "epoch": 0.9, + "learning_rate": 0.00016474061708585957, + "loss": 0.014, "step": 347870 }, { - "epoch": 1.76, - "learning_rate": 3.67350954286089e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001647367288694881, + "loss": 0.0128, "step": 347880 }, { - "epoch": 1.76, - "learning_rate": 3.672752773559489e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016473284065311665, + "loss": 0.0129, "step": 347890 }, { - "epoch": 1.76, - "learning_rate": 3.6719960042580886e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.0001647289524367452, + "loss": 0.0142, "step": 347900 }, { - "epoch": 1.76, - "learning_rate": 3.6712392349566875e-05, - "loss": 0.007, + "epoch": 0.9, + "learning_rate": 0.0001647250642203737, + "loss": 0.0138, "step": 347910 }, { - "epoch": 1.76, - "learning_rate": 3.670482465655286e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016472117600400225, + "loss": 0.0132, "step": 347920 }, { - "epoch": 1.76, - "learning_rate": 3.669725696353885e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.0001647172877876308, + "loss": 0.0129, "step": 347930 }, { - "epoch": 1.76, - "learning_rate": 3.668968927052484e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.00016471339957125933, + "loss": 0.0103, "step": 347940 }, { - "epoch": 1.76, - "learning_rate": 3.668212157751083e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.00016470951135488785, + "loss": 0.0137, "step": 347950 }, { - "epoch": 1.76, - "learning_rate": 3.667455388449682e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.0001647056231385164, + "loss": 0.012, "step": 347960 }, { - "epoch": 1.76, - "learning_rate": 3.666698619148281e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016470173492214496, + "loss": 0.0122, "step": 347970 }, { - "epoch": 1.76, - "learning_rate": 3.66594184984688e-05, - "loss": 0.0037, + "epoch": 0.9, + "learning_rate": 0.00016469784670577347, + "loss": 0.0124, "step": 347980 }, { - "epoch": 1.76, - "learning_rate": 3.665185080545479e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.000164693958489402, + "loss": 0.0188, "step": 347990 }, { - "epoch": 1.76, - "learning_rate": 3.664428311244078e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.00016469007027303053, + "loss": 0.0143, "step": 348000 }, { - "epoch": 1.76, - "eval_cer": 0.9144324104542716, - "eval_loss": 0.004651382099837065, - "eval_runtime": 116.6456, - "eval_samples_per_second": 17.146, - "eval_steps_per_second": 4.286, + "epoch": 0.9, + "eval_cer": 0.8817348779726539, + "eval_loss": 0.008867635391652584, + "eval_runtime": 107.6298, + "eval_samples_per_second": 18.582, + "eval_steps_per_second": 4.646, "step": 348000 }, { - "epoch": 1.76, - "learning_rate": 3.663671541942677e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.0001646861820566591, + "loss": 0.0167, "step": 348010 }, { - "epoch": 1.76, - "learning_rate": 3.662914772641276e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.0001646822938402876, + "loss": 0.0128, "step": 348020 }, { - "epoch": 1.76, - "learning_rate": 3.662158003339875e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016467840562391615, + "loss": 0.0151, "step": 348030 }, { - "epoch": 1.76, - "learning_rate": 3.661401234038474e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016467451740754467, + "loss": 0.0115, "step": 348040 }, { - "epoch": 1.76, - "learning_rate": 3.660644464737073e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016467062919117324, + "loss": 0.0119, "step": 348050 }, { - "epoch": 1.76, - "learning_rate": 3.659887695435672e-05, - "loss": 0.0084, + "epoch": 0.9, + "learning_rate": 0.00016466674097480175, + "loss": 0.0138, "step": 348060 }, { - "epoch": 1.76, - "learning_rate": 3.6591309261342706e-05, - "loss": 0.0073, + "epoch": 0.9, + "learning_rate": 0.0001646628527584303, + "loss": 0.0143, "step": 348070 }, { - "epoch": 1.76, - "learning_rate": 3.6583741568328695e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.0001646589645420588, + "loss": 0.0135, "step": 348080 }, { - "epoch": 1.76, - "learning_rate": 3.657617387531468e-05, - "loss": 0.0076, + "epoch": 0.9, + "learning_rate": 0.00016465507632568738, + "loss": 0.011, "step": 348090 }, { - "epoch": 1.76, - "learning_rate": 3.656860618230068e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.0001646511881093159, + "loss": 0.0147, "step": 348100 }, { - "epoch": 1.76, - "learning_rate": 3.6561038489286666e-05, - "loss": 0.0061, + "epoch": 0.9, + "learning_rate": 0.00016464729989294443, + "loss": 0.0108, "step": 348110 }, { - "epoch": 1.76, - "learning_rate": 3.6553470796272654e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016464341167657295, + "loss": 0.0142, "step": 348120 }, { - "epoch": 1.76, - "learning_rate": 3.654590310325864e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.0001646395234602015, + "loss": 0.0134, "step": 348130 }, { - "epoch": 1.76, - "learning_rate": 3.653833541024464e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016463563524383006, + "loss": 0.0122, "step": 348140 }, { - "epoch": 1.76, - "learning_rate": 3.6530767717230626e-05, - "loss": 0.0071, + "epoch": 0.9, + "learning_rate": 0.00016463174702745857, + "loss": 0.0142, "step": 348150 }, { - "epoch": 1.76, - "learning_rate": 3.6523200024216614e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016462785881108709, + "loss": 0.0129, "step": 348160 }, { - "epoch": 1.76, - "learning_rate": 3.65156323312026e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.00016462397059471563, + "loss": 0.012, "step": 348170 }, { - "epoch": 1.76, - "learning_rate": 3.65080646381886e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.0001646200823783442, + "loss": 0.0122, "step": 348180 }, { - "epoch": 1.76, - "learning_rate": 3.6500496945174585e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.0001646161941619727, + "loss": 0.0145, "step": 348190 }, { - "epoch": 1.76, - "learning_rate": 3.6492929252160574e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016461230594560125, + "loss": 0.0142, "step": 348200 }, { - "epoch": 1.76, - "learning_rate": 3.648536155914656e-05, - "loss": 0.0047, + "epoch": 0.9, + "learning_rate": 0.00016460841772922977, + "loss": 0.0154, "step": 348210 }, { - "epoch": 1.76, - "learning_rate": 3.647779386613256e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016460452951285834, + "loss": 0.0123, "step": 348220 }, { - "epoch": 1.76, - "learning_rate": 3.6470226173118545e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.00016460064129648685, + "loss": 0.0141, "step": 348230 }, { - "epoch": 1.76, - "learning_rate": 3.646265848010453e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.0001645967530801154, + "loss": 0.0105, "step": 348240 }, { - "epoch": 1.76, - "learning_rate": 3.645509078709052e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.0001645928648637439, + "loss": 0.0125, "step": 348250 }, { - "epoch": 1.76, - "learning_rate": 3.644752309407651e-05, - "loss": 0.0088, + "epoch": 0.9, + "learning_rate": 0.00016458897664737248, + "loss": 0.0108, "step": 348260 }, { - "epoch": 1.76, - "learning_rate": 3.64399554010625e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.000164585088431001, + "loss": 0.0129, "step": 348270 }, { - "epoch": 1.76, - "learning_rate": 3.643238770804849e-05, - "loss": 0.0068, + "epoch": 0.9, + "learning_rate": 0.00016458120021462953, + "loss": 0.0101, "step": 348280 }, { - "epoch": 1.76, - "learning_rate": 3.642482001503448e-05, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.00016457731199825805, + "loss": 0.0114, "step": 348290 }, { - "epoch": 1.76, - "learning_rate": 3.641725232202047e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016457342378188662, + "loss": 0.0116, "step": 348300 }, { - "epoch": 1.76, - "learning_rate": 3.640968462900646e-05, - "loss": 0.0052, + "epoch": 0.9, + "learning_rate": 0.00016456953556551513, + "loss": 0.012, "step": 348310 }, { - "epoch": 1.76, - "learning_rate": 3.640211693599245e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016456564734914367, + "loss": 0.0145, "step": 348320 }, { - "epoch": 1.76, - "learning_rate": 3.639454924297844e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016456175913277219, + "loss": 0.0148, "step": 348330 }, { - "epoch": 1.76, - "learning_rate": 3.638698154996443e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.00016455787091640075, + "loss": 0.0147, "step": 348340 }, { - "epoch": 1.76, - "learning_rate": 3.637941385695042e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.0001645539827000293, + "loss": 0.0128, "step": 348350 }, { - "epoch": 1.76, - "learning_rate": 3.637184616393641e-05, - "loss": 0.0066, + "epoch": 0.9, + "learning_rate": 0.0001645500944836578, + "loss": 0.0114, "step": 348360 }, { - "epoch": 1.76, - "learning_rate": 3.63642784709224e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016454620626728635, + "loss": 0.0243, "step": 348370 }, { - "epoch": 1.76, - "learning_rate": 3.635671077790839e-05, - "loss": 0.0044, - "step": 348380 + "epoch": 0.9, + "learning_rate": 0.00016454231805091487, + "loss": 0.0173, + "step": 348380 }, { - "epoch": 1.76, - "learning_rate": 3.634914308489438e-05, - "loss": 0.0041, + "epoch": 0.9, + "learning_rate": 0.00016453842983454344, + "loss": 0.0131, "step": 348390 }, { - "epoch": 1.76, - "learning_rate": 3.6341575391880365e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016453454161817195, + "loss": 0.0115, "step": 348400 }, { - "epoch": 1.76, - "learning_rate": 3.633400769886635e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.0001645306534018005, + "loss": 0.0152, "step": 348410 }, { - "epoch": 1.76, - "learning_rate": 3.632644000585234e-05, - "loss": 0.0091, + "epoch": 0.9, + "learning_rate": 0.000164526765185429, + "loss": 0.0168, "step": 348420 }, { - "epoch": 1.76, - "learning_rate": 3.6318872312838336e-05, - "loss": 0.0045, + "epoch": 0.9, + "learning_rate": 0.00016452287696905758, + "loss": 0.0132, "step": 348430 }, { - "epoch": 1.76, - "learning_rate": 3.6311304619824325e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001645189887526861, + "loss": 0.0112, "step": 348440 }, { - "epoch": 1.76, - "learning_rate": 3.630373692681031e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016451510053631463, + "loss": 0.015, "step": 348450 }, { - "epoch": 1.76, - "learning_rate": 3.62961692337963e-05, - "loss": 0.0113, + "epoch": 0.9, + "learning_rate": 0.00016451121231994315, + "loss": 0.0117, "step": 348460 }, { - "epoch": 1.76, - "learning_rate": 3.6288601540782296e-05, - "loss": 0.008, + "epoch": 0.9, + "learning_rate": 0.00016450732410357171, + "loss": 0.0195, "step": 348470 }, { - "epoch": 1.76, - "learning_rate": 3.6281033847768284e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016450343588720023, + "loss": 0.0145, "step": 348480 }, { - "epoch": 1.76, - "learning_rate": 3.627346615475427e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016449954767082877, + "loss": 0.0144, "step": 348490 }, { - "epoch": 1.76, - "learning_rate": 3.626589846174027e-05, - "loss": 0.0041, + "epoch": 0.9, + "learning_rate": 0.00016449565945445729, + "loss": 0.0135, "step": 348500 }, { - "epoch": 1.76, - "learning_rate": 3.6258330768726256e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016449177123808585, + "loss": 0.0146, "step": 348510 }, { - "epoch": 1.76, - "learning_rate": 3.6250763075712244e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.0001644878830217144, + "loss": 0.0157, "step": 348520 }, { - "epoch": 1.76, - "learning_rate": 3.624319538269823e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001644839948053429, + "loss": 0.0113, "step": 348530 }, { - "epoch": 1.76, - "learning_rate": 3.623562768968423e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016448010658897145, + "loss": 0.0135, "step": 348540 }, { - "epoch": 1.76, - "learning_rate": 3.6228059996670215e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001644762183726, + "loss": 0.0125, "step": 348550 }, { - "epoch": 1.76, - "learning_rate": 3.62204923036562e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016447233015622854, + "loss": 0.0158, "step": 348560 }, { - "epoch": 1.76, - "learning_rate": 3.621292461064219e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016446844193985705, + "loss": 0.0123, "step": 348570 }, { - "epoch": 1.76, - "learning_rate": 3.620535691762818e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.0001644645537234856, + "loss": 0.0139, "step": 348580 }, { - "epoch": 1.76, - "learning_rate": 3.619778922461417e-05, - "loss": 0.0042, + "epoch": 0.9, + "learning_rate": 0.0001644606655071141, + "loss": 0.0158, "step": 348590 }, { - "epoch": 1.76, - "learning_rate": 3.6190221531600157e-05, - "loss": 0.0101, + "epoch": 0.9, + "learning_rate": 0.00016445677729074267, + "loss": 0.0097, "step": 348600 }, { - "epoch": 1.76, - "learning_rate": 3.618265383858615e-05, - "loss": 0.0049, + "epoch": 0.9, + "learning_rate": 0.0001644528890743712, + "loss": 0.0121, "step": 348610 }, { - "epoch": 1.76, - "learning_rate": 3.617508614557214e-05, - "loss": 0.0036, + "epoch": 0.9, + "learning_rate": 0.00016444900085799973, + "loss": 0.0161, "step": 348620 }, { - "epoch": 1.76, - "learning_rate": 3.616751845255813e-05, - "loss": 0.0084, + "epoch": 0.9, + "learning_rate": 0.00016444511264162825, + "loss": 0.012, "step": 348630 }, { - "epoch": 1.76, - "learning_rate": 3.6159950759544116e-05, - "loss": 0.0058, + "epoch": 0.9, + "learning_rate": 0.00016444122442525681, + "loss": 0.0139, "step": 348640 }, { - "epoch": 1.76, - "learning_rate": 3.615238306653011e-05, - "loss": 0.0055, + "epoch": 0.9, + "learning_rate": 0.00016443733620888533, + "loss": 0.0119, "step": 348650 }, { - "epoch": 1.76, - "learning_rate": 3.61448153735161e-05, - "loss": 0.0067, + "epoch": 0.9, + "learning_rate": 0.00016443344799251387, + "loss": 0.0154, "step": 348660 }, { - "epoch": 1.76, - "learning_rate": 3.613724768050209e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016442955977614238, + "loss": 0.0119, "step": 348670 }, { - "epoch": 1.76, - "learning_rate": 3.6129679987488076e-05, - "loss": 0.0082, + "epoch": 0.9, + "learning_rate": 0.00016442567155977095, + "loss": 0.0135, "step": 348680 }, { - "epoch": 1.76, - "learning_rate": 3.612211229447407e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.0001644217833433995, + "loss": 0.0134, "step": 348690 }, { - "epoch": 1.76, - "learning_rate": 3.611454460146006e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.000164417895127028, + "loss": 0.0123, "step": 348700 }, { - "epoch": 1.76, - "learning_rate": 3.610697690844605e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016441400691065652, + "loss": 0.0174, "step": 348710 }, { - "epoch": 1.76, - "learning_rate": 3.6099409215432035e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.0001644101186942851, + "loss": 0.0152, "step": 348720 }, { - "epoch": 1.76, - "learning_rate": 3.6091841522418024e-05, - "loss": 0.0083, + "epoch": 0.9, + "learning_rate": 0.00016440623047791363, + "loss": 0.0117, "step": 348730 }, { - "epoch": 1.76, - "learning_rate": 3.608427382940401e-05, - "loss": 0.0051, + "epoch": 0.9, + "learning_rate": 0.00016440234226154215, + "loss": 0.0113, "step": 348740 }, { - "epoch": 1.76, - "learning_rate": 3.607670613639001e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.0001643984540451707, + "loss": 0.0118, "step": 348750 }, { - "epoch": 1.76, - "learning_rate": 3.6069138443375995e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.00016439456582879923, + "loss": 0.0146, "step": 348760 }, { - "epoch": 1.76, - "learning_rate": 3.606157075036198e-05, - "loss": 0.0064, + "epoch": 0.9, + "learning_rate": 0.00016439067761242777, + "loss": 0.0108, "step": 348770 }, { - "epoch": 1.76, - "learning_rate": 3.605400305734797e-05, - "loss": 0.0091, + "epoch": 0.9, + "learning_rate": 0.0001643867893960563, + "loss": 0.0125, "step": 348780 }, { - "epoch": 1.76, - "learning_rate": 3.6046435364333967e-05, - "loss": 0.0059, + "epoch": 0.9, + "learning_rate": 0.00016438290117968483, + "loss": 0.0132, "step": 348790 }, { - "epoch": 1.76, - "learning_rate": 3.6038867671319955e-05, - "loss": 0.0053, + "epoch": 0.9, + "learning_rate": 0.00016437901296331337, + "loss": 0.011, "step": 348800 }, { - "epoch": 1.76, - "learning_rate": 3.603129997830594e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001643751247469419, + "loss": 0.0157, "step": 348810 }, { - "epoch": 1.76, - "learning_rate": 3.602373228529193e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016437123653057043, + "loss": 0.0137, "step": 348820 }, { - "epoch": 1.76, - "learning_rate": 3.6016164592277926e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.00016436734831419897, + "loss": 0.016, "step": 348830 }, { - "epoch": 1.76, - "learning_rate": 3.6008596899263914e-05, - "loss": 0.005, + "epoch": 0.9, + "learning_rate": 0.00016436346009782748, + "loss": 0.0116, "step": 348840 }, { - "epoch": 1.76, - "learning_rate": 3.60010292062499e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016435957188145605, + "loss": 0.0136, "step": 348850 }, { - "epoch": 1.76, - "learning_rate": 3.599346151323589e-05, - "loss": 0.0082, + "epoch": 0.9, + "learning_rate": 0.0001643556836650846, + "loss": 0.0117, "step": 348860 }, { - "epoch": 1.76, - "learning_rate": 3.598589382022188e-05, - "loss": 0.0085, + "epoch": 0.9, + "learning_rate": 0.0001643517954487131, + "loss": 0.0156, "step": 348870 }, { - "epoch": 1.76, - "learning_rate": 3.597832612720787e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016434790723234162, + "loss": 0.0107, "step": 348880 }, { - "epoch": 1.76, - "learning_rate": 3.597075843419386e-05, - "loss": 0.0048, + "epoch": 0.9, + "learning_rate": 0.0001643440190159702, + "loss": 0.0119, "step": 348890 }, { - "epoch": 1.76, - "learning_rate": 3.596319074117985e-05, - "loss": 0.0046, + "epoch": 0.9, + "learning_rate": 0.00016434013079959873, + "loss": 0.0107, "step": 348900 }, { - "epoch": 1.76, - "learning_rate": 3.595562304816584e-05, - "loss": 0.0062, + "epoch": 0.9, + "learning_rate": 0.00016433624258322725, + "loss": 0.011, "step": 348910 }, { - "epoch": 1.76, - "learning_rate": 3.594805535515183e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.0001643323543668558, + "loss": 0.0144, "step": 348920 }, { - "epoch": 1.76, - "learning_rate": 3.594048766213782e-05, - "loss": 0.0078, + "epoch": 0.9, + "learning_rate": 0.00016432846615048433, + "loss": 0.0112, "step": 348930 }, { - "epoch": 1.76, - "learning_rate": 3.593291996912381e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.00016432457793411287, + "loss": 0.0128, "step": 348940 }, { - "epoch": 1.76, - "learning_rate": 3.59253522761098e-05, - "loss": 0.0057, + "epoch": 0.9, + "learning_rate": 0.0001643206897177414, + "loss": 0.0113, "step": 348950 }, { - "epoch": 1.76, - "learning_rate": 3.591778458309579e-05, - "loss": 0.0079, + "epoch": 0.9, + "learning_rate": 0.00016431680150136993, + "loss": 0.0149, "step": 348960 }, { - "epoch": 1.76, - "learning_rate": 3.591021689008178e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016431291328499847, + "loss": 0.0147, "step": 348970 }, { - "epoch": 1.76, - "learning_rate": 3.590264919706777e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.000164309025068627, + "loss": 0.0102, "step": 348980 }, { - "epoch": 1.76, - "learning_rate": 3.589508150405376e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016430513685225553, + "loss": 0.0127, "step": 348990 }, { - "epoch": 1.76, - "learning_rate": 3.5887513811039746e-05, - "loss": 0.0054, + "epoch": 0.9, + "learning_rate": 0.00016430124863588407, + "loss": 0.0116, "step": 349000 }, { - "epoch": 1.76, - "eval_cer": 0.9144188249085159, - "eval_loss": 0.004665224812924862, - "eval_runtime": 116.662, - "eval_samples_per_second": 17.144, - "eval_steps_per_second": 4.286, + "epoch": 0.9, + "eval_cer": 0.8817376772465223, + "eval_loss": 0.008726708590984344, + "eval_runtime": 107.6491, + "eval_samples_per_second": 18.579, + "eval_steps_per_second": 4.645, "step": 349000 }, { - "epoch": 1.76, - "learning_rate": 3.587994611802574e-05, - "loss": 0.0094, + "epoch": 0.9, + "learning_rate": 0.00016429736041951264, + "loss": 0.0118, "step": 349010 }, { - "epoch": 1.76, - "learning_rate": 3.587237842501173e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016429347220314115, + "loss": 0.0138, "step": 349020 }, { - "epoch": 1.76, - "learning_rate": 3.586481073199772e-05, - "loss": 0.006, + "epoch": 0.9, + "learning_rate": 0.00016428958398676967, + "loss": 0.0177, "step": 349030 }, { - "epoch": 1.76, - "learning_rate": 3.5857243038983706e-05, - "loss": 0.0056, + "epoch": 0.9, + "learning_rate": 0.0001642856957703982, + "loss": 0.0132, "step": 349040 }, { - "epoch": 1.76, - "learning_rate": 3.5849675345969694e-05, - "loss": 0.0042, + "epoch": 0.9, + "learning_rate": 0.00016428180755402678, + "loss": 0.0132, "step": 349050 }, { - "epoch": 1.76, - "learning_rate": 3.584210765295568e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.0001642779193376553, + "loss": 0.0135, "step": 349060 }, { - "epoch": 1.76, - "learning_rate": 3.583453995994168e-05, - "loss": 0.0063, + "epoch": 0.9, + "learning_rate": 0.00016427403112128383, + "loss": 0.0124, "step": 349070 }, { - "epoch": 1.76, - "learning_rate": 3.5826972266927666e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.00016427014290491235, + "loss": 0.0185, "step": 349080 }, { - "epoch": 1.76, - "learning_rate": 3.5819404573913654e-05, - "loss": 0.0065, + "epoch": 0.9, + "learning_rate": 0.0001642662546885409, + "loss": 0.01, "step": 349090 }, { - "epoch": 1.76, - "learning_rate": 3.581183688089964e-05, - "loss": 0.0072, + "epoch": 0.9, + "learning_rate": 0.00016426236647216943, + "loss": 0.0203, "step": 349100 }, { - "epoch": 1.76, - "learning_rate": 3.580426918788564e-05, - "loss": 0.0069, + "epoch": 0.9, + "learning_rate": 0.00016425847825579797, + "loss": 0.0124, "step": 349110 }, { - "epoch": 1.76, - "learning_rate": 3.5796701494871625e-05, - "loss": 0.0074, + "epoch": 0.9, + "learning_rate": 0.0001642545900394265, + "loss": 0.011, "step": 349120 }, { - "epoch": 1.76, - "learning_rate": 3.5789133801857613e-05, - "loss": 0.011, + "epoch": 0.9, + "learning_rate": 0.00016425070182305503, + "loss": 0.0103, "step": 349130 }, { - "epoch": 1.76, - "learning_rate": 3.57815661088436e-05, - "loss": 0.0094, + "epoch": 0.91, + "learning_rate": 0.00016424681360668357, + "loss": 0.0121, "step": 349140 }, { - "epoch": 1.76, - "learning_rate": 3.57739984158296e-05, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.0001642429253903121, + "loss": 0.0131, "step": 349150 }, { - "epoch": 1.76, - "learning_rate": 3.5766430722815585e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016423903717394063, + "loss": 0.0139, "step": 349160 }, { - "epoch": 1.76, - "learning_rate": 3.575886302980157e-05, - "loss": 0.0089, + "epoch": 0.91, + "learning_rate": 0.00016423514895756917, + "loss": 0.0152, "step": 349170 }, { - "epoch": 1.76, - "learning_rate": 3.575129533678756e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.0001642312607411977, + "loss": 0.0168, "step": 349180 }, { - "epoch": 1.76, - "learning_rate": 3.574372764377355e-05, - "loss": 0.0079, + "epoch": 0.91, + "learning_rate": 0.00016422737252482625, + "loss": 0.014, "step": 349190 }, { - "epoch": 1.76, - "learning_rate": 3.573615995075954e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016422348430845477, + "loss": 0.0147, "step": 349200 }, { - "epoch": 1.76, - "learning_rate": 3.572859225774553e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001642195960920833, + "loss": 0.0113, "step": 349210 }, { - "epoch": 1.76, - "learning_rate": 3.572102456473152e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016421570787571188, + "loss": 0.0148, "step": 349220 }, { - "epoch": 1.76, - "learning_rate": 3.571345687171751e-05, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.0001642118196593404, + "loss": 0.0131, "step": 349230 }, { - "epoch": 1.76, - "learning_rate": 3.57058891787035e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016420793144296893, + "loss": 0.014, "step": 349240 }, { - "epoch": 1.76, - "learning_rate": 3.569832148568949e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016420404322659745, + "loss": 0.0117, "step": 349250 }, { - "epoch": 1.76, - "learning_rate": 3.569075379267548e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016420015501022602, + "loss": 0.0406, "step": 349260 }, { - "epoch": 1.76, - "learning_rate": 3.568318609966147e-05, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016419626679385453, + "loss": 0.0141, "step": 349270 }, { - "epoch": 1.76, - "learning_rate": 3.567561840664746e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016419237857748307, + "loss": 0.0128, "step": 349280 }, { - "epoch": 1.76, - "learning_rate": 3.566805071363345e-05, - "loss": 0.0164, + "epoch": 0.91, + "learning_rate": 0.0001641884903611116, + "loss": 0.0136, "step": 349290 }, { - "epoch": 1.76, - "learning_rate": 3.566048302061944e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016418460214474016, + "loss": 0.0176, "step": 349300 }, { - "epoch": 1.76, - "learning_rate": 3.565291532760543e-05, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.00016418071392836867, + "loss": 0.0188, "step": 349310 }, { - "epoch": 1.76, - "learning_rate": 3.564534763459142e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.0001641768257119972, + "loss": 0.0127, "step": 349320 }, { - "epoch": 1.76, - "learning_rate": 3.563777994157741e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016417293749562573, + "loss": 0.011, "step": 349330 }, { - "epoch": 1.76, - "learning_rate": 3.563021224856339e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016416904927925427, + "loss": 0.0132, "step": 349340 }, { - "epoch": 1.76, - "learning_rate": 3.562264455554938e-05, - "loss": 0.0037, + "epoch": 0.91, + "learning_rate": 0.0001641651610628828, + "loss": 0.0142, "step": 349350 }, { - "epoch": 1.76, - "learning_rate": 3.5615076862535376e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016416127284651135, + "loss": 0.0126, "step": 349360 }, { - "epoch": 1.76, - "learning_rate": 3.5607509169521365e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016415738463013987, + "loss": 0.0136, "step": 349370 }, { - "epoch": 1.76, - "learning_rate": 3.559994147650735e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.0001641534964137684, + "loss": 0.0141, "step": 349380 }, { - "epoch": 1.76, - "learning_rate": 3.559237378349334e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016414960819739698, + "loss": 0.0141, "step": 349390 }, { - "epoch": 1.76, - "learning_rate": 3.5584806090479336e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001641457199810255, + "loss": 0.0135, "step": 349400 }, { - "epoch": 1.76, - "learning_rate": 3.5577238397465324e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016414183176465403, + "loss": 0.0153, "step": 349410 }, { - "epoch": 1.76, - "learning_rate": 3.556967070445131e-05, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016413794354828255, + "loss": 0.0134, "step": 349420 }, { - "epoch": 1.76, - "learning_rate": 3.55621030114373e-05, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.00016413405533191112, + "loss": 0.0113, "step": 349430 }, { - "epoch": 1.76, - "learning_rate": 3.5554535318423296e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016413016711553963, + "loss": 0.0134, "step": 349440 }, { - "epoch": 1.76, - "learning_rate": 3.5546967625409284e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016412627889916817, + "loss": 0.0139, "step": 349450 }, { - "epoch": 1.76, - "learning_rate": 3.553939993239527e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016412239068279669, + "loss": 0.0123, "step": 349460 }, { - "epoch": 1.76, - "learning_rate": 3.553183223938127e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.00016411850246642525, + "loss": 0.0134, "step": 349470 }, { - "epoch": 1.76, - "learning_rate": 3.5524264546367255e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016411461425005377, + "loss": 0.0162, "step": 349480 }, { - "epoch": 1.76, - "learning_rate": 3.5516696853353244e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.0001641107260336823, + "loss": 0.0122, "step": 349490 }, { - "epoch": 1.76, - "learning_rate": 3.550912916033923e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016410683781731083, + "loss": 0.0105, "step": 349500 }, { - "epoch": 1.76, - "learning_rate": 3.550156146732522e-05, - "loss": 0.0088, + "epoch": 0.91, + "learning_rate": 0.0001641029496009394, + "loss": 0.0136, "step": 349510 }, { - "epoch": 1.76, - "learning_rate": 3.549399377431121e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.0001640990613845679, + "loss": 0.0118, "step": 349520 }, { - "epoch": 1.76, - "learning_rate": 3.5486426081297196e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016409517316819645, + "loss": 0.0144, "step": 349530 }, { - "epoch": 1.76, - "learning_rate": 3.547885838828319e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.00016409128495182496, + "loss": 0.0138, "step": 349540 }, { - "epoch": 1.76, - "learning_rate": 3.547129069526918e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016408739673545353, + "loss": 0.0134, "step": 349550 }, { - "epoch": 1.76, - "learning_rate": 3.546372300225517e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016408350851908208, + "loss": 0.0185, "step": 349560 }, { - "epoch": 1.76, - "learning_rate": 3.5456155309241156e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.0001640796203027106, + "loss": 0.0143, "step": 349570 }, { - "epoch": 1.76, - "learning_rate": 3.544858761622715e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001640757320863391, + "loss": 0.0143, "step": 349580 }, { - "epoch": 1.76, - "learning_rate": 3.544101992321314e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016407184386996765, + "loss": 0.0133, "step": 349590 }, { - "epoch": 1.76, - "learning_rate": 3.543345223019913e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016406795565359621, + "loss": 0.0158, "step": 349600 }, { - "epoch": 1.76, - "learning_rate": 3.5425884537185116e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016406406743722473, + "loss": 0.0138, "step": 349610 }, { - "epoch": 1.76, - "learning_rate": 3.541831684417111e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016406017922085327, + "loss": 0.0126, "step": 349620 }, { - "epoch": 1.76, - "learning_rate": 3.54107491511571e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016405629100448179, + "loss": 0.0125, "step": 349630 }, { - "epoch": 1.76, - "learning_rate": 3.540318145814309e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016405240278811035, + "loss": 0.0145, "step": 349640 }, { - "epoch": 1.76, - "learning_rate": 3.5395613765129075e-05, - "loss": 0.0084, + "epoch": 0.91, + "learning_rate": 0.00016404851457173887, + "loss": 0.0154, "step": 349650 }, { - "epoch": 1.76, - "learning_rate": 3.5388046072115064e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001640446263553674, + "loss": 0.0104, "step": 349660 }, { - "epoch": 1.76, - "learning_rate": 3.538047837910105e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016404073813899592, + "loss": 0.0117, "step": 349670 }, { - "epoch": 1.76, - "learning_rate": 3.537291068608705e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.0001640368499226245, + "loss": 0.0122, "step": 349680 }, { - "epoch": 1.76, - "learning_rate": 3.5365342993073035e-05, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.000164032961706253, + "loss": 0.0208, "step": 349690 }, { - "epoch": 1.76, - "learning_rate": 3.535777530005902e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016402907348988155, + "loss": 0.0155, "step": 349700 }, { - "epoch": 1.76, - "learning_rate": 3.535020760704501e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016402518527351006, + "loss": 0.0122, "step": 349710 }, { - "epoch": 1.76, - "learning_rate": 3.5342639914031006e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.00016402129705713863, + "loss": 0.0125, "step": 349720 }, { - "epoch": 1.76, - "learning_rate": 3.5335072221016995e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016401740884076717, + "loss": 0.0133, "step": 349730 }, { - "epoch": 1.76, - "learning_rate": 3.532750452800298e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.0001640135206243957, + "loss": 0.0129, "step": 349740 }, { - "epoch": 1.76, - "learning_rate": 3.531993683498897e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001640096324080242, + "loss": 0.0144, "step": 349750 }, { - "epoch": 1.76, - "learning_rate": 3.5312369141974966e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016400574419165277, + "loss": 0.0139, "step": 349760 }, { - "epoch": 1.76, - "learning_rate": 3.5304801448960954e-05, - "loss": 0.0109, + "epoch": 0.91, + "learning_rate": 0.00016400185597528131, + "loss": 0.0143, "step": 349770 }, { - "epoch": 1.76, - "learning_rate": 3.529723375594694e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016399796775890983, + "loss": 0.013, "step": 349780 }, { - "epoch": 1.76, - "learning_rate": 3.528966606293293e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016399407954253837, + "loss": 0.0119, "step": 349790 }, { - "epoch": 1.76, - "learning_rate": 3.5282098369918926e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001639901913261669, + "loss": 0.0149, "step": 349800 }, { - "epoch": 1.76, - "learning_rate": 3.527453067690491e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016398630310979545, + "loss": 0.014, "step": 349810 }, { - "epoch": 1.76, - "learning_rate": 3.52669629838909e-05, - "loss": 0.0091, + "epoch": 0.91, + "learning_rate": 0.00016398241489342397, + "loss": 0.0124, "step": 349820 }, { - "epoch": 1.76, - "learning_rate": 3.525939529087689e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.0001639785266770525, + "loss": 0.0146, "step": 349830 }, { - "epoch": 1.76, - "learning_rate": 3.525182759786288e-05, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.00016397463846068102, + "loss": 0.015, "step": 349840 }, { - "epoch": 1.77, - "learning_rate": 3.524425990484887e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001639707502443096, + "loss": 0.0127, "step": 349850 }, { - "epoch": 1.77, - "learning_rate": 3.523669221183486e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001639668620279381, + "loss": 0.0147, "step": 349860 }, { - "epoch": 1.77, - "learning_rate": 3.522912451882085e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016396297381156665, + "loss": 0.0128, "step": 349870 }, { - "epoch": 1.77, - "learning_rate": 3.522155682580684e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016395908559519516, + "loss": 0.0131, "step": 349880 }, { - "epoch": 1.77, - "learning_rate": 3.5213989132792826e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016395519737882373, + "loss": 0.0131, "step": 349890 }, { - "epoch": 1.77, - "learning_rate": 3.520642143977882e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016395130916245225, + "loss": 0.0104, "step": 349900 }, { - "epoch": 1.77, - "learning_rate": 3.519885374676481e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.0001639474209460808, + "loss": 0.0133, "step": 349910 }, { - "epoch": 1.77, - "learning_rate": 3.51912860537508e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.0001639435327297093, + "loss": 0.0108, "step": 349920 }, { - "epoch": 1.77, - "learning_rate": 3.5183718360736786e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016393964451333787, + "loss": 0.0117, "step": 349930 }, { - "epoch": 1.77, - "learning_rate": 3.517615066772278e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016393575629696641, + "loss": 0.0096, "step": 349940 }, { - "epoch": 1.77, - "learning_rate": 3.516858297470877e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.00016393186808059493, + "loss": 0.0107, "step": 349950 }, { - "epoch": 1.77, - "learning_rate": 3.516101528169476e-05, - "loss": 0.0082, + "epoch": 0.91, + "learning_rate": 0.00016392797986422347, + "loss": 0.0125, "step": 349960 }, { - "epoch": 1.77, - "learning_rate": 3.5153447588680746e-05, - "loss": 0.0096, + "epoch": 0.91, + "learning_rate": 0.000163924091647852, + "loss": 0.0206, "step": 349970 }, { - "epoch": 1.77, - "learning_rate": 3.5145879895666734e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016392020343148055, + "loss": 0.0126, "step": 349980 }, { - "epoch": 1.77, - "learning_rate": 3.513831220265272e-05, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016391631521510907, + "loss": 0.0113, "step": 349990 }, { - "epoch": 1.77, - "learning_rate": 3.513074450963872e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.0001639124269987376, + "loss": 0.0143, "step": 350000 }, { - "epoch": 1.77, - "eval_cer": 0.9144498775845288, - "eval_loss": 0.004672383423894644, - "eval_runtime": 116.7279, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.283, + "epoch": 0.91, + "eval_cer": 0.8817964619977577, + "eval_loss": 0.009117286652326584, + "eval_runtime": 107.4916, + "eval_samples_per_second": 18.606, + "eval_steps_per_second": 4.652, "step": 350000 }, { - "epoch": 1.77, - "learning_rate": 3.5123176816624705e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.00016390853878236615, + "loss": 0.0109, "step": 350010 }, { - "epoch": 1.77, - "learning_rate": 3.5115609123610694e-05, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.0001639046505659947, + "loss": 0.0111, "step": 350020 }, { - "epoch": 1.77, - "learning_rate": 3.510804143059668e-05, - "loss": 0.0082, + "epoch": 0.91, + "learning_rate": 0.0001639007623496232, + "loss": 0.0124, "step": 350030 }, { - "epoch": 1.77, - "learning_rate": 3.510047373758268e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016389687413325175, + "loss": 0.0134, "step": 350040 }, { - "epoch": 1.77, - "learning_rate": 3.5092906044568665e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.0001638929859168803, + "loss": 0.0132, "step": 350050 }, { - "epoch": 1.77, - "learning_rate": 3.508533835155465e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016388909770050883, + "loss": 0.0153, "step": 350060 }, { - "epoch": 1.77, - "learning_rate": 3.507777065854064e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.00016388520948413735, + "loss": 0.0119, "step": 350070 }, { - "epoch": 1.77, - "learning_rate": 3.5070202965526637e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.0001638813212677659, + "loss": 0.0129, "step": 350080 }, { - "epoch": 1.77, - "learning_rate": 3.5062635272512625e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.0001638774330513944, + "loss": 0.0117, "step": 350090 }, { - "epoch": 1.77, - "learning_rate": 3.505506757949861e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016387354483502297, + "loss": 0.0161, "step": 350100 }, { - "epoch": 1.77, - "learning_rate": 3.50474998864846e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001638696566186515, + "loss": 0.0127, "step": 350110 }, { - "epoch": 1.77, - "learning_rate": 3.5039932193470596e-05, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.00016386576840228003, + "loss": 0.0149, "step": 350120 }, { - "epoch": 1.77, - "learning_rate": 3.503236450045658e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016386188018590857, + "loss": 0.0114, "step": 350130 }, { - "epoch": 1.77, - "learning_rate": 3.5024796807442566e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.0001638579919695371, + "loss": 0.0116, "step": 350140 }, { - "epoch": 1.77, - "learning_rate": 3.501722911442856e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016385410375316565, + "loss": 0.0122, "step": 350150 }, { - "epoch": 1.77, - "learning_rate": 3.500966142141455e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016385021553679417, + "loss": 0.012, "step": 350160 }, { - "epoch": 1.77, - "learning_rate": 3.500209372840054e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.0001638463273204227, + "loss": 0.0095, "step": 350170 }, { - "epoch": 1.77, - "learning_rate": 3.499452603538653e-05, - "loss": 0.0094, + "epoch": 0.91, + "learning_rate": 0.00016384243910405125, + "loss": 0.0144, "step": 350180 }, { - "epoch": 1.77, - "learning_rate": 3.498695834237252e-05, - "loss": 0.0097, + "epoch": 0.91, + "learning_rate": 0.0001638385508876798, + "loss": 0.0141, "step": 350190 }, { - "epoch": 1.77, - "learning_rate": 3.497939064935851e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.0001638346626713083, + "loss": 0.0125, "step": 350200 }, { - "epoch": 1.77, - "learning_rate": 3.49718229563445e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016383077445493685, + "loss": 0.0124, "step": 350210 }, { - "epoch": 1.77, - "learning_rate": 3.496425526333049e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.0001638268862385654, + "loss": 0.0157, "step": 350220 }, { - "epoch": 1.77, - "learning_rate": 3.495668757031648e-05, - "loss": 0.0089, + "epoch": 0.91, + "learning_rate": 0.00016382299802219393, + "loss": 0.0155, "step": 350230 }, { - "epoch": 1.77, - "learning_rate": 3.494911987730247e-05, - "loss": 0.0043, + "epoch": 0.91, + "learning_rate": 0.00016381910980582245, + "loss": 0.0142, "step": 350240 }, { - "epoch": 1.77, - "learning_rate": 3.4941552184288457e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.000163815221589451, + "loss": 0.0116, "step": 350250 }, { - "epoch": 1.77, - "learning_rate": 3.493398449127445e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.00016381133337307956, + "loss": 0.0128, "step": 350260 }, { - "epoch": 1.77, - "learning_rate": 3.492641679826044e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016380744515670807, + "loss": 0.0124, "step": 350270 }, { - "epoch": 1.77, - "learning_rate": 3.491884910524642e-05, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.0001638035569403366, + "loss": 0.0143, "step": 350280 }, { - "epoch": 1.77, - "learning_rate": 3.4911281412232416e-05, - "loss": 0.0082, + "epoch": 0.91, + "learning_rate": 0.00016379966872396513, + "loss": 0.0124, "step": 350290 }, { - "epoch": 1.77, - "learning_rate": 3.4903713719218404e-05, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.0001637957805075937, + "loss": 0.0131, "step": 350300 }, { - "epoch": 1.77, - "learning_rate": 3.489614602620439e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.0001637918922912222, + "loss": 0.0128, "step": 350310 }, { - "epoch": 1.77, - "learning_rate": 3.488857833319038e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016378800407485075, + "loss": 0.0096, "step": 350320 }, { - "epoch": 1.77, - "learning_rate": 3.4881010640176376e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016378411585847927, + "loss": 0.016, "step": 350330 }, { - "epoch": 1.77, - "learning_rate": 3.4873442947162364e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.0001637802276421078, + "loss": 0.013, "step": 350340 }, { - "epoch": 1.77, - "learning_rate": 3.486587525414835e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016377633942573635, + "loss": 0.0111, "step": 350350 }, { - "epoch": 1.77, - "learning_rate": 3.485830756113434e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001637724512093649, + "loss": 0.018, "step": 350360 }, { - "epoch": 1.77, - "learning_rate": 3.4850739868120336e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001637685629929934, + "loss": 0.0113, "step": 350370 }, { - "epoch": 1.77, - "learning_rate": 3.4843172175106324e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016376467477662195, + "loss": 0.0139, "step": 350380 }, { - "epoch": 1.77, - "learning_rate": 3.483560448209231e-05, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.0001637607865602505, + "loss": 0.0108, "step": 350390 }, { - "epoch": 1.77, - "learning_rate": 3.48280367890783e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016375689834387903, + "loss": 0.0117, "step": 350400 }, { - "epoch": 1.77, - "learning_rate": 3.4820469096064295e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016375301012750755, + "loss": 0.0103, "step": 350410 }, { - "epoch": 1.77, - "learning_rate": 3.4812901403050283e-05, - "loss": 0.0108, + "epoch": 0.91, + "learning_rate": 0.0001637491219111361, + "loss": 0.0115, "step": 350420 }, { - "epoch": 1.77, - "learning_rate": 3.480533371003627e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016374523369476466, + "loss": 0.0116, "step": 350430 }, { - "epoch": 1.77, - "learning_rate": 3.479776601702226e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016374134547839317, + "loss": 0.0126, "step": 350440 }, { - "epoch": 1.77, - "learning_rate": 3.479019832400825e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.0001637374572620217, + "loss": 0.0092, "step": 350450 }, { - "epoch": 1.77, - "learning_rate": 3.4782630630994236e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016373356904565023, + "loss": 0.0099, "step": 350460 }, { - "epoch": 1.77, - "learning_rate": 3.477506293798023e-05, - "loss": 0.008, + "epoch": 0.91, + "learning_rate": 0.0001637296808292788, + "loss": 0.0144, "step": 350470 }, { - "epoch": 1.77, - "learning_rate": 3.476749524496622e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.0001637257926129073, + "loss": 0.0123, "step": 350480 }, { - "epoch": 1.77, - "learning_rate": 3.475992755195221e-05, - "loss": 0.0091, + "epoch": 0.91, + "learning_rate": 0.00016372190439653585, + "loss": 0.0134, "step": 350490 }, { - "epoch": 1.77, - "learning_rate": 3.4752359858938196e-05, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.00016371801618016437, + "loss": 0.0135, "step": 350500 }, { - "epoch": 1.77, - "learning_rate": 3.474479216592419e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016371412796379293, + "loss": 0.0138, "step": 350510 }, { - "epoch": 1.77, - "learning_rate": 3.473722447291018e-05, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.00016371023974742145, + "loss": 0.0128, "step": 350520 }, { - "epoch": 1.77, - "learning_rate": 3.472965677989617e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016370635153105, + "loss": 0.013, "step": 350530 }, { - "epoch": 1.77, - "learning_rate": 3.4722089086882156e-05, - "loss": 0.0045, + "epoch": 0.91, + "learning_rate": 0.0001637024633146785, + "loss": 0.0111, "step": 350540 }, { - "epoch": 1.77, - "learning_rate": 3.471452139386815e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016369857509830707, + "loss": 0.0141, "step": 350550 }, { - "epoch": 1.77, - "learning_rate": 3.470695370085414e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001636946868819356, + "loss": 0.0136, "step": 350560 }, { - "epoch": 1.77, - "learning_rate": 3.469938600784013e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016369079866556413, + "loss": 0.0135, "step": 350570 }, { - "epoch": 1.77, - "learning_rate": 3.4691818314826115e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016368691044919264, + "loss": 0.012, "step": 350580 }, { - "epoch": 1.77, - "learning_rate": 3.468425062181211e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016368302223282119, + "loss": 0.0107, "step": 350590 }, { - "epoch": 1.77, - "learning_rate": 3.467668292879809e-05, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.00016367913401644976, + "loss": 0.0114, "step": 350600 }, { - "epoch": 1.77, - "learning_rate": 3.466911523578409e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016367524580007827, + "loss": 0.0119, "step": 350610 }, { - "epoch": 1.77, - "learning_rate": 3.4661547542770075e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016367135758370678, + "loss": 0.0121, "step": 350620 }, { - "epoch": 1.77, - "learning_rate": 3.465397984975606e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016366746936733533, + "loss": 0.0125, "step": 350630 }, { - "epoch": 1.77, - "learning_rate": 3.464641215674205e-05, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.0001636635811509639, + "loss": 0.0106, "step": 350640 }, { - "epoch": 1.77, - "learning_rate": 3.4638844463728046e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001636596929345924, + "loss": 0.0132, "step": 350650 }, { - "epoch": 1.77, - "learning_rate": 3.4631276770714035e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016365580471822095, + "loss": 0.0125, "step": 350660 }, { - "epoch": 1.77, - "learning_rate": 3.462370907770002e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016365191650184947, + "loss": 0.0118, "step": 350670 }, { - "epoch": 1.77, - "learning_rate": 3.461614138468601e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016364802828547803, + "loss": 0.017, "step": 350680 }, { - "epoch": 1.77, - "learning_rate": 3.4608573691672006e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016364414006910655, + "loss": 0.0116, "step": 350690 }, { - "epoch": 1.77, - "learning_rate": 3.4601005998657994e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.0001636402518527351, + "loss": 0.014, "step": 350700 }, { - "epoch": 1.77, - "learning_rate": 3.459343830564398e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.0001636363636363636, + "loss": 0.0146, "step": 350710 }, { - "epoch": 1.77, - "learning_rate": 3.458587061262997e-05, - "loss": 0.0088, + "epoch": 0.91, + "learning_rate": 0.00016363247541999217, + "loss": 0.0113, "step": 350720 }, { - "epoch": 1.77, - "learning_rate": 3.4578302919615966e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.0001636285872036207, + "loss": 0.0128, "step": 350730 }, { - "epoch": 1.77, - "learning_rate": 3.4570735226601954e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016362469898724923, + "loss": 0.0098, "step": 350740 }, { - "epoch": 1.77, - "learning_rate": 3.456316753358794e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016362081077087774, + "loss": 0.0096, "step": 350750 }, { - "epoch": 1.77, - "learning_rate": 3.455559984057393e-05, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.0001636169225545063, + "loss": 0.0134, "step": 350760 }, { - "epoch": 1.77, - "learning_rate": 3.454803214755992e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016361303433813483, + "loss": 0.0125, "step": 350770 }, { - "epoch": 1.77, - "learning_rate": 3.454046445454591e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016360914612176337, + "loss": 0.0131, "step": 350780 }, { - "epoch": 1.77, - "learning_rate": 3.45328967615319e-05, - "loss": 0.0097, + "epoch": 0.91, + "learning_rate": 0.00016360525790539188, + "loss": 0.0128, "step": 350790 }, { - "epoch": 1.77, - "learning_rate": 3.452532906851789e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016360136968902045, + "loss": 0.011, "step": 350800 }, { - "epoch": 1.77, - "learning_rate": 3.451776137550388e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.000163597481472649, + "loss": 0.0118, "step": 350810 }, { - "epoch": 1.77, - "learning_rate": 3.4510193682489866e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.0001635935932562775, + "loss": 0.0099, "step": 350820 }, { - "epoch": 1.77, - "learning_rate": 3.450262598947586e-05, - "loss": 0.0097, + "epoch": 0.91, + "learning_rate": 0.00016358970503990605, + "loss": 0.0111, "step": 350830 }, { - "epoch": 1.77, - "learning_rate": 3.449505829646185e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016358581682353456, + "loss": 0.0152, "step": 350840 }, { - "epoch": 1.77, - "learning_rate": 3.448749060344784e-05, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016358192860716313, + "loss": 0.0135, "step": 350850 }, { - "epoch": 1.77, - "learning_rate": 3.4479922910433826e-05, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016357804039079165, + "loss": 0.0089, "step": 350860 }, { - "epoch": 1.77, - "learning_rate": 3.447235521741982e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001635741521744202, + "loss": 0.0091, "step": 350870 }, { - "epoch": 1.77, - "learning_rate": 3.446478752440581e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001635702639580487, + "loss": 0.0184, "step": 350880 }, { - "epoch": 1.77, - "learning_rate": 3.44572198313918e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016356637574167727, + "loss": 0.0126, "step": 350890 }, { - "epoch": 1.77, - "learning_rate": 3.4449652138377786e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001635624875253058, + "loss": 0.0121, "step": 350900 }, { - "epoch": 1.77, - "learning_rate": 3.4442084445363774e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016355859930893433, + "loss": 0.0116, "step": 350910 }, { - "epoch": 1.77, - "learning_rate": 3.443451675234976e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016355471109256284, + "loss": 0.0189, "step": 350920 }, { - "epoch": 1.77, - "learning_rate": 3.442694905933576e-05, - "loss": 0.0079, + "epoch": 0.91, + "learning_rate": 0.0001635508228761914, + "loss": 0.0141, "step": 350930 }, { - "epoch": 1.77, - "learning_rate": 3.4419381366321745e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016354693465981993, + "loss": 0.0128, "step": 350940 }, { - "epoch": 1.77, - "learning_rate": 3.4411813673307734e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.00016354304644344847, + "loss": 0.0159, "step": 350950 }, { - "epoch": 1.77, - "learning_rate": 3.440424598029372e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.00016353915822707698, + "loss": 0.0128, "step": 350960 }, { - "epoch": 1.77, - "learning_rate": 3.439667828727972e-05, - "loss": 0.0089, + "epoch": 0.91, + "learning_rate": 0.00016353527001070555, + "loss": 0.0105, "step": 350970 }, { - "epoch": 1.77, - "learning_rate": 3.4389110594265705e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001635313817943341, + "loss": 0.0127, "step": 350980 }, { - "epoch": 1.77, - "learning_rate": 3.438154290125169e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.0001635274935779626, + "loss": 0.0146, "step": 350990 }, { - "epoch": 1.77, - "learning_rate": 3.437397520823768e-05, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016352360536159115, + "loss": 0.0124, "step": 351000 }, { - "epoch": 1.77, - "eval_cer": 0.9144362920387732, - "eval_loss": 0.004640540108084679, - "eval_runtime": 116.6521, - "eval_samples_per_second": 17.145, - "eval_steps_per_second": 4.286, + "epoch": 0.91, + "eval_cer": 0.8817642703482717, + "eval_loss": 0.008518124930560589, + "eval_runtime": 107.3251, + "eval_samples_per_second": 18.635, + "eval_steps_per_second": 4.659, "step": 351000 }, { - "epoch": 1.77, - "learning_rate": 3.4366407515223676e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.0001635197171452197, + "loss": 0.0127, "step": 351010 }, { - "epoch": 1.77, - "learning_rate": 3.4358839822209665e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016351582892884823, + "loss": 0.0115, "step": 351020 }, { - "epoch": 1.77, - "learning_rate": 3.435127212919565e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016351194071247675, + "loss": 0.0132, "step": 351030 }, { - "epoch": 1.77, - "learning_rate": 3.434370443618164e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.0001635080524961053, + "loss": 0.0143, "step": 351040 }, { - "epoch": 1.77, - "learning_rate": 3.4336136743167636e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016350416427973383, + "loss": 0.0125, "step": 351050 }, { - "epoch": 1.77, - "learning_rate": 3.4328569050153624e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016350027606336237, + "loss": 0.0161, "step": 351060 }, { - "epoch": 1.77, - "learning_rate": 3.4321001357139606e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001634963878469909, + "loss": 0.0105, "step": 351070 }, { - "epoch": 1.77, - "learning_rate": 3.43134336641256e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016349249963061943, + "loss": 0.0174, "step": 351080 }, { - "epoch": 1.77, - "learning_rate": 3.430586597111159e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016348861141424794, + "loss": 0.0135, "step": 351090 }, { - "epoch": 1.77, - "learning_rate": 3.429829827809758e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001634847231978765, + "loss": 0.0136, "step": 351100 }, { - "epoch": 1.77, - "learning_rate": 3.4290730585083565e-05, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.00016348083498150503, + "loss": 0.0092, "step": 351110 }, { - "epoch": 1.77, - "learning_rate": 3.428316289206956e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016347694676513357, + "loss": 0.0122, "step": 351120 }, { - "epoch": 1.77, - "learning_rate": 3.427559519905555e-05, - "loss": 0.0045, + "epoch": 0.91, + "learning_rate": 0.00016347305854876208, + "loss": 0.0107, "step": 351130 }, { - "epoch": 1.77, - "learning_rate": 3.426802750604154e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016346917033239065, + "loss": 0.0139, "step": 351140 }, { - "epoch": 1.77, - "learning_rate": 3.426045981302753e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.0001634652821160192, + "loss": 0.0136, "step": 351150 }, { - "epoch": 1.77, - "learning_rate": 3.425289212001352e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001634613938996477, + "loss": 0.0133, "step": 351160 }, { - "epoch": 1.77, - "learning_rate": 3.424532442699951e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016345750568327622, + "loss": 0.0122, "step": 351170 }, { - "epoch": 1.77, - "learning_rate": 3.4237756733985496e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.0001634536174669048, + "loss": 0.0113, "step": 351180 }, { - "epoch": 1.77, - "learning_rate": 3.423018904097149e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016344972925053333, + "loss": 0.009, "step": 351190 }, { - "epoch": 1.77, - "learning_rate": 3.422262134795748e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016344584103416185, + "loss": 0.0126, "step": 351200 }, { - "epoch": 1.77, - "learning_rate": 3.421505365494347e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.0001634419528177904, + "loss": 0.0131, "step": 351210 }, { - "epoch": 1.77, - "learning_rate": 3.4207485961929456e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.00016343806460141893, + "loss": 0.0143, "step": 351220 }, { - "epoch": 1.77, - "learning_rate": 3.4199918268915444e-05, - "loss": 0.0091, + "epoch": 0.91, + "learning_rate": 0.00016343417638504747, + "loss": 0.0113, "step": 351230 }, { - "epoch": 1.77, - "learning_rate": 3.419235057590143e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016343028816867599, + "loss": 0.014, "step": 351240 }, { - "epoch": 1.77, - "learning_rate": 3.418478288288742e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016342639995230453, + "loss": 0.015, "step": 351250 }, { - "epoch": 1.77, - "learning_rate": 3.4177215189873416e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016342251173593307, + "loss": 0.0125, "step": 351260 }, { - "epoch": 1.77, - "learning_rate": 3.4169647496859404e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.0001634186235195616, + "loss": 0.014, "step": 351270 }, { - "epoch": 1.77, - "learning_rate": 3.416207980384539e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016341473530319013, + "loss": 0.0112, "step": 351280 }, { - "epoch": 1.77, - "learning_rate": 3.415451211083138e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016341084708681867, + "loss": 0.0118, "step": 351290 }, { - "epoch": 1.77, - "learning_rate": 3.4146944417817375e-05, - "loss": 0.0039, + "epoch": 0.91, + "learning_rate": 0.00016340695887044724, + "loss": 0.0156, "step": 351300 }, { - "epoch": 1.77, - "learning_rate": 3.4139376724803364e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016340307065407575, + "loss": 0.0121, "step": 351310 }, { - "epoch": 1.77, - "learning_rate": 3.413180903178935e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001633991824377043, + "loss": 0.0134, "step": 351320 }, { - "epoch": 1.77, - "learning_rate": 3.412424133877534e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.0001633952942213328, + "loss": 0.0112, "step": 351330 }, { - "epoch": 1.77, - "learning_rate": 3.4116673645761335e-05, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.00016339140600496132, + "loss": 0.0121, "step": 351340 }, { - "epoch": 1.77, - "learning_rate": 3.410910595274732e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.0001633875177885899, + "loss": 0.0149, "step": 351350 }, { - "epoch": 1.77, - "learning_rate": 3.410153825973331e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.00016338362957221843, + "loss": 0.0119, "step": 351360 }, { - "epoch": 1.77, - "learning_rate": 3.40939705667193e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016337974135584695, + "loss": 0.0145, "step": 351370 }, { - "epoch": 1.77, - "learning_rate": 3.408640287370529e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001633758531394755, + "loss": 0.015, "step": 351380 }, { - "epoch": 1.77, - "learning_rate": 3.4078835180691276e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016337196492310403, + "loss": 0.0144, "step": 351390 }, { - "epoch": 1.77, - "learning_rate": 3.407126748767727e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016336807670673257, + "loss": 0.0185, "step": 351400 }, { - "epoch": 1.77, - "learning_rate": 3.406369979466326e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016336418849036109, + "loss": 0.0153, "step": 351410 }, { - "epoch": 1.77, - "learning_rate": 3.405613210164925e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016336030027398963, + "loss": 0.0142, "step": 351420 }, { - "epoch": 1.77, - "learning_rate": 3.4048564408635236e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016335641205761817, + "loss": 0.0121, "step": 351430 }, { - "epoch": 1.77, - "learning_rate": 3.404099671562123e-05, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.0001633525238412467, + "loss": 0.0119, "step": 351440 }, { - "epoch": 1.77, - "learning_rate": 3.403342902260722e-05, - "loss": 0.0073, + "epoch": 0.91, + "learning_rate": 0.00016334863562487523, + "loss": 0.0145, "step": 351450 }, { - "epoch": 1.77, - "learning_rate": 3.402586132959321e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016334474740850377, + "loss": 0.0116, "step": 351460 }, { - "epoch": 1.77, - "learning_rate": 3.4018293636579195e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016334085919213234, + "loss": 0.0109, "step": 351470 }, { - "epoch": 1.77, - "learning_rate": 3.401072594356519e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016333697097576085, + "loss": 0.0127, "step": 351480 }, { - "epoch": 1.77, - "learning_rate": 3.400315825055118e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016333308275938936, + "loss": 0.0134, "step": 351490 }, { - "epoch": 1.77, - "learning_rate": 3.399559055753717e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.0001633291945430179, + "loss": 0.017, "step": 351500 }, { - "epoch": 1.77, - "learning_rate": 3.3988022864523155e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016332530632664648, + "loss": 0.0179, "step": 351510 }, { - "epoch": 1.77, - "learning_rate": 3.398045517150915e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.000163321418110275, + "loss": 0.0139, "step": 351520 }, { - "epoch": 1.77, - "learning_rate": 3.397288747849514e-05, - "loss": 0.0158, + "epoch": 0.91, + "learning_rate": 0.00016331752989390353, + "loss": 0.0122, "step": 351530 }, { - "epoch": 1.77, - "learning_rate": 3.3965319785481127e-05, - "loss": 0.0091, + "epoch": 0.91, + "learning_rate": 0.00016331364167753205, + "loss": 0.0161, "step": 351540 }, { - "epoch": 1.77, - "learning_rate": 3.3957752092467115e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016330975346116061, + "loss": 0.0144, "step": 351550 }, { - "epoch": 1.77, - "learning_rate": 3.39501843994531e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.00016330586524478913, + "loss": 0.0132, "step": 351560 }, { - "epoch": 1.77, - "learning_rate": 3.394261670643909e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016330197702841767, + "loss": 0.0205, "step": 351570 }, { - "epoch": 1.77, - "learning_rate": 3.3935049013425086e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016329808881204619, + "loss": 0.0097, "step": 351580 }, { - "epoch": 1.77, - "learning_rate": 3.3927481320411074e-05, - "loss": 0.0045, + "epoch": 0.91, + "learning_rate": 0.00016329420059567473, + "loss": 0.0136, "step": 351590 }, { - "epoch": 1.77, - "learning_rate": 3.391991362739706e-05, - "loss": 0.0081, + "epoch": 0.91, + "learning_rate": 0.00016329031237930327, + "loss": 0.0124, "step": 351600 }, { - "epoch": 1.77, - "learning_rate": 3.391234593438305e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.0001632864241629318, + "loss": 0.0119, "step": 351610 }, { - "epoch": 1.77, - "learning_rate": 3.3904778241369046e-05, - "loss": 0.0045, + "epoch": 0.91, + "learning_rate": 0.00016328253594656032, + "loss": 0.0121, "step": 351620 }, { - "epoch": 1.77, - "learning_rate": 3.3897210548355034e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016327864773018887, + "loss": 0.0168, "step": 351630 }, { - "epoch": 1.77, - "learning_rate": 3.388964285534102e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.0001632747595138174, + "loss": 0.0091, "step": 351640 }, { - "epoch": 1.77, - "learning_rate": 3.388207516232701e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016327087129744595, + "loss": 0.0129, "step": 351650 }, { - "epoch": 1.77, - "learning_rate": 3.3874507469313005e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016326698308107446, + "loss": 0.0132, "step": 351660 }, { - "epoch": 1.77, - "learning_rate": 3.3866939776298994e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.000163263094864703, + "loss": 0.0146, "step": 351670 }, { - "epoch": 1.77, - "learning_rate": 3.385937208328498e-05, - "loss": 0.0084, + "epoch": 0.91, + "learning_rate": 0.00016325920664833157, + "loss": 0.0091, "step": 351680 }, { - "epoch": 1.77, - "learning_rate": 3.385180439027097e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001632553184319601, + "loss": 0.0137, "step": 351690 }, { - "epoch": 1.77, - "learning_rate": 3.384423669725696e-05, - "loss": 0.0038, + "epoch": 0.91, + "learning_rate": 0.00016325143021558863, + "loss": 0.0103, "step": 351700 }, { - "epoch": 1.77, - "learning_rate": 3.3836669004242947e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016324754199921715, + "loss": 0.0163, "step": 351710 }, { - "epoch": 1.77, - "learning_rate": 3.382910131122894e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016324365378284571, + "loss": 0.0184, "step": 351720 }, { - "epoch": 1.77, - "learning_rate": 3.382153361821493e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016323976556647423, + "loss": 0.0109, "step": 351730 }, { - "epoch": 1.77, - "learning_rate": 3.381396592520092e-05, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016323587735010277, + "loss": 0.0109, "step": 351740 }, { - "epoch": 1.77, - "learning_rate": 3.3806398232186906e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016323198913373128, + "loss": 0.0147, "step": 351750 }, { - "epoch": 1.77, - "learning_rate": 3.37988305391729e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016322810091735985, + "loss": 0.0119, "step": 351760 }, { - "epoch": 1.77, - "learning_rate": 3.379126284615889e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016322421270098837, + "loss": 0.0124, "step": 351770 }, { - "epoch": 1.77, - "learning_rate": 3.378369515314488e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.0001632203244846169, + "loss": 0.0114, "step": 351780 }, { - "epoch": 1.77, - "learning_rate": 3.3776127460130866e-05, - "loss": 0.0088, + "epoch": 0.91, + "learning_rate": 0.00016321643626824542, + "loss": 0.013, "step": 351790 }, { - "epoch": 1.77, - "learning_rate": 3.376855976711686e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.000163212548051874, + "loss": 0.012, "step": 351800 }, { - "epoch": 1.77, - "learning_rate": 3.376099207410285e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.0001632086598355025, + "loss": 0.0169, "step": 351810 }, { - "epoch": 1.77, - "learning_rate": 3.375342438108884e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016320477161913105, + "loss": 0.0133, "step": 351820 }, { - "epoch": 1.78, - "learning_rate": 3.3745856688074826e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.00016320088340275956, + "loss": 0.0118, "step": 351830 }, { - "epoch": 1.78, - "learning_rate": 3.373828899506082e-05, - "loss": 0.004, + "epoch": 0.91, + "learning_rate": 0.0001631969951863881, + "loss": 0.0153, "step": 351840 }, { - "epoch": 1.78, - "learning_rate": 3.37307213020468e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016319310697001667, + "loss": 0.0149, "step": 351850 }, { - "epoch": 1.78, - "learning_rate": 3.37231536090328e-05, - "loss": 0.0081, + "epoch": 0.91, + "learning_rate": 0.0001631892187536452, + "loss": 0.0129, "step": 351860 }, { - "epoch": 1.78, - "learning_rate": 3.3715585916018785e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.00016318533053727373, + "loss": 0.0214, "step": 351870 }, { - "epoch": 1.78, - "learning_rate": 3.3708018223004773e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.00016318144232090224, + "loss": 0.0118, "step": 351880 }, { - "epoch": 1.78, - "learning_rate": 3.370045052999076e-05, - "loss": 0.0107, + "epoch": 0.91, + "learning_rate": 0.0001631775541045308, + "loss": 0.0176, "step": 351890 }, { - "epoch": 1.78, - "learning_rate": 3.369288283697676e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016317366588815933, + "loss": 0.0122, "step": 351900 }, { - "epoch": 1.78, - "learning_rate": 3.3685315143962745e-05, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016316977767178787, + "loss": 0.0121, "step": 351910 }, { - "epoch": 1.78, - "learning_rate": 3.367774745094873e-05, - "loss": 0.0042, + "epoch": 0.91, + "learning_rate": 0.00016316588945541638, + "loss": 0.0122, "step": 351920 }, { - "epoch": 1.78, - "learning_rate": 3.367017975793472e-05, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.00016316200123904495, + "loss": 0.0124, "step": 351930 }, { - "epoch": 1.78, - "learning_rate": 3.3662612064920716e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016315811302267347, + "loss": 0.0119, "step": 351940 }, { - "epoch": 1.78, - "learning_rate": 3.3655044371906704e-05, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.000163154224806302, + "loss": 0.0143, "step": 351950 }, { - "epoch": 1.78, - "learning_rate": 3.364747667889269e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016315033658993052, + "loss": 0.0129, "step": 351960 }, { - "epoch": 1.78, - "learning_rate": 3.363990898587868e-05, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.0001631464483735591, + "loss": 0.0099, "step": 351970 }, { - "epoch": 1.78, - "learning_rate": 3.3632341292864676e-05, - "loss": 0.0082, + "epoch": 0.91, + "learning_rate": 0.0001631425601571876, + "loss": 0.0154, "step": 351980 }, { - "epoch": 1.78, - "learning_rate": 3.3624773599850664e-05, - "loss": 0.0066, + "epoch": 0.91, + "learning_rate": 0.00016313867194081615, + "loss": 0.0148, "step": 351990 }, { - "epoch": 1.78, - "learning_rate": 3.361720590683665e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016313478372444466, + "loss": 0.0144, "step": 352000 }, { - "epoch": 1.78, - "eval_cer": 0.9144343512465224, - "eval_loss": 0.0045296261087059975, - "eval_runtime": 116.5512, - "eval_samples_per_second": 17.16, - "eval_steps_per_second": 4.29, + "epoch": 0.91, + "eval_cer": 0.8817558725266665, + "eval_loss": 0.00876292772591114, + "eval_runtime": 107.5104, + "eval_samples_per_second": 18.603, + "eval_steps_per_second": 4.651, "step": 352000 }, { - "epoch": 1.78, - "learning_rate": 3.360963821382264e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016313089550807323, + "loss": 0.0124, "step": 352010 }, { - "epoch": 1.78, - "learning_rate": 3.360207052080863e-05, - "loss": 0.0078, + "epoch": 0.91, + "learning_rate": 0.00016312700729170177, + "loss": 0.0125, "step": 352020 }, { - "epoch": 1.78, - "learning_rate": 3.359450282779462e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.0001631231190753303, + "loss": 0.0131, "step": 352030 }, { - "epoch": 1.78, - "learning_rate": 3.3586935134780605e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016311923085895883, + "loss": 0.0111, "step": 352040 }, { - "epoch": 1.78, - "learning_rate": 3.35793674417666e-05, - "loss": 0.0039, + "epoch": 0.91, + "learning_rate": 0.00016311534264258737, + "loss": 0.0144, "step": 352050 }, { - "epoch": 1.78, - "learning_rate": 3.357179974875259e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.0001631114544262159, + "loss": 0.0144, "step": 352060 }, { - "epoch": 1.78, - "learning_rate": 3.356423205573858e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016310756620984443, + "loss": 0.0121, "step": 352070 }, { - "epoch": 1.78, - "learning_rate": 3.3556664362724565e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016310367799347297, + "loss": 0.0152, "step": 352080 }, { - "epoch": 1.78, - "learning_rate": 3.354909666971056e-05, - "loss": 0.0095, + "epoch": 0.91, + "learning_rate": 0.00016309978977710148, + "loss": 0.0124, "step": 352090 }, { - "epoch": 1.78, - "learning_rate": 3.354152897669655e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016309590156073005, + "loss": 0.0125, "step": 352100 }, { - "epoch": 1.78, - "learning_rate": 3.3533961283682536e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016309201334435857, + "loss": 0.0114, "step": 352110 }, { - "epoch": 1.78, - "learning_rate": 3.352639359066853e-05, - "loss": 0.0076, + "epoch": 0.91, + "learning_rate": 0.0001630881251279871, + "loss": 0.0166, "step": 352120 }, { - "epoch": 1.78, - "learning_rate": 3.351882589765452e-05, - "loss": 0.0042, + "epoch": 0.91, + "learning_rate": 0.00016308423691161562, + "loss": 0.0121, "step": 352130 }, { - "epoch": 1.78, - "learning_rate": 3.351125820464051e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.0001630803486952442, + "loss": 0.0124, "step": 352140 }, { - "epoch": 1.78, - "learning_rate": 3.3503690511626496e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.0001630764604788727, + "loss": 0.0103, "step": 352150 }, { - "epoch": 1.78, - "learning_rate": 3.349612281861249e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016307257226250125, + "loss": 0.0108, "step": 352160 }, { - "epoch": 1.78, - "learning_rate": 3.348855512559847e-05, - "loss": 0.0071, + "epoch": 0.91, + "learning_rate": 0.00016306868404612976, + "loss": 0.0117, "step": 352170 }, { - "epoch": 1.78, - "learning_rate": 3.348098743258446e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016306479582975833, + "loss": 0.0162, "step": 352180 }, { - "epoch": 1.78, - "learning_rate": 3.3473419739570456e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016306090761338687, + "loss": 0.0114, "step": 352190 }, { - "epoch": 1.78, - "learning_rate": 3.3465852046556444e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.0001630570193970154, + "loss": 0.0122, "step": 352200 }, { - "epoch": 1.78, - "learning_rate": 3.345828435354243e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001630531311806439, + "loss": 0.0139, "step": 352210 }, { - "epoch": 1.78, - "learning_rate": 3.345071666052842e-05, - "loss": 0.0077, + "epoch": 0.91, + "learning_rate": 0.00016304924296427247, + "loss": 0.0115, "step": 352220 }, { - "epoch": 1.78, - "learning_rate": 3.3443148967514415e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.000163045354747901, + "loss": 0.0121, "step": 352230 }, { - "epoch": 1.78, - "learning_rate": 3.3435581274500403e-05, - "loss": 0.0054, + "epoch": 0.91, + "learning_rate": 0.00016304146653152953, + "loss": 0.0167, "step": 352240 }, { - "epoch": 1.78, - "learning_rate": 3.342801358148639e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016303757831515807, + "loss": 0.0131, "step": 352250 }, { - "epoch": 1.78, - "learning_rate": 3.342044588847238e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.0001630336900987866, + "loss": 0.0127, "step": 352260 }, { - "epoch": 1.78, - "learning_rate": 3.3412878195458375e-05, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.00016302980188241515, + "loss": 0.0141, "step": 352270 }, { - "epoch": 1.78, - "learning_rate": 3.340531050244436e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016302591366604367, + "loss": 0.0156, "step": 352280 }, { - "epoch": 1.78, - "learning_rate": 3.339774280943035e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.0001630220254496722, + "loss": 0.0114, "step": 352290 }, { - "epoch": 1.78, - "learning_rate": 3.339017511641634e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016301813723330075, + "loss": 0.0125, "step": 352300 }, { - "epoch": 1.78, - "learning_rate": 3.3382607423402335e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001630142490169293, + "loss": 0.0097, "step": 352310 }, { - "epoch": 1.78, - "learning_rate": 3.337503973038832e-05, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.0001630103608005578, + "loss": 0.0132, "step": 352320 }, { - "epoch": 1.78, - "learning_rate": 3.336747203737431e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.00016300647258418635, + "loss": 0.0143, "step": 352330 }, { - "epoch": 1.78, - "learning_rate": 3.33599043443603e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016300258436781486, + "loss": 0.0107, "step": 352340 }, { - "epoch": 1.78, - "learning_rate": 3.335233665134629e-05, - "loss": 0.0044, + "epoch": 0.91, + "learning_rate": 0.00016299869615144343, + "loss": 0.0151, "step": 352350 }, { - "epoch": 1.78, - "learning_rate": 3.3344768958332276e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016299480793507195, + "loss": 0.0128, "step": 352360 }, { - "epoch": 1.78, - "learning_rate": 3.333720126531827e-05, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.0001629909197187005, + "loss": 0.0159, "step": 352370 }, { - "epoch": 1.78, - "learning_rate": 3.332963357230426e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.000162987031502329, + "loss": 0.0097, "step": 352380 }, { - "epoch": 1.78, - "learning_rate": 3.332206587929025e-05, - "loss": 0.0093, + "epoch": 0.91, + "learning_rate": 0.00016298314328595757, + "loss": 0.0144, "step": 352390 }, { - "epoch": 1.78, - "learning_rate": 3.3314498186276235e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.0001629792550695861, + "loss": 0.0133, "step": 352400 }, { - "epoch": 1.78, - "learning_rate": 3.330693049326223e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016297536685321463, + "loss": 0.0147, "step": 352410 }, { - "epoch": 1.78, - "learning_rate": 3.329936280024822e-05, - "loss": 0.0084, + "epoch": 0.91, + "learning_rate": 0.00016297147863684317, + "loss": 0.0148, "step": 352420 }, { - "epoch": 1.78, - "learning_rate": 3.329179510723421e-05, - "loss": 0.0045, + "epoch": 0.91, + "learning_rate": 0.0001629675904204717, + "loss": 0.0107, "step": 352430 }, { - "epoch": 1.78, - "learning_rate": 3.3284227414220195e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016296370220410025, + "loss": 0.0123, "step": 352440 }, { - "epoch": 1.78, - "learning_rate": 3.327665972120619e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016295981398772877, + "loss": 0.0131, "step": 352450 }, { - "epoch": 1.78, - "learning_rate": 3.326909202819218e-05, - "loss": 0.0075, + "epoch": 0.91, + "learning_rate": 0.0001629559257713573, + "loss": 0.0133, "step": 352460 }, { - "epoch": 1.78, - "learning_rate": 3.3261524335178166e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016295203755498585, + "loss": 0.0141, "step": 352470 }, { - "epoch": 1.78, - "learning_rate": 3.3253956642164155e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.0001629481493386144, + "loss": 0.0149, "step": 352480 }, { - "epoch": 1.78, - "learning_rate": 3.324638894915014e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001629442611222429, + "loss": 0.0158, "step": 352490 }, { - "epoch": 1.78, - "learning_rate": 3.323882125613613e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016294037290587145, + "loss": 0.0139, "step": 352500 }, { - "epoch": 1.78, - "learning_rate": 3.3231253563122126e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016293648468950002, + "loss": 0.0128, "step": 352510 }, { - "epoch": 1.78, - "learning_rate": 3.3223685870108114e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016293259647312853, + "loss": 0.0172, "step": 352520 }, { - "epoch": 1.78, - "learning_rate": 3.32161181770941e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016292870825675704, + "loss": 0.0123, "step": 352530 }, { - "epoch": 1.78, - "learning_rate": 3.320855048408009e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.00016292482004038559, + "loss": 0.0138, "step": 352540 }, { - "epoch": 1.78, - "learning_rate": 3.3200982791066086e-05, - "loss": 0.0095, + "epoch": 0.91, + "learning_rate": 0.00016292093182401415, + "loss": 0.0185, "step": 352550 }, { - "epoch": 1.78, - "learning_rate": 3.3193415098052074e-05, - "loss": 0.0056, + "epoch": 0.91, + "learning_rate": 0.00016291704360764267, + "loss": 0.0181, "step": 352560 }, { - "epoch": 1.78, - "learning_rate": 3.318584740503806e-05, - "loss": 0.0069, + "epoch": 0.91, + "learning_rate": 0.0001629131553912712, + "loss": 0.0125, "step": 352570 }, { - "epoch": 1.78, - "learning_rate": 3.317827971202405e-05, - "loss": 0.0063, + "epoch": 0.91, + "learning_rate": 0.00016290926717489973, + "loss": 0.017, "step": 352580 }, { - "epoch": 1.78, - "learning_rate": 3.3170712019010045e-05, - "loss": 0.0052, + "epoch": 0.91, + "learning_rate": 0.00016290537895852827, + "loss": 0.0189, "step": 352590 }, { - "epoch": 1.78, - "learning_rate": 3.3163144325996034e-05, - "loss": 0.008, + "epoch": 0.91, + "learning_rate": 0.0001629014907421568, + "loss": 0.015, "step": 352600 }, { - "epoch": 1.78, - "learning_rate": 3.315557663298202e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016289760252578535, + "loss": 0.016, "step": 352610 }, { - "epoch": 1.78, - "learning_rate": 3.314800893996801e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016289371430941386, + "loss": 0.011, "step": 352620 }, { - "epoch": 1.78, - "learning_rate": 3.3140441246954005e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.0001628898260930424, + "loss": 0.0144, "step": 352630 }, { - "epoch": 1.78, - "learning_rate": 3.3132873553939986e-05, - "loss": 0.007, + "epoch": 0.91, + "learning_rate": 0.00016288593787667095, + "loss": 0.0095, "step": 352640 }, { - "epoch": 1.78, - "learning_rate": 3.312530586092598e-05, - "loss": 0.0043, + "epoch": 0.91, + "learning_rate": 0.0001628820496602995, + "loss": 0.0119, "step": 352650 }, { - "epoch": 1.78, - "learning_rate": 3.311773816791197e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.000162878161443928, + "loss": 0.0111, "step": 352660 }, { - "epoch": 1.78, - "learning_rate": 3.311017047489796e-05, - "loss": 0.0048, + "epoch": 0.91, + "learning_rate": 0.00016287427322755655, + "loss": 0.0159, "step": 352670 }, { - "epoch": 1.78, - "learning_rate": 3.3102602781883946e-05, - "loss": 0.0068, + "epoch": 0.91, + "learning_rate": 0.0001628703850111851, + "loss": 0.0138, "step": 352680 }, { - "epoch": 1.78, - "learning_rate": 3.309503508886994e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016286649679481363, + "loss": 0.0142, "step": 352690 }, { - "epoch": 1.78, - "learning_rate": 3.308746739585593e-05, - "loss": 0.0065, + "epoch": 0.91, + "learning_rate": 0.00016286260857844214, + "loss": 0.0124, "step": 352700 }, { - "epoch": 1.78, - "learning_rate": 3.307989970284192e-05, - "loss": 0.0067, + "epoch": 0.91, + "learning_rate": 0.00016285872036207069, + "loss": 0.0107, "step": 352710 }, { - "epoch": 1.78, - "learning_rate": 3.3072332009827906e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016285483214569925, + "loss": 0.0121, "step": 352720 }, { - "epoch": 1.78, - "learning_rate": 3.30647643168139e-05, - "loss": 0.005, + "epoch": 0.91, + "learning_rate": 0.00016285094392932777, + "loss": 0.0152, "step": 352730 }, { - "epoch": 1.78, - "learning_rate": 3.305719662379989e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.0001628470557129563, + "loss": 0.0126, "step": 352740 }, { - "epoch": 1.78, - "learning_rate": 3.304962893078588e-05, - "loss": 0.0055, + "epoch": 0.91, + "learning_rate": 0.00016284316749658482, + "loss": 0.0114, "step": 352750 }, { - "epoch": 1.78, - "learning_rate": 3.3042061237771865e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.0001628392792802134, + "loss": 0.0123, "step": 352760 }, { - "epoch": 1.78, - "learning_rate": 3.303449354475786e-05, - "loss": 0.0051, + "epoch": 0.91, + "learning_rate": 0.0001628353910638419, + "loss": 0.0154, "step": 352770 }, { - "epoch": 1.78, - "learning_rate": 3.302692585174385e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016283150284747045, + "loss": 0.0162, "step": 352780 }, { - "epoch": 1.78, - "learning_rate": 3.301935815872984e-05, - "loss": 0.0053, + "epoch": 0.91, + "learning_rate": 0.00016282761463109896, + "loss": 0.0139, "step": 352790 }, { - "epoch": 1.78, - "learning_rate": 3.3011790465715825e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016282372641472753, + "loss": 0.0112, "step": 352800 }, { - "epoch": 1.78, - "learning_rate": 3.300422277270181e-05, - "loss": 0.0094, + "epoch": 0.91, + "learning_rate": 0.00016281983819835605, + "loss": 0.014, "step": 352810 }, { - "epoch": 1.78, - "learning_rate": 3.29966550796878e-05, - "loss": 0.0074, + "epoch": 0.91, + "learning_rate": 0.0001628159499819846, + "loss": 0.0126, "step": 352820 }, { - "epoch": 1.78, - "learning_rate": 3.2989087386673796e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.0001628120617656131, + "loss": 0.0196, "step": 352830 }, { - "epoch": 1.78, - "learning_rate": 3.2981519693659785e-05, - "loss": 0.0058, + "epoch": 0.91, + "learning_rate": 0.00016280817354924165, + "loss": 0.0138, "step": 352840 }, { - "epoch": 1.78, - "learning_rate": 3.297395200064577e-05, - "loss": 0.0072, + "epoch": 0.91, + "learning_rate": 0.0001628042853328702, + "loss": 0.0122, "step": 352850 }, { - "epoch": 1.78, - "learning_rate": 3.296638430763176e-05, - "loss": 0.0064, + "epoch": 0.91, + "learning_rate": 0.00016280039711649873, + "loss": 0.015, "step": 352860 }, { - "epoch": 1.78, - "learning_rate": 3.2958816614617756e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016279650890012724, + "loss": 0.0129, "step": 352870 }, { - "epoch": 1.78, - "learning_rate": 3.2951248921603744e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016279262068375578, + "loss": 0.0111, "step": 352880 }, { - "epoch": 1.78, - "learning_rate": 3.294368122858973e-05, - "loss": 0.0049, + "epoch": 0.91, + "learning_rate": 0.00016278873246738435, + "loss": 0.0173, "step": 352890 }, { - "epoch": 1.78, - "learning_rate": 3.293611353557572e-05, - "loss": 0.0062, + "epoch": 0.91, + "learning_rate": 0.00016278484425101287, + "loss": 0.014, "step": 352900 }, { - "epoch": 1.78, - "learning_rate": 3.2928545842561716e-05, - "loss": 0.0092, + "epoch": 0.91, + "learning_rate": 0.0001627809560346414, + "loss": 0.0137, "step": 352910 }, { - "epoch": 1.78, - "learning_rate": 3.2920978149547704e-05, - "loss": 0.0059, + "epoch": 0.91, + "learning_rate": 0.00016277706781826992, + "loss": 0.0107, "step": 352920 }, { - "epoch": 1.78, - "learning_rate": 3.291341045653369e-05, - "loss": 0.0047, + "epoch": 0.91, + "learning_rate": 0.0001627731796018985, + "loss": 0.0155, "step": 352930 }, { - "epoch": 1.78, - "learning_rate": 3.290584276351968e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.000162769291385527, + "loss": 0.0101, "step": 352940 }, { - "epoch": 1.78, - "learning_rate": 3.289827507050567e-05, - "loss": 0.006, + "epoch": 0.91, + "learning_rate": 0.00016276540316915555, + "loss": 0.0157, "step": 352950 }, { - "epoch": 1.78, - "learning_rate": 3.289070737749166e-05, - "loss": 0.0046, + "epoch": 0.91, + "learning_rate": 0.00016276151495278406, + "loss": 0.0117, "step": 352960 }, { - "epoch": 1.78, - "learning_rate": 3.2883139684477645e-05, - "loss": 0.0061, + "epoch": 0.91, + "learning_rate": 0.00016275762673641263, + "loss": 0.0151, "step": 352970 }, { - "epoch": 1.78, - "learning_rate": 3.287557199146364e-05, - "loss": 0.0057, + "epoch": 0.91, + "learning_rate": 0.00016275373852004115, + "loss": 0.0148, "step": 352980 }, { - "epoch": 1.78, - "learning_rate": 3.286800429844963e-05, - "loss": 0.0086, + "epoch": 0.92, + "learning_rate": 0.0001627498503036697, + "loss": 0.0178, "step": 352990 }, { - "epoch": 1.78, - "learning_rate": 3.2860436605435617e-05, - "loss": 0.0081, + "epoch": 0.92, + "learning_rate": 0.0001627459620872982, + "loss": 0.0131, "step": 353000 }, { - "epoch": 1.78, - "eval_cer": 0.9144139729278888, - "eval_loss": 0.0045607974752783775, - "eval_runtime": 116.7751, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.92, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.008378801867365837, + "eval_runtime": 107.4189, + "eval_samples_per_second": 18.619, + "eval_steps_per_second": 4.655, "step": 353000 }, { - "epoch": 1.78, - "learning_rate": 3.2852868912421605e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016274207387092677, + "loss": 0.013, "step": 353010 }, { - "epoch": 1.78, - "learning_rate": 3.28453012194076e-05, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.0001627381856545553, + "loss": 0.0122, "step": 353020 }, { - "epoch": 1.78, - "learning_rate": 3.283773352639359e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016273429743818383, + "loss": 0.0135, "step": 353030 }, { - "epoch": 1.78, - "learning_rate": 3.2830165833379576e-05, - "loss": 0.009, + "epoch": 0.92, + "learning_rate": 0.00016273040922181234, + "loss": 0.0148, "step": 353040 }, { - "epoch": 1.78, - "learning_rate": 3.2822598140365564e-05, - "loss": 0.0079, + "epoch": 0.92, + "learning_rate": 0.0001627265210054409, + "loss": 0.0135, "step": 353050 }, { - "epoch": 1.78, - "learning_rate": 3.281503044735156e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016272263278906945, + "loss": 0.0146, "step": 353060 }, { - "epoch": 1.78, - "learning_rate": 3.280746275433755e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016271874457269797, + "loss": 0.0148, "step": 353070 }, { - "epoch": 1.78, - "learning_rate": 3.2799895061323536e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016271485635632648, + "loss": 0.0171, "step": 353080 }, { - "epoch": 1.78, - "learning_rate": 3.279232736830953e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016271096813995502, + "loss": 0.0113, "step": 353090 }, { - "epoch": 1.78, - "learning_rate": 3.278475967529552e-05, - "loss": 0.0043, + "epoch": 0.92, + "learning_rate": 0.0001627070799235836, + "loss": 0.0168, "step": 353100 }, { - "epoch": 1.78, - "learning_rate": 3.27771919822815e-05, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.0001627031917072121, + "loss": 0.0115, "step": 353110 }, { - "epoch": 1.78, - "learning_rate": 3.2769624289267496e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016269930349084065, + "loss": 0.0141, "step": 353120 }, { - "epoch": 1.78, - "learning_rate": 3.2762056596253484e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016269541527446916, + "loss": 0.0156, "step": 353130 }, { - "epoch": 1.78, - "learning_rate": 3.275448890323947e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016269152705809773, + "loss": 0.0131, "step": 353140 }, { - "epoch": 1.78, - "learning_rate": 3.274692121022546e-05, - "loss": 0.0079, + "epoch": 0.92, + "learning_rate": 0.00016268763884172625, + "loss": 0.0107, "step": 353150 }, { - "epoch": 1.78, - "learning_rate": 3.2739353517211455e-05, - "loss": 0.0156, + "epoch": 0.92, + "learning_rate": 0.0001626837506253548, + "loss": 0.0136, "step": 353160 }, { - "epoch": 1.78, - "learning_rate": 3.273178582419744e-05, - "loss": 0.0114, + "epoch": 0.92, + "learning_rate": 0.0001626798624089833, + "loss": 0.0134, "step": 353170 }, { - "epoch": 1.78, - "learning_rate": 3.272421813118343e-05, - "loss": 0.0084, + "epoch": 0.92, + "learning_rate": 0.00016267597419261187, + "loss": 0.009, "step": 353180 }, { - "epoch": 1.78, - "learning_rate": 3.271665043816942e-05, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.00016267208597624039, + "loss": 0.0111, "step": 353190 }, { - "epoch": 1.78, - "learning_rate": 3.2709082745155415e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016266819775986893, + "loss": 0.0157, "step": 353200 }, { - "epoch": 1.78, - "learning_rate": 3.27015150521414e-05, - "loss": 0.0043, + "epoch": 0.92, + "learning_rate": 0.00016266430954349744, + "loss": 0.0124, "step": 353210 }, { - "epoch": 1.78, - "learning_rate": 3.269394735912739e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.000162660421327126, + "loss": 0.0112, "step": 353220 }, { - "epoch": 1.78, - "learning_rate": 3.268637966611338e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016265653311075453, + "loss": 0.0127, "step": 353230 }, { - "epoch": 1.78, - "learning_rate": 3.2678811973099374e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016265264489438307, + "loss": 0.0172, "step": 353240 }, { - "epoch": 1.78, - "learning_rate": 3.267124428008536e-05, - "loss": 0.0074, + "epoch": 0.92, + "learning_rate": 0.00016264875667801158, + "loss": 0.0131, "step": 353250 }, { - "epoch": 1.78, - "learning_rate": 3.266367658707135e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016264486846164015, + "loss": 0.011, "step": 353260 }, { - "epoch": 1.78, - "learning_rate": 3.265610889405734e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.0001626409802452687, + "loss": 0.0141, "step": 353270 }, { - "epoch": 1.78, - "learning_rate": 3.264854120104333e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.0001626370920288972, + "loss": 0.014, "step": 353280 }, { - "epoch": 1.78, - "learning_rate": 3.2640973508029316e-05, - "loss": 0.0074, + "epoch": 0.92, + "learning_rate": 0.00016263320381252575, + "loss": 0.0171, "step": 353290 }, { - "epoch": 1.78, - "learning_rate": 3.263340581501531e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.0001626293155961543, + "loss": 0.0115, "step": 353300 }, { - "epoch": 1.78, - "learning_rate": 3.26258381220013e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016262542737978283, + "loss": 0.0106, "step": 353310 }, { - "epoch": 1.78, - "learning_rate": 3.261827042898729e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016262153916341135, + "loss": 0.0134, "step": 353320 }, { - "epoch": 1.78, - "learning_rate": 3.2610702735973275e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.0001626176509470399, + "loss": 0.0164, "step": 353330 }, { - "epoch": 1.78, - "learning_rate": 3.260313504295927e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.0001626137627306684, + "loss": 0.0148, "step": 353340 }, { - "epoch": 1.78, - "learning_rate": 3.259556734994526e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016260987451429697, + "loss": 0.0106, "step": 353350 }, { - "epoch": 1.78, - "learning_rate": 3.258799965693125e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016260598629792549, + "loss": 0.014, "step": 353360 }, { - "epoch": 1.78, - "learning_rate": 3.2580431963917235e-05, - "loss": 0.0087, + "epoch": 0.92, + "learning_rate": 0.00016260209808155403, + "loss": 0.0132, "step": 353370 }, { - "epoch": 1.78, - "learning_rate": 3.257286427090323e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016259820986518254, + "loss": 0.0107, "step": 353380 }, { - "epoch": 1.78, - "learning_rate": 3.256529657788922e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.0001625943216488111, + "loss": 0.017, "step": 353390 }, { - "epoch": 1.78, - "learning_rate": 3.2557728884875206e-05, - "loss": 0.0041, + "epoch": 0.92, + "learning_rate": 0.00016259043343243962, + "loss": 0.0173, "step": 353400 }, { - "epoch": 1.78, - "learning_rate": 3.2550161191861195e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016258654521606817, + "loss": 0.0128, "step": 353410 }, { - "epoch": 1.78, - "learning_rate": 3.254259349884719e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016258265699969668, + "loss": 0.0138, "step": 353420 }, { - "epoch": 1.78, - "learning_rate": 3.253502580583317e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016257876878332525, + "loss": 0.0146, "step": 353430 }, { - "epoch": 1.78, - "learning_rate": 3.2527458112819166e-05, - "loss": 0.0035, + "epoch": 0.92, + "learning_rate": 0.0001625748805669538, + "loss": 0.016, "step": 353440 }, { - "epoch": 1.78, - "learning_rate": 3.2519890419805154e-05, - "loss": 0.0087, + "epoch": 0.92, + "learning_rate": 0.0001625709923505823, + "loss": 0.0113, "step": 353450 }, { - "epoch": 1.78, - "learning_rate": 3.251232272679114e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016256710413421085, + "loss": 0.0134, "step": 353460 }, { - "epoch": 1.78, - "learning_rate": 3.250475503377713e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.0001625632159178394, + "loss": 0.0123, "step": 353470 }, { - "epoch": 1.78, - "learning_rate": 3.2497187340763126e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016255932770146793, + "loss": 0.0156, "step": 353480 }, { - "epoch": 1.78, - "learning_rate": 3.2489619647749114e-05, - "loss": 0.0078, + "epoch": 0.92, + "learning_rate": 0.00016255543948509645, + "loss": 0.0127, "step": 353490 }, { - "epoch": 1.78, - "learning_rate": 3.24820519547351e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.000162551551268725, + "loss": 0.0143, "step": 353500 }, { - "epoch": 1.78, - "learning_rate": 3.247448426172109e-05, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.00016254766305235353, + "loss": 0.0148, "step": 353510 }, { - "epoch": 1.78, - "learning_rate": 3.2466916568707085e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016254377483598207, + "loss": 0.0143, "step": 353520 }, { - "epoch": 1.78, - "learning_rate": 3.2459348875693073e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016253988661961058, + "loss": 0.0136, "step": 353530 }, { - "epoch": 1.78, - "learning_rate": 3.245178118267906e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016253599840323913, + "loss": 0.0148, "step": 353540 }, { - "epoch": 1.78, - "learning_rate": 3.244421348966505e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016253211018686767, + "loss": 0.0122, "step": 353550 }, { - "epoch": 1.78, - "learning_rate": 3.2436645796651045e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.0001625282219704962, + "loss": 0.0133, "step": 353560 }, { - "epoch": 1.78, - "learning_rate": 3.242907810363703e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016252433375412472, + "loss": 0.0122, "step": 353570 }, { - "epoch": 1.78, - "learning_rate": 3.242151041062302e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016252044553775327, + "loss": 0.0129, "step": 353580 }, { - "epoch": 1.78, - "learning_rate": 3.241394271760901e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016251655732138178, + "loss": 0.014, "step": 353590 }, { - "epoch": 1.78, - "learning_rate": 3.2406375024595e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016251266910501035, + "loss": 0.0157, "step": 353600 }, { - "epoch": 1.78, - "learning_rate": 3.2398807331580986e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.0001625087808886389, + "loss": 0.0113, "step": 353610 }, { - "epoch": 1.78, - "learning_rate": 3.239123963856698e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.0001625048926722674, + "loss": 0.0153, "step": 353620 }, { - "epoch": 1.78, - "learning_rate": 3.238367194555297e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.00016250100445589595, + "loss": 0.0147, "step": 353630 }, { - "epoch": 1.78, - "learning_rate": 3.237610425253896e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.0001624971162395245, + "loss": 0.0154, "step": 353640 }, { - "epoch": 1.78, - "learning_rate": 3.2368536559524946e-05, - "loss": 0.0085, + "epoch": 0.92, + "learning_rate": 0.00016249322802315303, + "loss": 0.0154, "step": 353650 }, { - "epoch": 1.78, - "learning_rate": 3.236096886651094e-05, - "loss": 0.0094, + "epoch": 0.92, + "learning_rate": 0.00016248933980678154, + "loss": 0.0105, "step": 353660 }, { - "epoch": 1.78, - "learning_rate": 3.235340117349693e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016248545159041009, + "loss": 0.012, "step": 353670 }, { - "epoch": 1.78, - "learning_rate": 3.234583348048292e-05, - "loss": 0.0042, + "epoch": 0.92, + "learning_rate": 0.00016248156337403863, + "loss": 0.0156, "step": 353680 }, { - "epoch": 1.78, - "learning_rate": 3.2338265787468905e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016247767515766717, + "loss": 0.0128, "step": 353690 }, { - "epoch": 1.78, - "learning_rate": 3.23306980944549e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016247378694129568, + "loss": 0.0139, "step": 353700 }, { - "epoch": 1.78, - "learning_rate": 3.232313040144089e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016246989872492423, + "loss": 0.0119, "step": 353710 }, { - "epoch": 1.78, - "learning_rate": 3.231556270842688e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016246601050855277, + "loss": 0.0174, "step": 353720 }, { - "epoch": 1.78, - "learning_rate": 3.2307995015412865e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.0001624621222921813, + "loss": 0.0117, "step": 353730 }, { - "epoch": 1.78, - "learning_rate": 3.230042732239885e-05, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.00016245823407580982, + "loss": 0.012, "step": 353740 }, { - "epoch": 1.78, - "learning_rate": 3.229285962938484e-05, - "loss": 0.0079, + "epoch": 0.92, + "learning_rate": 0.00016245434585943837, + "loss": 0.0131, "step": 353750 }, { - "epoch": 1.78, - "learning_rate": 3.228529193637083e-05, - "loss": 0.0043, + "epoch": 0.92, + "learning_rate": 0.00016245045764306693, + "loss": 0.0145, "step": 353760 }, { - "epoch": 1.78, - "learning_rate": 3.2277724243356825e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016244656942669545, + "loss": 0.01, "step": 353770 }, { - "epoch": 1.78, - "learning_rate": 3.227015655034281e-05, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.000162442681210324, + "loss": 0.0111, "step": 353780 }, { - "epoch": 1.78, - "learning_rate": 3.22625888573288e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001624387929939525, + "loss": 0.0151, "step": 353790 }, { - "epoch": 1.78, - "learning_rate": 3.2255021164314796e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016243490477758107, + "loss": 0.0142, "step": 353800 }, { - "epoch": 1.79, - "learning_rate": 3.2247453471300784e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.0001624310165612096, + "loss": 0.0167, "step": 353810 }, { - "epoch": 1.79, - "learning_rate": 3.223988577828677e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016242712834483813, + "loss": 0.0112, "step": 353820 }, { - "epoch": 1.79, - "learning_rate": 3.223231808527276e-05, - "loss": 0.0085, + "epoch": 0.92, + "learning_rate": 0.00016242324012846664, + "loss": 0.0156, "step": 353830 }, { - "epoch": 1.79, - "learning_rate": 3.2224750392258756e-05, - "loss": 0.0033, + "epoch": 0.92, + "learning_rate": 0.00016241935191209519, + "loss": 0.013, "step": 353840 }, { - "epoch": 1.79, - "learning_rate": 3.2217182699244744e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016241546369572373, + "loss": 0.0118, "step": 353850 }, { - "epoch": 1.79, - "learning_rate": 3.220961500623073e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016241157547935227, + "loss": 0.0149, "step": 353860 }, { - "epoch": 1.79, - "learning_rate": 3.220204731321672e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016240768726298078, + "loss": 0.0106, "step": 353870 }, { - "epoch": 1.79, - "learning_rate": 3.2194479620202715e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.00016240379904660933, + "loss": 0.0146, "step": 353880 }, { - "epoch": 1.79, - "learning_rate": 3.2186911927188704e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016239991083023787, + "loss": 0.0116, "step": 353890 }, { - "epoch": 1.79, - "learning_rate": 3.2179344234174685e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001623960226138664, + "loss": 0.0115, "step": 353900 }, { - "epoch": 1.79, - "learning_rate": 3.217177654116068e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016239213439749492, + "loss": 0.0154, "step": 353910 }, { - "epoch": 1.79, - "learning_rate": 3.216420884814667e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016238824618112346, + "loss": 0.0144, "step": 353920 }, { - "epoch": 1.79, - "learning_rate": 3.2156641155132656e-05, - "loss": 0.0081, + "epoch": 0.92, + "learning_rate": 0.00016238435796475203, + "loss": 0.0148, "step": 353930 }, { - "epoch": 1.79, - "learning_rate": 3.2149073462118645e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016238046974838055, + "loss": 0.0112, "step": 353940 }, { - "epoch": 1.79, - "learning_rate": 3.214150576910464e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016237658153200906, + "loss": 0.0122, "step": 353950 }, { - "epoch": 1.79, - "learning_rate": 3.213393807609063e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.0001623726933156376, + "loss": 0.0114, "step": 353960 }, { - "epoch": 1.79, - "learning_rate": 3.2126370383076616e-05, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.00016236880509926617, + "loss": 0.0136, "step": 353970 }, { - "epoch": 1.79, - "learning_rate": 3.2118802690062604e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.0001623649168828947, + "loss": 0.0154, "step": 353980 }, { - "epoch": 1.79, - "learning_rate": 3.21112349970486e-05, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.00016236102866652323, + "loss": 0.0127, "step": 353990 }, { - "epoch": 1.79, - "learning_rate": 3.210366730403459e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016235714045015174, + "loss": 0.0125, "step": 354000 }, { - "epoch": 1.79, - "eval_cer": 0.9144197953046413, - "eval_loss": 0.004529756028205156, - "eval_runtime": 116.782, - "eval_samples_per_second": 17.126, - "eval_steps_per_second": 4.281, + "epoch": 0.92, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.008665827102959156, + "eval_runtime": 107.3976, + "eval_samples_per_second": 18.622, + "eval_steps_per_second": 4.656, "step": 354000 }, { - "epoch": 1.79, - "learning_rate": 3.2096099611020576e-05, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.0001623532522337803, + "loss": 0.0149, "step": 354010 }, { - "epoch": 1.79, - "learning_rate": 3.2088531918006564e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016234936401740883, + "loss": 0.0122, "step": 354020 }, { - "epoch": 1.79, - "learning_rate": 3.208096422499256e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016234547580103737, + "loss": 0.0127, "step": 354030 }, { - "epoch": 1.79, - "learning_rate": 3.207339653197855e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016234158758466588, + "loss": 0.014, "step": 354040 }, { - "epoch": 1.79, - "learning_rate": 3.2065828838964535e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016233769936829442, + "loss": 0.0109, "step": 354050 }, { - "epoch": 1.79, - "learning_rate": 3.2058261145950524e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016233381115192297, + "loss": 0.016, "step": 354060 }, { - "epoch": 1.79, - "learning_rate": 3.205069345293651e-05, - "loss": 0.0078, + "epoch": 0.92, + "learning_rate": 0.0001623299229355515, + "loss": 0.011, "step": 354070 }, { - "epoch": 1.79, - "learning_rate": 3.20431257599225e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016232603471918002, + "loss": 0.0137, "step": 354080 }, { - "epoch": 1.79, - "learning_rate": 3.2035558066908495e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016232214650280856, + "loss": 0.0117, "step": 354090 }, { - "epoch": 1.79, - "learning_rate": 3.202799037389448e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016231825828643713, + "loss": 0.0103, "step": 354100 }, { - "epoch": 1.79, - "learning_rate": 3.202042268088047e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016231437007006565, + "loss": 0.0125, "step": 354110 }, { - "epoch": 1.79, - "learning_rate": 3.201285498786646e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016231048185369416, + "loss": 0.0132, "step": 354120 }, { - "epoch": 1.79, - "learning_rate": 3.2005287294852455e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.0001623065936373227, + "loss": 0.0113, "step": 354130 }, { - "epoch": 1.79, - "learning_rate": 3.199771960183844e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016230270542095127, + "loss": 0.014, "step": 354140 }, { - "epoch": 1.79, - "learning_rate": 3.199015190882443e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001622988172045798, + "loss": 0.0105, "step": 354150 }, { - "epoch": 1.79, - "learning_rate": 3.198258421581042e-05, - "loss": 0.0113, + "epoch": 0.92, + "learning_rate": 0.00016229492898820833, + "loss": 0.0103, "step": 354160 }, { - "epoch": 1.79, - "learning_rate": 3.1975016522796414e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016229104077183684, + "loss": 0.0125, "step": 354170 }, { - "epoch": 1.79, - "learning_rate": 3.19674488297824e-05, - "loss": 0.0082, + "epoch": 0.92, + "learning_rate": 0.0001622871525554654, + "loss": 0.011, "step": 354180 }, { - "epoch": 1.79, - "learning_rate": 3.195988113676839e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016228326433909393, + "loss": 0.0128, "step": 354190 }, { - "epoch": 1.79, - "learning_rate": 3.195231344375438e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016227937612272247, + "loss": 0.014, "step": 354200 }, { - "epoch": 1.79, - "learning_rate": 3.194474575074037e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016227548790635098, + "loss": 0.0125, "step": 354210 }, { - "epoch": 1.79, - "learning_rate": 3.1937178057726355e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016227159968997955, + "loss": 0.0143, "step": 354220 }, { - "epoch": 1.79, - "learning_rate": 3.192961036471235e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016226771147360807, + "loss": 0.0128, "step": 354230 }, { - "epoch": 1.79, - "learning_rate": 3.192204267169834e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.0001622638232572366, + "loss": 0.0104, "step": 354240 }, { - "epoch": 1.79, - "learning_rate": 3.191447497868433e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016225993504086512, + "loss": 0.011, "step": 354250 }, { - "epoch": 1.79, - "learning_rate": 3.1906907285670315e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.0001622560468244937, + "loss": 0.0111, "step": 354260 }, { - "epoch": 1.79, - "learning_rate": 3.189933959265631e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.0001622521586081222, + "loss": 0.0128, "step": 354270 }, { - "epoch": 1.79, - "learning_rate": 3.18917718996423e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016224827039175075, + "loss": 0.013, "step": 354280 }, { - "epoch": 1.79, - "learning_rate": 3.1884204206628287e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016224438217537926, + "loss": 0.0156, "step": 354290 }, { - "epoch": 1.79, - "learning_rate": 3.1876636513614275e-05, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.0001622404939590078, + "loss": 0.0145, "step": 354300 }, { - "epoch": 1.79, - "learning_rate": 3.186906882060027e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016223660574263637, + "loss": 0.0128, "step": 354310 }, { - "epoch": 1.79, - "learning_rate": 3.186150112758626e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016223271752626489, + "loss": 0.0131, "step": 354320 }, { - "epoch": 1.79, - "learning_rate": 3.1853933434572246e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016222882930989343, + "loss": 0.0111, "step": 354330 }, { - "epoch": 1.79, - "learning_rate": 3.1846365741558234e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016222494109352194, + "loss": 0.0137, "step": 354340 }, { - "epoch": 1.79, - "learning_rate": 3.183879804854423e-05, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.0001622210528771505, + "loss": 0.016, "step": 354350 }, { - "epoch": 1.79, - "learning_rate": 3.183123035553022e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016221716466077903, + "loss": 0.012, "step": 354360 }, { - "epoch": 1.79, - "learning_rate": 3.1823662662516206e-05, - "loss": 0.0074, + "epoch": 0.92, + "learning_rate": 0.00016221327644440757, + "loss": 0.012, "step": 354370 }, { - "epoch": 1.79, - "learning_rate": 3.1816094969502194e-05, - "loss": 0.0086, + "epoch": 0.92, + "learning_rate": 0.00016220938822803608, + "loss": 0.0124, "step": 354380 }, { - "epoch": 1.79, - "learning_rate": 3.180852727648818e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016220550001166465, + "loss": 0.0101, "step": 354390 }, { - "epoch": 1.79, - "learning_rate": 3.180095958347417e-05, - "loss": 0.0074, + "epoch": 0.92, + "learning_rate": 0.00016220161179529317, + "loss": 0.012, "step": 354400 }, { - "epoch": 1.79, - "learning_rate": 3.1793391890460165e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.0001621977235789217, + "loss": 0.0133, "step": 354410 }, { - "epoch": 1.79, - "learning_rate": 3.1785824197446154e-05, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.00016219383536255022, + "loss": 0.0108, "step": 354420 }, { - "epoch": 1.79, - "learning_rate": 3.177825650443214e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.0001621899471461788, + "loss": 0.0124, "step": 354430 }, { - "epoch": 1.79, - "learning_rate": 3.177068881141813e-05, - "loss": 0.0068, + "epoch": 0.92, + "learning_rate": 0.0001621860589298073, + "loss": 0.0134, "step": 354440 }, { - "epoch": 1.79, - "learning_rate": 3.1763121118404125e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016218217071343585, + "loss": 0.0121, "step": 354450 }, { - "epoch": 1.79, - "learning_rate": 3.175555342539011e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016217828249706436, + "loss": 0.0106, "step": 354460 }, { - "epoch": 1.79, - "learning_rate": 3.17479857323761e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016217439428069293, + "loss": 0.0139, "step": 354470 }, { - "epoch": 1.79, - "learning_rate": 3.174041803936209e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016217050606432147, + "loss": 0.0178, "step": 354480 }, { - "epoch": 1.79, - "learning_rate": 3.1732850346348085e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016216661784794999, + "loss": 0.0159, "step": 354490 }, { - "epoch": 1.79, - "learning_rate": 3.172528265333407e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016216272963157853, + "loss": 0.0123, "step": 354500 }, { - "epoch": 1.79, - "learning_rate": 3.171771496032006e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016215884141520707, + "loss": 0.0156, "step": 354510 }, { - "epoch": 1.79, - "learning_rate": 3.171014726730605e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.0001621549531988356, + "loss": 0.0145, "step": 354520 }, { - "epoch": 1.79, - "learning_rate": 3.170257957429204e-05, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.00016215106498246413, + "loss": 0.0115, "step": 354530 }, { - "epoch": 1.79, - "learning_rate": 3.1695011881278026e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016214717676609267, + "loss": 0.0113, "step": 354540 }, { - "epoch": 1.79, - "learning_rate": 3.168744418826402e-05, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.00016214328854972118, + "loss": 0.0106, "step": 354550 }, { - "epoch": 1.79, - "learning_rate": 3.167987649525001e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016213940033334975, + "loss": 0.0155, "step": 354560 }, { - "epoch": 1.79, - "learning_rate": 3.1672308802236e-05, - "loss": 0.004, + "epoch": 0.92, + "learning_rate": 0.00016213551211697826, + "loss": 0.0129, "step": 354570 }, { - "epoch": 1.79, - "learning_rate": 3.1664741109221986e-05, - "loss": 0.0068, + "epoch": 0.92, + "learning_rate": 0.0001621316239006068, + "loss": 0.014, "step": 354580 }, { - "epoch": 1.79, - "learning_rate": 3.165717341620798e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016212773568423532, + "loss": 0.0099, "step": 354590 }, { - "epoch": 1.79, - "learning_rate": 3.164960572319397e-05, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.0001621238474678639, + "loss": 0.018, "step": 354600 }, { - "epoch": 1.79, - "learning_rate": 3.164203803017996e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.0001621199592514924, + "loss": 0.0125, "step": 354610 }, { - "epoch": 1.79, - "learning_rate": 3.1634470337165945e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016211607103512095, + "loss": 0.0151, "step": 354620 }, { - "epoch": 1.79, - "learning_rate": 3.162690264415194e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016211218281874946, + "loss": 0.0129, "step": 354630 }, { - "epoch": 1.79, - "learning_rate": 3.161933495113793e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016210829460237803, + "loss": 0.0156, "step": 354640 }, { - "epoch": 1.79, - "learning_rate": 3.1611767258123917e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016210440638600657, + "loss": 0.0119, "step": 354650 }, { - "epoch": 1.79, - "learning_rate": 3.1604199565109905e-05, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.00016210051816963509, + "loss": 0.014, "step": 354660 }, { - "epoch": 1.79, - "learning_rate": 3.15966318720959e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.0001620966299532636, + "loss": 0.0199, "step": 354670 }, { - "epoch": 1.79, - "learning_rate": 3.158906417908188e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016209274173689217, + "loss": 0.0124, "step": 354680 }, { - "epoch": 1.79, - "learning_rate": 3.158149648606787e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.0001620888535205207, + "loss": 0.0132, "step": 354690 }, { - "epoch": 1.79, - "learning_rate": 3.1573928793053864e-05, - "loss": 0.0069, + "epoch": 0.92, + "learning_rate": 0.00016208496530414922, + "loss": 0.0135, "step": 354700 }, { - "epoch": 1.79, - "learning_rate": 3.156636110003985e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016208107708777777, + "loss": 0.0136, "step": 354710 }, { - "epoch": 1.79, - "learning_rate": 3.155879340702584e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.0001620771888714063, + "loss": 0.0111, "step": 354720 }, { - "epoch": 1.79, - "learning_rate": 3.155122571401183e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016207330065503485, + "loss": 0.0119, "step": 354730 }, { - "epoch": 1.79, - "learning_rate": 3.1543658020997824e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016206941243866336, + "loss": 0.0146, "step": 354740 }, { - "epoch": 1.79, - "learning_rate": 3.153609032798381e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.0001620655242222919, + "loss": 0.0138, "step": 354750 }, { - "epoch": 1.79, - "learning_rate": 3.15285226349698e-05, - "loss": 0.0087, + "epoch": 0.92, + "learning_rate": 0.00016206163600592045, + "loss": 0.0143, "step": 354760 }, { - "epoch": 1.79, - "learning_rate": 3.1520954941955796e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.000162057747789549, + "loss": 0.0127, "step": 354770 }, { - "epoch": 1.79, - "learning_rate": 3.1513387248941784e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.0001620538595731775, + "loss": 0.0126, "step": 354780 }, { - "epoch": 1.79, - "learning_rate": 3.150581955592777e-05, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.00016204997135680605, + "loss": 0.0139, "step": 354790 }, { - "epoch": 1.79, - "learning_rate": 3.149825186291376e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016204608314043456, + "loss": 0.0114, "step": 354800 }, { - "epoch": 1.79, - "learning_rate": 3.1490684169899755e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016204219492406313, + "loss": 0.0151, "step": 354810 }, { - "epoch": 1.79, - "learning_rate": 3.1483116476885743e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016203830670769164, + "loss": 0.0123, "step": 354820 }, { - "epoch": 1.79, - "learning_rate": 3.147554878387173e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016203441849132018, + "loss": 0.0137, "step": 354830 }, { - "epoch": 1.79, - "learning_rate": 3.146798109085772e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.0001620305302749487, + "loss": 0.0121, "step": 354840 }, { - "epoch": 1.79, - "learning_rate": 3.146041339784371e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016202664205857727, + "loss": 0.0167, "step": 354850 }, { - "epoch": 1.79, - "learning_rate": 3.1452845704829696e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.0001620227538422058, + "loss": 0.0114, "step": 354860 }, { - "epoch": 1.79, - "learning_rate": 3.1445278011815685e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016201886562583432, + "loss": 0.0126, "step": 354870 }, { - "epoch": 1.79, - "learning_rate": 3.143771031880168e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016201497740946287, + "loss": 0.0157, "step": 354880 }, { - "epoch": 1.79, - "learning_rate": 3.143014262578767e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.0001620110891930914, + "loss": 0.0117, "step": 354890 }, { - "epoch": 1.79, - "learning_rate": 3.1422574932773656e-05, - "loss": 0.008, + "epoch": 0.92, + "learning_rate": 0.00016200720097671995, + "loss": 0.0128, "step": 354900 }, { - "epoch": 1.79, - "learning_rate": 3.1415007239759644e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.00016200331276034846, + "loss": 0.0117, "step": 354910 }, { - "epoch": 1.79, - "learning_rate": 3.140743954674564e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.000161999424543977, + "loss": 0.0104, "step": 354920 }, { - "epoch": 1.79, - "learning_rate": 3.139987185373163e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016199553632760555, + "loss": 0.0147, "step": 354930 }, { - "epoch": 1.79, - "learning_rate": 3.1392304160717616e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001619916481112341, + "loss": 0.0124, "step": 354940 }, { - "epoch": 1.79, - "learning_rate": 3.1384736467703604e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.0001619877598948626, + "loss": 0.0166, "step": 354950 }, { - "epoch": 1.79, - "learning_rate": 3.13771687746896e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016198387167849114, + "loss": 0.009, "step": 354960 }, { - "epoch": 1.79, - "learning_rate": 3.136960108167559e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.0001619799834621197, + "loss": 0.0144, "step": 354970 }, { - "epoch": 1.79, - "learning_rate": 3.1362033388661575e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016197609524574823, + "loss": 0.0111, "step": 354980 }, { - "epoch": 1.79, - "learning_rate": 3.1354465695647563e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016197220702937674, + "loss": 0.0142, "step": 354990 }, { - "epoch": 1.79, - "learning_rate": 3.134689800263355e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016196831881300528, + "loss": 0.009, "step": 355000 }, { - "epoch": 1.79, - "eval_cer": 0.9144265880775191, - "eval_loss": 0.004483331926167011, - "eval_runtime": 116.7694, - "eval_samples_per_second": 17.128, - "eval_steps_per_second": 4.282, + "epoch": 0.92, + "eval_cer": 0.8817362776095881, + "eval_loss": 0.008503294549882412, + "eval_runtime": 107.342, + "eval_samples_per_second": 18.632, + "eval_steps_per_second": 4.658, "step": 355000 }, { - "epoch": 1.79, - "learning_rate": 3.133933030961954e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016196443059663385, + "loss": 0.0141, "step": 355010 }, { - "epoch": 1.79, - "learning_rate": 3.1331762616605535e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016196054238026237, + "loss": 0.0128, "step": 355020 }, { - "epoch": 1.79, - "learning_rate": 3.132419492359152e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.0001619566541638909, + "loss": 0.0149, "step": 355030 }, { - "epoch": 1.79, - "learning_rate": 3.131662723057751e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.00016195276594751942, + "loss": 0.0188, "step": 355040 }, { - "epoch": 1.79, - "learning_rate": 3.13090595375635e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016194887773114797, + "loss": 0.016, "step": 355050 }, { - "epoch": 1.79, - "learning_rate": 3.1301491844549495e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.0001619449895147765, + "loss": 0.0166, "step": 355060 }, { - "epoch": 1.79, - "learning_rate": 3.129392415153548e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016194110129840505, + "loss": 0.0111, "step": 355070 }, { - "epoch": 1.79, - "learning_rate": 3.128635645852147e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016193721308203356, + "loss": 0.0151, "step": 355080 }, { - "epoch": 1.79, - "learning_rate": 3.127878876550746e-05, - "loss": 0.0088, + "epoch": 0.92, + "learning_rate": 0.0001619333248656621, + "loss": 0.0161, "step": 355090 }, { - "epoch": 1.79, - "learning_rate": 3.1271221072493454e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016192943664929065, + "loss": 0.0102, "step": 355100 }, { - "epoch": 1.79, - "learning_rate": 3.126365337947944e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.0001619255484329192, + "loss": 0.0149, "step": 355110 }, { - "epoch": 1.79, - "learning_rate": 3.125608568646543e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.0001619216602165477, + "loss": 0.0139, "step": 355120 }, { - "epoch": 1.79, - "learning_rate": 3.124851799345142e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016191777200017624, + "loss": 0.0128, "step": 355130 }, { - "epoch": 1.79, - "learning_rate": 3.1240950300437414e-05, - "loss": 0.0042, + "epoch": 0.92, + "learning_rate": 0.00016191388378380479, + "loss": 0.0138, "step": 355140 }, { - "epoch": 1.79, - "learning_rate": 3.1233382607423395e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016190999556743333, + "loss": 0.0144, "step": 355150 }, { - "epoch": 1.79, - "learning_rate": 3.122581491440939e-05, - "loss": 0.0043, + "epoch": 0.92, + "learning_rate": 0.00016190610735106184, + "loss": 0.0154, "step": 355160 }, { - "epoch": 1.79, - "learning_rate": 3.121824722139538e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016190221913469038, + "loss": 0.0107, "step": 355170 }, { - "epoch": 1.79, - "learning_rate": 3.121067952838137e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.00016189833091831895, + "loss": 0.0125, "step": 355180 }, { - "epoch": 1.79, - "learning_rate": 3.1203111835367355e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016189444270194747, + "loss": 0.0169, "step": 355190 }, { - "epoch": 1.79, - "learning_rate": 3.119554414235335e-05, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.000161890554485576, + "loss": 0.017, "step": 355200 }, { - "epoch": 1.79, - "learning_rate": 3.118797644933934e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016188666626920452, + "loss": 0.012, "step": 355210 }, { - "epoch": 1.79, - "learning_rate": 3.1180408756325326e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.0001618827780528331, + "loss": 0.0109, "step": 355220 }, { - "epoch": 1.79, - "learning_rate": 3.1172841063311315e-05, - "loss": 0.0076, + "epoch": 0.92, + "learning_rate": 0.0001618788898364616, + "loss": 0.0107, "step": 355230 }, { - "epoch": 1.79, - "learning_rate": 3.116527337029731e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016187500162009015, + "loss": 0.0145, "step": 355240 }, { - "epoch": 1.79, - "learning_rate": 3.11577056772833e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016187111340371866, + "loss": 0.0137, "step": 355250 }, { - "epoch": 1.79, - "learning_rate": 3.1150137984269286e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016186722518734723, + "loss": 0.0119, "step": 355260 }, { - "epoch": 1.79, - "learning_rate": 3.1142570291255274e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016186333697097575, + "loss": 0.0117, "step": 355270 }, { - "epoch": 1.79, - "learning_rate": 3.113500259824127e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.0001618594487546043, + "loss": 0.0153, "step": 355280 }, { - "epoch": 1.79, - "learning_rate": 3.112743490522726e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.0001618555605382328, + "loss": 0.0158, "step": 355290 }, { - "epoch": 1.79, - "learning_rate": 3.1119867212213246e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.00016185167232186134, + "loss": 0.0111, "step": 355300 }, { - "epoch": 1.79, - "learning_rate": 3.1112299519199234e-05, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.00016184778410548989, + "loss": 0.0133, "step": 355310 }, { - "epoch": 1.79, - "learning_rate": 3.110473182618522e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016184389588911843, + "loss": 0.0114, "step": 355320 }, { - "epoch": 1.79, - "learning_rate": 3.109716413317121e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016184000767274694, + "loss": 0.0124, "step": 355330 }, { - "epoch": 1.79, - "learning_rate": 3.1089596440157205e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016183611945637548, + "loss": 0.0182, "step": 355340 }, { - "epoch": 1.79, - "learning_rate": 3.1082028747143194e-05, - "loss": 0.0032, + "epoch": 0.92, + "learning_rate": 0.00016183223124000405, + "loss": 0.0121, "step": 355350 }, { - "epoch": 1.79, - "learning_rate": 3.107446105412918e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016182834302363257, + "loss": 0.0144, "step": 355360 }, { - "epoch": 1.79, - "learning_rate": 3.106689336111517e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.0001618244548072611, + "loss": 0.0114, "step": 355370 }, { - "epoch": 1.79, - "learning_rate": 3.1059325668101165e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016182056659088962, + "loss": 0.0119, "step": 355380 }, { - "epoch": 1.79, - "learning_rate": 3.105175797508715e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.0001618166783745182, + "loss": 0.0098, "step": 355390 }, { - "epoch": 1.79, - "learning_rate": 3.104419028207314e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.0001618127901581467, + "loss": 0.0154, "step": 355400 }, { - "epoch": 1.79, - "learning_rate": 3.103662258905913e-05, - "loss": 0.009, + "epoch": 0.92, + "learning_rate": 0.00016180890194177525, + "loss": 0.0128, "step": 355410 }, { - "epoch": 1.79, - "learning_rate": 3.1029054896045125e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016180501372540376, + "loss": 0.0148, "step": 355420 }, { - "epoch": 1.79, - "learning_rate": 3.102148720303111e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016180112550903233, + "loss": 0.0137, "step": 355430 }, { - "epoch": 1.79, - "learning_rate": 3.10139195100171e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016179723729266084, + "loss": 0.0139, "step": 355440 }, { - "epoch": 1.79, - "learning_rate": 3.100635181700309e-05, - "loss": 0.0083, + "epoch": 0.92, + "learning_rate": 0.0001617933490762894, + "loss": 0.0124, "step": 355450 }, { - "epoch": 1.79, - "learning_rate": 3.0998784123989084e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.0001617894608599179, + "loss": 0.0155, "step": 355460 }, { - "epoch": 1.79, - "learning_rate": 3.0991216430975066e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016178557264354647, + "loss": 0.0142, "step": 355470 }, { - "epoch": 1.79, - "learning_rate": 3.098364873796106e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.00016178168442717498, + "loss": 0.015, "step": 355480 }, { - "epoch": 1.79, - "learning_rate": 3.097608104494705e-05, - "loss": 0.0093, + "epoch": 0.92, + "learning_rate": 0.00016177779621080353, + "loss": 0.0158, "step": 355490 }, { - "epoch": 1.79, - "learning_rate": 3.096851335193304e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016177390799443204, + "loss": 0.0152, "step": 355500 }, { - "epoch": 1.79, - "learning_rate": 3.0960945658919025e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001617700197780606, + "loss": 0.0135, "step": 355510 }, { - "epoch": 1.79, - "learning_rate": 3.095337796590502e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016176613156168915, + "loss": 0.0104, "step": 355520 }, { - "epoch": 1.79, - "learning_rate": 3.094581027289101e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016176224334531767, + "loss": 0.0118, "step": 355530 }, { - "epoch": 1.79, - "learning_rate": 3.0938242579877e-05, - "loss": 0.0074, + "epoch": 0.92, + "learning_rate": 0.00016175835512894618, + "loss": 0.0156, "step": 355540 }, { - "epoch": 1.79, - "learning_rate": 3.0930674886862985e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016175446691257472, + "loss": 0.0143, "step": 355550 }, { - "epoch": 1.79, - "learning_rate": 3.092310719384898e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.0001617505786962033, + "loss": 0.0153, "step": 355560 }, { - "epoch": 1.79, - "learning_rate": 3.091553950083497e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.0001617466904798318, + "loss": 0.0164, "step": 355570 }, { - "epoch": 1.79, - "learning_rate": 3.0907971807820956e-05, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.00016174280226346035, + "loss": 0.0132, "step": 355580 }, { - "epoch": 1.79, - "learning_rate": 3.0900404114806945e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016173891404708886, + "loss": 0.0148, "step": 355590 }, { - "epoch": 1.79, - "learning_rate": 3.089283642179294e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016173502583071743, + "loss": 0.0115, "step": 355600 }, { - "epoch": 1.79, - "learning_rate": 3.088526872877893e-05, - "loss": 0.009, + "epoch": 0.92, + "learning_rate": 0.00016173113761434594, + "loss": 0.0105, "step": 355610 }, { - "epoch": 1.79, - "learning_rate": 3.0877701035764916e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016172724939797449, + "loss": 0.0128, "step": 355620 }, { - "epoch": 1.79, - "learning_rate": 3.0870133342750904e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.000161723361181603, + "loss": 0.0136, "step": 355630 }, { - "epoch": 1.79, - "learning_rate": 3.086256564973689e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016171947296523157, + "loss": 0.013, "step": 355640 }, { - "epoch": 1.79, - "learning_rate": 3.085499795672288e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016171558474886008, + "loss": 0.0126, "step": 355650 }, { - "epoch": 1.79, - "learning_rate": 3.084743026370887e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016171169653248863, + "loss": 0.0146, "step": 355660 }, { - "epoch": 1.79, - "learning_rate": 3.0839862570694864e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016170780831611714, + "loss": 0.0101, "step": 355670 }, { - "epoch": 1.79, - "learning_rate": 3.083229487768085e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.0001617039200997457, + "loss": 0.0146, "step": 355680 }, { - "epoch": 1.79, - "learning_rate": 3.082472718466684e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016170003188337425, + "loss": 0.0143, "step": 355690 }, { - "epoch": 1.79, - "learning_rate": 3.081715949165283e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016169614366700276, + "loss": 0.014, "step": 355700 }, { - "epoch": 1.79, - "learning_rate": 3.0809591798638824e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016169225545063128, + "loss": 0.0133, "step": 355710 }, { - "epoch": 1.79, - "learning_rate": 3.080202410562481e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016168836723425985, + "loss": 0.0122, "step": 355720 }, { - "epoch": 1.79, - "learning_rate": 3.07944564126108e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.0001616844790178884, + "loss": 0.0131, "step": 355730 }, { - "epoch": 1.79, - "learning_rate": 3.0786888719596795e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.0001616805908015169, + "loss": 0.0109, "step": 355740 }, { - "epoch": 1.79, - "learning_rate": 3.077932102658278e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016167670258514545, + "loss": 0.0131, "step": 355750 }, { - "epoch": 1.79, - "learning_rate": 3.077175333356877e-05, - "loss": 0.007, + "epoch": 0.92, + "learning_rate": 0.000161672814368774, + "loss": 0.0121, "step": 355760 }, { - "epoch": 1.79, - "learning_rate": 3.076418564055476e-05, - "loss": 0.0086, + "epoch": 0.92, + "learning_rate": 0.00016166892615240253, + "loss": 0.0123, "step": 355770 }, { - "epoch": 1.79, - "learning_rate": 3.075661794754075e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.00016166503793603104, + "loss": 0.0149, "step": 355780 }, { - "epoch": 1.79, - "learning_rate": 3.0749050254526736e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016166114971965959, + "loss": 0.0147, "step": 355790 }, { - "epoch": 1.8, - "learning_rate": 3.0741482561512724e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.0001616572615032881, + "loss": 0.0123, "step": 355800 }, { - "epoch": 1.8, - "learning_rate": 3.073391486849872e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016165337328691667, + "loss": 0.0111, "step": 355810 }, { - "epoch": 1.8, - "learning_rate": 3.072634717548471e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016164948507054518, + "loss": 0.012, "step": 355820 }, { - "epoch": 1.8, - "learning_rate": 3.0718779482470696e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.00016164559685417372, + "loss": 0.0122, "step": 355830 }, { - "epoch": 1.8, - "learning_rate": 3.0711211789456684e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016164170863780224, + "loss": 0.0148, "step": 355840 }, { - "epoch": 1.8, - "learning_rate": 3.070364409644268e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.0001616378204214308, + "loss": 0.0149, "step": 355850 }, { - "epoch": 1.8, - "learning_rate": 3.069607640342867e-05, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.00016163393220505932, + "loss": 0.011, "step": 355860 }, { - "epoch": 1.8, - "learning_rate": 3.0688508710414655e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016163004398868786, + "loss": 0.0142, "step": 355870 }, { - "epoch": 1.8, - "learning_rate": 3.0680941017400644e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016162615577231638, + "loss": 0.0138, "step": 355880 }, { - "epoch": 1.8, - "learning_rate": 3.067337332438664e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016162226755594495, + "loss": 0.0164, "step": 355890 }, { - "epoch": 1.8, - "learning_rate": 3.066580563137263e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.0001616183793395735, + "loss": 0.0146, "step": 355900 }, { - "epoch": 1.8, - "learning_rate": 3.0658237938358615e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.000161614491123202, + "loss": 0.0126, "step": 355910 }, { - "epoch": 1.8, - "learning_rate": 3.06506702453446e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016161060290683055, + "loss": 0.0131, "step": 355920 }, { - "epoch": 1.8, - "learning_rate": 3.06431025523306e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.0001616067146904591, + "loss": 0.0144, "step": 355930 }, { - "epoch": 1.8, - "learning_rate": 3.063553485931658e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016160282647408763, + "loss": 0.0118, "step": 355940 }, { - "epoch": 1.8, - "learning_rate": 3.0627967166302575e-05, - "loss": 0.0045, + "epoch": 0.92, + "learning_rate": 0.00016159893825771614, + "loss": 0.0135, "step": 355950 }, { - "epoch": 1.8, - "learning_rate": 3.062039947328856e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016159505004134468, + "loss": 0.0165, "step": 355960 }, { - "epoch": 1.8, - "learning_rate": 3.061283178027455e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016159116182497323, + "loss": 0.0143, "step": 355970 }, { - "epoch": 1.8, - "learning_rate": 3.060526408726054e-05, - "loss": 0.0086, + "epoch": 0.92, + "learning_rate": 0.00016158727360860177, + "loss": 0.0174, "step": 355980 }, { - "epoch": 1.8, - "learning_rate": 3.0597696394246534e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016158338539223028, + "loss": 0.0144, "step": 355990 }, { - "epoch": 1.8, - "learning_rate": 3.059012870123252e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016157949717585882, + "loss": 0.0134, "step": 356000 }, { - "epoch": 1.8, - "eval_cer": 0.9144130025317635, - "eval_loss": 0.0044956691563129425, - "eval_runtime": 116.7755, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.92, + "eval_cer": 0.8817866645392185, + "eval_loss": 0.008485401049256325, + "eval_runtime": 107.1956, + "eval_samples_per_second": 18.657, + "eval_steps_per_second": 4.664, "step": 356000 }, { - "epoch": 1.8, - "learning_rate": 3.058256100821851e-05, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.00016157560895948737, + "loss": 0.0088, "step": 356010 }, { - "epoch": 1.8, - "learning_rate": 3.05749933152045e-05, - "loss": 0.0055, - "step": 356020 + "epoch": 0.92, + "learning_rate": 0.0001615717207431159, + "loss": 0.0102, + "step": 356020 }, { - "epoch": 1.8, - "learning_rate": 3.0567425622190494e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016156783252674442, + "loss": 0.0121, "step": 356030 }, { - "epoch": 1.8, - "learning_rate": 3.055985792917648e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016156394431037296, + "loss": 0.0107, "step": 356040 }, { - "epoch": 1.8, - "learning_rate": 3.055229023616247e-05, - "loss": 0.0087, + "epoch": 0.92, + "learning_rate": 0.00016156005609400148, + "loss": 0.014, "step": 356050 }, { - "epoch": 1.8, - "learning_rate": 3.054472254314846e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016155616787763005, + "loss": 0.0128, "step": 356060 }, { - "epoch": 1.8, - "learning_rate": 3.0537154850134454e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.0001615522796612586, + "loss": 0.0145, "step": 356070 }, { - "epoch": 1.8, - "learning_rate": 3.052958715712044e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.0001615483914448871, + "loss": 0.0113, "step": 356080 }, { - "epoch": 1.8, - "learning_rate": 3.052201946410643e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016154450322851564, + "loss": 0.0111, "step": 356090 }, { - "epoch": 1.8, - "learning_rate": 3.051445177109242e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001615406150121442, + "loss": 0.0108, "step": 356100 }, { - "epoch": 1.8, - "learning_rate": 3.0506884078078407e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016153672679577273, + "loss": 0.0139, "step": 356110 }, { - "epoch": 1.8, - "learning_rate": 3.0499316385064398e-05, - "loss": 0.0046, + "epoch": 0.92, + "learning_rate": 0.00016153283857940124, + "loss": 0.013, "step": 356120 }, { - "epoch": 1.8, - "learning_rate": 3.0491748692050386e-05, - "loss": 0.0079, + "epoch": 0.92, + "learning_rate": 0.00016152895036302978, + "loss": 0.0129, "step": 356130 }, { - "epoch": 1.8, - "learning_rate": 3.0484180999036378e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016152506214665833, + "loss": 0.014, "step": 356140 }, { - "epoch": 1.8, - "learning_rate": 3.0476613306022366e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016152117393028687, + "loss": 0.0145, "step": 356150 }, { - "epoch": 1.8, - "learning_rate": 3.0469045613008358e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016151728571391538, + "loss": 0.0112, "step": 356160 }, { - "epoch": 1.8, - "learning_rate": 3.0461477919994346e-05, - "loss": 0.0083, + "epoch": 0.92, + "learning_rate": 0.00016151339749754392, + "loss": 0.0135, "step": 356170 }, { - "epoch": 1.8, - "learning_rate": 3.0453910226980338e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016150950928117247, + "loss": 0.0147, "step": 356180 }, { - "epoch": 1.8, - "learning_rate": 3.0446342533966326e-05, - "loss": 0.004, + "epoch": 0.92, + "learning_rate": 0.000161505621064801, + "loss": 0.0162, "step": 356190 }, { - "epoch": 1.8, - "learning_rate": 3.0438774840952318e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016150173284842952, + "loss": 0.0141, "step": 356200 }, { - "epoch": 1.8, - "learning_rate": 3.0431207147938306e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016149784463205806, + "loss": 0.0155, "step": 356210 }, { - "epoch": 1.8, - "learning_rate": 3.0423639454924297e-05, - "loss": 0.0064, + "epoch": 0.92, + "learning_rate": 0.00016149395641568663, + "loss": 0.0152, "step": 356220 }, { - "epoch": 1.8, - "learning_rate": 3.0416071761910286e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016149006819931515, + "loss": 0.0137, "step": 356230 }, { - "epoch": 1.8, - "learning_rate": 3.0408504068896277e-05, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.0001614861799829437, + "loss": 0.0111, "step": 356240 }, { - "epoch": 1.8, - "learning_rate": 3.0400936375882262e-05, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.0001614822917665722, + "loss": 0.0192, "step": 356250 }, { - "epoch": 1.8, - "learning_rate": 3.0393368682868254e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016147840355020077, + "loss": 0.0119, "step": 356260 }, { - "epoch": 1.8, - "learning_rate": 3.0385800989854242e-05, - "loss": 0.0048, + "epoch": 0.92, + "learning_rate": 0.00016147451533382929, + "loss": 0.0128, "step": 356270 }, { - "epoch": 1.8, - "learning_rate": 3.0378233296840233e-05, + "epoch": 0.92, + "learning_rate": 0.00016147062711745783, "loss": 0.0092, "step": 356280 }, { - "epoch": 1.8, - "learning_rate": 3.037066560382622e-05, - "loss": 0.0062, + "epoch": 0.92, + "learning_rate": 0.00016146673890108634, + "loss": 0.0122, "step": 356290 }, { - "epoch": 1.8, - "learning_rate": 3.0363097910812213e-05, - "loss": 0.0042, + "epoch": 0.92, + "learning_rate": 0.00016146285068471488, + "loss": 0.0162, "step": 356300 }, { - "epoch": 1.8, - "learning_rate": 3.03555302177982e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016145896246834343, + "loss": 0.0155, "step": 356310 }, { - "epoch": 1.8, - "learning_rate": 3.0347962524784193e-05, - "loss": 0.0077, + "epoch": 0.92, + "learning_rate": 0.00016145507425197197, + "loss": 0.0152, "step": 356320 }, { - "epoch": 1.8, - "learning_rate": 3.034039483177018e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016145118603560048, + "loss": 0.011, "step": 356330 }, { - "epoch": 1.8, - "learning_rate": 3.0332827138756173e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016144729781922902, + "loss": 0.0124, "step": 356340 }, { - "epoch": 1.8, - "learning_rate": 3.032525944574216e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016144340960285756, + "loss": 0.0136, "step": 356350 }, { - "epoch": 1.8, - "learning_rate": 3.0317691752728153e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.0001614395213864861, + "loss": 0.0117, "step": 356360 }, { - "epoch": 1.8, - "learning_rate": 3.031012405971414e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016143563317011462, + "loss": 0.0131, "step": 356370 }, { - "epoch": 1.8, - "learning_rate": 3.0302556366700133e-05, - "loss": 0.0091, + "epoch": 0.92, + "learning_rate": 0.00016143174495374316, + "loss": 0.0122, "step": 356380 }, { - "epoch": 1.8, - "learning_rate": 3.029498867368612e-05, - "loss": 0.0079, + "epoch": 0.92, + "learning_rate": 0.00016142785673737173, + "loss": 0.0122, "step": 356390 }, { - "epoch": 1.8, - "learning_rate": 3.0287420980672112e-05, - "loss": 0.0073, + "epoch": 0.92, + "learning_rate": 0.00016142396852100025, + "loss": 0.0112, "step": 356400 }, { - "epoch": 1.8, - "learning_rate": 3.0279853287658097e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016142008030462876, + "loss": 0.0181, "step": 356410 }, { - "epoch": 1.8, - "learning_rate": 3.0272285594644085e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.0001614161920882573, + "loss": 0.011, "step": 356420 }, { - "epoch": 1.8, - "learning_rate": 3.0264717901630077e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016141230387188587, + "loss": 0.0125, "step": 356430 }, { - "epoch": 1.8, - "learning_rate": 3.0257150208616065e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016140841565551439, + "loss": 0.0095, "step": 356440 }, { - "epoch": 1.8, - "learning_rate": 3.0249582515602057e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016140452743914293, + "loss": 0.014, "step": 356450 }, { - "epoch": 1.8, - "learning_rate": 3.024201482258805e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016140063922277144, + "loss": 0.0138, "step": 356460 }, { - "epoch": 1.8, - "learning_rate": 3.0234447129574037e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.0001613967510064, + "loss": 0.0123, "step": 356470 }, { - "epoch": 1.8, - "learning_rate": 3.0226879436560028e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016139286279002852, + "loss": 0.0144, "step": 356480 }, { - "epoch": 1.8, - "learning_rate": 3.0219311743546017e-05, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.00016138897457365707, + "loss": 0.013, "step": 356490 }, { - "epoch": 1.8, - "learning_rate": 3.0211744050532008e-05, - "loss": 0.004, + "epoch": 0.92, + "learning_rate": 0.00016138508635728558, + "loss": 0.0127, "step": 356500 }, { - "epoch": 1.8, - "learning_rate": 3.0204176357517996e-05, - "loss": 0.0067, + "epoch": 0.92, + "learning_rate": 0.00016138119814091415, + "loss": 0.0125, "step": 356510 }, { - "epoch": 1.8, - "learning_rate": 3.0196608664503988e-05, - "loss": 0.0055, + "epoch": 0.92, + "learning_rate": 0.00016137730992454266, + "loss": 0.0116, "step": 356520 }, { - "epoch": 1.8, - "learning_rate": 3.0189040971489976e-05, - "loss": 0.0104, + "epoch": 0.92, + "learning_rate": 0.0001613734217081712, + "loss": 0.014, "step": 356530 }, { - "epoch": 1.8, - "learning_rate": 3.0181473278475968e-05, - "loss": 0.0058, + "epoch": 0.92, + "learning_rate": 0.00016136953349179972, + "loss": 0.0114, "step": 356540 }, { - "epoch": 1.8, - "learning_rate": 3.0173905585461956e-05, - "loss": 0.0038, + "epoch": 0.92, + "learning_rate": 0.00016136564527542826, + "loss": 0.0116, "step": 356550 }, { - "epoch": 1.8, - "learning_rate": 3.0166337892447948e-05, - "loss": 0.0057, + "epoch": 0.92, + "learning_rate": 0.00016136175705905683, + "loss": 0.0134, "step": 356560 }, { - "epoch": 1.8, - "learning_rate": 3.0158770199433932e-05, - "loss": 0.0031, + "epoch": 0.92, + "learning_rate": 0.00016135786884268535, + "loss": 0.0133, "step": 356570 }, { - "epoch": 1.8, - "learning_rate": 3.015120250641992e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016135398062631386, + "loss": 0.0159, "step": 356580 }, { - "epoch": 1.8, - "learning_rate": 3.0143634813405912e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.0001613500924099424, + "loss": 0.0167, "step": 356590 }, { - "epoch": 1.8, - "learning_rate": 3.01360671203919e-05, - "loss": 0.0049, + "epoch": 0.92, + "learning_rate": 0.00016134620419357097, + "loss": 0.011, "step": 356600 }, { - "epoch": 1.8, - "learning_rate": 3.0128499427377892e-05, - "loss": 0.0063, + "epoch": 0.92, + "learning_rate": 0.00016134231597719948, + "loss": 0.0139, "step": 356610 }, { - "epoch": 1.8, - "learning_rate": 3.012093173436388e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016133842776082803, + "loss": 0.0125, "step": 356620 }, { - "epoch": 1.8, - "learning_rate": 3.0113364041349872e-05, - "loss": 0.006, + "epoch": 0.92, + "learning_rate": 0.00016133453954445654, + "loss": 0.0137, "step": 356630 }, { - "epoch": 1.8, - "learning_rate": 3.010579634833586e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.0001613306513280851, + "loss": 0.0111, "step": 356640 }, { - "epoch": 1.8, - "learning_rate": 3.0098228655321852e-05, - "loss": 0.0052, + "epoch": 0.92, + "learning_rate": 0.00016132676311171362, + "loss": 0.0158, "step": 356650 }, { - "epoch": 1.8, - "learning_rate": 3.009066096230784e-05, - "loss": 0.0044, + "epoch": 0.92, + "learning_rate": 0.00016132287489534217, + "loss": 0.0134, "step": 356660 }, { - "epoch": 1.8, - "learning_rate": 3.008309326929383e-05, - "loss": 0.0072, + "epoch": 0.92, + "learning_rate": 0.00016131898667897068, + "loss": 0.0137, "step": 356670 }, { - "epoch": 1.8, - "learning_rate": 3.007552557627982e-05, - "loss": 0.0056, + "epoch": 0.92, + "learning_rate": 0.00016131509846259925, + "loss": 0.0145, "step": 356680 }, { - "epoch": 1.8, - "learning_rate": 3.006795788326581e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.00016131121024622776, + "loss": 0.0143, "step": 356690 }, { - "epoch": 1.8, - "learning_rate": 3.00603901902518e-05, - "loss": 0.0054, + "epoch": 0.92, + "learning_rate": 0.0001613073220298563, + "loss": 0.0128, "step": 356700 }, { - "epoch": 1.8, - "learning_rate": 3.005282249723779e-05, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.00016130343381348482, + "loss": 0.0098, "step": 356710 }, { - "epoch": 1.8, - "learning_rate": 3.0045254804223783e-05, - "loss": 0.0075, + "epoch": 0.92, + "learning_rate": 0.0001612995455971134, + "loss": 0.01, "step": 356720 }, { - "epoch": 1.8, - "learning_rate": 3.0037687111209768e-05, - "loss": 0.0047, + "epoch": 0.92, + "learning_rate": 0.0001612956573807419, + "loss": 0.014, "step": 356730 }, { - "epoch": 1.8, - "learning_rate": 3.0030119418195756e-05, - "loss": 0.0061, + "epoch": 0.92, + "learning_rate": 0.00016129176916437044, + "loss": 0.0142, "step": 356740 }, { - "epoch": 1.8, - "learning_rate": 3.0022551725181747e-05, - "loss": 0.0066, + "epoch": 0.92, + "learning_rate": 0.00016128788094799896, + "loss": 0.0126, "step": 356750 }, { - "epoch": 1.8, - "learning_rate": 3.0014984032167736e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016128399273162753, + "loss": 0.0134, "step": 356760 }, { - "epoch": 1.8, - "learning_rate": 3.0007416339153727e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016128010451525607, + "loss": 0.0101, "step": 356770 }, { - "epoch": 1.8, - "learning_rate": 2.9999848646139716e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016127621629888458, + "loss": 0.0123, "step": 356780 }, { - "epoch": 1.8, - "learning_rate": 2.9992280953125707e-05, - "loss": 0.0065, + "epoch": 0.92, + "learning_rate": 0.00016127232808251313, + "loss": 0.0186, "step": 356790 }, { - "epoch": 1.8, - "learning_rate": 2.9984713260111695e-05, - "loss": 0.005, + "epoch": 0.92, + "learning_rate": 0.00016126843986614164, + "loss": 0.0096, "step": 356800 }, { - "epoch": 1.8, - "learning_rate": 2.9977145567097687e-05, - "loss": 0.0071, + "epoch": 0.92, + "learning_rate": 0.0001612645516497702, + "loss": 0.0115, "step": 356810 }, { - "epoch": 1.8, - "learning_rate": 2.9969577874083675e-05, - "loss": 0.0053, + "epoch": 0.92, + "learning_rate": 0.00016126066343339872, + "loss": 0.0134, "step": 356820 }, { - "epoch": 1.8, - "learning_rate": 2.9962010181069667e-05, - "loss": 0.0059, + "epoch": 0.92, + "learning_rate": 0.00016125677521702727, + "loss": 0.0126, "step": 356830 }, { - "epoch": 1.8, - "learning_rate": 2.9954442488055655e-05, - "loss": 0.0051, + "epoch": 0.92, + "learning_rate": 0.00016125288700065578, + "loss": 0.0112, "step": 356840 }, { - "epoch": 1.8, - "learning_rate": 2.9946874795041647e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016124899878428435, + "loss": 0.0135, "step": 356850 }, { - "epoch": 1.8, - "learning_rate": 2.9939307102027635e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016124511056791286, + "loss": 0.013, "step": 356860 }, { - "epoch": 1.8, - "learning_rate": 2.9931739409013626e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.0001612412223515414, + "loss": 0.0126, "step": 356870 }, { - "epoch": 1.8, - "learning_rate": 2.992417171599961e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016123733413516992, + "loss": 0.0109, "step": 356880 }, { - "epoch": 1.8, - "learning_rate": 2.9916604022985603e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.0001612334459187985, + "loss": 0.0139, "step": 356890 }, { - "epoch": 1.8, - "learning_rate": 2.990903632997159e-05, - "loss": 0.0073, + "epoch": 0.93, + "learning_rate": 0.000161229557702427, + "loss": 0.0138, "step": 356900 }, { - "epoch": 1.8, - "learning_rate": 2.9901468636957583e-05, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016122566948605554, + "loss": 0.0122, "step": 356910 }, { - "epoch": 1.8, - "learning_rate": 2.989390094394357e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016122178126968406, + "loss": 0.0124, "step": 356920 }, { - "epoch": 1.8, - "learning_rate": 2.9886333250929563e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016121789305331263, + "loss": 0.0132, "step": 356930 }, { - "epoch": 1.8, - "learning_rate": 2.987876555791555e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016121400483694117, + "loss": 0.0147, "step": 356940 }, { - "epoch": 1.8, - "learning_rate": 2.9871197864901542e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016121011662056968, + "loss": 0.0121, "step": 356950 }, { - "epoch": 1.8, - "learning_rate": 2.986363017188753e-05, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.00016120622840419823, + "loss": 0.0113, "step": 356960 }, { - "epoch": 1.8, - "learning_rate": 2.9856062478873522e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016120234018782677, + "loss": 0.0105, "step": 356970 }, { - "epoch": 1.8, - "learning_rate": 2.984849478585951e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.0001611984519714553, + "loss": 0.0153, "step": 356980 }, { - "epoch": 1.8, - "learning_rate": 2.9840927092845502e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016119456375508382, + "loss": 0.0111, "step": 356990 }, { - "epoch": 1.8, - "learning_rate": 2.983335939983149e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016119067553871236, + "loss": 0.0144, "step": 357000 }, { - "epoch": 1.8, - "eval_cer": 0.9144139729278888, - "eval_loss": 0.004504029173403978, - "eval_runtime": 116.8007, - "eval_samples_per_second": 17.123, - "eval_steps_per_second": 4.281, + "epoch": 0.93, + "eval_cer": 0.8817502739789299, + "eval_loss": 0.00885064247995615, + "eval_runtime": 107.1821, + "eval_samples_per_second": 18.66, + "eval_steps_per_second": 4.665, "step": 357000 }, { - "epoch": 1.8, - "learning_rate": 2.9825791706817482e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.0001611867873223409, + "loss": 0.015, "step": 357010 }, { - "epoch": 1.8, - "learning_rate": 2.981822401380347e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016118289910596945, + "loss": 0.0115, "step": 357020 }, { - "epoch": 1.8, - "learning_rate": 2.981065632078946e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016117901088959796, + "loss": 0.0103, "step": 357030 }, { - "epoch": 1.8, - "learning_rate": 2.9803088627775446e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.0001611751226732265, + "loss": 0.0141, "step": 357040 }, { - "epoch": 1.8, - "learning_rate": 2.9795520934761438e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016117123445685502, + "loss": 0.0122, "step": 357050 }, { - "epoch": 1.8, - "learning_rate": 2.9787953241747426e-05, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.0001611673462404836, + "loss": 0.0134, "step": 357060 }, { - "epoch": 1.8, - "learning_rate": 2.9780385548733418e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.0001611634580241121, + "loss": 0.0108, "step": 357070 }, { - "epoch": 1.8, - "learning_rate": 2.9772817855719406e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016115956980774064, + "loss": 0.0118, "step": 357080 }, { - "epoch": 1.8, - "learning_rate": 2.9765250162705398e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016115568159136916, + "loss": 0.015, "step": 357090 }, { - "epoch": 1.8, - "learning_rate": 2.9757682469691386e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016115179337499773, + "loss": 0.0163, "step": 357100 }, { - "epoch": 1.8, - "learning_rate": 2.9750114776677378e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016114790515862627, + "loss": 0.0101, "step": 357110 }, { - "epoch": 1.8, - "learning_rate": 2.9742547083663366e-05, - "loss": 0.0031, + "epoch": 0.93, + "learning_rate": 0.00016114401694225478, + "loss": 0.0138, "step": 357120 }, { - "epoch": 1.8, - "learning_rate": 2.9734979390649357e-05, - "loss": 0.0046, + "epoch": 0.93, + "learning_rate": 0.0001611401287258833, + "loss": 0.0149, "step": 357130 }, { - "epoch": 1.8, - "learning_rate": 2.9727411697635346e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016113624050951187, + "loss": 0.013, "step": 357140 }, { - "epoch": 1.8, - "learning_rate": 2.9719844004621337e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.0001611323522931404, + "loss": 0.0141, "step": 357150 }, { - "epoch": 1.8, - "learning_rate": 2.9712276311607325e-05, - "loss": 0.0041, + "epoch": 0.93, + "learning_rate": 0.00016112846407676892, + "loss": 0.0136, "step": 357160 }, { - "epoch": 1.8, - "learning_rate": 2.9704708618593317e-05, - "loss": 0.0084, + "epoch": 0.93, + "learning_rate": 0.00016112457586039746, + "loss": 0.0116, "step": 357170 }, { - "epoch": 1.8, - "learning_rate": 2.9697140925579305e-05, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.000161120687644026, + "loss": 0.0158, "step": 357180 }, { - "epoch": 1.8, - "learning_rate": 2.9689573232565297e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016111679942765455, + "loss": 0.0154, "step": 357190 }, { - "epoch": 1.8, - "learning_rate": 2.968200553955128e-05, - "loss": 0.011, + "epoch": 0.93, + "learning_rate": 0.00016111291121128306, + "loss": 0.012, "step": 357200 }, { - "epoch": 1.8, - "learning_rate": 2.9674437846537273e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.0001611090229949116, + "loss": 0.0133, "step": 357210 }, { - "epoch": 1.8, - "learning_rate": 2.966687015352326e-05, - "loss": 0.0044, + "epoch": 0.93, + "learning_rate": 0.00016110513477854015, + "loss": 0.0161, "step": 357220 }, { - "epoch": 1.8, - "learning_rate": 2.9659302460509253e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.0001611012465621687, + "loss": 0.0135, "step": 357230 }, { - "epoch": 1.8, - "learning_rate": 2.965173476749524e-05, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.0001610973583457972, + "loss": 0.0123, "step": 357240 }, { - "epoch": 1.8, - "learning_rate": 2.9644167074481233e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016109347012942574, + "loss": 0.0135, "step": 357250 }, { - "epoch": 1.8, - "learning_rate": 2.963659938146722e-05, - "loss": 0.0044, + "epoch": 0.93, + "learning_rate": 0.0001610895819130543, + "loss": 0.0166, "step": 357260 }, { - "epoch": 1.8, - "learning_rate": 2.9629031688453213e-05, - "loss": 0.0044, + "epoch": 0.93, + "learning_rate": 0.00016108569369668283, + "loss": 0.0126, "step": 357270 }, { - "epoch": 1.8, - "learning_rate": 2.96214639954392e-05, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016108180548031137, + "loss": 0.0111, "step": 357280 }, { - "epoch": 1.8, - "learning_rate": 2.9613896302425193e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016107791726393988, + "loss": 0.0132, "step": 357290 }, { - "epoch": 1.8, - "learning_rate": 2.960632860941118e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.0001610740290475684, + "loss": 0.0121, "step": 357300 }, { - "epoch": 1.8, - "learning_rate": 2.9598760916397172e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016107014083119697, + "loss": 0.0116, "step": 357310 }, { - "epoch": 1.8, - "learning_rate": 2.959119322338316e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.0001610662526148255, + "loss": 0.0136, "step": 357320 }, { - "epoch": 1.8, - "learning_rate": 2.9583625530369152e-05, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.00016106236439845402, + "loss": 0.0142, "step": 357330 }, { - "epoch": 1.8, - "learning_rate": 2.957605783735514e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016105847618208256, + "loss": 0.0142, "step": 357340 }, { - "epoch": 1.8, - "learning_rate": 2.9568490144341125e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001610545879657111, + "loss": 0.0157, "step": 357350 }, { - "epoch": 1.8, - "learning_rate": 2.9560922451327117e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016105069974933965, + "loss": 0.0148, "step": 357360 }, { - "epoch": 1.8, - "learning_rate": 2.9553354758313105e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016104681153296816, + "loss": 0.0173, "step": 357370 }, { - "epoch": 1.8, - "learning_rate": 2.9545787065299097e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.0001610429233165967, + "loss": 0.0139, "step": 357380 }, { - "epoch": 1.8, - "learning_rate": 2.9538219372285085e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016103903510022524, + "loss": 0.0114, "step": 357390 }, { - "epoch": 1.8, - "learning_rate": 2.9530651679271077e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016103514688385379, + "loss": 0.014, "step": 357400 }, { - "epoch": 1.8, - "learning_rate": 2.9523083986257065e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.0001610312586674823, + "loss": 0.0187, "step": 357410 }, { - "epoch": 1.8, - "learning_rate": 2.9515516293243056e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016102737045111084, + "loss": 0.015, "step": 357420 }, { - "epoch": 1.8, - "learning_rate": 2.9507948600229048e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.0001610234822347394, + "loss": 0.0138, "step": 357430 }, { - "epoch": 1.8, - "learning_rate": 2.9500380907215036e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016101959401836793, + "loss": 0.0131, "step": 357440 }, { - "epoch": 1.8, - "learning_rate": 2.9492813214201028e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016101570580199644, + "loss": 0.0116, "step": 357450 }, { - "epoch": 1.8, - "learning_rate": 2.9485245521187016e-05, - "loss": 0.0084, + "epoch": 0.93, + "learning_rate": 0.00016101181758562498, + "loss": 0.0134, "step": 357460 }, { - "epoch": 1.8, - "learning_rate": 2.9477677828173008e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016100792936925355, + "loss": 0.0096, "step": 357470 }, { - "epoch": 1.8, - "learning_rate": 2.9470110135158996e-05, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.00016100404115288207, + "loss": 0.0132, "step": 357480 }, { - "epoch": 1.8, - "learning_rate": 2.9462542442144987e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.0001610001529365106, + "loss": 0.0159, "step": 357490 }, { - "epoch": 1.8, - "learning_rate": 2.9454974749130976e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016099626472013912, + "loss": 0.0127, "step": 357500 }, { - "epoch": 1.8, - "learning_rate": 2.944740705611696e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001609923765037677, + "loss": 0.0107, "step": 357510 }, { - "epoch": 1.8, - "learning_rate": 2.9439839363102952e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.0001609884882873962, + "loss": 0.0101, "step": 357520 }, { - "epoch": 1.8, - "learning_rate": 2.943227167008894e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016098460007102475, + "loss": 0.0113, "step": 357530 }, { - "epoch": 1.8, - "learning_rate": 2.9424703977074932e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016098071185465326, + "loss": 0.0164, "step": 357540 }, { - "epoch": 1.8, - "learning_rate": 2.941713628406092e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001609768236382818, + "loss": 0.0089, "step": 357550 }, { - "epoch": 1.8, - "learning_rate": 2.9409568591046912e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016097293542191034, + "loss": 0.012, "step": 357560 }, { - "epoch": 1.8, - "learning_rate": 2.94020008980329e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016096904720553889, + "loss": 0.0131, "step": 357570 }, { - "epoch": 1.8, - "learning_rate": 2.939443320501889e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.0001609651589891674, + "loss": 0.0111, "step": 357580 }, { - "epoch": 1.8, - "learning_rate": 2.938686551200488e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016096127077279594, + "loss": 0.0162, "step": 357590 }, { - "epoch": 1.8, - "learning_rate": 2.937929781899087e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016095738255642448, + "loss": 0.0109, "step": 357600 }, { - "epoch": 1.8, - "learning_rate": 2.937173012597686e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016095349434005303, + "loss": 0.0124, "step": 357610 }, { - "epoch": 1.8, - "learning_rate": 2.936416243296285e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016094960612368154, + "loss": 0.0131, "step": 357620 }, { - "epoch": 1.8, - "learning_rate": 2.935659473994884e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016094571790731008, + "loss": 0.0114, "step": 357630 }, { - "epoch": 1.8, - "learning_rate": 2.934902704693483e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016094182969093865, + "loss": 0.0118, "step": 357640 }, { - "epoch": 1.8, - "learning_rate": 2.934145935392082e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016093794147456716, + "loss": 0.0127, "step": 357650 }, { - "epoch": 1.8, - "learning_rate": 2.933389166090681e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.0001609340532581957, + "loss": 0.0105, "step": 357660 }, { - "epoch": 1.8, - "learning_rate": 2.9326323967892796e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016093016504182422, + "loss": 0.0109, "step": 357670 }, { - "epoch": 1.8, - "learning_rate": 2.9318756274878787e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.0001609262768254528, + "loss": 0.0103, "step": 357680 }, { - "epoch": 1.8, - "learning_rate": 2.9311188581864776e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001609223886090813, + "loss": 0.0132, "step": 357690 }, { - "epoch": 1.8, - "learning_rate": 2.9303620888850767e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016091850039270985, + "loss": 0.0135, "step": 357700 }, { - "epoch": 1.8, - "learning_rate": 2.9296053195836755e-05, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.00016091461217633836, + "loss": 0.0124, "step": 357710 }, { - "epoch": 1.8, - "learning_rate": 2.9288485502822747e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016091072395996693, + "loss": 0.0121, "step": 357720 }, { - "epoch": 1.8, - "learning_rate": 2.9280917809808735e-05, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.00016090683574359544, + "loss": 0.0166, "step": 357730 }, { - "epoch": 1.8, - "learning_rate": 2.9273350116794727e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016090294752722399, + "loss": 0.0168, "step": 357740 }, { - "epoch": 1.8, - "learning_rate": 2.9265782423780715e-05, - "loss": 0.0097, + "epoch": 0.93, + "learning_rate": 0.0001608990593108525, + "loss": 0.0114, "step": 357750 }, { - "epoch": 1.8, - "learning_rate": 2.9258214730766707e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016089517109448107, + "loss": 0.014, "step": 357760 }, { - "epoch": 1.8, - "learning_rate": 2.9250647037752695e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016089128287810958, + "loss": 0.0179, "step": 357770 }, { - "epoch": 1.81, - "learning_rate": 2.9243079344738686e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016088739466173812, + "loss": 0.0119, "step": 357780 }, { - "epoch": 1.81, - "learning_rate": 2.9235511651724675e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016088350644536664, + "loss": 0.013, "step": 357790 }, { - "epoch": 1.81, - "learning_rate": 2.9227943958710666e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016087961822899518, + "loss": 0.0103, "step": 357800 }, { - "epoch": 1.81, - "learning_rate": 2.9220376265696655e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016087573001262375, + "loss": 0.0162, "step": 357810 }, { - "epoch": 1.81, - "learning_rate": 2.9212808572682643e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016087184179625226, + "loss": 0.0127, "step": 357820 }, { - "epoch": 1.81, - "learning_rate": 2.920524087966863e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.0001608679535798808, + "loss": 0.0128, "step": 357830 }, { - "epoch": 1.81, - "learning_rate": 2.9197673186654623e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016086406536350932, + "loss": 0.0129, "step": 357840 }, { - "epoch": 1.81, - "learning_rate": 2.919010549364061e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.0001608601771471379, + "loss": 0.0133, "step": 357850 }, { - "epoch": 1.81, - "learning_rate": 2.9182537800626602e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.0001608562889307664, + "loss": 0.0147, "step": 357860 }, { - "epoch": 1.81, - "learning_rate": 2.917497010761259e-05, - "loss": 0.0075, + "epoch": 0.93, + "learning_rate": 0.00016085240071439495, + "loss": 0.0126, "step": 357870 }, { - "epoch": 1.81, - "learning_rate": 2.9167402414598582e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016084851249802346, + "loss": 0.0151, "step": 357880 }, { - "epoch": 1.81, - "learning_rate": 2.915983472158457e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016084462428165203, + "loss": 0.0101, "step": 357890 }, { - "epoch": 1.81, - "learning_rate": 2.9152267028570562e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016084073606528054, + "loss": 0.0136, "step": 357900 }, { - "epoch": 1.81, - "learning_rate": 2.914469933555655e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016083684784890908, + "loss": 0.0187, "step": 357910 }, { - "epoch": 1.81, - "learning_rate": 2.9137131642542542e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001608329596325376, + "loss": 0.0147, "step": 357920 }, { - "epoch": 1.81, - "learning_rate": 2.912956394952853e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016082907141616617, + "loss": 0.0147, "step": 357930 }, { - "epoch": 1.81, - "learning_rate": 2.912199625651452e-05, - "loss": 0.0075, + "epoch": 0.93, + "learning_rate": 0.00016082518319979468, + "loss": 0.0133, "step": 357940 }, { - "epoch": 1.81, - "learning_rate": 2.911442856350051e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016082129498342322, + "loss": 0.0143, "step": 357950 }, { - "epoch": 1.81, - "learning_rate": 2.91068608704865e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016081740676705174, + "loss": 0.0129, "step": 357960 }, { - "epoch": 1.81, - "learning_rate": 2.909929317747249e-05, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.0001608135185506803, + "loss": 0.0101, "step": 357970 }, { - "epoch": 1.81, - "learning_rate": 2.9091725484458478e-05, - "loss": 0.0036, + "epoch": 0.93, + "learning_rate": 0.00016080963033430885, + "loss": 0.0133, "step": 357980 }, { - "epoch": 1.81, - "learning_rate": 2.9084157791444466e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016080574211793736, + "loss": 0.012, "step": 357990 }, { - "epoch": 1.81, - "learning_rate": 2.9076590098430458e-05, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.00016080185390156588, + "loss": 0.0095, "step": 358000 }, { - "epoch": 1.81, - "eval_cer": 0.9144353216426477, - "eval_loss": 0.004471032880246639, - "eval_runtime": 116.5217, - "eval_samples_per_second": 17.164, - "eval_steps_per_second": 4.291, + "epoch": 0.93, + "eval_cer": 0.8817642703482717, + "eval_loss": 0.008927177637815475, + "eval_runtime": 107.5563, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, "step": 358000 }, { - "epoch": 1.81, - "learning_rate": 2.9069022405416446e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016079796568519445, + "loss": 0.0095, "step": 358010 }, { - "epoch": 1.81, - "learning_rate": 2.9061454712402438e-05, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.000160794077468823, + "loss": 0.0112, "step": 358020 }, { - "epoch": 1.81, - "learning_rate": 2.9053887019388426e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.0001607901892524515, + "loss": 0.01, "step": 358030 }, { - "epoch": 1.81, - "learning_rate": 2.9046319326374417e-05, - "loss": 0.0092, + "epoch": 0.93, + "learning_rate": 0.00016078630103608004, + "loss": 0.0125, "step": 358040 }, { - "epoch": 1.81, - "learning_rate": 2.9038751633360406e-05, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.00016078241281970856, + "loss": 0.0134, "step": 358050 }, { - "epoch": 1.81, - "learning_rate": 2.9031183940346397e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016077852460333713, + "loss": 0.015, "step": 358060 }, { - "epoch": 1.81, - "learning_rate": 2.9023616247332385e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016077463638696564, + "loss": 0.0113, "step": 358070 }, { - "epoch": 1.81, - "learning_rate": 2.9016048554318377e-05, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016077074817059418, + "loss": 0.013, "step": 358080 }, { - "epoch": 1.81, - "learning_rate": 2.9008480861304365e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.0001607668599542227, + "loss": 0.0105, "step": 358090 }, { - "epoch": 1.81, - "learning_rate": 2.9000913168290357e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016076297173785127, + "loss": 0.012, "step": 358100 }, { - "epoch": 1.81, - "learning_rate": 2.8993345475276345e-05, - "loss": 0.0092, + "epoch": 0.93, + "learning_rate": 0.00016075908352147978, + "loss": 0.0129, "step": 358110 }, { - "epoch": 1.81, - "learning_rate": 2.8985777782262337e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016075519530510832, + "loss": 0.0113, "step": 358120 }, { - "epoch": 1.81, - "learning_rate": 2.8978210089248325e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016075130708873684, + "loss": 0.0114, "step": 358130 }, { - "epoch": 1.81, - "learning_rate": 2.8970642396234313e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.0001607474188723654, + "loss": 0.0146, "step": 358140 }, { - "epoch": 1.81, - "learning_rate": 2.89630747032203e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016074353065599395, + "loss": 0.0135, "step": 358150 }, { - "epoch": 1.81, - "learning_rate": 2.8955507010206293e-05, - "loss": 0.0041, + "epoch": 0.93, + "learning_rate": 0.00016073964243962246, + "loss": 0.0132, "step": 358160 }, { - "epoch": 1.81, - "learning_rate": 2.894793931719228e-05, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016073575422325098, + "loss": 0.0162, "step": 358170 }, { - "epoch": 1.81, - "learning_rate": 2.8940371624178273e-05, - "loss": 0.0078, + "epoch": 0.93, + "learning_rate": 0.00016073186600687955, + "loss": 0.0136, "step": 358180 }, { - "epoch": 1.81, - "learning_rate": 2.893280393116426e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.0001607279777905081, + "loss": 0.0139, "step": 358190 }, { - "epoch": 1.81, - "learning_rate": 2.8925236238150253e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001607240895741366, + "loss": 0.0115, "step": 358200 }, { - "epoch": 1.81, - "learning_rate": 2.891766854513624e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016072020135776514, + "loss": 0.0126, "step": 358210 }, { - "epoch": 1.81, - "learning_rate": 2.8910100852122232e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016071631314139369, + "loss": 0.0143, "step": 358220 }, { - "epoch": 1.81, - "learning_rate": 2.890253315910822e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016071242492502223, + "loss": 0.0112, "step": 358230 }, { - "epoch": 1.81, - "learning_rate": 2.8894965466094212e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016070853670865074, + "loss": 0.0115, "step": 358240 }, { - "epoch": 1.81, - "learning_rate": 2.88873977730802e-05, - "loss": 0.0075, + "epoch": 0.93, + "learning_rate": 0.00016070464849227928, + "loss": 0.0125, "step": 358250 }, { - "epoch": 1.81, - "learning_rate": 2.8879830080066192e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016070076027590783, + "loss": 0.0158, "step": 358260 }, { - "epoch": 1.81, - "learning_rate": 2.887226238705218e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016069687205953637, + "loss": 0.0132, "step": 358270 }, { - "epoch": 1.81, - "learning_rate": 2.8864694694038172e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016069298384316488, + "loss": 0.0114, "step": 358280 }, { - "epoch": 1.81, - "learning_rate": 2.885712700102416e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016068909562679342, + "loss": 0.0124, "step": 358290 }, { - "epoch": 1.81, - "learning_rate": 2.8849559308010145e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016068520741042194, + "loss": 0.0133, "step": 358300 }, { - "epoch": 1.81, - "learning_rate": 2.8841991614996137e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.0001606813191940505, + "loss": 0.0114, "step": 358310 }, { - "epoch": 1.81, - "learning_rate": 2.8834423921982125e-05, - "loss": 0.0038, + "epoch": 0.93, + "learning_rate": 0.00016067743097767902, + "loss": 0.0123, "step": 358320 }, { - "epoch": 1.81, - "learning_rate": 2.8826856228968116e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016067354276130756, + "loss": 0.0141, "step": 358330 }, { - "epoch": 1.81, - "learning_rate": 2.8819288535954105e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016066965454493608, + "loss": 0.0102, "step": 358340 }, { - "epoch": 1.81, - "learning_rate": 2.8811720842940096e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016066576632856465, + "loss": 0.0156, "step": 358350 }, { - "epoch": 1.81, - "learning_rate": 2.8804153149926084e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.0001606618781121932, + "loss": 0.013, "step": 358360 }, { - "epoch": 1.81, - "learning_rate": 2.8796585456912076e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001606579898958217, + "loss": 0.0217, "step": 358370 }, { - "epoch": 1.81, - "learning_rate": 2.8789017763898064e-05, - "loss": 0.0081, + "epoch": 0.93, + "learning_rate": 0.00016065410167945024, + "loss": 0.0167, "step": 358380 }, { - "epoch": 1.81, - "learning_rate": 2.8781450070884056e-05, - "loss": 0.0075, + "epoch": 0.93, + "learning_rate": 0.00016065021346307878, + "loss": 0.0123, "step": 358390 }, { - "epoch": 1.81, - "learning_rate": 2.8773882377870048e-05, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.00016064632524670733, + "loss": 0.0099, "step": 358400 }, { - "epoch": 1.81, - "learning_rate": 2.8766314684856036e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016064243703033584, + "loss": 0.0133, "step": 358410 }, { - "epoch": 1.81, - "learning_rate": 2.8758746991842027e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016063854881396438, + "loss": 0.0134, "step": 358420 }, { - "epoch": 1.81, - "learning_rate": 2.8751179298828016e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016063466059759292, + "loss": 0.0125, "step": 358430 }, { - "epoch": 1.81, - "learning_rate": 2.8743611605814007e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016063077238122147, + "loss": 0.0113, "step": 358440 }, { - "epoch": 1.81, - "learning_rate": 2.8736043912799992e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016062688416484998, + "loss": 0.0135, "step": 358450 }, { - "epoch": 1.81, - "learning_rate": 2.872847621978598e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016062299594847852, + "loss": 0.0128, "step": 358460 }, { - "epoch": 1.81, - "learning_rate": 2.8720908526771972e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016061910773210706, + "loss": 0.0109, "step": 358470 }, { - "epoch": 1.81, - "learning_rate": 2.871334083375796e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001606152195157356, + "loss": 0.0161, "step": 358480 }, { - "epoch": 1.81, - "learning_rate": 2.870577314074395e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016061133129936412, + "loss": 0.0134, "step": 358490 }, { - "epoch": 1.81, - "learning_rate": 2.869820544772994e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00016060744308299266, + "loss": 0.0147, "step": 358500 }, { - "epoch": 1.81, - "learning_rate": 2.869063775471593e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016060355486662123, + "loss": 0.0138, "step": 358510 }, { - "epoch": 1.81, - "learning_rate": 2.868307006170192e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.00016059966665024974, + "loss": 0.0176, "step": 358520 }, { - "epoch": 1.81, - "learning_rate": 2.867550236868791e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.0001605957784338783, + "loss": 0.0138, "step": 358530 }, { - "epoch": 1.81, - "learning_rate": 2.86679346756739e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.0001605918902175068, + "loss": 0.0121, "step": 358540 }, { - "epoch": 1.81, - "learning_rate": 2.866036698265989e-05, - "loss": 0.0046, + "epoch": 0.93, + "learning_rate": 0.00016058800200113534, + "loss": 0.0113, "step": 358550 }, { - "epoch": 1.81, - "learning_rate": 2.865279928964588e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016058411378476388, + "loss": 0.0141, "step": 358560 }, { - "epoch": 1.81, - "learning_rate": 2.864523159663187e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016058022556839243, + "loss": 0.011, "step": 358570 }, { - "epoch": 1.81, - "learning_rate": 2.863766390361786e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016057633735202094, + "loss": 0.0112, "step": 358580 }, { - "epoch": 1.81, - "learning_rate": 2.863009621060385e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016057244913564948, + "loss": 0.0109, "step": 358590 }, { - "epoch": 1.81, - "learning_rate": 2.862252851758984e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016056856091927802, + "loss": 0.0105, "step": 358600 }, { - "epoch": 1.81, - "learning_rate": 2.8614960824575827e-05, - "loss": 0.0041, + "epoch": 0.93, + "learning_rate": 0.00016056467270290657, + "loss": 0.0111, "step": 358610 }, { - "epoch": 1.81, - "learning_rate": 2.8607393131561815e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00016056078448653508, + "loss": 0.0109, "step": 358620 }, { - "epoch": 1.81, - "learning_rate": 2.8599825438547807e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.00016055689627016362, + "loss": 0.0127, "step": 358630 }, { - "epoch": 1.81, - "learning_rate": 2.8592257745533795e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016055300805379216, + "loss": 0.0119, "step": 358640 }, { - "epoch": 1.81, - "learning_rate": 2.8584690052519787e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.0001605491198374207, + "loss": 0.0124, "step": 358650 }, { - "epoch": 1.81, - "learning_rate": 2.8577122359505775e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016054523162104922, + "loss": 0.0147, "step": 358660 }, { - "epoch": 1.81, - "learning_rate": 2.8569554666491767e-05, - "loss": 0.0071, + "epoch": 0.93, + "learning_rate": 0.00016054134340467776, + "loss": 0.0149, "step": 358670 }, { - "epoch": 1.81, - "learning_rate": 2.8561986973477755e-05, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.00016053745518830633, + "loss": 0.0146, "step": 358680 }, { - "epoch": 1.81, - "learning_rate": 2.8554419280463747e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016053356697193484, + "loss": 0.0145, "step": 358690 }, { - "epoch": 1.81, - "learning_rate": 2.8546851587449735e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016052967875556339, + "loss": 0.0137, "step": 358700 }, { - "epoch": 1.81, - "learning_rate": 2.8539283894435726e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.0001605257905391919, + "loss": 0.0142, "step": 358710 }, { - "epoch": 1.81, - "learning_rate": 2.8531716201421715e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016052190232282047, + "loss": 0.0129, "step": 358720 }, { - "epoch": 1.81, - "learning_rate": 2.8524148508407706e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016051801410644898, + "loss": 0.0149, "step": 358730 }, { - "epoch": 1.81, - "learning_rate": 2.8516580815393694e-05, - "loss": 0.0073, + "epoch": 0.93, + "learning_rate": 0.00016051412589007753, + "loss": 0.0145, "step": 358740 }, { - "epoch": 1.81, - "learning_rate": 2.8509013122379686e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016051023767370604, + "loss": 0.0132, "step": 358750 }, { - "epoch": 1.81, - "learning_rate": 2.8501445429365674e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.0001605063494573346, + "loss": 0.0153, "step": 358760 }, { - "epoch": 1.81, - "learning_rate": 2.8493877736351662e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016050246124096312, + "loss": 0.0158, "step": 358770 }, { - "epoch": 1.81, - "learning_rate": 2.848631004333765e-05, - "loss": 0.0092, + "epoch": 0.93, + "learning_rate": 0.00016049857302459166, + "loss": 0.0142, "step": 358780 }, { - "epoch": 1.81, - "learning_rate": 2.8478742350323642e-05, - "loss": 0.0044, + "epoch": 0.93, + "learning_rate": 0.00016049468480822018, + "loss": 0.0132, "step": 358790 }, { - "epoch": 1.81, - "learning_rate": 2.847117465730963e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016049079659184872, + "loss": 0.0148, "step": 358800 }, { - "epoch": 1.81, - "learning_rate": 2.8463606964295622e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016048690837547726, + "loss": 0.0127, "step": 358810 }, { - "epoch": 1.81, - "learning_rate": 2.845603927128161e-05, - "loss": 0.0046, + "epoch": 0.93, + "learning_rate": 0.0001604830201591058, + "loss": 0.0158, "step": 358820 }, { - "epoch": 1.81, - "learning_rate": 2.8448471578267602e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00016047913194273432, + "loss": 0.0189, "step": 358830 }, { - "epoch": 1.81, - "learning_rate": 2.844090388525359e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016047524372636286, + "loss": 0.013, "step": 358840 }, { - "epoch": 1.81, - "learning_rate": 2.8433336192239582e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016047135550999143, + "loss": 0.0151, "step": 358850 }, { - "epoch": 1.81, - "learning_rate": 2.842576849922557e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016046746729361994, + "loss": 0.0143, "step": 358860 }, { - "epoch": 1.81, - "learning_rate": 2.841820080621156e-05, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016046357907724849, + "loss": 0.0141, "step": 358870 }, { - "epoch": 1.81, - "learning_rate": 2.841063311319755e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.000160459690860877, + "loss": 0.0097, "step": 358880 }, { - "epoch": 1.81, - "learning_rate": 2.840306542018354e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016045580264450557, + "loss": 0.0156, "step": 358890 }, { - "epoch": 1.81, - "learning_rate": 2.839549772716953e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016045191442813408, + "loss": 0.0127, "step": 358900 }, { - "epoch": 1.81, - "learning_rate": 2.838793003415552e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016044802621176262, + "loss": 0.0123, "step": 358910 }, { - "epoch": 1.81, - "learning_rate": 2.8380362341141506e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016044413799539114, + "loss": 0.0147, "step": 358920 }, { - "epoch": 1.81, - "learning_rate": 2.8372794648127498e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.0001604402497790197, + "loss": 0.0091, "step": 358930 }, { - "epoch": 1.81, - "learning_rate": 2.8365226955113486e-05, - "loss": 0.0073, + "epoch": 0.93, + "learning_rate": 0.00016043636156264822, + "loss": 0.0116, "step": 358940 }, { - "epoch": 1.81, - "learning_rate": 2.8357659262099477e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016043247334627676, + "loss": 0.013, "step": 358950 }, { - "epoch": 1.81, - "learning_rate": 2.8350091569085466e-05, - "loss": 0.0046, + "epoch": 0.93, + "learning_rate": 0.00016042858512990528, + "loss": 0.0114, "step": 358960 }, { - "epoch": 1.81, - "learning_rate": 2.8342523876071457e-05, - "loss": 0.004, + "epoch": 0.93, + "learning_rate": 0.00016042469691353385, + "loss": 0.0163, "step": 358970 }, { - "epoch": 1.81, - "learning_rate": 2.8334956183057446e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016042080869716236, + "loss": 0.0154, "step": 358980 }, { - "epoch": 1.81, - "learning_rate": 2.8327388490043437e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.0001604169204807909, + "loss": 0.0131, "step": 358990 }, { - "epoch": 1.81, - "learning_rate": 2.8319820797029425e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016041303226441942, + "loss": 0.0134, "step": 359000 }, { - "epoch": 1.81, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004385951440781355, - "eval_runtime": 116.7254, - "eval_samples_per_second": 17.134, - "eval_steps_per_second": 4.284, + "epoch": 0.93, + "eval_cer": 0.8817712685329425, + "eval_loss": 0.008768617175519466, + "eval_runtime": 107.5531, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, "step": 359000 }, { - "epoch": 1.81, - "learning_rate": 2.8312253104015417e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.000160409144048048, + "loss": 0.0086, "step": 359010 }, { - "epoch": 1.81, - "learning_rate": 2.8304685411001405e-05, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.00016040525583167653, + "loss": 0.0117, "step": 359020 }, { - "epoch": 1.81, - "learning_rate": 2.8297117717987397e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016040136761530504, + "loss": 0.0163, "step": 359030 }, { - "epoch": 1.81, - "learning_rate": 2.8289550024973385e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016039747939893356, + "loss": 0.0169, "step": 359040 }, { - "epoch": 1.81, - "learning_rate": 2.8281982331959377e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.0001603935911825621, + "loss": 0.0128, "step": 359050 }, { - "epoch": 1.81, - "learning_rate": 2.8274414638945365e-05, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.00016038970296619067, + "loss": 0.0112, "step": 359060 }, { - "epoch": 1.81, - "learning_rate": 2.8266846945931356e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016038581474981918, + "loss": 0.0138, "step": 359070 }, { - "epoch": 1.81, - "learning_rate": 2.825927925291734e-05, - "loss": 0.0071, + "epoch": 0.93, + "learning_rate": 0.00016038192653344772, + "loss": 0.0135, "step": 359080 }, { - "epoch": 1.81, - "learning_rate": 2.825171155990333e-05, - "loss": 0.0071, + "epoch": 0.93, + "learning_rate": 0.00016037803831707624, + "loss": 0.0168, "step": 359090 }, { - "epoch": 1.81, - "learning_rate": 2.824414386688932e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.0001603741501007048, + "loss": 0.0115, "step": 359100 }, { - "epoch": 1.81, - "learning_rate": 2.8236576173875313e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016037026188433332, + "loss": 0.0121, "step": 359110 }, { - "epoch": 1.81, - "learning_rate": 2.82290084808613e-05, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.00016036637366796186, + "loss": 0.0126, "step": 359120 }, { - "epoch": 1.81, - "learning_rate": 2.8221440787847293e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016036248545159038, + "loss": 0.0159, "step": 359130 }, { - "epoch": 1.81, - "learning_rate": 2.821387309483328e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016035859723521895, + "loss": 0.0105, "step": 359140 }, { - "epoch": 1.81, - "learning_rate": 2.8206305401819272e-05, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.00016035470901884746, + "loss": 0.0132, "step": 359150 }, { - "epoch": 1.81, - "learning_rate": 2.819873770880526e-05, - "loss": 0.0044, + "epoch": 0.93, + "learning_rate": 0.000160350820802476, + "loss": 0.0112, "step": 359160 }, { - "epoch": 1.81, - "learning_rate": 2.8191170015791252e-05, - "loss": 0.004, + "epoch": 0.93, + "learning_rate": 0.00016034693258610452, + "loss": 0.0152, "step": 359170 }, { - "epoch": 1.81, - "learning_rate": 2.818360232277724e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.0001603430443697331, + "loss": 0.0108, "step": 359180 }, { - "epoch": 1.81, - "learning_rate": 2.8176034629763232e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.0001603391561533616, + "loss": 0.0147, "step": 359190 }, { - "epoch": 1.81, - "learning_rate": 2.816846693674922e-05, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016033526793699014, + "loss": 0.0144, "step": 359200 }, { - "epoch": 1.81, - "learning_rate": 2.8160899243735212e-05, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.00016033137972061866, + "loss": 0.0138, "step": 359210 }, { - "epoch": 1.81, - "learning_rate": 2.81533315507212e-05, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.00016032749150424723, + "loss": 0.0132, "step": 359220 }, { - "epoch": 1.81, - "learning_rate": 2.814576385770719e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016032360328787577, + "loss": 0.0143, "step": 359230 }, { - "epoch": 1.81, - "learning_rate": 2.8138196164693176e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016031971507150428, + "loss": 0.0111, "step": 359240 }, { - "epoch": 1.81, - "learning_rate": 2.8130628471679165e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016031582685513282, + "loss": 0.0115, "step": 359250 }, { - "epoch": 1.81, - "learning_rate": 2.8123060778665156e-05, - "loss": 0.0081, + "epoch": 0.93, + "learning_rate": 0.00016031193863876134, + "loss": 0.0138, "step": 359260 }, { - "epoch": 1.81, - "learning_rate": 2.8115493085651145e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.0001603080504223899, + "loss": 0.0098, "step": 359270 }, { - "epoch": 1.81, - "learning_rate": 2.8107925392637136e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016030416220601842, + "loss": 0.016, "step": 359280 }, { - "epoch": 1.81, - "learning_rate": 2.8100357699623124e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00016030027398964696, + "loss": 0.0127, "step": 359290 }, { - "epoch": 1.81, - "learning_rate": 2.8092790006609116e-05, - "loss": 0.0041, + "epoch": 0.93, + "learning_rate": 0.00016029638577327548, + "loss": 0.0146, "step": 359300 }, { - "epoch": 1.81, - "learning_rate": 2.8085222313595104e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016029249755690405, + "loss": 0.012, "step": 359310 }, { - "epoch": 1.81, - "learning_rate": 2.8077654620581096e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016028860934053256, + "loss": 0.0138, "step": 359320 }, { - "epoch": 1.81, - "learning_rate": 2.8070086927567084e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.0001602847211241611, + "loss": 0.0133, "step": 359330 }, { - "epoch": 1.81, - "learning_rate": 2.8062519234553076e-05, - "loss": 0.0041, + "epoch": 0.93, + "learning_rate": 0.00016028083290778962, + "loss": 0.0113, "step": 359340 }, { - "epoch": 1.81, - "learning_rate": 2.8054951541539064e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016027694469141819, + "loss": 0.0126, "step": 359350 }, { - "epoch": 1.81, - "learning_rate": 2.8047383848525055e-05, - "loss": 0.0081, + "epoch": 0.93, + "learning_rate": 0.0001602730564750467, + "loss": 0.0162, "step": 359360 }, { - "epoch": 1.81, - "learning_rate": 2.8039816155511047e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016026916825867524, + "loss": 0.0111, "step": 359370 }, { - "epoch": 1.81, - "learning_rate": 2.8032248462497035e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016026528004230376, + "loss": 0.0103, "step": 359380 }, { - "epoch": 1.81, - "learning_rate": 2.8024680769483027e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016026139182593233, + "loss": 0.0122, "step": 359390 }, { - "epoch": 1.81, - "learning_rate": 2.801711307646901e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00016025750360956087, + "loss": 0.0135, "step": 359400 }, { - "epoch": 1.81, - "learning_rate": 2.8009545383455e-05, - "loss": 0.0101, + "epoch": 0.93, + "learning_rate": 0.00016025361539318938, + "loss": 0.0085, "step": 359410 }, { - "epoch": 1.81, - "learning_rate": 2.800197769044099e-05, - "loss": 0.0105, + "epoch": 0.93, + "learning_rate": 0.00016024972717681792, + "loss": 0.0125, "step": 359420 }, { - "epoch": 1.81, - "learning_rate": 2.799440999742698e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016024583896044646, + "loss": 0.0138, "step": 359430 }, { - "epoch": 1.81, - "learning_rate": 2.798684230441297e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.000160241950744075, + "loss": 0.0145, "step": 359440 }, { - "epoch": 1.81, - "learning_rate": 2.797927461139896e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016023806252770352, + "loss": 0.0144, "step": 359450 }, { - "epoch": 1.81, - "learning_rate": 2.797170691838495e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016023417431133206, + "loss": 0.0141, "step": 359460 }, { - "epoch": 1.81, - "learning_rate": 2.796413922537094e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.0001602302860949606, + "loss": 0.0143, "step": 359470 }, { - "epoch": 1.81, - "learning_rate": 2.795657153235693e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016022639787858915, + "loss": 0.0118, "step": 359480 }, { - "epoch": 1.81, - "learning_rate": 2.794900383934292e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016022250966221766, + "loss": 0.0134, "step": 359490 }, { - "epoch": 1.81, - "learning_rate": 2.794143614632891e-05, - "loss": 0.0044, + "epoch": 0.93, + "learning_rate": 0.0001602186214458462, + "loss": 0.0191, "step": 359500 }, { - "epoch": 1.81, - "learning_rate": 2.79338684533149e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00016021473322947472, + "loss": 0.0104, "step": 359510 }, { - "epoch": 1.81, - "learning_rate": 2.792630076030089e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016021084501310329, + "loss": 0.0169, "step": 359520 }, { - "epoch": 1.81, - "learning_rate": 2.791873306728688e-05, - "loss": 0.0046, + "epoch": 0.93, + "learning_rate": 0.0001602069567967318, + "loss": 0.0113, "step": 359530 }, { - "epoch": 1.81, - "learning_rate": 2.791116537427287e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016020306858036034, + "loss": 0.016, "step": 359540 }, { - "epoch": 1.81, - "learning_rate": 2.7903597681258855e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016019918036398886, + "loss": 0.0147, "step": 359550 }, { - "epoch": 1.81, - "learning_rate": 2.7896029988244847e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.00016019529214761742, + "loss": 0.0137, "step": 359560 }, { - "epoch": 1.81, - "learning_rate": 2.7888462295230835e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016019140393124597, + "loss": 0.0127, "step": 359570 }, { - "epoch": 1.81, - "learning_rate": 2.7880894602216827e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00016018751571487448, + "loss": 0.0131, "step": 359580 }, { - "epoch": 1.81, - "learning_rate": 2.7873326909202815e-05, - "loss": 0.0102, + "epoch": 0.93, + "learning_rate": 0.000160183627498503, + "loss": 0.0141, "step": 359590 }, { - "epoch": 1.81, - "learning_rate": 2.7865759216188807e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016017973928213156, + "loss": 0.0126, "step": 359600 }, { - "epoch": 1.81, - "learning_rate": 2.7858191523174795e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.0001601758510657601, + "loss": 0.0126, "step": 359610 }, { - "epoch": 1.81, - "learning_rate": 2.7850623830160786e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016017196284938862, + "loss": 0.0131, "step": 359620 }, { - "epoch": 1.81, - "learning_rate": 2.7843056137146775e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016016807463301716, + "loss": 0.0117, "step": 359630 }, { - "epoch": 1.81, - "learning_rate": 2.7835488444132766e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.0001601641864166457, + "loss": 0.0142, "step": 359640 }, { - "epoch": 1.81, - "learning_rate": 2.7827920751118754e-05, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00016016029820027425, + "loss": 0.0129, "step": 359650 }, { - "epoch": 1.81, - "learning_rate": 2.7820353058104746e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00016015640998390276, + "loss": 0.015, "step": 359660 }, { - "epoch": 1.81, - "learning_rate": 2.7812785365090734e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.0001601525217675313, + "loss": 0.0111, "step": 359670 }, { - "epoch": 1.81, - "learning_rate": 2.7805217672076726e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016014863355115984, + "loss": 0.0137, "step": 359680 }, { - "epoch": 1.81, - "learning_rate": 2.7797649979062714e-05, - "loss": 0.0077, + "epoch": 0.93, + "learning_rate": 0.00016014474533478838, + "loss": 0.0121, "step": 359690 }, { - "epoch": 1.81, - "learning_rate": 2.7790082286048706e-05, - "loss": 0.0082, + "epoch": 0.93, + "learning_rate": 0.0001601408571184169, + "loss": 0.0129, "step": 359700 }, { - "epoch": 1.81, - "learning_rate": 2.778251459303469e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00016013696890204544, + "loss": 0.0158, "step": 359710 }, { - "epoch": 1.81, - "learning_rate": 2.7774946900020682e-05, - "loss": 0.0069, + "epoch": 0.93, + "learning_rate": 0.000160133080685674, + "loss": 0.011, "step": 359720 }, { - "epoch": 1.81, - "learning_rate": 2.776737920700667e-05, - "loss": 0.0083, + "epoch": 0.93, + "learning_rate": 0.00016012919246930252, + "loss": 0.0132, "step": 359730 }, { - "epoch": 1.81, - "learning_rate": 2.7759811513992662e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00016012530425293107, + "loss": 0.0177, "step": 359740 }, { - "epoch": 1.81, - "learning_rate": 2.775224382097865e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016012141603655958, + "loss": 0.0135, "step": 359750 }, { - "epoch": 1.82, - "learning_rate": 2.7744676127964642e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.0001601175278201881, + "loss": 0.0094, "step": 359760 }, { - "epoch": 1.82, - "learning_rate": 2.773710843495063e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016011363960381666, + "loss": 0.0127, "step": 359770 }, { - "epoch": 1.82, - "learning_rate": 2.772954074193662e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001601097513874452, + "loss": 0.0162, "step": 359780 }, { - "epoch": 1.82, - "learning_rate": 2.772197304892261e-05, - "loss": 0.0043, + "epoch": 0.93, + "learning_rate": 0.00016010586317107372, + "loss": 0.0127, "step": 359790 }, { - "epoch": 1.82, - "learning_rate": 2.77144053559086e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00016010197495470226, + "loss": 0.0151, "step": 359800 }, { - "epoch": 1.82, - "learning_rate": 2.770683766289459e-05, - "loss": 0.0079, + "epoch": 0.93, + "learning_rate": 0.0001600980867383308, + "loss": 0.0119, "step": 359810 }, { - "epoch": 1.82, - "learning_rate": 2.769926996988058e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00016009419852195934, + "loss": 0.0114, "step": 359820 }, { - "epoch": 1.82, - "learning_rate": 2.769170227686657e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016009031030558786, + "loss": 0.013, "step": 359830 }, { - "epoch": 1.82, - "learning_rate": 2.768413458385256e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.0001600864220892164, + "loss": 0.013, "step": 359840 }, { - "epoch": 1.82, - "learning_rate": 2.767656689083855e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016008253387284494, + "loss": 0.0156, "step": 359850 }, { - "epoch": 1.82, - "learning_rate": 2.766899919782454e-05, - "loss": 0.0091, + "epoch": 0.93, + "learning_rate": 0.00016007864565647348, + "loss": 0.0135, "step": 359860 }, { - "epoch": 1.82, - "learning_rate": 2.7661431504810526e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.000160074757440102, + "loss": 0.0142, "step": 359870 }, { - "epoch": 1.82, - "learning_rate": 2.7653863811796517e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016007086922373054, + "loss": 0.0114, "step": 359880 }, { - "epoch": 1.82, - "learning_rate": 2.7646296118782506e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.0001600669810073591, + "loss": 0.0125, "step": 359890 }, { - "epoch": 1.82, - "learning_rate": 2.7638728425768497e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00016006309279098762, + "loss": 0.0099, "step": 359900 }, { - "epoch": 1.82, - "learning_rate": 2.7631160732754485e-05, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00016005920457461614, + "loss": 0.0142, "step": 359910 }, { - "epoch": 1.82, - "learning_rate": 2.7623593039740477e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00016005531635824468, + "loss": 0.0102, "step": 359920 }, { - "epoch": 1.82, - "learning_rate": 2.7616025346726465e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00016005142814187325, + "loss": 0.0121, "step": 359930 }, { - "epoch": 1.82, - "learning_rate": 2.7608457653712457e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00016004753992550176, + "loss": 0.0126, "step": 359940 }, { - "epoch": 1.82, - "learning_rate": 2.7600889960698445e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.0001600436517091303, + "loss": 0.0094, "step": 359950 }, { - "epoch": 1.82, - "learning_rate": 2.7593322267684437e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00016003976349275882, + "loss": 0.0125, "step": 359960 }, { - "epoch": 1.82, - "learning_rate": 2.7585754574670425e-05, - "loss": 0.007, + "epoch": 0.93, + "learning_rate": 0.0001600358752763874, + "loss": 0.0146, "step": 359970 }, { - "epoch": 1.82, - "learning_rate": 2.7578186881656416e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.0001600319870600159, + "loss": 0.0106, "step": 359980 }, { - "epoch": 1.82, - "learning_rate": 2.7570619188642405e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00016002809884364444, + "loss": 0.0128, "step": 359990 }, { - "epoch": 1.82, - "learning_rate": 2.7563051495628396e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00016002421062727296, + "loss": 0.0148, "step": 360000 }, { - "epoch": 1.82, - "eval_cer": 0.9144062097588856, - "eval_loss": 0.0043929265812039375, - "eval_runtime": 116.599, - "eval_samples_per_second": 17.153, - "eval_steps_per_second": 4.288, + "epoch": 0.93, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.008698065765202045, + "eval_runtime": 107.5328, + "eval_samples_per_second": 18.599, + "eval_steps_per_second": 4.65, "step": 360000 }, { - "epoch": 1.82, - "learning_rate": 2.7555483802614385e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.0001600203224109015, + "loss": 0.0115, "step": 360010 }, { - "epoch": 1.82, - "learning_rate": 2.754791610960037e-05, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.00016001643419453004, + "loss": 0.0101, "step": 360020 }, { - "epoch": 1.82, - "learning_rate": 2.754034841658636e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00016001254597815858, + "loss": 0.0103, "step": 360030 }, { - "epoch": 1.82, - "learning_rate": 2.753278072357235e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.0001600086577617871, + "loss": 0.0123, "step": 360040 }, { - "epoch": 1.82, - "learning_rate": 2.752521303055834e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016000476954541564, + "loss": 0.0157, "step": 360050 }, { - "epoch": 1.82, - "learning_rate": 2.751764533754433e-05, - "loss": 0.0068, + "epoch": 0.93, + "learning_rate": 0.00016000088132904418, + "loss": 0.0127, "step": 360060 }, { - "epoch": 1.82, - "learning_rate": 2.751007764453032e-05, - "loss": 0.0061, + "epoch": 0.93, + "learning_rate": 0.00015999699311267272, + "loss": 0.0107, "step": 360070 }, { - "epoch": 1.82, - "learning_rate": 2.7502509951516312e-05, - "loss": 0.0055, + "epoch": 0.93, + "learning_rate": 0.00015999310489630124, + "loss": 0.0111, "step": 360080 }, { - "epoch": 1.82, - "learning_rate": 2.74949422585023e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00015998921667992978, + "loss": 0.0135, "step": 360090 }, { - "epoch": 1.82, - "learning_rate": 2.7487374565488292e-05, - "loss": 0.0057, + "epoch": 0.93, + "learning_rate": 0.00015998532846355835, + "loss": 0.0136, "step": 360100 }, { - "epoch": 1.82, - "learning_rate": 2.747980687247428e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00015998144024718686, + "loss": 0.0134, "step": 360110 }, { - "epoch": 1.82, - "learning_rate": 2.7472239179460272e-05, - "loss": 0.0076, + "epoch": 0.93, + "learning_rate": 0.0001599775520308154, + "loss": 0.0121, "step": 360120 }, { - "epoch": 1.82, - "learning_rate": 2.746467148644626e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00015997366381444392, + "loss": 0.012, "step": 360130 }, { - "epoch": 1.82, - "learning_rate": 2.745710379343225e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.0001599697755980725, + "loss": 0.0121, "step": 360140 }, { - "epoch": 1.82, - "learning_rate": 2.744953610041824e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.000159965887381701, + "loss": 0.013, "step": 360150 }, { - "epoch": 1.82, - "learning_rate": 2.744196840740423e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00015996199916532954, + "loss": 0.0121, "step": 360160 }, { - "epoch": 1.82, - "learning_rate": 2.743440071439022e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00015995811094895806, + "loss": 0.0156, "step": 360170 }, { - "epoch": 1.82, - "learning_rate": 2.7426833021376205e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00015995422273258663, + "loss": 0.0136, "step": 360180 }, { - "epoch": 1.82, - "learning_rate": 2.7419265328362196e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00015995033451621514, + "loss": 0.0121, "step": 360190 }, { - "epoch": 1.82, - "learning_rate": 2.7411697635348184e-05, - "loss": 0.0065, + "epoch": 0.93, + "learning_rate": 0.00015994644629984368, + "loss": 0.0149, "step": 360200 }, { - "epoch": 1.82, - "learning_rate": 2.7404129942334176e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.0001599425580834722, + "loss": 0.012, "step": 360210 }, { - "epoch": 1.82, - "learning_rate": 2.7396562249320164e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00015993866986710077, + "loss": 0.013, "step": 360220 }, { - "epoch": 1.82, - "learning_rate": 2.7388994556306156e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00015993478165072928, + "loss": 0.0138, "step": 360230 }, { - "epoch": 1.82, - "learning_rate": 2.7381426863292144e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00015993089343435782, + "loss": 0.0113, "step": 360240 }, { - "epoch": 1.82, - "learning_rate": 2.7373859170278136e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.00015992700521798634, + "loss": 0.0152, "step": 360250 }, { - "epoch": 1.82, - "learning_rate": 2.7366291477264124e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.00015992311700161488, + "loss": 0.0129, "step": 360260 }, { - "epoch": 1.82, - "learning_rate": 2.7358723784250115e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00015991922878524345, + "loss": 0.0111, "step": 360270 }, { - "epoch": 1.82, - "learning_rate": 2.7351156091236104e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00015991534056887196, + "loss": 0.0115, "step": 360280 }, { - "epoch": 1.82, - "learning_rate": 2.7343588398222095e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.0001599114523525005, + "loss": 0.0126, "step": 360290 }, { - "epoch": 1.82, - "learning_rate": 2.7336020705208084e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00015990756413612902, + "loss": 0.0202, "step": 360300 }, { - "epoch": 1.82, - "learning_rate": 2.7328453012194075e-05, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.0001599036759197576, + "loss": 0.0111, "step": 360310 }, { - "epoch": 1.82, - "learning_rate": 2.7320885319180063e-05, - "loss": 0.0113, + "epoch": 0.93, + "learning_rate": 0.0001598997877033861, + "loss": 0.011, "step": 360320 }, { - "epoch": 1.82, - "learning_rate": 2.7313317626166055e-05, - "loss": 0.0082, + "epoch": 0.93, + "learning_rate": 0.00015989589948701464, + "loss": 0.0114, "step": 360330 }, { - "epoch": 1.82, - "learning_rate": 2.730574993315204e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00015989201127064316, + "loss": 0.0138, "step": 360340 }, { - "epoch": 1.82, - "learning_rate": 2.729818224013803e-05, - "loss": 0.006, + "epoch": 0.93, + "learning_rate": 0.00015988812305427173, + "loss": 0.0149, "step": 360350 }, { - "epoch": 1.82, - "learning_rate": 2.729061454712402e-05, - "loss": 0.0074, + "epoch": 0.93, + "learning_rate": 0.00015988423483790024, + "loss": 0.0124, "step": 360360 }, { - "epoch": 1.82, - "learning_rate": 2.728304685411001e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00015988034662152878, + "loss": 0.0113, "step": 360370 }, { - "epoch": 1.82, - "learning_rate": 2.7275479161096e-05, - "loss": 0.0054, + "epoch": 0.93, + "learning_rate": 0.0001598764584051573, + "loss": 0.0105, "step": 360380 }, { - "epoch": 1.82, - "learning_rate": 2.726791146808199e-05, - "loss": 0.0063, + "epoch": 0.93, + "learning_rate": 0.00015987257018878587, + "loss": 0.0119, "step": 360390 }, { - "epoch": 1.82, - "learning_rate": 2.726034377506798e-05, - "loss": 0.0048, + "epoch": 0.93, + "learning_rate": 0.00015986868197241438, + "loss": 0.0131, "step": 360400 }, { - "epoch": 1.82, - "learning_rate": 2.725277608205397e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.00015986479375604292, + "loss": 0.0105, "step": 360410 }, { - "epoch": 1.82, - "learning_rate": 2.724520838903996e-05, - "loss": 0.0049, + "epoch": 0.93, + "learning_rate": 0.00015986090553967144, + "loss": 0.0129, "step": 360420 }, { - "epoch": 1.82, - "learning_rate": 2.723764069602595e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.0001598570173233, + "loss": 0.0139, "step": 360430 }, { - "epoch": 1.82, - "learning_rate": 2.723007300301194e-05, - "loss": 0.0106, + "epoch": 0.93, + "learning_rate": 0.00015985312910692855, + "loss": 0.0125, "step": 360440 }, { - "epoch": 1.82, - "learning_rate": 2.722250530999793e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00015984924089055706, + "loss": 0.0118, "step": 360450 }, { - "epoch": 1.82, - "learning_rate": 2.721493761698392e-05, - "loss": 0.0059, + "epoch": 0.93, + "learning_rate": 0.0001598453526741856, + "loss": 0.0135, "step": 360460 }, { - "epoch": 1.82, - "learning_rate": 2.720736992396991e-05, - "loss": 0.008, + "epoch": 0.93, + "learning_rate": 0.00015984146445781414, + "loss": 0.0103, "step": 360470 }, { - "epoch": 1.82, - "learning_rate": 2.71998022309559e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00015983757624144269, + "loss": 0.0165, "step": 360480 }, { - "epoch": 1.82, - "learning_rate": 2.719223453794189e-05, - "loss": 0.0041, + "epoch": 0.93, + "learning_rate": 0.0001598336880250712, + "loss": 0.0146, "step": 360490 }, { - "epoch": 1.82, - "learning_rate": 2.7184666844927875e-05, - "loss": 0.0056, + "epoch": 0.93, + "learning_rate": 0.00015982979980869974, + "loss": 0.0145, "step": 360500 }, { - "epoch": 1.82, - "learning_rate": 2.7177099151913867e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.00015982591159232826, + "loss": 0.0116, "step": 360510 }, { - "epoch": 1.82, - "learning_rate": 2.7169531458899855e-05, - "loss": 0.0053, + "epoch": 0.93, + "learning_rate": 0.00015982202337595683, + "loss": 0.0124, "step": 360520 }, { - "epoch": 1.82, - "learning_rate": 2.7161963765885846e-05, - "loss": 0.0062, + "epoch": 0.93, + "learning_rate": 0.00015981813515958534, + "loss": 0.0104, "step": 360530 }, { - "epoch": 1.82, - "learning_rate": 2.7154396072871835e-05, - "loss": 0.0051, + "epoch": 0.93, + "learning_rate": 0.00015981424694321388, + "loss": 0.0133, "step": 360540 }, { - "epoch": 1.82, - "learning_rate": 2.7146828379857826e-05, - "loss": 0.0052, + "epoch": 0.93, + "learning_rate": 0.0001598103587268424, + "loss": 0.0116, "step": 360550 }, { - "epoch": 1.82, - "learning_rate": 2.7139260686843814e-05, - "loss": 0.0064, + "epoch": 0.93, + "learning_rate": 0.00015980647051047097, + "loss": 0.0145, "step": 360560 }, { - "epoch": 1.82, - "learning_rate": 2.7131692993829806e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00015980258229409948, + "loss": 0.0152, "step": 360570 }, { - "epoch": 1.82, - "learning_rate": 2.7124125300815794e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.00015979869407772802, + "loss": 0.0123, "step": 360580 }, { - "epoch": 1.82, - "learning_rate": 2.7116557607801786e-05, - "loss": 0.0045, + "epoch": 0.93, + "learning_rate": 0.00015979480586135654, + "loss": 0.0109, "step": 360590 }, { - "epoch": 1.82, - "learning_rate": 2.7108989914787774e-05, - "loss": 0.0078, + "epoch": 0.93, + "learning_rate": 0.0001597909176449851, + "loss": 0.0169, "step": 360600 }, { - "epoch": 1.82, - "learning_rate": 2.7101422221773766e-05, - "loss": 0.0072, + "epoch": 0.93, + "learning_rate": 0.00015978702942861365, + "loss": 0.0157, "step": 360610 }, { - "epoch": 1.82, - "learning_rate": 2.7093854528759754e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00015978314121224216, + "loss": 0.0116, "step": 360620 }, { - "epoch": 1.82, - "learning_rate": 2.7086286835745746e-05, - "loss": 0.0043, + "epoch": 0.93, + "learning_rate": 0.00015977925299587068, + "loss": 0.015, "step": 360630 }, { - "epoch": 1.82, - "learning_rate": 2.7078719142731734e-05, - "loss": 0.0078, + "epoch": 0.93, + "learning_rate": 0.00015977536477949924, + "loss": 0.0118, "step": 360640 }, { - "epoch": 1.82, - "learning_rate": 2.7071151449717722e-05, - "loss": 0.0047, + "epoch": 0.93, + "learning_rate": 0.00015977147656312779, + "loss": 0.0117, "step": 360650 }, { - "epoch": 1.82, - "learning_rate": 2.706358375670371e-05, - "loss": 0.0066, + "epoch": 0.93, + "learning_rate": 0.0001597675883467563, + "loss": 0.0111, "step": 360660 }, { - "epoch": 1.82, - "learning_rate": 2.7056016063689702e-05, - "loss": 0.0058, + "epoch": 0.93, + "learning_rate": 0.00015976370013038484, + "loss": 0.0145, "step": 360670 }, { - "epoch": 1.82, - "learning_rate": 2.704844837067569e-05, - "loss": 0.005, + "epoch": 0.93, + "learning_rate": 0.00015975981191401338, + "loss": 0.0114, "step": 360680 }, { - "epoch": 1.82, - "learning_rate": 2.704088067766168e-05, - "loss": 0.0067, + "epoch": 0.93, + "learning_rate": 0.00015975592369764193, + "loss": 0.0132, "step": 360690 }, { - "epoch": 1.82, - "learning_rate": 2.703331298464767e-05, - "loss": 0.0082, + "epoch": 0.93, + "learning_rate": 0.00015975203548127044, + "loss": 0.0154, "step": 360700 }, { - "epoch": 1.82, - "learning_rate": 2.702574529163366e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015974814726489898, + "loss": 0.0133, "step": 360710 }, { - "epoch": 1.82, - "learning_rate": 2.701817759861965e-05, - "loss": 0.013, + "epoch": 0.94, + "learning_rate": 0.00015974425904852752, + "loss": 0.0099, "step": 360720 }, { - "epoch": 1.82, - "learning_rate": 2.701060990560564e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015974037083215606, + "loss": 0.0105, "step": 360730 }, { - "epoch": 1.82, - "learning_rate": 2.700304221259163e-05, - "loss": 0.0064, + "epoch": 0.94, + "learning_rate": 0.00015973648261578458, + "loss": 0.0126, "step": 360740 }, { - "epoch": 1.82, - "learning_rate": 2.699547451957762e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.00015973259439941312, + "loss": 0.0118, "step": 360750 }, { - "epoch": 1.82, - "learning_rate": 2.698790682656361e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015972870618304164, + "loss": 0.0133, "step": 360760 }, { - "epoch": 1.82, - "learning_rate": 2.69803391335496e-05, - "loss": 0.0029, + "epoch": 0.94, + "learning_rate": 0.0001597248179666702, + "loss": 0.0124, "step": 360770 }, { - "epoch": 1.82, - "learning_rate": 2.697277144053559e-05, - "loss": 0.0085, + "epoch": 0.94, + "learning_rate": 0.00015972092975029872, + "loss": 0.0143, "step": 360780 }, { - "epoch": 1.82, - "learning_rate": 2.696520374752158e-05, - "loss": 0.0093, + "epoch": 0.94, + "learning_rate": 0.00015971704153392726, + "loss": 0.0123, "step": 360790 }, { - "epoch": 1.82, - "learning_rate": 2.695763605450757e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015971315331755577, + "loss": 0.0141, "step": 360800 }, { - "epoch": 1.82, - "learning_rate": 2.6950068361493557e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015970926510118434, + "loss": 0.0123, "step": 360810 }, { - "epoch": 1.82, - "learning_rate": 2.6942500668479545e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.00015970537688481289, + "loss": 0.0116, "step": 360820 }, { - "epoch": 1.82, - "learning_rate": 2.6934932975465537e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.0001597014886684414, + "loss": 0.0172, "step": 360830 }, { - "epoch": 1.82, - "learning_rate": 2.6927365282451525e-05, - "loss": 0.0064, + "epoch": 0.94, + "learning_rate": 0.00015969760045206994, + "loss": 0.0137, "step": 360840 }, { - "epoch": 1.82, - "learning_rate": 2.6919797589437517e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015969371223569848, + "loss": 0.011, "step": 360850 }, { - "epoch": 1.82, - "learning_rate": 2.6912229896423505e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015968982401932702, + "loss": 0.011, "step": 360860 }, { - "epoch": 1.82, - "learning_rate": 2.6904662203409497e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015968593580295554, + "loss": 0.0122, "step": 360870 }, { - "epoch": 1.82, - "learning_rate": 2.6897094510395485e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015968204758658408, + "loss": 0.0148, "step": 360880 }, { - "epoch": 1.82, - "learning_rate": 2.6889526817381477e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015967815937021262, + "loss": 0.0117, "step": 360890 }, { - "epoch": 1.82, - "learning_rate": 2.6881959124367465e-05, - "loss": 0.0093, + "epoch": 0.94, + "learning_rate": 0.00015967427115384116, + "loss": 0.0145, "step": 360900 }, { - "epoch": 1.82, - "learning_rate": 2.6874391431353456e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015967038293746968, + "loss": 0.0107, "step": 360910 }, { - "epoch": 1.82, - "learning_rate": 2.6866823738339445e-05, - "loss": 0.0088, + "epoch": 0.94, + "learning_rate": 0.00015966649472109822, + "loss": 0.0125, "step": 360920 }, { - "epoch": 1.82, - "learning_rate": 2.6859256045325436e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.0001596626065047268, + "loss": 0.0224, "step": 360930 }, { - "epoch": 1.82, - "learning_rate": 2.6851688352311424e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.0001596587182883553, + "loss": 0.0142, "step": 360940 }, { - "epoch": 1.82, - "learning_rate": 2.6844120659297416e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015965483007198382, + "loss": 0.011, "step": 360950 }, { - "epoch": 1.82, - "learning_rate": 2.6836552966283404e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015965094185561236, + "loss": 0.0114, "step": 360960 }, { - "epoch": 1.82, - "learning_rate": 2.682898527326939e-05, - "loss": 0.0042, + "epoch": 0.94, + "learning_rate": 0.00015964705363924093, + "loss": 0.013, "step": 360970 }, { - "epoch": 1.82, - "learning_rate": 2.682141758025538e-05, - "loss": 0.0071, + "epoch": 0.94, + "learning_rate": 0.00015964316542286944, + "loss": 0.0128, "step": 360980 }, { - "epoch": 1.82, - "learning_rate": 2.681384988724137e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015963927720649798, + "loss": 0.0114, "step": 360990 }, { - "epoch": 1.82, - "learning_rate": 2.680628219422736e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.0001596353889901265, + "loss": 0.0139, "step": 361000 }, { - "epoch": 1.82, - "eval_cer": 0.9144256176813937, - "eval_loss": 0.004407630767673254, - "eval_runtime": 116.7425, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.94, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.008725974708795547, + "eval_runtime": 107.3705, + "eval_samples_per_second": 18.627, + "eval_steps_per_second": 4.657, "step": 361000 }, { - "epoch": 1.82, - "learning_rate": 2.679871450121335e-05, - "loss": 0.0085, + "epoch": 0.94, + "learning_rate": 0.00015963150077375504, + "loss": 0.0134, "step": 361010 }, { - "epoch": 1.82, - "learning_rate": 2.679114680819934e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.00015962761255738358, + "loss": 0.0112, "step": 361020 }, { - "epoch": 1.82, - "learning_rate": 2.678357911518533e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015962372434101212, + "loss": 0.0154, "step": 361030 }, { - "epoch": 1.82, - "learning_rate": 2.677601142217132e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015961983612464064, + "loss": 0.0118, "step": 361040 }, { - "epoch": 1.82, - "learning_rate": 2.6768443729157312e-05, - "loss": 0.0075, + "epoch": 0.94, + "learning_rate": 0.00015961594790826918, + "loss": 0.0129, "step": 361050 }, { - "epoch": 1.82, - "learning_rate": 2.67608760361433e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.00015961205969189772, + "loss": 0.0142, "step": 361060 }, { - "epoch": 1.82, - "learning_rate": 2.675330834312929e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015960817147552626, + "loss": 0.0106, "step": 361070 }, { - "epoch": 1.82, - "learning_rate": 2.674574065011528e-05, - "loss": 0.0078, + "epoch": 0.94, + "learning_rate": 0.00015960428325915478, + "loss": 0.0147, "step": 361080 }, { - "epoch": 1.82, - "learning_rate": 2.673817295710127e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015960039504278332, + "loss": 0.0121, "step": 361090 }, { - "epoch": 1.82, - "learning_rate": 2.673060526408726e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015959650682641186, + "loss": 0.0117, "step": 361100 }, { - "epoch": 1.82, - "learning_rate": 2.672303757107325e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.0001595926186100404, + "loss": 0.0121, "step": 361110 }, { - "epoch": 1.82, - "learning_rate": 2.6715469878059236e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015958873039366892, + "loss": 0.0118, "step": 361120 }, { - "epoch": 1.82, - "learning_rate": 2.6707902185045224e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015958484217729746, + "loss": 0.0151, "step": 361130 }, { - "epoch": 1.82, - "learning_rate": 2.6700334492031216e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015958095396092603, + "loss": 0.0166, "step": 361140 }, { - "epoch": 1.82, - "learning_rate": 2.6692766799017204e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015957706574455454, + "loss": 0.0121, "step": 361150 }, { - "epoch": 1.82, - "learning_rate": 2.6685199106003196e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015957317752818308, + "loss": 0.0113, "step": 361160 }, { - "epoch": 1.82, - "learning_rate": 2.6677631412989184e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.0001595692893118116, + "loss": 0.0127, "step": 361170 }, { - "epoch": 1.82, - "learning_rate": 2.6670063719975176e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015956540109544017, + "loss": 0.0136, "step": 361180 }, { - "epoch": 1.82, - "learning_rate": 2.6662496026961164e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015956151287906868, + "loss": 0.0157, "step": 361190 }, { - "epoch": 1.82, - "learning_rate": 2.6654928333947155e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015955762466269722, + "loss": 0.0115, "step": 361200 }, { - "epoch": 1.82, - "learning_rate": 2.6647360640933144e-05, - "loss": 0.0047, + "epoch": 0.94, + "learning_rate": 0.00015955373644632574, + "loss": 0.0131, "step": 361210 }, { - "epoch": 1.82, - "learning_rate": 2.6639792947919135e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.0001595498482299543, + "loss": 0.0122, "step": 361220 }, { - "epoch": 1.82, - "learning_rate": 2.6632225254905123e-05, - "loss": 0.0072, + "epoch": 0.94, + "learning_rate": 0.00015954596001358282, + "loss": 0.0102, "step": 361230 }, { - "epoch": 1.82, - "learning_rate": 2.6624657561891115e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015954207179721136, + "loss": 0.0125, "step": 361240 }, { - "epoch": 1.82, - "learning_rate": 2.6617089868877103e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015953818358083988, + "loss": 0.0111, "step": 361250 }, { - "epoch": 1.82, - "learning_rate": 2.6609522175863095e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015953429536446842, + "loss": 0.0135, "step": 361260 }, { - "epoch": 1.82, - "learning_rate": 2.6601954482849083e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015953040714809696, + "loss": 0.014, "step": 361270 }, { - "epoch": 1.82, - "learning_rate": 2.659438678983507e-05, - "loss": 0.0081, + "epoch": 0.94, + "learning_rate": 0.0001595265189317255, + "loss": 0.0144, "step": 361280 }, { - "epoch": 1.82, - "learning_rate": 2.658681909682106e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015952263071535402, + "loss": 0.0116, "step": 361290 }, { - "epoch": 1.82, - "learning_rate": 2.657925140380705e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015951874249898256, + "loss": 0.0103, "step": 361300 }, { - "epoch": 1.82, - "learning_rate": 2.657168371079304e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015951485428261113, + "loss": 0.0137, "step": 361310 }, { - "epoch": 1.82, - "learning_rate": 2.656411601777903e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015951096606623964, + "loss": 0.0135, "step": 361320 }, { - "epoch": 1.82, - "learning_rate": 2.655654832476502e-05, - "loss": 0.0064, + "epoch": 0.94, + "learning_rate": 0.00015950707784986818, + "loss": 0.015, "step": 361330 }, { - "epoch": 1.82, - "learning_rate": 2.654898063175101e-05, - "loss": 0.0043, + "epoch": 0.94, + "learning_rate": 0.0001595031896334967, + "loss": 0.0127, "step": 361340 }, { - "epoch": 1.82, - "learning_rate": 2.6541412938737e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015949930141712527, + "loss": 0.0122, "step": 361350 }, { - "epoch": 1.82, - "learning_rate": 2.653384524572299e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015949541320075378, + "loss": 0.0117, "step": 361360 }, { - "epoch": 1.82, - "learning_rate": 2.652627755270898e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.00015949152498438232, + "loss": 0.0123, "step": 361370 }, { - "epoch": 1.82, - "learning_rate": 2.651870985969497e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015948763676801084, + "loss": 0.0145, "step": 361380 }, { - "epoch": 1.82, - "learning_rate": 2.651114216668096e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.0001594837485516394, + "loss": 0.0131, "step": 361390 }, { - "epoch": 1.82, - "learning_rate": 2.650357447366695e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015947986033526792, + "loss": 0.0143, "step": 361400 }, { - "epoch": 1.82, - "learning_rate": 2.649600678065294e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.00015947597211889646, + "loss": 0.013, "step": 361410 }, { - "epoch": 1.82, - "learning_rate": 2.648843908763893e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015947208390252498, + "loss": 0.0134, "step": 361420 }, { - "epoch": 1.82, - "learning_rate": 2.6480871394624918e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015946819568615355, + "loss": 0.0121, "step": 361430 }, { - "epoch": 1.82, - "learning_rate": 2.6473303701610906e-05, - "loss": 0.0084, + "epoch": 0.94, + "learning_rate": 0.00015946430746978206, + "loss": 0.0126, "step": 361440 }, { - "epoch": 1.82, - "learning_rate": 2.6465736008596895e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.0001594604192534106, + "loss": 0.0109, "step": 361450 }, { - "epoch": 1.82, - "learning_rate": 2.6458168315582886e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015945653103703912, + "loss": 0.0178, "step": 361460 }, { - "epoch": 1.82, - "learning_rate": 2.6450600622568875e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.00015945264282066768, + "loss": 0.0153, "step": 361470 }, { - "epoch": 1.82, - "learning_rate": 2.6443032929554866e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015944875460429623, + "loss": 0.0141, "step": 361480 }, { - "epoch": 1.82, - "learning_rate": 2.6435465236540854e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015944486638792474, + "loss": 0.0117, "step": 361490 }, { - "epoch": 1.82, - "learning_rate": 2.6427897543526846e-05, - "loss": 0.0072, + "epoch": 0.94, + "learning_rate": 0.00015944097817155326, + "loss": 0.0167, "step": 361500 }, { - "epoch": 1.82, - "learning_rate": 2.6420329850512834e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.0001594370899551818, + "loss": 0.0142, "step": 361510 }, { - "epoch": 1.82, - "learning_rate": 2.6412762157498826e-05, - "loss": 0.0039, + "epoch": 0.94, + "learning_rate": 0.00015943320173881037, + "loss": 0.0175, "step": 361520 }, { - "epoch": 1.82, - "learning_rate": 2.6405194464484814e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015942931352243888, + "loss": 0.0173, "step": 361530 }, { - "epoch": 1.82, - "learning_rate": 2.6397626771470806e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015942542530606742, + "loss": 0.0142, "step": 361540 }, { - "epoch": 1.82, - "learning_rate": 2.6390059078456794e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015942153708969594, + "loss": 0.0167, "step": 361550 }, { - "epoch": 1.82, - "learning_rate": 2.6382491385442785e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.0001594176488733245, + "loss": 0.0093, "step": 361560 }, { - "epoch": 1.82, - "learning_rate": 2.6374923692428774e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015941376065695302, + "loss": 0.0129, "step": 361570 }, { - "epoch": 1.82, - "learning_rate": 2.6367355999414765e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015940987244058156, + "loss": 0.0193, "step": 361580 }, { - "epoch": 1.82, - "learning_rate": 2.6359788306400753e-05, - "loss": 0.0038, + "epoch": 0.94, + "learning_rate": 0.00015940598422421008, + "loss": 0.0115, "step": 361590 }, { - "epoch": 1.82, - "learning_rate": 2.635222061338674e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015940209600783864, + "loss": 0.0109, "step": 361600 }, { - "epoch": 1.82, - "learning_rate": 2.634465292037273e-05, - "loss": 0.008, + "epoch": 0.94, + "learning_rate": 0.00015939820779146716, + "loss": 0.0133, "step": 361610 }, { - "epoch": 1.82, - "learning_rate": 2.633708522735872e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.0001593943195750957, + "loss": 0.012, "step": 361620 }, { - "epoch": 1.82, - "learning_rate": 2.632951753434471e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015939043135872422, + "loss": 0.0143, "step": 361630 }, { - "epoch": 1.82, - "learning_rate": 2.63219498413307e-05, - "loss": 0.0051, + "epoch": 0.94, + "learning_rate": 0.00015938654314235278, + "loss": 0.0141, "step": 361640 }, { - "epoch": 1.82, - "learning_rate": 2.631438214831669e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.0001593826549259813, + "loss": 0.0119, "step": 361650 }, { - "epoch": 1.82, - "learning_rate": 2.630681445530268e-05, - "loss": 0.0042, + "epoch": 0.94, + "learning_rate": 0.00015937876670960984, + "loss": 0.0106, "step": 361660 }, { - "epoch": 1.82, - "learning_rate": 2.629924676228867e-05, - "loss": 0.007, + "epoch": 0.94, + "learning_rate": 0.00015937487849323836, + "loss": 0.0124, "step": 361670 }, { - "epoch": 1.82, - "learning_rate": 2.629167906927466e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015937099027686692, + "loss": 0.0144, "step": 361680 }, { - "epoch": 1.82, - "learning_rate": 2.628411137626065e-05, - "loss": 0.0044, + "epoch": 0.94, + "learning_rate": 0.00015936710206049547, + "loss": 0.0135, "step": 361690 }, { - "epoch": 1.82, - "learning_rate": 2.627654368324664e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015936321384412398, + "loss": 0.0105, "step": 361700 }, { - "epoch": 1.82, - "learning_rate": 2.626897599023263e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015935932562775252, + "loss": 0.0117, "step": 361710 }, { - "epoch": 1.82, - "learning_rate": 2.626140829721862e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.00015935543741138106, + "loss": 0.0122, "step": 361720 }, { - "epoch": 1.82, - "learning_rate": 2.625384060420461e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.0001593515491950096, + "loss": 0.0123, "step": 361730 }, { - "epoch": 1.83, - "learning_rate": 2.62462729111906e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.00015934766097863812, + "loss": 0.0149, "step": 361740 }, { - "epoch": 1.83, - "learning_rate": 2.6238705218176585e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015934377276226666, + "loss": 0.0173, "step": 361750 }, { - "epoch": 1.83, - "learning_rate": 2.6231137525162577e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015933988454589518, + "loss": 0.0126, "step": 361760 }, { - "epoch": 1.83, - "learning_rate": 2.6223569832148565e-05, - "loss": 0.0039, + "epoch": 0.94, + "learning_rate": 0.00015933599632952374, + "loss": 0.0141, "step": 361770 }, { - "epoch": 1.83, - "learning_rate": 2.6216002139134557e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015933210811315226, + "loss": 0.0154, "step": 361780 }, { - "epoch": 1.83, - "learning_rate": 2.6208434446120545e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.0001593282198967808, + "loss": 0.0133, "step": 361790 }, { - "epoch": 1.83, - "learning_rate": 2.6200866753106537e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015932433168040932, + "loss": 0.0185, "step": 361800 }, { - "epoch": 1.83, - "learning_rate": 2.6193299060092525e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.00015932044346403788, + "loss": 0.0112, "step": 361810 }, { - "epoch": 1.83, - "learning_rate": 2.6185731367078516e-05, - "loss": 0.0093, + "epoch": 0.94, + "learning_rate": 0.0001593165552476664, + "loss": 0.014, "step": 361820 }, { - "epoch": 1.83, - "learning_rate": 2.6178163674064505e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015931266703129494, + "loss": 0.0165, "step": 361830 }, { - "epoch": 1.83, - "learning_rate": 2.6170595981050496e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015930877881492345, + "loss": 0.0127, "step": 361840 }, { - "epoch": 1.83, - "learning_rate": 2.6163028288036484e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015930489059855202, + "loss": 0.0131, "step": 361850 }, { - "epoch": 1.83, - "learning_rate": 2.6155460595022476e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015930100238218056, + "loss": 0.0122, "step": 361860 }, { - "epoch": 1.83, - "learning_rate": 2.6147892902008464e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015929711416580908, + "loss": 0.0119, "step": 361870 }, { - "epoch": 1.83, - "learning_rate": 2.6140325208994456e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015929322594943762, + "loss": 0.0131, "step": 361880 }, { - "epoch": 1.83, - "learning_rate": 2.6132757515980444e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015928933773306616, + "loss": 0.0136, "step": 361890 }, { - "epoch": 1.83, - "learning_rate": 2.6125189822966436e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.0001592854495166947, + "loss": 0.0116, "step": 361900 }, { - "epoch": 1.83, - "learning_rate": 2.611762212995242e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015928156130032322, + "loss": 0.0135, "step": 361910 }, { - "epoch": 1.83, - "learning_rate": 2.611005443693841e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015927767308395176, + "loss": 0.0118, "step": 361920 }, { - "epoch": 1.83, - "learning_rate": 2.61024867439244e-05, - "loss": 0.0044, + "epoch": 0.94, + "learning_rate": 0.0001592737848675803, + "loss": 0.0112, "step": 361930 }, { - "epoch": 1.83, - "learning_rate": 2.609491905091039e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015926989665120884, + "loss": 0.0126, "step": 361940 }, { - "epoch": 1.83, - "learning_rate": 2.608735135789638e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.00015926600843483736, + "loss": 0.0137, "step": 361950 }, { - "epoch": 1.83, - "learning_rate": 2.607978366488237e-05, - "loss": 0.0086, + "epoch": 0.94, + "learning_rate": 0.0001592621202184659, + "loss": 0.0148, "step": 361960 }, { - "epoch": 1.83, - "learning_rate": 2.607221597186836e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015925823200209444, + "loss": 0.0137, "step": 361970 }, { - "epoch": 1.83, - "learning_rate": 2.6064648278854348e-05, - "loss": 0.0078, + "epoch": 0.94, + "learning_rate": 0.00015925434378572298, + "loss": 0.0119, "step": 361980 }, { - "epoch": 1.83, - "learning_rate": 2.605708058584034e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.0001592504555693515, + "loss": 0.014, "step": 361990 }, { - "epoch": 1.83, - "learning_rate": 2.6049512892826328e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015924656735298004, + "loss": 0.0136, "step": 362000 }, { - "epoch": 1.83, - "eval_cer": 0.9144314400581461, - "eval_loss": 0.004417457617819309, - "eval_runtime": 116.6172, - "eval_samples_per_second": 17.15, - "eval_steps_per_second": 4.288, + "epoch": 0.94, + "eval_cer": 0.8817222812402463, + "eval_loss": 0.008736135438084602, + "eval_runtime": 107.4655, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, "step": 362000 }, { - "epoch": 1.83, - "learning_rate": 2.604194519981232e-05, - "loss": 0.0051, + "epoch": 0.94, + "learning_rate": 0.00015924267913660855, + "loss": 0.015, "step": 362010 }, { - "epoch": 1.83, - "learning_rate": 2.603437750679831e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015923879092023712, + "loss": 0.0129, "step": 362020 }, { - "epoch": 1.83, - "learning_rate": 2.60268098137843e-05, - "loss": 0.0086, + "epoch": 0.94, + "learning_rate": 0.00015923490270386566, + "loss": 0.0126, "step": 362030 }, { - "epoch": 1.83, - "learning_rate": 2.601924212077029e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.00015923101448749418, + "loss": 0.0117, "step": 362040 }, { - "epoch": 1.83, - "learning_rate": 2.601167442775628e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.0001592271262711227, + "loss": 0.0145, "step": 362050 }, { - "epoch": 1.83, - "learning_rate": 2.600410673474227e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015922323805475126, + "loss": 0.0107, "step": 362060 }, { - "epoch": 1.83, - "learning_rate": 2.5996539041728256e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.0001592193498383798, + "loss": 0.0174, "step": 362070 }, { - "epoch": 1.83, - "learning_rate": 2.5988971348714244e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015921546162200832, + "loss": 0.0141, "step": 362080 }, { - "epoch": 1.83, - "learning_rate": 2.5981403655700236e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015921157340563686, + "loss": 0.0119, "step": 362090 }, { - "epoch": 1.83, - "learning_rate": 2.5973835962686224e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.0001592076851892654, + "loss": 0.0133, "step": 362100 }, { - "epoch": 1.83, - "learning_rate": 2.5966268269672215e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015920379697289394, + "loss": 0.0136, "step": 362110 }, { - "epoch": 1.83, - "learning_rate": 2.5958700576658204e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015919990875652246, + "loss": 0.0127, "step": 362120 }, { - "epoch": 1.83, - "learning_rate": 2.5951132883644195e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.000159196020540151, + "loss": 0.0144, "step": 362130 }, { - "epoch": 1.83, - "learning_rate": 2.5943565190630183e-05, - "loss": 0.0043, + "epoch": 0.94, + "learning_rate": 0.00015919213232377954, + "loss": 0.0098, "step": 362140 }, { - "epoch": 1.83, - "learning_rate": 2.5935997497616175e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015918824410740808, + "loss": 0.0125, "step": 362150 }, { - "epoch": 1.83, - "learning_rate": 2.5928429804602163e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.0001591843558910366, + "loss": 0.0099, "step": 362160 }, { - "epoch": 1.83, - "learning_rate": 2.5920862111588155e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015918046767466514, + "loss": 0.0137, "step": 362170 }, { - "epoch": 1.83, - "learning_rate": 2.5913294418574143e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.0001591765794582937, + "loss": 0.0127, "step": 362180 }, { - "epoch": 1.83, - "learning_rate": 2.5905726725560135e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015917269124192222, + "loss": 0.0126, "step": 362190 }, { - "epoch": 1.83, - "learning_rate": 2.5898159032546123e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.00015916880302555076, + "loss": 0.0145, "step": 362200 }, { - "epoch": 1.83, - "learning_rate": 2.5890591339532115e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015916491480917928, + "loss": 0.0122, "step": 362210 }, { - "epoch": 1.83, - "learning_rate": 2.58830236465181e-05, - "loss": 0.0072, + "epoch": 0.94, + "learning_rate": 0.00015916102659280785, + "loss": 0.0114, "step": 362220 }, { - "epoch": 1.83, - "learning_rate": 2.587545595350409e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015915713837643636, + "loss": 0.0109, "step": 362230 }, { - "epoch": 1.83, - "learning_rate": 2.586788826049008e-05, - "loss": 0.0078, + "epoch": 0.94, + "learning_rate": 0.0001591532501600649, + "loss": 0.0094, "step": 362240 }, { - "epoch": 1.83, - "learning_rate": 2.586032056747607e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015914936194369342, + "loss": 0.0146, "step": 362250 }, { - "epoch": 1.83, - "learning_rate": 2.585275287446206e-05, - "loss": 0.0075, + "epoch": 0.94, + "learning_rate": 0.00015914547372732196, + "loss": 0.0128, "step": 362260 }, { - "epoch": 1.83, - "learning_rate": 2.584518518144805e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.0001591415855109505, + "loss": 0.0148, "step": 362270 }, { - "epoch": 1.83, - "learning_rate": 2.583761748843404e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.00015913769729457904, + "loss": 0.0115, "step": 362280 }, { - "epoch": 1.83, - "learning_rate": 2.583004979542003e-05, - "loss": 0.0042, + "epoch": 0.94, + "learning_rate": 0.00015913380907820756, + "loss": 0.0114, "step": 362290 }, { - "epoch": 1.83, - "learning_rate": 2.582248210240602e-05, - "loss": 0.0082, + "epoch": 0.94, + "learning_rate": 0.0001591299208618361, + "loss": 0.0135, "step": 362300 }, { - "epoch": 1.83, - "learning_rate": 2.581491440939201e-05, - "loss": 0.0085, + "epoch": 0.94, + "learning_rate": 0.00015912603264546464, + "loss": 0.0094, "step": 362310 }, { - "epoch": 1.83, - "learning_rate": 2.5807346716378e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.00015912214442909318, + "loss": 0.0096, "step": 362320 }, { - "epoch": 1.83, - "learning_rate": 2.579977902336399e-05, - "loss": 0.0051, + "epoch": 0.94, + "learning_rate": 0.0001591182562127217, + "loss": 0.0124, "step": 362330 }, { - "epoch": 1.83, - "learning_rate": 2.5792211330349978e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015911436799635024, + "loss": 0.0118, "step": 362340 }, { - "epoch": 1.83, - "learning_rate": 2.578464363733597e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.0001591104797799788, + "loss": 0.0109, "step": 362350 }, { - "epoch": 1.83, - "learning_rate": 2.5777075944321958e-05, - "loss": 0.0079, + "epoch": 0.94, + "learning_rate": 0.00015910659156360732, + "loss": 0.0144, "step": 362360 }, { - "epoch": 1.83, - "learning_rate": 2.576950825130795e-05, - "loss": 0.0064, + "epoch": 0.94, + "learning_rate": 0.00015910270334723584, + "loss": 0.0117, "step": 362370 }, { - "epoch": 1.83, - "learning_rate": 2.5761940558293935e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015909881513086438, + "loss": 0.0111, "step": 362380 }, { - "epoch": 1.83, - "learning_rate": 2.5754372865279926e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015909492691449295, + "loss": 0.0111, "step": 362390 }, { - "epoch": 1.83, - "learning_rate": 2.5746805172265914e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015909103869812146, + "loss": 0.0148, "step": 362400 }, { - "epoch": 1.83, - "learning_rate": 2.5739237479251906e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015908715048175, + "loss": 0.0124, "step": 362410 }, { - "epoch": 1.83, - "learning_rate": 2.5731669786237894e-05, - "loss": 0.0094, + "epoch": 0.94, + "learning_rate": 0.00015908326226537852, + "loss": 0.0111, "step": 362420 }, { - "epoch": 1.83, - "learning_rate": 2.5724102093223886e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015907937404900709, + "loss": 0.0138, "step": 362430 }, { - "epoch": 1.83, - "learning_rate": 2.5716534400209874e-05, - "loss": 0.0073, + "epoch": 0.94, + "learning_rate": 0.0001590754858326356, + "loss": 0.0138, "step": 362440 }, { - "epoch": 1.83, - "learning_rate": 2.5708966707195866e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015907159761626414, + "loss": 0.0155, "step": 362450 }, { - "epoch": 1.83, - "learning_rate": 2.5701399014181854e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015906770939989266, + "loss": 0.0118, "step": 362460 }, { - "epoch": 1.83, - "learning_rate": 2.5693831321167845e-05, - "loss": 0.0073, + "epoch": 0.94, + "learning_rate": 0.00015906382118352123, + "loss": 0.0146, "step": 362470 }, { - "epoch": 1.83, - "learning_rate": 2.5686263628153834e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015905993296714974, + "loss": 0.0118, "step": 362480 }, { - "epoch": 1.83, - "learning_rate": 2.5678695935139825e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015905604475077828, + "loss": 0.0132, "step": 362490 }, { - "epoch": 1.83, - "learning_rate": 2.5671128242125814e-05, - "loss": 0.0088, + "epoch": 0.94, + "learning_rate": 0.0001590521565344068, + "loss": 0.0119, "step": 362500 }, { - "epoch": 1.83, - "learning_rate": 2.5663560549111805e-05, - "loss": 0.0039, + "epoch": 0.94, + "learning_rate": 0.00015904826831803534, + "loss": 0.0091, "step": 362510 }, { - "epoch": 1.83, - "learning_rate": 2.5655992856097793e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.0001590443801016639, + "loss": 0.0134, "step": 362520 }, { - "epoch": 1.83, - "learning_rate": 2.5648425163083785e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015904049188529242, + "loss": 0.0164, "step": 362530 }, { - "epoch": 1.83, - "learning_rate": 2.564085747006977e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015903660366892094, + "loss": 0.0147, "step": 362540 }, { - "epoch": 1.83, - "learning_rate": 2.563328977705576e-05, - "loss": 0.0036, + "epoch": 0.94, + "learning_rate": 0.00015903271545254948, + "loss": 0.0124, "step": 362550 }, { - "epoch": 1.83, - "learning_rate": 2.562572208404175e-05, - "loss": 0.0071, + "epoch": 0.94, + "learning_rate": 0.00015902882723617805, + "loss": 0.0105, "step": 362560 }, { - "epoch": 1.83, - "learning_rate": 2.561815439102774e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.00015902493901980656, + "loss": 0.0139, "step": 362570 }, { - "epoch": 1.83, - "learning_rate": 2.561058669801373e-05, - "loss": 0.004, + "epoch": 0.94, + "learning_rate": 0.0001590210508034351, + "loss": 0.0118, "step": 362580 }, { - "epoch": 1.83, - "learning_rate": 2.560301900499972e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015901716258706362, + "loss": 0.0175, "step": 362590 }, { - "epoch": 1.83, - "learning_rate": 2.559545131198571e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015901327437069219, + "loss": 0.0129, "step": 362600 }, { - "epoch": 1.83, - "learning_rate": 2.55878836189717e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.0001590093861543207, + "loss": 0.0138, "step": 362610 }, { - "epoch": 1.83, - "learning_rate": 2.558031592595769e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.00015900549793794924, + "loss": 0.0156, "step": 362620 }, { - "epoch": 1.83, - "learning_rate": 2.557274823294368e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.00015900160972157776, + "loss": 0.0151, "step": 362630 }, { - "epoch": 1.83, - "learning_rate": 2.556518053992967e-05, - "loss": 0.0076, + "epoch": 0.94, + "learning_rate": 0.00015899772150520632, + "loss": 0.0137, "step": 362640 }, { - "epoch": 1.83, - "learning_rate": 2.555761284691566e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015899383328883484, + "loss": 0.0149, "step": 362650 }, { - "epoch": 1.83, - "learning_rate": 2.555004515390165e-05, - "loss": 0.0034, + "epoch": 0.94, + "learning_rate": 0.00015898994507246338, + "loss": 0.0114, "step": 362660 }, { - "epoch": 1.83, - "learning_rate": 2.554247746088764e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.0001589860568560919, + "loss": 0.0122, "step": 362670 }, { - "epoch": 1.83, - "learning_rate": 2.553490976787363e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015898216863972046, + "loss": 0.0152, "step": 362680 }, { - "epoch": 1.83, - "learning_rate": 2.552734207485962e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015897828042334898, + "loss": 0.0124, "step": 362690 }, { - "epoch": 1.83, - "learning_rate": 2.5519774381845605e-05, - "loss": 0.0078, + "epoch": 0.94, + "learning_rate": 0.00015897439220697752, + "loss": 0.0154, "step": 362700 }, { - "epoch": 1.83, - "learning_rate": 2.5512206688831593e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015897050399060603, + "loss": 0.0145, "step": 362710 }, { - "epoch": 1.83, - "learning_rate": 2.5504638995817585e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.0001589666157742346, + "loss": 0.0117, "step": 362720 }, { - "epoch": 1.83, - "learning_rate": 2.5497071302803576e-05, - "loss": 0.0041, + "epoch": 0.94, + "learning_rate": 0.00015896272755786315, + "loss": 0.0139, "step": 362730 }, { - "epoch": 1.83, - "learning_rate": 2.5489503609789565e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015895883934149166, + "loss": 0.0116, "step": 362740 }, { - "epoch": 1.83, - "learning_rate": 2.5481935916775556e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.0001589549511251202, + "loss": 0.0123, "step": 362750 }, { - "epoch": 1.83, - "learning_rate": 2.5474368223761544e-05, - "loss": 0.0077, + "epoch": 0.94, + "learning_rate": 0.00015895106290874872, + "loss": 0.0117, "step": 362760 }, { - "epoch": 1.83, - "learning_rate": 2.5466800530747536e-05, - "loss": 0.0075, + "epoch": 0.94, + "learning_rate": 0.00015894717469237728, + "loss": 0.012, "step": 362770 }, { - "epoch": 1.83, - "learning_rate": 2.5459232837733524e-05, - "loss": 0.0047, + "epoch": 0.94, + "learning_rate": 0.0001589432864760058, + "loss": 0.011, "step": 362780 }, { - "epoch": 1.83, - "learning_rate": 2.5451665144719516e-05, - "loss": 0.0051, + "epoch": 0.94, + "learning_rate": 0.00015893939825963434, + "loss": 0.0121, "step": 362790 }, { - "epoch": 1.83, - "learning_rate": 2.5444097451705504e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015893551004326286, + "loss": 0.0111, "step": 362800 }, { - "epoch": 1.83, - "learning_rate": 2.5436529758691496e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015893162182689142, + "loss": 0.0098, "step": 362810 }, { - "epoch": 1.83, - "learning_rate": 2.5428962065677484e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.00015892773361051994, + "loss": 0.012, "step": 362820 }, { - "epoch": 1.83, - "learning_rate": 2.5421394372663476e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015892384539414848, + "loss": 0.0155, "step": 362830 }, { - "epoch": 1.83, - "learning_rate": 2.5413826679649464e-05, - "loss": 0.0092, + "epoch": 0.94, + "learning_rate": 0.000158919957177777, + "loss": 0.0104, "step": 362840 }, { - "epoch": 1.83, - "learning_rate": 2.540625898663545e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015891606896140556, + "loss": 0.0116, "step": 362850 }, { - "epoch": 1.83, - "learning_rate": 2.539869129362144e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015891218074503408, + "loss": 0.0104, "step": 362860 }, { - "epoch": 1.83, - "learning_rate": 2.539112360060743e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015890829252866262, + "loss": 0.0124, "step": 362870 }, { - "epoch": 1.83, - "learning_rate": 2.538355590759342e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015890440431229113, + "loss": 0.015, "step": 362880 }, { - "epoch": 1.83, - "learning_rate": 2.5375988214579408e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.0001589005160959197, + "loss": 0.0136, "step": 362890 }, { - "epoch": 1.83, - "learning_rate": 2.53684205215654e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015889662787954824, + "loss": 0.0132, "step": 362900 }, { - "epoch": 1.83, - "learning_rate": 2.5360852828551388e-05, - "loss": 0.0081, + "epoch": 0.94, + "learning_rate": 0.00015889273966317676, + "loss": 0.0133, "step": 362910 }, { - "epoch": 1.83, - "learning_rate": 2.535328513553738e-05, - "loss": 0.0071, + "epoch": 0.94, + "learning_rate": 0.0001588888514468053, + "loss": 0.0101, "step": 362920 }, { - "epoch": 1.83, - "learning_rate": 2.5345717442523368e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015888496323043384, + "loss": 0.0116, "step": 362930 }, { - "epoch": 1.83, - "learning_rate": 2.533814974950936e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015888107501406238, + "loss": 0.0119, "step": 362940 }, { - "epoch": 1.83, - "learning_rate": 2.5330582056495348e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.0001588771867976909, + "loss": 0.0133, "step": 362950 }, { - "epoch": 1.83, - "learning_rate": 2.532301436348134e-05, - "loss": 0.004, + "epoch": 0.94, + "learning_rate": 0.00015887329858131944, + "loss": 0.0133, "step": 362960 }, { - "epoch": 1.83, - "learning_rate": 2.5315446670467328e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015886941036494798, + "loss": 0.0127, "step": 362970 }, { - "epoch": 1.83, - "learning_rate": 2.530787897745332e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015886552214857652, + "loss": 0.011, "step": 362980 }, { - "epoch": 1.83, - "learning_rate": 2.530031128443931e-05, - "loss": 0.0088, + "epoch": 0.94, + "learning_rate": 0.00015886163393220504, + "loss": 0.013, "step": 362990 }, { - "epoch": 1.83, - "learning_rate": 2.52927435914253e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015885774571583358, + "loss": 0.0122, "step": 363000 }, { - "epoch": 1.83, - "eval_cer": 0.9144324104542716, - "eval_loss": 0.004368518013507128, - "eval_runtime": 116.7968, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.94, + "eval_cer": 0.8817474747050615, + "eval_loss": 0.0086388373747468, + "eval_runtime": 107.5493, + "eval_samples_per_second": 18.596, + "eval_steps_per_second": 4.649, "step": 363000 }, { - "epoch": 1.83, - "learning_rate": 2.5285175898411284e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.0001588538574994621, + "loss": 0.0145, "step": 363010 }, { - "epoch": 1.83, - "learning_rate": 2.5277608205397275e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015884996928309066, + "loss": 0.0131, "step": 363020 }, { - "epoch": 1.83, - "learning_rate": 2.5270040512383264e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015884608106671918, + "loss": 0.0121, "step": 363030 }, { - "epoch": 1.83, - "learning_rate": 2.5262472819369255e-05, - "loss": 0.0047, + "epoch": 0.94, + "learning_rate": 0.00015884219285034772, + "loss": 0.0131, "step": 363040 }, { - "epoch": 1.83, - "learning_rate": 2.5254905126355243e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015883830463397623, + "loss": 0.0086, "step": 363050 }, { - "epoch": 1.83, - "learning_rate": 2.5247337433341235e-05, - "loss": 0.0072, + "epoch": 0.94, + "learning_rate": 0.0001588344164176048, + "loss": 0.0095, "step": 363060 }, { - "epoch": 1.83, - "learning_rate": 2.5239769740327223e-05, - "loss": 0.0071, + "epoch": 0.94, + "learning_rate": 0.00015883052820123334, + "loss": 0.0112, "step": 363070 }, { - "epoch": 1.83, - "learning_rate": 2.5232202047313215e-05, - "loss": 0.0081, + "epoch": 0.94, + "learning_rate": 0.00015882663998486186, + "loss": 0.0121, "step": 363080 }, { - "epoch": 1.83, - "learning_rate": 2.5224634354299203e-05, - "loss": 0.0079, + "epoch": 0.94, + "learning_rate": 0.00015882275176849037, + "loss": 0.0126, "step": 363090 }, { - "epoch": 1.83, - "learning_rate": 2.5217066661285195e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015881886355211894, + "loss": 0.0112, "step": 363100 }, { - "epoch": 1.83, - "learning_rate": 2.5209498968271183e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015881497533574748, + "loss": 0.0168, "step": 363110 }, { - "epoch": 1.83, - "learning_rate": 2.5201931275257175e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.000158811087119376, + "loss": 0.0109, "step": 363120 }, { - "epoch": 1.83, - "learning_rate": 2.5194363582243163e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015880719890300454, + "loss": 0.013, "step": 363130 }, { - "epoch": 1.83, - "learning_rate": 2.5186795889229154e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015880331068663308, + "loss": 0.0115, "step": 363140 }, { - "epoch": 1.83, - "learning_rate": 2.5179228196215143e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015879942247026162, + "loss": 0.0121, "step": 363150 }, { - "epoch": 1.83, - "learning_rate": 2.5171660503201134e-05, - "loss": 0.0087, + "epoch": 0.94, + "learning_rate": 0.00015879553425389014, + "loss": 0.0118, "step": 363160 }, { - "epoch": 1.83, - "learning_rate": 2.516409281018712e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015879164603751868, + "loss": 0.0141, "step": 363170 }, { - "epoch": 1.83, - "learning_rate": 2.515652511717311e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015878775782114722, + "loss": 0.012, "step": 363180 }, { - "epoch": 1.83, - "learning_rate": 2.51489574241591e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.00015878386960477576, + "loss": 0.0159, "step": 363190 }, { - "epoch": 1.83, - "learning_rate": 2.514138973114509e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015877998138840428, + "loss": 0.0123, "step": 363200 }, { - "epoch": 1.83, - "learning_rate": 2.513382203813108e-05, - "loss": 0.0076, + "epoch": 0.94, + "learning_rate": 0.00015877609317203282, + "loss": 0.0135, "step": 363210 }, { - "epoch": 1.83, - "learning_rate": 2.512625434511707e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.0001587722049556614, + "loss": 0.0132, "step": 363220 }, { - "epoch": 1.83, - "learning_rate": 2.511868665210306e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.0001587683167392899, + "loss": 0.0097, "step": 363230 }, { - "epoch": 1.83, - "learning_rate": 2.511111895908905e-05, - "loss": 0.0041, + "epoch": 0.94, + "learning_rate": 0.00015876442852291842, + "loss": 0.015, "step": 363240 }, { - "epoch": 1.83, - "learning_rate": 2.510355126607504e-05, - "loss": 0.0079, + "epoch": 0.94, + "learning_rate": 0.00015876054030654696, + "loss": 0.012, "step": 363250 }, { - "epoch": 1.83, - "learning_rate": 2.509598357306103e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015875665209017547, + "loss": 0.0118, "step": 363260 }, { - "epoch": 1.83, - "learning_rate": 2.5088415880047018e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015875276387380404, + "loss": 0.0115, "step": 363270 }, { - "epoch": 1.83, - "learning_rate": 2.508084818703301e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015874887565743258, + "loss": 0.0138, "step": 363280 }, { - "epoch": 1.83, - "learning_rate": 2.5073280494018998e-05, - "loss": 0.0076, + "epoch": 0.94, + "learning_rate": 0.0001587449874410611, + "loss": 0.0133, "step": 363290 }, { - "epoch": 1.83, - "learning_rate": 2.506571280100499e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015874109922468964, + "loss": 0.0108, "step": 363300 }, { - "epoch": 1.83, - "learning_rate": 2.5058145107990978e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015873721100831818, + "loss": 0.0124, "step": 363310 }, { - "epoch": 1.83, - "learning_rate": 2.5050577414976966e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015873332279194672, + "loss": 0.0097, "step": 363320 }, { - "epoch": 1.83, - "learning_rate": 2.5043009721962954e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015872943457557524, + "loss": 0.0149, "step": 363330 }, { - "epoch": 1.83, - "learning_rate": 2.5035442028948946e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015872554635920378, + "loss": 0.0127, "step": 363340 }, { - "epoch": 1.83, - "learning_rate": 2.5027874335934934e-05, - "loss": 0.007, + "epoch": 0.94, + "learning_rate": 0.00015872165814283232, + "loss": 0.0113, "step": 363350 }, { - "epoch": 1.83, - "learning_rate": 2.5020306642920926e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015871776992646086, + "loss": 0.0136, "step": 363360 }, { - "epoch": 1.83, - "learning_rate": 2.5012738949906914e-05, - "loss": 0.0047, + "epoch": 0.94, + "learning_rate": 0.00015871388171008938, + "loss": 0.0136, "step": 363370 }, { - "epoch": 1.83, - "learning_rate": 2.5005171256892906e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015870999349371792, + "loss": 0.0182, "step": 363380 }, { - "epoch": 1.83, - "learning_rate": 2.4997603563878894e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.0001587061052773465, + "loss": 0.0109, "step": 363390 }, { - "epoch": 1.83, - "learning_rate": 2.4990035870864885e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.000158702217060975, + "loss": 0.0159, "step": 363400 }, { - "epoch": 1.83, - "learning_rate": 2.4982468177850874e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015869832884460352, + "loss": 0.0135, "step": 363410 }, { - "epoch": 1.83, - "learning_rate": 2.4974900484836865e-05, - "loss": 0.0041, + "epoch": 0.94, + "learning_rate": 0.00015869444062823206, + "loss": 0.0141, "step": 363420 }, { - "epoch": 1.83, - "learning_rate": 2.4967332791822853e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.00015869055241186063, + "loss": 0.0139, "step": 363430 }, { - "epoch": 1.83, - "learning_rate": 2.4959765098808845e-05, - "loss": 0.0078, + "epoch": 0.94, + "learning_rate": 0.00015868666419548914, + "loss": 0.0145, "step": 363440 }, { - "epoch": 1.83, - "learning_rate": 2.4952197405794833e-05, - "loss": 0.008, + "epoch": 0.94, + "learning_rate": 0.00015868277597911768, + "loss": 0.0106, "step": 363450 }, { - "epoch": 1.83, - "learning_rate": 2.4944629712780825e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.0001586788877627462, + "loss": 0.0131, "step": 363460 }, { - "epoch": 1.83, - "learning_rate": 2.4937062019766813e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015867499954637477, + "loss": 0.0146, "step": 363470 }, { - "epoch": 1.83, - "learning_rate": 2.49294943267528e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015867111133000328, + "loss": 0.0118, "step": 363480 }, { - "epoch": 1.83, - "learning_rate": 2.492192663373879e-05, - "loss": 0.0044, + "epoch": 0.94, + "learning_rate": 0.00015866722311363182, + "loss": 0.0123, "step": 363490 }, { - "epoch": 1.83, - "learning_rate": 2.491435894072478e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015866333489726034, + "loss": 0.0122, "step": 363500 }, { - "epoch": 1.83, - "learning_rate": 2.490679124771077e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015865944668088888, + "loss": 0.0149, "step": 363510 }, { - "epoch": 1.83, - "learning_rate": 2.489922355469676e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015865555846451742, + "loss": 0.0134, "step": 363520 }, { - "epoch": 1.83, - "learning_rate": 2.489165586168275e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015865167024814596, + "loss": 0.0111, "step": 363530 }, { - "epoch": 1.83, - "learning_rate": 2.488408816866874e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015864778203177448, + "loss": 0.0146, "step": 363540 }, { - "epoch": 1.83, - "learning_rate": 2.487652047565473e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015864389381540302, + "loss": 0.0123, "step": 363550 }, { - "epoch": 1.83, - "learning_rate": 2.486895278264072e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015864000559903156, + "loss": 0.0135, "step": 363560 }, { - "epoch": 1.83, - "learning_rate": 2.486138508962671e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.0001586361173826601, + "loss": 0.0136, "step": 363570 }, { - "epoch": 1.83, - "learning_rate": 2.48538173966127e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015863222916628862, + "loss": 0.0161, "step": 363580 }, { - "epoch": 1.83, - "learning_rate": 2.484624970359869e-05, - "loss": 0.0047, + "epoch": 0.94, + "learning_rate": 0.00015862834094991716, + "loss": 0.0128, "step": 363590 }, { - "epoch": 1.83, - "learning_rate": 2.483868201058468e-05, - "loss": 0.0092, + "epoch": 0.94, + "learning_rate": 0.00015862445273354573, + "loss": 0.0127, "step": 363600 }, { - "epoch": 1.83, - "learning_rate": 2.483111431757067e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015862056451717424, + "loss": 0.0133, "step": 363610 }, { - "epoch": 1.83, - "learning_rate": 2.482354662455666e-05, - "loss": 0.0083, + "epoch": 0.94, + "learning_rate": 0.00015861667630080278, + "loss": 0.0115, "step": 363620 }, { - "epoch": 1.83, - "learning_rate": 2.4815978931542648e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.0001586127880844313, + "loss": 0.0114, "step": 363630 }, { - "epoch": 1.83, - "learning_rate": 2.4808411238528633e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015860889986805987, + "loss": 0.013, "step": 363640 }, { - "epoch": 1.83, - "learning_rate": 2.4800843545514625e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015860501165168838, + "loss": 0.0132, "step": 363650 }, { - "epoch": 1.83, - "learning_rate": 2.4793275852500613e-05, - "loss": 0.0042, + "epoch": 0.94, + "learning_rate": 0.00015860112343531692, + "loss": 0.0145, "step": 363660 }, { - "epoch": 1.83, - "learning_rate": 2.4785708159486605e-05, - "loss": 0.0044, + "epoch": 0.94, + "learning_rate": 0.00015859723521894544, + "loss": 0.0127, "step": 363670 }, { - "epoch": 1.83, - "learning_rate": 2.4778140466472593e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.000158593347002574, + "loss": 0.0114, "step": 363680 }, { - "epoch": 1.83, - "learning_rate": 2.4770572773458584e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015858945878620252, + "loss": 0.0111, "step": 363690 }, { - "epoch": 1.83, - "learning_rate": 2.4763005080444576e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015858557056983106, + "loss": 0.0115, "step": 363700 }, { - "epoch": 1.83, - "learning_rate": 2.4755437387430564e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015858168235345958, + "loss": 0.0125, "step": 363710 }, { - "epoch": 1.84, - "learning_rate": 2.4747869694416556e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015857779413708814, + "loss": 0.011, "step": 363720 }, { - "epoch": 1.84, - "learning_rate": 2.4740302001402544e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015857390592071666, + "loss": 0.0123, "step": 363730 }, { - "epoch": 1.84, - "learning_rate": 2.4732734308388536e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.0001585700177043452, + "loss": 0.0121, "step": 363740 }, { - "epoch": 1.84, - "learning_rate": 2.4725166615374524e-05, - "loss": 0.0059, + "epoch": 0.94, + "learning_rate": 0.00015856612948797371, + "loss": 0.0125, "step": 363750 }, { - "epoch": 1.84, - "learning_rate": 2.4717598922360515e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015856224127160226, + "loss": 0.0112, "step": 363760 }, { - "epoch": 1.84, - "learning_rate": 2.4710031229346504e-05, - "loss": 0.0037, + "epoch": 0.94, + "learning_rate": 0.00015855835305523083, + "loss": 0.0126, "step": 363770 }, { - "epoch": 1.84, - "learning_rate": 2.4702463536332495e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.00015855446483885934, + "loss": 0.0143, "step": 363780 }, { - "epoch": 1.84, - "learning_rate": 2.4694895843318483e-05, - "loss": 0.007, + "epoch": 0.94, + "learning_rate": 0.00015855057662248788, + "loss": 0.0117, "step": 363790 }, { - "epoch": 1.84, - "learning_rate": 2.468732815030447e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.0001585466884061164, + "loss": 0.0087, "step": 363800 }, { - "epoch": 1.84, - "learning_rate": 2.467976045729046e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015854280018974496, + "loss": 0.0133, "step": 363810 }, { - "epoch": 1.84, - "learning_rate": 2.4672192764276448e-05, - "loss": 0.004, + "epoch": 0.94, + "learning_rate": 0.00015853891197337348, + "loss": 0.0143, "step": 363820 }, { - "epoch": 1.84, - "learning_rate": 2.466462507126244e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015853502375700202, + "loss": 0.0123, "step": 363830 }, { - "epoch": 1.84, - "learning_rate": 2.4657057378248428e-05, - "loss": 0.007, + "epoch": 0.94, + "learning_rate": 0.00015853113554063054, + "loss": 0.0116, "step": 363840 }, { - "epoch": 1.84, - "learning_rate": 2.464948968523442e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.0001585272473242591, + "loss": 0.0192, "step": 363850 }, { - "epoch": 1.84, - "learning_rate": 2.4641921992220408e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015852335910788762, + "loss": 0.0112, "step": 363860 }, { - "epoch": 1.84, - "learning_rate": 2.46343542992064e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015851947089151616, + "loss": 0.0122, "step": 363870 }, { - "epoch": 1.84, - "learning_rate": 2.4626786606192388e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015851558267514467, + "loss": 0.0163, "step": 363880 }, { - "epoch": 1.84, - "learning_rate": 2.461921891317838e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015851169445877324, + "loss": 0.0123, "step": 363890 }, { - "epoch": 1.84, - "learning_rate": 2.4611651220164367e-05, - "loss": 0.0072, + "epoch": 0.94, + "learning_rate": 0.00015850780624240176, + "loss": 0.0123, "step": 363900 }, { - "epoch": 1.84, - "learning_rate": 2.460408352715036e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.0001585039180260303, + "loss": 0.0201, "step": 363910 }, { - "epoch": 1.84, - "learning_rate": 2.4596515834136347e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015850002980965881, + "loss": 0.0125, "step": 363920 }, { - "epoch": 1.84, - "learning_rate": 2.458894814112234e-05, - "loss": 0.0069, + "epoch": 0.94, + "learning_rate": 0.00015849614159328738, + "loss": 0.0125, "step": 363930 }, { - "epoch": 1.84, - "learning_rate": 2.4581380448108327e-05, - "loss": 0.0073, + "epoch": 0.94, + "learning_rate": 0.00015849225337691592, + "loss": 0.0118, "step": 363940 }, { - "epoch": 1.84, - "learning_rate": 2.4573812755094315e-05, - "loss": 0.0068, + "epoch": 0.94, + "learning_rate": 0.00015848836516054444, + "loss": 0.0157, "step": 363950 }, { - "epoch": 1.84, - "learning_rate": 2.4566245062080304e-05, - "loss": 0.0043, + "epoch": 0.94, + "learning_rate": 0.00015848447694417295, + "loss": 0.0152, "step": 363960 }, { - "epoch": 1.84, - "learning_rate": 2.4558677369066295e-05, - "loss": 0.004, + "epoch": 0.94, + "learning_rate": 0.00015848058872780152, + "loss": 0.012, "step": 363970 }, { - "epoch": 1.84, - "learning_rate": 2.4551109676052283e-05, - "loss": 0.0039, + "epoch": 0.94, + "learning_rate": 0.00015847670051143006, + "loss": 0.0112, "step": 363980 }, { - "epoch": 1.84, - "learning_rate": 2.4543541983038275e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015847281229505858, + "loss": 0.0134, "step": 363990 }, { - "epoch": 1.84, - "learning_rate": 2.4535974290024263e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015846892407868712, + "loss": 0.0142, "step": 364000 }, { - "epoch": 1.84, - "eval_cer": 0.9144071801550111, - "eval_loss": 0.004426935221999884, - "eval_runtime": 116.6371, - "eval_samples_per_second": 17.147, - "eval_steps_per_second": 4.287, + "epoch": 0.94, + "eval_cer": 0.8817432757942589, + "eval_loss": 0.008785239420831203, + "eval_runtime": 107.5582, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, "step": 364000 }, { - "epoch": 1.84, - "learning_rate": 2.4528406597010255e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.00015846503586231563, + "loss": 0.0128, "step": 364010 }, { - "epoch": 1.84, - "learning_rate": 2.4520838903996243e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.0001584611476459442, + "loss": 0.0163, "step": 364020 }, { - "epoch": 1.84, - "learning_rate": 2.4513271210982235e-05, - "loss": 0.0074, + "epoch": 0.94, + "learning_rate": 0.00015845725942957272, + "loss": 0.0146, "step": 364030 }, { - "epoch": 1.84, - "learning_rate": 2.4505703517968223e-05, - "loss": 0.0064, + "epoch": 0.94, + "learning_rate": 0.00015845337121320126, + "loss": 0.0107, "step": 364040 }, { - "epoch": 1.84, - "learning_rate": 2.4498135824954214e-05, - "loss": 0.0067, + "epoch": 0.94, + "learning_rate": 0.00015844948299682977, + "loss": 0.0112, "step": 364050 }, { - "epoch": 1.84, - "learning_rate": 2.4490568131940203e-05, - "loss": 0.0051, + "epoch": 0.94, + "learning_rate": 0.00015844559478045834, + "loss": 0.011, "step": 364060 }, { - "epoch": 1.84, - "learning_rate": 2.4483000438926194e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015844170656408686, + "loss": 0.0107, "step": 364070 }, { - "epoch": 1.84, - "learning_rate": 2.4475432745912182e-05, - "loss": 0.007, + "epoch": 0.94, + "learning_rate": 0.0001584378183477154, + "loss": 0.011, "step": 364080 }, { - "epoch": 1.84, - "learning_rate": 2.4467865052898174e-05, - "loss": 0.0066, + "epoch": 0.94, + "learning_rate": 0.0001584339301313439, + "loss": 0.0123, "step": 364090 }, { - "epoch": 1.84, - "learning_rate": 2.4460297359884162e-05, - "loss": 0.0058, + "epoch": 0.94, + "learning_rate": 0.00015843004191497248, + "loss": 0.0117, "step": 364100 }, { - "epoch": 1.84, - "learning_rate": 2.445272966687015e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015842615369860102, + "loss": 0.0155, "step": 364110 }, { - "epoch": 1.84, - "learning_rate": 2.444516197385614e-05, - "loss": 0.0044, + "epoch": 0.94, + "learning_rate": 0.00015842226548222954, + "loss": 0.0136, "step": 364120 }, { - "epoch": 1.84, - "learning_rate": 2.443759428084213e-05, - "loss": 0.0064, + "epoch": 0.94, + "learning_rate": 0.00015841837726585805, + "loss": 0.0153, "step": 364130 }, { - "epoch": 1.84, - "learning_rate": 2.443002658782812e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015841448904948662, + "loss": 0.0112, "step": 364140 }, { - "epoch": 1.84, - "learning_rate": 2.442245889481411e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.00015841060083311516, + "loss": 0.0133, "step": 364150 }, { - "epoch": 1.84, - "learning_rate": 2.44148912018001e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015840671261674368, + "loss": 0.0132, "step": 364160 }, { - "epoch": 1.84, - "learning_rate": 2.440732350878609e-05, - "loss": 0.0049, + "epoch": 0.94, + "learning_rate": 0.00015840282440037222, + "loss": 0.0103, "step": 364170 }, { - "epoch": 1.84, - "learning_rate": 2.4399755815772078e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.00015839893618400076, + "loss": 0.011, "step": 364180 }, { - "epoch": 1.84, - "learning_rate": 2.439218812275807e-05, - "loss": 0.0054, + "epoch": 0.94, + "learning_rate": 0.0001583950479676293, + "loss": 0.0128, "step": 364190 }, { - "epoch": 1.84, - "learning_rate": 2.4384620429744058e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015839115975125782, + "loss": 0.011, "step": 364200 }, { - "epoch": 1.84, - "learning_rate": 2.437705273673005e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.00015838727153488636, + "loss": 0.0096, "step": 364210 }, { - "epoch": 1.84, - "learning_rate": 2.4369485043716038e-05, - "loss": 0.0083, + "epoch": 0.94, + "learning_rate": 0.0001583833833185149, + "loss": 0.011, "step": 364220 }, { - "epoch": 1.84, - "learning_rate": 2.436191735070203e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015837949510214344, + "loss": 0.0136, "step": 364230 }, { - "epoch": 1.84, - "learning_rate": 2.4354349657688018e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.00015837560688577196, + "loss": 0.0127, "step": 364240 }, { - "epoch": 1.84, - "learning_rate": 2.434678196467401e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.0001583717186694005, + "loss": 0.0155, "step": 364250 }, { - "epoch": 1.84, - "learning_rate": 2.4339214271659998e-05, - "loss": 0.006, + "epoch": 0.94, + "learning_rate": 0.000158367830453029, + "loss": 0.0122, "step": 364260 }, { - "epoch": 1.84, - "learning_rate": 2.4331646578645986e-05, - "loss": 0.0062, + "epoch": 0.94, + "learning_rate": 0.00015836394223665758, + "loss": 0.0134, "step": 364270 }, { - "epoch": 1.84, - "learning_rate": 2.4324078885631974e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.0001583600540202861, + "loss": 0.0135, "step": 364280 }, { - "epoch": 1.84, - "learning_rate": 2.4316511192617966e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015835616580391464, + "loss": 0.0128, "step": 364290 }, { - "epoch": 1.84, - "learning_rate": 2.4308943499603954e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015835227758754315, + "loss": 0.0161, "step": 364300 }, { - "epoch": 1.84, - "learning_rate": 2.4301375806589945e-05, - "loss": 0.0085, + "epoch": 0.94, + "learning_rate": 0.00015834838937117172, + "loss": 0.0138, "step": 364310 }, { - "epoch": 1.84, - "learning_rate": 2.4293808113575934e-05, - "loss": 0.0096, + "epoch": 0.94, + "learning_rate": 0.00015834450115480026, + "loss": 0.0131, "step": 364320 }, { - "epoch": 1.84, - "learning_rate": 2.4286240420561925e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015834061293842878, + "loss": 0.0127, "step": 364330 }, { - "epoch": 1.84, - "learning_rate": 2.4278672727547913e-05, - "loss": 0.0081, + "epoch": 0.94, + "learning_rate": 0.00015833672472205732, + "loss": 0.0155, "step": 364340 }, { - "epoch": 1.84, - "learning_rate": 2.4271105034533905e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015833283650568586, + "loss": 0.0108, "step": 364350 }, { - "epoch": 1.84, - "learning_rate": 2.4263537341519893e-05, - "loss": 0.0052, + "epoch": 0.94, + "learning_rate": 0.0001583289482893144, + "loss": 0.0105, "step": 364360 }, { - "epoch": 1.84, - "learning_rate": 2.4255969648505885e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015832506007294292, + "loss": 0.0121, "step": 364370 }, { - "epoch": 1.84, - "learning_rate": 2.4248401955491873e-05, - "loss": 0.0046, + "epoch": 0.94, + "learning_rate": 0.00015832117185657146, + "loss": 0.0128, "step": 364380 }, { - "epoch": 1.84, - "learning_rate": 2.4240834262477865e-05, - "loss": 0.0079, + "epoch": 0.94, + "learning_rate": 0.0001583172836402, + "loss": 0.0109, "step": 364390 }, { - "epoch": 1.84, - "learning_rate": 2.4233266569463853e-05, - "loss": 0.0051, + "epoch": 0.94, + "learning_rate": 0.00015831339542382854, + "loss": 0.0108, "step": 364400 }, { - "epoch": 1.84, - "learning_rate": 2.4225698876449845e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015830950720745706, + "loss": 0.0111, "step": 364410 }, { - "epoch": 1.84, - "learning_rate": 2.421813118343583e-05, - "loss": 0.0053, + "epoch": 0.94, + "learning_rate": 0.0001583056189910856, + "loss": 0.0138, "step": 364420 }, { - "epoch": 1.84, - "learning_rate": 2.421056349042182e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015830173077471414, + "loss": 0.0124, "step": 364430 }, { - "epoch": 1.84, - "learning_rate": 2.420299579740781e-05, - "loss": 0.0057, + "epoch": 0.94, + "learning_rate": 0.00015829784255834268, + "loss": 0.0118, "step": 364440 }, { - "epoch": 1.84, - "learning_rate": 2.41954281043938e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.0001582939543419712, + "loss": 0.0134, "step": 364450 }, { - "epoch": 1.84, - "learning_rate": 2.418786041137979e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015829006612559974, + "loss": 0.0124, "step": 364460 }, { - "epoch": 1.84, - "learning_rate": 2.418029271836578e-05, - "loss": 0.0061, + "epoch": 0.94, + "learning_rate": 0.00015828617790922825, + "loss": 0.0131, "step": 364470 }, { - "epoch": 1.84, - "learning_rate": 2.417272502535177e-05, - "loss": 0.0056, + "epoch": 0.94, + "learning_rate": 0.00015828228969285682, + "loss": 0.0201, "step": 364480 }, { - "epoch": 1.84, - "learning_rate": 2.416515733233776e-05, - "loss": 0.0045, + "epoch": 0.94, + "learning_rate": 0.00015827840147648536, + "loss": 0.0129, "step": 364490 }, { - "epoch": 1.84, - "learning_rate": 2.415758963932375e-05, - "loss": 0.005, + "epoch": 0.94, + "learning_rate": 0.00015827451326011388, + "loss": 0.0136, "step": 364500 }, { - "epoch": 1.84, - "learning_rate": 2.415002194630974e-05, - "loss": 0.0048, + "epoch": 0.94, + "learning_rate": 0.00015827062504374242, + "loss": 0.0112, "step": 364510 }, { - "epoch": 1.84, - "learning_rate": 2.414245425329573e-05, - "loss": 0.0047, + "epoch": 0.94, + "learning_rate": 0.00015826673682737096, + "loss": 0.0121, "step": 364520 }, { - "epoch": 1.84, - "learning_rate": 2.413488656028172e-05, - "loss": 0.0063, + "epoch": 0.94, + "learning_rate": 0.0001582628486109995, + "loss": 0.0131, "step": 364530 }, { - "epoch": 1.84, - "learning_rate": 2.412731886726771e-05, - "loss": 0.0065, + "epoch": 0.94, + "learning_rate": 0.00015825896039462802, + "loss": 0.0122, "step": 364540 }, { - "epoch": 1.84, - "learning_rate": 2.41197511742537e-05, - "loss": 0.0071, + "epoch": 0.94, + "learning_rate": 0.00015825507217825656, + "loss": 0.013, "step": 364550 }, { - "epoch": 1.84, - "learning_rate": 2.4112183481239688e-05, - "loss": 0.0055, + "epoch": 0.94, + "learning_rate": 0.0001582511839618851, + "loss": 0.01, "step": 364560 }, { - "epoch": 1.84, - "learning_rate": 2.410461578822568e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015824729574551364, + "loss": 0.0108, "step": 364570 }, { - "epoch": 1.84, - "learning_rate": 2.4097048095211665e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015824340752914216, + "loss": 0.0126, "step": 364580 }, { - "epoch": 1.84, - "learning_rate": 2.4089480402197653e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.0001582395193127707, + "loss": 0.0126, "step": 364590 }, { - "epoch": 1.84, - "learning_rate": 2.4081912709183644e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015823563109639924, + "loss": 0.0131, "step": 364600 }, { - "epoch": 1.84, - "learning_rate": 2.4074345016169633e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015823174288002778, + "loss": 0.0113, "step": 364610 }, { - "epoch": 1.84, - "learning_rate": 2.4066777323155624e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.0001582278546636563, + "loss": 0.012, "step": 364620 }, { - "epoch": 1.84, - "learning_rate": 2.4059209630141612e-05, - "loss": 0.0077, + "epoch": 0.95, + "learning_rate": 0.00015822396644728484, + "loss": 0.0121, "step": 364630 }, { - "epoch": 1.84, - "learning_rate": 2.4051641937127604e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.0001582200782309134, + "loss": 0.0156, "step": 364640 }, { - "epoch": 1.84, - "learning_rate": 2.4044074244113592e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.00015821619001454192, + "loss": 0.0114, "step": 364650 }, { - "epoch": 1.84, - "learning_rate": 2.4036506551099584e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015821230179817046, + "loss": 0.0119, "step": 364660 }, { - "epoch": 1.84, - "learning_rate": 2.4028938858085575e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.00015820841358179898, + "loss": 0.0111, "step": 364670 }, { - "epoch": 1.84, - "learning_rate": 2.4021371165071564e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015820452536542754, + "loss": 0.0137, "step": 364680 }, { - "epoch": 1.84, - "learning_rate": 2.4013803472057555e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015820063714905606, + "loss": 0.0117, "step": 364690 }, { - "epoch": 1.84, - "learning_rate": 2.4006235779043544e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.0001581967489326846, + "loss": 0.0169, "step": 364700 }, { - "epoch": 1.84, - "learning_rate": 2.3998668086029535e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015819286071631312, + "loss": 0.0123, "step": 364710 }, { - "epoch": 1.84, - "learning_rate": 2.3991100393015523e-05, - "loss": 0.0043, + "epoch": 0.95, + "learning_rate": 0.00015818897249994166, + "loss": 0.011, "step": 364720 }, { - "epoch": 1.84, - "learning_rate": 2.3983532700001515e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.0001581850842835702, + "loss": 0.0152, "step": 364730 }, { - "epoch": 1.84, - "learning_rate": 2.39759650069875e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015818119606719874, + "loss": 0.0102, "step": 364740 }, { - "epoch": 1.84, - "learning_rate": 2.3968397313973488e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015817730785082726, + "loss": 0.0143, "step": 364750 }, { - "epoch": 1.84, - "learning_rate": 2.396082962095948e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.0001581734196344558, + "loss": 0.0115, "step": 364760 }, { - "epoch": 1.84, - "learning_rate": 2.3953261927945468e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015816953141808434, + "loss": 0.0142, "step": 364770 }, { - "epoch": 1.84, - "learning_rate": 2.394569423493146e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015816564320171288, + "loss": 0.0155, "step": 364780 }, { - "epoch": 1.84, - "learning_rate": 2.3938126541917448e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.0001581617549853414, + "loss": 0.0096, "step": 364790 }, { - "epoch": 1.84, - "learning_rate": 2.393055884890344e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015815786676896994, + "loss": 0.0182, "step": 364800 }, { - "epoch": 1.84, - "learning_rate": 2.3922991155889427e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.0001581539785525985, + "loss": 0.0151, "step": 364810 }, { - "epoch": 1.84, - "learning_rate": 2.391542346287542e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.00015815009033622702, + "loss": 0.0138, "step": 364820 }, { - "epoch": 1.84, - "learning_rate": 2.3907855769861407e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015814620211985553, + "loss": 0.011, "step": 364830 }, { - "epoch": 1.84, - "learning_rate": 2.39002880768474e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015814231390348408, + "loss": 0.0131, "step": 364840 }, { - "epoch": 1.84, - "learning_rate": 2.3892720383833387e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015813842568711264, + "loss": 0.0166, "step": 364850 }, { - "epoch": 1.84, - "learning_rate": 2.388515269081938e-05, - "loss": 0.0039, + "epoch": 0.95, + "learning_rate": 0.00015813453747074116, + "loss": 0.0128, "step": 364860 }, { - "epoch": 1.84, - "learning_rate": 2.3877584997805367e-05, - "loss": 0.0083, + "epoch": 0.95, + "learning_rate": 0.0001581306492543697, + "loss": 0.0161, "step": 364870 }, { - "epoch": 1.84, - "learning_rate": 2.387001730479136e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015812676103799822, + "loss": 0.0142, "step": 364880 }, { - "epoch": 1.84, - "learning_rate": 2.3862449611777343e-05, - "loss": 0.0097, + "epoch": 0.95, + "learning_rate": 0.00015812287282162678, + "loss": 0.0135, "step": 364890 }, { - "epoch": 1.84, - "learning_rate": 2.3854881918763335e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.0001581189846052553, + "loss": 0.0122, "step": 364900 }, { - "epoch": 1.84, - "learning_rate": 2.3847314225749323e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015811509638888384, + "loss": 0.0134, "step": 364910 }, { - "epoch": 1.84, - "learning_rate": 2.3839746532735315e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.00015811120817251235, + "loss": 0.0122, "step": 364920 }, { - "epoch": 1.84, - "learning_rate": 2.3832178839721303e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015810731995614092, + "loss": 0.0122, "step": 364930 }, { - "epoch": 1.84, - "learning_rate": 2.3824611146707295e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015810343173976944, + "loss": 0.0146, "step": 364940 }, { - "epoch": 1.84, - "learning_rate": 2.3817043453693283e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015809954352339798, + "loss": 0.0108, "step": 364950 }, { - "epoch": 1.84, - "learning_rate": 2.3809475760679274e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.0001580956553070265, + "loss": 0.0119, "step": 364960 }, { - "epoch": 1.84, - "learning_rate": 2.3801908067665263e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015809176709065504, + "loss": 0.0125, "step": 364970 }, { - "epoch": 1.84, - "learning_rate": 2.3794340374651254e-05, - "loss": 0.004, + "epoch": 0.95, + "learning_rate": 0.0001580878788742836, + "loss": 0.0171, "step": 364980 }, { - "epoch": 1.84, - "learning_rate": 2.3786772681637243e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015808399065791212, + "loss": 0.0142, "step": 364990 }, { - "epoch": 1.84, - "learning_rate": 2.3779204988623234e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015808010244154063, + "loss": 0.0161, "step": 365000 }, { - "epoch": 1.84, - "eval_cer": 0.9144207657007667, - "eval_loss": 0.0044406414963305, - "eval_runtime": 116.6279, - "eval_samples_per_second": 17.149, - "eval_steps_per_second": 4.287, + "epoch": 0.95, + "eval_cer": 0.8817390768834564, + "eval_loss": 0.00836771447211504, + "eval_runtime": 107.6249, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, "step": 365000 }, { - "epoch": 1.84, - "learning_rate": 2.3771637295609222e-05, - "loss": 0.004, + "epoch": 0.95, + "learning_rate": 0.00015807621422516918, + "loss": 0.0127, "step": 365010 }, { - "epoch": 1.84, - "learning_rate": 2.3764069602595214e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015807232600879774, + "loss": 0.0161, "step": 365020 }, { - "epoch": 1.84, - "learning_rate": 2.3756501909581202e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015806843779242626, + "loss": 0.0155, "step": 365030 }, { - "epoch": 1.84, - "learning_rate": 2.3748934216567194e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.0001580645495760548, + "loss": 0.0113, "step": 365040 }, { - "epoch": 1.84, - "learning_rate": 2.374136652355318e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015806066135968331, + "loss": 0.0109, "step": 365050 }, { - "epoch": 1.84, - "learning_rate": 2.373379883053917e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015805677314331188, + "loss": 0.0157, "step": 365060 }, { - "epoch": 1.84, - "learning_rate": 2.372623113752516e-05, - "loss": 0.007, + "epoch": 0.95, + "learning_rate": 0.0001580528849269404, + "loss": 0.0126, "step": 365070 }, { - "epoch": 1.84, - "learning_rate": 2.371866344451115e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015804899671056894, + "loss": 0.0158, "step": 365080 }, { - "epoch": 1.84, - "learning_rate": 2.3711095751497138e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015804510849419745, + "loss": 0.0119, "step": 365090 }, { - "epoch": 1.84, - "learning_rate": 2.370352805848313e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015804122027782602, + "loss": 0.0125, "step": 365100 }, { - "epoch": 1.84, - "learning_rate": 2.3695960365469118e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015803733206145454, + "loss": 0.0133, "step": 365110 }, { - "epoch": 1.84, - "learning_rate": 2.368839267245511e-05, - "loss": 0.0032, + "epoch": 0.95, + "learning_rate": 0.00015803344384508308, + "loss": 0.0173, "step": 365120 }, { - "epoch": 1.84, - "learning_rate": 2.3680824979441098e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.0001580295556287116, + "loss": 0.0111, "step": 365130 }, { - "epoch": 1.84, - "learning_rate": 2.367325728642709e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015802566741234016, + "loss": 0.0141, "step": 365140 }, { - "epoch": 1.84, - "learning_rate": 2.3665689593413078e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015802177919596868, + "loss": 0.0127, "step": 365150 }, { - "epoch": 1.84, - "learning_rate": 2.365812190039907e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015801789097959722, + "loss": 0.0134, "step": 365160 }, { - "epoch": 1.84, - "learning_rate": 2.3650554207385058e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015801400276322573, + "loss": 0.014, "step": 365170 }, { - "epoch": 1.84, - "learning_rate": 2.364298651437105e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.0001580101145468543, + "loss": 0.0137, "step": 365180 }, { - "epoch": 1.84, - "learning_rate": 2.3635418821357037e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015800622633048284, + "loss": 0.0131, "step": 365190 }, { - "epoch": 1.84, - "learning_rate": 2.362785112834303e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015800233811411136, + "loss": 0.013, "step": 365200 }, { - "epoch": 1.84, - "learning_rate": 2.3620283435329014e-05, - "loss": 0.0072, + "epoch": 0.95, + "learning_rate": 0.0001579984498977399, + "loss": 0.0183, "step": 365210 }, { - "epoch": 1.84, - "learning_rate": 2.3612715742315005e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015799456168136841, + "loss": 0.0131, "step": 365220 }, { - "epoch": 1.84, - "learning_rate": 2.3605148049300994e-05, - "loss": 0.0073, + "epoch": 0.95, + "learning_rate": 0.00015799067346499698, + "loss": 0.0136, "step": 365230 }, { - "epoch": 1.84, - "learning_rate": 2.3597580356286985e-05, - "loss": 0.0079, + "epoch": 0.95, + "learning_rate": 0.0001579867852486255, + "loss": 0.0105, "step": 365240 }, { - "epoch": 1.84, - "learning_rate": 2.3590012663272973e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015798289703225404, + "loss": 0.0113, "step": 365250 }, { - "epoch": 1.84, - "learning_rate": 2.3582444970258965e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015797900881588255, + "loss": 0.0132, "step": 365260 }, { - "epoch": 1.84, - "learning_rate": 2.3574877277244953e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015797512059951112, + "loss": 0.0137, "step": 365270 }, { - "epoch": 1.84, - "learning_rate": 2.3567309584230945e-05, - "loss": 0.0083, + "epoch": 0.95, + "learning_rate": 0.00015797123238313964, + "loss": 0.0128, "step": 365280 }, { - "epoch": 1.84, - "learning_rate": 2.3559741891216933e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015796734416676818, + "loss": 0.0167, "step": 365290 }, { - "epoch": 1.84, - "learning_rate": 2.3552174198202925e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.0001579634559503967, + "loss": 0.0105, "step": 365300 }, { - "epoch": 1.84, - "learning_rate": 2.3544606505188913e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015795956773402526, + "loss": 0.0169, "step": 365310 }, { - "epoch": 1.84, - "learning_rate": 2.3537038812174905e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015795567951765378, + "loss": 0.0115, "step": 365320 }, { - "epoch": 1.84, - "learning_rate": 2.3529471119160893e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015795179130128232, + "loss": 0.0142, "step": 365330 }, { - "epoch": 1.84, - "learning_rate": 2.3521903426146884e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015794790308491083, + "loss": 0.0102, "step": 365340 }, { - "epoch": 1.84, - "learning_rate": 2.3514335733132873e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.0001579440148685394, + "loss": 0.014, "step": 365350 }, { - "epoch": 1.84, - "learning_rate": 2.3506768040118864e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015794012665216794, + "loss": 0.0111, "step": 365360 }, { - "epoch": 1.84, - "learning_rate": 2.349920034710485e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.00015793623843579646, + "loss": 0.0121, "step": 365370 }, { - "epoch": 1.84, - "learning_rate": 2.3491632654090837e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.000157932350219425, + "loss": 0.0131, "step": 365380 }, { - "epoch": 1.84, - "learning_rate": 2.348406496107683e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015792846200305354, + "loss": 0.0132, "step": 365390 }, { - "epoch": 1.84, - "learning_rate": 2.347649726806282e-05, - "loss": 0.0071, + "epoch": 0.95, + "learning_rate": 0.00015792457378668208, + "loss": 0.0149, "step": 365400 }, { - "epoch": 1.84, - "learning_rate": 2.346892957504881e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.0001579206855703106, + "loss": 0.0112, "step": 365410 }, { - "epoch": 1.84, - "learning_rate": 2.34613618820348e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015791679735393914, + "loss": 0.01, "step": 365420 }, { - "epoch": 1.84, - "learning_rate": 2.345379418902079e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015791290913756768, + "loss": 0.0138, "step": 365430 }, { - "epoch": 1.84, - "learning_rate": 2.344622649600678e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015790902092119622, + "loss": 0.0119, "step": 365440 }, { - "epoch": 1.84, - "learning_rate": 2.343865880299277e-05, - "loss": 0.0073, + "epoch": 0.95, + "learning_rate": 0.00015790513270482474, + "loss": 0.0145, "step": 365450 }, { - "epoch": 1.84, - "learning_rate": 2.343109110997876e-05, - "loss": 0.0074, + "epoch": 0.95, + "learning_rate": 0.00015790124448845328, + "loss": 0.0131, "step": 365460 }, { - "epoch": 1.84, - "learning_rate": 2.3423523416964748e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.0001578973562720818, + "loss": 0.0139, "step": 365470 }, { - "epoch": 1.84, - "learning_rate": 2.341595572395074e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015789346805571036, + "loss": 0.0166, "step": 365480 }, { - "epoch": 1.84, - "learning_rate": 2.3408388030936728e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015788957983933888, + "loss": 0.0136, "step": 365490 }, { - "epoch": 1.84, - "learning_rate": 2.340082033792272e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015788569162296742, + "loss": 0.0165, "step": 365500 }, { - "epoch": 1.84, - "learning_rate": 2.3393252644908708e-05, - "loss": 0.0069, + "epoch": 0.95, + "learning_rate": 0.00015788180340659593, + "loss": 0.01, "step": 365510 }, { - "epoch": 1.84, - "learning_rate": 2.3385684951894693e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.0001578779151902245, + "loss": 0.016, "step": 365520 }, { - "epoch": 1.84, - "learning_rate": 2.3378117258880684e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015787402697385304, + "loss": 0.0177, "step": 365530 }, { - "epoch": 1.84, - "learning_rate": 2.3370549565866672e-05, - "loss": 0.0039, + "epoch": 0.95, + "learning_rate": 0.00015787013875748156, + "loss": 0.0111, "step": 365540 }, { - "epoch": 1.84, - "learning_rate": 2.3362981872852664e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.00015786625054111007, + "loss": 0.0104, "step": 365550 }, { - "epoch": 1.84, - "learning_rate": 2.3355414179838652e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015786236232473864, + "loss": 0.0152, "step": 365560 }, { - "epoch": 1.84, - "learning_rate": 2.3347846486824644e-05, - "loss": 0.0081, + "epoch": 0.95, + "learning_rate": 0.00015785847410836718, + "loss": 0.0144, "step": 365570 }, { - "epoch": 1.84, - "learning_rate": 2.3340278793810632e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.0001578545858919957, + "loss": 0.0123, "step": 365580 }, { - "epoch": 1.84, - "learning_rate": 2.3332711100796624e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015785069767562424, + "loss": 0.0124, "step": 365590 }, { - "epoch": 1.84, - "learning_rate": 2.3325143407782612e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015784680945925278, + "loss": 0.0153, "step": 365600 }, { - "epoch": 1.84, - "learning_rate": 2.3317575714768604e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015784292124288132, + "loss": 0.0093, "step": 365610 }, { - "epoch": 1.84, - "learning_rate": 2.3310008021754592e-05, - "loss": 0.0037, + "epoch": 0.95, + "learning_rate": 0.00015783903302650984, + "loss": 0.0114, "step": 365620 }, { - "epoch": 1.84, - "learning_rate": 2.3302440328740583e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015783514481013838, + "loss": 0.0128, "step": 365630 }, { - "epoch": 1.84, - "learning_rate": 2.3294872635726575e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015783125659376692, + "loss": 0.0145, "step": 365640 }, { - "epoch": 1.84, - "learning_rate": 2.3287304942712563e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.00015782736837739546, + "loss": 0.0123, "step": 365650 }, { - "epoch": 1.84, - "learning_rate": 2.3279737249698555e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015782348016102397, + "loss": 0.011, "step": 365660 }, { - "epoch": 1.84, - "learning_rate": 2.3272169556684543e-05, - "loss": 0.0039, + "epoch": 0.95, + "learning_rate": 0.00015781959194465252, + "loss": 0.0114, "step": 365670 }, { - "epoch": 1.84, - "learning_rate": 2.3264601863670528e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015781570372828109, + "loss": 0.0123, "step": 365680 }, { - "epoch": 1.84, - "learning_rate": 2.325703417065652e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.0001578118155119096, + "loss": 0.0111, "step": 365690 }, { - "epoch": 1.84, - "learning_rate": 2.3249466477642508e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015780792729553814, + "loss": 0.0125, "step": 365700 }, { - "epoch": 1.85, - "learning_rate": 2.32418987846285e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015780403907916666, + "loss": 0.0148, "step": 365710 }, { - "epoch": 1.85, - "learning_rate": 2.3234331091614488e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015780015086279517, + "loss": 0.0125, "step": 365720 }, { - "epoch": 1.85, - "learning_rate": 2.322676339860048e-05, - "loss": 0.0078, + "epoch": 0.95, + "learning_rate": 0.00015779626264642374, + "loss": 0.0103, "step": 365730 }, { - "epoch": 1.85, - "learning_rate": 2.3219195705586467e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015779237443005228, + "loss": 0.0139, "step": 365740 }, { - "epoch": 1.85, - "learning_rate": 2.321162801257246e-05, - "loss": 0.0074, + "epoch": 0.95, + "learning_rate": 0.0001577884862136808, + "loss": 0.0128, "step": 365750 }, { - "epoch": 1.85, - "learning_rate": 2.3204060319558447e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015778459799730934, + "loss": 0.0125, "step": 365760 }, { - "epoch": 1.85, - "learning_rate": 2.319649262654444e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015778070978093788, + "loss": 0.0134, "step": 365770 }, { - "epoch": 1.85, - "learning_rate": 2.3188924933530427e-05, - "loss": 0.0105, + "epoch": 0.95, + "learning_rate": 0.00015777682156456642, + "loss": 0.013, "step": 365780 }, { - "epoch": 1.85, - "learning_rate": 2.318135724051642e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015777293334819493, + "loss": 0.0161, "step": 365790 }, { - "epoch": 1.85, - "learning_rate": 2.3173789547502407e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015776904513182348, + "loss": 0.0126, "step": 365800 }, { - "epoch": 1.85, - "learning_rate": 2.31662218544884e-05, - "loss": 0.0075, + "epoch": 0.95, + "learning_rate": 0.00015776515691545202, + "loss": 0.0132, "step": 365810 }, { - "epoch": 1.85, - "learning_rate": 2.3158654161474387e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015776126869908056, + "loss": 0.0151, "step": 365820 }, { - "epoch": 1.85, - "learning_rate": 2.3151086468460378e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.00015775738048270907, + "loss": 0.0133, "step": 365830 }, { - "epoch": 1.85, - "learning_rate": 2.3143518775446363e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015775349226633762, + "loss": 0.0109, "step": 365840 }, { - "epoch": 1.85, - "learning_rate": 2.3135951082432355e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015774960404996618, + "loss": 0.0122, "step": 365850 }, { - "epoch": 1.85, - "learning_rate": 2.3128383389418343e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.0001577457158335947, + "loss": 0.0146, "step": 365860 }, { - "epoch": 1.85, - "learning_rate": 2.3120815696404335e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015774182761722321, + "loss": 0.0159, "step": 365870 }, { - "epoch": 1.85, - "learning_rate": 2.3113248003390323e-05, - "loss": 0.0041, + "epoch": 0.95, + "learning_rate": 0.00015773793940085176, + "loss": 0.016, "step": 365880 }, { - "epoch": 1.85, - "learning_rate": 2.3105680310376314e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015773405118448032, + "loss": 0.0157, "step": 365890 }, { - "epoch": 1.85, - "learning_rate": 2.3098112617362303e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015773016296810884, + "loss": 0.0116, "step": 365900 }, { - "epoch": 1.85, - "learning_rate": 2.3090544924348294e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015772627475173738, + "loss": 0.0125, "step": 365910 }, { - "epoch": 1.85, - "learning_rate": 2.3082977231334282e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.0001577223865353659, + "loss": 0.0119, "step": 365920 }, { - "epoch": 1.85, - "learning_rate": 2.3075409538320274e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015771849831899446, + "loss": 0.0105, "step": 365930 }, { - "epoch": 1.85, - "learning_rate": 2.3067841845306262e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015771461010262298, + "loss": 0.0115, "step": 365940 }, { - "epoch": 1.85, - "learning_rate": 2.3060274152292254e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015771072188625152, + "loss": 0.0116, "step": 365950 }, { - "epoch": 1.85, - "learning_rate": 2.3052706459278242e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015770683366988003, + "loss": 0.0128, "step": 365960 }, { - "epoch": 1.85, - "learning_rate": 2.3045138766264234e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015770294545350858, + "loss": 0.0179, "step": 365970 }, { - "epoch": 1.85, - "learning_rate": 2.3037571073250222e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015769905723713712, + "loss": 0.0106, "step": 365980 }, { - "epoch": 1.85, - "learning_rate": 2.303000338023621e-05, - "loss": 0.0091, + "epoch": 0.95, + "learning_rate": 0.00015769516902076566, + "loss": 0.0158, "step": 365990 }, { - "epoch": 1.85, - "learning_rate": 2.30224356872222e-05, - "loss": 0.0038, + "epoch": 0.95, + "learning_rate": 0.00015769128080439417, + "loss": 0.0128, "step": 366000 }, { - "epoch": 1.85, - "eval_cer": 0.914423676889143, - "eval_loss": 0.004396693781018257, - "eval_runtime": 116.8468, - "eval_samples_per_second": 17.116, - "eval_steps_per_second": 4.279, + "epoch": 0.95, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.008484454825520515, + "eval_runtime": 107.5251, + "eval_samples_per_second": 18.6, + "eval_steps_per_second": 4.65, "step": 366000 }, { - "epoch": 1.85, - "learning_rate": 2.301486799420819e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015768739258802272, + "loss": 0.0139, "step": 366010 }, { - "epoch": 1.85, - "learning_rate": 2.3007300301194178e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015768350437165126, + "loss": 0.0125, "step": 366020 }, { - "epoch": 1.85, - "learning_rate": 2.299973260818017e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.0001576796161552798, + "loss": 0.011, "step": 366030 }, { - "epoch": 1.85, - "learning_rate": 2.2992164915166158e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.0001576757279389083, + "loss": 0.0134, "step": 366040 }, { - "epoch": 1.85, - "learning_rate": 2.298459722215215e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.00015767183972253685, + "loss": 0.0152, "step": 366050 }, { - "epoch": 1.85, - "learning_rate": 2.2977029529138138e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015766795150616542, + "loss": 0.0149, "step": 366060 }, { - "epoch": 1.85, - "learning_rate": 2.296946183612413e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015766406328979394, + "loss": 0.017, "step": 366070 }, { - "epoch": 1.85, - "learning_rate": 2.2961894143110118e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015766017507342248, + "loss": 0.0127, "step": 366080 }, { - "epoch": 1.85, - "learning_rate": 2.295432645009611e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.000157656286857051, + "loss": 0.0116, "step": 366090 }, { - "epoch": 1.85, - "learning_rate": 2.2946758757082097e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015765239864067956, + "loss": 0.019, "step": 366100 }, { - "epoch": 1.85, - "learning_rate": 2.293919106406809e-05, - "loss": 0.0087, + "epoch": 0.95, + "learning_rate": 0.00015764851042430808, + "loss": 0.0129, "step": 366110 }, { - "epoch": 1.85, - "learning_rate": 2.2931623371054077e-05, - "loss": 0.0076, + "epoch": 0.95, + "learning_rate": 0.00015764462220793662, + "loss": 0.01, "step": 366120 }, { - "epoch": 1.85, - "learning_rate": 2.292405567804007e-05, - "loss": 0.0091, + "epoch": 0.95, + "learning_rate": 0.00015764073399156513, + "loss": 0.0132, "step": 366130 }, { - "epoch": 1.85, - "learning_rate": 2.2916487985026057e-05, - "loss": 0.0043, + "epoch": 0.95, + "learning_rate": 0.0001576368457751937, + "loss": 0.0142, "step": 366140 }, { - "epoch": 1.85, - "learning_rate": 2.2908920292012045e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015763295755882222, + "loss": 0.0114, "step": 366150 }, { - "epoch": 1.85, - "learning_rate": 2.2901352598998034e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015762906934245076, + "loss": 0.0135, "step": 366160 }, { - "epoch": 1.85, - "learning_rate": 2.2893784905984025e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015762518112607927, + "loss": 0.0112, "step": 366170 }, { - "epoch": 1.85, - "learning_rate": 2.2886217212970013e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015762129290970784, + "loss": 0.0103, "step": 366180 }, { - "epoch": 1.85, - "learning_rate": 2.2878649519956005e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015761740469333636, + "loss": 0.0116, "step": 366190 }, { - "epoch": 1.85, - "learning_rate": 2.2871081826941993e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.0001576135164769649, + "loss": 0.0112, "step": 366200 }, { - "epoch": 1.85, - "learning_rate": 2.2863514133927985e-05, - "loss": 0.0078, + "epoch": 0.95, + "learning_rate": 0.0001576096282605934, + "loss": 0.011, "step": 366210 }, { - "epoch": 1.85, - "learning_rate": 2.2855946440913973e-05, - "loss": 0.007, - "step": 366220 + "epoch": 0.95, + "learning_rate": 0.00015760574004422195, + "loss": 0.0129, + "step": 366220 }, { - "epoch": 1.85, - "learning_rate": 2.2848378747899965e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015760185182785052, + "loss": 0.014, "step": 366230 }, { - "epoch": 1.85, - "learning_rate": 2.2840811054885953e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015759796361147904, + "loss": 0.0135, "step": 366240 }, { - "epoch": 1.85, - "learning_rate": 2.2833243361871944e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015759407539510758, + "loss": 0.0151, "step": 366250 }, { - "epoch": 1.85, - "learning_rate": 2.2825675668857933e-05, - "loss": 0.0073, + "epoch": 0.95, + "learning_rate": 0.0001575901871787361, + "loss": 0.0119, "step": 366260 }, { - "epoch": 1.85, - "learning_rate": 2.2818107975843924e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015758629896236466, + "loss": 0.0202, "step": 366270 }, { - "epoch": 1.85, - "learning_rate": 2.2810540282829912e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015758241074599318, + "loss": 0.0128, "step": 366280 }, { - "epoch": 1.85, - "learning_rate": 2.2802972589815904e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015757852252962172, + "loss": 0.0131, "step": 366290 }, { - "epoch": 1.85, - "learning_rate": 2.2795404896801892e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015757463431325023, + "loss": 0.0136, "step": 366300 }, { - "epoch": 1.85, - "learning_rate": 2.2787837203787877e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.0001575707460968788, + "loss": 0.0124, "step": 366310 }, { - "epoch": 1.85, - "learning_rate": 2.278026951077387e-05, - "loss": 0.0084, + "epoch": 0.95, + "learning_rate": 0.00015756685788050732, + "loss": 0.0111, "step": 366320 }, { - "epoch": 1.85, - "learning_rate": 2.2772701817759857e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015756296966413586, + "loss": 0.0154, "step": 366330 }, { - "epoch": 1.85, - "learning_rate": 2.276513412474585e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.00015755908144776437, + "loss": 0.0136, "step": 366340 }, { - "epoch": 1.85, - "learning_rate": 2.2757566431731837e-05, - "loss": 0.0077, + "epoch": 0.95, + "learning_rate": 0.00015755519323139294, + "loss": 0.0142, "step": 366350 }, { - "epoch": 1.85, - "learning_rate": 2.274999873871783e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015755130501502146, + "loss": 0.0153, "step": 366360 }, { - "epoch": 1.85, - "learning_rate": 2.274243104570382e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015754741679865, + "loss": 0.0134, "step": 366370 }, { - "epoch": 1.85, - "learning_rate": 2.2734863352689808e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.0001575435285822785, + "loss": 0.013, "step": 366380 }, { - "epoch": 1.85, - "learning_rate": 2.27272956596758e-05, - "loss": 0.0069, + "epoch": 0.95, + "learning_rate": 0.00015753964036590708, + "loss": 0.0105, "step": 366390 }, { - "epoch": 1.85, - "learning_rate": 2.2719727966661788e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015753575214953562, + "loss": 0.0109, "step": 366400 }, { - "epoch": 1.85, - "learning_rate": 2.271216027364778e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015753186393316414, + "loss": 0.0125, "step": 366410 }, { - "epoch": 1.85, - "learning_rate": 2.2704592580633768e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015752797571679265, + "loss": 0.0101, "step": 366420 }, { - "epoch": 1.85, - "learning_rate": 2.269702488761976e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015752408750042122, + "loss": 0.0145, "step": 366430 }, { - "epoch": 1.85, - "learning_rate": 2.2689457194605748e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015752019928404976, + "loss": 0.0132, "step": 366440 }, { - "epoch": 1.85, - "learning_rate": 2.268188950159174e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015751631106767828, + "loss": 0.0136, "step": 366450 }, { - "epoch": 1.85, - "learning_rate": 2.2674321808577728e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015751242285130682, + "loss": 0.0129, "step": 366460 }, { - "epoch": 1.85, - "learning_rate": 2.2666754115563712e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015750853463493533, + "loss": 0.0144, "step": 366470 }, { - "epoch": 1.85, - "learning_rate": 2.2659186422549704e-05, - "loss": 0.0086, + "epoch": 0.95, + "learning_rate": 0.0001575046464185639, + "loss": 0.0127, "step": 366480 }, { - "epoch": 1.85, - "learning_rate": 2.2651618729535692e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015750075820219242, + "loss": 0.0125, "step": 366490 }, { - "epoch": 1.85, - "learning_rate": 2.2644051036521684e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015749686998582096, + "loss": 0.0094, "step": 366500 }, { - "epoch": 1.85, - "learning_rate": 2.2636483343507672e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.00015749298176944947, + "loss": 0.0148, "step": 366510 }, { - "epoch": 1.85, - "learning_rate": 2.2628915650493664e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015748909355307804, + "loss": 0.0128, "step": 366520 }, { - "epoch": 1.85, - "learning_rate": 2.2621347957479652e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015748520533670656, + "loss": 0.014, "step": 366530 }, { - "epoch": 1.85, - "learning_rate": 2.2613780264465643e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.0001574813171203351, + "loss": 0.0129, "step": 366540 }, { - "epoch": 1.85, - "learning_rate": 2.260621257145163e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.0001574774289039636, + "loss": 0.0174, "step": 366550 }, { - "epoch": 1.85, - "learning_rate": 2.2598644878437623e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015747354068759218, + "loss": 0.0118, "step": 366560 }, { - "epoch": 1.85, - "learning_rate": 2.259107718542361e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015746965247122072, + "loss": 0.0158, "step": 366570 }, { - "epoch": 1.85, - "learning_rate": 2.2583509492409603e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015746576425484924, + "loss": 0.0168, "step": 366580 }, { - "epoch": 1.85, - "learning_rate": 2.257594179939559e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015746187603847775, + "loss": 0.011, "step": 366590 }, { - "epoch": 1.85, - "learning_rate": 2.2568374106381583e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015745798782210632, + "loss": 0.0124, "step": 366600 }, { - "epoch": 1.85, - "learning_rate": 2.256080641336757e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.00015745409960573486, + "loss": 0.0135, "step": 366610 }, { - "epoch": 1.85, - "learning_rate": 2.255323872035356e-05, - "loss": 0.0078, + "epoch": 0.95, + "learning_rate": 0.00015745021138936338, + "loss": 0.0133, "step": 366620 }, { - "epoch": 1.85, - "learning_rate": 2.2545671027339548e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015744632317299192, + "loss": 0.0131, "step": 366630 }, { - "epoch": 1.85, - "learning_rate": 2.253810333432554e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015744243495662046, + "loss": 0.0125, "step": 366640 }, { - "epoch": 1.85, - "learning_rate": 2.2530535641311527e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.000157438546740249, + "loss": 0.012, "step": 366650 }, { - "epoch": 1.85, - "learning_rate": 2.252296794829752e-05, - "loss": 0.008, + "epoch": 0.95, + "learning_rate": 0.00015743465852387752, + "loss": 0.0133, "step": 366660 }, { - "epoch": 1.85, - "learning_rate": 2.2515400255283507e-05, - "loss": 0.0044, + "epoch": 0.95, + "learning_rate": 0.00015743077030750606, + "loss": 0.0106, "step": 366670 }, { - "epoch": 1.85, - "learning_rate": 2.25078325622695e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.0001574268820911346, + "loss": 0.0126, "step": 366680 }, { - "epoch": 1.85, - "learning_rate": 2.2500264869255487e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015742299387476314, + "loss": 0.0142, "step": 366690 }, { - "epoch": 1.85, - "learning_rate": 2.249269717624148e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015741910565839165, + "loss": 0.0125, "step": 366700 }, { - "epoch": 1.85, - "learning_rate": 2.2485129483227467e-05, - "loss": 0.0041, + "epoch": 0.95, + "learning_rate": 0.0001574152174420202, + "loss": 0.0118, "step": 366710 }, { - "epoch": 1.85, - "learning_rate": 2.247756179021346e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.0001574113292256487, + "loss": 0.0141, "step": 366720 }, { - "epoch": 1.85, - "learning_rate": 2.2469994097199447e-05, - "loss": 0.007, + "epoch": 0.95, + "learning_rate": 0.00015740744100927728, + "loss": 0.016, "step": 366730 }, { - "epoch": 1.85, - "learning_rate": 2.246242640418544e-05, - "loss": 0.0075, + "epoch": 0.95, + "learning_rate": 0.0001574035527929058, + "loss": 0.0133, "step": 366740 }, { - "epoch": 1.85, - "learning_rate": 2.2454858711171427e-05, - "loss": 0.007, + "epoch": 0.95, + "learning_rate": 0.00015739966457653434, + "loss": 0.0115, "step": 366750 }, { - "epoch": 1.85, - "learning_rate": 2.2447291018157418e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015739577636016285, + "loss": 0.0119, "step": 366760 }, { - "epoch": 1.85, - "learning_rate": 2.2439723325143406e-05, - "loss": 0.007, + "epoch": 0.95, + "learning_rate": 0.00015739188814379142, + "loss": 0.0122, "step": 366770 }, { - "epoch": 1.85, - "learning_rate": 2.2432155632129395e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015738799992741996, + "loss": 0.011, "step": 366780 }, { - "epoch": 1.85, - "learning_rate": 2.2424587939115383e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015738411171104848, + "loss": 0.0119, "step": 366790 }, { - "epoch": 1.85, - "learning_rate": 2.2417020246101374e-05, - "loss": 0.0092, + "epoch": 0.95, + "learning_rate": 0.00015738022349467702, + "loss": 0.0129, "step": 366800 }, { - "epoch": 1.85, - "learning_rate": 2.2409452553087363e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015737633527830556, + "loss": 0.0121, "step": 366810 }, { - "epoch": 1.85, - "learning_rate": 2.2401884860073354e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.0001573724470619341, + "loss": 0.0124, "step": 366820 }, { - "epoch": 1.85, - "learning_rate": 2.2394317167059342e-05, - "loss": 0.0085, + "epoch": 0.95, + "learning_rate": 0.00015736855884556261, + "loss": 0.0108, "step": 366830 }, { - "epoch": 1.85, - "learning_rate": 2.2386749474045334e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015736467062919116, + "loss": 0.0199, "step": 366840 }, { - "epoch": 1.85, - "learning_rate": 2.2379181781031322e-05, - "loss": 0.0069, + "epoch": 0.95, + "learning_rate": 0.0001573607824128197, + "loss": 0.0222, "step": 366850 }, { - "epoch": 1.85, - "learning_rate": 2.2371614088017314e-05, - "loss": 0.0078, + "epoch": 0.95, + "learning_rate": 0.00015735689419644824, + "loss": 0.0108, "step": 366860 }, { - "epoch": 1.85, - "learning_rate": 2.2364046395003302e-05, - "loss": 0.0075, + "epoch": 0.95, + "learning_rate": 0.00015735300598007675, + "loss": 0.0178, "step": 366870 }, { - "epoch": 1.85, - "learning_rate": 2.2356478701989294e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.0001573491177637053, + "loss": 0.011, "step": 366880 }, { - "epoch": 1.85, - "learning_rate": 2.2348911008975282e-05, - "loss": 0.0076, + "epoch": 0.95, + "learning_rate": 0.00015734522954733384, + "loss": 0.0134, "step": 366890 }, { - "epoch": 1.85, - "learning_rate": 2.2341343315961274e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015734134133096238, + "loss": 0.0227, "step": 366900 }, { - "epoch": 1.85, - "learning_rate": 2.2333775622947262e-05, - "loss": 0.0082, + "epoch": 0.95, + "learning_rate": 0.0001573374531145909, + "loss": 0.0129, "step": 366910 }, { - "epoch": 1.85, - "learning_rate": 2.2326207929933253e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015733356489821944, + "loss": 0.012, "step": 366920 }, { - "epoch": 1.85, - "learning_rate": 2.231864023691924e-05, - "loss": 0.0041, + "epoch": 0.95, + "learning_rate": 0.000157329676681848, + "loss": 0.0125, "step": 366930 }, { - "epoch": 1.85, - "learning_rate": 2.231107254390523e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015732578846547652, + "loss": 0.0112, "step": 366940 }, { - "epoch": 1.85, - "learning_rate": 2.2303504850891218e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015732190024910506, + "loss": 0.0134, "step": 366950 }, { - "epoch": 1.85, - "learning_rate": 2.229593715787721e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015731801203273357, + "loss": 0.0135, "step": 366960 }, { - "epoch": 1.85, - "learning_rate": 2.2288369464863198e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.00015731412381636212, + "loss": 0.013, "step": 366970 }, { - "epoch": 1.85, - "learning_rate": 2.228080177184919e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015731023559999066, + "loss": 0.012, "step": 366980 }, { - "epoch": 1.85, - "learning_rate": 2.2273234078835178e-05, - "loss": 0.0079, + "epoch": 0.95, + "learning_rate": 0.0001573063473836192, + "loss": 0.0154, "step": 366990 }, { - "epoch": 1.85, - "learning_rate": 2.226566638582117e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015730245916724771, + "loss": 0.0138, "step": 367000 }, { - "epoch": 1.85, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004412375390529633, - "eval_runtime": 116.7639, - "eval_samples_per_second": 17.129, - "eval_steps_per_second": 4.282, + "epoch": 0.95, + "eval_cer": 0.8817208816033121, + "eval_loss": 0.008482192642986774, + "eval_runtime": 107.6733, + "eval_samples_per_second": 18.575, + "eval_steps_per_second": 4.644, "step": 367000 }, { - "epoch": 1.85, - "learning_rate": 2.2258098692807157e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015729857095087626, + "loss": 0.0093, "step": 367010 }, { - "epoch": 1.85, - "learning_rate": 2.225053099979315e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.0001572946827345048, + "loss": 0.012, "step": 367020 }, { - "epoch": 1.85, - "learning_rate": 2.2242963306779137e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015729079451813334, + "loss": 0.0121, "step": 367030 }, { - "epoch": 1.85, - "learning_rate": 2.223539561376513e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.00015728690630176185, + "loss": 0.0134, "step": 367040 }, { - "epoch": 1.85, - "learning_rate": 2.2227827920751117e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.0001572830180853904, + "loss": 0.0134, "step": 367050 }, { - "epoch": 1.85, - "learning_rate": 2.222026022773711e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015727912986901894, + "loss": 0.0115, "step": 367060 }, { - "epoch": 1.85, - "learning_rate": 2.2212692534723097e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.00015727524165264748, + "loss": 0.0131, "step": 367070 }, { - "epoch": 1.85, - "learning_rate": 2.220512484170909e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.000157271353436276, + "loss": 0.0137, "step": 367080 }, { - "epoch": 1.85, - "learning_rate": 2.2197557148695073e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015726746521990453, + "loss": 0.0131, "step": 367090 }, { - "epoch": 1.85, - "learning_rate": 2.2189989455681065e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.0001572635770035331, + "loss": 0.0096, "step": 367100 }, { - "epoch": 1.85, - "learning_rate": 2.2182421762667053e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015725968878716162, + "loss": 0.0143, "step": 367110 }, { - "epoch": 1.85, - "learning_rate": 2.2174854069653045e-05, - "loss": 0.007, + "epoch": 0.95, + "learning_rate": 0.00015725580057079016, + "loss": 0.017, "step": 367120 }, { - "epoch": 1.85, - "learning_rate": 2.2167286376639033e-05, - "loss": 0.0026, + "epoch": 0.95, + "learning_rate": 0.00015725191235441867, + "loss": 0.0112, "step": 367130 }, { - "epoch": 1.85, - "learning_rate": 2.2159718683625025e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015724802413804724, + "loss": 0.0099, "step": 367140 }, { - "epoch": 1.85, - "learning_rate": 2.2152150990611013e-05, - "loss": 0.007, + "epoch": 0.95, + "learning_rate": 0.00015724413592167576, + "loss": 0.0125, "step": 367150 }, { - "epoch": 1.85, - "learning_rate": 2.2144583297597004e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.0001572402477053043, + "loss": 0.0136, "step": 367160 }, { - "epoch": 1.85, - "learning_rate": 2.2137015604582993e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.0001572363594889328, + "loss": 0.0151, "step": 367170 }, { - "epoch": 1.85, - "learning_rate": 2.2129447911568984e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.00015723247127256138, + "loss": 0.0136, "step": 367180 }, { - "epoch": 1.85, - "learning_rate": 2.2121880218554973e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.0001572285830561899, + "loss": 0.0114, "step": 367190 }, { - "epoch": 1.85, - "learning_rate": 2.2114312525540964e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015722469483981844, + "loss": 0.0123, "step": 367200 }, { - "epoch": 1.85, - "learning_rate": 2.2106744832526952e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015722080662344695, + "loss": 0.0154, "step": 367210 }, { - "epoch": 1.85, - "learning_rate": 2.2099177139512944e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.0001572169184070755, + "loss": 0.013, "step": 367220 }, { - "epoch": 1.85, - "learning_rate": 2.2091609446498932e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015721303019070404, + "loss": 0.011, "step": 367230 }, { - "epoch": 1.85, - "learning_rate": 2.2084041753484924e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015720914197433258, + "loss": 0.0125, "step": 367240 }, { - "epoch": 1.85, - "learning_rate": 2.207647406047091e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.0001572052537579611, + "loss": 0.013, "step": 367250 }, { - "epoch": 1.85, - "learning_rate": 2.2068906367456897e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015720136554158963, + "loss": 0.0112, "step": 367260 }, { - "epoch": 1.85, - "learning_rate": 2.206133867444289e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.0001571974773252182, + "loss": 0.0085, "step": 367270 }, { - "epoch": 1.85, - "learning_rate": 2.2053770981428877e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015719358910884672, + "loss": 0.0173, "step": 367280 }, { - "epoch": 1.85, - "learning_rate": 2.2046203288414868e-05, - "loss": 0.0075, + "epoch": 0.95, + "learning_rate": 0.00015718970089247526, + "loss": 0.009, "step": 367290 }, { - "epoch": 1.85, - "learning_rate": 2.2038635595400856e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015718581267610377, + "loss": 0.014, "step": 367300 }, { - "epoch": 1.85, - "learning_rate": 2.2031067902386848e-05, - "loss": 0.0074, + "epoch": 0.95, + "learning_rate": 0.00015718192445973234, + "loss": 0.0123, "step": 367310 }, { - "epoch": 1.85, - "learning_rate": 2.2023500209372836e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.00015717803624336086, + "loss": 0.0125, "step": 367320 }, { - "epoch": 1.85, - "learning_rate": 2.2015932516358828e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.0001571741480269894, + "loss": 0.0147, "step": 367330 }, { - "epoch": 1.85, - "learning_rate": 2.200836482334482e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.0001571702598106179, + "loss": 0.0163, "step": 367340 }, { - "epoch": 1.85, - "learning_rate": 2.2000797130330808e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015716637159424648, + "loss": 0.0136, "step": 367350 }, { - "epoch": 1.85, - "learning_rate": 2.19932294373168e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.000157162483377875, + "loss": 0.0101, "step": 367360 }, { - "epoch": 1.85, - "learning_rate": 2.1985661744302788e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015715859516150354, + "loss": 0.0123, "step": 367370 }, { - "epoch": 1.85, - "learning_rate": 2.197809405128878e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.00015715470694513205, + "loss": 0.0134, "step": 367380 }, { - "epoch": 1.85, - "learning_rate": 2.1970526358274767e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.00015715081872876062, + "loss": 0.0124, "step": 367390 }, { - "epoch": 1.85, - "learning_rate": 2.196295866526076e-05, - "loss": 0.0064, + "epoch": 0.95, + "learning_rate": 0.00015714693051238914, + "loss": 0.013, "step": 367400 }, { - "epoch": 1.85, - "learning_rate": 2.1955390972246744e-05, - "loss": 0.0073, + "epoch": 0.95, + "learning_rate": 0.00015714304229601768, + "loss": 0.0145, "step": 367410 }, { - "epoch": 1.85, - "learning_rate": 2.1947823279232732e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.0001571391540796462, + "loss": 0.0131, "step": 367420 }, { - "epoch": 1.85, - "learning_rate": 2.1940255586218724e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.00015713526586327476, + "loss": 0.0172, "step": 367430 }, { - "epoch": 1.85, - "learning_rate": 2.1932687893204712e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.0001571313776469033, + "loss": 0.0144, "step": 367440 }, { - "epoch": 1.85, - "learning_rate": 2.1925120200190703e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.00015712748943053182, + "loss": 0.0124, "step": 367450 }, { - "epoch": 1.85, - "learning_rate": 2.1917552507176692e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015712360121416033, + "loss": 0.0143, "step": 367460 }, { - "epoch": 1.85, - "learning_rate": 2.1909984814162683e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015711971299778887, + "loss": 0.0163, "step": 367470 }, { - "epoch": 1.85, - "learning_rate": 2.190241712114867e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015711582478141744, + "loss": 0.0144, "step": 367480 }, { - "epoch": 1.85, - "learning_rate": 2.1894849428134663e-05, - "loss": 0.0086, + "epoch": 0.95, + "learning_rate": 0.00015711193656504596, + "loss": 0.0106, "step": 367490 }, { - "epoch": 1.85, - "learning_rate": 2.188728173512065e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.0001571080483486745, + "loss": 0.0113, "step": 367500 }, { - "epoch": 1.85, - "learning_rate": 2.1879714042106643e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.000157104160132303, + "loss": 0.0105, "step": 367510 }, { - "epoch": 1.85, - "learning_rate": 2.187214634909263e-05, - "loss": 0.0032, + "epoch": 0.95, + "learning_rate": 0.00015710027191593158, + "loss": 0.0121, "step": 367520 }, { - "epoch": 1.85, - "learning_rate": 2.1864578656078623e-05, - "loss": 0.0067, + "epoch": 0.95, + "learning_rate": 0.0001570963836995601, + "loss": 0.0117, "step": 367530 }, { - "epoch": 1.85, - "learning_rate": 2.185701096306461e-05, - "loss": 0.0082, + "epoch": 0.95, + "learning_rate": 0.00015709249548318864, + "loss": 0.0142, "step": 367540 }, { - "epoch": 1.85, - "learning_rate": 2.1849443270050603e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015708860726681715, + "loss": 0.0126, "step": 367550 }, { - "epoch": 1.85, - "learning_rate": 2.184187557703659e-05, - "loss": 0.0056, + "epoch": 0.95, + "learning_rate": 0.00015708471905044572, + "loss": 0.011, "step": 367560 }, { - "epoch": 1.85, - "learning_rate": 2.183430788402258e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015708083083407424, + "loss": 0.012, "step": 367570 }, { - "epoch": 1.85, - "learning_rate": 2.1826740191008567e-05, - "loss": 0.0051, + "epoch": 0.95, + "learning_rate": 0.00015707694261770278, + "loss": 0.0122, "step": 367580 }, { - "epoch": 1.85, - "learning_rate": 2.181917249799456e-05, - "loss": 0.0055, + "epoch": 0.95, + "learning_rate": 0.0001570730544013313, + "loss": 0.0106, "step": 367590 }, { - "epoch": 1.85, - "learning_rate": 2.1811604804980547e-05, - "loss": 0.0038, + "epoch": 0.95, + "learning_rate": 0.00015706916618495986, + "loss": 0.0146, "step": 367600 }, { - "epoch": 1.85, - "learning_rate": 2.180403711196654e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015706527796858837, + "loss": 0.0173, "step": 367610 }, { - "epoch": 1.85, - "learning_rate": 2.1796469418952527e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015706138975221692, + "loss": 0.013, "step": 367620 }, { - "epoch": 1.85, - "learning_rate": 2.178890172593852e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.00015705750153584543, + "loss": 0.0131, "step": 367630 }, { - "epoch": 1.85, - "learning_rate": 2.1781334032924507e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.000157053613319474, + "loss": 0.013, "step": 367640 }, { - "epoch": 1.85, - "learning_rate": 2.17737663399105e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015704972510310254, + "loss": 0.0131, "step": 367650 }, { - "epoch": 1.85, - "learning_rate": 2.1766198646896487e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015704583688673106, + "loss": 0.0126, "step": 367660 }, { - "epoch": 1.85, - "learning_rate": 2.1758630953882478e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.0001570419486703596, + "loss": 0.0123, "step": 367670 }, { - "epoch": 1.85, - "learning_rate": 2.1751063260868466e-05, - "loss": 0.0075, + "epoch": 0.95, + "learning_rate": 0.00015703806045398814, + "loss": 0.0141, "step": 367680 }, { - "epoch": 1.86, - "learning_rate": 2.1743495567854458e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015703417223761668, + "loss": 0.0133, "step": 367690 }, { - "epoch": 1.86, - "learning_rate": 2.1735927874840446e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.0001570302840212452, + "loss": 0.015, "step": 367700 }, { - "epoch": 1.86, - "learning_rate": 2.1728360181826438e-05, - "loss": 0.0069, + "epoch": 0.95, + "learning_rate": 0.00015702639580487374, + "loss": 0.0155, "step": 367710 }, { - "epoch": 1.86, - "learning_rate": 2.1720792488812423e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015702250758850225, + "loss": 0.0132, "step": 367720 }, { - "epoch": 1.86, - "learning_rate": 2.1713224795798414e-05, - "loss": 0.0086, + "epoch": 0.95, + "learning_rate": 0.00015701861937213082, + "loss": 0.0108, "step": 367730 }, { - "epoch": 1.86, - "learning_rate": 2.1705657102784402e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015701473115575933, + "loss": 0.0116, "step": 367740 }, { - "epoch": 1.86, - "learning_rate": 2.1698089409770394e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015701084293938788, + "loss": 0.0166, "step": 367750 }, { - "epoch": 1.86, - "learning_rate": 2.1690521716756382e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.0001570069547230164, + "loss": 0.0116, "step": 367760 }, { - "epoch": 1.86, - "learning_rate": 2.1682954023742374e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015700306650664496, + "loss": 0.0138, "step": 367770 }, { - "epoch": 1.86, - "learning_rate": 2.1675386330728362e-05, - "loss": 0.0077, + "epoch": 0.95, + "learning_rate": 0.00015699917829027347, + "loss": 0.0117, "step": 367780 }, { - "epoch": 1.86, - "learning_rate": 2.1667818637714354e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015699529007390202, + "loss": 0.012, "step": 367790 }, { - "epoch": 1.86, - "learning_rate": 2.1660250944700342e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015699140185753053, + "loss": 0.011, "step": 367800 }, { - "epoch": 1.86, - "learning_rate": 2.1652683251686334e-05, - "loss": 0.0085, + "epoch": 0.95, + "learning_rate": 0.0001569875136411591, + "loss": 0.0166, "step": 367810 }, { - "epoch": 1.86, - "learning_rate": 2.1645115558672322e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015698362542478764, + "loss": 0.0114, "step": 367820 }, { - "epoch": 1.86, - "learning_rate": 2.1637547865658313e-05, - "loss": 0.0078, + "epoch": 0.95, + "learning_rate": 0.00015697973720841616, + "loss": 0.0138, "step": 367830 }, { - "epoch": 1.86, - "learning_rate": 2.16299801726443e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.0001569758489920447, + "loss": 0.013, "step": 367840 }, { - "epoch": 1.86, - "learning_rate": 2.1622412479630293e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015697196077567324, + "loss": 0.018, "step": 367850 }, { - "epoch": 1.86, - "learning_rate": 2.161484478661628e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015696807255930178, + "loss": 0.0122, "step": 367860 }, { - "epoch": 1.86, - "learning_rate": 2.1607277093602273e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.0001569641843429303, + "loss": 0.0115, "step": 367870 }, { - "epoch": 1.86, - "learning_rate": 2.1599709400588258e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015696029612655884, + "loss": 0.0108, "step": 367880 }, { - "epoch": 1.86, - "learning_rate": 2.159214170757425e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015695640791018738, + "loss": 0.0157, "step": 367890 }, { - "epoch": 1.86, - "learning_rate": 2.1584574014560238e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015695251969381592, + "loss": 0.0152, "step": 367900 }, { - "epoch": 1.86, - "learning_rate": 2.157700632154623e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015694863147744443, + "loss": 0.0105, "step": 367910 }, { - "epoch": 1.86, - "learning_rate": 2.1569438628532218e-05, - "loss": 0.0072, + "epoch": 0.95, + "learning_rate": 0.00015694474326107298, + "loss": 0.009, "step": 367920 }, { - "epoch": 1.86, - "learning_rate": 2.156187093551821e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015694085504470152, + "loss": 0.0132, "step": 367930 }, { - "epoch": 1.86, - "learning_rate": 2.1554303242504197e-05, - "loss": 0.0066, + "epoch": 0.95, + "learning_rate": 0.00015693696682833006, + "loss": 0.0121, "step": 367940 }, { - "epoch": 1.86, - "learning_rate": 2.154673554949019e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015693307861195857, + "loss": 0.013, "step": 367950 }, { - "epoch": 1.86, - "learning_rate": 2.1539167856476177e-05, - "loss": 0.0076, + "epoch": 0.95, + "learning_rate": 0.00015692919039558712, + "loss": 0.0131, "step": 367960 }, { - "epoch": 1.86, - "learning_rate": 2.153160016346217e-05, - "loss": 0.0077, + "epoch": 0.95, + "learning_rate": 0.00015692530217921563, + "loss": 0.013, "step": 367970 }, { - "epoch": 1.86, - "learning_rate": 2.1524032470448157e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.0001569214139628442, + "loss": 0.0135, "step": 367980 }, { - "epoch": 1.86, - "learning_rate": 2.151646477743415e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015691752574647274, + "loss": 0.0118, "step": 367990 }, { - "epoch": 1.86, - "learning_rate": 2.1508897084420137e-05, - "loss": 0.0072, + "epoch": 0.95, + "learning_rate": 0.00015691363753010125, + "loss": 0.0121, "step": 368000 }, { - "epoch": 1.86, - "eval_cer": 0.9144285288697699, - "eval_loss": 0.004368205089122057, - "eval_runtime": 116.793, - "eval_samples_per_second": 17.124, - "eval_steps_per_second": 4.281, + "epoch": 0.95, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.008444735780358315, + "eval_runtime": 107.6844, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, "step": 368000 }, { - "epoch": 1.86, - "learning_rate": 2.150132939140613e-05, - "loss": 0.0076, + "epoch": 0.95, + "learning_rate": 0.00015690974931372977, + "loss": 0.0152, "step": 368010 }, { - "epoch": 1.86, - "learning_rate": 2.1493761698392117e-05, - "loss": 0.0044, + "epoch": 0.95, + "learning_rate": 0.00015690586109735834, + "loss": 0.011, "step": 368020 }, { - "epoch": 1.86, - "learning_rate": 2.1486194005378108e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015690197288098688, + "loss": 0.0137, "step": 368030 }, { - "epoch": 1.86, - "learning_rate": 2.1478626312364093e-05, - "loss": 0.0048, + "epoch": 0.95, + "learning_rate": 0.0001568980846646154, + "loss": 0.0153, "step": 368040 }, { - "epoch": 1.86, - "learning_rate": 2.1471058619350085e-05, - "loss": 0.0039, + "epoch": 0.95, + "learning_rate": 0.00015689419644824394, + "loss": 0.0169, "step": 368050 }, { - "epoch": 1.86, - "learning_rate": 2.1463490926336073e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015689030823187248, + "loss": 0.0136, "step": 368060 }, { - "epoch": 1.86, - "learning_rate": 2.1455923233322065e-05, - "loss": 0.0038, + "epoch": 0.95, + "learning_rate": 0.00015688642001550102, + "loss": 0.0134, "step": 368070 }, { - "epoch": 1.86, - "learning_rate": 2.1448355540308053e-05, - "loss": 0.0057, + "epoch": 0.95, + "learning_rate": 0.00015688253179912953, + "loss": 0.0142, "step": 368080 }, { - "epoch": 1.86, - "learning_rate": 2.1440787847294044e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.00015687864358275807, + "loss": 0.017, "step": 368090 }, { - "epoch": 1.86, - "learning_rate": 2.1433220154280033e-05, - "loss": 0.0078, + "epoch": 0.95, + "learning_rate": 0.00015687475536638662, + "loss": 0.0106, "step": 368100 }, { - "epoch": 1.86, - "learning_rate": 2.1425652461266024e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015687086715001516, + "loss": 0.0112, "step": 368110 }, { - "epoch": 1.86, - "learning_rate": 2.1418084768252012e-05, - "loss": 0.0062, + "epoch": 0.95, + "learning_rate": 0.00015686697893364367, + "loss": 0.0127, "step": 368120 }, { - "epoch": 1.86, - "learning_rate": 2.1410517075238004e-05, - "loss": 0.0109, + "epoch": 0.95, + "learning_rate": 0.00015686309071727221, + "loss": 0.014, "step": 368130 }, { - "epoch": 1.86, - "learning_rate": 2.1402949382223992e-05, - "loss": 0.0045, + "epoch": 0.95, + "learning_rate": 0.00015685920250090078, + "loss": 0.016, "step": 368140 }, { - "epoch": 1.86, - "learning_rate": 2.1395381689209984e-05, - "loss": 0.0061, + "epoch": 0.95, + "learning_rate": 0.0001568553142845293, + "loss": 0.0114, "step": 368150 }, { - "epoch": 1.86, - "learning_rate": 2.1387813996195972e-05, - "loss": 0.006, + "epoch": 0.95, + "learning_rate": 0.00015685142606815784, + "loss": 0.0104, "step": 368160 }, { - "epoch": 1.86, - "learning_rate": 2.1380246303181964e-05, - "loss": 0.0053, + "epoch": 0.95, + "learning_rate": 0.00015684753785178635, + "loss": 0.0134, "step": 368170 }, { - "epoch": 1.86, - "learning_rate": 2.1372678610167952e-05, - "loss": 0.0046, + "epoch": 0.95, + "learning_rate": 0.00015684364963541492, + "loss": 0.0114, "step": 368180 }, { - "epoch": 1.86, - "learning_rate": 2.1365110917153937e-05, - "loss": 0.0041, + "epoch": 0.95, + "learning_rate": 0.00015683976141904344, + "loss": 0.0121, "step": 368190 }, { - "epoch": 1.86, - "learning_rate": 2.135754322413993e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015683587320267198, + "loss": 0.0184, "step": 368200 }, { - "epoch": 1.86, - "learning_rate": 2.1349975531125917e-05, - "loss": 0.005, + "epoch": 0.95, + "learning_rate": 0.0001568319849863005, + "loss": 0.0149, "step": 368210 }, { - "epoch": 1.86, - "learning_rate": 2.1342407838111908e-05, - "loss": 0.0082, + "epoch": 0.95, + "learning_rate": 0.00015682809676992903, + "loss": 0.0108, "step": 368220 }, { - "epoch": 1.86, - "learning_rate": 2.1334840145097896e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015682420855355758, + "loss": 0.01, "step": 368230 }, { - "epoch": 1.86, - "learning_rate": 2.1327272452083888e-05, - "loss": 0.0047, + "epoch": 0.95, + "learning_rate": 0.00015682032033718612, + "loss": 0.0112, "step": 368240 }, { - "epoch": 1.86, - "learning_rate": 2.1319704759069876e-05, - "loss": 0.0059, + "epoch": 0.95, + "learning_rate": 0.00015681643212081463, + "loss": 0.0127, "step": 368250 }, { - "epoch": 1.86, - "learning_rate": 2.1312137066055868e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015681254390444317, + "loss": 0.0112, "step": 368260 }, { - "epoch": 1.86, - "learning_rate": 2.1304569373041856e-05, - "loss": 0.0102, + "epoch": 0.95, + "learning_rate": 0.00015680865568807172, + "loss": 0.0113, "step": 368270 }, { - "epoch": 1.86, - "learning_rate": 2.1297001680027848e-05, - "loss": 0.0049, + "epoch": 0.95, + "learning_rate": 0.00015680476747170026, + "loss": 0.0116, "step": 368280 }, { - "epoch": 1.86, - "learning_rate": 2.1289433987013836e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015680087925532877, + "loss": 0.0133, "step": 368290 }, { - "epoch": 1.86, - "learning_rate": 2.1281866293999827e-05, - "loss": 0.0052, + "epoch": 0.95, + "learning_rate": 0.00015679699103895731, + "loss": 0.0142, "step": 368300 }, { - "epoch": 1.86, - "learning_rate": 2.127429860098582e-05, - "loss": 0.0069, + "epoch": 0.95, + "learning_rate": 0.00015679310282258588, + "loss": 0.0137, "step": 368310 }, { - "epoch": 1.86, - "learning_rate": 2.1266730907971807e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.0001567892146062144, + "loss": 0.0129, "step": 368320 }, { - "epoch": 1.86, - "learning_rate": 2.12591632149578e-05, - "loss": 0.0044, + "epoch": 0.95, + "learning_rate": 0.0001567853263898429, + "loss": 0.0109, "step": 368330 }, { - "epoch": 1.86, - "learning_rate": 2.1251595521943787e-05, - "loss": 0.0074, + "epoch": 0.95, + "learning_rate": 0.00015678143817347145, + "loss": 0.0151, "step": 368340 }, { - "epoch": 1.86, - "learning_rate": 2.1244027828929772e-05, - "loss": 0.0058, + "epoch": 0.95, + "learning_rate": 0.00015677754995710002, + "loss": 0.0118, "step": 368350 }, { - "epoch": 1.86, - "learning_rate": 2.1236460135915764e-05, - "loss": 0.0065, + "epoch": 0.95, + "learning_rate": 0.00015677366174072854, + "loss": 0.0125, "step": 368360 }, { - "epoch": 1.86, - "learning_rate": 2.1228892442901752e-05, - "loss": 0.0042, + "epoch": 0.95, + "learning_rate": 0.00015676977352435708, + "loss": 0.0179, "step": 368370 }, { - "epoch": 1.86, - "learning_rate": 2.1221324749887743e-05, - "loss": 0.0044, + "epoch": 0.95, + "learning_rate": 0.0001567658853079856, + "loss": 0.0137, "step": 368380 }, { - "epoch": 1.86, - "learning_rate": 2.121375705687373e-05, - "loss": 0.0063, + "epoch": 0.95, + "learning_rate": 0.00015676199709161416, + "loss": 0.0139, "step": 368390 }, { - "epoch": 1.86, - "learning_rate": 2.1206189363859723e-05, - "loss": 0.0054, + "epoch": 0.95, + "learning_rate": 0.00015675810887524268, + "loss": 0.0139, "step": 368400 }, { - "epoch": 1.86, - "learning_rate": 2.119862167084571e-05, - "loss": 0.0068, + "epoch": 0.95, + "learning_rate": 0.00015675422065887122, + "loss": 0.0119, "step": 368410 }, { - "epoch": 1.86, - "learning_rate": 2.1191053977831703e-05, - "loss": 0.008, + "epoch": 0.95, + "learning_rate": 0.00015675033244249973, + "loss": 0.0145, "step": 368420 }, { - "epoch": 1.86, - "learning_rate": 2.118348628481769e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001567464442261283, + "loss": 0.0121, "step": 368430 }, { - "epoch": 1.86, - "learning_rate": 2.1175918591803683e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015674255600975682, + "loss": 0.0121, "step": 368440 }, { - "epoch": 1.86, - "learning_rate": 2.116835089878967e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015673866779338536, + "loss": 0.0116, "step": 368450 }, { - "epoch": 1.86, - "learning_rate": 2.1160783205775663e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015673477957701387, + "loss": 0.0111, "step": 368460 }, { - "epoch": 1.86, - "learning_rate": 2.115321551276165e-05, - "loss": 0.0037, + "epoch": 0.96, + "learning_rate": 0.0001567308913606424, + "loss": 0.0148, "step": 368470 }, { - "epoch": 1.86, - "learning_rate": 2.1145647819747642e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.00015672700314427095, + "loss": 0.0102, "step": 368480 }, { - "epoch": 1.86, - "learning_rate": 2.113808012673363e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.0001567231149278995, + "loss": 0.012, "step": 368490 }, { - "epoch": 1.86, - "learning_rate": 2.1130512433719622e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.000156719226711528, + "loss": 0.0133, "step": 368500 }, { - "epoch": 1.86, - "learning_rate": 2.1122944740705607e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.00015671533849515655, + "loss": 0.0098, "step": 368510 }, { - "epoch": 1.86, - "learning_rate": 2.11153770476916e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015671145027878512, + "loss": 0.0144, "step": 368520 }, { - "epoch": 1.86, - "learning_rate": 2.1107809354677587e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015670756206241364, + "loss": 0.0192, "step": 368530 }, { - "epoch": 1.86, - "learning_rate": 2.110024166166358e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015670367384604218, + "loss": 0.0124, "step": 368540 }, { - "epoch": 1.86, - "learning_rate": 2.1092673968649567e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.0001566997856296707, + "loss": 0.0115, "step": 368550 }, { - "epoch": 1.86, - "learning_rate": 2.108510627563556e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015669589741329926, + "loss": 0.0131, "step": 368560 }, { - "epoch": 1.86, - "learning_rate": 2.1077538582621547e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015669200919692778, + "loss": 0.0135, "step": 368570 }, { - "epoch": 1.86, - "learning_rate": 2.1069970889607538e-05, - "loss": 0.0071, + "epoch": 0.96, + "learning_rate": 0.00015668812098055632, + "loss": 0.0136, "step": 368580 }, { - "epoch": 1.86, - "learning_rate": 2.1062403196593526e-05, - "loss": 0.0073, + "epoch": 0.96, + "learning_rate": 0.00015668423276418483, + "loss": 0.0131, "step": 368590 }, { - "epoch": 1.86, - "learning_rate": 2.1054835503579518e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.0001566803445478134, + "loss": 0.0147, "step": 368600 }, { - "epoch": 1.86, - "learning_rate": 2.1047267810565506e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015667645633144191, + "loss": 0.0126, "step": 368610 }, { - "epoch": 1.86, - "learning_rate": 2.1039700117551498e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.00015667256811507046, + "loss": 0.0145, "step": 368620 }, { - "epoch": 1.86, - "learning_rate": 2.1032132424537486e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.00015666867989869897, + "loss": 0.0136, "step": 368630 }, { - "epoch": 1.86, - "learning_rate": 2.1024564731523478e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015666479168232754, + "loss": 0.0144, "step": 368640 }, { - "epoch": 1.86, - "learning_rate": 2.1016997038509466e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015666090346595605, + "loss": 0.0126, "step": 368650 }, { - "epoch": 1.86, - "learning_rate": 2.1009429345495458e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.0001566570152495846, + "loss": 0.0132, "step": 368660 }, { - "epoch": 1.86, - "learning_rate": 2.1001861652481442e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.0001566531270332131, + "loss": 0.0153, "step": 368670 }, { - "epoch": 1.86, - "learning_rate": 2.0994293959467434e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015664923881684168, + "loss": 0.0128, "step": 368680 }, { - "epoch": 1.86, - "learning_rate": 2.0986726266453422e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015664535060047022, + "loss": 0.0126, "step": 368690 }, { - "epoch": 1.86, - "learning_rate": 2.0979158573439414e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015664146238409874, + "loss": 0.0157, "step": 368700 }, { - "epoch": 1.86, - "learning_rate": 2.0971590880425402e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015663757416772728, + "loss": 0.0208, "step": 368710 }, { - "epoch": 1.86, - "learning_rate": 2.0964023187411394e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.0001566336859513558, + "loss": 0.0129, "step": 368720 }, { - "epoch": 1.86, - "learning_rate": 2.0956455494397382e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015662979773498436, + "loss": 0.0136, "step": 368730 }, { - "epoch": 1.86, - "learning_rate": 2.0948887801383373e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015662590951861287, + "loss": 0.0147, "step": 368740 }, { - "epoch": 1.86, - "learning_rate": 2.094132010836936e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015662202130224142, + "loss": 0.0129, "step": 368750 }, { - "epoch": 1.86, - "learning_rate": 2.0933752415355353e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015661813308586993, + "loss": 0.0131, "step": 368760 }, { - "epoch": 1.86, - "learning_rate": 2.092618472234134e-05, - "loss": 0.0068, - "step": 368770 + "epoch": 0.96, + "learning_rate": 0.0001566142448694985, + "loss": 0.0126, + "step": 368770 }, { - "epoch": 1.86, - "learning_rate": 2.0918617029327333e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015661035665312701, + "loss": 0.0162, "step": 368780 }, { - "epoch": 1.86, - "learning_rate": 2.091104933631332e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015660646843675556, + "loss": 0.0142, "step": 368790 }, { - "epoch": 1.86, - "learning_rate": 2.0903481643299313e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015660258022038407, + "loss": 0.0139, "step": 368800 }, { - "epoch": 1.86, - "learning_rate": 2.08959139502853e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015659869200401264, + "loss": 0.012, "step": 368810 }, { - "epoch": 1.86, - "learning_rate": 2.088834625727129e-05, - "loss": 0.0043, + "epoch": 0.96, + "learning_rate": 0.00015659480378764115, + "loss": 0.0116, "step": 368820 }, { - "epoch": 1.86, - "learning_rate": 2.0880778564257278e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.0001565909155712697, + "loss": 0.0114, "step": 368830 }, { - "epoch": 1.86, - "learning_rate": 2.087321087124327e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.0001565870273548982, + "loss": 0.0126, "step": 368840 }, { - "epoch": 1.86, - "learning_rate": 2.0865643178229257e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015658313913852678, + "loss": 0.0115, "step": 368850 }, { - "epoch": 1.86, - "learning_rate": 2.085807548521525e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015657925092215532, + "loss": 0.0101, "step": 368860 }, { - "epoch": 1.86, - "learning_rate": 2.0850507792201237e-05, - "loss": 0.0077, + "epoch": 0.96, + "learning_rate": 0.00015657536270578383, + "loss": 0.0121, "step": 368870 }, { - "epoch": 1.86, - "learning_rate": 2.084294009918723e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015657147448941238, + "loss": 0.0133, "step": 368880 }, { - "epoch": 1.86, - "learning_rate": 2.0835372406173217e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015656758627304092, + "loss": 0.0158, "step": 368890 }, { - "epoch": 1.86, - "learning_rate": 2.082780471315921e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015656369805666946, + "loss": 0.0166, "step": 368900 }, { - "epoch": 1.86, - "learning_rate": 2.0820237020145197e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.00015655980984029797, + "loss": 0.0139, "step": 368910 }, { - "epoch": 1.86, - "learning_rate": 2.081266932713119e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.00015655592162392652, + "loss": 0.0141, "step": 368920 }, { - "epoch": 1.86, - "learning_rate": 2.0805101634117177e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015655203340755506, + "loss": 0.0123, "step": 368930 }, { - "epoch": 1.86, - "learning_rate": 2.079753394110317e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.0001565481451911836, + "loss": 0.0167, "step": 368940 }, { - "epoch": 1.86, - "learning_rate": 2.0789966248089157e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.00015654425697481211, + "loss": 0.0147, "step": 368950 }, { - "epoch": 1.86, - "learning_rate": 2.0782398555075148e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.00015654036875844066, + "loss": 0.009, "step": 368960 }, { - "epoch": 1.86, - "learning_rate": 2.0774830862061136e-05, - "loss": 0.0043, + "epoch": 0.96, + "learning_rate": 0.00015653648054206917, + "loss": 0.0138, "step": 368970 }, { - "epoch": 1.86, - "learning_rate": 2.076726316904712e-05, - "loss": 0.0084, + "epoch": 0.96, + "learning_rate": 0.00015653259232569774, + "loss": 0.0155, "step": 368980 }, { - "epoch": 1.86, - "learning_rate": 2.0759695476033113e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.00015652870410932625, + "loss": 0.0165, "step": 368990 }, { - "epoch": 1.86, - "learning_rate": 2.07521277830191e-05, - "loss": 0.008, + "epoch": 0.96, + "learning_rate": 0.0001565248158929548, + "loss": 0.0112, "step": 369000 }, { - "epoch": 1.86, - "eval_cer": 0.9144450256039017, - "eval_loss": 0.0044240448623895645, - "eval_runtime": 116.7122, - "eval_samples_per_second": 17.136, - "eval_steps_per_second": 4.284, + "epoch": 0.96, + "eval_cer": 0.8817586718005349, + "eval_loss": 0.008379627019166946, + "eval_runtime": 107.6158, + "eval_samples_per_second": 18.585, + "eval_steps_per_second": 4.646, "step": 369000 }, { - "epoch": 1.86, - "learning_rate": 2.0744560090005093e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.0001565209276765833, + "loss": 0.0113, "step": 369010 }, { - "epoch": 1.86, - "learning_rate": 2.0736992396991084e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.00015651703946021188, + "loss": 0.0141, "step": 369020 }, { - "epoch": 1.86, - "learning_rate": 2.0729424703977072e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.00015651315124384042, + "loss": 0.0177, "step": 369030 }, { - "epoch": 1.86, - "learning_rate": 2.0721857010963064e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015650926302746893, + "loss": 0.0142, "step": 369040 }, { - "epoch": 1.86, - "learning_rate": 2.0714289317949052e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015650537481109745, + "loss": 0.0106, "step": 369050 }, { - "epoch": 1.86, - "learning_rate": 2.0706721624935044e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015650148659472602, + "loss": 0.0175, "step": 369060 }, { - "epoch": 1.86, - "learning_rate": 2.0699153931921032e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.00015649759837835456, + "loss": 0.0104, "step": 369070 }, { - "epoch": 1.86, - "learning_rate": 2.0691586238907024e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.00015649371016198307, + "loss": 0.0124, "step": 369080 }, { - "epoch": 1.86, - "learning_rate": 2.0684018545893012e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015648982194561162, + "loss": 0.0149, "step": 369090 }, { - "epoch": 1.86, - "learning_rate": 2.0676450852879004e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015648593372924016, + "loss": 0.0161, "step": 369100 }, { - "epoch": 1.86, - "learning_rate": 2.0668883159864992e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.0001564820455128687, + "loss": 0.0134, "step": 369110 }, { - "epoch": 1.86, - "learning_rate": 2.0661315466850983e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.0001564781572964972, + "loss": 0.014, "step": 369120 }, { - "epoch": 1.86, - "learning_rate": 2.065374777383697e-05, - "loss": 0.0104, + "epoch": 0.96, + "learning_rate": 0.00015647426908012575, + "loss": 0.0105, "step": 369130 }, { - "epoch": 1.86, - "learning_rate": 2.0646180080822956e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.0001564703808637543, + "loss": 0.0171, "step": 369140 }, { - "epoch": 1.86, - "learning_rate": 2.0638612387808948e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.00015646649264738284, + "loss": 0.0131, "step": 369150 }, { - "epoch": 1.86, - "learning_rate": 2.0631044694794936e-05, - "loss": 0.0112, + "epoch": 0.96, + "learning_rate": 0.00015646260443101135, + "loss": 0.0129, "step": 369160 }, { - "epoch": 1.86, - "learning_rate": 2.0623477001780928e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.0001564587162146399, + "loss": 0.0159, "step": 369170 }, { - "epoch": 1.86, - "learning_rate": 2.0615909308766916e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015645482799826846, + "loss": 0.0107, "step": 369180 }, { - "epoch": 1.86, - "learning_rate": 2.0608341615752908e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015645093978189698, + "loss": 0.0132, "step": 369190 }, { - "epoch": 1.86, - "learning_rate": 2.0600773922738896e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001564470515655255, + "loss": 0.0127, "step": 369200 }, { - "epoch": 1.86, - "learning_rate": 2.0593206229724887e-05, - "loss": 0.0113, + "epoch": 0.96, + "learning_rate": 0.00015644316334915403, + "loss": 0.0127, "step": 369210 }, { - "epoch": 1.86, - "learning_rate": 2.0585638536710876e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015643927513278255, + "loss": 0.0115, "step": 369220 }, { - "epoch": 1.86, - "learning_rate": 2.0578070843696867e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015643538691641112, + "loss": 0.0172, "step": 369230 }, { - "epoch": 1.86, - "learning_rate": 2.0570503150682856e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.00015643149870003966, + "loss": 0.0142, "step": 369240 }, { - "epoch": 1.86, - "learning_rate": 2.0562935457668847e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015642761048366817, + "loss": 0.0169, "step": 369250 }, { - "epoch": 1.86, - "learning_rate": 2.0555367764654835e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015642372226729671, + "loss": 0.0149, "step": 369260 }, { - "epoch": 1.86, - "learning_rate": 2.0547800071640827e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015641983405092526, + "loss": 0.0144, "step": 369270 }, { - "epoch": 1.86, - "learning_rate": 2.054023237862682e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.0001564159458345538, + "loss": 0.0125, "step": 369280 }, { - "epoch": 1.86, - "learning_rate": 2.0532664685612803e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.0001564120576181823, + "loss": 0.0122, "step": 369290 }, { - "epoch": 1.86, - "learning_rate": 2.052509699259879e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015640816940181085, + "loss": 0.0103, "step": 369300 }, { - "epoch": 1.86, - "learning_rate": 2.0517529299584783e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.0001564042811854394, + "loss": 0.0167, "step": 369310 }, { - "epoch": 1.86, - "learning_rate": 2.050996160657077e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015640039296906794, + "loss": 0.0126, "step": 369320 }, { - "epoch": 1.86, - "learning_rate": 2.0502393913556763e-05, - "loss": 0.0086, + "epoch": 0.96, + "learning_rate": 0.00015639650475269645, + "loss": 0.0131, "step": 369330 }, { - "epoch": 1.86, - "learning_rate": 2.049482622054275e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.000156392616536325, + "loss": 0.0123, "step": 369340 }, { - "epoch": 1.86, - "learning_rate": 2.0487258527528743e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015638872831995356, + "loss": 0.0124, "step": 369350 }, { - "epoch": 1.86, - "learning_rate": 2.047969083451473e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015638484010358208, + "loss": 0.0148, "step": 369360 }, { - "epoch": 1.86, - "learning_rate": 2.0472123141500723e-05, - "loss": 0.0133, + "epoch": 0.96, + "learning_rate": 0.0001563809518872106, + "loss": 0.0124, "step": 369370 }, { - "epoch": 1.86, - "learning_rate": 2.046455544848671e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015637706367083913, + "loss": 0.0095, "step": 369380 }, { - "epoch": 1.86, - "learning_rate": 2.0456987755472703e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.0001563731754544677, + "loss": 0.0108, "step": 369390 }, { - "epoch": 1.86, - "learning_rate": 2.044942006245869e-05, - "loss": 0.008, + "epoch": 0.96, + "learning_rate": 0.00015636928723809622, + "loss": 0.0135, "step": 369400 }, { - "epoch": 1.86, - "learning_rate": 2.0441852369444682e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015636539902172476, + "loss": 0.0179, "step": 369410 }, { - "epoch": 1.86, - "learning_rate": 2.043428467643067e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015636151080535327, + "loss": 0.0124, "step": 369420 }, { - "epoch": 1.86, - "learning_rate": 2.0426716983416662e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.00015635762258898184, + "loss": 0.0136, "step": 369430 }, { - "epoch": 1.86, - "learning_rate": 2.041914929040265e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015635373437261036, + "loss": 0.0146, "step": 369440 }, { - "epoch": 1.86, - "learning_rate": 2.041158159738864e-05, - "loss": 0.0033, + "epoch": 0.96, + "learning_rate": 0.0001563498461562389, + "loss": 0.0118, "step": 369450 }, { - "epoch": 1.86, - "learning_rate": 2.0404013904374627e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.0001563459579398674, + "loss": 0.0148, "step": 369460 }, { - "epoch": 1.86, - "learning_rate": 2.039644621136062e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.00015634206972349595, + "loss": 0.0166, "step": 369470 }, { - "epoch": 1.86, - "learning_rate": 2.0388878518346607e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.0001563381815071245, + "loss": 0.011, "step": 369480 }, { - "epoch": 1.86, - "learning_rate": 2.0381310825332598e-05, - "loss": 0.0075, + "epoch": 0.96, + "learning_rate": 0.00015633429329075304, + "loss": 0.0158, "step": 369490 }, { - "epoch": 1.86, - "learning_rate": 2.0373743132318586e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015633040507438155, + "loss": 0.0097, "step": 369500 }, { - "epoch": 1.86, - "learning_rate": 2.0366175439304578e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.0001563265168580101, + "loss": 0.0144, "step": 369510 }, { - "epoch": 1.86, - "learning_rate": 2.0358607746290566e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015632262864163863, + "loss": 0.0107, "step": 369520 }, { - "epoch": 1.86, - "learning_rate": 2.0351040053276558e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015631874042526718, + "loss": 0.0185, "step": 369530 }, { - "epoch": 1.86, - "learning_rate": 2.0343472360262546e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.0001563148522088957, + "loss": 0.0116, "step": 369540 }, { - "epoch": 1.86, - "learning_rate": 2.0335904667248538e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015631096399252423, + "loss": 0.0129, "step": 369550 }, { - "epoch": 1.86, - "learning_rate": 2.0328336974234526e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001563070757761528, + "loss": 0.0141, "step": 369560 }, { - "epoch": 1.86, - "learning_rate": 2.0320769281220518e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015630318755978132, + "loss": 0.0103, "step": 369570 }, { - "epoch": 1.86, - "learning_rate": 2.0313201588206506e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015629929934340986, + "loss": 0.0135, "step": 369580 }, { - "epoch": 1.86, - "learning_rate": 2.0305633895192497e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.00015629541112703837, + "loss": 0.0105, "step": 369590 }, { - "epoch": 1.86, - "learning_rate": 2.0298066202178486e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015629152291066694, + "loss": 0.0168, "step": 369600 }, { - "epoch": 1.86, - "learning_rate": 2.0290498509164474e-05, - "loss": 0.0043, + "epoch": 0.96, + "learning_rate": 0.00015628763469429546, + "loss": 0.0118, "step": 369610 }, { - "epoch": 1.86, - "learning_rate": 2.0282930816150462e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.000156283746477924, + "loss": 0.0108, "step": 369620 }, { - "epoch": 1.86, - "learning_rate": 2.0275363123136454e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001562798582615525, + "loss": 0.0119, "step": 369630 }, { - "epoch": 1.86, - "learning_rate": 2.0267795430122442e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015627597004518108, + "loss": 0.0121, "step": 369640 }, { - "epoch": 1.86, - "learning_rate": 2.0260227737108433e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.0001562720818288096, + "loss": 0.0124, "step": 369650 }, { - "epoch": 1.86, - "learning_rate": 2.0252660044094422e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015626819361243814, + "loss": 0.0108, "step": 369660 }, { - "epoch": 1.87, - "learning_rate": 2.0245092351080413e-05, - "loss": 0.0085, + "epoch": 0.96, + "learning_rate": 0.00015626430539606665, + "loss": 0.0112, "step": 369670 }, { - "epoch": 1.87, - "learning_rate": 2.02375246580664e-05, - "loss": 0.0072, + "epoch": 0.96, + "learning_rate": 0.0001562604171796952, + "loss": 0.0137, "step": 369680 }, { - "epoch": 1.87, - "learning_rate": 2.0229956965052393e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015625652896332373, + "loss": 0.0107, "step": 369690 }, { - "epoch": 1.87, - "learning_rate": 2.022238927203838e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015625264074695228, + "loss": 0.0126, "step": 369700 }, { - "epoch": 1.87, - "learning_rate": 2.0214821579024373e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001562487525305808, + "loss": 0.014, "step": 369710 }, { - "epoch": 1.87, - "learning_rate": 2.020725388601036e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.00015624486431420933, + "loss": 0.0146, "step": 369720 }, { - "epoch": 1.87, - "learning_rate": 2.0199686192996353e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.0001562409760978379, + "loss": 0.0136, "step": 369730 }, { - "epoch": 1.87, - "learning_rate": 2.019211849998234e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015623708788146642, + "loss": 0.0146, "step": 369740 }, { - "epoch": 1.87, - "learning_rate": 2.0184550806968333e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015623319966509496, + "loss": 0.016, "step": 369750 }, { - "epoch": 1.87, - "learning_rate": 2.017698311395432e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015622931144872347, + "loss": 0.0135, "step": 369760 }, { - "epoch": 1.87, - "learning_rate": 2.016941542094031e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015622542323235204, + "loss": 0.0119, "step": 369770 }, { - "epoch": 1.87, - "learning_rate": 2.0161847727926297e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015622153501598055, + "loss": 0.0137, "step": 369780 }, { - "epoch": 1.87, - "learning_rate": 2.015428003491229e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.0001562176467996091, + "loss": 0.0165, "step": 369790 }, { - "epoch": 1.87, - "learning_rate": 2.0146712341898277e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.0001562137585832376, + "loss": 0.0159, "step": 369800 }, { - "epoch": 1.87, - "learning_rate": 2.013914464888427e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015620987036686618, + "loss": 0.0116, "step": 369810 }, { - "epoch": 1.87, - "learning_rate": 2.0131576955870257e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.0001562059821504947, + "loss": 0.012, "step": 369820 }, { - "epoch": 1.87, - "learning_rate": 2.012400926285625e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015620209393412324, + "loss": 0.0105, "step": 369830 }, { - "epoch": 1.87, - "learning_rate": 2.0116441569842237e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.00015619820571775175, + "loss": 0.0132, "step": 369840 }, { - "epoch": 1.87, - "learning_rate": 2.010887387682823e-05, - "loss": 0.0043, + "epoch": 0.96, + "learning_rate": 0.00015619431750138032, + "loss": 0.0099, "step": 369850 }, { - "epoch": 1.87, - "learning_rate": 2.0101306183814217e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015619042928500883, + "loss": 0.0116, "step": 369860 }, { - "epoch": 1.87, - "learning_rate": 2.0093738490800208e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015618654106863738, + "loss": 0.0221, "step": 369870 }, { - "epoch": 1.87, - "learning_rate": 2.0086170797786196e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.0001561826528522659, + "loss": 0.0167, "step": 369880 }, { - "epoch": 1.87, - "learning_rate": 2.0078603104772188e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015617876463589446, + "loss": 0.011, "step": 369890 }, { - "epoch": 1.87, - "learning_rate": 2.0071035411758176e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.000156174876419523, + "loss": 0.0134, "step": 369900 }, { - "epoch": 1.87, - "learning_rate": 2.0063467718744168e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015617098820315151, + "loss": 0.011, "step": 369910 }, { - "epoch": 1.87, - "learning_rate": 2.0055900025730153e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.00015616709998678003, + "loss": 0.012, "step": 369920 }, { - "epoch": 1.87, - "learning_rate": 2.004833233271614e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015616321177040857, + "loss": 0.0131, "step": 369930 }, { - "epoch": 1.87, - "learning_rate": 2.0040764639702132e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015615932355403714, + "loss": 0.0112, "step": 369940 }, { - "epoch": 1.87, - "learning_rate": 2.003319694668812e-05, - "loss": 0.0042, + "epoch": 0.96, + "learning_rate": 0.00015615543533766565, + "loss": 0.0145, "step": 369950 }, { - "epoch": 1.87, - "learning_rate": 2.0025629253674112e-05, - "loss": 0.0084, + "epoch": 0.96, + "learning_rate": 0.0001561515471212942, + "loss": 0.0178, "step": 369960 }, { - "epoch": 1.87, - "learning_rate": 2.00180615606601e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.0001561476589049227, + "loss": 0.016, "step": 369970 }, { - "epoch": 1.87, - "learning_rate": 2.0010493867646092e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015614377068855128, + "loss": 0.0095, "step": 369980 }, { - "epoch": 1.87, - "learning_rate": 2.0002926174632084e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.0001561398824721798, + "loss": 0.0164, "step": 369990 }, { - "epoch": 1.87, - "learning_rate": 1.9995358481618072e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015613599425580834, + "loss": 0.0116, "step": 370000 }, { - "epoch": 1.87, - "eval_cer": 0.9144246472852683, - "eval_loss": 0.004436591174453497, - "eval_runtime": 116.7427, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.96, + "eval_cer": 0.8817068852339703, + "eval_loss": 0.008635921403765678, + "eval_runtime": 107.4637, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, "step": 370000 }, { - "epoch": 1.87, - "learning_rate": 1.9987790788604064e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.00015613210603943685, + "loss": 0.0141, "step": 370010 }, { - "epoch": 1.87, - "learning_rate": 1.9980223095590052e-05, - "loss": 0.0077, + "epoch": 0.96, + "learning_rate": 0.00015612821782306542, + "loss": 0.0127, "step": 370020 }, { - "epoch": 1.87, - "learning_rate": 1.9972655402576043e-05, - "loss": 0.0039, + "epoch": 0.96, + "learning_rate": 0.00015612432960669393, + "loss": 0.0136, "step": 370030 }, { - "epoch": 1.87, - "learning_rate": 1.996508770956203e-05, - "loss": 0.0071, + "epoch": 0.96, + "learning_rate": 0.00015612044139032247, + "loss": 0.022, "step": 370040 }, { - "epoch": 1.87, - "learning_rate": 1.9957520016548023e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.000156116553173951, + "loss": 0.0175, "step": 370050 }, { - "epoch": 1.87, - "learning_rate": 1.994995232353401e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015611266495757956, + "loss": 0.0168, "step": 370060 }, { - "epoch": 1.87, - "learning_rate": 1.9942384630520003e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015610877674120807, + "loss": 0.0143, "step": 370070 }, { - "epoch": 1.87, - "learning_rate": 1.9934816937505988e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015610488852483661, + "loss": 0.0107, "step": 370080 }, { - "epoch": 1.87, - "learning_rate": 1.9927249244491976e-05, - "loss": 0.0043, + "epoch": 0.96, + "learning_rate": 0.00015610100030846513, + "loss": 0.0133, "step": 370090 }, { - "epoch": 1.87, - "learning_rate": 1.9919681551477968e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.0001560971120920937, + "loss": 0.0125, "step": 370100 }, { - "epoch": 1.87, - "learning_rate": 1.9912113858463956e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015609322387572224, + "loss": 0.0106, "step": 370110 }, { - "epoch": 1.87, - "learning_rate": 1.9904546165449948e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015608933565935075, + "loss": 0.0127, "step": 370120 }, { - "epoch": 1.87, - "learning_rate": 1.9896978472435936e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.0001560854474429793, + "loss": 0.0148, "step": 370130 }, { - "epoch": 1.87, - "learning_rate": 1.9889410779421927e-05, - "loss": 0.0073, + "epoch": 0.96, + "learning_rate": 0.00015608155922660784, + "loss": 0.016, "step": 370140 }, { - "epoch": 1.87, - "learning_rate": 1.9881843086407916e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015607767101023638, + "loss": 0.0108, "step": 370150 }, { - "epoch": 1.87, - "learning_rate": 1.9874275393393907e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.0001560737827938649, + "loss": 0.0151, "step": 370160 }, { - "epoch": 1.87, - "learning_rate": 1.9866707700379895e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015606989457749343, + "loss": 0.0139, "step": 370170 }, { - "epoch": 1.87, - "learning_rate": 1.9859140007365887e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015606600636112195, + "loss": 0.0118, "step": 370180 }, { - "epoch": 1.87, - "learning_rate": 1.9851572314351875e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015606211814475052, + "loss": 0.01, "step": 370190 }, { - "epoch": 1.87, - "learning_rate": 1.9844004621337867e-05, - "loss": 0.0072, + "epoch": 0.96, + "learning_rate": 0.00015605822992837903, + "loss": 0.0124, "step": 370200 }, { - "epoch": 1.87, - "learning_rate": 1.9836436928323855e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015605434171200757, + "loss": 0.0147, "step": 370210 }, { - "epoch": 1.87, - "learning_rate": 1.9828869235309847e-05, - "loss": 0.0041, + "epoch": 0.96, + "learning_rate": 0.0001560504534956361, + "loss": 0.0128, "step": 370220 }, { - "epoch": 1.87, - "learning_rate": 1.9821301542295835e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015604656527926466, + "loss": 0.014, "step": 370230 }, { - "epoch": 1.87, - "learning_rate": 1.9813733849281823e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015604267706289317, + "loss": 0.0142, "step": 370240 }, { - "epoch": 1.87, - "learning_rate": 1.980616615626781e-05, - "loss": 0.0079, + "epoch": 0.96, + "learning_rate": 0.0001560387888465217, + "loss": 0.0151, "step": 370250 }, { - "epoch": 1.87, - "learning_rate": 1.9798598463253803e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015603490063015023, + "loss": 0.013, "step": 370260 }, { - "epoch": 1.87, - "learning_rate": 1.979103077023979e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.0001560310124137788, + "loss": 0.0136, "step": 370270 }, { - "epoch": 1.87, - "learning_rate": 1.9783463077225783e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015602712419740734, + "loss": 0.0138, "step": 370280 }, { - "epoch": 1.87, - "learning_rate": 1.977589538421177e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015602323598103585, + "loss": 0.0122, "step": 370290 }, { - "epoch": 1.87, - "learning_rate": 1.9768327691197763e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.0001560193477646644, + "loss": 0.0121, "step": 370300 }, { - "epoch": 1.87, - "learning_rate": 1.976075999818375e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015601545954829294, + "loss": 0.0105, "step": 370310 }, { - "epoch": 1.87, - "learning_rate": 1.9753192305169742e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.00015601157133192148, + "loss": 0.0118, "step": 370320 }, { - "epoch": 1.87, - "learning_rate": 1.974562461215573e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015600768311555, + "loss": 0.01, "step": 370330 }, { - "epoch": 1.87, - "learning_rate": 1.9738056919141722e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015600379489917853, + "loss": 0.0125, "step": 370340 }, { - "epoch": 1.87, - "learning_rate": 1.973048922612771e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015599990668280708, + "loss": 0.0124, "step": 370350 }, { - "epoch": 1.87, - "learning_rate": 1.9722921533113702e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.00015599601846643562, + "loss": 0.0186, "step": 370360 }, { - "epoch": 1.87, - "learning_rate": 1.971535384009969e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.00015599213025006413, + "loss": 0.0143, "step": 370370 }, { - "epoch": 1.87, - "learning_rate": 1.9707786147085682e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015598824203369267, + "loss": 0.0147, "step": 370380 }, { - "epoch": 1.87, - "learning_rate": 1.9700218454071667e-05, - "loss": 0.0077, + "epoch": 0.96, + "learning_rate": 0.00015598435381732122, + "loss": 0.0132, "step": 370390 }, { - "epoch": 1.87, - "learning_rate": 1.969265076105766e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015598046560094976, + "loss": 0.0121, "step": 370400 }, { - "epoch": 1.87, - "learning_rate": 1.9685083068043647e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015597657738457827, + "loss": 0.0148, "step": 370410 }, { - "epoch": 1.87, - "learning_rate": 1.9677515375029638e-05, - "loss": 0.0039, + "epoch": 0.96, + "learning_rate": 0.0001559726891682068, + "loss": 0.0118, "step": 370420 }, { - "epoch": 1.87, - "learning_rate": 1.9669947682015626e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015596880095183533, + "loss": 0.0116, "step": 370430 }, { - "epoch": 1.87, - "learning_rate": 1.9662379989001618e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.0001559649127354639, + "loss": 0.0141, "step": 370440 }, { - "epoch": 1.87, - "learning_rate": 1.9654812295987606e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015596102451909244, + "loss": 0.0126, "step": 370450 }, { - "epoch": 1.87, - "learning_rate": 1.9647244602973598e-05, - "loss": 0.0086, + "epoch": 0.96, + "learning_rate": 0.00015595713630272095, + "loss": 0.0165, "step": 370460 }, { - "epoch": 1.87, - "learning_rate": 1.9639676909959586e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015595324808634947, + "loss": 0.0137, "step": 370470 }, { - "epoch": 1.87, - "learning_rate": 1.9632109216945578e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015594935986997804, + "loss": 0.0163, "step": 370480 }, { - "epoch": 1.87, - "learning_rate": 1.9624541523931566e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.00015594547165360658, + "loss": 0.0136, "step": 370490 }, { - "epoch": 1.87, - "learning_rate": 1.9616973830917557e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.0001559415834372351, + "loss": 0.0137, "step": 370500 }, { - "epoch": 1.87, - "learning_rate": 1.9609406137903546e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015593769522086363, + "loss": 0.0135, "step": 370510 }, { - "epoch": 1.87, - "learning_rate": 1.9601838444889537e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015593380700449218, + "loss": 0.0157, "step": 370520 }, { - "epoch": 1.87, - "learning_rate": 1.9594270751875525e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015592991878812072, + "loss": 0.0127, "step": 370530 }, { - "epoch": 1.87, - "learning_rate": 1.9586703058861517e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015592603057174923, + "loss": 0.0112, "step": 370540 }, { - "epoch": 1.87, - "learning_rate": 1.9579135365847502e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015592214235537777, + "loss": 0.0131, "step": 370550 }, { - "epoch": 1.87, - "learning_rate": 1.9571567672833494e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.00015591825413900631, + "loss": 0.0109, "step": 370560 }, { - "epoch": 1.87, - "learning_rate": 1.9563999979819482e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.00015591436592263486, + "loss": 0.0155, "step": 370570 }, { - "epoch": 1.87, - "learning_rate": 1.9556432286805473e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015591047770626337, + "loss": 0.0222, "step": 370580 }, { - "epoch": 1.87, - "learning_rate": 1.954886459379146e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.0001559065894898919, + "loss": 0.0089, "step": 370590 }, { - "epoch": 1.87, - "learning_rate": 1.9541296900777453e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015590270127352048, + "loss": 0.0125, "step": 370600 }, { - "epoch": 1.87, - "learning_rate": 1.953372920776344e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.000155898813057149, + "loss": 0.0112, "step": 370610 }, { - "epoch": 1.87, - "learning_rate": 1.9526161514749433e-05, - "loss": 0.004, + "epoch": 0.96, + "learning_rate": 0.00015589492484077754, + "loss": 0.019, "step": 370620 }, { - "epoch": 1.87, - "learning_rate": 1.951859382173542e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015589103662440605, + "loss": 0.0109, "step": 370630 }, { - "epoch": 1.87, - "learning_rate": 1.9511026128721413e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015588714840803462, + "loss": 0.0174, "step": 370640 }, { - "epoch": 1.87, - "learning_rate": 1.95034584357074e-05, - "loss": 0.0071, + "epoch": 0.96, + "learning_rate": 0.00015588326019166314, + "loss": 0.0131, "step": 370650 }, { - "epoch": 1.87, - "learning_rate": 1.9495890742693393e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015587937197529168, + "loss": 0.0113, "step": 370660 }, { - "epoch": 1.87, - "learning_rate": 1.948832304967938e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.0001558754837589202, + "loss": 0.0103, "step": 370670 }, { - "epoch": 1.87, - "learning_rate": 1.9480755356665372e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015587159554254873, + "loss": 0.0134, "step": 370680 }, { - "epoch": 1.87, - "learning_rate": 1.947318766365136e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015586770732617727, + "loss": 0.0128, "step": 370690 }, { - "epoch": 1.87, - "learning_rate": 1.9465619970637352e-05, - "loss": 0.0071, + "epoch": 0.96, + "learning_rate": 0.00015586381910980582, + "loss": 0.0109, "step": 370700 }, { - "epoch": 1.87, - "learning_rate": 1.9458052277623337e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015585993089343433, + "loss": 0.0124, "step": 370710 }, { - "epoch": 1.87, - "learning_rate": 1.945048458460933e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.00015585604267706287, + "loss": 0.0112, "step": 370720 }, { - "epoch": 1.87, - "learning_rate": 1.9442916891595317e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015585215446069141, + "loss": 0.015, "step": 370730 }, { - "epoch": 1.87, - "learning_rate": 1.943534919858131e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015584826624431996, + "loss": 0.0136, "step": 370740 }, { - "epoch": 1.87, - "learning_rate": 1.9427781505567297e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015584437802794847, + "loss": 0.012, "step": 370750 }, { - "epoch": 1.87, - "learning_rate": 1.942021381255329e-05, - "loss": 0.0067, + "epoch": 0.96, + "learning_rate": 0.000155840489811577, + "loss": 0.0135, "step": 370760 }, { - "epoch": 1.87, - "learning_rate": 1.9412646119539277e-05, - "loss": 0.0039, + "epoch": 0.96, + "learning_rate": 0.00015583660159520558, + "loss": 0.0088, "step": 370770 }, { - "epoch": 1.87, - "learning_rate": 1.9405078426525268e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.0001558327133788341, + "loss": 0.0152, "step": 370780 }, { - "epoch": 1.87, - "learning_rate": 1.9397510733511256e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.0001558288251624626, + "loss": 0.0113, "step": 370790 }, { - "epoch": 1.87, - "learning_rate": 1.9389943040497248e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015582493694609115, + "loss": 0.0159, "step": 370800 }, { - "epoch": 1.87, - "learning_rate": 1.9382375347483236e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015582104872971972, + "loss": 0.012, "step": 370810 }, { - "epoch": 1.87, - "learning_rate": 1.9374807654469228e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015581716051334823, + "loss": 0.0088, "step": 370820 }, { - "epoch": 1.87, - "learning_rate": 1.9367239961455216e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015581327229697678, + "loss": 0.015, "step": 370830 }, { - "epoch": 1.87, - "learning_rate": 1.9359672268441208e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.0001558093840806053, + "loss": 0.0109, "step": 370840 }, { - "epoch": 1.87, - "learning_rate": 1.9352104575427196e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.00015580549586423386, + "loss": 0.0105, "step": 370850 }, { - "epoch": 1.87, - "learning_rate": 1.9344536882413188e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015580160764786237, + "loss": 0.0121, "step": 370860 }, { - "epoch": 1.87, - "learning_rate": 1.9336969189399172e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015579771943149092, + "loss": 0.0137, "step": 370870 }, { - "epoch": 1.87, - "learning_rate": 1.932940149638516e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.00015579383121511943, + "loss": 0.0118, "step": 370880 }, { - "epoch": 1.87, - "learning_rate": 1.9321833803371152e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.000155789942998748, + "loss": 0.0135, "step": 370890 }, { - "epoch": 1.87, - "learning_rate": 1.931426611035714e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.0001557860547823765, + "loss": 0.0135, "step": 370900 }, { - "epoch": 1.87, - "learning_rate": 1.9306698417343132e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015578216656600506, + "loss": 0.0163, "step": 370910 }, { - "epoch": 1.87, - "learning_rate": 1.929913072432912e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015577827834963357, + "loss": 0.0118, "step": 370920 }, { - "epoch": 1.87, - "learning_rate": 1.9291563031315112e-05, - "loss": 0.0099, + "epoch": 0.96, + "learning_rate": 0.0001557743901332621, + "loss": 0.0141, "step": 370930 }, { - "epoch": 1.87, - "learning_rate": 1.92839953383011e-05, - "loss": 0.0077, + "epoch": 0.96, + "learning_rate": 0.00015577050191689068, + "loss": 0.01, "step": 370940 }, { - "epoch": 1.87, - "learning_rate": 1.927642764528709e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.0001557666137005192, + "loss": 0.0098, "step": 370950 }, { - "epoch": 1.87, - "learning_rate": 1.9268859952273083e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.0001557627254841477, + "loss": 0.0195, "step": 370960 }, { - "epoch": 1.87, - "learning_rate": 1.926129225925907e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015575883726777625, + "loss": 0.0135, "step": 370970 }, { - "epoch": 1.87, - "learning_rate": 1.9253724566245063e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015575494905140482, + "loss": 0.0137, "step": 370980 }, { - "epoch": 1.87, - "learning_rate": 1.924615687323105e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015575106083503333, + "loss": 0.0114, "step": 370990 }, { - "epoch": 1.87, - "learning_rate": 1.9238589180217043e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015574717261866188, + "loss": 0.0123, "step": 371000 }, { - "epoch": 1.87, - "eval_cer": 0.9144450256039017, - "eval_loss": 0.004348627291619778, - "eval_runtime": 116.6791, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.96, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.008374325931072235, + "eval_runtime": 107.4524, + "eval_samples_per_second": 18.613, + "eval_steps_per_second": 4.653, "step": 371000 }, { - "epoch": 1.87, - "learning_rate": 1.923102148720303e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.0001557432844022904, + "loss": 0.0131, "step": 371010 }, { - "epoch": 1.87, - "learning_rate": 1.9223453794189016e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.00015573939618591896, + "loss": 0.0143, "step": 371020 }, { - "epoch": 1.87, - "learning_rate": 1.9215886101175008e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015573550796954747, + "loss": 0.0111, "step": 371030 }, { - "epoch": 1.87, - "learning_rate": 1.9208318408160996e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015573161975317601, + "loss": 0.0133, "step": 371040 }, { - "epoch": 1.87, - "learning_rate": 1.9200750715146987e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015572773153680453, + "loss": 0.0104, "step": 371050 }, { - "epoch": 1.87, - "learning_rate": 1.9193183022132976e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.0001557238433204331, + "loss": 0.0139, "step": 371060 }, { - "epoch": 1.87, - "learning_rate": 1.9185615329118967e-05, - "loss": 0.0032, + "epoch": 0.96, + "learning_rate": 0.0001557199551040616, + "loss": 0.0118, "step": 371070 }, { - "epoch": 1.87, - "learning_rate": 1.9178047636104955e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015571606688769015, + "loss": 0.009, "step": 371080 }, { - "epoch": 1.87, - "learning_rate": 1.9170479943090947e-05, - "loss": 0.0071, + "epoch": 0.96, + "learning_rate": 0.00015571217867131867, + "loss": 0.0123, "step": 371090 }, { - "epoch": 1.87, - "learning_rate": 1.9162912250076935e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015570829045494724, + "loss": 0.0111, "step": 371100 }, { - "epoch": 1.87, - "learning_rate": 1.9155344557062927e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015570440223857575, + "loss": 0.0137, "step": 371110 }, { - "epoch": 1.87, - "learning_rate": 1.9147776864048915e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001557005140222043, + "loss": 0.0112, "step": 371120 }, { - "epoch": 1.87, - "learning_rate": 1.9140209171034907e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.0001556966258058328, + "loss": 0.0116, "step": 371130 }, { - "epoch": 1.87, - "learning_rate": 1.9132641478020895e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015569273758946138, + "loss": 0.0115, "step": 371140 }, { - "epoch": 1.87, - "learning_rate": 1.9125073785006887e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015568884937308992, + "loss": 0.012, "step": 371150 }, { - "epoch": 1.87, - "learning_rate": 1.9117506091992875e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015568496115671843, + "loss": 0.011, "step": 371160 }, { - "epoch": 1.87, - "learning_rate": 1.9109938398978866e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015568107294034697, + "loss": 0.0147, "step": 371170 }, { - "epoch": 1.87, - "learning_rate": 1.910237070596485e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.0001556771847239755, + "loss": 0.0117, "step": 371180 }, { - "epoch": 1.87, - "learning_rate": 1.9094803012950843e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.00015567329650760406, + "loss": 0.0126, "step": 371190 }, { - "epoch": 1.87, - "learning_rate": 1.908723531993683e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.00015566940829123257, + "loss": 0.0131, "step": 371200 }, { - "epoch": 1.87, - "learning_rate": 1.9079667626922823e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.00015566552007486111, + "loss": 0.0119, "step": 371210 }, { - "epoch": 1.87, - "learning_rate": 1.907209993390881e-05, - "loss": 0.0048, + "epoch": 0.96, + "learning_rate": 0.00015566163185848963, + "loss": 0.014, "step": 371220 }, { - "epoch": 1.87, - "learning_rate": 1.9064532240894802e-05, - "loss": 0.0073, + "epoch": 0.96, + "learning_rate": 0.0001556577436421182, + "loss": 0.013, "step": 371230 }, { - "epoch": 1.87, - "learning_rate": 1.905696454788079e-05, - "loss": 0.0074, + "epoch": 0.96, + "learning_rate": 0.0001556538554257467, + "loss": 0.0109, "step": 371240 }, { - "epoch": 1.87, - "learning_rate": 1.9049396854866782e-05, - "loss": 0.0087, + "epoch": 0.96, + "learning_rate": 0.00015564996720937525, + "loss": 0.0112, "step": 371250 }, { - "epoch": 1.87, - "learning_rate": 1.904182916185277e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015564607899300377, + "loss": 0.0114, "step": 371260 }, { - "epoch": 1.87, - "learning_rate": 1.9034261468838762e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.00015564219077663234, + "loss": 0.0133, "step": 371270 }, { - "epoch": 1.87, - "learning_rate": 1.902669377582475e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015563830256026085, + "loss": 0.0137, "step": 371280 }, { - "epoch": 1.87, - "learning_rate": 1.9019126082810742e-05, - "loss": 0.0033, + "epoch": 0.96, + "learning_rate": 0.0001556344143438894, + "loss": 0.0126, "step": 371290 }, { - "epoch": 1.87, - "learning_rate": 1.901155838979673e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.0001556305261275179, + "loss": 0.0149, "step": 371300 }, { - "epoch": 1.87, - "learning_rate": 1.9003990696782722e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.00015562663791114648, + "loss": 0.012, "step": 371310 }, { - "epoch": 1.87, - "learning_rate": 1.899642300376871e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015562274969477502, + "loss": 0.0111, "step": 371320 }, { - "epoch": 1.87, - "learning_rate": 1.89888553107547e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015561886147840353, + "loss": 0.0093, "step": 371330 }, { - "epoch": 1.87, - "learning_rate": 1.8981287617740686e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015561497326203207, + "loss": 0.0108, "step": 371340 }, { - "epoch": 1.87, - "learning_rate": 1.8973719924726678e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015561108504566062, + "loss": 0.0114, "step": 371350 }, { - "epoch": 1.87, - "learning_rate": 1.8966152231712666e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015560719682928916, + "loss": 0.0153, "step": 371360 }, { - "epoch": 1.87, - "learning_rate": 1.8958584538698658e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015560330861291767, + "loss": 0.0117, "step": 371370 }, { - "epoch": 1.87, - "learning_rate": 1.8951016845684646e-05, - "loss": 0.0064, + "epoch": 0.96, + "learning_rate": 0.00015559942039654621, + "loss": 0.0105, "step": 371380 }, { - "epoch": 1.87, - "learning_rate": 1.8943449152670638e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015559553218017476, + "loss": 0.0112, "step": 371390 }, { - "epoch": 1.87, - "learning_rate": 1.8935881459656626e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.0001555916439638033, + "loss": 0.0185, "step": 371400 }, { - "epoch": 1.87, - "learning_rate": 1.8928313766642617e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.0001555877557474318, + "loss": 0.0159, "step": 371410 }, { - "epoch": 1.87, - "learning_rate": 1.8920746073628606e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015558386753106035, + "loss": 0.0163, "step": 371420 }, { - "epoch": 1.87, - "learning_rate": 1.8913178380614597e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015557997931468887, + "loss": 0.0114, "step": 371430 }, { - "epoch": 1.87, - "learning_rate": 1.8905610687600586e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015557609109831744, + "loss": 0.0111, "step": 371440 }, { - "epoch": 1.87, - "learning_rate": 1.8898042994586577e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.00015557220288194595, + "loss": 0.0092, "step": 371450 }, { - "epoch": 1.87, - "learning_rate": 1.8890475301572565e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.0001555683146655745, + "loss": 0.0092, "step": 371460 }, { - "epoch": 1.87, - "learning_rate": 1.8882907608558557e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.000155564426449203, + "loss": 0.0127, "step": 371470 }, { - "epoch": 1.87, - "learning_rate": 1.8875339915544545e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015556053823283158, + "loss": 0.0191, "step": 371480 }, { - "epoch": 1.87, - "learning_rate": 1.8867772222530533e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015555665001646012, + "loss": 0.0147, "step": 371490 }, { - "epoch": 1.87, - "learning_rate": 1.886020452951652e-05, - "loss": 0.0094, + "epoch": 0.96, + "learning_rate": 0.00015555276180008863, + "loss": 0.0108, "step": 371500 }, { - "epoch": 1.87, - "learning_rate": 1.8852636836502513e-05, - "loss": 0.0107, + "epoch": 0.96, + "learning_rate": 0.00015554887358371715, + "loss": 0.0105, "step": 371510 }, { - "epoch": 1.87, - "learning_rate": 1.88450691434885e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015554498536734572, + "loss": 0.0124, "step": 371520 }, { - "epoch": 1.87, - "learning_rate": 1.8837501450474493e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015554109715097426, + "loss": 0.0117, "step": 371530 }, { - "epoch": 1.87, - "learning_rate": 1.882993375746048e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.00015553720893460277, + "loss": 0.0121, "step": 371540 }, { - "epoch": 1.87, - "learning_rate": 1.8822366064446473e-05, - "loss": 0.0079, + "epoch": 0.96, + "learning_rate": 0.0001555333207182313, + "loss": 0.0124, "step": 371550 }, { - "epoch": 1.87, - "learning_rate": 1.881479837143246e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015552943250185985, + "loss": 0.0102, "step": 371560 }, { - "epoch": 1.87, - "learning_rate": 1.8807230678418453e-05, - "loss": 0.0041, + "epoch": 0.96, + "learning_rate": 0.0001555255442854884, + "loss": 0.0099, "step": 371570 }, { - "epoch": 1.87, - "learning_rate": 1.879966298540444e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.0001555216560691169, + "loss": 0.0121, "step": 371580 }, { - "epoch": 1.87, - "learning_rate": 1.8792095292390433e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015551776785274545, + "loss": 0.017, "step": 371590 }, { - "epoch": 1.87, - "learning_rate": 1.878452759937642e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.000155513879636374, + "loss": 0.0101, "step": 371600 }, { - "epoch": 1.87, - "learning_rate": 1.8776959906362412e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015550999142000254, + "loss": 0.013, "step": 371610 }, { - "epoch": 1.87, - "learning_rate": 1.87693922133484e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015550610320363105, + "loss": 0.0121, "step": 371620 }, { - "epoch": 1.87, - "learning_rate": 1.8761824520334392e-05, - "loss": 0.0049, + "epoch": 0.96, + "learning_rate": 0.0001555022149872596, + "loss": 0.0134, "step": 371630 }, { - "epoch": 1.87, - "learning_rate": 1.875425682732038e-05, - "loss": 0.0071, + "epoch": 0.96, + "learning_rate": 0.00015549832677088816, + "loss": 0.0094, "step": 371640 }, { - "epoch": 1.88, - "learning_rate": 1.874668913430637e-05, - "loss": 0.0051, + "epoch": 0.96, + "learning_rate": 0.00015549443855451668, + "loss": 0.0104, "step": 371650 }, { - "epoch": 1.88, - "learning_rate": 1.873912144129236e-05, - "loss": 0.004, + "epoch": 0.96, + "learning_rate": 0.0001554905503381452, + "loss": 0.0133, "step": 371660 }, { - "epoch": 1.88, - "learning_rate": 1.873155374827835e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015548666212177373, + "loss": 0.0118, "step": 371670 }, { - "epoch": 1.88, - "learning_rate": 1.872398605526434e-05, - "loss": 0.0059, + "epoch": 0.96, + "learning_rate": 0.00015548277390540225, + "loss": 0.0117, "step": 371680 }, { - "epoch": 1.88, - "learning_rate": 1.8716418362250328e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015547888568903081, + "loss": 0.009, "step": 371690 }, { - "epoch": 1.88, - "learning_rate": 1.8708850669236316e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015547499747265936, + "loss": 0.0106, "step": 371700 }, { - "epoch": 1.88, - "learning_rate": 1.8701282976222308e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015547110925628787, + "loss": 0.0104, "step": 371710 }, { - "epoch": 1.88, - "learning_rate": 1.8693715283208296e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001554672210399164, + "loss": 0.0135, "step": 371720 }, { - "epoch": 1.88, - "learning_rate": 1.8686147590194288e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015546333282354495, + "loss": 0.0126, "step": 371730 }, { - "epoch": 1.88, - "learning_rate": 1.8678579897180276e-05, - "loss": 0.0061, + "epoch": 0.96, + "learning_rate": 0.0001554594446071735, + "loss": 0.0108, "step": 371740 }, { - "epoch": 1.88, - "learning_rate": 1.8671012204166268e-05, - "loss": 0.0054, + "epoch": 0.96, + "learning_rate": 0.000155455556390802, + "loss": 0.0111, "step": 371750 }, { - "epoch": 1.88, - "learning_rate": 1.8663444511152256e-05, - "loss": 0.0063, + "epoch": 0.96, + "learning_rate": 0.00015545166817443055, + "loss": 0.0108, "step": 371760 }, { - "epoch": 1.88, - "learning_rate": 1.8655876818138244e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.0001554477799580591, + "loss": 0.0169, "step": 371770 }, { - "epoch": 1.88, - "learning_rate": 1.8648309125124232e-05, - "loss": 0.009, + "epoch": 0.96, + "learning_rate": 0.00015544389174168764, + "loss": 0.0128, "step": 371780 }, { - "epoch": 1.88, - "learning_rate": 1.8640741432110224e-05, - "loss": 0.0083, + "epoch": 0.96, + "learning_rate": 0.00015544000352531615, + "loss": 0.0123, "step": 371790 }, { - "epoch": 1.88, - "learning_rate": 1.8633173739096216e-05, - "loss": 0.0165, + "epoch": 0.96, + "learning_rate": 0.0001554361153089447, + "loss": 0.0141, "step": 371800 }, { - "epoch": 1.88, - "learning_rate": 1.8625606046082204e-05, - "loss": 0.004, + "epoch": 0.96, + "learning_rate": 0.00015543222709257326, + "loss": 0.0115, "step": 371810 }, { - "epoch": 1.88, - "learning_rate": 1.8618038353068195e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015542833887620177, + "loss": 0.0115, "step": 371820 }, { - "epoch": 1.88, - "learning_rate": 1.8610470660054184e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.0001554244506598303, + "loss": 0.0102, "step": 371830 }, { - "epoch": 1.88, - "learning_rate": 1.8602902967040175e-05, - "loss": 0.0069, + "epoch": 0.96, + "learning_rate": 0.00015542056244345883, + "loss": 0.0122, "step": 371840 }, { - "epoch": 1.88, - "learning_rate": 1.859533527402616e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.0001554166742270874, + "loss": 0.0125, "step": 371850 }, { - "epoch": 1.88, - "learning_rate": 1.8587767581012152e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015541278601071591, + "loss": 0.0121, "step": 371860 }, { - "epoch": 1.88, - "learning_rate": 1.858019988799814e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.00015540889779434446, + "loss": 0.0137, "step": 371870 }, { - "epoch": 1.88, - "learning_rate": 1.857263219498413e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.00015540500957797297, + "loss": 0.0142, "step": 371880 }, { - "epoch": 1.88, - "learning_rate": 1.856506450197012e-05, - "loss": 0.0041, + "epoch": 0.96, + "learning_rate": 0.00015540112136160154, + "loss": 0.0121, "step": 371890 }, { - "epoch": 1.88, - "learning_rate": 1.855749680895611e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015539723314523005, + "loss": 0.0119, "step": 371900 }, { - "epoch": 1.88, - "learning_rate": 1.85499291159421e-05, - "loss": 0.0091, + "epoch": 0.96, + "learning_rate": 0.0001553933449288586, + "loss": 0.0118, "step": 371910 }, { - "epoch": 1.88, - "learning_rate": 1.854236142292809e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.0001553894567124871, + "loss": 0.0097, "step": 371920 }, { - "epoch": 1.88, - "learning_rate": 1.853479372991408e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015538556849611565, + "loss": 0.0102, "step": 371930 }, { - "epoch": 1.88, - "learning_rate": 1.8527226036900068e-05, - "loss": 0.007, + "epoch": 0.96, + "learning_rate": 0.0001553816802797442, + "loss": 0.0122, "step": 371940 }, { - "epoch": 1.88, - "learning_rate": 1.851965834388606e-05, - "loss": 0.0053, + "epoch": 0.96, + "learning_rate": 0.00015537779206337273, + "loss": 0.0124, "step": 371950 }, { - "epoch": 1.88, - "learning_rate": 1.8512090650872047e-05, - "loss": 0.0066, + "epoch": 0.96, + "learning_rate": 0.00015537390384700125, + "loss": 0.0101, "step": 371960 }, { - "epoch": 1.88, - "learning_rate": 1.850452295785804e-05, - "loss": 0.0068, + "epoch": 0.96, + "learning_rate": 0.0001553700156306298, + "loss": 0.0119, "step": 371970 }, { - "epoch": 1.88, - "learning_rate": 1.8496955264844027e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.00015536612741425833, + "loss": 0.0113, "step": 371980 }, { - "epoch": 1.88, - "learning_rate": 1.848938757183002e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015536223919788687, + "loss": 0.0101, "step": 371990 }, { - "epoch": 1.88, - "learning_rate": 1.8481819878816007e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.0001553583509815154, + "loss": 0.0149, "step": 372000 }, { - "epoch": 1.88, - "eval_cer": 0.914423676889143, - "eval_loss": 0.004319104366004467, - "eval_runtime": 116.6762, - "eval_samples_per_second": 17.141, - "eval_steps_per_second": 4.285, + "epoch": 0.96, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.008426784537732601, + "eval_runtime": 107.8013, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, "step": 372000 }, { - "epoch": 1.88, - "learning_rate": 1.8474252185801995e-05, - "loss": 0.0082, + "epoch": 0.96, + "learning_rate": 0.00015535446276514393, + "loss": 0.0121, "step": 372010 }, { - "epoch": 1.88, - "learning_rate": 1.8466684492787987e-05, - "loss": 0.0047, + "epoch": 0.96, + "learning_rate": 0.0001553505745487725, + "loss": 0.013, "step": 372020 }, { - "epoch": 1.88, - "learning_rate": 1.8459116799773975e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.00015534668633240101, + "loss": 0.0123, "step": 372030 }, { - "epoch": 1.88, - "learning_rate": 1.8451549106759967e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015534279811602956, + "loss": 0.0123, "step": 372040 }, { - "epoch": 1.88, - "learning_rate": 1.8443981413745955e-05, - "loss": 0.005, + "epoch": 0.96, + "learning_rate": 0.00015533890989965807, + "loss": 0.0132, "step": 372050 }, { - "epoch": 1.88, - "learning_rate": 1.8436413720731947e-05, - "loss": 0.0072, + "epoch": 0.96, + "learning_rate": 0.00015533502168328664, + "loss": 0.0104, "step": 372060 }, { - "epoch": 1.88, - "learning_rate": 1.8428846027717935e-05, - "loss": 0.0044, + "epoch": 0.96, + "learning_rate": 0.00015533113346691515, + "loss": 0.0121, "step": 372070 }, { - "epoch": 1.88, - "learning_rate": 1.8421278334703923e-05, - "loss": 0.0104, + "epoch": 0.96, + "learning_rate": 0.0001553272452505437, + "loss": 0.0129, "step": 372080 }, { - "epoch": 1.88, - "learning_rate": 1.8413710641689915e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.0001553233570341722, + "loss": 0.0188, "step": 372090 }, { - "epoch": 1.88, - "learning_rate": 1.8406142948675903e-05, - "loss": 0.0161, + "epoch": 0.96, + "learning_rate": 0.00015531946881780078, + "loss": 0.0122, "step": 372100 }, { - "epoch": 1.88, - "learning_rate": 1.8398575255661894e-05, - "loss": 0.0056, + "epoch": 0.96, + "learning_rate": 0.0001553155806014293, + "loss": 0.0147, "step": 372110 }, { - "epoch": 1.88, - "learning_rate": 1.8391007562647883e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.00015531169238505783, + "loss": 0.0094, "step": 372120 }, { - "epoch": 1.88, - "learning_rate": 1.8383439869633874e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.00015530780416868635, + "loss": 0.0135, "step": 372130 }, { - "epoch": 1.88, - "learning_rate": 1.8375872176619862e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015530391595231492, + "loss": 0.015, "step": 372140 }, { - "epoch": 1.88, - "learning_rate": 1.8368304483605854e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015530002773594343, + "loss": 0.0149, "step": 372150 }, { - "epoch": 1.88, - "learning_rate": 1.8360736790591842e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015529613951957197, + "loss": 0.0103, "step": 372160 }, { - "epoch": 1.88, - "learning_rate": 1.835316909757783e-05, - "loss": 0.0046, + "epoch": 0.96, + "learning_rate": 0.0001552922513032005, + "loss": 0.0164, "step": 372170 }, { - "epoch": 1.88, - "learning_rate": 1.8345601404563822e-05, - "loss": 0.006, + "epoch": 0.96, + "learning_rate": 0.00015528836308682903, + "loss": 0.0117, "step": 372180 }, { - "epoch": 1.88, - "learning_rate": 1.833803371154981e-05, - "loss": 0.0073, + "epoch": 0.96, + "learning_rate": 0.0001552844748704576, + "loss": 0.0114, "step": 372190 }, { - "epoch": 1.88, - "learning_rate": 1.8330466018535802e-05, - "loss": 0.0065, + "epoch": 0.96, + "learning_rate": 0.0001552805866540861, + "loss": 0.0126, "step": 372200 }, { - "epoch": 1.88, - "learning_rate": 1.832289832552179e-05, - "loss": 0.0045, + "epoch": 0.96, + "learning_rate": 0.00015527669843771465, + "loss": 0.0109, "step": 372210 }, { - "epoch": 1.88, - "learning_rate": 1.8315330632507782e-05, - "loss": 0.0055, + "epoch": 0.96, + "learning_rate": 0.00015527281022134317, + "loss": 0.0091, "step": 372220 }, { - "epoch": 1.88, - "learning_rate": 1.830776293949377e-05, - "loss": 0.0057, + "epoch": 0.96, + "learning_rate": 0.00015526892200497174, + "loss": 0.0144, "step": 372230 }, { - "epoch": 1.88, - "learning_rate": 1.8300195246479758e-05, - "loss": 0.0072, + "epoch": 0.96, + "learning_rate": 0.00015526503378860025, + "loss": 0.0109, "step": 372240 }, { - "epoch": 1.88, - "learning_rate": 1.829262755346575e-05, - "loss": 0.0058, + "epoch": 0.96, + "learning_rate": 0.0001552611455722288, + "loss": 0.0176, "step": 372250 }, { - "epoch": 1.88, - "learning_rate": 1.8285059860451738e-05, - "loss": 0.0052, + "epoch": 0.96, + "learning_rate": 0.0001552572573558573, + "loss": 0.0149, "step": 372260 }, { - "epoch": 1.88, - "learning_rate": 1.827749216743773e-05, - "loss": 0.0062, + "epoch": 0.96, + "learning_rate": 0.00015525336913948588, + "loss": 0.0098, "step": 372270 }, { - "epoch": 1.88, - "learning_rate": 1.8269924474423718e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.0001552494809231144, + "loss": 0.0143, "step": 372280 }, { - "epoch": 1.88, - "learning_rate": 1.826235678140971e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.00015524559270674293, + "loss": 0.0132, "step": 372290 }, { - "epoch": 1.88, - "learning_rate": 1.8254789088395698e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015524170449037145, + "loss": 0.0114, "step": 372300 }, { - "epoch": 1.88, - "learning_rate": 1.824722139538169e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.00015523781627400002, + "loss": 0.0099, "step": 372310 }, { - "epoch": 1.88, - "learning_rate": 1.8239653702367678e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015523392805762853, + "loss": 0.0128, "step": 372320 }, { - "epoch": 1.88, - "learning_rate": 1.8232086009353666e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.00015523003984125707, + "loss": 0.0148, "step": 372330 }, { - "epoch": 1.88, - "learning_rate": 1.8224518316339657e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.0001552261516248856, + "loss": 0.0115, "step": 372340 }, { - "epoch": 1.88, - "learning_rate": 1.8216950623325646e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015522226340851416, + "loss": 0.0149, "step": 372350 }, { - "epoch": 1.88, - "learning_rate": 1.8209382930311637e-05, - "loss": 0.0089, + "epoch": 0.97, + "learning_rate": 0.0001552183751921427, + "loss": 0.0117, "step": 372360 }, { - "epoch": 1.88, - "learning_rate": 1.8201815237297625e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001552144869757712, + "loss": 0.0106, "step": 372370 }, { - "epoch": 1.88, - "learning_rate": 1.8194247544283617e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015521059875939973, + "loss": 0.0119, "step": 372380 }, { - "epoch": 1.88, - "learning_rate": 1.8186679851269605e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.0001552067105430283, + "loss": 0.0129, "step": 372390 }, { - "epoch": 1.88, - "learning_rate": 1.8179112158255593e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.00015520282232665684, + "loss": 0.0125, "step": 372400 }, { - "epoch": 1.88, - "learning_rate": 1.8171544465241585e-05, - "loss": 0.0072, + "epoch": 0.97, + "learning_rate": 0.00015519893411028535, + "loss": 0.013, "step": 372410 }, { - "epoch": 1.88, - "learning_rate": 1.8163976772227573e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.0001551950458939139, + "loss": 0.0112, "step": 372420 }, { - "epoch": 1.88, - "learning_rate": 1.8156409079213565e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.0001551911576775424, + "loss": 0.0143, "step": 372430 }, { - "epoch": 1.88, - "learning_rate": 1.8148841386199553e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015518726946117098, + "loss": 0.0122, "step": 372440 }, { - "epoch": 1.88, - "learning_rate": 1.8141273693185545e-05, - "loss": 0.0075, + "epoch": 0.97, + "learning_rate": 0.0001551833812447995, + "loss": 0.0163, "step": 372450 }, { - "epoch": 1.88, - "learning_rate": 1.8133706000171533e-05, - "loss": 0.0039, + "epoch": 0.97, + "learning_rate": 0.00015517949302842803, + "loss": 0.0164, "step": 372460 }, { - "epoch": 1.88, - "learning_rate": 1.8126138307157525e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.00015517560481205655, + "loss": 0.0123, "step": 372470 }, { - "epoch": 1.88, - "learning_rate": 1.8118570614143513e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.00015517171659568512, + "loss": 0.0201, "step": 372480 }, { - "epoch": 1.88, - "learning_rate": 1.81110029211295e-05, - "loss": 0.0045, + "epoch": 0.97, + "learning_rate": 0.00015516782837931363, + "loss": 0.0112, "step": 372490 }, { - "epoch": 1.88, - "learning_rate": 1.8103435228115493e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015516394016294217, + "loss": 0.0115, "step": 372500 }, { - "epoch": 1.88, - "learning_rate": 1.809586753510148e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.0001551600519465707, + "loss": 0.0132, "step": 372510 }, { - "epoch": 1.88, - "learning_rate": 1.8088299842087472e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015515616373019926, + "loss": 0.0164, "step": 372520 }, { - "epoch": 1.88, - "learning_rate": 1.808073214907346e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.0001551522755138278, + "loss": 0.0155, "step": 372530 }, { - "epoch": 1.88, - "learning_rate": 1.8073164456059452e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.0001551483872974563, + "loss": 0.0113, "step": 372540 }, { - "epoch": 1.88, - "learning_rate": 1.806559676304544e-05, - "loss": 0.0078, + "epoch": 0.97, + "learning_rate": 0.00015514449908108483, + "loss": 0.0156, "step": 372550 }, { - "epoch": 1.88, - "learning_rate": 1.805802907003143e-05, - "loss": 0.0081, + "epoch": 0.97, + "learning_rate": 0.0001551406108647134, + "loss": 0.0124, "step": 372560 }, { - "epoch": 1.88, - "learning_rate": 1.805046137701742e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.00015513672264834194, + "loss": 0.0134, "step": 372570 }, { - "epoch": 1.88, - "learning_rate": 1.804289368400341e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015513283443197045, + "loss": 0.011, "step": 372580 }, { - "epoch": 1.88, - "learning_rate": 1.80353259909894e-05, - "loss": 0.0039, + "epoch": 0.97, + "learning_rate": 0.000155128946215599, + "loss": 0.0116, "step": 372590 }, { - "epoch": 1.88, - "learning_rate": 1.802775829797539e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015512505799922753, + "loss": 0.0124, "step": 372600 }, { - "epoch": 1.88, - "learning_rate": 1.802019060496138e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015512116978285608, + "loss": 0.0139, "step": 372610 }, { - "epoch": 1.88, - "learning_rate": 1.8012622911947368e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.0001551172815664846, + "loss": 0.0144, "step": 372620 }, { - "epoch": 1.88, - "learning_rate": 1.8005055218933356e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.00015511339335011313, + "loss": 0.0111, "step": 372630 }, { - "epoch": 1.88, - "learning_rate": 1.7997487525919348e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.00015510950513374167, + "loss": 0.0107, "step": 372640 }, { - "epoch": 1.88, - "learning_rate": 1.7989919832905336e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015510561691737022, + "loss": 0.013, "step": 372650 }, { - "epoch": 1.88, - "learning_rate": 1.7982352139891328e-05, - "loss": 0.0072, + "epoch": 0.97, + "learning_rate": 0.00015510172870099873, + "loss": 0.01, "step": 372660 }, { - "epoch": 1.88, - "learning_rate": 1.7974784446877316e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.00015509784048462727, + "loss": 0.0097, "step": 372670 }, { - "epoch": 1.88, - "learning_rate": 1.7967216753863308e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.0001550939522682558, + "loss": 0.0112, "step": 372680 }, { - "epoch": 1.88, - "learning_rate": 1.7959649060849296e-05, - "loss": 0.0037, + "epoch": 0.97, + "learning_rate": 0.00015509006405188436, + "loss": 0.0158, "step": 372690 }, { - "epoch": 1.88, - "learning_rate": 1.7952081367835287e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015508617583551287, + "loss": 0.0109, "step": 372700 }, { - "epoch": 1.88, - "learning_rate": 1.7944513674821272e-05, - "loss": 0.004, + "epoch": 0.97, + "learning_rate": 0.0001550822876191414, + "loss": 0.0121, "step": 372710 }, { - "epoch": 1.88, - "learning_rate": 1.7936945981807264e-05, - "loss": 0.0043, + "epoch": 0.97, + "learning_rate": 0.00015507839940276993, + "loss": 0.011, "step": 372720 }, { - "epoch": 1.88, - "learning_rate": 1.7929378288793252e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.0001550745111863985, + "loss": 0.0135, "step": 372730 }, { - "epoch": 1.88, - "learning_rate": 1.7921810595779244e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.00015507062297002704, + "loss": 0.012, "step": 372740 }, { - "epoch": 1.88, - "learning_rate": 1.7914242902765232e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015506673475365555, + "loss": 0.0118, "step": 372750 }, { - "epoch": 1.88, - "learning_rate": 1.7906675209751224e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.0001550628465372841, + "loss": 0.0151, "step": 372760 }, { - "epoch": 1.88, - "learning_rate": 1.7899107516737215e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015505895832091263, + "loss": 0.0128, "step": 372770 }, { - "epoch": 1.88, - "learning_rate": 1.7891539823723203e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015505507010454118, + "loss": 0.0126, "step": 372780 }, { - "epoch": 1.88, - "learning_rate": 1.788397213070919e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.0001550511818881697, + "loss": 0.013, "step": 372790 }, { - "epoch": 1.88, - "learning_rate": 1.787640443769518e-05, - "loss": 0.0042, + "epoch": 0.97, + "learning_rate": 0.00015504729367179823, + "loss": 0.0117, "step": 372800 }, { - "epoch": 1.88, - "learning_rate": 1.786883674468117e-05, - "loss": 0.0075, + "epoch": 0.97, + "learning_rate": 0.00015504340545542677, + "loss": 0.0136, "step": 372810 }, { - "epoch": 1.88, - "learning_rate": 1.786126905166716e-05, - "loss": 0.004, + "epoch": 0.97, + "learning_rate": 0.00015503951723905532, + "loss": 0.0126, "step": 372820 }, { - "epoch": 1.88, - "learning_rate": 1.785370135865315e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.00015503562902268383, + "loss": 0.0097, "step": 372830 }, { - "epoch": 1.88, - "learning_rate": 1.784613366563914e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015503174080631237, + "loss": 0.0134, "step": 372840 }, { - "epoch": 1.88, - "learning_rate": 1.783856597262513e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.0001550278525899409, + "loss": 0.0243, "step": 372850 }, { - "epoch": 1.88, - "learning_rate": 1.783099827961112e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015502396437356945, + "loss": 0.0162, "step": 372860 }, { - "epoch": 1.88, - "learning_rate": 1.7823430586597108e-05, - "loss": 0.0045, + "epoch": 0.97, + "learning_rate": 0.00015502007615719797, + "loss": 0.0105, "step": 372870 }, { - "epoch": 1.88, - "learning_rate": 1.78158628935831e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.0001550161879408265, + "loss": 0.012, "step": 372880 }, { - "epoch": 1.88, - "learning_rate": 1.7808295200569087e-05, - "loss": 0.0073, + "epoch": 0.97, + "learning_rate": 0.00015501229972445508, + "loss": 0.0103, "step": 372890 }, { - "epoch": 1.88, - "learning_rate": 1.780072750755508e-05, - "loss": 0.0043, + "epoch": 0.97, + "learning_rate": 0.0001550084115080836, + "loss": 0.0131, "step": 372900 }, { - "epoch": 1.88, - "learning_rate": 1.7793159814541067e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015500452329171214, + "loss": 0.0152, "step": 372910 }, { - "epoch": 1.88, - "learning_rate": 1.778559212152706e-05, - "loss": 0.0074, + "epoch": 0.97, + "learning_rate": 0.00015500063507534065, + "loss": 0.0154, "step": 372920 }, { - "epoch": 1.88, - "learning_rate": 1.7778024428513047e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.0001549967468589692, + "loss": 0.012, "step": 372930 }, { - "epoch": 1.88, - "learning_rate": 1.777045673549904e-05, - "loss": 0.0078, + "epoch": 0.97, + "learning_rate": 0.00015499285864259773, + "loss": 0.0127, "step": 372940 }, { - "epoch": 1.88, - "learning_rate": 1.7762889042485027e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015498897042622628, + "loss": 0.0118, "step": 372950 }, { - "epoch": 1.88, - "learning_rate": 1.7755321349471015e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.0001549850822098548, + "loss": 0.0107, "step": 372960 }, { - "epoch": 1.88, - "learning_rate": 1.7747753656457007e-05, - "loss": 0.0078, + "epoch": 0.97, + "learning_rate": 0.00015498119399348333, + "loss": 0.0119, "step": 372970 }, { - "epoch": 1.88, - "learning_rate": 1.7740185963442995e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015497730577711187, + "loss": 0.0118, "step": 372980 }, { - "epoch": 1.88, - "learning_rate": 1.7732618270428986e-05, - "loss": 0.0034, + "epoch": 0.97, + "learning_rate": 0.00015497341756074041, + "loss": 0.0132, "step": 372990 }, { - "epoch": 1.88, - "learning_rate": 1.7725050577414975e-05, - "loss": 0.0082, + "epoch": 0.97, + "learning_rate": 0.00015496952934436893, + "loss": 0.0096, "step": 373000 }, { - "epoch": 1.88, - "eval_cer": 0.9144353216426477, - "eval_loss": 0.00432598264887929, - "eval_runtime": 116.7735, - "eval_samples_per_second": 17.127, - "eval_steps_per_second": 4.282, + "epoch": 0.97, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.00843864493072033, + "eval_runtime": 107.4926, + "eval_samples_per_second": 18.606, + "eval_steps_per_second": 4.651, "step": 373000 }, { - "epoch": 1.88, - "learning_rate": 1.7717482884400966e-05, - "loss": 0.009, + "epoch": 0.97, + "learning_rate": 0.00015496564112799747, + "loss": 0.0131, "step": 373010 }, { - "epoch": 1.88, - "learning_rate": 1.7709915191386954e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.000154961752911626, + "loss": 0.0161, "step": 373020 }, { - "epoch": 1.88, - "learning_rate": 1.7702347498372943e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015495786469525455, + "loss": 0.0118, "step": 373030 }, { - "epoch": 1.88, - "learning_rate": 1.7694779805358934e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015495397647888307, + "loss": 0.0147, "step": 373040 }, { - "epoch": 1.88, - "learning_rate": 1.7687212112344923e-05, - "loss": 0.01, + "epoch": 0.97, + "learning_rate": 0.0001549500882625116, + "loss": 0.0164, "step": 373050 }, { - "epoch": 1.88, - "learning_rate": 1.7679644419330914e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015494620004614018, + "loss": 0.0155, "step": 373060 }, { - "epoch": 1.88, - "learning_rate": 1.7672076726316902e-05, - "loss": 0.0077, + "epoch": 0.97, + "learning_rate": 0.0001549423118297687, + "loss": 0.0131, "step": 373070 }, { - "epoch": 1.88, - "learning_rate": 1.7664509033302894e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015493842361339724, + "loss": 0.0121, "step": 373080 }, { - "epoch": 1.88, - "learning_rate": 1.7656941340288882e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015493453539702575, + "loss": 0.0155, "step": 373090 }, { - "epoch": 1.88, - "learning_rate": 1.764937364727487e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015493064718065432, + "loss": 0.0112, "step": 373100 }, { - "epoch": 1.88, - "learning_rate": 1.7641805954260862e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015492675896428283, + "loss": 0.0123, "step": 373110 }, { - "epoch": 1.88, - "learning_rate": 1.763423826124685e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.00015492287074791137, + "loss": 0.0128, "step": 373120 }, { - "epoch": 1.88, - "learning_rate": 1.7626670568232842e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.0001549189825315399, + "loss": 0.0091, "step": 373130 }, { - "epoch": 1.88, - "learning_rate": 1.761910287521883e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.00015491509431516846, + "loss": 0.0115, "step": 373140 }, { - "epoch": 1.88, - "learning_rate": 1.761153518220482e-05, - "loss": 0.0072, + "epoch": 0.97, + "learning_rate": 0.00015491120609879697, + "loss": 0.0123, "step": 373150 }, { - "epoch": 1.88, - "learning_rate": 1.760396748919081e-05, - "loss": 0.0076, + "epoch": 0.97, + "learning_rate": 0.00015490731788242551, + "loss": 0.0099, "step": 373160 }, { - "epoch": 1.88, - "learning_rate": 1.75963997961768e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.00015490342966605403, + "loss": 0.012, "step": 373170 }, { - "epoch": 1.88, - "learning_rate": 1.758883210316279e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015489954144968257, + "loss": 0.0122, "step": 373180 }, { - "epoch": 1.88, - "learning_rate": 1.7581264410148778e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.0001548956532333111, + "loss": 0.0122, "step": 373190 }, { - "epoch": 1.88, - "learning_rate": 1.757369671713477e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015489176501693965, + "loss": 0.0132, "step": 373200 }, { - "epoch": 1.88, - "learning_rate": 1.7566129024120758e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015488787680056817, + "loss": 0.0137, "step": 373210 }, { - "epoch": 1.88, - "learning_rate": 1.755856133110675e-05, - "loss": 0.0072, + "epoch": 0.97, + "learning_rate": 0.0001548839885841967, + "loss": 0.0127, "step": 373220 }, { - "epoch": 1.88, - "learning_rate": 1.7550993638092738e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015488010036782528, + "loss": 0.0118, "step": 373230 }, { - "epoch": 1.88, - "learning_rate": 1.754342594507873e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.0001548762121514538, + "loss": 0.0123, "step": 373240 }, { - "epoch": 1.88, - "learning_rate": 1.7535858252064717e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001548723239350823, + "loss": 0.0101, "step": 373250 }, { - "epoch": 1.88, - "learning_rate": 1.7528290559050706e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015486843571871085, + "loss": 0.0136, "step": 373260 }, { - "epoch": 1.88, - "learning_rate": 1.7520722866036697e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015486454750233942, + "loss": 0.0115, "step": 373270 }, { - "epoch": 1.88, - "learning_rate": 1.7513155173022685e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015486065928596793, + "loss": 0.0128, "step": 373280 }, { - "epoch": 1.88, - "learning_rate": 1.7505587480008677e-05, - "loss": 0.0078, + "epoch": 0.97, + "learning_rate": 0.00015485677106959647, + "loss": 0.0151, "step": 373290 }, { - "epoch": 1.88, - "learning_rate": 1.7498019786994665e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.000154852882853225, + "loss": 0.0104, "step": 373300 }, { - "epoch": 1.88, - "learning_rate": 1.7490452093980657e-05, - "loss": 0.0074, + "epoch": 0.97, + "learning_rate": 0.00015484899463685356, + "loss": 0.0116, "step": 373310 }, { - "epoch": 1.88, - "learning_rate": 1.7482884400966645e-05, - "loss": 0.0038, + "epoch": 0.97, + "learning_rate": 0.00015484510642048207, + "loss": 0.0115, "step": 373320 }, { - "epoch": 1.88, - "learning_rate": 1.7475316707952637e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001548412182041106, + "loss": 0.0153, "step": 373330 }, { - "epoch": 1.88, - "learning_rate": 1.7467749014938625e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015483732998773913, + "loss": 0.0112, "step": 373340 }, { - "epoch": 1.88, - "learning_rate": 1.7460181321924613e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001548334417713677, + "loss": 0.0146, "step": 373350 }, { - "epoch": 1.88, - "learning_rate": 1.7452613628910605e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.0001548295535549962, + "loss": 0.0123, "step": 373360 }, { - "epoch": 1.88, - "learning_rate": 1.7445045935896593e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.00015482566533862475, + "loss": 0.0098, "step": 373370 }, { - "epoch": 1.88, - "learning_rate": 1.7437478242882585e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015482177712225327, + "loss": 0.0102, "step": 373380 }, { - "epoch": 1.88, - "learning_rate": 1.7429910549868573e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015481788890588184, + "loss": 0.0136, "step": 373390 }, { - "epoch": 1.88, - "learning_rate": 1.7422342856854564e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015481400068951038, + "loss": 0.0119, "step": 373400 }, { - "epoch": 1.88, - "learning_rate": 1.7414775163840553e-05, - "loss": 0.0069, + "epoch": 0.97, + "learning_rate": 0.0001548101124731389, + "loss": 0.009, "step": 373410 }, { - "epoch": 1.88, - "learning_rate": 1.740720747082654e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.0001548062242567674, + "loss": 0.0105, "step": 373420 }, { - "epoch": 1.88, - "learning_rate": 1.7399639777812532e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.00015480233604039595, + "loss": 0.0096, "step": 373430 }, { - "epoch": 1.88, - "learning_rate": 1.739207208479852e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.00015479844782402452, + "loss": 0.0152, "step": 373440 }, { - "epoch": 1.88, - "learning_rate": 1.7384504391784512e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015479455960765303, + "loss": 0.0124, "step": 373450 }, { - "epoch": 1.88, - "learning_rate": 1.73769366987705e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.00015479067139128157, + "loss": 0.0105, "step": 373460 }, { - "epoch": 1.88, - "learning_rate": 1.7369369005756492e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.0001547867831749101, + "loss": 0.01, "step": 373470 }, { - "epoch": 1.88, - "learning_rate": 1.736180131274248e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015478289495853866, + "loss": 0.0129, "step": 373480 }, { - "epoch": 1.88, - "learning_rate": 1.7354233619728472e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015477900674216717, + "loss": 0.0141, "step": 373490 }, { - "epoch": 1.88, - "learning_rate": 1.734666592671446e-05, - "loss": 0.0041, + "epoch": 0.97, + "learning_rate": 0.0001547751185257957, + "loss": 0.0122, "step": 373500 }, { - "epoch": 1.88, - "learning_rate": 1.733909823370045e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015477123030942423, + "loss": 0.0144, "step": 373510 }, { - "epoch": 1.88, - "learning_rate": 1.733153054068644e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.0001547673420930528, + "loss": 0.0136, "step": 373520 }, { - "epoch": 1.88, - "learning_rate": 1.7323962847672428e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.0001547634538766813, + "loss": 0.0121, "step": 373530 }, { - "epoch": 1.88, - "learning_rate": 1.731639515465842e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.00015475956566030985, + "loss": 0.0209, "step": 373540 }, { - "epoch": 1.88, - "learning_rate": 1.7308827461644408e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015475567744393837, + "loss": 0.0131, "step": 373550 }, { - "epoch": 1.88, - "learning_rate": 1.73012597686304e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015475178922756694, + "loss": 0.014, "step": 373560 }, { - "epoch": 1.88, - "learning_rate": 1.7293692075616388e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015474790101119545, + "loss": 0.011, "step": 373570 }, { - "epoch": 1.88, - "learning_rate": 1.7286124382602376e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.000154744012794824, + "loss": 0.0137, "step": 373580 }, { - "epoch": 1.88, - "learning_rate": 1.7278556689588364e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.0001547401245784525, + "loss": 0.0133, "step": 373590 }, { - "epoch": 1.88, - "learning_rate": 1.7270988996574356e-05, - "loss": 0.0078, + "epoch": 0.97, + "learning_rate": 0.00015473623636208108, + "loss": 0.0128, "step": 373600 }, { - "epoch": 1.88, - "learning_rate": 1.7263421303560347e-05, - "loss": 0.0081, + "epoch": 0.97, + "learning_rate": 0.00015473234814570962, + "loss": 0.0141, "step": 373610 }, { - "epoch": 1.88, - "learning_rate": 1.7255853610546336e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015472845992933813, + "loss": 0.0121, "step": 373620 }, { - "epoch": 1.89, - "learning_rate": 1.7248285917532327e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.00015472457171296667, + "loss": 0.0111, "step": 373630 }, { - "epoch": 1.89, - "learning_rate": 1.7240718224518316e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.00015472068349659521, + "loss": 0.0136, "step": 373640 }, { - "epoch": 1.89, - "learning_rate": 1.7233150531504304e-05, - "loss": 0.0077, + "epoch": 0.97, + "learning_rate": 0.00015471679528022376, + "loss": 0.012, "step": 373650 }, { - "epoch": 1.89, - "learning_rate": 1.7225582838490292e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.00015471290706385227, + "loss": 0.0145, "step": 373660 }, { - "epoch": 1.89, - "learning_rate": 1.7218015145476284e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.0001547090188474808, + "loss": 0.0117, "step": 373670 }, { - "epoch": 1.89, - "learning_rate": 1.7210447452462272e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015470513063110933, + "loss": 0.0133, "step": 373680 }, { - "epoch": 1.89, - "learning_rate": 1.7202879759448263e-05, - "loss": 0.0076, + "epoch": 0.97, + "learning_rate": 0.0001547012424147379, + "loss": 0.0121, "step": 373690 }, { - "epoch": 1.89, - "learning_rate": 1.719531206643425e-05, - "loss": 0.004, + "epoch": 0.97, + "learning_rate": 0.0001546973541983664, + "loss": 0.0139, "step": 373700 }, { - "epoch": 1.89, - "learning_rate": 1.7187744373420243e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015469346598199495, + "loss": 0.0119, "step": 373710 }, { - "epoch": 1.89, - "learning_rate": 1.718017668040623e-05, - "loss": 0.0082, + "epoch": 0.97, + "learning_rate": 0.00015468957776562347, + "loss": 0.0119, "step": 373720 }, { - "epoch": 1.89, - "learning_rate": 1.717260898739222e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015468568954925204, + "loss": 0.0095, "step": 373730 }, { - "epoch": 1.89, - "learning_rate": 1.716504129437821e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.00015468180133288055, + "loss": 0.0121, "step": 373740 }, { - "epoch": 1.89, - "learning_rate": 1.71574736013642e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.0001546779131165091, + "loss": 0.0375, "step": 373750 }, { - "epoch": 1.89, - "learning_rate": 1.714990590835019e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.0001546740249001376, + "loss": 0.0106, "step": 373760 }, { - "epoch": 1.89, - "learning_rate": 1.714233821533618e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015467013668376617, + "loss": 0.0124, "step": 373770 }, { - "epoch": 1.89, - "learning_rate": 1.713477052232217e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015466624846739472, + "loss": 0.0335, "step": 373780 }, { - "epoch": 1.89, - "learning_rate": 1.712720282930816e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015466236025102323, + "loss": 0.0131, "step": 373790 }, { - "epoch": 1.89, - "learning_rate": 1.711963513629415e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.00015465847203465177, + "loss": 0.0119, "step": 373800 }, { - "epoch": 1.89, - "learning_rate": 1.711206744328014e-05, - "loss": 0.0082, + "epoch": 0.97, + "learning_rate": 0.00015465458381828031, + "loss": 0.0126, "step": 373810 }, { - "epoch": 1.89, - "learning_rate": 1.7104499750266127e-05, - "loss": 0.0077, + "epoch": 0.97, + "learning_rate": 0.00015465069560190886, + "loss": 0.0152, "step": 373820 }, { - "epoch": 1.89, - "learning_rate": 1.709693205725212e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015464680738553737, + "loss": 0.0144, "step": 373830 }, { - "epoch": 1.89, - "learning_rate": 1.7089364364238107e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001546429191691659, + "loss": 0.0127, "step": 373840 }, { - "epoch": 1.89, - "learning_rate": 1.70817966712241e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015463903095279445, + "loss": 0.0101, "step": 373850 }, { - "epoch": 1.89, - "learning_rate": 1.7074228978210087e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.000154635142736423, + "loss": 0.0117, "step": 373860 }, { - "epoch": 1.89, - "learning_rate": 1.706666128519608e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.0001546312545200515, + "loss": 0.015, "step": 373870 }, { - "epoch": 1.89, - "learning_rate": 1.7059093592182067e-05, - "loss": 0.0073, + "epoch": 0.97, + "learning_rate": 0.00015462736630368005, + "loss": 0.0143, "step": 373880 }, { - "epoch": 1.89, - "learning_rate": 1.7051525899168055e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.0001546234780873086, + "loss": 0.0178, "step": 373890 }, { - "epoch": 1.89, - "learning_rate": 1.7043958206154047e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.00015461958987093713, + "loss": 0.0122, "step": 373900 }, { - "epoch": 1.89, - "learning_rate": 1.7036390513140035e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015461570165456565, + "loss": 0.012, "step": 373910 }, { - "epoch": 1.89, - "learning_rate": 1.7028822820126026e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.0001546118134381942, + "loss": 0.0124, "step": 373920 }, { - "epoch": 1.89, - "learning_rate": 1.7021255127112015e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.0001546079252218227, + "loss": 0.0177, "step": 373930 }, { - "epoch": 1.89, - "learning_rate": 1.7013687434098006e-05, - "loss": 0.0069, + "epoch": 0.97, + "learning_rate": 0.00015460403700545127, + "loss": 0.0123, "step": 373940 }, { - "epoch": 1.89, - "learning_rate": 1.7006119741083994e-05, - "loss": 0.0076, + "epoch": 0.97, + "learning_rate": 0.00015460014878907982, + "loss": 0.0124, "step": 373950 }, { - "epoch": 1.89, - "learning_rate": 1.6998552048069986e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.00015459626057270833, + "loss": 0.0116, "step": 373960 }, { - "epoch": 1.89, - "learning_rate": 1.6990984355055974e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015459237235633684, + "loss": 0.0106, "step": 373970 }, { - "epoch": 1.89, - "learning_rate": 1.6983416662041962e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.0001545884841399654, + "loss": 0.0225, "step": 373980 }, { - "epoch": 1.89, - "learning_rate": 1.6975848969027954e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015458459592359395, + "loss": 0.0136, "step": 373990 }, { - "epoch": 1.89, - "learning_rate": 1.6968281276013942e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015458070770722247, + "loss": 0.0093, "step": 374000 }, { - "epoch": 1.89, - "eval_cer": 0.9144294992658953, - "eval_loss": 0.004294942133128643, - "eval_runtime": 116.742, - "eval_samples_per_second": 17.132, - "eval_steps_per_second": 4.283, + "epoch": 0.97, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.00830517616122961, + "eval_runtime": 107.6382, + "eval_samples_per_second": 18.581, + "eval_steps_per_second": 4.645, "step": 374000 }, { - "epoch": 1.89, - "learning_rate": 1.6960713582999934e-05, - "loss": 0.0042, + "epoch": 0.97, + "learning_rate": 0.000154576819490851, + "loss": 0.0149, "step": 374010 }, { - "epoch": 1.89, - "learning_rate": 1.6953145889985922e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015457293127447955, + "loss": 0.0112, "step": 374020 }, { - "epoch": 1.89, - "learning_rate": 1.6945578196971914e-05, - "loss": 0.0079, + "epoch": 0.97, + "learning_rate": 0.0001545690430581081, + "loss": 0.0113, "step": 374030 }, { - "epoch": 1.89, - "learning_rate": 1.6938010503957902e-05, - "loss": 0.0031, + "epoch": 0.97, + "learning_rate": 0.0001545651548417366, + "loss": 0.011, "step": 374040 }, { - "epoch": 1.89, - "learning_rate": 1.693044281094389e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015456126662536515, + "loss": 0.0121, "step": 374050 }, { - "epoch": 1.89, - "learning_rate": 1.6922875117929882e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.0001545573784089937, + "loss": 0.0136, "step": 374060 }, { - "epoch": 1.89, - "learning_rate": 1.691530742491587e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015455349019262223, + "loss": 0.0113, "step": 374070 }, { - "epoch": 1.89, - "learning_rate": 1.690773973190186e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.00015454960197625075, + "loss": 0.0106, "step": 374080 }, { - "epoch": 1.89, - "learning_rate": 1.690017203888785e-05, - "loss": 0.0043, + "epoch": 0.97, + "learning_rate": 0.0001545457137598793, + "loss": 0.0127, "step": 374090 }, { - "epoch": 1.89, - "learning_rate": 1.689260434587384e-05, - "loss": 0.0077, + "epoch": 0.97, + "learning_rate": 0.00015454182554350786, + "loss": 0.0128, "step": 374100 }, { - "epoch": 1.89, - "learning_rate": 1.688503665285983e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015453793732713637, + "loss": 0.0105, "step": 374110 }, { - "epoch": 1.89, - "learning_rate": 1.687746895984582e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015453404911076491, + "loss": 0.0117, "step": 374120 }, { - "epoch": 1.89, - "learning_rate": 1.686990126683181e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015453016089439343, + "loss": 0.0128, "step": 374130 }, { - "epoch": 1.89, - "learning_rate": 1.6862333573817798e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.000154526272678022, + "loss": 0.0095, "step": 374140 }, { - "epoch": 1.89, - "learning_rate": 1.685476588080379e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001545223844616505, + "loss": 0.0117, "step": 374150 }, { - "epoch": 1.89, - "learning_rate": 1.6847198187789777e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015451849624527905, + "loss": 0.0129, "step": 374160 }, { - "epoch": 1.89, - "learning_rate": 1.683963049477577e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015451460802890757, + "loss": 0.0164, "step": 374170 }, { - "epoch": 1.89, - "learning_rate": 1.6832062801761757e-05, - "loss": 0.0045, + "epoch": 0.97, + "learning_rate": 0.0001545107198125361, + "loss": 0.0122, "step": 374180 }, { - "epoch": 1.89, - "learning_rate": 1.682449510874775e-05, - "loss": 0.0035, + "epoch": 0.97, + "learning_rate": 0.00015450683159616465, + "loss": 0.0124, "step": 374190 }, { - "epoch": 1.89, - "learning_rate": 1.6816927415733737e-05, - "loss": 0.0072, + "epoch": 0.97, + "learning_rate": 0.0001545029433797932, + "loss": 0.0113, "step": 374200 }, { - "epoch": 1.89, - "learning_rate": 1.6809359722719725e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.0001544990551634217, + "loss": 0.0121, "step": 374210 }, { - "epoch": 1.89, - "learning_rate": 1.6801792029705717e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015449516694705025, + "loss": 0.0144, "step": 374220 }, { - "epoch": 1.89, - "learning_rate": 1.6794224336691705e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.0001544912787306788, + "loss": 0.0105, "step": 374230 }, { - "epoch": 1.89, - "learning_rate": 1.6786656643677697e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015448739051430733, + "loss": 0.012, "step": 374240 }, { - "epoch": 1.89, - "learning_rate": 1.6779088950663685e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.00015448350229793585, + "loss": 0.0113, "step": 374250 }, { - "epoch": 1.89, - "learning_rate": 1.6771521257649677e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001544796140815644, + "loss": 0.0101, "step": 374260 }, { - "epoch": 1.89, - "learning_rate": 1.6763953564635665e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015447572586519296, + "loss": 0.0124, "step": 374270 }, { - "epoch": 1.89, - "learning_rate": 1.6756385871621653e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015447183764882147, + "loss": 0.0119, "step": 374280 }, { - "epoch": 1.89, - "learning_rate": 1.6748818178607645e-05, - "loss": 0.0045, + "epoch": 0.97, + "learning_rate": 0.00015446794943245, + "loss": 0.0113, "step": 374290 }, { - "epoch": 1.89, - "learning_rate": 1.6741250485593633e-05, - "loss": 0.0076, + "epoch": 0.97, + "learning_rate": 0.00015446406121607853, + "loss": 0.0136, "step": 374300 }, { - "epoch": 1.89, - "learning_rate": 1.6733682792579624e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.0001544601729997071, + "loss": 0.0129, "step": 374310 }, { - "epoch": 1.89, - "learning_rate": 1.6726115099565613e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.0001544562847833356, + "loss": 0.0132, "step": 374320 }, { - "epoch": 1.89, - "learning_rate": 1.6718547406551604e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015445239656696415, + "loss": 0.0102, "step": 374330 }, { - "epoch": 1.89, - "learning_rate": 1.6710979713537593e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015444850835059267, + "loss": 0.0136, "step": 374340 }, { - "epoch": 1.89, - "learning_rate": 1.6703412020523584e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015444462013422124, + "loss": 0.0133, "step": 374350 }, { - "epoch": 1.89, - "learning_rate": 1.6695844327509572e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015444073191784975, + "loss": 0.0124, "step": 374360 }, { - "epoch": 1.89, - "learning_rate": 1.668827663449556e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.0001544368437014783, + "loss": 0.0125, "step": 374370 }, { - "epoch": 1.89, - "learning_rate": 1.6680708941481552e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.0001544329554851068, + "loss": 0.0131, "step": 374380 }, { - "epoch": 1.89, - "learning_rate": 1.667314124846754e-05, - "loss": 0.0083, + "epoch": 0.97, + "learning_rate": 0.00015442906726873538, + "loss": 0.0148, "step": 374390 }, { - "epoch": 1.89, - "learning_rate": 1.6665573555453532e-05, - "loss": 0.004, + "epoch": 0.97, + "learning_rate": 0.0001544251790523639, + "loss": 0.0112, "step": 374400 }, { - "epoch": 1.89, - "learning_rate": 1.665800586243952e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015442129083599243, + "loss": 0.0128, "step": 374410 }, { - "epoch": 1.89, - "learning_rate": 1.6650438169425512e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015441740261962095, + "loss": 0.0117, "step": 374420 }, { - "epoch": 1.89, - "learning_rate": 1.66428704764115e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001544135144032495, + "loss": 0.0117, "step": 374430 }, { - "epoch": 1.89, - "learning_rate": 1.6635302783397488e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015440962618687803, + "loss": 0.0116, "step": 374440 }, { - "epoch": 1.89, - "learning_rate": 1.6627735090383476e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015440573797050657, + "loss": 0.0103, "step": 374450 }, { - "epoch": 1.89, - "learning_rate": 1.6620167397369468e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.0001544018497541351, + "loss": 0.0122, "step": 374460 }, { - "epoch": 1.89, - "learning_rate": 1.661259970435546e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015439796153776363, + "loss": 0.0107, "step": 374470 }, { - "epoch": 1.89, - "learning_rate": 1.6605032011341448e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.0001543940733213922, + "loss": 0.0156, "step": 374480 }, { - "epoch": 1.89, - "learning_rate": 1.659746431832744e-05, - "loss": 0.0079, + "epoch": 0.97, + "learning_rate": 0.0001543901851050207, + "loss": 0.0129, "step": 374490 }, { - "epoch": 1.89, - "learning_rate": 1.6589896625313428e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015438629688864925, + "loss": 0.0138, "step": 374500 }, { - "epoch": 1.89, - "learning_rate": 1.658232893229942e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015438240867227777, + "loss": 0.0105, "step": 374510 }, { - "epoch": 1.89, - "learning_rate": 1.6574761239285404e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015437852045590634, + "loss": 0.018, "step": 374520 }, { - "epoch": 1.89, - "learning_rate": 1.6567193546271396e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015437463223953485, + "loss": 0.011, "step": 374530 }, { - "epoch": 1.89, - "learning_rate": 1.6559625853257384e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.0001543707440231634, + "loss": 0.0123, "step": 374540 }, { - "epoch": 1.89, - "learning_rate": 1.6552058160243376e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.0001543668558067919, + "loss": 0.0084, "step": 374550 }, { - "epoch": 1.89, - "learning_rate": 1.6544490467229364e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.00015436296759042048, + "loss": 0.0109, "step": 374560 }, { - "epoch": 1.89, - "learning_rate": 1.6536922774215355e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.000154359079374049, + "loss": 0.0099, "step": 374570 }, { - "epoch": 1.89, - "learning_rate": 1.6529355081201347e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015435519115767753, + "loss": 0.01, "step": 374580 }, { - "epoch": 1.89, - "learning_rate": 1.6521787388187335e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015435130294130605, + "loss": 0.0104, "step": 374590 }, { - "epoch": 1.89, - "learning_rate": 1.6514219695173323e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015434741472493462, + "loss": 0.0114, "step": 374600 }, { - "epoch": 1.89, - "learning_rate": 1.650665200215931e-05, - "loss": 0.0079, + "epoch": 0.97, + "learning_rate": 0.00015434352650856313, + "loss": 0.0107, "step": 374610 }, { - "epoch": 1.89, - "learning_rate": 1.6499084309145303e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.00015433963829219167, + "loss": 0.0104, "step": 374620 }, { - "epoch": 1.89, - "learning_rate": 1.649151661613129e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015433575007582019, + "loss": 0.0132, "step": 374630 }, { - "epoch": 1.89, - "learning_rate": 1.6483948923117283e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015433186185944875, + "loss": 0.0109, "step": 374640 }, { - "epoch": 1.89, - "learning_rate": 1.647638123010327e-05, - "loss": 0.0079, + "epoch": 0.97, + "learning_rate": 0.0001543279736430773, + "loss": 0.0116, "step": 374650 }, { - "epoch": 1.89, - "learning_rate": 1.6468813537089263e-05, - "loss": 0.0065, + "epoch": 0.97, + "learning_rate": 0.0001543240854267058, + "loss": 0.0136, "step": 374660 }, { - "epoch": 1.89, - "learning_rate": 1.646124584407525e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015432019721033435, + "loss": 0.0124, "step": 374670 }, { - "epoch": 1.89, - "learning_rate": 1.645367815106124e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.00015431630899396287, + "loss": 0.0108, "step": 374680 }, { - "epoch": 1.89, - "learning_rate": 1.644611045804723e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015431242077759144, + "loss": 0.0153, "step": 374690 }, { - "epoch": 1.89, - "learning_rate": 1.643854276503322e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.00015430853256121995, + "loss": 0.0108, "step": 374700 }, { - "epoch": 1.89, - "learning_rate": 1.643097507201921e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.0001543046443448485, + "loss": 0.0102, "step": 374710 }, { - "epoch": 1.89, - "learning_rate": 1.64234073790052e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.000154300756128477, + "loss": 0.0133, "step": 374720 }, { - "epoch": 1.89, - "learning_rate": 1.641583968599119e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015429686791210558, + "loss": 0.0158, "step": 374730 }, { - "epoch": 1.89, - "learning_rate": 1.640827199297718e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.0001542929796957341, + "loss": 0.0147, "step": 374740 }, { - "epoch": 1.89, - "learning_rate": 1.6400704299963167e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.00015428909147936263, + "loss": 0.0155, "step": 374750 }, { - "epoch": 1.89, - "learning_rate": 1.639313660694916e-05, - "loss": 0.0041, + "epoch": 0.97, + "learning_rate": 0.00015428520326299115, + "loss": 0.0162, "step": 374760 }, { - "epoch": 1.89, - "learning_rate": 1.6385568913935147e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015428131504661971, + "loss": 0.0135, "step": 374770 }, { - "epoch": 1.89, - "learning_rate": 1.637800122092114e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015427742683024823, + "loss": 0.0142, "step": 374780 }, { - "epoch": 1.89, - "learning_rate": 1.6370433527907127e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.00015427353861387677, + "loss": 0.0167, "step": 374790 }, { - "epoch": 1.89, - "learning_rate": 1.636286583489312e-05, - "loss": 0.0075, + "epoch": 0.97, + "learning_rate": 0.00015426965039750529, + "loss": 0.0111, "step": 374800 }, { - "epoch": 1.89, - "learning_rate": 1.6355298141879107e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015426576218113385, + "loss": 0.0144, "step": 374810 }, { - "epoch": 1.89, - "learning_rate": 1.6347730448865098e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.0001542618739647624, + "loss": 0.0119, "step": 374820 }, { - "epoch": 1.89, - "learning_rate": 1.6340162755851086e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001542579857483909, + "loss": 0.0121, "step": 374830 }, { - "epoch": 1.89, - "learning_rate": 1.6332595062837075e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015425409753201942, + "loss": 0.0109, "step": 374840 }, { - "epoch": 1.89, - "learning_rate": 1.6325027369823066e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.000154250209315648, + "loss": 0.0141, "step": 374850 }, { - "epoch": 1.89, - "learning_rate": 1.6317459676809054e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015424632109927654, + "loss": 0.0165, "step": 374860 }, { - "epoch": 1.89, - "learning_rate": 1.6309891983795046e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015424243288290505, + "loss": 0.0116, "step": 374870 }, { - "epoch": 1.89, - "learning_rate": 1.6302324290781034e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.0001542385446665336, + "loss": 0.0142, "step": 374880 }, { - "epoch": 1.89, - "learning_rate": 1.6294756597767026e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.0001542346564501621, + "loss": 0.0122, "step": 374890 }, { - "epoch": 1.89, - "learning_rate": 1.6287188904753014e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.00015423076823379067, + "loss": 0.0128, "step": 374900 }, { - "epoch": 1.89, - "learning_rate": 1.6279621211739002e-05, - "loss": 0.0075, + "epoch": 0.97, + "learning_rate": 0.0001542268800174192, + "loss": 0.0132, "step": 374910 }, { - "epoch": 1.89, - "learning_rate": 1.6272053518724994e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015422299180104773, + "loss": 0.012, "step": 374920 }, { - "epoch": 1.89, - "learning_rate": 1.6264485825710982e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015421910358467625, + "loss": 0.0115, "step": 374930 }, { - "epoch": 1.89, - "learning_rate": 1.6256918132696974e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015421521536830481, + "loss": 0.0129, "step": 374940 }, { - "epoch": 1.89, - "learning_rate": 1.6249350439682962e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015421132715193333, + "loss": 0.0138, "step": 374950 }, { - "epoch": 1.89, - "learning_rate": 1.6241782746668954e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015420743893556187, + "loss": 0.0132, "step": 374960 }, { - "epoch": 1.89, - "learning_rate": 1.6234215053654942e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015420355071919038, + "loss": 0.0121, "step": 374970 }, { - "epoch": 1.89, - "learning_rate": 1.6226647360640933e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015419966250281895, + "loss": 0.01, "step": 374980 }, { - "epoch": 1.89, - "learning_rate": 1.621907966762692e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.0001541957742864475, + "loss": 0.0172, "step": 374990 }, { - "epoch": 1.89, - "learning_rate": 1.621151197461291e-05, - "loss": 0.0035, + "epoch": 0.97, + "learning_rate": 0.000154191886070076, + "loss": 0.0126, "step": 375000 }, { - "epoch": 1.89, - "eval_cer": 0.9144246472852683, - "eval_loss": 0.004302851855754852, - "eval_runtime": 116.6099, - "eval_samples_per_second": 17.151, - "eval_steps_per_second": 4.288, + "epoch": 0.97, + "eval_cer": 0.8817390768834564, + "eval_loss": 0.008427051827311516, + "eval_runtime": 107.5685, + "eval_samples_per_second": 18.593, + "eval_steps_per_second": 4.648, "step": 375000 }, { - "epoch": 1.89, - "learning_rate": 1.62039442815989e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015418799785370452, + "loss": 0.012, "step": 375010 }, { - "epoch": 1.89, - "learning_rate": 1.619637658858489e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.0001541841096373331, + "loss": 0.0136, "step": 375020 }, { - "epoch": 1.89, - "learning_rate": 1.618880889557088e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015418022142096163, + "loss": 0.0121, "step": 375030 }, { - "epoch": 1.89, - "learning_rate": 1.618124120255687e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015417633320459015, + "loss": 0.0115, "step": 375040 }, { - "epoch": 1.89, - "learning_rate": 1.617367350954286e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001541724449882187, + "loss": 0.0122, "step": 375050 }, { - "epoch": 1.89, - "learning_rate": 1.616610581652885e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015416855677184723, + "loss": 0.0134, "step": 375060 }, { - "epoch": 1.89, - "learning_rate": 1.6158538123514838e-05, - "loss": 0.0039, + "epoch": 0.97, + "learning_rate": 0.00015416466855547577, + "loss": 0.0157, "step": 375070 }, { - "epoch": 1.89, - "learning_rate": 1.615097043050083e-05, - "loss": 0.0069, + "epoch": 0.97, + "learning_rate": 0.0001541607803391043, + "loss": 0.0129, "step": 375080 }, { - "epoch": 1.89, - "learning_rate": 1.6143402737486817e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.00015415689212273283, + "loss": 0.0113, "step": 375090 }, { - "epoch": 1.89, - "learning_rate": 1.613583504447281e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015415300390636137, + "loss": 0.0138, "step": 375100 }, { - "epoch": 1.89, - "learning_rate": 1.6128267351458797e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015414911568998991, + "loss": 0.0128, "step": 375110 }, { - "epoch": 1.89, - "learning_rate": 1.612069965844479e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015414522747361843, + "loss": 0.0138, "step": 375120 }, { - "epoch": 1.89, - "learning_rate": 1.6113131965430777e-05, - "loss": 0.0069, + "epoch": 0.97, + "learning_rate": 0.00015414133925724697, + "loss": 0.0142, "step": 375130 }, { - "epoch": 1.89, - "learning_rate": 1.610556427241677e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015413745104087548, + "loss": 0.0141, "step": 375140 }, { - "epoch": 1.89, - "learning_rate": 1.6097996579402757e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015413356282450405, + "loss": 0.0139, "step": 375150 }, { - "epoch": 1.89, - "learning_rate": 1.6090428886388745e-05, - "loss": 0.0045, + "epoch": 0.97, + "learning_rate": 0.00015412967460813257, + "loss": 0.0134, "step": 375160 }, { - "epoch": 1.89, - "learning_rate": 1.6082861193374737e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.0001541257863917611, + "loss": 0.0132, "step": 375170 }, { - "epoch": 1.89, - "learning_rate": 1.6075293500360725e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015412189817538962, + "loss": 0.0132, "step": 375180 }, { - "epoch": 1.89, - "learning_rate": 1.6067725807346716e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.0001541180099590182, + "loss": 0.0134, "step": 375190 }, { - "epoch": 1.89, - "learning_rate": 1.6060158114332705e-05, - "loss": 0.004, + "epoch": 0.97, + "learning_rate": 0.00015411412174264673, + "loss": 0.0126, "step": 375200 }, { - "epoch": 1.89, - "learning_rate": 1.6052590421318696e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.00015411023352627525, + "loss": 0.0144, "step": 375210 }, { - "epoch": 1.89, - "learning_rate": 1.6045022728304685e-05, - "loss": 0.0041, + "epoch": 0.97, + "learning_rate": 0.0001541063453099038, + "loss": 0.0116, "step": 375220 }, { - "epoch": 1.89, - "learning_rate": 1.6037455035290673e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015410245709353233, + "loss": 0.0129, "step": 375230 }, { - "epoch": 1.89, - "learning_rate": 1.6029887342276664e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015409856887716087, + "loss": 0.0108, "step": 375240 }, { - "epoch": 1.89, - "learning_rate": 1.6022319649262653e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.0001540946806607894, + "loss": 0.0103, "step": 375250 }, { - "epoch": 1.89, - "learning_rate": 1.6014751956248644e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015409079244441793, + "loss": 0.012, "step": 375260 }, { - "epoch": 1.89, - "learning_rate": 1.6007184263234632e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015408690422804647, + "loss": 0.012, "step": 375270 }, { - "epoch": 1.89, - "learning_rate": 1.5999616570220624e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.000154083016011675, + "loss": 0.0162, "step": 375280 }, { - "epoch": 1.89, - "learning_rate": 1.5992048877206612e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.00015407912779530353, + "loss": 0.0113, "step": 375290 }, { - "epoch": 1.89, - "learning_rate": 1.59844811841926e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015407523957893207, + "loss": 0.012, "step": 375300 }, { - "epoch": 1.89, - "learning_rate": 1.5976913491178592e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001540713513625606, + "loss": 0.0138, "step": 375310 }, { - "epoch": 1.89, - "learning_rate": 1.596934579816458e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015406746314618915, + "loss": 0.0123, "step": 375320 }, { - "epoch": 1.89, - "learning_rate": 1.5961778105150572e-05, - "loss": 0.006, + "epoch": 0.97, + "learning_rate": 0.00015406357492981767, + "loss": 0.0154, "step": 375330 }, { - "epoch": 1.89, - "learning_rate": 1.595421041213656e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.0001540596867134462, + "loss": 0.0112, "step": 375340 }, { - "epoch": 1.89, - "learning_rate": 1.594664271912255e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015405579849707478, + "loss": 0.0159, "step": 375350 }, { - "epoch": 1.89, - "learning_rate": 1.593907502610854e-05, - "loss": 0.0079, + "epoch": 0.97, + "learning_rate": 0.0001540519102807033, + "loss": 0.0166, "step": 375360 }, { - "epoch": 1.89, - "learning_rate": 1.593150733309453e-05, - "loss": 0.0071, + "epoch": 0.97, + "learning_rate": 0.00015404802206433183, + "loss": 0.013, "step": 375370 }, { - "epoch": 1.89, - "learning_rate": 1.5923939640080516e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015404413384796035, + "loss": 0.0176, "step": 375380 }, { - "epoch": 1.89, - "learning_rate": 1.5916371947066508e-05, - "loss": 0.0042, + "epoch": 0.97, + "learning_rate": 0.0001540402456315889, + "loss": 0.012, "step": 375390 }, { - "epoch": 1.89, - "learning_rate": 1.5908804254052496e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015403635741521743, + "loss": 0.0134, "step": 375400 }, { - "epoch": 1.89, - "learning_rate": 1.5901236561038488e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.00015403246919884597, + "loss": 0.0095, "step": 375410 }, { - "epoch": 1.89, - "learning_rate": 1.5893668868024476e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.0001540285809824745, + "loss": 0.0134, "step": 375420 }, { - "epoch": 1.89, - "learning_rate": 1.5886101175010468e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015402469276610303, + "loss": 0.0123, "step": 375430 }, { - "epoch": 1.89, - "learning_rate": 1.587853348199646e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015402080454973157, + "loss": 0.0093, "step": 375440 }, { - "epoch": 1.89, - "learning_rate": 1.5870965788982447e-05, - "loss": 0.0041, + "epoch": 0.97, + "learning_rate": 0.0001540169163333601, + "loss": 0.0111, "step": 375450 }, { - "epoch": 1.89, - "learning_rate": 1.5863398095968436e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015401302811698863, + "loss": 0.0144, "step": 375460 }, { - "epoch": 1.89, - "learning_rate": 1.5855830402954424e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.00015400913990061717, + "loss": 0.0089, "step": 375470 }, { - "epoch": 1.89, - "learning_rate": 1.5848262709940415e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.0001540052516842457, + "loss": 0.0119, "step": 375480 }, { - "epoch": 1.89, - "learning_rate": 1.5840695016926404e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.00015400136346787425, + "loss": 0.0127, "step": 375490 }, { - "epoch": 1.89, - "learning_rate": 1.5833127323912395e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.00015399747525150277, + "loss": 0.0097, "step": 375500 }, { - "epoch": 1.89, - "learning_rate": 1.5825559630898384e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.0001539935870351313, + "loss": 0.0121, "step": 375510 }, { - "epoch": 1.89, - "learning_rate": 1.5817991937884375e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015398969881875988, + "loss": 0.0147, "step": 375520 }, { - "epoch": 1.89, - "learning_rate": 1.5810424244870363e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.0001539858106023884, + "loss": 0.0114, "step": 375530 }, { - "epoch": 1.89, - "learning_rate": 1.580285655185635e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015398192238601693, + "loss": 0.0141, "step": 375540 }, { - "epoch": 1.89, - "learning_rate": 1.5795288858842343e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.00015397803416964545, + "loss": 0.013, "step": 375550 }, { - "epoch": 1.89, - "learning_rate": 1.578772116582833e-05, - "loss": 0.0073, + "epoch": 0.97, + "learning_rate": 0.00015397414595327402, + "loss": 0.0153, "step": 375560 }, { - "epoch": 1.89, - "learning_rate": 1.5780153472814323e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015397025773690253, + "loss": 0.016, "step": 375570 }, { - "epoch": 1.89, - "learning_rate": 1.577258577980031e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015396636952053107, + "loss": 0.0156, "step": 375580 }, { - "epoch": 1.89, - "learning_rate": 1.5765018086786303e-05, - "loss": 0.004, + "epoch": 0.97, + "learning_rate": 0.0001539624813041596, + "loss": 0.0181, "step": 375590 }, { - "epoch": 1.89, - "learning_rate": 1.575745039377229e-05, - "loss": 0.0067, + "epoch": 0.97, + "learning_rate": 0.00015395859308778816, + "loss": 0.0137, "step": 375600 }, { - "epoch": 1.89, - "learning_rate": 1.5749882700758283e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015395470487141667, + "loss": 0.019, "step": 375610 }, { - "epoch": 1.9, - "learning_rate": 1.574231500774427e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.0001539508166550452, + "loss": 0.0165, "step": 375620 }, { - "epoch": 1.9, - "learning_rate": 1.573474731473026e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015394692843867373, + "loss": 0.0128, "step": 375630 }, { - "epoch": 1.9, - "learning_rate": 1.572717962171625e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015394304022230227, + "loss": 0.0121, "step": 375640 }, { - "epoch": 1.9, - "learning_rate": 1.571961192870224e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.0001539391520059308, + "loss": 0.0133, "step": 375650 }, { - "epoch": 1.9, - "learning_rate": 1.571204423568823e-05, - "loss": 0.0058, + "epoch": 0.97, + "learning_rate": 0.00015393526378955935, + "loss": 0.0156, "step": 375660 }, { - "epoch": 1.9, - "learning_rate": 1.570447654267422e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015393137557318787, + "loss": 0.0127, "step": 375670 }, { - "epoch": 1.9, - "learning_rate": 1.569690884966021e-05, - "loss": 0.0066, + "epoch": 0.97, + "learning_rate": 0.0001539274873568164, + "loss": 0.0118, "step": 375680 }, { - "epoch": 1.9, - "learning_rate": 1.56893411566462e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015392359914044498, + "loss": 0.022, "step": 375690 }, { - "epoch": 1.9, - "learning_rate": 1.5681773463632187e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.0001539197109240735, + "loss": 0.0113, "step": 375700 }, { - "epoch": 1.9, - "learning_rate": 1.567420577061818e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015391582270770203, + "loss": 0.0122, "step": 375710 }, { - "epoch": 1.9, - "learning_rate": 1.5666638077604167e-05, - "loss": 0.0035, + "epoch": 0.97, + "learning_rate": 0.00015391193449133055, + "loss": 0.0158, "step": 375720 }, { - "epoch": 1.9, - "learning_rate": 1.5659070384590158e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015390804627495912, + "loss": 0.0138, "step": 375730 }, { - "epoch": 1.9, - "learning_rate": 1.5651502691576146e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015390415805858763, + "loss": 0.0114, "step": 375740 }, { - "epoch": 1.9, - "learning_rate": 1.5643934998562138e-05, - "loss": 0.0076, + "epoch": 0.97, + "learning_rate": 0.00015390026984221617, + "loss": 0.014, "step": 375750 }, { - "epoch": 1.9, - "learning_rate": 1.5636367305548126e-05, - "loss": 0.0041, + "epoch": 0.97, + "learning_rate": 0.0001538963816258447, + "loss": 0.0115, "step": 375760 }, { - "epoch": 1.9, - "learning_rate": 1.5628799612534114e-05, - "loss": 0.0043, + "epoch": 0.97, + "learning_rate": 0.00015389249340947326, + "loss": 0.009, "step": 375770 }, { - "epoch": 1.9, - "learning_rate": 1.5621231919520106e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015388860519310177, + "loss": 0.0104, "step": 375780 }, { - "epoch": 1.9, - "learning_rate": 1.5613664226506094e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.0001538847169767303, + "loss": 0.0113, "step": 375790 }, { - "epoch": 1.9, - "learning_rate": 1.5606096533492086e-05, - "loss": 0.0054, + "epoch": 0.97, + "learning_rate": 0.00015388082876035883, + "loss": 0.0145, "step": 375800 }, { - "epoch": 1.9, - "learning_rate": 1.5598528840478074e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001538769405439874, + "loss": 0.012, "step": 375810 }, { - "epoch": 1.9, - "learning_rate": 1.5590961147464066e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.0001538730523276159, + "loss": 0.0172, "step": 375820 }, { - "epoch": 1.9, - "learning_rate": 1.5583393454450054e-05, - "loss": 0.0072, + "epoch": 0.97, + "learning_rate": 0.00015386916411124445, + "loss": 0.011, "step": 375830 }, { - "epoch": 1.9, - "learning_rate": 1.5575825761436046e-05, - "loss": 0.0037, + "epoch": 0.97, + "learning_rate": 0.00015386527589487297, + "loss": 0.015, "step": 375840 }, { - "epoch": 1.9, - "learning_rate": 1.5568258068422034e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.00015386138767850153, + "loss": 0.0109, "step": 375850 }, { - "epoch": 1.9, - "learning_rate": 1.5560690375408022e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.00015385749946213008, + "loss": 0.013, "step": 375860 }, { - "epoch": 1.9, - "learning_rate": 1.5553122682394014e-05, - "loss": 0.0048, + "epoch": 0.97, + "learning_rate": 0.0001538536112457586, + "loss": 0.0108, "step": 375870 }, { - "epoch": 1.9, - "learning_rate": 1.5545554989380002e-05, - "loss": 0.0044, + "epoch": 0.97, + "learning_rate": 0.0001538497230293871, + "loss": 0.0117, "step": 375880 }, { - "epoch": 1.9, - "learning_rate": 1.5537987296365993e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015384583481301565, + "loss": 0.0118, "step": 375890 }, { - "epoch": 1.9, - "learning_rate": 1.553041960335198e-05, - "loss": 0.0047, + "epoch": 0.97, + "learning_rate": 0.00015384194659664422, + "loss": 0.0131, "step": 375900 }, { - "epoch": 1.9, - "learning_rate": 1.5522851910337973e-05, - "loss": 0.0063, + "epoch": 0.97, + "learning_rate": 0.00015383805838027273, + "loss": 0.0132, "step": 375910 }, { - "epoch": 1.9, - "learning_rate": 1.551528421732396e-05, - "loss": 0.0056, + "epoch": 0.97, + "learning_rate": 0.00015383417016390127, + "loss": 0.0114, "step": 375920 }, { - "epoch": 1.9, - "learning_rate": 1.550771652430995e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.00015383028194752979, + "loss": 0.0118, "step": 375930 }, { - "epoch": 1.9, - "learning_rate": 1.550014883129594e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.00015382639373115835, + "loss": 0.0125, "step": 375940 }, { - "epoch": 1.9, - "learning_rate": 1.549258113828193e-05, - "loss": 0.0049, + "epoch": 0.97, + "learning_rate": 0.00015382250551478687, + "loss": 0.0095, "step": 375950 }, { - "epoch": 1.9, - "learning_rate": 1.548501344526792e-05, - "loss": 0.005, + "epoch": 0.97, + "learning_rate": 0.0001538186172984154, + "loss": 0.0148, "step": 375960 }, { - "epoch": 1.9, - "learning_rate": 1.547744575225391e-05, - "loss": 0.0057, + "epoch": 0.97, + "learning_rate": 0.00015381472908204393, + "loss": 0.0193, "step": 375970 }, { - "epoch": 1.9, - "learning_rate": 1.54698780592399e-05, - "loss": 0.0068, + "epoch": 0.97, + "learning_rate": 0.0001538108408656725, + "loss": 0.0105, "step": 375980 }, { - "epoch": 1.9, - "learning_rate": 1.546231036622589e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.000153806952649301, + "loss": 0.0117, "step": 375990 }, { - "epoch": 1.9, - "learning_rate": 1.545474267321188e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015380306443292955, + "loss": 0.0167, "step": 376000 }, { - "epoch": 1.9, - "eval_cer": 0.9144372624348985, - "eval_loss": 0.00426588486880064, - "eval_runtime": 116.7025, - "eval_samples_per_second": 17.138, - "eval_steps_per_second": 4.284, + "epoch": 0.97, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.008328206837177277, + "eval_runtime": 107.5837, + "eval_samples_per_second": 18.59, + "eval_steps_per_second": 4.648, "step": 376000 }, { - "epoch": 1.9, - "learning_rate": 1.544717498019787e-05, - "loss": 0.0051, + "epoch": 0.97, + "learning_rate": 0.00015379917621655806, + "loss": 0.0117, "step": 376010 }, { - "epoch": 1.9, - "learning_rate": 1.5439607287183857e-05, - "loss": 0.0062, + "epoch": 0.97, + "learning_rate": 0.00015379528800018663, + "loss": 0.0131, "step": 376020 }, { - "epoch": 1.9, - "learning_rate": 1.543203959416985e-05, - "loss": 0.007, + "epoch": 0.97, + "learning_rate": 0.00015379139978381515, + "loss": 0.0111, "step": 376030 }, { - "epoch": 1.9, - "learning_rate": 1.5424471901155837e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.0001537875115674437, + "loss": 0.0131, "step": 376040 }, { - "epoch": 1.9, - "learning_rate": 1.541690420814183e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.0001537836233510722, + "loss": 0.0131, "step": 376050 }, { - "epoch": 1.9, - "learning_rate": 1.5409336515127817e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015377973513470077, + "loss": 0.0114, "step": 376060 }, { - "epoch": 1.9, - "learning_rate": 1.540176882211381e-05, - "loss": 0.0059, + "epoch": 0.97, + "learning_rate": 0.00015377584691832931, + "loss": 0.0101, "step": 376070 }, { - "epoch": 1.9, - "learning_rate": 1.5394201129099797e-05, - "loss": 0.0055, + "epoch": 0.97, + "learning_rate": 0.00015377195870195783, + "loss": 0.0125, "step": 376080 }, { - "epoch": 1.9, - "learning_rate": 1.5386633436085785e-05, - "loss": 0.0061, + "epoch": 0.97, + "learning_rate": 0.00015376807048558637, + "loss": 0.0163, "step": 376090 }, { - "epoch": 1.9, - "learning_rate": 1.5379065743071777e-05, - "loss": 0.0052, + "epoch": 0.97, + "learning_rate": 0.0001537641822692149, + "loss": 0.0117, "step": 376100 }, { - "epoch": 1.9, - "learning_rate": 1.5371498050057765e-05, - "loss": 0.0053, + "epoch": 0.97, + "learning_rate": 0.00015376029405284345, + "loss": 0.0099, "step": 376110 }, { - "epoch": 1.9, - "learning_rate": 1.5363930357043756e-05, - "loss": 0.0046, + "epoch": 0.97, + "learning_rate": 0.00015375640583647197, + "loss": 0.0119, "step": 376120 }, { - "epoch": 1.9, - "learning_rate": 1.5356362664029745e-05, - "loss": 0.0064, + "epoch": 0.97, + "learning_rate": 0.0001537525176201005, + "loss": 0.0125, "step": 376130 }, { - "epoch": 1.9, - "learning_rate": 1.5348794971015736e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.00015374862940372902, + "loss": 0.0134, "step": 376140 }, { - "epoch": 1.9, - "learning_rate": 1.5341227278001724e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.0001537447411873576, + "loss": 0.0094, "step": 376150 }, { - "epoch": 1.9, - "learning_rate": 1.5333659584987716e-05, - "loss": 0.0042, + "epoch": 0.98, + "learning_rate": 0.0001537408529709861, + "loss": 0.0121, "step": 376160 }, { - "epoch": 1.9, - "learning_rate": 1.5326091891973704e-05, - "loss": 0.0039, + "epoch": 0.98, + "learning_rate": 0.00015373696475461465, + "loss": 0.0121, "step": 376170 }, { - "epoch": 1.9, - "learning_rate": 1.5318524198959692e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015373307653824316, + "loss": 0.0144, "step": 376180 }, { - "epoch": 1.9, - "learning_rate": 1.5310956505945684e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015372918832187173, + "loss": 0.0118, "step": 376190 }, { - "epoch": 1.9, - "learning_rate": 1.5303388812931672e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.00015372530010550025, + "loss": 0.0126, "step": 376200 }, { - "epoch": 1.9, - "learning_rate": 1.5295821119917664e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.0001537214118891288, + "loss": 0.0116, "step": 376210 }, { - "epoch": 1.9, - "learning_rate": 1.5288253426903652e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.0001537175236727573, + "loss": 0.0099, "step": 376220 }, { - "epoch": 1.9, - "learning_rate": 1.5280685733889644e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015371363545638587, + "loss": 0.0126, "step": 376230 }, { - "epoch": 1.9, - "learning_rate": 1.5273118040875632e-05, - "loss": 0.0102, + "epoch": 0.98, + "learning_rate": 0.00015370974724001441, + "loss": 0.0149, "step": 376240 }, { - "epoch": 1.9, - "learning_rate": 1.526555034786162e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015370585902364293, + "loss": 0.0143, "step": 376250 }, { - "epoch": 1.9, - "learning_rate": 1.525798265484761e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015370197080727147, + "loss": 0.0122, "step": 376260 }, { - "epoch": 1.9, - "learning_rate": 1.52504149618336e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.0001536980825909, + "loss": 0.0151, "step": 376270 }, { - "epoch": 1.9, - "learning_rate": 1.524284726881959e-05, - "loss": 0.0069, + "epoch": 0.98, + "learning_rate": 0.00015369419437452855, + "loss": 0.0107, "step": 376280 }, { - "epoch": 1.9, - "learning_rate": 1.523527957580558e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.00015369030615815707, + "loss": 0.0111, "step": 376290 }, { - "epoch": 1.9, - "learning_rate": 1.522771188279157e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.0001536864179417856, + "loss": 0.0106, "step": 376300 }, { - "epoch": 1.9, - "learning_rate": 1.522014418977756e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015368252972541415, + "loss": 0.0125, "step": 376310 }, { - "epoch": 1.9, - "learning_rate": 1.5212576496763548e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001536786415090427, + "loss": 0.0105, "step": 376320 }, { - "epoch": 1.9, - "learning_rate": 1.5205008803749538e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001536747532926712, + "loss": 0.0126, "step": 376330 }, { - "epoch": 1.9, - "learning_rate": 1.5197441110735528e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015367086507629975, + "loss": 0.012, "step": 376340 }, { - "epoch": 1.9, - "learning_rate": 1.5189873417721518e-05, - "loss": 0.0096, + "epoch": 0.98, + "learning_rate": 0.0001536669768599283, + "loss": 0.0126, "step": 376350 }, { - "epoch": 1.9, - "learning_rate": 1.5182305724707507e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015366308864355683, + "loss": 0.0164, "step": 376360 }, { - "epoch": 1.9, - "learning_rate": 1.5174738031693497e-05, - "loss": 0.0077, + "epoch": 0.98, + "learning_rate": 0.00015365920042718535, + "loss": 0.0115, "step": 376370 }, { - "epoch": 1.9, - "learning_rate": 1.5167170338679487e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.0001536553122108139, + "loss": 0.0146, "step": 376380 }, { - "epoch": 1.9, - "learning_rate": 1.5159602645665477e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.0001536514239944424, + "loss": 0.0122, "step": 376390 }, { - "epoch": 1.9, - "learning_rate": 1.5152034952651465e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015364753577807097, + "loss": 0.0119, "step": 376400 }, { - "epoch": 1.9, - "learning_rate": 1.5144467259637455e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.0001536436475616995, + "loss": 0.0133, "step": 376410 }, { - "epoch": 1.9, - "learning_rate": 1.5136899566623445e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015363975934532803, + "loss": 0.0097, "step": 376420 }, { - "epoch": 1.9, - "learning_rate": 1.5129331873609435e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015363587112895654, + "loss": 0.0119, "step": 376430 }, { - "epoch": 1.9, - "learning_rate": 1.5121764180595425e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.0001536319829125851, + "loss": 0.011, "step": 376440 }, { - "epoch": 1.9, - "learning_rate": 1.5114196487581415e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015362809469621365, + "loss": 0.0143, "step": 376450 }, { - "epoch": 1.9, - "learning_rate": 1.5106628794567405e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015362420647984217, + "loss": 0.0145, "step": 376460 }, { - "epoch": 1.9, - "learning_rate": 1.5099061101553395e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.0001536203182634707, + "loss": 0.0138, "step": 376470 }, { - "epoch": 1.9, - "learning_rate": 1.5091493408539383e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015361643004709925, + "loss": 0.0131, "step": 376480 }, { - "epoch": 1.9, - "learning_rate": 1.5083925715525373e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.0001536125418307278, + "loss": 0.0128, "step": 376490 }, { - "epoch": 1.9, - "learning_rate": 1.5076358022511363e-05, - "loss": 0.0042, + "epoch": 0.98, + "learning_rate": 0.0001536086536143563, + "loss": 0.0168, "step": 376500 }, { - "epoch": 1.9, - "learning_rate": 1.5068790329497353e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015360476539798485, + "loss": 0.0113, "step": 376510 }, { - "epoch": 1.9, - "learning_rate": 1.5061222636483343e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.0001536008771816134, + "loss": 0.0134, "step": 376520 }, { - "epoch": 1.9, - "learning_rate": 1.5053654943469333e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015359698896524193, + "loss": 0.0103, "step": 376530 }, { - "epoch": 1.9, - "learning_rate": 1.5046087250455323e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015359310074887045, + "loss": 0.0116, "step": 376540 }, { - "epoch": 1.9, - "learning_rate": 1.5038519557441312e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.000153589212532499, + "loss": 0.0098, "step": 376550 }, { - "epoch": 1.9, - "learning_rate": 1.50309518644273e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015358532431612756, + "loss": 0.0138, "step": 376560 }, { - "epoch": 1.9, - "learning_rate": 1.502338417141329e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015358143609975607, + "loss": 0.015, "step": 376570 }, { - "epoch": 1.9, - "learning_rate": 1.501581647839928e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.0001535775478833846, + "loss": 0.02, "step": 376580 }, { - "epoch": 1.9, - "learning_rate": 1.500824878538527e-05, - "loss": 0.004, + "epoch": 0.98, + "learning_rate": 0.00015357365966701313, + "loss": 0.0111, "step": 376590 }, { - "epoch": 1.9, - "learning_rate": 1.500068109237126e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001535697714506417, + "loss": 0.0141, "step": 376600 }, { - "epoch": 1.9, - "learning_rate": 1.499311339935725e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.0001535658832342702, + "loss": 0.0106, "step": 376610 }, { - "epoch": 1.9, - "learning_rate": 1.498554570634324e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015356199501789875, + "loss": 0.0111, "step": 376620 }, { - "epoch": 1.9, - "learning_rate": 1.497797801332923e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015355810680152727, + "loss": 0.0108, "step": 376630 }, { - "epoch": 1.9, - "learning_rate": 1.4970410320315218e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.0001535542185851558, + "loss": 0.0119, "step": 376640 }, { - "epoch": 1.9, - "learning_rate": 1.4962842627301208e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015355033036878435, + "loss": 0.0127, "step": 376650 }, { - "epoch": 1.9, - "learning_rate": 1.4955274934287198e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001535464421524129, + "loss": 0.012, "step": 376660 }, { - "epoch": 1.9, - "learning_rate": 1.4947707241273188e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.0001535425539360414, + "loss": 0.0129, "step": 376670 }, { - "epoch": 1.9, - "learning_rate": 1.4940139548259178e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015353866571966995, + "loss": 0.0101, "step": 376680 }, { - "epoch": 1.9, - "learning_rate": 1.4932571855245168e-05, - "loss": 0.0069, + "epoch": 0.98, + "learning_rate": 0.0001535347775032985, + "loss": 0.0116, "step": 376690 }, { - "epoch": 1.9, - "learning_rate": 1.4925004162231158e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.00015353088928692703, + "loss": 0.0155, "step": 376700 }, { - "epoch": 1.9, - "learning_rate": 1.4917436469217148e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015352700107055555, + "loss": 0.0125, "step": 376710 }, { - "epoch": 1.9, - "learning_rate": 1.4909868776203134e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.0001535231128541841, + "loss": 0.0108, "step": 376720 }, { - "epoch": 1.9, - "learning_rate": 1.4902301083189124e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015351922463781266, + "loss": 0.0146, "step": 376730 }, { - "epoch": 1.9, - "learning_rate": 1.4894733390175114e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015351533642144117, + "loss": 0.0108, "step": 376740 }, { - "epoch": 1.9, - "learning_rate": 1.4887165697161104e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015351144820506969, + "loss": 0.011, "step": 376750 }, { - "epoch": 1.9, - "learning_rate": 1.4879598004147096e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015350755998869823, + "loss": 0.0123, "step": 376760 }, { - "epoch": 1.9, - "learning_rate": 1.4872030311133085e-05, - "loss": 0.0076, + "epoch": 0.98, + "learning_rate": 0.0001535036717723268, + "loss": 0.0093, "step": 376770 }, { - "epoch": 1.9, - "learning_rate": 1.4864462618119075e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001534997835559553, + "loss": 0.0158, "step": 376780 }, { - "epoch": 1.9, - "learning_rate": 1.4856894925105065e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015349589533958385, + "loss": 0.0162, "step": 376790 }, { - "epoch": 1.9, - "learning_rate": 1.4849327232091052e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015349200712321237, + "loss": 0.0099, "step": 376800 }, { - "epoch": 1.9, - "learning_rate": 1.4841759539077042e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015348811890684094, + "loss": 0.0122, "step": 376810 }, { - "epoch": 1.9, - "learning_rate": 1.4834191846063032e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015348423069046945, + "loss": 0.0103, "step": 376820 }, { - "epoch": 1.9, - "learning_rate": 1.4826624153049022e-05, - "loss": 0.008, + "epoch": 0.98, + "learning_rate": 0.000153480342474098, + "loss": 0.0084, "step": 376830 }, { - "epoch": 1.9, - "learning_rate": 1.4819056460035011e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.0001534764542577265, + "loss": 0.0109, "step": 376840 }, { - "epoch": 1.9, - "learning_rate": 1.4811488767021001e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015347256604135507, + "loss": 0.0149, "step": 376850 }, { - "epoch": 1.9, - "learning_rate": 1.4803921074006991e-05, - "loss": 0.0083, + "epoch": 0.98, + "learning_rate": 0.0001534686778249836, + "loss": 0.0115, "step": 376860 }, { - "epoch": 1.9, - "learning_rate": 1.479635338099298e-05, - "loss": 0.0069, + "epoch": 0.98, + "learning_rate": 0.00015346478960861213, + "loss": 0.0099, "step": 376870 }, { - "epoch": 1.9, - "learning_rate": 1.478878568797897e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015346090139224065, + "loss": 0.0134, "step": 376880 }, { - "epoch": 1.9, - "learning_rate": 1.478121799496496e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.0001534570131758692, + "loss": 0.0121, "step": 376890 }, { - "epoch": 1.9, - "learning_rate": 1.477365030195095e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.00015345312495949773, + "loss": 0.0126, "step": 376900 }, { - "epoch": 1.9, - "learning_rate": 1.4766082608936939e-05, - "loss": 0.0079, + "epoch": 0.98, + "learning_rate": 0.00015344923674312627, + "loss": 0.0098, "step": 376910 }, { - "epoch": 1.9, - "learning_rate": 1.4758514915922929e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.00015344534852675478, + "loss": 0.01, "step": 376920 }, { - "epoch": 1.9, - "learning_rate": 1.4750947222908919e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015344146031038333, + "loss": 0.0118, "step": 376930 }, { - "epoch": 1.9, - "learning_rate": 1.4743379529894909e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.0001534375720940119, + "loss": 0.0104, "step": 376940 }, { - "epoch": 1.9, - "learning_rate": 1.4735811836880897e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.0001534336838776404, + "loss": 0.0127, "step": 376950 }, { - "epoch": 1.9, - "learning_rate": 1.4728244143866887e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015342979566126895, + "loss": 0.0136, "step": 376960 }, { - "epoch": 1.9, - "learning_rate": 1.4720676450852877e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015342590744489747, + "loss": 0.0106, "step": 376970 }, { - "epoch": 1.9, - "learning_rate": 1.4713108757838867e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015342201922852603, + "loss": 0.0127, "step": 376980 }, { - "epoch": 1.9, - "learning_rate": 1.4705541064824857e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015341813101215455, + "loss": 0.012, "step": 376990 }, { - "epoch": 1.9, - "learning_rate": 1.4697973371810847e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.0001534142427957831, + "loss": 0.0122, "step": 377000 }, { - "epoch": 1.9, - "eval_cer": 0.914438232831024, - "eval_loss": 0.004278304520994425, - "eval_runtime": 116.1202, - "eval_samples_per_second": 17.224, - "eval_steps_per_second": 4.306, + "epoch": 0.98, + "eval_cer": 0.8817376772465223, + "eval_loss": 0.008020076900720596, + "eval_runtime": 107.5591, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.649, "step": 377000 }, { - "epoch": 1.9, - "learning_rate": 1.4690405678796837e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001534103545794116, + "loss": 0.0136, "step": 377010 }, { - "epoch": 1.9, - "learning_rate": 1.4682837985782826e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.00015340646636304017, + "loss": 0.013, "step": 377020 }, { - "epoch": 1.9, - "learning_rate": 1.4675270292768815e-05, - "loss": 0.0035, + "epoch": 0.98, + "learning_rate": 0.0001534025781466687, + "loss": 0.0139, "step": 377030 }, { - "epoch": 1.9, - "learning_rate": 1.4667702599754805e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.00015339868993029723, + "loss": 0.0122, "step": 377040 }, { - "epoch": 1.9, - "learning_rate": 1.4660134906740795e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015339480171392574, + "loss": 0.0121, "step": 377050 }, { - "epoch": 1.9, - "learning_rate": 1.4652567213726784e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.0001533909134975543, + "loss": 0.0132, "step": 377060 }, { - "epoch": 1.9, - "learning_rate": 1.4644999520712774e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015338702528118283, + "loss": 0.0164, "step": 377070 }, { - "epoch": 1.9, - "learning_rate": 1.4637431827698764e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015338313706481137, + "loss": 0.0148, "step": 377080 }, { - "epoch": 1.9, - "learning_rate": 1.4629864134684754e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015337924884843988, + "loss": 0.0108, "step": 377090 }, { - "epoch": 1.9, - "learning_rate": 1.4622296441670744e-05, - "loss": 0.0066, + "epoch": 0.98, + "learning_rate": 0.00015337536063206845, + "loss": 0.0115, "step": 377100 }, { - "epoch": 1.9, - "learning_rate": 1.4614728748656732e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.000153371472415697, + "loss": 0.0153, "step": 377110 }, { - "epoch": 1.9, - "learning_rate": 1.4607161055642722e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001533675841993255, + "loss": 0.0136, "step": 377120 }, { - "epoch": 1.9, - "learning_rate": 1.4599593362628712e-05, - "loss": 0.0084, + "epoch": 0.98, + "learning_rate": 0.00015336369598295405, + "loss": 0.0125, "step": 377130 }, { - "epoch": 1.9, - "learning_rate": 1.4592025669614702e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015335980776658257, + "loss": 0.0153, "step": 377140 }, { - "epoch": 1.9, - "learning_rate": 1.4584457976600692e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015335591955021113, + "loss": 0.0119, "step": 377150 }, { - "epoch": 1.9, - "learning_rate": 1.4576890283586682e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015335203133383965, + "loss": 0.0117, "step": 377160 }, { - "epoch": 1.9, - "learning_rate": 1.4569322590572672e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.0001533481431174682, + "loss": 0.0142, "step": 377170 }, { - "epoch": 1.9, - "learning_rate": 1.4561754897558662e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.0001533442549010967, + "loss": 0.0155, "step": 377180 }, { - "epoch": 1.9, - "learning_rate": 1.455418720454465e-05, - "loss": 0.0083, + "epoch": 0.98, + "learning_rate": 0.00015334036668472527, + "loss": 0.013, "step": 377190 }, { - "epoch": 1.9, - "learning_rate": 1.454661951153064e-05, - "loss": 0.007, + "epoch": 0.98, + "learning_rate": 0.0001533364784683538, + "loss": 0.014, "step": 377200 }, { - "epoch": 1.9, - "learning_rate": 1.453905181851663e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015333259025198233, + "loss": 0.0097, "step": 377210 }, { - "epoch": 1.9, - "learning_rate": 1.453148412550262e-05, - "loss": 0.0081, + "epoch": 0.98, + "learning_rate": 0.00015332870203561084, + "loss": 0.0111, "step": 377220 }, { - "epoch": 1.9, - "learning_rate": 1.452391643248861e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.0001533248138192394, + "loss": 0.0103, "step": 377230 }, { - "epoch": 1.9, - "learning_rate": 1.45163487394746e-05, - "loss": 0.0076, + "epoch": 0.98, + "learning_rate": 0.00015332092560286793, + "loss": 0.0173, "step": 377240 }, { - "epoch": 1.9, - "learning_rate": 1.450878104646059e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.00015331703738649647, + "loss": 0.0107, "step": 377250 }, { - "epoch": 1.9, - "learning_rate": 1.450121335344658e-05, - "loss": 0.0068, + "epoch": 0.98, + "learning_rate": 0.00015331314917012498, + "loss": 0.0136, "step": 377260 }, { - "epoch": 1.9, - "learning_rate": 1.4493645660432568e-05, - "loss": 0.0073, + "epoch": 0.98, + "learning_rate": 0.00015330926095375355, + "loss": 0.0142, "step": 377270 }, { - "epoch": 1.9, - "learning_rate": 1.4486077967418557e-05, - "loss": 0.0083, + "epoch": 0.98, + "learning_rate": 0.0001533053727373821, + "loss": 0.0126, "step": 377280 }, { - "epoch": 1.9, - "learning_rate": 1.4478510274404547e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.0001533014845210106, + "loss": 0.0124, "step": 377290 }, { - "epoch": 1.9, - "learning_rate": 1.4470942581390537e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015329759630463912, + "loss": 0.0116, "step": 377300 }, { - "epoch": 1.9, - "learning_rate": 1.4463374888376527e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.0001532937080882677, + "loss": 0.0132, "step": 377310 }, { - "epoch": 1.9, - "learning_rate": 1.4455807195362517e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.00015328981987189623, + "loss": 0.0159, "step": 377320 }, { - "epoch": 1.9, - "learning_rate": 1.4448239502348507e-05, - "loss": 0.0077, + "epoch": 0.98, + "learning_rate": 0.00015328593165552475, + "loss": 0.0113, "step": 377330 }, { - "epoch": 1.9, - "learning_rate": 1.4440671809334497e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.0001532820434391533, + "loss": 0.0164, "step": 377340 }, { - "epoch": 1.9, - "learning_rate": 1.4433104116320485e-05, - "loss": 0.0042, + "epoch": 0.98, + "learning_rate": 0.00015327815522278183, + "loss": 0.0129, "step": 377350 }, { - "epoch": 1.9, - "learning_rate": 1.4425536423306475e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015327426700641037, + "loss": 0.0112, "step": 377360 }, { - "epoch": 1.9, - "learning_rate": 1.4417968730292465e-05, - "loss": 0.0038, + "epoch": 0.98, + "learning_rate": 0.0001532703787900389, + "loss": 0.0139, "step": 377370 }, { - "epoch": 1.9, - "learning_rate": 1.4410401037278455e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015326649057366743, + "loss": 0.0149, "step": 377380 }, { - "epoch": 1.9, - "learning_rate": 1.4402833344264445e-05, - "loss": 0.0039, + "epoch": 0.98, + "learning_rate": 0.00015326260235729594, + "loss": 0.0128, "step": 377390 }, { - "epoch": 1.9, - "learning_rate": 1.4395265651250435e-05, - "loss": 0.0038, + "epoch": 0.98, + "learning_rate": 0.0001532587141409245, + "loss": 0.0113, "step": 377400 }, { - "epoch": 1.9, - "learning_rate": 1.4387697958236425e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015325482592455303, + "loss": 0.0165, "step": 377410 }, { - "epoch": 1.9, - "learning_rate": 1.4380130265222413e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.00015325093770818157, + "loss": 0.014, "step": 377420 }, { - "epoch": 1.9, - "learning_rate": 1.4372562572208403e-05, - "loss": 0.0039, + "epoch": 0.98, + "learning_rate": 0.00015324704949181008, + "loss": 0.0112, "step": 377430 }, { - "epoch": 1.9, - "learning_rate": 1.4364994879194393e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015324316127543865, + "loss": 0.011, "step": 377440 }, { - "epoch": 1.9, - "learning_rate": 1.4357427186180383e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.0001532392730590672, + "loss": 0.0126, "step": 377450 }, { - "epoch": 1.9, - "learning_rate": 1.4349859493166372e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.0001532353848426957, + "loss": 0.0112, "step": 377460 }, { - "epoch": 1.9, - "learning_rate": 1.4342291800152362e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015323149662632422, + "loss": 0.0141, "step": 377470 }, { - "epoch": 1.9, - "learning_rate": 1.4334724107138352e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.0001532276084099528, + "loss": 0.0146, "step": 377480 }, { - "epoch": 1.9, - "learning_rate": 1.4327156414124342e-05, - "loss": 0.0068, + "epoch": 0.98, + "learning_rate": 0.00015322372019358133, + "loss": 0.0167, "step": 377490 }, { - "epoch": 1.9, - "learning_rate": 1.431958872111033e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015321983197720985, + "loss": 0.0122, "step": 377500 }, { - "epoch": 1.9, - "learning_rate": 1.431202102809632e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.0001532159437608384, + "loss": 0.0103, "step": 377510 }, { - "epoch": 1.9, - "learning_rate": 1.430445333508231e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015321205554446693, + "loss": 0.0164, "step": 377520 }, { - "epoch": 1.9, - "learning_rate": 1.42968856420683e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015320816732809547, + "loss": 0.0119, "step": 377530 }, { - "epoch": 1.9, - "learning_rate": 1.428931794905429e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.000153204279111724, + "loss": 0.0133, "step": 377540 }, { - "epoch": 1.9, - "learning_rate": 1.428175025604028e-05, - "loss": 0.0036, + "epoch": 0.98, + "learning_rate": 0.00015320039089535253, + "loss": 0.0155, "step": 377550 }, { - "epoch": 1.9, - "learning_rate": 1.427418256302627e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.00015319650267898107, + "loss": 0.0158, "step": 377560 }, { - "epoch": 1.9, - "learning_rate": 1.426661487001226e-05, - "loss": 0.007, + "epoch": 0.98, + "learning_rate": 0.0001531926144626096, + "loss": 0.0127, "step": 377570 }, { - "epoch": 1.9, - "learning_rate": 1.4259047176998246e-05, - "loss": 0.0068, + "epoch": 0.98, + "learning_rate": 0.00015318872624623813, + "loss": 0.0121, "step": 377580 }, { - "epoch": 1.9, - "learning_rate": 1.4251479483984236e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015318483802986667, + "loss": 0.0123, "step": 377590 }, { - "epoch": 1.91, - "learning_rate": 1.4243911790970228e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015318094981349524, + "loss": 0.0129, "step": 377600 }, { - "epoch": 1.91, - "learning_rate": 1.4236344097956218e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015317706159712375, + "loss": 0.0137, "step": 377610 }, { - "epoch": 1.91, - "learning_rate": 1.4228776404942208e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.00015317317338075227, + "loss": 0.0115, "step": 377620 }, { - "epoch": 1.91, - "learning_rate": 1.4221208711928198e-05, - "loss": 0.0073, + "epoch": 0.98, + "learning_rate": 0.0001531692851643808, + "loss": 0.0162, "step": 377630 }, { - "epoch": 1.91, - "learning_rate": 1.4213641018914188e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015316539694800932, + "loss": 0.012, "step": 377640 }, { - "epoch": 1.91, - "learning_rate": 1.4206073325900177e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.0001531615087316379, + "loss": 0.016, "step": 377650 }, { - "epoch": 1.91, - "learning_rate": 1.4198505632886164e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015315762051526643, + "loss": 0.0138, "step": 377660 }, { - "epoch": 1.91, - "learning_rate": 1.4190937939872154e-05, - "loss": 0.0076, + "epoch": 0.98, + "learning_rate": 0.00015315373229889495, + "loss": 0.0119, "step": 377670 }, { - "epoch": 1.91, - "learning_rate": 1.4183370246858144e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.0001531498440825235, + "loss": 0.0092, "step": 377680 }, { - "epoch": 1.91, - "learning_rate": 1.4175802553844134e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015314595586615203, + "loss": 0.0142, "step": 377690 }, { - "epoch": 1.91, - "learning_rate": 1.4168234860830124e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015314206764978057, + "loss": 0.0119, "step": 377700 }, { - "epoch": 1.91, - "learning_rate": 1.4160667167816114e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015313817943340909, + "loss": 0.0115, "step": 377710 }, { - "epoch": 1.91, - "learning_rate": 1.4153099474802103e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015313429121703763, + "loss": 0.0131, "step": 377720 }, { - "epoch": 1.91, - "learning_rate": 1.4145531781788095e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015313040300066617, + "loss": 0.0123, "step": 377730 }, { - "epoch": 1.91, - "learning_rate": 1.4137964088774082e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.0001531265147842947, + "loss": 0.015, "step": 377740 }, { - "epoch": 1.91, - "learning_rate": 1.4130396395760071e-05, - "loss": 0.0042, + "epoch": 0.98, + "learning_rate": 0.00015312262656792323, + "loss": 0.0177, "step": 377750 }, { - "epoch": 1.91, - "learning_rate": 1.4122828702746061e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015311873835155177, + "loss": 0.0122, "step": 377760 }, { - "epoch": 1.91, - "learning_rate": 1.4115261009732051e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015311485013518034, + "loss": 0.0168, "step": 377770 }, { - "epoch": 1.91, - "learning_rate": 1.4107693316718041e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.00015311096191880885, + "loss": 0.0161, "step": 377780 }, { - "epoch": 1.91, - "learning_rate": 1.4100125623704031e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015310707370243736, + "loss": 0.0113, "step": 377790 }, { - "epoch": 1.91, - "learning_rate": 1.4092557930690021e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.0001531031854860659, + "loss": 0.0118, "step": 377800 }, { - "epoch": 1.91, - "learning_rate": 1.4084990237676011e-05, - "loss": 0.0038, + "epoch": 0.98, + "learning_rate": 0.00015309929726969448, + "loss": 0.0152, "step": 377810 }, { - "epoch": 1.91, - "learning_rate": 1.4077422544662e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.000153095409053323, + "loss": 0.0119, "step": 377820 }, { - "epoch": 1.91, - "learning_rate": 1.4069854851647989e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015309152083695153, + "loss": 0.0119, "step": 377830 }, { - "epoch": 1.91, - "learning_rate": 1.4062287158633979e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015308763262058005, + "loss": 0.0152, "step": 377840 }, { - "epoch": 1.91, - "learning_rate": 1.4054719465619969e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.00015308374440420861, + "loss": 0.0141, "step": 377850 }, { - "epoch": 1.91, - "learning_rate": 1.4047151772605959e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015307985618783713, + "loss": 0.0201, "step": 377860 }, { - "epoch": 1.91, - "learning_rate": 1.4039584079591949e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015307596797146567, + "loss": 0.0134, "step": 377870 }, { - "epoch": 1.91, - "learning_rate": 1.4032016386577939e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015307207975509419, + "loss": 0.0149, "step": 377880 }, { - "epoch": 1.91, - "learning_rate": 1.4024448693563929e-05, - "loss": 0.0071, + "epoch": 0.98, + "learning_rate": 0.00015306819153872273, + "loss": 0.0148, "step": 377890 }, { - "epoch": 1.91, - "learning_rate": 1.4016881000549917e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015306430332235127, + "loss": 0.0097, "step": 377900 }, { - "epoch": 1.91, - "learning_rate": 1.4009313307535907e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.0001530604151059798, + "loss": 0.017, "step": 377910 }, { - "epoch": 1.91, - "learning_rate": 1.4001745614521897e-05, - "loss": 0.0038, + "epoch": 0.98, + "learning_rate": 0.00015305652688960832, + "loss": 0.0128, "step": 377920 }, { - "epoch": 1.91, - "learning_rate": 1.3994177921507887e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015305263867323687, + "loss": 0.0106, "step": 377930 }, { - "epoch": 1.91, - "learning_rate": 1.3986610228493876e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.0001530487504568654, + "loss": 0.015, "step": 377940 }, { - "epoch": 1.91, - "learning_rate": 1.3979042535479866e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015304486224049395, + "loss": 0.0151, "step": 377950 }, { - "epoch": 1.91, - "learning_rate": 1.3971474842465856e-05, - "loss": 0.0068, + "epoch": 0.98, + "learning_rate": 0.00015304097402412246, + "loss": 0.0135, "step": 377960 }, { - "epoch": 1.91, - "learning_rate": 1.3963907149451844e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.000153037085807751, + "loss": 0.0145, "step": 377970 }, { - "epoch": 1.91, - "learning_rate": 1.3956339456437834e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.00015303319759137957, + "loss": 0.0121, "step": 377980 }, { - "epoch": 1.91, - "learning_rate": 1.3948771763423824e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.0001530293093750081, + "loss": 0.0123, "step": 377990 }, { - "epoch": 1.91, - "learning_rate": 1.3941204070409814e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015302542115863663, + "loss": 0.0192, "step": 378000 }, { - "epoch": 1.91, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004249492194503546, - "eval_runtime": 116.3497, - "eval_samples_per_second": 17.19, - "eval_steps_per_second": 4.297, + "epoch": 0.98, + "eval_cer": 0.8817712685329425, + "eval_loss": 0.008189625106751919, + "eval_runtime": 107.5946, + "eval_samples_per_second": 18.588, + "eval_steps_per_second": 4.647, "step": 378000 }, { - "epoch": 1.91, - "learning_rate": 1.3933636377395804e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.00015302153294226515, + "loss": 0.0133, "step": 378010 }, { - "epoch": 1.91, - "learning_rate": 1.3926068684381794e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.00015301764472589371, + "loss": 0.0129, "step": 378020 }, { - "epoch": 1.91, - "learning_rate": 1.3918500991367784e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015301375650952223, + "loss": 0.0125, "step": 378030 }, { - "epoch": 1.91, - "learning_rate": 1.3910933298353774e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015300986829315077, + "loss": 0.0116, "step": 378040 }, { - "epoch": 1.91, - "learning_rate": 1.3903365605339762e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015300598007677928, + "loss": 0.0158, "step": 378050 }, { - "epoch": 1.91, - "learning_rate": 1.3895797912325752e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015300209186040785, + "loss": 0.0118, "step": 378060 }, { - "epoch": 1.91, - "learning_rate": 1.3888230219311742e-05, - "loss": 0.0091, + "epoch": 0.98, + "learning_rate": 0.00015299820364403637, + "loss": 0.011, "step": 378070 }, { - "epoch": 1.91, - "learning_rate": 1.3880662526297732e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001529943154276649, + "loss": 0.0133, "step": 378080 }, { - "epoch": 1.91, - "learning_rate": 1.3873094833283722e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015299042721129342, + "loss": 0.0109, "step": 378090 }, { - "epoch": 1.91, - "learning_rate": 1.3865527140269712e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.000152986538994922, + "loss": 0.0133, "step": 378100 }, { - "epoch": 1.91, - "learning_rate": 1.3857959447255702e-05, - "loss": 0.007, + "epoch": 0.98, + "learning_rate": 0.0001529826507785505, + "loss": 0.0132, "step": 378110 }, { - "epoch": 1.91, - "learning_rate": 1.3850391754241691e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015297876256217905, + "loss": 0.009, "step": 378120 }, { - "epoch": 1.91, - "learning_rate": 1.384282406122768e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015297487434580756, + "loss": 0.0114, "step": 378130 }, { - "epoch": 1.91, - "learning_rate": 1.383525636821367e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.0001529709861294361, + "loss": 0.0119, "step": 378140 }, { - "epoch": 1.91, - "learning_rate": 1.382768867519966e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015296709791306467, + "loss": 0.0121, "step": 378150 }, { - "epoch": 1.91, - "learning_rate": 1.382012098218565e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.0001529632096966932, + "loss": 0.0115, "step": 378160 }, { - "epoch": 1.91, - "learning_rate": 1.381255328917164e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015295932148032173, + "loss": 0.0106, "step": 378170 }, { - "epoch": 1.91, - "learning_rate": 1.380498559615763e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015295543326395024, + "loss": 0.0128, "step": 378180 }, { - "epoch": 1.91, - "learning_rate": 1.379741790314362e-05, - "loss": 0.0079, + "epoch": 0.98, + "learning_rate": 0.00015295154504757881, + "loss": 0.013, "step": 378190 }, { - "epoch": 1.91, - "learning_rate": 1.3789850210129609e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015294765683120733, + "loss": 0.0101, "step": 378200 }, { - "epoch": 1.91, - "learning_rate": 1.3782282517115597e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.00015294376861483587, + "loss": 0.0101, "step": 378210 }, { - "epoch": 1.91, - "learning_rate": 1.3774714824101587e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015293988039846438, + "loss": 0.0133, "step": 378220 }, { - "epoch": 1.91, - "learning_rate": 1.3767147131087577e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015293599218209295, + "loss": 0.0182, "step": 378230 }, { - "epoch": 1.91, - "learning_rate": 1.3759579438073567e-05, - "loss": 0.0072, + "epoch": 0.98, + "learning_rate": 0.00015293210396572147, + "loss": 0.0135, "step": 378240 }, { - "epoch": 1.91, - "learning_rate": 1.3752011745059557e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.00015292821574935, + "loss": 0.0099, "step": 378250 }, { - "epoch": 1.91, - "learning_rate": 1.3744444052045547e-05, - "loss": 0.0071, + "epoch": 0.98, + "learning_rate": 0.00015292432753297852, + "loss": 0.0126, "step": 378260 }, { - "epoch": 1.91, - "learning_rate": 1.3736876359031537e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.0001529204393166071, + "loss": 0.0152, "step": 378270 }, { - "epoch": 1.91, - "learning_rate": 1.3729308666017527e-05, - "loss": 0.0069, + "epoch": 0.98, + "learning_rate": 0.0001529165511002356, + "loss": 0.0152, "step": 378280 }, { - "epoch": 1.91, - "learning_rate": 1.3721740973003515e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015291266288386415, + "loss": 0.0116, "step": 378290 }, { - "epoch": 1.91, - "learning_rate": 1.3714173279989505e-05, - "loss": 0.0077, + "epoch": 0.98, + "learning_rate": 0.00015290877466749266, + "loss": 0.0096, "step": 378300 }, { - "epoch": 1.91, - "learning_rate": 1.3706605586975495e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015290488645112123, + "loss": 0.0143, "step": 378310 }, { - "epoch": 1.91, - "learning_rate": 1.3699037893961485e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015290099823474977, + "loss": 0.0135, "step": 378320 }, { - "epoch": 1.91, - "learning_rate": 1.3691470200947475e-05, - "loss": 0.0078, + "epoch": 0.98, + "learning_rate": 0.0001528971100183783, + "loss": 0.0113, "step": 378330 }, { - "epoch": 1.91, - "learning_rate": 1.3683902507933464e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.0001528932218020068, + "loss": 0.0145, "step": 378340 }, { - "epoch": 1.91, - "learning_rate": 1.3676334814919454e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015288933358563537, + "loss": 0.0112, "step": 378350 }, { - "epoch": 1.91, - "learning_rate": 1.3668767121905444e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.0001528854453692639, + "loss": 0.0123, "step": 378360 }, { - "epoch": 1.91, - "learning_rate": 1.3661199428891433e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015288155715289243, + "loss": 0.0118, "step": 378370 }, { - "epoch": 1.91, - "learning_rate": 1.3653631735877422e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015287766893652097, + "loss": 0.0152, "step": 378380 }, { - "epoch": 1.91, - "learning_rate": 1.3646064042863412e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015287378072014948, + "loss": 0.0138, "step": 378390 }, { - "epoch": 1.91, - "learning_rate": 1.3638496349849402e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015286989250377805, + "loss": 0.0114, "step": 378400 }, { - "epoch": 1.91, - "learning_rate": 1.3630928656835392e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015286600428740657, + "loss": 0.0131, "step": 378410 }, { - "epoch": 1.91, - "learning_rate": 1.3623360963821382e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001528621160710351, + "loss": 0.014, "step": 378420 }, { - "epoch": 1.91, - "learning_rate": 1.3615793270807372e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015285822785466362, + "loss": 0.0155, "step": 378430 }, { - "epoch": 1.91, - "learning_rate": 1.3608225577793362e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.0001528543396382922, + "loss": 0.0135, "step": 378440 }, { - "epoch": 1.91, - "learning_rate": 1.360065788477935e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.0001528504514219207, + "loss": 0.0117, "step": 378450 }, { - "epoch": 1.91, - "learning_rate": 1.359309019176534e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015284656320554925, + "loss": 0.0115, "step": 378460 }, { - "epoch": 1.91, - "learning_rate": 1.358552249875133e-05, - "loss": 0.0037, + "epoch": 0.98, + "learning_rate": 0.00015284267498917776, + "loss": 0.0112, "step": 378470 }, { - "epoch": 1.91, - "learning_rate": 1.357795480573732e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015283878677280633, + "loss": 0.014, "step": 378480 }, { - "epoch": 1.91, - "learning_rate": 1.357038711272331e-05, - "loss": 0.007, + "epoch": 0.98, + "learning_rate": 0.00015283489855643485, + "loss": 0.0117, "step": 378490 }, { - "epoch": 1.91, - "learning_rate": 1.35628194197093e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.0001528310103400634, + "loss": 0.0149, "step": 378500 }, { - "epoch": 1.91, - "learning_rate": 1.355525172669529e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.0001528271221236919, + "loss": 0.0124, "step": 378510 }, { - "epoch": 1.91, - "learning_rate": 1.3547684033681276e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015282323390732047, + "loss": 0.0122, "step": 378520 }, { - "epoch": 1.91, - "learning_rate": 1.3540116340667266e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.000152819345690949, + "loss": 0.0106, "step": 378530 }, { - "epoch": 1.91, - "learning_rate": 1.3532548647653256e-05, - "loss": 0.007, + "epoch": 0.98, + "learning_rate": 0.00015281545747457753, + "loss": 0.0119, "step": 378540 }, { - "epoch": 1.91, - "learning_rate": 1.3524980954639246e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015281156925820607, + "loss": 0.0136, "step": 378550 }, { - "epoch": 1.91, - "learning_rate": 1.3517413261625236e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.0001528076810418346, + "loss": 0.0128, "step": 378560 }, { - "epoch": 1.91, - "learning_rate": 1.3509845568611227e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.00015280379282546315, + "loss": 0.0156, "step": 378570 }, { - "epoch": 1.91, - "learning_rate": 1.3502277875597217e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015279990460909167, + "loss": 0.0131, "step": 378580 }, { - "epoch": 1.91, - "learning_rate": 1.3494710182583207e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.0001527960163927202, + "loss": 0.0132, "step": 378590 }, { - "epoch": 1.91, - "learning_rate": 1.3487142489569194e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015279212817634875, + "loss": 0.0234, "step": 378600 }, { - "epoch": 1.91, - "learning_rate": 1.3479574796555184e-05, - "loss": 0.0071, + "epoch": 0.98, + "learning_rate": 0.0001527882399599773, + "loss": 0.0157, "step": 378610 }, { - "epoch": 1.91, - "learning_rate": 1.3472007103541174e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001527843517436058, + "loss": 0.0112, "step": 378620 }, { - "epoch": 1.91, - "learning_rate": 1.3464439410527163e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015278046352723435, + "loss": 0.0135, "step": 378630 }, { - "epoch": 1.91, - "learning_rate": 1.3456871717513153e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015277657531086286, + "loss": 0.0121, "step": 378640 }, { - "epoch": 1.91, - "learning_rate": 1.3449304024499143e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015277268709449143, + "loss": 0.0107, "step": 378650 }, { - "epoch": 1.91, - "learning_rate": 1.3441736331485133e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015276879887811995, + "loss": 0.0113, "step": 378660 }, { - "epoch": 1.91, - "learning_rate": 1.3434168638471123e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.0001527649106617485, + "loss": 0.0127, "step": 378670 }, { - "epoch": 1.91, - "learning_rate": 1.3426600945457111e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.000152761022445377, + "loss": 0.01, "step": 378680 }, { - "epoch": 1.91, - "learning_rate": 1.3419033252443101e-05, - "loss": 0.008, + "epoch": 0.98, + "learning_rate": 0.00015275713422900557, + "loss": 0.0106, "step": 378690 }, { - "epoch": 1.91, - "learning_rate": 1.3411465559429091e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.0001527532460126341, + "loss": 0.0124, "step": 378700 }, { - "epoch": 1.91, - "learning_rate": 1.3403897866415081e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015274935779626263, + "loss": 0.009, "step": 378710 }, { - "epoch": 1.91, - "learning_rate": 1.3396330173401071e-05, - "loss": 0.0079, + "epoch": 0.98, + "learning_rate": 0.00015274546957989117, + "loss": 0.0128, "step": 378720 }, { - "epoch": 1.91, - "learning_rate": 1.3388762480387061e-05, - "loss": 0.0066, + "epoch": 0.98, + "learning_rate": 0.0001527415813635197, + "loss": 0.012, "step": 378730 }, { - "epoch": 1.91, - "learning_rate": 1.338119478737305e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015273769314714825, + "loss": 0.0131, "step": 378740 }, { - "epoch": 1.91, - "learning_rate": 1.337362709435904e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015273380493077677, + "loss": 0.0093, "step": 378750 }, { - "epoch": 1.91, - "learning_rate": 1.3366059401345029e-05, - "loss": 0.0071, + "epoch": 0.98, + "learning_rate": 0.0001527299167144053, + "loss": 0.0124, "step": 378760 }, { - "epoch": 1.91, - "learning_rate": 1.3358491708331019e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015272602849803385, + "loss": 0.0117, "step": 378770 }, { - "epoch": 1.91, - "learning_rate": 1.3350924015317009e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.0001527221402816624, + "loss": 0.012, "step": 378780 }, { - "epoch": 1.91, - "learning_rate": 1.3343356322302999e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.0001527182520652909, + "loss": 0.0092, "step": 378790 }, { - "epoch": 1.91, - "learning_rate": 1.3335788629288989e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.00015271436384891945, + "loss": 0.0117, "step": 378800 }, { - "epoch": 1.91, - "learning_rate": 1.3328220936274979e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.000152710475632548, + "loss": 0.0111, "step": 378810 }, { - "epoch": 1.91, - "learning_rate": 1.3320653243260968e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015270658741617653, + "loss": 0.0131, "step": 378820 }, { - "epoch": 1.91, - "learning_rate": 1.3313085550246958e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015270269919980504, + "loss": 0.0147, "step": 378830 }, { - "epoch": 1.91, - "learning_rate": 1.3305517857232947e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015269881098343359, + "loss": 0.0123, "step": 378840 }, { - "epoch": 1.91, - "learning_rate": 1.3297950164218936e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015269492276706216, + "loss": 0.0133, "step": 378850 }, { - "epoch": 1.91, - "learning_rate": 1.3290382471204926e-05, - "loss": 0.0037, + "epoch": 0.98, + "learning_rate": 0.00015269103455069067, + "loss": 0.0118, "step": 378860 }, { - "epoch": 1.91, - "learning_rate": 1.3282814778190916e-05, - "loss": 0.0055, + "epoch": 0.98, + "learning_rate": 0.0001526871463343192, + "loss": 0.0107, "step": 378870 }, { - "epoch": 1.91, - "learning_rate": 1.3275247085176906e-05, - "loss": 0.0085, + "epoch": 0.98, + "learning_rate": 0.00015268325811794773, + "loss": 0.0139, "step": 378880 }, { - "epoch": 1.91, - "learning_rate": 1.3267679392162896e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015267936990157624, + "loss": 0.0118, "step": 378890 }, { - "epoch": 1.91, - "learning_rate": 1.3260111699148886e-05, - "loss": 0.0074, + "epoch": 0.98, + "learning_rate": 0.0001526754816852048, + "loss": 0.0159, "step": 378900 }, { - "epoch": 1.91, - "learning_rate": 1.3252544006134876e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015267159346883335, + "loss": 0.0155, "step": 378910 }, { - "epoch": 1.91, - "learning_rate": 1.3244976313120864e-05, - "loss": 0.007, + "epoch": 0.98, + "learning_rate": 0.00015266770525246187, + "loss": 0.0126, "step": 378920 }, { - "epoch": 1.91, - "learning_rate": 1.3237408620106854e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.0001526638170360904, + "loss": 0.0132, "step": 378930 }, { - "epoch": 1.91, - "learning_rate": 1.3229840927092844e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015265992881971895, + "loss": 0.0153, "step": 378940 }, { - "epoch": 1.91, - "learning_rate": 1.3222273234078834e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.0001526560406033475, + "loss": 0.0165, "step": 378950 }, { - "epoch": 1.91, - "learning_rate": 1.3214705541064824e-05, - "loss": 0.0068, + "epoch": 0.98, + "learning_rate": 0.000152652152386976, + "loss": 0.0099, "step": 378960 }, { - "epoch": 1.91, - "learning_rate": 1.3207137848050814e-05, - "loss": 0.005, - "step": 378970 + "epoch": 0.98, + "learning_rate": 0.00015264826417060455, + "loss": 0.0103, + "step": 378970 }, { - "epoch": 1.91, - "learning_rate": 1.3199570155036804e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.0001526443759542331, + "loss": 0.0103, "step": 378980 }, { - "epoch": 1.91, - "learning_rate": 1.3192002462022794e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015264048773786163, + "loss": 0.0134, "step": 378990 }, { - "epoch": 1.91, - "learning_rate": 1.3184434769008782e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015263659952149014, + "loss": 0.0152, "step": 379000 }, { - "epoch": 1.91, - "eval_cer": 0.9144149433240143, - "eval_loss": 0.00423853425309062, - "eval_runtime": 116.3136, - "eval_samples_per_second": 17.195, - "eval_steps_per_second": 4.299, + "epoch": 0.98, + "eval_cer": 0.8817432757942589, + "eval_loss": 0.008436217904090881, + "eval_runtime": 107.5614, + "eval_samples_per_second": 18.594, + "eval_steps_per_second": 4.649, "step": 379000 }, { - "epoch": 1.91, - "learning_rate": 1.3176867075994772e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.00015263271130511869, + "loss": 0.0142, "step": 379010 }, { - "epoch": 1.91, - "learning_rate": 1.3169299382980762e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015262882308874725, + "loss": 0.0159, "step": 379020 }, { - "epoch": 1.91, - "learning_rate": 1.3161731689966752e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015262493487237577, + "loss": 0.0169, "step": 379030 }, { - "epoch": 1.91, - "learning_rate": 1.3154163996952741e-05, - "loss": 0.0069, + "epoch": 0.98, + "learning_rate": 0.0001526210466560043, + "loss": 0.0121, "step": 379040 }, { - "epoch": 1.91, - "learning_rate": 1.3146596303938731e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015261715843963283, + "loss": 0.0127, "step": 379050 }, { - "epoch": 1.91, - "learning_rate": 1.3139028610924721e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001526132702232614, + "loss": 0.0139, "step": 379060 }, { - "epoch": 1.91, - "learning_rate": 1.313146091791071e-05, - "loss": 0.0038, + "epoch": 0.98, + "learning_rate": 0.0001526093820068899, + "loss": 0.0124, "step": 379070 }, { - "epoch": 1.91, - "learning_rate": 1.31238932248967e-05, - "loss": 0.0042, + "epoch": 0.98, + "learning_rate": 0.00015260549379051845, + "loss": 0.0136, "step": 379080 }, { - "epoch": 1.91, - "learning_rate": 1.311632553188269e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.00015260160557414696, + "loss": 0.0137, "step": 379090 }, { - "epoch": 1.91, - "learning_rate": 1.310875783886868e-05, - "loss": 0.0079, + "epoch": 0.98, + "learning_rate": 0.00015259771735777553, + "loss": 0.013, "step": 379100 }, { - "epoch": 1.91, - "learning_rate": 1.3101190145854669e-05, - "loss": 0.0066, + "epoch": 0.98, + "learning_rate": 0.00015259382914140405, + "loss": 0.0141, "step": 379110 }, { - "epoch": 1.91, - "learning_rate": 1.3093622452840659e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.0001525899409250326, + "loss": 0.011, "step": 379120 }, { - "epoch": 1.91, - "learning_rate": 1.3086054759826649e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001525860527086611, + "loss": 0.0134, "step": 379130 }, { - "epoch": 1.91, - "learning_rate": 1.3078487066812639e-05, - "loss": 0.0039, + "epoch": 0.98, + "learning_rate": 0.00015258216449228965, + "loss": 0.0133, "step": 379140 }, { - "epoch": 1.91, - "learning_rate": 1.3070919373798627e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.0001525782762759182, + "loss": 0.0157, "step": 379150 }, { - "epoch": 1.91, - "learning_rate": 1.3063351680784617e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015257438805954673, + "loss": 0.0118, "step": 379160 }, { - "epoch": 1.91, - "learning_rate": 1.3055783987770607e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015257049984317524, + "loss": 0.0135, "step": 379170 }, { - "epoch": 1.91, - "learning_rate": 1.3048216294756597e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015256661162680379, + "loss": 0.0144, "step": 379180 }, { - "epoch": 1.91, - "learning_rate": 1.3040648601742587e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.00015256272341043235, + "loss": 0.0123, "step": 379190 }, { - "epoch": 1.91, - "learning_rate": 1.3033080908728577e-05, - "loss": 0.0042, + "epoch": 0.98, + "learning_rate": 0.00015255883519406087, + "loss": 0.0118, "step": 379200 }, { - "epoch": 1.91, - "learning_rate": 1.3025513215714567e-05, - "loss": 0.0041, + "epoch": 0.98, + "learning_rate": 0.00015255494697768938, + "loss": 0.0103, "step": 379210 }, { - "epoch": 1.91, - "learning_rate": 1.3017945522700556e-05, - "loss": 0.0074, + "epoch": 0.98, + "learning_rate": 0.00015255105876131792, + "loss": 0.0136, "step": 379220 }, { - "epoch": 1.91, - "learning_rate": 1.3010377829686545e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.0001525471705449465, + "loss": 0.0159, "step": 379230 }, { - "epoch": 1.91, - "learning_rate": 1.3002810136672535e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.000152543282328575, + "loss": 0.0114, "step": 379240 }, { - "epoch": 1.91, - "learning_rate": 1.2995242443658525e-05, - "loss": 0.0044, + "epoch": 0.98, + "learning_rate": 0.00015253939411220355, + "loss": 0.0131, "step": 379250 }, { - "epoch": 1.91, - "learning_rate": 1.2987674750644514e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015253550589583206, + "loss": 0.0119, "step": 379260 }, { - "epoch": 1.91, - "learning_rate": 1.2980107057630504e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015253161767946063, + "loss": 0.0119, "step": 379270 }, { - "epoch": 1.91, - "learning_rate": 1.2972539364616494e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015252772946308915, + "loss": 0.012, "step": 379280 }, { - "epoch": 1.91, - "learning_rate": 1.2964971671602484e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.0001525238412467177, + "loss": 0.0116, "step": 379290 }, { - "epoch": 1.91, - "learning_rate": 1.2957403978588474e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.0001525199530303462, + "loss": 0.0136, "step": 379300 }, { - "epoch": 1.91, - "learning_rate": 1.2949836285574462e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015251606481397477, + "loss": 0.0107, "step": 379310 }, { - "epoch": 1.91, - "learning_rate": 1.2942268592560452e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.0001525121765976033, + "loss": 0.0143, "step": 379320 }, { - "epoch": 1.91, - "learning_rate": 1.2934700899546442e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.00015250828838123183, + "loss": 0.0122, "step": 379330 }, { - "epoch": 1.91, - "learning_rate": 1.2927133206532432e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015250440016486034, + "loss": 0.0172, "step": 379340 }, { - "epoch": 1.91, - "learning_rate": 1.2919565513518422e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.0001525005119484889, + "loss": 0.0158, "step": 379350 }, { - "epoch": 1.91, - "learning_rate": 1.2911997820504412e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015249662373211745, + "loss": 0.0136, "step": 379360 }, { - "epoch": 1.91, - "learning_rate": 1.2904430127490402e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015249273551574597, + "loss": 0.0141, "step": 379370 }, { - "epoch": 1.91, - "learning_rate": 1.2896862434476392e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015248884729937448, + "loss": 0.0129, "step": 379380 }, { - "epoch": 1.91, - "learning_rate": 1.2889294741462378e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.00015248495908300302, + "loss": 0.0153, "step": 379390 }, { - "epoch": 1.91, - "learning_rate": 1.2881727048448368e-05, - "loss": 0.0068, + "epoch": 0.98, + "learning_rate": 0.0001524810708666316, + "loss": 0.012, "step": 379400 }, { - "epoch": 1.91, - "learning_rate": 1.287415935543436e-05, - "loss": 0.008, + "epoch": 0.98, + "learning_rate": 0.0001524771826502601, + "loss": 0.0138, "step": 379410 }, { - "epoch": 1.91, - "learning_rate": 1.286659166242035e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.00015247329443388865, + "loss": 0.0127, "step": 379420 }, { - "epoch": 1.91, - "learning_rate": 1.285902396940634e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015246940621751716, + "loss": 0.0124, "step": 379430 }, { - "epoch": 1.91, - "learning_rate": 1.285145627639233e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015246551800114573, + "loss": 0.0133, "step": 379440 }, { - "epoch": 1.91, - "learning_rate": 1.284388858337832e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015246162978477425, + "loss": 0.0141, "step": 379450 }, { - "epoch": 1.91, - "learning_rate": 1.283632089036431e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.0001524577415684028, + "loss": 0.0106, "step": 379460 }, { - "epoch": 1.91, - "learning_rate": 1.2828753197350296e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.0001524538533520313, + "loss": 0.0176, "step": 379470 }, { - "epoch": 1.91, - "learning_rate": 1.2821185504336286e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015244996513565987, + "loss": 0.0124, "step": 379480 }, { - "epoch": 1.91, - "learning_rate": 1.2813617811322276e-05, - "loss": 0.0056, + "epoch": 0.98, + "learning_rate": 0.00015244607691928839, + "loss": 0.0117, "step": 379490 }, { - "epoch": 1.91, - "learning_rate": 1.2806050118308266e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015244218870291693, + "loss": 0.0177, "step": 379500 }, { - "epoch": 1.91, - "learning_rate": 1.2798482425294255e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015243830048654544, + "loss": 0.0122, "step": 379510 }, { - "epoch": 1.91, - "learning_rate": 1.2790914732280245e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.000152434412270174, + "loss": 0.0128, "step": 379520 }, { - "epoch": 1.91, - "learning_rate": 1.2783347039266235e-05, - "loss": 0.005, + "epoch": 0.98, + "learning_rate": 0.00015243052405380253, + "loss": 0.0124, "step": 379530 }, { - "epoch": 1.91, - "learning_rate": 1.2775779346252227e-05, - "loss": 0.0083, + "epoch": 0.98, + "learning_rate": 0.00015242663583743107, + "loss": 0.0531, "step": 379540 }, { - "epoch": 1.91, - "learning_rate": 1.2768211653238213e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.00015242274762105958, + "loss": 0.011, "step": 379550 }, { - "epoch": 1.91, - "learning_rate": 1.2760643960224203e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015241885940468815, + "loss": 0.0169, "step": 379560 }, { - "epoch": 1.91, - "learning_rate": 1.2753076267210193e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001524149711883167, + "loss": 0.0119, "step": 379570 }, { - "epoch": 1.92, - "learning_rate": 1.2745508574196183e-05, - "loss": 0.0066, + "epoch": 0.98, + "learning_rate": 0.0001524110829719452, + "loss": 0.0111, "step": 379580 }, { - "epoch": 1.92, - "learning_rate": 1.2737940881182173e-05, - "loss": 0.0065, + "epoch": 0.98, + "learning_rate": 0.00015240719475557375, + "loss": 0.0139, "step": 379590 }, { - "epoch": 1.92, - "learning_rate": 1.2730373188168163e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001524033065392023, + "loss": 0.0128, "step": 379600 }, { - "epoch": 1.92, - "learning_rate": 1.2722805495154153e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015239941832283083, + "loss": 0.0119, "step": 379610 }, { - "epoch": 1.92, - "learning_rate": 1.2715237802140141e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015239553010645935, + "loss": 0.012, "step": 379620 }, { - "epoch": 1.92, - "learning_rate": 1.2707670109126131e-05, - "loss": 0.0066, + "epoch": 0.98, + "learning_rate": 0.0001523916418900879, + "loss": 0.0178, "step": 379630 }, { - "epoch": 1.92, - "learning_rate": 1.2700102416112121e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.0001523877536737164, + "loss": 0.0135, "step": 379640 }, { - "epoch": 1.92, - "learning_rate": 1.2692534723098111e-05, - "loss": 0.0046, + "epoch": 0.98, + "learning_rate": 0.00015238386545734497, + "loss": 0.0147, "step": 379650 }, { - "epoch": 1.92, - "learning_rate": 1.26849670300841e-05, - "loss": 0.004, + "epoch": 0.98, + "learning_rate": 0.00015237997724097349, + "loss": 0.0127, "step": 379660 }, { - "epoch": 1.92, - "learning_rate": 1.267739933707009e-05, - "loss": 0.0048, + "epoch": 0.98, + "learning_rate": 0.00015237608902460203, + "loss": 0.0166, "step": 379670 }, { - "epoch": 1.92, - "learning_rate": 1.266983164405608e-05, - "loss": 0.0051, + "epoch": 0.98, + "learning_rate": 0.00015237220080823054, + "loss": 0.0101, "step": 379680 }, { - "epoch": 1.92, - "learning_rate": 1.266226395104207e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001523683125918591, + "loss": 0.0114, "step": 379690 }, { - "epoch": 1.92, - "learning_rate": 1.2654696258028059e-05, - "loss": 0.0077, + "epoch": 0.98, + "learning_rate": 0.00015236442437548763, + "loss": 0.018, "step": 379700 }, { - "epoch": 1.92, - "learning_rate": 1.2647128565014049e-05, - "loss": 0.0076, + "epoch": 0.98, + "learning_rate": 0.00015236053615911617, + "loss": 0.0195, "step": 379710 }, { - "epoch": 1.92, - "learning_rate": 1.2639560872000039e-05, - "loss": 0.0045, + "epoch": 0.98, + "learning_rate": 0.00015235664794274468, + "loss": 0.0137, "step": 379720 }, { - "epoch": 1.92, - "learning_rate": 1.2631993178986028e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015235275972637325, + "loss": 0.0106, "step": 379730 }, { - "epoch": 1.92, - "learning_rate": 1.2624425485972018e-05, - "loss": 0.006, + "epoch": 0.98, + "learning_rate": 0.0001523488715100018, + "loss": 0.0117, "step": 379740 }, { - "epoch": 1.92, - "learning_rate": 1.2616857792958008e-05, - "loss": 0.0077, + "epoch": 0.98, + "learning_rate": 0.0001523449832936303, + "loss": 0.0154, "step": 379750 }, { - "epoch": 1.92, - "learning_rate": 1.2609290099943998e-05, - "loss": 0.0067, + "epoch": 0.98, + "learning_rate": 0.00015234109507725885, + "loss": 0.0145, "step": 379760 }, { - "epoch": 1.92, - "learning_rate": 1.2601722406929988e-05, - "loss": 0.0066, + "epoch": 0.98, + "learning_rate": 0.0001523372068608874, + "loss": 0.0129, "step": 379770 }, { - "epoch": 1.92, - "learning_rate": 1.2594154713915976e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.00015233331864451593, + "loss": 0.0152, "step": 379780 }, { - "epoch": 1.92, - "learning_rate": 1.2586587020901966e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015232943042814445, + "loss": 0.015, "step": 379790 }, { - "epoch": 1.92, - "learning_rate": 1.2579019327887956e-05, - "loss": 0.0064, + "epoch": 0.98, + "learning_rate": 0.000152325542211773, + "loss": 0.0106, "step": 379800 }, { - "epoch": 1.92, - "learning_rate": 1.2571451634873946e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015232165399540153, + "loss": 0.0131, "step": 379810 }, { - "epoch": 1.92, - "learning_rate": 1.2563883941859936e-05, - "loss": 0.0072, + "epoch": 0.98, + "learning_rate": 0.00015231776577903007, + "loss": 0.0174, "step": 379820 }, { - "epoch": 1.92, - "learning_rate": 1.2556316248845926e-05, - "loss": 0.0061, + "epoch": 0.98, + "learning_rate": 0.00015231387756265859, + "loss": 0.0095, "step": 379830 }, { - "epoch": 1.92, - "learning_rate": 1.2548748555831916e-05, - "loss": 0.0057, + "epoch": 0.98, + "learning_rate": 0.00015230998934628713, + "loss": 0.012, "step": 379840 }, { - "epoch": 1.92, - "learning_rate": 1.2541180862817906e-05, - "loss": 0.0062, + "epoch": 0.98, + "learning_rate": 0.00015230610112991567, + "loss": 0.0114, "step": 379850 }, { - "epoch": 1.92, - "learning_rate": 1.2533613169803894e-05, - "loss": 0.0075, + "epoch": 0.98, + "learning_rate": 0.0001523022129135442, + "loss": 0.012, "step": 379860 }, { - "epoch": 1.92, - "learning_rate": 1.2526045476789884e-05, - "loss": 0.0047, + "epoch": 0.98, + "learning_rate": 0.00015229832469717272, + "loss": 0.0139, "step": 379870 }, { - "epoch": 1.92, - "learning_rate": 1.2518477783775874e-05, - "loss": 0.0049, + "epoch": 0.98, + "learning_rate": 0.00015229443648080127, + "loss": 0.0125, "step": 379880 }, { - "epoch": 1.92, - "learning_rate": 1.2510910090761864e-05, - "loss": 0.0059, + "epoch": 0.98, + "learning_rate": 0.00015229054826442978, + "loss": 0.0141, "step": 379890 }, { - "epoch": 1.92, - "learning_rate": 1.2503342397747854e-05, - "loss": 0.0085, + "epoch": 0.98, + "learning_rate": 0.00015228666004805835, + "loss": 0.0105, "step": 379900 }, { - "epoch": 1.92, - "learning_rate": 1.2495774704733844e-05, - "loss": 0.0054, + "epoch": 0.98, + "learning_rate": 0.0001522827718316869, + "loss": 0.013, "step": 379910 }, { - "epoch": 1.92, - "learning_rate": 1.2488207011719833e-05, - "loss": 0.0053, + "epoch": 0.98, + "learning_rate": 0.0001522788836153154, + "loss": 0.0107, "step": 379920 }, { - "epoch": 1.92, - "learning_rate": 1.2480639318705823e-05, - "loss": 0.0058, + "epoch": 0.98, + "learning_rate": 0.00015227499539894392, + "loss": 0.0138, "step": 379930 }, { - "epoch": 1.92, - "learning_rate": 1.2473071625691812e-05, - "loss": 0.0087, + "epoch": 0.98, + "learning_rate": 0.0001522711071825725, + "loss": 0.0159, "step": 379940 }, { - "epoch": 1.92, - "learning_rate": 1.2465503932677801e-05, - "loss": 0.0052, + "epoch": 0.98, + "learning_rate": 0.00015226721896620103, + "loss": 0.0123, "step": 379950 }, { - "epoch": 1.92, - "learning_rate": 1.2457936239663791e-05, - "loss": 0.0074, + "epoch": 0.98, + "learning_rate": 0.00015226333074982955, + "loss": 0.0093, "step": 379960 }, { - "epoch": 1.92, - "learning_rate": 1.2450368546649781e-05, - "loss": 0.0063, + "epoch": 0.98, + "learning_rate": 0.0001522594425334581, + "loss": 0.0145, "step": 379970 }, { - "epoch": 1.92, - "learning_rate": 1.2442800853635771e-05, - "loss": 0.0072, + "epoch": 0.98, + "learning_rate": 0.00015225555431708663, + "loss": 0.0125, "step": 379980 }, { - "epoch": 1.92, - "learning_rate": 1.2435233160621761e-05, - "loss": 0.0043, + "epoch": 0.98, + "learning_rate": 0.00015225166610071517, + "loss": 0.01, "step": 379990 }, { - "epoch": 1.92, - "learning_rate": 1.2427665467607751e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015224777788434368, + "loss": 0.0122, "step": 380000 }, { - "epoch": 1.92, - "eval_cer": 0.9144217360968921, - "eval_loss": 0.004196519032120705, - "eval_runtime": 116.3652, - "eval_samples_per_second": 17.187, - "eval_steps_per_second": 4.297, + "epoch": 0.99, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.008343157358467579, + "eval_runtime": 107.6029, + "eval_samples_per_second": 18.587, + "eval_steps_per_second": 4.647, "step": 380000 }, { - "epoch": 1.92, - "learning_rate": 1.2420097774593741e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015224388966797223, + "loss": 0.0107, "step": 380010 }, { - "epoch": 1.92, - "learning_rate": 1.241253008157973e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015224000145160077, + "loss": 0.0127, "step": 380020 }, { - "epoch": 1.92, - "learning_rate": 1.2404962388565719e-05, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.0001522361132352293, + "loss": 0.0132, "step": 380030 }, { - "epoch": 1.92, - "learning_rate": 1.2397394695551709e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015223222501885782, + "loss": 0.0113, "step": 380040 }, { - "epoch": 1.92, - "learning_rate": 1.2389827002537699e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015222833680248637, + "loss": 0.0179, "step": 380050 }, { - "epoch": 1.92, - "learning_rate": 1.2382259309523689e-05, - "loss": 0.0062, + "epoch": 0.99, + "learning_rate": 0.00015222444858611493, + "loss": 0.0115, "step": 380060 }, { - "epoch": 1.92, - "learning_rate": 1.2374691616509679e-05, - "loss": 0.0038, + "epoch": 0.99, + "learning_rate": 0.00015222056036974345, + "loss": 0.0135, "step": 380070 }, { - "epoch": 1.92, - "learning_rate": 1.2367123923495669e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015221667215337196, + "loss": 0.0119, "step": 380080 }, { - "epoch": 1.92, - "learning_rate": 1.2359556230481659e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.0001522127839370005, + "loss": 0.0118, "step": 380090 }, { - "epoch": 1.92, - "learning_rate": 1.2351988537467647e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015220889572062902, + "loss": 0.0354, "step": 380100 }, { - "epoch": 1.92, - "learning_rate": 1.2344420844453637e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.0001522050075042576, + "loss": 0.0109, "step": 380110 }, { - "epoch": 1.92, - "learning_rate": 1.2336853151439627e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015220111928788613, + "loss": 0.0158, "step": 380120 }, { - "epoch": 1.92, - "learning_rate": 1.2329285458425617e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015219723107151464, + "loss": 0.0141, "step": 380130 }, { - "epoch": 1.92, - "learning_rate": 1.2321717765411606e-05, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015219334285514319, + "loss": 0.0127, "step": 380140 }, { - "epoch": 1.92, - "learning_rate": 1.2314150072397596e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015218945463877173, + "loss": 0.0107, "step": 380150 }, { - "epoch": 1.92, - "learning_rate": 1.2306582379383586e-05, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.00015218556642240027, + "loss": 0.0131, "step": 380160 }, { - "epoch": 1.92, - "learning_rate": 1.2299014686369574e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015218167820602878, + "loss": 0.0113, "step": 380170 }, { - "epoch": 1.92, - "learning_rate": 1.2291446993355564e-05, - "loss": 0.007, + "epoch": 0.99, + "learning_rate": 0.00015217778998965733, + "loss": 0.0141, "step": 380180 }, { - "epoch": 1.92, - "learning_rate": 1.2283879300341554e-05, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015217390177328587, + "loss": 0.0135, "step": 380190 }, { - "epoch": 1.92, - "learning_rate": 1.2276311607327544e-05, - "loss": 0.0032, + "epoch": 0.99, + "learning_rate": 0.0001521700135569144, + "loss": 0.014, "step": 380200 }, { - "epoch": 1.92, - "learning_rate": 1.2268743914313534e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015216612534054292, + "loss": 0.0153, "step": 380210 }, { - "epoch": 1.92, - "learning_rate": 1.2261176221299524e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015216223712417147, + "loss": 0.0172, "step": 380220 }, { - "epoch": 1.92, - "learning_rate": 1.2253608528285514e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015215834890780003, + "loss": 0.0097, "step": 380230 }, { - "epoch": 1.92, - "learning_rate": 1.2246040835271504e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015215446069142855, + "loss": 0.0116, "step": 380240 }, { - "epoch": 1.92, - "learning_rate": 1.223847314225749e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015215057247505706, + "loss": 0.0098, "step": 380250 }, { - "epoch": 1.92, - "learning_rate": 1.2230905449243482e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.0001521466842586856, + "loss": 0.0101, "step": 380260 }, { - "epoch": 1.92, - "learning_rate": 1.2223337756229472e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015214279604231417, + "loss": 0.0151, "step": 380270 }, { - "epoch": 1.92, - "learning_rate": 1.2215770063215462e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.0001521389078259427, + "loss": 0.0119, "step": 380280 }, { - "epoch": 1.92, - "learning_rate": 1.2208202370201452e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015213501960957123, + "loss": 0.0105, "step": 380290 }, { - "epoch": 1.92, - "learning_rate": 1.2200634677187442e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015213113139319974, + "loss": 0.0116, "step": 380300 }, { - "epoch": 1.92, - "learning_rate": 1.2193066984173432e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.0001521272431768283, + "loss": 0.0124, "step": 380310 }, { - "epoch": 1.92, - "learning_rate": 1.2185499291159421e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015212335496045683, + "loss": 0.012, "step": 380320 }, { - "epoch": 1.92, - "learning_rate": 1.2177931598145408e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015211946674408537, + "loss": 0.0147, "step": 380330 }, { - "epoch": 1.92, - "learning_rate": 1.2170363905131398e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015211557852771388, + "loss": 0.0135, "step": 380340 }, { - "epoch": 1.92, - "learning_rate": 1.2162796212117388e-05, - "loss": 0.0082, + "epoch": 0.99, + "learning_rate": 0.00015211169031134243, + "loss": 0.0107, "step": 380350 }, { - "epoch": 1.92, - "learning_rate": 1.2155228519103378e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015210780209497097, + "loss": 0.0114, "step": 380360 }, { - "epoch": 1.92, - "learning_rate": 1.2147660826089368e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.0001521039138785995, + "loss": 0.012, "step": 380370 }, { - "epoch": 1.92, - "learning_rate": 1.214009313307536e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015210002566222802, + "loss": 0.0156, "step": 380380 }, { - "epoch": 1.92, - "learning_rate": 1.213252544006135e-05, - "loss": 0.0072, + "epoch": 0.99, + "learning_rate": 0.00015209613744585656, + "loss": 0.0202, "step": 380390 }, { - "epoch": 1.92, - "learning_rate": 1.2124957747047339e-05, - "loss": 0.0092, + "epoch": 0.99, + "learning_rate": 0.0001520922492294851, + "loss": 0.0149, "step": 380400 }, { - "epoch": 1.92, - "learning_rate": 1.2117390054033326e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015208836101311365, + "loss": 0.0109, "step": 380410 }, { - "epoch": 1.92, - "learning_rate": 1.2109822361019316e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015208447279674216, + "loss": 0.0132, "step": 380420 }, { - "epoch": 1.92, - "learning_rate": 1.2102254668005305e-05, - "loss": 0.0075, + "epoch": 0.99, + "learning_rate": 0.0001520805845803707, + "loss": 0.0109, "step": 380430 }, { - "epoch": 1.92, - "learning_rate": 1.2094686974991295e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015207669636399927, + "loss": 0.0134, "step": 380440 }, { - "epoch": 1.92, - "learning_rate": 1.2087119281977285e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.0001520728081476278, + "loss": 0.0116, "step": 380450 }, { - "epoch": 1.92, - "learning_rate": 1.2079551588963275e-05, - "loss": 0.0064, + "epoch": 0.99, + "learning_rate": 0.00015206891993125633, + "loss": 0.0168, "step": 380460 }, { - "epoch": 1.92, - "learning_rate": 1.2071983895949265e-05, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.00015206503171488484, + "loss": 0.0127, "step": 380470 }, { - "epoch": 1.92, - "learning_rate": 1.2064416202935255e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.0001520611434985134, + "loss": 0.0132, "step": 380480 }, { - "epoch": 1.92, - "learning_rate": 1.2056848509921243e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015205725528214193, + "loss": 0.0201, "step": 380490 }, { - "epoch": 1.92, - "learning_rate": 1.2049280816907233e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015205336706577047, + "loss": 0.0149, "step": 380500 }, { - "epoch": 1.92, - "learning_rate": 1.2041713123893223e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015204947884939898, + "loss": 0.0108, "step": 380510 }, { - "epoch": 1.92, - "learning_rate": 1.2034145430879213e-05, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.00015204559063302755, + "loss": 0.0124, "step": 380520 }, { - "epoch": 1.92, - "learning_rate": 1.2026577737865203e-05, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.00015204170241665607, + "loss": 0.0134, "step": 380530 }, { - "epoch": 1.92, - "learning_rate": 1.2019010044851193e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.0001520378142002846, + "loss": 0.0103, "step": 380540 }, { - "epoch": 1.92, - "learning_rate": 1.2011442351837183e-05, - "loss": 0.0095, + "epoch": 0.99, + "learning_rate": 0.00015203392598391312, + "loss": 0.0113, "step": 380550 }, { - "epoch": 1.92, - "learning_rate": 1.2003874658823173e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.0001520300377675417, + "loss": 0.0163, "step": 380560 }, { - "epoch": 1.92, - "learning_rate": 1.199630696580916e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.0001520261495511702, + "loss": 0.0144, "step": 380570 }, { - "epoch": 1.92, - "learning_rate": 1.198873927279515e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015202226133479875, + "loss": 0.0203, "step": 380580 }, { - "epoch": 1.92, - "learning_rate": 1.198117157978114e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015201837311842726, + "loss": 0.0163, "step": 380590 }, { - "epoch": 1.92, - "learning_rate": 1.197360388676713e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.0001520144849020558, + "loss": 0.0153, "step": 380600 }, { - "epoch": 1.92, - "learning_rate": 1.196603619375312e-05, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.00015201059668568437, + "loss": 0.0158, "step": 380610 }, { - "epoch": 1.92, - "learning_rate": 1.195846850073911e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.0001520067084693129, + "loss": 0.0106, "step": 380620 }, { - "epoch": 1.92, - "learning_rate": 1.19509008077251e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015200282025294143, + "loss": 0.0145, "step": 380630 }, { - "epoch": 1.92, - "learning_rate": 1.194333311471109e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015199893203656994, + "loss": 0.0122, "step": 380640 }, { - "epoch": 1.92, - "learning_rate": 1.1935765421697078e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.0001519950438201985, + "loss": 0.0108, "step": 380650 }, { - "epoch": 1.92, - "learning_rate": 1.1928197728683068e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015199115560382703, + "loss": 0.011, "step": 380660 }, { - "epoch": 1.92, - "learning_rate": 1.1920630035669058e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.00015198726738745557, + "loss": 0.0112, "step": 380670 }, { - "epoch": 1.92, - "learning_rate": 1.1913062342655048e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015198337917108408, + "loss": 0.0137, "step": 380680 }, { - "epoch": 1.92, - "learning_rate": 1.1905494649641038e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015197949095471265, + "loss": 0.0129, "step": 380690 }, { - "epoch": 1.92, - "learning_rate": 1.1897926956627028e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015197560273834117, + "loss": 0.0111, "step": 380700 }, { - "epoch": 1.92, - "learning_rate": 1.1890359263613018e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.0001519717145219697, + "loss": 0.0136, "step": 380710 }, { - "epoch": 1.92, - "learning_rate": 1.1882791570599006e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015196782630559822, + "loss": 0.0135, "step": 380720 }, { - "epoch": 1.92, - "learning_rate": 1.1875223877584996e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.0001519639380892268, + "loss": 0.01, "step": 380730 }, { - "epoch": 1.92, - "learning_rate": 1.1867656184570986e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.0001519600498728553, + "loss": 0.0142, "step": 380740 }, { - "epoch": 1.92, - "learning_rate": 1.1860088491556976e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015195616165648385, + "loss": 0.0107, "step": 380750 }, { - "epoch": 1.92, - "learning_rate": 1.1852520798542966e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015195227344011236, + "loss": 0.0132, "step": 380760 }, { - "epoch": 1.92, - "learning_rate": 1.1844953105528956e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015194838522374093, + "loss": 0.0103, "step": 380770 }, { - "epoch": 1.92, - "learning_rate": 1.1837385412514946e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015194449700736947, + "loss": 0.0116, "step": 380780 }, { - "epoch": 1.92, - "learning_rate": 1.1829817719500936e-05, - "loss": 0.0032, + "epoch": 0.99, + "learning_rate": 0.00015194060879099799, + "loss": 0.0109, "step": 380790 }, { - "epoch": 1.92, - "learning_rate": 1.1822250026486924e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.0001519367205746265, + "loss": 0.0139, "step": 380800 }, { - "epoch": 1.92, - "learning_rate": 1.1814682333472914e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015193283235825507, + "loss": 0.0137, "step": 380810 }, { - "epoch": 1.92, - "learning_rate": 1.1807114640458904e-05, - "loss": 0.0082, + "epoch": 0.99, + "learning_rate": 0.0001519289441418836, + "loss": 0.0128, "step": 380820 }, { - "epoch": 1.92, - "learning_rate": 1.1799546947444893e-05, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015192505592551213, + "loss": 0.0114, "step": 380830 }, { - "epoch": 1.92, - "learning_rate": 1.1791979254430883e-05, - "loss": 0.0036, + "epoch": 0.99, + "learning_rate": 0.00015192116770914067, + "loss": 0.0118, "step": 380840 }, { - "epoch": 1.92, - "learning_rate": 1.1784411561416873e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015191727949276918, + "loss": 0.0211, "step": 380850 }, { - "epoch": 1.92, - "learning_rate": 1.1776843868402863e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015191339127639775, + "loss": 0.0106, "step": 380860 }, { - "epoch": 1.92, - "learning_rate": 1.1769276175388853e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015190950306002626, + "loss": 0.0115, "step": 380870 }, { - "epoch": 1.92, - "learning_rate": 1.1761708482374841e-05, - "loss": 0.004, + "epoch": 0.99, + "learning_rate": 0.0001519056148436548, + "loss": 0.0112, "step": 380880 }, { - "epoch": 1.92, - "learning_rate": 1.1754140789360831e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015190172662728332, + "loss": 0.0152, "step": 380890 }, { - "epoch": 1.92, - "learning_rate": 1.1746573096346821e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.0001518978384109119, + "loss": 0.0142, "step": 380900 }, { - "epoch": 1.92, - "learning_rate": 1.1739005403332811e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.0001518939501945404, + "loss": 0.015, "step": 380910 }, { - "epoch": 1.92, - "learning_rate": 1.1731437710318801e-05, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015189006197816895, + "loss": 0.0113, "step": 380920 }, { - "epoch": 1.92, - "learning_rate": 1.1723870017304791e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015188617376179746, + "loss": 0.0137, "step": 380930 }, { - "epoch": 1.92, - "learning_rate": 1.171630232429078e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015188228554542603, + "loss": 0.0128, "step": 380940 }, { - "epoch": 1.92, - "learning_rate": 1.170873463127677e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015187839732905457, + "loss": 0.0112, "step": 380950 }, { - "epoch": 1.92, - "learning_rate": 1.1701166938262759e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015187450911268309, + "loss": 0.0132, "step": 380960 }, { - "epoch": 1.92, - "learning_rate": 1.1693599245248749e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.0001518706208963116, + "loss": 0.0118, "step": 380970 }, { - "epoch": 1.92, - "learning_rate": 1.1686031552234739e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015186673267994017, + "loss": 0.0097, "step": 380980 }, { - "epoch": 1.92, - "learning_rate": 1.1678463859220729e-05, - "loss": 0.0086, + "epoch": 0.99, + "learning_rate": 0.0001518628444635687, + "loss": 0.0103, "step": 380990 }, { - "epoch": 1.92, - "learning_rate": 1.1670896166206719e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015185895624719722, + "loss": 0.0135, "step": 381000 }, { - "epoch": 1.92, - "eval_cer": 0.9144256176813937, - "eval_loss": 0.004235303029417992, - "eval_runtime": 116.578, - "eval_samples_per_second": 17.156, - "eval_steps_per_second": 4.289, + "epoch": 0.99, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.008428123779594898, + "eval_runtime": 107.512, + "eval_samples_per_second": 18.603, + "eval_steps_per_second": 4.651, "step": 381000 }, { - "epoch": 1.92, - "learning_rate": 1.1663328473192709e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015185506803082577, + "loss": 0.0122, "step": 381010 }, { - "epoch": 1.92, - "learning_rate": 1.1655760780178698e-05, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.0001518511798144543, + "loss": 0.0099, "step": 381020 }, { - "epoch": 1.92, - "learning_rate": 1.1648193087164688e-05, - "loss": 0.0102, + "epoch": 0.99, + "learning_rate": 0.00015184729159808285, + "loss": 0.0101, "step": 381030 }, { - "epoch": 1.92, - "learning_rate": 1.1640625394150677e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015184340338171136, + "loss": 0.0148, "step": 381040 }, { - "epoch": 1.92, - "learning_rate": 1.1633057701136666e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.0001518395151653399, + "loss": 0.014, "step": 381050 }, { - "epoch": 1.92, - "learning_rate": 1.1625490008122656e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015183562694896845, + "loss": 0.0107, "step": 381060 }, { - "epoch": 1.92, - "learning_rate": 1.1617922315108646e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.000151831738732597, + "loss": 0.0107, "step": 381070 }, { - "epoch": 1.92, - "learning_rate": 1.1610354622094636e-05, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.0001518278505162255, + "loss": 0.0106, "step": 381080 }, { - "epoch": 1.92, - "learning_rate": 1.1602786929080626e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015182396229985405, + "loss": 0.0124, "step": 381090 }, { - "epoch": 1.92, - "learning_rate": 1.1595219236066616e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015182007408348256, + "loss": 0.014, "step": 381100 }, { - "epoch": 1.92, - "learning_rate": 1.1587651543052606e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015181618586711113, + "loss": 0.0136, "step": 381110 }, { - "epoch": 1.92, - "learning_rate": 1.1580083850038594e-05, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.00015181229765073964, + "loss": 0.0117, "step": 381120 }, { - "epoch": 1.92, - "learning_rate": 1.1572516157024584e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015180840943436818, + "loss": 0.0137, "step": 381130 }, { - "epoch": 1.92, - "learning_rate": 1.1564948464010574e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.0001518045212179967, + "loss": 0.0155, "step": 381140 }, { - "epoch": 1.92, - "learning_rate": 1.1557380770996564e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015180063300162527, + "loss": 0.0138, "step": 381150 }, { - "epoch": 1.92, - "learning_rate": 1.1549813077982554e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.0001517967447852538, + "loss": 0.0118, "step": 381160 }, { - "epoch": 1.92, - "learning_rate": 1.1542245384968544e-05, - "loss": 0.0069, + "epoch": 0.99, + "learning_rate": 0.00015179285656888232, + "loss": 0.0119, "step": 381170 }, { - "epoch": 1.92, - "learning_rate": 1.1534677691954534e-05, - "loss": 0.0074, + "epoch": 0.99, + "learning_rate": 0.00015178896835251087, + "loss": 0.0118, "step": 381180 }, { - "epoch": 1.92, - "learning_rate": 1.1527109998940524e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.0001517850801361394, + "loss": 0.0117, "step": 381190 }, { - "epoch": 1.92, - "learning_rate": 1.151954230592651e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015178119191976795, + "loss": 0.0182, "step": 381200 }, { - "epoch": 1.92, - "learning_rate": 1.15119746129125e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015177730370339646, + "loss": 0.0133, "step": 381210 }, { - "epoch": 1.92, - "learning_rate": 1.150440691989849e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.000151773415487025, + "loss": 0.0117, "step": 381220 }, { - "epoch": 1.92, - "learning_rate": 1.1496839226884482e-05, - "loss": 0.004, + "epoch": 0.99, + "learning_rate": 0.00015176952727065355, + "loss": 0.0121, "step": 381230 }, { - "epoch": 1.92, - "learning_rate": 1.1489271533870471e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.0001517656390542821, + "loss": 0.015, "step": 381240 }, { - "epoch": 1.92, - "learning_rate": 1.1481703840856461e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.0001517617508379106, + "loss": 0.0132, "step": 381250 }, { - "epoch": 1.92, - "learning_rate": 1.1474136147842451e-05, - "loss": 0.004, + "epoch": 0.99, + "learning_rate": 0.00015175786262153914, + "loss": 0.0129, "step": 381260 }, { - "epoch": 1.92, - "learning_rate": 1.1466568454828438e-05, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.0001517539744051677, + "loss": 0.0094, "step": 381270 }, { - "epoch": 1.92, - "learning_rate": 1.1459000761814428e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.00015175008618879623, + "loss": 0.0117, "step": 381280 }, { - "epoch": 1.92, - "learning_rate": 1.1451433068800418e-05, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015174619797242474, + "loss": 0.0126, "step": 381290 }, { - "epoch": 1.92, - "learning_rate": 1.1443865375786408e-05, - "loss": 0.0062, + "epoch": 0.99, + "learning_rate": 0.00015174230975605328, + "loss": 0.018, "step": 381300 }, { - "epoch": 1.92, - "learning_rate": 1.1436297682772397e-05, - "loss": 0.0074, + "epoch": 0.99, + "learning_rate": 0.00015173842153968185, + "loss": 0.015, "step": 381310 }, { - "epoch": 1.92, - "learning_rate": 1.1428729989758387e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015173453332331037, + "loss": 0.0124, "step": 381320 }, { - "epoch": 1.92, - "learning_rate": 1.1421162296744377e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.0001517306451069389, + "loss": 0.011, "step": 381330 }, { - "epoch": 1.92, - "learning_rate": 1.1413594603730367e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015172675689056742, + "loss": 0.0156, "step": 381340 }, { - "epoch": 1.92, - "learning_rate": 1.1406026910716355e-05, - "loss": 0.0086, + "epoch": 0.99, + "learning_rate": 0.00015172286867419597, + "loss": 0.0114, "step": 381350 }, { - "epoch": 1.92, - "learning_rate": 1.1398459217702345e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.0001517189804578245, + "loss": 0.0096, "step": 381360 }, { - "epoch": 1.92, - "learning_rate": 1.1390891524688335e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015171509224145305, + "loss": 0.0113, "step": 381370 }, { - "epoch": 1.92, - "learning_rate": 1.1383323831674325e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015171120402508156, + "loss": 0.0154, "step": 381380 }, { - "epoch": 1.92, - "learning_rate": 1.1375756138660315e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.0001517073158087101, + "loss": 0.0107, "step": 381390 }, { - "epoch": 1.92, - "learning_rate": 1.1368188445646305e-05, - "loss": 0.0072, + "epoch": 0.99, + "learning_rate": 0.00015170342759233865, + "loss": 0.0149, "step": 381400 }, { - "epoch": 1.92, - "learning_rate": 1.1360620752632295e-05, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.0001516995393759672, + "loss": 0.0132, "step": 381410 }, { - "epoch": 1.92, - "learning_rate": 1.1353053059618285e-05, - "loss": 0.0064, + "epoch": 0.99, + "learning_rate": 0.0001516956511595957, + "loss": 0.0119, "step": 381420 }, { - "epoch": 1.92, - "learning_rate": 1.1345485366604273e-05, - "loss": 0.0069, + "epoch": 0.99, + "learning_rate": 0.00015169176294322424, + "loss": 0.0112, "step": 381430 }, { - "epoch": 1.92, - "learning_rate": 1.1337917673590263e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015168787472685279, + "loss": 0.0109, "step": 381440 }, { - "epoch": 1.92, - "learning_rate": 1.1330349980576253e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015168398651048133, + "loss": 0.0154, "step": 381450 }, { - "epoch": 1.92, - "learning_rate": 1.1322782287562243e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015168009829410984, + "loss": 0.0125, "step": 381460 }, { - "epoch": 1.92, - "learning_rate": 1.1315214594548233e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015167621007773838, + "loss": 0.0131, "step": 381470 }, { - "epoch": 1.92, - "learning_rate": 1.1307646901534223e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015167232186136695, + "loss": 0.0155, "step": 381480 }, { - "epoch": 1.92, - "learning_rate": 1.1300079208520212e-05, - "loss": 0.0064, + "epoch": 0.99, + "learning_rate": 0.00015166843364499547, + "loss": 0.0145, "step": 381490 }, { - "epoch": 1.92, - "learning_rate": 1.1292511515506202e-05, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.000151664545428624, + "loss": 0.0147, "step": 381500 }, { - "epoch": 1.92, - "learning_rate": 1.128494382249219e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015166065721225252, + "loss": 0.0137, "step": 381510 }, { - "epoch": 1.92, - "learning_rate": 1.127737612947818e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.0001516567689958811, + "loss": 0.0105, "step": 381520 }, { - "epoch": 1.92, - "learning_rate": 1.126980843646417e-05, - "loss": 0.008, + "epoch": 0.99, + "learning_rate": 0.0001516528807795096, + "loss": 0.0133, "step": 381530 }, { - "epoch": 1.92, - "learning_rate": 1.126224074345016e-05, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015164899256313815, + "loss": 0.0159, "step": 381540 }, { - "epoch": 1.92, - "learning_rate": 1.125467305043615e-05, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.00015164510434676666, + "loss": 0.0101, "step": 381550 }, { - "epoch": 1.93, - "learning_rate": 1.124710535742214e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015164121613039523, + "loss": 0.0163, "step": 381560 }, { - "epoch": 1.93, - "learning_rate": 1.123953766440813e-05, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.00015163732791402375, + "loss": 0.0135, "step": 381570 }, { - "epoch": 1.93, - "learning_rate": 1.123196997139412e-05, - "loss": 0.0074, + "epoch": 0.99, + "learning_rate": 0.0001516334396976523, + "loss": 0.0112, "step": 381580 }, { - "epoch": 1.93, - "learning_rate": 1.1224402278380108e-05, - "loss": 0.0081, + "epoch": 0.99, + "learning_rate": 0.0001516295514812808, + "loss": 0.0139, "step": 381590 }, { - "epoch": 1.93, - "learning_rate": 1.1216834585366098e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015162566326490934, + "loss": 0.0126, "step": 381600 }, { - "epoch": 1.93, - "learning_rate": 1.1209266892352088e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015162177504853789, + "loss": 0.0123, "step": 381610 }, { - "epoch": 1.93, - "learning_rate": 1.1201699199338078e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015161788683216643, + "loss": 0.0105, "step": 381620 }, { - "epoch": 1.93, - "learning_rate": 1.1194131506324068e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015161399861579494, + "loss": 0.0114, "step": 381630 }, { - "epoch": 1.93, - "learning_rate": 1.1186563813310058e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015161011039942348, + "loss": 0.011, "step": 381640 }, { - "epoch": 1.93, - "learning_rate": 1.1178996120296048e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015160622218305205, + "loss": 0.01, "step": 381650 }, { - "epoch": 1.93, - "learning_rate": 1.1171428427282038e-05, - "loss": 0.0062, + "epoch": 0.99, + "learning_rate": 0.00015160233396668057, + "loss": 0.0154, "step": 381660 }, { - "epoch": 1.93, - "learning_rate": 1.1163860734268026e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015159844575030908, + "loss": 0.0119, "step": 381670 }, { - "epoch": 1.93, - "learning_rate": 1.1156293041254016e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015159455753393762, + "loss": 0.0108, "step": 381680 }, { - "epoch": 1.93, - "learning_rate": 1.1148725348240006e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.0001515906693175662, + "loss": 0.0121, "step": 381690 }, { - "epoch": 1.93, - "learning_rate": 1.1141157655225996e-05, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.0001515867811011947, + "loss": 0.013, "step": 381700 }, { - "epoch": 1.93, - "learning_rate": 1.1133589962211985e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015158289288482325, + "loss": 0.012, "step": 381710 }, { - "epoch": 1.93, - "learning_rate": 1.1126022269197975e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015157900466845176, + "loss": 0.014, "step": 381720 }, { - "epoch": 1.93, - "learning_rate": 1.1118454576183965e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015157511645208033, + "loss": 0.0117, "step": 381730 }, { - "epoch": 1.93, - "learning_rate": 1.1110886883169954e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.00015157122823570885, + "loss": 0.0113, "step": 381740 }, { - "epoch": 1.93, - "learning_rate": 1.1103319190155943e-05, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.0001515673400193374, + "loss": 0.0156, "step": 381750 }, { - "epoch": 1.93, - "learning_rate": 1.1095751497141933e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.0001515634518029659, + "loss": 0.0116, "step": 381760 }, { - "epoch": 1.93, - "learning_rate": 1.1088183804127923e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015155956358659447, + "loss": 0.0136, "step": 381770 }, { - "epoch": 1.93, - "learning_rate": 1.1080616111113913e-05, - "loss": 0.0073, + "epoch": 0.99, + "learning_rate": 0.00015155567537022298, + "loss": 0.0135, "step": 381780 }, { - "epoch": 1.93, - "learning_rate": 1.1073048418099903e-05, - "loss": 0.0073, + "epoch": 0.99, + "learning_rate": 0.00015155178715385153, + "loss": 0.0127, "step": 381790 }, { - "epoch": 1.93, - "learning_rate": 1.1065480725085893e-05, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015154789893748004, + "loss": 0.0098, "step": 381800 }, { - "epoch": 1.93, - "learning_rate": 1.1057913032071883e-05, - "loss": 0.0096, + "epoch": 0.99, + "learning_rate": 0.0001515440107211086, + "loss": 0.014, "step": 381810 }, { - "epoch": 1.93, - "learning_rate": 1.1050345339057871e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015154012250473715, + "loss": 0.0108, "step": 381820 }, { - "epoch": 1.93, - "learning_rate": 1.1042777646043861e-05, - "loss": 0.0041, + "epoch": 0.99, + "learning_rate": 0.00015153623428836567, + "loss": 0.0135, "step": 381830 }, { - "epoch": 1.93, - "learning_rate": 1.1035209953029851e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015153234607199418, + "loss": 0.0129, "step": 381840 }, { - "epoch": 1.93, - "learning_rate": 1.1027642260015841e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.00015152845785562272, + "loss": 0.0138, "step": 381850 }, { - "epoch": 1.93, - "learning_rate": 1.102007456700183e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.0001515245696392513, + "loss": 0.0115, "step": 381860 }, { - "epoch": 1.93, - "learning_rate": 1.101250687398782e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.0001515206814228798, + "loss": 0.0108, "step": 381870 }, { - "epoch": 1.93, - "learning_rate": 1.100493918097381e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015151679320650835, + "loss": 0.0127, "step": 381880 }, { - "epoch": 1.93, - "learning_rate": 1.09973714879598e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015151290499013686, + "loss": 0.0096, "step": 381890 }, { - "epoch": 1.93, - "learning_rate": 1.0989803794945789e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015150901677376543, + "loss": 0.013, "step": 381900 }, { - "epoch": 1.93, - "learning_rate": 1.0982236101931779e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015150512855739394, + "loss": 0.0121, "step": 381910 }, { - "epoch": 1.93, - "learning_rate": 1.0974668408917769e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015150124034102249, + "loss": 0.0158, "step": 381920 }, { - "epoch": 1.93, - "learning_rate": 1.0967100715903758e-05, - "loss": 0.008, + "epoch": 0.99, + "learning_rate": 0.000151497352124651, + "loss": 0.0129, "step": 381930 }, { - "epoch": 1.93, - "learning_rate": 1.0959533022889748e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015149346390827957, + "loss": 0.0119, "step": 381940 }, { - "epoch": 1.93, - "learning_rate": 1.0951965329875738e-05, - "loss": 0.0038, + "epoch": 0.99, + "learning_rate": 0.00015148957569190808, + "loss": 0.0108, "step": 381950 }, { - "epoch": 1.93, - "learning_rate": 1.0944397636861728e-05, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015148568747553663, + "loss": 0.0136, "step": 381960 }, { - "epoch": 1.93, - "learning_rate": 1.0936829943847718e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015148179925916514, + "loss": 0.0141, "step": 381970 }, { - "epoch": 1.93, - "learning_rate": 1.0929262250833706e-05, - "loss": 0.0086, + "epoch": 0.99, + "learning_rate": 0.0001514779110427937, + "loss": 0.0107, "step": 381980 }, { - "epoch": 1.93, - "learning_rate": 1.0921694557819696e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015147402282642222, + "loss": 0.0168, "step": 381990 }, { - "epoch": 1.93, - "learning_rate": 1.0914126864805686e-05, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.00015147013461005077, + "loss": 0.0126, "step": 382000 }, { - "epoch": 1.93, - "eval_cer": 0.9144032985705095, - "eval_loss": 0.004233332350850105, - "eval_runtime": 116.331, - "eval_samples_per_second": 17.192, - "eval_steps_per_second": 4.298, + "epoch": 0.99, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.007775302045047283, + "eval_runtime": 107.5939, + "eval_samples_per_second": 18.588, + "eval_steps_per_second": 4.647, "step": 382000 }, { - "epoch": 1.93, - "learning_rate": 1.0906559171791676e-05, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.00015146624639367928, + "loss": 0.0112, "step": 382010 }, { - "epoch": 1.93, - "learning_rate": 1.0898991478777666e-05, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.00015146235817730785, + "loss": 0.0113, "step": 382020 }, { - "epoch": 1.93, - "learning_rate": 1.0891423785763656e-05, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.0001514584699609364, + "loss": 0.0106, "step": 382030 }, { - "epoch": 1.93, - "learning_rate": 1.0883856092749646e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.0001514545817445649, + "loss": 0.0124, "step": 382040 }, { - "epoch": 1.93, - "learning_rate": 1.0876288399735636e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015145069352819345, + "loss": 0.013, "step": 382050 }, { - "epoch": 1.93, - "learning_rate": 1.0868720706721622e-05, - "loss": 0.0075, + "epoch": 0.99, + "learning_rate": 0.000151446805311822, + "loss": 0.0092, "step": 382060 }, { - "epoch": 1.93, - "learning_rate": 1.0861153013707614e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.00015144291709545053, + "loss": 0.0116, "step": 382070 }, { - "epoch": 1.93, - "learning_rate": 1.0853585320693604e-05, - "loss": 0.0072, + "epoch": 0.99, + "learning_rate": 0.00015143902887907904, + "loss": 0.0183, "step": 382080 }, { - "epoch": 1.93, - "learning_rate": 1.0846017627679594e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015143514066270759, + "loss": 0.0138, "step": 382090 }, { - "epoch": 1.93, - "learning_rate": 1.0838449934665584e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.0001514312524463361, + "loss": 0.0116, "step": 382100 }, { - "epoch": 1.93, - "learning_rate": 1.0830882241651574e-05, - "loss": 0.0085, + "epoch": 0.99, + "learning_rate": 0.00015142736422996467, + "loss": 0.011, "step": 382110 }, { - "epoch": 1.93, - "learning_rate": 1.0823314548637563e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015142347601359318, + "loss": 0.0172, "step": 382120 }, { - "epoch": 1.93, - "learning_rate": 1.0815746855623553e-05, - "loss": 0.0041, + "epoch": 0.99, + "learning_rate": 0.00015141958779722173, + "loss": 0.0115, "step": 382130 }, { - "epoch": 1.93, - "learning_rate": 1.080817916260954e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015141569958085024, + "loss": 0.0123, "step": 382140 }, { - "epoch": 1.93, - "learning_rate": 1.080061146959553e-05, - "loss": 0.0035, + "epoch": 0.99, + "learning_rate": 0.0001514118113644788, + "loss": 0.0118, "step": 382150 }, { - "epoch": 1.93, - "learning_rate": 1.079304377658152e-05, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015140792314810732, + "loss": 0.0119, "step": 382160 }, { - "epoch": 1.93, - "learning_rate": 1.078547608356751e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015140403493173586, + "loss": 0.0161, "step": 382170 }, { - "epoch": 1.93, - "learning_rate": 1.07779083905535e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015140014671536438, + "loss": 0.0135, "step": 382180 }, { - "epoch": 1.93, - "learning_rate": 1.077034069753949e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015139625849899295, + "loss": 0.0136, "step": 382190 }, { - "epoch": 1.93, - "learning_rate": 1.0762773004525481e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.0001513923702826215, + "loss": 0.0135, "step": 382200 }, { - "epoch": 1.93, - "learning_rate": 1.0755205311511471e-05, - "loss": 0.0072, + "epoch": 0.99, + "learning_rate": 0.00015138848206625, + "loss": 0.0123, "step": 382210 }, { - "epoch": 1.93, - "learning_rate": 1.0747637618497457e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.00015138459384987855, + "loss": 0.0135, "step": 382220 }, { - "epoch": 1.93, - "learning_rate": 1.0740069925483447e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.0001513807056335071, + "loss": 0.0103, "step": 382230 }, { - "epoch": 1.93, - "learning_rate": 1.0732502232469437e-05, - "loss": 0.0099, + "epoch": 0.99, + "learning_rate": 0.00015137681741713563, + "loss": 0.0134, "step": 382240 }, { - "epoch": 1.93, - "learning_rate": 1.0724934539455427e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.00015137292920076414, + "loss": 0.0134, "step": 382250 }, { - "epoch": 1.93, - "learning_rate": 1.0717366846441417e-05, - "loss": 0.0069, + "epoch": 0.99, + "learning_rate": 0.00015136904098439269, + "loss": 0.0129, "step": 382260 }, { - "epoch": 1.93, - "learning_rate": 1.0709799153427407e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015136515276802123, + "loss": 0.0148, "step": 382270 }, { - "epoch": 1.93, - "learning_rate": 1.0702231460413397e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015136126455164977, + "loss": 0.0167, "step": 382280 }, { - "epoch": 1.93, - "learning_rate": 1.0694663767399385e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015135737633527828, + "loss": 0.0138, "step": 382290 }, { - "epoch": 1.93, - "learning_rate": 1.0687096074385375e-05, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.00015135348811890682, + "loss": 0.0125, "step": 382300 }, { - "epoch": 1.93, - "learning_rate": 1.0679528381371365e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015134959990253537, + "loss": 0.0104, "step": 382310 }, { - "epoch": 1.93, - "learning_rate": 1.0671960688357355e-05, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.0001513457116861639, + "loss": 0.0109, "step": 382320 }, { - "epoch": 1.93, - "learning_rate": 1.0664392995343345e-05, - "loss": 0.0076, + "epoch": 0.99, + "learning_rate": 0.00015134182346979242, + "loss": 0.0138, "step": 382330 }, { - "epoch": 1.93, - "learning_rate": 1.0656825302329335e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015133793525342096, + "loss": 0.0171, "step": 382340 }, { - "epoch": 1.93, - "learning_rate": 1.0649257609315325e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015133404703704948, + "loss": 0.0103, "step": 382350 }, { - "epoch": 1.93, - "learning_rate": 1.0641689916301315e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015133015882067805, + "loss": 0.0125, "step": 382360 }, { - "epoch": 1.93, - "learning_rate": 1.0634122223287303e-05, - "loss": 0.0074, + "epoch": 0.99, + "learning_rate": 0.0001513262706043066, + "loss": 0.0146, "step": 382370 }, { - "epoch": 1.93, - "learning_rate": 1.0626554530273293e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.0001513223823879351, + "loss": 0.0116, "step": 382380 }, { - "epoch": 1.93, - "learning_rate": 1.0618986837259283e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015131849417156362, + "loss": 0.0127, "step": 382390 }, { - "epoch": 1.93, - "learning_rate": 1.0611419144245273e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.0001513146059551922, + "loss": 0.0118, "step": 382400 }, { - "epoch": 1.93, - "learning_rate": 1.0603851451231262e-05, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015131071773882073, + "loss": 0.0138, "step": 382410 }, { - "epoch": 1.93, - "learning_rate": 1.0596283758217252e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015130682952244924, + "loss": 0.0132, "step": 382420 }, { - "epoch": 1.93, - "learning_rate": 1.0588716065203242e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015130294130607778, + "loss": 0.014, "step": 382430 }, { - "epoch": 1.93, - "learning_rate": 1.0581148372189232e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015129905308970633, + "loss": 0.0127, "step": 382440 }, { - "epoch": 1.93, - "learning_rate": 1.057358067917522e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015129516487333487, + "loss": 0.01, "step": 382450 }, { - "epoch": 1.93, - "learning_rate": 1.056601298616121e-05, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015129127665696338, + "loss": 0.015, "step": 382460 }, { - "epoch": 1.93, - "learning_rate": 1.05584452931472e-05, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015128738844059192, + "loss": 0.0118, "step": 382470 }, { - "epoch": 1.93, - "learning_rate": 1.055087760013319e-05, - "loss": 0.0035, + "epoch": 0.99, + "learning_rate": 0.00015128350022422047, + "loss": 0.0185, "step": 382480 }, { - "epoch": 1.93, - "learning_rate": 1.054330990711918e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.000151279612007849, + "loss": 0.0154, "step": 382490 }, { - "epoch": 1.93, - "learning_rate": 1.053574221410517e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015127572379147752, + "loss": 0.0121, "step": 382500 }, { - "epoch": 1.93, - "learning_rate": 1.052817452109116e-05, - "loss": 0.007, + "epoch": 0.99, + "learning_rate": 0.00015127183557510606, + "loss": 0.0139, "step": 382510 }, { - "epoch": 1.93, - "learning_rate": 1.052060682807715e-05, - "loss": 0.0069, + "epoch": 0.99, + "learning_rate": 0.00015126794735873463, + "loss": 0.0131, "step": 382520 }, { - "epoch": 1.93, - "learning_rate": 1.0513039135063138e-05, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015126405914236315, + "loss": 0.0136, "step": 382530 }, { - "epoch": 1.93, - "learning_rate": 1.0505471442049128e-05, - "loss": 0.0041, + "epoch": 0.99, + "learning_rate": 0.0001512601709259917, + "loss": 0.0116, "step": 382540 }, { - "epoch": 1.93, - "learning_rate": 1.0497903749035118e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.0001512562827096202, + "loss": 0.017, "step": 382550 }, { - "epoch": 1.93, - "learning_rate": 1.0490336056021108e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015125239449324877, + "loss": 0.014, "step": 382560 }, { - "epoch": 1.93, - "learning_rate": 1.0482768363007098e-05, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.00015124850627687729, + "loss": 0.0135, "step": 382570 }, { - "epoch": 1.93, - "learning_rate": 1.0475200669993088e-05, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.00015124461806050583, + "loss": 0.0113, "step": 382580 }, { - "epoch": 1.93, - "learning_rate": 1.0467632976979077e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015124072984413434, + "loss": 0.01, "step": 382590 }, { - "epoch": 1.93, - "learning_rate": 1.0460065283965067e-05, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015123684162776288, + "loss": 0.013, "step": 382600 }, { - "epoch": 1.93, - "learning_rate": 1.0452497590951056e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015123295341139143, + "loss": 0.0124, "step": 382610 }, { - "epoch": 1.93, - "learning_rate": 1.0444929897937046e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015122906519501997, + "loss": 0.0131, "step": 382620 }, { - "epoch": 1.93, - "learning_rate": 1.0437362204923035e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015122517697864848, + "loss": 0.01, "step": 382630 }, { - "epoch": 1.93, - "learning_rate": 1.0429794511909025e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015122128876227702, + "loss": 0.0113, "step": 382640 }, { - "epoch": 1.93, - "learning_rate": 1.0422226818895015e-05, - "loss": 0.0076, + "epoch": 0.99, + "learning_rate": 0.00015121740054590557, + "loss": 0.0106, "step": 382650 }, { - "epoch": 1.93, - "learning_rate": 1.0414659125881005e-05, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.0001512135123295341, + "loss": 0.0105, "step": 382660 }, { - "epoch": 1.93, - "learning_rate": 1.0407091432866995e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015120962411316262, + "loss": 0.0126, "step": 382670 }, { - "epoch": 1.93, - "learning_rate": 1.0399523739852985e-05, - "loss": 0.0087, + "epoch": 0.99, + "learning_rate": 0.00015120573589679116, + "loss": 0.0108, "step": 382680 }, { - "epoch": 1.93, - "learning_rate": 1.0391956046838973e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.00015120184768041973, + "loss": 0.0115, "step": 382690 }, { - "epoch": 1.93, - "learning_rate": 1.0384388353824963e-05, - "loss": 0.0098, + "epoch": 0.99, + "learning_rate": 0.00015119795946404825, + "loss": 0.0132, "step": 382700 }, { - "epoch": 1.93, - "learning_rate": 1.0376820660810953e-05, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015119407124767676, + "loss": 0.0128, "step": 382710 }, { - "epoch": 1.93, - "learning_rate": 1.0369252967796943e-05, - "loss": 0.0084, + "epoch": 0.99, + "learning_rate": 0.0001511901830313053, + "loss": 0.0108, "step": 382720 }, { - "epoch": 1.93, - "learning_rate": 1.0361685274782933e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015118629481493387, + "loss": 0.0126, "step": 382730 }, { - "epoch": 1.93, - "learning_rate": 1.0354117581768923e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015118240659856239, + "loss": 0.0094, "step": 382740 }, { - "epoch": 1.93, - "learning_rate": 1.0346549888754913e-05, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.00015117851838219093, + "loss": 0.0116, "step": 382750 }, { - "epoch": 1.93, - "learning_rate": 1.0338982195740903e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015117463016581944, + "loss": 0.0106, "step": 382760 }, { - "epoch": 1.93, - "learning_rate": 1.033141450272689e-05, - "loss": 0.0062, + "epoch": 0.99, + "learning_rate": 0.000151170741949448, + "loss": 0.0123, "step": 382770 }, { - "epoch": 1.93, - "learning_rate": 1.032384680971288e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015116685373307653, + "loss": 0.0114, "step": 382780 }, { - "epoch": 1.93, - "learning_rate": 1.031627911669887e-05, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015116296551670507, + "loss": 0.0107, "step": 382790 }, { - "epoch": 1.93, - "learning_rate": 1.030871142368486e-05, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.00015115907730033358, + "loss": 0.014, "step": 382800 }, { - "epoch": 1.93, - "learning_rate": 1.030114373067085e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015115518908396215, + "loss": 0.0137, "step": 382810 }, { - "epoch": 1.93, - "learning_rate": 1.029357603765684e-05, - "loss": 0.0041, + "epoch": 0.99, + "learning_rate": 0.00015115130086759066, + "loss": 0.0116, "step": 382820 }, { - "epoch": 1.93, - "learning_rate": 1.028600834464283e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.0001511474126512192, + "loss": 0.0133, "step": 382830 }, { - "epoch": 1.93, - "learning_rate": 1.0278440651628819e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015114352443484772, + "loss": 0.0133, "step": 382840 }, { - "epoch": 1.93, - "learning_rate": 1.0270872958614808e-05, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.00015113963621847626, + "loss": 0.0109, "step": 382850 }, { - "epoch": 1.93, - "learning_rate": 1.0263305265600798e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.0001511357480021048, + "loss": 0.0122, "step": 382860 }, { - "epoch": 1.93, - "learning_rate": 1.0255737572586788e-05, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015113185978573335, + "loss": 0.0142, "step": 382870 }, { - "epoch": 1.93, - "learning_rate": 1.0248169879572778e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015112797156936186, + "loss": 0.0115, "step": 382880 }, { - "epoch": 1.93, - "learning_rate": 1.0240602186558768e-05, - "loss": 0.0076, + "epoch": 0.99, + "learning_rate": 0.0001511240833529904, + "loss": 0.0164, "step": 382890 }, { - "epoch": 1.93, - "learning_rate": 1.0233034493544758e-05, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015112019513661897, + "loss": 0.012, "step": 382900 }, { - "epoch": 1.93, - "learning_rate": 1.0225466800530748e-05, - "loss": 0.0076, + "epoch": 0.99, + "learning_rate": 0.00015111630692024749, + "loss": 0.0116, "step": 382910 }, { - "epoch": 1.93, - "learning_rate": 1.0217899107516736e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015111241870387603, + "loss": 0.0138, "step": 382920 }, { - "epoch": 1.93, - "learning_rate": 1.0210331414502726e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015110853048750454, + "loss": 0.0124, "step": 382930 }, { - "epoch": 1.93, - "learning_rate": 1.0202763721488716e-05, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.0001511046422711331, + "loss": 0.0149, "step": 382940 }, { - "epoch": 1.93, - "learning_rate": 1.0195196028474706e-05, - "loss": 0.0077, + "epoch": 0.99, + "learning_rate": 0.00015110075405476162, + "loss": 0.0135, "step": 382950 }, { - "epoch": 1.93, - "learning_rate": 1.0187628335460696e-05, - "loss": 0.0064, + "epoch": 0.99, + "learning_rate": 0.00015109686583839017, + "loss": 0.0111, "step": 382960 }, { - "epoch": 1.93, - "learning_rate": 1.0180060642446686e-05, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015109297762201868, + "loss": 0.0147, "step": 382970 }, { - "epoch": 1.93, - "learning_rate": 1.0172492949432676e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015108908940564725, + "loss": 0.0155, "step": 382980 }, { - "epoch": 1.93, - "learning_rate": 1.0164925256418666e-05, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015108520118927576, + "loss": 0.0117, "step": 382990 }, { - "epoch": 1.93, - "learning_rate": 1.0157357563404652e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.0001510813129729043, + "loss": 0.0117, "step": 383000 }, { - "epoch": 1.93, - "eval_cer": 0.9144265880775191, - "eval_loss": 0.004191742278635502, - "eval_runtime": 116.3481, - "eval_samples_per_second": 17.19, - "eval_steps_per_second": 4.297, + "epoch": 0.99, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.007927495054900646, + "eval_runtime": 107.7064, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, "step": 383000 }, { - "epoch": 1.93, - "learning_rate": 1.0149789870390642e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.00015107742475653282, + "loss": 0.0139, "step": 383010 }, { - "epoch": 1.93, - "learning_rate": 1.0142222177376632e-05, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.0001510735365401614, + "loss": 0.0155, "step": 383020 }, { - "epoch": 1.93, - "learning_rate": 1.0134654484362622e-05, - "loss": 0.0064, + "epoch": 0.99, + "learning_rate": 0.0001510696483237899, + "loss": 0.0108, "step": 383030 }, { - "epoch": 1.93, - "learning_rate": 1.0127086791348613e-05, - "loss": 0.0064, + "epoch": 0.99, + "learning_rate": 0.00015106576010741845, + "loss": 0.0092, "step": 383040 }, { - "epoch": 1.93, - "learning_rate": 1.0119519098334603e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015106187189104696, + "loss": 0.0114, "step": 383050 }, { - "epoch": 1.93, - "learning_rate": 1.0111951405320593e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.00015105798367467553, + "loss": 0.0119, "step": 383060 }, { - "epoch": 1.93, - "learning_rate": 1.0104383712306583e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015105409545830407, + "loss": 0.0147, "step": 383070 }, { - "epoch": 1.93, - "learning_rate": 1.009681601929257e-05, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.00015105020724193258, + "loss": 0.0122, "step": 383080 }, { - "epoch": 1.93, - "learning_rate": 1.008924832627856e-05, - "loss": 0.0062, + "epoch": 0.99, + "learning_rate": 0.00015104631902556113, + "loss": 0.0143, "step": 383090 }, { - "epoch": 1.93, - "learning_rate": 1.008168063326455e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015104243080918964, + "loss": 0.0155, "step": 383100 }, { - "epoch": 1.93, - "learning_rate": 1.007411294025054e-05, - "loss": 0.0048, + "epoch": 0.99, + "learning_rate": 0.0001510385425928182, + "loss": 0.0108, "step": 383110 }, { - "epoch": 1.93, - "learning_rate": 1.006654524723653e-05, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015103465437644672, + "loss": 0.0242, "step": 383120 }, { - "epoch": 1.93, - "learning_rate": 1.005897755422252e-05, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015103076616007527, + "loss": 0.0108, "step": 383130 }, { - "epoch": 1.93, - "learning_rate": 1.0051409861208509e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015102687794370378, + "loss": 0.0117, "step": 383140 }, { - "epoch": 1.93, - "learning_rate": 1.0043842168194499e-05, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015102298972733235, + "loss": 0.0103, "step": 383150 }, { - "epoch": 1.93, - "learning_rate": 1.0036274475180487e-05, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015101910151096086, + "loss": 0.0116, "step": 383160 }, { - "epoch": 1.93, - "learning_rate": 1.0028706782166477e-05, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.0001510152132945894, + "loss": 0.0157, "step": 383170 }, { - "epoch": 1.93, - "learning_rate": 1.0021139089152467e-05, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015101132507821792, + "loss": 0.0145, "step": 383180 }, { - "epoch": 1.93, - "learning_rate": 1.0013571396138457e-05, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.0001510074368618465, + "loss": 0.0142, "step": 383190 }, { - "epoch": 1.93, - "learning_rate": 1.0006003703124447e-05, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.000151003548645475, + "loss": 0.0126, "step": 383200 }, { - "epoch": 1.93, - "learning_rate": 9.998436010110437e-06, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015099966042910354, + "loss": 0.0128, "step": 383210 }, { - "epoch": 1.93, - "learning_rate": 9.990868317096427e-06, - "loss": 0.0083, + "epoch": 0.99, + "learning_rate": 0.00015099577221273206, + "loss": 0.0142, "step": 383220 }, { - "epoch": 1.93, - "learning_rate": 9.983300624082417e-06, - "loss": 0.004, + "epoch": 0.99, + "learning_rate": 0.00015099188399636063, + "loss": 0.0126, "step": 383230 }, { - "epoch": 1.93, - "learning_rate": 9.975732931068405e-06, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015098799577998917, + "loss": 0.0134, "step": 383240 }, { - "epoch": 1.93, - "learning_rate": 9.968165238054395e-06, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015098410756361768, + "loss": 0.0111, "step": 383250 }, { - "epoch": 1.93, - "learning_rate": 9.960597545040385e-06, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.0001509802193472462, + "loss": 0.0126, "step": 383260 }, { - "epoch": 1.93, - "learning_rate": 9.953029852026375e-06, - "loss": 0.0071, + "epoch": 0.99, + "learning_rate": 0.00015097633113087477, + "loss": 0.0134, "step": 383270 }, { - "epoch": 1.93, - "learning_rate": 9.945462159012365e-06, - "loss": 0.0075, + "epoch": 0.99, + "learning_rate": 0.0001509724429145033, + "loss": 0.0146, "step": 383280 }, { - "epoch": 1.93, - "learning_rate": 9.937894465998354e-06, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015096855469813182, + "loss": 0.0133, "step": 383290 }, { - "epoch": 1.93, - "learning_rate": 9.930326772984344e-06, - "loss": 0.0062, + "epoch": 0.99, + "learning_rate": 0.00015096466648176037, + "loss": 0.009, "step": 383300 }, { - "epoch": 1.93, - "learning_rate": 9.922759079970334e-06, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.0001509607782653889, + "loss": 0.0138, "step": 383310 }, { - "epoch": 1.93, - "learning_rate": 9.915191386956322e-06, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015095689004901745, + "loss": 0.0114, "step": 383320 }, { - "epoch": 1.93, - "learning_rate": 9.907623693942312e-06, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015095300183264596, + "loss": 0.0128, "step": 383330 }, { - "epoch": 1.93, - "learning_rate": 9.900056000928302e-06, - "loss": 0.0058, + "epoch": 0.99, + "learning_rate": 0.0001509491136162745, + "loss": 0.0102, "step": 383340 }, { - "epoch": 1.93, - "learning_rate": 9.892488307914292e-06, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015094522539990302, + "loss": 0.0133, "step": 383350 }, { - "epoch": 1.93, - "learning_rate": 9.884920614900282e-06, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.0001509413371835316, + "loss": 0.014, "step": 383360 }, { - "epoch": 1.93, - "learning_rate": 9.877352921886272e-06, - "loss": 0.0066, + "epoch": 0.99, + "learning_rate": 0.0001509374489671601, + "loss": 0.0157, "step": 383370 }, { - "epoch": 1.93, - "learning_rate": 9.869785228872262e-06, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015093356075078864, + "loss": 0.0139, "step": 383380 }, { - "epoch": 1.93, - "learning_rate": 9.86221753585825e-06, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015092967253441716, + "loss": 0.0178, "step": 383390 }, { - "epoch": 1.93, - "learning_rate": 9.85464984284424e-06, - "loss": 0.0039, + "epoch": 0.99, + "learning_rate": 0.00015092578431804573, + "loss": 0.0184, "step": 383400 }, { - "epoch": 1.93, - "learning_rate": 9.84708214983023e-06, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.00015092189610167427, + "loss": 0.0112, "step": 383410 }, { - "epoch": 1.93, - "learning_rate": 9.83951445681622e-06, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.00015091800788530278, + "loss": 0.0135, "step": 383420 }, { - "epoch": 1.93, - "learning_rate": 9.83194676380221e-06, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.0001509141196689313, + "loss": 0.0116, "step": 383430 }, { - "epoch": 1.93, - "learning_rate": 9.8243790707882e-06, - "loss": 0.004, + "epoch": 0.99, + "learning_rate": 0.00015091023145255987, + "loss": 0.0149, "step": 383440 }, { - "epoch": 1.93, - "learning_rate": 9.81681137777419e-06, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.0001509063432361884, + "loss": 0.0173, "step": 383450 }, { - "epoch": 1.93, - "learning_rate": 9.80924368476018e-06, - "loss": 0.0041, + "epoch": 0.99, + "learning_rate": 0.00015090245501981692, + "loss": 0.0138, "step": 383460 }, { - "epoch": 1.93, - "learning_rate": 9.801675991746168e-06, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015089856680344546, + "loss": 0.0106, "step": 383470 }, { - "epoch": 1.93, - "learning_rate": 9.794108298732158e-06, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.000150894678587074, + "loss": 0.0126, "step": 383480 }, { - "epoch": 1.93, - "learning_rate": 9.786540605718148e-06, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.00015089079037070255, + "loss": 0.0106, "step": 383490 }, { - "epoch": 1.93, - "learning_rate": 9.778972912704138e-06, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.00015088690215433106, + "loss": 0.0113, "step": 383500 }, { - "epoch": 1.93, - "learning_rate": 9.771405219690127e-06, - "loss": 0.0079, + "epoch": 0.99, + "learning_rate": 0.0001508830139379596, + "loss": 0.0112, "step": 383510 }, { - "epoch": 1.93, - "learning_rate": 9.763837526676117e-06, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.00015087912572158815, + "loss": 0.0123, "step": 383520 }, { - "epoch": 1.93, - "learning_rate": 9.756269833662107e-06, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.0001508752375052167, + "loss": 0.0125, "step": 383530 }, { - "epoch": 1.94, - "learning_rate": 9.748702140648097e-06, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.0001508713492888452, + "loss": 0.0095, "step": 383540 }, { - "epoch": 1.94, - "learning_rate": 9.741134447634085e-06, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015086746107247374, + "loss": 0.0099, "step": 383550 }, { - "epoch": 1.94, - "learning_rate": 9.733566754620075e-06, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.0001508635728561023, + "loss": 0.0119, "step": 383560 }, { - "epoch": 1.94, - "learning_rate": 9.725999061606065e-06, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.00015085968463973083, + "loss": 0.0121, "step": 383570 }, { - "epoch": 1.94, - "learning_rate": 9.718431368592055e-06, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015085579642335934, + "loss": 0.013, "step": 383580 }, { - "epoch": 1.94, - "learning_rate": 9.710863675578045e-06, - "loss": 0.0067, + "epoch": 0.99, + "learning_rate": 0.00015085190820698788, + "loss": 0.0144, "step": 383590 }, { - "epoch": 1.94, - "learning_rate": 9.703295982564035e-06, - "loss": 0.0065, + "epoch": 0.99, + "learning_rate": 0.0001508480199906164, + "loss": 0.0091, "step": 383600 }, { - "epoch": 1.94, - "learning_rate": 9.695728289550025e-06, - "loss": 0.0047, + "epoch": 0.99, + "learning_rate": 0.00015084413177424497, + "loss": 0.0111, "step": 383610 }, { - "epoch": 1.94, - "learning_rate": 9.688160596536015e-06, - "loss": 0.0043, + "epoch": 0.99, + "learning_rate": 0.0001508402435578735, + "loss": 0.0099, "step": 383620 }, { - "epoch": 1.94, - "learning_rate": 9.680592903522003e-06, - "loss": 0.005, + "epoch": 0.99, + "learning_rate": 0.00015083635534150202, + "loss": 0.0111, "step": 383630 }, { - "epoch": 1.94, - "learning_rate": 9.673025210507993e-06, - "loss": 0.0059, + "epoch": 0.99, + "learning_rate": 0.00015083246712513056, + "loss": 0.0098, "step": 383640 }, { - "epoch": 1.94, - "learning_rate": 9.665457517493983e-06, - "loss": 0.0063, + "epoch": 0.99, + "learning_rate": 0.0001508285789087591, + "loss": 0.0119, "step": 383650 }, { - "epoch": 1.94, - "learning_rate": 9.657889824479973e-06, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015082469069238765, + "loss": 0.01, "step": 383660 }, { - "epoch": 1.94, - "learning_rate": 9.650322131465963e-06, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015082080247601616, + "loss": 0.0126, "step": 383670 }, { - "epoch": 1.94, - "learning_rate": 9.642754438451953e-06, - "loss": 0.0049, + "epoch": 0.99, + "learning_rate": 0.0001508169142596447, + "loss": 0.015, "step": 383680 }, { - "epoch": 1.94, - "learning_rate": 9.635186745437942e-06, - "loss": 0.0068, + "epoch": 0.99, + "learning_rate": 0.00015081302604327324, + "loss": 0.0209, "step": 383690 }, { - "epoch": 1.94, - "learning_rate": 9.627619052423932e-06, - "loss": 0.0036, + "epoch": 0.99, + "learning_rate": 0.0001508091378269018, + "loss": 0.0127, "step": 383700 }, { - "epoch": 1.94, - "learning_rate": 9.62005135940992e-06, - "loss": 0.0044, + "epoch": 0.99, + "learning_rate": 0.0001508052496105303, + "loss": 0.0144, "step": 383710 }, { - "epoch": 1.94, - "learning_rate": 9.61248366639591e-06, - "loss": 0.0053, + "epoch": 0.99, + "learning_rate": 0.00015080136139415884, + "loss": 0.0173, "step": 383720 }, { - "epoch": 1.94, - "learning_rate": 9.6049159733819e-06, - "loss": 0.0055, + "epoch": 0.99, + "learning_rate": 0.00015079747317778738, + "loss": 0.0117, "step": 383730 }, { - "epoch": 1.94, - "learning_rate": 9.59734828036789e-06, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015079358496141593, + "loss": 0.0108, "step": 383740 }, { - "epoch": 1.94, - "learning_rate": 9.58978058735388e-06, - "loss": 0.0042, + "epoch": 0.99, + "learning_rate": 0.00015078969674504444, + "loss": 0.0114, "step": 383750 }, { - "epoch": 1.94, - "learning_rate": 9.58221289433987e-06, - "loss": 0.0057, + "epoch": 0.99, + "learning_rate": 0.00015078580852867298, + "loss": 0.0105, "step": 383760 }, { - "epoch": 1.94, - "learning_rate": 9.57464520132586e-06, - "loss": 0.0045, + "epoch": 0.99, + "learning_rate": 0.00015078192031230155, + "loss": 0.0156, "step": 383770 }, { - "epoch": 1.94, - "learning_rate": 9.56707750831185e-06, - "loss": 0.0056, + "epoch": 0.99, + "learning_rate": 0.00015077803209593007, + "loss": 0.0161, "step": 383780 }, { - "epoch": 1.94, - "learning_rate": 9.559509815297838e-06, - "loss": 0.0051, + "epoch": 0.99, + "learning_rate": 0.0001507741438795586, + "loss": 0.0138, "step": 383790 }, { - "epoch": 1.94, - "learning_rate": 9.551942122283828e-06, - "loss": 0.006, + "epoch": 0.99, + "learning_rate": 0.00015077025566318712, + "loss": 0.0151, "step": 383800 }, { - "epoch": 1.94, - "learning_rate": 9.544374429269818e-06, - "loss": 0.0075, + "epoch": 0.99, + "learning_rate": 0.0001507663674468157, + "loss": 0.0129, "step": 383810 }, { - "epoch": 1.94, - "learning_rate": 9.536806736255808e-06, - "loss": 0.0054, + "epoch": 0.99, + "learning_rate": 0.0001507624792304442, + "loss": 0.0121, "step": 383820 }, { - "epoch": 1.94, - "learning_rate": 9.529239043241798e-06, - "loss": 0.0052, + "epoch": 0.99, + "learning_rate": 0.00015075859101407275, + "loss": 0.0115, "step": 383830 }, { - "epoch": 1.94, - "learning_rate": 9.521671350227788e-06, - "loss": 0.0061, + "epoch": 0.99, + "learning_rate": 0.00015075470279770126, + "loss": 0.0112, "step": 383840 }, { - "epoch": 1.94, - "learning_rate": 9.514103657213778e-06, - "loss": 0.0046, + "epoch": 0.99, + "learning_rate": 0.0001507508145813298, + "loss": 0.0095, "step": 383850 }, { - "epoch": 1.94, - "learning_rate": 9.506535964199768e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00015074692636495834, + "loss": 0.0146, "step": 383860 }, { - "epoch": 1.94, - "learning_rate": 9.498968271185754e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00015074303814858689, + "loss": 0.012, "step": 383870 }, { - "epoch": 1.94, - "learning_rate": 9.491400578171746e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.0001507391499322154, + "loss": 0.0118, "step": 383880 }, { - "epoch": 1.94, - "learning_rate": 9.483832885157736e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015073526171584394, + "loss": 0.0104, "step": 383890 }, { - "epoch": 1.94, - "learning_rate": 9.476265192143726e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00015073137349947248, + "loss": 0.0106, "step": 383900 }, { - "epoch": 1.94, - "learning_rate": 9.468697499129715e-06, - "loss": 0.009, + "epoch": 1.0, + "learning_rate": 0.00015072748528310103, + "loss": 0.0099, "step": 383910 }, { - "epoch": 1.94, - "learning_rate": 9.461129806115705e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015072359706672954, + "loss": 0.0112, "step": 383920 }, { - "epoch": 1.94, - "learning_rate": 9.453562113101695e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00015071970885035808, + "loss": 0.0108, "step": 383930 }, { - "epoch": 1.94, - "learning_rate": 9.445994420087682e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00015071582063398665, + "loss": 0.0096, "step": 383940 }, { - "epoch": 1.94, - "learning_rate": 9.438426727073672e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00015071193241761516, + "loss": 0.0128, "step": 383950 }, { - "epoch": 1.94, - "learning_rate": 9.430859034059662e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.0001507080442012437, + "loss": 0.0121, "step": 383960 }, { - "epoch": 1.94, - "learning_rate": 9.423291341045652e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015070415598487222, + "loss": 0.0115, "step": 383970 }, { - "epoch": 1.94, - "learning_rate": 9.415723648031641e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.0001507002677685008, + "loss": 0.0121, "step": 383980 }, { - "epoch": 1.94, - "learning_rate": 9.408155955017631e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.0001506963795521293, + "loss": 0.0113, "step": 383990 }, { - "epoch": 1.94, - "learning_rate": 9.400588262003621e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015069249133575785, + "loss": 0.0105, "step": 384000 }, { - "epoch": 1.94, - "eval_cer": 0.9144159137201398, - "eval_loss": 0.004220431204885244, - "eval_runtime": 116.4383, - "eval_samples_per_second": 17.176, - "eval_steps_per_second": 4.294, + "epoch": 1.0, + "eval_cer": 0.8817054855970361, + "eval_loss": 0.007804430089890957, + "eval_runtime": 107.5434, + "eval_samples_per_second": 18.597, + "eval_steps_per_second": 4.649, "step": 384000 }, { - "epoch": 1.94, - "learning_rate": 9.393020568989613e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00015068860311938636, + "loss": 0.0113, "step": 384010 }, { - "epoch": 1.94, - "learning_rate": 9.3854528759756e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015068471490301493, + "loss": 0.0136, "step": 384020 }, { - "epoch": 1.94, - "learning_rate": 9.37788518296159e-06, - "loss": 0.0034, + "epoch": 1.0, + "learning_rate": 0.00015068082668664344, + "loss": 0.0141, "step": 384030 }, { - "epoch": 1.94, - "learning_rate": 9.37031748994758e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015067693847027199, + "loss": 0.0123, "step": 384040 }, { - "epoch": 1.94, - "learning_rate": 9.36274979693357e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.0001506730502539005, + "loss": 0.0147, "step": 384050 }, { - "epoch": 1.94, - "learning_rate": 9.355182103919559e-06, - "loss": 0.0035, + "epoch": 1.0, + "learning_rate": 0.00015066916203752907, + "loss": 0.0108, "step": 384060 }, { - "epoch": 1.94, - "learning_rate": 9.347614410905549e-06, - "loss": 0.0055, - "step": 384070 + "epoch": 1.0, + "learning_rate": 0.00015066527382115758, + "loss": 0.0143, + "step": 384070 }, { - "epoch": 1.94, - "learning_rate": 9.340046717891539e-06, - "loss": 0.0041, + "epoch": 1.0, + "learning_rate": 0.00015066138560478612, + "loss": 0.0113, "step": 384080 }, { - "epoch": 1.94, - "learning_rate": 9.332479024877529e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00015065749738841464, + "loss": 0.0119, "step": 384090 }, { - "epoch": 1.94, - "learning_rate": 9.324911331863519e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00015065360917204318, + "loss": 0.0123, "step": 384100 }, { - "epoch": 1.94, - "learning_rate": 9.317343638849509e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00015064972095567175, + "loss": 0.0116, "step": 384110 }, { - "epoch": 1.94, - "learning_rate": 9.309775945835497e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00015064583273930026, + "loss": 0.01, "step": 384120 }, { - "epoch": 1.94, - "learning_rate": 9.302208252821487e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.0001506419445229288, + "loss": 0.0107, "step": 384130 }, { - "epoch": 1.94, - "learning_rate": 9.294640559807477e-06, - "loss": 0.0073, + "epoch": 1.0, + "learning_rate": 0.00015063805630655732, + "loss": 0.0083, "step": 384140 }, { - "epoch": 1.94, - "learning_rate": 9.287072866793467e-06, - "loss": 0.0071, + "epoch": 1.0, + "learning_rate": 0.0001506341680901859, + "loss": 0.0102, "step": 384150 }, { - "epoch": 1.94, - "learning_rate": 9.279505173779457e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.0001506302798738144, + "loss": 0.0103, "step": 384160 }, { - "epoch": 1.94, - "learning_rate": 9.271937480765446e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00015062639165744295, + "loss": 0.0144, "step": 384170 }, { - "epoch": 1.94, - "learning_rate": 9.264369787751436e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.00015062250344107146, + "loss": 0.0112, "step": 384180 }, { - "epoch": 1.94, - "learning_rate": 9.256802094737426e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015061861522470003, + "loss": 0.0129, "step": 384190 }, { - "epoch": 1.94, - "learning_rate": 9.249234401723414e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00015061472700832854, + "loss": 0.0132, "step": 384200 }, { - "epoch": 1.94, - "learning_rate": 9.241666708709404e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015061083879195708, + "loss": 0.01, "step": 384210 }, { - "epoch": 1.94, - "learning_rate": 9.234099015695394e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.0001506069505755856, + "loss": 0.0116, "step": 384220 }, { - "epoch": 1.94, - "learning_rate": 9.226531322681384e-06, - "loss": 0.0039, + "epoch": 1.0, + "learning_rate": 0.00015060306235921417, + "loss": 0.0119, "step": 384230 }, { - "epoch": 1.94, - "learning_rate": 9.218963629667374e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00015059917414284268, + "loss": 0.0107, "step": 384240 }, { - "epoch": 1.94, - "learning_rate": 9.211395936653364e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015059528592647122, + "loss": 0.0119, "step": 384250 }, { - "epoch": 1.94, - "learning_rate": 9.203828243639354e-06, - "loss": 0.0073, + "epoch": 1.0, + "learning_rate": 0.00015059139771009974, + "loss": 0.0129, "step": 384260 }, { - "epoch": 1.94, - "learning_rate": 9.196260550625344e-06, - "loss": 0.0076, + "epoch": 1.0, + "learning_rate": 0.0001505875094937283, + "loss": 0.014, "step": 384270 }, { - "epoch": 1.94, - "learning_rate": 9.188692857611332e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00015058362127735685, + "loss": 0.011, "step": 384280 }, { - "epoch": 1.94, - "learning_rate": 9.181125164597322e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00015057973306098536, + "loss": 0.0124, "step": 384290 }, { - "epoch": 1.94, - "learning_rate": 9.173557471583312e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00015057584484461388, + "loss": 0.0145, "step": 384300 }, { - "epoch": 1.94, - "learning_rate": 9.165989778569302e-06, - "loss": 0.004, + "epoch": 1.0, + "learning_rate": 0.00015057195662824245, + "loss": 0.0105, "step": 384310 }, { - "epoch": 1.94, - "learning_rate": 9.158422085555292e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.000150568068411871, + "loss": 0.0187, "step": 384320 }, { - "epoch": 1.94, - "learning_rate": 9.150854392541282e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.0001505641801954995, + "loss": 0.0113, "step": 384330 }, { - "epoch": 1.94, - "learning_rate": 9.143286699527272e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015056029197912804, + "loss": 0.0134, "step": 384340 }, { - "epoch": 1.94, - "learning_rate": 9.135719006513261e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00015055640376275656, + "loss": 0.012, "step": 384350 }, { - "epoch": 1.94, - "learning_rate": 9.12815131349925e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00015055251554638513, + "loss": 0.0111, "step": 384360 }, { - "epoch": 1.94, - "learning_rate": 9.12058362048524e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00015054862733001364, + "loss": 0.0099, "step": 384370 }, { - "epoch": 1.94, - "learning_rate": 9.11301592747123e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015054473911364218, + "loss": 0.0109, "step": 384380 }, { - "epoch": 1.94, - "learning_rate": 9.10544823445722e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.0001505408508972707, + "loss": 0.0145, "step": 384390 }, { - "epoch": 1.94, - "learning_rate": 9.097880541443208e-06, - "loss": 0.0067, + "epoch": 1.0, + "learning_rate": 0.00015053696268089927, + "loss": 0.0145, "step": 384400 }, { - "epoch": 1.94, - "learning_rate": 9.090312848429198e-06, - "loss": 0.004, + "epoch": 1.0, + "learning_rate": 0.00015053307446452778, + "loss": 0.0165, "step": 384410 }, { - "epoch": 1.94, - "learning_rate": 9.082745155415187e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015052918624815632, + "loss": 0.0141, "step": 384420 }, { - "epoch": 1.94, - "learning_rate": 9.075177462401179e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00015052529803178484, + "loss": 0.013, "step": 384430 }, { - "epoch": 1.94, - "learning_rate": 9.067609769387167e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.0001505214098154134, + "loss": 0.0132, "step": 384440 }, { - "epoch": 1.94, - "learning_rate": 9.060042076373157e-06, - "loss": 0.0067, + "epoch": 1.0, + "learning_rate": 0.00015051752159904192, + "loss": 0.0123, "step": 384450 }, { - "epoch": 1.94, - "learning_rate": 9.052474383359147e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00015051363338267046, + "loss": 0.0123, "step": 384460 }, { - "epoch": 1.94, - "learning_rate": 9.044906690345135e-06, - "loss": 0.0041, + "epoch": 1.0, + "learning_rate": 0.00015050974516629898, + "loss": 0.0157, "step": 384470 }, { - "epoch": 1.94, - "learning_rate": 9.037338997331125e-06, - "loss": 0.0043, + "epoch": 1.0, + "learning_rate": 0.00015050585694992755, + "loss": 0.014, "step": 384480 }, { - "epoch": 1.94, - "learning_rate": 9.029771304317115e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.0001505019687335561, + "loss": 0.0114, "step": 384490 }, { - "epoch": 1.94, - "learning_rate": 9.022203611303105e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.0001504980805171846, + "loss": 0.0138, "step": 384500 }, { - "epoch": 1.94, - "learning_rate": 9.014635918289095e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015049419230081314, + "loss": 0.0127, "step": 384510 }, { - "epoch": 1.94, - "learning_rate": 9.007068225275085e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00015049030408444169, + "loss": 0.0106, "step": 384520 }, { - "epoch": 1.94, - "learning_rate": 8.999500532261075e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00015048641586807023, + "loss": 0.0103, "step": 384530 }, { - "epoch": 1.94, - "learning_rate": 8.991932839247065e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015048252765169874, + "loss": 0.0133, "step": 384540 }, { - "epoch": 1.94, - "learning_rate": 8.984365146233053e-06, - "loss": 0.0083, + "epoch": 1.0, + "learning_rate": 0.00015047863943532728, + "loss": 0.0101, "step": 384550 }, { - "epoch": 1.94, - "learning_rate": 8.976797453219043e-06, - "loss": 0.0074, + "epoch": 1.0, + "learning_rate": 0.00015047475121895583, + "loss": 0.0129, "step": 384560 }, { - "epoch": 1.94, - "learning_rate": 8.969229760205033e-06, - "loss": 0.004, + "epoch": 1.0, + "learning_rate": 0.00015047086300258437, + "loss": 0.011, "step": 384570 }, { - "epoch": 1.94, - "learning_rate": 8.961662067191023e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00015046697478621288, + "loss": 0.0148, "step": 384580 }, { - "epoch": 1.94, - "learning_rate": 8.954094374177013e-06, - "loss": 0.0074, + "epoch": 1.0, + "learning_rate": 0.00015046308656984142, + "loss": 0.014, "step": 384590 }, { - "epoch": 1.94, - "learning_rate": 8.946526681163003e-06, - "loss": 0.0044, + "epoch": 1.0, + "learning_rate": 0.00015045919835346994, + "loss": 0.0102, "step": 384600 }, { - "epoch": 1.94, - "learning_rate": 8.938958988148992e-06, - "loss": 0.0072, + "epoch": 1.0, + "learning_rate": 0.0001504553101370985, + "loss": 0.0137, "step": 384610 }, { - "epoch": 1.94, - "learning_rate": 8.931391295134982e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015045142192072702, + "loss": 0.0123, "step": 384620 }, { - "epoch": 1.94, - "learning_rate": 8.92382360212097e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00015044753370435556, + "loss": 0.0105, "step": 384630 }, { - "epoch": 1.94, - "learning_rate": 8.91625590910696e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00015044364548798408, + "loss": 0.0161, "step": 384640 }, { - "epoch": 1.94, - "learning_rate": 8.90868821609295e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015043975727161265, + "loss": 0.0134, "step": 384650 }, { - "epoch": 1.94, - "learning_rate": 8.90112052307894e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.0001504358690552412, + "loss": 0.0097, "step": 384660 }, { - "epoch": 1.94, - "learning_rate": 8.89355283006493e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.0001504319808388697, + "loss": 0.0136, "step": 384670 }, { - "epoch": 1.94, - "learning_rate": 8.88598513705092e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00015042809262249824, + "loss": 0.013, "step": 384680 }, { - "epoch": 1.94, - "learning_rate": 8.87841744403691e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015042420440612679, + "loss": 0.0129, "step": 384690 }, { - "epoch": 1.94, - "learning_rate": 8.8708497510229e-06, - "loss": 0.0072, + "epoch": 1.0, + "learning_rate": 0.00015042031618975533, + "loss": 0.0158, "step": 384700 }, { - "epoch": 1.94, - "learning_rate": 8.863282058008888e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015041642797338384, + "loss": 0.0154, "step": 384710 }, { - "epoch": 1.94, - "learning_rate": 8.855714364994878e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00015041253975701238, + "loss": 0.0128, "step": 384720 }, { - "epoch": 1.94, - "learning_rate": 8.848146671980868e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00015040865154064092, + "loss": 0.0132, "step": 384730 }, { - "epoch": 1.94, - "learning_rate": 8.840578978966858e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00015040476332426947, + "loss": 0.0127, "step": 384740 }, { - "epoch": 1.94, - "learning_rate": 8.833011285952848e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015040087510789798, + "loss": 0.0137, "step": 384750 }, { - "epoch": 1.94, - "learning_rate": 8.825443592938838e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00015039698689152652, + "loss": 0.011, "step": 384760 }, { - "epoch": 1.94, - "learning_rate": 8.817875899924828e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.00015039309867515506, + "loss": 0.013, "step": 384770 }, { - "epoch": 1.94, - "learning_rate": 8.810308206910818e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.0001503892104587836, + "loss": 0.0136, "step": 384780 }, { - "epoch": 1.94, - "learning_rate": 8.802740513896806e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015038532224241212, + "loss": 0.013, "step": 384790 }, { - "epoch": 1.94, - "learning_rate": 8.795172820882796e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015038143402604066, + "loss": 0.0152, "step": 384800 }, { - "epoch": 1.94, - "learning_rate": 8.787605127868786e-06, - "loss": 0.0076, + "epoch": 1.0, + "learning_rate": 0.00015037754580966923, + "loss": 0.0136, "step": 384810 }, { - "epoch": 1.94, - "learning_rate": 8.780037434854776e-06, - "loss": 0.0067, + "epoch": 1.0, + "learning_rate": 0.00015037365759329775, + "loss": 0.0135, "step": 384820 }, { - "epoch": 1.94, - "learning_rate": 8.772469741840764e-06, - "loss": 0.0071, + "epoch": 1.0, + "learning_rate": 0.0001503697693769263, + "loss": 0.0113, "step": 384830 }, { - "epoch": 1.94, - "learning_rate": 8.764902048826754e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.0001503658811605548, + "loss": 0.0111, "step": 384840 }, { - "epoch": 1.94, - "learning_rate": 8.757334355812745e-06, - "loss": 0.0088, + "epoch": 1.0, + "learning_rate": 0.00015036199294418332, + "loss": 0.0124, "step": 384850 }, { - "epoch": 1.94, - "learning_rate": 8.749766662798735e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015035810472781188, + "loss": 0.0149, "step": 384860 }, { - "epoch": 1.94, - "learning_rate": 8.742198969784723e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015035421651144043, + "loss": 0.0117, "step": 384870 }, { - "epoch": 1.94, - "learning_rate": 8.734631276770713e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00015035032829506894, + "loss": 0.0097, "step": 384880 }, { - "epoch": 1.94, - "learning_rate": 8.727063583756703e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015034644007869748, + "loss": 0.0115, "step": 384890 }, { - "epoch": 1.94, - "learning_rate": 8.719495890742693e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015034255186232602, + "loss": 0.0122, "step": 384900 }, { - "epoch": 1.94, - "learning_rate": 8.711928197728681e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015033866364595457, + "loss": 0.0114, "step": 384910 }, { - "epoch": 1.94, - "learning_rate": 8.704360504714671e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015033477542958308, + "loss": 0.0139, "step": 384920 }, { - "epoch": 1.94, - "learning_rate": 8.696792811700661e-06, - "loss": 0.0088, + "epoch": 1.0, + "learning_rate": 0.00015033088721321162, + "loss": 0.0123, "step": 384930 }, { - "epoch": 1.94, - "learning_rate": 8.689225118686651e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015032699899684016, + "loss": 0.0112, "step": 384940 }, { - "epoch": 1.94, - "learning_rate": 8.681657425672641e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.0001503231107804687, + "loss": 0.0172, "step": 384950 }, { - "epoch": 1.94, - "learning_rate": 8.674089732658631e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.00015031922256409722, + "loss": 0.0141, "step": 384960 }, { - "epoch": 1.94, - "learning_rate": 8.66652203964462e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00015031533434772576, + "loss": 0.0112, "step": 384970 }, { - "epoch": 1.94, - "learning_rate": 8.65895434663061e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00015031144613135433, + "loss": 0.0193, "step": 384980 }, { - "epoch": 1.94, - "learning_rate": 8.651386653616599e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00015030755791498284, + "loss": 0.0177, "step": 384990 }, { - "epoch": 1.94, - "learning_rate": 8.643818960602589e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00015030366969861139, + "loss": 0.0152, "step": 385000 }, { - "epoch": 1.94, - "eval_cer": 0.914423676889143, - "eval_loss": 0.0041769566014409065, - "eval_runtime": 116.103, - "eval_samples_per_second": 17.226, - "eval_steps_per_second": 4.307, + "epoch": 1.0, + "eval_cer": 0.8817684692590742, + "eval_loss": 0.00825272686779499, + "eval_runtime": 107.6549, + "eval_samples_per_second": 18.578, + "eval_steps_per_second": 4.644, "step": 385000 }, { - "epoch": 1.94, - "learning_rate": 8.636251267588579e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.0001502997814822399, + "loss": 0.0123, "step": 385010 }, { - "epoch": 1.94, - "learning_rate": 8.628683574574569e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00015029589326586847, + "loss": 0.0152, "step": 385020 }, { - "epoch": 1.94, - "learning_rate": 8.621115881560559e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015029200504949698, + "loss": 0.0131, "step": 385030 }, { - "epoch": 1.94, - "learning_rate": 8.613548188546549e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00015028811683312553, + "loss": 0.0146, "step": 385040 }, { - "epoch": 1.94, - "learning_rate": 8.605980495532538e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015028422861675404, + "loss": 0.0111, "step": 385050 }, { - "epoch": 1.94, - "learning_rate": 8.598412802518527e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.0001502803404003826, + "loss": 0.0283, "step": 385060 }, { - "epoch": 1.94, - "learning_rate": 8.590845109504517e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00015027645218401112, + "loss": 0.0101, "step": 385070 }, { - "epoch": 1.94, - "learning_rate": 8.583277416490506e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00015027256396763967, + "loss": 0.0164, "step": 385080 }, { - "epoch": 1.94, - "learning_rate": 8.575709723476496e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015026867575126818, + "loss": 0.0117, "step": 385090 }, { - "epoch": 1.94, - "learning_rate": 8.568142030462486e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00015026478753489672, + "loss": 0.0097, "step": 385100 }, { - "epoch": 1.94, - "learning_rate": 8.560574337448476e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015026089931852526, + "loss": 0.0122, "step": 385110 }, { - "epoch": 1.94, - "learning_rate": 8.553006644434466e-06, - "loss": 0.0067, + "epoch": 1.0, + "learning_rate": 0.0001502570111021538, + "loss": 0.0146, "step": 385120 }, { - "epoch": 1.94, - "learning_rate": 8.545438951420456e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00015025312288578232, + "loss": 0.0125, "step": 385130 }, { - "epoch": 1.94, - "learning_rate": 8.537871258406444e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00015024923466941086, + "loss": 0.0106, "step": 385140 }, { - "epoch": 1.94, - "learning_rate": 8.530303565392434e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00015024534645303943, + "loss": 0.0127, "step": 385150 }, { - "epoch": 1.94, - "learning_rate": 8.522735872378424e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00015024145823666794, + "loss": 0.0134, "step": 385160 }, { - "epoch": 1.94, - "learning_rate": 8.515168179364414e-06, - "loss": 0.0073, + "epoch": 1.0, + "learning_rate": 0.00015023757002029646, + "loss": 0.0124, "step": 385170 }, { - "epoch": 1.94, - "learning_rate": 8.507600486350404e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.000150233681803925, + "loss": 0.01, "step": 385180 }, { - "epoch": 1.94, - "learning_rate": 8.500032793336394e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015022979358755357, + "loss": 0.0133, "step": 385190 }, { - "epoch": 1.94, - "learning_rate": 8.492465100322384e-06, - "loss": 0.0069, + "epoch": 1.0, + "learning_rate": 0.00015022590537118208, + "loss": 0.0118, "step": 385200 }, { - "epoch": 1.94, - "learning_rate": 8.484897407308374e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00015022201715481063, + "loss": 0.0146, "step": 385210 }, { - "epoch": 1.94, - "learning_rate": 8.477329714294362e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.00015021812893843914, + "loss": 0.0123, "step": 385220 }, { - "epoch": 1.94, - "learning_rate": 8.469762021280352e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.0001502142407220677, + "loss": 0.0109, "step": 385230 }, { - "epoch": 1.94, - "learning_rate": 8.462194328266342e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00015021035250569622, + "loss": 0.0147, "step": 385240 }, { - "epoch": 1.94, - "learning_rate": 8.454626635252332e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00015020646428932476, + "loss": 0.0116, "step": 385250 }, { - "epoch": 1.94, - "learning_rate": 8.44705894223832e-06, - "loss": 0.0072, + "epoch": 1.0, + "learning_rate": 0.00015020257607295328, + "loss": 0.0148, "step": 385260 }, { - "epoch": 1.94, - "learning_rate": 8.439491249224311e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015019868785658185, + "loss": 0.0129, "step": 385270 }, { - "epoch": 1.94, - "learning_rate": 8.431923556210301e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015019479964021036, + "loss": 0.0109, "step": 385280 }, { - "epoch": 1.94, - "learning_rate": 8.424355863196291e-06, - "loss": 0.0041, + "epoch": 1.0, + "learning_rate": 0.0001501909114238389, + "loss": 0.0143, "step": 385290 }, { - "epoch": 1.94, - "learning_rate": 8.41678817018228e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00015018702320746742, + "loss": 0.0145, "step": 385300 }, { - "epoch": 1.94, - "learning_rate": 8.40922047716827e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015018313499109596, + "loss": 0.0175, "step": 385310 }, { - "epoch": 1.94, - "learning_rate": 8.40165278415426e-06, - "loss": 0.0039, + "epoch": 1.0, + "learning_rate": 0.0001501792467747245, + "loss": 0.0132, "step": 385320 }, { - "epoch": 1.94, - "learning_rate": 8.39408509114025e-06, - "loss": 0.0041, + "epoch": 1.0, + "learning_rate": 0.00015017535855835304, + "loss": 0.0113, "step": 385330 }, { - "epoch": 1.94, - "learning_rate": 8.386517398126237e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00015017147034198156, + "loss": 0.0115, "step": 385340 }, { - "epoch": 1.94, - "learning_rate": 8.378949705112227e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.0001501675821256101, + "loss": 0.0132, "step": 385350 }, { - "epoch": 1.94, - "learning_rate": 8.371382012098217e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00015016369390923867, + "loss": 0.0101, "step": 385360 }, { - "epoch": 1.94, - "learning_rate": 8.363814319084207e-06, - "loss": 0.0114, + "epoch": 1.0, + "learning_rate": 0.00015015980569286718, + "loss": 0.0134, "step": 385370 }, { - "epoch": 1.94, - "learning_rate": 8.356246626070197e-06, - "loss": 0.0044, + "epoch": 1.0, + "learning_rate": 0.00015015591747649572, + "loss": 0.0125, "step": 385380 }, { - "epoch": 1.94, - "learning_rate": 8.348678933056187e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00015015202926012424, + "loss": 0.0112, "step": 385390 }, { - "epoch": 1.94, - "learning_rate": 8.341111240042177e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.0001501481410437528, + "loss": 0.0132, "step": 385400 }, { - "epoch": 1.94, - "learning_rate": 8.333543547028167e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015014425282738132, + "loss": 0.0116, "step": 385410 }, { - "epoch": 1.94, - "learning_rate": 8.325975854014155e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015014036461100986, + "loss": 0.013, "step": 385420 }, { - "epoch": 1.94, - "learning_rate": 8.318408161000145e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015013647639463838, + "loss": 0.0124, "step": 385430 }, { - "epoch": 1.94, - "learning_rate": 8.310840467986135e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015013258817826695, + "loss": 0.0119, "step": 385440 }, { - "epoch": 1.94, - "learning_rate": 8.303272774972125e-06, - "loss": 0.0039, + "epoch": 1.0, + "learning_rate": 0.00015012869996189546, + "loss": 0.0138, "step": 385450 }, { - "epoch": 1.94, - "learning_rate": 8.295705081958115e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.000150124811745524, + "loss": 0.0112, "step": 385460 }, { - "epoch": 1.94, - "learning_rate": 8.288137388944105e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00015012092352915252, + "loss": 0.0169, "step": 385470 }, { - "epoch": 1.94, - "learning_rate": 8.280569695930095e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.0001501170353127811, + "loss": 0.0123, "step": 385480 }, { - "epoch": 1.94, - "learning_rate": 8.273002002916084e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.0001501131470964096, + "loss": 0.0102, "step": 385490 }, { - "epoch": 1.94, - "learning_rate": 8.265434309902073e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00015010925888003814, + "loss": 0.014, "step": 385500 }, { - "epoch": 1.94, - "learning_rate": 8.257866616888063e-06, - "loss": 0.0079, + "epoch": 1.0, + "learning_rate": 0.00015010537066366666, + "loss": 0.0085, "step": 385510 }, { - "epoch": 1.94, - "learning_rate": 8.250298923874052e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00015010148244729523, + "loss": 0.0164, "step": 385520 }, { - "epoch": 1.95, - "learning_rate": 8.242731230860042e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015009759423092377, + "loss": 0.0149, "step": 385530 }, { - "epoch": 1.95, - "learning_rate": 8.235163537846032e-06, - "loss": 0.0067, + "epoch": 1.0, + "learning_rate": 0.00015009370601455228, + "loss": 0.0147, "step": 385540 }, { - "epoch": 1.95, - "learning_rate": 8.227595844832022e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00015008981779818082, + "loss": 0.0134, "step": 385550 }, { - "epoch": 1.95, - "learning_rate": 8.220028151818012e-06, - "loss": 0.0094, + "epoch": 1.0, + "learning_rate": 0.00015008592958180934, + "loss": 0.0155, "step": 385560 }, { - "epoch": 1.95, - "learning_rate": 8.212460458804e-06, - "loss": 0.0041, + "epoch": 1.0, + "learning_rate": 0.0001500820413654379, + "loss": 0.0123, "step": 385570 }, { - "epoch": 1.95, - "learning_rate": 8.20489276578999e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00015007815314906642, + "loss": 0.0111, "step": 385580 }, { - "epoch": 1.95, - "learning_rate": 8.19732507277598e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015007426493269496, + "loss": 0.01, "step": 385590 }, { - "epoch": 1.95, - "learning_rate": 8.18975737976197e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015007037671632348, + "loss": 0.0141, "step": 385600 }, { - "epoch": 1.95, - "learning_rate": 8.18218968674796e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00015006648849995205, + "loss": 0.0108, "step": 385610 }, { - "epoch": 1.95, - "learning_rate": 8.17462199373395e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00015006260028358056, + "loss": 0.0098, "step": 385620 }, { - "epoch": 1.95, - "learning_rate": 8.16705430071994e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.0001500587120672091, + "loss": 0.014, "step": 385630 }, { - "epoch": 1.95, - "learning_rate": 8.15948660770593e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00015005482385083762, + "loss": 0.0129, "step": 385640 }, { - "epoch": 1.95, - "learning_rate": 8.151918914691918e-06, - "loss": 0.0042, + "epoch": 1.0, + "learning_rate": 0.00015005093563446619, + "loss": 0.0148, "step": 385650 }, { - "epoch": 1.95, - "learning_rate": 8.144351221677908e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.0001500470474180947, + "loss": 0.014, "step": 385660 }, { - "epoch": 1.95, - "learning_rate": 8.136783528663898e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015004315920172324, + "loss": 0.0143, "step": 385670 }, { - "epoch": 1.95, - "learning_rate": 8.129215835649888e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00015003927098535176, + "loss": 0.0189, "step": 385680 }, { - "epoch": 1.95, - "learning_rate": 8.121648142635878e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00015003538276898033, + "loss": 0.0143, "step": 385690 }, { - "epoch": 1.95, - "learning_rate": 8.114080449621868e-06, - "loss": 0.0077, + "epoch": 1.0, + "learning_rate": 0.00015003149455260887, + "loss": 0.0148, "step": 385700 }, { - "epoch": 1.95, - "learning_rate": 8.106512756607857e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00015002760633623738, + "loss": 0.0109, "step": 385710 }, { - "epoch": 1.95, - "learning_rate": 8.098945063593847e-06, - "loss": 0.0086, + "epoch": 1.0, + "learning_rate": 0.0001500237181198659, + "loss": 0.0114, "step": 385720 }, { - "epoch": 1.95, - "learning_rate": 8.091377370579836e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015001982990349447, + "loss": 0.0103, "step": 385730 }, { - "epoch": 1.95, - "learning_rate": 8.083809677565825e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.000150015941687123, + "loss": 0.0139, "step": 385740 }, { - "epoch": 1.95, - "learning_rate": 8.076241984551815e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00015001205347075152, + "loss": 0.0154, "step": 385750 }, { - "epoch": 1.95, - "learning_rate": 8.068674291537805e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00015000816525438006, + "loss": 0.0091, "step": 385760 }, { - "epoch": 1.95, - "learning_rate": 8.061106598523794e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.0001500042770380086, + "loss": 0.0138, "step": 385770 }, { - "epoch": 1.95, - "learning_rate": 8.053538905509783e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00015000038882163715, + "loss": 0.0131, "step": 385780 }, { - "epoch": 1.95, - "learning_rate": 8.045971212495773e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014999650060526566, + "loss": 0.0111, "step": 385790 }, { - "epoch": 1.95, - "learning_rate": 8.038403519481763e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.0001499926123888942, + "loss": 0.0114, "step": 385800 }, { - "epoch": 1.95, - "learning_rate": 8.030835826467753e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.00014998872417252274, + "loss": 0.0098, "step": 385810 }, { - "epoch": 1.95, - "learning_rate": 8.023268133453743e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014998483595615126, + "loss": 0.0126, "step": 385820 }, { - "epoch": 1.95, - "learning_rate": 8.015700440439733e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.0001499809477397798, + "loss": 0.0163, "step": 385830 }, { - "epoch": 1.95, - "learning_rate": 8.008132747425723e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014997705952340834, + "loss": 0.0095, "step": 385840 }, { - "epoch": 1.95, - "learning_rate": 8.000565054411711e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00014997317130703688, + "loss": 0.0119, "step": 385850 }, { - "epoch": 1.95, - "learning_rate": 7.992997361397701e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.0001499692830906654, + "loss": 0.0107, "step": 385860 }, { - "epoch": 1.95, - "learning_rate": 7.985429668383691e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014996539487429397, + "loss": 0.0109, "step": 385870 }, { - "epoch": 1.95, - "learning_rate": 7.977861975369681e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014996150665792248, + "loss": 0.0148, "step": 385880 }, { - "epoch": 1.95, - "learning_rate": 7.97029428235567e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00014995761844155102, + "loss": 0.0087, "step": 385890 }, { - "epoch": 1.95, - "learning_rate": 7.96272658934166e-06, - "loss": 0.0068, + "epoch": 1.0, + "learning_rate": 0.00014995373022517956, + "loss": 0.0119, "step": 385900 }, { - "epoch": 1.95, - "learning_rate": 7.95515889632765e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.0001499498420088081, + "loss": 0.0113, "step": 385910 }, { - "epoch": 1.95, - "learning_rate": 7.94759120331364e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014994595379243662, + "loss": 0.0124, "step": 385920 }, { - "epoch": 1.95, - "learning_rate": 7.940023510299629e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00014994206557606516, + "loss": 0.0123, "step": 385930 }, { - "epoch": 1.95, - "learning_rate": 7.932455817285619e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.0001499381773596937, + "loss": 0.0094, "step": 385940 }, { - "epoch": 1.95, - "learning_rate": 7.924888124271609e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00014993428914332225, + "loss": 0.0124, "step": 385950 }, { - "epoch": 1.95, - "learning_rate": 7.917320431257598e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00014993040092695076, + "loss": 0.0124, "step": 385960 }, { - "epoch": 1.95, - "learning_rate": 7.909752738243588e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.0001499265127105793, + "loss": 0.0127, "step": 385970 }, { - "epoch": 1.95, - "learning_rate": 7.902185045229578e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00014992262449420784, + "loss": 0.0145, "step": 385980 }, { - "epoch": 1.95, - "learning_rate": 7.894617352215568e-06, - "loss": 0.0071, + "epoch": 1.0, + "learning_rate": 0.00014991873627783639, + "loss": 0.0126, "step": 385990 }, { - "epoch": 1.95, - "learning_rate": 7.887049659201558e-06, - "loss": 0.0072, + "epoch": 1.0, + "learning_rate": 0.0001499148480614649, + "loss": 0.0114, "step": 386000 }, { - "epoch": 1.95, - "eval_cer": 0.9144178545123905, - "eval_loss": 0.0041864411905407906, - "eval_runtime": 116.4755, - "eval_samples_per_second": 17.171, - "eval_steps_per_second": 4.293, + "epoch": 1.0, + "eval_cer": 0.8817152830555753, + "eval_loss": 0.008142529986798763, + "eval_runtime": 108.5328, + "eval_samples_per_second": 18.428, + "eval_steps_per_second": 4.607, "step": 386000 }, { - "epoch": 1.95, - "learning_rate": 7.879481966187546e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00014991095984509344, + "loss": 0.0097, "step": 386010 }, { - "epoch": 1.95, - "learning_rate": 7.871914273173536e-06, - "loss": 0.0031, + "epoch": 1.0, + "learning_rate": 0.00014990707162872198, + "loss": 0.0101, "step": 386020 }, { - "epoch": 1.95, - "learning_rate": 7.864346580159526e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.00014990318341235052, + "loss": 0.0224, "step": 386030 }, { - "epoch": 1.95, - "learning_rate": 7.856778887145516e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00014989929519597904, + "loss": 0.011, "step": 386040 }, { - "epoch": 1.95, - "learning_rate": 7.849211194131506e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.0001498954069796076, + "loss": 0.009, "step": 386050 }, { - "epoch": 1.95, - "learning_rate": 7.841643501117496e-06, - "loss": 0.0035, + "epoch": 1.0, + "learning_rate": 0.00014989151876323612, + "loss": 0.0136, "step": 386060 }, { - "epoch": 1.95, - "learning_rate": 7.834075808103486e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00014988763054686466, + "loss": 0.0163, "step": 386070 }, { - "epoch": 1.95, - "learning_rate": 7.826508115089476e-06, - "loss": 0.0037, + "epoch": 1.0, + "learning_rate": 0.0001498837423304932, + "loss": 0.0121, "step": 386080 }, { - "epoch": 1.95, - "learning_rate": 7.818940422075464e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00014987985411412172, + "loss": 0.0124, "step": 386090 }, { - "epoch": 1.95, - "learning_rate": 7.811372729061454e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00014987596589775026, + "loss": 0.0129, "step": 386100 }, { - "epoch": 1.95, - "learning_rate": 7.803805036047444e-06, - "loss": 0.0043, + "epoch": 1.0, + "learning_rate": 0.0001498720776813788, + "loss": 0.01, "step": 386110 }, { - "epoch": 1.95, - "learning_rate": 7.796237343033434e-06, - "loss": 0.0041, + "epoch": 1.0, + "learning_rate": 0.00014986818946500735, + "loss": 0.0123, "step": 386120 }, { - "epoch": 1.95, - "learning_rate": 7.788669650019424e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014986430124863586, + "loss": 0.0117, "step": 386130 }, { - "epoch": 1.95, - "learning_rate": 7.781101957005414e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.0001498604130322644, + "loss": 0.0137, "step": 386140 }, { - "epoch": 1.95, - "learning_rate": 7.773534263991403e-06, - "loss": 0.0076, + "epoch": 1.0, + "learning_rate": 0.00014985652481589294, + "loss": 0.0128, "step": 386150 }, { - "epoch": 1.95, - "learning_rate": 7.765966570977392e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00014985263659952148, + "loss": 0.0109, "step": 386160 }, { - "epoch": 1.95, - "learning_rate": 7.758398877963382e-06, - "loss": 0.0044, + "epoch": 1.0, + "learning_rate": 0.00014984874838315, + "loss": 0.0151, "step": 386170 }, { - "epoch": 1.95, - "learning_rate": 7.750831184949371e-06, - "loss": 0.0069, + "epoch": 1.0, + "learning_rate": 0.00014984486016677854, + "loss": 0.0159, "step": 386180 }, { - "epoch": 1.95, - "learning_rate": 7.743263491935361e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00014984097195040708, + "loss": 0.0119, "step": 386190 }, { - "epoch": 1.95, - "learning_rate": 7.73569579892135e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014983708373403562, + "loss": 0.0076, "step": 386200 }, { - "epoch": 1.95, - "learning_rate": 7.72812810590734e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00014983319551766414, + "loss": 0.0124, "step": 386210 }, { - "epoch": 1.95, - "learning_rate": 7.72056041289333e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.0001498293073012927, + "loss": 0.0112, "step": 386220 }, { - "epoch": 1.95, - "learning_rate": 7.71299271987932e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014982541908492122, + "loss": 0.0115, "step": 386230 }, { - "epoch": 1.95, - "learning_rate": 7.70542502686531e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00014982153086854976, + "loss": 0.0139, "step": 386240 }, { - "epoch": 1.95, - "learning_rate": 7.6978573338513e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.0001498176426521783, + "loss": 0.0147, "step": 386250 }, { - "epoch": 1.95, - "learning_rate": 7.690289640837289e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014981375443580685, + "loss": 0.0116, "step": 386260 }, { - "epoch": 1.95, - "learning_rate": 7.682721947823279e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014980986621943536, + "loss": 0.0134, "step": 386270 }, { - "epoch": 1.95, - "learning_rate": 7.675154254809267e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.0001498059780030639, + "loss": 0.0308, "step": 386280 }, { - "epoch": 1.95, - "learning_rate": 7.667586561795257e-06, - "loss": 0.004, + "epoch": 1.0, + "learning_rate": 0.00014980208978669244, + "loss": 0.0141, "step": 386290 }, { - "epoch": 1.95, - "learning_rate": 7.660018868781247e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014979820157032099, + "loss": 0.104, "step": 386300 }, { - "epoch": 1.95, - "learning_rate": 7.652451175767237e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.0001497943133539495, + "loss": 0.5434, "step": 386310 }, { - "epoch": 1.95, - "learning_rate": 7.644883482753227e-06, - "loss": 0.0043, + "epoch": 1.0, + "learning_rate": 0.00014979042513757804, + "loss": 1.8435, "step": 386320 }, { - "epoch": 1.95, - "learning_rate": 7.637315789739217e-06, - "loss": 0.0044, + "epoch": 1.0, + "learning_rate": 0.00014978653692120658, + "loss": 2.0344, "step": 386330 }, { - "epoch": 1.95, - "learning_rate": 7.629748096725207e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.0001497826487048351, + "loss": 0.1523, "step": 386340 }, { - "epoch": 1.95, - "learning_rate": 7.622180403711197e-06, - "loss": 0.0067, + "epoch": 1.0, + "learning_rate": 0.00014977876048846364, + "loss": 0.0122, "step": 386350 }, { - "epoch": 1.95, - "learning_rate": 7.614612710697186e-06, - "loss": 0.0038, + "epoch": 1.0, + "learning_rate": 0.00014977487227209218, + "loss": 0.014, "step": 386360 }, { - "epoch": 1.95, - "learning_rate": 7.607045017683176e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00014977098405572072, + "loss": 0.0085, "step": 386370 }, { - "epoch": 1.95, - "learning_rate": 7.5994773246691655e-06, - "loss": 0.0069, + "epoch": 1.0, + "learning_rate": 0.00014976709583934924, + "loss": 0.0128, "step": 386380 }, { - "epoch": 1.95, - "learning_rate": 7.591909631655155e-06, - "loss": 0.0039, + "epoch": 1.0, + "learning_rate": 0.0001497632076229778, + "loss": 0.0133, "step": 386390 }, { - "epoch": 1.95, - "learning_rate": 7.584341938641144e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00014975931940660632, + "loss": 0.0289, "step": 386400 }, { - "epoch": 1.95, - "learning_rate": 7.5767742456271335e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014975543119023486, + "loss": 0.0107, "step": 386410 }, { - "epoch": 1.95, - "learning_rate": 7.569206552613124e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.0001497515429738634, + "loss": 0.0279, "step": 386420 }, { - "epoch": 1.95, - "learning_rate": 7.561638859599114e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.00014974765475749195, + "loss": 0.0266, "step": 386430 }, { - "epoch": 1.95, - "learning_rate": 7.5540711665851024e-06, - "loss": 0.0077, + "epoch": 1.0, + "learning_rate": 0.00014974376654112046, + "loss": 0.0116, "step": 386440 }, { - "epoch": 1.95, - "learning_rate": 7.546503473571092e-06, - "loss": 0.0068, + "epoch": 1.0, + "learning_rate": 0.000149739878324749, + "loss": 0.0258, "step": 386450 }, { - "epoch": 1.95, - "learning_rate": 7.538935780557082e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.00014973599010837754, + "loss": 0.0115, "step": 386460 }, { - "epoch": 1.95, - "learning_rate": 7.531368087543072e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00014973210189200609, + "loss": 0.0249, "step": 386470 }, { - "epoch": 1.95, - "learning_rate": 7.523800394529061e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.0001497282136756346, + "loss": 0.0266, "step": 386480 }, { - "epoch": 1.95, - "learning_rate": 7.516232701515051e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014972432545926314, + "loss": 0.0361, "step": 386490 }, { - "epoch": 1.95, - "learning_rate": 7.508665008501041e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00014972043724289168, + "loss": 0.0119, "step": 386500 }, { - "epoch": 1.95, - "learning_rate": 7.501097315487031e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014971654902652023, + "loss": 0.0286, "step": 386510 }, { - "epoch": 1.95, - "learning_rate": 7.49352962247302e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00014971266081014874, + "loss": 0.0329, "step": 386520 }, { - "epoch": 1.95, - "learning_rate": 7.48596192945901e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00014970877259377728, + "loss": 0.0098, "step": 386530 }, { - "epoch": 1.95, - "learning_rate": 7.478394236445e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00014970488437740582, + "loss": 0.0288, "step": 386540 }, { - "epoch": 1.95, - "learning_rate": 7.47082654343099e-06, - "loss": 0.0085, + "epoch": 1.0, + "learning_rate": 0.00014970099616103436, + "loss": 0.013, "step": 386550 }, { - "epoch": 1.95, - "learning_rate": 7.463258850416979e-06, - "loss": 0.0081, + "epoch": 1.0, + "learning_rate": 0.00014969710794466288, + "loss": 0.0258, "step": 386560 }, { - "epoch": 1.95, - "learning_rate": 7.455691157402969e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00014969321972829142, + "loss": 0.0126, "step": 386570 }, { - "epoch": 1.95, - "learning_rate": 7.448123464388959e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00014968933151191996, + "loss": 0.0116, "step": 386580 }, { - "epoch": 1.95, - "learning_rate": 7.440555771374949e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.0001496854432955485, + "loss": 0.012, "step": 386590 }, { - "epoch": 1.95, - "learning_rate": 7.432988078360938e-06, - "loss": 0.0069, + "epoch": 1.0, + "learning_rate": 0.00014968155507917705, + "loss": 0.0145, "step": 386600 }, { - "epoch": 1.95, - "learning_rate": 7.4254203853469276e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00014967766686280556, + "loss": 0.0123, "step": 386610 }, { - "epoch": 1.95, - "learning_rate": 7.4178526923329175e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.0001496737786464341, + "loss": 0.01, "step": 386620 }, { - "epoch": 1.95, - "learning_rate": 7.410284999318907e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00014966989043006264, + "loss": 0.0102, "step": 386630 }, { - "epoch": 1.95, - "learning_rate": 7.4027173063048965e-06, - "loss": 0.0071, + "epoch": 1.0, + "learning_rate": 0.00014966600221369118, + "loss": 0.0129, "step": 386640 }, { - "epoch": 1.95, - "learning_rate": 7.395149613290886e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.0001496621139973197, + "loss": 0.0136, "step": 386650 }, { - "epoch": 1.95, - "learning_rate": 7.387581920276876e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014965822578094824, + "loss": 0.01, "step": 386660 }, { - "epoch": 1.95, - "learning_rate": 7.380014227262865e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00014965433756457678, + "loss": 0.0135, "step": 386670 }, { - "epoch": 1.95, - "learning_rate": 7.372446534248855e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014965044934820532, + "loss": 0.012, "step": 386680 }, { - "epoch": 1.95, - "learning_rate": 7.364878841234845e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00014964656113183384, + "loss": 0.0095, "step": 386690 }, { - "epoch": 1.95, - "learning_rate": 7.357311148220835e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014964267291546238, + "loss": 0.0127, "step": 386700 }, { - "epoch": 1.95, - "learning_rate": 7.349743455206824e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00014963878469909092, + "loss": 0.012, "step": 386710 }, { - "epoch": 1.95, - "learning_rate": 7.342175762192814e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00014963489648271946, + "loss": 0.0108, "step": 386720 }, { - "epoch": 1.95, - "learning_rate": 7.334608069178804e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00014963100826634798, + "loss": 0.01, "step": 386730 }, { - "epoch": 1.95, - "learning_rate": 7.327040376164794e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00014962712004997655, + "loss": 0.0122, "step": 386740 }, { - "epoch": 1.95, - "learning_rate": 7.319472683150783e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014962323183360506, + "loss": 0.0106, "step": 386750 }, { - "epoch": 1.95, - "learning_rate": 7.311904990136773e-06, - "loss": 0.0085, + "epoch": 1.0, + "learning_rate": 0.0001496193436172336, + "loss": 0.0119, "step": 386760 }, { - "epoch": 1.95, - "learning_rate": 7.304337297122763e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00014961545540086214, + "loss": 0.0141, "step": 386770 }, { - "epoch": 1.95, - "learning_rate": 7.296769604108753e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.0001496115671844907, + "loss": 0.0131, "step": 386780 }, { - "epoch": 1.95, - "learning_rate": 7.289201911094742e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.0001496076789681192, + "loss": 0.0109, "step": 386790 }, { - "epoch": 1.95, - "learning_rate": 7.281634218080732e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00014960379075174774, + "loss": 0.0148, "step": 386800 }, { - "epoch": 1.95, - "learning_rate": 7.274066525066722e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00014959990253537628, + "loss": 0.0126, "step": 386810 }, { - "epoch": 1.95, - "learning_rate": 7.2664988320527115e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.0001495960143190048, + "loss": 0.0102, "step": 386820 }, { - "epoch": 1.95, - "learning_rate": 7.2589311390387e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00014959212610263334, + "loss": 0.0091, "step": 386830 }, { - "epoch": 1.95, - "learning_rate": 7.2513634460246905e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00014958823788626188, + "loss": 0.0117, "step": 386840 }, { - "epoch": 1.95, - "learning_rate": 7.24379575301068e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00014958434966989042, + "loss": 0.0137, "step": 386850 }, { - "epoch": 1.95, - "learning_rate": 7.23622805999667e-06, - "loss": 0.0035, + "epoch": 1.0, + "learning_rate": 0.00014958046145351894, + "loss": 0.0133, "step": 386860 }, { - "epoch": 1.95, - "learning_rate": 7.2286603669826585e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00014957657323714748, + "loss": 0.01, "step": 386870 }, { - "epoch": 1.95, - "learning_rate": 7.2210926739686484e-06, - "loss": 0.0049, + "epoch": 1.0, + "learning_rate": 0.00014957268502077602, + "loss": 0.0159, "step": 386880 }, { - "epoch": 1.95, - "learning_rate": 7.213524980954638e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00014956879680440456, + "loss": 0.0113, "step": 386890 }, { - "epoch": 1.95, - "learning_rate": 7.205957287940628e-06, - "loss": 0.0032, + "epoch": 1.0, + "learning_rate": 0.00014956490858803308, + "loss": 0.0119, "step": 386900 }, { - "epoch": 1.95, - "learning_rate": 7.198389594926617e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00014956102037166162, + "loss": 0.0114, "step": 386910 }, { - "epoch": 1.95, - "learning_rate": 7.190821901912607e-06, - "loss": 0.0089, + "epoch": 1.0, + "learning_rate": 0.00014955713215529016, + "loss": 0.0117, "step": 386920 }, { - "epoch": 1.95, - "learning_rate": 7.183254208898597e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.0001495532439389187, + "loss": 0.0106, "step": 386930 }, { - "epoch": 1.95, - "learning_rate": 7.175686515884587e-06, - "loss": 0.0066, + "epoch": 1.0, + "learning_rate": 0.00014954935572254724, + "loss": 0.0142, "step": 386940 }, { - "epoch": 1.95, - "learning_rate": 7.168118822870576e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00014954546750617579, + "loss": 0.0123, "step": 386950 }, { - "epoch": 1.95, - "learning_rate": 7.160551129856566e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.0001495415792898043, + "loss": 0.0103, "step": 386960 }, { - "epoch": 1.95, - "learning_rate": 7.152983436842556e-06, - "loss": 0.0069, + "epoch": 1.0, + "learning_rate": 0.00014953769107343284, + "loss": 0.0124, "step": 386970 }, { - "epoch": 1.95, - "learning_rate": 7.145415743828546e-06, - "loss": 0.0072, + "epoch": 1.0, + "learning_rate": 0.00014953380285706138, + "loss": 0.0139, "step": 386980 }, { - "epoch": 1.95, - "learning_rate": 7.137848050814535e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00014952991464068993, + "loss": 0.0107, "step": 386990 }, { - "epoch": 1.95, - "learning_rate": 7.130280357800525e-06, - "loss": 0.0078, + "epoch": 1.0, + "learning_rate": 0.00014952602642431844, + "loss": 0.0135, "step": 387000 }, { - "epoch": 1.95, - "eval_cer": 0.9144052393627603, - "eval_loss": 0.004187974147498608, - "eval_runtime": 116.3794, - "eval_samples_per_second": 17.185, - "eval_steps_per_second": 4.296, + "epoch": 1.0, + "eval_cer": 0.8817306790618513, + "eval_loss": 0.014083863236010075, + "eval_runtime": 108.3195, + "eval_samples_per_second": 18.464, + "eval_steps_per_second": 4.616, "step": 387000 }, { - "epoch": 1.95, - "learning_rate": 7.122712664786515e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014952213820794698, + "loss": 0.013, "step": 387010 }, { - "epoch": 1.95, - "learning_rate": 7.115144971772505e-06, - "loss": 0.009, + "epoch": 1.0, + "learning_rate": 0.00014951824999157552, + "loss": 0.0124, "step": 387020 }, { - "epoch": 1.95, - "learning_rate": 7.107577278758494e-06, + "epoch": 1.0, + "learning_rate": 0.00014951436177520406, "loss": 0.0104, "step": 387030 }, { - "epoch": 1.95, - "learning_rate": 7.100009585744484e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014951047355883258, + "loss": 0.0103, "step": 387040 }, { - "epoch": 1.95, - "learning_rate": 7.0924418927304736e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00014950658534246112, + "loss": 0.0104, "step": 387050 }, { - "epoch": 1.95, - "learning_rate": 7.0848741997164635e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00014950269712608966, + "loss": 0.0115, "step": 387060 }, { - "epoch": 1.95, - "learning_rate": 7.0773065067024526e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00014949880890971818, + "loss": 0.0115, "step": 387070 }, { - "epoch": 1.95, - "learning_rate": 7.0697388136884425e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00014949492069334672, + "loss": 0.015, "step": 387080 }, { - "epoch": 1.95, - "learning_rate": 7.062171120674432e-06, - "loss": 0.0062, + "epoch": 1.0, + "learning_rate": 0.00014949103247697526, + "loss": 0.0103, "step": 387090 }, { - "epoch": 1.95, - "learning_rate": 7.054603427660422e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.0001494871442606038, + "loss": 0.0179, "step": 387100 }, { - "epoch": 1.95, - "learning_rate": 7.047035734646411e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014948325604423232, + "loss": 0.0102, "step": 387110 }, { - "epoch": 1.95, - "learning_rate": 7.039468041632401e-06, - "loss": 0.0077, + "epoch": 1.0, + "learning_rate": 0.00014947936782786089, + "loss": 0.0106, "step": 387120 }, { - "epoch": 1.95, - "learning_rate": 7.031900348618391e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.0001494754796114894, + "loss": 0.0114, "step": 387130 }, { - "epoch": 1.95, - "learning_rate": 7.024332655604381e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.00014947159139511794, + "loss": 0.0096, "step": 387140 }, { - "epoch": 1.95, - "learning_rate": 7.01676496259037e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014946770317874648, + "loss": 0.0101, "step": 387150 }, { - "epoch": 1.95, - "learning_rate": 7.00919726957636e-06, - "loss": 0.0102, + "epoch": 1.0, + "learning_rate": 0.00014946381496237502, + "loss": 0.0119, "step": 387160 }, { - "epoch": 1.95, - "learning_rate": 7.00162957656235e-06, - "loss": 0.0043, + "epoch": 1.0, + "learning_rate": 0.00014945992674600354, + "loss": 0.0115, "step": 387170 }, { - "epoch": 1.95, - "learning_rate": 6.994061883548339e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00014945603852963208, + "loss": 0.0091, "step": 387180 }, { - "epoch": 1.95, - "learning_rate": 6.986494190534329e-06, - "loss": 0.0056, + "epoch": 1.0, + "learning_rate": 0.00014945215031326062, + "loss": 0.0087, "step": 387190 }, { - "epoch": 1.95, - "learning_rate": 6.978926497520319e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.00014944826209688916, + "loss": 0.0128, "step": 387200 }, { - "epoch": 1.95, - "learning_rate": 6.971358804506309e-06, - "loss": 0.0069, + "epoch": 1.0, + "learning_rate": 0.00014944437388051768, + "loss": 0.0106, "step": 387210 }, { - "epoch": 1.95, - "learning_rate": 6.963791111492298e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014944048566414622, + "loss": 0.0131, "step": 387220 }, { - "epoch": 1.95, - "learning_rate": 6.956223418478288e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00014943659744777476, + "loss": 0.0108, "step": 387230 }, { - "epoch": 1.95, - "learning_rate": 6.948655725464278e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.0001494327092314033, + "loss": 0.012, "step": 387240 }, { - "epoch": 1.95, - "learning_rate": 6.941088032450268e-06, - "loss": 0.0044, + "epoch": 1.0, + "learning_rate": 0.00014942882101503182, + "loss": 0.0115, "step": 387250 }, { - "epoch": 1.95, - "learning_rate": 6.933520339436256e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.0001494249327986604, + "loss": 0.011, "step": 387260 }, { - "epoch": 1.95, - "learning_rate": 6.9259526464222466e-06, - "loss": 0.008, + "epoch": 1.0, + "learning_rate": 0.0001494210445822889, + "loss": 0.0116, "step": 387270 }, { - "epoch": 1.95, - "learning_rate": 6.9183849534082365e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014941715636591744, + "loss": 0.0101, "step": 387280 }, { - "epoch": 1.95, - "learning_rate": 6.910817260394226e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00014941326814954598, + "loss": 0.014, "step": 387290 }, { - "epoch": 1.95, - "learning_rate": 6.903249567380215e-06, - "loss": 0.0086, + "epoch": 1.0, + "learning_rate": 0.0001494093799331745, + "loss": 0.0124, "step": 387300 }, { - "epoch": 1.95, - "learning_rate": 6.8956818743662045e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00014940549171680304, + "loss": 0.009, "step": 387310 }, { - "epoch": 1.95, - "learning_rate": 6.8881141813521944e-06, - "loss": 0.0047, + "epoch": 1.0, + "learning_rate": 0.00014940160350043158, + "loss": 0.0124, "step": 387320 }, { - "epoch": 1.95, - "learning_rate": 6.880546488338185e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014939771528406012, + "loss": 0.0157, "step": 387330 }, { - "epoch": 1.95, - "learning_rate": 6.872978795324173e-06, - "loss": 0.0135, + "epoch": 1.0, + "learning_rate": 0.00014939382706768864, + "loss": 0.0123, "step": 387340 }, { - "epoch": 1.95, - "learning_rate": 6.865411102310163e-06, - "loss": 0.0059, + "epoch": 1.0, + "learning_rate": 0.00014938993885131718, + "loss": 0.0132, "step": 387350 }, { - "epoch": 1.95, - "learning_rate": 6.857843409296153e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00014938605063494572, + "loss": 0.0107, "step": 387360 }, { - "epoch": 1.95, - "learning_rate": 6.850275716282143e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00014938216241857426, + "loss": 0.0137, "step": 387370 }, { - "epoch": 1.95, - "learning_rate": 6.842708023268132e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00014937827420220278, + "loss": 0.011, "step": 387380 }, { - "epoch": 1.95, - "learning_rate": 6.835140330254122e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014937438598583132, + "loss": 0.0107, "step": 387390 }, { - "epoch": 1.95, - "learning_rate": 6.827572637240112e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.00014937049776945986, + "loss": 0.0099, "step": 387400 }, { - "epoch": 1.95, - "learning_rate": 6.820004944226102e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.0001493666095530884, + "loss": 0.0099, "step": 387410 }, { - "epoch": 1.95, - "learning_rate": 6.812437251212091e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00014936272133671692, + "loss": 0.0086, "step": 387420 }, { - "epoch": 1.95, - "learning_rate": 6.804869558198081e-06, - "loss": 0.0048, + "epoch": 1.0, + "learning_rate": 0.00014935883312034546, + "loss": 0.0257, "step": 387430 }, { - "epoch": 1.95, - "learning_rate": 6.797301865184071e-06, - "loss": 0.007, + "epoch": 1.0, + "learning_rate": 0.000149354944903974, + "loss": 0.0138, "step": 387440 }, { - "epoch": 1.95, - "learning_rate": 6.789734172170061e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014935105668760254, + "loss": 0.0133, "step": 387450 }, { - "epoch": 1.95, - "learning_rate": 6.78216647915605e-06, - "loss": 0.0055, + "epoch": 1.0, + "learning_rate": 0.00014934716847123108, + "loss": 0.0129, "step": 387460 }, { - "epoch": 1.95, - "learning_rate": 6.77459878614204e-06, - "loss": 0.0051, + "epoch": 1.0, + "learning_rate": 0.00014934328025485963, + "loss": 0.0101, "step": 387470 }, { - "epoch": 1.95, - "learning_rate": 6.76703109312803e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.00014933939203848814, + "loss": 0.0114, "step": 387480 }, { - "epoch": 1.95, - "learning_rate": 6.7594634001140196e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00014933550382211668, + "loss": 0.0112, "step": 387490 }, { - "epoch": 1.95, - "learning_rate": 6.751895707100009e-06, - "loss": 0.0068, + "epoch": 1.0, + "learning_rate": 0.00014933161560574522, + "loss": 0.0142, "step": 387500 }, { - "epoch": 1.96, - "learning_rate": 6.7443280140859986e-06, - "loss": 0.0063, + "epoch": 1.0, + "learning_rate": 0.00014932772738937377, + "loss": 0.0098, "step": 387510 }, { - "epoch": 1.96, - "learning_rate": 6.7367603210719885e-06, - "loss": 0.0071, + "epoch": 1.0, + "learning_rate": 0.00014932383917300228, + "loss": 0.0132, "step": 387520 }, { - "epoch": 1.96, - "learning_rate": 6.729192628057978e-06, - "loss": 0.0046, + "epoch": 1.0, + "learning_rate": 0.00014931995095663082, + "loss": 0.0101, "step": 387530 }, { - "epoch": 1.96, - "learning_rate": 6.7216249350439674e-06, - "loss": 0.0058, + "epoch": 1.0, + "learning_rate": 0.00014931606274025936, + "loss": 0.0148, "step": 387540 }, { - "epoch": 1.96, - "learning_rate": 6.714057242029957e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014931217452388788, + "loss": 0.0112, "step": 387550 }, { - "epoch": 1.96, - "learning_rate": 6.706489549015947e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00014930828630751642, + "loss": 0.0127, "step": 387560 }, { - "epoch": 1.96, - "learning_rate": 6.698921856001937e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00014930439809114496, + "loss": 0.0124, "step": 387570 }, { - "epoch": 1.96, - "learning_rate": 6.691354162987926e-06, - "loss": 0.0098, + "epoch": 1.0, + "learning_rate": 0.0001493005098747735, + "loss": 0.0127, "step": 387580 }, { - "epoch": 1.96, - "learning_rate": 6.683786469973916e-06, - "loss": 0.0052, + "epoch": 1.0, + "learning_rate": 0.00014929662165840202, + "loss": 0.0103, "step": 387590 }, { - "epoch": 1.96, - "learning_rate": 6.676218776959906e-06, - "loss": 0.0053, + "epoch": 1.0, + "learning_rate": 0.00014929273344203056, + "loss": 0.0132, "step": 387600 }, { - "epoch": 1.96, - "learning_rate": 6.668651083945896e-06, - "loss": 0.005, + "epoch": 1.0, + "learning_rate": 0.0001492888452256591, + "loss": 0.0127, "step": 387610 }, { - "epoch": 1.96, - "learning_rate": 6.661083390931885e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00014928495700928764, + "loss": 0.0114, "step": 387620 }, { - "epoch": 1.96, - "learning_rate": 6.653515697917875e-06, - "loss": 0.0075, + "epoch": 1.0, + "learning_rate": 0.00014928106879291616, + "loss": 0.011, "step": 387630 }, { - "epoch": 1.96, - "learning_rate": 6.645948004903865e-06, - "loss": 0.0061, + "epoch": 1.0, + "learning_rate": 0.00014927718057654473, + "loss": 0.0114, "step": 387640 }, { - "epoch": 1.96, - "learning_rate": 6.638380311889855e-06, - "loss": 0.006, + "epoch": 1.0, + "learning_rate": 0.00014927329236017324, + "loss": 0.013, "step": 387650 }, { - "epoch": 1.96, - "learning_rate": 6.630812618875844e-06, - "loss": 0.0057, + "epoch": 1.0, + "learning_rate": 0.00014926940414380178, + "loss": 0.0103, "step": 387660 }, { - "epoch": 1.96, - "learning_rate": 6.623244925861834e-06, - "loss": 0.0054, + "epoch": 1.0, + "learning_rate": 0.00014926551592743032, + "loss": 0.0124, "step": 387670 }, { - "epoch": 1.96, - "learning_rate": 6.615677232847824e-06, - "loss": 0.0065, + "epoch": 1.0, + "learning_rate": 0.00014926162771105886, + "loss": 0.0225, "step": 387680 }, { - "epoch": 1.96, - "learning_rate": 6.608109539833814e-06, - "loss": 0.0045, + "epoch": 1.0, + "learning_rate": 0.00014925773949468738, + "loss": 0.0105, "step": 387690 }, { - "epoch": 1.96, - "learning_rate": 6.600541846819803e-06, - "loss": 0.0087, + "epoch": 1.0, + "learning_rate": 0.00014925385127831592, + "loss": 0.0121, "step": 387700 }, { - "epoch": 1.96, - "learning_rate": 6.5929741538057926e-06, - "loss": 0.0064, + "epoch": 1.0, + "learning_rate": 0.00014924996306194446, + "loss": 0.0313, "step": 387710 }, { - "epoch": 1.96, - "learning_rate": 6.5854064607917825e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.000149246074845573, + "loss": 0.0196, "step": 387720 }, { - "epoch": 1.96, - "learning_rate": 6.577838767777771e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.00014924218662920152, + "loss": 0.0139, "step": 387730 }, { - "epoch": 1.96, - "learning_rate": 6.570271074763761e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014923829841283006, + "loss": 0.0138, "step": 387740 }, { - "epoch": 1.96, - "learning_rate": 6.562703381749751e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.0001492344101964586, + "loss": 0.0087, "step": 387750 }, { - "epoch": 1.96, - "learning_rate": 6.555135688735741e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.00014923052198008714, + "loss": 0.0147, "step": 387760 }, { - "epoch": 1.96, - "learning_rate": 6.5475679957217295e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014922663376371566, + "loss": 0.0103, "step": 387770 }, { - "epoch": 1.96, - "learning_rate": 6.540000302707719e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014922274554734423, + "loss": 0.0121, "step": 387780 }, { - "epoch": 1.96, - "learning_rate": 6.532432609693709e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014921885733097274, + "loss": 0.01, "step": 387790 }, { - "epoch": 1.96, - "learning_rate": 6.524864916679699e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014921496911460126, + "loss": 0.01, "step": 387800 }, { - "epoch": 1.96, - "learning_rate": 6.517297223665688e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014921108089822982, + "loss": 0.0122, "step": 387810 }, { - "epoch": 1.96, - "learning_rate": 6.509729530651678e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014920719268185834, + "loss": 0.0101, "step": 387820 }, { - "epoch": 1.96, - "learning_rate": 6.502161837637668e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014920330446548688, + "loss": 0.0162, "step": 387830 }, { - "epoch": 1.96, - "learning_rate": 6.494594144623658e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014919941624911542, + "loss": 0.011, "step": 387840 }, { - "epoch": 1.96, - "learning_rate": 6.487026451609647e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014919552803274396, + "loss": 0.0137, "step": 387850 }, { - "epoch": 1.96, - "learning_rate": 6.479458758595637e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014919163981637248, + "loss": 0.0105, "step": 387860 }, { - "epoch": 1.96, - "learning_rate": 6.471891065581627e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014918775160000102, + "loss": 0.0105, "step": 387870 }, { - "epoch": 1.96, - "learning_rate": 6.464323372567617e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014918386338362956, + "loss": 0.0127, "step": 387880 }, { - "epoch": 1.96, - "learning_rate": 6.456755679553606e-06, - "loss": 0.0037, + "epoch": 1.01, + "learning_rate": 0.0001491799751672581, + "loss": 0.0102, "step": 387890 }, { - "epoch": 1.96, - "learning_rate": 6.449187986539596e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014917608695088662, + "loss": 0.0103, "step": 387900 }, { - "epoch": 1.96, - "learning_rate": 6.441620293525586e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014917219873451516, + "loss": 0.009, "step": 387910 }, { - "epoch": 1.96, - "learning_rate": 6.434052600511576e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.0001491683105181437, + "loss": 0.0108, "step": 387920 }, { - "epoch": 1.96, - "learning_rate": 6.426484907497565e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014916442230177224, + "loss": 0.0123, "step": 387930 }, { - "epoch": 1.96, - "learning_rate": 6.418917214483555e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014916053408540076, + "loss": 0.0152, "step": 387940 }, { - "epoch": 1.96, - "learning_rate": 6.4113495214695446e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.0001491566458690293, + "loss": 0.0122, "step": 387950 }, { - "epoch": 1.96, - "learning_rate": 6.4037818284555345e-06, - "loss": 0.007, + "epoch": 1.01, + "learning_rate": 0.00014915275765265784, + "loss": 0.0121, "step": 387960 }, { - "epoch": 1.96, - "learning_rate": 6.3962141354415235e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014914886943628638, + "loss": 0.0137, "step": 387970 }, { - "epoch": 1.96, - "learning_rate": 6.3886464424275134e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014914498121991492, + "loss": 0.0114, "step": 387980 }, { - "epoch": 1.96, - "learning_rate": 6.381078749413503e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014914109300354347, + "loss": 0.0109, "step": 387990 }, { - "epoch": 1.96, - "learning_rate": 6.373511056399493e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014913720478717198, + "loss": 0.0137, "step": 388000 }, { - "epoch": 1.96, - "eval_cer": 0.9144062097588856, - "eval_loss": 0.004157001152634621, - "eval_runtime": 116.3242, - "eval_samples_per_second": 17.193, - "eval_steps_per_second": 4.298, + "epoch": 1.01, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.007554326672106981, + "eval_runtime": 108.2118, + "eval_samples_per_second": 18.482, + "eval_steps_per_second": 4.621, "step": 388000 }, { - "epoch": 1.96, - "learning_rate": 6.365943363385482e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014913331657080052, + "loss": 0.0097, "step": 388010 }, { - "epoch": 1.96, - "learning_rate": 6.358375670371472e-06, - "loss": 0.0044, + "epoch": 1.01, + "learning_rate": 0.00014912942835442906, + "loss": 0.0101, "step": 388020 }, { - "epoch": 1.96, - "learning_rate": 6.350807977357462e-06, - "loss": 0.0038, + "epoch": 1.01, + "learning_rate": 0.0001491255401380576, + "loss": 0.0137, "step": 388030 }, { - "epoch": 1.96, - "learning_rate": 6.343240284343452e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014912165192168612, + "loss": 0.0115, "step": 388040 }, { - "epoch": 1.96, - "learning_rate": 6.335672591329441e-06, - "loss": 0.0068, + "epoch": 1.01, + "learning_rate": 0.00014911776370531466, + "loss": 0.011, "step": 388050 }, { - "epoch": 1.96, - "learning_rate": 6.328104898315431e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.0001491138754889432, + "loss": 0.0092, "step": 388060 }, { - "epoch": 1.96, - "learning_rate": 6.320537205301421e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014910998727257172, + "loss": 0.012, "step": 388070 }, { - "epoch": 1.96, - "learning_rate": 6.312969512287411e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014910609905620026, + "loss": 0.0107, "step": 388080 }, { - "epoch": 1.96, - "learning_rate": 6.3054018192734e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.0001491022108398288, + "loss": 0.0106, "step": 388090 }, { - "epoch": 1.96, - "learning_rate": 6.29783412625939e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.00014909832262345734, + "loss": 0.0107, "step": 388100 }, { - "epoch": 1.96, - "learning_rate": 6.29026643324538e-06, - "loss": 0.0087, + "epoch": 1.01, + "learning_rate": 0.00014909443440708586, + "loss": 0.0155, "step": 388110 }, { - "epoch": 1.96, - "learning_rate": 6.28269874023137e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.0001490905461907144, + "loss": 0.0098, "step": 388120 }, { - "epoch": 1.96, - "learning_rate": 6.275131047217359e-06, - "loss": 0.0067, + "epoch": 1.01, + "learning_rate": 0.00014908665797434294, + "loss": 0.0119, "step": 388130 }, { - "epoch": 1.96, - "learning_rate": 6.267563354203349e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014908276975797148, + "loss": 0.0136, "step": 388140 }, { - "epoch": 1.96, - "learning_rate": 6.2599956611893386e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.0001490788815416, + "loss": 0.0097, "step": 388150 }, { - "epoch": 1.96, - "learning_rate": 6.2524279681753285e-06, - "loss": 0.0044, + "epoch": 1.01, + "learning_rate": 0.00014907499332522857, + "loss": 0.0116, "step": 388160 }, { - "epoch": 1.96, - "learning_rate": 6.2448602751613176e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014907110510885708, + "loss": 0.014, "step": 388170 }, { - "epoch": 1.96, - "learning_rate": 6.2372925821473075e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014906721689248562, + "loss": 0.0131, "step": 388180 }, { - "epoch": 1.96, - "learning_rate": 6.229724889133297e-06, - "loss": 0.0066, + "epoch": 1.01, + "learning_rate": 0.00014906332867611416, + "loss": 0.0127, "step": 388190 }, { - "epoch": 1.96, - "learning_rate": 6.222157196119287e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.0001490594404597427, + "loss": 0.0127, "step": 388200 }, { - "epoch": 1.96, - "learning_rate": 6.2145895031052755e-06, - "loss": 0.0067, + "epoch": 1.01, + "learning_rate": 0.00014905555224337122, + "loss": 0.0119, "step": 388210 }, { - "epoch": 1.96, - "learning_rate": 6.207021810091265e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014905166402699976, + "loss": 0.0108, "step": 388220 }, { - "epoch": 1.96, - "learning_rate": 6.199454117077255e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.0001490477758106283, + "loss": 0.0102, "step": 388230 }, { - "epoch": 1.96, - "learning_rate": 6.191886424063246e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.00014904388759425684, + "loss": 0.0095, "step": 388240 }, { - "epoch": 1.96, - "learning_rate": 6.184318731049234e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014903999937788536, + "loss": 0.0106, "step": 388250 }, { - "epoch": 1.96, - "learning_rate": 6.176751038035224e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.0001490361111615139, + "loss": 0.0107, "step": 388260 }, { - "epoch": 1.96, - "learning_rate": 6.169183345021214e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.00014903222294514244, + "loss": 0.0113, "step": 388270 }, { - "epoch": 1.96, - "learning_rate": 6.161615652007203e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014902833472877098, + "loss": 0.0101, "step": 388280 }, { - "epoch": 1.96, - "learning_rate": 6.154047958993193e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.0001490244465123995, + "loss": 0.0142, "step": 388290 }, { - "epoch": 1.96, - "learning_rate": 6.146480265979183e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014902055829602804, + "loss": 0.0094, "step": 388300 }, { - "epoch": 1.96, - "learning_rate": 6.138912572965173e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014901667007965658, + "loss": 0.0149, "step": 388310 }, { - "epoch": 1.96, - "learning_rate": 6.131344879951162e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.0001490127818632851, + "loss": 0.0128, "step": 388320 }, { - "epoch": 1.96, - "learning_rate": 6.123777186937152e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014900889364691366, + "loss": 0.0113, "step": 388330 }, { - "epoch": 1.96, - "learning_rate": 6.116209493923142e-06, - "loss": 0.0073, + "epoch": 1.01, + "learning_rate": 0.00014900500543054218, + "loss": 0.0132, "step": 388340 }, { - "epoch": 1.96, - "learning_rate": 6.108641800909132e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014900111721417072, + "loss": 0.0152, "step": 388350 }, { - "epoch": 1.96, - "learning_rate": 6.101074107895121e-06, - "loss": 0.0083, + "epoch": 1.01, + "learning_rate": 0.00014899722899779926, + "loss": 0.0104, "step": 388360 }, { - "epoch": 1.96, - "learning_rate": 6.093506414881111e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.0001489933407814278, + "loss": 0.0152, "step": 388370 }, { - "epoch": 1.96, - "learning_rate": 6.085938721867101e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014898945256505632, + "loss": 0.0119, "step": 388380 }, { - "epoch": 1.96, - "learning_rate": 6.0783710288530906e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014898556434868486, + "loss": 0.009, "step": 388390 }, { - "epoch": 1.96, - "learning_rate": 6.07080333583908e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.0001489816761323134, + "loss": 0.0109, "step": 388400 }, { - "epoch": 1.96, - "learning_rate": 6.0632356428250695e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014897778791594194, + "loss": 0.0134, "step": 388410 }, { - "epoch": 1.96, - "learning_rate": 6.0556679498110594e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014897389969957046, + "loss": 0.0115, "step": 388420 }, { - "epoch": 1.96, - "learning_rate": 6.048100256797049e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.000148970011483199, + "loss": 0.0106, "step": 388430 }, { - "epoch": 1.96, - "learning_rate": 6.040532563783038e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.00014896612326682754, + "loss": 0.0144, "step": 388440 }, { - "epoch": 1.96, - "learning_rate": 6.032964870769028e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014896223505045608, + "loss": 0.0134, "step": 388450 }, { - "epoch": 1.96, - "learning_rate": 6.025397177755018e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.0001489583468340846, + "loss": 0.0132, "step": 388460 }, { - "epoch": 1.96, - "learning_rate": 6.017829484741008e-06, - "loss": 0.0081, + "epoch": 1.01, + "learning_rate": 0.00014895445861771314, + "loss": 0.014, "step": 388470 }, { - "epoch": 1.96, - "learning_rate": 6.010261791726997e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014895057040134168, + "loss": 0.0119, "step": 388480 }, { - "epoch": 1.96, - "learning_rate": 6.002694098712987e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.00014894668218497022, + "loss": 0.0128, "step": 388490 }, { - "epoch": 1.96, - "learning_rate": 5.995126405698977e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014894279396859874, + "loss": 0.0178, "step": 388500 }, { - "epoch": 1.96, - "learning_rate": 5.987558712684967e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.0001489389057522273, + "loss": 0.0116, "step": 388510 }, { - "epoch": 1.96, - "learning_rate": 5.979991019670956e-06, - "loss": 0.0066, + "epoch": 1.01, + "learning_rate": 0.00014893501753585582, + "loss": 0.01, "step": 388520 }, { - "epoch": 1.96, - "learning_rate": 5.972423326656946e-06, - "loss": 0.0069, + "epoch": 1.01, + "learning_rate": 0.00014893112931948436, + "loss": 0.0124, "step": 388530 }, { - "epoch": 1.96, - "learning_rate": 5.964855633642936e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.0001489272411031129, + "loss": 0.0109, "step": 388540 }, { - "epoch": 1.96, - "learning_rate": 5.957287940628926e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014892335288674142, + "loss": 0.0137, "step": 388550 }, { - "epoch": 1.96, - "learning_rate": 5.949720247614915e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014891946467036996, + "loss": 0.0104, "step": 388560 }, { - "epoch": 1.96, - "learning_rate": 5.942152554600905e-06, - "loss": 0.0074, + "epoch": 1.01, + "learning_rate": 0.0001489155764539985, + "loss": 0.0116, "step": 388570 }, { - "epoch": 1.96, - "learning_rate": 5.934584861586895e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014891168823762704, + "loss": 0.015, "step": 388580 }, { - "epoch": 1.96, - "learning_rate": 5.9270171685728846e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014890780002125556, + "loss": 0.0117, "step": 388590 }, { - "epoch": 1.96, - "learning_rate": 5.919449475558874e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.0001489039118048841, + "loss": 0.0105, "step": 388600 }, { - "epoch": 1.96, - "learning_rate": 5.9118817825448636e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014890002358851264, + "loss": 0.0126, "step": 388610 }, { - "epoch": 1.96, - "learning_rate": 5.9043140895308535e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014889613537214118, + "loss": 0.013, "step": 388620 }, { - "epoch": 1.96, - "learning_rate": 5.896746396516843e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.0001488922471557697, + "loss": 0.0116, "step": 388630 }, { - "epoch": 1.96, - "learning_rate": 5.889178703502832e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014888835893939824, + "loss": 0.0127, "step": 388640 }, { - "epoch": 1.96, - "learning_rate": 5.8816110104888215e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014888447072302678, + "loss": 0.0129, "step": 388650 }, { - "epoch": 1.96, - "learning_rate": 5.874043317474812e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.00014888058250665532, + "loss": 0.0146, "step": 388660 }, { - "epoch": 1.96, - "learning_rate": 5.866475624460802e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014887669429028384, + "loss": 0.009, "step": 388670 }, { - "epoch": 1.96, - "learning_rate": 5.85890793144679e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.0001488728060739124, + "loss": 0.0081, "step": 388680 }, { - "epoch": 1.96, - "learning_rate": 5.85134023843278e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014886891785754092, + "loss": 0.0132, "step": 388690 }, { - "epoch": 1.96, - "learning_rate": 5.84377254541877e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014886502964116946, + "loss": 0.0134, "step": 388700 }, { - "epoch": 1.96, - "learning_rate": 5.83620485240476e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.000148861141424798, + "loss": 0.0104, "step": 388710 }, { - "epoch": 1.96, - "learning_rate": 5.828637159390749e-06, - "loss": 0.0065, + "epoch": 1.01, + "learning_rate": 0.00014885725320842654, + "loss": 0.0098, "step": 388720 }, { - "epoch": 1.96, - "learning_rate": 5.821069466376739e-06, - "loss": 0.0069, + "epoch": 1.01, + "learning_rate": 0.00014885336499205506, + "loss": 0.0113, "step": 388730 }, { - "epoch": 1.96, - "learning_rate": 5.813501773362729e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.0001488494767756836, + "loss": 0.0135, "step": 388740 }, { - "epoch": 1.96, - "learning_rate": 5.805934080348719e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014884558855931214, + "loss": 0.0136, "step": 388750 }, { - "epoch": 1.96, - "learning_rate": 5.798366387334708e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014884170034294068, + "loss": 0.0081, "step": 388760 }, { - "epoch": 1.96, - "learning_rate": 5.790798694320698e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.0001488378121265692, + "loss": 0.0119, "step": 388770 }, { - "epoch": 1.96, - "learning_rate": 5.783231001306688e-06, - "loss": 0.0072, + "epoch": 1.01, + "learning_rate": 0.00014883392391019774, + "loss": 0.0111, "step": 388780 }, { - "epoch": 1.96, - "learning_rate": 5.775663308292678e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.00014883003569382628, + "loss": 0.0094, "step": 388790 }, { - "epoch": 1.96, - "learning_rate": 5.768095615278667e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.0001488261474774548, + "loss": 0.0135, "step": 388800 }, { - "epoch": 1.96, - "learning_rate": 5.760527922264657e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014882225926108334, + "loss": 0.0102, "step": 388810 }, { - "epoch": 1.96, - "learning_rate": 5.752960229250647e-06, - "loss": 0.0069, + "epoch": 1.01, + "learning_rate": 0.00014881837104471188, + "loss": 0.0171, "step": 388820 }, { - "epoch": 1.96, - "learning_rate": 5.745392536236636e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.00014881448282834042, + "loss": 0.012, "step": 388830 }, { - "epoch": 1.96, - "learning_rate": 5.737824843222626e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014881059461196894, + "loss": 0.0164, "step": 388840 }, { - "epoch": 1.96, - "learning_rate": 5.7302571502086155e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.0001488067063955975, + "loss": 0.0118, "step": 388850 }, { - "epoch": 1.96, - "learning_rate": 5.7226894571946054e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014880281817922602, + "loss": 0.0116, "step": 388860 }, { - "epoch": 1.96, - "learning_rate": 5.7151217641805945e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014879892996285456, + "loss": 0.0102, "step": 388870 }, { - "epoch": 1.96, - "learning_rate": 5.7075540711665844e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.0001487950417464831, + "loss": 0.013, "step": 388880 }, { - "epoch": 1.96, - "learning_rate": 5.699986378152574e-06, - "loss": 0.007, + "epoch": 1.01, + "learning_rate": 0.00014879115353011164, + "loss": 0.0085, "step": 388890 }, { - "epoch": 1.96, - "learning_rate": 5.692418685138564e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014878726531374016, + "loss": 0.0115, "step": 388900 }, { - "epoch": 1.96, - "learning_rate": 5.684850992124553e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.0001487833770973687, + "loss": 0.011, "step": 388910 }, { - "epoch": 1.96, - "learning_rate": 5.677283299110543e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014877948888099724, + "loss": 0.011, "step": 388920 }, { - "epoch": 1.96, - "learning_rate": 5.669715606096533e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014877560066462578, + "loss": 0.0099, "step": 388930 }, { - "epoch": 1.96, - "learning_rate": 5.662147913082523e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.0001487717124482543, + "loss": 0.0103, "step": 388940 }, { - "epoch": 1.96, - "learning_rate": 5.654580220068512e-06, - "loss": 0.0066, + "epoch": 1.01, + "learning_rate": 0.00014876782423188284, + "loss": 0.012, "step": 388950 }, { - "epoch": 1.96, - "learning_rate": 5.647012527054502e-06, - "loss": 0.0067, + "epoch": 1.01, + "learning_rate": 0.00014876393601551138, + "loss": 0.0124, "step": 388960 }, { - "epoch": 1.96, - "learning_rate": 5.639444834040492e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014876004779913992, + "loss": 0.0081, "step": 388970 }, { - "epoch": 1.96, - "learning_rate": 5.631877141026482e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.00014875615958276844, + "loss": 0.0137, "step": 388980 }, { - "epoch": 1.96, - "learning_rate": 5.624309448012471e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014875227136639698, + "loss": 0.0123, "step": 388990 }, { - "epoch": 1.96, - "learning_rate": 5.616741754998461e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014874838315002552, + "loss": 0.0107, "step": 389000 }, { - "epoch": 1.96, - "eval_cer": 0.9143994169860079, - "eval_loss": 0.004172166809439659, - "eval_runtime": 116.4331, - "eval_samples_per_second": 17.177, - "eval_steps_per_second": 4.294, + "epoch": 1.01, + "eval_cer": 0.881704085960102, + "eval_loss": 0.007840441539883614, + "eval_runtime": 107.9934, + "eval_samples_per_second": 18.52, + "eval_steps_per_second": 4.63, "step": 389000 }, { - "epoch": 1.96, - "learning_rate": 5.609174061984451e-06, - "loss": 0.0074, + "epoch": 1.01, + "learning_rate": 0.00014874449493365406, + "loss": 0.0104, "step": 389010 }, { - "epoch": 1.96, - "learning_rate": 5.601606368970441e-06, - "loss": 0.009, + "epoch": 1.01, + "learning_rate": 0.00014874060671728258, + "loss": 0.0126, "step": 389020 }, { - "epoch": 1.96, - "learning_rate": 5.59403867595643e-06, - "loss": 0.0077, + "epoch": 1.01, + "learning_rate": 0.00014873671850091115, + "loss": 0.0098, "step": 389030 }, { - "epoch": 1.96, - "learning_rate": 5.58647098294242e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014873283028453966, + "loss": 0.0095, "step": 389040 }, { - "epoch": 1.96, - "learning_rate": 5.5789032899284096e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.0001487289420681682, + "loss": 0.0121, "step": 389050 }, { - "epoch": 1.96, - "learning_rate": 5.5713355969143995e-06, - "loss": 0.0067, + "epoch": 1.01, + "learning_rate": 0.00014872505385179674, + "loss": 0.0113, "step": 389060 }, { - "epoch": 1.96, - "learning_rate": 5.563767903900388e-06, - "loss": 0.0034, + "epoch": 1.01, + "learning_rate": 0.00014872116563542526, + "loss": 0.0087, "step": 389070 }, { - "epoch": 1.96, - "learning_rate": 5.5562002108863784e-06, - "loss": 0.0074, + "epoch": 1.01, + "learning_rate": 0.0001487172774190538, + "loss": 0.0094, "step": 389080 }, { - "epoch": 1.96, - "learning_rate": 5.548632517872368e-06, - "loss": 0.0076, + "epoch": 1.01, + "learning_rate": 0.00014871338920268234, + "loss": 0.0111, "step": 389090 }, { - "epoch": 1.96, - "learning_rate": 5.541064824858358e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014870950098631088, + "loss": 0.0113, "step": 389100 }, { - "epoch": 1.96, - "learning_rate": 5.5334971318443465e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.0001487056127699394, + "loss": 0.0121, "step": 389110 }, { - "epoch": 1.96, - "learning_rate": 5.525929438830336e-06, - "loss": 0.0073, + "epoch": 1.01, + "learning_rate": 0.00014870172455356794, + "loss": 0.0146, "step": 389120 }, { - "epoch": 1.96, - "learning_rate": 5.518361745816326e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014869783633719648, + "loss": 0.0106, "step": 389130 }, { - "epoch": 1.96, - "learning_rate": 5.510794052802317e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014869394812082502, + "loss": 0.0091, "step": 389140 }, { - "epoch": 1.96, - "learning_rate": 5.503226359788305e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014869005990445354, + "loss": 0.011, "step": 389150 }, { - "epoch": 1.96, - "learning_rate": 5.495658666774295e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014868617168808208, + "loss": 0.0174, "step": 389160 }, { - "epoch": 1.96, - "learning_rate": 5.488090973760285e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014868228347171062, + "loss": 0.0187, "step": 389170 }, { - "epoch": 1.96, - "learning_rate": 5.480523280746275e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.00014867839525533916, + "loss": 0.0113, "step": 389180 }, { - "epoch": 1.96, - "learning_rate": 5.472955587732264e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014867450703896768, + "loss": 0.0106, "step": 389190 }, { - "epoch": 1.96, - "learning_rate": 5.465387894718254e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014867061882259625, + "loss": 0.0121, "step": 389200 }, { - "epoch": 1.96, - "learning_rate": 5.457820201704244e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014866673060622476, + "loss": 0.011, "step": 389210 }, { - "epoch": 1.96, - "learning_rate": 5.450252508690234e-06, - "loss": 0.0065, + "epoch": 1.01, + "learning_rate": 0.0001486628423898533, + "loss": 0.0111, "step": 389220 }, { - "epoch": 1.96, - "learning_rate": 5.442684815676223e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014865895417348184, + "loss": 0.01, "step": 389230 }, { - "epoch": 1.96, - "learning_rate": 5.435117122662213e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014865506595711038, + "loss": 0.0126, "step": 389240 }, { - "epoch": 1.96, - "learning_rate": 5.427549429648203e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.0001486511777407389, + "loss": 0.0152, "step": 389250 }, { - "epoch": 1.96, - "learning_rate": 5.419981736634193e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014864728952436744, + "loss": 0.0134, "step": 389260 }, { - "epoch": 1.96, - "learning_rate": 5.412414043620182e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014864340130799598, + "loss": 0.0141, "step": 389270 }, { - "epoch": 1.96, - "learning_rate": 5.404846350606172e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.0001486395130916245, + "loss": 0.0128, "step": 389280 }, { - "epoch": 1.96, - "learning_rate": 5.3972786575921615e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014863562487525304, + "loss": 0.0124, "step": 389290 }, { - "epoch": 1.96, - "learning_rate": 5.3897109645781514e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014863173665888158, + "loss": 0.0092, "step": 389300 }, { - "epoch": 1.96, - "learning_rate": 5.3821432715641405e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.00014862784844251012, + "loss": 0.0097, "step": 389310 }, { - "epoch": 1.96, - "learning_rate": 5.3745755785501304e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.00014862396022613864, + "loss": 0.0109, "step": 389320 }, { - "epoch": 1.96, - "learning_rate": 5.36700788553612e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014862007200976718, + "loss": 0.0117, "step": 389330 }, { - "epoch": 1.96, - "learning_rate": 5.35944019252211e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014861618379339572, + "loss": 0.0109, "step": 389340 }, { - "epoch": 1.96, - "learning_rate": 5.351872499508099e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.00014861229557702426, + "loss": 0.0118, "step": 389350 }, { - "epoch": 1.96, - "learning_rate": 5.344304806494089e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014860840736065278, + "loss": 0.0107, "step": 389360 }, { - "epoch": 1.96, - "learning_rate": 5.336737113480079e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014860451914428134, + "loss": 0.0113, "step": 389370 }, { - "epoch": 1.96, - "learning_rate": 5.329169420466068e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014860063092790986, + "loss": 0.0111, "step": 389380 }, { - "epoch": 1.96, - "learning_rate": 5.321601727452058e-06, - "loss": 0.0067, + "epoch": 1.01, + "learning_rate": 0.0001485967427115384, + "loss": 0.0149, "step": 389390 }, { - "epoch": 1.96, - "learning_rate": 5.314034034438048e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014859285449516694, + "loss": 0.0123, "step": 389400 }, { - "epoch": 1.96, - "learning_rate": 5.306466341424038e-06, - "loss": 0.0088, + "epoch": 1.01, + "learning_rate": 0.00014858896627879548, + "loss": 0.0097, "step": 389410 }, { - "epoch": 1.96, - "learning_rate": 5.298898648410027e-06, - "loss": 0.004, + "epoch": 1.01, + "learning_rate": 0.000148585078062424, + "loss": 0.0129, "step": 389420 }, { - "epoch": 1.96, - "learning_rate": 5.291330955396017e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014858118984605254, + "loss": 0.0109, "step": 389430 }, { - "epoch": 1.96, - "learning_rate": 5.283763262382007e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014857730162968108, + "loss": 0.0096, "step": 389440 }, { - "epoch": 1.96, - "learning_rate": 5.276195569367997e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014857341341330962, + "loss": 0.0105, "step": 389450 }, { - "epoch": 1.96, - "learning_rate": 5.268627876353986e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014856952519693814, + "loss": 0.0145, "step": 389460 }, { - "epoch": 1.96, - "learning_rate": 5.261060183339976e-06, - "loss": 0.0039, + "epoch": 1.01, + "learning_rate": 0.00014856563698056668, + "loss": 0.0097, "step": 389470 }, { - "epoch": 1.96, - "learning_rate": 5.253492490325966e-06, - "loss": 0.0092, + "epoch": 1.01, + "learning_rate": 0.00014856174876419522, + "loss": 0.0118, "step": 389480 }, { - "epoch": 1.97, - "learning_rate": 5.2459247973119556e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014855786054782376, + "loss": 0.0118, "step": 389490 }, { - "epoch": 1.97, - "learning_rate": 5.238357104297945e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014855397233145228, + "loss": 0.0103, "step": 389500 }, { - "epoch": 1.97, - "learning_rate": 5.2307894112839345e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014855008411508082, + "loss": 0.0093, "step": 389510 }, { - "epoch": 1.97, - "learning_rate": 5.2232217182699244e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.00014854619589870936, + "loss": 0.0096, "step": 389520 }, { - "epoch": 1.97, - "learning_rate": 5.215654025255914e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014854230768233788, + "loss": 0.009, "step": 389530 }, { - "epoch": 1.97, - "learning_rate": 5.208086332241903e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014853841946596642, + "loss": 0.0148, "step": 389540 }, { - "epoch": 1.97, - "learning_rate": 5.2005186392278925e-06, - "loss": 0.0027, + "epoch": 1.01, + "learning_rate": 0.00014853453124959496, + "loss": 0.0245, "step": 389550 }, { - "epoch": 1.97, - "learning_rate": 5.192950946213883e-06, - "loss": 0.0036, + "epoch": 1.01, + "learning_rate": 0.0001485306430332235, + "loss": 0.0094, "step": 389560 }, { - "epoch": 1.97, - "learning_rate": 5.185383253199873e-06, - "loss": 0.0067, + "epoch": 1.01, + "learning_rate": 0.00014852675481685204, + "loss": 0.0091, "step": 389570 }, { - "epoch": 1.97, - "learning_rate": 5.177815560185861e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014852286660048058, + "loss": 0.014, "step": 389580 }, { - "epoch": 1.97, - "learning_rate": 5.170247867171851e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.0001485189783841091, + "loss": 0.0085, "step": 389590 }, { - "epoch": 1.97, - "learning_rate": 5.162680174157841e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.00014851509016773764, + "loss": 0.0123, "step": 389600 }, { - "epoch": 1.97, - "learning_rate": 5.155112481143831e-06, - "loss": 0.0068, + "epoch": 1.01, + "learning_rate": 0.00014851120195136618, + "loss": 0.011, "step": 389610 }, { - "epoch": 1.97, - "learning_rate": 5.14754478812982e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014850731373499472, + "loss": 0.0122, "step": 389620 }, { - "epoch": 1.97, - "learning_rate": 5.13997709511581e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014850342551862324, + "loss": 0.0122, "step": 389630 }, { - "epoch": 1.97, - "learning_rate": 5.1324094021018e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014849953730225178, + "loss": 0.0093, "step": 389640 }, { - "epoch": 1.97, - "learning_rate": 5.12484170908779e-06, - "loss": 0.0073, + "epoch": 1.01, + "learning_rate": 0.00014849564908588032, + "loss": 0.0111, "step": 389650 }, { - "epoch": 1.97, - "learning_rate": 5.117274016073779e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014849176086950886, + "loss": 0.0107, "step": 389660 }, { - "epoch": 1.97, - "learning_rate": 5.109706323059769e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014848787265313738, + "loss": 0.0123, "step": 389670 }, { - "epoch": 1.97, - "learning_rate": 5.102138630045759e-06, - "loss": 0.0029, + "epoch": 1.01, + "learning_rate": 0.00014848398443676592, + "loss": 0.0135, "step": 389680 }, { - "epoch": 1.97, - "learning_rate": 5.094570937031749e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014848009622039446, + "loss": 0.013, "step": 389690 }, { - "epoch": 1.97, - "learning_rate": 5.087003244017738e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.000148476208004023, + "loss": 0.0095, "step": 389700 }, { - "epoch": 1.97, - "learning_rate": 5.079435551003728e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014847231978765152, + "loss": 0.0109, "step": 389710 }, { - "epoch": 1.97, - "learning_rate": 5.071867857989718e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014846843157128008, + "loss": 0.0103, "step": 389720 }, { - "epoch": 1.97, - "learning_rate": 5.0643001649757075e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.0001484645433549086, + "loss": 0.0114, "step": 389730 }, { - "epoch": 1.97, - "learning_rate": 5.056732471961697e-06, - "loss": 0.0072, + "epoch": 1.01, + "learning_rate": 0.00014846065513853714, + "loss": 0.0145, "step": 389740 }, { - "epoch": 1.97, - "learning_rate": 5.0491647789476865e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014845676692216568, + "loss": 0.01, "step": 389750 }, { - "epoch": 1.97, - "learning_rate": 5.0415970859336764e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014845287870579422, + "loss": 0.0105, "step": 389760 }, { - "epoch": 1.97, - "learning_rate": 5.034029392919666e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014844899048942274, + "loss": 0.0113, "step": 389770 }, { - "epoch": 1.97, - "learning_rate": 5.026461699905655e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014844510227305128, + "loss": 0.0142, "step": 389780 }, { - "epoch": 1.97, - "learning_rate": 5.018894006891645e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014844121405667982, + "loss": 0.0134, "step": 389790 }, { - "epoch": 1.97, - "learning_rate": 5.011326313877635e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014843732584030834, + "loss": 0.0134, "step": 389800 }, { - "epoch": 1.97, - "learning_rate": 5.003758620863625e-06, - "loss": 0.007, + "epoch": 1.01, + "learning_rate": 0.00014843343762393688, + "loss": 0.0116, "step": 389810 }, { - "epoch": 1.97, - "learning_rate": 4.996190927849614e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014842954940756542, + "loss": 0.0123, "step": 389820 }, { - "epoch": 1.97, - "learning_rate": 4.988623234835604e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014842566119119396, + "loss": 0.0091, "step": 389830 }, { - "epoch": 1.97, - "learning_rate": 4.981055541821594e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014842177297482248, + "loss": 0.0104, "step": 389840 }, { - "epoch": 1.97, - "learning_rate": 4.973487848807584e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.00014841788475845102, + "loss": 0.0129, "step": 389850 }, { - "epoch": 1.97, - "learning_rate": 4.965920155793573e-06, - "loss": 0.0072, + "epoch": 1.01, + "learning_rate": 0.00014841399654207956, + "loss": 0.0098, "step": 389860 }, { - "epoch": 1.97, - "learning_rate": 4.958352462779563e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.0001484101083257081, + "loss": 0.0104, "step": 389870 }, { - "epoch": 1.97, - "learning_rate": 4.950784769765553e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014840622010933662, + "loss": 0.0115, "step": 389880 }, { - "epoch": 1.97, - "learning_rate": 4.943217076751543e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.00014840233189296516, + "loss": 0.0106, "step": 389890 }, { - "epoch": 1.97, - "learning_rate": 4.935649383737532e-06, - "loss": 0.0076, + "epoch": 1.01, + "learning_rate": 0.0001483984436765937, + "loss": 0.0156, "step": 389900 }, { - "epoch": 1.97, - "learning_rate": 4.928081690723522e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014839455546022224, + "loss": 0.0115, "step": 389910 }, { - "epoch": 1.97, - "learning_rate": 4.920513997709512e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014839066724385078, + "loss": 0.0123, "step": 389920 }, { - "epoch": 1.97, - "learning_rate": 4.912946304695501e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014838677902747932, + "loss": 0.0114, "step": 389930 }, { - "epoch": 1.97, - "learning_rate": 4.905378611681491e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014838289081110784, + "loss": 0.0116, "step": 389940 }, { - "epoch": 1.97, - "learning_rate": 4.8978109186674805e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014837900259473638, + "loss": 0.0085, "step": 389950 }, { - "epoch": 1.97, - "learning_rate": 4.8902432256534704e-06, - "loss": 0.0066, + "epoch": 1.01, + "learning_rate": 0.00014837511437836492, + "loss": 0.0116, "step": 389960 }, { - "epoch": 1.97, - "learning_rate": 4.882675532639459e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014837122616199346, + "loss": 0.0108, "step": 389970 }, { - "epoch": 1.97, - "learning_rate": 4.875107839625449e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014836733794562198, + "loss": 0.0116, "step": 389980 }, { - "epoch": 1.97, - "learning_rate": 4.867540146611439e-06, - "loss": 0.0068, + "epoch": 1.01, + "learning_rate": 0.00014836344972925052, + "loss": 0.0161, "step": 389990 }, { - "epoch": 1.97, - "learning_rate": 4.859972453597429e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014835956151287906, + "loss": 0.0119, "step": 390000 }, { - "epoch": 1.97, - "eval_cer": 0.9143955354015062, - "eval_loss": 0.004140438511967659, - "eval_runtime": 116.3675, - "eval_samples_per_second": 17.187, - "eval_steps_per_second": 4.297, + "epoch": 1.01, + "eval_cer": 0.881719481966378, + "eval_loss": 0.007798693608492613, + "eval_runtime": 108.0106, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, "step": 390000 }, { - "epoch": 1.97, - "learning_rate": 4.8524047605834175e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.0001483556732965076, + "loss": 0.0131, "step": 390010 }, { - "epoch": 1.97, - "learning_rate": 4.844837067569407e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014835178508013612, + "loss": 0.0174, "step": 390020 }, { - "epoch": 1.97, - "learning_rate": 4.837269374555397e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014834789686376466, + "loss": 0.0146, "step": 390030 }, { - "epoch": 1.97, - "learning_rate": 4.829701681541387e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.0001483440086473932, + "loss": 0.0092, "step": 390040 }, { - "epoch": 1.97, - "learning_rate": 4.822133988527376e-06, - "loss": 0.0044, + "epoch": 1.01, + "learning_rate": 0.00014834012043102172, + "loss": 0.0126, "step": 390050 }, { - "epoch": 1.97, - "learning_rate": 4.814566295513366e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014833623221465026, + "loss": 0.0122, "step": 390060 }, { - "epoch": 1.97, - "learning_rate": 4.806998602499356e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.0001483323439982788, + "loss": 0.0126, "step": 390070 }, { - "epoch": 1.97, - "learning_rate": 4.799430909485346e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014832845578190734, + "loss": 0.0113, "step": 390080 }, { - "epoch": 1.97, - "learning_rate": 4.791863216471335e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014832456756553585, + "loss": 0.0101, "step": 390090 }, { - "epoch": 1.97, - "learning_rate": 4.784295523457325e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014832067934916442, + "loss": 0.0135, "step": 390100 }, { - "epoch": 1.97, - "learning_rate": 4.776727830443315e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.00014831679113279294, + "loss": 0.0095, "step": 390110 }, { - "epoch": 1.97, - "learning_rate": 4.769160137429305e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014831290291642148, + "loss": 0.0114, "step": 390120 }, { - "epoch": 1.97, - "learning_rate": 4.761592444415294e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014830901470005002, + "loss": 0.0109, "step": 390130 }, { - "epoch": 1.97, - "learning_rate": 4.754024751401284e-06, - "loss": 0.0033, + "epoch": 1.01, + "learning_rate": 0.00014830512648367856, + "loss": 0.0191, "step": 390140 }, { - "epoch": 1.97, - "learning_rate": 4.746457058387274e-06, - "loss": 0.0094, + "epoch": 1.01, + "learning_rate": 0.00014830123826730708, + "loss": 0.0103, "step": 390150 }, { - "epoch": 1.97, - "learning_rate": 4.738889365373264e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014829735005093562, + "loss": 0.014, "step": 390160 }, { - "epoch": 1.97, - "learning_rate": 4.731321672359253e-06, - "loss": 0.0068, + "epoch": 1.01, + "learning_rate": 0.00014829346183456416, + "loss": 0.0111, "step": 390170 }, { - "epoch": 1.97, - "learning_rate": 4.723753979345243e-06, - "loss": 0.0084, + "epoch": 1.01, + "learning_rate": 0.0001482895736181927, + "loss": 0.0127, "step": 390180 }, { - "epoch": 1.97, - "learning_rate": 4.7161862863312325e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014828568540182122, + "loss": 0.013, "step": 390190 }, { - "epoch": 1.97, - "learning_rate": 4.7086185933172224e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.00014828179718544976, + "loss": 0.01, "step": 390200 }, { - "epoch": 1.97, - "learning_rate": 4.7010509003032115e-06, - "loss": 0.0095, + "epoch": 1.01, + "learning_rate": 0.0001482779089690783, + "loss": 0.0118, "step": 390210 }, { - "epoch": 1.97, - "learning_rate": 4.693483207289201e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.00014827402075270684, + "loss": 0.0097, "step": 390220 }, { - "epoch": 1.97, - "learning_rate": 4.685915514275191e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014827013253633536, + "loss": 0.0139, "step": 390230 }, { - "epoch": 1.97, - "learning_rate": 4.67834782126118e-06, - "loss": 0.0035, + "epoch": 1.01, + "learning_rate": 0.00014826624431996392, + "loss": 0.016, "step": 390240 }, { - "epoch": 1.97, - "learning_rate": 4.67078012824717e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014826235610359244, + "loss": 0.0108, "step": 390250 }, { - "epoch": 1.97, - "learning_rate": 4.66321243523316e-06, - "loss": 0.0071, + "epoch": 1.01, + "learning_rate": 0.00014825846788722098, + "loss": 0.0102, "step": 390260 }, { - "epoch": 1.97, - "learning_rate": 4.65564474221915e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014825457967084952, + "loss": 0.0128, "step": 390270 }, { - "epoch": 1.97, - "learning_rate": 4.648077049205139e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014825069145447804, + "loss": 0.0108, "step": 390280 }, { - "epoch": 1.97, - "learning_rate": 4.640509356191129e-06, - "loss": 0.0044, + "epoch": 1.01, + "learning_rate": 0.00014824680323810658, + "loss": 0.0084, "step": 390290 }, { - "epoch": 1.97, - "learning_rate": 4.632941663177119e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014824291502173512, + "loss": 0.0126, "step": 390300 }, { - "epoch": 1.97, - "learning_rate": 4.625373970163109e-06, - "loss": 0.0066, + "epoch": 1.01, + "learning_rate": 0.00014823902680536366, + "loss": 0.013, "step": 390310 }, { - "epoch": 1.97, - "learning_rate": 4.617806277149098e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014823513858899218, + "loss": 0.0167, "step": 390320 }, { - "epoch": 1.97, - "learning_rate": 4.610238584135088e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014823125037262072, + "loss": 0.0093, "step": 390330 }, { - "epoch": 1.97, - "learning_rate": 4.602670891121078e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014822736215624926, + "loss": 0.0114, "step": 390340 }, { - "epoch": 1.97, - "learning_rate": 4.595103198107068e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.0001482234739398778, + "loss": 0.0099, "step": 390350 }, { - "epoch": 1.97, - "learning_rate": 4.587535505093057e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014821958572350632, + "loss": 0.0126, "step": 390360 }, { - "epoch": 1.97, - "learning_rate": 4.579967812079047e-06, - "loss": 0.0065, + "epoch": 1.01, + "learning_rate": 0.00014821569750713486, + "loss": 0.0093, "step": 390370 }, { - "epoch": 1.97, - "learning_rate": 4.572400119065037e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.0001482118092907634, + "loss": 0.0137, "step": 390380 }, { - "epoch": 1.97, - "learning_rate": 4.5648324260510265e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014820792107439194, + "loss": 0.0093, "step": 390390 }, { - "epoch": 1.97, - "learning_rate": 4.557264733037016e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014820403285802046, + "loss": 0.0138, "step": 390400 }, { - "epoch": 1.97, - "learning_rate": 4.5496970400230055e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.000148200144641649, + "loss": 0.0111, "step": 390410 }, { - "epoch": 1.97, - "learning_rate": 4.5421293470089954e-06, - "loss": 0.0079, + "epoch": 1.01, + "learning_rate": 0.00014819625642527754, + "loss": 0.0102, "step": 390420 }, { - "epoch": 1.97, - "learning_rate": 4.534561653994985e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014819236820890608, + "loss": 0.0131, "step": 390430 }, { - "epoch": 1.97, - "learning_rate": 4.526993960980974e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.00014818847999253462, + "loss": 0.0123, "step": 390440 }, { - "epoch": 1.97, - "learning_rate": 4.5194262679669635e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.00014818459177616316, + "loss": 0.009, "step": 390450 }, { - "epoch": 1.97, - "learning_rate": 4.511858574952953e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014818070355979168, + "loss": 0.0148, "step": 390460 }, { - "epoch": 1.97, - "learning_rate": 4.504290881938943e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014817681534342022, + "loss": 0.0096, "step": 390470 }, { - "epoch": 1.97, - "learning_rate": 4.496723188924933e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014817292712704876, + "loss": 0.0123, "step": 390480 }, { - "epoch": 1.97, - "learning_rate": 4.489155495910922e-06, + "epoch": 1.01, + "learning_rate": 0.0001481690389106773, "loss": 0.0099, "step": 390490 }, { - "epoch": 1.97, - "learning_rate": 4.481587802896912e-06, - "loss": 0.0068, + "epoch": 1.01, + "learning_rate": 0.00014816515069430582, + "loss": 0.0109, "step": 390500 }, { - "epoch": 1.97, - "learning_rate": 4.474020109882902e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014816126247793436, + "loss": 0.0145, "step": 390510 }, { - "epoch": 1.97, - "learning_rate": 4.466452416868892e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.0001481573742615629, + "loss": 0.0112, "step": 390520 }, { - "epoch": 1.97, - "learning_rate": 4.458884723854881e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014815348604519142, + "loss": 0.0111, "step": 390530 }, { - "epoch": 1.97, - "learning_rate": 4.451317030840871e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014814959782881996, + "loss": 0.0128, "step": 390540 }, { - "epoch": 1.97, - "learning_rate": 4.443749337826861e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.0001481457096124485, + "loss": 0.0111, "step": 390550 }, { - "epoch": 1.97, - "learning_rate": 4.436181644812851e-06, - "loss": 0.0071, + "epoch": 1.01, + "learning_rate": 0.00014814182139607704, + "loss": 0.0118, "step": 390560 }, { - "epoch": 1.97, - "learning_rate": 4.42861395179884e-06, - "loss": 0.0071, + "epoch": 1.01, + "learning_rate": 0.00014813793317970555, + "loss": 0.0096, "step": 390570 }, { - "epoch": 1.97, - "learning_rate": 4.42104625878483e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.0001481340449633341, + "loss": 0.0112, "step": 390580 }, { - "epoch": 1.97, - "learning_rate": 4.41347856577082e-06, - "loss": 0.0036, + "epoch": 1.01, + "learning_rate": 0.00014813015674696264, + "loss": 0.01, "step": 390590 }, { - "epoch": 1.97, - "learning_rate": 4.40591087275681e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.00014812626853059118, + "loss": 0.0121, "step": 390600 }, { - "epoch": 1.97, - "learning_rate": 4.398343179742799e-06, - "loss": 0.004, + "epoch": 1.01, + "learning_rate": 0.0001481223803142197, + "loss": 0.0123, "step": 390610 }, { - "epoch": 1.97, - "learning_rate": 4.390775486728789e-06, - "loss": 0.0074, + "epoch": 1.01, + "learning_rate": 0.00014811849209784826, + "loss": 0.0135, "step": 390620 }, { - "epoch": 1.97, - "learning_rate": 4.3832077937147785e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014811460388147678, + "loss": 0.0098, "step": 390630 }, { - "epoch": 1.97, - "learning_rate": 4.3756401007007684e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014811071566510532, + "loss": 0.0134, "step": 390640 }, { - "epoch": 1.97, - "learning_rate": 4.3680724076867575e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014810682744873386, + "loss": 0.0132, "step": 390650 }, { - "epoch": 1.97, - "learning_rate": 4.360504714672747e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.0001481029392323624, + "loss": 0.0094, "step": 390660 }, { - "epoch": 1.97, - "learning_rate": 4.3529370216587365e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014809905101599092, + "loss": 0.0112, "step": 390670 }, { - "epoch": 1.97, - "learning_rate": 4.345369328644727e-06, - "loss": 0.0043, + "epoch": 1.01, + "learning_rate": 0.00014809516279961946, + "loss": 0.0132, "step": 390680 }, { - "epoch": 1.97, - "learning_rate": 4.337801635630716e-06, - "loss": 0.0089, + "epoch": 1.01, + "learning_rate": 0.000148091274583248, + "loss": 0.0109, "step": 390690 }, { - "epoch": 1.97, - "learning_rate": 4.330233942616706e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014808738636687654, + "loss": 0.012, "step": 390700 }, { - "epoch": 1.97, - "learning_rate": 4.322666249602695e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.00014808349815050506, + "loss": 0.0114, "step": 390710 }, { - "epoch": 1.97, - "learning_rate": 4.315098556588685e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.0001480796099341336, + "loss": 0.0126, "step": 390720 }, { - "epoch": 1.97, - "learning_rate": 4.307530863574675e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014807572171776214, + "loss": 0.01, "step": 390730 }, { - "epoch": 1.97, - "learning_rate": 4.299963170560665e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014807183350139068, + "loss": 0.0121, "step": 390740 }, { - "epoch": 1.97, - "learning_rate": 4.292395477546654e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.0001480679452850192, + "loss": 0.0122, "step": 390750 }, { - "epoch": 1.97, - "learning_rate": 4.284827784532644e-06, - "loss": 0.0071, + "epoch": 1.01, + "learning_rate": 0.00014806405706864774, + "loss": 0.0088, "step": 390760 }, { - "epoch": 1.97, - "learning_rate": 4.277260091518634e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014806016885227628, + "loss": 0.023, "step": 390770 }, { - "epoch": 1.97, - "learning_rate": 4.269692398504624e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.0001480562806359048, + "loss": 0.0168, "step": 390780 }, { - "epoch": 1.97, - "learning_rate": 4.262124705490613e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014805239241953336, + "loss": 0.0145, "step": 390790 }, { - "epoch": 1.97, - "learning_rate": 4.254557012476603e-06, - "loss": 0.0088, + "epoch": 1.01, + "learning_rate": 0.00014804850420316188, + "loss": 0.0112, "step": 390800 }, { - "epoch": 1.97, - "learning_rate": 4.246989319462593e-06, - "loss": 0.0038, + "epoch": 1.01, + "learning_rate": 0.00014804461598679042, + "loss": 0.0115, "step": 390810 }, { - "epoch": 1.97, - "learning_rate": 4.239421626448583e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014804072777041896, + "loss": 0.0087, "step": 390820 }, { - "epoch": 1.97, - "learning_rate": 4.231853933434572e-06, - "loss": 0.0093, + "epoch": 1.01, + "learning_rate": 0.0001480368395540475, + "loss": 0.0147, "step": 390830 }, { - "epoch": 1.97, - "learning_rate": 4.224286240420562e-06, - "loss": 0.0093, + "epoch": 1.01, + "learning_rate": 0.00014803295133767602, + "loss": 0.0113, "step": 390840 }, { - "epoch": 1.97, - "learning_rate": 4.2167185474065515e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.00014802906312130456, + "loss": 0.0101, "step": 390850 }, { - "epoch": 1.97, - "learning_rate": 4.2091508543925414e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.0001480251749049331, + "loss": 0.0158, "step": 390860 }, { - "epoch": 1.97, - "learning_rate": 4.2015831613785305e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014802128668856164, + "loss": 0.0167, "step": 390870 }, { - "epoch": 1.97, - "learning_rate": 4.19401546836452e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.00014801739847219016, + "loss": 0.0087, "step": 390880 }, { - "epoch": 1.97, - "learning_rate": 4.18644777535051e-06, - "loss": 0.0059, + "epoch": 1.01, + "learning_rate": 0.0001480135102558187, + "loss": 0.0177, "step": 390890 }, { - "epoch": 1.97, - "learning_rate": 4.1788800823365e-06, - "loss": 0.007, + "epoch": 1.01, + "learning_rate": 0.00014800962203944724, + "loss": 0.0098, "step": 390900 }, { - "epoch": 1.97, - "learning_rate": 4.171312389322489e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.00014800573382307578, + "loss": 0.0129, "step": 390910 }, { - "epoch": 1.97, - "learning_rate": 4.163744696308479e-06, - "loss": 0.0055, + "epoch": 1.01, + "learning_rate": 0.0001480018456067043, + "loss": 0.0116, "step": 390920 }, { - "epoch": 1.97, - "learning_rate": 4.156177003294468e-06, - "loss": 0.0071, + "epoch": 1.01, + "learning_rate": 0.00014799795739033284, + "loss": 0.0112, "step": 390930 }, { - "epoch": 1.97, - "learning_rate": 4.148609310280458e-06, - "loss": 0.0044, + "epoch": 1.01, + "learning_rate": 0.00014799406917396138, + "loss": 0.013, "step": 390940 }, { - "epoch": 1.97, - "learning_rate": 4.141041617266448e-06, - "loss": 0.007, + "epoch": 1.01, + "learning_rate": 0.00014799018095758992, + "loss": 0.0128, "step": 390950 }, { - "epoch": 1.97, - "learning_rate": 4.133473924252438e-06, - "loss": 0.0038, + "epoch": 1.01, + "learning_rate": 0.00014798629274121846, + "loss": 0.0115, "step": 390960 }, { - "epoch": 1.97, - "learning_rate": 4.125906231238427e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.000147982404524847, + "loss": 0.0106, "step": 390970 }, { - "epoch": 1.97, - "learning_rate": 4.118338538224417e-06, - "loss": 0.005, + "epoch": 1.01, + "learning_rate": 0.00014797851630847552, + "loss": 0.0117, "step": 390980 }, { - "epoch": 1.97, - "learning_rate": 4.110770845210407e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014797462809210406, + "loss": 0.0098, "step": 390990 }, { - "epoch": 1.97, - "learning_rate": 4.103203152196396e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.0001479707398757326, + "loss": 0.0121, "step": 391000 }, { - "epoch": 1.97, - "eval_cer": 0.9144003873821333, - "eval_loss": 0.00414480222389102, - "eval_runtime": 116.2164, - "eval_samples_per_second": 17.209, - "eval_steps_per_second": 4.302, + "epoch": 1.01, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.007885308936238289, + "eval_runtime": 107.5773, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, "step": 391000 }, { - "epoch": 1.97, - "learning_rate": 4.095635459182386e-06, - "loss": 0.0084, + "epoch": 1.01, + "learning_rate": 0.00014796685165936114, + "loss": 0.011, "step": 391010 }, { - "epoch": 1.97, - "learning_rate": 4.088067766168376e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014796296344298966, + "loss": 0.0124, "step": 391020 }, { - "epoch": 1.97, - "learning_rate": 4.080500073154366e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.0001479590752266182, + "loss": 0.0118, "step": 391030 }, { - "epoch": 1.97, - "learning_rate": 4.072932380140355e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.00014795518701024674, + "loss": 0.0129, "step": 391040 }, { - "epoch": 1.97, - "learning_rate": 4.065364687126345e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014795129879387526, + "loss": 0.0124, "step": 391050 }, { - "epoch": 1.97, - "learning_rate": 4.057796994112335e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.0001479474105775038, + "loss": 0.0151, "step": 391060 }, { - "epoch": 1.97, - "learning_rate": 4.0502293010983245e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014794352236113234, + "loss": 0.0108, "step": 391070 }, { - "epoch": 1.97, - "learning_rate": 4.042661608084314e-06, - "loss": 0.004, + "epoch": 1.01, + "learning_rate": 0.00014793963414476088, + "loss": 0.0123, "step": 391080 }, { - "epoch": 1.97, - "learning_rate": 4.0350939150703035e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.0001479357459283894, + "loss": 0.0134, "step": 391090 }, { - "epoch": 1.97, - "learning_rate": 4.027526222056293e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014793185771201794, + "loss": 0.0142, "step": 391100 }, { - "epoch": 1.97, - "learning_rate": 4.019958529042283e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.00014792796949564648, + "loss": 0.0101, "step": 391110 }, { - "epoch": 1.97, - "learning_rate": 4.012390836028272e-06, - "loss": 0.0045, + "epoch": 1.01, + "learning_rate": 0.00014792408127927502, + "loss": 0.016, "step": 391120 }, { - "epoch": 1.97, - "learning_rate": 4.004823143014262e-06, - "loss": 0.0058, + "epoch": 1.01, + "learning_rate": 0.00014792019306290353, + "loss": 0.0117, "step": 391130 }, { - "epoch": 1.97, - "learning_rate": 3.997255450000251e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.0001479163048465321, + "loss": 0.0134, "step": 391140 }, { - "epoch": 1.97, - "learning_rate": 3.989687756986241e-06, - "loss": 0.0035, + "epoch": 1.01, + "learning_rate": 0.00014791241663016062, + "loss": 0.0094, "step": 391150 }, { - "epoch": 1.97, - "learning_rate": 3.982120063972231e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014790852841378916, + "loss": 0.0106, "step": 391160 }, { - "epoch": 1.97, - "learning_rate": 3.974552370958221e-06, - "loss": 0.0056, + "epoch": 1.01, + "learning_rate": 0.0001479046401974177, + "loss": 0.0107, "step": 391170 }, { - "epoch": 1.97, - "learning_rate": 3.96698467794421e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014790075198104624, + "loss": 0.0124, "step": 391180 }, { - "epoch": 1.97, - "learning_rate": 3.9594169849302e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014789686376467476, + "loss": 0.0083, "step": 391190 }, { - "epoch": 1.97, - "learning_rate": 3.95184929191619e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.0001478929755483033, + "loss": 0.0165, "step": 391200 }, { - "epoch": 1.97, - "learning_rate": 3.94428159890218e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014788908733193184, + "loss": 0.012, "step": 391210 }, { - "epoch": 1.97, - "learning_rate": 3.936713905888169e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014788519911556038, + "loss": 0.0098, "step": 391220 }, { - "epoch": 1.97, - "learning_rate": 3.929146212874159e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.0001478813108991889, + "loss": 0.0117, "step": 391230 }, { - "epoch": 1.97, - "learning_rate": 3.921578519860149e-06, - "loss": 0.0072, + "epoch": 1.01, + "learning_rate": 0.00014787742268281744, + "loss": 0.0145, "step": 391240 }, { - "epoch": 1.97, - "learning_rate": 3.914010826846139e-06, - "loss": 0.0052, + "epoch": 1.01, + "learning_rate": 0.00014787353446644598, + "loss": 0.0108, "step": 391250 }, { - "epoch": 1.97, - "learning_rate": 3.906443133832128e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014786964625007452, + "loss": 0.0124, "step": 391260 }, { - "epoch": 1.97, - "learning_rate": 3.898875440818118e-06, - "loss": 0.0041, + "epoch": 1.01, + "learning_rate": 0.00014786575803370304, + "loss": 0.0125, "step": 391270 }, { - "epoch": 1.97, - "learning_rate": 3.891307747804108e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014786186981733158, + "loss": 0.0099, "step": 391280 }, { - "epoch": 1.97, - "learning_rate": 3.8837400547900975e-06, - "loss": 0.0046, + "epoch": 1.01, + "learning_rate": 0.00014785798160096012, + "loss": 0.0118, "step": 391290 }, { - "epoch": 1.97, - "learning_rate": 3.876172361776087e-06, - "loss": 0.0065, + "epoch": 1.01, + "learning_rate": 0.00014785409338458863, + "loss": 0.0132, "step": 391300 }, { - "epoch": 1.97, - "learning_rate": 3.8686046687620765e-06, - "loss": 0.0061, + "epoch": 1.01, + "learning_rate": 0.0001478502051682172, + "loss": 0.0123, "step": 391310 }, { - "epoch": 1.97, - "learning_rate": 3.861036975748066e-06, - "loss": 0.0092, + "epoch": 1.01, + "learning_rate": 0.00014784631695184572, + "loss": 0.0108, "step": 391320 }, { - "epoch": 1.97, - "learning_rate": 3.853469282734056e-06, - "loss": 0.0039, + "epoch": 1.01, + "learning_rate": 0.00014784242873547426, + "loss": 0.0111, "step": 391330 }, { - "epoch": 1.97, - "learning_rate": 3.845901589720045e-06, - "loss": 0.0042, + "epoch": 1.01, + "learning_rate": 0.0001478385405191028, + "loss": 0.0126, "step": 391340 }, { - "epoch": 1.97, - "learning_rate": 3.838333896706035e-06, - "loss": 0.0051, + "epoch": 1.01, + "learning_rate": 0.00014783465230273134, + "loss": 0.0136, "step": 391350 }, { - "epoch": 1.97, - "learning_rate": 3.830766203692024e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014783076408635986, + "loss": 0.0108, "step": 391360 }, { - "epoch": 1.97, - "learning_rate": 3.823198510678014e-06, - "loss": 0.0039, + "epoch": 1.01, + "learning_rate": 0.0001478268758699884, + "loss": 0.0107, "step": 391370 }, { - "epoch": 1.97, - "learning_rate": 3.815630817664004e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014782298765361694, + "loss": 0.0102, "step": 391380 }, { - "epoch": 1.97, - "learning_rate": 3.808063124649994e-06, - "loss": 0.0062, + "epoch": 1.01, + "learning_rate": 0.00014781909943724548, + "loss": 0.0107, "step": 391390 }, { - "epoch": 1.97, - "learning_rate": 3.8004954316359836e-06, - "loss": 0.0057, + "epoch": 1.01, + "learning_rate": 0.000147815211220874, + "loss": 0.0116, "step": 391400 }, { - "epoch": 1.97, - "learning_rate": 3.7929277386219735e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.00014781132300450254, + "loss": 0.0127, "step": 391410 }, { - "epoch": 1.97, - "learning_rate": 3.785360045607963e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014780743478813108, + "loss": 0.0109, "step": 391420 }, { - "epoch": 1.97, - "learning_rate": 3.777792352593953e-06, - "loss": 0.006, + "epoch": 1.01, + "learning_rate": 0.00014780354657175962, + "loss": 0.0104, "step": 391430 }, { - "epoch": 1.97, - "learning_rate": 3.7702246595799424e-06, - "loss": 0.0035, + "epoch": 1.01, + "learning_rate": 0.00014779965835538814, + "loss": 0.0099, "step": 391440 }, { - "epoch": 1.97, - "learning_rate": 3.7626569665659323e-06, - "loss": 0.0038, + "epoch": 1.01, + "learning_rate": 0.00014779577013901668, + "loss": 0.0128, "step": 391450 }, { - "epoch": 1.97, - "learning_rate": 3.7550892735519214e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014779188192264522, + "loss": 0.0097, "step": 391460 }, { - "epoch": 1.98, - "learning_rate": 3.7475215805379117e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.00014778799370627376, + "loss": 0.0142, "step": 391470 }, { - "epoch": 1.98, - "learning_rate": 3.7399538875239008e-06, - "loss": 0.0048, + "epoch": 1.01, + "learning_rate": 0.00014778410548990227, + "loss": 0.0167, "step": 391480 }, { - "epoch": 1.98, - "learning_rate": 3.7323861945098907e-06, - "loss": 0.0047, + "epoch": 1.01, + "learning_rate": 0.00014778021727353084, + "loss": 0.0122, "step": 391490 }, { - "epoch": 1.98, - "learning_rate": 3.72481850149588e-06, - "loss": 0.0091, + "epoch": 1.01, + "learning_rate": 0.00014777632905715936, + "loss": 0.0122, "step": 391500 }, { - "epoch": 1.98, - "learning_rate": 3.71725080848187e-06, - "loss": 0.0053, + "epoch": 1.01, + "learning_rate": 0.0001477724408407879, + "loss": 0.0119, "step": 391510 }, { - "epoch": 1.98, - "learning_rate": 3.7096831154678596e-06, - "loss": 0.0064, + "epoch": 1.01, + "learning_rate": 0.00014776855262441644, + "loss": 0.0105, "step": 391520 }, { - "epoch": 1.98, - "learning_rate": 3.702115422453849e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014776466440804496, + "loss": 0.0085, "step": 391530 }, { - "epoch": 1.98, - "learning_rate": 3.694547729439839e-06, - "loss": 0.0063, + "epoch": 1.01, + "learning_rate": 0.0001477607761916735, + "loss": 0.0134, "step": 391540 }, { - "epoch": 1.98, - "learning_rate": 3.6869800364258285e-06, - "loss": 0.0049, + "epoch": 1.01, + "learning_rate": 0.00014775688797530204, + "loss": 0.0097, "step": 391550 }, { - "epoch": 1.98, - "learning_rate": 3.6794123434118184e-06, - "loss": 0.0054, + "epoch": 1.01, + "learning_rate": 0.00014775299975893058, + "loss": 0.0121, "step": 391560 }, { - "epoch": 1.98, - "learning_rate": 3.671844650397808e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.0001477491115425591, + "loss": 0.0114, "step": 391570 }, { - "epoch": 1.98, - "learning_rate": 3.6642769573837978e-06, - "loss": 0.0064, + "epoch": 1.02, + "learning_rate": 0.00014774522332618764, + "loss": 0.0107, "step": 391580 }, { - "epoch": 1.98, - "learning_rate": 3.6567092643697873e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014774133510981618, + "loss": 0.016, "step": 391590 }, { - "epoch": 1.98, - "learning_rate": 3.649141571355777e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014773744689344472, + "loss": 0.0125, "step": 391600 }, { - "epoch": 1.98, - "learning_rate": 3.6415738783417667e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.00014773355867707323, + "loss": 0.0119, "step": 391610 }, { - "epoch": 1.98, - "learning_rate": 3.6340061853277566e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014772967046070178, + "loss": 0.0136, "step": 391620 }, { - "epoch": 1.98, - "learning_rate": 3.626438492313746e-06, - "loss": 0.0081, + "epoch": 1.02, + "learning_rate": 0.00014772578224433032, + "loss": 0.0109, "step": 391630 }, { - "epoch": 1.98, - "learning_rate": 3.618870799299736e-06, - "loss": 0.009, + "epoch": 1.02, + "learning_rate": 0.00014772189402795886, + "loss": 0.0139, "step": 391640 }, { - "epoch": 1.98, - "learning_rate": 3.6113031062857255e-06, - "loss": 0.0033, + "epoch": 1.02, + "learning_rate": 0.00014771800581158737, + "loss": 0.0143, "step": 391650 }, { - "epoch": 1.98, - "learning_rate": 3.6037354132717154e-06, - "loss": 0.006, + "epoch": 1.02, + "learning_rate": 0.00014771411759521594, + "loss": 0.0122, "step": 391660 }, { - "epoch": 1.98, - "learning_rate": 3.5961677202577045e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.00014771022937884446, + "loss": 0.0134, "step": 391670 }, { - "epoch": 1.98, - "learning_rate": 3.588600027243695e-06, - "loss": 0.0057, + "epoch": 1.02, + "learning_rate": 0.000147706341162473, + "loss": 0.0126, "step": 391680 }, { - "epoch": 1.98, - "learning_rate": 3.581032334229684e-06, - "loss": 0.0076, + "epoch": 1.02, + "learning_rate": 0.00014770245294610154, + "loss": 0.0095, "step": 391690 }, { - "epoch": 1.98, - "learning_rate": 3.5734646412156738e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.00014769856472973008, + "loss": 0.0105, "step": 391700 }, { - "epoch": 1.98, - "learning_rate": 3.5658969482016633e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.0001476946765133586, + "loss": 0.0084, "step": 391710 }, { - "epoch": 1.98, - "learning_rate": 3.558329255187653e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014769078829698714, + "loss": 0.0118, "step": 391720 }, { - "epoch": 1.98, - "learning_rate": 3.5507615621736427e-06, - "loss": 0.0072, + "epoch": 1.02, + "learning_rate": 0.00014768690008061568, + "loss": 0.0141, "step": 391730 }, { - "epoch": 1.98, - "learning_rate": 3.5431938691596326e-06, - "loss": 0.0058, + "epoch": 1.02, + "learning_rate": 0.00014768301186424422, + "loss": 0.0119, "step": 391740 }, { - "epoch": 1.98, - "learning_rate": 3.535626176145622e-06, - "loss": 0.0039, + "epoch": 1.02, + "learning_rate": 0.00014767912364787274, + "loss": 0.0118, "step": 391750 }, { - "epoch": 1.98, - "learning_rate": 3.528058483131612e-06, - "loss": 0.0067, + "epoch": 1.02, + "learning_rate": 0.00014767523543150128, + "loss": 0.0129, "step": 391760 }, { - "epoch": 1.98, - "learning_rate": 3.5204907901176015e-06, - "loss": 0.0043, + "epoch": 1.02, + "learning_rate": 0.00014767134721512982, + "loss": 0.0114, "step": 391770 }, { - "epoch": 1.98, - "learning_rate": 3.5129230971035914e-06, - "loss": 0.0057, + "epoch": 1.02, + "learning_rate": 0.00014766745899875833, + "loss": 0.0101, "step": 391780 }, { - "epoch": 1.98, - "learning_rate": 3.505355404089581e-06, - "loss": 0.0087, + "epoch": 1.02, + "learning_rate": 0.00014766357078238688, + "loss": 0.0112, "step": 391790 }, { - "epoch": 1.98, - "learning_rate": 3.4977877110755708e-06, - "loss": 0.0045, + "epoch": 1.02, + "learning_rate": 0.00014765968256601542, + "loss": 0.0113, "step": 391800 }, { - "epoch": 1.98, - "learning_rate": 3.4902200180615603e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.00014765579434964396, + "loss": 0.0097, "step": 391810 }, { - "epoch": 1.98, - "learning_rate": 3.48265232504755e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014765190613327247, + "loss": 0.01, "step": 391820 }, { - "epoch": 1.98, - "learning_rate": 3.4750846320335397e-06, - "loss": 0.006, + "epoch": 1.02, + "learning_rate": 0.00014764801791690104, + "loss": 0.0126, "step": 391830 }, { - "epoch": 1.98, - "learning_rate": 3.4675169390195296e-06, - "loss": 0.0066, + "epoch": 1.02, + "learning_rate": 0.00014764412970052956, + "loss": 0.0099, "step": 391840 }, { - "epoch": 1.98, - "learning_rate": 3.459949246005519e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.0001476402414841581, + "loss": 0.0135, "step": 391850 }, { - "epoch": 1.98, - "learning_rate": 3.452381552991509e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.00014763635326778664, + "loss": 0.0128, "step": 391860 }, { - "epoch": 1.98, - "learning_rate": 3.4448138599774985e-06, - "loss": 0.009, + "epoch": 1.02, + "learning_rate": 0.00014763246505141518, + "loss": 0.0091, "step": 391870 }, { - "epoch": 1.98, - "learning_rate": 3.4372461669634884e-06, - "loss": 0.0059, + "epoch": 1.02, + "learning_rate": 0.0001476285768350437, + "loss": 0.0118, "step": 391880 }, { - "epoch": 1.98, - "learning_rate": 3.429678473949478e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014762468861867224, + "loss": 0.0156, "step": 391890 }, { - "epoch": 1.98, - "learning_rate": 3.422110780935468e-06, - "loss": 0.0061, + "epoch": 1.02, + "learning_rate": 0.00014762080040230078, + "loss": 0.0141, "step": 391900 }, { - "epoch": 1.98, - "learning_rate": 3.414543087921457e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.00014761691218592932, + "loss": 0.0196, "step": 391910 }, { - "epoch": 1.98, - "learning_rate": 3.406975394907447e-06, - "loss": 0.008, + "epoch": 1.02, + "learning_rate": 0.00014761302396955784, + "loss": 0.0109, "step": 391920 }, { - "epoch": 1.98, - "learning_rate": 3.3994077018934363e-06, - "loss": 0.0062, + "epoch": 1.02, + "learning_rate": 0.00014760913575318638, + "loss": 0.0143, "step": 391930 }, { - "epoch": 1.98, - "learning_rate": 3.391840008879426e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.00014760524753681492, + "loss": 0.013, "step": 391940 }, { - "epoch": 1.98, - "learning_rate": 3.3842723158654157e-06, - "loss": 0.0044, + "epoch": 1.02, + "learning_rate": 0.00014760135932044346, + "loss": 0.0103, "step": 391950 }, { - "epoch": 1.98, - "learning_rate": 3.3767046228514056e-06, - "loss": 0.0078, + "epoch": 1.02, + "learning_rate": 0.00014759747110407198, + "loss": 0.0097, "step": 391960 }, { - "epoch": 1.98, - "learning_rate": 3.369136929837395e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014759358288770052, + "loss": 0.0104, "step": 391970 }, { - "epoch": 1.98, - "learning_rate": 3.361569236823385e-06, - "loss": 0.0071, + "epoch": 1.02, + "learning_rate": 0.00014758969467132906, + "loss": 0.0109, "step": 391980 }, { - "epoch": 1.98, - "learning_rate": 3.3540015438093745e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.0001475858064549576, + "loss": 0.0133, "step": 391990 }, { - "epoch": 1.98, - "learning_rate": 3.3464338507953644e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014758191823858611, + "loss": 0.0114, "step": 392000 }, { - "epoch": 1.98, - "eval_cer": 0.9144130025317635, - "eval_loss": 0.004128037486225367, - "eval_runtime": 116.0593, - "eval_samples_per_second": 17.233, - "eval_steps_per_second": 4.308, + "epoch": 1.02, + "eval_cer": 0.8817488743419957, + "eval_loss": 0.007738828659057617, + "eval_runtime": 107.489, + "eval_samples_per_second": 18.607, + "eval_steps_per_second": 4.652, "step": 392000 }, { - "epoch": 1.98, - "learning_rate": 3.338866157781354e-06, - "loss": 0.0077, + "epoch": 1.02, + "learning_rate": 0.00014757803002221466, + "loss": 0.0153, "step": 392010 }, { - "epoch": 1.98, - "learning_rate": 3.331298464767344e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.0001475741418058432, + "loss": 0.0097, "step": 392020 }, { - "epoch": 1.98, - "learning_rate": 3.3237307717533333e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.00014757025358947174, + "loss": 0.0129, "step": 392030 }, { - "epoch": 1.98, - "learning_rate": 3.316163078739323e-06, - "loss": 0.0056, + "epoch": 1.02, + "learning_rate": 0.00014756636537310028, + "loss": 0.0159, "step": 392040 }, { - "epoch": 1.98, - "learning_rate": 3.3085953857253127e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.0001475624771567288, + "loss": 0.0127, "step": 392050 }, { - "epoch": 1.98, - "learning_rate": 3.3010276927113026e-06, - "loss": 0.0064, + "epoch": 1.02, + "learning_rate": 0.00014755858894035734, + "loss": 0.0104, "step": 392060 }, { - "epoch": 1.98, - "learning_rate": 3.293459999697292e-06, - "loss": 0.0061, + "epoch": 1.02, + "learning_rate": 0.00014755470072398588, + "loss": 0.0096, "step": 392070 }, { - "epoch": 1.98, - "learning_rate": 3.2858923066832816e-06, - "loss": 0.0061, + "epoch": 1.02, + "learning_rate": 0.00014755081250761442, + "loss": 0.0109, "step": 392080 }, { - "epoch": 1.98, - "learning_rate": 3.2783246136692715e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014754692429124294, + "loss": 0.0106, "step": 392090 }, { - "epoch": 1.98, - "learning_rate": 3.270756920655261e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014754303607487148, + "loss": 0.0174, "step": 392100 }, { - "epoch": 1.98, - "learning_rate": 3.263189227641251e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014753914785850002, + "loss": 0.0128, "step": 392110 }, { - "epoch": 1.98, - "learning_rate": 3.25562153462724e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014753525964212856, + "loss": 0.0129, "step": 392120 }, { - "epoch": 1.98, - "learning_rate": 3.2480538416132303e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.00014753137142575707, + "loss": 0.0126, "step": 392130 }, { - "epoch": 1.98, - "learning_rate": 3.2404861485992194e-06, - "loss": 0.0061, + "epoch": 1.02, + "learning_rate": 0.00014752748320938562, + "loss": 0.0092, "step": 392140 }, { - "epoch": 1.98, - "learning_rate": 3.2329184555852093e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014752359499301416, + "loss": 0.0159, "step": 392150 }, { - "epoch": 1.98, - "learning_rate": 3.2253507625711988e-06, - "loss": 0.0042, + "epoch": 1.02, + "learning_rate": 0.0001475197067766427, + "loss": 0.0128, "step": 392160 }, { - "epoch": 1.98, - "learning_rate": 3.2177830695571887e-06, - "loss": 0.01, + "epoch": 1.02, + "learning_rate": 0.00014751581856027121, + "loss": 0.0118, "step": 392170 }, { - "epoch": 1.98, - "learning_rate": 3.210215376543178e-06, - "loss": 0.0038, + "epoch": 1.02, + "learning_rate": 0.00014751193034389978, + "loss": 0.0111, "step": 392180 }, { - "epoch": 1.98, - "learning_rate": 3.202647683529168e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.0001475080421275283, + "loss": 0.0136, "step": 392190 }, { - "epoch": 1.98, - "learning_rate": 3.1950799905151576e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014750415391115684, + "loss": 0.0122, "step": 392200 }, { - "epoch": 1.98, - "learning_rate": 3.1875122975011475e-06, - "loss": 0.0056, + "epoch": 1.02, + "learning_rate": 0.00014750026569478538, + "loss": 0.0119, "step": 392210 }, { - "epoch": 1.98, - "learning_rate": 3.179944604487137e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.00014749637747841392, + "loss": 0.0125, "step": 392220 }, { - "epoch": 1.98, - "learning_rate": 3.172376911473127e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.00014749248926204244, + "loss": 0.0132, "step": 392230 }, { - "epoch": 1.98, - "learning_rate": 3.1648092184591164e-06, - "loss": 0.0033, + "epoch": 1.02, + "learning_rate": 0.00014748860104567098, + "loss": 0.012, "step": 392240 }, { - "epoch": 1.98, - "learning_rate": 3.1572415254451063e-06, - "loss": 0.0056, + "epoch": 1.02, + "learning_rate": 0.00014748471282929952, + "loss": 0.0092, "step": 392250 }, { - "epoch": 1.98, - "learning_rate": 3.1496738324310958e-06, - "loss": 0.0044, + "epoch": 1.02, + "learning_rate": 0.00014748082461292803, + "loss": 0.0115, "step": 392260 }, { - "epoch": 1.98, - "learning_rate": 3.1421061394170857e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014747693639655658, + "loss": 0.0116, "step": 392270 }, { - "epoch": 1.98, - "learning_rate": 3.134538446403075e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014747304818018512, + "loss": 0.0092, "step": 392280 }, { - "epoch": 1.98, - "learning_rate": 3.126970753389065e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.00014746915996381366, + "loss": 0.0167, "step": 392290 }, { - "epoch": 1.98, - "learning_rate": 3.1194030603750546e-06, - "loss": 0.0047, + "epoch": 1.02, + "learning_rate": 0.00014746527174744217, + "loss": 0.0119, "step": 392300 }, { - "epoch": 1.98, - "learning_rate": 3.1118353673610445e-06, - "loss": 0.0059, + "epoch": 1.02, + "learning_rate": 0.00014746138353107072, + "loss": 0.0125, "step": 392310 }, { - "epoch": 1.98, - "learning_rate": 3.104267674347034e-06, - "loss": 0.0068, + "epoch": 1.02, + "learning_rate": 0.00014745749531469926, + "loss": 0.0107, "step": 392320 }, { - "epoch": 1.98, - "learning_rate": 3.096699981333024e-06, - "loss": 0.0064, + "epoch": 1.02, + "learning_rate": 0.0001474536070983278, + "loss": 0.0151, "step": 392330 }, { - "epoch": 1.98, - "learning_rate": 3.0891322883190134e-06, - "loss": 0.0061, + "epoch": 1.02, + "learning_rate": 0.00014744971888195631, + "loss": 0.0124, "step": 392340 }, { - "epoch": 1.98, - "learning_rate": 3.0815645953050033e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.00014744583066558486, + "loss": 0.013, "step": 392350 }, { - "epoch": 1.98, - "learning_rate": 3.0739969022909924e-06, - "loss": 0.0095, + "epoch": 1.02, + "learning_rate": 0.0001474419424492134, + "loss": 0.0116, "step": 392360 }, { - "epoch": 1.98, - "learning_rate": 3.0664292092769827e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014743805423284194, + "loss": 0.0165, "step": 392370 }, { - "epoch": 1.98, - "learning_rate": 3.0588615162629718e-06, - "loss": 0.0036, + "epoch": 1.02, + "learning_rate": 0.00014743416601647048, + "loss": 0.0108, "step": 392380 }, { - "epoch": 1.98, - "learning_rate": 3.0512938232489617e-06, - "loss": 0.0042, + "epoch": 1.02, + "learning_rate": 0.00014743027780009902, + "loss": 0.0101, "step": 392390 }, { - "epoch": 1.98, - "learning_rate": 3.043726130234951e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014742638958372754, + "loss": 0.0117, "step": 392400 }, { - "epoch": 1.98, - "learning_rate": 3.036158437220941e-06, - "loss": 0.0077, + "epoch": 1.02, + "learning_rate": 0.00014742250136735608, + "loss": 0.0108, "step": 392410 }, { - "epoch": 1.98, - "learning_rate": 3.0285907442069306e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.00014741861315098462, + "loss": 0.0094, "step": 392420 }, { - "epoch": 1.98, - "learning_rate": 3.0210230511929205e-06, - "loss": 0.0034, + "epoch": 1.02, + "learning_rate": 0.00014741472493461316, + "loss": 0.0094, "step": 392430 }, { - "epoch": 1.98, - "learning_rate": 3.01345535817891e-06, - "loss": 0.0081, + "epoch": 1.02, + "learning_rate": 0.00014741083671824168, + "loss": 0.0107, "step": 392440 }, { - "epoch": 1.98, - "learning_rate": 3.0058876651649e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014740694850187022, + "loss": 0.0122, "step": 392450 }, { - "epoch": 1.98, - "learning_rate": 2.9983199721508894e-06, - "loss": 0.0056, + "epoch": 1.02, + "learning_rate": 0.00014740306028549876, + "loss": 0.011, "step": 392460 }, { - "epoch": 1.98, - "learning_rate": 2.9907522791368793e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.0001473991720691273, + "loss": 0.0109, "step": 392470 }, { - "epoch": 1.98, - "learning_rate": 2.9831845861228688e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.00014739528385275582, + "loss": 0.0121, "step": 392480 }, { - "epoch": 1.98, - "learning_rate": 2.9756168931088587e-06, - "loss": 0.0078, + "epoch": 1.02, + "learning_rate": 0.00014739139563638436, + "loss": 0.0124, "step": 392490 }, { - "epoch": 1.98, - "learning_rate": 2.968049200094848e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.0001473875074200129, + "loss": 0.0113, "step": 392500 }, { - "epoch": 1.98, - "learning_rate": 2.960481507080838e-06, - "loss": 0.0044, + "epoch": 1.02, + "learning_rate": 0.0001473836192036414, + "loss": 0.0108, "step": 392510 }, { - "epoch": 1.98, - "learning_rate": 2.9529138140668276e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.00014737973098726995, + "loss": 0.0156, "step": 392520 }, { - "epoch": 1.98, - "learning_rate": 2.9453461210528175e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.0001473758427708985, + "loss": 0.0108, "step": 392530 }, { - "epoch": 1.98, - "learning_rate": 2.937778428038807e-06, - "loss": 0.0075, + "epoch": 1.02, + "learning_rate": 0.00014737195455452704, + "loss": 0.0112, "step": 392540 }, { - "epoch": 1.98, - "learning_rate": 2.930210735024797e-06, - "loss": 0.0053, + "epoch": 1.02, + "learning_rate": 0.00014736806633815555, + "loss": 0.0124, "step": 392550 }, { - "epoch": 1.98, - "learning_rate": 2.9226430420107864e-06, - "loss": 0.0042, + "epoch": 1.02, + "learning_rate": 0.00014736417812178412, + "loss": 0.0158, "step": 392560 }, { - "epoch": 1.98, - "learning_rate": 2.9150753489967763e-06, - "loss": 0.0062, + "epoch": 1.02, + "learning_rate": 0.00014736028990541264, + "loss": 0.0111, "step": 392570 }, { - "epoch": 1.98, - "learning_rate": 2.9075076559827658e-06, - "loss": 0.0094, + "epoch": 1.02, + "learning_rate": 0.00014735640168904118, + "loss": 0.0122, "step": 392580 }, { - "epoch": 1.98, - "learning_rate": 2.8999399629687557e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.00014735251347266972, + "loss": 0.0242, "step": 392590 }, { - "epoch": 1.98, - "learning_rate": 2.8923722699547448e-06, - "loss": 0.0071, + "epoch": 1.02, + "learning_rate": 0.00014734862525629826, + "loss": 0.0129, "step": 392600 }, { - "epoch": 1.98, - "learning_rate": 2.8848045769407347e-06, - "loss": 0.0082, + "epoch": 1.02, + "learning_rate": 0.00014734473703992678, + "loss": 0.0103, "step": 392610 }, { - "epoch": 1.98, - "learning_rate": 2.877236883926724e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.00014734084882355532, + "loss": 0.0083, "step": 392620 }, { - "epoch": 1.98, - "learning_rate": 2.8696691909127136e-06, - "loss": 0.0043, + "epoch": 1.02, + "learning_rate": 0.00014733696060718386, + "loss": 0.01, "step": 392630 }, { - "epoch": 1.98, - "learning_rate": 2.8621014978987036e-06, - "loss": 0.004, + "epoch": 1.02, + "learning_rate": 0.0001473330723908124, + "loss": 0.0101, "step": 392640 }, { - "epoch": 1.98, - "learning_rate": 2.854533804884693e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.00014732918417444091, + "loss": 0.0102, "step": 392650 }, { - "epoch": 1.98, - "learning_rate": 2.846966111870683e-06, - "loss": 0.0045, + "epoch": 1.02, + "learning_rate": 0.00014732529595806946, + "loss": 0.0097, "step": 392660 }, { - "epoch": 1.98, - "learning_rate": 2.8393984188566725e-06, - "loss": 0.0035, + "epoch": 1.02, + "learning_rate": 0.000147321407741698, + "loss": 0.0113, "step": 392670 }, { - "epoch": 1.98, - "learning_rate": 2.8318307258426624e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014731751952532654, + "loss": 0.0149, "step": 392680 }, { - "epoch": 1.98, - "learning_rate": 2.824263032828652e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014731363130895505, + "loss": 0.0152, "step": 392690 }, { - "epoch": 1.98, - "learning_rate": 2.8166953398146418e-06, - "loss": 0.006, + "epoch": 1.02, + "learning_rate": 0.00014730974309258362, + "loss": 0.009, "step": 392700 }, { - "epoch": 1.98, - "learning_rate": 2.8091276468006313e-06, - "loss": 0.0047, + "epoch": 1.02, + "learning_rate": 0.00014730585487621214, + "loss": 0.0104, "step": 392710 }, { - "epoch": 1.98, - "learning_rate": 2.801559953786621e-06, - "loss": 0.0072, + "epoch": 1.02, + "learning_rate": 0.00014730196665984068, + "loss": 0.0108, "step": 392720 }, { - "epoch": 1.98, - "learning_rate": 2.7939922607726107e-06, - "loss": 0.0072, + "epoch": 1.02, + "learning_rate": 0.00014729807844346922, + "loss": 0.0116, "step": 392730 }, { - "epoch": 1.98, - "learning_rate": 2.7864245677586006e-06, - "loss": 0.0058, + "epoch": 1.02, + "learning_rate": 0.00014729419022709776, + "loss": 0.0109, "step": 392740 }, { - "epoch": 1.98, - "learning_rate": 2.77885687474459e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014729030201072628, + "loss": 0.0178, "step": 392750 }, { - "epoch": 1.98, - "learning_rate": 2.77128918173058e-06, - "loss": 0.0057, + "epoch": 1.02, + "learning_rate": 0.00014728641379435482, + "loss": 0.0109, "step": 392760 }, { - "epoch": 1.98, - "learning_rate": 2.7637214887165695e-06, - "loss": 0.0065, + "epoch": 1.02, + "learning_rate": 0.00014728252557798336, + "loss": 0.0183, "step": 392770 }, { - "epoch": 1.98, - "learning_rate": 2.7561537957025594e-06, - "loss": 0.0039, + "epoch": 1.02, + "learning_rate": 0.00014727863736161187, + "loss": 0.0121, "step": 392780 }, { - "epoch": 1.98, - "learning_rate": 2.7485861026885484e-06, - "loss": 0.0066, + "epoch": 1.02, + "learning_rate": 0.00014727474914524042, + "loss": 0.0158, "step": 392790 }, { - "epoch": 1.98, - "learning_rate": 2.7410184096745388e-06, - "loss": 0.0073, + "epoch": 1.02, + "learning_rate": 0.00014727086092886896, + "loss": 0.0121, "step": 392800 }, { - "epoch": 1.98, - "learning_rate": 2.733450716660528e-06, - "loss": 0.0041, + "epoch": 1.02, + "learning_rate": 0.0001472669727124975, + "loss": 0.0103, "step": 392810 }, { - "epoch": 1.98, - "learning_rate": 2.7258830236465178e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014726308449612601, + "loss": 0.0108, "step": 392820 }, { - "epoch": 1.98, - "learning_rate": 2.7183153306325072e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014725919627975456, + "loss": 0.0129, "step": 392830 }, { - "epoch": 1.98, - "learning_rate": 2.710747637618497e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.0001472553080633831, + "loss": 0.0106, "step": 392840 }, { - "epoch": 1.98, - "learning_rate": 2.7031799446044866e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.00014725141984701164, + "loss": 0.0119, "step": 392850 }, { - "epoch": 1.98, - "learning_rate": 2.6956122515904766e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014724753163064015, + "loss": 0.0109, "step": 392860 }, { - "epoch": 1.98, - "learning_rate": 2.688044558576466e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.0001472436434142687, + "loss": 0.0088, "step": 392870 }, { - "epoch": 1.98, - "learning_rate": 2.680476865562456e-06, - "loss": 0.0038, + "epoch": 1.02, + "learning_rate": 0.00014723975519789724, + "loss": 0.0107, "step": 392880 }, { - "epoch": 1.98, - "learning_rate": 2.6729091725484455e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014723586698152578, + "loss": 0.0113, "step": 392890 }, { - "epoch": 1.98, - "learning_rate": 2.6653414795344354e-06, - "loss": 0.0053, + "epoch": 1.02, + "learning_rate": 0.00014723197876515432, + "loss": 0.015, "step": 392900 }, { - "epoch": 1.98, - "learning_rate": 2.657773786520425e-06, - "loss": 0.006, + "epoch": 1.02, + "learning_rate": 0.00014722809054878286, + "loss": 0.0119, "step": 392910 }, { - "epoch": 1.98, - "learning_rate": 2.6502060935064148e-06, - "loss": 0.0067, + "epoch": 1.02, + "learning_rate": 0.00014722420233241138, + "loss": 0.0132, "step": 392920 }, { - "epoch": 1.98, - "learning_rate": 2.6426384004924043e-06, - "loss": 0.0068, + "epoch": 1.02, + "learning_rate": 0.00014722031411603992, + "loss": 0.0159, "step": 392930 }, { - "epoch": 1.98, - "learning_rate": 2.635070707478394e-06, - "loss": 0.0044, + "epoch": 1.02, + "learning_rate": 0.00014721642589966846, + "loss": 0.0097, "step": 392940 }, { - "epoch": 1.98, - "learning_rate": 2.6275030144643837e-06, - "loss": 0.0058, + "epoch": 1.02, + "learning_rate": 0.000147212537683297, + "loss": 0.0112, "step": 392950 }, { - "epoch": 1.98, - "learning_rate": 2.6199353214503736e-06, - "loss": 0.0042, + "epoch": 1.02, + "learning_rate": 0.00014720864946692552, + "loss": 0.0129, "step": 392960 }, { - "epoch": 1.98, - "learning_rate": 2.612367628436363e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014720476125055406, + "loss": 0.0189, "step": 392970 }, { - "epoch": 1.98, - "learning_rate": 2.604799935422353e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.0001472008730341826, + "loss": 0.0119, "step": 392980 }, { - "epoch": 1.98, - "learning_rate": 2.5972322424083425e-06, - "loss": 0.0045, + "epoch": 1.02, + "learning_rate": 0.00014719698481781114, + "loss": 0.0102, "step": 392990 }, { - "epoch": 1.98, - "learning_rate": 2.5896645493943324e-06, - "loss": 0.0069, + "epoch": 1.02, + "learning_rate": 0.00014719309660143966, + "loss": 0.0101, "step": 393000 }, { - "epoch": 1.98, - "eval_cer": 0.9144188249085159, - "eval_loss": 0.004126059357076883, - "eval_runtime": 116.0572, - "eval_samples_per_second": 17.233, - "eval_steps_per_second": 4.308, + "epoch": 1.02, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.008117906749248505, + "eval_runtime": 107.5812, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, "step": 393000 }, { - "epoch": 1.98, - "learning_rate": 2.582096856380322e-06, - "loss": 0.0053, + "epoch": 1.02, + "learning_rate": 0.0001471892083850682, + "loss": 0.0108, "step": 393010 }, { - "epoch": 1.98, - "learning_rate": 2.5745291633663118e-06, - "loss": 0.01, + "epoch": 1.02, + "learning_rate": 0.00014718532016869674, + "loss": 0.013, "step": 393020 }, { - "epoch": 1.98, - "learning_rate": 2.566961470352301e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014718143195232525, + "loss": 0.0116, "step": 393030 }, { - "epoch": 1.98, - "learning_rate": 2.559393777338291e-06, - "loss": 0.0069, + "epoch": 1.02, + "learning_rate": 0.0001471775437359538, + "loss": 0.0129, "step": 393040 }, { - "epoch": 1.98, - "learning_rate": 2.5518260843242802e-06, - "loss": 0.0043, + "epoch": 1.02, + "learning_rate": 0.00014717365551958234, + "loss": 0.0113, "step": 393050 }, { - "epoch": 1.98, - "learning_rate": 2.54425839131027e-06, - "loss": 0.0065, + "epoch": 1.02, + "learning_rate": 0.00014716976730321088, + "loss": 0.0117, "step": 393060 }, { - "epoch": 1.98, - "learning_rate": 2.5366906982962596e-06, - "loss": 0.0053, + "epoch": 1.02, + "learning_rate": 0.0001471658790868394, + "loss": 0.0105, "step": 393070 }, { - "epoch": 1.98, - "learning_rate": 2.5291230052822496e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014716199087046796, + "loss": 0.0118, "step": 393080 }, { - "epoch": 1.98, - "learning_rate": 2.521555312268239e-06, - "loss": 0.0072, + "epoch": 1.02, + "learning_rate": 0.00014715810265409648, + "loss": 0.0078, "step": 393090 }, { - "epoch": 1.98, - "learning_rate": 2.513987619254229e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014715421443772502, + "loss": 0.0121, "step": 393100 }, { - "epoch": 1.98, - "learning_rate": 2.5064199262402185e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014715032622135356, + "loss": 0.0067, "step": 393110 }, { - "epoch": 1.98, - "learning_rate": 2.4988522332262084e-06, - "loss": 0.006, + "epoch": 1.02, + "learning_rate": 0.0001471464380049821, + "loss": 0.0152, "step": 393120 }, { - "epoch": 1.98, - "learning_rate": 2.491284540212198e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014714254978861062, + "loss": 0.0113, "step": 393130 }, { - "epoch": 1.98, - "learning_rate": 2.4837168471981878e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014713866157223916, + "loss": 0.0106, "step": 393140 }, { - "epoch": 1.98, - "learning_rate": 2.4761491541841773e-06, - "loss": 0.0053, + "epoch": 1.02, + "learning_rate": 0.0001471347733558677, + "loss": 0.0112, "step": 393150 }, { - "epoch": 1.98, - "learning_rate": 2.4685814611701667e-06, - "loss": 0.0042, + "epoch": 1.02, + "learning_rate": 0.00014713088513949624, + "loss": 0.0106, "step": 393160 }, { - "epoch": 1.98, - "learning_rate": 2.4610137681561567e-06, - "loss": 0.0057, + "epoch": 1.02, + "learning_rate": 0.00014712699692312475, + "loss": 0.0126, "step": 393170 }, { - "epoch": 1.98, - "learning_rate": 2.453446075142146e-06, - "loss": 0.0075, + "epoch": 1.02, + "learning_rate": 0.0001471231087067533, + "loss": 0.0094, "step": 393180 }, { - "epoch": 1.98, - "learning_rate": 2.445878382128136e-06, - "loss": 0.0069, + "epoch": 1.02, + "learning_rate": 0.00014711922049038184, + "loss": 0.0104, "step": 393190 }, { - "epoch": 1.98, - "learning_rate": 2.4383106891141256e-06, - "loss": 0.0038, + "epoch": 1.02, + "learning_rate": 0.00014711533227401038, + "loss": 0.0119, "step": 393200 }, { - "epoch": 1.98, - "learning_rate": 2.4307429961001155e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.0001471114440576389, + "loss": 0.0141, "step": 393210 }, { - "epoch": 1.98, - "learning_rate": 2.423175303086105e-06, - "loss": 0.007, + "epoch": 1.02, + "learning_rate": 0.00014710755584126746, + "loss": 0.0102, "step": 393220 }, { - "epoch": 1.98, - "learning_rate": 2.415607610072095e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014710366762489598, + "loss": 0.0144, "step": 393230 }, { - "epoch": 1.98, - "learning_rate": 2.408039917058084e-06, - "loss": 0.0062, + "epoch": 1.02, + "learning_rate": 0.00014709977940852452, + "loss": 0.0084, "step": 393240 }, { - "epoch": 1.98, - "learning_rate": 2.4004722240440743e-06, - "loss": 0.0051, + "epoch": 1.02, + "learning_rate": 0.00014709589119215306, + "loss": 0.014, "step": 393250 }, { - "epoch": 1.98, - "learning_rate": 2.3929045310300633e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.00014709200297578158, + "loss": 0.0253, "step": 393260 }, { - "epoch": 1.98, - "learning_rate": 2.3853368380160532e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014708811475941012, + "loss": 0.0128, "step": 393270 }, { - "epoch": 1.98, - "learning_rate": 2.3777691450020427e-06, - "loss": 0.0047, + "epoch": 1.02, + "learning_rate": 0.00014708422654303866, + "loss": 0.0135, "step": 393280 }, { - "epoch": 1.98, - "learning_rate": 2.3702014519880327e-06, - "loss": 0.0045, + "epoch": 1.02, + "learning_rate": 0.0001470803383266672, + "loss": 0.0145, "step": 393290 }, { - "epoch": 1.98, - "learning_rate": 2.362633758974022e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014707645011029571, + "loss": 0.012, "step": 393300 }, { - "epoch": 1.98, - "learning_rate": 2.355066065960012e-06, - "loss": 0.0052, + "epoch": 1.02, + "learning_rate": 0.00014707256189392426, + "loss": 0.0116, "step": 393310 }, { - "epoch": 1.98, - "learning_rate": 2.3474983729460015e-06, - "loss": 0.0064, + "epoch": 1.02, + "learning_rate": 0.0001470686736775528, + "loss": 0.013, "step": 393320 }, { - "epoch": 1.98, - "learning_rate": 2.3399306799319915e-06, - "loss": 0.0075, + "epoch": 1.02, + "learning_rate": 0.00014706478546118134, + "loss": 0.016, "step": 393330 }, { - "epoch": 1.98, - "learning_rate": 2.3323629869179814e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014706089724480985, + "loss": 0.0117, "step": 393340 }, { - "epoch": 1.98, - "learning_rate": 2.324795293903971e-06, - "loss": 0.0092, + "epoch": 1.02, + "learning_rate": 0.0001470570090284384, + "loss": 0.0104, "step": 393350 }, { - "epoch": 1.98, - "learning_rate": 2.3172276008899608e-06, - "loss": 0.0072, + "epoch": 1.02, + "learning_rate": 0.00014705312081206694, + "loss": 0.0131, "step": 393360 }, { - "epoch": 1.98, - "learning_rate": 2.3096599078759503e-06, - "loss": 0.0064, + "epoch": 1.02, + "learning_rate": 0.00014704923259569548, + "loss": 0.0127, "step": 393370 }, { - "epoch": 1.98, - "learning_rate": 2.3020922148619397e-06, - "loss": 0.008, + "epoch": 1.02, + "learning_rate": 0.000147045344379324, + "loss": 0.0167, "step": 393380 }, { - "epoch": 1.98, - "learning_rate": 2.2945245218479297e-06, - "loss": 0.0091, + "epoch": 1.02, + "learning_rate": 0.00014704145616295253, + "loss": 0.0107, "step": 393390 }, { - "epoch": 1.98, - "learning_rate": 2.286956828833919e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014703756794658108, + "loss": 0.0106, "step": 393400 }, { - "epoch": 1.98, - "learning_rate": 2.279389135819909e-06, - "loss": 0.0055, + "epoch": 1.02, + "learning_rate": 0.00014703367973020962, + "loss": 0.0121, "step": 393410 }, { - "epoch": 1.98, - "learning_rate": 2.2718214428058986e-06, - "loss": 0.0047, + "epoch": 1.02, + "learning_rate": 0.00014702979151383816, + "loss": 0.0146, "step": 393420 }, { - "epoch": 1.98, - "learning_rate": 2.2642537497918885e-06, - "loss": 0.0053, + "epoch": 1.02, + "learning_rate": 0.0001470259032974667, + "loss": 0.0105, "step": 393430 }, { - "epoch": 1.98, - "learning_rate": 2.256686056777878e-06, - "loss": 0.0059, + "epoch": 1.02, + "learning_rate": 0.00014702201508109522, + "loss": 0.0117, "step": 393440 }, { - "epoch": 1.98, - "learning_rate": 2.2491183637638674e-06, - "loss": 0.0043, + "epoch": 1.02, + "learning_rate": 0.00014701812686472376, + "loss": 0.0119, "step": 393450 }, { - "epoch": 1.99, - "learning_rate": 2.2415506707498574e-06, - "loss": 0.006, + "epoch": 1.02, + "learning_rate": 0.0001470142386483523, + "loss": 0.0118, "step": 393460 }, { - "epoch": 1.99, - "learning_rate": 2.233982977735847e-06, - "loss": 0.0056, + "epoch": 1.02, + "learning_rate": 0.00014701035043198084, + "loss": 0.0124, "step": 393470 }, { - "epoch": 1.99, - "learning_rate": 2.2264152847218363e-06, - "loss": 0.0046, + "epoch": 1.02, + "learning_rate": 0.00014700646221560936, + "loss": 0.0104, "step": 393480 }, { - "epoch": 1.99, - "learning_rate": 2.2188475917078262e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.0001470025739992379, + "loss": 0.0119, "step": 393490 }, { - "epoch": 1.99, - "learning_rate": 2.2112798986938157e-06, - "loss": 0.0049, + "epoch": 1.02, + "learning_rate": 0.00014699868578286644, + "loss": 0.011, "step": 393500 }, { - "epoch": 1.99, - "learning_rate": 2.2037122056798057e-06, - "loss": 0.0059, + "epoch": 1.02, + "learning_rate": 0.00014699479756649495, + "loss": 0.0093, "step": 393510 }, { - "epoch": 1.99, - "learning_rate": 2.196144512665795e-06, - "loss": 0.0071, + "epoch": 1.02, + "learning_rate": 0.0001469909093501235, + "loss": 0.0163, "step": 393520 }, { - "epoch": 1.99, - "learning_rate": 2.188576819651785e-06, - "loss": 0.0075, + "epoch": 1.02, + "learning_rate": 0.00014698702113375204, + "loss": 0.0088, "step": 393530 }, { - "epoch": 1.99, - "learning_rate": 2.1810091266377745e-06, - "loss": 0.0065, + "epoch": 1.02, + "learning_rate": 0.00014698313291738058, + "loss": 0.0121, "step": 393540 }, { - "epoch": 1.99, - "learning_rate": 2.1734414336237645e-06, - "loss": 0.007, + "epoch": 1.02, + "learning_rate": 0.0001469792447010091, + "loss": 0.0097, "step": 393550 }, { - "epoch": 1.99, - "learning_rate": 2.165873740609754e-06, - "loss": 0.007, + "epoch": 1.02, + "learning_rate": 0.00014697535648463763, + "loss": 0.0091, "step": 393560 }, { - "epoch": 1.99, - "learning_rate": 2.158306047595744e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014697146826826618, + "loss": 0.0121, "step": 393570 }, { - "epoch": 1.99, - "learning_rate": 2.1507383545817333e-06, - "loss": 0.0037, + "epoch": 1.02, + "learning_rate": 0.00014696758005189472, + "loss": 0.0107, "step": 393580 }, { - "epoch": 1.99, - "learning_rate": 2.143170661567723e-06, - "loss": 0.005, + "epoch": 1.02, + "learning_rate": 0.00014696369183552323, + "loss": 0.0153, "step": 393590 }, { - "epoch": 1.99, - "learning_rate": 2.1356029685537127e-06, - "loss": 0.0076, + "epoch": 1.02, + "learning_rate": 0.0001469598036191518, + "loss": 0.013, "step": 393600 }, { - "epoch": 1.99, - "learning_rate": 2.1280352755397022e-06, - "loss": 0.0066, + "epoch": 1.02, + "learning_rate": 0.00014695591540278032, + "loss": 0.013, "step": 393610 }, { - "epoch": 1.99, - "learning_rate": 2.120467582525692e-06, - "loss": 0.0054, + "epoch": 1.02, + "learning_rate": 0.00014695202718640886, + "loss": 0.0151, "step": 393620 }, { - "epoch": 1.99, - "learning_rate": 2.1128998895116816e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.0001469481389700374, + "loss": 0.0108, "step": 393630 }, { - "epoch": 1.99, - "learning_rate": 2.1053321964976716e-06, - "loss": 0.0085, + "epoch": 1.02, + "learning_rate": 0.00014694425075366594, + "loss": 0.0098, "step": 393640 }, { - "epoch": 1.99, - "learning_rate": 2.097764503483661e-06, - "loss": 0.0042, + "epoch": 1.02, + "learning_rate": 0.00014694036253729445, + "loss": 0.0117, "step": 393650 }, { - "epoch": 1.99, - "learning_rate": 2.090196810469651e-06, - "loss": 0.0063, + "epoch": 1.02, + "learning_rate": 0.000146936474320923, + "loss": 0.0129, "step": 393660 }, { - "epoch": 1.99, - "learning_rate": 2.0826291174556404e-06, - "loss": 0.0067, + "epoch": 1.02, + "learning_rate": 0.00014693258610455154, + "loss": 0.0129, "step": 393670 }, { - "epoch": 1.99, - "learning_rate": 2.0750614244416304e-06, - "loss": 0.0048, + "epoch": 1.02, + "learning_rate": 0.00014692869788818008, + "loss": 0.0133, "step": 393680 }, + { + "epoch": 1.02, + "learning_rate": 0.0001469248096718086, + "loss": 0.0107, + "step": 393690 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014692092145543714, + "loss": 0.0112, + "step": 393700 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014691703323906568, + "loss": 0.0129, + "step": 393710 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014691314502269422, + "loss": 0.01, + "step": 393720 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014690925680632273, + "loss": 0.0106, + "step": 393730 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014690536858995128, + "loss": 0.0106, + "step": 393740 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014690148037357982, + "loss": 0.0086, + "step": 393750 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014689759215720833, + "loss": 0.0109, + "step": 393760 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468937039408369, + "loss": 0.0121, + "step": 393770 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014688981572446541, + "loss": 0.0094, + "step": 393780 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014688592750809396, + "loss": 0.0123, + "step": 393790 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468820392917225, + "loss": 0.0116, + "step": 393800 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014687815107535104, + "loss": 0.0106, + "step": 393810 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014687426285897955, + "loss": 0.0104, + "step": 393820 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468703746426081, + "loss": 0.0098, + "step": 393830 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014686648642623664, + "loss": 0.0142, + "step": 393840 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014686259820986518, + "loss": 0.0129, + "step": 393850 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468587099934937, + "loss": 0.0133, + "step": 393860 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014685482177712224, + "loss": 0.0103, + "step": 393870 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014685093356075078, + "loss": 0.0097, + "step": 393880 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014684704534437932, + "loss": 0.0123, + "step": 393890 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014684315712800783, + "loss": 0.0089, + "step": 393900 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014683926891163637, + "loss": 0.0111, + "step": 393910 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014683538069526492, + "loss": 0.0102, + "step": 393920 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014683149247889346, + "loss": 0.0106, + "step": 393930 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014682760426252197, + "loss": 0.0149, + "step": 393940 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014682371604615054, + "loss": 0.0102, + "step": 393950 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014681982782977906, + "loss": 0.0166, + "step": 393960 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468159396134076, + "loss": 0.0136, + "step": 393970 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014681205139703614, + "loss": 0.0137, + "step": 393980 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014680816318066468, + "loss": 0.0101, + "step": 393990 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001468042749642932, + "loss": 0.0095, + "step": 394000 + }, + { + "epoch": 1.02, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.0077973357401788235, + "eval_runtime": 107.7965, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, + "step": 394000 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014680038674792174, + "loss": 0.0125, + "step": 394010 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014679649853155028, + "loss": 0.0099, + "step": 394020 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001467926103151788, + "loss": 0.0104, + "step": 394030 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014678872209880733, + "loss": 0.0111, + "step": 394040 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014678483388243588, + "loss": 0.01, + "step": 394050 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014678094566606442, + "loss": 0.0101, + "step": 394060 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014677705744969293, + "loss": 0.0164, + "step": 394070 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014677316923332147, + "loss": 0.009, + "step": 394080 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014676928101695002, + "loss": 0.0151, + "step": 394090 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014676539280057856, + "loss": 0.0094, + "step": 394100 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014676150458420707, + "loss": 0.0092, + "step": 394110 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014675761636783564, + "loss": 0.0146, + "step": 394120 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014675372815146416, + "loss": 0.0123, + "step": 394130 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001467498399350927, + "loss": 0.017, + "step": 394140 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014674595171872124, + "loss": 0.012, + "step": 394150 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014674206350234978, + "loss": 0.0138, + "step": 394160 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001467381752859783, + "loss": 0.0136, + "step": 394170 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014673428706960684, + "loss": 0.0111, + "step": 394180 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014673039885323538, + "loss": 0.0125, + "step": 394190 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014672651063686392, + "loss": 0.0134, + "step": 394200 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014672262242049243, + "loss": 0.0101, + "step": 394210 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014671873420412098, + "loss": 0.0117, + "step": 394220 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014671484598774952, + "loss": 0.012, + "step": 394230 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014671095777137806, + "loss": 0.0093, + "step": 394240 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014670706955500657, + "loss": 0.0096, + "step": 394250 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014670318133863512, + "loss": 0.0127, + "step": 394260 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014669929312226366, + "loss": 0.0117, + "step": 394270 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014669540490589217, + "loss": 0.0114, + "step": 394280 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014669151668952074, + "loss": 0.0123, + "step": 394290 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014668762847314925, + "loss": 0.0125, + "step": 394300 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466837402567778, + "loss": 0.011, + "step": 394310 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014667985204040634, + "loss": 0.0126, + "step": 394320 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014667596382403488, + "loss": 0.0115, + "step": 394330 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466720756076634, + "loss": 0.0103, + "step": 394340 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014666818739129194, + "loss": 0.0133, + "step": 394350 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014666429917492048, + "loss": 0.0096, + "step": 394360 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014666041095854902, + "loss": 0.0133, + "step": 394370 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014665652274217753, + "loss": 0.0121, + "step": 394380 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014665263452580608, + "loss": 0.0149, + "step": 394390 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014664874630943462, + "loss": 0.0158, + "step": 394400 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014664485809306316, + "loss": 0.0102, + "step": 394410 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014664096987669167, + "loss": 0.01, + "step": 394420 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014663708166032021, + "loss": 0.0121, + "step": 394430 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014663319344394876, + "loss": 0.0092, + "step": 394440 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466293052275773, + "loss": 0.0124, + "step": 394450 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466254170112058, + "loss": 0.0126, + "step": 394460 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014662152879483438, + "loss": 0.0124, + "step": 394470 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466176405784629, + "loss": 0.0084, + "step": 394480 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014661375236209144, + "loss": 0.0112, + "step": 394490 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014660986414571998, + "loss": 0.0109, + "step": 394500 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001466059759293485, + "loss": 0.0112, + "step": 394510 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014660208771297704, + "loss": 0.012, + "step": 394520 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014659819949660558, + "loss": 0.0111, + "step": 394530 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014659431128023412, + "loss": 0.0095, + "step": 394540 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014659042306386263, + "loss": 0.0099, + "step": 394550 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014658653484749117, + "loss": 0.0102, + "step": 394560 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014658264663111972, + "loss": 0.0119, + "step": 394570 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014657875841474826, + "loss": 0.0127, + "step": 394580 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014657487019837677, + "loss": 0.0103, + "step": 394590 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014657098198200531, + "loss": 0.0109, + "step": 394600 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014656709376563386, + "loss": 0.0098, + "step": 394610 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001465632055492624, + "loss": 0.0085, + "step": 394620 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001465593173328909, + "loss": 0.0109, + "step": 394630 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014655542911651948, + "loss": 0.0106, + "step": 394640 + }, + { + "epoch": 1.02, + "learning_rate": 0.000146551540900148, + "loss": 0.0137, + "step": 394650 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014654765268377654, + "loss": 0.013, + "step": 394660 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014654376446740508, + "loss": 0.0112, + "step": 394670 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014653987625103362, + "loss": 0.0096, + "step": 394680 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014653598803466213, + "loss": 0.0127, + "step": 394690 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014653209981829068, + "loss": 0.0107, + "step": 394700 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014652821160191922, + "loss": 0.0119, + "step": 394710 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014652432338554776, + "loss": 0.018, + "step": 394720 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014652043516917627, + "loss": 0.0127, + "step": 394730 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014651654695280482, + "loss": 0.0165, + "step": 394740 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014651265873643336, + "loss": 0.013, + "step": 394750 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014650877052006187, + "loss": 0.0118, + "step": 394760 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014650488230369041, + "loss": 0.0146, + "step": 394770 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014650099408731896, + "loss": 0.0147, + "step": 394780 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464971058709475, + "loss": 0.009, + "step": 394790 + }, + { + "epoch": 1.02, + "learning_rate": 0.000146493217654576, + "loss": 0.0119, + "step": 394800 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014648932943820458, + "loss": 0.0097, + "step": 394810 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464854412218331, + "loss": 0.0115, + "step": 394820 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014648155300546164, + "loss": 0.0144, + "step": 394830 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014647766478909018, + "loss": 0.0145, + "step": 394840 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014647377657271872, + "loss": 0.0078, + "step": 394850 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014646988835634723, + "loss": 0.0091, + "step": 394860 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014646600013997578, + "loss": 0.0113, + "step": 394870 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014646211192360432, + "loss": 0.0107, + "step": 394880 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014645822370723286, + "loss": 0.0121, + "step": 394890 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014645433549086137, + "loss": 0.0113, + "step": 394900 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014645044727448992, + "loss": 0.0122, + "step": 394910 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014644655905811846, + "loss": 0.0102, + "step": 394920 + }, + { + "epoch": 1.02, + "learning_rate": 0.000146442670841747, + "loss": 0.0107, + "step": 394930 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464387826253755, + "loss": 0.0129, + "step": 394940 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014643489440900405, + "loss": 0.0101, + "step": 394950 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464310061926326, + "loss": 0.0158, + "step": 394960 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014642711797626114, + "loss": 0.0127, + "step": 394970 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014642322975988965, + "loss": 0.0098, + "step": 394980 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001464193415435182, + "loss": 0.0129, + "step": 394990 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014641545332714674, + "loss": 0.0121, + "step": 395000 + }, + { + "epoch": 1.02, + "eval_cer": 0.8816970877754311, + "eval_loss": 0.007893171161413193, + "eval_runtime": 107.5146, + "eval_samples_per_second": 18.602, + "eval_steps_per_second": 4.651, + "step": 395000 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014641156511077528, + "loss": 0.0108, + "step": 395010 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014640767689440382, + "loss": 0.0098, + "step": 395020 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014640378867803233, + "loss": 0.0089, + "step": 395030 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014639990046166088, + "loss": 0.0092, + "step": 395040 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014639601224528942, + "loss": 0.0132, + "step": 395050 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014639212402891796, + "loss": 0.0141, + "step": 395060 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014638823581254647, + "loss": 0.0105, + "step": 395070 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014638434759617501, + "loss": 0.0146, + "step": 395080 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014638045937980356, + "loss": 0.0109, + "step": 395090 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463765711634321, + "loss": 0.0114, + "step": 395100 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463726829470606, + "loss": 0.0095, + "step": 395110 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014636879473068915, + "loss": 0.0136, + "step": 395120 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463649065143177, + "loss": 0.0113, + "step": 395130 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014636101829794624, + "loss": 0.0118, + "step": 395140 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014635713008157475, + "loss": 0.0162, + "step": 395150 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014635324186520332, + "loss": 0.0162, + "step": 395160 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014634935364883184, + "loss": 0.0122, + "step": 395170 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014634546543246038, + "loss": 0.0096, + "step": 395180 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014634157721608892, + "loss": 0.0144, + "step": 395190 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014633768899971746, + "loss": 0.012, + "step": 395200 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014633380078334597, + "loss": 0.0099, + "step": 395210 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014632991256697452, + "loss": 0.012, + "step": 395220 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014632602435060306, + "loss": 0.0088, + "step": 395230 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014632213613423157, + "loss": 0.0105, + "step": 395240 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014631824791786011, + "loss": 0.0104, + "step": 395250 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014631435970148866, + "loss": 0.0086, + "step": 395260 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463104714851172, + "loss": 0.011, + "step": 395270 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001463065832687457, + "loss": 0.0154, + "step": 395280 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014630269505237425, + "loss": 0.0138, + "step": 395290 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001462988068360028, + "loss": 0.0148, + "step": 395300 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014629491861963134, + "loss": 0.0153, + "step": 395310 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014629103040325985, + "loss": 0.0109, + "step": 395320 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001462871421868884, + "loss": 0.0106, + "step": 395330 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014628325397051693, + "loss": 0.0115, + "step": 395340 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014627936575414548, + "loss": 0.0157, + "step": 395350 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014627547753777402, + "loss": 0.0137, + "step": 395360 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014627158932140256, + "loss": 0.0135, + "step": 395370 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014626770110503107, + "loss": 0.0105, + "step": 395380 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014626381288865962, + "loss": 0.0096, + "step": 395390 + }, + { + "epoch": 1.02, + "learning_rate": 0.00014625992467228816, + "loss": 0.0081, + "step": 395400 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001462560364559167, + "loss": 0.0107, + "step": 395410 + }, + { + "epoch": 1.02, + "learning_rate": 0.0001462521482395452, + "loss": 0.0096, + "step": 395420 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014624826002317376, + "loss": 0.0082, + "step": 395430 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001462443718068023, + "loss": 0.0105, + "step": 395440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014624048359043084, + "loss": 0.0102, + "step": 395450 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014623659537405935, + "loss": 0.0138, + "step": 395460 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001462327071576879, + "loss": 0.0094, + "step": 395470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014622881894131644, + "loss": 0.0124, + "step": 395480 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014622493072494495, + "loss": 0.0095, + "step": 395490 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001462210425085735, + "loss": 0.0096, + "step": 395500 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014621715429220203, + "loss": 0.0096, + "step": 395510 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014621326607583058, + "loss": 0.0104, + "step": 395520 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001462093778594591, + "loss": 0.0123, + "step": 395530 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014620548964308766, + "loss": 0.0138, + "step": 395540 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014620160142671617, + "loss": 0.0106, + "step": 395550 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014619771321034472, + "loss": 0.0118, + "step": 395560 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014619382499397326, + "loss": 0.014, + "step": 395570 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461899367776018, + "loss": 0.0106, + "step": 395580 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461860485612303, + "loss": 0.0107, + "step": 395590 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014618216034485885, + "loss": 0.0124, + "step": 395600 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461782721284874, + "loss": 0.0123, + "step": 395610 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014617438391211594, + "loss": 0.0106, + "step": 395620 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014617049569574445, + "loss": 0.0124, + "step": 395630 + }, + { + "epoch": 1.03, + "learning_rate": 0.000146166607479373, + "loss": 0.0164, + "step": 395640 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014616271926300154, + "loss": 0.0101, + "step": 395650 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014615883104663008, + "loss": 0.0131, + "step": 395660 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461549428302586, + "loss": 0.0108, + "step": 395670 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014615105461388716, + "loss": 0.0113, + "step": 395680 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014614716639751568, + "loss": 0.0154, + "step": 395690 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014614327818114422, + "loss": 0.0112, + "step": 395700 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014613938996477276, + "loss": 0.0126, + "step": 395710 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461355017484013, + "loss": 0.0123, + "step": 395720 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014613161353202981, + "loss": 0.0117, + "step": 395730 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014612772531565836, + "loss": 0.011, + "step": 395740 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461238370992869, + "loss": 0.0091, + "step": 395750 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461199488829154, + "loss": 0.0092, + "step": 395760 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014611606066654395, + "loss": 0.0135, + "step": 395770 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461121724501725, + "loss": 0.0143, + "step": 395780 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014610828423380104, + "loss": 0.0124, + "step": 395790 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014610439601742955, + "loss": 0.0131, + "step": 395800 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001461005078010581, + "loss": 0.0164, + "step": 395810 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014609661958468664, + "loss": 0.0155, + "step": 395820 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014609273136831518, + "loss": 0.0131, + "step": 395830 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001460888431519437, + "loss": 0.0121, + "step": 395840 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014608495493557223, + "loss": 0.01, + "step": 395850 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014608106671920077, + "loss": 0.0124, + "step": 395860 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014607717850282932, + "loss": 0.0123, + "step": 395870 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014607329028645786, + "loss": 0.01, + "step": 395880 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001460694020700864, + "loss": 0.012, + "step": 395890 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014606551385371491, + "loss": 0.0111, + "step": 395900 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014606162563734346, + "loss": 0.0118, + "step": 395910 + }, + { + "epoch": 1.03, + "learning_rate": 0.000146057737420972, + "loss": 0.0101, + "step": 395920 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014605384920460054, + "loss": 0.0133, + "step": 395930 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014604996098822905, + "loss": 0.0113, + "step": 395940 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001460460727718576, + "loss": 0.011, + "step": 395950 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014604218455548614, + "loss": 0.0128, + "step": 395960 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014603829633911468, + "loss": 0.0113, + "step": 395970 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001460344081227432, + "loss": 0.0113, + "step": 395980 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014603051990637173, + "loss": 0.011, + "step": 395990 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014602663169000028, + "loss": 0.0115, + "step": 396000 + }, + { + "epoch": 1.03, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.007747070398181677, + "eval_runtime": 107.5107, + "eval_samples_per_second": 18.603, + "eval_steps_per_second": 4.651, + "step": 396000 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001460227434736288, + "loss": 0.0157, + "step": 396010 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014601885525725733, + "loss": 0.0104, + "step": 396020 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014601496704088587, + "loss": 0.0117, + "step": 396030 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014601107882451442, + "loss": 0.0098, + "step": 396040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014600719060814293, + "loss": 0.0116, + "step": 396050 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001460033023917715, + "loss": 0.0115, + "step": 396060 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459994141754, + "loss": 0.0131, + "step": 396070 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014599552595902856, + "loss": 0.0111, + "step": 396080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459916377426571, + "loss": 0.0116, + "step": 396090 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014598774952628564, + "loss": 0.0098, + "step": 396100 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014598386130991415, + "loss": 0.0134, + "step": 396110 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459799730935427, + "loss": 0.0119, + "step": 396120 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014597608487717124, + "loss": 0.0103, + "step": 396130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014597219666079978, + "loss": 0.0105, + "step": 396140 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459683084444283, + "loss": 0.0115, + "step": 396150 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014596442022805683, + "loss": 0.0096, + "step": 396160 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014596053201168538, + "loss": 0.0109, + "step": 396170 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014595664379531392, + "loss": 0.0099, + "step": 396180 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014595275557894243, + "loss": 0.0133, + "step": 396190 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145948867362571, + "loss": 0.0109, + "step": 396200 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014594497914619952, + "loss": 0.0121, + "step": 396210 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014594109092982806, + "loss": 0.0104, + "step": 396220 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459372027134566, + "loss": 0.0121, + "step": 396230 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459333144970851, + "loss": 0.0124, + "step": 396240 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014592942628071365, + "loss": 0.0104, + "step": 396250 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459255380643422, + "loss": 0.0087, + "step": 396260 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014592164984797074, + "loss": 0.0103, + "step": 396270 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014591776163159925, + "loss": 0.013, + "step": 396280 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459138734152278, + "loss": 0.0166, + "step": 396290 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014590998519885634, + "loss": 0.0096, + "step": 396300 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014590609698248488, + "loss": 0.0099, + "step": 396310 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001459022087661134, + "loss": 0.0163, + "step": 396320 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014589832054974193, + "loss": 0.0089, + "step": 396330 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014589443233337047, + "loss": 0.0099, + "step": 396340 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014589054411699902, + "loss": 0.0123, + "step": 396350 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014588665590062753, + "loss": 0.0176, + "step": 396360 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014588276768425607, + "loss": 0.0147, + "step": 396370 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014587887946788461, + "loss": 0.0138, + "step": 396380 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014587499125151316, + "loss": 0.01, + "step": 396390 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458711030351417, + "loss": 0.0144, + "step": 396400 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014586721481877024, + "loss": 0.0104, + "step": 396410 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014586332660239875, + "loss": 0.0119, + "step": 396420 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458594383860273, + "loss": 0.009, + "step": 396430 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014585555016965584, + "loss": 0.0163, + "step": 396440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014585166195328438, + "loss": 0.011, + "step": 396450 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458477737369129, + "loss": 0.0087, + "step": 396460 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014584388552054143, + "loss": 0.0124, + "step": 396470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014583999730416998, + "loss": 0.0108, + "step": 396480 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001458361090877985, + "loss": 0.013, + "step": 396490 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014583222087142703, + "loss": 0.0144, + "step": 396500 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014582833265505557, + "loss": 0.0117, + "step": 396510 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014582444443868412, + "loss": 0.0139, + "step": 396520 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014582055622231263, + "loss": 0.0129, + "step": 396530 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014581666800594117, + "loss": 0.0093, + "step": 396540 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014581277978956971, + "loss": 0.0179, + "step": 396550 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014580889157319826, + "loss": 0.0099, + "step": 396560 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014580500335682677, + "loss": 0.0105, + "step": 396570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014580111514045534, + "loss": 0.011, + "step": 396580 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014579722692408385, + "loss": 0.0115, + "step": 396590 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457933387077124, + "loss": 0.0117, + "step": 396600 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014578945049134094, + "loss": 0.0092, + "step": 396610 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014578556227496948, + "loss": 0.0098, + "step": 396620 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145781674058598, + "loss": 0.0106, + "step": 396630 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014577778584222653, + "loss": 0.0104, + "step": 396640 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014577389762585508, + "loss": 0.0118, + "step": 396650 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014577000940948362, + "loss": 0.012, + "step": 396660 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014576612119311213, + "loss": 0.0113, + "step": 396670 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014576223297674067, + "loss": 0.0112, + "step": 396680 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014575834476036922, + "loss": 0.0143, + "step": 396690 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014575445654399776, + "loss": 0.0091, + "step": 396700 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014575056832762627, + "loss": 0.0107, + "step": 396710 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457466801112548, + "loss": 0.013, + "step": 396720 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014574279189488335, + "loss": 0.0148, + "step": 396730 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014573890367851187, + "loss": 0.0124, + "step": 396740 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014573501546214044, + "loss": 0.0092, + "step": 396750 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014573112724576895, + "loss": 0.0105, + "step": 396760 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457272390293975, + "loss": 0.0115, + "step": 396770 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014572335081302604, + "loss": 0.009, + "step": 396780 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014571946259665458, + "loss": 0.0101, + "step": 396790 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001457155743802831, + "loss": 0.0116, + "step": 396800 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014571168616391163, + "loss": 0.0097, + "step": 396810 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014570779794754018, + "loss": 0.0093, + "step": 396820 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014570390973116872, + "loss": 0.0121, + "step": 396830 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014570002151479723, + "loss": 0.0094, + "step": 396840 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014569613329842577, + "loss": 0.0161, + "step": 396850 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014569224508205431, + "loss": 0.0121, + "step": 396860 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014568835686568286, + "loss": 0.0141, + "step": 396870 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014568446864931137, + "loss": 0.0156, + "step": 396880 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456805804329399, + "loss": 0.0107, + "step": 396890 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014567669221656845, + "loss": 0.0145, + "step": 396900 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145672804000197, + "loss": 0.0125, + "step": 396910 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456689157838255, + "loss": 0.011, + "step": 396920 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014566502756745408, + "loss": 0.0105, + "step": 396930 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456611393510826, + "loss": 0.0137, + "step": 396940 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014565725113471114, + "loss": 0.0119, + "step": 396950 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014565336291833968, + "loss": 0.0089, + "step": 396960 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014564947470196822, + "loss": 0.0124, + "step": 396970 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014564558648559673, + "loss": 0.0098, + "step": 396980 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014564169826922527, + "loss": 0.0139, + "step": 396990 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014563781005285382, + "loss": 0.0146, + "step": 397000 + }, + { + "epoch": 1.03, + "eval_cer": 0.8817628707113375, + "eval_loss": 0.0079797999933362, + "eval_runtime": 107.7727, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.639, + "step": 397000 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014563392183648233, + "loss": 0.0106, + "step": 397010 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014563003362011087, + "loss": 0.0102, + "step": 397020 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014562614540373941, + "loss": 0.0144, + "step": 397030 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014562225718736796, + "loss": 0.0096, + "step": 397040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014561836897099647, + "loss": 0.0112, + "step": 397050 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145614480754625, + "loss": 0.0101, + "step": 397060 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014561059253825355, + "loss": 0.0097, + "step": 397070 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456067043218821, + "loss": 0.0144, + "step": 397080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001456028161055106, + "loss": 0.0122, + "step": 397090 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014559892788913918, + "loss": 0.0098, + "step": 397100 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455950396727677, + "loss": 0.0112, + "step": 397110 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014559115145639623, + "loss": 0.0129, + "step": 397120 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014558726324002478, + "loss": 0.0112, + "step": 397130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014558337502365332, + "loss": 0.0094, + "step": 397140 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014557948680728183, + "loss": 0.0115, + "step": 397150 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014557559859091037, + "loss": 0.0088, + "step": 397160 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014557171037453892, + "loss": 0.0196, + "step": 397170 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014556782215816746, + "loss": 0.0154, + "step": 397180 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014556393394179597, + "loss": 0.0133, + "step": 397190 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014556004572542451, + "loss": 0.0134, + "step": 397200 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014555615750905306, + "loss": 0.0106, + "step": 397210 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014555226929268157, + "loss": 0.0135, + "step": 397220 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455483810763101, + "loss": 0.0116, + "step": 397230 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014554449285993865, + "loss": 0.0142, + "step": 397240 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455406046435672, + "loss": 0.0137, + "step": 397250 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455367164271957, + "loss": 0.0117, + "step": 397260 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014553282821082428, + "loss": 0.0137, + "step": 397270 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001455289399944528, + "loss": 0.0094, + "step": 397280 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014552505177808133, + "loss": 0.012, + "step": 397290 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014552116356170988, + "loss": 0.0093, + "step": 397300 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014551727534533842, + "loss": 0.0125, + "step": 397310 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014551338712896693, + "loss": 0.0097, + "step": 397320 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014550949891259547, + "loss": 0.0096, + "step": 397330 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014550561069622402, + "loss": 0.0122, + "step": 397340 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014550172247985256, + "loss": 0.0096, + "step": 397350 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014549783426348107, + "loss": 0.012, + "step": 397360 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454939460471096, + "loss": 0.0117, + "step": 397370 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014549005783073815, + "loss": 0.0176, + "step": 397380 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454861696143667, + "loss": 0.0084, + "step": 397390 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454822813979952, + "loss": 0.0077, + "step": 397400 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014547839318162375, + "loss": 0.0129, + "step": 397410 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454745049652523, + "loss": 0.0118, + "step": 397420 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014547061674888084, + "loss": 0.0101, + "step": 397430 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014546672853250935, + "loss": 0.0123, + "step": 397440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014546284031613792, + "loss": 0.0196, + "step": 397450 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014545895209976643, + "loss": 0.0125, + "step": 397460 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014545506388339498, + "loss": 0.0099, + "step": 397470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014545117566702352, + "loss": 0.0095, + "step": 397480 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014544728745065203, + "loss": 0.0112, + "step": 397490 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014544339923428057, + "loss": 0.0139, + "step": 397500 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014543951101790911, + "loss": 0.0115, + "step": 397510 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014543562280153766, + "loss": 0.0089, + "step": 397520 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014543173458516617, + "loss": 0.0081, + "step": 397530 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454278463687947, + "loss": 0.0097, + "step": 397540 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014542395815242325, + "loss": 0.0095, + "step": 397550 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454200699360518, + "loss": 0.0124, + "step": 397560 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454161817196803, + "loss": 0.0132, + "step": 397570 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014541229350330885, + "loss": 0.0108, + "step": 397580 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001454084052869374, + "loss": 0.0162, + "step": 397590 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014540451707056594, + "loss": 0.0102, + "step": 397600 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014540062885419445, + "loss": 0.0128, + "step": 397610 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014539674063782302, + "loss": 0.0097, + "step": 397620 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014539285242145153, + "loss": 0.0111, + "step": 397630 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014538896420508007, + "loss": 0.0123, + "step": 397640 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014538507598870862, + "loss": 0.0124, + "step": 397650 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014538118777233716, + "loss": 0.0096, + "step": 397660 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014537729955596567, + "loss": 0.0093, + "step": 397670 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014537341133959421, + "loss": 0.0138, + "step": 397680 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014536952312322276, + "loss": 0.0126, + "step": 397690 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453656349068513, + "loss": 0.0122, + "step": 397700 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453617466904798, + "loss": 0.0137, + "step": 397710 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014535785847410835, + "loss": 0.0134, + "step": 397720 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453539702577369, + "loss": 0.0135, + "step": 397730 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453500820413654, + "loss": 0.0128, + "step": 397740 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014534619382499395, + "loss": 0.0118, + "step": 397750 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001453423056086225, + "loss": 0.0126, + "step": 397760 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014533841739225103, + "loss": 0.0146, + "step": 397770 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014533452917587955, + "loss": 0.014, + "step": 397780 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014533064095950812, + "loss": 0.0128, + "step": 397790 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014532675274313663, + "loss": 0.012, + "step": 397800 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014532286452676517, + "loss": 0.015, + "step": 397810 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014531897631039372, + "loss": 0.0157, + "step": 397820 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014531508809402226, + "loss": 0.0113, + "step": 397830 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014531119987765077, + "loss": 0.0119, + "step": 397840 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014530731166127931, + "loss": 0.0112, + "step": 397850 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014530342344490786, + "loss": 0.0115, + "step": 397860 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452995352285364, + "loss": 0.013, + "step": 397870 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452956470121649, + "loss": 0.0126, + "step": 397880 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014529175879579345, + "loss": 0.012, + "step": 397890 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145287870579422, + "loss": 0.01, + "step": 397900 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014528398236305054, + "loss": 0.0119, + "step": 397910 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014528009414667905, + "loss": 0.0125, + "step": 397920 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452762059303076, + "loss": 0.0115, + "step": 397930 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014527231771393613, + "loss": 0.0134, + "step": 397940 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014526842949756468, + "loss": 0.0112, + "step": 397950 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452645412811932, + "loss": 0.0109, + "step": 397960 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014526065306482173, + "loss": 0.0136, + "step": 397970 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014525676484845027, + "loss": 0.0115, + "step": 397980 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014525287663207882, + "loss": 0.0101, + "step": 397990 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014524898841570736, + "loss": 0.012, + "step": 398000 + }, + { + "epoch": 1.03, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.007515719626098871, + "eval_runtime": 107.6857, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, + "step": 398000 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014524510019933587, + "loss": 0.0112, + "step": 398010 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452412119829644, + "loss": 0.01, + "step": 398020 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014523732376659295, + "loss": 0.0098, + "step": 398030 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452334355502215, + "loss": 0.0124, + "step": 398040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014522954733385, + "loss": 0.011, + "step": 398050 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014522565911747855, + "loss": 0.0139, + "step": 398060 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452217709011071, + "loss": 0.0128, + "step": 398070 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014521788268473564, + "loss": 0.011, + "step": 398080 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014521399446836415, + "loss": 0.0109, + "step": 398090 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001452101062519927, + "loss": 0.0123, + "step": 398100 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014520621803562123, + "loss": 0.0112, + "step": 398110 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014520232981924978, + "loss": 0.0102, + "step": 398120 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451984416028783, + "loss": 0.0119, + "step": 398130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014519455338650686, + "loss": 0.0142, + "step": 398140 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014519066517013537, + "loss": 0.0117, + "step": 398150 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014518677695376391, + "loss": 0.0111, + "step": 398160 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014518288873739246, + "loss": 0.011, + "step": 398170 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145179000521021, + "loss": 0.0106, + "step": 398180 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451751123046495, + "loss": 0.0127, + "step": 398190 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014517122408827805, + "loss": 0.0103, + "step": 398200 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451673358719066, + "loss": 0.0116, + "step": 398210 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451634476555351, + "loss": 0.0123, + "step": 398220 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014515955943916365, + "loss": 0.0099, + "step": 398230 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451556712227922, + "loss": 0.0111, + "step": 398240 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014515178300642074, + "loss": 0.0095, + "step": 398250 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014514789479004925, + "loss": 0.0118, + "step": 398260 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451440065736778, + "loss": 0.0091, + "step": 398270 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014514011835730633, + "loss": 0.0126, + "step": 398280 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014513623014093487, + "loss": 0.0106, + "step": 398290 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451323419245634, + "loss": 0.0129, + "step": 398300 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014512845370819193, + "loss": 0.0118, + "step": 398310 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014512456549182047, + "loss": 0.0117, + "step": 398320 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014512067727544901, + "loss": 0.0117, + "step": 398330 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014511678905907756, + "loss": 0.0087, + "step": 398340 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451129008427061, + "loss": 0.0086, + "step": 398350 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451090126263346, + "loss": 0.0119, + "step": 398360 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014510512440996315, + "loss": 0.0105, + "step": 398370 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001451012361935917, + "loss": 0.0115, + "step": 398380 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014509734797722024, + "loss": 0.0101, + "step": 398390 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014509345976084875, + "loss": 0.0126, + "step": 398400 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450895715444773, + "loss": 0.0085, + "step": 398410 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014508568332810583, + "loss": 0.0099, + "step": 398420 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014508179511173438, + "loss": 0.0108, + "step": 398430 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450779068953629, + "loss": 0.0113, + "step": 398440 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014507401867899143, + "loss": 0.0125, + "step": 398450 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014507013046261997, + "loss": 0.0106, + "step": 398460 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450662422462485, + "loss": 0.0104, + "step": 398470 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014506235402987703, + "loss": 0.012, + "step": 398480 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014505846581350557, + "loss": 0.0142, + "step": 398490 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450545775971341, + "loss": 0.0114, + "step": 398500 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014505068938076263, + "loss": 0.0119, + "step": 398510 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450468011643912, + "loss": 0.0121, + "step": 398520 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450429129480197, + "loss": 0.0113, + "step": 398530 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014503902473164825, + "loss": 0.0129, + "step": 398540 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450351365152768, + "loss": 0.0125, + "step": 398550 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014503124829890534, + "loss": 0.0099, + "step": 398560 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014502736008253385, + "loss": 0.0119, + "step": 398570 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001450234718661624, + "loss": 0.0142, + "step": 398580 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014501958364979093, + "loss": 0.01, + "step": 398590 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014501569543341948, + "loss": 0.0131, + "step": 398600 + }, + { + "epoch": 1.03, + "learning_rate": 0.000145011807217048, + "loss": 0.0131, + "step": 398610 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014500791900067653, + "loss": 0.0114, + "step": 398620 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014500403078430507, + "loss": 0.0114, + "step": 398630 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014500014256793362, + "loss": 0.0098, + "step": 398640 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014499625435156213, + "loss": 0.0133, + "step": 398650 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449923661351907, + "loss": 0.013, + "step": 398660 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449884779188192, + "loss": 0.0106, + "step": 398670 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014498458970244775, + "loss": 0.0123, + "step": 398680 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449807014860763, + "loss": 0.0089, + "step": 398690 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014497681326970484, + "loss": 0.0132, + "step": 398700 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014497292505333335, + "loss": 0.0186, + "step": 398710 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449690368369619, + "loss": 0.0115, + "step": 398720 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014496514862059044, + "loss": 0.0127, + "step": 398730 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014496126040421895, + "loss": 0.011, + "step": 398740 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449573721878475, + "loss": 0.0147, + "step": 398750 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014495348397147603, + "loss": 0.0105, + "step": 398760 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014494959575510458, + "loss": 0.0102, + "step": 398770 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449457075387331, + "loss": 0.0102, + "step": 398780 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014494181932236163, + "loss": 0.0085, + "step": 398790 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014493793110599017, + "loss": 0.0149, + "step": 398800 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014493404288961871, + "loss": 0.0146, + "step": 398810 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014493015467324723, + "loss": 0.0116, + "step": 398820 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014492626645687577, + "loss": 0.01, + "step": 398830 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449223782405043, + "loss": 0.0092, + "step": 398840 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014491849002413285, + "loss": 0.0131, + "step": 398850 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001449146018077614, + "loss": 0.0103, + "step": 398860 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014491071359138994, + "loss": 0.0171, + "step": 398870 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014490682537501845, + "loss": 0.0115, + "step": 398880 + }, + { + "epoch": 1.03, + "learning_rate": 0.000144902937158647, + "loss": 0.012, + "step": 398890 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014489904894227554, + "loss": 0.0137, + "step": 398900 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014489516072590408, + "loss": 0.0117, + "step": 398910 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448912725095326, + "loss": 0.0114, + "step": 398920 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014488738429316113, + "loss": 0.0101, + "step": 398930 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014488349607678967, + "loss": 0.0084, + "step": 398940 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014487960786041822, + "loss": 0.011, + "step": 398950 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014487571964404673, + "loss": 0.0117, + "step": 398960 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014487183142767527, + "loss": 0.012, + "step": 398970 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014486794321130381, + "loss": 0.013, + "step": 398980 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014486405499493233, + "loss": 0.0093, + "step": 398990 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014486016677856087, + "loss": 0.0127, + "step": 399000 + }, + { + "epoch": 1.03, + "eval_cer": 0.881688689953826, + "eval_loss": 0.00787573866546154, + "eval_runtime": 107.4938, + "eval_samples_per_second": 18.606, + "eval_steps_per_second": 4.651, + "step": 399000 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448562785621894, + "loss": 0.01, + "step": 399010 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014485239034581795, + "loss": 0.0104, + "step": 399020 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014484850212944647, + "loss": 0.0176, + "step": 399030 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014484461391307504, + "loss": 0.0113, + "step": 399040 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014484072569670355, + "loss": 0.0124, + "step": 399050 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448368374803321, + "loss": 0.0111, + "step": 399060 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014483294926396063, + "loss": 0.0093, + "step": 399070 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014482906104758918, + "loss": 0.0124, + "step": 399080 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448251728312177, + "loss": 0.0113, + "step": 399090 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014482128461484623, + "loss": 0.0114, + "step": 399100 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014481739639847477, + "loss": 0.0141, + "step": 399110 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014481350818210332, + "loss": 0.0202, + "step": 399120 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014480961996573183, + "loss": 0.0132, + "step": 399130 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014480573174936037, + "loss": 0.017, + "step": 399140 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001448018435329889, + "loss": 0.0103, + "step": 399150 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014479795531661746, + "loss": 0.0122, + "step": 399160 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014479406710024597, + "loss": 0.0123, + "step": 399170 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001447901788838745, + "loss": 0.0104, + "step": 399180 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014478629066750305, + "loss": 0.0118, + "step": 399190 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001447824024511316, + "loss": 0.0107, + "step": 399200 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014477851423476014, + "loss": 0.0094, + "step": 399210 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014477462601838865, + "loss": 0.0131, + "step": 399220 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001447707378020172, + "loss": 0.0133, + "step": 399230 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014476684958564573, + "loss": 0.0155, + "step": 399240 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014476296136927428, + "loss": 0.0128, + "step": 399250 + }, + { + "epoch": 1.03, + "learning_rate": 0.0001447590731529028, + "loss": 0.0135, + "step": 399260 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014475518493653133, + "loss": 0.0159, + "step": 399270 + }, + { + "epoch": 1.03, + "learning_rate": 0.00014475129672015987, + "loss": 0.0115, + "step": 399280 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014474740850378841, + "loss": 0.0098, + "step": 399290 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014474352028741693, + "loss": 0.0088, + "step": 399300 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014473963207104547, + "loss": 0.0103, + "step": 399310 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144735743854674, + "loss": 0.0176, + "step": 399320 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014473185563830255, + "loss": 0.0124, + "step": 399330 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014472796742193107, + "loss": 0.0111, + "step": 399340 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001447240792055596, + "loss": 0.0118, + "step": 399350 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014472019098918815, + "loss": 0.0105, + "step": 399360 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001447163027728167, + "loss": 0.0116, + "step": 399370 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014471241455644524, + "loss": 0.0103, + "step": 399380 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014470852634007378, + "loss": 0.0112, + "step": 399390 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001447046381237023, + "loss": 0.012, + "step": 399400 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014470074990733083, + "loss": 0.0118, + "step": 399410 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014469686169095937, + "loss": 0.0126, + "step": 399420 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014469297347458792, + "loss": 0.0105, + "step": 399430 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014468908525821643, + "loss": 0.0108, + "step": 399440 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014468519704184497, + "loss": 0.0112, + "step": 399450 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014468130882547351, + "loss": 0.0143, + "step": 399460 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014467742060910203, + "loss": 0.0185, + "step": 399470 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014467353239273057, + "loss": 0.0149, + "step": 399480 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446696441763591, + "loss": 0.0129, + "step": 399490 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014466575595998765, + "loss": 0.0111, + "step": 399500 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014466186774361617, + "loss": 0.0136, + "step": 399510 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446579795272447, + "loss": 0.0133, + "step": 399520 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014465409131087325, + "loss": 0.0121, + "step": 399530 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446502030945018, + "loss": 0.0173, + "step": 399540 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446463148781303, + "loss": 0.0133, + "step": 399550 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014464242666175888, + "loss": 0.0104, + "step": 399560 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446385384453874, + "loss": 0.0134, + "step": 399570 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014463465022901593, + "loss": 0.0093, + "step": 399580 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014463076201264447, + "loss": 0.0128, + "step": 399590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014462687379627302, + "loss": 0.0131, + "step": 399600 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014462298557990153, + "loss": 0.0138, + "step": 399610 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014461909736353007, + "loss": 0.0101, + "step": 399620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014461520914715861, + "loss": 0.0103, + "step": 399630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014461132093078716, + "loss": 0.0118, + "step": 399640 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014460743271441567, + "loss": 0.0117, + "step": 399650 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001446035444980442, + "loss": 0.013, + "step": 399660 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014459965628167275, + "loss": 0.0128, + "step": 399670 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445957680653013, + "loss": 0.0114, + "step": 399680 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445918798489298, + "loss": 0.0102, + "step": 399690 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014458799163255835, + "loss": 0.0138, + "step": 399700 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445841034161869, + "loss": 0.0111, + "step": 399710 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445802151998154, + "loss": 0.0146, + "step": 399720 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014457632698344398, + "loss": 0.0144, + "step": 399730 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445724387670725, + "loss": 0.0138, + "step": 399740 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014456855055070103, + "loss": 0.0107, + "step": 399750 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014456466233432957, + "loss": 0.0125, + "step": 399760 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014456077411795812, + "loss": 0.0122, + "step": 399770 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014455688590158663, + "loss": 0.0127, + "step": 399780 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014455299768521517, + "loss": 0.009, + "step": 399790 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445491094688437, + "loss": 0.0102, + "step": 399800 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014454522125247225, + "loss": 0.0122, + "step": 399810 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014454133303610077, + "loss": 0.0112, + "step": 399820 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445374448197293, + "loss": 0.0138, + "step": 399830 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014453355660335785, + "loss": 0.0135, + "step": 399840 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445296683869864, + "loss": 0.0162, + "step": 399850 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001445257801706149, + "loss": 0.0101, + "step": 399860 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014452189195424345, + "loss": 0.0126, + "step": 399870 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144518003737872, + "loss": 0.0135, + "step": 399880 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014451411552150053, + "loss": 0.0116, + "step": 399890 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014451022730512905, + "loss": 0.0154, + "step": 399900 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014450633908875762, + "loss": 0.0142, + "step": 399910 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014450245087238613, + "loss": 0.0149, + "step": 399920 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014449856265601467, + "loss": 0.0517, + "step": 399930 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014449467443964321, + "loss": 0.0142, + "step": 399940 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014449078622327173, + "loss": 0.0147, + "step": 399950 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014448689800690027, + "loss": 0.0106, + "step": 399960 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444830097905288, + "loss": 0.0115, + "step": 399970 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014447912157415735, + "loss": 0.0116, + "step": 399980 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014447523335778587, + "loss": 0.0112, + "step": 399990 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444713451414144, + "loss": 0.0136, + "step": 400000 + }, + { + "epoch": 1.04, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.007727402728050947, + "eval_runtime": 107.7237, + "eval_samples_per_second": 18.566, + "eval_steps_per_second": 4.642, + "step": 400000 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014446745692504295, + "loss": 0.0131, + "step": 400010 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444635687086715, + "loss": 0.0137, + "step": 400020 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444596804923, + "loss": 0.0108, + "step": 400030 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014445579227592855, + "loss": 0.0106, + "step": 400040 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444519040595571, + "loss": 0.0098, + "step": 400050 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014444801584318563, + "loss": 0.0097, + "step": 400060 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014444412762681415, + "loss": 0.0143, + "step": 400070 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014444023941044272, + "loss": 0.0122, + "step": 400080 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014443635119407123, + "loss": 0.0131, + "step": 400090 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014443246297769977, + "loss": 0.0135, + "step": 400100 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014442857476132831, + "loss": 0.0105, + "step": 400110 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014442468654495686, + "loss": 0.0139, + "step": 400120 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014442079832858537, + "loss": 0.0162, + "step": 400130 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444169101122139, + "loss": 0.0137, + "step": 400140 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014441302189584245, + "loss": 0.0119, + "step": 400150 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144409133679471, + "loss": 0.0113, + "step": 400160 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001444052454630995, + "loss": 0.0127, + "step": 400170 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014440135724672805, + "loss": 0.0168, + "step": 400180 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443974690303566, + "loss": 0.0116, + "step": 400190 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443935808139851, + "loss": 0.011, + "step": 400200 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014438969259761365, + "loss": 0.0097, + "step": 400210 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443858043812422, + "loss": 0.012, + "step": 400220 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014438191616487073, + "loss": 0.0111, + "step": 400230 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014437802794849925, + "loss": 0.0112, + "step": 400240 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014437413973212782, + "loss": 0.0092, + "step": 400250 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014437025151575633, + "loss": 0.0112, + "step": 400260 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014436636329938487, + "loss": 0.015, + "step": 400270 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014436247508301341, + "loss": 0.0114, + "step": 400280 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014435858686664196, + "loss": 0.0124, + "step": 400290 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014435469865027047, + "loss": 0.0116, + "step": 400300 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144350810433899, + "loss": 0.0166, + "step": 400310 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014434692221752755, + "loss": 0.0101, + "step": 400320 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443430340011561, + "loss": 0.0121, + "step": 400330 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443391457847846, + "loss": 0.0088, + "step": 400340 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014433525756841315, + "loss": 0.0091, + "step": 400350 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443313693520417, + "loss": 0.0121, + "step": 400360 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014432748113567023, + "loss": 0.0117, + "step": 400370 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014432359291929875, + "loss": 0.0122, + "step": 400380 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443197047029273, + "loss": 0.0096, + "step": 400390 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014431581648655583, + "loss": 0.0109, + "step": 400400 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014431192827018437, + "loss": 0.0113, + "step": 400410 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001443080400538129, + "loss": 0.0111, + "step": 400420 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014430415183744146, + "loss": 0.0133, + "step": 400430 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014430026362106997, + "loss": 0.0129, + "step": 400440 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442963754046985, + "loss": 0.0127, + "step": 400450 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014429248718832705, + "loss": 0.0137, + "step": 400460 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014428859897195557, + "loss": 0.01, + "step": 400470 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442847107555841, + "loss": 0.0116, + "step": 400480 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014428082253921265, + "loss": 0.0105, + "step": 400490 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442769343228412, + "loss": 0.0146, + "step": 400500 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442730461064697, + "loss": 0.0099, + "step": 400510 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014426915789009825, + "loss": 0.0084, + "step": 400520 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442652696737268, + "loss": 0.0107, + "step": 400530 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014426138145735533, + "loss": 0.0099, + "step": 400540 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014425749324098385, + "loss": 0.0098, + "step": 400550 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442536050246124, + "loss": 0.0087, + "step": 400560 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014424971680824093, + "loss": 0.0093, + "step": 400570 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014424582859186947, + "loss": 0.0104, + "step": 400580 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144241940375498, + "loss": 0.0126, + "step": 400590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014423805215912656, + "loss": 0.0133, + "step": 400600 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014423416394275507, + "loss": 0.0099, + "step": 400610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442302757263836, + "loss": 0.0108, + "step": 400620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014422638751001215, + "loss": 0.0114, + "step": 400630 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442224992936407, + "loss": 0.0115, + "step": 400640 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442186110772692, + "loss": 0.0129, + "step": 400650 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014421472286089775, + "loss": 0.0108, + "step": 400660 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001442108346445263, + "loss": 0.0133, + "step": 400670 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014420694642815484, + "loss": 0.0108, + "step": 400680 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014420305821178335, + "loss": 0.0135, + "step": 400690 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441991699954119, + "loss": 0.0141, + "step": 400700 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014419528177904043, + "loss": 0.0151, + "step": 400710 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014419139356266895, + "loss": 0.0105, + "step": 400720 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441875053462975, + "loss": 0.0132, + "step": 400730 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014418361712992603, + "loss": 0.0124, + "step": 400740 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014417972891355457, + "loss": 0.0133, + "step": 400750 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441758406971831, + "loss": 0.0147, + "step": 400760 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014417195248081163, + "loss": 0.0129, + "step": 400770 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014416806426444017, + "loss": 0.0116, + "step": 400780 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441641760480687, + "loss": 0.0113, + "step": 400790 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014416028783169725, + "loss": 0.0113, + "step": 400800 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441563996153258, + "loss": 0.0108, + "step": 400810 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441525113989543, + "loss": 0.0157, + "step": 400820 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014414862318258285, + "loss": 0.0129, + "step": 400830 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441447349662114, + "loss": 0.0138, + "step": 400840 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014414084674983993, + "loss": 0.0116, + "step": 400850 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014413695853346845, + "loss": 0.0175, + "step": 400860 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144133070317097, + "loss": 0.014, + "step": 400870 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014412918210072553, + "loss": 0.0163, + "step": 400880 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014412529388435407, + "loss": 0.0134, + "step": 400890 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001441214056679826, + "loss": 0.0128, + "step": 400900 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014411751745161113, + "loss": 0.0103, + "step": 400910 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014411362923523967, + "loss": 0.011, + "step": 400920 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014410974101886821, + "loss": 0.0121, + "step": 400930 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014410585280249673, + "loss": 0.0134, + "step": 400940 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014410196458612527, + "loss": 0.0096, + "step": 400950 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440980763697538, + "loss": 0.0099, + "step": 400960 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014409418815338233, + "loss": 0.0106, + "step": 400970 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440902999370109, + "loss": 0.0157, + "step": 400980 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440864117206394, + "loss": 0.0118, + "step": 400990 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014408252350426795, + "loss": 0.0129, + "step": 401000 + }, + { + "epoch": 1.04, + "eval_cer": 0.8817012866862336, + "eval_loss": 0.0077420733869075775, + "eval_runtime": 107.3386, + "eval_samples_per_second": 18.633, + "eval_steps_per_second": 4.658, + "step": 401000 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440786352878965, + "loss": 0.0098, + "step": 401010 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014407474707152503, + "loss": 0.0108, + "step": 401020 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014407085885515355, + "loss": 0.0123, + "step": 401030 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440669706387821, + "loss": 0.0113, + "step": 401040 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014406308242241063, + "loss": 0.0136, + "step": 401050 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014405919420603917, + "loss": 0.0139, + "step": 401060 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440553059896677, + "loss": 0.012, + "step": 401070 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014405141777329623, + "loss": 0.0114, + "step": 401080 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014404752955692477, + "loss": 0.0121, + "step": 401090 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440436413405533, + "loss": 0.0103, + "step": 401100 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014403975312418183, + "loss": 0.0108, + "step": 401110 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440358649078104, + "loss": 0.0104, + "step": 401120 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440319766914389, + "loss": 0.0106, + "step": 401130 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014402808847506745, + "loss": 0.0133, + "step": 401140 + }, + { + "epoch": 1.04, + "learning_rate": 0.000144024200258696, + "loss": 0.0123, + "step": 401150 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014402031204232454, + "loss": 0.0206, + "step": 401160 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014401642382595305, + "loss": 0.0103, + "step": 401170 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440125356095816, + "loss": 0.0095, + "step": 401180 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014400864739321013, + "loss": 0.011, + "step": 401190 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014400475917683865, + "loss": 0.0082, + "step": 401200 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001440008709604672, + "loss": 0.0112, + "step": 401210 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014399698274409573, + "loss": 0.0095, + "step": 401220 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014399309452772427, + "loss": 0.0129, + "step": 401230 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439892063113528, + "loss": 0.0135, + "step": 401240 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014398531809498133, + "loss": 0.0107, + "step": 401250 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014398142987860987, + "loss": 0.0108, + "step": 401260 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439775416622384, + "loss": 0.0103, + "step": 401270 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014397365344586693, + "loss": 0.0128, + "step": 401280 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014396976522949547, + "loss": 0.0114, + "step": 401290 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143965877013124, + "loss": 0.0121, + "step": 401300 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014396198879675255, + "loss": 0.013, + "step": 401310 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439581005803811, + "loss": 0.01, + "step": 401320 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014395421236400964, + "loss": 0.0081, + "step": 401330 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014395032414763815, + "loss": 0.0107, + "step": 401340 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439464359312667, + "loss": 0.01, + "step": 401350 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014394254771489523, + "loss": 0.0113, + "step": 401360 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014393865949852377, + "loss": 0.0146, + "step": 401370 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439347712821523, + "loss": 0.0116, + "step": 401380 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014393088306578083, + "loss": 0.014, + "step": 401390 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014392699484940937, + "loss": 0.0109, + "step": 401400 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014392310663303791, + "loss": 0.0094, + "step": 401410 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014391921841666643, + "loss": 0.015, + "step": 401420 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014391533020029497, + "loss": 0.0135, + "step": 401430 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001439114419839235, + "loss": 0.0099, + "step": 401440 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014390755376755203, + "loss": 0.014, + "step": 401450 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014390366555118057, + "loss": 0.015, + "step": 401460 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438997773348091, + "loss": 0.0126, + "step": 401470 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014389588911843765, + "loss": 0.0114, + "step": 401480 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014389200090206617, + "loss": 0.0104, + "step": 401490 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014388811268569473, + "loss": 0.0112, + "step": 401500 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014388422446932325, + "loss": 0.0114, + "step": 401510 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438803362529518, + "loss": 0.0129, + "step": 401520 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014387644803658033, + "loss": 0.0089, + "step": 401530 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014387255982020887, + "loss": 0.0103, + "step": 401540 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438686716038374, + "loss": 0.0138, + "step": 401550 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014386478338746593, + "loss": 0.0084, + "step": 401560 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014386089517109447, + "loss": 0.0115, + "step": 401570 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143857006954723, + "loss": 0.0097, + "step": 401580 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014385311873835153, + "loss": 0.0126, + "step": 401590 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014384923052198007, + "loss": 0.0129, + "step": 401600 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438453423056086, + "loss": 0.0109, + "step": 401610 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014384145408923715, + "loss": 0.0107, + "step": 401620 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014383756587286567, + "loss": 0.0112, + "step": 401630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014383367765649424, + "loss": 0.0111, + "step": 401640 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014382978944012275, + "loss": 0.0135, + "step": 401650 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438259012237513, + "loss": 0.0098, + "step": 401660 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014382201300737983, + "loss": 0.0123, + "step": 401670 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014381812479100838, + "loss": 0.0112, + "step": 401680 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438142365746369, + "loss": 0.0154, + "step": 401690 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014381034835826543, + "loss": 0.0111, + "step": 401700 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014380646014189397, + "loss": 0.0135, + "step": 401710 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001438025719255225, + "loss": 0.0096, + "step": 401720 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014379868370915103, + "loss": 0.0123, + "step": 401730 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014379479549277957, + "loss": 0.0127, + "step": 401740 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437909072764081, + "loss": 0.0118, + "step": 401750 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014378701906003663, + "loss": 0.0143, + "step": 401760 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014378313084366517, + "loss": 0.0123, + "step": 401770 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437792426272937, + "loss": 0.0115, + "step": 401780 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014377535441092225, + "loss": 0.0145, + "step": 401790 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014377146619455077, + "loss": 0.0107, + "step": 401800 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437675779781793, + "loss": 0.0092, + "step": 401810 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014376368976180785, + "loss": 0.0133, + "step": 401820 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437598015454364, + "loss": 0.0115, + "step": 401830 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014375591332906493, + "loss": 0.0125, + "step": 401840 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014375202511269348, + "loss": 0.0126, + "step": 401850 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143748136896322, + "loss": 0.0159, + "step": 401860 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014374424867995053, + "loss": 0.0106, + "step": 401870 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014374036046357907, + "loss": 0.0127, + "step": 401880 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014373647224720761, + "loss": 0.0112, + "step": 401890 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014373258403083613, + "loss": 0.0127, + "step": 401900 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014372869581446467, + "loss": 0.0109, + "step": 401910 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437248075980932, + "loss": 0.0124, + "step": 401920 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014372091938172175, + "loss": 0.0147, + "step": 401930 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014371703116535027, + "loss": 0.0097, + "step": 401940 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437131429489788, + "loss": 0.0152, + "step": 401950 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014370925473260735, + "loss": 0.0126, + "step": 401960 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014370536651623587, + "loss": 0.0107, + "step": 401970 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001437014782998644, + "loss": 0.0108, + "step": 401980 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014369759008349295, + "loss": 0.0128, + "step": 401990 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436937018671215, + "loss": 0.0132, + "step": 402000 + }, + { + "epoch": 1.04, + "eval_cer": 0.8817012866862336, + "eval_loss": 0.007718118838965893, + "eval_runtime": 107.504, + "eval_samples_per_second": 18.604, + "eval_steps_per_second": 4.651, + "step": 402000 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014368981365075, + "loss": 0.0112, + "step": 402010 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014368592543437857, + "loss": 0.0122, + "step": 402020 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436820372180071, + "loss": 0.0119, + "step": 402030 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014367814900163563, + "loss": 0.0127, + "step": 402040 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014367426078526417, + "loss": 0.015, + "step": 402050 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014367037256889271, + "loss": 0.0107, + "step": 402060 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014366648435252123, + "loss": 0.0101, + "step": 402070 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014366259613614977, + "loss": 0.0134, + "step": 402080 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436587079197783, + "loss": 0.0112, + "step": 402090 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014365481970340685, + "loss": 0.0122, + "step": 402100 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014365093148703537, + "loss": 0.0117, + "step": 402110 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436470432706639, + "loss": 0.0133, + "step": 402120 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014364315505429245, + "loss": 0.0239, + "step": 402130 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143639266837921, + "loss": 0.0099, + "step": 402140 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436353786215495, + "loss": 0.0097, + "step": 402150 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014363149040517805, + "loss": 0.0091, + "step": 402160 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436276021888066, + "loss": 0.013, + "step": 402170 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014362371397243513, + "loss": 0.0135, + "step": 402180 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014361982575606367, + "loss": 0.0119, + "step": 402190 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436159375396922, + "loss": 0.0097, + "step": 402200 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014361204932332073, + "loss": 0.0092, + "step": 402210 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014360816110694927, + "loss": 0.0136, + "step": 402220 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001436042728905778, + "loss": 0.0113, + "step": 402230 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014360038467420633, + "loss": 0.0137, + "step": 402240 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014359649645783487, + "loss": 0.0137, + "step": 402250 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435926082414634, + "loss": 0.0111, + "step": 402260 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014358872002509195, + "loss": 0.0108, + "step": 402270 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014358483180872047, + "loss": 0.0128, + "step": 402280 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143580943592349, + "loss": 0.0156, + "step": 402290 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014357705537597755, + "loss": 0.0102, + "step": 402300 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435731671596061, + "loss": 0.01, + "step": 402310 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435692789432346, + "loss": 0.011, + "step": 402320 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014356539072686315, + "loss": 0.0101, + "step": 402330 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435615025104917, + "loss": 0.0103, + "step": 402340 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014355761429412023, + "loss": 0.0121, + "step": 402350 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014355372607774875, + "loss": 0.011, + "step": 402360 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014354983786137731, + "loss": 0.0209, + "step": 402370 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014354594964500583, + "loss": 0.0137, + "step": 402380 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014354206142863437, + "loss": 0.012, + "step": 402390 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435381732122629, + "loss": 0.0121, + "step": 402400 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014353428499589145, + "loss": 0.0219, + "step": 402410 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014353039677951997, + "loss": 0.0112, + "step": 402420 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435265085631485, + "loss": 0.0123, + "step": 402430 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014352262034677705, + "loss": 0.0112, + "step": 402440 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014351873213040557, + "loss": 0.0095, + "step": 402450 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435148439140341, + "loss": 0.0113, + "step": 402460 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014351095569766265, + "loss": 0.0094, + "step": 402470 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435070674812912, + "loss": 0.0114, + "step": 402480 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001435031792649197, + "loss": 0.0123, + "step": 402490 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014349929104854825, + "loss": 0.0138, + "step": 402500 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434954028321768, + "loss": 0.0132, + "step": 402510 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014349151461580533, + "loss": 0.0116, + "step": 402520 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014348762639943385, + "loss": 0.0112, + "step": 402530 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014348373818306241, + "loss": 0.0109, + "step": 402540 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014347984996669093, + "loss": 0.0109, + "step": 402550 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014347596175031947, + "loss": 0.0104, + "step": 402560 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143472073533948, + "loss": 0.0093, + "step": 402570 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014346818531757655, + "loss": 0.0096, + "step": 402580 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014346429710120507, + "loss": 0.0094, + "step": 402590 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434604088848336, + "loss": 0.0146, + "step": 402600 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014345652066846215, + "loss": 0.0145, + "step": 402610 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434526324520907, + "loss": 0.0116, + "step": 402620 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434487442357192, + "loss": 0.0107, + "step": 402630 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014344485601934775, + "loss": 0.0143, + "step": 402640 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434409678029763, + "loss": 0.0097, + "step": 402650 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014343707958660483, + "loss": 0.0109, + "step": 402660 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014343319137023335, + "loss": 0.0112, + "step": 402670 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434293031538619, + "loss": 0.0098, + "step": 402680 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014342541493749043, + "loss": 0.011, + "step": 402690 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014342152672111895, + "loss": 0.0111, + "step": 402700 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014341763850474751, + "loss": 0.0112, + "step": 402710 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014341375028837603, + "loss": 0.008, + "step": 402720 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014340986207200457, + "loss": 0.0117, + "step": 402730 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001434059738556331, + "loss": 0.013, + "step": 402740 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014340208563926165, + "loss": 0.0099, + "step": 402750 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014339819742289017, + "loss": 0.0122, + "step": 402760 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433943092065187, + "loss": 0.0108, + "step": 402770 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014339042099014725, + "loss": 0.0102, + "step": 402780 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433865327737758, + "loss": 0.0122, + "step": 402790 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433826445574043, + "loss": 0.013, + "step": 402800 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014337875634103285, + "loss": 0.0122, + "step": 402810 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433748681246614, + "loss": 0.0118, + "step": 402820 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014337097990828993, + "loss": 0.0103, + "step": 402830 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014336709169191845, + "loss": 0.0136, + "step": 402840 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143363203475547, + "loss": 0.0106, + "step": 402850 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014335931525917553, + "loss": 0.0115, + "step": 402860 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014335542704280407, + "loss": 0.0117, + "step": 402870 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014335153882643259, + "loss": 0.0158, + "step": 402880 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014334765061006115, + "loss": 0.0115, + "step": 402890 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014334376239368967, + "loss": 0.0135, + "step": 402900 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433398741773182, + "loss": 0.0132, + "step": 402910 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014333598596094675, + "loss": 0.0134, + "step": 402920 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014333209774457527, + "loss": 0.0124, + "step": 402930 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433282095282038, + "loss": 0.0178, + "step": 402940 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014332432131183235, + "loss": 0.0131, + "step": 402950 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433204330954609, + "loss": 0.0136, + "step": 402960 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433165448790894, + "loss": 0.0152, + "step": 402970 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014331265666271795, + "loss": 0.012, + "step": 402980 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001433087684463465, + "loss": 0.0107, + "step": 402990 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014330488022997503, + "loss": 0.0077, + "step": 403000 + }, + { + "epoch": 1.04, + "eval_cer": 0.8816970877754311, + "eval_loss": 0.007720929104834795, + "eval_runtime": 107.8049, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, + "step": 403000 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014330099201360355, + "loss": 0.0107, + "step": 403010 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432971037972321, + "loss": 0.0111, + "step": 403020 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014329321558086063, + "loss": 0.0138, + "step": 403030 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014328932736448917, + "loss": 0.008, + "step": 403040 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014328543914811769, + "loss": 0.0087, + "step": 403050 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014328155093174625, + "loss": 0.0101, + "step": 403060 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014327766271537477, + "loss": 0.0132, + "step": 403070 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432737744990033, + "loss": 0.0115, + "step": 403080 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014326988628263185, + "loss": 0.0084, + "step": 403090 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432659980662604, + "loss": 0.0103, + "step": 403100 + }, + { + "epoch": 1.04, + "learning_rate": 0.0001432621098498889, + "loss": 0.0095, + "step": 403110 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014325822163351745, + "loss": 0.0136, + "step": 403120 + }, + { + "epoch": 1.04, + "learning_rate": 0.000143254333417146, + "loss": 0.0102, + "step": 403130 + }, + { + "epoch": 1.04, + "learning_rate": 0.00014325044520077453, + "loss": 0.0103, + "step": 403140 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014324655698440305, + "loss": 0.0094, + "step": 403150 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001432426687680316, + "loss": 0.0145, + "step": 403160 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014323878055166013, + "loss": 0.0154, + "step": 403170 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014323489233528865, + "loss": 0.0099, + "step": 403180 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001432310041189172, + "loss": 0.0122, + "step": 403190 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014322711590254573, + "loss": 0.0112, + "step": 403200 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014322322768617427, + "loss": 0.0112, + "step": 403210 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014321933946980278, + "loss": 0.0108, + "step": 403220 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014321545125343135, + "loss": 0.0093, + "step": 403230 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014321156303705987, + "loss": 0.0107, + "step": 403240 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001432076748206884, + "loss": 0.0107, + "step": 403250 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014320378660431695, + "loss": 0.0104, + "step": 403260 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431998983879455, + "loss": 0.0138, + "step": 403270 + }, + { + "epoch": 1.05, + "learning_rate": 0.000143196010171574, + "loss": 0.0144, + "step": 403280 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014319212195520255, + "loss": 0.014, + "step": 403290 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431882337388311, + "loss": 0.0103, + "step": 403300 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014318434552245963, + "loss": 0.0149, + "step": 403310 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014318045730608815, + "loss": 0.0101, + "step": 403320 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431765690897167, + "loss": 0.0097, + "step": 403330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014317268087334523, + "loss": 0.0112, + "step": 403340 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014316879265697377, + "loss": 0.0095, + "step": 403350 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431649044406023, + "loss": 0.0108, + "step": 403360 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014316101622423083, + "loss": 0.0119, + "step": 403370 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014315712800785937, + "loss": 0.0129, + "step": 403380 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431532397914879, + "loss": 0.0144, + "step": 403390 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014314935157511643, + "loss": 0.0113, + "step": 403400 + }, + { + "epoch": 1.05, + "learning_rate": 0.000143145463358745, + "loss": 0.0107, + "step": 403410 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431415751423735, + "loss": 0.0126, + "step": 403420 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014313768692600205, + "loss": 0.0111, + "step": 403430 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431337987096306, + "loss": 0.0306, + "step": 403440 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431299104932591, + "loss": 0.0085, + "step": 403450 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014312602227688765, + "loss": 0.0121, + "step": 403460 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431221340605162, + "loss": 0.0107, + "step": 403470 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014311824584414473, + "loss": 0.01, + "step": 403480 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014311435762777325, + "loss": 0.0124, + "step": 403490 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001431104694114018, + "loss": 0.0091, + "step": 403500 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014310658119503033, + "loss": 0.013, + "step": 403510 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014310269297865887, + "loss": 0.0111, + "step": 403520 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014309880476228739, + "loss": 0.0124, + "step": 403530 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014309491654591593, + "loss": 0.0106, + "step": 403540 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014309102832954447, + "loss": 0.0112, + "step": 403550 + }, + { + "epoch": 1.05, + "learning_rate": 0.000143087140113173, + "loss": 0.0156, + "step": 403560 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014308325189680153, + "loss": 0.013, + "step": 403570 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430793636804301, + "loss": 0.0094, + "step": 403580 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430754754640586, + "loss": 0.0148, + "step": 403590 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014307158724768715, + "loss": 0.0122, + "step": 403600 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430676990313157, + "loss": 0.0107, + "step": 403610 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014306381081494423, + "loss": 0.0131, + "step": 403620 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014305992259857275, + "loss": 0.0102, + "step": 403630 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430560343822013, + "loss": 0.0103, + "step": 403640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014305214616582983, + "loss": 0.0129, + "step": 403650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014304825794945837, + "loss": 0.0125, + "step": 403660 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430443697330869, + "loss": 0.0111, + "step": 403670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014304048151671543, + "loss": 0.009, + "step": 403680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014303659330034397, + "loss": 0.0108, + "step": 403690 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014303270508397249, + "loss": 0.0211, + "step": 403700 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014302881686760103, + "loss": 0.0147, + "step": 403710 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014302492865122957, + "loss": 0.0113, + "step": 403720 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430210404348581, + "loss": 0.01, + "step": 403730 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014301715221848662, + "loss": 0.01, + "step": 403740 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014301326400211517, + "loss": 0.0126, + "step": 403750 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430093757857437, + "loss": 0.0145, + "step": 403760 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014300548756937225, + "loss": 0.0125, + "step": 403770 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001430015993530008, + "loss": 0.0131, + "step": 403780 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014299771113662933, + "loss": 0.0109, + "step": 403790 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014299382292025785, + "loss": 0.0162, + "step": 403800 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429899347038864, + "loss": 0.0147, + "step": 403810 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014298604648751493, + "loss": 0.0132, + "step": 403820 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014298215827114347, + "loss": 0.012, + "step": 403830 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142978270054772, + "loss": 0.0087, + "step": 403840 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014297438183840053, + "loss": 0.0114, + "step": 403850 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014297049362202907, + "loss": 0.0104, + "step": 403860 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429666054056576, + "loss": 0.0109, + "step": 403870 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014296271718928613, + "loss": 0.0106, + "step": 403880 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014295882897291467, + "loss": 0.0103, + "step": 403890 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429549407565432, + "loss": 0.0115, + "step": 403900 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014295105254017175, + "loss": 0.0131, + "step": 403910 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014294716432380027, + "loss": 0.0182, + "step": 403920 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429432761074288, + "loss": 0.0115, + "step": 403930 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014293938789105735, + "loss": 0.0114, + "step": 403940 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014293549967468586, + "loss": 0.0105, + "step": 403950 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014293161145831443, + "loss": 0.015, + "step": 403960 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014292772324194295, + "loss": 0.0111, + "step": 403970 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429238350255715, + "loss": 0.0101, + "step": 403980 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014291994680920003, + "loss": 0.0112, + "step": 403990 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014291605859282857, + "loss": 0.013, + "step": 404000 + }, + { + "epoch": 1.05, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.009204316884279251, + "eval_runtime": 107.4647, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, + "step": 404000 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429121703764571, + "loss": 0.0083, + "step": 404010 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014290828216008563, + "loss": 0.0128, + "step": 404020 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014290439394371417, + "loss": 0.0101, + "step": 404030 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001429005057273427, + "loss": 0.0138, + "step": 404040 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014289661751097123, + "loss": 0.0102, + "step": 404050 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014289272929459977, + "loss": 0.0119, + "step": 404060 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428888410782283, + "loss": 0.0117, + "step": 404070 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014288495286185685, + "loss": 0.0124, + "step": 404080 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014288106464548537, + "loss": 0.0108, + "step": 404090 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014287717642911393, + "loss": 0.015, + "step": 404100 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014287328821274245, + "loss": 0.0166, + "step": 404110 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142869399996371, + "loss": 0.0108, + "step": 404120 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014286551177999953, + "loss": 0.0132, + "step": 404130 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014286162356362807, + "loss": 0.0122, + "step": 404140 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428577353472566, + "loss": 0.0121, + "step": 404150 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014285384713088513, + "loss": 0.0105, + "step": 404160 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014284995891451367, + "loss": 0.0111, + "step": 404170 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014284607069814219, + "loss": 0.0119, + "step": 404180 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014284218248177073, + "loss": 0.013, + "step": 404190 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014283829426539927, + "loss": 0.0094, + "step": 404200 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428344060490278, + "loss": 0.0089, + "step": 404210 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014283051783265633, + "loss": 0.0096, + "step": 404220 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014282662961628487, + "loss": 0.0115, + "step": 404230 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428227413999134, + "loss": 0.0106, + "step": 404240 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014281885318354195, + "loss": 0.0084, + "step": 404250 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014281496496717046, + "loss": 0.0134, + "step": 404260 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142811076750799, + "loss": 0.0113, + "step": 404270 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014280718853442755, + "loss": 0.0116, + "step": 404280 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001428033003180561, + "loss": 0.0122, + "step": 404290 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014279941210168463, + "loss": 0.0106, + "step": 404300 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014279552388531317, + "loss": 0.0118, + "step": 404310 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427916356689417, + "loss": 0.0105, + "step": 404320 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014278774745257023, + "loss": 0.01, + "step": 404330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014278385923619877, + "loss": 0.0121, + "step": 404340 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427799710198273, + "loss": 0.0087, + "step": 404350 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014277608280345583, + "loss": 0.0092, + "step": 404360 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014277219458708437, + "loss": 0.012, + "step": 404370 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427683063707129, + "loss": 0.0119, + "step": 404380 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014276441815434145, + "loss": 0.0101, + "step": 404390 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014276052993796997, + "loss": 0.0152, + "step": 404400 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427566417215985, + "loss": 0.0114, + "step": 404410 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014275275350522705, + "loss": 0.01, + "step": 404420 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014274886528885556, + "loss": 0.0132, + "step": 404430 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427449770724841, + "loss": 0.0094, + "step": 404440 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014274108885611265, + "loss": 0.0129, + "step": 404450 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427372006397412, + "loss": 0.0131, + "step": 404460 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427333124233697, + "loss": 0.0108, + "step": 404470 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014272942420699827, + "loss": 0.0101, + "step": 404480 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427255359906268, + "loss": 0.012, + "step": 404490 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014272164777425533, + "loss": 0.0104, + "step": 404500 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014271775955788387, + "loss": 0.0117, + "step": 404510 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001427138713415124, + "loss": 0.0105, + "step": 404520 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014270998312514093, + "loss": 0.0119, + "step": 404530 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014270609490876947, + "loss": 0.0114, + "step": 404540 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142702206692398, + "loss": 0.0168, + "step": 404550 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014269831847602655, + "loss": 0.0119, + "step": 404560 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014269443025965507, + "loss": 0.012, + "step": 404570 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426905420432836, + "loss": 0.0149, + "step": 404580 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014268665382691215, + "loss": 0.0116, + "step": 404590 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426827656105407, + "loss": 0.0127, + "step": 404600 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426788773941692, + "loss": 0.0111, + "step": 404610 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014267498917779777, + "loss": 0.0088, + "step": 404620 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426711009614263, + "loss": 0.0171, + "step": 404630 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014266721274505483, + "loss": 0.0111, + "step": 404640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014266332452868337, + "loss": 0.0119, + "step": 404650 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426594363123119, + "loss": 0.012, + "step": 404660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014265554809594043, + "loss": 0.0121, + "step": 404670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014265165987956897, + "loss": 0.0118, + "step": 404680 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426477716631975, + "loss": 0.0108, + "step": 404690 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014264388344682603, + "loss": 0.0115, + "step": 404700 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014263999523045457, + "loss": 0.0109, + "step": 404710 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426361070140831, + "loss": 0.0099, + "step": 404720 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014263221879771165, + "loss": 0.0116, + "step": 404730 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014262833058134017, + "loss": 0.0108, + "step": 404740 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426244423649687, + "loss": 0.0106, + "step": 404750 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014262055414859725, + "loss": 0.0127, + "step": 404760 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426166659322258, + "loss": 0.0138, + "step": 404770 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426127777158543, + "loss": 0.014, + "step": 404780 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014260888949948285, + "loss": 0.0096, + "step": 404790 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001426050012831114, + "loss": 0.0117, + "step": 404800 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014260111306673993, + "loss": 0.0112, + "step": 404810 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014259722485036847, + "loss": 0.0106, + "step": 404820 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142593336633997, + "loss": 0.0127, + "step": 404830 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014258944841762553, + "loss": 0.0151, + "step": 404840 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014258556020125407, + "loss": 0.0165, + "step": 404850 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425816719848826, + "loss": 0.0115, + "step": 404860 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014257778376851115, + "loss": 0.0102, + "step": 404870 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014257389555213967, + "loss": 0.0099, + "step": 404880 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425700073357682, + "loss": 0.0107, + "step": 404890 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014256611911939675, + "loss": 0.0127, + "step": 404900 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425622309030253, + "loss": 0.0124, + "step": 404910 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425583426866538, + "loss": 0.0148, + "step": 404920 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014255445447028235, + "loss": 0.0115, + "step": 404930 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425505662539109, + "loss": 0.0111, + "step": 404940 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425466780375394, + "loss": 0.0123, + "step": 404950 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014254278982116795, + "loss": 0.012, + "step": 404960 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425389016047965, + "loss": 0.0147, + "step": 404970 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014253501338842503, + "loss": 0.0133, + "step": 404980 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014253112517205354, + "loss": 0.0122, + "step": 404990 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425272369556821, + "loss": 0.0136, + "step": 405000 + }, + { + "epoch": 1.05, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.007998434826731682, + "eval_runtime": 107.3073, + "eval_samples_per_second": 18.638, + "eval_steps_per_second": 4.66, + "step": 405000 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014252334873931063, + "loss": 0.0107, + "step": 405010 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014251946052293917, + "loss": 0.0139, + "step": 405020 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425155723065677, + "loss": 0.0128, + "step": 405030 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014251168409019625, + "loss": 0.015, + "step": 405040 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014250779587382477, + "loss": 0.0122, + "step": 405050 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001425039076574533, + "loss": 0.009, + "step": 405060 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014250001944108185, + "loss": 0.0099, + "step": 405070 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424961312247104, + "loss": 0.013, + "step": 405080 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424922430083389, + "loss": 0.0091, + "step": 405090 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014248835479196745, + "loss": 0.01, + "step": 405100 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142484466575596, + "loss": 0.012, + "step": 405110 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014248057835922453, + "loss": 0.0132, + "step": 405120 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014247669014285305, + "loss": 0.0106, + "step": 405130 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424728019264816, + "loss": 0.0117, + "step": 405140 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014246891371011013, + "loss": 0.0139, + "step": 405150 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014246502549373864, + "loss": 0.0142, + "step": 405160 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424611372773672, + "loss": 0.016, + "step": 405170 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014245724906099573, + "loss": 0.0184, + "step": 405180 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014245336084462427, + "loss": 0.0111, + "step": 405190 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424494726282528, + "loss": 0.0112, + "step": 405200 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014244558441188135, + "loss": 0.0134, + "step": 405210 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014244169619550987, + "loss": 0.0132, + "step": 405220 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424378079791384, + "loss": 0.0105, + "step": 405230 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014243391976276695, + "loss": 0.0115, + "step": 405240 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424300315463955, + "loss": 0.0137, + "step": 405250 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142426143330024, + "loss": 0.0123, + "step": 405260 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014242225511365255, + "loss": 0.0089, + "step": 405270 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001424183668972811, + "loss": 0.01, + "step": 405280 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014241447868090963, + "loss": 0.0095, + "step": 405290 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014241059046453814, + "loss": 0.015, + "step": 405300 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014240670224816669, + "loss": 0.0132, + "step": 405310 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014240281403179523, + "loss": 0.0126, + "step": 405320 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014239892581542377, + "loss": 0.0146, + "step": 405330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014239503759905228, + "loss": 0.0132, + "step": 405340 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014239114938268085, + "loss": 0.0131, + "step": 405350 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014238726116630937, + "loss": 0.0116, + "step": 405360 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423833729499379, + "loss": 0.0126, + "step": 405370 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014237948473356645, + "loss": 0.0123, + "step": 405380 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142375596517195, + "loss": 0.01, + "step": 405390 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423717083008235, + "loss": 0.0118, + "step": 405400 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014236782008445205, + "loss": 0.0141, + "step": 405410 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423639318680806, + "loss": 0.0122, + "step": 405420 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423600436517091, + "loss": 0.0133, + "step": 405430 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014235615543533765, + "loss": 0.0119, + "step": 405440 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423522672189662, + "loss": 0.011, + "step": 405450 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014234837900259473, + "loss": 0.011, + "step": 405460 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014234449078622324, + "loss": 0.0124, + "step": 405470 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014234060256985179, + "loss": 0.0097, + "step": 405480 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014233671435348033, + "loss": 0.0121, + "step": 405490 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014233282613710887, + "loss": 0.0109, + "step": 405500 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014232893792073738, + "loss": 0.0128, + "step": 405510 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014232504970436595, + "loss": 0.0092, + "step": 405520 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014232116148799447, + "loss": 0.0108, + "step": 405530 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142317273271623, + "loss": 0.0102, + "step": 405540 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014231338505525155, + "loss": 0.0127, + "step": 405550 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423094968388801, + "loss": 0.0124, + "step": 405560 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001423056086225086, + "loss": 0.0149, + "step": 405570 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014230172040613715, + "loss": 0.0128, + "step": 405580 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422978321897657, + "loss": 0.0114, + "step": 405590 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014229394397339423, + "loss": 0.0136, + "step": 405600 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014229005575702275, + "loss": 0.0089, + "step": 405610 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422861675406513, + "loss": 0.0156, + "step": 405620 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014228227932427983, + "loss": 0.0104, + "step": 405630 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014227839110790837, + "loss": 0.0104, + "step": 405640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014227450289153689, + "loss": 0.0101, + "step": 405650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014227061467516543, + "loss": 0.0131, + "step": 405660 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014226672645879397, + "loss": 0.0117, + "step": 405670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014226283824242248, + "loss": 0.013, + "step": 405680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014225895002605105, + "loss": 0.0149, + "step": 405690 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014225506180967957, + "loss": 0.0088, + "step": 405700 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422511735933081, + "loss": 0.0117, + "step": 405710 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014224728537693665, + "loss": 0.0096, + "step": 405720 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422433971605652, + "loss": 0.0143, + "step": 405730 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422395089441937, + "loss": 0.0142, + "step": 405740 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014223562072782225, + "loss": 0.0109, + "step": 405750 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422317325114508, + "loss": 0.0119, + "step": 405760 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014222784429507933, + "loss": 0.0113, + "step": 405770 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014222395607870785, + "loss": 0.0134, + "step": 405780 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001422200678623364, + "loss": 0.0101, + "step": 405790 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014221617964596493, + "loss": 0.011, + "step": 405800 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014221229142959347, + "loss": 0.0123, + "step": 405810 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014220840321322198, + "loss": 0.0114, + "step": 405820 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014220451499685053, + "loss": 0.0109, + "step": 405830 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014220062678047907, + "loss": 0.0121, + "step": 405840 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421967385641076, + "loss": 0.015, + "step": 405850 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014219285034773612, + "loss": 0.0117, + "step": 405860 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421889621313647, + "loss": 0.0109, + "step": 405870 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421850739149932, + "loss": 0.0093, + "step": 405880 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014218118569862175, + "loss": 0.0101, + "step": 405890 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421772974822503, + "loss": 0.0116, + "step": 405900 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421734092658788, + "loss": 0.0104, + "step": 405910 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014216952104950735, + "loss": 0.0101, + "step": 405920 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421656328331359, + "loss": 0.0102, + "step": 405930 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014216174461676443, + "loss": 0.0124, + "step": 405940 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014215785640039294, + "loss": 0.0129, + "step": 405950 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014215396818402149, + "loss": 0.0106, + "step": 405960 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014215007996765003, + "loss": 0.0112, + "step": 405970 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014214619175127857, + "loss": 0.0135, + "step": 405980 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014214230353490708, + "loss": 0.0132, + "step": 405990 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014213841531853563, + "loss": 0.012, + "step": 406000 + }, + { + "epoch": 1.05, + "eval_cer": 0.8817180823294437, + "eval_loss": 0.007497414480894804, + "eval_runtime": 107.7608, + "eval_samples_per_second": 18.56, + "eval_steps_per_second": 4.64, + "step": 406000 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014213452710216417, + "loss": 0.0128, + "step": 406010 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421306388857927, + "loss": 0.0107, + "step": 406020 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014212675066942122, + "loss": 0.0152, + "step": 406030 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421228624530498, + "loss": 0.0119, + "step": 406040 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421189742366783, + "loss": 0.0126, + "step": 406050 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014211508602030685, + "loss": 0.0116, + "step": 406060 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001421111978039354, + "loss": 0.0119, + "step": 406070 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014210730958756393, + "loss": 0.0136, + "step": 406080 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014210342137119245, + "loss": 0.0139, + "step": 406090 + }, + { + "epoch": 1.05, + "learning_rate": 0.000142099533154821, + "loss": 0.014, + "step": 406100 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014209564493844953, + "loss": 0.0115, + "step": 406110 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014209175672207807, + "loss": 0.017, + "step": 406120 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014208786850570659, + "loss": 0.0111, + "step": 406130 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014208398028933513, + "loss": 0.0098, + "step": 406140 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014208009207296367, + "loss": 0.0105, + "step": 406150 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014207620385659218, + "loss": 0.011, + "step": 406160 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014207231564022072, + "loss": 0.0116, + "step": 406170 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014206842742384927, + "loss": 0.0132, + "step": 406180 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420645392074778, + "loss": 0.01, + "step": 406190 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014206065099110632, + "loss": 0.0115, + "step": 406200 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420567627747349, + "loss": 0.01, + "step": 406210 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420528745583634, + "loss": 0.011, + "step": 406220 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014204898634199195, + "loss": 0.0161, + "step": 406230 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420450981256205, + "loss": 0.0157, + "step": 406240 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014204120990924903, + "loss": 0.0112, + "step": 406250 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014203732169287755, + "loss": 0.0123, + "step": 406260 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420334334765061, + "loss": 0.012, + "step": 406270 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014202954526013463, + "loss": 0.0105, + "step": 406280 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014202565704376317, + "loss": 0.0137, + "step": 406290 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014202176882739168, + "loss": 0.0122, + "step": 406300 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014201788061102023, + "loss": 0.013, + "step": 406310 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014201399239464877, + "loss": 0.0079, + "step": 406320 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001420101041782773, + "loss": 0.0168, + "step": 406330 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014200621596190582, + "loss": 0.0092, + "step": 406340 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014200232774553437, + "loss": 0.0131, + "step": 406350 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419984395291629, + "loss": 0.0092, + "step": 406360 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014199455131279145, + "loss": 0.0099, + "step": 406370 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014199066309641996, + "loss": 0.0088, + "step": 406380 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014198677488004853, + "loss": 0.0132, + "step": 406390 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014198288666367705, + "loss": 0.0105, + "step": 406400 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419789984473056, + "loss": 0.0107, + "step": 406410 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014197511023093413, + "loss": 0.0108, + "step": 406420 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014197122201456264, + "loss": 0.0137, + "step": 406430 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419673337981912, + "loss": 0.012, + "step": 406440 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014196344558181973, + "loss": 0.0148, + "step": 406450 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014195955736544827, + "loss": 0.0118, + "step": 406460 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014195566914907678, + "loss": 0.009, + "step": 406470 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014195178093270533, + "loss": 0.0156, + "step": 406480 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014194789271633387, + "loss": 0.011, + "step": 406490 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419440044999624, + "loss": 0.0109, + "step": 406500 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014194011628359092, + "loss": 0.0107, + "step": 406510 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014193622806721947, + "loss": 0.0132, + "step": 406520 + }, + { + "epoch": 1.05, + "learning_rate": 0.000141932339850848, + "loss": 0.0116, + "step": 406530 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014192845163447655, + "loss": 0.011, + "step": 406540 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014192456341810506, + "loss": 0.0113, + "step": 406550 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014192067520173363, + "loss": 0.0112, + "step": 406560 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014191678698536215, + "loss": 0.0099, + "step": 406570 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001419128987689907, + "loss": 0.013, + "step": 406580 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014190901055261923, + "loss": 0.0127, + "step": 406590 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014190512233624777, + "loss": 0.0097, + "step": 406600 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014190123411987629, + "loss": 0.0116, + "step": 406610 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014189734590350483, + "loss": 0.0133, + "step": 406620 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014189345768713337, + "loss": 0.0106, + "step": 406630 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418895694707619, + "loss": 0.0105, + "step": 406640 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014188568125439043, + "loss": 0.0132, + "step": 406650 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014188179303801897, + "loss": 0.0108, + "step": 406660 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418779048216475, + "loss": 0.0167, + "step": 406670 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014187401660527602, + "loss": 0.0084, + "step": 406680 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014187012838890456, + "loss": 0.0105, + "step": 406690 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418662401725331, + "loss": 0.0094, + "step": 406700 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014186235195616165, + "loss": 0.0116, + "step": 406710 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014185846373979016, + "loss": 0.0113, + "step": 406720 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418545755234187, + "loss": 0.0139, + "step": 406730 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014185068730704725, + "loss": 0.0092, + "step": 406740 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418467990906758, + "loss": 0.0123, + "step": 406750 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014184291087430433, + "loss": 0.0134, + "step": 406760 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014183902265793287, + "loss": 0.0106, + "step": 406770 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014183513444156139, + "loss": 0.0132, + "step": 406780 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014183124622518993, + "loss": 0.0121, + "step": 406790 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014182735800881847, + "loss": 0.0104, + "step": 406800 + }, + { + "epoch": 1.05, + "learning_rate": 0.000141823469792447, + "loss": 0.0101, + "step": 406810 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014181958157607552, + "loss": 0.0115, + "step": 406820 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014181569335970407, + "loss": 0.0159, + "step": 406830 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418118051433326, + "loss": 0.0128, + "step": 406840 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014180791692696115, + "loss": 0.0097, + "step": 406850 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014180402871058966, + "loss": 0.0114, + "step": 406860 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001418001404942182, + "loss": 0.0098, + "step": 406870 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014179625227784675, + "loss": 0.0156, + "step": 406880 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001417923640614753, + "loss": 0.0132, + "step": 406890 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001417884758451038, + "loss": 0.0096, + "step": 406900 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014178458762873235, + "loss": 0.0116, + "step": 406910 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001417806994123609, + "loss": 0.0162, + "step": 406920 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001417768111959894, + "loss": 0.0105, + "step": 406930 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014177292297961797, + "loss": 0.0137, + "step": 406940 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014176903476324648, + "loss": 0.0141, + "step": 406950 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014176514654687503, + "loss": 0.0113, + "step": 406960 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014176125833050357, + "loss": 0.0116, + "step": 406970 + }, + { + "epoch": 1.05, + "learning_rate": 0.0001417573701141321, + "loss": 0.0102, + "step": 406980 + }, + { + "epoch": 1.05, + "learning_rate": 0.00014175348189776062, + "loss": 0.0113, + "step": 406990 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014174959368138917, + "loss": 0.013, + "step": 407000 + }, + { + "epoch": 1.06, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.007594889495521784, + "eval_runtime": 107.3439, + "eval_samples_per_second": 18.632, + "eval_steps_per_second": 4.658, + "step": 407000 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417457054650177, + "loss": 0.0087, + "step": 407010 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014174181724864625, + "loss": 0.0162, + "step": 407020 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014173792903227476, + "loss": 0.0139, + "step": 407030 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417340408159033, + "loss": 0.0108, + "step": 407040 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014173015259953185, + "loss": 0.014, + "step": 407050 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417262643831604, + "loss": 0.0138, + "step": 407060 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417223761667889, + "loss": 0.0109, + "step": 407070 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014171848795041747, + "loss": 0.0123, + "step": 407080 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014171459973404599, + "loss": 0.0127, + "step": 407090 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014171071151767453, + "loss": 0.0178, + "step": 407100 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014170682330130307, + "loss": 0.0093, + "step": 407110 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001417029350849316, + "loss": 0.0131, + "step": 407120 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014169904686856013, + "loss": 0.0124, + "step": 407130 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014169515865218867, + "loss": 0.013, + "step": 407140 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416912704358172, + "loss": 0.0113, + "step": 407150 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014168738221944572, + "loss": 0.0101, + "step": 407160 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014168349400307427, + "loss": 0.0139, + "step": 407170 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416796057867028, + "loss": 0.0121, + "step": 407180 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014167571757033135, + "loss": 0.0101, + "step": 407190 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014167182935395986, + "loss": 0.0114, + "step": 407200 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416679411375884, + "loss": 0.0149, + "step": 407210 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014166405292121695, + "loss": 0.0091, + "step": 407220 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416601647048455, + "loss": 0.0167, + "step": 407230 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141656276488474, + "loss": 0.0107, + "step": 407240 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014165238827210254, + "loss": 0.016, + "step": 407250 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014164850005573109, + "loss": 0.0173, + "step": 407260 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014164461183935963, + "loss": 0.0087, + "step": 407270 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014164072362298817, + "loss": 0.0141, + "step": 407280 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416368354066167, + "loss": 0.0083, + "step": 407290 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014163294719024523, + "loss": 0.0132, + "step": 407300 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014162905897387377, + "loss": 0.0146, + "step": 407310 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416251707575023, + "loss": 0.0137, + "step": 407320 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014162128254113085, + "loss": 0.0131, + "step": 407330 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014161739432475936, + "loss": 0.0123, + "step": 407340 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416135061083879, + "loss": 0.011, + "step": 407350 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014160961789201645, + "loss": 0.0142, + "step": 407360 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141605729675645, + "loss": 0.0123, + "step": 407370 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001416018414592735, + "loss": 0.0114, + "step": 407380 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014159795324290205, + "loss": 0.0137, + "step": 407390 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415940650265306, + "loss": 0.0129, + "step": 407400 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415901768101591, + "loss": 0.0157, + "step": 407410 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014158628859378764, + "loss": 0.0139, + "step": 407420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014158240037741619, + "loss": 0.0131, + "step": 407430 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014157851216104473, + "loss": 0.0113, + "step": 407440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014157462394467324, + "loss": 0.0114, + "step": 407450 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415707357283018, + "loss": 0.0119, + "step": 407460 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014156684751193032, + "loss": 0.0183, + "step": 407470 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014156295929555887, + "loss": 0.0099, + "step": 407480 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415590710791874, + "loss": 0.0103, + "step": 407490 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014155518286281595, + "loss": 0.012, + "step": 407500 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014155129464644446, + "loss": 0.0117, + "step": 407510 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141547406430073, + "loss": 0.0112, + "step": 407520 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014154351821370155, + "loss": 0.0108, + "step": 407530 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415396299973301, + "loss": 0.0098, + "step": 407540 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415357417809586, + "loss": 0.0096, + "step": 407550 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014153185356458715, + "loss": 0.0111, + "step": 407560 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415279653482157, + "loss": 0.0113, + "step": 407570 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014152407713184423, + "loss": 0.0106, + "step": 407580 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014152018891547274, + "loss": 0.0091, + "step": 407590 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014151630069910128, + "loss": 0.0131, + "step": 407600 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014151241248272983, + "loss": 0.0143, + "step": 407610 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014150852426635837, + "loss": 0.0101, + "step": 407620 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001415046360499869, + "loss": 0.01, + "step": 407630 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014150074783361542, + "loss": 0.0109, + "step": 407640 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014149685961724397, + "loss": 0.0154, + "step": 407650 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414929714008725, + "loss": 0.0113, + "step": 407660 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014148908318450105, + "loss": 0.012, + "step": 407670 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014148519496812956, + "loss": 0.0108, + "step": 407680 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414813067517581, + "loss": 0.0128, + "step": 407690 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014147741853538665, + "loss": 0.0078, + "step": 407700 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414735303190152, + "loss": 0.0108, + "step": 407710 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414696421026437, + "loss": 0.0106, + "step": 407720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014146575388627224, + "loss": 0.0113, + "step": 407730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014146186566990079, + "loss": 0.0105, + "step": 407740 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014145797745352933, + "loss": 0.012, + "step": 407750 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014145408923715784, + "loss": 0.0097, + "step": 407760 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014145020102078638, + "loss": 0.0098, + "step": 407770 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014144631280441493, + "loss": 0.0126, + "step": 407780 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014144242458804347, + "loss": 0.0087, + "step": 407790 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014143853637167198, + "loss": 0.0118, + "step": 407800 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014143464815530055, + "loss": 0.0077, + "step": 407810 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014143075993892907, + "loss": 0.0144, + "step": 407820 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414268717225576, + "loss": 0.0117, + "step": 407830 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014142298350618615, + "loss": 0.0113, + "step": 407840 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414190952898147, + "loss": 0.0144, + "step": 407850 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414152070734432, + "loss": 0.0116, + "step": 407860 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014141131885707175, + "loss": 0.0131, + "step": 407870 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414074306407003, + "loss": 0.0109, + "step": 407880 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001414035424243288, + "loss": 0.0107, + "step": 407890 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014139965420795734, + "loss": 0.0107, + "step": 407900 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014139576599158589, + "loss": 0.0117, + "step": 407910 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014139187777521443, + "loss": 0.0098, + "step": 407920 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014138798955884294, + "loss": 0.0131, + "step": 407930 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014138410134247148, + "loss": 0.0137, + "step": 407940 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014138021312610003, + "loss": 0.0132, + "step": 407950 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014137632490972857, + "loss": 0.0112, + "step": 407960 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014137243669335708, + "loss": 0.0102, + "step": 407970 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014136854847698565, + "loss": 0.0101, + "step": 407980 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014136466026061416, + "loss": 0.0118, + "step": 407990 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413607720442427, + "loss": 0.0123, + "step": 408000 + }, + { + "epoch": 1.06, + "eval_cer": 0.8817292794249172, + "eval_loss": 0.007572217844426632, + "eval_runtime": 107.5486, + "eval_samples_per_second": 18.596, + "eval_steps_per_second": 4.649, + "step": 408000 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014135688382787125, + "loss": 0.0114, + "step": 408010 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413529956114998, + "loss": 0.0106, + "step": 408020 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413491073951283, + "loss": 0.0138, + "step": 408030 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014134521917875685, + "loss": 0.0118, + "step": 408040 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001413413309623854, + "loss": 0.0105, + "step": 408050 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014133744274601393, + "loss": 0.0108, + "step": 408060 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014133355452964244, + "loss": 0.0114, + "step": 408070 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014132966631327099, + "loss": 0.0082, + "step": 408080 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014132577809689953, + "loss": 0.0138, + "step": 408090 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014132188988052807, + "loss": 0.0126, + "step": 408100 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014131800166415658, + "loss": 0.0133, + "step": 408110 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014131411344778512, + "loss": 0.0138, + "step": 408120 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014131022523141367, + "loss": 0.0125, + "step": 408130 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014130633701504218, + "loss": 0.013, + "step": 408140 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014130244879867075, + "loss": 0.011, + "step": 408150 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014129856058229926, + "loss": 0.0096, + "step": 408160 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412946723659278, + "loss": 0.0136, + "step": 408170 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014129078414955635, + "loss": 0.0118, + "step": 408180 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412868959331849, + "loss": 0.0135, + "step": 408190 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412830077168134, + "loss": 0.0132, + "step": 408200 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014127911950044195, + "loss": 0.0131, + "step": 408210 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412752312840705, + "loss": 0.0093, + "step": 408220 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014127134306769903, + "loss": 0.0148, + "step": 408230 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014126745485132754, + "loss": 0.0232, + "step": 408240 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014126356663495608, + "loss": 0.0235, + "step": 408250 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014125967841858463, + "loss": 0.0115, + "step": 408260 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014125579020221317, + "loss": 0.0107, + "step": 408270 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014125190198584168, + "loss": 0.0121, + "step": 408280 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014124801376947022, + "loss": 0.0111, + "step": 408290 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014124412555309877, + "loss": 0.0127, + "step": 408300 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412402373367273, + "loss": 0.0107, + "step": 408310 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014123634912035582, + "loss": 0.0079, + "step": 408320 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412324609039844, + "loss": 0.017, + "step": 408330 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001412285726876129, + "loss": 0.0157, + "step": 408340 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014122468447124145, + "loss": 0.008, + "step": 408350 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014122079625487, + "loss": 0.0131, + "step": 408360 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014121690803849853, + "loss": 0.0136, + "step": 408370 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014121301982212704, + "loss": 0.0107, + "step": 408380 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014120913160575559, + "loss": 0.0105, + "step": 408390 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014120524338938413, + "loss": 0.0094, + "step": 408400 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014120135517301264, + "loss": 0.0084, + "step": 408410 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014119746695664118, + "loss": 0.0101, + "step": 408420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014119357874026973, + "loss": 0.0112, + "step": 408430 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014118969052389827, + "loss": 0.0124, + "step": 408440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014118580230752678, + "loss": 0.0142, + "step": 408450 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014118191409115532, + "loss": 0.0113, + "step": 408460 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014117802587478387, + "loss": 0.012, + "step": 408470 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411741376584124, + "loss": 0.0104, + "step": 408480 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014117024944204092, + "loss": 0.0113, + "step": 408490 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411663612256695, + "loss": 0.0148, + "step": 408500 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141162473009298, + "loss": 0.0112, + "step": 408510 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014115858479292655, + "loss": 0.0114, + "step": 408520 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411546965765551, + "loss": 0.0106, + "step": 408530 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014115080836018363, + "loss": 0.0089, + "step": 408540 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014114692014381214, + "loss": 0.0146, + "step": 408550 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014114303192744069, + "loss": 0.0118, + "step": 408560 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014113914371106923, + "loss": 0.0089, + "step": 408570 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014113525549469777, + "loss": 0.0123, + "step": 408580 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014113136727832628, + "loss": 0.0141, + "step": 408590 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014112747906195483, + "loss": 0.0107, + "step": 408600 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014112359084558337, + "loss": 0.0108, + "step": 408610 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411197026292119, + "loss": 0.0107, + "step": 408620 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014111581441284042, + "loss": 0.0113, + "step": 408630 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014111192619646896, + "loss": 0.0109, + "step": 408640 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411080379800975, + "loss": 0.0093, + "step": 408650 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014110414976372602, + "loss": 0.011, + "step": 408660 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001411002615473546, + "loss": 0.011, + "step": 408670 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001410963733309831, + "loss": 0.01, + "step": 408680 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014109248511461165, + "loss": 0.0129, + "step": 408690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001410885968982402, + "loss": 0.0113, + "step": 408700 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014108470868186873, + "loss": 0.0203, + "step": 408710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014108082046549724, + "loss": 0.0108, + "step": 408720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014107693224912579, + "loss": 0.0159, + "step": 408730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014107304403275433, + "loss": 0.0116, + "step": 408740 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014106915581638287, + "loss": 0.0095, + "step": 408750 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014106526760001138, + "loss": 0.0102, + "step": 408760 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014106137938363992, + "loss": 0.0127, + "step": 408770 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014105749116726847, + "loss": 0.0146, + "step": 408780 + }, + { + "epoch": 1.06, + "learning_rate": 0.000141053602950897, + "loss": 0.0101, + "step": 408790 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014104971473452552, + "loss": 0.0122, + "step": 408800 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014104582651815406, + "loss": 0.0124, + "step": 408810 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001410419383017826, + "loss": 0.0116, + "step": 408820 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014103805008541115, + "loss": 0.012, + "step": 408830 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014103416186903966, + "loss": 0.0126, + "step": 408840 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014103027365266823, + "loss": 0.011, + "step": 408850 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014102638543629675, + "loss": 0.0142, + "step": 408860 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001410224972199253, + "loss": 0.0117, + "step": 408870 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014101860900355383, + "loss": 0.0111, + "step": 408880 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014101472078718234, + "loss": 0.0107, + "step": 408890 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014101083257081088, + "loss": 0.0111, + "step": 408900 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014100694435443943, + "loss": 0.0112, + "step": 408910 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014100305613806797, + "loss": 0.0084, + "step": 408920 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014099916792169648, + "loss": 0.0113, + "step": 408930 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014099527970532502, + "loss": 0.01, + "step": 408940 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014099139148895357, + "loss": 0.0087, + "step": 408950 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409875032725821, + "loss": 0.0111, + "step": 408960 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014098361505621062, + "loss": 0.0098, + "step": 408970 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014097972683983916, + "loss": 0.013, + "step": 408980 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409758386234677, + "loss": 0.0111, + "step": 408990 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014097195040709625, + "loss": 0.0106, + "step": 409000 + }, + { + "epoch": 1.06, + "eval_cer": 0.8817390768834564, + "eval_loss": 0.007736441679298878, + "eval_runtime": 107.4459, + "eval_samples_per_second": 18.614, + "eval_steps_per_second": 4.654, + "step": 409000 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014096806219072476, + "loss": 0.0107, + "step": 409010 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014096417397435333, + "loss": 0.0108, + "step": 409020 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014096028575798184, + "loss": 0.0295, + "step": 409030 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014095639754161039, + "loss": 0.0122, + "step": 409040 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014095250932523893, + "loss": 0.0106, + "step": 409050 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014094862110886747, + "loss": 0.0121, + "step": 409060 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014094473289249598, + "loss": 0.0162, + "step": 409070 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014094084467612453, + "loss": 0.0128, + "step": 409080 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014093695645975307, + "loss": 0.0122, + "step": 409090 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409330682433816, + "loss": 0.0106, + "step": 409100 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014092918002701012, + "loss": 0.0108, + "step": 409110 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014092529181063866, + "loss": 0.0102, + "step": 409120 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409214035942672, + "loss": 0.0117, + "step": 409130 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014091751537789572, + "loss": 0.0119, + "step": 409140 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014091362716152426, + "loss": 0.0117, + "step": 409150 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001409097389451528, + "loss": 0.0105, + "step": 409160 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014090585072878135, + "loss": 0.0118, + "step": 409170 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014090196251240986, + "loss": 0.0094, + "step": 409180 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408980742960384, + "loss": 0.0104, + "step": 409190 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014089418607966694, + "loss": 0.013, + "step": 409200 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014089029786329549, + "loss": 0.0082, + "step": 409210 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014088640964692403, + "loss": 0.0119, + "step": 409220 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014088252143055257, + "loss": 0.011, + "step": 409230 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014087863321418108, + "loss": 0.0126, + "step": 409240 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014087474499780962, + "loss": 0.0122, + "step": 409250 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014087085678143817, + "loss": 0.0097, + "step": 409260 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408669685650667, + "loss": 0.0118, + "step": 409270 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014086308034869522, + "loss": 0.0099, + "step": 409280 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014085919213232376, + "loss": 0.0092, + "step": 409290 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408553039159523, + "loss": 0.0106, + "step": 409300 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014085141569958085, + "loss": 0.0134, + "step": 409310 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014084752748320936, + "loss": 0.0134, + "step": 409320 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408436392668379, + "loss": 0.0091, + "step": 409330 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014083975105046645, + "loss": 0.014, + "step": 409340 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140835862834095, + "loss": 0.0096, + "step": 409350 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408319746177235, + "loss": 0.0096, + "step": 409360 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014082808640135207, + "loss": 0.009, + "step": 409370 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014082419818498058, + "loss": 0.0101, + "step": 409380 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408203099686091, + "loss": 0.0122, + "step": 409390 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014081642175223767, + "loss": 0.0096, + "step": 409400 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014081253353586618, + "loss": 0.0122, + "step": 409410 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014080864531949472, + "loss": 0.0091, + "step": 409420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014080475710312327, + "loss": 0.0134, + "step": 409430 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001408008688867518, + "loss": 0.0109, + "step": 409440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014079698067038032, + "loss": 0.011, + "step": 409450 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014079309245400886, + "loss": 0.0118, + "step": 409460 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407892042376374, + "loss": 0.0158, + "step": 409470 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014078531602126595, + "loss": 0.0095, + "step": 409480 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014078142780489446, + "loss": 0.0161, + "step": 409490 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140777539588523, + "loss": 0.0106, + "step": 409500 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014077365137215154, + "loss": 0.0097, + "step": 409510 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407697631557801, + "loss": 0.0137, + "step": 409520 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407658749394086, + "loss": 0.0104, + "step": 409530 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014076198672303717, + "loss": 0.011, + "step": 409540 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014075809850666568, + "loss": 0.0114, + "step": 409550 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014075421029029423, + "loss": 0.011, + "step": 409560 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014075032207392277, + "loss": 0.0125, + "step": 409570 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407464338575513, + "loss": 0.0103, + "step": 409580 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014074254564117982, + "loss": 0.0114, + "step": 409590 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014073865742480837, + "loss": 0.0117, + "step": 409600 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407347692084369, + "loss": 0.0157, + "step": 409610 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014073088099206545, + "loss": 0.0108, + "step": 409620 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014072699277569396, + "loss": 0.0106, + "step": 409630 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407231045593225, + "loss": 0.0162, + "step": 409640 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014071921634295105, + "loss": 0.0152, + "step": 409650 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014071532812657956, + "loss": 0.0097, + "step": 409660 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001407114399102081, + "loss": 0.0128, + "step": 409670 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014070755169383664, + "loss": 0.0119, + "step": 409680 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014070366347746519, + "loss": 0.0112, + "step": 409690 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406997752610937, + "loss": 0.0118, + "step": 409700 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014069588704472224, + "loss": 0.0206, + "step": 409710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014069199882835078, + "loss": 0.0131, + "step": 409720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014068811061197933, + "loss": 0.0112, + "step": 409730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014068422239560787, + "loss": 0.0119, + "step": 409740 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406803341792364, + "loss": 0.0098, + "step": 409750 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014067644596286492, + "loss": 0.0117, + "step": 409760 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014067255774649346, + "loss": 0.013, + "step": 409770 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140668669530122, + "loss": 0.0131, + "step": 409780 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014066478131375055, + "loss": 0.0109, + "step": 409790 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014066089309737906, + "loss": 0.008, + "step": 409800 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406570048810076, + "loss": 0.0113, + "step": 409810 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014065311666463615, + "loss": 0.0133, + "step": 409820 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406492284482647, + "loss": 0.01, + "step": 409830 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406453402318932, + "loss": 0.0107, + "step": 409840 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014064145201552174, + "loss": 0.0119, + "step": 409850 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014063756379915029, + "loss": 0.0107, + "step": 409860 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014063367558277883, + "loss": 0.0092, + "step": 409870 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014062978736640734, + "loss": 0.0131, + "step": 409880 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014062589915003588, + "loss": 0.0119, + "step": 409890 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014062201093366442, + "loss": 0.0112, + "step": 409900 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014061812271729294, + "loss": 0.0101, + "step": 409910 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406142345009215, + "loss": 0.0114, + "step": 409920 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014061034628455002, + "loss": 0.0106, + "step": 409930 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014060645806817856, + "loss": 0.0097, + "step": 409940 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001406025698518071, + "loss": 0.01, + "step": 409950 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014059868163543565, + "loss": 0.014, + "step": 409960 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014059479341906416, + "loss": 0.0108, + "step": 409970 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405909052026927, + "loss": 0.0108, + "step": 409980 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014058701698632125, + "loss": 0.0125, + "step": 409990 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405831287699498, + "loss": 0.0103, + "step": 410000 + }, + { + "epoch": 1.06, + "eval_cer": 0.8817068852339703, + "eval_loss": 0.007638953160494566, + "eval_runtime": 107.3836, + "eval_samples_per_second": 18.625, + "eval_steps_per_second": 4.656, + "step": 410000 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405792405535783, + "loss": 0.0136, + "step": 410010 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014057535233720684, + "loss": 0.0094, + "step": 410020 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014057146412083538, + "loss": 0.0103, + "step": 410030 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014056757590446393, + "loss": 0.0122, + "step": 410040 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014056368768809244, + "loss": 0.0133, + "step": 410050 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140559799471721, + "loss": 0.0119, + "step": 410060 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014055591125534952, + "loss": 0.009, + "step": 410070 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014055202303897807, + "loss": 0.009, + "step": 410080 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405481348226066, + "loss": 0.0118, + "step": 410090 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014054424660623515, + "loss": 0.0096, + "step": 410100 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014054035838986366, + "loss": 0.0156, + "step": 410110 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405364701734922, + "loss": 0.0137, + "step": 410120 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014053258195712075, + "loss": 0.0084, + "step": 410130 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014052869374074926, + "loss": 0.0121, + "step": 410140 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405248055243778, + "loss": 0.0163, + "step": 410150 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014052091730800634, + "loss": 0.0128, + "step": 410160 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014051702909163489, + "loss": 0.0118, + "step": 410170 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001405131408752634, + "loss": 0.009, + "step": 410180 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014050925265889194, + "loss": 0.0113, + "step": 410190 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014050536444252048, + "loss": 0.0081, + "step": 410200 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014050147622614903, + "loss": 0.0132, + "step": 410210 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014049758800977754, + "loss": 0.0145, + "step": 410220 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014049369979340608, + "loss": 0.0157, + "step": 410230 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014048981157703462, + "loss": 0.0096, + "step": 410240 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014048592336066317, + "loss": 0.0114, + "step": 410250 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404820351442917, + "loss": 0.0117, + "step": 410260 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014047814692792025, + "loss": 0.0152, + "step": 410270 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014047425871154876, + "loss": 0.013, + "step": 410280 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404703704951773, + "loss": 0.0112, + "step": 410290 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014046648227880585, + "loss": 0.0166, + "step": 410300 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404625940624344, + "loss": 0.0113, + "step": 410310 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404587058460629, + "loss": 0.0243, + "step": 410320 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014045481762969144, + "loss": 0.0102, + "step": 410330 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014045092941331999, + "loss": 0.0138, + "step": 410340 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014044704119694853, + "loss": 0.0104, + "step": 410350 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014044315298057704, + "loss": 0.0116, + "step": 410360 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014043926476420558, + "loss": 0.0093, + "step": 410370 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014043537654783413, + "loss": 0.0136, + "step": 410380 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014043148833146264, + "loss": 0.0104, + "step": 410390 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014042760011509118, + "loss": 0.0098, + "step": 410400 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014042371189871972, + "loss": 0.0099, + "step": 410410 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014041982368234826, + "loss": 0.0122, + "step": 410420 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014041593546597678, + "loss": 0.0111, + "step": 410430 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014041204724960535, + "loss": 0.014, + "step": 410440 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014040815903323386, + "loss": 0.0109, + "step": 410450 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001404042708168624, + "loss": 0.0094, + "step": 410460 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014040038260049095, + "loss": 0.0124, + "step": 410470 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403964943841195, + "loss": 0.0113, + "step": 410480 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140392606167748, + "loss": 0.0121, + "step": 410490 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014038871795137654, + "loss": 0.0104, + "step": 410500 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014038482973500509, + "loss": 0.0137, + "step": 410510 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014038094151863363, + "loss": 0.0101, + "step": 410520 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014037705330226214, + "loss": 0.0098, + "step": 410530 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014037316508589068, + "loss": 0.0115, + "step": 410540 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014036927686951922, + "loss": 0.0112, + "step": 410550 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014036538865314777, + "loss": 0.0101, + "step": 410560 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014036150043677628, + "loss": 0.013, + "step": 410570 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014035761222040482, + "loss": 0.0087, + "step": 410580 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014035372400403336, + "loss": 0.0102, + "step": 410590 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403498357876619, + "loss": 0.0081, + "step": 410600 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014034594757129045, + "loss": 0.0206, + "step": 410610 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014034205935491896, + "loss": 0.0113, + "step": 410620 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403381711385475, + "loss": 0.0105, + "step": 410630 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014033428292217605, + "loss": 0.0188, + "step": 410640 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403303947058046, + "loss": 0.012, + "step": 410650 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001403265064894331, + "loss": 0.0112, + "step": 410660 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014032261827306164, + "loss": 0.0112, + "step": 410670 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014031873005669018, + "loss": 0.0111, + "step": 410680 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014031484184031873, + "loss": 0.0138, + "step": 410690 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014031095362394724, + "loss": 0.0128, + "step": 410700 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014030706540757578, + "loss": 0.0132, + "step": 410710 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014030317719120432, + "loss": 0.013, + "step": 410720 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014029928897483287, + "loss": 0.0135, + "step": 410730 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014029540075846138, + "loss": 0.0117, + "step": 410740 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014029151254208992, + "loss": 0.0109, + "step": 410750 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014028762432571846, + "loss": 0.0088, + "step": 410760 + }, + { + "epoch": 1.06, + "learning_rate": 0.000140283736109347, + "loss": 0.0118, + "step": 410770 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014027984789297552, + "loss": 0.0111, + "step": 410780 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001402759596766041, + "loss": 0.0136, + "step": 410790 + }, + { + "epoch": 1.06, + "learning_rate": 0.0001402720714602326, + "loss": 0.0107, + "step": 410800 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014026818324386114, + "loss": 0.0112, + "step": 410810 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014026429502748969, + "loss": 0.0129, + "step": 410820 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014026040681111823, + "loss": 0.0153, + "step": 410830 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014025651859474674, + "loss": 0.015, + "step": 410840 + }, + { + "epoch": 1.06, + "learning_rate": 0.00014025263037837528, + "loss": 0.0126, + "step": 410850 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014024874216200383, + "loss": 0.0112, + "step": 410860 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014024485394563234, + "loss": 0.0092, + "step": 410870 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014024096572926088, + "loss": 0.0113, + "step": 410880 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014023707751288942, + "loss": 0.0109, + "step": 410890 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014023318929651797, + "loss": 0.01, + "step": 410900 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014022930108014648, + "loss": 0.0141, + "step": 410910 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014022541286377502, + "loss": 0.0136, + "step": 410920 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014022152464740356, + "loss": 0.0113, + "step": 410930 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001402176364310321, + "loss": 0.0134, + "step": 410940 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014021374821466062, + "loss": 0.0116, + "step": 410950 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001402098599982892, + "loss": 0.0121, + "step": 410960 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001402059717819177, + "loss": 0.0107, + "step": 410970 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014020208356554624, + "loss": 0.0095, + "step": 410980 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014019819534917479, + "loss": 0.0158, + "step": 410990 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014019430713280333, + "loss": 0.0111, + "step": 411000 + }, + { + "epoch": 1.07, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.007736830040812492, + "eval_runtime": 107.3663, + "eval_samples_per_second": 18.628, + "eval_steps_per_second": 4.657, + "step": 411000 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014019041891643184, + "loss": 0.0112, + "step": 411010 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014018653070006038, + "loss": 0.0119, + "step": 411020 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014018264248368893, + "loss": 0.0118, + "step": 411030 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014017875426731747, + "loss": 0.0093, + "step": 411040 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014017486605094598, + "loss": 0.0111, + "step": 411050 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014017097783457452, + "loss": 0.0127, + "step": 411060 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014016708961820306, + "loss": 0.0084, + "step": 411070 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001401632014018316, + "loss": 0.0106, + "step": 411080 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014015931318546012, + "loss": 0.0093, + "step": 411090 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014015542496908866, + "loss": 0.0106, + "step": 411100 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001401515367527172, + "loss": 0.0092, + "step": 411110 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014014764853634572, + "loss": 0.0113, + "step": 411120 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001401437603199743, + "loss": 0.011, + "step": 411130 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001401398721036028, + "loss": 0.0104, + "step": 411140 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014013598388723134, + "loss": 0.0101, + "step": 411150 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014013209567085989, + "loss": 0.0095, + "step": 411160 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014012820745448843, + "loss": 0.016, + "step": 411170 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014012431923811694, + "loss": 0.0089, + "step": 411180 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014012043102174548, + "loss": 0.0101, + "step": 411190 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014011654280537402, + "loss": 0.0084, + "step": 411200 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014011265458900257, + "loss": 0.0131, + "step": 411210 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014010876637263108, + "loss": 0.0102, + "step": 411220 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014010487815625962, + "loss": 0.0091, + "step": 411230 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014010098993988816, + "loss": 0.0115, + "step": 411240 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400971017235167, + "loss": 0.0111, + "step": 411250 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014009321350714522, + "loss": 0.0127, + "step": 411260 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014008932529077376, + "loss": 0.0118, + "step": 411270 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400854370744023, + "loss": 0.0102, + "step": 411280 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014008154885803085, + "loss": 0.0108, + "step": 411290 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014007766064165936, + "loss": 0.0106, + "step": 411300 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014007377242528793, + "loss": 0.0131, + "step": 411310 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014006988420891644, + "loss": 0.0131, + "step": 411320 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014006599599254498, + "loss": 0.013, + "step": 411330 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014006210777617353, + "loss": 0.0115, + "step": 411340 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014005821955980207, + "loss": 0.0148, + "step": 411350 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014005433134343058, + "loss": 0.0154, + "step": 411360 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014005044312705912, + "loss": 0.0117, + "step": 411370 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014004655491068767, + "loss": 0.012, + "step": 411380 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014004266669431618, + "loss": 0.0105, + "step": 411390 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014003877847794472, + "loss": 0.0088, + "step": 411400 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014003489026157326, + "loss": 0.0088, + "step": 411410 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400310020452018, + "loss": 0.0089, + "step": 411420 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014002711382883032, + "loss": 0.0174, + "step": 411430 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014002322561245886, + "loss": 0.0115, + "step": 411440 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001400193373960874, + "loss": 0.0115, + "step": 411450 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014001544917971594, + "loss": 0.0122, + "step": 411460 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014001156096334446, + "loss": 0.0113, + "step": 411470 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014000767274697303, + "loss": 0.0094, + "step": 411480 + }, + { + "epoch": 1.07, + "learning_rate": 0.00014000378453060154, + "loss": 0.0121, + "step": 411490 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013999989631423008, + "loss": 0.0128, + "step": 411500 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013999600809785863, + "loss": 0.0133, + "step": 411510 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013999211988148717, + "loss": 0.0092, + "step": 411520 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013998823166511568, + "loss": 0.0129, + "step": 411530 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013998434344874422, + "loss": 0.016, + "step": 411540 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013998045523237277, + "loss": 0.0128, + "step": 411550 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001399765670160013, + "loss": 0.0161, + "step": 411560 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013997267879962982, + "loss": 0.01, + "step": 411570 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013996879058325836, + "loss": 0.0125, + "step": 411580 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001399649023668869, + "loss": 0.0125, + "step": 411590 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013996101415051545, + "loss": 0.0089, + "step": 411600 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013995712593414396, + "loss": 0.0124, + "step": 411610 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001399532377177725, + "loss": 0.0089, + "step": 411620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013994934950140104, + "loss": 0.0077, + "step": 411630 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013994546128502956, + "loss": 0.0096, + "step": 411640 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013994157306865813, + "loss": 0.0095, + "step": 411650 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013993768485228664, + "loss": 0.0123, + "step": 411660 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013993379663591518, + "loss": 0.0094, + "step": 411670 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013992990841954373, + "loss": 0.012, + "step": 411680 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013992602020317227, + "loss": 0.0104, + "step": 411690 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013992213198680078, + "loss": 0.015, + "step": 411700 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013991824377042932, + "loss": 0.014, + "step": 411710 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013991435555405786, + "loss": 0.011, + "step": 411720 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001399104673376864, + "loss": 0.011, + "step": 411730 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013990657912131492, + "loss": 0.0134, + "step": 411740 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013990269090494346, + "loss": 0.0129, + "step": 411750 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139898802688572, + "loss": 0.0087, + "step": 411760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013989491447220055, + "loss": 0.0129, + "step": 411770 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013989102625582906, + "loss": 0.014, + "step": 411780 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398871380394576, + "loss": 0.0112, + "step": 411790 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013988324982308614, + "loss": 0.0124, + "step": 411800 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013987936160671469, + "loss": 0.0131, + "step": 411810 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398754733903432, + "loss": 0.0108, + "step": 411820 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013987158517397177, + "loss": 0.0126, + "step": 411830 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013986769695760028, + "loss": 0.0108, + "step": 411840 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013986380874122882, + "loss": 0.0105, + "step": 411850 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013985992052485737, + "loss": 0.0136, + "step": 411860 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013985603230848588, + "loss": 0.0104, + "step": 411870 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013985214409211442, + "loss": 0.0107, + "step": 411880 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013984825587574296, + "loss": 0.011, + "step": 411890 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398443676593715, + "loss": 0.0092, + "step": 411900 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013984047944300002, + "loss": 0.0105, + "step": 411910 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013983659122662856, + "loss": 0.0108, + "step": 411920 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398327030102571, + "loss": 0.0162, + "step": 411930 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013982881479388564, + "loss": 0.0086, + "step": 411940 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013982492657751416, + "loss": 0.0106, + "step": 411950 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398210383611427, + "loss": 0.0106, + "step": 411960 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013981715014477124, + "loss": 0.0137, + "step": 411970 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013981326192839978, + "loss": 0.0126, + "step": 411980 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001398093737120283, + "loss": 0.0127, + "step": 411990 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013980548549565687, + "loss": 0.0119, + "step": 412000 + }, + { + "epoch": 1.07, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.007703993935137987, + "eval_runtime": 107.4229, + "eval_samples_per_second": 18.618, + "eval_steps_per_second": 4.655, + "step": 412000 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013980159727928538, + "loss": 0.0126, + "step": 412010 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013979770906291392, + "loss": 0.0141, + "step": 412020 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013979382084654247, + "loss": 0.0113, + "step": 412030 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139789932630171, + "loss": 0.0115, + "step": 412040 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013978604441379952, + "loss": 0.0127, + "step": 412050 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013978215619742806, + "loss": 0.0121, + "step": 412060 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397782679810566, + "loss": 0.0098, + "step": 412070 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013977437976468515, + "loss": 0.0113, + "step": 412080 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013977049154831366, + "loss": 0.0091, + "step": 412090 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397666033319422, + "loss": 0.0111, + "step": 412100 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013976271511557074, + "loss": 0.0107, + "step": 412110 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013975882689919926, + "loss": 0.0108, + "step": 412120 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397549386828278, + "loss": 0.012, + "step": 412130 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013975105046645634, + "loss": 0.0107, + "step": 412140 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013974716225008488, + "loss": 0.0114, + "step": 412150 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397432740337134, + "loss": 0.0097, + "step": 412160 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013973938581734194, + "loss": 0.0086, + "step": 412170 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013973549760097048, + "loss": 0.0117, + "step": 412180 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013973160938459902, + "loss": 0.0095, + "step": 412190 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013972772116822756, + "loss": 0.0128, + "step": 412200 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397238329518561, + "loss": 0.0105, + "step": 412210 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013971994473548462, + "loss": 0.0105, + "step": 412220 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013971605651911316, + "loss": 0.013, + "step": 412230 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397121683027417, + "loss": 0.0152, + "step": 412240 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013970828008637025, + "loss": 0.0109, + "step": 412250 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013970439186999876, + "loss": 0.013, + "step": 412260 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001397005036536273, + "loss": 0.0081, + "step": 412270 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013969661543725584, + "loss": 0.0117, + "step": 412280 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013969272722088439, + "loss": 0.0221, + "step": 412290 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396888390045129, + "loss": 0.0123, + "step": 412300 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013968495078814144, + "loss": 0.0094, + "step": 412310 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013968106257176998, + "loss": 0.0139, + "step": 412320 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013967717435539852, + "loss": 0.0115, + "step": 412330 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013967328613902704, + "loss": 0.0139, + "step": 412340 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396693979226556, + "loss": 0.0098, + "step": 412350 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013966550970628412, + "loss": 0.011, + "step": 412360 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013966162148991264, + "loss": 0.0091, + "step": 412370 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396577332735412, + "loss": 0.0116, + "step": 412380 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013965384505716972, + "loss": 0.0117, + "step": 412390 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013964995684079826, + "loss": 0.0135, + "step": 412400 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396460686244268, + "loss": 0.009, + "step": 412410 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013964218040805535, + "loss": 0.0105, + "step": 412420 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013963829219168386, + "loss": 0.0125, + "step": 412430 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396344039753124, + "loss": 0.0089, + "step": 412440 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013963051575894094, + "loss": 0.01, + "step": 412450 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013962662754256948, + "loss": 0.0109, + "step": 412460 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139622739326198, + "loss": 0.0104, + "step": 412470 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013961885110982654, + "loss": 0.0119, + "step": 412480 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013961496289345508, + "loss": 0.0161, + "step": 412490 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013961107467708362, + "loss": 0.0092, + "step": 412500 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013960718646071214, + "loss": 0.0131, + "step": 412510 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001396032982443407, + "loss": 0.0108, + "step": 412520 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013959941002796922, + "loss": 0.0097, + "step": 412530 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013959552181159776, + "loss": 0.0123, + "step": 412540 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395916335952263, + "loss": 0.0092, + "step": 412550 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013958774537885485, + "loss": 0.0115, + "step": 412560 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013958385716248336, + "loss": 0.0113, + "step": 412570 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395799689461119, + "loss": 0.0135, + "step": 412580 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013957608072974044, + "loss": 0.0149, + "step": 412590 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139572192513369, + "loss": 0.0105, + "step": 412600 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395683042969975, + "loss": 0.0099, + "step": 412610 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013956441608062604, + "loss": 0.0106, + "step": 412620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013956052786425458, + "loss": 0.0099, + "step": 412630 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395566396478831, + "loss": 0.0097, + "step": 412640 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013955275143151164, + "loss": 0.0115, + "step": 412650 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013954886321514018, + "loss": 0.0112, + "step": 412660 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013954497499876872, + "loss": 0.0081, + "step": 412670 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013954108678239724, + "loss": 0.009, + "step": 412680 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013953719856602578, + "loss": 0.0126, + "step": 412690 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013953331034965432, + "loss": 0.0102, + "step": 412700 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013952942213328286, + "loss": 0.0099, + "step": 412710 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395255339169114, + "loss": 0.0104, + "step": 412720 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013952164570053995, + "loss": 0.0101, + "step": 412730 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013951775748416846, + "loss": 0.0135, + "step": 412740 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139513869267797, + "loss": 0.0141, + "step": 412750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013950998105142554, + "loss": 0.015, + "step": 412760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013950609283505409, + "loss": 0.0088, + "step": 412770 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001395022046186826, + "loss": 0.0109, + "step": 412780 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013949831640231114, + "loss": 0.0111, + "step": 412790 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013949442818593968, + "loss": 0.0135, + "step": 412800 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013949053996956823, + "loss": 0.0133, + "step": 412810 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013948665175319674, + "loss": 0.0086, + "step": 412820 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013948276353682528, + "loss": 0.0146, + "step": 412830 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013947887532045382, + "loss": 0.0098, + "step": 412840 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013947498710408234, + "loss": 0.0101, + "step": 412850 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013947109888771088, + "loss": 0.0105, + "step": 412860 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013946721067133942, + "loss": 0.0125, + "step": 412870 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013946332245496796, + "loss": 0.0103, + "step": 412880 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013945943423859648, + "loss": 0.0142, + "step": 412890 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013945554602222505, + "loss": 0.01, + "step": 412900 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013945165780585356, + "loss": 0.0087, + "step": 412910 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001394477695894821, + "loss": 0.0104, + "step": 412920 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013944388137311064, + "loss": 0.0099, + "step": 412930 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013943999315673919, + "loss": 0.0172, + "step": 412940 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001394361049403677, + "loss": 0.0106, + "step": 412950 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013943221672399624, + "loss": 0.0143, + "step": 412960 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013942832850762478, + "loss": 0.0094, + "step": 412970 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013942444029125332, + "loss": 0.0125, + "step": 412980 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013942055207488184, + "loss": 0.0136, + "step": 412990 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013941666385851038, + "loss": 0.0098, + "step": 413000 + }, + { + "epoch": 1.07, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.007829415611922741, + "eval_runtime": 107.3445, + "eval_samples_per_second": 18.632, + "eval_steps_per_second": 4.658, + "step": 413000 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013941277564213892, + "loss": 0.0109, + "step": 413010 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013940888742576746, + "loss": 0.0114, + "step": 413020 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013940499920939598, + "loss": 0.0108, + "step": 413030 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013940111099302455, + "loss": 0.0212, + "step": 413040 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013939722277665306, + "loss": 0.013, + "step": 413050 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393933345602816, + "loss": 0.012, + "step": 413060 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013938944634391015, + "loss": 0.0123, + "step": 413070 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393855581275387, + "loss": 0.0132, + "step": 413080 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393816699111672, + "loss": 0.0112, + "step": 413090 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013937778169479574, + "loss": 0.0124, + "step": 413100 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013937389347842428, + "loss": 0.0118, + "step": 413110 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393700052620528, + "loss": 0.0135, + "step": 413120 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013936611704568134, + "loss": 0.0162, + "step": 413130 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013936222882930988, + "loss": 0.0097, + "step": 413140 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013935834061293842, + "loss": 0.0102, + "step": 413150 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013935445239656694, + "loss": 0.0098, + "step": 413160 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013935056418019548, + "loss": 0.0163, + "step": 413170 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013934667596382402, + "loss": 0.0092, + "step": 413180 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013934278774745256, + "loss": 0.013, + "step": 413190 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013933889953108108, + "loss": 0.0103, + "step": 413200 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013933501131470962, + "loss": 0.0106, + "step": 413210 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013933112309833816, + "loss": 0.0115, + "step": 413220 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393272348819667, + "loss": 0.012, + "step": 413230 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013932334666559524, + "loss": 0.0113, + "step": 413240 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013931945844922379, + "loss": 0.0129, + "step": 413250 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001393155702328523, + "loss": 0.0097, + "step": 413260 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013931168201648084, + "loss": 0.0109, + "step": 413270 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013930779380010938, + "loss": 0.0085, + "step": 413280 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013930390558373793, + "loss": 0.0124, + "step": 413290 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013930001736736644, + "loss": 0.0123, + "step": 413300 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013929612915099498, + "loss": 0.0104, + "step": 413310 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013929224093462352, + "loss": 0.013, + "step": 413320 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013928835271825207, + "loss": 0.0119, + "step": 413330 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013928446450188058, + "loss": 0.0135, + "step": 413340 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013928057628550912, + "loss": 0.01, + "step": 413350 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013927668806913766, + "loss": 0.0133, + "step": 413360 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013927279985276618, + "loss": 0.0145, + "step": 413370 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013926891163639472, + "loss": 0.0123, + "step": 413380 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013926502342002326, + "loss": 0.0132, + "step": 413390 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001392611352036518, + "loss": 0.0092, + "step": 413400 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013925724698728032, + "loss": 0.0169, + "step": 413410 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013925335877090889, + "loss": 0.0126, + "step": 413420 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001392494705545374, + "loss": 0.0145, + "step": 413430 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013924558233816594, + "loss": 0.0113, + "step": 413440 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013924169412179448, + "loss": 0.0128, + "step": 413450 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013923780590542303, + "loss": 0.0107, + "step": 413460 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013923391768905154, + "loss": 0.0127, + "step": 413470 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013923002947268008, + "loss": 0.0106, + "step": 413480 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013922614125630862, + "loss": 0.0099, + "step": 413490 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013922225303993716, + "loss": 0.0129, + "step": 413500 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013921836482356568, + "loss": 0.0082, + "step": 413510 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013921447660719422, + "loss": 0.01, + "step": 413520 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013921058839082276, + "loss": 0.0118, + "step": 413530 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001392067001744513, + "loss": 0.0098, + "step": 413540 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013920281195807982, + "loss": 0.0093, + "step": 413550 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013919892374170836, + "loss": 0.0091, + "step": 413560 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001391950355253369, + "loss": 0.0103, + "step": 413570 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013919114730896544, + "loss": 0.0102, + "step": 413580 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013918725909259399, + "loss": 0.0104, + "step": 413590 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001391833708762225, + "loss": 0.0096, + "step": 413600 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013917948265985104, + "loss": 0.0135, + "step": 413610 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013917559444347958, + "loss": 0.0122, + "step": 413620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013917170622710812, + "loss": 0.0121, + "step": 413630 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013916781801073664, + "loss": 0.0111, + "step": 413640 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013916392979436518, + "loss": 0.013, + "step": 413650 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013916004157799372, + "loss": 0.0157, + "step": 413660 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013915615336162226, + "loss": 0.0099, + "step": 413670 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013915226514525078, + "loss": 0.0085, + "step": 413680 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013914837692887932, + "loss": 0.0143, + "step": 413690 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013914448871250786, + "loss": 0.0139, + "step": 413700 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001391406004961364, + "loss": 0.0122, + "step": 413710 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013913671227976492, + "loss": 0.0116, + "step": 413720 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013913282406339346, + "loss": 0.0135, + "step": 413730 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139128935847022, + "loss": 0.0128, + "step": 413740 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013912504763065054, + "loss": 0.0104, + "step": 413750 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013912115941427906, + "loss": 0.0093, + "step": 413760 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013911727119790763, + "loss": 0.0094, + "step": 413770 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013911338298153614, + "loss": 0.0093, + "step": 413780 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013910949476516468, + "loss": 0.0109, + "step": 413790 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013910560654879322, + "loss": 0.0096, + "step": 413800 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013910171833242177, + "loss": 0.0092, + "step": 413810 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013909783011605028, + "loss": 0.013, + "step": 413820 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013909394189967882, + "loss": 0.0144, + "step": 413830 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013909005368330736, + "loss": 0.0109, + "step": 413840 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013908616546693588, + "loss": 0.0114, + "step": 413850 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013908227725056442, + "loss": 0.0111, + "step": 413860 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013907838903419296, + "loss": 0.0099, + "step": 413870 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390745008178215, + "loss": 0.0139, + "step": 413880 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013907061260145002, + "loss": 0.0107, + "step": 413890 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013906672438507856, + "loss": 0.0112, + "step": 413900 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390628361687071, + "loss": 0.0107, + "step": 413910 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013905894795233564, + "loss": 0.011, + "step": 413920 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013905505973596416, + "loss": 0.0111, + "step": 413930 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013905117151959273, + "loss": 0.0132, + "step": 413940 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013904728330322124, + "loss": 0.0143, + "step": 413950 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013904339508684978, + "loss": 0.0126, + "step": 413960 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013903950687047832, + "loss": 0.0098, + "step": 413970 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013903561865410687, + "loss": 0.0108, + "step": 413980 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013903173043773538, + "loss": 0.0113, + "step": 413990 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013902784222136392, + "loss": 0.0139, + "step": 414000 + }, + { + "epoch": 1.07, + "eval_cer": 0.881704085960102, + "eval_loss": 0.007683408912271261, + "eval_runtime": 107.5812, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, + "step": 414000 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013902395400499246, + "loss": 0.0113, + "step": 414010 + }, + { + "epoch": 1.07, + "learning_rate": 0.000139020065788621, + "loss": 0.0096, + "step": 414020 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013901617757224952, + "loss": 0.0124, + "step": 414030 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013901228935587806, + "loss": 0.0115, + "step": 414040 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001390084011395066, + "loss": 0.0086, + "step": 414050 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013900451292313514, + "loss": 0.0141, + "step": 414060 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013900062470676366, + "loss": 0.0089, + "step": 414070 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389967364903922, + "loss": 0.0117, + "step": 414080 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013899284827402074, + "loss": 0.0108, + "step": 414090 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013898896005764926, + "loss": 0.011, + "step": 414100 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013898507184127783, + "loss": 0.0145, + "step": 414110 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013898118362490634, + "loss": 0.0109, + "step": 414120 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013897729540853488, + "loss": 0.009, + "step": 414130 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013897340719216342, + "loss": 0.0092, + "step": 414140 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013896951897579196, + "loss": 0.0115, + "step": 414150 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013896563075942048, + "loss": 0.0125, + "step": 414160 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013896174254304902, + "loss": 0.0125, + "step": 414170 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013895785432667756, + "loss": 0.0109, + "step": 414180 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389539661103061, + "loss": 0.01, + "step": 414190 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013895007789393462, + "loss": 0.0122, + "step": 414200 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013894618967756316, + "loss": 0.0097, + "step": 414210 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389423014611917, + "loss": 0.0095, + "step": 414220 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013893841324482024, + "loss": 0.0123, + "step": 414230 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013893452502844876, + "loss": 0.0103, + "step": 414240 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389306368120773, + "loss": 0.0103, + "step": 414250 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013892674859570584, + "loss": 0.0132, + "step": 414260 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013892286037933438, + "loss": 0.0119, + "step": 414270 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001389189721629629, + "loss": 0.0133, + "step": 414280 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013891508394659147, + "loss": 0.0142, + "step": 414290 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013891119573021998, + "loss": 0.0105, + "step": 414300 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013890730751384852, + "loss": 0.0107, + "step": 414310 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013890341929747706, + "loss": 0.0129, + "step": 414320 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388995310811056, + "loss": 0.0092, + "step": 414330 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013889564286473412, + "loss": 0.0116, + "step": 414340 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013889175464836266, + "loss": 0.0176, + "step": 414350 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388878664319912, + "loss": 0.0113, + "step": 414360 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013888397821561972, + "loss": 0.0129, + "step": 414370 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013888008999924826, + "loss": 0.017, + "step": 414380 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388762017828768, + "loss": 0.012, + "step": 414390 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013887231356650534, + "loss": 0.0097, + "step": 414400 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013886842535013386, + "loss": 0.0083, + "step": 414410 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388645371337624, + "loss": 0.0107, + "step": 414420 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013886064891739094, + "loss": 0.011, + "step": 414430 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013885676070101948, + "loss": 0.0085, + "step": 414440 + }, + { + "epoch": 1.07, + "learning_rate": 0.000138852872484648, + "loss": 0.0128, + "step": 414450 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013884898426827657, + "loss": 0.0096, + "step": 414460 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013884509605190508, + "loss": 0.0141, + "step": 414470 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013884120783553362, + "loss": 0.0181, + "step": 414480 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013883731961916216, + "loss": 0.011, + "step": 414490 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388334314027907, + "loss": 0.0136, + "step": 414500 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013882954318641922, + "loss": 0.0113, + "step": 414510 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013882565497004776, + "loss": 0.0159, + "step": 414520 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388217667536763, + "loss": 0.0087, + "step": 414530 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013881787853730484, + "loss": 0.0115, + "step": 414540 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013881399032093336, + "loss": 0.0102, + "step": 414550 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001388101021045619, + "loss": 0.0118, + "step": 414560 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013880621388819044, + "loss": 0.0128, + "step": 414570 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013880232567181898, + "loss": 0.0098, + "step": 414580 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001387984374554475, + "loss": 0.0118, + "step": 414590 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013879454923907604, + "loss": 0.0094, + "step": 414600 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013879066102270458, + "loss": 0.0122, + "step": 414610 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001387867728063331, + "loss": 0.009, + "step": 414620 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013878288458996167, + "loss": 0.0117, + "step": 414630 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013877899637359018, + "loss": 0.0162, + "step": 414640 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013877510815721872, + "loss": 0.0104, + "step": 414650 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013877121994084726, + "loss": 0.0127, + "step": 414660 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001387673317244758, + "loss": 0.0101, + "step": 414670 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013876344350810432, + "loss": 0.0138, + "step": 414680 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013875955529173286, + "loss": 0.0171, + "step": 414690 + }, + { + "epoch": 1.07, + "learning_rate": 0.0001387556670753614, + "loss": 0.0101, + "step": 414700 + }, + { + "epoch": 1.07, + "learning_rate": 0.00013875177885898994, + "loss": 0.011, + "step": 414710 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013874789064261846, + "loss": 0.0127, + "step": 414720 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138744002426247, + "loss": 0.0124, + "step": 414730 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013874011420987554, + "loss": 0.01, + "step": 414740 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013873622599350408, + "loss": 0.0147, + "step": 414750 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001387323377771326, + "loss": 0.0106, + "step": 414760 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013872844956076114, + "loss": 0.01, + "step": 414770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013872456134438968, + "loss": 0.0108, + "step": 414780 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013872067312801822, + "loss": 0.0119, + "step": 414790 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013871678491164674, + "loss": 0.0118, + "step": 414800 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001387128966952753, + "loss": 0.0108, + "step": 414810 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013870900847890382, + "loss": 0.0102, + "step": 414820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013870512026253236, + "loss": 0.0078, + "step": 414830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001387012320461609, + "loss": 0.0094, + "step": 414840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013869734382978942, + "loss": 0.0106, + "step": 414850 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013869345561341796, + "loss": 0.0125, + "step": 414860 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386895673970465, + "loss": 0.0107, + "step": 414870 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013868567918067504, + "loss": 0.0102, + "step": 414880 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013868179096430356, + "loss": 0.0111, + "step": 414890 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386779027479321, + "loss": 0.0109, + "step": 414900 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013867401453156064, + "loss": 0.0123, + "step": 414910 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013867012631518918, + "loss": 0.0114, + "step": 414920 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386662380988177, + "loss": 0.0103, + "step": 414930 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013866234988244624, + "loss": 0.009, + "step": 414940 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013865846166607478, + "loss": 0.014, + "step": 414950 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013865457344970332, + "loss": 0.0104, + "step": 414960 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013865068523333184, + "loss": 0.0108, + "step": 414970 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386467970169604, + "loss": 0.0118, + "step": 414980 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013864290880058892, + "loss": 0.0142, + "step": 414990 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013863902058421746, + "loss": 0.0093, + "step": 415000 + }, + { + "epoch": 1.08, + "eval_cer": 0.881727879787983, + "eval_loss": 0.0076110344380140305, + "eval_runtime": 107.5209, + "eval_samples_per_second": 18.601, + "eval_steps_per_second": 4.65, + "step": 415000 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138635132367846, + "loss": 0.0094, + "step": 415010 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013863124415147454, + "loss": 0.0102, + "step": 415020 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013862735593510306, + "loss": 0.0091, + "step": 415030 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386234677187316, + "loss": 0.0133, + "step": 415040 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013861957950236014, + "loss": 0.0136, + "step": 415050 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013861569128598868, + "loss": 0.0098, + "step": 415060 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386118030696172, + "loss": 0.0167, + "step": 415070 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013860791485324574, + "loss": 0.0138, + "step": 415080 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013860402663687428, + "loss": 0.011, + "step": 415090 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001386001384205028, + "loss": 0.0099, + "step": 415100 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013859625020413134, + "loss": 0.0093, + "step": 415110 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013859236198775988, + "loss": 0.0076, + "step": 415120 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013858847377138842, + "loss": 0.0085, + "step": 415130 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013858458555501694, + "loss": 0.0129, + "step": 415140 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013858069733864548, + "loss": 0.0121, + "step": 415150 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013857680912227402, + "loss": 0.0108, + "step": 415160 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013857292090590256, + "loss": 0.0104, + "step": 415170 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385690326895311, + "loss": 0.0142, + "step": 415180 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013856514447315964, + "loss": 0.0109, + "step": 415190 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013856125625678816, + "loss": 0.0106, + "step": 415200 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385573680404167, + "loss": 0.0147, + "step": 415210 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013855347982404524, + "loss": 0.0149, + "step": 415220 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013854959160767378, + "loss": 0.0111, + "step": 415230 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001385457033913023, + "loss": 0.0104, + "step": 415240 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013854181517493084, + "loss": 0.0117, + "step": 415250 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013853792695855938, + "loss": 0.013, + "step": 415260 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013853403874218792, + "loss": 0.0128, + "step": 415270 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013853015052581644, + "loss": 0.009, + "step": 415280 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013852626230944498, + "loss": 0.0121, + "step": 415290 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013852237409307352, + "loss": 0.013, + "step": 415300 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013851848587670206, + "loss": 0.0073, + "step": 415310 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013851459766033058, + "loss": 0.0116, + "step": 415320 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013851070944395915, + "loss": 0.0112, + "step": 415330 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013850682122758766, + "loss": 0.0134, + "step": 415340 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013850293301121618, + "loss": 0.0121, + "step": 415350 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013849904479484474, + "loss": 0.0122, + "step": 415360 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013849515657847326, + "loss": 0.0138, + "step": 415370 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384912683621018, + "loss": 0.0135, + "step": 415380 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013848738014573034, + "loss": 0.01, + "step": 415390 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013848349192935888, + "loss": 0.0125, + "step": 415400 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384796037129874, + "loss": 0.0116, + "step": 415410 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013847571549661594, + "loss": 0.0097, + "step": 415420 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013847182728024448, + "loss": 0.01, + "step": 415430 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013846793906387302, + "loss": 0.0099, + "step": 415440 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013846405084750154, + "loss": 0.0098, + "step": 415450 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013846016263113008, + "loss": 0.0107, + "step": 415460 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013845627441475862, + "loss": 0.0105, + "step": 415470 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013845238619838716, + "loss": 0.0109, + "step": 415480 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013844849798201568, + "loss": 0.0112, + "step": 415490 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013844460976564425, + "loss": 0.0114, + "step": 415500 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013844072154927276, + "loss": 0.0106, + "step": 415510 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384368333329013, + "loss": 0.011, + "step": 415520 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013843294511652984, + "loss": 0.0131, + "step": 415530 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013842905690015838, + "loss": 0.0193, + "step": 415540 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384251686837869, + "loss": 0.0167, + "step": 415550 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013842128046741544, + "loss": 0.0155, + "step": 415560 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013841739225104398, + "loss": 0.0115, + "step": 415570 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001384135040346725, + "loss": 0.0099, + "step": 415580 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013840961581830104, + "loss": 0.0126, + "step": 415590 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013840572760192958, + "loss": 0.0106, + "step": 415600 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013840183938555812, + "loss": 0.0115, + "step": 415610 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013839795116918664, + "loss": 0.0133, + "step": 415620 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013839406295281518, + "loss": 0.0131, + "step": 415630 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013839017473644372, + "loss": 0.0133, + "step": 415640 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013838628652007226, + "loss": 0.0109, + "step": 415650 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013838239830370078, + "loss": 0.0121, + "step": 415660 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013837851008732932, + "loss": 0.0133, + "step": 415670 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013837462187095786, + "loss": 0.0105, + "step": 415680 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001383707336545864, + "loss": 0.0093, + "step": 415690 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013836684543821494, + "loss": 0.0128, + "step": 415700 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013836295722184348, + "loss": 0.0114, + "step": 415710 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138359069005472, + "loss": 0.0102, + "step": 415720 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013835518078910054, + "loss": 0.0108, + "step": 415730 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013835129257272908, + "loss": 0.0155, + "step": 415740 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013834740435635762, + "loss": 0.012, + "step": 415750 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013834351613998614, + "loss": 0.0096, + "step": 415760 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013833962792361468, + "loss": 0.0077, + "step": 415770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013833573970724322, + "loss": 0.015, + "step": 415780 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013833185149087176, + "loss": 0.0105, + "step": 415790 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013832796327450028, + "loss": 0.0073, + "step": 415800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013832407505812882, + "loss": 0.0136, + "step": 415810 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013832018684175736, + "loss": 0.014, + "step": 415820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013831629862538588, + "loss": 0.0124, + "step": 415830 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013831241040901442, + "loss": 0.013, + "step": 415840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013830852219264296, + "loss": 0.0126, + "step": 415850 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001383046339762715, + "loss": 0.0125, + "step": 415860 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013830074575990001, + "loss": 0.014, + "step": 415870 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013829685754352858, + "loss": 0.0122, + "step": 415880 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382929693271571, + "loss": 0.0096, + "step": 415890 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013828908111078564, + "loss": 0.0118, + "step": 415900 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013828519289441418, + "loss": 0.0103, + "step": 415910 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013828130467804272, + "loss": 0.0101, + "step": 415920 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013827741646167124, + "loss": 0.0127, + "step": 415930 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013827352824529978, + "loss": 0.013, + "step": 415940 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013826964002892832, + "loss": 0.0124, + "step": 415950 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013826575181255686, + "loss": 0.0125, + "step": 415960 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013826186359618538, + "loss": 0.0107, + "step": 415970 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013825797537981392, + "loss": 0.0104, + "step": 415980 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013825408716344246, + "loss": 0.012, + "step": 415990 + }, + { + "epoch": 1.08, + "learning_rate": 0.000138250198947071, + "loss": 0.0121, + "step": 416000 + }, + { + "epoch": 1.08, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.007917557843029499, + "eval_runtime": 107.4603, + "eval_samples_per_second": 18.612, + "eval_steps_per_second": 4.653, + "step": 416000 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013824631073069952, + "loss": 0.0113, + "step": 416010 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013824242251432806, + "loss": 0.0124, + "step": 416020 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001382385342979566, + "loss": 0.0116, + "step": 416030 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013823464608158514, + "loss": 0.0114, + "step": 416040 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013823075786521368, + "loss": 0.0082, + "step": 416050 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013822686964884222, + "loss": 0.0111, + "step": 416060 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013822298143247074, + "loss": 0.0157, + "step": 416070 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013821909321609928, + "loss": 0.0159, + "step": 416080 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013821520499972782, + "loss": 0.012, + "step": 416090 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013821131678335634, + "loss": 0.0164, + "step": 416100 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013820742856698488, + "loss": 0.01, + "step": 416110 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013820354035061342, + "loss": 0.0113, + "step": 416120 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013819965213424196, + "loss": 0.0102, + "step": 416130 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013819576391787048, + "loss": 0.0105, + "step": 416140 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013819187570149902, + "loss": 0.0106, + "step": 416150 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013818798748512756, + "loss": 0.0103, + "step": 416160 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381840992687561, + "loss": 0.0087, + "step": 416170 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013818021105238462, + "loss": 0.0135, + "step": 416180 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013817632283601316, + "loss": 0.0125, + "step": 416190 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381724346196417, + "loss": 0.0094, + "step": 416200 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013816854640327024, + "loss": 0.0132, + "step": 416210 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013816465818689876, + "loss": 0.0126, + "step": 416220 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013816076997052732, + "loss": 0.0114, + "step": 416230 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013815688175415584, + "loss": 0.0118, + "step": 416240 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013815299353778438, + "loss": 0.0086, + "step": 416250 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013814910532141292, + "loss": 0.011, + "step": 416260 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013814521710504146, + "loss": 0.0107, + "step": 416270 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013814132888866998, + "loss": 0.0087, + "step": 416280 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013813744067229852, + "loss": 0.0118, + "step": 416290 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013813355245592706, + "loss": 0.0108, + "step": 416300 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381296642395556, + "loss": 0.0087, + "step": 416310 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013812577602318412, + "loss": 0.0134, + "step": 416320 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013812188780681266, + "loss": 0.0106, + "step": 416330 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381179995904412, + "loss": 0.0123, + "step": 416340 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013811411137406972, + "loss": 0.0122, + "step": 416350 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013811022315769826, + "loss": 0.0137, + "step": 416360 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001381063349413268, + "loss": 0.0127, + "step": 416370 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013810244672495534, + "loss": 0.0105, + "step": 416380 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013809855850858385, + "loss": 0.0132, + "step": 416390 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013809467029221242, + "loss": 0.0132, + "step": 416400 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013809078207584094, + "loss": 0.0131, + "step": 416410 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013808689385946948, + "loss": 0.0093, + "step": 416420 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013808300564309802, + "loss": 0.0096, + "step": 416430 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013807911742672656, + "loss": 0.012, + "step": 416440 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013807522921035508, + "loss": 0.01, + "step": 416450 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013807134099398362, + "loss": 0.0105, + "step": 416460 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013806745277761216, + "loss": 0.0114, + "step": 416470 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001380635645612407, + "loss": 0.0098, + "step": 416480 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013805967634486922, + "loss": 0.0128, + "step": 416490 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013805578812849776, + "loss": 0.0094, + "step": 416500 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001380518999121263, + "loss": 0.0118, + "step": 416510 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013804801169575484, + "loss": 0.0118, + "step": 416520 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013804412347938336, + "loss": 0.0109, + "step": 416530 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001380402352630119, + "loss": 0.0082, + "step": 416540 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013803634704664044, + "loss": 0.0131, + "step": 416550 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013803245883026898, + "loss": 0.0107, + "step": 416560 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013802857061389752, + "loss": 0.0123, + "step": 416570 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013802468239752604, + "loss": 0.0125, + "step": 416580 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013802079418115458, + "loss": 0.0119, + "step": 416590 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013801690596478312, + "loss": 0.0138, + "step": 416600 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013801301774841166, + "loss": 0.011, + "step": 416610 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013800912953204018, + "loss": 0.0119, + "step": 416620 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013800524131566872, + "loss": 0.0133, + "step": 416630 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013800135309929726, + "loss": 0.011, + "step": 416640 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379974648829258, + "loss": 0.0097, + "step": 416650 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013799357666655432, + "loss": 0.0117, + "step": 416660 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013798968845018286, + "loss": 0.0125, + "step": 416670 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379858002338114, + "loss": 0.0107, + "step": 416680 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013798191201743994, + "loss": 0.0138, + "step": 416690 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013797802380106846, + "loss": 0.0105, + "step": 416700 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137974135584697, + "loss": 0.0081, + "step": 416710 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013797024736832554, + "loss": 0.0084, + "step": 416720 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013796635915195408, + "loss": 0.0151, + "step": 416730 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379624709355826, + "loss": 0.0109, + "step": 416740 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013795858271921116, + "loss": 0.0111, + "step": 416750 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013795469450283968, + "loss": 0.0118, + "step": 416760 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013795080628646822, + "loss": 0.0107, + "step": 416770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013794691807009676, + "loss": 0.0101, + "step": 416780 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379430298537253, + "loss": 0.0115, + "step": 416790 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013793914163735382, + "loss": 0.0111, + "step": 416800 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013793525342098236, + "loss": 0.0085, + "step": 416810 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379313652046109, + "loss": 0.0093, + "step": 416820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013792747698823942, + "loss": 0.012, + "step": 416830 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013792358877186796, + "loss": 0.0101, + "step": 416840 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379197005554965, + "loss": 0.0101, + "step": 416850 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013791581233912504, + "loss": 0.0115, + "step": 416860 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013791192412275356, + "loss": 0.0096, + "step": 416870 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001379080359063821, + "loss": 0.0119, + "step": 416880 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013790414769001064, + "loss": 0.0117, + "step": 416890 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013790025947363918, + "loss": 0.0133, + "step": 416900 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378963712572677, + "loss": 0.0114, + "step": 416910 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013789248304089626, + "loss": 0.0099, + "step": 416920 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013788859482452478, + "loss": 0.0133, + "step": 416930 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013788470660815332, + "loss": 0.0095, + "step": 416940 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013788081839178186, + "loss": 0.0124, + "step": 416950 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378769301754104, + "loss": 0.0125, + "step": 416960 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013787304195903892, + "loss": 0.012, + "step": 416970 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013786915374266746, + "loss": 0.0104, + "step": 416980 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137865265526296, + "loss": 0.0096, + "step": 416990 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013786137730992454, + "loss": 0.014, + "step": 417000 + }, + { + "epoch": 1.08, + "eval_cer": 0.8817166826925096, + "eval_loss": 0.007632073480635881, + "eval_runtime": 107.6798, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 4.643, + "step": 417000 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013785748909355306, + "loss": 0.0112, + "step": 417010 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378536008771816, + "loss": 0.0123, + "step": 417020 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013784971266081014, + "loss": 0.0114, + "step": 417030 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013784582444443868, + "loss": 0.0165, + "step": 417040 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378419362280672, + "loss": 0.0085, + "step": 417050 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013783804801169574, + "loss": 0.01, + "step": 417060 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013783415979532428, + "loss": 0.0106, + "step": 417070 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378302715789528, + "loss": 0.0113, + "step": 417080 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013782638336258136, + "loss": 0.0136, + "step": 417090 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013782249514620988, + "loss": 0.009, + "step": 417100 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013781860692983842, + "loss": 0.012, + "step": 417110 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013781471871346696, + "loss": 0.0126, + "step": 417120 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001378108304970955, + "loss": 0.0127, + "step": 417130 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013780694228072402, + "loss": 0.0091, + "step": 417140 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013780305406435256, + "loss": 0.0106, + "step": 417150 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377991658479811, + "loss": 0.0101, + "step": 417160 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013779527763160964, + "loss": 0.0105, + "step": 417170 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013779138941523816, + "loss": 0.0117, + "step": 417180 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377875011988667, + "loss": 0.0099, + "step": 417190 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013778361298249524, + "loss": 0.0113, + "step": 417200 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013777972476612378, + "loss": 0.0102, + "step": 417210 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377758365497523, + "loss": 0.0112, + "step": 417220 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013777194833338084, + "loss": 0.011, + "step": 417230 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013776806011700938, + "loss": 0.0112, + "step": 417240 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013776417190063792, + "loss": 0.0118, + "step": 417250 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013776028368426644, + "loss": 0.0083, + "step": 417260 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137756395467895, + "loss": 0.0105, + "step": 417270 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013775250725152352, + "loss": 0.0124, + "step": 417280 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013774861903515206, + "loss": 0.0113, + "step": 417290 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377447308187806, + "loss": 0.0125, + "step": 417300 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013774084260240914, + "loss": 0.0103, + "step": 417310 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013773695438603766, + "loss": 0.0111, + "step": 417320 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377330661696662, + "loss": 0.012, + "step": 417330 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013772917795329474, + "loss": 0.0115, + "step": 417340 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013772528973692326, + "loss": 0.0099, + "step": 417350 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377214015205518, + "loss": 0.0122, + "step": 417360 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013771751330418034, + "loss": 0.0138, + "step": 417370 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013771362508780888, + "loss": 0.0103, + "step": 417380 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001377097368714374, + "loss": 0.0098, + "step": 417390 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013770584865506594, + "loss": 0.0112, + "step": 417400 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013770196043869448, + "loss": 0.0122, + "step": 417410 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013769807222232302, + "loss": 0.011, + "step": 417420 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013769418400595153, + "loss": 0.0091, + "step": 417430 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376902957895801, + "loss": 0.0136, + "step": 417440 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013768640757320862, + "loss": 0.0104, + "step": 417450 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013768251935683716, + "loss": 0.0174, + "step": 417460 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376786311404657, + "loss": 0.0119, + "step": 417470 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013767474292409424, + "loss": 0.0112, + "step": 417480 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013767085470772276, + "loss": 0.0085, + "step": 417490 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376669664913513, + "loss": 0.0125, + "step": 417500 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013766307827497984, + "loss": 0.0083, + "step": 417510 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013765919005860838, + "loss": 0.0131, + "step": 417520 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376553018422369, + "loss": 0.0104, + "step": 417530 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013765141362586544, + "loss": 0.0129, + "step": 417540 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013764752540949398, + "loss": 0.0137, + "step": 417550 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013764363719312252, + "loss": 0.0127, + "step": 417560 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013763974897675104, + "loss": 0.0168, + "step": 417570 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013763586076037958, + "loss": 0.0111, + "step": 417580 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013763197254400812, + "loss": 0.0102, + "step": 417590 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013762808432763663, + "loss": 0.0119, + "step": 417600 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013762419611126518, + "loss": 0.012, + "step": 417610 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013762030789489372, + "loss": 0.0102, + "step": 417620 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013761641967852226, + "loss": 0.0118, + "step": 417630 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376125314621508, + "loss": 0.0122, + "step": 417640 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013760864324577934, + "loss": 0.0111, + "step": 417650 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013760475502940786, + "loss": 0.0082, + "step": 417660 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001376008668130364, + "loss": 0.0114, + "step": 417670 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013759697859666494, + "loss": 0.0082, + "step": 417680 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013759309038029348, + "loss": 0.0144, + "step": 417690 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137589202163922, + "loss": 0.012, + "step": 417700 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013758531394755054, + "loss": 0.022, + "step": 417710 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013758142573117908, + "loss": 0.0142, + "step": 417720 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013757753751480762, + "loss": 0.0105, + "step": 417730 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013757364929843614, + "loss": 0.0122, + "step": 417740 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013756976108206468, + "loss": 0.0131, + "step": 417750 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013756587286569322, + "loss": 0.0122, + "step": 417760 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013756198464932176, + "loss": 0.0097, + "step": 417770 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013755809643295028, + "loss": 0.0123, + "step": 417780 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013755420821657884, + "loss": 0.0136, + "step": 417790 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013755032000020736, + "loss": 0.0113, + "step": 417800 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001375464317838359, + "loss": 0.0126, + "step": 417810 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013754254356746444, + "loss": 0.0112, + "step": 417820 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013753865535109296, + "loss": 0.0132, + "step": 417830 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001375347671347215, + "loss": 0.0092, + "step": 417840 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013753087891835004, + "loss": 0.011, + "step": 417850 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013752699070197858, + "loss": 0.0095, + "step": 417860 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001375231024856071, + "loss": 0.0114, + "step": 417870 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013751921426923564, + "loss": 0.0104, + "step": 417880 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013751532605286418, + "loss": 0.0113, + "step": 417890 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013751143783649272, + "loss": 0.0147, + "step": 417900 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013750754962012124, + "loss": 0.0111, + "step": 417910 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013750366140374978, + "loss": 0.0127, + "step": 417920 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013749977318737832, + "loss": 0.0083, + "step": 417930 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013749588497100686, + "loss": 0.0104, + "step": 417940 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013749199675463537, + "loss": 0.0103, + "step": 417950 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013748810853826394, + "loss": 0.0108, + "step": 417960 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013748422032189246, + "loss": 0.0093, + "step": 417970 + }, + { + "epoch": 1.08, + "learning_rate": 0.000137480332105521, + "loss": 0.0108, + "step": 417980 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013747644388914954, + "loss": 0.0118, + "step": 417990 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013747255567277808, + "loss": 0.0118, + "step": 418000 + }, + { + "epoch": 1.08, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.007763538043946028, + "eval_runtime": 107.433, + "eval_samples_per_second": 18.616, + "eval_steps_per_second": 4.654, + "step": 418000 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374686674564066, + "loss": 0.0093, + "step": 418010 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013746477924003514, + "loss": 0.0115, + "step": 418020 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013746089102366368, + "loss": 0.0112, + "step": 418030 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013745700280729222, + "loss": 0.01, + "step": 418040 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013745311459092074, + "loss": 0.0095, + "step": 418050 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013744922637454928, + "loss": 0.0094, + "step": 418060 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013744533815817782, + "loss": 0.0164, + "step": 418070 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013744144994180633, + "loss": 0.0117, + "step": 418080 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013743756172543488, + "loss": 0.0096, + "step": 418090 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013743367350906342, + "loss": 0.0119, + "step": 418100 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013742978529269196, + "loss": 0.0086, + "step": 418110 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013742589707632047, + "loss": 0.0104, + "step": 418120 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013742200885994902, + "loss": 0.008, + "step": 418130 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013741812064357756, + "loss": 0.0102, + "step": 418140 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374142324272061, + "loss": 0.0108, + "step": 418150 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013741034421083464, + "loss": 0.0105, + "step": 418160 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013740645599446318, + "loss": 0.0122, + "step": 418170 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001374025677780917, + "loss": 0.0093, + "step": 418180 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013739867956172024, + "loss": 0.0087, + "step": 418190 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013739479134534878, + "loss": 0.0154, + "step": 418200 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013739090312897732, + "loss": 0.0109, + "step": 418210 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013738701491260584, + "loss": 0.0095, + "step": 418220 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013738312669623438, + "loss": 0.0103, + "step": 418230 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013737923847986292, + "loss": 0.01, + "step": 418240 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013737535026349146, + "loss": 0.0101, + "step": 418250 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013737146204711998, + "loss": 0.014, + "step": 418260 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013736757383074852, + "loss": 0.0135, + "step": 418270 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013736368561437706, + "loss": 0.0136, + "step": 418280 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373597973980056, + "loss": 0.0133, + "step": 418290 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013735590918163412, + "loss": 0.0096, + "step": 418300 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013735202096526266, + "loss": 0.0096, + "step": 418310 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373481327488912, + "loss": 0.0131, + "step": 418320 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373442445325197, + "loss": 0.0119, + "step": 418330 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013734035631614828, + "loss": 0.0113, + "step": 418340 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001373364680997768, + "loss": 0.0089, + "step": 418350 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013733257988340534, + "loss": 0.0114, + "step": 418360 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013732869166703388, + "loss": 0.0111, + "step": 418370 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013732480345066242, + "loss": 0.0155, + "step": 418380 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013732091523429094, + "loss": 0.0113, + "step": 418390 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013731702701791948, + "loss": 0.01, + "step": 418400 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013731313880154802, + "loss": 0.0101, + "step": 418410 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013730925058517656, + "loss": 0.0123, + "step": 418420 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013730536236880508, + "loss": 0.0149, + "step": 418430 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013730147415243362, + "loss": 0.0118, + "step": 418440 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013729758593606216, + "loss": 0.0108, + "step": 418450 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001372936977196907, + "loss": 0.0111, + "step": 418460 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013728980950331921, + "loss": 0.0139, + "step": 418470 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013728592128694778, + "loss": 0.0101, + "step": 418480 + }, + { + "epoch": 1.08, + "learning_rate": 0.0001372820330705763, + "loss": 0.0114, + "step": 418490 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013727814485420484, + "loss": 0.0109, + "step": 418500 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013727425663783338, + "loss": 0.0124, + "step": 418510 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013727036842146192, + "loss": 0.0115, + "step": 418520 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013726648020509044, + "loss": 0.0121, + "step": 418530 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013726259198871898, + "loss": 0.0097, + "step": 418540 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013725870377234752, + "loss": 0.0101, + "step": 418550 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013725481555597604, + "loss": 0.014, + "step": 418560 + }, + { + "epoch": 1.08, + "learning_rate": 0.00013725092733960458, + "loss": 0.0087, + "step": 418570 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013724703912323312, + "loss": 0.0113, + "step": 418580 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013724315090686166, + "loss": 0.0099, + "step": 418590 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013723926269049017, + "loss": 0.014, + "step": 418600 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013723537447411872, + "loss": 0.0098, + "step": 418610 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013723148625774726, + "loss": 0.0111, + "step": 418620 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001372275980413758, + "loss": 0.0114, + "step": 418630 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013722370982500431, + "loss": 0.0142, + "step": 418640 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013721982160863286, + "loss": 0.0105, + "step": 418650 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001372159333922614, + "loss": 0.0102, + "step": 418660 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013721204517588994, + "loss": 0.0128, + "step": 418670 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013720815695951848, + "loss": 0.01, + "step": 418680 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013720426874314702, + "loss": 0.0107, + "step": 418690 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013720038052677554, + "loss": 0.0115, + "step": 418700 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013719649231040408, + "loss": 0.0114, + "step": 418710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013719260409403262, + "loss": 0.0127, + "step": 418720 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013718871587766116, + "loss": 0.0114, + "step": 418730 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013718482766128968, + "loss": 0.0127, + "step": 418740 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013718093944491822, + "loss": 0.0117, + "step": 418750 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013717705122854676, + "loss": 0.0131, + "step": 418760 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371731630121753, + "loss": 0.0126, + "step": 418770 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013716927479580382, + "loss": 0.0076, + "step": 418780 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013716538657943236, + "loss": 0.0134, + "step": 418790 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371614983630609, + "loss": 0.0105, + "step": 418800 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371576101466894, + "loss": 0.0105, + "step": 418810 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013715372193031795, + "loss": 0.0109, + "step": 418820 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371498337139465, + "loss": 0.0172, + "step": 418830 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013714594549757504, + "loss": 0.0135, + "step": 418840 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013714205728120355, + "loss": 0.0117, + "step": 418850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013713816906483212, + "loss": 0.0133, + "step": 418860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013713428084846064, + "loss": 0.0128, + "step": 418870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013713039263208918, + "loss": 0.0154, + "step": 418880 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013712650441571772, + "loss": 0.0158, + "step": 418890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013712261619934626, + "loss": 0.0123, + "step": 418900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013711872798297478, + "loss": 0.0087, + "step": 418910 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013711483976660332, + "loss": 0.0095, + "step": 418920 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013711095155023186, + "loss": 0.0117, + "step": 418930 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001371070633338604, + "loss": 0.0098, + "step": 418940 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013710317511748891, + "loss": 0.0119, + "step": 418950 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013709928690111746, + "loss": 0.0071, + "step": 418960 + }, + { + "epoch": 1.09, + "learning_rate": 0.000137095398684746, + "loss": 0.0103, + "step": 418970 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013709151046837454, + "loss": 0.009, + "step": 418980 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013708762225200305, + "loss": 0.013, + "step": 418990 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370837340356316, + "loss": 0.0105, + "step": 419000 + }, + { + "epoch": 1.09, + "eval_cer": 0.881751673615864, + "eval_loss": 0.007565063424408436, + "eval_runtime": 107.4764, + "eval_samples_per_second": 18.609, + "eval_steps_per_second": 4.652, + "step": 419000 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013707984581926014, + "loss": 0.0118, + "step": 419010 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013707595760288868, + "loss": 0.0109, + "step": 419020 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013707206938651722, + "loss": 0.0136, + "step": 419030 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013706818117014576, + "loss": 0.0149, + "step": 419040 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013706429295377428, + "loss": 0.0147, + "step": 419050 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013706040473740282, + "loss": 0.0107, + "step": 419060 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013705651652103136, + "loss": 0.0127, + "step": 419070 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013705262830465987, + "loss": 0.0123, + "step": 419080 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013704874008828842, + "loss": 0.0099, + "step": 419090 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013704485187191696, + "loss": 0.0125, + "step": 419100 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370409636555455, + "loss": 0.0126, + "step": 419110 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013703707543917401, + "loss": 0.0132, + "step": 419120 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013703318722280256, + "loss": 0.0143, + "step": 419130 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370292990064311, + "loss": 0.0122, + "step": 419140 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013702541079005964, + "loss": 0.0128, + "step": 419150 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013702152257368815, + "loss": 0.011, + "step": 419160 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370176343573167, + "loss": 0.0135, + "step": 419170 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013701374614094524, + "loss": 0.0114, + "step": 419180 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013700985792457378, + "loss": 0.0133, + "step": 419190 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001370059697082023, + "loss": 0.0115, + "step": 419200 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013700208149183086, + "loss": 0.0095, + "step": 419210 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013699819327545938, + "loss": 0.0113, + "step": 419220 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013699430505908792, + "loss": 0.0114, + "step": 419230 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013699041684271646, + "loss": 0.0094, + "step": 419240 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136986528626345, + "loss": 0.0091, + "step": 419250 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013698264040997352, + "loss": 0.012, + "step": 419260 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013697875219360206, + "loss": 0.0098, + "step": 419270 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369748639772306, + "loss": 0.0114, + "step": 419280 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013697097576085914, + "loss": 0.0099, + "step": 419290 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013696708754448766, + "loss": 0.0099, + "step": 419300 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369631993281162, + "loss": 0.0114, + "step": 419310 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013695931111174474, + "loss": 0.0107, + "step": 419320 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013695542289537325, + "loss": 0.0091, + "step": 419330 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369515346790018, + "loss": 0.0151, + "step": 419340 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013694764646263034, + "loss": 0.0151, + "step": 419350 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013694375824625888, + "loss": 0.0122, + "step": 419360 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369398700298874, + "loss": 0.0112, + "step": 419370 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013693598181351596, + "loss": 0.0144, + "step": 419380 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013693209359714448, + "loss": 0.0117, + "step": 419390 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013692820538077302, + "loss": 0.0116, + "step": 419400 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013692431716440156, + "loss": 0.0165, + "step": 419410 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369204289480301, + "loss": 0.0112, + "step": 419420 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013691654073165862, + "loss": 0.0115, + "step": 419430 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013691265251528716, + "loss": 0.0115, + "step": 419440 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001369087642989157, + "loss": 0.0104, + "step": 419450 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013690487608254424, + "loss": 0.0104, + "step": 419460 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013690098786617275, + "loss": 0.0117, + "step": 419470 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368970996498013, + "loss": 0.0122, + "step": 419480 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013689321143342984, + "loss": 0.012, + "step": 419490 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013688932321705838, + "loss": 0.0109, + "step": 419500 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368854350006869, + "loss": 0.0145, + "step": 419510 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013688154678431544, + "loss": 0.0105, + "step": 419520 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013687765856794398, + "loss": 0.0119, + "step": 419530 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013687377035157252, + "loss": 0.0121, + "step": 419540 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013686988213520106, + "loss": 0.011, + "step": 419550 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013686599391882958, + "loss": 0.0116, + "step": 419560 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013686210570245812, + "loss": 0.0112, + "step": 419570 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013685821748608666, + "loss": 0.0103, + "step": 419580 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368543292697152, + "loss": 0.0132, + "step": 419590 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013685044105334371, + "loss": 0.0101, + "step": 419600 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013684655283697226, + "loss": 0.0132, + "step": 419610 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368426646206008, + "loss": 0.0117, + "step": 419620 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013683877640422934, + "loss": 0.0124, + "step": 419630 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013683488818785785, + "loss": 0.0118, + "step": 419640 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001368309999714864, + "loss": 0.009, + "step": 419650 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013682711175511494, + "loss": 0.012, + "step": 419660 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013682322353874348, + "loss": 0.011, + "step": 419670 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136819335322372, + "loss": 0.0125, + "step": 419680 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013681544710600054, + "loss": 0.0119, + "step": 419690 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013681155888962908, + "loss": 0.0133, + "step": 419700 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013680767067325762, + "loss": 0.0096, + "step": 419710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013680378245688613, + "loss": 0.0112, + "step": 419720 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367998942405147, + "loss": 0.0152, + "step": 419730 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013679600602414322, + "loss": 0.0113, + "step": 419740 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013679211780777176, + "loss": 0.0081, + "step": 419750 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367882295914003, + "loss": 0.0124, + "step": 419760 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013678434137502884, + "loss": 0.0077, + "step": 419770 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013678045315865736, + "loss": 0.0116, + "step": 419780 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367765649422859, + "loss": 0.0109, + "step": 419790 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013677267672591444, + "loss": 0.0109, + "step": 419800 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013676878850954295, + "loss": 0.0118, + "step": 419810 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367649002931715, + "loss": 0.0112, + "step": 419820 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013676101207680004, + "loss": 0.0125, + "step": 419830 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013675712386042858, + "loss": 0.0096, + "step": 419840 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367532356440571, + "loss": 0.0105, + "step": 419850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013674934742768563, + "loss": 0.0094, + "step": 419860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013674545921131418, + "loss": 0.0135, + "step": 419870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013674157099494272, + "loss": 0.0085, + "step": 419880 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013673768277857123, + "loss": 0.0116, + "step": 419890 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367337945621998, + "loss": 0.0147, + "step": 419900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013672990634582832, + "loss": 0.0099, + "step": 419910 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013672601812945686, + "loss": 0.01, + "step": 419920 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001367221299130854, + "loss": 0.0105, + "step": 419930 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013671824169671394, + "loss": 0.0147, + "step": 419940 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013671435348034246, + "loss": 0.0133, + "step": 419950 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136710465263971, + "loss": 0.013, + "step": 419960 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013670657704759954, + "loss": 0.0112, + "step": 419970 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013670268883122808, + "loss": 0.0096, + "step": 419980 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366988006148566, + "loss": 0.0123, + "step": 419990 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013669491239848514, + "loss": 0.0102, + "step": 420000 + }, + { + "epoch": 1.09, + "eval_cer": 0.8817488743419957, + "eval_loss": 0.007611589971929789, + "eval_runtime": 107.4861, + "eval_samples_per_second": 18.607, + "eval_steps_per_second": 4.652, + "step": 420000 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013669102418211368, + "loss": 0.0117, + "step": 420010 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013668713596574222, + "loss": 0.0129, + "step": 420020 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013668324774937073, + "loss": 0.0097, + "step": 420030 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013667935953299928, + "loss": 0.0129, + "step": 420040 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013667547131662782, + "loss": 0.0102, + "step": 420050 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013667158310025633, + "loss": 0.0096, + "step": 420060 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366676948838849, + "loss": 0.0111, + "step": 420070 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013666380666751342, + "loss": 0.0146, + "step": 420080 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013665991845114196, + "loss": 0.0143, + "step": 420090 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366560302347705, + "loss": 0.0131, + "step": 420100 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013665214201839904, + "loss": 0.0138, + "step": 420110 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013664825380202755, + "loss": 0.0088, + "step": 420120 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366443655856561, + "loss": 0.0106, + "step": 420130 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013664047736928464, + "loss": 0.008, + "step": 420140 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013663658915291318, + "loss": 0.01, + "step": 420150 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001366327009365417, + "loss": 0.0103, + "step": 420160 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013662881272017024, + "loss": 0.0104, + "step": 420170 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013662492450379878, + "loss": 0.0111, + "step": 420180 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013662103628742732, + "loss": 0.0116, + "step": 420190 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013661714807105583, + "loss": 0.0116, + "step": 420200 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013661325985468438, + "loss": 0.0079, + "step": 420210 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013660937163831292, + "loss": 0.0097, + "step": 420220 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013660548342194146, + "loss": 0.0124, + "step": 420230 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013660159520556997, + "loss": 0.0116, + "step": 420240 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013659770698919854, + "loss": 0.0084, + "step": 420250 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013659381877282706, + "loss": 0.0124, + "step": 420260 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365899305564556, + "loss": 0.0115, + "step": 420270 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013658604234008414, + "loss": 0.0107, + "step": 420280 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013658215412371268, + "loss": 0.0093, + "step": 420290 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365782659073412, + "loss": 0.013, + "step": 420300 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013657437769096974, + "loss": 0.0107, + "step": 420310 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013657048947459828, + "loss": 0.0085, + "step": 420320 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365666012582268, + "loss": 0.013, + "step": 420330 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013656271304185534, + "loss": 0.0153, + "step": 420340 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013655882482548388, + "loss": 0.0124, + "step": 420350 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013655493660911242, + "loss": 0.0109, + "step": 420360 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013655104839274093, + "loss": 0.009, + "step": 420370 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013654716017636947, + "loss": 0.0109, + "step": 420380 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013654327195999802, + "loss": 0.0107, + "step": 420390 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013653938374362656, + "loss": 0.0106, + "step": 420400 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013653549552725507, + "loss": 0.01, + "step": 420410 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013653160731088364, + "loss": 0.013, + "step": 420420 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013652771909451216, + "loss": 0.0118, + "step": 420430 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365238308781407, + "loss": 0.013, + "step": 420440 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013651994266176924, + "loss": 0.0107, + "step": 420450 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013651605444539778, + "loss": 0.0113, + "step": 420460 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001365121662290263, + "loss": 0.0109, + "step": 420470 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013650827801265484, + "loss": 0.0151, + "step": 420480 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013650438979628338, + "loss": 0.0115, + "step": 420490 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013650050157991192, + "loss": 0.0174, + "step": 420500 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013649661336354043, + "loss": 0.0088, + "step": 420510 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013649272514716898, + "loss": 0.011, + "step": 420520 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013648883693079752, + "loss": 0.0112, + "step": 420530 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013648494871442606, + "loss": 0.0126, + "step": 420540 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013648106049805457, + "loss": 0.0098, + "step": 420550 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013647717228168312, + "loss": 0.0117, + "step": 420560 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013647328406531166, + "loss": 0.0083, + "step": 420570 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013646939584894017, + "loss": 0.0142, + "step": 420580 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013646550763256871, + "loss": 0.0152, + "step": 420590 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013646161941619726, + "loss": 0.0096, + "step": 420600 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001364577311998258, + "loss": 0.0108, + "step": 420610 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013645384298345434, + "loss": 0.0076, + "step": 420620 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013644995476708288, + "loss": 0.0107, + "step": 420630 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001364460665507114, + "loss": 0.012, + "step": 420640 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013644217833433994, + "loss": 0.0106, + "step": 420650 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013643829011796848, + "loss": 0.0139, + "step": 420660 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013643440190159702, + "loss": 0.0152, + "step": 420670 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013643051368522553, + "loss": 0.0124, + "step": 420680 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013642662546885408, + "loss": 0.0087, + "step": 420690 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013642273725248262, + "loss": 0.0093, + "step": 420700 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013641884903611116, + "loss": 0.0094, + "step": 420710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013641496081973967, + "loss": 0.0126, + "step": 420720 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013641107260336822, + "loss": 0.0087, + "step": 420730 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013640718438699676, + "loss": 0.0114, + "step": 420740 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001364032961706253, + "loss": 0.0163, + "step": 420750 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363994079542538, + "loss": 0.0115, + "step": 420760 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013639551973788238, + "loss": 0.0113, + "step": 420770 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363916315215109, + "loss": 0.0144, + "step": 420780 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363877433051394, + "loss": 0.014, + "step": 420790 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013638385508876798, + "loss": 0.0111, + "step": 420800 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363799668723965, + "loss": 0.0123, + "step": 420810 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013637607865602504, + "loss": 0.014, + "step": 420820 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013637219043965358, + "loss": 0.0094, + "step": 420830 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013636830222328212, + "loss": 0.0086, + "step": 420840 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013636441400691063, + "loss": 0.0145, + "step": 420850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013636052579053918, + "loss": 0.0122, + "step": 420860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013635663757416772, + "loss": 0.01, + "step": 420870 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013635274935779626, + "loss": 0.0112, + "step": 420880 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013634886114142477, + "loss": 0.0106, + "step": 420890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013634497292505331, + "loss": 0.009, + "step": 420900 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013634108470868186, + "loss": 0.0108, + "step": 420910 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363371964923104, + "loss": 0.0095, + "step": 420920 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001363333082759389, + "loss": 0.0111, + "step": 420930 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013632942005956748, + "loss": 0.013, + "step": 420940 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136325531843196, + "loss": 0.0125, + "step": 420950 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013632164362682454, + "loss": 0.0101, + "step": 420960 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013631775541045308, + "loss": 0.0163, + "step": 420970 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013631386719408162, + "loss": 0.0112, + "step": 420980 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013630997897771014, + "loss": 0.0112, + "step": 420990 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013630609076133868, + "loss": 0.0104, + "step": 421000 + }, + { + "epoch": 1.09, + "eval_cer": 0.8817152830555753, + "eval_loss": 0.007646199781447649, + "eval_runtime": 107.458, + "eval_samples_per_second": 18.612, + "eval_steps_per_second": 4.653, + "step": 421000 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013630220254496722, + "loss": 0.0119, + "step": 421010 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013629831432859576, + "loss": 0.0128, + "step": 421020 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013629442611222427, + "loss": 0.0133, + "step": 421030 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013629053789585282, + "loss": 0.0121, + "step": 421040 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013628664967948136, + "loss": 0.0104, + "step": 421050 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013628276146310987, + "loss": 0.0098, + "step": 421060 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013627887324673841, + "loss": 0.0097, + "step": 421070 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013627498503036696, + "loss": 0.0118, + "step": 421080 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362710968139955, + "loss": 0.0115, + "step": 421090 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136267208597624, + "loss": 0.0111, + "step": 421100 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013626332038125255, + "loss": 0.0096, + "step": 421110 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362594321648811, + "loss": 0.0156, + "step": 421120 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013625554394850964, + "loss": 0.011, + "step": 421130 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013625165573213818, + "loss": 0.0128, + "step": 421140 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013624776751576672, + "loss": 0.0106, + "step": 421150 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013624387929939523, + "loss": 0.0103, + "step": 421160 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013623999108302378, + "loss": 0.0081, + "step": 421170 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013623610286665232, + "loss": 0.0111, + "step": 421180 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013623221465028086, + "loss": 0.0091, + "step": 421190 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013622832643390937, + "loss": 0.0152, + "step": 421200 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013622443821753792, + "loss": 0.0138, + "step": 421210 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013622055000116646, + "loss": 0.0132, + "step": 421220 + }, + { + "epoch": 1.09, + "learning_rate": 0.000136216661784795, + "loss": 0.0112, + "step": 421230 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362127735684235, + "loss": 0.0268, + "step": 421240 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013620888535205206, + "loss": 0.0143, + "step": 421250 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001362049971356806, + "loss": 0.0121, + "step": 421260 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013620110891930914, + "loss": 0.0105, + "step": 421270 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013619722070293765, + "loss": 0.0097, + "step": 421280 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001361933324865662, + "loss": 0.0149, + "step": 421290 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013618944427019474, + "loss": 0.0101, + "step": 421300 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013618555605382325, + "loss": 0.0108, + "step": 421310 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013618166783745182, + "loss": 0.0097, + "step": 421320 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013617777962108033, + "loss": 0.0132, + "step": 421330 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013617389140470888, + "loss": 0.011, + "step": 421340 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013617000318833742, + "loss": 0.0149, + "step": 421350 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013616611497196596, + "loss": 0.0117, + "step": 421360 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013616222675559447, + "loss": 0.0146, + "step": 421370 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013615833853922302, + "loss": 0.0124, + "step": 421380 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013615445032285156, + "loss": 0.0149, + "step": 421390 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001361505621064801, + "loss": 0.0121, + "step": 421400 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001361466738901086, + "loss": 0.0101, + "step": 421410 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013614278567373715, + "loss": 0.0097, + "step": 421420 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001361388974573657, + "loss": 0.0121, + "step": 421430 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013613500924099424, + "loss": 0.0115, + "step": 421440 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013613112102462275, + "loss": 0.012, + "step": 421450 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013612723280825132, + "loss": 0.0152, + "step": 421460 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013612334459187984, + "loss": 0.0097, + "step": 421470 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013611945637550838, + "loss": 0.0109, + "step": 421480 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013611556815913692, + "loss": 0.0128, + "step": 421490 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013611167994276546, + "loss": 0.0091, + "step": 421500 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013610779172639398, + "loss": 0.0102, + "step": 421510 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013610390351002252, + "loss": 0.0126, + "step": 421520 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013610001529365106, + "loss": 0.0109, + "step": 421530 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013609612707727957, + "loss": 0.0122, + "step": 421540 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013609223886090811, + "loss": 0.0121, + "step": 421550 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013608835064453666, + "loss": 0.0137, + "step": 421560 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360844624281652, + "loss": 0.0123, + "step": 421570 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360805742117937, + "loss": 0.0101, + "step": 421580 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013607668599542225, + "loss": 0.0098, + "step": 421590 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360727977790508, + "loss": 0.0108, + "step": 421600 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013606890956267934, + "loss": 0.0129, + "step": 421610 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013606502134630785, + "loss": 0.0142, + "step": 421620 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360611331299364, + "loss": 0.0136, + "step": 421630 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013605724491356493, + "loss": 0.0093, + "step": 421640 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013605335669719348, + "loss": 0.0121, + "step": 421650 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013604946848082202, + "loss": 0.0104, + "step": 421660 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013604558026445056, + "loss": 0.0128, + "step": 421670 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013604169204807907, + "loss": 0.0102, + "step": 421680 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013603780383170762, + "loss": 0.0142, + "step": 421690 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013603391561533616, + "loss": 0.0118, + "step": 421700 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360300273989647, + "loss": 0.0103, + "step": 421710 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013602613918259321, + "loss": 0.0103, + "step": 421720 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013602225096622176, + "loss": 0.0088, + "step": 421730 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360183627498503, + "loss": 0.0109, + "step": 421740 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013601447453347884, + "loss": 0.0116, + "step": 421750 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013601058631710735, + "loss": 0.0136, + "step": 421760 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001360066981007359, + "loss": 0.0093, + "step": 421770 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013600280988436444, + "loss": 0.0097, + "step": 421780 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013599892166799295, + "loss": 0.0122, + "step": 421790 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359950334516215, + "loss": 0.0092, + "step": 421800 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013599114523525003, + "loss": 0.01, + "step": 421810 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013598725701887858, + "loss": 0.0095, + "step": 421820 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359833688025071, + "loss": 0.0147, + "step": 421830 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013597948058613566, + "loss": 0.0101, + "step": 421840 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013597559236976417, + "loss": 0.014, + "step": 421850 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013597170415339272, + "loss": 0.0105, + "step": 421860 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013596781593702126, + "loss": 0.0111, + "step": 421870 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359639277206498, + "loss": 0.0108, + "step": 421880 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359600395042783, + "loss": 0.0105, + "step": 421890 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013595615128790685, + "loss": 0.0139, + "step": 421900 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359522630715354, + "loss": 0.0119, + "step": 421910 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013594837485516394, + "loss": 0.0099, + "step": 421920 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013594448663879245, + "loss": 0.0104, + "step": 421930 + }, + { + "epoch": 1.09, + "learning_rate": 0.000135940598422421, + "loss": 0.0103, + "step": 421940 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013593671020604954, + "loss": 0.0123, + "step": 421950 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013593282198967808, + "loss": 0.0127, + "step": 421960 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359289337733066, + "loss": 0.0127, + "step": 421970 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013592504555693513, + "loss": 0.0106, + "step": 421980 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013592115734056368, + "loss": 0.0132, + "step": 421990 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013591726912419222, + "loss": 0.0109, + "step": 422000 + }, + { + "epoch": 1.09, + "eval_cer": 0.881727879787983, + "eval_loss": 0.008169938810169697, + "eval_runtime": 107.7698, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.64, + "step": 422000 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013591338090782076, + "loss": 0.0138, + "step": 422010 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001359094926914493, + "loss": 0.0087, + "step": 422020 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013590560447507781, + "loss": 0.0119, + "step": 422030 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013590171625870636, + "loss": 0.0113, + "step": 422040 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358978280423349, + "loss": 0.0149, + "step": 422050 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358939398259634, + "loss": 0.0113, + "step": 422060 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013589005160959195, + "loss": 0.0162, + "step": 422070 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358861633932205, + "loss": 0.0132, + "step": 422080 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013588227517684904, + "loss": 0.0106, + "step": 422090 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013587838696047755, + "loss": 0.0094, + "step": 422100 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358744987441061, + "loss": 0.0141, + "step": 422110 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013587061052773464, + "loss": 0.0109, + "step": 422120 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013586672231136318, + "loss": 0.0126, + "step": 422130 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358628340949917, + "loss": 0.0124, + "step": 422140 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013585894587862023, + "loss": 0.0116, + "step": 422150 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013585505766224877, + "loss": 0.0092, + "step": 422160 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013585116944587732, + "loss": 0.0088, + "step": 422170 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013584728122950583, + "loss": 0.0134, + "step": 422180 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358433930131344, + "loss": 0.0127, + "step": 422190 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013583950479676291, + "loss": 0.0114, + "step": 422200 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013583561658039146, + "loss": 0.0095, + "step": 422210 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013583172836402, + "loss": 0.0111, + "step": 422220 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013582784014764854, + "loss": 0.0096, + "step": 422230 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013582395193127705, + "loss": 0.0134, + "step": 422240 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358200637149056, + "loss": 0.0096, + "step": 422250 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013581617549853414, + "loss": 0.0081, + "step": 422260 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013581228728216268, + "loss": 0.0132, + "step": 422270 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001358083990657912, + "loss": 0.0128, + "step": 422280 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013580451084941973, + "loss": 0.0115, + "step": 422290 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013580062263304828, + "loss": 0.01, + "step": 422300 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001357967344166768, + "loss": 0.0108, + "step": 422310 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013579284620030533, + "loss": 0.0108, + "step": 422320 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013578895798393387, + "loss": 0.0104, + "step": 422330 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013578506976756242, + "loss": 0.0118, + "step": 422340 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013578118155119093, + "loss": 0.0121, + "step": 422350 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001357772933348195, + "loss": 0.0112, + "step": 422360 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013577340511844801, + "loss": 0.0097, + "step": 422370 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013576951690207656, + "loss": 0.0143, + "step": 422380 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001357656286857051, + "loss": 0.0129, + "step": 422390 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013576174046933364, + "loss": 0.0097, + "step": 422400 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013575785225296215, + "loss": 0.0183, + "step": 422410 + }, + { + "epoch": 1.09, + "learning_rate": 0.0001357539640365907, + "loss": 0.0093, + "step": 422420 + }, + { + "epoch": 1.09, + "learning_rate": 0.00013575007582021924, + "loss": 0.0154, + "step": 422430 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013574618760384778, + "loss": 0.0124, + "step": 422440 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001357422993874763, + "loss": 0.0104, + "step": 422450 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013573841117110483, + "loss": 0.0142, + "step": 422460 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013573452295473338, + "loss": 0.009, + "step": 422470 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013573063473836192, + "loss": 0.0098, + "step": 422480 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013572674652199043, + "loss": 0.0116, + "step": 422490 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013572285830561897, + "loss": 0.0114, + "step": 422500 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013571897008924752, + "loss": 0.0112, + "step": 422510 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013571508187287606, + "loss": 0.0108, + "step": 422520 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001357111936565046, + "loss": 0.0147, + "step": 422530 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001357073054401331, + "loss": 0.0148, + "step": 422540 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013570341722376165, + "loss": 0.011, + "step": 422550 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356995290073902, + "loss": 0.0103, + "step": 422560 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013569564079101874, + "loss": 0.0127, + "step": 422570 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013569175257464725, + "loss": 0.0128, + "step": 422580 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356878643582758, + "loss": 0.0113, + "step": 422590 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013568397614190434, + "loss": 0.0112, + "step": 422600 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013568008792553288, + "loss": 0.0092, + "step": 422610 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356761997091614, + "loss": 0.0096, + "step": 422620 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013567231149278993, + "loss": 0.0098, + "step": 422630 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013566842327641848, + "loss": 0.0096, + "step": 422640 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013566453506004702, + "loss": 0.0105, + "step": 422650 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013566064684367553, + "loss": 0.0112, + "step": 422660 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013565675862730407, + "loss": 0.0101, + "step": 422670 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013565287041093261, + "loss": 0.0095, + "step": 422680 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013564898219456116, + "loss": 0.0112, + "step": 422690 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013564509397818967, + "loss": 0.0126, + "step": 422700 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013564120576181824, + "loss": 0.01, + "step": 422710 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013563731754544675, + "loss": 0.0131, + "step": 422720 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356334293290753, + "loss": 0.0137, + "step": 422730 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013562954111270384, + "loss": 0.0095, + "step": 422740 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013562565289633238, + "loss": 0.0095, + "step": 422750 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356217646799609, + "loss": 0.0113, + "step": 422760 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013561787646358944, + "loss": 0.0111, + "step": 422770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013561398824721798, + "loss": 0.0113, + "step": 422780 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001356101000308465, + "loss": 0.0113, + "step": 422790 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013560621181447503, + "loss": 0.0109, + "step": 422800 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013560232359810357, + "loss": 0.01, + "step": 422810 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013559843538173212, + "loss": 0.0142, + "step": 422820 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013559454716536063, + "loss": 0.0166, + "step": 422830 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013559065894898917, + "loss": 0.01, + "step": 422840 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013558677073261771, + "loss": 0.0132, + "step": 422850 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013558288251624626, + "loss": 0.0109, + "step": 422860 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013557899429987477, + "loss": 0.0124, + "step": 422870 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013557510608350334, + "loss": 0.0118, + "step": 422880 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013557121786713185, + "loss": 0.0095, + "step": 422890 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001355673296507604, + "loss": 0.0126, + "step": 422900 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013556344143438894, + "loss": 0.0109, + "step": 422910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013555955321801748, + "loss": 0.0125, + "step": 422920 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135555665001646, + "loss": 0.0116, + "step": 422930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013555177678527453, + "loss": 0.01, + "step": 422940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013554788856890308, + "loss": 0.01, + "step": 422950 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013554400035253162, + "loss": 0.0115, + "step": 422960 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013554011213616013, + "loss": 0.0109, + "step": 422970 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013553622391978867, + "loss": 0.0106, + "step": 422980 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013553233570341722, + "loss": 0.0113, + "step": 422990 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013552844748704576, + "loss": 0.0092, + "step": 423000 + }, + { + "epoch": 1.1, + "eval_cer": 0.8817054855970361, + "eval_loss": 0.007950132712721825, + "eval_runtime": 107.536, + "eval_samples_per_second": 18.598, + "eval_steps_per_second": 4.65, + "step": 423000 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013552455927067427, + "loss": 0.0104, + "step": 423010 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013552067105430281, + "loss": 0.0089, + "step": 423020 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013551678283793136, + "loss": 0.0105, + "step": 423030 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013551289462155987, + "loss": 0.0116, + "step": 423040 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001355090064051884, + "loss": 0.0084, + "step": 423050 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013550511818881695, + "loss": 0.0116, + "step": 423060 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001355012299724455, + "loss": 0.012, + "step": 423070 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013549734175607404, + "loss": 0.0133, + "step": 423080 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013549345353970258, + "loss": 0.0111, + "step": 423090 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354895653233311, + "loss": 0.0091, + "step": 423100 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013548567710695963, + "loss": 0.0142, + "step": 423110 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013548178889058818, + "loss": 0.0102, + "step": 423120 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013547790067421672, + "loss": 0.0116, + "step": 423130 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013547401245784523, + "loss": 0.0137, + "step": 423140 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013547012424147377, + "loss": 0.0152, + "step": 423150 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013546623602510232, + "loss": 0.0102, + "step": 423160 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013546234780873086, + "loss": 0.0102, + "step": 423170 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013545845959235937, + "loss": 0.0116, + "step": 423180 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354545713759879, + "loss": 0.0096, + "step": 423190 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013545068315961645, + "loss": 0.0098, + "step": 423200 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135446794943245, + "loss": 0.0115, + "step": 423210 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354429067268735, + "loss": 0.0112, + "step": 423220 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013543901851050208, + "loss": 0.0104, + "step": 423230 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354351302941306, + "loss": 0.0092, + "step": 423240 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013543124207775914, + "loss": 0.0097, + "step": 423250 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013542735386138768, + "loss": 0.0135, + "step": 423260 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001354234656450162, + "loss": 0.0107, + "step": 423270 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013541957742864473, + "loss": 0.0084, + "step": 423280 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013541568921227328, + "loss": 0.0094, + "step": 423290 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013541180099590182, + "loss": 0.0132, + "step": 423300 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013540791277953033, + "loss": 0.0111, + "step": 423310 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013540402456315887, + "loss": 0.0154, + "step": 423320 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013540013634678741, + "loss": 0.011, + "step": 423330 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013539624813041596, + "loss": 0.011, + "step": 423340 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013539235991404447, + "loss": 0.0139, + "step": 423350 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135388471697673, + "loss": 0.0133, + "step": 423360 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013538458348130155, + "loss": 0.0131, + "step": 423370 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353806952649301, + "loss": 0.0077, + "step": 423380 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353768070485586, + "loss": 0.0126, + "step": 423390 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013537291883218718, + "loss": 0.0077, + "step": 423400 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353690306158157, + "loss": 0.0101, + "step": 423410 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013536514239944424, + "loss": 0.0099, + "step": 423420 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013536125418307278, + "loss": 0.0103, + "step": 423430 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013535736596670132, + "loss": 0.0125, + "step": 423440 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013535347775032983, + "loss": 0.0092, + "step": 423450 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013534958953395837, + "loss": 0.012, + "step": 423460 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013534570131758692, + "loss": 0.0106, + "step": 423470 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013534181310121546, + "loss": 0.013, + "step": 423480 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013533792488484397, + "loss": 0.0109, + "step": 423490 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013533403666847251, + "loss": 0.0122, + "step": 423500 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013533014845210106, + "loss": 0.0147, + "step": 423510 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013532626023572957, + "loss": 0.0101, + "step": 423520 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353223720193581, + "loss": 0.0123, + "step": 423530 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013531848380298665, + "loss": 0.0094, + "step": 423540 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353145955866152, + "loss": 0.0134, + "step": 423550 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353107073702437, + "loss": 0.0101, + "step": 423560 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013530681915387225, + "loss": 0.0117, + "step": 423570 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001353029309375008, + "loss": 0.0129, + "step": 423580 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013529904272112933, + "loss": 0.0107, + "step": 423590 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013529515450475788, + "loss": 0.0144, + "step": 423600 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013529126628838642, + "loss": 0.0092, + "step": 423610 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013528737807201493, + "loss": 0.01, + "step": 423620 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013528348985564347, + "loss": 0.0089, + "step": 423630 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013527960163927202, + "loss": 0.0146, + "step": 423640 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013527571342290056, + "loss": 0.0142, + "step": 423650 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013527182520652907, + "loss": 0.0144, + "step": 423660 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352679369901576, + "loss": 0.0122, + "step": 423670 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013526404877378616, + "loss": 0.0082, + "step": 423680 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352601605574147, + "loss": 0.0111, + "step": 423690 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352562723410432, + "loss": 0.0112, + "step": 423700 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013525238412467175, + "loss": 0.014, + "step": 423710 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352484959083003, + "loss": 0.0098, + "step": 423720 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013524460769192884, + "loss": 0.0112, + "step": 423730 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013524071947555735, + "loss": 0.0092, + "step": 423740 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013523683125918592, + "loss": 0.0144, + "step": 423750 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013523294304281443, + "loss": 0.0126, + "step": 423760 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013522905482644295, + "loss": 0.0083, + "step": 423770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013522516661007152, + "loss": 0.0125, + "step": 423780 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013522127839370003, + "loss": 0.0141, + "step": 423790 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013521739017732857, + "loss": 0.0122, + "step": 423800 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013521350196095712, + "loss": 0.0114, + "step": 423810 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013520961374458566, + "loss": 0.0129, + "step": 423820 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013520572552821417, + "loss": 0.0092, + "step": 423830 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001352018373118427, + "loss": 0.01, + "step": 423840 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013519794909547125, + "loss": 0.0079, + "step": 423850 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351940608790998, + "loss": 0.0105, + "step": 423860 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351901726627283, + "loss": 0.013, + "step": 423870 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013518628444635685, + "loss": 0.0121, + "step": 423880 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351823962299854, + "loss": 0.0118, + "step": 423890 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013517850801361394, + "loss": 0.0114, + "step": 423900 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013517461979724245, + "loss": 0.0119, + "step": 423910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013517073158087102, + "loss": 0.0144, + "step": 423920 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013516684336449953, + "loss": 0.0137, + "step": 423930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013516295514812808, + "loss": 0.0137, + "step": 423940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013515906693175662, + "loss": 0.0109, + "step": 423950 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013515517871538516, + "loss": 0.0091, + "step": 423960 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013515129049901367, + "loss": 0.0111, + "step": 423970 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013514740228264221, + "loss": 0.0134, + "step": 423980 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013514351406627076, + "loss": 0.0105, + "step": 423990 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351396258498993, + "loss": 0.0127, + "step": 424000 + }, + { + "epoch": 1.1, + "eval_cer": 0.8817026863231677, + "eval_loss": 0.007645982783287764, + "eval_runtime": 107.6093, + "eval_samples_per_second": 18.586, + "eval_steps_per_second": 4.646, + "step": 424000 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351357376335278, + "loss": 0.0093, + "step": 424010 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013513184941715635, + "loss": 0.0107, + "step": 424020 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351279612007849, + "loss": 0.0145, + "step": 424030 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351240729844134, + "loss": 0.0112, + "step": 424040 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013512018476804195, + "loss": 0.0108, + "step": 424050 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351162965516705, + "loss": 0.0096, + "step": 424060 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013511240833529904, + "loss": 0.0136, + "step": 424070 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013510852011892755, + "loss": 0.0087, + "step": 424080 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001351046319025561, + "loss": 0.0102, + "step": 424090 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013510074368618463, + "loss": 0.0164, + "step": 424100 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013509685546981317, + "loss": 0.0145, + "step": 424110 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013509296725344172, + "loss": 0.0113, + "step": 424120 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013508907903707026, + "loss": 0.011, + "step": 424130 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013508519082069877, + "loss": 0.0113, + "step": 424140 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013508130260432731, + "loss": 0.0121, + "step": 424150 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013507741438795586, + "loss": 0.0123, + "step": 424160 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350735261715844, + "loss": 0.0094, + "step": 424170 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350696379552129, + "loss": 0.0125, + "step": 424180 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013506574973884145, + "loss": 0.0121, + "step": 424190 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013506186152247, + "loss": 0.0111, + "step": 424200 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013505797330609854, + "loss": 0.0129, + "step": 424210 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013505408508972705, + "loss": 0.0124, + "step": 424220 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350501968733556, + "loss": 0.013, + "step": 424230 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013504630865698413, + "loss": 0.018, + "step": 424240 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013504242044061268, + "loss": 0.0087, + "step": 424250 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350385322242412, + "loss": 0.0085, + "step": 424260 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013503464400786973, + "loss": 0.0092, + "step": 424270 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013503075579149827, + "loss": 0.0099, + "step": 424280 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350268675751268, + "loss": 0.0129, + "step": 424290 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013502297935875536, + "loss": 0.0123, + "step": 424300 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013501909114238387, + "loss": 0.0112, + "step": 424310 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350152029260124, + "loss": 0.0093, + "step": 424320 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013501131470964096, + "loss": 0.0092, + "step": 424330 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001350074264932695, + "loss": 0.0123, + "step": 424340 + }, + { + "epoch": 1.1, + "learning_rate": 0.000135003538276898, + "loss": 0.012, + "step": 424350 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013499965006052655, + "loss": 0.0111, + "step": 424360 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349957618441551, + "loss": 0.0119, + "step": 424370 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013499187362778364, + "loss": 0.0127, + "step": 424380 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013498798541141215, + "loss": 0.0103, + "step": 424390 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349840971950407, + "loss": 0.011, + "step": 424400 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013498020897866923, + "loss": 0.0115, + "step": 424410 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013497632076229778, + "loss": 0.0107, + "step": 424420 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349724325459263, + "loss": 0.013, + "step": 424430 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013496854432955483, + "loss": 0.0129, + "step": 424440 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013496465611318337, + "loss": 0.0094, + "step": 424450 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013496076789681192, + "loss": 0.0113, + "step": 424460 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013495687968044046, + "loss": 0.0093, + "step": 424470 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134952991464069, + "loss": 0.0094, + "step": 424480 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349491032476975, + "loss": 0.0106, + "step": 424490 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013494521503132605, + "loss": 0.0098, + "step": 424500 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349413268149546, + "loss": 0.0104, + "step": 424510 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349374385985831, + "loss": 0.0105, + "step": 424520 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013493355038221165, + "loss": 0.0102, + "step": 424530 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349296621658402, + "loss": 0.0142, + "step": 424540 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013492577394946874, + "loss": 0.0098, + "step": 424550 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013492188573309725, + "loss": 0.0142, + "step": 424560 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349179975167258, + "loss": 0.0088, + "step": 424570 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013491410930035433, + "loss": 0.0119, + "step": 424580 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013491022108398287, + "loss": 0.0126, + "step": 424590 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001349063328676114, + "loss": 0.0084, + "step": 424600 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013490244465123993, + "loss": 0.0092, + "step": 424610 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013489855643486847, + "loss": 0.0114, + "step": 424620 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013489466821849701, + "loss": 0.0101, + "step": 424630 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013489078000212553, + "loss": 0.0098, + "step": 424640 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348868917857541, + "loss": 0.0105, + "step": 424650 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348830035693826, + "loss": 0.0094, + "step": 424660 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013487911535301115, + "loss": 0.0091, + "step": 424670 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348752271366397, + "loss": 0.0117, + "step": 424680 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013487133892026824, + "loss": 0.0085, + "step": 424690 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013486745070389675, + "loss": 0.0096, + "step": 424700 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348635624875253, + "loss": 0.0092, + "step": 424710 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013485967427115383, + "loss": 0.0135, + "step": 424720 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013485578605478238, + "loss": 0.0113, + "step": 424730 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348518978384109, + "loss": 0.0111, + "step": 424740 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013484800962203943, + "loss": 0.0101, + "step": 424750 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013484412140566797, + "loss": 0.0111, + "step": 424760 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348402331892965, + "loss": 0.008, + "step": 424770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013483634497292503, + "loss": 0.0074, + "step": 424780 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013483245675655357, + "loss": 0.0113, + "step": 424790 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013482856854018211, + "loss": 0.0114, + "step": 424800 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013482468032381063, + "loss": 0.0102, + "step": 424810 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348207921074392, + "loss": 0.0133, + "step": 424820 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348169038910677, + "loss": 0.009, + "step": 424830 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013481301567469625, + "loss": 0.0101, + "step": 424840 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001348091274583248, + "loss": 0.0105, + "step": 424850 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013480523924195334, + "loss": 0.0143, + "step": 424860 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013480135102558185, + "loss": 0.0113, + "step": 424870 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347974628092104, + "loss": 0.0131, + "step": 424880 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013479357459283893, + "loss": 0.0131, + "step": 424890 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013478968637646748, + "loss": 0.0123, + "step": 424900 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134785798160096, + "loss": 0.012, + "step": 424910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013478190994372453, + "loss": 0.0137, + "step": 424920 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013477802172735307, + "loss": 0.0111, + "step": 424930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013477413351098162, + "loss": 0.0145, + "step": 424940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013477024529461013, + "loss": 0.0105, + "step": 424950 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013476635707823867, + "loss": 0.0157, + "step": 424960 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347624688618672, + "loss": 0.0083, + "step": 424970 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013475858064549575, + "loss": 0.0094, + "step": 424980 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347546924291243, + "loss": 0.0105, + "step": 424990 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013475080421275284, + "loss": 0.0111, + "step": 425000 + }, + { + "epoch": 1.1, + "eval_cer": 0.8817292794249172, + "eval_loss": 0.007522050756961107, + "eval_runtime": 107.5853, + "eval_samples_per_second": 18.59, + "eval_steps_per_second": 4.647, + "step": 425000 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013474691599638135, + "loss": 0.0102, + "step": 425010 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347430277800099, + "loss": 0.0075, + "step": 425020 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013473913956363844, + "loss": 0.0116, + "step": 425030 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013473525134726695, + "loss": 0.0116, + "step": 425040 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347313631308955, + "loss": 0.0105, + "step": 425050 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013472747491452403, + "loss": 0.0097, + "step": 425060 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013472358669815258, + "loss": 0.0106, + "step": 425070 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001347196984817811, + "loss": 0.0115, + "step": 425080 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013471581026540963, + "loss": 0.0089, + "step": 425090 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013471192204903817, + "loss": 0.0121, + "step": 425100 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013470803383266671, + "loss": 0.0117, + "step": 425110 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013470414561629523, + "loss": 0.0117, + "step": 425120 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013470025739992377, + "loss": 0.0109, + "step": 425130 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346963691835523, + "loss": 0.0134, + "step": 425140 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013469248096718085, + "loss": 0.0124, + "step": 425150 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013468859275080937, + "loss": 0.012, + "step": 425160 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013468470453443794, + "loss": 0.0103, + "step": 425170 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013468081631806645, + "loss": 0.0102, + "step": 425180 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134676928101695, + "loss": 0.0112, + "step": 425190 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013467303988532354, + "loss": 0.0091, + "step": 425200 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013466915166895208, + "loss": 0.0111, + "step": 425210 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346652634525806, + "loss": 0.0105, + "step": 425220 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013466137523620913, + "loss": 0.0122, + "step": 425230 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013465748701983767, + "loss": 0.0147, + "step": 425240 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013465359880346622, + "loss": 0.0101, + "step": 425250 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013464971058709473, + "loss": 0.0099, + "step": 425260 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013464582237072327, + "loss": 0.0137, + "step": 425270 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013464193415435181, + "loss": 0.0115, + "step": 425280 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013463804593798033, + "loss": 0.0119, + "step": 425290 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013463415772160887, + "loss": 0.011, + "step": 425300 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346302695052374, + "loss": 0.0114, + "step": 425310 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013462638128886595, + "loss": 0.0097, + "step": 425320 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013462249307249447, + "loss": 0.0113, + "step": 425330 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013461860485612304, + "loss": 0.0113, + "step": 425340 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013461471663975155, + "loss": 0.0112, + "step": 425350 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001346108284233801, + "loss": 0.0128, + "step": 425360 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013460694020700863, + "loss": 0.0114, + "step": 425370 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013460305199063718, + "loss": 0.0106, + "step": 425380 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345991637742657, + "loss": 0.0103, + "step": 425390 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013459527555789423, + "loss": 0.0095, + "step": 425400 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013459138734152277, + "loss": 0.0111, + "step": 425410 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013458749912515132, + "loss": 0.0109, + "step": 425420 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013458361090877983, + "loss": 0.0119, + "step": 425430 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013457972269240837, + "loss": 0.0106, + "step": 425440 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013457583447603691, + "loss": 0.0164, + "step": 425450 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013457194625966546, + "loss": 0.0108, + "step": 425460 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013456805804329397, + "loss": 0.0121, + "step": 425470 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345641698269225, + "loss": 0.0179, + "step": 425480 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013456028161055105, + "loss": 0.01, + "step": 425490 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345563933941796, + "loss": 0.0112, + "step": 425500 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013455250517780814, + "loss": 0.0107, + "step": 425510 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013454861696143665, + "loss": 0.0124, + "step": 425520 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345447287450652, + "loss": 0.012, + "step": 425530 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013454084052869373, + "loss": 0.0106, + "step": 425540 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013453695231232228, + "loss": 0.0109, + "step": 425550 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001345330640959508, + "loss": 0.0087, + "step": 425560 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013452917587957933, + "loss": 0.0095, + "step": 425570 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013452528766320787, + "loss": 0.0125, + "step": 425580 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013452139944683642, + "loss": 0.0091, + "step": 425590 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013451751123046493, + "loss": 0.0138, + "step": 425600 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013451362301409347, + "loss": 0.0132, + "step": 425610 + }, + { + "epoch": 1.1, + "learning_rate": 0.000134509734797722, + "loss": 0.0207, + "step": 425620 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013450584658135055, + "loss": 0.0106, + "step": 425630 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013450195836497907, + "loss": 0.0119, + "step": 425640 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344980701486076, + "loss": 0.0146, + "step": 425650 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013449418193223615, + "loss": 0.0158, + "step": 425660 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344902937158647, + "loss": 0.0111, + "step": 425670 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344864054994932, + "loss": 0.0094, + "step": 425680 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013448251728312178, + "loss": 0.0098, + "step": 425690 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344786290667503, + "loss": 0.0112, + "step": 425700 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013447474085037883, + "loss": 0.0102, + "step": 425710 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013447085263400738, + "loss": 0.0146, + "step": 425720 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013446696441763592, + "loss": 0.0103, + "step": 425730 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013446307620126443, + "loss": 0.0112, + "step": 425740 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013445918798489297, + "loss": 0.012, + "step": 425750 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013445529976852151, + "loss": 0.0109, + "step": 425760 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013445141155215003, + "loss": 0.0128, + "step": 425770 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013444752333577857, + "loss": 0.0125, + "step": 425780 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344436351194071, + "loss": 0.0101, + "step": 425790 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013443974690303565, + "loss": 0.0091, + "step": 425800 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013443585868666417, + "loss": 0.0104, + "step": 425810 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344319704702927, + "loss": 0.0149, + "step": 425820 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013442808225392125, + "loss": 0.0106, + "step": 425830 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344241940375498, + "loss": 0.0111, + "step": 425840 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344203058211783, + "loss": 0.0111, + "step": 425850 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013441641760480688, + "loss": 0.0097, + "step": 425860 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001344125293884354, + "loss": 0.0087, + "step": 425870 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013440864117206393, + "loss": 0.0106, + "step": 425880 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013440475295569247, + "loss": 0.0099, + "step": 425890 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013440086473932102, + "loss": 0.0136, + "step": 425900 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013439697652294953, + "loss": 0.0106, + "step": 425910 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013439308830657807, + "loss": 0.0117, + "step": 425920 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013438920009020661, + "loss": 0.011, + "step": 425930 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013438531187383516, + "loss": 0.0112, + "step": 425940 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013438142365746367, + "loss": 0.0099, + "step": 425950 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343775354410922, + "loss": 0.0111, + "step": 425960 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013437364722472075, + "loss": 0.0096, + "step": 425970 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343697590083493, + "loss": 0.0128, + "step": 425980 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343658707919778, + "loss": 0.0134, + "step": 425990 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013436198257560635, + "loss": 0.0125, + "step": 426000 + }, + { + "epoch": 1.1, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.007685732562094927, + "eval_runtime": 107.9705, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 426000 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343580943592349, + "loss": 0.009, + "step": 426010 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343542061428634, + "loss": 0.0102, + "step": 426020 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013435031792649195, + "loss": 0.0105, + "step": 426030 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343464297101205, + "loss": 0.0089, + "step": 426040 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013434254149374903, + "loss": 0.0133, + "step": 426050 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013433865327737757, + "loss": 0.0111, + "step": 426060 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013433476506100612, + "loss": 0.0095, + "step": 426070 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013433087684463463, + "loss": 0.0142, + "step": 426080 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013432698862826317, + "loss": 0.0077, + "step": 426090 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013432310041189171, + "loss": 0.0102, + "step": 426100 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013431921219552026, + "loss": 0.0079, + "step": 426110 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013431532397914877, + "loss": 0.0128, + "step": 426120 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343114357627773, + "loss": 0.0141, + "step": 426130 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013430754754640585, + "loss": 0.0148, + "step": 426140 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001343036593300344, + "loss": 0.0076, + "step": 426150 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001342997711136629, + "loss": 0.0092, + "step": 426160 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013429588289729145, + "loss": 0.0122, + "step": 426170 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013429199468092, + "loss": 0.0154, + "step": 426180 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013428810646454853, + "loss": 0.0121, + "step": 426190 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013428421824817705, + "loss": 0.0095, + "step": 426200 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013428033003180562, + "loss": 0.0119, + "step": 426210 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013427644181543413, + "loss": 0.0135, + "step": 426220 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013427255359906267, + "loss": 0.0099, + "step": 426230 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013426866538269122, + "loss": 0.011, + "step": 426240 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013426477716631973, + "loss": 0.0129, + "step": 426250 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013426088894994827, + "loss": 0.0117, + "step": 426260 + }, + { + "epoch": 1.1, + "learning_rate": 0.0001342570007335768, + "loss": 0.0156, + "step": 426270 + }, + { + "epoch": 1.1, + "learning_rate": 0.00013425311251720535, + "loss": 0.0117, + "step": 426280 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013424922430083387, + "loss": 0.0125, + "step": 426290 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001342453360844624, + "loss": 0.0122, + "step": 426300 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013424144786809095, + "loss": 0.0155, + "step": 426310 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001342375596517195, + "loss": 0.0169, + "step": 426320 + }, + { + "epoch": 1.11, + "learning_rate": 0.000134233671435348, + "loss": 0.0137, + "step": 426330 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013422978321897655, + "loss": 0.0092, + "step": 426340 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001342258950026051, + "loss": 0.0126, + "step": 426350 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013422200678623363, + "loss": 0.0127, + "step": 426360 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013421811856986215, + "loss": 0.0112, + "step": 426370 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013421423035349072, + "loss": 0.0139, + "step": 426380 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013421034213711923, + "loss": 0.0098, + "step": 426390 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013420645392074777, + "loss": 0.0106, + "step": 426400 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013420256570437631, + "loss": 0.011, + "step": 426410 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013419867748800486, + "loss": 0.0104, + "step": 426420 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013419478927163337, + "loss": 0.0128, + "step": 426430 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341909010552619, + "loss": 0.0111, + "step": 426440 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013418701283889045, + "loss": 0.0156, + "step": 426450 + }, + { + "epoch": 1.11, + "learning_rate": 0.000134183124622519, + "loss": 0.0098, + "step": 426460 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341792364061475, + "loss": 0.0107, + "step": 426470 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013417534818977605, + "loss": 0.0101, + "step": 426480 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341714599734046, + "loss": 0.0128, + "step": 426490 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341675717570331, + "loss": 0.0122, + "step": 426500 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013416368354066165, + "loss": 0.0094, + "step": 426510 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341597953242902, + "loss": 0.0121, + "step": 426520 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013415590710791873, + "loss": 0.0123, + "step": 426530 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013415201889154725, + "loss": 0.0129, + "step": 426540 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341481306751758, + "loss": 0.0124, + "step": 426550 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013414424245880433, + "loss": 0.0091, + "step": 426560 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013414035424243287, + "loss": 0.0151, + "step": 426570 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013413646602606141, + "loss": 0.0147, + "step": 426580 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013413257780968996, + "loss": 0.0104, + "step": 426590 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013412868959331847, + "loss": 0.0104, + "step": 426600 + }, + { + "epoch": 1.11, + "learning_rate": 0.000134124801376947, + "loss": 0.0089, + "step": 426610 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013412091316057555, + "loss": 0.0141, + "step": 426620 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341170249442041, + "loss": 0.0096, + "step": 426630 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341131367278326, + "loss": 0.0108, + "step": 426640 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013410924851146115, + "loss": 0.0103, + "step": 426650 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001341053602950897, + "loss": 0.0132, + "step": 426660 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013410147207871823, + "loss": 0.0118, + "step": 426670 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013409758386234675, + "loss": 0.0111, + "step": 426680 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340936956459753, + "loss": 0.0093, + "step": 426690 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013408980742960383, + "loss": 0.0126, + "step": 426700 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013408591921323237, + "loss": 0.0091, + "step": 426710 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340820309968609, + "loss": 0.0073, + "step": 426720 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013407814278048946, + "loss": 0.0079, + "step": 426730 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013407425456411797, + "loss": 0.012, + "step": 426740 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013407036634774649, + "loss": 0.0106, + "step": 426750 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013406647813137506, + "loss": 0.0113, + "step": 426760 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013406258991500357, + "loss": 0.0109, + "step": 426770 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340587016986321, + "loss": 0.0131, + "step": 426780 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013405481348226065, + "loss": 0.0136, + "step": 426790 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340509252658892, + "loss": 0.0116, + "step": 426800 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340470370495177, + "loss": 0.0131, + "step": 426810 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013404314883314625, + "loss": 0.0145, + "step": 426820 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340392606167748, + "loss": 0.0107, + "step": 426830 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013403537240040333, + "loss": 0.01, + "step": 426840 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013403148418403185, + "loss": 0.013, + "step": 426850 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340275959676604, + "loss": 0.0098, + "step": 426860 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013402370775128893, + "loss": 0.0081, + "step": 426870 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013401981953491747, + "loss": 0.009, + "step": 426880 + }, + { + "epoch": 1.11, + "learning_rate": 0.000134015931318546, + "loss": 0.011, + "step": 426890 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013401204310217456, + "loss": 0.0131, + "step": 426900 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013400815488580307, + "loss": 0.0125, + "step": 426910 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001340042666694316, + "loss": 0.0097, + "step": 426920 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013400037845306015, + "loss": 0.0118, + "step": 426930 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339964902366887, + "loss": 0.0129, + "step": 426940 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339926020203172, + "loss": 0.01, + "step": 426950 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013398871380394575, + "loss": 0.0107, + "step": 426960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339848255875743, + "loss": 0.0094, + "step": 426970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013398093737120284, + "loss": 0.0143, + "step": 426980 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013397704915483135, + "loss": 0.0142, + "step": 426990 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339731609384599, + "loss": 0.0135, + "step": 427000 + }, + { + "epoch": 1.11, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.007585541810840368, + "eval_runtime": 107.5996, + "eval_samples_per_second": 18.587, + "eval_steps_per_second": 4.647, + "step": 427000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013396927272208843, + "loss": 0.0115, + "step": 427010 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013396538450571695, + "loss": 0.0112, + "step": 427020 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339614962893455, + "loss": 0.0111, + "step": 427030 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013395760807297403, + "loss": 0.0109, + "step": 427040 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013395371985660257, + "loss": 0.0094, + "step": 427050 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339498316402311, + "loss": 0.0112, + "step": 427060 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013394594342385963, + "loss": 0.0126, + "step": 427070 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013394205520748817, + "loss": 0.0137, + "step": 427080 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339381669911167, + "loss": 0.0127, + "step": 427090 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013393427877474525, + "loss": 0.0127, + "step": 427100 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339303905583738, + "loss": 0.0132, + "step": 427110 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339265023420023, + "loss": 0.0089, + "step": 427120 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013392261412563085, + "loss": 0.0097, + "step": 427130 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001339187259092594, + "loss": 0.0116, + "step": 427140 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013391483769288794, + "loss": 0.0109, + "step": 427150 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013391094947651645, + "loss": 0.0101, + "step": 427160 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133907061260145, + "loss": 0.0113, + "step": 427170 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013390317304377353, + "loss": 0.0134, + "step": 427180 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013389928482740207, + "loss": 0.012, + "step": 427190 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338953966110306, + "loss": 0.0121, + "step": 427200 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013389150839465913, + "loss": 0.0115, + "step": 427210 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013388762017828767, + "loss": 0.0135, + "step": 427220 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013388373196191621, + "loss": 0.0126, + "step": 427230 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013387984374554473, + "loss": 0.0076, + "step": 427240 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013387595552917327, + "loss": 0.0115, + "step": 427250 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338720673128018, + "loss": 0.0099, + "step": 427260 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013386817909643033, + "loss": 0.009, + "step": 427270 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338642908800589, + "loss": 0.0136, + "step": 427280 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338604026636874, + "loss": 0.0144, + "step": 427290 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013385651444731595, + "loss": 0.0109, + "step": 427300 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338526262309445, + "loss": 0.0111, + "step": 427310 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013384873801457303, + "loss": 0.0114, + "step": 427320 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013384484979820155, + "loss": 0.0105, + "step": 427330 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338409615818301, + "loss": 0.0093, + "step": 427340 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013383707336545863, + "loss": 0.0096, + "step": 427350 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013383318514908717, + "loss": 0.0107, + "step": 427360 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338292969327157, + "loss": 0.015, + "step": 427370 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013382540871634423, + "loss": 0.0113, + "step": 427380 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013382152049997277, + "loss": 0.0099, + "step": 427390 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338176322836013, + "loss": 0.0105, + "step": 427400 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013381374406722983, + "loss": 0.013, + "step": 427410 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013380985585085837, + "loss": 0.0133, + "step": 427420 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001338059676344869, + "loss": 0.0149, + "step": 427430 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013380207941811545, + "loss": 0.0112, + "step": 427440 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133798191201744, + "loss": 0.0106, + "step": 427450 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013379430298537254, + "loss": 0.0102, + "step": 427460 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013379041476900105, + "loss": 0.0092, + "step": 427470 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337865265526296, + "loss": 0.0107, + "step": 427480 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013378263833625813, + "loss": 0.0103, + "step": 427490 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013377875011988665, + "loss": 0.0092, + "step": 427500 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337748619035152, + "loss": 0.0139, + "step": 427510 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013377097368714373, + "loss": 0.0194, + "step": 427520 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013376708547077227, + "loss": 0.0087, + "step": 427530 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337631972544008, + "loss": 0.0119, + "step": 427540 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013375930903802933, + "loss": 0.0089, + "step": 427550 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013375542082165787, + "loss": 0.0108, + "step": 427560 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337515326052864, + "loss": 0.0114, + "step": 427570 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013374764438891493, + "loss": 0.0108, + "step": 427580 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013374375617254347, + "loss": 0.0111, + "step": 427590 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133739867956172, + "loss": 0.0109, + "step": 427600 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013373597973980055, + "loss": 0.009, + "step": 427610 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013373209152342907, + "loss": 0.0128, + "step": 427620 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013372820330705764, + "loss": 0.0114, + "step": 427630 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013372431509068615, + "loss": 0.0097, + "step": 427640 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337204268743147, + "loss": 0.0129, + "step": 427650 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013371653865794323, + "loss": 0.0106, + "step": 427660 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013371265044157177, + "loss": 0.0099, + "step": 427670 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001337087622252003, + "loss": 0.0118, + "step": 427680 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013370487400882883, + "loss": 0.0078, + "step": 427690 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013370098579245737, + "loss": 0.0132, + "step": 427700 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013369709757608591, + "loss": 0.0107, + "step": 427710 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013369320935971443, + "loss": 0.0097, + "step": 427720 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013368932114334297, + "loss": 0.0121, + "step": 427730 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336854329269715, + "loss": 0.011, + "step": 427740 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013368154471060003, + "loss": 0.0091, + "step": 427750 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013367765649422857, + "loss": 0.0093, + "step": 427760 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336737682778571, + "loss": 0.0094, + "step": 427770 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013366988006148565, + "loss": 0.0095, + "step": 427780 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013366599184511417, + "loss": 0.0094, + "step": 427790 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013366210362874273, + "loss": 0.0143, + "step": 427800 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013365821541237125, + "loss": 0.0138, + "step": 427810 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336543271959998, + "loss": 0.0105, + "step": 427820 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013365043897962833, + "loss": 0.0092, + "step": 427830 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013364655076325687, + "loss": 0.01, + "step": 427840 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336426625468854, + "loss": 0.012, + "step": 427850 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013363877433051393, + "loss": 0.0086, + "step": 427860 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013363488611414247, + "loss": 0.0114, + "step": 427870 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013363099789777101, + "loss": 0.0131, + "step": 427880 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013362710968139953, + "loss": 0.0105, + "step": 427890 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013362322146502807, + "loss": 0.0121, + "step": 427900 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336193332486566, + "loss": 0.0098, + "step": 427910 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013361544503228515, + "loss": 0.0106, + "step": 427920 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013361155681591367, + "loss": 0.0106, + "step": 427930 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001336076685995422, + "loss": 0.0109, + "step": 427940 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013360378038317075, + "loss": 0.012, + "step": 427950 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335998921667993, + "loss": 0.0112, + "step": 427960 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013359600395042783, + "loss": 0.0117, + "step": 427970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013359211573405638, + "loss": 0.0117, + "step": 427980 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335882275176849, + "loss": 0.0095, + "step": 427990 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013358433930131343, + "loss": 0.012, + "step": 428000 + }, + { + "epoch": 1.11, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.007801650557667017, + "eval_runtime": 107.5281, + "eval_samples_per_second": 18.6, + "eval_steps_per_second": 4.65, + "step": 428000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013358045108494197, + "loss": 0.0129, + "step": 428010 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335765628685705, + "loss": 0.0122, + "step": 428020 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013357267465219903, + "loss": 0.0098, + "step": 428030 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013356878643582757, + "loss": 0.0117, + "step": 428040 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335648982194561, + "loss": 0.011, + "step": 428050 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013356101000308463, + "loss": 0.0077, + "step": 428060 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013355712178671317, + "loss": 0.0088, + "step": 428070 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335532335703417, + "loss": 0.011, + "step": 428080 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013354934535397025, + "loss": 0.0084, + "step": 428090 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013354545713759877, + "loss": 0.0117, + "step": 428100 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335415689212273, + "loss": 0.0096, + "step": 428110 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013353768070485585, + "loss": 0.0105, + "step": 428120 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335337924884844, + "loss": 0.0105, + "step": 428130 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001335299042721129, + "loss": 0.0099, + "step": 428140 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013352601605574148, + "loss": 0.0105, + "step": 428150 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013352212783937, + "loss": 0.0118, + "step": 428160 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013351823962299853, + "loss": 0.0111, + "step": 428170 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013351435140662707, + "loss": 0.0133, + "step": 428180 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013351046319025561, + "loss": 0.0111, + "step": 428190 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013350657497388413, + "loss": 0.0107, + "step": 428200 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013350268675751267, + "loss": 0.0152, + "step": 428210 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334987985411412, + "loss": 0.0153, + "step": 428220 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013349491032476975, + "loss": 0.0105, + "step": 428230 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013349102210839827, + "loss": 0.0135, + "step": 428240 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334871338920268, + "loss": 0.0108, + "step": 428250 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013348324567565535, + "loss": 0.0122, + "step": 428260 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013347935745928387, + "loss": 0.0118, + "step": 428270 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334754692429124, + "loss": 0.0106, + "step": 428280 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013347158102654095, + "loss": 0.0097, + "step": 428290 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334676928101695, + "loss": 0.0079, + "step": 428300 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133463804593798, + "loss": 0.0103, + "step": 428310 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013345991637742657, + "loss": 0.0221, + "step": 428320 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334560281610551, + "loss": 0.0112, + "step": 428330 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013345213994468363, + "loss": 0.0089, + "step": 428340 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013344825172831217, + "loss": 0.0085, + "step": 428350 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013344436351194071, + "loss": 0.011, + "step": 428360 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013344047529556923, + "loss": 0.0098, + "step": 428370 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013343658707919777, + "loss": 0.0087, + "step": 428380 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334326988628263, + "loss": 0.0105, + "step": 428390 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013342881064645485, + "loss": 0.0123, + "step": 428400 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013342492243008337, + "loss": 0.0099, + "step": 428410 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334210342137119, + "loss": 0.0113, + "step": 428420 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013341714599734045, + "loss": 0.0121, + "step": 428430 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133413257780969, + "loss": 0.0097, + "step": 428440 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334093695645975, + "loss": 0.0091, + "step": 428450 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013340548134822605, + "loss": 0.0145, + "step": 428460 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001334015931318546, + "loss": 0.0103, + "step": 428470 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013339770491548313, + "loss": 0.01, + "step": 428480 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013339381669911167, + "loss": 0.0132, + "step": 428490 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333899284827402, + "loss": 0.0103, + "step": 428500 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013338604026636873, + "loss": 0.0115, + "step": 428510 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013338215204999727, + "loss": 0.0107, + "step": 428520 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013337826383362581, + "loss": 0.0113, + "step": 428530 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013337437561725433, + "loss": 0.0123, + "step": 428540 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013337048740088287, + "loss": 0.0093, + "step": 428550 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333665991845114, + "loss": 0.0105, + "step": 428560 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013336271096813995, + "loss": 0.0122, + "step": 428570 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013335882275176847, + "loss": 0.0132, + "step": 428580 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133354934535397, + "loss": 0.0109, + "step": 428590 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013335104631902555, + "loss": 0.0137, + "step": 428600 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333471581026541, + "loss": 0.0135, + "step": 428610 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333432698862826, + "loss": 0.0103, + "step": 428620 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013333938166991115, + "loss": 0.0094, + "step": 428630 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333354934535397, + "loss": 0.0104, + "step": 428640 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013333160523716823, + "loss": 0.014, + "step": 428650 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013332771702079675, + "loss": 0.0112, + "step": 428660 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013332382880442532, + "loss": 0.0073, + "step": 428670 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013331994058805383, + "loss": 0.0142, + "step": 428680 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013331605237168237, + "loss": 0.0117, + "step": 428690 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333121641553109, + "loss": 0.0114, + "step": 428700 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013330827593893945, + "loss": 0.0109, + "step": 428710 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013330438772256797, + "loss": 0.0123, + "step": 428720 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001333004995061965, + "loss": 0.0111, + "step": 428730 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013329661128982505, + "loss": 0.0101, + "step": 428740 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013329272307345357, + "loss": 0.0089, + "step": 428750 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332888348570821, + "loss": 0.0127, + "step": 428760 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013328494664071065, + "loss": 0.0134, + "step": 428770 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332810584243392, + "loss": 0.0099, + "step": 428780 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332771702079677, + "loss": 0.0128, + "step": 428790 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013327328199159625, + "loss": 0.0088, + "step": 428800 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332693937752248, + "loss": 0.0098, + "step": 428810 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013326550555885333, + "loss": 0.0075, + "step": 428820 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013326161734248185, + "loss": 0.0127, + "step": 428830 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013325772912611041, + "loss": 0.0122, + "step": 428840 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013325384090973893, + "loss": 0.0126, + "step": 428850 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013324995269336747, + "loss": 0.0093, + "step": 428860 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133246064476996, + "loss": 0.0105, + "step": 428870 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013324217626062455, + "loss": 0.0125, + "step": 428880 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013323828804425307, + "loss": 0.0107, + "step": 428890 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332343998278816, + "loss": 0.0136, + "step": 428900 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013323051161151015, + "loss": 0.011, + "step": 428910 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332266233951387, + "loss": 0.0086, + "step": 428920 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332227351787672, + "loss": 0.0124, + "step": 428930 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013321884696239575, + "loss": 0.0107, + "step": 428940 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332149587460243, + "loss": 0.0113, + "step": 428950 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013321107052965283, + "loss": 0.0123, + "step": 428960 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013320718231328135, + "loss": 0.0123, + "step": 428970 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001332032940969099, + "loss": 0.0124, + "step": 428980 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013319940588053843, + "loss": 0.0139, + "step": 428990 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013319551766416695, + "loss": 0.0133, + "step": 429000 + }, + { + "epoch": 1.11, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.007387722842395306, + "eval_runtime": 107.4783, + "eval_samples_per_second": 18.608, + "eval_steps_per_second": 4.652, + "step": 429000 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331916294477955, + "loss": 0.0122, + "step": 429010 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013318774123142403, + "loss": 0.01, + "step": 429020 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013318385301505257, + "loss": 0.0116, + "step": 429030 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331799647986811, + "loss": 0.0109, + "step": 429040 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013317607658230965, + "loss": 0.0122, + "step": 429050 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013317218836593817, + "loss": 0.0097, + "step": 429060 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331683001495667, + "loss": 0.0111, + "step": 429070 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013316441193319525, + "loss": 0.0142, + "step": 429080 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331605237168238, + "loss": 0.0139, + "step": 429090 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331566355004523, + "loss": 0.0125, + "step": 429100 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013315274728408085, + "loss": 0.011, + "step": 429110 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331488590677094, + "loss": 0.0124, + "step": 429120 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013314497085133793, + "loss": 0.0101, + "step": 429130 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013314108263496645, + "loss": 0.015, + "step": 429140 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133137194418595, + "loss": 0.0101, + "step": 429150 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013313330620222353, + "loss": 0.0129, + "step": 429160 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013312941798585207, + "loss": 0.0142, + "step": 429170 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331255297694806, + "loss": 0.0092, + "step": 429180 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013312164155310916, + "loss": 0.0106, + "step": 429190 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013311775333673767, + "loss": 0.0097, + "step": 429200 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331138651203662, + "loss": 0.0116, + "step": 429210 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013310997690399475, + "loss": 0.01, + "step": 429220 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013310608868762327, + "loss": 0.0091, + "step": 429230 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001331022004712518, + "loss": 0.0111, + "step": 429240 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013309831225488035, + "loss": 0.0108, + "step": 429250 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330944240385089, + "loss": 0.0103, + "step": 429260 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330905358221374, + "loss": 0.0117, + "step": 429270 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013308664760576595, + "loss": 0.0104, + "step": 429280 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330827593893945, + "loss": 0.0089, + "step": 429290 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013307887117302303, + "loss": 0.0112, + "step": 429300 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013307498295665155, + "loss": 0.0122, + "step": 429310 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330710947402801, + "loss": 0.013, + "step": 429320 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013306720652390863, + "loss": 0.0126, + "step": 429330 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013306331830753717, + "loss": 0.0094, + "step": 429340 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013305943009116569, + "loss": 0.0095, + "step": 429350 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013305554187479425, + "loss": 0.0122, + "step": 429360 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013305165365842277, + "loss": 0.0113, + "step": 429370 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330477654420513, + "loss": 0.0107, + "step": 429380 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013304387722567985, + "loss": 0.0138, + "step": 429390 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330399890093084, + "loss": 0.0109, + "step": 429400 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330361007929369, + "loss": 0.0111, + "step": 429410 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013303221257656545, + "loss": 0.0098, + "step": 429420 + }, + { + "epoch": 1.11, + "learning_rate": 0.000133028324360194, + "loss": 0.0109, + "step": 429430 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013302443614382253, + "loss": 0.0149, + "step": 429440 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013302054792745105, + "loss": 0.0096, + "step": 429450 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330166597110796, + "loss": 0.0101, + "step": 429460 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013301277149470813, + "loss": 0.0115, + "step": 429470 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013300888327833665, + "loss": 0.0117, + "step": 429480 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001330049950619652, + "loss": 0.0131, + "step": 429490 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013300110684559373, + "loss": 0.0085, + "step": 429500 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013299721862922227, + "loss": 0.0127, + "step": 429510 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013299333041285079, + "loss": 0.0107, + "step": 429520 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013298944219647933, + "loss": 0.0102, + "step": 429530 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013298555398010787, + "loss": 0.0123, + "step": 429540 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329816657637364, + "loss": 0.0095, + "step": 429550 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013297777754736495, + "loss": 0.0087, + "step": 429560 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329738893309935, + "loss": 0.0116, + "step": 429570 + }, + { + "epoch": 1.11, + "learning_rate": 0.000132970001114622, + "loss": 0.01, + "step": 429580 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013296611289825055, + "loss": 0.0098, + "step": 429590 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329622246818791, + "loss": 0.0083, + "step": 429600 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013295833646550763, + "loss": 0.013, + "step": 429610 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013295444824913615, + "loss": 0.0135, + "step": 429620 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329505600327647, + "loss": 0.013, + "step": 429630 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013294667181639323, + "loss": 0.01, + "step": 429640 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013294278360002177, + "loss": 0.0165, + "step": 429650 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329388953836503, + "loss": 0.0087, + "step": 429660 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013293500716727883, + "loss": 0.0119, + "step": 429670 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013293111895090737, + "loss": 0.0135, + "step": 429680 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329272307345359, + "loss": 0.0114, + "step": 429690 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013292334251816443, + "loss": 0.0129, + "step": 429700 + }, + { + "epoch": 1.11, + "learning_rate": 0.000132919454301793, + "loss": 0.0099, + "step": 429710 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329155660854215, + "loss": 0.0076, + "step": 429720 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013291167786905002, + "loss": 0.0121, + "step": 429730 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329077896526786, + "loss": 0.0084, + "step": 429740 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001329039014363071, + "loss": 0.0109, + "step": 429750 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013290001321993565, + "loss": 0.0086, + "step": 429760 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328961250035642, + "loss": 0.0153, + "step": 429770 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013289223678719273, + "loss": 0.0116, + "step": 429780 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013288834857082125, + "loss": 0.0095, + "step": 429790 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328844603544498, + "loss": 0.0177, + "step": 429800 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013288057213807833, + "loss": 0.0157, + "step": 429810 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013287668392170687, + "loss": 0.0118, + "step": 429820 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013287279570533539, + "loss": 0.0108, + "step": 429830 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013286890748896393, + "loss": 0.009, + "step": 429840 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013286501927259247, + "loss": 0.0138, + "step": 429850 + }, + { + "epoch": 1.11, + "learning_rate": 0.000132861131056221, + "loss": 0.0115, + "step": 429860 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013285724283984953, + "loss": 0.0095, + "step": 429870 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328533546234781, + "loss": 0.0112, + "step": 429880 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328494664071066, + "loss": 0.0109, + "step": 429890 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013284557819073515, + "loss": 0.0089, + "step": 429900 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328416899743637, + "loss": 0.0119, + "step": 429910 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013283780175799223, + "loss": 0.016, + "step": 429920 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013283391354162075, + "loss": 0.0147, + "step": 429930 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328300253252493, + "loss": 0.015, + "step": 429940 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013282613710887783, + "loss": 0.0123, + "step": 429950 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013282224889250637, + "loss": 0.012, + "step": 429960 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001328183606761349, + "loss": 0.0113, + "step": 429970 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013281447245976343, + "loss": 0.0128, + "step": 429980 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013281058424339197, + "loss": 0.011, + "step": 429990 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013280669602702049, + "loss": 0.0108, + "step": 430000 + }, + { + "epoch": 1.11, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.007531081326305866, + "eval_runtime": 107.5849, + "eval_samples_per_second": 18.59, + "eval_steps_per_second": 4.647, + "step": 430000 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013280280781064903, + "loss": 0.0092, + "step": 430010 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013279891959427757, + "loss": 0.0132, + "step": 430020 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327950313779061, + "loss": 0.0124, + "step": 430030 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013279114316153463, + "loss": 0.0084, + "step": 430040 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013278725494516317, + "loss": 0.0094, + "step": 430050 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327833667287917, + "loss": 0.0163, + "step": 430060 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013277947851242025, + "loss": 0.0102, + "step": 430070 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327755902960488, + "loss": 0.0117, + "step": 430080 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013277170207967733, + "loss": 0.0113, + "step": 430090 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013276781386330585, + "loss": 0.0085, + "step": 430100 + }, + { + "epoch": 1.11, + "learning_rate": 0.0001327639256469344, + "loss": 0.0147, + "step": 430110 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013276003743056293, + "loss": 0.0139, + "step": 430120 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013275614921419147, + "loss": 0.0114, + "step": 430130 + }, + { + "epoch": 1.11, + "learning_rate": 0.00013275226099782, + "loss": 0.0131, + "step": 430140 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013274837278144853, + "loss": 0.0093, + "step": 430150 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013274448456507707, + "loss": 0.0086, + "step": 430160 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001327405963487056, + "loss": 0.0111, + "step": 430170 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013273670813233413, + "loss": 0.0106, + "step": 430180 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013273281991596267, + "loss": 0.0076, + "step": 430190 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001327289316995912, + "loss": 0.0124, + "step": 430200 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013272504348321975, + "loss": 0.0148, + "step": 430210 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013272115526684827, + "loss": 0.0093, + "step": 430220 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001327172670504768, + "loss": 0.0111, + "step": 430230 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013271337883410535, + "loss": 0.0109, + "step": 430240 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013270949061773386, + "loss": 0.0114, + "step": 430250 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013270560240136243, + "loss": 0.0106, + "step": 430260 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013270171418499095, + "loss": 0.0105, + "step": 430270 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326978259686195, + "loss": 0.0095, + "step": 430280 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013269393775224803, + "loss": 0.0093, + "step": 430290 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013269004953587657, + "loss": 0.0111, + "step": 430300 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326861613195051, + "loss": 0.0088, + "step": 430310 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013268227310313363, + "loss": 0.0115, + "step": 430320 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013267838488676217, + "loss": 0.0112, + "step": 430330 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326744966703907, + "loss": 0.0115, + "step": 430340 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013267060845401923, + "loss": 0.0099, + "step": 430350 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013266672023764777, + "loss": 0.0149, + "step": 430360 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326628320212763, + "loss": 0.0101, + "step": 430370 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013265894380490485, + "loss": 0.0133, + "step": 430380 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013265505558853337, + "loss": 0.014, + "step": 430390 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326511673721619, + "loss": 0.0124, + "step": 430400 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013264727915579045, + "loss": 0.0112, + "step": 430410 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132643390939419, + "loss": 0.013, + "step": 430420 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013263950272304753, + "loss": 0.0098, + "step": 430430 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013263561450667607, + "loss": 0.0117, + "step": 430440 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326317262903046, + "loss": 0.0132, + "step": 430450 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013262783807393313, + "loss": 0.0094, + "step": 430460 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013262394985756167, + "loss": 0.0153, + "step": 430470 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013262006164119019, + "loss": 0.009, + "step": 430480 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013261617342481873, + "loss": 0.01, + "step": 430490 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013261228520844727, + "loss": 0.0119, + "step": 430500 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001326083969920758, + "loss": 0.015, + "step": 430510 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013260450877570433, + "loss": 0.0104, + "step": 430520 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013260062055933287, + "loss": 0.0154, + "step": 430530 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325967323429614, + "loss": 0.0092, + "step": 430540 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013259284412658995, + "loss": 0.0094, + "step": 430550 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013258895591021847, + "loss": 0.0099, + "step": 430560 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132585067693847, + "loss": 0.0094, + "step": 430570 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013258117947747555, + "loss": 0.0114, + "step": 430580 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325772912611041, + "loss": 0.009, + "step": 430590 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325734030447326, + "loss": 0.0141, + "step": 430600 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013256951482836117, + "loss": 0.0113, + "step": 430610 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325656266119897, + "loss": 0.0136, + "step": 430620 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013256173839561823, + "loss": 0.0085, + "step": 430630 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013255785017924677, + "loss": 0.0109, + "step": 430640 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325539619628753, + "loss": 0.0094, + "step": 430650 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013255007374650383, + "loss": 0.0128, + "step": 430660 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013254618553013237, + "loss": 0.0086, + "step": 430670 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325422973137609, + "loss": 0.011, + "step": 430680 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013253840909738945, + "loss": 0.0084, + "step": 430690 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013253452088101797, + "loss": 0.0123, + "step": 430700 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325306326646465, + "loss": 0.0107, + "step": 430710 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013252674444827505, + "loss": 0.0127, + "step": 430720 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013252285623190356, + "loss": 0.01, + "step": 430730 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325189680155321, + "loss": 0.0102, + "step": 430740 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013251507979916065, + "loss": 0.0098, + "step": 430750 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325111915827892, + "loss": 0.01, + "step": 430760 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001325073033664177, + "loss": 0.0105, + "step": 430770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013250341515004627, + "loss": 0.0103, + "step": 430780 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324995269336748, + "loss": 0.0099, + "step": 430790 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013249563871730333, + "loss": 0.0148, + "step": 430800 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013249175050093187, + "loss": 0.0131, + "step": 430810 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324878622845604, + "loss": 0.0128, + "step": 430820 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013248397406818893, + "loss": 0.0101, + "step": 430830 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013248008585181747, + "loss": 0.012, + "step": 430840 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132476197635446, + "loss": 0.0129, + "step": 430850 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013247230941907455, + "loss": 0.0117, + "step": 430860 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013246842120270307, + "loss": 0.0125, + "step": 430870 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324645329863316, + "loss": 0.0086, + "step": 430880 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013246064476996015, + "loss": 0.0084, + "step": 430890 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324567565535887, + "loss": 0.0109, + "step": 430900 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324528683372172, + "loss": 0.0105, + "step": 430910 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013244898012084575, + "loss": 0.0121, + "step": 430920 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324450919044743, + "loss": 0.0108, + "step": 430930 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013244120368810283, + "loss": 0.0142, + "step": 430940 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013243731547173137, + "loss": 0.0116, + "step": 430950 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013243342725535991, + "loss": 0.0109, + "step": 430960 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013242953903898843, + "loss": 0.0093, + "step": 430970 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013242565082261697, + "loss": 0.0123, + "step": 430980 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324217626062455, + "loss": 0.0132, + "step": 430990 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013241787438987403, + "loss": 0.0104, + "step": 431000 + }, + { + "epoch": 1.12, + "eval_cer": 0.881719481966378, + "eval_loss": 0.007422698196023703, + "eval_runtime": 107.6404, + "eval_samples_per_second": 18.58, + "eval_steps_per_second": 4.645, + "step": 431000 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013241398617350257, + "loss": 0.0093, + "step": 431010 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001324100979571311, + "loss": 0.0085, + "step": 431020 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013240620974075965, + "loss": 0.0123, + "step": 431030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013240232152438817, + "loss": 0.0102, + "step": 431040 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323984333080167, + "loss": 0.0128, + "step": 431050 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013239454509164525, + "loss": 0.0095, + "step": 431060 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323906568752738, + "loss": 0.0105, + "step": 431070 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323867686589023, + "loss": 0.0103, + "step": 431080 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013238288044253085, + "loss": 0.0083, + "step": 431090 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323789922261594, + "loss": 0.0148, + "step": 431100 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013237510400978793, + "loss": 0.0108, + "step": 431110 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013237121579341644, + "loss": 0.0113, + "step": 431120 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132367327577045, + "loss": 0.009, + "step": 431130 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013236343936067353, + "loss": 0.0105, + "step": 431140 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013235955114430207, + "loss": 0.0095, + "step": 431150 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323556629279306, + "loss": 0.0112, + "step": 431160 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013235177471155915, + "loss": 0.0105, + "step": 431170 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013234788649518767, + "loss": 0.0133, + "step": 431180 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323439982788162, + "loss": 0.0109, + "step": 431190 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013234011006244475, + "loss": 0.0128, + "step": 431200 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013233622184607327, + "loss": 0.0114, + "step": 431210 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323323336297018, + "loss": 0.0106, + "step": 431220 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013232844541333035, + "loss": 0.0128, + "step": 431230 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323245571969589, + "loss": 0.0109, + "step": 431240 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323206689805874, + "loss": 0.0119, + "step": 431250 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013231678076421595, + "loss": 0.0104, + "step": 431260 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323128925478445, + "loss": 0.0119, + "step": 431270 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013230900433147303, + "loss": 0.0098, + "step": 431280 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013230511611510154, + "loss": 0.0103, + "step": 431290 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001323012278987301, + "loss": 0.0091, + "step": 431300 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013229733968235863, + "loss": 0.0132, + "step": 431310 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013229345146598717, + "loss": 0.0103, + "step": 431320 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322895632496157, + "loss": 0.0112, + "step": 431330 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013228567503324425, + "loss": 0.0105, + "step": 431340 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013228178681687277, + "loss": 0.0094, + "step": 431350 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322778986005013, + "loss": 0.0124, + "step": 431360 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013227401038412985, + "loss": 0.009, + "step": 431370 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322701221677584, + "loss": 0.0106, + "step": 431380 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322662339513869, + "loss": 0.0118, + "step": 431390 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013226234573501545, + "loss": 0.0149, + "step": 431400 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132258457518644, + "loss": 0.0118, + "step": 431410 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013225456930227253, + "loss": 0.0135, + "step": 431420 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013225068108590105, + "loss": 0.0135, + "step": 431430 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322467928695296, + "loss": 0.0113, + "step": 431440 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013224290465315813, + "loss": 0.0159, + "step": 431450 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013223901643678664, + "loss": 0.0099, + "step": 431460 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013223512822041518, + "loss": 0.0114, + "step": 431470 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013223124000404373, + "loss": 0.0115, + "step": 431480 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013222735178767227, + "loss": 0.0093, + "step": 431490 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322234635713008, + "loss": 0.0123, + "step": 431500 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013221957535492935, + "loss": 0.0087, + "step": 431510 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013221568713855787, + "loss": 0.0104, + "step": 431520 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322117989221864, + "loss": 0.0105, + "step": 431530 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013220791070581495, + "loss": 0.0111, + "step": 431540 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001322040224894435, + "loss": 0.0095, + "step": 431550 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132200134273072, + "loss": 0.0118, + "step": 431560 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013219624605670055, + "loss": 0.0107, + "step": 431570 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321923578403291, + "loss": 0.0117, + "step": 431580 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013218846962395763, + "loss": 0.0118, + "step": 431590 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013218458140758614, + "loss": 0.0117, + "step": 431600 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321806931912147, + "loss": 0.0094, + "step": 431610 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013217680497484323, + "loss": 0.0097, + "step": 431620 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013217291675847177, + "loss": 0.0112, + "step": 431630 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013216902854210028, + "loss": 0.012, + "step": 431640 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013216514032572885, + "loss": 0.0109, + "step": 431650 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013216125210935737, + "loss": 0.0111, + "step": 431660 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321573638929859, + "loss": 0.0114, + "step": 431670 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013215347567661445, + "loss": 0.0137, + "step": 431680 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132149587460243, + "loss": 0.0108, + "step": 431690 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321456992438715, + "loss": 0.0083, + "step": 431700 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013214181102750005, + "loss": 0.01, + "step": 431710 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321379228111286, + "loss": 0.0107, + "step": 431720 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321340345947571, + "loss": 0.0135, + "step": 431730 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013213014637838565, + "loss": 0.012, + "step": 431740 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001321262581620142, + "loss": 0.0097, + "step": 431750 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013212236994564273, + "loss": 0.0113, + "step": 431760 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013211848172927124, + "loss": 0.0121, + "step": 431770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013211459351289979, + "loss": 0.0108, + "step": 431780 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013211070529652833, + "loss": 0.0104, + "step": 431790 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013210681708015687, + "loss": 0.0099, + "step": 431800 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013210292886378538, + "loss": 0.0083, + "step": 431810 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013209904064741395, + "loss": 0.0097, + "step": 431820 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013209515243104247, + "loss": 0.011, + "step": 431830 + }, + { + "epoch": 1.12, + "learning_rate": 0.000132091264214671, + "loss": 0.0104, + "step": 431840 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013208737599829955, + "loss": 0.0105, + "step": 431850 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320834877819281, + "loss": 0.0125, + "step": 431860 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320795995655566, + "loss": 0.0127, + "step": 431870 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013207571134918515, + "loss": 0.0131, + "step": 431880 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320718231328137, + "loss": 0.013, + "step": 431890 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013206793491644223, + "loss": 0.0085, + "step": 431900 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013206404670007075, + "loss": 0.0102, + "step": 431910 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320601584836993, + "loss": 0.0111, + "step": 431920 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013205627026732783, + "loss": 0.0128, + "step": 431930 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013205238205095637, + "loss": 0.0107, + "step": 431940 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013204849383458489, + "loss": 0.0133, + "step": 431950 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013204460561821343, + "loss": 0.0127, + "step": 431960 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013204071740184197, + "loss": 0.0147, + "step": 431970 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013203682918547048, + "loss": 0.0122, + "step": 431980 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013203294096909902, + "loss": 0.0154, + "step": 431990 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013202905275272757, + "loss": 0.0126, + "step": 432000 + }, + { + "epoch": 1.12, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.007582567632198334, + "eval_runtime": 107.5055, + "eval_samples_per_second": 18.604, + "eval_steps_per_second": 4.651, + "step": 432000 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320251645363561, + "loss": 0.0113, + "step": 432010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013202127631998465, + "loss": 0.0096, + "step": 432020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320173881036132, + "loss": 0.0113, + "step": 432030 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320134998872417, + "loss": 0.0116, + "step": 432040 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013200961167087025, + "loss": 0.0132, + "step": 432050 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001320057234544988, + "loss": 0.0098, + "step": 432060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013200183523812733, + "loss": 0.0099, + "step": 432070 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013199794702175585, + "loss": 0.0152, + "step": 432080 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319940588053844, + "loss": 0.0102, + "step": 432090 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013199017058901293, + "loss": 0.0114, + "step": 432100 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013198628237264147, + "loss": 0.0125, + "step": 432110 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013198239415626998, + "loss": 0.0135, + "step": 432120 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013197850593989853, + "loss": 0.0118, + "step": 432130 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013197461772352707, + "loss": 0.0122, + "step": 432140 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319707295071556, + "loss": 0.01, + "step": 432150 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013196684129078412, + "loss": 0.0138, + "step": 432160 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319629530744127, + "loss": 0.0121, + "step": 432170 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319590648580412, + "loss": 0.0182, + "step": 432180 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013195517664166975, + "loss": 0.0144, + "step": 432190 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319512884252983, + "loss": 0.0114, + "step": 432200 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319474002089268, + "loss": 0.0142, + "step": 432210 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013194351199255535, + "loss": 0.0086, + "step": 432220 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319396237761839, + "loss": 0.0146, + "step": 432230 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013193573555981243, + "loss": 0.0116, + "step": 432240 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013193184734344094, + "loss": 0.0117, + "step": 432250 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319279591270695, + "loss": 0.0091, + "step": 432260 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013192407091069803, + "loss": 0.0142, + "step": 432270 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013192018269432657, + "loss": 0.0149, + "step": 432280 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013191629447795508, + "loss": 0.0137, + "step": 432290 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013191240626158363, + "loss": 0.0114, + "step": 432300 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013190851804521217, + "loss": 0.0094, + "step": 432310 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001319046298288407, + "loss": 0.0161, + "step": 432320 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013190074161246922, + "loss": 0.0083, + "step": 432330 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318968533960978, + "loss": 0.0113, + "step": 432340 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318929651797263, + "loss": 0.0089, + "step": 432350 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013188907696335485, + "loss": 0.0152, + "step": 432360 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318851887469834, + "loss": 0.0116, + "step": 432370 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013188130053061193, + "loss": 0.0115, + "step": 432380 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013187741231424045, + "loss": 0.0104, + "step": 432390 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131873524097869, + "loss": 0.0154, + "step": 432400 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013186963588149753, + "loss": 0.0108, + "step": 432410 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013186574766512607, + "loss": 0.0108, + "step": 432420 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013186185944875459, + "loss": 0.014, + "step": 432430 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013185797123238313, + "loss": 0.0097, + "step": 432440 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013185408301601167, + "loss": 0.008, + "step": 432450 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013185019479964018, + "loss": 0.0114, + "step": 432460 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013184630658326873, + "loss": 0.013, + "step": 432470 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013184241836689727, + "loss": 0.01, + "step": 432480 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318385301505258, + "loss": 0.0087, + "step": 432490 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013183464193415432, + "loss": 0.011, + "step": 432500 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013183075371778286, + "loss": 0.0102, + "step": 432510 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318268655014114, + "loss": 0.011, + "step": 432520 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013182297728503995, + "loss": 0.0091, + "step": 432530 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318190890686685, + "loss": 0.0105, + "step": 432540 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013181520085229703, + "loss": 0.0125, + "step": 432550 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013181131263592555, + "loss": 0.0109, + "step": 432560 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001318074244195541, + "loss": 0.0151, + "step": 432570 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013180353620318263, + "loss": 0.0098, + "step": 432580 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013179964798681117, + "loss": 0.0103, + "step": 432590 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013179575977043969, + "loss": 0.0096, + "step": 432600 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013179187155406823, + "loss": 0.0109, + "step": 432610 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013178798333769677, + "loss": 0.0071, + "step": 432620 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317840951213253, + "loss": 0.0148, + "step": 432630 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013178020690495382, + "loss": 0.0115, + "step": 432640 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013177631868858237, + "loss": 0.016, + "step": 432650 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317724304722109, + "loss": 0.0133, + "step": 432660 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013176854225583945, + "loss": 0.0111, + "step": 432670 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013176465403946796, + "loss": 0.0123, + "step": 432680 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013176076582309653, + "loss": 0.0149, + "step": 432690 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013175687760672505, + "loss": 0.0127, + "step": 432700 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013175298939035356, + "loss": 0.0105, + "step": 432710 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013174910117398213, + "loss": 0.0104, + "step": 432720 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013174521295761065, + "loss": 0.011, + "step": 432730 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317413247412392, + "loss": 0.0105, + "step": 432740 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013173743652486773, + "loss": 0.0109, + "step": 432750 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013173354830849627, + "loss": 0.0099, + "step": 432760 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013172966009212478, + "loss": 0.0076, + "step": 432770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013172577187575333, + "loss": 0.0111, + "step": 432780 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013172188365938187, + "loss": 0.0119, + "step": 432790 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001317179954430104, + "loss": 0.0144, + "step": 432800 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013171410722663892, + "loss": 0.011, + "step": 432810 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013171021901026747, + "loss": 0.0094, + "step": 432820 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131706330793896, + "loss": 0.0097, + "step": 432830 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013170244257752455, + "loss": 0.0131, + "step": 432840 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013169855436115306, + "loss": 0.0112, + "step": 432850 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316946661447816, + "loss": 0.0139, + "step": 432860 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013169077792841015, + "loss": 0.0106, + "step": 432870 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316868897120387, + "loss": 0.0113, + "step": 432880 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013168300149566723, + "loss": 0.0121, + "step": 432890 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013167911327929577, + "loss": 0.0181, + "step": 432900 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013167522506292429, + "loss": 0.0156, + "step": 432910 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013167133684655283, + "loss": 0.011, + "step": 432920 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013166744863018137, + "loss": 0.0106, + "step": 432930 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316635604138099, + "loss": 0.0107, + "step": 432940 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013165967219743843, + "loss": 0.0119, + "step": 432950 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013165578398106697, + "loss": 0.0126, + "step": 432960 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316518957646955, + "loss": 0.0121, + "step": 432970 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013164800754832402, + "loss": 0.0111, + "step": 432980 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013164411933195257, + "loss": 0.0116, + "step": 432990 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316402311155811, + "loss": 0.0123, + "step": 433000 + }, + { + "epoch": 1.12, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.0072698756121098995, + "eval_runtime": 107.5529, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, + "step": 433000 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013163634289920965, + "loss": 0.0104, + "step": 433010 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013163245468283816, + "loss": 0.0115, + "step": 433020 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316285664664667, + "loss": 0.0112, + "step": 433030 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013162467825009525, + "loss": 0.012, + "step": 433040 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316207900337238, + "loss": 0.0158, + "step": 433050 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001316169018173523, + "loss": 0.01, + "step": 433060 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013161301360098087, + "loss": 0.0142, + "step": 433070 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013160912538460939, + "loss": 0.0084, + "step": 433080 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013160523716823793, + "loss": 0.0111, + "step": 433090 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013160134895186647, + "loss": 0.0114, + "step": 433100 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131597460735495, + "loss": 0.0125, + "step": 433110 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013159357251912353, + "loss": 0.0112, + "step": 433120 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013158968430275207, + "loss": 0.0134, + "step": 433130 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315857960863806, + "loss": 0.0112, + "step": 433140 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013158190787000915, + "loss": 0.014, + "step": 433150 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013157801965363766, + "loss": 0.01, + "step": 433160 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315741314372662, + "loss": 0.0109, + "step": 433170 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013157024322089475, + "loss": 0.0117, + "step": 433180 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315663550045233, + "loss": 0.0147, + "step": 433190 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315624667881518, + "loss": 0.0109, + "step": 433200 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013155857857178035, + "loss": 0.0097, + "step": 433210 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315546903554089, + "loss": 0.0141, + "step": 433220 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315508021390374, + "loss": 0.0117, + "step": 433230 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013154691392266597, + "loss": 0.0148, + "step": 433240 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013154302570629449, + "loss": 0.0102, + "step": 433250 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013153913748992303, + "loss": 0.011, + "step": 433260 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013153524927355157, + "loss": 0.0123, + "step": 433270 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315313610571801, + "loss": 0.0098, + "step": 433280 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013152747284080862, + "loss": 0.0088, + "step": 433290 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013152358462443717, + "loss": 0.0094, + "step": 433300 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315196964080657, + "loss": 0.0122, + "step": 433310 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013151580819169425, + "loss": 0.009, + "step": 433320 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013151191997532276, + "loss": 0.0104, + "step": 433330 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315080317589513, + "loss": 0.011, + "step": 433340 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013150414354257985, + "loss": 0.0121, + "step": 433350 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001315002553262084, + "loss": 0.0105, + "step": 433360 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314963671098369, + "loss": 0.0087, + "step": 433370 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013149247889346545, + "loss": 0.0147, + "step": 433380 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131488590677094, + "loss": 0.0138, + "step": 433390 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013148470246072253, + "loss": 0.0132, + "step": 433400 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013148081424435107, + "loss": 0.0113, + "step": 433410 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314769260279796, + "loss": 0.014, + "step": 433420 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013147303781160813, + "loss": 0.0103, + "step": 433430 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013146914959523667, + "loss": 0.0134, + "step": 433440 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314652613788652, + "loss": 0.0119, + "step": 433450 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013146137316249372, + "loss": 0.0115, + "step": 433460 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013145748494612227, + "loss": 0.01, + "step": 433470 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314535967297508, + "loss": 0.0151, + "step": 433480 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013144970851337935, + "loss": 0.0105, + "step": 433490 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013144582029700786, + "loss": 0.011, + "step": 433500 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314419320806364, + "loss": 0.0128, + "step": 433510 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013143804386426495, + "loss": 0.0145, + "step": 433520 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314341556478935, + "loss": 0.0104, + "step": 433530 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131430267431522, + "loss": 0.0128, + "step": 433540 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013142637921515054, + "loss": 0.0097, + "step": 433550 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013142249099877909, + "loss": 0.0111, + "step": 433560 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013141860278240763, + "loss": 0.0113, + "step": 433570 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013141471456603614, + "loss": 0.0092, + "step": 433580 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001314108263496647, + "loss": 0.0106, + "step": 433590 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013140693813329323, + "loss": 0.011, + "step": 433600 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013140304991692177, + "loss": 0.0106, + "step": 433610 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313991617005503, + "loss": 0.0107, + "step": 433620 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013139527348417885, + "loss": 0.0109, + "step": 433630 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013139138526780737, + "loss": 0.0111, + "step": 433640 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313874970514359, + "loss": 0.0111, + "step": 433650 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013138360883506445, + "loss": 0.0139, + "step": 433660 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131379720618693, + "loss": 0.0138, + "step": 433670 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313758324023215, + "loss": 0.0126, + "step": 433680 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013137194418595005, + "loss": 0.0127, + "step": 433690 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313680559695786, + "loss": 0.0105, + "step": 433700 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313641677532071, + "loss": 0.0113, + "step": 433710 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013136027953683564, + "loss": 0.01, + "step": 433720 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013135639132046419, + "loss": 0.0105, + "step": 433730 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013135250310409273, + "loss": 0.0108, + "step": 433740 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013134861488772124, + "loss": 0.0106, + "step": 433750 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313447266713498, + "loss": 0.0095, + "step": 433760 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013134083845497833, + "loss": 0.0093, + "step": 433770 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013133695023860687, + "loss": 0.0089, + "step": 433780 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313330620222354, + "loss": 0.0107, + "step": 433790 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013132917380586395, + "loss": 0.0135, + "step": 433800 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013132528558949246, + "loss": 0.0118, + "step": 433810 + }, + { + "epoch": 1.12, + "learning_rate": 0.000131321397373121, + "loss": 0.0094, + "step": 433820 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013131750915674955, + "loss": 0.01, + "step": 433830 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313136209403781, + "loss": 0.0091, + "step": 433840 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313097327240066, + "loss": 0.0126, + "step": 433850 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013130584450763515, + "loss": 0.0136, + "step": 433860 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001313019562912637, + "loss": 0.0083, + "step": 433870 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013129806807489223, + "loss": 0.0107, + "step": 433880 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013129417985852074, + "loss": 0.0137, + "step": 433890 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013129029164214929, + "loss": 0.0109, + "step": 433900 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013128640342577783, + "loss": 0.0094, + "step": 433910 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013128251520940637, + "loss": 0.012, + "step": 433920 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001312786269930349, + "loss": 0.0125, + "step": 433930 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013127473877666342, + "loss": 0.011, + "step": 433940 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013127085056029197, + "loss": 0.0152, + "step": 433950 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001312669623439205, + "loss": 0.0104, + "step": 433960 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013126307412754905, + "loss": 0.0109, + "step": 433970 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013125918591117756, + "loss": 0.0133, + "step": 433980 + }, + { + "epoch": 1.12, + "learning_rate": 0.0001312552976948061, + "loss": 0.0126, + "step": 433990 + }, + { + "epoch": 1.12, + "learning_rate": 0.00013125140947843465, + "loss": 0.0104, + "step": 434000 + }, + { + "epoch": 1.12, + "eval_cer": 0.8817334783357197, + "eval_loss": 0.007528600748628378, + "eval_runtime": 107.4782, + "eval_samples_per_second": 18.608, + "eval_steps_per_second": 4.652, + "step": 434000 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312475212620632, + "loss": 0.0124, + "step": 434010 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312436330456917, + "loss": 0.0109, + "step": 434020 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013123974482932025, + "loss": 0.0125, + "step": 434030 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312358566129488, + "loss": 0.0147, + "step": 434040 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013123196839657733, + "loss": 0.014, + "step": 434050 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013122808018020584, + "loss": 0.0158, + "step": 434060 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013122419196383438, + "loss": 0.0117, + "step": 434070 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013122030374746293, + "loss": 0.0135, + "step": 434080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013121641553109147, + "loss": 0.0116, + "step": 434090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013121252731471998, + "loss": 0.0102, + "step": 434100 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013120863909834855, + "loss": 0.0103, + "step": 434110 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013120475088197707, + "loss": 0.0127, + "step": 434120 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001312008626656056, + "loss": 0.0122, + "step": 434130 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013119697444923415, + "loss": 0.0131, + "step": 434140 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311930862328627, + "loss": 0.0094, + "step": 434150 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311891980164912, + "loss": 0.0115, + "step": 434160 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013118530980011975, + "loss": 0.0125, + "step": 434170 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311814215837483, + "loss": 0.0123, + "step": 434180 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311775333673768, + "loss": 0.0129, + "step": 434190 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013117364515100534, + "loss": 0.012, + "step": 434200 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013116975693463389, + "loss": 0.0117, + "step": 434210 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013116586871826243, + "loss": 0.0117, + "step": 434220 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013116198050189094, + "loss": 0.0108, + "step": 434230 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013115809228551948, + "loss": 0.0112, + "step": 434240 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013115420406914803, + "loss": 0.0106, + "step": 434250 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013115031585277657, + "loss": 0.0093, + "step": 434260 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013114642763640508, + "loss": 0.0105, + "step": 434270 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013114253942003365, + "loss": 0.0142, + "step": 434280 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013113865120366217, + "loss": 0.0136, + "step": 434290 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311347629872907, + "loss": 0.0104, + "step": 434300 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013113087477091925, + "loss": 0.0129, + "step": 434310 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311269865545478, + "loss": 0.009, + "step": 434320 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311230983381763, + "loss": 0.0111, + "step": 434330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013111921012180485, + "loss": 0.0152, + "step": 434340 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001311153219054334, + "loss": 0.01, + "step": 434350 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013111143368906193, + "loss": 0.0089, + "step": 434360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013110754547269044, + "loss": 0.0097, + "step": 434370 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013110365725631899, + "loss": 0.0097, + "step": 434380 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013109976903994753, + "loss": 0.013, + "step": 434390 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013109588082357607, + "loss": 0.0118, + "step": 434400 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013109199260720458, + "loss": 0.011, + "step": 434410 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013108810439083312, + "loss": 0.0097, + "step": 434420 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013108421617446167, + "loss": 0.0163, + "step": 434430 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013108032795809018, + "loss": 0.0118, + "step": 434440 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013107643974171872, + "loss": 0.0143, + "step": 434450 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013107255152534726, + "loss": 0.009, + "step": 434460 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310686633089758, + "loss": 0.0138, + "step": 434470 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013106477509260435, + "loss": 0.0099, + "step": 434480 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310608868762329, + "loss": 0.0105, + "step": 434490 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310569986598614, + "loss": 0.0129, + "step": 434500 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013105311044348995, + "loss": 0.0128, + "step": 434510 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310492222271185, + "loss": 0.0168, + "step": 434520 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013104533401074703, + "loss": 0.0144, + "step": 434530 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013104144579437554, + "loss": 0.0075, + "step": 434540 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013103755757800408, + "loss": 0.0189, + "step": 434550 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013103366936163263, + "loss": 0.0122, + "step": 434560 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013102978114526117, + "loss": 0.01, + "step": 434570 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013102589292888968, + "loss": 0.0125, + "step": 434580 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013102200471251822, + "loss": 0.0094, + "step": 434590 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013101811649614677, + "loss": 0.0141, + "step": 434600 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310142282797753, + "loss": 0.0111, + "step": 434610 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013101034006340382, + "loss": 0.0106, + "step": 434620 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310064518470324, + "loss": 0.0115, + "step": 434630 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001310025636306609, + "loss": 0.0119, + "step": 434640 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013099867541428945, + "loss": 0.0135, + "step": 434650 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130994787197918, + "loss": 0.0132, + "step": 434660 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013099089898154653, + "loss": 0.0118, + "step": 434670 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013098701076517504, + "loss": 0.0115, + "step": 434680 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309831225488036, + "loss": 0.0095, + "step": 434690 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013097923433243213, + "loss": 0.0135, + "step": 434700 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013097534611606064, + "loss": 0.0116, + "step": 434710 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013097145789968918, + "loss": 0.0111, + "step": 434720 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013096756968331773, + "loss": 0.0104, + "step": 434730 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013096368146694627, + "loss": 0.0103, + "step": 434740 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013095979325057478, + "loss": 0.0094, + "step": 434750 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013095590503420332, + "loss": 0.0107, + "step": 434760 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013095201681783187, + "loss": 0.0087, + "step": 434770 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309481286014604, + "loss": 0.0136, + "step": 434780 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013094424038508892, + "loss": 0.0113, + "step": 434790 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309403521687175, + "loss": 0.0123, + "step": 434800 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130936463952346, + "loss": 0.0138, + "step": 434810 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013093257573597455, + "loss": 0.0105, + "step": 434820 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001309286875196031, + "loss": 0.0095, + "step": 434830 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013092479930323163, + "loss": 0.0091, + "step": 434840 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013092091108686014, + "loss": 0.0108, + "step": 434850 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013091702287048869, + "loss": 0.0103, + "step": 434860 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013091313465411723, + "loss": 0.0103, + "step": 434870 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013090924643774577, + "loss": 0.0116, + "step": 434880 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013090535822137428, + "loss": 0.0085, + "step": 434890 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013090147000500283, + "loss": 0.0131, + "step": 434900 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013089758178863137, + "loss": 0.0096, + "step": 434910 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308936935722599, + "loss": 0.0143, + "step": 434920 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013088980535588842, + "loss": 0.0158, + "step": 434930 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013088591713951696, + "loss": 0.0126, + "step": 434940 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308820289231455, + "loss": 0.0105, + "step": 434950 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013087814070677402, + "loss": 0.007, + "step": 434960 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013087425249040256, + "loss": 0.0143, + "step": 434970 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308703642740311, + "loss": 0.0103, + "step": 434980 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013086647605765965, + "loss": 0.0142, + "step": 434990 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308625878412882, + "loss": 0.0142, + "step": 435000 + }, + { + "epoch": 1.13, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.007556126918643713, + "eval_runtime": 107.935, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.632, + "step": 435000 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013085869962491673, + "loss": 0.0123, + "step": 435010 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013085481140854524, + "loss": 0.0085, + "step": 435020 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013085092319217379, + "loss": 0.014, + "step": 435030 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013084703497580233, + "loss": 0.0111, + "step": 435040 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013084314675943087, + "loss": 0.0114, + "step": 435050 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013083925854305938, + "loss": 0.0089, + "step": 435060 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013083537032668792, + "loss": 0.0106, + "step": 435070 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013083148211031647, + "loss": 0.0092, + "step": 435080 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130827593893945, + "loss": 0.0124, + "step": 435090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013082370567757352, + "loss": 0.0149, + "step": 435100 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013081981746120206, + "loss": 0.0098, + "step": 435110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001308159292448306, + "loss": 0.0104, + "step": 435120 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013081204102845915, + "loss": 0.0115, + "step": 435130 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013080815281208766, + "loss": 0.01, + "step": 435140 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013080426459571623, + "loss": 0.01, + "step": 435150 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013080037637934475, + "loss": 0.0099, + "step": 435160 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307964881629733, + "loss": 0.0108, + "step": 435170 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013079259994660183, + "loss": 0.0085, + "step": 435180 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013078871173023034, + "loss": 0.0119, + "step": 435190 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013078482351385888, + "loss": 0.0134, + "step": 435200 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013078093529748743, + "loss": 0.0187, + "step": 435210 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013077704708111597, + "loss": 0.0138, + "step": 435220 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013077315886474448, + "loss": 0.012, + "step": 435230 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013076927064837302, + "loss": 0.0239, + "step": 435240 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013076538243200157, + "loss": 0.0131, + "step": 435250 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307614942156301, + "loss": 0.0108, + "step": 435260 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013075760599925862, + "loss": 0.0128, + "step": 435270 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013075371778288716, + "loss": 0.015, + "step": 435280 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307498295665157, + "loss": 0.0097, + "step": 435290 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013074594135014425, + "loss": 0.0085, + "step": 435300 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013074205313377276, + "loss": 0.0103, + "step": 435310 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013073816491740133, + "loss": 0.0157, + "step": 435320 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013073427670102984, + "loss": 0.0266, + "step": 435330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013073038848465839, + "loss": 0.0214, + "step": 435340 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013072650026828693, + "loss": 0.0147, + "step": 435350 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013072261205191547, + "loss": 0.0114, + "step": 435360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013071872383554398, + "loss": 0.0088, + "step": 435370 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013071483561917253, + "loss": 0.0128, + "step": 435380 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013071094740280107, + "loss": 0.018, + "step": 435390 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001307070591864296, + "loss": 0.0095, + "step": 435400 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013070317097005812, + "loss": 0.0111, + "step": 435410 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013069928275368667, + "loss": 0.0098, + "step": 435420 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306953945373152, + "loss": 0.0138, + "step": 435430 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013069150632094372, + "loss": 0.0126, + "step": 435440 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013068761810457226, + "loss": 0.012, + "step": 435450 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306837298882008, + "loss": 0.0107, + "step": 435460 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013067984167182935, + "loss": 0.0114, + "step": 435470 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013067595345545786, + "loss": 0.0129, + "step": 435480 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306720652390864, + "loss": 0.0131, + "step": 435490 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013066817702271494, + "loss": 0.0129, + "step": 435500 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013066428880634349, + "loss": 0.0119, + "step": 435510 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013066040058997203, + "loss": 0.0121, + "step": 435520 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013065651237360057, + "loss": 0.0106, + "step": 435530 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013065262415722908, + "loss": 0.0098, + "step": 435540 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013064873594085763, + "loss": 0.0117, + "step": 435550 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013064484772448617, + "loss": 0.0131, + "step": 435560 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306409595081147, + "loss": 0.0116, + "step": 435570 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013063707129174322, + "loss": 0.0124, + "step": 435580 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013063318307537176, + "loss": 0.0104, + "step": 435590 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306292948590003, + "loss": 0.0134, + "step": 435600 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013062540664262885, + "loss": 0.0086, + "step": 435610 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013062151842625736, + "loss": 0.0086, + "step": 435620 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306176302098859, + "loss": 0.0154, + "step": 435630 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013061374199351445, + "loss": 0.0098, + "step": 435640 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130609853777143, + "loss": 0.013, + "step": 435650 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001306059655607715, + "loss": 0.0123, + "step": 435660 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013060207734440007, + "loss": 0.0112, + "step": 435670 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013059818912802859, + "loss": 0.0124, + "step": 435680 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305943009116571, + "loss": 0.0158, + "step": 435690 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013059041269528567, + "loss": 0.0115, + "step": 435700 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013058652447891418, + "loss": 0.0153, + "step": 435710 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013058263626254272, + "loss": 0.0124, + "step": 435720 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013057874804617127, + "loss": 0.0093, + "step": 435730 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305748598297998, + "loss": 0.011, + "step": 435740 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013057097161342832, + "loss": 0.0113, + "step": 435750 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013056708339705686, + "loss": 0.0117, + "step": 435760 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305631951806854, + "loss": 0.0102, + "step": 435770 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013055930696431395, + "loss": 0.0128, + "step": 435780 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013055541874794246, + "loss": 0.0093, + "step": 435790 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130551530531571, + "loss": 0.0109, + "step": 435800 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013054764231519955, + "loss": 0.0116, + "step": 435810 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305437540988281, + "loss": 0.0201, + "step": 435820 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305398658824566, + "loss": 0.0126, + "step": 435830 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013053597766608514, + "loss": 0.0138, + "step": 435840 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013053208944971368, + "loss": 0.0118, + "step": 435850 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013052820123334223, + "loss": 0.0119, + "step": 435860 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013052431301697077, + "loss": 0.0088, + "step": 435870 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305204248005993, + "loss": 0.0101, + "step": 435880 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013051653658422782, + "loss": 0.0092, + "step": 435890 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013051264836785637, + "loss": 0.0092, + "step": 435900 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001305087601514849, + "loss": 0.0247, + "step": 435910 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013050487193511345, + "loss": 0.0105, + "step": 435920 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013050098371874196, + "loss": 0.0089, + "step": 435930 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304970955023705, + "loss": 0.0091, + "step": 435940 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013049320728599905, + "loss": 0.0141, + "step": 435950 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013048931906962756, + "loss": 0.0117, + "step": 435960 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304854308532561, + "loss": 0.0121, + "step": 435970 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013048154263688464, + "loss": 0.0117, + "step": 435980 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013047765442051319, + "loss": 0.0098, + "step": 435990 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304737662041417, + "loss": 0.0133, + "step": 436000 + }, + { + "epoch": 1.13, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.007555661257356405, + "eval_runtime": 107.5039, + "eval_samples_per_second": 18.604, + "eval_steps_per_second": 4.651, + "step": 436000 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013046987798777024, + "loss": 0.0105, + "step": 436010 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013046598977139878, + "loss": 0.0112, + "step": 436020 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013046210155502733, + "loss": 0.0091, + "step": 436030 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013045821333865584, + "loss": 0.0123, + "step": 436040 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304543251222844, + "loss": 0.0092, + "step": 436050 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013045043690591292, + "loss": 0.0114, + "step": 436060 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013044654868954147, + "loss": 0.0106, + "step": 436070 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013044266047317, + "loss": 0.0103, + "step": 436080 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013043877225679855, + "loss": 0.0115, + "step": 436090 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013043488404042706, + "loss": 0.0082, + "step": 436100 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304309958240556, + "loss": 0.01, + "step": 436110 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013042710760768415, + "loss": 0.0144, + "step": 436120 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304232193913127, + "loss": 0.0134, + "step": 436130 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001304193311749412, + "loss": 0.0102, + "step": 436140 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013041544295856974, + "loss": 0.0113, + "step": 436150 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013041155474219829, + "loss": 0.009, + "step": 436160 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013040766652582683, + "loss": 0.0119, + "step": 436170 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013040377830945534, + "loss": 0.0096, + "step": 436180 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013039989009308388, + "loss": 0.0156, + "step": 436190 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013039600187671243, + "loss": 0.0111, + "step": 436200 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013039211366034094, + "loss": 0.0132, + "step": 436210 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303882254439695, + "loss": 0.0107, + "step": 436220 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013038433722759802, + "loss": 0.0095, + "step": 436230 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013038044901122656, + "loss": 0.0117, + "step": 436240 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303765607948551, + "loss": 0.0095, + "step": 436250 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013037267257848365, + "loss": 0.0146, + "step": 436260 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013036878436211216, + "loss": 0.0114, + "step": 436270 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303648961457407, + "loss": 0.0121, + "step": 436280 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013036100792936925, + "loss": 0.0109, + "step": 436290 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303571197129978, + "loss": 0.0143, + "step": 436300 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303532314966263, + "loss": 0.0101, + "step": 436310 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013034934328025484, + "loss": 0.0122, + "step": 436320 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013034545506388339, + "loss": 0.011, + "step": 436330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013034156684751193, + "loss": 0.0088, + "step": 436340 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013033767863114044, + "loss": 0.015, + "step": 436350 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013033379041476898, + "loss": 0.0115, + "step": 436360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013032990219839752, + "loss": 0.0121, + "step": 436370 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013032601398202607, + "loss": 0.014, + "step": 436380 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303221257656546, + "loss": 0.0133, + "step": 436390 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013031823754928315, + "loss": 0.0103, + "step": 436400 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013031434933291166, + "loss": 0.0095, + "step": 436410 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001303104611165402, + "loss": 0.0108, + "step": 436420 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013030657290016875, + "loss": 0.0091, + "step": 436430 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013030268468379726, + "loss": 0.01, + "step": 436440 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302987964674258, + "loss": 0.0111, + "step": 436450 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013029490825105435, + "loss": 0.0132, + "step": 436460 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302910200346829, + "loss": 0.0146, + "step": 436470 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302871318183114, + "loss": 0.0099, + "step": 436480 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013028324360193994, + "loss": 0.0113, + "step": 436490 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013027935538556848, + "loss": 0.0113, + "step": 436500 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013027546716919703, + "loss": 0.025, + "step": 436510 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013027157895282554, + "loss": 0.0114, + "step": 436520 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013026769073645408, + "loss": 0.0107, + "step": 436530 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013026380252008262, + "loss": 0.0093, + "step": 436540 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013025991430371117, + "loss": 0.0113, + "step": 436550 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013025602608733968, + "loss": 0.013, + "step": 436560 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013025213787096825, + "loss": 0.0129, + "step": 436570 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013024824965459676, + "loss": 0.0074, + "step": 436580 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302443614382253, + "loss": 0.016, + "step": 436590 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013024047322185385, + "loss": 0.0109, + "step": 436600 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302365850054824, + "loss": 0.0151, + "step": 436610 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001302326967891109, + "loss": 0.0119, + "step": 436620 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013022880857273944, + "loss": 0.0101, + "step": 436630 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013022492035636799, + "loss": 0.0126, + "step": 436640 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013022103213999653, + "loss": 0.0124, + "step": 436650 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013021714392362504, + "loss": 0.0105, + "step": 436660 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013021325570725358, + "loss": 0.0103, + "step": 436670 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013020936749088213, + "loss": 0.0115, + "step": 436680 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013020547927451064, + "loss": 0.014, + "step": 436690 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013020159105813918, + "loss": 0.0138, + "step": 436700 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013019770284176772, + "loss": 0.0305, + "step": 436710 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013019381462539627, + "loss": 0.0112, + "step": 436720 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013018992640902478, + "loss": 0.0117, + "step": 436730 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013018603819265335, + "loss": 0.011, + "step": 436740 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013018214997628186, + "loss": 0.0111, + "step": 436750 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301782617599104, + "loss": 0.0097, + "step": 436760 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013017437354353895, + "loss": 0.0162, + "step": 436770 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301704853271675, + "loss": 0.0117, + "step": 436780 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130166597110796, + "loss": 0.0116, + "step": 436790 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013016270889442454, + "loss": 0.0094, + "step": 436800 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013015882067805309, + "loss": 0.0096, + "step": 436810 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013015493246168163, + "loss": 0.0092, + "step": 436820 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013015104424531014, + "loss": 0.0098, + "step": 436830 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013014715602893868, + "loss": 0.0107, + "step": 436840 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013014326781256723, + "loss": 0.0103, + "step": 436850 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013013937959619577, + "loss": 0.0092, + "step": 436860 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013013549137982428, + "loss": 0.0124, + "step": 436870 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013013160316345282, + "loss": 0.0113, + "step": 436880 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013012771494708136, + "loss": 0.0114, + "step": 436890 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301238267307099, + "loss": 0.0112, + "step": 436900 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013011993851433845, + "loss": 0.0175, + "step": 436910 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013011605029796696, + "loss": 0.0118, + "step": 436920 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301121620815955, + "loss": 0.0118, + "step": 436930 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013010827386522405, + "loss": 0.0128, + "step": 436940 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301043856488526, + "loss": 0.0083, + "step": 436950 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001301004974324811, + "loss": 0.0137, + "step": 436960 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013009660921610964, + "loss": 0.0101, + "step": 436970 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013009272099973819, + "loss": 0.0151, + "step": 436980 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013008883278336673, + "loss": 0.0092, + "step": 436990 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013008494456699524, + "loss": 0.0111, + "step": 437000 + }, + { + "epoch": 1.13, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.007372898980975151, + "eval_runtime": 107.4604, + "eval_samples_per_second": 18.612, + "eval_steps_per_second": 4.653, + "step": 437000 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013008105635062378, + "loss": 0.0105, + "step": 437010 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013007716813425232, + "loss": 0.0099, + "step": 437020 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013007327991788087, + "loss": 0.0135, + "step": 437030 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013006939170150938, + "loss": 0.0106, + "step": 437040 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013006550348513792, + "loss": 0.0103, + "step": 437050 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013006161526876646, + "loss": 0.0108, + "step": 437060 + }, + { + "epoch": 1.13, + "learning_rate": 0.000130057727052395, + "loss": 0.0107, + "step": 437070 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013005383883602352, + "loss": 0.0159, + "step": 437080 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001300499506196521, + "loss": 0.0108, + "step": 437090 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001300460624032806, + "loss": 0.0128, + "step": 437100 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013004217418690915, + "loss": 0.0092, + "step": 437110 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001300382859705377, + "loss": 0.0106, + "step": 437120 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013003439775416623, + "loss": 0.0124, + "step": 437130 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013003050953779474, + "loss": 0.0121, + "step": 437140 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013002662132142328, + "loss": 0.0115, + "step": 437150 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013002273310505183, + "loss": 0.0091, + "step": 437160 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013001884488868034, + "loss": 0.0091, + "step": 437170 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013001495667230888, + "loss": 0.0107, + "step": 437180 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013001106845593742, + "loss": 0.0112, + "step": 437190 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013000718023956597, + "loss": 0.0155, + "step": 437200 + }, + { + "epoch": 1.13, + "learning_rate": 0.00013000329202319448, + "loss": 0.0108, + "step": 437210 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012999940380682302, + "loss": 0.0127, + "step": 437220 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012999551559045156, + "loss": 0.0095, + "step": 437230 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299916273740801, + "loss": 0.0117, + "step": 437240 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012998773915770862, + "loss": 0.0114, + "step": 437250 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299838509413372, + "loss": 0.0098, + "step": 437260 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299799627249657, + "loss": 0.0116, + "step": 437270 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012997607450859424, + "loss": 0.0145, + "step": 437280 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012997218629222279, + "loss": 0.01, + "step": 437290 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012996829807585133, + "loss": 0.0097, + "step": 437300 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012996440985947984, + "loss": 0.009, + "step": 437310 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012996052164310838, + "loss": 0.0123, + "step": 437320 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012995663342673693, + "loss": 0.0117, + "step": 437330 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012995274521036547, + "loss": 0.0095, + "step": 437340 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012994885699399398, + "loss": 0.0092, + "step": 437350 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012994496877762252, + "loss": 0.0128, + "step": 437360 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012994108056125106, + "loss": 0.01, + "step": 437370 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299371923448796, + "loss": 0.0095, + "step": 437380 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012993330412850812, + "loss": 0.0117, + "step": 437390 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012992941591213666, + "loss": 0.0088, + "step": 437400 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299255276957652, + "loss": 0.0097, + "step": 437410 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012992163947939372, + "loss": 0.0111, + "step": 437420 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012991775126302226, + "loss": 0.0086, + "step": 437430 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001299138630466508, + "loss": 0.008, + "step": 437440 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012990997483027934, + "loss": 0.0089, + "step": 437450 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012990608661390789, + "loss": 0.0084, + "step": 437460 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012990219839753643, + "loss": 0.0134, + "step": 437470 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012989831018116494, + "loss": 0.0092, + "step": 437480 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012989442196479348, + "loss": 0.0119, + "step": 437490 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012989053374842202, + "loss": 0.0132, + "step": 437500 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012988664553205057, + "loss": 0.0121, + "step": 437510 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012988275731567908, + "loss": 0.0096, + "step": 437520 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012987886909930762, + "loss": 0.01, + "step": 437530 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012987498088293616, + "loss": 0.0111, + "step": 437540 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001298710926665647, + "loss": 0.0105, + "step": 437550 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012986720445019322, + "loss": 0.0276, + "step": 437560 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012986331623382176, + "loss": 0.0106, + "step": 437570 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001298594280174503, + "loss": 0.0104, + "step": 437580 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012985553980107885, + "loss": 0.0125, + "step": 437590 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012985165158470736, + "loss": 0.0111, + "step": 437600 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012984776336833593, + "loss": 0.011, + "step": 437610 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012984387515196444, + "loss": 0.0089, + "step": 437620 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012983998693559298, + "loss": 0.0104, + "step": 437630 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012983609871922153, + "loss": 0.0118, + "step": 437640 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012983221050285007, + "loss": 0.0108, + "step": 437650 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012982832228647858, + "loss": 0.0085, + "step": 437660 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012982443407010712, + "loss": 0.0126, + "step": 437670 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012982054585373567, + "loss": 0.0119, + "step": 437680 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012981665763736418, + "loss": 0.0092, + "step": 437690 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012981276942099272, + "loss": 0.0135, + "step": 437700 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012980888120462126, + "loss": 0.0084, + "step": 437710 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001298049929882498, + "loss": 0.0108, + "step": 437720 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012980110477187832, + "loss": 0.0156, + "step": 437730 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012979721655550686, + "loss": 0.0116, + "step": 437740 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001297933283391354, + "loss": 0.0109, + "step": 437750 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012978944012276394, + "loss": 0.0092, + "step": 437760 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012978555190639246, + "loss": 0.0141, + "step": 437770 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012978166369002103, + "loss": 0.0112, + "step": 437780 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012977777547364954, + "loss": 0.0106, + "step": 437790 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012977388725727808, + "loss": 0.0129, + "step": 437800 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012976999904090663, + "loss": 0.0097, + "step": 437810 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012976611082453517, + "loss": 0.0109, + "step": 437820 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012976222260816368, + "loss": 0.0119, + "step": 437830 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012975833439179222, + "loss": 0.0114, + "step": 437840 + }, + { + "epoch": 1.13, + "learning_rate": 0.00012975444617542077, + "loss": 0.0107, + "step": 437850 + }, + { + "epoch": 1.13, + "learning_rate": 0.0001297505579590493, + "loss": 0.0133, + "step": 437860 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012974666974267782, + "loss": 0.0146, + "step": 437870 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012974278152630636, + "loss": 0.0092, + "step": 437880 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001297388933099349, + "loss": 0.0099, + "step": 437890 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012973500509356345, + "loss": 0.0124, + "step": 437900 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012973111687719196, + "loss": 0.01, + "step": 437910 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001297272286608205, + "loss": 0.0102, + "step": 437920 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012972334044444904, + "loss": 0.0119, + "step": 437930 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012971945222807756, + "loss": 0.0116, + "step": 437940 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001297155640117061, + "loss": 0.0102, + "step": 437950 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012971167579533464, + "loss": 0.0133, + "step": 437960 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012970778757896318, + "loss": 0.0099, + "step": 437970 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012970389936259173, + "loss": 0.0105, + "step": 437980 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012970001114622027, + "loss": 0.0137, + "step": 437990 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012969612292984878, + "loss": 0.0114, + "step": 438000 + }, + { + "epoch": 1.14, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.007308073341846466, + "eval_runtime": 107.3816, + "eval_samples_per_second": 18.625, + "eval_steps_per_second": 4.656, + "step": 438000 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012969223471347732, + "loss": 0.0099, + "step": 438010 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012968834649710586, + "loss": 0.0121, + "step": 438020 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296844582807344, + "loss": 0.0094, + "step": 438030 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012968057006436292, + "loss": 0.0107, + "step": 438040 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012967668184799146, + "loss": 0.0106, + "step": 438050 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012967279363162, + "loss": 0.0119, + "step": 438060 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012966890541524855, + "loss": 0.0148, + "step": 438070 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012966501719887706, + "loss": 0.0123, + "step": 438080 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296611289825056, + "loss": 0.0105, + "step": 438090 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012965724076613414, + "loss": 0.01, + "step": 438100 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012965335254976269, + "loss": 0.0088, + "step": 438110 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296494643333912, + "loss": 0.0266, + "step": 438120 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012964557611701977, + "loss": 0.0132, + "step": 438130 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012964168790064828, + "loss": 0.0119, + "step": 438140 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012963779968427682, + "loss": 0.009, + "step": 438150 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012963391146790537, + "loss": 0.0111, + "step": 438160 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012963002325153388, + "loss": 0.0114, + "step": 438170 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012962613503516242, + "loss": 0.013, + "step": 438180 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012962224681879096, + "loss": 0.0118, + "step": 438190 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296183586024195, + "loss": 0.0108, + "step": 438200 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012961447038604802, + "loss": 0.0191, + "step": 438210 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012961058216967656, + "loss": 0.0124, + "step": 438220 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001296066939533051, + "loss": 0.0107, + "step": 438230 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012960280573693365, + "loss": 0.0139, + "step": 438240 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012959891752056216, + "loss": 0.0098, + "step": 438250 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295950293041907, + "loss": 0.0108, + "step": 438260 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012959114108781924, + "loss": 0.0091, + "step": 438270 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012958725287144778, + "loss": 0.0093, + "step": 438280 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295833646550763, + "loss": 0.0116, + "step": 438290 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012957947643870484, + "loss": 0.0089, + "step": 438300 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012957558822233338, + "loss": 0.0093, + "step": 438310 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012957170000596192, + "loss": 0.0146, + "step": 438320 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012956781178959047, + "loss": 0.0116, + "step": 438330 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129563923573219, + "loss": 0.0116, + "step": 438340 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012956003535684752, + "loss": 0.0093, + "step": 438350 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012955614714047606, + "loss": 0.0109, + "step": 438360 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295522589241046, + "loss": 0.0102, + "step": 438370 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012954837070773315, + "loss": 0.0113, + "step": 438380 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012954448249136166, + "loss": 0.0091, + "step": 438390 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295405942749902, + "loss": 0.0098, + "step": 438400 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012953670605861874, + "loss": 0.0112, + "step": 438410 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012953281784224726, + "loss": 0.0102, + "step": 438420 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295289296258758, + "loss": 0.0118, + "step": 438430 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012952504140950434, + "loss": 0.0117, + "step": 438440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012952115319313288, + "loss": 0.0121, + "step": 438450 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001295172649767614, + "loss": 0.01, + "step": 438460 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012951337676038994, + "loss": 0.0162, + "step": 438470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012950948854401848, + "loss": 0.0125, + "step": 438480 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012950560032764702, + "loss": 0.0135, + "step": 438490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012950171211127557, + "loss": 0.0098, + "step": 438500 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294978238949041, + "loss": 0.01, + "step": 438510 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012949393567853262, + "loss": 0.0102, + "step": 438520 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012949004746216116, + "loss": 0.0112, + "step": 438530 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294861592457897, + "loss": 0.011, + "step": 438540 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012948227102941825, + "loss": 0.0104, + "step": 438550 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012947838281304676, + "loss": 0.0108, + "step": 438560 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294744945966753, + "loss": 0.0108, + "step": 438570 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012947060638030384, + "loss": 0.0131, + "step": 438580 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012946671816393239, + "loss": 0.01, + "step": 438590 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294628299475609, + "loss": 0.0114, + "step": 438600 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012945894173118944, + "loss": 0.0091, + "step": 438610 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012945505351481798, + "loss": 0.0109, + "step": 438620 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012945116529844653, + "loss": 0.0115, + "step": 438630 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012944727708207504, + "loss": 0.0128, + "step": 438640 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294433888657036, + "loss": 0.0123, + "step": 438650 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012943950064933212, + "loss": 0.0121, + "step": 438660 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012943561243296064, + "loss": 0.0113, + "step": 438670 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294317242165892, + "loss": 0.0108, + "step": 438680 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012942783600021772, + "loss": 0.0161, + "step": 438690 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012942394778384626, + "loss": 0.0114, + "step": 438700 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294200595674748, + "loss": 0.0133, + "step": 438710 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012941617135110335, + "loss": 0.017, + "step": 438720 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012941228313473186, + "loss": 0.0101, + "step": 438730 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001294083949183604, + "loss": 0.0112, + "step": 438740 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012940450670198894, + "loss": 0.0095, + "step": 438750 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012940061848561749, + "loss": 0.0117, + "step": 438760 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129396730269246, + "loss": 0.0089, + "step": 438770 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012939284205287454, + "loss": 0.013, + "step": 438780 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012938895383650308, + "loss": 0.0105, + "step": 438790 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012938506562013162, + "loss": 0.0091, + "step": 438800 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012938117740376014, + "loss": 0.0086, + "step": 438810 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012937728918738868, + "loss": 0.0084, + "step": 438820 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012937340097101722, + "loss": 0.0111, + "step": 438830 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012936951275464576, + "loss": 0.0109, + "step": 438840 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293656245382743, + "loss": 0.0079, + "step": 438850 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012936173632190285, + "loss": 0.013, + "step": 438860 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012935784810553136, + "loss": 0.0115, + "step": 438870 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293539598891599, + "loss": 0.0139, + "step": 438880 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012935007167278845, + "loss": 0.0094, + "step": 438890 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129346183456417, + "loss": 0.0093, + "step": 438900 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293422952400455, + "loss": 0.0121, + "step": 438910 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012933840702367404, + "loss": 0.0126, + "step": 438920 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012933451880730258, + "loss": 0.0105, + "step": 438930 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001293306305909311, + "loss": 0.0116, + "step": 438940 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012932674237455964, + "loss": 0.0173, + "step": 438950 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012932285415818818, + "loss": 0.0117, + "step": 438960 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012931896594181672, + "loss": 0.0126, + "step": 438970 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012931507772544524, + "loss": 0.0154, + "step": 438980 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012931118950907378, + "loss": 0.0102, + "step": 438990 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012930730129270232, + "loss": 0.0122, + "step": 439000 + }, + { + "epoch": 1.14, + "eval_cer": 0.8817180823294437, + "eval_loss": 0.0074248588643968105, + "eval_runtime": 107.7068, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, + "step": 439000 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012930341307633086, + "loss": 0.0102, + "step": 439010 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012929952485995938, + "loss": 0.0084, + "step": 439020 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012929563664358795, + "loss": 0.0113, + "step": 439030 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012929174842721646, + "loss": 0.0119, + "step": 439040 + }, + { + "epoch": 1.14, + "learning_rate": 0.000129287860210845, + "loss": 0.0124, + "step": 439050 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012928397199447354, + "loss": 0.0099, + "step": 439060 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012928008377810209, + "loss": 0.0089, + "step": 439070 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001292761955617306, + "loss": 0.009, + "step": 439080 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012927230734535914, + "loss": 0.0136, + "step": 439090 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012926841912898768, + "loss": 0.0106, + "step": 439100 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012926453091261623, + "loss": 0.009, + "step": 439110 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012926064269624474, + "loss": 0.0099, + "step": 439120 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012925675447987328, + "loss": 0.0096, + "step": 439130 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012925286626350182, + "loss": 0.0097, + "step": 439140 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012924897804713034, + "loss": 0.0116, + "step": 439150 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012924508983075888, + "loss": 0.0085, + "step": 439160 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012924120161438742, + "loss": 0.012, + "step": 439170 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012923731339801596, + "loss": 0.0107, + "step": 439180 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012923342518164448, + "loss": 0.0118, + "step": 439190 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012922953696527305, + "loss": 0.0086, + "step": 439200 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012922564874890156, + "loss": 0.0145, + "step": 439210 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001292217605325301, + "loss": 0.012, + "step": 439220 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012921787231615864, + "loss": 0.0107, + "step": 439230 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012921398409978719, + "loss": 0.0089, + "step": 439240 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001292100958834157, + "loss": 0.0119, + "step": 439250 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012920620766704424, + "loss": 0.012, + "step": 439260 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012920231945067278, + "loss": 0.0102, + "step": 439270 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012919843123430133, + "loss": 0.0109, + "step": 439280 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012919454301792984, + "loss": 0.0107, + "step": 439290 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012919065480155838, + "loss": 0.0107, + "step": 439300 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012918676658518692, + "loss": 0.0129, + "step": 439310 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012918287836881546, + "loss": 0.0098, + "step": 439320 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012917899015244398, + "loss": 0.012, + "step": 439330 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012917510193607252, + "loss": 0.0135, + "step": 439340 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012917121371970106, + "loss": 0.0105, + "step": 439350 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291673255033296, + "loss": 0.01, + "step": 439360 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012916343728695815, + "loss": 0.0087, + "step": 439370 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291595490705867, + "loss": 0.0097, + "step": 439380 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291556608542152, + "loss": 0.0107, + "step": 439390 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012915177263784374, + "loss": 0.011, + "step": 439400 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012914788442147229, + "loss": 0.0109, + "step": 439410 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291439962051008, + "loss": 0.0133, + "step": 439420 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012914010798872934, + "loss": 0.0154, + "step": 439430 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012913621977235788, + "loss": 0.0118, + "step": 439440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012913233155598642, + "loss": 0.0118, + "step": 439450 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012912844333961494, + "loss": 0.0101, + "step": 439460 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012912455512324348, + "loss": 0.012, + "step": 439470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012912066690687202, + "loss": 0.0099, + "step": 439480 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012911677869050056, + "loss": 0.0101, + "step": 439490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012911289047412908, + "loss": 0.0117, + "step": 439500 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012910900225775762, + "loss": 0.0128, + "step": 439510 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012910511404138616, + "loss": 0.0117, + "step": 439520 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001291012258250147, + "loss": 0.0119, + "step": 439530 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012909733760864322, + "loss": 0.011, + "step": 439540 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001290934493922718, + "loss": 0.0157, + "step": 439550 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001290895611759003, + "loss": 0.009, + "step": 439560 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012908567295952884, + "loss": 0.0162, + "step": 439570 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012908178474315738, + "loss": 0.013, + "step": 439580 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012907789652678593, + "loss": 0.0101, + "step": 439590 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012907400831041444, + "loss": 0.0105, + "step": 439600 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012907012009404298, + "loss": 0.0116, + "step": 439610 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012906623187767152, + "loss": 0.0096, + "step": 439620 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012906234366130007, + "loss": 0.0103, + "step": 439630 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012905845544492858, + "loss": 0.0098, + "step": 439640 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012905456722855712, + "loss": 0.0104, + "step": 439650 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012905067901218566, + "loss": 0.0102, + "step": 439660 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012904679079581418, + "loss": 0.012, + "step": 439670 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012904290257944272, + "loss": 0.011, + "step": 439680 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012903901436307126, + "loss": 0.0089, + "step": 439690 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001290351261466998, + "loss": 0.0124, + "step": 439700 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012903123793032832, + "loss": 0.0089, + "step": 439710 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012902734971395689, + "loss": 0.0111, + "step": 439720 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001290234614975854, + "loss": 0.0122, + "step": 439730 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012901957328121394, + "loss": 0.0128, + "step": 439740 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012901568506484248, + "loss": 0.0115, + "step": 439750 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012901179684847103, + "loss": 0.0129, + "step": 439760 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012900790863209954, + "loss": 0.01, + "step": 439770 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012900402041572808, + "loss": 0.0097, + "step": 439780 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012900013219935662, + "loss": 0.0119, + "step": 439790 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012899624398298517, + "loss": 0.016, + "step": 439800 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012899235576661368, + "loss": 0.0095, + "step": 439810 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012898846755024222, + "loss": 0.0122, + "step": 439820 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012898457933387076, + "loss": 0.0113, + "step": 439830 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289806911174993, + "loss": 0.0087, + "step": 439840 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012897680290112782, + "loss": 0.0098, + "step": 439850 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012897291468475636, + "loss": 0.0101, + "step": 439860 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289690264683849, + "loss": 0.013, + "step": 439870 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012896513825201344, + "loss": 0.0123, + "step": 439880 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012896125003564196, + "loss": 0.0103, + "step": 439890 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289573618192705, + "loss": 0.0124, + "step": 439900 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012895347360289904, + "loss": 0.011, + "step": 439910 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012894958538652758, + "loss": 0.0088, + "step": 439920 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012894569717015613, + "loss": 0.0147, + "step": 439930 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012894180895378464, + "loss": 0.0117, + "step": 439940 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012893792073741318, + "loss": 0.0141, + "step": 439950 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012893403252104172, + "loss": 0.0102, + "step": 439960 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012893014430467026, + "loss": 0.012, + "step": 439970 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012892625608829878, + "loss": 0.013, + "step": 439980 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012892236787192732, + "loss": 0.0117, + "step": 439990 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012891847965555586, + "loss": 0.0118, + "step": 440000 + }, + { + "epoch": 1.14, + "eval_cer": 0.8817236808771804, + "eval_loss": 0.007295154966413975, + "eval_runtime": 107.4949, + "eval_samples_per_second": 18.606, + "eval_steps_per_second": 4.651, + "step": 440000 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001289145914391844, + "loss": 0.0117, + "step": 440010 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012891070322281292, + "loss": 0.0141, + "step": 440020 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012890681500644146, + "loss": 0.0151, + "step": 440030 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012890292679007, + "loss": 0.0126, + "step": 440040 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012889903857369854, + "loss": 0.0107, + "step": 440050 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012889515035732706, + "loss": 0.0065, + "step": 440060 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012889126214095563, + "loss": 0.0108, + "step": 440070 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012888737392458414, + "loss": 0.0132, + "step": 440080 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012888348570821268, + "loss": 0.0119, + "step": 440090 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012887959749184122, + "loss": 0.0106, + "step": 440100 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012887570927546977, + "loss": 0.0112, + "step": 440110 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012887182105909828, + "loss": 0.0088, + "step": 440120 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012886793284272682, + "loss": 0.011, + "step": 440130 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012886404462635536, + "loss": 0.0088, + "step": 440140 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012886015640998388, + "loss": 0.0101, + "step": 440150 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012885626819361242, + "loss": 0.0114, + "step": 440160 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012885237997724096, + "loss": 0.0139, + "step": 440170 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001288484917608695, + "loss": 0.012, + "step": 440180 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012884460354449802, + "loss": 0.0116, + "step": 440190 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012884071532812656, + "loss": 0.0139, + "step": 440200 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001288368271117551, + "loss": 0.0104, + "step": 440210 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012883293889538364, + "loss": 0.0098, + "step": 440220 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012882905067901216, + "loss": 0.0114, + "step": 440230 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012882516246264073, + "loss": 0.0086, + "step": 440240 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012882127424626924, + "loss": 0.0134, + "step": 440250 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012881738602989778, + "loss": 0.0128, + "step": 440260 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012881349781352632, + "loss": 0.0148, + "step": 440270 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012880960959715487, + "loss": 0.0115, + "step": 440280 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012880572138078338, + "loss": 0.0107, + "step": 440290 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012880183316441192, + "loss": 0.0086, + "step": 440300 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012879794494804046, + "loss": 0.0086, + "step": 440310 + }, + { + "epoch": 1.14, + "learning_rate": 0.000128794056731669, + "loss": 0.0128, + "step": 440320 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012879016851529752, + "loss": 0.0106, + "step": 440330 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012878628029892606, + "loss": 0.0121, + "step": 440340 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287823920825546, + "loss": 0.0103, + "step": 440350 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012877850386618314, + "loss": 0.0107, + "step": 440360 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012877461564981166, + "loss": 0.0102, + "step": 440370 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287707274334402, + "loss": 0.0087, + "step": 440380 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012876683921706874, + "loss": 0.0125, + "step": 440390 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012876295100069726, + "loss": 0.0131, + "step": 440400 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287590627843258, + "loss": 0.0092, + "step": 440410 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012875517456795434, + "loss": 0.0098, + "step": 440420 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012875128635158288, + "loss": 0.0113, + "step": 440430 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012874739813521142, + "loss": 0.0091, + "step": 440440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012874350991883996, + "loss": 0.0119, + "step": 440450 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012873962170246848, + "loss": 0.0106, + "step": 440460 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012873573348609702, + "loss": 0.0119, + "step": 440470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012873184526972556, + "loss": 0.0144, + "step": 440480 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287279570533541, + "loss": 0.0109, + "step": 440490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012872406883698262, + "loss": 0.0137, + "step": 440500 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012872018062061116, + "loss": 0.0115, + "step": 440510 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287162924042397, + "loss": 0.0123, + "step": 440520 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012871240418786824, + "loss": 0.0111, + "step": 440530 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012870851597149676, + "loss": 0.0096, + "step": 440540 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001287046277551253, + "loss": 0.0094, + "step": 440550 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012870073953875384, + "loss": 0.0109, + "step": 440560 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012869685132238238, + "loss": 0.0099, + "step": 440570 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286929631060109, + "loss": 0.0094, + "step": 440580 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012868907488963947, + "loss": 0.0122, + "step": 440590 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012868518667326798, + "loss": 0.0098, + "step": 440600 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012868129845689652, + "loss": 0.0093, + "step": 440610 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012867741024052506, + "loss": 0.0091, + "step": 440620 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286735220241536, + "loss": 0.0129, + "step": 440630 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012866963380778212, + "loss": 0.0097, + "step": 440640 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012866574559141066, + "loss": 0.0123, + "step": 440650 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286618573750392, + "loss": 0.0121, + "step": 440660 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012865796915866772, + "loss": 0.011, + "step": 440670 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012865408094229626, + "loss": 0.0092, + "step": 440680 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286501927259248, + "loss": 0.0111, + "step": 440690 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012864630450955334, + "loss": 0.0127, + "step": 440700 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012864241629318186, + "loss": 0.0108, + "step": 440710 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286385280768104, + "loss": 0.0122, + "step": 440720 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012863463986043894, + "loss": 0.009, + "step": 440730 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012863075164406748, + "loss": 0.0115, + "step": 440740 + }, + { + "epoch": 1.14, + "learning_rate": 0.000128626863427696, + "loss": 0.0139, + "step": 440750 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012862297521132457, + "loss": 0.01, + "step": 440760 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012861908699495308, + "loss": 0.0178, + "step": 440770 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012861519877858162, + "loss": 0.01, + "step": 440780 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012861131056221016, + "loss": 0.0125, + "step": 440790 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001286074223458387, + "loss": 0.0121, + "step": 440800 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012860353412946722, + "loss": 0.0171, + "step": 440810 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012859964591309576, + "loss": 0.0101, + "step": 440820 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285957576967243, + "loss": 0.0119, + "step": 440830 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012859186948035284, + "loss": 0.0099, + "step": 440840 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012858798126398136, + "loss": 0.0125, + "step": 440850 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285840930476099, + "loss": 0.0121, + "step": 440860 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012858020483123844, + "loss": 0.0096, + "step": 440870 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012857631661486698, + "loss": 0.0131, + "step": 440880 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285724283984955, + "loss": 0.0138, + "step": 440890 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012856854018212404, + "loss": 0.0121, + "step": 440900 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012856465196575258, + "loss": 0.0185, + "step": 440910 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285607637493811, + "loss": 0.0141, + "step": 440920 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012855687553300964, + "loss": 0.0115, + "step": 440930 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012855298731663818, + "loss": 0.0119, + "step": 440940 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012854909910026672, + "loss": 0.0094, + "step": 440950 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012854521088389526, + "loss": 0.0114, + "step": 440960 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285413226675238, + "loss": 0.0108, + "step": 440970 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012853743445115232, + "loss": 0.0089, + "step": 440980 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012853354623478086, + "loss": 0.0106, + "step": 440990 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285296580184094, + "loss": 0.0112, + "step": 441000 + }, + { + "epoch": 1.14, + "eval_cer": 0.8816592975782083, + "eval_loss": 0.007312288507819176, + "eval_runtime": 107.3849, + "eval_samples_per_second": 18.625, + "eval_steps_per_second": 4.656, + "step": 441000 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012852576980203794, + "loss": 0.0139, + "step": 441010 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012852188158566646, + "loss": 0.0109, + "step": 441020 + }, + { + "epoch": 1.14, + "learning_rate": 0.000128517993369295, + "loss": 0.0113, + "step": 441030 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012851410515292354, + "loss": 0.0104, + "step": 441040 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012851021693655208, + "loss": 0.0113, + "step": 441050 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001285063287201806, + "loss": 0.0128, + "step": 441060 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012850244050380914, + "loss": 0.012, + "step": 441070 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012849855228743768, + "loss": 0.0128, + "step": 441080 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012849466407106622, + "loss": 0.0103, + "step": 441090 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012849077585469474, + "loss": 0.0121, + "step": 441100 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001284868876383233, + "loss": 0.0115, + "step": 441110 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012848299942195182, + "loss": 0.0128, + "step": 441120 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012847911120558036, + "loss": 0.0116, + "step": 441130 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001284752229892089, + "loss": 0.0109, + "step": 441140 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012847133477283742, + "loss": 0.0098, + "step": 441150 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012846744655646596, + "loss": 0.0137, + "step": 441160 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001284635583400945, + "loss": 0.0099, + "step": 441170 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012845967012372304, + "loss": 0.016, + "step": 441180 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012845578190735156, + "loss": 0.0096, + "step": 441190 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001284518936909801, + "loss": 0.0092, + "step": 441200 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012844800547460864, + "loss": 0.0124, + "step": 441210 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012844411725823718, + "loss": 0.0116, + "step": 441220 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001284402290418657, + "loss": 0.0114, + "step": 441230 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012843634082549424, + "loss": 0.0112, + "step": 441240 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012843245260912278, + "loss": 0.0104, + "step": 441250 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012842856439275132, + "loss": 0.011, + "step": 441260 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012842467617637984, + "loss": 0.0106, + "step": 441270 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012842078796000838, + "loss": 0.0103, + "step": 441280 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012841689974363692, + "loss": 0.0156, + "step": 441290 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012841301152726546, + "loss": 0.0106, + "step": 441300 + }, + { + "epoch": 1.14, + "learning_rate": 0.000128409123310894, + "loss": 0.0104, + "step": 441310 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012840523509452255, + "loss": 0.0093, + "step": 441320 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012840134687815106, + "loss": 0.0135, + "step": 441330 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283974586617796, + "loss": 0.0133, + "step": 441340 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012839357044540814, + "loss": 0.0098, + "step": 441350 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012838968222903668, + "loss": 0.0104, + "step": 441360 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283857940126652, + "loss": 0.0108, + "step": 441370 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012838190579629374, + "loss": 0.0109, + "step": 441380 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012837801757992228, + "loss": 0.0099, + "step": 441390 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283741293635508, + "loss": 0.0117, + "step": 441400 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012837024114717934, + "loss": 0.0106, + "step": 441410 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012836635293080788, + "loss": 0.011, + "step": 441420 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012836246471443642, + "loss": 0.0156, + "step": 441430 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012835857649806494, + "loss": 0.0121, + "step": 441440 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012835468828169348, + "loss": 0.0135, + "step": 441450 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012835080006532202, + "loss": 0.0111, + "step": 441460 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012834691184895056, + "loss": 0.0154, + "step": 441470 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012834302363257908, + "loss": 0.0102, + "step": 441480 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012833913541620764, + "loss": 0.0122, + "step": 441490 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012833524719983616, + "loss": 0.0097, + "step": 441500 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283313589834647, + "loss": 0.0115, + "step": 441510 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012832747076709324, + "loss": 0.0138, + "step": 441520 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012832358255072178, + "loss": 0.0107, + "step": 441530 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001283196943343503, + "loss": 0.0113, + "step": 441540 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012831580611797884, + "loss": 0.0109, + "step": 441550 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012831191790160738, + "loss": 0.0141, + "step": 441560 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012830802968523592, + "loss": 0.0081, + "step": 441570 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012830414146886444, + "loss": 0.0094, + "step": 441580 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012830025325249298, + "loss": 0.0106, + "step": 441590 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012829636503612152, + "loss": 0.0117, + "step": 441600 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012829247681975006, + "loss": 0.0147, + "step": 441610 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012828858860337858, + "loss": 0.0101, + "step": 441620 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012828470038700712, + "loss": 0.0097, + "step": 441630 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012828081217063566, + "loss": 0.0091, + "step": 441640 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012827692395426418, + "loss": 0.0086, + "step": 441650 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012827303573789274, + "loss": 0.0125, + "step": 441660 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012826914752152126, + "loss": 0.0111, + "step": 441670 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001282652593051498, + "loss": 0.0122, + "step": 441680 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012826137108877834, + "loss": 0.0152, + "step": 441690 + }, + { + "epoch": 1.14, + "learning_rate": 0.00012825748287240688, + "loss": 0.0112, + "step": 441700 + }, + { + "epoch": 1.14, + "learning_rate": 0.0001282535946560354, + "loss": 0.0089, + "step": 441710 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012824970643966394, + "loss": 0.0126, + "step": 441720 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012824581822329248, + "loss": 0.0112, + "step": 441730 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012824193000692102, + "loss": 0.0091, + "step": 441740 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012823804179054954, + "loss": 0.0096, + "step": 441750 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012823415357417808, + "loss": 0.0106, + "step": 441760 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012823026535780662, + "loss": 0.0111, + "step": 441770 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012822637714143516, + "loss": 0.0076, + "step": 441780 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012822248892506368, + "loss": 0.0109, + "step": 441790 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012821860070869222, + "loss": 0.01, + "step": 441800 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012821471249232076, + "loss": 0.0158, + "step": 441810 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001282108242759493, + "loss": 0.012, + "step": 441820 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012820693605957784, + "loss": 0.0103, + "step": 441830 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012820304784320639, + "loss": 0.0102, + "step": 441840 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001281991596268349, + "loss": 0.0107, + "step": 441850 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012819527141046344, + "loss": 0.0112, + "step": 441860 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012819138319409198, + "loss": 0.0082, + "step": 441870 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001281874949777205, + "loss": 0.0095, + "step": 441880 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012818360676134904, + "loss": 0.0094, + "step": 441890 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012817971854497758, + "loss": 0.0115, + "step": 441900 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012817583032860612, + "loss": 0.0098, + "step": 441910 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012817194211223464, + "loss": 0.0082, + "step": 441920 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012816805389586318, + "loss": 0.0099, + "step": 441930 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012816416567949172, + "loss": 0.0112, + "step": 441940 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012816027746312026, + "loss": 0.0116, + "step": 441950 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012815638924674878, + "loss": 0.0113, + "step": 441960 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012815250103037732, + "loss": 0.009, + "step": 441970 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012814861281400586, + "loss": 0.0099, + "step": 441980 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001281447245976344, + "loss": 0.0111, + "step": 441990 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012814083638126292, + "loss": 0.0101, + "step": 442000 + }, + { + "epoch": 1.15, + "eval_cer": 0.881688689953826, + "eval_loss": 0.007025611121207476, + "eval_runtime": 107.5769, + "eval_samples_per_second": 18.591, + "eval_steps_per_second": 4.648, + "step": 442000 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012813694816489148, + "loss": 0.011, + "step": 442010 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012813305994852, + "loss": 0.0092, + "step": 442020 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012812917173214854, + "loss": 0.015, + "step": 442030 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012812528351577708, + "loss": 0.0092, + "step": 442040 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012812139529940562, + "loss": 0.0105, + "step": 442050 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012811750708303414, + "loss": 0.0116, + "step": 442060 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012811361886666268, + "loss": 0.0118, + "step": 442070 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012810973065029122, + "loss": 0.0145, + "step": 442080 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012810584243391976, + "loss": 0.0097, + "step": 442090 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012810195421754828, + "loss": 0.0126, + "step": 442100 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012809806600117682, + "loss": 0.0117, + "step": 442110 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012809417778480536, + "loss": 0.0105, + "step": 442120 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012809028956843388, + "loss": 0.0093, + "step": 442130 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012808640135206242, + "loss": 0.0134, + "step": 442140 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012808251313569096, + "loss": 0.013, + "step": 442150 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280786249193195, + "loss": 0.0101, + "step": 442160 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012807473670294802, + "loss": 0.0115, + "step": 442170 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012807084848657658, + "loss": 0.012, + "step": 442180 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280669602702051, + "loss": 0.0105, + "step": 442190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012806307205383364, + "loss": 0.0091, + "step": 442200 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012805918383746218, + "loss": 0.0156, + "step": 442210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012805529562109072, + "loss": 0.0111, + "step": 442220 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012805140740471924, + "loss": 0.0101, + "step": 442230 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012804751918834778, + "loss": 0.0088, + "step": 442240 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012804363097197632, + "loss": 0.0093, + "step": 442250 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012803974275560486, + "loss": 0.0109, + "step": 442260 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012803585453923338, + "loss": 0.0114, + "step": 442270 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012803196632286192, + "loss": 0.0132, + "step": 442280 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012802807810649046, + "loss": 0.0107, + "step": 442290 + }, + { + "epoch": 1.15, + "learning_rate": 0.000128024189890119, + "loss": 0.0114, + "step": 442300 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012802030167374752, + "loss": 0.0108, + "step": 442310 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012801641345737606, + "loss": 0.0121, + "step": 442320 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001280125252410046, + "loss": 0.0111, + "step": 442330 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012800863702463314, + "loss": 0.0063, + "step": 442340 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012800474880826168, + "loss": 0.0134, + "step": 442350 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012800086059189023, + "loss": 0.0102, + "step": 442360 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012799697237551874, + "loss": 0.0081, + "step": 442370 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012799308415914728, + "loss": 0.0097, + "step": 442380 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012798919594277582, + "loss": 0.0103, + "step": 442390 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012798530772640434, + "loss": 0.0123, + "step": 442400 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012798141951003288, + "loss": 0.0082, + "step": 442410 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012797753129366142, + "loss": 0.0134, + "step": 442420 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012797364307728996, + "loss": 0.0114, + "step": 442430 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012796975486091848, + "loss": 0.0117, + "step": 442440 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012796586664454702, + "loss": 0.0108, + "step": 442450 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012796197842817556, + "loss": 0.0124, + "step": 442460 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001279580902118041, + "loss": 0.0134, + "step": 442470 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012795420199543262, + "loss": 0.0108, + "step": 442480 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012795031377906116, + "loss": 0.0118, + "step": 442490 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001279464255626897, + "loss": 0.0126, + "step": 442500 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012794253734631824, + "loss": 0.0105, + "step": 442510 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012793864912994676, + "loss": 0.0118, + "step": 442520 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012793476091357532, + "loss": 0.0111, + "step": 442530 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012793087269720384, + "loss": 0.0102, + "step": 442540 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012792698448083238, + "loss": 0.0113, + "step": 442550 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012792309626446092, + "loss": 0.0093, + "step": 442560 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012791920804808946, + "loss": 0.0117, + "step": 442570 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012791531983171798, + "loss": 0.0128, + "step": 442580 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012791143161534652, + "loss": 0.0111, + "step": 442590 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012790754339897506, + "loss": 0.0105, + "step": 442600 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001279036551826036, + "loss": 0.0117, + "step": 442610 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012789976696623212, + "loss": 0.013, + "step": 442620 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012789587874986066, + "loss": 0.0146, + "step": 442630 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278919905334892, + "loss": 0.012, + "step": 442640 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012788810231711772, + "loss": 0.0125, + "step": 442650 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012788421410074626, + "loss": 0.011, + "step": 442660 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278803258843748, + "loss": 0.0108, + "step": 442670 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012787643766800334, + "loss": 0.0098, + "step": 442680 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012787254945163186, + "loss": 0.0115, + "step": 442690 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012786866123526042, + "loss": 0.0149, + "step": 442700 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012786477301888894, + "loss": 0.012, + "step": 442710 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012786088480251748, + "loss": 0.0108, + "step": 442720 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012785699658614602, + "loss": 0.0122, + "step": 442730 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012785310836977456, + "loss": 0.0115, + "step": 442740 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012784922015340308, + "loss": 0.0098, + "step": 442750 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012784533193703162, + "loss": 0.0104, + "step": 442760 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012784144372066016, + "loss": 0.0095, + "step": 442770 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278375555042887, + "loss": 0.0099, + "step": 442780 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012783366728791722, + "loss": 0.0105, + "step": 442790 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012782977907154576, + "loss": 0.0104, + "step": 442800 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278258908551743, + "loss": 0.0089, + "step": 442810 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012782200263880284, + "loss": 0.0116, + "step": 442820 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012781811442243136, + "loss": 0.0103, + "step": 442830 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278142262060599, + "loss": 0.0112, + "step": 442840 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012781033798968844, + "loss": 0.0162, + "step": 442850 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012780644977331698, + "loss": 0.0094, + "step": 442860 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001278025615569455, + "loss": 0.0088, + "step": 442870 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012779867334057404, + "loss": 0.0157, + "step": 442880 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012779478512420258, + "loss": 0.0122, + "step": 442890 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012779089690783112, + "loss": 0.0123, + "step": 442900 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012778700869145966, + "loss": 0.0141, + "step": 442910 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012778312047508818, + "loss": 0.0114, + "step": 442920 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012777923225871672, + "loss": 0.011, + "step": 442930 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012777534404234526, + "loss": 0.0095, + "step": 442940 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277714558259738, + "loss": 0.0096, + "step": 442950 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012776756760960232, + "loss": 0.0106, + "step": 442960 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012776367939323086, + "loss": 0.0101, + "step": 442970 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277597911768594, + "loss": 0.0114, + "step": 442980 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012775590296048794, + "loss": 0.0094, + "step": 442990 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012775201474411646, + "loss": 0.0128, + "step": 443000 + }, + { + "epoch": 1.15, + "eval_cer": 0.8817026863231677, + "eval_loss": 0.007168120238929987, + "eval_runtime": 107.6791, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 4.643, + "step": 443000 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127748126527745, + "loss": 0.0116, + "step": 443010 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012774423831137354, + "loss": 0.0096, + "step": 443020 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012774035009500208, + "loss": 0.0092, + "step": 443030 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277364618786306, + "loss": 0.0109, + "step": 443040 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012773257366225916, + "loss": 0.0077, + "step": 443050 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012772868544588768, + "loss": 0.0146, + "step": 443060 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012772479722951622, + "loss": 0.0157, + "step": 443070 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012772090901314476, + "loss": 0.0078, + "step": 443080 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277170207967733, + "loss": 0.0119, + "step": 443090 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012771313258040182, + "loss": 0.0102, + "step": 443100 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012770924436403036, + "loss": 0.0125, + "step": 443110 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001277053561476589, + "loss": 0.014, + "step": 443120 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012770146793128742, + "loss": 0.0104, + "step": 443130 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012769757971491596, + "loss": 0.0128, + "step": 443140 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276936914985445, + "loss": 0.0131, + "step": 443150 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012768980328217304, + "loss": 0.0105, + "step": 443160 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012768591506580156, + "loss": 0.0096, + "step": 443170 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276820268494301, + "loss": 0.0105, + "step": 443180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012767813863305864, + "loss": 0.0087, + "step": 443190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012767425041668718, + "loss": 0.0096, + "step": 443200 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276703622003157, + "loss": 0.012, + "step": 443210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012766647398394426, + "loss": 0.0122, + "step": 443220 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012766258576757278, + "loss": 0.0099, + "step": 443230 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012765869755120132, + "loss": 0.0113, + "step": 443240 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012765480933482986, + "loss": 0.0123, + "step": 443250 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276509211184584, + "loss": 0.0144, + "step": 443260 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012764703290208692, + "loss": 0.011, + "step": 443270 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012764314468571546, + "loss": 0.0116, + "step": 443280 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127639256469344, + "loss": 0.0107, + "step": 443290 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012763536825297254, + "loss": 0.0106, + "step": 443300 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012763148003660106, + "loss": 0.0113, + "step": 443310 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276275918202296, + "loss": 0.0104, + "step": 443320 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012762370360385814, + "loss": 0.0085, + "step": 443330 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012761981538748668, + "loss": 0.0096, + "step": 443340 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276159271711152, + "loss": 0.0125, + "step": 443350 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012761203895474374, + "loss": 0.011, + "step": 443360 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012760815073837228, + "loss": 0.0157, + "step": 443370 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001276042625220008, + "loss": 0.0128, + "step": 443380 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012760037430562934, + "loss": 0.0122, + "step": 443390 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012759648608925788, + "loss": 0.0108, + "step": 443400 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012759259787288642, + "loss": 0.0117, + "step": 443410 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012758870965651496, + "loss": 0.0112, + "step": 443420 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275848214401435, + "loss": 0.0116, + "step": 443430 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012758093322377202, + "loss": 0.012, + "step": 443440 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012757704500740056, + "loss": 0.0099, + "step": 443450 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275731567910291, + "loss": 0.0105, + "step": 443460 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012756926857465764, + "loss": 0.009, + "step": 443470 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012756538035828616, + "loss": 0.0092, + "step": 443480 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275614921419147, + "loss": 0.0117, + "step": 443490 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012755760392554324, + "loss": 0.0104, + "step": 443500 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012755371570917178, + "loss": 0.0125, + "step": 443510 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275498274928003, + "loss": 0.0126, + "step": 443520 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012754593927642884, + "loss": 0.0124, + "step": 443530 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012754205106005738, + "loss": 0.0083, + "step": 443540 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012753816284368592, + "loss": 0.0116, + "step": 443550 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012753427462731444, + "loss": 0.0096, + "step": 443560 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127530386410943, + "loss": 0.0111, + "step": 443570 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012752649819457152, + "loss": 0.0113, + "step": 443580 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012752260997820006, + "loss": 0.0089, + "step": 443590 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275187217618286, + "loss": 0.0083, + "step": 443600 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012751483354545714, + "loss": 0.0146, + "step": 443610 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012751094532908566, + "loss": 0.008, + "step": 443620 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001275070571127142, + "loss": 0.0099, + "step": 443630 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012750316889634274, + "loss": 0.0111, + "step": 443640 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012749928067997126, + "loss": 0.0106, + "step": 443650 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274953924635998, + "loss": 0.0124, + "step": 443660 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012749150424722834, + "loss": 0.0103, + "step": 443670 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012748761603085688, + "loss": 0.0351, + "step": 443680 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274837278144854, + "loss": 0.0102, + "step": 443690 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012747983959811394, + "loss": 0.0114, + "step": 443700 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012747595138174248, + "loss": 0.0117, + "step": 443710 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012747206316537102, + "loss": 0.0104, + "step": 443720 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012746817494899954, + "loss": 0.014, + "step": 443730 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274642867326281, + "loss": 0.0119, + "step": 443740 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012746039851625662, + "loss": 0.0144, + "step": 443750 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012745651029988516, + "loss": 0.0094, + "step": 443760 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274526220835137, + "loss": 0.0114, + "step": 443770 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012744873386714224, + "loss": 0.0125, + "step": 443780 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012744484565077076, + "loss": 0.0094, + "step": 443790 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274409574343993, + "loss": 0.0131, + "step": 443800 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012743706921802784, + "loss": 0.0127, + "step": 443810 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012743318100165638, + "loss": 0.0095, + "step": 443820 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001274292927852849, + "loss": 0.0117, + "step": 443830 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012742540456891344, + "loss": 0.0118, + "step": 443840 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012742151635254198, + "loss": 0.0091, + "step": 443850 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012741762813617052, + "loss": 0.0129, + "step": 443860 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012741373991979904, + "loss": 0.0163, + "step": 443870 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012740985170342758, + "loss": 0.0149, + "step": 443880 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012740596348705612, + "loss": 0.0086, + "step": 443890 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012740207527068463, + "loss": 0.0091, + "step": 443900 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012739818705431318, + "loss": 0.013, + "step": 443910 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012739429883794172, + "loss": 0.0096, + "step": 443920 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012739041062157026, + "loss": 0.0119, + "step": 443930 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001273865224051988, + "loss": 0.0091, + "step": 443940 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012738263418882734, + "loss": 0.0081, + "step": 443950 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012737874597245586, + "loss": 0.012, + "step": 443960 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001273748577560844, + "loss": 0.0125, + "step": 443970 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012737096953971294, + "loss": 0.0105, + "step": 443980 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012736708132334148, + "loss": 0.0178, + "step": 443990 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012736319310697, + "loss": 0.0141, + "step": 444000 + }, + { + "epoch": 1.15, + "eval_cer": 0.8817026863231677, + "eval_loss": 0.007035560440272093, + "eval_runtime": 107.7478, + "eval_samples_per_second": 18.562, + "eval_steps_per_second": 4.64, + "step": 444000 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012735930489059854, + "loss": 0.0124, + "step": 444010 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012735541667422708, + "loss": 0.0107, + "step": 444020 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012735152845785562, + "loss": 0.0163, + "step": 444030 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012734764024148414, + "loss": 0.0098, + "step": 444040 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012734375202511268, + "loss": 0.0118, + "step": 444050 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012733986380874122, + "loss": 0.0108, + "step": 444060 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012733597559236976, + "loss": 0.0104, + "step": 444070 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012733208737599828, + "loss": 0.0145, + "step": 444080 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012732819915962684, + "loss": 0.0127, + "step": 444090 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012732431094325536, + "loss": 0.0088, + "step": 444100 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001273204227268839, + "loss": 0.0096, + "step": 444110 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012731653451051244, + "loss": 0.0098, + "step": 444120 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012731264629414096, + "loss": 0.0095, + "step": 444130 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001273087580777695, + "loss": 0.0112, + "step": 444140 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012730486986139804, + "loss": 0.0103, + "step": 444150 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012730098164502658, + "loss": 0.0141, + "step": 444160 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001272970934286551, + "loss": 0.0092, + "step": 444170 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012729320521228364, + "loss": 0.0117, + "step": 444180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012728931699591218, + "loss": 0.0121, + "step": 444190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012728542877954072, + "loss": 0.0131, + "step": 444200 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012728154056316924, + "loss": 0.0091, + "step": 444210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012727765234679778, + "loss": 0.0123, + "step": 444220 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012727376413042632, + "loss": 0.0092, + "step": 444230 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012726987591405486, + "loss": 0.0111, + "step": 444240 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012726598769768337, + "loss": 0.0126, + "step": 444250 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012726209948131192, + "loss": 0.0115, + "step": 444260 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012725821126494046, + "loss": 0.0089, + "step": 444270 + }, + { + "epoch": 1.15, + "learning_rate": 0.000127254323048569, + "loss": 0.0101, + "step": 444280 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012725043483219754, + "loss": 0.0132, + "step": 444290 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012724654661582608, + "loss": 0.0101, + "step": 444300 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001272426583994546, + "loss": 0.0096, + "step": 444310 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012723877018308314, + "loss": 0.012, + "step": 444320 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012723488196671168, + "loss": 0.0096, + "step": 444330 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012723099375034022, + "loss": 0.0129, + "step": 444340 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012722710553396874, + "loss": 0.012, + "step": 444350 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012722321731759728, + "loss": 0.0125, + "step": 444360 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012721932910122582, + "loss": 0.0102, + "step": 444370 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012721544088485433, + "loss": 0.0095, + "step": 444380 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012721155266848288, + "loss": 0.0132, + "step": 444390 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012720766445211142, + "loss": 0.0067, + "step": 444400 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012720377623573996, + "loss": 0.0117, + "step": 444410 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012719988801936847, + "loss": 0.0104, + "step": 444420 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012719599980299702, + "loss": 0.0121, + "step": 444430 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012719211158662556, + "loss": 0.0094, + "step": 444440 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271882233702541, + "loss": 0.0105, + "step": 444450 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012718433515388261, + "loss": 0.0123, + "step": 444460 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012718044693751118, + "loss": 0.0106, + "step": 444470 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271765587211397, + "loss": 0.0089, + "step": 444480 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012717267050476824, + "loss": 0.0103, + "step": 444490 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012716878228839678, + "loss": 0.0105, + "step": 444500 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012716489407202532, + "loss": 0.0138, + "step": 444510 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012716100585565384, + "loss": 0.0117, + "step": 444520 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012715711763928238, + "loss": 0.0118, + "step": 444530 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012715322942291092, + "loss": 0.0109, + "step": 444540 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012714934120653946, + "loss": 0.0084, + "step": 444550 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012714545299016798, + "loss": 0.015, + "step": 444560 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012714156477379652, + "loss": 0.0119, + "step": 444570 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012713767655742506, + "loss": 0.0087, + "step": 444580 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271337883410536, + "loss": 0.0156, + "step": 444590 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012712990012468212, + "loss": 0.0104, + "step": 444600 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012712601190831066, + "loss": 0.0109, + "step": 444610 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271221236919392, + "loss": 0.0125, + "step": 444620 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271182354755677, + "loss": 0.0105, + "step": 444630 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012711434725919628, + "loss": 0.0094, + "step": 444640 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001271104590428248, + "loss": 0.0113, + "step": 444650 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012710657082645334, + "loss": 0.0124, + "step": 444660 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012710268261008188, + "loss": 0.01, + "step": 444670 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012709879439371042, + "loss": 0.0107, + "step": 444680 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012709490617733894, + "loss": 0.0124, + "step": 444690 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012709101796096748, + "loss": 0.012, + "step": 444700 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012708712974459602, + "loss": 0.0126, + "step": 444710 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012708324152822456, + "loss": 0.0099, + "step": 444720 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012707935331185308, + "loss": 0.0183, + "step": 444730 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012707546509548162, + "loss": 0.0119, + "step": 444740 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012707157687911016, + "loss": 0.0145, + "step": 444750 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001270676886627387, + "loss": 0.011, + "step": 444760 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012706380044636721, + "loss": 0.0127, + "step": 444770 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012705991222999576, + "loss": 0.0104, + "step": 444780 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001270560240136243, + "loss": 0.0105, + "step": 444790 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012705213579725284, + "loss": 0.0111, + "step": 444800 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012704824758088138, + "loss": 0.0091, + "step": 444810 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012704435936450992, + "loss": 0.0098, + "step": 444820 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012704047114813844, + "loss": 0.0124, + "step": 444830 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012703658293176698, + "loss": 0.0098, + "step": 444840 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012703269471539552, + "loss": 0.0112, + "step": 444850 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012702880649902404, + "loss": 0.0129, + "step": 444860 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012702491828265258, + "loss": 0.0115, + "step": 444870 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012702103006628112, + "loss": 0.0126, + "step": 444880 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012701714184990966, + "loss": 0.0083, + "step": 444890 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012701325363353817, + "loss": 0.0109, + "step": 444900 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012700936541716672, + "loss": 0.0094, + "step": 444910 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012700547720079526, + "loss": 0.014, + "step": 444920 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001270015889844238, + "loss": 0.0131, + "step": 444930 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012699770076805231, + "loss": 0.0108, + "step": 444940 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012699381255168086, + "loss": 0.0099, + "step": 444950 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269899243353094, + "loss": 0.0109, + "step": 444960 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012698603611893794, + "loss": 0.0117, + "step": 444970 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012698214790256645, + "loss": 0.0126, + "step": 444980 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012697825968619502, + "loss": 0.0106, + "step": 444990 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012697437146982354, + "loss": 0.0111, + "step": 445000 + }, + { + "epoch": 1.15, + "eval_cer": 0.8817152830555753, + "eval_loss": 0.0074842702597379684, + "eval_runtime": 107.1551, + "eval_samples_per_second": 18.665, + "eval_steps_per_second": 4.666, + "step": 445000 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012697048325345208, + "loss": 0.0119, + "step": 445010 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012696659503708062, + "loss": 0.0057, + "step": 445020 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012696270682070916, + "loss": 0.0092, + "step": 445030 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012695881860433768, + "loss": 0.0106, + "step": 445040 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012695493038796622, + "loss": 0.0132, + "step": 445050 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012695104217159476, + "loss": 0.0132, + "step": 445060 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269471539552233, + "loss": 0.0126, + "step": 445070 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012694326573885182, + "loss": 0.0109, + "step": 445080 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012693937752248036, + "loss": 0.0095, + "step": 445090 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269354893061089, + "loss": 0.0139, + "step": 445100 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012693160108973741, + "loss": 0.0123, + "step": 445110 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012692771287336596, + "loss": 0.0115, + "step": 445120 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001269238246569945, + "loss": 0.0115, + "step": 445130 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012691993644062304, + "loss": 0.0086, + "step": 445140 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012691604822425155, + "loss": 0.009, + "step": 445150 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012691216000788012, + "loss": 0.0094, + "step": 445160 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012690827179150864, + "loss": 0.011, + "step": 445170 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012690438357513718, + "loss": 0.0102, + "step": 445180 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012690049535876572, + "loss": 0.0119, + "step": 445190 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012689660714239426, + "loss": 0.0122, + "step": 445200 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012689271892602278, + "loss": 0.0079, + "step": 445210 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012688883070965132, + "loss": 0.0083, + "step": 445220 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012688494249327986, + "loss": 0.0132, + "step": 445230 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268810542769084, + "loss": 0.0118, + "step": 445240 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012687716606053692, + "loss": 0.0103, + "step": 445250 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012687327784416546, + "loss": 0.013, + "step": 445260 + }, + { + "epoch": 1.15, + "learning_rate": 0.000126869389627794, + "loss": 0.0112, + "step": 445270 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012686550141142254, + "loss": 0.0147, + "step": 445280 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012686161319505105, + "loss": 0.0101, + "step": 445290 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268577249786796, + "loss": 0.0122, + "step": 445300 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012685383676230814, + "loss": 0.0104, + "step": 445310 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012684994854593668, + "loss": 0.01, + "step": 445320 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012684606032956522, + "loss": 0.0094, + "step": 445330 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012684217211319376, + "loss": 0.0109, + "step": 445340 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012683828389682228, + "loss": 0.0112, + "step": 445350 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012683439568045082, + "loss": 0.0138, + "step": 445360 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012683050746407936, + "loss": 0.011, + "step": 445370 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012682661924770788, + "loss": 0.0109, + "step": 445380 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012682273103133642, + "loss": 0.0129, + "step": 445390 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012681884281496496, + "loss": 0.0098, + "step": 445400 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268149545985935, + "loss": 0.0134, + "step": 445410 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012681106638222201, + "loss": 0.0109, + "step": 445420 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012680717816585056, + "loss": 0.0103, + "step": 445430 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001268032899494791, + "loss": 0.0109, + "step": 445440 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012679940173310764, + "loss": 0.0103, + "step": 445450 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012679551351673615, + "loss": 0.0138, + "step": 445460 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001267916253003647, + "loss": 0.011, + "step": 445470 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012678773708399324, + "loss": 0.0107, + "step": 445480 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012678384886762178, + "loss": 0.0156, + "step": 445490 + }, + { + "epoch": 1.15, + "learning_rate": 0.0001267799606512503, + "loss": 0.0083, + "step": 445500 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012677607243487886, + "loss": 0.0105, + "step": 445510 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012677218421850738, + "loss": 0.01, + "step": 445520 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012676829600213592, + "loss": 0.0128, + "step": 445530 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012676440778576446, + "loss": 0.0117, + "step": 445540 + }, + { + "epoch": 1.15, + "learning_rate": 0.000126760519569393, + "loss": 0.0102, + "step": 445550 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012675663135302152, + "loss": 0.0099, + "step": 445560 + }, + { + "epoch": 1.15, + "learning_rate": 0.00012675274313665006, + "loss": 0.0099, + "step": 445570 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001267488549202786, + "loss": 0.0102, + "step": 445580 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012674496670390714, + "loss": 0.0117, + "step": 445590 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012674107848753566, + "loss": 0.0091, + "step": 445600 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001267371902711642, + "loss": 0.0095, + "step": 445610 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012673330205479274, + "loss": 0.0104, + "step": 445620 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012672941383842125, + "loss": 0.013, + "step": 445630 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001267255256220498, + "loss": 0.0159, + "step": 445640 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012672163740567834, + "loss": 0.0143, + "step": 445650 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012671774918930688, + "loss": 0.0111, + "step": 445660 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001267138609729354, + "loss": 0.0078, + "step": 445670 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012670997275656396, + "loss": 0.0076, + "step": 445680 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012670608454019248, + "loss": 0.0154, + "step": 445690 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012670219632382102, + "loss": 0.0127, + "step": 445700 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012669830810744956, + "loss": 0.0094, + "step": 445710 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266944198910781, + "loss": 0.0105, + "step": 445720 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012669053167470662, + "loss": 0.0108, + "step": 445730 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012668664345833516, + "loss": 0.0092, + "step": 445740 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266827552419637, + "loss": 0.0108, + "step": 445750 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012667886702559224, + "loss": 0.01, + "step": 445760 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012667497880922076, + "loss": 0.0108, + "step": 445770 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266710905928493, + "loss": 0.0107, + "step": 445780 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012666720237647784, + "loss": 0.0114, + "step": 445790 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012666331416010638, + "loss": 0.0092, + "step": 445800 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266594259437349, + "loss": 0.0145, + "step": 445810 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012665553772736344, + "loss": 0.0143, + "step": 445820 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012665164951099198, + "loss": 0.0114, + "step": 445830 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012664776129462052, + "loss": 0.0116, + "step": 445840 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012664387307824903, + "loss": 0.0125, + "step": 445850 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012663998486187758, + "loss": 0.0113, + "step": 445860 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012663609664550612, + "loss": 0.0071, + "step": 445870 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012663220842913466, + "loss": 0.022, + "step": 445880 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266283202127632, + "loss": 0.0099, + "step": 445890 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012662443199639172, + "loss": 0.013, + "step": 445900 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012662054378002026, + "loss": 0.0106, + "step": 445910 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266166555636488, + "loss": 0.0121, + "step": 445920 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012661276734727734, + "loss": 0.0152, + "step": 445930 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012660887913090585, + "loss": 0.0137, + "step": 445940 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001266049909145344, + "loss": 0.0101, + "step": 445950 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012660110269816294, + "loss": 0.011, + "step": 445960 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012659721448179148, + "loss": 0.0117, + "step": 445970 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012659332626542, + "loss": 0.0094, + "step": 445980 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012658943804904854, + "loss": 0.0074, + "step": 445990 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012658554983267708, + "loss": 0.0116, + "step": 446000 + }, + { + "epoch": 1.16, + "eval_cer": 0.8816648961259449, + "eval_loss": 0.007201557978987694, + "eval_runtime": 107.397, + "eval_samples_per_second": 18.622, + "eval_steps_per_second": 4.656, + "step": 446000 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012658166161630562, + "loss": 0.0083, + "step": 446010 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012657777339993413, + "loss": 0.0113, + "step": 446020 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265738851835627, + "loss": 0.0161, + "step": 446030 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012656999696719122, + "loss": 0.0103, + "step": 446040 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012656610875081976, + "loss": 0.0126, + "step": 446050 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265622205344483, + "loss": 0.0123, + "step": 446060 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012655833231807684, + "loss": 0.0102, + "step": 446070 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012655444410170536, + "loss": 0.0115, + "step": 446080 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265505558853339, + "loss": 0.0106, + "step": 446090 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012654666766896244, + "loss": 0.0116, + "step": 446100 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012654277945259095, + "loss": 0.0133, + "step": 446110 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265388912362195, + "loss": 0.0136, + "step": 446120 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012653500301984804, + "loss": 0.0127, + "step": 446130 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012653111480347658, + "loss": 0.0111, + "step": 446140 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265272265871051, + "loss": 0.0091, + "step": 446150 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012652333837073364, + "loss": 0.0152, + "step": 446160 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012651945015436218, + "loss": 0.0087, + "step": 446170 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012651556193799072, + "loss": 0.0123, + "step": 446180 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012651167372161923, + "loss": 0.0111, + "step": 446190 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001265077855052478, + "loss": 0.0112, + "step": 446200 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012650389728887632, + "loss": 0.0139, + "step": 446210 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012650000907250486, + "loss": 0.014, + "step": 446220 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264961208561334, + "loss": 0.0096, + "step": 446230 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012649223263976194, + "loss": 0.0118, + "step": 446240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012648834442339046, + "loss": 0.0156, + "step": 446250 + }, + { + "epoch": 1.16, + "learning_rate": 0.000126484456207019, + "loss": 0.0102, + "step": 446260 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012648056799064754, + "loss": 0.0093, + "step": 446270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012647667977427608, + "loss": 0.0105, + "step": 446280 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264727915579046, + "loss": 0.0137, + "step": 446290 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012646890334153314, + "loss": 0.009, + "step": 446300 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012646501512516168, + "loss": 0.0087, + "step": 446310 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012646112690879022, + "loss": 0.0098, + "step": 446320 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012645723869241873, + "loss": 0.0155, + "step": 446330 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012645335047604728, + "loss": 0.0101, + "step": 446340 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012644946225967582, + "loss": 0.0106, + "step": 446350 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012644557404330433, + "loss": 0.0104, + "step": 446360 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012644168582693287, + "loss": 0.0101, + "step": 446370 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012643779761056142, + "loss": 0.01, + "step": 446380 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012643390939418996, + "loss": 0.0109, + "step": 446390 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264300211778185, + "loss": 0.0098, + "step": 446400 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012642613296144704, + "loss": 0.0098, + "step": 446410 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012642224474507556, + "loss": 0.0118, + "step": 446420 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264183565287041, + "loss": 0.0109, + "step": 446430 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012641446831233264, + "loss": 0.0113, + "step": 446440 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012641058009596118, + "loss": 0.0082, + "step": 446450 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001264066918795897, + "loss": 0.0118, + "step": 446460 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012640280366321824, + "loss": 0.0127, + "step": 446470 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012639891544684678, + "loss": 0.0111, + "step": 446480 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012639502723047532, + "loss": 0.0103, + "step": 446490 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012639113901410383, + "loss": 0.0139, + "step": 446500 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012638725079773238, + "loss": 0.0137, + "step": 446510 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012638336258136092, + "loss": 0.0123, + "step": 446520 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012637947436498946, + "loss": 0.013, + "step": 446530 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012637558614861797, + "loss": 0.0136, + "step": 446540 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012637169793224654, + "loss": 0.0098, + "step": 446550 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012636780971587506, + "loss": 0.0102, + "step": 446560 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263639214995036, + "loss": 0.0126, + "step": 446570 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012636003328313214, + "loss": 0.0083, + "step": 446580 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012635614506676068, + "loss": 0.0126, + "step": 446590 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263522568503892, + "loss": 0.0125, + "step": 446600 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012634836863401774, + "loss": 0.0121, + "step": 446610 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012634448041764628, + "loss": 0.0121, + "step": 446620 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001263405922012748, + "loss": 0.0132, + "step": 446630 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012633670398490334, + "loss": 0.0117, + "step": 446640 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012633281576853188, + "loss": 0.0113, + "step": 446650 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012632892755216042, + "loss": 0.0088, + "step": 446660 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012632503933578893, + "loss": 0.0097, + "step": 446670 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012632115111941748, + "loss": 0.01, + "step": 446680 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012631726290304602, + "loss": 0.0099, + "step": 446690 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012631337468667456, + "loss": 0.01, + "step": 446700 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012630948647030307, + "loss": 0.0099, + "step": 446710 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012630559825393161, + "loss": 0.0136, + "step": 446720 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012630171003756016, + "loss": 0.0112, + "step": 446730 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001262978218211887, + "loss": 0.0101, + "step": 446740 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012629393360481724, + "loss": 0.0108, + "step": 446750 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012629004538844578, + "loss": 0.0086, + "step": 446760 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001262861571720743, + "loss": 0.0108, + "step": 446770 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012628226895570284, + "loss": 0.0128, + "step": 446780 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012627838073933138, + "loss": 0.01, + "step": 446790 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012627449252295992, + "loss": 0.0126, + "step": 446800 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012627060430658844, + "loss": 0.0117, + "step": 446810 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012626671609021698, + "loss": 0.0155, + "step": 446820 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012626282787384552, + "loss": 0.0132, + "step": 446830 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012625893965747406, + "loss": 0.01, + "step": 446840 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012625505144110257, + "loss": 0.0109, + "step": 446850 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012625116322473112, + "loss": 0.0115, + "step": 446860 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012624727500835966, + "loss": 0.0134, + "step": 446870 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012624338679198817, + "loss": 0.009, + "step": 446880 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012623949857561671, + "loss": 0.0109, + "step": 446890 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012623561035924526, + "loss": 0.0089, + "step": 446900 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001262317221428738, + "loss": 0.0101, + "step": 446910 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012622783392650234, + "loss": 0.0096, + "step": 446920 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012622394571013088, + "loss": 0.0117, + "step": 446930 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001262200574937594, + "loss": 0.0086, + "step": 446940 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012621616927738794, + "loss": 0.0111, + "step": 446950 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012621228106101648, + "loss": 0.0108, + "step": 446960 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012620839284464502, + "loss": 0.01, + "step": 446970 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012620450462827353, + "loss": 0.0092, + "step": 446980 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012620061641190208, + "loss": 0.0144, + "step": 446990 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012619672819553062, + "loss": 0.0123, + "step": 447000 + }, + { + "epoch": 1.16, + "eval_cer": 0.8817054855970361, + "eval_loss": 0.007263442501425743, + "eval_runtime": 107.2268, + "eval_samples_per_second": 18.652, + "eval_steps_per_second": 4.663, + "step": 447000 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012619283997915916, + "loss": 0.0073, + "step": 447010 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012618895176278767, + "loss": 0.0123, + "step": 447020 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012618506354641622, + "loss": 0.0104, + "step": 447030 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012618117533004476, + "loss": 0.0112, + "step": 447040 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261772871136733, + "loss": 0.0092, + "step": 447050 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261733988973018, + "loss": 0.0101, + "step": 447060 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012616951068093038, + "loss": 0.0117, + "step": 447070 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261656224645589, + "loss": 0.0119, + "step": 447080 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261617342481874, + "loss": 0.0108, + "step": 447090 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012615784603181598, + "loss": 0.0097, + "step": 447100 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261539578154445, + "loss": 0.0115, + "step": 447110 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012615006959907304, + "loss": 0.0137, + "step": 447120 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012614618138270158, + "loss": 0.0121, + "step": 447130 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012614229316633012, + "loss": 0.0108, + "step": 447140 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012613840494995863, + "loss": 0.0075, + "step": 447150 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012613451673358718, + "loss": 0.0086, + "step": 447160 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012613062851721572, + "loss": 0.0083, + "step": 447170 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012612674030084426, + "loss": 0.0128, + "step": 447180 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012612285208447277, + "loss": 0.0112, + "step": 447190 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012611896386810131, + "loss": 0.0136, + "step": 447200 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012611507565172986, + "loss": 0.0101, + "step": 447210 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261111874353584, + "loss": 0.0096, + "step": 447220 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001261072992189869, + "loss": 0.0114, + "step": 447230 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012610341100261545, + "loss": 0.0103, + "step": 447240 + }, + { + "epoch": 1.16, + "learning_rate": 0.000126099522786244, + "loss": 0.0117, + "step": 447250 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012609563456987254, + "loss": 0.0135, + "step": 447260 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012609174635350108, + "loss": 0.0095, + "step": 447270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012608785813712962, + "loss": 0.0106, + "step": 447280 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012608396992075814, + "loss": 0.0092, + "step": 447290 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012608008170438668, + "loss": 0.0115, + "step": 447300 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012607619348801522, + "loss": 0.0082, + "step": 447310 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012607230527164376, + "loss": 0.013, + "step": 447320 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012606841705527227, + "loss": 0.0138, + "step": 447330 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012606452883890082, + "loss": 0.0081, + "step": 447340 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012606064062252936, + "loss": 0.0149, + "step": 447350 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012605675240615787, + "loss": 0.0123, + "step": 447360 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012605286418978641, + "loss": 0.0151, + "step": 447370 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012604897597341496, + "loss": 0.0095, + "step": 447380 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001260450877570435, + "loss": 0.0107, + "step": 447390 + }, + { + "epoch": 1.16, + "learning_rate": 0.000126041199540672, + "loss": 0.0082, + "step": 447400 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012603731132430055, + "loss": 0.0115, + "step": 447410 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001260334231079291, + "loss": 0.0109, + "step": 447420 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012602953489155764, + "loss": 0.0106, + "step": 447430 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012602564667518615, + "loss": 0.0127, + "step": 447440 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012602175845881472, + "loss": 0.012, + "step": 447450 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012601787024244323, + "loss": 0.0105, + "step": 447460 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012601398202607178, + "loss": 0.0099, + "step": 447470 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012601009380970032, + "loss": 0.0103, + "step": 447480 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012600620559332886, + "loss": 0.0115, + "step": 447490 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012600231737695737, + "loss": 0.0123, + "step": 447500 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012599842916058592, + "loss": 0.0079, + "step": 447510 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012599454094421446, + "loss": 0.0111, + "step": 447520 + }, + { + "epoch": 1.16, + "learning_rate": 0.000125990652727843, + "loss": 0.0126, + "step": 447530 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012598676451147151, + "loss": 0.008, + "step": 447540 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012598287629510006, + "loss": 0.0124, + "step": 447550 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259789880787286, + "loss": 0.0078, + "step": 447560 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012597509986235714, + "loss": 0.01, + "step": 447570 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012597121164598565, + "loss": 0.0123, + "step": 447580 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259673234296142, + "loss": 0.013, + "step": 447590 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012596343521324274, + "loss": 0.0099, + "step": 447600 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012595954699687125, + "loss": 0.0103, + "step": 447610 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012595565878049982, + "loss": 0.0112, + "step": 447620 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012595177056412833, + "loss": 0.012, + "step": 447630 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012594788234775688, + "loss": 0.011, + "step": 447640 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012594399413138542, + "loss": 0.0101, + "step": 447650 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012594010591501396, + "loss": 0.0097, + "step": 447660 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012593621769864247, + "loss": 0.0087, + "step": 447670 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012593232948227102, + "loss": 0.0162, + "step": 447680 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012592844126589956, + "loss": 0.0118, + "step": 447690 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259245530495281, + "loss": 0.0111, + "step": 447700 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259206648331566, + "loss": 0.012, + "step": 447710 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012591677661678515, + "loss": 0.0103, + "step": 447720 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259128884004137, + "loss": 0.0138, + "step": 447730 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012590900018404224, + "loss": 0.0149, + "step": 447740 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012590511196767075, + "loss": 0.0091, + "step": 447750 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001259012237512993, + "loss": 0.0087, + "step": 447760 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012589733553492784, + "loss": 0.0092, + "step": 447770 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012589344731855638, + "loss": 0.0107, + "step": 447780 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012588955910218492, + "loss": 0.0116, + "step": 447790 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012588567088581346, + "loss": 0.0097, + "step": 447800 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012588178266944198, + "loss": 0.0143, + "step": 447810 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012587789445307052, + "loss": 0.0097, + "step": 447820 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012587400623669906, + "loss": 0.013, + "step": 447830 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012587011802032757, + "loss": 0.0096, + "step": 447840 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012586622980395611, + "loss": 0.0113, + "step": 447850 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012586234158758466, + "loss": 0.0124, + "step": 447860 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258584533712132, + "loss": 0.011, + "step": 447870 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258545651548417, + "loss": 0.0096, + "step": 447880 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012585067693847025, + "loss": 0.0107, + "step": 447890 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258467887220988, + "loss": 0.0108, + "step": 447900 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012584290050572734, + "loss": 0.0116, + "step": 447910 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012583901228935585, + "loss": 0.0093, + "step": 447920 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258351240729844, + "loss": 0.0086, + "step": 447930 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012583123585661294, + "loss": 0.015, + "step": 447940 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012582734764024148, + "loss": 0.0099, + "step": 447950 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012582345942387, + "loss": 0.0121, + "step": 447960 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012581957120749856, + "loss": 0.0101, + "step": 447970 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012581568299112707, + "loss": 0.0119, + "step": 447980 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012581179477475562, + "loss": 0.0151, + "step": 447990 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012580790655838416, + "loss": 0.009, + "step": 448000 + }, + { + "epoch": 1.16, + "eval_cer": 0.8817068852339703, + "eval_loss": 0.007401402574032545, + "eval_runtime": 107.5857, + "eval_samples_per_second": 18.59, + "eval_steps_per_second": 4.647, + "step": 448000 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001258040183420127, + "loss": 0.0098, + "step": 448010 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012580013012564121, + "loss": 0.01, + "step": 448020 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012579624190926976, + "loss": 0.0082, + "step": 448030 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257923536928983, + "loss": 0.0101, + "step": 448040 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012578846547652684, + "loss": 0.0125, + "step": 448050 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012578457726015535, + "loss": 0.0111, + "step": 448060 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257806890437839, + "loss": 0.0093, + "step": 448070 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012577680082741244, + "loss": 0.0094, + "step": 448080 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012577291261104095, + "loss": 0.012, + "step": 448090 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257690243946695, + "loss": 0.0125, + "step": 448100 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012576513617829803, + "loss": 0.0107, + "step": 448110 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012576124796192658, + "loss": 0.0133, + "step": 448120 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257573597455551, + "loss": 0.0085, + "step": 448130 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012575347152918366, + "loss": 0.0126, + "step": 448140 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012574958331281217, + "loss": 0.0088, + "step": 448150 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012574569509644072, + "loss": 0.0105, + "step": 448160 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012574180688006926, + "loss": 0.0162, + "step": 448170 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257379186636978, + "loss": 0.0098, + "step": 448180 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012573403044732631, + "loss": 0.0096, + "step": 448190 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012573014223095486, + "loss": 0.0106, + "step": 448200 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257262540145834, + "loss": 0.0091, + "step": 448210 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012572236579821194, + "loss": 0.008, + "step": 448220 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012571847758184045, + "loss": 0.0126, + "step": 448230 + }, + { + "epoch": 1.16, + "learning_rate": 0.000125714589365469, + "loss": 0.0143, + "step": 448240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012571070114909754, + "loss": 0.0101, + "step": 448250 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012570681293272608, + "loss": 0.0101, + "step": 448260 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001257029247163546, + "loss": 0.0112, + "step": 448270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012569903649998313, + "loss": 0.0123, + "step": 448280 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012569514828361168, + "loss": 0.009, + "step": 448290 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012569126006724022, + "loss": 0.0111, + "step": 448300 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012568737185086873, + "loss": 0.0112, + "step": 448310 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256834836344973, + "loss": 0.0092, + "step": 448320 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012567959541812582, + "loss": 0.0091, + "step": 448330 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012567570720175436, + "loss": 0.0097, + "step": 448340 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256718189853829, + "loss": 0.0131, + "step": 448350 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256679307690114, + "loss": 0.0119, + "step": 448360 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012566404255263995, + "loss": 0.0126, + "step": 448370 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256601543362685, + "loss": 0.0114, + "step": 448380 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012565626611989704, + "loss": 0.0098, + "step": 448390 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012565237790352555, + "loss": 0.0107, + "step": 448400 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256484896871541, + "loss": 0.0114, + "step": 448410 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012564460147078264, + "loss": 0.0118, + "step": 448420 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012564071325441118, + "loss": 0.0095, + "step": 448430 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256368250380397, + "loss": 0.0101, + "step": 448440 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012563293682166823, + "loss": 0.0154, + "step": 448450 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012562904860529678, + "loss": 0.0115, + "step": 448460 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012562516038892532, + "loss": 0.0122, + "step": 448470 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012562127217255383, + "loss": 0.01, + "step": 448480 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001256173839561824, + "loss": 0.0115, + "step": 448490 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012561349573981091, + "loss": 0.0113, + "step": 448500 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012560960752343946, + "loss": 0.0087, + "step": 448510 + }, + { + "epoch": 1.16, + "learning_rate": 0.000125605719307068, + "loss": 0.0104, + "step": 448520 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012560183109069654, + "loss": 0.0133, + "step": 448530 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012559794287432505, + "loss": 0.0118, + "step": 448540 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255940546579536, + "loss": 0.01, + "step": 448550 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012559016644158214, + "loss": 0.0123, + "step": 448560 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012558627822521068, + "loss": 0.0085, + "step": 448570 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255823900088392, + "loss": 0.0105, + "step": 448580 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012557850179246774, + "loss": 0.0135, + "step": 448590 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012557461357609628, + "loss": 0.0107, + "step": 448600 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255707253597248, + "loss": 0.0142, + "step": 448610 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012556683714335333, + "loss": 0.0117, + "step": 448620 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012556294892698187, + "loss": 0.0092, + "step": 448630 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012555906071061042, + "loss": 0.0098, + "step": 448640 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012555517249423893, + "loss": 0.0114, + "step": 448650 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255512842778675, + "loss": 0.0115, + "step": 448660 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012554739606149601, + "loss": 0.0095, + "step": 448670 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012554350784512456, + "loss": 0.0109, + "step": 448680 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255396196287531, + "loss": 0.0096, + "step": 448690 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012553573141238164, + "loss": 0.0133, + "step": 448700 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012553184319601015, + "loss": 0.0112, + "step": 448710 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255279549796387, + "loss": 0.011, + "step": 448720 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012552406676326724, + "loss": 0.0081, + "step": 448730 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012552017854689578, + "loss": 0.012, + "step": 448740 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001255162903305243, + "loss": 0.0126, + "step": 448750 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012551240211415283, + "loss": 0.0107, + "step": 448760 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012550851389778138, + "loss": 0.0114, + "step": 448770 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012550462568140992, + "loss": 0.0119, + "step": 448780 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012550073746503843, + "loss": 0.0091, + "step": 448790 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012549684924866697, + "loss": 0.0083, + "step": 448800 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012549296103229552, + "loss": 0.0122, + "step": 448810 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012548907281592406, + "loss": 0.0126, + "step": 448820 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012548518459955257, + "loss": 0.0118, + "step": 448830 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012548129638318111, + "loss": 0.0083, + "step": 448840 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012547740816680966, + "loss": 0.0108, + "step": 448850 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254735199504382, + "loss": 0.0109, + "step": 448860 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012546963173406674, + "loss": 0.014, + "step": 448870 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012546574351769525, + "loss": 0.0109, + "step": 448880 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254618553013238, + "loss": 0.0135, + "step": 448890 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012545796708495234, + "loss": 0.0088, + "step": 448900 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012545407886858088, + "loss": 0.011, + "step": 448910 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254501906522094, + "loss": 0.0118, + "step": 448920 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012544630243583793, + "loss": 0.0097, + "step": 448930 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012544241421946648, + "loss": 0.012, + "step": 448940 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012543852600309502, + "loss": 0.0103, + "step": 448950 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012543463778672353, + "loss": 0.0106, + "step": 448960 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012543074957035207, + "loss": 0.0114, + "step": 448970 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012542686135398062, + "loss": 0.0099, + "step": 448980 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012542297313760916, + "loss": 0.0102, + "step": 448990 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012541908492123767, + "loss": 0.0122, + "step": 449000 + }, + { + "epoch": 1.16, + "eval_cer": 0.8817446754311932, + "eval_loss": 0.0073244315572083, + "eval_runtime": 107.5578, + "eval_samples_per_second": 18.595, + "eval_steps_per_second": 4.649, + "step": 449000 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012541519670486624, + "loss": 0.0118, + "step": 449010 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012541130848849475, + "loss": 0.0152, + "step": 449020 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001254074202721233, + "loss": 0.0105, + "step": 449030 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012540353205575184, + "loss": 0.0114, + "step": 449040 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012539964383938038, + "loss": 0.01, + "step": 449050 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253957556230089, + "loss": 0.0122, + "step": 449060 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012539186740663744, + "loss": 0.015, + "step": 449070 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012538797919026598, + "loss": 0.0096, + "step": 449080 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253840909738945, + "loss": 0.0088, + "step": 449090 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012538020275752303, + "loss": 0.0115, + "step": 449100 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012537631454115158, + "loss": 0.0089, + "step": 449110 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012537242632478012, + "loss": 0.0122, + "step": 449120 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012536853810840863, + "loss": 0.0151, + "step": 449130 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012536464989203717, + "loss": 0.0095, + "step": 449140 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012536076167566571, + "loss": 0.0127, + "step": 449150 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012535687345929426, + "loss": 0.0094, + "step": 449160 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012535298524292277, + "loss": 0.0092, + "step": 449170 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012534909702655134, + "loss": 0.0093, + "step": 449180 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012534520881017985, + "loss": 0.0128, + "step": 449190 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001253413205938084, + "loss": 0.0108, + "step": 449200 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012533743237743694, + "loss": 0.0139, + "step": 449210 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012533354416106548, + "loss": 0.013, + "step": 449220 + }, + { + "epoch": 1.16, + "learning_rate": 0.000125329655944694, + "loss": 0.0099, + "step": 449230 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012532576772832254, + "loss": 0.0111, + "step": 449240 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012532187951195108, + "loss": 0.0092, + "step": 449250 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012531799129557962, + "loss": 0.0105, + "step": 449260 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012531410307920813, + "loss": 0.0099, + "step": 449270 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012531021486283667, + "loss": 0.0107, + "step": 449280 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012530632664646522, + "loss": 0.0148, + "step": 449290 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012530243843009376, + "loss": 0.0111, + "step": 449300 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012529855021372227, + "loss": 0.0087, + "step": 449310 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012529466199735081, + "loss": 0.0093, + "step": 449320 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012529077378097936, + "loss": 0.0114, + "step": 449330 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012528688556460787, + "loss": 0.0101, + "step": 449340 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001252829973482364, + "loss": 0.0102, + "step": 449350 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012527910913186495, + "loss": 0.0113, + "step": 449360 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001252752209154935, + "loss": 0.0104, + "step": 449370 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012527133269912204, + "loss": 0.0122, + "step": 449380 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012526744448275058, + "loss": 0.015, + "step": 449390 + }, + { + "epoch": 1.16, + "learning_rate": 0.0001252635562663791, + "loss": 0.012, + "step": 449400 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012525966805000763, + "loss": 0.0101, + "step": 449410 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012525577983363618, + "loss": 0.0087, + "step": 449420 + }, + { + "epoch": 1.16, + "learning_rate": 0.00012525189161726472, + "loss": 0.0107, + "step": 449430 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012524800340089323, + "loss": 0.0097, + "step": 449440 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012524411518452177, + "loss": 0.0124, + "step": 449450 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012524022696815032, + "loss": 0.0111, + "step": 449460 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012523633875177886, + "loss": 0.0137, + "step": 449470 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012523245053540737, + "loss": 0.0114, + "step": 449480 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001252285623190359, + "loss": 0.0128, + "step": 449490 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012522467410266446, + "loss": 0.0098, + "step": 449500 + }, + { + "epoch": 1.17, + "learning_rate": 0.000125220785886293, + "loss": 0.0119, + "step": 449510 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001252168976699215, + "loss": 0.0132, + "step": 449520 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012521300945355008, + "loss": 0.012, + "step": 449530 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001252091212371786, + "loss": 0.0097, + "step": 449540 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012520523302080714, + "loss": 0.0114, + "step": 449550 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012520134480443568, + "loss": 0.0157, + "step": 449560 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251974565880642, + "loss": 0.0115, + "step": 449570 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012519356837169273, + "loss": 0.0094, + "step": 449580 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012518968015532128, + "loss": 0.0101, + "step": 449590 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012518579193894982, + "loss": 0.0108, + "step": 449600 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012518190372257833, + "loss": 0.0113, + "step": 449610 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012517801550620687, + "loss": 0.0104, + "step": 449620 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012517412728983542, + "loss": 0.0098, + "step": 449630 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012517023907346396, + "loss": 0.0093, + "step": 449640 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012516635085709247, + "loss": 0.0114, + "step": 449650 + }, + { + "epoch": 1.17, + "learning_rate": 0.000125162462640721, + "loss": 0.013, + "step": 449660 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012515857442434955, + "loss": 0.0084, + "step": 449670 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251546862079781, + "loss": 0.0098, + "step": 449680 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251507979916066, + "loss": 0.0101, + "step": 449690 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012514690977523515, + "loss": 0.0078, + "step": 449700 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001251430215588637, + "loss": 0.0106, + "step": 449710 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012513913334249224, + "loss": 0.0081, + "step": 449720 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012513524512612078, + "loss": 0.0114, + "step": 449730 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012513135690974932, + "loss": 0.0115, + "step": 449740 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012512746869337783, + "loss": 0.0094, + "step": 449750 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012512358047700638, + "loss": 0.0112, + "step": 449760 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012511969226063492, + "loss": 0.0078, + "step": 449770 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012511580404426346, + "loss": 0.0115, + "step": 449780 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012511191582789197, + "loss": 0.0102, + "step": 449790 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012510802761152051, + "loss": 0.0108, + "step": 449800 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012510413939514906, + "loss": 0.0115, + "step": 449810 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012510025117877757, + "loss": 0.009, + "step": 449820 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250963629624061, + "loss": 0.0114, + "step": 449830 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012509247474603465, + "loss": 0.0067, + "step": 449840 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250885865296632, + "loss": 0.0158, + "step": 449850 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250846983132917, + "loss": 0.0095, + "step": 449860 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012508081009692025, + "loss": 0.0104, + "step": 449870 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250769218805488, + "loss": 0.0075, + "step": 449880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012507303366417734, + "loss": 0.0126, + "step": 449890 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012506914544780585, + "loss": 0.0101, + "step": 449900 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012506525723143442, + "loss": 0.0067, + "step": 449910 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012506136901506293, + "loss": 0.034, + "step": 449920 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012505748079869147, + "loss": 0.0121, + "step": 449930 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012505359258232002, + "loss": 0.0121, + "step": 449940 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012504970436594856, + "loss": 0.0097, + "step": 449950 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012504581614957707, + "loss": 0.0093, + "step": 449960 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012504192793320561, + "loss": 0.0113, + "step": 449970 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012503803971683416, + "loss": 0.0149, + "step": 449980 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250341515004627, + "loss": 0.0106, + "step": 449990 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250302632840912, + "loss": 0.0107, + "step": 450000 + }, + { + "epoch": 1.17, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.007372671272605658, + "eval_runtime": 107.4625, + "eval_samples_per_second": 18.611, + "eval_steps_per_second": 4.653, + "step": 450000 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012502637506771975, + "loss": 0.0104, + "step": 450010 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001250224868513483, + "loss": 0.012, + "step": 450020 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012501859863497684, + "loss": 0.0088, + "step": 450030 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012501471041860535, + "loss": 0.014, + "step": 450040 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012501082220223392, + "loss": 0.0095, + "step": 450050 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012500693398586243, + "loss": 0.0098, + "step": 450060 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012500304576949095, + "loss": 0.0119, + "step": 450070 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012499915755311952, + "loss": 0.0109, + "step": 450080 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012499526933674803, + "loss": 0.0104, + "step": 450090 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012499138112037657, + "loss": 0.0091, + "step": 450100 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012498749290400512, + "loss": 0.0096, + "step": 450110 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012498360468763366, + "loss": 0.0095, + "step": 450120 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012497971647126217, + "loss": 0.0116, + "step": 450130 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249758282548907, + "loss": 0.0094, + "step": 450140 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012497194003851925, + "loss": 0.0113, + "step": 450150 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249680518221478, + "loss": 0.013, + "step": 450160 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249641636057763, + "loss": 0.0144, + "step": 450170 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012496027538940485, + "loss": 0.0108, + "step": 450180 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249563871730334, + "loss": 0.0126, + "step": 450190 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012495249895666194, + "loss": 0.0123, + "step": 450200 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012494861074029045, + "loss": 0.0119, + "step": 450210 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124944722523919, + "loss": 0.0117, + "step": 450220 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012494083430754753, + "loss": 0.0107, + "step": 450230 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012493694609117608, + "loss": 0.0118, + "step": 450240 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012493305787480462, + "loss": 0.0107, + "step": 450250 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012492916965843316, + "loss": 0.01, + "step": 450260 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012492528144206167, + "loss": 0.0092, + "step": 450270 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012492139322569021, + "loss": 0.0093, + "step": 450280 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012491750500931876, + "loss": 0.01, + "step": 450290 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249136167929473, + "loss": 0.0108, + "step": 450300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249097285765758, + "loss": 0.0087, + "step": 450310 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012490584036020435, + "loss": 0.011, + "step": 450320 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001249019521438329, + "loss": 0.0115, + "step": 450330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248980639274614, + "loss": 0.0129, + "step": 450340 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012489417571108995, + "loss": 0.0112, + "step": 450350 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248902874947185, + "loss": 0.0112, + "step": 450360 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012488639927834704, + "loss": 0.0102, + "step": 450370 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012488251106197555, + "loss": 0.0139, + "step": 450380 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248786228456041, + "loss": 0.0105, + "step": 450390 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012487473462923263, + "loss": 0.0154, + "step": 450400 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012487084641286117, + "loss": 0.0134, + "step": 450410 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248669581964897, + "loss": 0.0113, + "step": 450420 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012486306998011826, + "loss": 0.0114, + "step": 450430 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012485918176374677, + "loss": 0.013, + "step": 450440 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012485529354737531, + "loss": 0.0104, + "step": 450450 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012485140533100386, + "loss": 0.0111, + "step": 450460 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248475171146324, + "loss": 0.0152, + "step": 450470 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248436288982609, + "loss": 0.0113, + "step": 450480 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012483974068188945, + "loss": 0.0106, + "step": 450490 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124835852465518, + "loss": 0.0113, + "step": 450500 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012483196424914654, + "loss": 0.0118, + "step": 450510 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012482807603277505, + "loss": 0.0094, + "step": 450520 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248241878164036, + "loss": 0.0109, + "step": 450530 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012482029960003213, + "loss": 0.0096, + "step": 450540 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012481641138366068, + "loss": 0.0131, + "step": 450550 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248125231672892, + "loss": 0.0145, + "step": 450560 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012480863495091773, + "loss": 0.0124, + "step": 450570 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012480474673454627, + "loss": 0.0145, + "step": 450580 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001248008585181748, + "loss": 0.0124, + "step": 450590 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012479697030180336, + "loss": 0.0117, + "step": 450600 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012479308208543187, + "loss": 0.0082, + "step": 450610 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012478919386906041, + "loss": 0.0094, + "step": 450620 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012478530565268896, + "loss": 0.01, + "step": 450630 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247814174363175, + "loss": 0.0077, + "step": 450640 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124777529219946, + "loss": 0.0112, + "step": 450650 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012477364100357455, + "loss": 0.016, + "step": 450660 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247697527872031, + "loss": 0.009, + "step": 450670 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012476586457083164, + "loss": 0.0117, + "step": 450680 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012476197635446015, + "loss": 0.0106, + "step": 450690 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247580881380887, + "loss": 0.011, + "step": 450700 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012475419992171723, + "loss": 0.0146, + "step": 450710 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012475031170534578, + "loss": 0.0123, + "step": 450720 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247464234889743, + "loss": 0.0127, + "step": 450730 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012474253527260283, + "loss": 0.0106, + "step": 450740 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012473864705623137, + "loss": 0.0101, + "step": 450750 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012473475883985992, + "loss": 0.0118, + "step": 450760 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012473087062348846, + "loss": 0.0122, + "step": 450770 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124726982407117, + "loss": 0.0142, + "step": 450780 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247230941907455, + "loss": 0.0145, + "step": 450790 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012471920597437405, + "loss": 0.0105, + "step": 450800 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247153177580026, + "loss": 0.0095, + "step": 450810 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247114295416311, + "loss": 0.0098, + "step": 450820 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012470754132525965, + "loss": 0.0108, + "step": 450830 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001247036531088882, + "loss": 0.0106, + "step": 450840 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012469976489251674, + "loss": 0.0094, + "step": 450850 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012469587667614525, + "loss": 0.0103, + "step": 450860 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246919884597738, + "loss": 0.0103, + "step": 450870 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012468810024340233, + "loss": 0.0103, + "step": 450880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012468421202703088, + "loss": 0.0093, + "step": 450890 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246803238106594, + "loss": 0.0139, + "step": 450900 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012467643559428793, + "loss": 0.0093, + "step": 450910 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012467254737791647, + "loss": 0.0079, + "step": 450920 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012466865916154501, + "loss": 0.0114, + "step": 450930 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012466477094517353, + "loss": 0.0086, + "step": 450940 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246608827288021, + "loss": 0.0111, + "step": 450950 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246569945124306, + "loss": 0.0161, + "step": 450960 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012465310629605915, + "loss": 0.0176, + "step": 450970 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246492180796877, + "loss": 0.012, + "step": 450980 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012464532986331624, + "loss": 0.0102, + "step": 450990 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012464144164694475, + "loss": 0.0114, + "step": 451000 + }, + { + "epoch": 1.17, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.007332668174058199, + "eval_runtime": 107.5021, + "eval_samples_per_second": 18.604, + "eval_steps_per_second": 4.651, + "step": 451000 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246375534305733, + "loss": 0.0121, + "step": 451010 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012463366521420184, + "loss": 0.0107, + "step": 451020 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012462977699783038, + "loss": 0.0098, + "step": 451030 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246258887814589, + "loss": 0.0119, + "step": 451040 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012462200056508743, + "loss": 0.0099, + "step": 451050 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012461811234871597, + "loss": 0.0106, + "step": 451060 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001246142241323445, + "loss": 0.0091, + "step": 451070 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012461033591597303, + "loss": 0.0114, + "step": 451080 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012460644769960157, + "loss": 0.0124, + "step": 451090 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012460255948323011, + "loss": 0.0174, + "step": 451100 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012459867126685863, + "loss": 0.0093, + "step": 451110 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245947830504872, + "loss": 0.0109, + "step": 451120 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245908948341157, + "loss": 0.0117, + "step": 451130 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012458700661774425, + "loss": 0.0113, + "step": 451140 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245831184013728, + "loss": 0.0116, + "step": 451150 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012457923018500134, + "loss": 0.0135, + "step": 451160 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012457534196862985, + "loss": 0.0108, + "step": 451170 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245714537522584, + "loss": 0.0086, + "step": 451180 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012456756553588693, + "loss": 0.0116, + "step": 451190 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012456367731951548, + "loss": 0.0088, + "step": 451200 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124559789103144, + "loss": 0.0119, + "step": 451210 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012455590088677253, + "loss": 0.0111, + "step": 451220 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012455201267040107, + "loss": 0.01, + "step": 451230 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012454812445402962, + "loss": 0.0103, + "step": 451240 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012454423623765813, + "loss": 0.0132, + "step": 451250 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012454034802128667, + "loss": 0.0089, + "step": 451260 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012453645980491521, + "loss": 0.0094, + "step": 451270 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012453257158854376, + "loss": 0.0108, + "step": 451280 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012452868337217227, + "loss": 0.0128, + "step": 451290 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012452479515580084, + "loss": 0.0109, + "step": 451300 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012452090693942935, + "loss": 0.0117, + "step": 451310 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245170187230579, + "loss": 0.0114, + "step": 451320 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012451313050668644, + "loss": 0.0115, + "step": 451330 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012450924229031495, + "loss": 0.0097, + "step": 451340 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001245053540739435, + "loss": 0.0099, + "step": 451350 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012450146585757203, + "loss": 0.0095, + "step": 451360 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012449757764120058, + "loss": 0.0122, + "step": 451370 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244936894248291, + "loss": 0.0111, + "step": 451380 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012448980120845763, + "loss": 0.0102, + "step": 451390 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012448591299208617, + "loss": 0.0108, + "step": 451400 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012448202477571472, + "loss": 0.0082, + "step": 451410 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012447813655934323, + "loss": 0.0108, + "step": 451420 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012447424834297177, + "loss": 0.0116, + "step": 451430 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244703601266003, + "loss": 0.0094, + "step": 451440 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012446647191022885, + "loss": 0.0095, + "step": 451450 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012446258369385737, + "loss": 0.0118, + "step": 451460 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012445869547748594, + "loss": 0.0083, + "step": 451470 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012445480726111445, + "loss": 0.0098, + "step": 451480 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124450919044743, + "loss": 0.0112, + "step": 451490 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012444703082837154, + "loss": 0.0101, + "step": 451500 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012444314261200008, + "loss": 0.0096, + "step": 451510 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244392543956286, + "loss": 0.0098, + "step": 451520 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012443536617925713, + "loss": 0.0181, + "step": 451530 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012443147796288568, + "loss": 0.0164, + "step": 451540 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012442758974651422, + "loss": 0.0095, + "step": 451550 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012442370153014273, + "loss": 0.0137, + "step": 451560 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012441981331377127, + "loss": 0.0129, + "step": 451570 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012441592509739981, + "loss": 0.0091, + "step": 451580 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012441203688102833, + "loss": 0.0138, + "step": 451590 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012440814866465687, + "loss": 0.0116, + "step": 451600 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001244042604482854, + "loss": 0.0115, + "step": 451610 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012440037223191395, + "loss": 0.0124, + "step": 451620 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012439648401554247, + "loss": 0.0112, + "step": 451630 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012439259579917104, + "loss": 0.0114, + "step": 451640 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012438870758279955, + "loss": 0.009, + "step": 451650 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243848193664281, + "loss": 0.0091, + "step": 451660 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012438093115005664, + "loss": 0.01, + "step": 451670 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012437704293368518, + "loss": 0.0101, + "step": 451680 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243731547173137, + "loss": 0.0116, + "step": 451690 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012436926650094223, + "loss": 0.0126, + "step": 451700 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012436537828457077, + "loss": 0.0101, + "step": 451710 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012436149006819932, + "loss": 0.0095, + "step": 451720 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012435760185182783, + "loss": 0.0153, + "step": 451730 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012435371363545637, + "loss": 0.0093, + "step": 451740 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012434982541908491, + "loss": 0.0131, + "step": 451750 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012434593720271346, + "loss": 0.0154, + "step": 451760 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012434204898634197, + "loss": 0.0085, + "step": 451770 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243381607699705, + "loss": 0.0142, + "step": 451780 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012433427255359905, + "loss": 0.0113, + "step": 451790 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243303843372276, + "loss": 0.0141, + "step": 451800 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243264961208561, + "loss": 0.0102, + "step": 451810 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012432260790448465, + "loss": 0.0121, + "step": 451820 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243187196881132, + "loss": 0.0107, + "step": 451830 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012431483147174173, + "loss": 0.0094, + "step": 451840 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012431094325537028, + "loss": 0.0097, + "step": 451850 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001243070550389988, + "loss": 0.0142, + "step": 451860 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012430316682262733, + "loss": 0.0128, + "step": 451870 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012429927860625587, + "loss": 0.0097, + "step": 451880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012429539038988442, + "loss": 0.0096, + "step": 451890 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012429150217351293, + "loss": 0.0118, + "step": 451900 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012428761395714147, + "loss": 0.0112, + "step": 451910 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012428372574077, + "loss": 0.0108, + "step": 451920 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012427983752439856, + "loss": 0.0084, + "step": 451930 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012427594930802707, + "loss": 0.0094, + "step": 451940 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242720610916556, + "loss": 0.01, + "step": 451950 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012426817287528415, + "loss": 0.0119, + "step": 451960 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242642846589127, + "loss": 0.0117, + "step": 451970 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242603964425412, + "loss": 0.0094, + "step": 451980 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012425650822616978, + "loss": 0.0125, + "step": 451990 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242526200097983, + "loss": 0.0134, + "step": 452000 + }, + { + "epoch": 1.17, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.007198153994977474, + "eval_runtime": 107.5259, + "eval_samples_per_second": 18.6, + "eval_steps_per_second": 4.65, + "step": 452000 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012424873179342683, + "loss": 0.0107, + "step": 452010 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012424484357705538, + "loss": 0.0084, + "step": 452020 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012424095536068392, + "loss": 0.0103, + "step": 452030 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012423706714431243, + "loss": 0.0102, + "step": 452040 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012423317892794097, + "loss": 0.0102, + "step": 452050 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012422929071156952, + "loss": 0.0117, + "step": 452060 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012422540249519803, + "loss": 0.0126, + "step": 452070 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012422151427882657, + "loss": 0.0118, + "step": 452080 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242176260624551, + "loss": 0.0085, + "step": 452090 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012421373784608365, + "loss": 0.0098, + "step": 452100 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012420984962971217, + "loss": 0.0102, + "step": 452110 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001242059614133407, + "loss": 0.0091, + "step": 452120 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012420207319696925, + "loss": 0.0084, + "step": 452130 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241981849805978, + "loss": 0.0108, + "step": 452140 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241942967642263, + "loss": 0.0125, + "step": 452150 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012419040854785488, + "loss": 0.0104, + "step": 452160 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241865203314834, + "loss": 0.0094, + "step": 452170 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012418263211511193, + "loss": 0.0106, + "step": 452180 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012417874389874048, + "loss": 0.0177, + "step": 452190 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012417485568236902, + "loss": 0.0116, + "step": 452200 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012417096746599753, + "loss": 0.0111, + "step": 452210 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012416707924962607, + "loss": 0.0105, + "step": 452220 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012416319103325461, + "loss": 0.0117, + "step": 452230 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012415930281688316, + "loss": 0.0089, + "step": 452240 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012415541460051167, + "loss": 0.0099, + "step": 452250 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241515263841402, + "loss": 0.0175, + "step": 452260 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012414763816776875, + "loss": 0.0103, + "step": 452270 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241437499513973, + "loss": 0.0082, + "step": 452280 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241398617350258, + "loss": 0.0118, + "step": 452290 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012413597351865435, + "loss": 0.0098, + "step": 452300 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241320853022829, + "loss": 0.0132, + "step": 452310 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241281970859114, + "loss": 0.0071, + "step": 452320 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012412430886953995, + "loss": 0.0089, + "step": 452330 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001241204206531685, + "loss": 0.0104, + "step": 452340 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012411653243679703, + "loss": 0.0081, + "step": 452350 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012411264422042557, + "loss": 0.0101, + "step": 452360 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012410875600405412, + "loss": 0.0103, + "step": 452370 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012410486778768263, + "loss": 0.0114, + "step": 452380 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012410097957131117, + "loss": 0.0118, + "step": 452390 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012409709135493971, + "loss": 0.0093, + "step": 452400 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012409320313856826, + "loss": 0.0125, + "step": 452410 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012408931492219677, + "loss": 0.0113, + "step": 452420 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001240854267058253, + "loss": 0.0126, + "step": 452430 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012408153848945385, + "loss": 0.0116, + "step": 452440 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001240776502730824, + "loss": 0.01, + "step": 452450 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001240737620567109, + "loss": 0.0098, + "step": 452460 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012406987384033945, + "loss": 0.0109, + "step": 452470 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124065985623968, + "loss": 0.0141, + "step": 452480 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012406209740759653, + "loss": 0.0107, + "step": 452490 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012405820919122505, + "loss": 0.014, + "step": 452500 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012405432097485362, + "loss": 0.0125, + "step": 452510 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012405043275848213, + "loss": 0.0093, + "step": 452520 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012404654454211067, + "loss": 0.0101, + "step": 452530 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012404265632573922, + "loss": 0.0104, + "step": 452540 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012403876810936773, + "loss": 0.0135, + "step": 452550 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012403487989299627, + "loss": 0.0116, + "step": 452560 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001240309916766248, + "loss": 0.0108, + "step": 452570 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012402710346025336, + "loss": 0.0097, + "step": 452580 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012402321524388187, + "loss": 0.0122, + "step": 452590 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001240193270275104, + "loss": 0.0093, + "step": 452600 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012401543881113895, + "loss": 0.011, + "step": 452610 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001240115505947675, + "loss": 0.0077, + "step": 452620 + }, + { + "epoch": 1.17, + "learning_rate": 0.000124007662378396, + "loss": 0.0113, + "step": 452630 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012400377416202455, + "loss": 0.0143, + "step": 452640 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239998859456531, + "loss": 0.0121, + "step": 452650 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012399599772928163, + "loss": 0.0147, + "step": 452660 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012399210951291015, + "loss": 0.0081, + "step": 452670 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239882212965387, + "loss": 0.0095, + "step": 452680 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012398433308016723, + "loss": 0.0094, + "step": 452690 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012398044486379577, + "loss": 0.0128, + "step": 452700 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012397655664742432, + "loss": 0.011, + "step": 452710 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012397266843105286, + "loss": 0.0086, + "step": 452720 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012396878021468137, + "loss": 0.0111, + "step": 452730 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239648919983099, + "loss": 0.0125, + "step": 452740 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012396100378193845, + "loss": 0.0087, + "step": 452750 + }, + { + "epoch": 1.17, + "learning_rate": 0.000123957115565567, + "loss": 0.0088, + "step": 452760 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239532273491955, + "loss": 0.0099, + "step": 452770 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012394933913282405, + "loss": 0.0111, + "step": 452780 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239454509164526, + "loss": 0.0102, + "step": 452790 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239415627000811, + "loss": 0.0103, + "step": 452800 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012393767448370965, + "loss": 0.0082, + "step": 452810 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239337862673382, + "loss": 0.0094, + "step": 452820 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012392989805096673, + "loss": 0.01, + "step": 452830 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012392600983459525, + "loss": 0.0117, + "step": 452840 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239221216182238, + "loss": 0.0121, + "step": 452850 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012391823340185233, + "loss": 0.0131, + "step": 452860 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012391434518548087, + "loss": 0.0147, + "step": 452870 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001239104569691094, + "loss": 0.0108, + "step": 452880 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012390656875273796, + "loss": 0.0099, + "step": 452890 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012390268053636647, + "loss": 0.0119, + "step": 452900 + }, + { + "epoch": 1.17, + "learning_rate": 0.000123898792319995, + "loss": 0.0123, + "step": 452910 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012389490410362355, + "loss": 0.0098, + "step": 452920 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238910158872521, + "loss": 0.0111, + "step": 452930 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238871276708806, + "loss": 0.012, + "step": 452940 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012388323945450915, + "loss": 0.0106, + "step": 452950 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238793512381377, + "loss": 0.0093, + "step": 452960 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012387546302176623, + "loss": 0.013, + "step": 452970 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012387157480539475, + "loss": 0.0087, + "step": 452980 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238676865890233, + "loss": 0.0141, + "step": 452990 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012386379837265183, + "loss": 0.0119, + "step": 453000 + }, + { + "epoch": 1.17, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.007030075415968895, + "eval_runtime": 108.0107, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, + "step": 453000 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012385991015628037, + "loss": 0.0109, + "step": 453010 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238560219399089, + "loss": 0.0104, + "step": 453020 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012385213372353746, + "loss": 0.0107, + "step": 453030 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012384824550716597, + "loss": 0.0107, + "step": 453040 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238443572907945, + "loss": 0.01, + "step": 453050 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012384046907442306, + "loss": 0.0132, + "step": 453060 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012383658085805157, + "loss": 0.0108, + "step": 453070 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238326926416801, + "loss": 0.0234, + "step": 453080 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012382880442530865, + "loss": 0.0119, + "step": 453090 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238249162089372, + "loss": 0.0086, + "step": 453100 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238210279925657, + "loss": 0.0084, + "step": 453110 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012381713977619425, + "loss": 0.0093, + "step": 453120 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238132515598228, + "loss": 0.0135, + "step": 453130 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012380936334345133, + "loss": 0.0098, + "step": 453140 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012380547512707985, + "loss": 0.0099, + "step": 453150 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001238015869107084, + "loss": 0.0089, + "step": 453160 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012379769869433693, + "loss": 0.016, + "step": 453170 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012379381047796547, + "loss": 0.0116, + "step": 453180 + }, + { + "epoch": 1.17, + "learning_rate": 0.000123789922261594, + "loss": 0.0119, + "step": 453190 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012378603404522253, + "loss": 0.0127, + "step": 453200 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012378214582885107, + "loss": 0.0087, + "step": 453210 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237782576124796, + "loss": 0.0112, + "step": 453220 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012377436939610815, + "loss": 0.0098, + "step": 453230 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237704811797367, + "loss": 0.0096, + "step": 453240 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237665929633652, + "loss": 0.0082, + "step": 453250 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012376270474699375, + "loss": 0.0078, + "step": 453260 + }, + { + "epoch": 1.17, + "learning_rate": 0.0001237588165306223, + "loss": 0.0094, + "step": 453270 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012375492831425084, + "loss": 0.0113, + "step": 453280 + }, + { + "epoch": 1.17, + "learning_rate": 0.00012375104009787935, + "loss": 0.0112, + "step": 453290 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237471518815079, + "loss": 0.0098, + "step": 453300 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012374326366513643, + "loss": 0.0092, + "step": 453310 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012373937544876495, + "loss": 0.0132, + "step": 453320 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237354872323935, + "loss": 0.0148, + "step": 453330 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012373159901602203, + "loss": 0.0093, + "step": 453340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012372771079965057, + "loss": 0.0112, + "step": 453350 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237238225832791, + "loss": 0.0107, + "step": 453360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012371993436690763, + "loss": 0.0099, + "step": 453370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012371604615053617, + "loss": 0.0093, + "step": 453380 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237121579341647, + "loss": 0.0106, + "step": 453390 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012370826971779323, + "loss": 0.0143, + "step": 453400 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237043815014218, + "loss": 0.0105, + "step": 453410 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001237004932850503, + "loss": 0.0092, + "step": 453420 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012369660506867885, + "loss": 0.0107, + "step": 453430 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236927168523074, + "loss": 0.0102, + "step": 453440 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012368882863593594, + "loss": 0.0125, + "step": 453450 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012368494041956445, + "loss": 0.0129, + "step": 453460 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123681052203193, + "loss": 0.014, + "step": 453470 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012367716398682153, + "loss": 0.0145, + "step": 453480 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012367327577045007, + "loss": 0.0088, + "step": 453490 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236693875540786, + "loss": 0.0109, + "step": 453500 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012366549933770713, + "loss": 0.0113, + "step": 453510 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012366161112133567, + "loss": 0.0101, + "step": 453520 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012365772290496421, + "loss": 0.0123, + "step": 453530 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012365383468859273, + "loss": 0.0127, + "step": 453540 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012364994647222127, + "loss": 0.0146, + "step": 453550 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236460582558498, + "loss": 0.009, + "step": 453560 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012364217003947833, + "loss": 0.0106, + "step": 453570 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236382818231069, + "loss": 0.0088, + "step": 453580 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236343936067354, + "loss": 0.0128, + "step": 453590 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012363050539036395, + "loss": 0.0145, + "step": 453600 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236266171739925, + "loss": 0.0132, + "step": 453610 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012362272895762103, + "loss": 0.011, + "step": 453620 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012361884074124955, + "loss": 0.0097, + "step": 453630 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236149525248781, + "loss": 0.017, + "step": 453640 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012361106430850663, + "loss": 0.0106, + "step": 453650 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012360717609213517, + "loss": 0.0094, + "step": 453660 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001236032878757637, + "loss": 0.0123, + "step": 453670 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012359939965939223, + "loss": 0.0082, + "step": 453680 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012359551144302077, + "loss": 0.0104, + "step": 453690 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012359162322664931, + "loss": 0.0141, + "step": 453700 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012358773501027783, + "loss": 0.01, + "step": 453710 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012358384679390637, + "loss": 0.0117, + "step": 453720 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235799585775349, + "loss": 0.0081, + "step": 453730 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012357607036116345, + "loss": 0.0099, + "step": 453740 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123572182144792, + "loss": 0.0119, + "step": 453750 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012356829392842054, + "loss": 0.0165, + "step": 453760 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012356440571204905, + "loss": 0.0109, + "step": 453770 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235605174956776, + "loss": 0.0114, + "step": 453780 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012355662927930613, + "loss": 0.0101, + "step": 453790 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012355274106293465, + "loss": 0.0098, + "step": 453800 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235488528465632, + "loss": 0.0113, + "step": 453810 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012354496463019173, + "loss": 0.0106, + "step": 453820 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012354107641382027, + "loss": 0.0081, + "step": 453830 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235371881974488, + "loss": 0.0087, + "step": 453840 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012353329998107733, + "loss": 0.009, + "step": 453850 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012352941176470587, + "loss": 0.0094, + "step": 453860 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001235255235483344, + "loss": 0.0125, + "step": 453870 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012352163533196293, + "loss": 0.0093, + "step": 453880 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012351774711559147, + "loss": 0.0105, + "step": 453890 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012351385889922, + "loss": 0.0085, + "step": 453900 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012350997068284855, + "loss": 0.0094, + "step": 453910 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012350608246647707, + "loss": 0.0088, + "step": 453920 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012350219425010564, + "loss": 0.0102, + "step": 453930 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012349830603373415, + "loss": 0.0129, + "step": 453940 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234944178173627, + "loss": 0.0119, + "step": 453950 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012349052960099123, + "loss": 0.0105, + "step": 453960 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012348664138461978, + "loss": 0.01, + "step": 453970 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234827531682483, + "loss": 0.0105, + "step": 453980 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012347886495187683, + "loss": 0.0146, + "step": 453990 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012347497673550537, + "loss": 0.0125, + "step": 454000 + }, + { + "epoch": 1.18, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.0068307314068078995, + "eval_runtime": 107.3869, + "eval_samples_per_second": 18.624, + "eval_steps_per_second": 4.656, + "step": 454000 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012347108851913391, + "loss": 0.0114, + "step": 454010 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012346720030276243, + "loss": 0.0114, + "step": 454020 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012346331208639097, + "loss": 0.0146, + "step": 454030 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234594238700195, + "loss": 0.012, + "step": 454040 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012345553565364803, + "loss": 0.0123, + "step": 454050 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012345164743727657, + "loss": 0.0102, + "step": 454060 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234477592209051, + "loss": 0.0149, + "step": 454070 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012344387100453365, + "loss": 0.0102, + "step": 454080 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012343998278816217, + "loss": 0.0088, + "step": 454090 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012343609457179074, + "loss": 0.0119, + "step": 454100 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012343220635541925, + "loss": 0.0128, + "step": 454110 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234283181390478, + "loss": 0.0123, + "step": 454120 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012342442992267633, + "loss": 0.0121, + "step": 454130 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012342054170630487, + "loss": 0.0164, + "step": 454140 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001234166534899334, + "loss": 0.009, + "step": 454150 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012341276527356193, + "loss": 0.0093, + "step": 454160 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012340887705719047, + "loss": 0.013, + "step": 454170 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012340498884081901, + "loss": 0.0111, + "step": 454180 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012340110062444753, + "loss": 0.0098, + "step": 454190 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012339721240807607, + "loss": 0.0097, + "step": 454200 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233933241917046, + "loss": 0.0127, + "step": 454210 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012338943597533315, + "loss": 0.012, + "step": 454220 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012338554775896167, + "loss": 0.01, + "step": 454230 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233816595425902, + "loss": 0.0126, + "step": 454240 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012337777132621875, + "loss": 0.0145, + "step": 454250 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233738831098473, + "loss": 0.0086, + "step": 454260 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233699948934758, + "loss": 0.0103, + "step": 454270 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012336610667710438, + "loss": 0.0089, + "step": 454280 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233622184607329, + "loss": 0.0124, + "step": 454290 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012335833024436143, + "loss": 0.0141, + "step": 454300 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012335444202798997, + "loss": 0.0113, + "step": 454310 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233505538116185, + "loss": 0.012, + "step": 454320 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012334666559524703, + "loss": 0.0123, + "step": 454330 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012334277737887557, + "loss": 0.0104, + "step": 454340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012333888916250411, + "loss": 0.0101, + "step": 454350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012333500094613263, + "loss": 0.0123, + "step": 454360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012333111272976117, + "loss": 0.0132, + "step": 454370 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233272245133897, + "loss": 0.0103, + "step": 454380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012332333629701825, + "loss": 0.0133, + "step": 454390 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012331944808064677, + "loss": 0.0114, + "step": 454400 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233155598642753, + "loss": 0.0108, + "step": 454410 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012331167164790385, + "loss": 0.0108, + "step": 454420 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233077834315324, + "loss": 0.0094, + "step": 454430 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001233038952151609, + "loss": 0.0127, + "step": 454440 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012330000699878948, + "loss": 0.0104, + "step": 454450 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123296118782418, + "loss": 0.0114, + "step": 454460 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012329223056604653, + "loss": 0.013, + "step": 454470 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012328834234967507, + "loss": 0.0128, + "step": 454480 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012328445413330362, + "loss": 0.0114, + "step": 454490 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012328056591693213, + "loss": 0.0109, + "step": 454500 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012327667770056067, + "loss": 0.0125, + "step": 454510 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232727894841892, + "loss": 0.0107, + "step": 454520 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012326890126781775, + "loss": 0.0107, + "step": 454530 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012326501305144627, + "loss": 0.0114, + "step": 454540 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232611248350748, + "loss": 0.0105, + "step": 454550 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012325723661870335, + "loss": 0.011, + "step": 454560 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012325334840233187, + "loss": 0.0111, + "step": 454570 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232494601859604, + "loss": 0.0134, + "step": 454580 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012324557196958895, + "loss": 0.0115, + "step": 454590 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232416837532175, + "loss": 0.0104, + "step": 454600 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123237795536846, + "loss": 0.0096, + "step": 454610 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012323390732047458, + "loss": 0.0111, + "step": 454620 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232300191041031, + "loss": 0.0148, + "step": 454630 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012322613088773163, + "loss": 0.0083, + "step": 454640 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012322224267136017, + "loss": 0.0133, + "step": 454650 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012321835445498871, + "loss": 0.0091, + "step": 454660 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012321446623861723, + "loss": 0.0125, + "step": 454670 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012321057802224577, + "loss": 0.0087, + "step": 454680 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001232066898058743, + "loss": 0.0115, + "step": 454690 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012320280158950285, + "loss": 0.0115, + "step": 454700 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012319891337313137, + "loss": 0.0094, + "step": 454710 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231950251567599, + "loss": 0.0138, + "step": 454720 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012319113694038845, + "loss": 0.011, + "step": 454730 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123187248724017, + "loss": 0.0101, + "step": 454740 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231833605076455, + "loss": 0.0102, + "step": 454750 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012317947229127405, + "loss": 0.0099, + "step": 454760 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231755840749026, + "loss": 0.0108, + "step": 454770 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231716958585311, + "loss": 0.0082, + "step": 454780 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012316780764215965, + "loss": 0.0151, + "step": 454790 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231639194257882, + "loss": 0.01, + "step": 454800 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012316003120941673, + "loss": 0.0116, + "step": 454810 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012315614299304527, + "loss": 0.008, + "step": 454820 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012315225477667381, + "loss": 0.0107, + "step": 454830 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012314836656030233, + "loss": 0.0107, + "step": 454840 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012314447834393087, + "loss": 0.0123, + "step": 454850 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231405901275594, + "loss": 0.0083, + "step": 454860 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012313670191118795, + "loss": 0.0077, + "step": 454870 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012313281369481647, + "loss": 0.0139, + "step": 454880 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123128925478445, + "loss": 0.0129, + "step": 454890 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012312503726207355, + "loss": 0.0095, + "step": 454900 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231211490457021, + "loss": 0.0173, + "step": 454910 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231172608293306, + "loss": 0.0107, + "step": 454920 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012311337261295915, + "loss": 0.0097, + "step": 454930 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001231094843965877, + "loss": 0.0109, + "step": 454940 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012310559618021623, + "loss": 0.0122, + "step": 454950 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012310170796384475, + "loss": 0.0111, + "step": 454960 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012309781974747332, + "loss": 0.0079, + "step": 454970 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012309393153110183, + "loss": 0.0104, + "step": 454980 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012309004331473037, + "loss": 0.0108, + "step": 454990 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230861550983589, + "loss": 0.0104, + "step": 455000 + }, + { + "epoch": 1.18, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.007326171267777681, + "eval_runtime": 107.2391, + "eval_samples_per_second": 18.65, + "eval_steps_per_second": 4.662, + "step": 455000 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012308226688198746, + "loss": 0.0138, + "step": 455010 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012307837866561597, + "loss": 0.0125, + "step": 455020 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230744904492445, + "loss": 0.0083, + "step": 455030 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012307060223287305, + "loss": 0.0109, + "step": 455040 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012306671401650157, + "loss": 0.0098, + "step": 455050 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230628258001301, + "loss": 0.0123, + "step": 455060 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012305893758375865, + "loss": 0.0101, + "step": 455070 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230550493673872, + "loss": 0.0114, + "step": 455080 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230511611510157, + "loss": 0.0121, + "step": 455090 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012304727293464425, + "loss": 0.0098, + "step": 455100 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230433847182728, + "loss": 0.0105, + "step": 455110 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012303949650190133, + "loss": 0.0101, + "step": 455120 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012303560828552985, + "loss": 0.0107, + "step": 455130 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230317200691584, + "loss": 0.0107, + "step": 455140 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012302783185278693, + "loss": 0.0095, + "step": 455150 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012302394363641547, + "loss": 0.0106, + "step": 455160 + }, + { + "epoch": 1.18, + "learning_rate": 0.000123020055420044, + "loss": 0.0105, + "step": 455170 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012301616720367255, + "loss": 0.0109, + "step": 455180 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012301227898730107, + "loss": 0.0092, + "step": 455190 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230083907709296, + "loss": 0.0095, + "step": 455200 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012300450255455815, + "loss": 0.0092, + "step": 455210 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001230006143381867, + "loss": 0.0129, + "step": 455220 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229967261218152, + "loss": 0.0115, + "step": 455230 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012299283790544375, + "loss": 0.0108, + "step": 455240 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229889496890723, + "loss": 0.0091, + "step": 455250 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012298506147270083, + "loss": 0.0121, + "step": 455260 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012298117325632935, + "loss": 0.0136, + "step": 455270 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229772850399579, + "loss": 0.0081, + "step": 455280 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012297339682358643, + "loss": 0.0125, + "step": 455290 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012296950860721495, + "loss": 0.0136, + "step": 455300 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229656203908435, + "loss": 0.0074, + "step": 455310 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012296173217447203, + "loss": 0.0088, + "step": 455320 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012295784395810057, + "loss": 0.0113, + "step": 455330 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229539557417291, + "loss": 0.0115, + "step": 455340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012295006752535765, + "loss": 0.0096, + "step": 455350 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012294617930898617, + "loss": 0.0107, + "step": 455360 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229422910926147, + "loss": 0.0099, + "step": 455370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012293840287624325, + "loss": 0.0125, + "step": 455380 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229345146598718, + "loss": 0.0094, + "step": 455390 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229306264435003, + "loss": 0.0132, + "step": 455400 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012292673822712885, + "loss": 0.0115, + "step": 455410 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001229228500107574, + "loss": 0.0097, + "step": 455420 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012291896179438593, + "loss": 0.0118, + "step": 455430 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012291507357801445, + "loss": 0.01, + "step": 455440 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122911185361643, + "loss": 0.013, + "step": 455450 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012290729714527153, + "loss": 0.0133, + "step": 455460 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012290340892890007, + "loss": 0.0093, + "step": 455470 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228995207125286, + "loss": 0.0099, + "step": 455480 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012289563249615716, + "loss": 0.0081, + "step": 455490 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012289174427978567, + "loss": 0.0085, + "step": 455500 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228878560634142, + "loss": 0.0111, + "step": 455510 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012288396784704275, + "loss": 0.0113, + "step": 455520 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012288007963067127, + "loss": 0.011, + "step": 455530 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228761914142998, + "loss": 0.0129, + "step": 455540 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012287230319792835, + "loss": 0.0112, + "step": 455550 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228684149815569, + "loss": 0.0097, + "step": 455560 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228645267651854, + "loss": 0.0102, + "step": 455570 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012286063854881395, + "loss": 0.0106, + "step": 455580 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228567503324425, + "loss": 0.0098, + "step": 455590 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012285286211607103, + "loss": 0.01, + "step": 455600 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012284897389969955, + "loss": 0.0081, + "step": 455610 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228450856833281, + "loss": 0.0114, + "step": 455620 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012284119746695663, + "loss": 0.014, + "step": 455630 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012283730925058517, + "loss": 0.0079, + "step": 455640 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012283342103421369, + "loss": 0.0133, + "step": 455650 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012282953281784223, + "loss": 0.0116, + "step": 455660 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012282564460147077, + "loss": 0.0094, + "step": 455670 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228217563850993, + "loss": 0.0122, + "step": 455680 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012281786816872785, + "loss": 0.0079, + "step": 455690 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228139799523564, + "loss": 0.0106, + "step": 455700 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001228100917359849, + "loss": 0.0104, + "step": 455710 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012280620351961345, + "loss": 0.008, + "step": 455720 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122802315303242, + "loss": 0.0099, + "step": 455730 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012279842708687053, + "loss": 0.0111, + "step": 455740 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012279453887049905, + "loss": 0.0106, + "step": 455750 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227906506541276, + "loss": 0.0129, + "step": 455760 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012278676243775613, + "loss": 0.0087, + "step": 455770 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012278287422138465, + "loss": 0.0095, + "step": 455780 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227789860050132, + "loss": 0.0104, + "step": 455790 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012277509778864173, + "loss": 0.0105, + "step": 455800 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012277120957227027, + "loss": 0.0112, + "step": 455810 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012276732135589879, + "loss": 0.0103, + "step": 455820 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012276343313952733, + "loss": 0.0093, + "step": 455830 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012275954492315587, + "loss": 0.0087, + "step": 455840 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227556567067844, + "loss": 0.0099, + "step": 455850 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012275176849041293, + "loss": 0.0091, + "step": 455860 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227478802740415, + "loss": 0.0111, + "step": 455870 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012274399205767, + "loss": 0.0103, + "step": 455880 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012274010384129855, + "loss": 0.0111, + "step": 455890 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227362156249271, + "loss": 0.0122, + "step": 455900 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012273232740855563, + "loss": 0.009, + "step": 455910 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012272843919218415, + "loss": 0.0111, + "step": 455920 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227245509758127, + "loss": 0.0137, + "step": 455930 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012272066275944123, + "loss": 0.0095, + "step": 455940 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012271677454306977, + "loss": 0.0093, + "step": 455950 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227128863266983, + "loss": 0.0103, + "step": 455960 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012270899811032683, + "loss": 0.0118, + "step": 455970 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012270510989395537, + "loss": 0.0132, + "step": 455980 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001227012216775839, + "loss": 0.0105, + "step": 455990 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012269733346121243, + "loss": 0.0092, + "step": 456000 + }, + { + "epoch": 1.18, + "eval_cer": 0.881688689953826, + "eval_loss": 0.0070779649540781975, + "eval_runtime": 107.4452, + "eval_samples_per_second": 18.614, + "eval_steps_per_second": 4.654, + "step": 456000 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122693445244841, + "loss": 0.0093, + "step": 456010 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226895570284695, + "loss": 0.0095, + "step": 456020 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012268566881209802, + "loss": 0.0106, + "step": 456030 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226817805957266, + "loss": 0.0143, + "step": 456040 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226778923793551, + "loss": 0.0096, + "step": 456050 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012267400416298365, + "loss": 0.0108, + "step": 456060 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226701159466122, + "loss": 0.0114, + "step": 456070 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012266622773024073, + "loss": 0.0089, + "step": 456080 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012266233951386925, + "loss": 0.0088, + "step": 456090 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226584512974978, + "loss": 0.0121, + "step": 456100 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012265456308112633, + "loss": 0.0125, + "step": 456110 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012265067486475487, + "loss": 0.0139, + "step": 456120 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226467866483834, + "loss": 0.0132, + "step": 456130 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012264289843201193, + "loss": 0.0107, + "step": 456140 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012263901021564047, + "loss": 0.0107, + "step": 456150 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122635121999269, + "loss": 0.0114, + "step": 456160 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012263123378289753, + "loss": 0.0119, + "step": 456170 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012262734556652607, + "loss": 0.0115, + "step": 456180 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226234573501546, + "loss": 0.0127, + "step": 456190 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012261956913378315, + "loss": 0.0104, + "step": 456200 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226156809174117, + "loss": 0.0094, + "step": 456210 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012261179270104023, + "loss": 0.0145, + "step": 456220 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012260790448466875, + "loss": 0.0101, + "step": 456230 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001226040162682973, + "loss": 0.0106, + "step": 456240 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012260012805192583, + "loss": 0.0112, + "step": 456250 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012259623983555437, + "loss": 0.0172, + "step": 456260 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225923516191829, + "loss": 0.01, + "step": 456270 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012258846340281143, + "loss": 0.0092, + "step": 456280 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012258457518643997, + "loss": 0.0113, + "step": 456290 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012258068697006849, + "loss": 0.0099, + "step": 456300 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012257679875369703, + "loss": 0.0145, + "step": 456310 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012257291053732557, + "loss": 0.0087, + "step": 456320 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225690223209541, + "loss": 0.0134, + "step": 456330 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012256513410458263, + "loss": 0.0121, + "step": 456340 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012256124588821117, + "loss": 0.0109, + "step": 456350 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225573576718397, + "loss": 0.0111, + "step": 456360 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012255346945546825, + "loss": 0.017, + "step": 456370 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012254958123909677, + "loss": 0.0087, + "step": 456380 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012254569302272533, + "loss": 0.0113, + "step": 456390 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012254180480635385, + "loss": 0.0125, + "step": 456400 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225379165899824, + "loss": 0.0103, + "step": 456410 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012253402837361093, + "loss": 0.0094, + "step": 456420 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012253014015723947, + "loss": 0.0123, + "step": 456430 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122526251940868, + "loss": 0.0086, + "step": 456440 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012252236372449653, + "loss": 0.0131, + "step": 456450 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012251847550812507, + "loss": 0.0112, + "step": 456460 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225145872917536, + "loss": 0.0099, + "step": 456470 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012251069907538213, + "loss": 0.0145, + "step": 456480 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012250681085901067, + "loss": 0.0117, + "step": 456490 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001225029226426392, + "loss": 0.0111, + "step": 456500 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012249903442626775, + "loss": 0.011, + "step": 456510 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012249514620989627, + "loss": 0.0151, + "step": 456520 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224912579935248, + "loss": 0.0102, + "step": 456530 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012248736977715335, + "loss": 0.0138, + "step": 456540 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012248348156078186, + "loss": 0.0093, + "step": 456550 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012247959334441043, + "loss": 0.0102, + "step": 456560 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012247570512803895, + "loss": 0.0145, + "step": 456570 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224718169116675, + "loss": 0.0119, + "step": 456580 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012246792869529603, + "loss": 0.01, + "step": 456590 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012246404047892457, + "loss": 0.0109, + "step": 456600 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224601522625531, + "loss": 0.0112, + "step": 456610 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012245626404618163, + "loss": 0.0106, + "step": 456620 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012245237582981017, + "loss": 0.0111, + "step": 456630 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224484876134387, + "loss": 0.0129, + "step": 456640 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012244459939706723, + "loss": 0.0095, + "step": 456650 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012244071118069577, + "loss": 0.0141, + "step": 456660 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224368229643243, + "loss": 0.0084, + "step": 456670 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012243293474795285, + "loss": 0.0101, + "step": 456680 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012242904653158137, + "loss": 0.0108, + "step": 456690 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224251583152099, + "loss": 0.011, + "step": 456700 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012242127009883845, + "loss": 0.0122, + "step": 456710 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122417381882467, + "loss": 0.0172, + "step": 456720 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224134936660955, + "loss": 0.0114, + "step": 456730 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012240960544972407, + "loss": 0.01, + "step": 456740 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001224057172333526, + "loss": 0.0099, + "step": 456750 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012240182901698113, + "loss": 0.0107, + "step": 456760 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012239794080060967, + "loss": 0.0118, + "step": 456770 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223940525842382, + "loss": 0.01, + "step": 456780 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012239016436786673, + "loss": 0.0093, + "step": 456790 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012238627615149527, + "loss": 0.0111, + "step": 456800 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223823879351238, + "loss": 0.0095, + "step": 456810 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012237849971875233, + "loss": 0.0143, + "step": 456820 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012237461150238087, + "loss": 0.0128, + "step": 456830 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223707232860094, + "loss": 0.0129, + "step": 456840 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012236683506963795, + "loss": 0.0087, + "step": 456850 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012236294685326647, + "loss": 0.0138, + "step": 456860 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122359058636895, + "loss": 0.0134, + "step": 456870 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012235517042052355, + "loss": 0.0131, + "step": 456880 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223512822041521, + "loss": 0.012, + "step": 456890 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223473939877806, + "loss": 0.0156, + "step": 456900 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012234350577140917, + "loss": 0.0062, + "step": 456910 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223396175550377, + "loss": 0.0093, + "step": 456920 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012233572933866623, + "loss": 0.0104, + "step": 456930 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012233184112229477, + "loss": 0.0111, + "step": 456940 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223279529059233, + "loss": 0.013, + "step": 456950 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012232406468955183, + "loss": 0.0155, + "step": 456960 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012232017647318037, + "loss": 0.0117, + "step": 456970 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223162882568089, + "loss": 0.0081, + "step": 456980 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012231240004043745, + "loss": 0.0083, + "step": 456990 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012230851182406597, + "loss": 0.0129, + "step": 457000 + }, + { + "epoch": 1.18, + "eval_cer": 0.8816970877754311, + "eval_loss": 0.0070222471840679646, + "eval_runtime": 107.5432, + "eval_samples_per_second": 18.597, + "eval_steps_per_second": 4.649, + "step": 457000 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001223046236076945, + "loss": 0.0156, + "step": 457010 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012230073539132305, + "loss": 0.0108, + "step": 457020 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012229684717495156, + "loss": 0.0125, + "step": 457030 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222929589585801, + "loss": 0.0118, + "step": 457040 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012228907074220865, + "loss": 0.0109, + "step": 457050 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222851825258372, + "loss": 0.0089, + "step": 457060 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222812943094657, + "loss": 0.013, + "step": 457070 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012227740609309427, + "loss": 0.0111, + "step": 457080 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222735178767228, + "loss": 0.0111, + "step": 457090 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012226962966035133, + "loss": 0.0162, + "step": 457100 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012226574144397987, + "loss": 0.0162, + "step": 457110 + }, + { + "epoch": 1.18, + "learning_rate": 0.0001222618532276084, + "loss": 0.0088, + "step": 457120 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012225796501123693, + "loss": 0.0096, + "step": 457130 + }, + { + "epoch": 1.18, + "learning_rate": 0.00012225407679486547, + "loss": 0.01, + "step": 457140 + }, + { + "epoch": 1.18, + "learning_rate": 0.000122250188578494, + "loss": 0.0115, + "step": 457150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012224630036212255, + "loss": 0.006, + "step": 457160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012224241214575107, + "loss": 0.0103, + "step": 457170 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222385239293796, + "loss": 0.0125, + "step": 457180 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012223463571300815, + "loss": 0.0097, + "step": 457190 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222307474966367, + "loss": 0.0149, + "step": 457200 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222268592802652, + "loss": 0.0129, + "step": 457210 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012222297106389375, + "loss": 0.0121, + "step": 457220 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001222190828475223, + "loss": 0.0099, + "step": 457230 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012221519463115083, + "loss": 0.0134, + "step": 457240 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012221130641477935, + "loss": 0.0135, + "step": 457250 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012220741819840791, + "loss": 0.0111, + "step": 457260 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012220352998203643, + "loss": 0.0104, + "step": 457270 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012219964176566497, + "loss": 0.0103, + "step": 457280 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221957535492935, + "loss": 0.0112, + "step": 457290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012219186533292203, + "loss": 0.0094, + "step": 457300 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012218797711655057, + "loss": 0.009, + "step": 457310 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221840889001791, + "loss": 0.01, + "step": 457320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012218020068380765, + "loss": 0.0093, + "step": 457330 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012217631246743617, + "loss": 0.0089, + "step": 457340 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221724242510647, + "loss": 0.0115, + "step": 457350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012216853603469325, + "loss": 0.0126, + "step": 457360 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221646478183218, + "loss": 0.0129, + "step": 457370 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221607596019503, + "loss": 0.017, + "step": 457380 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012215687138557885, + "loss": 0.0132, + "step": 457390 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221529831692074, + "loss": 0.0096, + "step": 457400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012214909495283593, + "loss": 0.0106, + "step": 457410 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012214520673646444, + "loss": 0.0097, + "step": 457420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012214131852009301, + "loss": 0.0121, + "step": 457430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012213743030372153, + "loss": 0.0107, + "step": 457440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012213354208735007, + "loss": 0.0097, + "step": 457450 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221296538709786, + "loss": 0.0125, + "step": 457460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012212576565460715, + "loss": 0.0137, + "step": 457470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012212187743823567, + "loss": 0.008, + "step": 457480 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221179892218642, + "loss": 0.0118, + "step": 457490 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012211410100549275, + "loss": 0.0144, + "step": 457500 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012211021278912127, + "loss": 0.0144, + "step": 457510 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001221063245727498, + "loss": 0.0099, + "step": 457520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012210243635637835, + "loss": 0.0117, + "step": 457530 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220985481400069, + "loss": 0.0088, + "step": 457540 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220946599236354, + "loss": 0.0096, + "step": 457550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012209077170726395, + "loss": 0.0114, + "step": 457560 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220868834908925, + "loss": 0.0092, + "step": 457570 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012208299527452103, + "loss": 0.0107, + "step": 457580 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012207910705814954, + "loss": 0.0128, + "step": 457590 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220752188417781, + "loss": 0.012, + "step": 457600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012207133062540663, + "loss": 0.0146, + "step": 457610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012206744240903517, + "loss": 0.0147, + "step": 457620 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220635541926637, + "loss": 0.0121, + "step": 457630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012205966597629224, + "loss": 0.0138, + "step": 457640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012205577775992077, + "loss": 0.0119, + "step": 457650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012205188954354931, + "loss": 0.0133, + "step": 457660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012204800132717784, + "loss": 0.01, + "step": 457670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012204411311080639, + "loss": 0.0112, + "step": 457680 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220402248944349, + "loss": 0.0103, + "step": 457690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012203633667806346, + "loss": 0.0112, + "step": 457700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012203244846169199, + "loss": 0.013, + "step": 457710 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012202856024532053, + "loss": 0.0129, + "step": 457720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012202467202894906, + "loss": 0.0146, + "step": 457730 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220207838125776, + "loss": 0.012, + "step": 457740 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012201689559620613, + "loss": 0.0095, + "step": 457750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012201300737983466, + "loss": 0.0114, + "step": 457760 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001220091191634632, + "loss": 0.0119, + "step": 457770 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012200523094709173, + "loss": 0.0098, + "step": 457780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012200134273072027, + "loss": 0.0116, + "step": 457790 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219974545143488, + "loss": 0.0115, + "step": 457800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012199356629797734, + "loss": 0.0101, + "step": 457810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012198967808160587, + "loss": 0.0085, + "step": 457820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012198578986523441, + "loss": 0.0096, + "step": 457830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012198190164886294, + "loss": 0.0154, + "step": 457840 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012197801343249148, + "loss": 0.0128, + "step": 457850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012197412521612, + "loss": 0.0084, + "step": 457860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012197023699974856, + "loss": 0.0137, + "step": 457870 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012196634878337709, + "loss": 0.0101, + "step": 457880 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012196246056700563, + "loss": 0.0104, + "step": 457890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012195857235063416, + "loss": 0.0143, + "step": 457900 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219546841342627, + "loss": 0.0153, + "step": 457910 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012195079591789123, + "loss": 0.0138, + "step": 457920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012194690770151977, + "loss": 0.0153, + "step": 457930 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219430194851483, + "loss": 0.0158, + "step": 457940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012193913126877684, + "loss": 0.0099, + "step": 457950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012193524305240537, + "loss": 0.0174, + "step": 457960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012193135483603391, + "loss": 0.0113, + "step": 457970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012192746661966244, + "loss": 0.0107, + "step": 457980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012192357840329098, + "loss": 0.0105, + "step": 457990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012191969018691951, + "loss": 0.0124, + "step": 458000 + }, + { + "epoch": 1.19, + "eval_cer": 0.8817250805141147, + "eval_loss": 0.007128569763153791, + "eval_runtime": 107.4871, + "eval_samples_per_second": 18.607, + "eval_steps_per_second": 4.652, + "step": 458000 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012191580197054804, + "loss": 0.0095, + "step": 458010 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012191191375417658, + "loss": 0.0121, + "step": 458020 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001219080255378051, + "loss": 0.0137, + "step": 458030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012190413732143365, + "loss": 0.015, + "step": 458040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012190024910506218, + "loss": 0.0168, + "step": 458050 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012189636088869073, + "loss": 0.0097, + "step": 458060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012189247267231926, + "loss": 0.0115, + "step": 458070 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001218885844559478, + "loss": 0.0093, + "step": 458080 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012188469623957633, + "loss": 0.0121, + "step": 458090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012188080802320487, + "loss": 0.0127, + "step": 458100 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001218769198068334, + "loss": 0.0121, + "step": 458110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012187303159046194, + "loss": 0.0086, + "step": 458120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012186914337409047, + "loss": 0.0106, + "step": 458130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012186525515771901, + "loss": 0.01, + "step": 458140 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012186136694134754, + "loss": 0.0113, + "step": 458150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012185747872497608, + "loss": 0.0151, + "step": 458160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012185359050860461, + "loss": 0.0116, + "step": 458170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012184970229223315, + "loss": 0.015, + "step": 458180 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012184581407586168, + "loss": 0.0115, + "step": 458190 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012184192585949022, + "loss": 0.0121, + "step": 458200 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012183803764311875, + "loss": 0.0115, + "step": 458210 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001218341494267473, + "loss": 0.0109, + "step": 458220 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012183026121037583, + "loss": 0.0116, + "step": 458230 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012182637299400437, + "loss": 0.0092, + "step": 458240 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001218224847776329, + "loss": 0.015, + "step": 458250 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012181859656126143, + "loss": 0.009, + "step": 458260 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012181470834488997, + "loss": 0.0092, + "step": 458270 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001218108201285185, + "loss": 0.0131, + "step": 458280 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012180693191214704, + "loss": 0.0108, + "step": 458290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012180304369577557, + "loss": 0.01, + "step": 458300 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012179915547940411, + "loss": 0.0135, + "step": 458310 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012179526726303264, + "loss": 0.0133, + "step": 458320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012179137904666118, + "loss": 0.0135, + "step": 458330 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001217874908302897, + "loss": 0.0089, + "step": 458340 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012178360261391825, + "loss": 0.0113, + "step": 458350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012177971439754678, + "loss": 0.0138, + "step": 458360 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012177582618117532, + "loss": 0.013, + "step": 458370 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012177193796480385, + "loss": 0.0092, + "step": 458380 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001217680497484324, + "loss": 0.0136, + "step": 458390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012176416153206092, + "loss": 0.0104, + "step": 458400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012176027331568947, + "loss": 0.0109, + "step": 458410 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121756385099318, + "loss": 0.0102, + "step": 458420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012175249688294654, + "loss": 0.0149, + "step": 458430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012174860866657507, + "loss": 0.0109, + "step": 458440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012174472045020361, + "loss": 0.0085, + "step": 458450 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012174083223383214, + "loss": 0.0116, + "step": 458460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012173694401746068, + "loss": 0.0125, + "step": 458470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012173305580108921, + "loss": 0.0111, + "step": 458480 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012172916758471775, + "loss": 0.0106, + "step": 458490 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012172527936834628, + "loss": 0.0111, + "step": 458500 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001217213911519748, + "loss": 0.0095, + "step": 458510 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012171750293560335, + "loss": 0.0107, + "step": 458520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012171361471923188, + "loss": 0.0115, + "step": 458530 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012170972650286042, + "loss": 0.0088, + "step": 458540 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012170583828648895, + "loss": 0.0128, + "step": 458550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012170195007011749, + "loss": 0.014, + "step": 458560 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012169806185374601, + "loss": 0.0138, + "step": 458570 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012169417363737457, + "loss": 0.0085, + "step": 458580 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001216902854210031, + "loss": 0.013, + "step": 458590 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012168639720463164, + "loss": 0.0422, + "step": 458600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012168250898826017, + "loss": 0.0098, + "step": 458610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012167862077188871, + "loss": 0.0097, + "step": 458620 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012167473255551724, + "loss": 0.0117, + "step": 458630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012167084433914578, + "loss": 0.0102, + "step": 458640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012166695612277431, + "loss": 0.0118, + "step": 458650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012166306790640285, + "loss": 0.0116, + "step": 458660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012165917969003138, + "loss": 0.0136, + "step": 458670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012165529147365992, + "loss": 0.0113, + "step": 458680 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012165140325728845, + "loss": 0.0122, + "step": 458690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012164751504091699, + "loss": 0.0098, + "step": 458700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012164362682454552, + "loss": 0.0094, + "step": 458710 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012163973860817406, + "loss": 0.0113, + "step": 458720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012163585039180259, + "loss": 0.0103, + "step": 458730 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012163196217543114, + "loss": 0.015, + "step": 458740 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012162807395905967, + "loss": 0.0092, + "step": 458750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012162418574268818, + "loss": 0.0103, + "step": 458760 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012162029752631674, + "loss": 0.0105, + "step": 458770 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012161640930994527, + "loss": 0.0106, + "step": 458780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012161252109357381, + "loss": 0.0131, + "step": 458790 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012160863287720234, + "loss": 0.0194, + "step": 458800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012160474466083088, + "loss": 0.0102, + "step": 458810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012160085644445941, + "loss": 0.0144, + "step": 458820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012159696822808795, + "loss": 0.0109, + "step": 458830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012159308001171648, + "loss": 0.0103, + "step": 458840 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012158919179534502, + "loss": 0.0133, + "step": 458850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012158530357897355, + "loss": 0.013, + "step": 458860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012158141536260209, + "loss": 0.0116, + "step": 458870 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012157752714623062, + "loss": 0.0107, + "step": 458880 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012157363892985916, + "loss": 0.0109, + "step": 458890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012156975071348769, + "loss": 0.0122, + "step": 458900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012156586249711624, + "loss": 0.0098, + "step": 458910 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012156197428074476, + "loss": 0.0106, + "step": 458920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012155808606437331, + "loss": 0.0077, + "step": 458930 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012155419784800184, + "loss": 0.014, + "step": 458940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012155030963163038, + "loss": 0.0106, + "step": 458950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012154642141525891, + "loss": 0.011, + "step": 458960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012154253319888745, + "loss": 0.0126, + "step": 458970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012153864498251598, + "loss": 0.008, + "step": 458980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012153475676614452, + "loss": 0.0212, + "step": 458990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012153086854977305, + "loss": 0.0102, + "step": 459000 + }, + { + "epoch": 1.19, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.007249526679515839, + "eval_runtime": 107.419, + "eval_samples_per_second": 18.619, + "eval_steps_per_second": 4.655, + "step": 459000 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012152698033340158, + "loss": 0.0112, + "step": 459010 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012152309211703012, + "loss": 0.0101, + "step": 459020 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012151920390065865, + "loss": 0.0127, + "step": 459030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012151531568428719, + "loss": 0.0084, + "step": 459040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012151142746791572, + "loss": 0.008, + "step": 459050 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012150753925154426, + "loss": 0.0135, + "step": 459060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012150365103517279, + "loss": 0.0093, + "step": 459070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012149976281880133, + "loss": 0.0111, + "step": 459080 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012149587460242985, + "loss": 0.0098, + "step": 459090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012149198638605841, + "loss": 0.0132, + "step": 459100 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012148809816968694, + "loss": 0.0111, + "step": 459110 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012148420995331548, + "loss": 0.0113, + "step": 459120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012148032173694401, + "loss": 0.0137, + "step": 459130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012147643352057255, + "loss": 0.0109, + "step": 459140 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012147254530420108, + "loss": 0.0098, + "step": 459150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012146865708782962, + "loss": 0.0119, + "step": 459160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012146476887145815, + "loss": 0.0107, + "step": 459170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012146088065508669, + "loss": 0.0065, + "step": 459180 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012145699243871522, + "loss": 0.0106, + "step": 459190 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012145310422234376, + "loss": 0.0083, + "step": 459200 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012144921600597229, + "loss": 0.0105, + "step": 459210 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012144532778960083, + "loss": 0.0097, + "step": 459220 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012144143957322936, + "loss": 0.0083, + "step": 459230 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001214375513568579, + "loss": 0.0088, + "step": 459240 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012143366314048643, + "loss": 0.0109, + "step": 459250 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012142977492411495, + "loss": 0.01, + "step": 459260 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012142588670774351, + "loss": 0.0104, + "step": 459270 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012142199849137202, + "loss": 0.0099, + "step": 459280 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012141811027500058, + "loss": 0.0094, + "step": 459290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012141422205862911, + "loss": 0.0121, + "step": 459300 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012141033384225765, + "loss": 0.0105, + "step": 459310 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012140644562588618, + "loss": 0.0094, + "step": 459320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012140255740951472, + "loss": 0.0098, + "step": 459330 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012139866919314325, + "loss": 0.0151, + "step": 459340 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012139478097677179, + "loss": 0.0109, + "step": 459350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012139089276040032, + "loss": 0.0101, + "step": 459360 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012138700454402886, + "loss": 0.0123, + "step": 459370 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012138311632765739, + "loss": 0.0099, + "step": 459380 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012137922811128593, + "loss": 0.0098, + "step": 459390 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012137533989491446, + "loss": 0.0081, + "step": 459400 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121371451678543, + "loss": 0.0147, + "step": 459410 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012136756346217153, + "loss": 0.0095, + "step": 459420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012136367524580007, + "loss": 0.0138, + "step": 459430 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001213597870294286, + "loss": 0.0122, + "step": 459440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012135589881305715, + "loss": 0.0096, + "step": 459450 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012135201059668568, + "loss": 0.0145, + "step": 459460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012134812238031422, + "loss": 0.0125, + "step": 459470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012134423416394275, + "loss": 0.01, + "step": 459480 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012134034594757129, + "loss": 0.0111, + "step": 459490 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012133645773119982, + "loss": 0.0101, + "step": 459500 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012133256951482835, + "loss": 0.0087, + "step": 459510 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012132868129845689, + "loss": 0.0079, + "step": 459520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012132479308208542, + "loss": 0.0115, + "step": 459530 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012132090486571396, + "loss": 0.0118, + "step": 459540 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012131701664934249, + "loss": 0.0097, + "step": 459550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012131312843297103, + "loss": 0.011, + "step": 459560 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012130924021659956, + "loss": 0.0104, + "step": 459570 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001213053520002281, + "loss": 0.011, + "step": 459580 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012130146378385663, + "loss": 0.0102, + "step": 459590 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012129757556748517, + "loss": 0.009, + "step": 459600 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001212936873511137, + "loss": 0.0102, + "step": 459610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012128979913474225, + "loss": 0.0109, + "step": 459620 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012128591091837076, + "loss": 0.01, + "step": 459630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012128202270199932, + "loss": 0.0101, + "step": 459640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012127813448562785, + "loss": 0.0126, + "step": 459650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012127424626925639, + "loss": 0.0136, + "step": 459660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012127035805288492, + "loss": 0.0131, + "step": 459670 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012126646983651346, + "loss": 0.0109, + "step": 459680 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012126258162014199, + "loss": 0.0097, + "step": 459690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012125869340377053, + "loss": 0.014, + "step": 459700 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012125480518739906, + "loss": 0.0123, + "step": 459710 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001212509169710276, + "loss": 0.0098, + "step": 459720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012124702875465613, + "loss": 0.0112, + "step": 459730 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012124314053828467, + "loss": 0.0105, + "step": 459740 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001212392523219132, + "loss": 0.0122, + "step": 459750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012123536410554172, + "loss": 0.0088, + "step": 459760 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012123147588917027, + "loss": 0.01, + "step": 459770 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001212275876727988, + "loss": 0.0096, + "step": 459780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012122369945642734, + "loss": 0.01, + "step": 459790 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012121981124005586, + "loss": 0.0093, + "step": 459800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012121592302368442, + "loss": 0.0122, + "step": 459810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012121203480731295, + "loss": 0.0118, + "step": 459820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012120814659094149, + "loss": 0.0092, + "step": 459830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012120425837457002, + "loss": 0.008, + "step": 459840 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012120037015819856, + "loss": 0.0093, + "step": 459850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012119648194182709, + "loss": 0.0102, + "step": 459860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012119259372545563, + "loss": 0.0117, + "step": 459870 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012118870550908416, + "loss": 0.0136, + "step": 459880 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001211848172927127, + "loss": 0.0093, + "step": 459890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012118092907634123, + "loss": 0.0111, + "step": 459900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012117704085996977, + "loss": 0.0108, + "step": 459910 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001211731526435983, + "loss": 0.0122, + "step": 459920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012116926442722684, + "loss": 0.01, + "step": 459930 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012116537621085537, + "loss": 0.0096, + "step": 459940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012116148799448391, + "loss": 0.0108, + "step": 459950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012115759977811244, + "loss": 0.0103, + "step": 459960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012115371156174099, + "loss": 0.0125, + "step": 459970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012114982334536952, + "loss": 0.0104, + "step": 459980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012114593512899803, + "loss": 0.0105, + "step": 459990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012114204691262659, + "loss": 0.0159, + "step": 460000 + }, + { + "epoch": 1.19, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.007131533697247505, + "eval_runtime": 107.4528, + "eval_samples_per_second": 18.613, + "eval_steps_per_second": 4.653, + "step": 460000 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012113815869625512, + "loss": 0.0106, + "step": 460010 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012113427047988366, + "loss": 0.0105, + "step": 460020 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012113038226351219, + "loss": 0.01, + "step": 460030 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012112649404714073, + "loss": 0.0081, + "step": 460040 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012112260583076926, + "loss": 0.0114, + "step": 460050 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001211187176143978, + "loss": 0.0109, + "step": 460060 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012111482939802633, + "loss": 0.0132, + "step": 460070 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012111094118165487, + "loss": 0.0097, + "step": 460080 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001211070529652834, + "loss": 0.01, + "step": 460090 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012110316474891194, + "loss": 0.0112, + "step": 460100 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012109927653254046, + "loss": 0.0087, + "step": 460110 + }, + { + "epoch": 1.19, + "learning_rate": 0.000121095388316169, + "loss": 0.0103, + "step": 460120 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012109150009979753, + "loss": 0.0178, + "step": 460130 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012108761188342609, + "loss": 0.0128, + "step": 460140 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210837236670546, + "loss": 0.0132, + "step": 460150 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012107983545068316, + "loss": 0.0094, + "step": 460160 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012107594723431169, + "loss": 0.0142, + "step": 460170 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012107205901794023, + "loss": 0.0124, + "step": 460180 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012106817080156876, + "loss": 0.0123, + "step": 460190 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210642825851973, + "loss": 0.01, + "step": 460200 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012106039436882583, + "loss": 0.0099, + "step": 460210 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012105650615245437, + "loss": 0.0125, + "step": 460220 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210526179360829, + "loss": 0.0105, + "step": 460230 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012104872971971142, + "loss": 0.0145, + "step": 460240 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012104484150333997, + "loss": 0.008, + "step": 460250 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210409532869685, + "loss": 0.0101, + "step": 460260 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012103706507059704, + "loss": 0.0094, + "step": 460270 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012103317685422556, + "loss": 0.0121, + "step": 460280 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210292886378541, + "loss": 0.0114, + "step": 460290 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012102540042148263, + "loss": 0.009, + "step": 460300 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012102151220511118, + "loss": 0.008, + "step": 460310 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001210176239887397, + "loss": 0.0152, + "step": 460320 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012101373577236826, + "loss": 0.01, + "step": 460330 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012100984755599679, + "loss": 0.0105, + "step": 460340 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012100595933962533, + "loss": 0.0119, + "step": 460350 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012100207112325386, + "loss": 0.0136, + "step": 460360 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209981829068824, + "loss": 0.0101, + "step": 460370 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012099429469051093, + "loss": 0.0099, + "step": 460380 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012099040647413947, + "loss": 0.0099, + "step": 460390 + }, + { + "epoch": 1.19, + "learning_rate": 0.000120986518257768, + "loss": 0.0109, + "step": 460400 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012098263004139654, + "loss": 0.0082, + "step": 460410 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012097874182502507, + "loss": 0.0096, + "step": 460420 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012097485360865361, + "loss": 0.0113, + "step": 460430 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012097096539228214, + "loss": 0.0101, + "step": 460440 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012096707717591068, + "loss": 0.0102, + "step": 460450 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209631889595392, + "loss": 0.0106, + "step": 460460 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012095930074316775, + "loss": 0.0106, + "step": 460470 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012095541252679628, + "loss": 0.0101, + "step": 460480 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209515243104248, + "loss": 0.0091, + "step": 460490 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012094763609405336, + "loss": 0.0118, + "step": 460500 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012094374787768187, + "loss": 0.0092, + "step": 460510 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012093985966131043, + "loss": 0.0119, + "step": 460520 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012093597144493896, + "loss": 0.0105, + "step": 460530 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209320832285675, + "loss": 0.0082, + "step": 460540 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012092819501219603, + "loss": 0.012, + "step": 460550 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012092430679582457, + "loss": 0.0115, + "step": 460560 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001209204185794531, + "loss": 0.0108, + "step": 460570 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012091653036308164, + "loss": 0.0117, + "step": 460580 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012091264214671017, + "loss": 0.0093, + "step": 460590 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012090875393033871, + "loss": 0.0098, + "step": 460600 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012090486571396724, + "loss": 0.0093, + "step": 460610 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012090097749759578, + "loss": 0.011, + "step": 460620 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208970892812243, + "loss": 0.0108, + "step": 460630 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012089320106485285, + "loss": 0.0131, + "step": 460640 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012088931284848137, + "loss": 0.0075, + "step": 460650 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012088542463210992, + "loss": 0.0126, + "step": 460660 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012088153641573844, + "loss": 0.0097, + "step": 460670 + }, + { + "epoch": 1.19, + "learning_rate": 0.000120877648199367, + "loss": 0.0125, + "step": 460680 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012087375998299553, + "loss": 0.0121, + "step": 460690 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012086987176662407, + "loss": 0.0119, + "step": 460700 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208659835502526, + "loss": 0.0087, + "step": 460710 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012086209533388114, + "loss": 0.01, + "step": 460720 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012085820711750967, + "loss": 0.0108, + "step": 460730 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208543189011382, + "loss": 0.01, + "step": 460740 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012085043068476674, + "loss": 0.0111, + "step": 460750 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012084654246839526, + "loss": 0.0108, + "step": 460760 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208426542520238, + "loss": 0.0093, + "step": 460770 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012083876603565233, + "loss": 0.0116, + "step": 460780 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012083487781928088, + "loss": 0.0107, + "step": 460790 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208309896029094, + "loss": 0.0109, + "step": 460800 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012082710138653795, + "loss": 0.0108, + "step": 460810 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012082321317016647, + "loss": 0.0098, + "step": 460820 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012081932495379502, + "loss": 0.0105, + "step": 460830 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012081543673742354, + "loss": 0.0087, + "step": 460840 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001208115485210521, + "loss": 0.0115, + "step": 460850 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012080766030468063, + "loss": 0.0121, + "step": 460860 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012080377208830917, + "loss": 0.0104, + "step": 460870 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001207998838719377, + "loss": 0.0123, + "step": 460880 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012079599565556624, + "loss": 0.0087, + "step": 460890 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012079210743919477, + "loss": 0.0139, + "step": 460900 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012078821922282331, + "loss": 0.013, + "step": 460910 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012078433100645184, + "loss": 0.0092, + "step": 460920 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012078044279008038, + "loss": 0.0127, + "step": 460930 + }, + { + "epoch": 1.19, + "learning_rate": 0.0001207765545737089, + "loss": 0.0106, + "step": 460940 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012077266635733745, + "loss": 0.0123, + "step": 460950 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012076877814096598, + "loss": 0.0125, + "step": 460960 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012076488992459452, + "loss": 0.0176, + "step": 460970 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012076100170822305, + "loss": 0.0107, + "step": 460980 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012075711349185157, + "loss": 0.0092, + "step": 460990 + }, + { + "epoch": 1.19, + "learning_rate": 0.00012075322527548012, + "loss": 0.0109, + "step": 461000 + }, + { + "epoch": 1.19, + "eval_cer": 0.881719481966378, + "eval_loss": 0.0072724465280771255, + "eval_runtime": 107.8929, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 461000 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012074933705910864, + "loss": 0.0117, + "step": 461010 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012074544884273718, + "loss": 0.0106, + "step": 461020 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012074156062636571, + "loss": 0.0139, + "step": 461030 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012073767240999427, + "loss": 0.0107, + "step": 461040 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001207337841936228, + "loss": 0.0116, + "step": 461050 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012072989597725134, + "loss": 0.0112, + "step": 461060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012072600776087987, + "loss": 0.0116, + "step": 461070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012072211954450841, + "loss": 0.011, + "step": 461080 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012071823132813694, + "loss": 0.0094, + "step": 461090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012071434311176548, + "loss": 0.0084, + "step": 461100 + }, + { + "epoch": 1.2, + "learning_rate": 0.000120710454895394, + "loss": 0.0115, + "step": 461110 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012070656667902255, + "loss": 0.0095, + "step": 461120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012070267846265107, + "loss": 0.0109, + "step": 461130 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012069879024627962, + "loss": 0.0113, + "step": 461140 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012069490202990814, + "loss": 0.0113, + "step": 461150 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012069101381353669, + "loss": 0.0274, + "step": 461160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012068712559716521, + "loss": 0.0101, + "step": 461170 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012068323738079376, + "loss": 0.0142, + "step": 461180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012067934916442228, + "loss": 0.0129, + "step": 461190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012067546094805084, + "loss": 0.0098, + "step": 461200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012067157273167937, + "loss": 0.0093, + "step": 461210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012066768451530791, + "loss": 0.0109, + "step": 461220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012066379629893644, + "loss": 0.0096, + "step": 461230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012065990808256497, + "loss": 0.0136, + "step": 461240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012065601986619351, + "loss": 0.0125, + "step": 461250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012065213164982203, + "loss": 0.0099, + "step": 461260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012064824343345058, + "loss": 0.0135, + "step": 461270 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001206443552170791, + "loss": 0.0089, + "step": 461280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012064046700070765, + "loss": 0.0138, + "step": 461290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012063657878433617, + "loss": 0.0123, + "step": 461300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012063269056796472, + "loss": 0.0108, + "step": 461310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012062880235159324, + "loss": 0.0094, + "step": 461320 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012062491413522179, + "loss": 0.0093, + "step": 461330 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012062102591885031, + "loss": 0.0125, + "step": 461340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012061713770247886, + "loss": 0.0089, + "step": 461350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012061324948610738, + "loss": 0.0127, + "step": 461360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012060936126973594, + "loss": 0.0125, + "step": 461370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012060547305336445, + "loss": 0.0093, + "step": 461380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012060158483699301, + "loss": 0.0103, + "step": 461390 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012059769662062154, + "loss": 0.0118, + "step": 461400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012059380840425008, + "loss": 0.0096, + "step": 461410 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001205899201878786, + "loss": 0.0141, + "step": 461420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012058603197150715, + "loss": 0.0099, + "step": 461430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012058214375513568, + "loss": 0.0112, + "step": 461440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012057825553876422, + "loss": 0.0099, + "step": 461450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012057436732239275, + "loss": 0.0098, + "step": 461460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012057047910602129, + "loss": 0.0123, + "step": 461470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012056659088964982, + "loss": 0.0093, + "step": 461480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012056270267327834, + "loss": 0.0118, + "step": 461490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012055881445690689, + "loss": 0.0079, + "step": 461500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012055492624053541, + "loss": 0.0084, + "step": 461510 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012055103802416395, + "loss": 0.0109, + "step": 461520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012054714980779248, + "loss": 0.0116, + "step": 461530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012054326159142102, + "loss": 0.0118, + "step": 461540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012053937337504955, + "loss": 0.0091, + "step": 461550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012053548515867811, + "loss": 0.0123, + "step": 461560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012053159694230664, + "loss": 0.0129, + "step": 461570 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012052770872593518, + "loss": 0.0113, + "step": 461580 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001205238205095637, + "loss": 0.0106, + "step": 461590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012051993229319225, + "loss": 0.0161, + "step": 461600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012051604407682078, + "loss": 0.0093, + "step": 461610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012051215586044932, + "loss": 0.0108, + "step": 461620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012050826764407785, + "loss": 0.0173, + "step": 461630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012050437942770639, + "loss": 0.0102, + "step": 461640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012050049121133491, + "loss": 0.0105, + "step": 461650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012049660299496346, + "loss": 0.0086, + "step": 461660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012049271477859198, + "loss": 0.0123, + "step": 461670 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012048882656222053, + "loss": 0.01, + "step": 461680 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012048493834584905, + "loss": 0.0142, + "step": 461690 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001204810501294776, + "loss": 0.0109, + "step": 461700 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012047716191310612, + "loss": 0.0096, + "step": 461710 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012047327369673468, + "loss": 0.0131, + "step": 461720 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012046938548036321, + "loss": 0.0108, + "step": 461730 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012046549726399172, + "loss": 0.0104, + "step": 461740 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012046160904762028, + "loss": 0.0118, + "step": 461750 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001204577208312488, + "loss": 0.0104, + "step": 461760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012045383261487735, + "loss": 0.0104, + "step": 461770 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012044994439850587, + "loss": 0.0124, + "step": 461780 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012044605618213442, + "loss": 0.0088, + "step": 461790 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012044216796576294, + "loss": 0.0126, + "step": 461800 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012043827974939149, + "loss": 0.0079, + "step": 461810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012043439153302001, + "loss": 0.0106, + "step": 461820 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012043050331664856, + "loss": 0.0126, + "step": 461830 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012042661510027708, + "loss": 0.0119, + "step": 461840 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012042272688390563, + "loss": 0.0098, + "step": 461850 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012041883866753415, + "loss": 0.0169, + "step": 461860 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001204149504511627, + "loss": 0.0126, + "step": 461870 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012041106223479122, + "loss": 0.0113, + "step": 461880 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012040717401841978, + "loss": 0.0096, + "step": 461890 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012040328580204829, + "loss": 0.0117, + "step": 461900 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012039939758567685, + "loss": 0.0209, + "step": 461910 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012039550936930538, + "loss": 0.0093, + "step": 461920 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012039162115293392, + "loss": 0.0106, + "step": 461930 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012038773293656245, + "loss": 0.0118, + "step": 461940 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012038384472019099, + "loss": 0.0105, + "step": 461950 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012037995650381952, + "loss": 0.012, + "step": 461960 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012037606828744806, + "loss": 0.011, + "step": 461970 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012037218007107659, + "loss": 0.0089, + "step": 461980 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012036829185470511, + "loss": 0.0097, + "step": 461990 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012036440363833366, + "loss": 0.0085, + "step": 462000 + }, + { + "epoch": 1.2, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.00711864186450839, + "eval_runtime": 107.836, + "eval_samples_per_second": 18.547, + "eval_steps_per_second": 4.637, + "step": 462000 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012036051542196218, + "loss": 0.0141, + "step": 462010 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012035662720559073, + "loss": 0.0089, + "step": 462020 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012035273898921925, + "loss": 0.0109, + "step": 462030 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001203488507728478, + "loss": 0.0099, + "step": 462040 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012034496255647632, + "loss": 0.0109, + "step": 462050 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012034107434010486, + "loss": 0.0159, + "step": 462060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012033718612373339, + "loss": 0.0113, + "step": 462070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012033329790736195, + "loss": 0.0114, + "step": 462080 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012032940969099048, + "loss": 0.0097, + "step": 462090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012032552147461902, + "loss": 0.0115, + "step": 462100 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012032163325824755, + "loss": 0.0127, + "step": 462110 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012031774504187609, + "loss": 0.0108, + "step": 462120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012031385682550462, + "loss": 0.0113, + "step": 462130 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012030996860913316, + "loss": 0.0119, + "step": 462140 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012030608039276169, + "loss": 0.0115, + "step": 462150 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012030219217639023, + "loss": 0.0119, + "step": 462160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012029830396001875, + "loss": 0.0102, + "step": 462170 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001202944157436473, + "loss": 0.0099, + "step": 462180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012029052752727582, + "loss": 0.0119, + "step": 462190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012028663931090437, + "loss": 0.0126, + "step": 462200 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001202827510945329, + "loss": 0.0102, + "step": 462210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012027886287816144, + "loss": 0.0098, + "step": 462220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012027497466178996, + "loss": 0.0113, + "step": 462230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012027108644541849, + "loss": 0.0092, + "step": 462240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012026719822904703, + "loss": 0.0135, + "step": 462250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012026331001267556, + "loss": 0.0105, + "step": 462260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012025942179630412, + "loss": 0.0117, + "step": 462270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012025553357993265, + "loss": 0.0123, + "step": 462280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012025164536356119, + "loss": 0.012, + "step": 462290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012024775714718971, + "loss": 0.0094, + "step": 462300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012024386893081826, + "loss": 0.0107, + "step": 462310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012023998071444678, + "loss": 0.0144, + "step": 462320 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012023609249807533, + "loss": 0.0125, + "step": 462330 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012023220428170385, + "loss": 0.0106, + "step": 462340 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001202283160653324, + "loss": 0.0106, + "step": 462350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012022442784896092, + "loss": 0.0099, + "step": 462360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012022053963258947, + "loss": 0.0089, + "step": 462370 + }, + { + "epoch": 1.2, + "learning_rate": 0.000120216651416218, + "loss": 0.0152, + "step": 462380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012021276319984654, + "loss": 0.014, + "step": 462390 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012020887498347506, + "loss": 0.0116, + "step": 462400 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001202049867671036, + "loss": 0.0103, + "step": 462410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012020109855073213, + "loss": 0.0091, + "step": 462420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012019721033436069, + "loss": 0.0097, + "step": 462430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012019332211798922, + "loss": 0.0109, + "step": 462440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012018943390161776, + "loss": 0.011, + "step": 462450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012018554568524629, + "loss": 0.0125, + "step": 462460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012018165746887483, + "loss": 0.0116, + "step": 462470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012017776925250336, + "loss": 0.0134, + "step": 462480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012017388103613188, + "loss": 0.0162, + "step": 462490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012016999281976043, + "loss": 0.0109, + "step": 462500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012016610460338895, + "loss": 0.0139, + "step": 462510 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001201622163870175, + "loss": 0.0093, + "step": 462520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012015832817064602, + "loss": 0.0087, + "step": 462530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012015443995427457, + "loss": 0.0106, + "step": 462540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012015055173790309, + "loss": 0.0105, + "step": 462550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012014666352153163, + "loss": 0.01, + "step": 462560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012014277530516016, + "loss": 0.0098, + "step": 462570 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001201388870887887, + "loss": 0.0146, + "step": 462580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012013499887241723, + "loss": 0.0156, + "step": 462590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012013111065604579, + "loss": 0.0111, + "step": 462600 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001201272224396743, + "loss": 0.0094, + "step": 462610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012012333422330286, + "loss": 0.0127, + "step": 462620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012011944600693139, + "loss": 0.0086, + "step": 462630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012011555779055993, + "loss": 0.008, + "step": 462640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012011166957418846, + "loss": 0.0089, + "step": 462650 + }, + { + "epoch": 1.2, + "learning_rate": 0.000120107781357817, + "loss": 0.0095, + "step": 462660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012010389314144552, + "loss": 0.0114, + "step": 462670 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012010000492507407, + "loss": 0.0105, + "step": 462680 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200961167087026, + "loss": 0.0117, + "step": 462690 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012009222849233114, + "loss": 0.0098, + "step": 462700 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012008834027595966, + "loss": 0.0117, + "step": 462710 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012008445205958819, + "loss": 0.0108, + "step": 462720 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012008056384321673, + "loss": 0.0082, + "step": 462730 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012007667562684526, + "loss": 0.012, + "step": 462740 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200727874104738, + "loss": 0.0129, + "step": 462750 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012006889919410233, + "loss": 0.0113, + "step": 462760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012006501097773087, + "loss": 0.0101, + "step": 462770 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200611227613594, + "loss": 0.0101, + "step": 462780 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012005723454498796, + "loss": 0.0142, + "step": 462790 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012005334632861648, + "loss": 0.0108, + "step": 462800 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012004945811224503, + "loss": 0.012, + "step": 462810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012004556989587355, + "loss": 0.0087, + "step": 462820 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200416816795021, + "loss": 0.0108, + "step": 462830 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012003779346313062, + "loss": 0.0109, + "step": 462840 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012003390524675917, + "loss": 0.0086, + "step": 462850 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200300170303877, + "loss": 0.0086, + "step": 462860 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012002612881401624, + "loss": 0.0142, + "step": 462870 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012002224059764476, + "loss": 0.0117, + "step": 462880 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200183523812733, + "loss": 0.0102, + "step": 462890 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012001446416490183, + "loss": 0.0096, + "step": 462900 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012001057594853038, + "loss": 0.0102, + "step": 462910 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001200066877321589, + "loss": 0.0105, + "step": 462920 + }, + { + "epoch": 1.2, + "learning_rate": 0.00012000279951578744, + "loss": 0.0077, + "step": 462930 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011999891129941597, + "loss": 0.0125, + "step": 462940 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011999502308304453, + "loss": 0.0121, + "step": 462950 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011999113486667306, + "loss": 0.0109, + "step": 462960 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011998724665030157, + "loss": 0.0113, + "step": 462970 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011998335843393013, + "loss": 0.0108, + "step": 462980 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011997947021755865, + "loss": 0.0168, + "step": 462990 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199755820011872, + "loss": 0.0126, + "step": 463000 + }, + { + "epoch": 1.2, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.006891580764204264, + "eval_runtime": 108.0948, + "eval_samples_per_second": 18.502, + "eval_steps_per_second": 4.626, + "step": 463000 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011997169378481572, + "loss": 0.0089, + "step": 463010 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011996780556844427, + "loss": 0.0089, + "step": 463020 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199639173520728, + "loss": 0.0124, + "step": 463030 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011996002913570134, + "loss": 0.0142, + "step": 463040 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011995614091932986, + "loss": 0.0176, + "step": 463050 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199522527029584, + "loss": 0.0095, + "step": 463060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011994836448658693, + "loss": 0.0092, + "step": 463070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011994447627021547, + "loss": 0.0102, + "step": 463080 + }, + { + "epoch": 1.2, + "learning_rate": 0.000119940588053844, + "loss": 0.0098, + "step": 463090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011993669983747254, + "loss": 0.011, + "step": 463100 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011993281162110107, + "loss": 0.0106, + "step": 463110 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011992892340472963, + "loss": 0.0114, + "step": 463120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011992503518835814, + "loss": 0.0114, + "step": 463130 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199211469719867, + "loss": 0.0099, + "step": 463140 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011991725875561523, + "loss": 0.011, + "step": 463150 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011991337053924377, + "loss": 0.0127, + "step": 463160 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001199094823228723, + "loss": 0.0104, + "step": 463170 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011990559410650084, + "loss": 0.0076, + "step": 463180 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011990170589012936, + "loss": 0.0139, + "step": 463190 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198978176737579, + "loss": 0.0132, + "step": 463200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011989392945738643, + "loss": 0.0075, + "step": 463210 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011989004124101496, + "loss": 0.0106, + "step": 463220 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198861530246435, + "loss": 0.0106, + "step": 463230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011988226480827203, + "loss": 0.0097, + "step": 463240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011987837659190057, + "loss": 0.0095, + "step": 463250 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198744883755291, + "loss": 0.0109, + "step": 463260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011987060015915764, + "loss": 0.0097, + "step": 463270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011986671194278617, + "loss": 0.0102, + "step": 463280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011986282372641471, + "loss": 0.0087, + "step": 463290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011985893551004324, + "loss": 0.0093, + "step": 463300 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198550472936718, + "loss": 0.0128, + "step": 463310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011985115907730032, + "loss": 0.0133, + "step": 463320 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011984727086092887, + "loss": 0.0118, + "step": 463330 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198433826445574, + "loss": 0.0106, + "step": 463340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011983949442818594, + "loss": 0.0108, + "step": 463350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011983560621181446, + "loss": 0.0101, + "step": 463360 + }, + { + "epoch": 1.2, + "learning_rate": 0.000119831717995443, + "loss": 0.0105, + "step": 463370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011982782977907153, + "loss": 0.0131, + "step": 463380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011982394156270008, + "loss": 0.0084, + "step": 463390 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001198200533463286, + "loss": 0.0111, + "step": 463400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011981616512995715, + "loss": 0.0095, + "step": 463410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011981227691358567, + "loss": 0.0095, + "step": 463420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011980838869721422, + "loss": 0.0084, + "step": 463430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011980450048084274, + "loss": 0.0112, + "step": 463440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011980061226447128, + "loss": 0.014, + "step": 463450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011979672404809981, + "loss": 0.0131, + "step": 463460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011979283583172834, + "loss": 0.0121, + "step": 463470 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197889476153569, + "loss": 0.014, + "step": 463480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011978505939898541, + "loss": 0.0116, + "step": 463490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011978117118261397, + "loss": 0.0095, + "step": 463500 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197772829662425, + "loss": 0.0109, + "step": 463510 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011977339474987104, + "loss": 0.0116, + "step": 463520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011976950653349956, + "loss": 0.0094, + "step": 463530 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197656183171281, + "loss": 0.0127, + "step": 463540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011976173010075663, + "loss": 0.0112, + "step": 463550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011975784188438518, + "loss": 0.0093, + "step": 463560 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001197539536680137, + "loss": 0.0096, + "step": 463570 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011975006545164224, + "loss": 0.0106, + "step": 463580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011974617723527077, + "loss": 0.0113, + "step": 463590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011974228901889931, + "loss": 0.0097, + "step": 463600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011973840080252784, + "loss": 0.0118, + "step": 463610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011973451258615638, + "loss": 0.0093, + "step": 463620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011973062436978491, + "loss": 0.0098, + "step": 463630 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011972673615341345, + "loss": 0.0136, + "step": 463640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011972284793704198, + "loss": 0.0122, + "step": 463650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011971895972067054, + "loss": 0.0104, + "step": 463660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011971507150429907, + "loss": 0.0114, + "step": 463670 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011971118328792761, + "loss": 0.013, + "step": 463680 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011970729507155614, + "loss": 0.0132, + "step": 463690 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011970340685518468, + "loss": 0.0091, + "step": 463700 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001196995186388132, + "loss": 0.0116, + "step": 463710 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011969563042244173, + "loss": 0.0113, + "step": 463720 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011969174220607027, + "loss": 0.0091, + "step": 463730 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001196878539896988, + "loss": 0.0125, + "step": 463740 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011968396577332734, + "loss": 0.0126, + "step": 463750 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011968007755695587, + "loss": 0.0099, + "step": 463760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011967618934058441, + "loss": 0.0145, + "step": 463770 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011967230112421294, + "loss": 0.0099, + "step": 463780 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011966841290784148, + "loss": 0.0195, + "step": 463790 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011966452469147001, + "loss": 0.0156, + "step": 463800 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011966063647509855, + "loss": 0.0087, + "step": 463810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011965674825872708, + "loss": 0.0101, + "step": 463820 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011965286004235564, + "loss": 0.0102, + "step": 463830 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011964897182598415, + "loss": 0.0083, + "step": 463840 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001196450836096127, + "loss": 0.009, + "step": 463850 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011964119539324123, + "loss": 0.0112, + "step": 463860 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011963730717686978, + "loss": 0.0117, + "step": 463870 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001196334189604983, + "loss": 0.011, + "step": 463880 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011962953074412685, + "loss": 0.0095, + "step": 463890 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011962564252775537, + "loss": 0.0098, + "step": 463900 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011962175431138392, + "loss": 0.0093, + "step": 463910 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011961786609501244, + "loss": 0.0133, + "step": 463920 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011961397787864099, + "loss": 0.0097, + "step": 463930 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011961008966226951, + "loss": 0.0109, + "step": 463940 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011960620144589806, + "loss": 0.0101, + "step": 463950 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011960231322952658, + "loss": 0.0122, + "step": 463960 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011959842501315511, + "loss": 0.009, + "step": 463970 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011959453679678365, + "loss": 0.0079, + "step": 463980 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011959064858041218, + "loss": 0.0137, + "step": 463990 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011958676036404072, + "loss": 0.01, + "step": 464000 + }, + { + "epoch": 1.2, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.0069192503578960896, + "eval_runtime": 107.9208, + "eval_samples_per_second": 18.532, + "eval_steps_per_second": 4.633, + "step": 464000 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011958287214766925, + "loss": 0.0094, + "step": 464010 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195789839312978, + "loss": 0.012, + "step": 464020 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011957509571492633, + "loss": 0.0083, + "step": 464030 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011957120749855488, + "loss": 0.0109, + "step": 464040 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195673192821834, + "loss": 0.01, + "step": 464050 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011956343106581195, + "loss": 0.0102, + "step": 464060 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011955954284944047, + "loss": 0.0113, + "step": 464070 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011955565463306901, + "loss": 0.012, + "step": 464080 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011955176641669754, + "loss": 0.0123, + "step": 464090 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011954787820032608, + "loss": 0.0142, + "step": 464100 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011954398998395461, + "loss": 0.009, + "step": 464110 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011954010176758315, + "loss": 0.0111, + "step": 464120 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011953621355121168, + "loss": 0.0104, + "step": 464130 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011953232533484022, + "loss": 0.0137, + "step": 464140 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011952843711846875, + "loss": 0.0103, + "step": 464150 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195245489020973, + "loss": 0.0089, + "step": 464160 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011952066068572582, + "loss": 0.016, + "step": 464170 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011951677246935438, + "loss": 0.0095, + "step": 464180 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195128842529829, + "loss": 0.0081, + "step": 464190 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011950899603661145, + "loss": 0.0093, + "step": 464200 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011950510782023997, + "loss": 0.0089, + "step": 464210 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001195012196038685, + "loss": 0.0087, + "step": 464220 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011949733138749704, + "loss": 0.0099, + "step": 464230 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011949344317112557, + "loss": 0.0128, + "step": 464240 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011948955495475411, + "loss": 0.0111, + "step": 464250 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011948566673838264, + "loss": 0.0099, + "step": 464260 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011948177852201118, + "loss": 0.0124, + "step": 464270 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011947789030563971, + "loss": 0.0108, + "step": 464280 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011947400208926825, + "loss": 0.0101, + "step": 464290 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011947011387289678, + "loss": 0.0089, + "step": 464300 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011946622565652532, + "loss": 0.0071, + "step": 464310 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011946233744015385, + "loss": 0.0085, + "step": 464320 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001194584492237824, + "loss": 0.0078, + "step": 464330 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011945456100741092, + "loss": 0.0115, + "step": 464340 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011945067279103948, + "loss": 0.0085, + "step": 464350 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011944678457466799, + "loss": 0.009, + "step": 464360 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011944289635829655, + "loss": 0.0086, + "step": 464370 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011943900814192507, + "loss": 0.0158, + "step": 464380 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011943511992555362, + "loss": 0.0122, + "step": 464390 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011943123170918214, + "loss": 0.0092, + "step": 464400 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011942734349281069, + "loss": 0.0166, + "step": 464410 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011942345527643921, + "loss": 0.014, + "step": 464420 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011941956706006776, + "loss": 0.0125, + "step": 464430 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011941567884369628, + "loss": 0.0119, + "step": 464440 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011941179062732483, + "loss": 0.0125, + "step": 464450 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011940790241095335, + "loss": 0.0144, + "step": 464460 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011940401419458188, + "loss": 0.0101, + "step": 464470 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011940012597821042, + "loss": 0.0104, + "step": 464480 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011939623776183895, + "loss": 0.0171, + "step": 464490 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011939234954546749, + "loss": 0.0109, + "step": 464500 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011938846132909602, + "loss": 0.0108, + "step": 464510 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011938457311272456, + "loss": 0.0124, + "step": 464520 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011938068489635309, + "loss": 0.0107, + "step": 464530 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011937679667998165, + "loss": 0.0098, + "step": 464540 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011937290846361017, + "loss": 0.0167, + "step": 464550 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011936902024723872, + "loss": 0.0102, + "step": 464560 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011936513203086724, + "loss": 0.0104, + "step": 464570 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011936124381449579, + "loss": 0.0102, + "step": 464580 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011935735559812431, + "loss": 0.0089, + "step": 464590 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011935346738175285, + "loss": 0.0109, + "step": 464600 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011934957916538138, + "loss": 0.0087, + "step": 464610 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011934569094900992, + "loss": 0.0108, + "step": 464620 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011934180273263845, + "loss": 0.0098, + "step": 464630 + }, + { + "epoch": 1.2, + "learning_rate": 0.000119337914516267, + "loss": 0.0128, + "step": 464640 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011933402629989552, + "loss": 0.0095, + "step": 464650 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011933013808352406, + "loss": 0.0091, + "step": 464660 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011932624986715259, + "loss": 0.0092, + "step": 464670 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011932236165078113, + "loss": 0.0082, + "step": 464680 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011931847343440966, + "loss": 0.012, + "step": 464690 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011931458521803822, + "loss": 0.0088, + "step": 464700 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011931069700166675, + "loss": 0.0094, + "step": 464710 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011930680878529526, + "loss": 0.0099, + "step": 464720 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011930292056892381, + "loss": 0.015, + "step": 464730 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011929903235255234, + "loss": 0.0103, + "step": 464740 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011929514413618088, + "loss": 0.0112, + "step": 464750 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011929125591980941, + "loss": 0.0113, + "step": 464760 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011928736770343795, + "loss": 0.0093, + "step": 464770 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011928347948706648, + "loss": 0.0123, + "step": 464780 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011927959127069502, + "loss": 0.0123, + "step": 464790 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011927570305432355, + "loss": 0.0137, + "step": 464800 + }, + { + "epoch": 1.2, + "learning_rate": 0.0001192718148379521, + "loss": 0.0088, + "step": 464810 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011926792662158062, + "loss": 0.011, + "step": 464820 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011926403840520916, + "loss": 0.0131, + "step": 464830 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011926015018883769, + "loss": 0.0123, + "step": 464840 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011925626197246623, + "loss": 0.0106, + "step": 464850 + }, + { + "epoch": 1.2, + "learning_rate": 0.00011925237375609476, + "loss": 0.0095, + "step": 464860 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001192484855397233, + "loss": 0.0106, + "step": 464870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011924459732335183, + "loss": 0.0098, + "step": 464880 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011924070910698039, + "loss": 0.0083, + "step": 464890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011923682089060891, + "loss": 0.0091, + "step": 464900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011923293267423746, + "loss": 0.0136, + "step": 464910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011922904445786598, + "loss": 0.0113, + "step": 464920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011922515624149453, + "loss": 0.0128, + "step": 464930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011922126802512305, + "loss": 0.0081, + "step": 464940 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001192173798087516, + "loss": 0.0122, + "step": 464950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011921349159238012, + "loss": 0.0129, + "step": 464960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011920960337600865, + "loss": 0.0126, + "step": 464970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011920571515963719, + "loss": 0.0088, + "step": 464980 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011920182694326572, + "loss": 0.0098, + "step": 464990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011919793872689426, + "loss": 0.0108, + "step": 465000 + }, + { + "epoch": 1.21, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.006845335941761732, + "eval_runtime": 107.9447, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 465000 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011919405051052279, + "loss": 0.0135, + "step": 465010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011919016229415133, + "loss": 0.0116, + "step": 465020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011918627407777986, + "loss": 0.0099, + "step": 465030 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191823858614084, + "loss": 0.0106, + "step": 465040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011917849764503693, + "loss": 0.0108, + "step": 465050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011917460942866549, + "loss": 0.0096, + "step": 465060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011917072121229401, + "loss": 0.0094, + "step": 465070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011916683299592256, + "loss": 0.0149, + "step": 465080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011916294477955108, + "loss": 0.0083, + "step": 465090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011915905656317963, + "loss": 0.0113, + "step": 465100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011915516834680815, + "loss": 0.0122, + "step": 465110 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191512801304367, + "loss": 0.0091, + "step": 465120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011914739191406522, + "loss": 0.0135, + "step": 465130 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011914350369769376, + "loss": 0.0096, + "step": 465140 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011913961548132229, + "loss": 0.0112, + "step": 465150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011913572726495083, + "loss": 0.009, + "step": 465160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011913183904857936, + "loss": 0.0103, + "step": 465170 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191279508322079, + "loss": 0.0096, + "step": 465180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011912406261583643, + "loss": 0.0106, + "step": 465190 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011912017439946496, + "loss": 0.01, + "step": 465200 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191162861830935, + "loss": 0.0095, + "step": 465210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011911239796672203, + "loss": 0.0122, + "step": 465220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011910850975035057, + "loss": 0.0114, + "step": 465230 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001191046215339791, + "loss": 0.0116, + "step": 465240 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011910073331760765, + "loss": 0.0111, + "step": 465250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011909684510123618, + "loss": 0.0102, + "step": 465260 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011909295688486472, + "loss": 0.011, + "step": 465270 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011908906866849325, + "loss": 0.0118, + "step": 465280 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190851804521218, + "loss": 0.0104, + "step": 465290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011908129223575032, + "loss": 0.0117, + "step": 465300 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011907740401937886, + "loss": 0.0102, + "step": 465310 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011907351580300739, + "loss": 0.0113, + "step": 465320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011906962758663593, + "loss": 0.012, + "step": 465330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011906573937026446, + "loss": 0.0192, + "step": 465340 + }, + { + "epoch": 1.21, + "learning_rate": 0.000119061851153893, + "loss": 0.0087, + "step": 465350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011905796293752153, + "loss": 0.0188, + "step": 465360 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011905407472115007, + "loss": 0.0102, + "step": 465370 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190501865047786, + "loss": 0.0099, + "step": 465380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011904629828840714, + "loss": 0.0086, + "step": 465390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011904241007203567, + "loss": 0.0121, + "step": 465400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011903852185566423, + "loss": 0.0136, + "step": 465410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011903463363929275, + "loss": 0.0113, + "step": 465420 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190307454229213, + "loss": 0.0148, + "step": 465430 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011902685720654982, + "loss": 0.0096, + "step": 465440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011902296899017835, + "loss": 0.0105, + "step": 465450 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001190190807738069, + "loss": 0.0109, + "step": 465460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011901519255743542, + "loss": 0.0112, + "step": 465470 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011901130434106396, + "loss": 0.0124, + "step": 465480 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011900741612469249, + "loss": 0.011, + "step": 465490 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011900352790832103, + "loss": 0.0072, + "step": 465500 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011899963969194956, + "loss": 0.0122, + "step": 465510 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189957514755781, + "loss": 0.0102, + "step": 465520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011899186325920663, + "loss": 0.01, + "step": 465530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011898797504283517, + "loss": 0.0091, + "step": 465540 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189840868264637, + "loss": 0.0093, + "step": 465550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011898019861009224, + "loss": 0.0123, + "step": 465560 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011897631039372077, + "loss": 0.011, + "step": 465570 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011897242217734933, + "loss": 0.0088, + "step": 465580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011896853396097784, + "loss": 0.011, + "step": 465590 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189646457446064, + "loss": 0.0137, + "step": 465600 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011896075752823492, + "loss": 0.0105, + "step": 465610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011895686931186346, + "loss": 0.011, + "step": 465620 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011895298109549199, + "loss": 0.0077, + "step": 465630 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011894909287912053, + "loss": 0.0088, + "step": 465640 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011894520466274906, + "loss": 0.0084, + "step": 465650 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189413164463776, + "loss": 0.0096, + "step": 465660 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011893742823000613, + "loss": 0.0172, + "step": 465670 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011893354001363467, + "loss": 0.0115, + "step": 465680 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189296517972632, + "loss": 0.0129, + "step": 465690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011892576358089173, + "loss": 0.0141, + "step": 465700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011892187536452027, + "loss": 0.012, + "step": 465710 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001189179871481488, + "loss": 0.0123, + "step": 465720 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011891409893177734, + "loss": 0.0096, + "step": 465730 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011891021071540587, + "loss": 0.01, + "step": 465740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011890632249903441, + "loss": 0.0093, + "step": 465750 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011890243428266294, + "loss": 0.0135, + "step": 465760 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188985460662915, + "loss": 0.0135, + "step": 465770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011889465784992002, + "loss": 0.0146, + "step": 465780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011889076963354856, + "loss": 0.0124, + "step": 465790 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011888688141717709, + "loss": 0.0126, + "step": 465800 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011888299320080563, + "loss": 0.0099, + "step": 465810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011887910498443416, + "loss": 0.0114, + "step": 465820 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188752167680627, + "loss": 0.0112, + "step": 465830 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011887132855169123, + "loss": 0.0111, + "step": 465840 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011886744033531977, + "loss": 0.0101, + "step": 465850 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188635521189483, + "loss": 0.0121, + "step": 465860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011885966390257684, + "loss": 0.0082, + "step": 465870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011885577568620537, + "loss": 0.0103, + "step": 465880 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011885188746983391, + "loss": 0.0102, + "step": 465890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011884799925346244, + "loss": 0.0104, + "step": 465900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011884411103709098, + "loss": 0.0135, + "step": 465910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011884022282071951, + "loss": 0.0098, + "step": 465920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011883633460434807, + "loss": 0.0102, + "step": 465930 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188324463879766, + "loss": 0.0078, + "step": 465940 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011882855817160511, + "loss": 0.0087, + "step": 465950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011882466995523366, + "loss": 0.0125, + "step": 465960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011882078173886219, + "loss": 0.0105, + "step": 465970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011881689352249073, + "loss": 0.0091, + "step": 465980 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011881300530611926, + "loss": 0.0089, + "step": 465990 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001188091170897478, + "loss": 0.0101, + "step": 466000 + }, + { + "epoch": 1.21, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.00721912644803524, + "eval_runtime": 107.9087, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.634, + "step": 466000 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011880522887337633, + "loss": 0.0107, + "step": 466010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011880134065700487, + "loss": 0.0171, + "step": 466020 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001187974524406334, + "loss": 0.0106, + "step": 466030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011879356422426194, + "loss": 0.0062, + "step": 466040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011878967600789047, + "loss": 0.0086, + "step": 466050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011878578779151901, + "loss": 0.0103, + "step": 466060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011878189957514754, + "loss": 0.0101, + "step": 466070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011877801135877608, + "loss": 0.0105, + "step": 466080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011877412314240461, + "loss": 0.0144, + "step": 466090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011877023492603317, + "loss": 0.0096, + "step": 466100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011876634670966168, + "loss": 0.0095, + "step": 466110 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011876245849329024, + "loss": 0.0115, + "step": 466120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011875857027691876, + "loss": 0.013, + "step": 466130 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001187546820605473, + "loss": 0.0096, + "step": 466140 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011875079384417583, + "loss": 0.0121, + "step": 466150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011874690562780437, + "loss": 0.0097, + "step": 466160 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001187430174114329, + "loss": 0.0137, + "step": 466170 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011873912919506144, + "loss": 0.0094, + "step": 466180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011873524097868997, + "loss": 0.0112, + "step": 466190 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001187313527623185, + "loss": 0.0105, + "step": 466200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011872746454594704, + "loss": 0.0143, + "step": 466210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011872357632957557, + "loss": 0.0118, + "step": 466220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011871968811320411, + "loss": 0.0069, + "step": 466230 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011871579989683264, + "loss": 0.0102, + "step": 466240 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011871191168046118, + "loss": 0.0134, + "step": 466250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011870802346408971, + "loss": 0.009, + "step": 466260 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011870413524771825, + "loss": 0.0103, + "step": 466270 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011870024703134678, + "loss": 0.0102, + "step": 466280 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011869635881497533, + "loss": 0.0108, + "step": 466290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011869247059860386, + "loss": 0.0132, + "step": 466300 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186885823822324, + "loss": 0.0108, + "step": 466310 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011868469416586093, + "loss": 0.0094, + "step": 466320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011868080594948947, + "loss": 0.0098, + "step": 466330 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118676917733118, + "loss": 0.0099, + "step": 466340 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011867302951674654, + "loss": 0.0118, + "step": 466350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011866914130037507, + "loss": 0.0111, + "step": 466360 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011866525308400361, + "loss": 0.0084, + "step": 466370 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011866136486763214, + "loss": 0.0106, + "step": 466380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011865747665126068, + "loss": 0.0112, + "step": 466390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011865358843488921, + "loss": 0.0081, + "step": 466400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011864970021851775, + "loss": 0.0131, + "step": 466410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011864581200214628, + "loss": 0.0123, + "step": 466420 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011864192378577482, + "loss": 0.0127, + "step": 466430 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011863803556940335, + "loss": 0.0134, + "step": 466440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011863414735303188, + "loss": 0.0119, + "step": 466450 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011863025913666042, + "loss": 0.0153, + "step": 466460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011862637092028895, + "loss": 0.0097, + "step": 466470 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186224827039175, + "loss": 0.0093, + "step": 466480 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011861859448754603, + "loss": 0.0117, + "step": 466490 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011861470627117457, + "loss": 0.0118, + "step": 466500 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001186108180548031, + "loss": 0.0165, + "step": 466510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011860692983843164, + "loss": 0.0087, + "step": 466520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011860304162206017, + "loss": 0.0105, + "step": 466530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011859915340568871, + "loss": 0.0117, + "step": 466540 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011859526518931724, + "loss": 0.0093, + "step": 466550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011859137697294578, + "loss": 0.0124, + "step": 466560 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011858748875657431, + "loss": 0.0142, + "step": 466570 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011858360054020285, + "loss": 0.0142, + "step": 466580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011857971232383138, + "loss": 0.0118, + "step": 466590 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011857582410745992, + "loss": 0.013, + "step": 466600 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011857193589108845, + "loss": 0.0097, + "step": 466610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011856804767471699, + "loss": 0.0098, + "step": 466620 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011856415945834552, + "loss": 0.0107, + "step": 466630 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011856027124197408, + "loss": 0.0108, + "step": 466640 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001185563830256026, + "loss": 0.0126, + "step": 466650 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011855249480923114, + "loss": 0.0133, + "step": 466660 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011854860659285967, + "loss": 0.011, + "step": 466670 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011854471837648821, + "loss": 0.0081, + "step": 466680 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011854083016011674, + "loss": 0.0101, + "step": 466690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011853694194374527, + "loss": 0.0103, + "step": 466700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011853305372737381, + "loss": 0.0097, + "step": 466710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011852916551100234, + "loss": 0.0096, + "step": 466720 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011852527729463088, + "loss": 0.012, + "step": 466730 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011852138907825941, + "loss": 0.0095, + "step": 466740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011851750086188795, + "loss": 0.0122, + "step": 466750 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011851361264551648, + "loss": 0.0144, + "step": 466760 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011850972442914502, + "loss": 0.0134, + "step": 466770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011850583621277355, + "loss": 0.0142, + "step": 466780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011850194799640209, + "loss": 0.0088, + "step": 466790 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011849805978003062, + "loss": 0.0185, + "step": 466800 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011849417156365917, + "loss": 0.0098, + "step": 466810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011849028334728769, + "loss": 0.0109, + "step": 466820 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011848639513091624, + "loss": 0.0103, + "step": 466830 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011848250691454477, + "loss": 0.0091, + "step": 466840 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011847861869817331, + "loss": 0.0113, + "step": 466850 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011847473048180184, + "loss": 0.0094, + "step": 466860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011847084226543038, + "loss": 0.01, + "step": 466870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011846695404905891, + "loss": 0.0112, + "step": 466880 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011846306583268745, + "loss": 0.0103, + "step": 466890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011845917761631598, + "loss": 0.0135, + "step": 466900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011845528939994452, + "loss": 0.0086, + "step": 466910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011845140118357305, + "loss": 0.0077, + "step": 466920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011844751296720159, + "loss": 0.012, + "step": 466930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011844362475083012, + "loss": 0.0095, + "step": 466940 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011843973653445865, + "loss": 0.0102, + "step": 466950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011843584831808719, + "loss": 0.0123, + "step": 466960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011843196010171572, + "loss": 0.0098, + "step": 466970 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011842807188534426, + "loss": 0.0085, + "step": 466980 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011842418366897279, + "loss": 0.011, + "step": 466990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011842029545260134, + "loss": 0.0113, + "step": 467000 + }, + { + "epoch": 1.21, + "eval_cer": 0.8816648961259449, + "eval_loss": 0.006742514204233885, + "eval_runtime": 107.864, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, + "step": 467000 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011841640723622987, + "loss": 0.0108, + "step": 467010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011841251901985841, + "loss": 0.0096, + "step": 467020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011840863080348694, + "loss": 0.009, + "step": 467030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011840474258711548, + "loss": 0.0076, + "step": 467040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011840085437074401, + "loss": 0.0111, + "step": 467050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011839696615437255, + "loss": 0.0119, + "step": 467060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011839307793800108, + "loss": 0.0098, + "step": 467070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011838918972162962, + "loss": 0.0166, + "step": 467080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011838530150525815, + "loss": 0.0122, + "step": 467090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011838141328888669, + "loss": 0.0095, + "step": 467100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011837752507251522, + "loss": 0.0101, + "step": 467110 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011837363685614376, + "loss": 0.009, + "step": 467120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011836974863977229, + "loss": 0.0103, + "step": 467130 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011836586042340083, + "loss": 0.0115, + "step": 467140 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011836197220702936, + "loss": 0.0098, + "step": 467150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011835808399065791, + "loss": 0.0094, + "step": 467160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011835419577428644, + "loss": 0.0095, + "step": 467170 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011835030755791498, + "loss": 0.0091, + "step": 467180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011834641934154351, + "loss": 0.0109, + "step": 467190 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011834253112517204, + "loss": 0.0123, + "step": 467200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011833864290880058, + "loss": 0.01, + "step": 467210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011833475469242911, + "loss": 0.013, + "step": 467220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011833086647605765, + "loss": 0.0127, + "step": 467230 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011832697825968618, + "loss": 0.0085, + "step": 467240 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011832309004331472, + "loss": 0.0114, + "step": 467250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011831920182694325, + "loss": 0.0112, + "step": 467260 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011831531361057179, + "loss": 0.0098, + "step": 467270 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011831142539420032, + "loss": 0.0095, + "step": 467280 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011830753717782886, + "loss": 0.0112, + "step": 467290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011830364896145739, + "loss": 0.0081, + "step": 467300 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011829976074508593, + "loss": 0.0088, + "step": 467310 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011829587252871446, + "loss": 0.0092, + "step": 467320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011829198431234301, + "loss": 0.007, + "step": 467330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011828809609597153, + "loss": 0.0106, + "step": 467340 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011828420787960008, + "loss": 0.0099, + "step": 467350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011828031966322861, + "loss": 0.0085, + "step": 467360 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011827643144685715, + "loss": 0.0124, + "step": 467370 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011827254323048568, + "loss": 0.0089, + "step": 467380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011826865501411422, + "loss": 0.0112, + "step": 467390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011826476679774275, + "loss": 0.0086, + "step": 467400 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001182608785813713, + "loss": 0.0113, + "step": 467410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011825699036499982, + "loss": 0.0112, + "step": 467420 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011825310214862836, + "loss": 0.011, + "step": 467430 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011824921393225689, + "loss": 0.01, + "step": 467440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011824532571588542, + "loss": 0.0102, + "step": 467450 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011824143749951396, + "loss": 0.0083, + "step": 467460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011823754928314249, + "loss": 0.0122, + "step": 467470 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011823366106677103, + "loss": 0.0091, + "step": 467480 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011822977285039956, + "loss": 0.0101, + "step": 467490 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001182258846340281, + "loss": 0.0106, + "step": 467500 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011822199641765663, + "loss": 0.0119, + "step": 467510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011821810820128518, + "loss": 0.0098, + "step": 467520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011821421998491371, + "loss": 0.0147, + "step": 467530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011821033176854225, + "loss": 0.011, + "step": 467540 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011820644355217078, + "loss": 0.0086, + "step": 467550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011820255533579932, + "loss": 0.01, + "step": 467560 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011819866711942785, + "loss": 0.0103, + "step": 467570 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011819477890305639, + "loss": 0.0098, + "step": 467580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011819089068668492, + "loss": 0.01, + "step": 467590 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011818700247031346, + "loss": 0.0134, + "step": 467600 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011818311425394199, + "loss": 0.0083, + "step": 467610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011817922603757053, + "loss": 0.0126, + "step": 467620 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011817533782119906, + "loss": 0.0104, + "step": 467630 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001181714496048276, + "loss": 0.0106, + "step": 467640 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011816756138845613, + "loss": 0.0105, + "step": 467650 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011816367317208467, + "loss": 0.0113, + "step": 467660 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001181597849557132, + "loss": 0.0092, + "step": 467670 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011815589673934175, + "loss": 0.0105, + "step": 467680 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011815200852297028, + "loss": 0.0122, + "step": 467690 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001181481203065988, + "loss": 0.0103, + "step": 467700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011814423209022735, + "loss": 0.0128, + "step": 467710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011814034387385588, + "loss": 0.0102, + "step": 467720 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011813645565748442, + "loss": 0.0083, + "step": 467730 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011813256744111295, + "loss": 0.0139, + "step": 467740 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011812867922474149, + "loss": 0.0095, + "step": 467750 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011812479100837002, + "loss": 0.0133, + "step": 467760 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011812090279199856, + "loss": 0.0087, + "step": 467770 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011811701457562709, + "loss": 0.0127, + "step": 467780 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011811312635925563, + "loss": 0.0083, + "step": 467790 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011810923814288416, + "loss": 0.0092, + "step": 467800 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001181053499265127, + "loss": 0.0119, + "step": 467810 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011810146171014123, + "loss": 0.0123, + "step": 467820 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011809757349376977, + "loss": 0.0113, + "step": 467830 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001180936852773983, + "loss": 0.0091, + "step": 467840 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011808979706102684, + "loss": 0.0102, + "step": 467850 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011808590884465537, + "loss": 0.0118, + "step": 467860 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011808202062828392, + "loss": 0.0129, + "step": 467870 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011807813241191245, + "loss": 0.0098, + "step": 467880 + }, + { + "epoch": 1.21, + "learning_rate": 0.000118074244195541, + "loss": 0.0142, + "step": 467890 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011807035597916952, + "loss": 0.0114, + "step": 467900 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011806646776279806, + "loss": 0.0111, + "step": 467910 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011806257954642659, + "loss": 0.0123, + "step": 467920 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011805869133005512, + "loss": 0.0092, + "step": 467930 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011805480311368366, + "loss": 0.0102, + "step": 467940 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011805091489731219, + "loss": 0.0092, + "step": 467950 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011804702668094073, + "loss": 0.0113, + "step": 467960 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011804313846456926, + "loss": 0.0096, + "step": 467970 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001180392502481978, + "loss": 0.0105, + "step": 467980 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011803536203182633, + "loss": 0.0112, + "step": 467990 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011803147381545487, + "loss": 0.011, + "step": 468000 + }, + { + "epoch": 1.21, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.007058866787701845, + "eval_runtime": 107.9524, + "eval_samples_per_second": 18.527, + "eval_steps_per_second": 4.632, + "step": 468000 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001180275855990834, + "loss": 0.0111, + "step": 468010 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011802369738271194, + "loss": 0.0116, + "step": 468020 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011801980916634047, + "loss": 0.0092, + "step": 468030 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011801592094996902, + "loss": 0.011, + "step": 468040 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011801203273359754, + "loss": 0.0099, + "step": 468050 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011800814451722609, + "loss": 0.0128, + "step": 468060 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011800425630085462, + "loss": 0.0122, + "step": 468070 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011800036808448316, + "loss": 0.0081, + "step": 468080 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011799647986811169, + "loss": 0.0117, + "step": 468090 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011799259165174023, + "loss": 0.0127, + "step": 468100 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011798870343536876, + "loss": 0.0081, + "step": 468110 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001179848152189973, + "loss": 0.0106, + "step": 468120 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011798092700262583, + "loss": 0.0107, + "step": 468130 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011797703878625437, + "loss": 0.0095, + "step": 468140 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001179731505698829, + "loss": 0.0124, + "step": 468150 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011796926235351144, + "loss": 0.0134, + "step": 468160 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011796537413713997, + "loss": 0.0105, + "step": 468170 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001179614859207685, + "loss": 0.0083, + "step": 468180 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011795759770439704, + "loss": 0.0121, + "step": 468190 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011795370948802557, + "loss": 0.0091, + "step": 468200 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011794982127165411, + "loss": 0.0116, + "step": 468210 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011794593305528264, + "loss": 0.0126, + "step": 468220 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011794204483891119, + "loss": 0.0128, + "step": 468230 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011793815662253972, + "loss": 0.0098, + "step": 468240 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011793426840616826, + "loss": 0.0112, + "step": 468250 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011793038018979679, + "loss": 0.0128, + "step": 468260 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011792649197342533, + "loss": 0.0133, + "step": 468270 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011792260375705386, + "loss": 0.0095, + "step": 468280 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001179187155406824, + "loss": 0.0112, + "step": 468290 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011791482732431093, + "loss": 0.0115, + "step": 468300 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011791093910793947, + "loss": 0.0093, + "step": 468310 + }, + { + "epoch": 1.21, + "learning_rate": 0.000117907050891568, + "loss": 0.0124, + "step": 468320 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011790316267519654, + "loss": 0.0091, + "step": 468330 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011789927445882507, + "loss": 0.0105, + "step": 468340 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011789538624245361, + "loss": 0.0104, + "step": 468350 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011789149802608214, + "loss": 0.0127, + "step": 468360 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011788760980971068, + "loss": 0.0088, + "step": 468370 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011788372159333921, + "loss": 0.0114, + "step": 468380 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011787983337696776, + "loss": 0.0174, + "step": 468390 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011787594516059629, + "loss": 0.0123, + "step": 468400 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011787205694422483, + "loss": 0.0094, + "step": 468410 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011786816872785336, + "loss": 0.0093, + "step": 468420 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011786428051148189, + "loss": 0.0119, + "step": 468430 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011786039229511043, + "loss": 0.0082, + "step": 468440 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011785650407873896, + "loss": 0.0131, + "step": 468450 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178526158623675, + "loss": 0.0099, + "step": 468460 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011784872764599603, + "loss": 0.0106, + "step": 468470 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011784483942962457, + "loss": 0.0111, + "step": 468480 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001178409512132531, + "loss": 0.0107, + "step": 468490 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011783706299688164, + "loss": 0.0108, + "step": 468500 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011783317478051017, + "loss": 0.0111, + "step": 468510 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011782928656413871, + "loss": 0.0098, + "step": 468520 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011782539834776724, + "loss": 0.0134, + "step": 468530 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011782151013139578, + "loss": 0.0103, + "step": 468540 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011781762191502431, + "loss": 0.011, + "step": 468550 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011781373369865286, + "loss": 0.0095, + "step": 468560 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011780984548228138, + "loss": 0.0121, + "step": 468570 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011780595726590993, + "loss": 0.0094, + "step": 468580 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011780206904953846, + "loss": 0.0075, + "step": 468590 + }, + { + "epoch": 1.21, + "learning_rate": 0.000117798180833167, + "loss": 0.0122, + "step": 468600 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011779429261679553, + "loss": 0.0105, + "step": 468610 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011779040440042407, + "loss": 0.0093, + "step": 468620 + }, + { + "epoch": 1.21, + "learning_rate": 0.0001177865161840526, + "loss": 0.0087, + "step": 468630 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011778262796768114, + "loss": 0.0103, + "step": 468640 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011777873975130967, + "loss": 0.0114, + "step": 468650 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011777485153493821, + "loss": 0.0087, + "step": 468660 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011777096331856674, + "loss": 0.0138, + "step": 468670 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011776707510219527, + "loss": 0.0103, + "step": 468680 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011776318688582381, + "loss": 0.0105, + "step": 468690 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011775929866945234, + "loss": 0.0111, + "step": 468700 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011775541045308088, + "loss": 0.0131, + "step": 468710 + }, + { + "epoch": 1.21, + "learning_rate": 0.00011775152223670941, + "loss": 0.0108, + "step": 468720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011774763402033795, + "loss": 0.0122, + "step": 468730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011774374580396648, + "loss": 0.0097, + "step": 468740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011773985758759503, + "loss": 0.01, + "step": 468750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011773596937122356, + "loss": 0.0103, + "step": 468760 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001177320811548521, + "loss": 0.009, + "step": 468770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011772819293848063, + "loss": 0.0123, + "step": 468780 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011772430472210917, + "loss": 0.0088, + "step": 468790 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001177204165057377, + "loss": 0.0095, + "step": 468800 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011771652828936624, + "loss": 0.0114, + "step": 468810 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011771264007299477, + "loss": 0.0116, + "step": 468820 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011770875185662331, + "loss": 0.0129, + "step": 468830 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011770486364025184, + "loss": 0.0094, + "step": 468840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011770097542388038, + "loss": 0.0126, + "step": 468850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011769708720750891, + "loss": 0.0117, + "step": 468860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011769319899113745, + "loss": 0.01, + "step": 468870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011768931077476598, + "loss": 0.0105, + "step": 468880 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011768542255839452, + "loss": 0.0122, + "step": 468890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011768153434202305, + "loss": 0.0093, + "step": 468900 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001176776461256516, + "loss": 0.0092, + "step": 468910 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011767375790928013, + "loss": 0.0167, + "step": 468920 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011766986969290865, + "loss": 0.0117, + "step": 468930 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001176659814765372, + "loss": 0.0121, + "step": 468940 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011766209326016573, + "loss": 0.0102, + "step": 468950 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011765820504379427, + "loss": 0.0098, + "step": 468960 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001176543168274228, + "loss": 0.011, + "step": 468970 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011765042861105134, + "loss": 0.0135, + "step": 468980 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011764654039467987, + "loss": 0.0092, + "step": 468990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011764265217830841, + "loss": 0.01, + "step": 469000 + }, + { + "epoch": 1.22, + "eval_cer": 0.881719481966378, + "eval_loss": 0.007160056848078966, + "eval_runtime": 107.8978, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, + "step": 469000 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011763876396193694, + "loss": 0.0109, + "step": 469010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011763487574556548, + "loss": 0.0092, + "step": 469020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011763098752919401, + "loss": 0.0111, + "step": 469030 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011762709931282255, + "loss": 0.0135, + "step": 469040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011762321109645108, + "loss": 0.0127, + "step": 469050 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011761932288007962, + "loss": 0.0091, + "step": 469060 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011761543466370815, + "loss": 0.0118, + "step": 469070 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011761154644733669, + "loss": 0.0077, + "step": 469080 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011760765823096522, + "loss": 0.0095, + "step": 469090 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011760377001459377, + "loss": 0.0092, + "step": 469100 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001175998817982223, + "loss": 0.0108, + "step": 469110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011759599358185084, + "loss": 0.0091, + "step": 469120 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011759210536547937, + "loss": 0.008, + "step": 469130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011758821714910791, + "loss": 0.008, + "step": 469140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011758432893273644, + "loss": 0.0104, + "step": 469150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011758044071636498, + "loss": 0.0117, + "step": 469160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011757655249999351, + "loss": 0.0145, + "step": 469170 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011757266428362204, + "loss": 0.0105, + "step": 469180 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011756877606725058, + "loss": 0.0095, + "step": 469190 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011756488785087911, + "loss": 0.0117, + "step": 469200 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011756099963450765, + "loss": 0.0122, + "step": 469210 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011755711141813618, + "loss": 0.0143, + "step": 469220 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011755322320176472, + "loss": 0.013, + "step": 469230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011754933498539325, + "loss": 0.0131, + "step": 469240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011754544676902179, + "loss": 0.0086, + "step": 469250 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011754155855265032, + "loss": 0.0117, + "step": 469260 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011753767033627887, + "loss": 0.0138, + "step": 469270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011753378211990739, + "loss": 0.0101, + "step": 469280 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011752989390353594, + "loss": 0.0096, + "step": 469290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011752600568716447, + "loss": 0.0099, + "step": 469300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011752211747079301, + "loss": 0.0137, + "step": 469310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011751822925442154, + "loss": 0.0106, + "step": 469320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011751434103805008, + "loss": 0.0116, + "step": 469330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011751045282167861, + "loss": 0.0154, + "step": 469340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011750656460530715, + "loss": 0.0102, + "step": 469350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011750267638893568, + "loss": 0.0097, + "step": 469360 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011749878817256422, + "loss": 0.0119, + "step": 469370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011749489995619275, + "loss": 0.0109, + "step": 469380 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011749101173982129, + "loss": 0.0121, + "step": 469390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011748712352344982, + "loss": 0.0084, + "step": 469400 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011748323530707836, + "loss": 0.0068, + "step": 469410 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011747934709070689, + "loss": 0.0131, + "step": 469420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011747545887433542, + "loss": 0.0152, + "step": 469430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011747157065796396, + "loss": 0.0099, + "step": 469440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011746768244159249, + "loss": 0.0086, + "step": 469450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011746379422522104, + "loss": 0.0091, + "step": 469460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011745990600884957, + "loss": 0.0118, + "step": 469470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011745601779247811, + "loss": 0.0092, + "step": 469480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011745212957610664, + "loss": 0.0082, + "step": 469490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011744824135973518, + "loss": 0.013, + "step": 469500 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011744435314336371, + "loss": 0.0094, + "step": 469510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011744046492699225, + "loss": 0.0088, + "step": 469520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011743657671062078, + "loss": 0.0125, + "step": 469530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011743268849424932, + "loss": 0.0123, + "step": 469540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011742880027787785, + "loss": 0.0109, + "step": 469550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011742491206150639, + "loss": 0.008, + "step": 469560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011742102384513492, + "loss": 0.0116, + "step": 469570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011741713562876346, + "loss": 0.0093, + "step": 469580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011741324741239199, + "loss": 0.0147, + "step": 469590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011740935919602053, + "loss": 0.011, + "step": 469600 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011740547097964906, + "loss": 0.0138, + "step": 469610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011740158276327761, + "loss": 0.0101, + "step": 469620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011739769454690614, + "loss": 0.0145, + "step": 469630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011739380633053468, + "loss": 0.0096, + "step": 469640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011738991811416321, + "loss": 0.0081, + "step": 469650 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011738602989779175, + "loss": 0.0139, + "step": 469660 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011738214168142028, + "loss": 0.0104, + "step": 469670 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011737825346504881, + "loss": 0.0123, + "step": 469680 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011737436524867735, + "loss": 0.0115, + "step": 469690 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011737047703230588, + "loss": 0.0094, + "step": 469700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011736658881593442, + "loss": 0.0143, + "step": 469710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011736270059956295, + "loss": 0.0086, + "step": 469720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011735881238319149, + "loss": 0.0102, + "step": 469730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011735492416682002, + "loss": 0.0082, + "step": 469740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011735103595044856, + "loss": 0.0103, + "step": 469750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011734714773407709, + "loss": 0.0125, + "step": 469760 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011734325951770563, + "loss": 0.0143, + "step": 469770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011733937130133416, + "loss": 0.01, + "step": 469780 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011733548308496271, + "loss": 0.0128, + "step": 469790 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011733159486859123, + "loss": 0.0118, + "step": 469800 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011732770665221978, + "loss": 0.0115, + "step": 469810 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011732381843584831, + "loss": 0.0114, + "step": 469820 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011731993021947685, + "loss": 0.0102, + "step": 469830 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011731604200310538, + "loss": 0.0122, + "step": 469840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011731215378673392, + "loss": 0.0135, + "step": 469850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011730826557036245, + "loss": 0.0102, + "step": 469860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011730437735399099, + "loss": 0.0118, + "step": 469870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011730048913761952, + "loss": 0.0117, + "step": 469880 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011729660092124806, + "loss": 0.0098, + "step": 469890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011729271270487659, + "loss": 0.0102, + "step": 469900 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011728882448850513, + "loss": 0.0114, + "step": 469910 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011728493627213366, + "loss": 0.0088, + "step": 469920 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011728104805576219, + "loss": 0.0114, + "step": 469930 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011727715983939073, + "loss": 0.0157, + "step": 469940 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011727327162301926, + "loss": 0.0126, + "step": 469950 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001172693834066478, + "loss": 0.0141, + "step": 469960 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011726549519027633, + "loss": 0.0138, + "step": 469970 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011726160697390488, + "loss": 0.011, + "step": 469980 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011725771875753341, + "loss": 0.0093, + "step": 469990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011725383054116195, + "loss": 0.0104, + "step": 470000 + }, + { + "epoch": 1.22, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.007257182616740465, + "eval_runtime": 107.971, + "eval_samples_per_second": 18.523, + "eval_steps_per_second": 4.631, + "step": 470000 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011724994232479048, + "loss": 0.0113, + "step": 470010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011724605410841902, + "loss": 0.0108, + "step": 470020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011724216589204755, + "loss": 0.0117, + "step": 470030 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011723827767567609, + "loss": 0.0102, + "step": 470040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011723438945930462, + "loss": 0.0101, + "step": 470050 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011723050124293316, + "loss": 0.0085, + "step": 470060 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011722661302656169, + "loss": 0.0097, + "step": 470070 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011722272481019023, + "loss": 0.0091, + "step": 470080 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011721883659381876, + "loss": 0.0101, + "step": 470090 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001172149483774473, + "loss": 0.01, + "step": 470100 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011721106016107583, + "loss": 0.0114, + "step": 470110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011720717194470437, + "loss": 0.0123, + "step": 470120 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001172032837283329, + "loss": 0.0109, + "step": 470130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011719939551196145, + "loss": 0.0113, + "step": 470140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011719550729558998, + "loss": 0.0117, + "step": 470150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011719161907921852, + "loss": 0.0087, + "step": 470160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011718773086284705, + "loss": 0.0133, + "step": 470170 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011718384264647558, + "loss": 0.0117, + "step": 470180 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011717995443010412, + "loss": 0.0124, + "step": 470190 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011717606621373265, + "loss": 0.014, + "step": 470200 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011717217799736119, + "loss": 0.0111, + "step": 470210 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011716828978098972, + "loss": 0.0115, + "step": 470220 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011716440156461826, + "loss": 0.0103, + "step": 470230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011716051334824679, + "loss": 0.0118, + "step": 470240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011715662513187533, + "loss": 0.0134, + "step": 470250 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011715273691550386, + "loss": 0.008, + "step": 470260 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001171488486991324, + "loss": 0.0116, + "step": 470270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011714496048276093, + "loss": 0.0129, + "step": 470280 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011714107226638947, + "loss": 0.0128, + "step": 470290 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117137184050018, + "loss": 0.0095, + "step": 470300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011713329583364655, + "loss": 0.0102, + "step": 470310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011712940761727507, + "loss": 0.0107, + "step": 470320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011712551940090362, + "loss": 0.0098, + "step": 470330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011712163118453215, + "loss": 0.0075, + "step": 470340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011711774296816069, + "loss": 0.0107, + "step": 470350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011711385475178922, + "loss": 0.0111, + "step": 470360 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011710996653541776, + "loss": 0.0105, + "step": 470370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011710607831904629, + "loss": 0.0099, + "step": 470380 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011710219010267483, + "loss": 0.0095, + "step": 470390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011709830188630336, + "loss": 0.0102, + "step": 470400 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170944136699319, + "loss": 0.0093, + "step": 470410 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011709052545356043, + "loss": 0.0088, + "step": 470420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011708663723718896, + "loss": 0.0155, + "step": 470430 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170827490208175, + "loss": 0.0159, + "step": 470440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011707886080444603, + "loss": 0.0127, + "step": 470450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011707497258807457, + "loss": 0.0105, + "step": 470460 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170710843717031, + "loss": 0.0112, + "step": 470470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011706719615533164, + "loss": 0.0121, + "step": 470480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011706330793896017, + "loss": 0.0153, + "step": 470490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011705941972258872, + "loss": 0.0085, + "step": 470500 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011705553150621725, + "loss": 0.0112, + "step": 470510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011705164328984579, + "loss": 0.0106, + "step": 470520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011704775507347432, + "loss": 0.009, + "step": 470530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011704386685710286, + "loss": 0.016, + "step": 470540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011703997864073139, + "loss": 0.0089, + "step": 470550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011703609042435993, + "loss": 0.0131, + "step": 470560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011703220220798846, + "loss": 0.0095, + "step": 470570 + }, + { + "epoch": 1.22, + "learning_rate": 0.000117028313991617, + "loss": 0.0096, + "step": 470580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011702442577524553, + "loss": 0.0103, + "step": 470590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011702053755887407, + "loss": 0.0138, + "step": 470600 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001170166493425026, + "loss": 0.0098, + "step": 470610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011701276112613114, + "loss": 0.0094, + "step": 470620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011700887290975967, + "loss": 0.0092, + "step": 470630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011700498469338821, + "loss": 0.0097, + "step": 470640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011700109647701674, + "loss": 0.0122, + "step": 470650 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011699720826064527, + "loss": 0.01, + "step": 470660 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011699332004427381, + "loss": 0.0102, + "step": 470670 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011698943182790234, + "loss": 0.0121, + "step": 470680 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011698554361153089, + "loss": 0.0107, + "step": 470690 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011698165539515942, + "loss": 0.0117, + "step": 470700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011697776717878796, + "loss": 0.0084, + "step": 470710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011697387896241649, + "loss": 0.0145, + "step": 470720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011696999074604503, + "loss": 0.012, + "step": 470730 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011696610252967356, + "loss": 0.0094, + "step": 470740 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169622143133021, + "loss": 0.0116, + "step": 470750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011695832609693063, + "loss": 0.0093, + "step": 470760 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011695443788055917, + "loss": 0.0104, + "step": 470770 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169505496641877, + "loss": 0.0139, + "step": 470780 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011694666144781624, + "loss": 0.0139, + "step": 470790 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011694277323144477, + "loss": 0.0106, + "step": 470800 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011693888501507331, + "loss": 0.0099, + "step": 470810 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011693499679870184, + "loss": 0.0102, + "step": 470820 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011693110858233038, + "loss": 0.0093, + "step": 470830 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169272203659589, + "loss": 0.0102, + "step": 470840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011692333214958746, + "loss": 0.01, + "step": 470850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011691944393321599, + "loss": 0.0122, + "step": 470860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011691555571684453, + "loss": 0.0106, + "step": 470870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011691166750047306, + "loss": 0.0096, + "step": 470880 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001169077792841016, + "loss": 0.0113, + "step": 470890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011690389106773013, + "loss": 0.0125, + "step": 470900 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011690000285135866, + "loss": 0.011, + "step": 470910 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168961146349872, + "loss": 0.0096, + "step": 470920 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011689222641861573, + "loss": 0.0113, + "step": 470930 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011688833820224427, + "loss": 0.0124, + "step": 470940 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168844499858728, + "loss": 0.0082, + "step": 470950 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011688056176950134, + "loss": 0.0073, + "step": 470960 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011687667355312987, + "loss": 0.0117, + "step": 470970 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011687278533675841, + "loss": 0.0121, + "step": 470980 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011686889712038694, + "loss": 0.0088, + "step": 470990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011686500890401548, + "loss": 0.0131, + "step": 471000 + }, + { + "epoch": 1.22, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.007188483607023954, + "eval_runtime": 107.8616, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.636, + "step": 471000 + }, + { + "epoch": 1.22, + "learning_rate": 0.000116861120687644, + "loss": 0.0163, + "step": 471010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011685723247127256, + "loss": 0.0105, + "step": 471020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011685334425490108, + "loss": 0.0102, + "step": 471030 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011684945603852963, + "loss": 0.008, + "step": 471040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011684556782215816, + "loss": 0.0135, + "step": 471050 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168416796057867, + "loss": 0.0144, + "step": 471060 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011683779138941523, + "loss": 0.0104, + "step": 471070 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011683390317304377, + "loss": 0.0133, + "step": 471080 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001168300149566723, + "loss": 0.0118, + "step": 471090 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011682612674030084, + "loss": 0.009, + "step": 471100 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011682223852392937, + "loss": 0.0094, + "step": 471110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011681835030755791, + "loss": 0.0104, + "step": 471120 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011681446209118644, + "loss": 0.0109, + "step": 471130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011681057387481498, + "loss": 0.0118, + "step": 471140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011680668565844351, + "loss": 0.0102, + "step": 471150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011680279744207204, + "loss": 0.0119, + "step": 471160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011679890922570058, + "loss": 0.0116, + "step": 471170 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167950210093291, + "loss": 0.0065, + "step": 471180 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011679113279295765, + "loss": 0.0106, + "step": 471190 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011678724457658618, + "loss": 0.0131, + "step": 471200 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011678335636021473, + "loss": 0.0098, + "step": 471210 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011677946814384326, + "loss": 0.0146, + "step": 471220 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167755799274718, + "loss": 0.0099, + "step": 471230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011677169171110033, + "loss": 0.0098, + "step": 471240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011676780349472887, + "loss": 0.011, + "step": 471250 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167639152783574, + "loss": 0.0087, + "step": 471260 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011676002706198594, + "loss": 0.0115, + "step": 471270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011675613884561447, + "loss": 0.008, + "step": 471280 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011675225062924301, + "loss": 0.0109, + "step": 471290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011674836241287154, + "loss": 0.007, + "step": 471300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011674447419650008, + "loss": 0.0102, + "step": 471310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011674058598012861, + "loss": 0.0103, + "step": 471320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011673669776375715, + "loss": 0.0093, + "step": 471330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011673280954738568, + "loss": 0.0138, + "step": 471340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011672892133101422, + "loss": 0.0085, + "step": 471350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011672503311464275, + "loss": 0.0087, + "step": 471360 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167211448982713, + "loss": 0.0082, + "step": 471370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011671725668189983, + "loss": 0.0121, + "step": 471380 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011671336846552837, + "loss": 0.0089, + "step": 471390 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001167094802491569, + "loss": 0.011, + "step": 471400 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011670559203278543, + "loss": 0.0112, + "step": 471410 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011670170381641397, + "loss": 0.0121, + "step": 471420 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166978156000425, + "loss": 0.0129, + "step": 471430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011669392738367104, + "loss": 0.0092, + "step": 471440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011669003916729957, + "loss": 0.0152, + "step": 471450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011668615095092811, + "loss": 0.0086, + "step": 471460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011668226273455664, + "loss": 0.011, + "step": 471470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011667837451818518, + "loss": 0.014, + "step": 471480 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166744863018137, + "loss": 0.0086, + "step": 471490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011667059808544225, + "loss": 0.0098, + "step": 471500 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011666670986907078, + "loss": 0.0107, + "step": 471510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011666282165269932, + "loss": 0.0123, + "step": 471520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011665893343632785, + "loss": 0.0103, + "step": 471530 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166550452199564, + "loss": 0.01, + "step": 471540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011665115700358492, + "loss": 0.0106, + "step": 471550 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011664726878721347, + "loss": 0.0091, + "step": 471560 + }, + { + "epoch": 1.22, + "learning_rate": 0.000116643380570842, + "loss": 0.013, + "step": 471570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011663949235447054, + "loss": 0.015, + "step": 471580 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011663560413809907, + "loss": 0.0076, + "step": 471590 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011663171592172761, + "loss": 0.0092, + "step": 471600 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011662782770535614, + "loss": 0.0129, + "step": 471610 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011662393948898468, + "loss": 0.0096, + "step": 471620 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011662005127261321, + "loss": 0.0089, + "step": 471630 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011661616305624175, + "loss": 0.009, + "step": 471640 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011661227483987028, + "loss": 0.0104, + "step": 471650 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001166083866234988, + "loss": 0.0093, + "step": 471660 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011660449840712735, + "loss": 0.0079, + "step": 471670 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011660061019075588, + "loss": 0.0132, + "step": 471680 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011659672197438442, + "loss": 0.014, + "step": 471690 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011659283375801295, + "loss": 0.0104, + "step": 471700 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011658894554164149, + "loss": 0.0107, + "step": 471710 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011658505732527002, + "loss": 0.0097, + "step": 471720 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011658116910889857, + "loss": 0.0096, + "step": 471730 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001165772808925271, + "loss": 0.0134, + "step": 471740 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011657339267615564, + "loss": 0.0121, + "step": 471750 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011656950445978417, + "loss": 0.0101, + "step": 471760 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011656561624341271, + "loss": 0.0105, + "step": 471770 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011656172802704124, + "loss": 0.0124, + "step": 471780 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011655783981066978, + "loss": 0.0125, + "step": 471790 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011655395159429831, + "loss": 0.0082, + "step": 471800 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011655006337792685, + "loss": 0.0115, + "step": 471810 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011654617516155538, + "loss": 0.0134, + "step": 471820 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011654228694518392, + "loss": 0.0094, + "step": 471830 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011653839872881245, + "loss": 0.009, + "step": 471840 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011653451051244099, + "loss": 0.0125, + "step": 471850 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011653062229606952, + "loss": 0.0095, + "step": 471860 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011652673407969806, + "loss": 0.0119, + "step": 471870 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011652284586332659, + "loss": 0.0106, + "step": 471880 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011651895764695514, + "loss": 0.01, + "step": 471890 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011651506943058367, + "loss": 0.0109, + "step": 471900 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011651118121421218, + "loss": 0.0118, + "step": 471910 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011650729299784074, + "loss": 0.007, + "step": 471920 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011650340478146927, + "loss": 0.0105, + "step": 471930 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011649951656509781, + "loss": 0.0083, + "step": 471940 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011649562834872634, + "loss": 0.0106, + "step": 471950 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011649174013235488, + "loss": 0.011, + "step": 471960 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011648785191598341, + "loss": 0.0095, + "step": 471970 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011648396369961195, + "loss": 0.0096, + "step": 471980 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011648007548324048, + "loss": 0.0129, + "step": 471990 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011647618726686902, + "loss": 0.0108, + "step": 472000 + }, + { + "epoch": 1.22, + "eval_cer": 0.8817012866862336, + "eval_loss": 0.007290003355592489, + "eval_runtime": 108.0416, + "eval_samples_per_second": 18.511, + "eval_steps_per_second": 4.628, + "step": 472000 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011647229905049755, + "loss": 0.0118, + "step": 472010 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011646841083412609, + "loss": 0.0106, + "step": 472020 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011646452261775462, + "loss": 0.0121, + "step": 472030 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011646063440138316, + "loss": 0.011, + "step": 472040 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011645674618501169, + "loss": 0.012, + "step": 472050 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011645285796864023, + "loss": 0.0146, + "step": 472060 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011644896975226876, + "loss": 0.0111, + "step": 472070 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011644508153589731, + "loss": 0.0118, + "step": 472080 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011644119331952584, + "loss": 0.0142, + "step": 472090 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011643730510315438, + "loss": 0.0111, + "step": 472100 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011643341688678291, + "loss": 0.0095, + "step": 472110 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011642952867041145, + "loss": 0.0083, + "step": 472120 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011642564045403998, + "loss": 0.0081, + "step": 472130 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011642175223766852, + "loss": 0.0076, + "step": 472140 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011641786402129705, + "loss": 0.0111, + "step": 472150 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011641397580492558, + "loss": 0.0105, + "step": 472160 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011641008758855412, + "loss": 0.0092, + "step": 472170 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011640619937218265, + "loss": 0.0163, + "step": 472180 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011640231115581119, + "loss": 0.0099, + "step": 472190 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011639842293943972, + "loss": 0.0103, + "step": 472200 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011639453472306826, + "loss": 0.0085, + "step": 472210 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011639064650669679, + "loss": 0.0092, + "step": 472220 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011638675829032533, + "loss": 0.0109, + "step": 472230 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011638287007395386, + "loss": 0.0086, + "step": 472240 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011637898185758241, + "loss": 0.0108, + "step": 472250 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011637509364121092, + "loss": 0.0104, + "step": 472260 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011637120542483948, + "loss": 0.0083, + "step": 472270 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011636731720846801, + "loss": 0.0093, + "step": 472280 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011636342899209655, + "loss": 0.0113, + "step": 472290 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011635954077572508, + "loss": 0.0061, + "step": 472300 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011635565255935362, + "loss": 0.011, + "step": 472310 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011635176434298215, + "loss": 0.0099, + "step": 472320 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011634787612661069, + "loss": 0.012, + "step": 472330 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011634398791023922, + "loss": 0.009, + "step": 472340 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011634009969386776, + "loss": 0.0075, + "step": 472350 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011633621147749629, + "loss": 0.0117, + "step": 472360 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011633232326112483, + "loss": 0.0147, + "step": 472370 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011632843504475336, + "loss": 0.0099, + "step": 472380 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001163245468283819, + "loss": 0.0107, + "step": 472390 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011632065861201043, + "loss": 0.0115, + "step": 472400 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011631677039563895, + "loss": 0.0101, + "step": 472410 + }, + { + "epoch": 1.22, + "learning_rate": 0.0001163128821792675, + "loss": 0.0107, + "step": 472420 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011630899396289602, + "loss": 0.0137, + "step": 472430 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011630510574652458, + "loss": 0.0089, + "step": 472440 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011630121753015311, + "loss": 0.0112, + "step": 472450 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011629732931378165, + "loss": 0.0127, + "step": 472460 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011629344109741018, + "loss": 0.012, + "step": 472470 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011628955288103872, + "loss": 0.0101, + "step": 472480 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011628566466466725, + "loss": 0.0116, + "step": 472490 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011628177644829579, + "loss": 0.0102, + "step": 472500 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011627788823192432, + "loss": 0.0094, + "step": 472510 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011627400001555286, + "loss": 0.0098, + "step": 472520 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011627011179918139, + "loss": 0.0099, + "step": 472530 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011626622358280993, + "loss": 0.012, + "step": 472540 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011626233536643846, + "loss": 0.0102, + "step": 472550 + }, + { + "epoch": 1.22, + "learning_rate": 0.000116258447150067, + "loss": 0.0109, + "step": 472560 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011625455893369553, + "loss": 0.0086, + "step": 472570 + }, + { + "epoch": 1.22, + "learning_rate": 0.00011625067071732407, + "loss": 0.0086, + "step": 472580 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001162467825009526, + "loss": 0.0132, + "step": 472590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011624289428458115, + "loss": 0.0092, + "step": 472600 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011623900606820968, + "loss": 0.0114, + "step": 472610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011623511785183822, + "loss": 0.0078, + "step": 472620 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011623122963546675, + "loss": 0.0095, + "step": 472630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011622734141909529, + "loss": 0.01, + "step": 472640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011622345320272382, + "loss": 0.0094, + "step": 472650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011621956498635235, + "loss": 0.0118, + "step": 472660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011621567676998089, + "loss": 0.009, + "step": 472670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011621178855360942, + "loss": 0.009, + "step": 472680 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011620790033723796, + "loss": 0.0107, + "step": 472690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011620401212086649, + "loss": 0.0089, + "step": 472700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011620012390449503, + "loss": 0.0097, + "step": 472710 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011619623568812356, + "loss": 0.0091, + "step": 472720 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161923474717521, + "loss": 0.0121, + "step": 472730 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011618845925538063, + "loss": 0.0141, + "step": 472740 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011618457103900917, + "loss": 0.0146, + "step": 472750 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161806828226377, + "loss": 0.0104, + "step": 472760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011617679460626625, + "loss": 0.0102, + "step": 472770 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011617290638989476, + "loss": 0.0114, + "step": 472780 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011616901817352332, + "loss": 0.0102, + "step": 472790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011616512995715185, + "loss": 0.0081, + "step": 472800 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011616124174078039, + "loss": 0.0094, + "step": 472810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011615735352440892, + "loss": 0.0127, + "step": 472820 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011615346530803746, + "loss": 0.0087, + "step": 472830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011614957709166599, + "loss": 0.0083, + "step": 472840 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011614568887529453, + "loss": 0.0114, + "step": 472850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011614180065892306, + "loss": 0.0104, + "step": 472860 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161379124425516, + "loss": 0.0096, + "step": 472870 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011613402422618013, + "loss": 0.0097, + "step": 472880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011613013600980867, + "loss": 0.011, + "step": 472890 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161262477934372, + "loss": 0.01, + "step": 472900 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011612235957706572, + "loss": 0.0102, + "step": 472910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011611847136069427, + "loss": 0.008, + "step": 472920 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001161145831443228, + "loss": 0.0114, + "step": 472930 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011611069492795134, + "loss": 0.01, + "step": 472940 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011610680671157986, + "loss": 0.0101, + "step": 472950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011610291849520842, + "loss": 0.0109, + "step": 472960 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011609903027883695, + "loss": 0.0114, + "step": 472970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011609514206246549, + "loss": 0.0085, + "step": 472980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011609125384609402, + "loss": 0.0132, + "step": 472990 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011608736562972256, + "loss": 0.0106, + "step": 473000 + }, + { + "epoch": 1.23, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.0070616379380226135, + "eval_runtime": 108.0667, + "eval_samples_per_second": 18.507, + "eval_steps_per_second": 4.627, + "step": 473000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011608347741335109, + "loss": 0.0117, + "step": 473010 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011607958919697963, + "loss": 0.0147, + "step": 473020 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011607570098060816, + "loss": 0.0096, + "step": 473030 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001160718127642367, + "loss": 0.0139, + "step": 473040 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011606792454786523, + "loss": 0.0106, + "step": 473050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011606403633149377, + "loss": 0.0097, + "step": 473060 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001160601481151223, + "loss": 0.0086, + "step": 473070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011605625989875084, + "loss": 0.0143, + "step": 473080 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011605237168237937, + "loss": 0.0095, + "step": 473090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011604848346600791, + "loss": 0.0099, + "step": 473100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011604459524963644, + "loss": 0.011, + "step": 473110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011604070703326499, + "loss": 0.0092, + "step": 473120 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011603681881689352, + "loss": 0.0095, + "step": 473130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011603293060052203, + "loss": 0.0106, + "step": 473140 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011602904238415059, + "loss": 0.01, + "step": 473150 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011602515416777912, + "loss": 0.0101, + "step": 473160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011602126595140766, + "loss": 0.0098, + "step": 473170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011601737773503619, + "loss": 0.0099, + "step": 473180 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011601348951866473, + "loss": 0.0102, + "step": 473190 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011600960130229326, + "loss": 0.0097, + "step": 473200 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001160057130859218, + "loss": 0.0098, + "step": 473210 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011600182486955033, + "loss": 0.0097, + "step": 473220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011599793665317887, + "loss": 0.0095, + "step": 473230 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159940484368074, + "loss": 0.0129, + "step": 473240 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011599016022043594, + "loss": 0.0122, + "step": 473250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011598627200406447, + "loss": 0.0108, + "step": 473260 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115982383787693, + "loss": 0.0131, + "step": 473270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011597849557132153, + "loss": 0.0121, + "step": 473280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011597460735495008, + "loss": 0.011, + "step": 473290 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159707191385786, + "loss": 0.0137, + "step": 473300 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011596683092220716, + "loss": 0.0117, + "step": 473310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011596294270583569, + "loss": 0.009, + "step": 473320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011595905448946423, + "loss": 0.008, + "step": 473330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011595516627309276, + "loss": 0.0303, + "step": 473340 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159512780567213, + "loss": 0.0126, + "step": 473350 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011594738984034983, + "loss": 0.0102, + "step": 473360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011594350162397837, + "loss": 0.0107, + "step": 473370 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159396134076069, + "loss": 0.0081, + "step": 473380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011593572519123543, + "loss": 0.0107, + "step": 473390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011593183697486397, + "loss": 0.0087, + "step": 473400 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159279487584925, + "loss": 0.0082, + "step": 473410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011592406054212104, + "loss": 0.0106, + "step": 473420 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011592017232574956, + "loss": 0.0091, + "step": 473430 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159162841093781, + "loss": 0.0083, + "step": 473440 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011591239589300663, + "loss": 0.0126, + "step": 473450 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011590850767663518, + "loss": 0.0106, + "step": 473460 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001159046194602637, + "loss": 0.0069, + "step": 473470 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011590073124389226, + "loss": 0.0116, + "step": 473480 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011589684302752077, + "loss": 0.012, + "step": 473490 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011589295481114933, + "loss": 0.0114, + "step": 473500 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011588906659477786, + "loss": 0.0128, + "step": 473510 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158851783784064, + "loss": 0.0103, + "step": 473520 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011588129016203493, + "loss": 0.0118, + "step": 473530 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011587740194566347, + "loss": 0.0109, + "step": 473540 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115873513729292, + "loss": 0.0093, + "step": 473550 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011586962551292054, + "loss": 0.0131, + "step": 473560 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011586573729654907, + "loss": 0.0129, + "step": 473570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011586184908017761, + "loss": 0.0074, + "step": 473580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011585796086380614, + "loss": 0.008, + "step": 473590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011585407264743468, + "loss": 0.0114, + "step": 473600 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158501844310632, + "loss": 0.0106, + "step": 473610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011584629621469175, + "loss": 0.0108, + "step": 473620 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011584240799832028, + "loss": 0.0098, + "step": 473630 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158385197819488, + "loss": 0.0075, + "step": 473640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011583463156557735, + "loss": 0.0081, + "step": 473650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011583074334920587, + "loss": 0.0127, + "step": 473660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011582685513283443, + "loss": 0.01, + "step": 473670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011582296691646296, + "loss": 0.0093, + "step": 473680 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158190787000915, + "loss": 0.011, + "step": 473690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011581519048372003, + "loss": 0.0124, + "step": 473700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011581130226734857, + "loss": 0.0126, + "step": 473710 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001158074140509771, + "loss": 0.0095, + "step": 473720 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011580352583460564, + "loss": 0.0108, + "step": 473730 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011579963761823417, + "loss": 0.0099, + "step": 473740 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011579574940186271, + "loss": 0.0108, + "step": 473750 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011579186118549124, + "loss": 0.0118, + "step": 473760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011578797296911978, + "loss": 0.0112, + "step": 473770 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157840847527483, + "loss": 0.0118, + "step": 473780 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011578019653637685, + "loss": 0.0106, + "step": 473790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011577630832000537, + "loss": 0.0141, + "step": 473800 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011577242010363392, + "loss": 0.0141, + "step": 473810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011576853188726244, + "loss": 0.0116, + "step": 473820 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115764643670891, + "loss": 0.0095, + "step": 473830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011576075545451953, + "loss": 0.0099, + "step": 473840 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011575686723814807, + "loss": 0.0089, + "step": 473850 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157529790217766, + "loss": 0.0133, + "step": 473860 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011574909080540514, + "loss": 0.0088, + "step": 473870 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011574520258903367, + "loss": 0.0131, + "step": 473880 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157413143726622, + "loss": 0.0132, + "step": 473890 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011573742615629074, + "loss": 0.0099, + "step": 473900 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011573353793991926, + "loss": 0.0108, + "step": 473910 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157296497235478, + "loss": 0.0103, + "step": 473920 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011572576150717633, + "loss": 0.0101, + "step": 473930 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011572187329080488, + "loss": 0.0101, + "step": 473940 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001157179850744334, + "loss": 0.0117, + "step": 473950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011571409685806195, + "loss": 0.0123, + "step": 473960 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011571020864169047, + "loss": 0.0114, + "step": 473970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011570632042531902, + "loss": 0.0123, + "step": 473980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011570243220894754, + "loss": 0.0127, + "step": 473990 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156985439925761, + "loss": 0.0116, + "step": 474000 + }, + { + "epoch": 1.23, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.007081829011440277, + "eval_runtime": 107.9934, + "eval_samples_per_second": 18.52, + "eval_steps_per_second": 4.63, + "step": 474000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011569465577620461, + "loss": 0.0095, + "step": 474010 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011569076755983317, + "loss": 0.0094, + "step": 474020 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156868793434617, + "loss": 0.0109, + "step": 474030 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011568299112709024, + "loss": 0.0108, + "step": 474040 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011567910291071877, + "loss": 0.0091, + "step": 474050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011567521469434731, + "loss": 0.0075, + "step": 474060 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011567132647797584, + "loss": 0.0091, + "step": 474070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011566743826160438, + "loss": 0.0106, + "step": 474080 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156635500452329, + "loss": 0.0118, + "step": 474090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011565966182886145, + "loss": 0.0143, + "step": 474100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011565577361248998, + "loss": 0.0089, + "step": 474110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011565188539611852, + "loss": 0.0117, + "step": 474120 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011564799717974705, + "loss": 0.0122, + "step": 474130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011564410896337557, + "loss": 0.0117, + "step": 474140 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011564022074700412, + "loss": 0.0109, + "step": 474150 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011563633253063264, + "loss": 0.0132, + "step": 474160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011563244431426118, + "loss": 0.0118, + "step": 474170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011562855609788971, + "loss": 0.0095, + "step": 474180 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011562466788151827, + "loss": 0.0138, + "step": 474190 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001156207796651468, + "loss": 0.0153, + "step": 474200 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011561689144877534, + "loss": 0.0141, + "step": 474210 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011561300323240387, + "loss": 0.0108, + "step": 474220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011560911501603241, + "loss": 0.0085, + "step": 474230 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011560522679966094, + "loss": 0.0122, + "step": 474240 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011560133858328948, + "loss": 0.0091, + "step": 474250 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115597450366918, + "loss": 0.008, + "step": 474260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011559356215054655, + "loss": 0.0108, + "step": 474270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011558967393417508, + "loss": 0.01, + "step": 474280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011558578571780362, + "loss": 0.0077, + "step": 474290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011558189750143214, + "loss": 0.0114, + "step": 474300 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011557800928506069, + "loss": 0.0099, + "step": 474310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011557412106868921, + "loss": 0.0098, + "step": 474320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011557023285231776, + "loss": 0.0099, + "step": 474330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011556634463594628, + "loss": 0.0107, + "step": 474340 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011556245641957484, + "loss": 0.0116, + "step": 474350 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011555856820320337, + "loss": 0.0121, + "step": 474360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011555467998683191, + "loss": 0.0104, + "step": 474370 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011555079177046044, + "loss": 0.0117, + "step": 474380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011554690355408897, + "loss": 0.0096, + "step": 474390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011554301533771751, + "loss": 0.0129, + "step": 474400 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011553912712134604, + "loss": 0.0087, + "step": 474410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011553523890497458, + "loss": 0.0083, + "step": 474420 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001155313506886031, + "loss": 0.0103, + "step": 474430 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011552746247223165, + "loss": 0.0121, + "step": 474440 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011552357425586017, + "loss": 0.0127, + "step": 474450 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011551968603948872, + "loss": 0.0091, + "step": 474460 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011551579782311724, + "loss": 0.0105, + "step": 474470 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011551190960674579, + "loss": 0.0104, + "step": 474480 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011550802139037431, + "loss": 0.0129, + "step": 474490 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011550413317400286, + "loss": 0.0094, + "step": 474500 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011550024495763138, + "loss": 0.0093, + "step": 474510 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011549635674125994, + "loss": 0.0139, + "step": 474520 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011549246852488845, + "loss": 0.0091, + "step": 474530 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011548858030851701, + "loss": 0.0145, + "step": 474540 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011548469209214554, + "loss": 0.0105, + "step": 474550 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011548080387577408, + "loss": 0.0144, + "step": 474560 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001154769156594026, + "loss": 0.0101, + "step": 474570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011547302744303115, + "loss": 0.0084, + "step": 474580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011546913922665968, + "loss": 0.0113, + "step": 474590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011546525101028822, + "loss": 0.0098, + "step": 474600 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011546136279391675, + "loss": 0.0103, + "step": 474610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011545747457754529, + "loss": 0.0104, + "step": 474620 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011545358636117382, + "loss": 0.0092, + "step": 474630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011544969814480234, + "loss": 0.0134, + "step": 474640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011544580992843089, + "loss": 0.0086, + "step": 474650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011544192171205941, + "loss": 0.0106, + "step": 474660 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011543803349568796, + "loss": 0.0086, + "step": 474670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011543414527931648, + "loss": 0.0087, + "step": 474680 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011543025706294502, + "loss": 0.0119, + "step": 474690 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011542636884657355, + "loss": 0.0076, + "step": 474700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011542248063020211, + "loss": 0.0078, + "step": 474710 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011541859241383064, + "loss": 0.0114, + "step": 474720 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011541470419745918, + "loss": 0.0121, + "step": 474730 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001154108159810877, + "loss": 0.009, + "step": 474740 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011540692776471625, + "loss": 0.0111, + "step": 474750 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011540303954834478, + "loss": 0.0133, + "step": 474760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011539915133197332, + "loss": 0.0122, + "step": 474770 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011539526311560185, + "loss": 0.0121, + "step": 474780 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011539137489923039, + "loss": 0.0111, + "step": 474790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011538748668285892, + "loss": 0.0133, + "step": 474800 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011538359846648746, + "loss": 0.0128, + "step": 474810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011537971025011598, + "loss": 0.0151, + "step": 474820 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011537582203374453, + "loss": 0.0098, + "step": 474830 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011537193381737305, + "loss": 0.0105, + "step": 474840 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153680456010016, + "loss": 0.0104, + "step": 474850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011536415738463012, + "loss": 0.0109, + "step": 474860 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011536026916825868, + "loss": 0.0111, + "step": 474870 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153563809518872, + "loss": 0.0108, + "step": 474880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011535249273551572, + "loss": 0.0101, + "step": 474890 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011534860451914428, + "loss": 0.014, + "step": 474900 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153447163027728, + "loss": 0.0122, + "step": 474910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011534082808640135, + "loss": 0.0107, + "step": 474920 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011533693987002988, + "loss": 0.01, + "step": 474930 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011533305165365842, + "loss": 0.0078, + "step": 474940 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011532916343728694, + "loss": 0.013, + "step": 474950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011532527522091549, + "loss": 0.0104, + "step": 474960 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011532138700454401, + "loss": 0.0126, + "step": 474970 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011531749878817256, + "loss": 0.0139, + "step": 474980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011531361057180108, + "loss": 0.0101, + "step": 474990 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011530972235542963, + "loss": 0.0109, + "step": 475000 + }, + { + "epoch": 1.23, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.007072898093611002, + "eval_runtime": 108.0529, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 475000 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011530583413905815, + "loss": 0.014, + "step": 475010 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001153019459226867, + "loss": 0.0102, + "step": 475020 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011529805770631522, + "loss": 0.0092, + "step": 475030 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011529416948994377, + "loss": 0.0121, + "step": 475040 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001152902812735723, + "loss": 0.0123, + "step": 475050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011528639305720085, + "loss": 0.0109, + "step": 475060 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011528250484082938, + "loss": 0.0114, + "step": 475070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011527861662445792, + "loss": 0.0114, + "step": 475080 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011527472840808645, + "loss": 0.0067, + "step": 475090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011527084019171499, + "loss": 0.0107, + "step": 475100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011526695197534352, + "loss": 0.0081, + "step": 475110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011526306375897206, + "loss": 0.0077, + "step": 475120 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011525917554260059, + "loss": 0.0108, + "step": 475130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011525528732622911, + "loss": 0.008, + "step": 475140 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011525139910985766, + "loss": 0.0101, + "step": 475150 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011524751089348618, + "loss": 0.0099, + "step": 475160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011524362267711473, + "loss": 0.0098, + "step": 475170 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011523973446074325, + "loss": 0.0111, + "step": 475180 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001152358462443718, + "loss": 0.0099, + "step": 475190 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011523195802800032, + "loss": 0.0146, + "step": 475200 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011522806981162886, + "loss": 0.0124, + "step": 475210 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011522418159525739, + "loss": 0.0111, + "step": 475220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011522029337888595, + "loss": 0.0095, + "step": 475230 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011521640516251446, + "loss": 0.0122, + "step": 475240 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011521251694614302, + "loss": 0.0115, + "step": 475250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011520862872977155, + "loss": 0.0129, + "step": 475260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011520474051340009, + "loss": 0.0098, + "step": 475270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011520085229702862, + "loss": 0.0118, + "step": 475280 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011519696408065716, + "loss": 0.0193, + "step": 475290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011519307586428569, + "loss": 0.0095, + "step": 475300 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011518918764791423, + "loss": 0.0088, + "step": 475310 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011518529943154275, + "loss": 0.0086, + "step": 475320 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151814112151713, + "loss": 0.0096, + "step": 475330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011517752299879982, + "loss": 0.0117, + "step": 475340 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011517363478242837, + "loss": 0.0108, + "step": 475350 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151697465660569, + "loss": 0.0103, + "step": 475360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011516585834968544, + "loss": 0.009, + "step": 475370 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011516197013331396, + "loss": 0.0108, + "step": 475380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011515808191694249, + "loss": 0.0092, + "step": 475390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011515419370057103, + "loss": 0.01, + "step": 475400 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011515030548419956, + "loss": 0.0103, + "step": 475410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011514641726782812, + "loss": 0.0125, + "step": 475420 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011514252905145665, + "loss": 0.0091, + "step": 475430 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011513864083508519, + "loss": 0.0124, + "step": 475440 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011513475261871371, + "loss": 0.0124, + "step": 475450 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011513086440234226, + "loss": 0.0133, + "step": 475460 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011512697618597078, + "loss": 0.009, + "step": 475470 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011512308796959933, + "loss": 0.0135, + "step": 475480 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011511919975322785, + "loss": 0.0112, + "step": 475490 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001151153115368564, + "loss": 0.0088, + "step": 475500 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011511142332048492, + "loss": 0.0106, + "step": 475510 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011510753510411347, + "loss": 0.0102, + "step": 475520 + }, + { + "epoch": 1.23, + "learning_rate": 0.000115103646887742, + "loss": 0.0089, + "step": 475530 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011509975867137054, + "loss": 0.0106, + "step": 475540 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011509587045499906, + "loss": 0.0087, + "step": 475550 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150919822386276, + "loss": 0.0109, + "step": 475560 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011508809402225613, + "loss": 0.0122, + "step": 475570 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011508420580588469, + "loss": 0.0129, + "step": 475580 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011508031758951322, + "loss": 0.0093, + "step": 475590 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011507642937314176, + "loss": 0.0142, + "step": 475600 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011507254115677029, + "loss": 0.0115, + "step": 475610 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011506865294039883, + "loss": 0.0131, + "step": 475620 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011506476472402736, + "loss": 0.0108, + "step": 475630 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011506087650765588, + "loss": 0.0095, + "step": 475640 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011505698829128443, + "loss": 0.0121, + "step": 475650 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011505310007491295, + "loss": 0.0118, + "step": 475660 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150492118585415, + "loss": 0.0087, + "step": 475670 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011504532364217002, + "loss": 0.0083, + "step": 475680 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011504143542579857, + "loss": 0.0071, + "step": 475690 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150375472094271, + "loss": 0.0115, + "step": 475700 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011503365899305563, + "loss": 0.0115, + "step": 475710 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011502977077668416, + "loss": 0.0108, + "step": 475720 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150258825603127, + "loss": 0.0104, + "step": 475730 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011502199434394123, + "loss": 0.0111, + "step": 475740 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011501810612756979, + "loss": 0.0124, + "step": 475750 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001150142179111983, + "loss": 0.0102, + "step": 475760 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011501032969482686, + "loss": 0.0111, + "step": 475770 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011500644147845539, + "loss": 0.0077, + "step": 475780 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011500255326208393, + "loss": 0.0096, + "step": 475790 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011499866504571246, + "loss": 0.0141, + "step": 475800 + }, + { + "epoch": 1.23, + "learning_rate": 0.000114994776829341, + "loss": 0.0098, + "step": 475810 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011499088861296953, + "loss": 0.0111, + "step": 475820 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011498700039659807, + "loss": 0.012, + "step": 475830 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149831121802266, + "loss": 0.0097, + "step": 475840 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011497922396385514, + "loss": 0.0093, + "step": 475850 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011497533574748366, + "loss": 0.0128, + "step": 475860 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011497144753111219, + "loss": 0.0113, + "step": 475870 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011496755931474073, + "loss": 0.009, + "step": 475880 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011496367109836926, + "loss": 0.0116, + "step": 475890 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149597828819978, + "loss": 0.0105, + "step": 475900 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011495589466562633, + "loss": 0.0091, + "step": 475910 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011495200644925487, + "loss": 0.0088, + "step": 475920 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149481182328834, + "loss": 0.0133, + "step": 475930 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011494423001651196, + "loss": 0.0126, + "step": 475940 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011494034180014049, + "loss": 0.0101, + "step": 475950 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011493645358376903, + "loss": 0.01, + "step": 475960 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011493256536739755, + "loss": 0.0104, + "step": 475970 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149286771510261, + "loss": 0.0124, + "step": 475980 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011492478893465462, + "loss": 0.0081, + "step": 475990 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011492090071828317, + "loss": 0.0087, + "step": 476000 + }, + { + "epoch": 1.23, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.00715318787842989, + "eval_runtime": 108.0552, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 476000 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149170125019117, + "loss": 0.0087, + "step": 476010 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011491312428554024, + "loss": 0.0087, + "step": 476020 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011490923606916876, + "loss": 0.0108, + "step": 476030 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001149053478527973, + "loss": 0.0096, + "step": 476040 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011490145963642583, + "loss": 0.0109, + "step": 476050 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011489757142005438, + "loss": 0.0089, + "step": 476060 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148936832036829, + "loss": 0.012, + "step": 476070 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011488979498731145, + "loss": 0.0095, + "step": 476080 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011488590677093997, + "loss": 0.0109, + "step": 476090 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011488201855456853, + "loss": 0.0091, + "step": 476100 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011487813033819706, + "loss": 0.0106, + "step": 476110 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011487424212182557, + "loss": 0.0099, + "step": 476120 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011487035390545413, + "loss": 0.0098, + "step": 476130 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011486646568908265, + "loss": 0.0108, + "step": 476140 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148625774727112, + "loss": 0.0106, + "step": 476150 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011485868925633972, + "loss": 0.0072, + "step": 476160 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011485480103996827, + "loss": 0.0098, + "step": 476170 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148509128235968, + "loss": 0.009, + "step": 476180 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011484702460722534, + "loss": 0.0102, + "step": 476190 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011484313639085386, + "loss": 0.0103, + "step": 476200 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148392481744824, + "loss": 0.0118, + "step": 476210 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011483535995811093, + "loss": 0.0093, + "step": 476220 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011483147174173947, + "loss": 0.0108, + "step": 476230 + }, + { + "epoch": 1.23, + "learning_rate": 0.000114827583525368, + "loss": 0.0094, + "step": 476240 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011482369530899654, + "loss": 0.011, + "step": 476250 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011481980709262507, + "loss": 0.009, + "step": 476260 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011481591887625361, + "loss": 0.0116, + "step": 476270 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011481203065988214, + "loss": 0.0086, + "step": 476280 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001148081424435107, + "loss": 0.0098, + "step": 476290 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011480425422713923, + "loss": 0.0117, + "step": 476300 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011480036601076777, + "loss": 0.0127, + "step": 476310 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147964777943963, + "loss": 0.0113, + "step": 476320 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011479258957802484, + "loss": 0.0089, + "step": 476330 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011478870136165337, + "loss": 0.011, + "step": 476340 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147848131452819, + "loss": 0.0114, + "step": 476350 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011478092492891043, + "loss": 0.0089, + "step": 476360 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011477703671253896, + "loss": 0.0093, + "step": 476370 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147731484961675, + "loss": 0.0128, + "step": 476380 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011476926027979603, + "loss": 0.0188, + "step": 476390 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011476537206342457, + "loss": 0.0083, + "step": 476400 + }, + { + "epoch": 1.23, + "learning_rate": 0.0001147614838470531, + "loss": 0.0077, + "step": 476410 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011475759563068164, + "loss": 0.012, + "step": 476420 + }, + { + "epoch": 1.23, + "learning_rate": 0.00011475370741431017, + "loss": 0.009, + "step": 476430 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011474981919793871, + "loss": 0.0103, + "step": 476440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011474593098156724, + "loss": 0.0114, + "step": 476450 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001147420427651958, + "loss": 0.0106, + "step": 476460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011473815454882431, + "loss": 0.0108, + "step": 476470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011473426633245287, + "loss": 0.0089, + "step": 476480 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001147303781160814, + "loss": 0.0108, + "step": 476490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011472648989970994, + "loss": 0.0084, + "step": 476500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011472260168333846, + "loss": 0.0145, + "step": 476510 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114718713466967, + "loss": 0.0111, + "step": 476520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011471482525059553, + "loss": 0.0127, + "step": 476530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011471093703422408, + "loss": 0.0112, + "step": 476540 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001147070488178526, + "loss": 0.009, + "step": 476550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011470316060148115, + "loss": 0.0098, + "step": 476560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011469927238510967, + "loss": 0.0104, + "step": 476570 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011469538416873822, + "loss": 0.0118, + "step": 476580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011469149595236674, + "loss": 0.0087, + "step": 476590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011468760773599529, + "loss": 0.0103, + "step": 476600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011468371951962381, + "loss": 0.0117, + "step": 476610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011467983130325234, + "loss": 0.0114, + "step": 476620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011467594308688088, + "loss": 0.0108, + "step": 476630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011467205487050941, + "loss": 0.01, + "step": 476640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011466816665413797, + "loss": 0.0099, + "step": 476650 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001146642784377665, + "loss": 0.009, + "step": 476660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011466039022139504, + "loss": 0.0103, + "step": 476670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011465650200502356, + "loss": 0.0101, + "step": 476680 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001146526137886521, + "loss": 0.0093, + "step": 476690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011464872557228063, + "loss": 0.0082, + "step": 476700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011464483735590918, + "loss": 0.0089, + "step": 476710 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001146409491395377, + "loss": 0.0106, + "step": 476720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011463706092316624, + "loss": 0.0096, + "step": 476730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011463317270679477, + "loss": 0.0097, + "step": 476740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011462928449042331, + "loss": 0.0106, + "step": 476750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011462539627405184, + "loss": 0.0119, + "step": 476760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011462150805768038, + "loss": 0.0095, + "step": 476770 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011461761984130891, + "loss": 0.0102, + "step": 476780 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011461373162493745, + "loss": 0.0132, + "step": 476790 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011460984340856598, + "loss": 0.0113, + "step": 476800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011460595519219454, + "loss": 0.0127, + "step": 476810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011460206697582307, + "loss": 0.0115, + "step": 476820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011459817875945161, + "loss": 0.0087, + "step": 476830 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011459429054308014, + "loss": 0.01, + "step": 476840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011459040232670868, + "loss": 0.0109, + "step": 476850 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001145865141103372, + "loss": 0.0134, + "step": 476860 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011458262589396573, + "loss": 0.0107, + "step": 476870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011457873767759427, + "loss": 0.0111, + "step": 476880 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001145748494612228, + "loss": 0.0061, + "step": 476890 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011457096124485134, + "loss": 0.0144, + "step": 476900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011456707302847987, + "loss": 0.0116, + "step": 476910 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011456318481210841, + "loss": 0.0098, + "step": 476920 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011455929659573694, + "loss": 0.0115, + "step": 476930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011455540837936548, + "loss": 0.0099, + "step": 476940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011455152016299401, + "loss": 0.0092, + "step": 476950 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011454763194662255, + "loss": 0.011, + "step": 476960 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011454374373025108, + "loss": 0.0089, + "step": 476970 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011453985551387964, + "loss": 0.0083, + "step": 476980 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011453596729750815, + "loss": 0.0089, + "step": 476990 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001145320790811367, + "loss": 0.0112, + "step": 477000 + }, + { + "epoch": 1.24, + "eval_cer": 0.8817054855970361, + "eval_loss": 0.0070707546547055244, + "eval_runtime": 108.0477, + "eval_samples_per_second": 18.51, + "eval_steps_per_second": 4.628, + "step": 477000 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011452819086476523, + "loss": 0.011, + "step": 477010 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011452430264839378, + "loss": 0.0081, + "step": 477020 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001145204144320223, + "loss": 0.0096, + "step": 477030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011451652621565085, + "loss": 0.0095, + "step": 477040 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011451263799927937, + "loss": 0.0121, + "step": 477050 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011450874978290792, + "loss": 0.01, + "step": 477060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011450486156653644, + "loss": 0.0177, + "step": 477070 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011450097335016499, + "loss": 0.0117, + "step": 477080 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011449708513379351, + "loss": 0.0082, + "step": 477090 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011449319691742206, + "loss": 0.013, + "step": 477100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011448930870105058, + "loss": 0.0111, + "step": 477110 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011448542048467911, + "loss": 0.0115, + "step": 477120 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011448153226830765, + "loss": 0.0104, + "step": 477130 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011447764405193618, + "loss": 0.011, + "step": 477140 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011447375583556472, + "loss": 0.0111, + "step": 477150 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011446986761919325, + "loss": 0.0123, + "step": 477160 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144659794028218, + "loss": 0.0127, + "step": 477170 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011446209118645033, + "loss": 0.0096, + "step": 477180 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011445820297007888, + "loss": 0.0097, + "step": 477190 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144543147537074, + "loss": 0.0116, + "step": 477200 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011445042653733595, + "loss": 0.0088, + "step": 477210 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011444653832096447, + "loss": 0.0103, + "step": 477220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011444265010459302, + "loss": 0.0077, + "step": 477230 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011443876188822154, + "loss": 0.0105, + "step": 477240 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011443487367185008, + "loss": 0.01, + "step": 477250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011443098545547861, + "loss": 0.0099, + "step": 477260 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011442709723910715, + "loss": 0.0104, + "step": 477270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011442320902273568, + "loss": 0.0116, + "step": 477280 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011441932080636422, + "loss": 0.0105, + "step": 477290 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011441543258999275, + "loss": 0.0113, + "step": 477300 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001144115443736213, + "loss": 0.0123, + "step": 477310 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011440765615724982, + "loss": 0.0129, + "step": 477320 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011440376794087838, + "loss": 0.012, + "step": 477330 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001143998797245069, + "loss": 0.0111, + "step": 477340 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011439599150813545, + "loss": 0.0109, + "step": 477350 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011439210329176398, + "loss": 0.0116, + "step": 477360 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001143882150753925, + "loss": 0.008, + "step": 477370 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011438432685902104, + "loss": 0.0074, + "step": 477380 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011438043864264957, + "loss": 0.0083, + "step": 477390 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011437655042627811, + "loss": 0.0105, + "step": 477400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011437266220990664, + "loss": 0.0125, + "step": 477410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011436877399353518, + "loss": 0.0092, + "step": 477420 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011436488577716371, + "loss": 0.0085, + "step": 477430 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011436099756079225, + "loss": 0.0079, + "step": 477440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011435710934442078, + "loss": 0.0097, + "step": 477450 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011435322112804932, + "loss": 0.0088, + "step": 477460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011434933291167785, + "loss": 0.0119, + "step": 477470 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001143454446953064, + "loss": 0.0099, + "step": 477480 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011434155647893492, + "loss": 0.0106, + "step": 477490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011433766826256346, + "loss": 0.0105, + "step": 477500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011433378004619199, + "loss": 0.0131, + "step": 477510 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011432989182982055, + "loss": 0.012, + "step": 477520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011432600361344907, + "loss": 0.0088, + "step": 477530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011432211539707762, + "loss": 0.0099, + "step": 477540 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011431822718070614, + "loss": 0.0158, + "step": 477550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011431433896433469, + "loss": 0.013, + "step": 477560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011431045074796321, + "loss": 0.0102, + "step": 477570 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011430656253159176, + "loss": 0.0115, + "step": 477580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011430267431522028, + "loss": 0.0094, + "step": 477590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011429878609884883, + "loss": 0.0127, + "step": 477600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011429489788247735, + "loss": 0.0114, + "step": 477610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011429100966610588, + "loss": 0.0103, + "step": 477620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011428712144973442, + "loss": 0.0083, + "step": 477630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011428323323336295, + "loss": 0.0093, + "step": 477640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011427934501699149, + "loss": 0.01, + "step": 477650 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011427545680062002, + "loss": 0.0113, + "step": 477660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011427156858424856, + "loss": 0.0117, + "step": 477670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011426768036787709, + "loss": 0.0112, + "step": 477680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011426379215150565, + "loss": 0.0116, + "step": 477690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011425990393513416, + "loss": 0.0104, + "step": 477700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011425601571876272, + "loss": 0.0086, + "step": 477710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011425212750239124, + "loss": 0.0106, + "step": 477720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011424823928601979, + "loss": 0.0091, + "step": 477730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011424435106964831, + "loss": 0.0101, + "step": 477740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011424046285327686, + "loss": 0.0116, + "step": 477750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011423657463690538, + "loss": 0.0106, + "step": 477760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011423268642053392, + "loss": 0.0106, + "step": 477770 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011422879820416245, + "loss": 0.0084, + "step": 477780 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114224909987791, + "loss": 0.0129, + "step": 477790 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011422102177141952, + "loss": 0.0096, + "step": 477800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011421713355504806, + "loss": 0.0088, + "step": 477810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011421324533867659, + "loss": 0.0092, + "step": 477820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011420935712230513, + "loss": 0.0096, + "step": 477830 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011420546890593366, + "loss": 0.0086, + "step": 477840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011420158068956222, + "loss": 0.0099, + "step": 477850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011419769247319073, + "loss": 0.008, + "step": 477860 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011419380425681926, + "loss": 0.01, + "step": 477870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011418991604044782, + "loss": 0.0094, + "step": 477880 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011418602782407634, + "loss": 0.0139, + "step": 477890 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011418213960770488, + "loss": 0.0148, + "step": 477900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011417825139133341, + "loss": 0.0126, + "step": 477910 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011417436317496195, + "loss": 0.0111, + "step": 477920 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011417047495859048, + "loss": 0.0116, + "step": 477930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011416658674221902, + "loss": 0.0103, + "step": 477940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011416269852584755, + "loss": 0.0118, + "step": 477950 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001141588103094761, + "loss": 0.01, + "step": 477960 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011415492209310462, + "loss": 0.0123, + "step": 477970 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011415103387673316, + "loss": 0.0114, + "step": 477980 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011414714566036169, + "loss": 0.0126, + "step": 477990 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011414325744399023, + "loss": 0.0094, + "step": 478000 + }, + { + "epoch": 1.24, + "eval_cer": 0.881688689953826, + "eval_loss": 0.007163301110267639, + "eval_runtime": 107.8483, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, + "step": 478000 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011413936922761876, + "loss": 0.0111, + "step": 478010 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001141354810112473, + "loss": 0.0131, + "step": 478020 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011413159279487583, + "loss": 0.0115, + "step": 478030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011412770457850439, + "loss": 0.0126, + "step": 478040 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011412381636213291, + "loss": 0.0079, + "step": 478050 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011411992814576146, + "loss": 0.0113, + "step": 478060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011411603992938998, + "loss": 0.0117, + "step": 478070 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011411215171301853, + "loss": 0.0086, + "step": 478080 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011410826349664705, + "loss": 0.0129, + "step": 478090 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001141043752802756, + "loss": 0.0121, + "step": 478100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011410048706390412, + "loss": 0.0105, + "step": 478110 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011409659884753265, + "loss": 0.0125, + "step": 478120 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140927106311612, + "loss": 0.0103, + "step": 478130 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011408882241478972, + "loss": 0.0083, + "step": 478140 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011408493419841826, + "loss": 0.0119, + "step": 478150 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011408104598204679, + "loss": 0.0082, + "step": 478160 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011407715776567533, + "loss": 0.0087, + "step": 478170 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011407326954930386, + "loss": 0.0109, + "step": 478180 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140693813329324, + "loss": 0.0182, + "step": 478190 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011406549311656093, + "loss": 0.0094, + "step": 478200 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011406160490018949, + "loss": 0.012, + "step": 478210 + }, + { + "epoch": 1.24, + "learning_rate": 0.000114057716683818, + "loss": 0.0096, + "step": 478220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011405382846744656, + "loss": 0.0097, + "step": 478230 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011404994025107508, + "loss": 0.0109, + "step": 478240 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011404605203470363, + "loss": 0.0112, + "step": 478250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011404216381833215, + "loss": 0.0136, + "step": 478260 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140382756019607, + "loss": 0.0095, + "step": 478270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011403438738558922, + "loss": 0.0098, + "step": 478280 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011403049916921776, + "loss": 0.0105, + "step": 478290 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011402661095284629, + "loss": 0.0133, + "step": 478300 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011402272273647483, + "loss": 0.0102, + "step": 478310 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011401883452010336, + "loss": 0.0083, + "step": 478320 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140149463037319, + "loss": 0.0112, + "step": 478330 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011401105808736043, + "loss": 0.0128, + "step": 478340 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011400716987098896, + "loss": 0.0095, + "step": 478350 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001140032816546175, + "loss": 0.012, + "step": 478360 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011399939343824603, + "loss": 0.0087, + "step": 478370 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011399550522187457, + "loss": 0.0084, + "step": 478380 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139916170055031, + "loss": 0.0109, + "step": 478390 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011398772878913165, + "loss": 0.0118, + "step": 478400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011398384057276018, + "loss": 0.0107, + "step": 478410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011397995235638872, + "loss": 0.0087, + "step": 478420 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011397606414001725, + "loss": 0.0093, + "step": 478430 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139721759236458, + "loss": 0.0093, + "step": 478440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011396828770727432, + "loss": 0.0108, + "step": 478450 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011396439949090286, + "loss": 0.009, + "step": 478460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011396051127453139, + "loss": 0.0126, + "step": 478470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011395662305815993, + "loss": 0.0118, + "step": 478480 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011395273484178846, + "loss": 0.0105, + "step": 478490 + }, + { + "epoch": 1.24, + "learning_rate": 0.000113948846625417, + "loss": 0.0097, + "step": 478500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011394495840904553, + "loss": 0.0103, + "step": 478510 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011394107019267407, + "loss": 0.0098, + "step": 478520 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139371819763026, + "loss": 0.0119, + "step": 478530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011393329375993114, + "loss": 0.0117, + "step": 478540 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011392940554355967, + "loss": 0.0098, + "step": 478550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011392551732718823, + "loss": 0.0118, + "step": 478560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011392162911081675, + "loss": 0.0102, + "step": 478570 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139177408944453, + "loss": 0.0101, + "step": 478580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011391385267807382, + "loss": 0.0108, + "step": 478590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011390996446170235, + "loss": 0.0077, + "step": 478600 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001139060762453309, + "loss": 0.0097, + "step": 478610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011390218802895942, + "loss": 0.0082, + "step": 478620 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011389829981258796, + "loss": 0.01, + "step": 478630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011389441159621649, + "loss": 0.0085, + "step": 478640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011389052337984503, + "loss": 0.0094, + "step": 478650 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011388663516347356, + "loss": 0.0127, + "step": 478660 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138827469471021, + "loss": 0.0082, + "step": 478670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011387885873073063, + "loss": 0.0118, + "step": 478680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011387497051435917, + "loss": 0.0077, + "step": 478690 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138710822979877, + "loss": 0.0095, + "step": 478700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011386719408161624, + "loss": 0.0103, + "step": 478710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011386330586524477, + "loss": 0.0082, + "step": 478720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011385941764887333, + "loss": 0.0093, + "step": 478730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011385552943250184, + "loss": 0.0074, + "step": 478740 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138516412161304, + "loss": 0.0087, + "step": 478750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011384775299975892, + "loss": 0.0098, + "step": 478760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011384386478338747, + "loss": 0.0082, + "step": 478770 + }, + { + "epoch": 1.24, + "learning_rate": 0.000113839976567016, + "loss": 0.0089, + "step": 478780 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011383608835064453, + "loss": 0.0099, + "step": 478790 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011383220013427306, + "loss": 0.0113, + "step": 478800 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138283119179016, + "loss": 0.0191, + "step": 478810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011382442370153013, + "loss": 0.0108, + "step": 478820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011382053548515867, + "loss": 0.0108, + "step": 478830 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138166472687872, + "loss": 0.0107, + "step": 478840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011381275905241573, + "loss": 0.0113, + "step": 478850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011380887083604427, + "loss": 0.0119, + "step": 478860 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001138049826196728, + "loss": 0.0104, + "step": 478870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011380109440330134, + "loss": 0.0079, + "step": 478880 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011379720618692987, + "loss": 0.013, + "step": 478890 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011379331797055841, + "loss": 0.01, + "step": 478900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011378942975418694, + "loss": 0.0092, + "step": 478910 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137855415378155, + "loss": 0.0106, + "step": 478920 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011378165332144402, + "loss": 0.0097, + "step": 478930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011377776510507256, + "loss": 0.011, + "step": 478940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011377387688870109, + "loss": 0.0092, + "step": 478950 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011376998867232963, + "loss": 0.0109, + "step": 478960 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011376610045595816, + "loss": 0.0111, + "step": 478970 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137622122395867, + "loss": 0.0119, + "step": 478980 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011375832402321523, + "loss": 0.0116, + "step": 478990 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011375443580684377, + "loss": 0.0129, + "step": 479000 + }, + { + "epoch": 1.24, + "eval_cer": 0.88167329394755, + "eval_loss": 0.006849655415862799, + "eval_runtime": 107.8443, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, + "step": 479000 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001137505475904723, + "loss": 0.0105, + "step": 479010 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011374665937410084, + "loss": 0.0131, + "step": 479020 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011374277115772937, + "loss": 0.0097, + "step": 479030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011373888294135791, + "loss": 0.0103, + "step": 479040 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011373499472498644, + "loss": 0.0093, + "step": 479050 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011373110650861498, + "loss": 0.0115, + "step": 479060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011372721829224351, + "loss": 0.0153, + "step": 479070 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011372333007587207, + "loss": 0.0104, + "step": 479080 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011371944185950058, + "loss": 0.0125, + "step": 479090 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011371555364312911, + "loss": 0.013, + "step": 479100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011371166542675766, + "loss": 0.0094, + "step": 479110 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011370777721038619, + "loss": 0.0137, + "step": 479120 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011370388899401473, + "loss": 0.0106, + "step": 479130 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011370000077764326, + "loss": 0.0121, + "step": 479140 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136961125612718, + "loss": 0.01, + "step": 479150 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011369222434490033, + "loss": 0.0098, + "step": 479160 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011368833612852887, + "loss": 0.0124, + "step": 479170 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136844479121574, + "loss": 0.0104, + "step": 479180 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011368055969578594, + "loss": 0.0125, + "step": 479190 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011367667147941447, + "loss": 0.0091, + "step": 479200 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011367278326304301, + "loss": 0.0102, + "step": 479210 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011366889504667154, + "loss": 0.0096, + "step": 479220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011366500683030008, + "loss": 0.0102, + "step": 479230 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011366111861392861, + "loss": 0.0079, + "step": 479240 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011365723039755715, + "loss": 0.0098, + "step": 479250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011365334218118568, + "loss": 0.0137, + "step": 479260 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011364945396481424, + "loss": 0.0161, + "step": 479270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011364556574844276, + "loss": 0.0123, + "step": 479280 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136416775320713, + "loss": 0.0094, + "step": 479290 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011363778931569983, + "loss": 0.0109, + "step": 479300 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011363390109932837, + "loss": 0.0074, + "step": 479310 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136300128829569, + "loss": 0.0099, + "step": 479320 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011362612466658544, + "loss": 0.0129, + "step": 479330 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011362223645021397, + "loss": 0.0094, + "step": 479340 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001136183482338425, + "loss": 0.0086, + "step": 479350 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011361446001747104, + "loss": 0.0116, + "step": 479360 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011361057180109957, + "loss": 0.0136, + "step": 479370 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011360668358472811, + "loss": 0.012, + "step": 479380 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011360279536835664, + "loss": 0.0069, + "step": 479390 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011359890715198518, + "loss": 0.0095, + "step": 479400 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011359501893561371, + "loss": 0.0105, + "step": 479410 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011359113071924225, + "loss": 0.0103, + "step": 479420 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011358724250287078, + "loss": 0.0143, + "step": 479430 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011358335428649933, + "loss": 0.0097, + "step": 479440 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011357946607012785, + "loss": 0.0103, + "step": 479450 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001135755778537564, + "loss": 0.0092, + "step": 479460 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011357168963738493, + "loss": 0.0112, + "step": 479470 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011356780142101347, + "loss": 0.0117, + "step": 479480 + }, + { + "epoch": 1.24, + "learning_rate": 0.000113563913204642, + "loss": 0.0142, + "step": 479490 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011356002498827054, + "loss": 0.0134, + "step": 479500 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011355613677189907, + "loss": 0.01, + "step": 479510 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011355224855552761, + "loss": 0.0133, + "step": 479520 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011354836033915614, + "loss": 0.0085, + "step": 479530 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011354447212278468, + "loss": 0.0116, + "step": 479540 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011354058390641321, + "loss": 0.0149, + "step": 479550 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011353669569004175, + "loss": 0.0098, + "step": 479560 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011353280747367028, + "loss": 0.0112, + "step": 479570 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011352891925729882, + "loss": 0.0115, + "step": 479580 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011352503104092735, + "loss": 0.0081, + "step": 479590 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011352114282455588, + "loss": 0.0114, + "step": 479600 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011351725460818442, + "loss": 0.0088, + "step": 479610 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011351336639181295, + "loss": 0.009, + "step": 479620 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001135094781754415, + "loss": 0.0084, + "step": 479630 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011350558995907003, + "loss": 0.0093, + "step": 479640 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011350170174269857, + "loss": 0.0093, + "step": 479650 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134978135263271, + "loss": 0.0061, + "step": 479660 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011349392530995564, + "loss": 0.0105, + "step": 479670 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011349003709358417, + "loss": 0.013, + "step": 479680 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011348614887721271, + "loss": 0.0126, + "step": 479690 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011348226066084124, + "loss": 0.019, + "step": 479700 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011347837244446978, + "loss": 0.0089, + "step": 479710 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011347448422809831, + "loss": 0.0127, + "step": 479720 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011347059601172685, + "loss": 0.01, + "step": 479730 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011346670779535538, + "loss": 0.0106, + "step": 479740 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011346281957898392, + "loss": 0.0091, + "step": 479750 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011345893136261245, + "loss": 0.0167, + "step": 479760 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011345504314624099, + "loss": 0.0074, + "step": 479770 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011345115492986952, + "loss": 0.0075, + "step": 479780 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011344726671349808, + "loss": 0.0131, + "step": 479790 + }, + { + "epoch": 1.24, + "learning_rate": 0.0001134433784971266, + "loss": 0.0173, + "step": 479800 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011343949028075514, + "loss": 0.0098, + "step": 479810 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011343560206438367, + "loss": 0.0154, + "step": 479820 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011343171384801221, + "loss": 0.0086, + "step": 479830 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011342782563164074, + "loss": 0.0107, + "step": 479840 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011342393741526927, + "loss": 0.0091, + "step": 479850 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011342004919889781, + "loss": 0.0096, + "step": 479860 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011341616098252634, + "loss": 0.0121, + "step": 479870 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011341227276615488, + "loss": 0.012, + "step": 479880 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011340838454978341, + "loss": 0.0109, + "step": 479890 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011340449633341195, + "loss": 0.0088, + "step": 479900 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011340060811704048, + "loss": 0.0106, + "step": 479910 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011339671990066902, + "loss": 0.012, + "step": 479920 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011339283168429755, + "loss": 0.0112, + "step": 479930 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011338894346792609, + "loss": 0.0077, + "step": 479940 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011338505525155462, + "loss": 0.0136, + "step": 479950 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011338116703518317, + "loss": 0.0107, + "step": 479960 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011337727881881169, + "loss": 0.0087, + "step": 479970 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011337339060244024, + "loss": 0.0121, + "step": 479980 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011336950238606877, + "loss": 0.011, + "step": 479990 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011336561416969731, + "loss": 0.0108, + "step": 480000 + }, + { + "epoch": 1.24, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.0065583763644099236, + "eval_runtime": 107.8502, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, + "step": 480000 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011336172595332584, + "loss": 0.0118, + "step": 480010 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011335783773695438, + "loss": 0.0136, + "step": 480020 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011335394952058291, + "loss": 0.0105, + "step": 480030 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011335006130421145, + "loss": 0.0116, + "step": 480040 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011334617308783998, + "loss": 0.009, + "step": 480050 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011334228487146852, + "loss": 0.0127, + "step": 480060 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011333839665509705, + "loss": 0.0081, + "step": 480070 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011333450843872559, + "loss": 0.0088, + "step": 480080 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011333062022235412, + "loss": 0.0115, + "step": 480090 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011332673200598265, + "loss": 0.0085, + "step": 480100 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011332284378961119, + "loss": 0.0093, + "step": 480110 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011331895557323972, + "loss": 0.0095, + "step": 480120 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011331506735686826, + "loss": 0.0125, + "step": 480130 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011331117914049679, + "loss": 0.0182, + "step": 480140 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011330729092412534, + "loss": 0.0109, + "step": 480150 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011330340270775387, + "loss": 0.0134, + "step": 480160 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011329951449138241, + "loss": 0.007, + "step": 480170 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011329562627501094, + "loss": 0.014, + "step": 480180 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011329173805863948, + "loss": 0.0105, + "step": 480190 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011328784984226801, + "loss": 0.0121, + "step": 480200 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011328396162589655, + "loss": 0.0127, + "step": 480210 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011328007340952508, + "loss": 0.0082, + "step": 480220 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011327618519315362, + "loss": 0.0107, + "step": 480230 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011327229697678215, + "loss": 0.0089, + "step": 480240 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011326840876041069, + "loss": 0.0138, + "step": 480250 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011326452054403922, + "loss": 0.01, + "step": 480260 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011326063232766776, + "loss": 0.0108, + "step": 480270 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011325674411129629, + "loss": 0.0122, + "step": 480280 + }, + { + "epoch": 1.24, + "learning_rate": 0.00011325285589492483, + "loss": 0.0105, + "step": 480290 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011324896767855336, + "loss": 0.0093, + "step": 480300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011324507946218192, + "loss": 0.0076, + "step": 480310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011324119124581044, + "loss": 0.0098, + "step": 480320 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011323730302943898, + "loss": 0.011, + "step": 480330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011323341481306751, + "loss": 0.0087, + "step": 480340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011322952659669604, + "loss": 0.0082, + "step": 480350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011322563838032458, + "loss": 0.0111, + "step": 480360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011322175016395311, + "loss": 0.0098, + "step": 480370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011321786194758165, + "loss": 0.0124, + "step": 480380 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011321397373121018, + "loss": 0.0088, + "step": 480390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011321008551483872, + "loss": 0.012, + "step": 480400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011320619729846725, + "loss": 0.0115, + "step": 480410 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011320230908209579, + "loss": 0.0092, + "step": 480420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011319842086572432, + "loss": 0.0099, + "step": 480430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011319453264935286, + "loss": 0.0112, + "step": 480440 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011319064443298139, + "loss": 0.0081, + "step": 480450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011318675621660993, + "loss": 0.0105, + "step": 480460 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011318286800023846, + "loss": 0.0132, + "step": 480470 + }, + { + "epoch": 1.25, + "learning_rate": 0.000113178979783867, + "loss": 0.0127, + "step": 480480 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011317509156749553, + "loss": 0.0138, + "step": 480490 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011317120335112408, + "loss": 0.0109, + "step": 480500 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011316731513475261, + "loss": 0.0118, + "step": 480510 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011316342691838115, + "loss": 0.0103, + "step": 480520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011315953870200968, + "loss": 0.0093, + "step": 480530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011315565048563822, + "loss": 0.0102, + "step": 480540 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011315176226926675, + "loss": 0.0089, + "step": 480550 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001131478740528953, + "loss": 0.0096, + "step": 480560 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011314398583652382, + "loss": 0.0162, + "step": 480570 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011314009762015236, + "loss": 0.0075, + "step": 480580 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011313620940378089, + "loss": 0.0113, + "step": 480590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011313232118740942, + "loss": 0.0097, + "step": 480600 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011312843297103796, + "loss": 0.0087, + "step": 480610 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011312454475466649, + "loss": 0.0081, + "step": 480620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011312065653829503, + "loss": 0.0103, + "step": 480630 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011311676832192356, + "loss": 0.0107, + "step": 480640 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001131128801055521, + "loss": 0.0093, + "step": 480650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011310899188918063, + "loss": 0.0086, + "step": 480660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011310510367280918, + "loss": 0.0079, + "step": 480670 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001131012154564377, + "loss": 0.0149, + "step": 480680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011309732724006625, + "loss": 0.0069, + "step": 480690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011309343902369478, + "loss": 0.0093, + "step": 480700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011308955080732332, + "loss": 0.0089, + "step": 480710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011308566259095185, + "loss": 0.0096, + "step": 480720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011308177437458039, + "loss": 0.0088, + "step": 480730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011307788615820892, + "loss": 0.01, + "step": 480740 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011307399794183746, + "loss": 0.0134, + "step": 480750 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011307010972546599, + "loss": 0.0105, + "step": 480760 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011306622150909453, + "loss": 0.0092, + "step": 480770 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011306233329272306, + "loss": 0.0129, + "step": 480780 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001130584450763516, + "loss": 0.0135, + "step": 480790 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011305455685998013, + "loss": 0.0089, + "step": 480800 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011305066864360867, + "loss": 0.0095, + "step": 480810 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001130467804272372, + "loss": 0.0134, + "step": 480820 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011304289221086576, + "loss": 0.0093, + "step": 480830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011303900399449427, + "loss": 0.0124, + "step": 480840 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001130351157781228, + "loss": 0.0124, + "step": 480850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011303122756175135, + "loss": 0.0081, + "step": 480860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011302733934537988, + "loss": 0.0068, + "step": 480870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011302345112900842, + "loss": 0.012, + "step": 480880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011301956291263695, + "loss": 0.0127, + "step": 480890 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011301567469626549, + "loss": 0.0102, + "step": 480900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011301178647989402, + "loss": 0.0103, + "step": 480910 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011300789826352256, + "loss": 0.0107, + "step": 480920 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011300401004715109, + "loss": 0.0113, + "step": 480930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011300012183077963, + "loss": 0.0122, + "step": 480940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011299623361440816, + "loss": 0.011, + "step": 480950 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001129923453980367, + "loss": 0.0103, + "step": 480960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011298845718166523, + "loss": 0.0138, + "step": 480970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011298456896529377, + "loss": 0.0079, + "step": 480980 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001129806807489223, + "loss": 0.0094, + "step": 480990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011297679253255084, + "loss": 0.0123, + "step": 481000 + }, + { + "epoch": 1.25, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.006680840160697699, + "eval_runtime": 108.1021, + "eval_samples_per_second": 18.501, + "eval_steps_per_second": 4.625, + "step": 481000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011297290431617937, + "loss": 0.0169, + "step": 481010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011296901609980792, + "loss": 0.0127, + "step": 481020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011296512788343645, + "loss": 0.0091, + "step": 481030 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112961239667065, + "loss": 0.0098, + "step": 481040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011295735145069352, + "loss": 0.0087, + "step": 481050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011295346323432206, + "loss": 0.0097, + "step": 481060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011294957501795059, + "loss": 0.0094, + "step": 481070 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011294568680157912, + "loss": 0.0102, + "step": 481080 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011294179858520766, + "loss": 0.0107, + "step": 481090 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011293791036883619, + "loss": 0.0088, + "step": 481100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011293402215246473, + "loss": 0.0086, + "step": 481110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011293013393609326, + "loss": 0.0107, + "step": 481120 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001129262457197218, + "loss": 0.0097, + "step": 481130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011292235750335033, + "loss": 0.0107, + "step": 481140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011291846928697887, + "loss": 0.0117, + "step": 481150 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001129145810706074, + "loss": 0.0089, + "step": 481160 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011291069285423594, + "loss": 0.0131, + "step": 481170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011290680463786447, + "loss": 0.0125, + "step": 481180 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011290291642149302, + "loss": 0.0091, + "step": 481190 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011289902820512154, + "loss": 0.0129, + "step": 481200 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128951399887501, + "loss": 0.0105, + "step": 481210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011289125177237862, + "loss": 0.0119, + "step": 481220 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011288736355600716, + "loss": 0.0099, + "step": 481230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011288347533963569, + "loss": 0.0124, + "step": 481240 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011287958712326423, + "loss": 0.0106, + "step": 481250 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011287569890689276, + "loss": 0.0095, + "step": 481260 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128718106905213, + "loss": 0.0134, + "step": 481270 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011286792247414983, + "loss": 0.0111, + "step": 481280 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011286403425777837, + "loss": 0.0091, + "step": 481290 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128601460414069, + "loss": 0.0113, + "step": 481300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011285625782503544, + "loss": 0.0131, + "step": 481310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011285236960866397, + "loss": 0.0093, + "step": 481320 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128484813922925, + "loss": 0.0114, + "step": 481330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011284459317592104, + "loss": 0.0178, + "step": 481340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011284070495954957, + "loss": 0.0146, + "step": 481350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011283681674317811, + "loss": 0.0113, + "step": 481360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011283292852680664, + "loss": 0.0176, + "step": 481370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011282904031043519, + "loss": 0.0125, + "step": 481380 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011282515209406372, + "loss": 0.0101, + "step": 481390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011282126387769226, + "loss": 0.0125, + "step": 481400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011281737566132079, + "loss": 0.0148, + "step": 481410 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011281348744494933, + "loss": 0.0117, + "step": 481420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011280959922857786, + "loss": 0.009, + "step": 481430 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001128057110122064, + "loss": 0.0101, + "step": 481440 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011280182279583493, + "loss": 0.013, + "step": 481450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011279793457946347, + "loss": 0.0126, + "step": 481460 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112794046363092, + "loss": 0.0087, + "step": 481470 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011279015814672054, + "loss": 0.0135, + "step": 481480 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011278626993034907, + "loss": 0.0088, + "step": 481490 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011278238171397761, + "loss": 0.0082, + "step": 481500 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011277849349760614, + "loss": 0.0083, + "step": 481510 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011277460528123468, + "loss": 0.0075, + "step": 481520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011277071706486321, + "loss": 0.011, + "step": 481530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011276682884849176, + "loss": 0.0095, + "step": 481540 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011276294063212029, + "loss": 0.0112, + "step": 481550 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011275905241574883, + "loss": 0.0144, + "step": 481560 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011275516419937736, + "loss": 0.0101, + "step": 481570 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011275127598300589, + "loss": 0.0138, + "step": 481580 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011274738776663443, + "loss": 0.0094, + "step": 481590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011274349955026296, + "loss": 0.0108, + "step": 481600 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001127396113338915, + "loss": 0.0093, + "step": 481610 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011273572311752003, + "loss": 0.009, + "step": 481620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011273183490114857, + "loss": 0.0094, + "step": 481630 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001127279466847771, + "loss": 0.0111, + "step": 481640 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011272405846840564, + "loss": 0.0092, + "step": 481650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011272017025203417, + "loss": 0.0106, + "step": 481660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011271628203566271, + "loss": 0.0104, + "step": 481670 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011271239381929124, + "loss": 0.0087, + "step": 481680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011270850560291978, + "loss": 0.0081, + "step": 481690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011270461738654831, + "loss": 0.0123, + "step": 481700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011270072917017685, + "loss": 0.0107, + "step": 481710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011269684095380538, + "loss": 0.0099, + "step": 481720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011269295273743393, + "loss": 0.0099, + "step": 481730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011268906452106246, + "loss": 0.0088, + "step": 481740 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112685176304691, + "loss": 0.0113, + "step": 481750 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011268128808831953, + "loss": 0.0094, + "step": 481760 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011267739987194807, + "loss": 0.0098, + "step": 481770 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126735116555766, + "loss": 0.0118, + "step": 481780 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011266962343920514, + "loss": 0.0109, + "step": 481790 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011266573522283367, + "loss": 0.0101, + "step": 481800 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011266184700646221, + "loss": 0.012, + "step": 481810 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011265795879009074, + "loss": 0.0092, + "step": 481820 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011265407057371927, + "loss": 0.0098, + "step": 481830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011265018235734781, + "loss": 0.0141, + "step": 481840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011264629414097634, + "loss": 0.009, + "step": 481850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011264240592460488, + "loss": 0.0092, + "step": 481860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011263851770823341, + "loss": 0.0089, + "step": 481870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011263462949186195, + "loss": 0.0085, + "step": 481880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011263074127549048, + "loss": 0.0113, + "step": 481890 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011262685305911903, + "loss": 0.0169, + "step": 481900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011262296484274755, + "loss": 0.0111, + "step": 481910 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126190766263761, + "loss": 0.0108, + "step": 481920 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011261518841000463, + "loss": 0.0114, + "step": 481930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011261130019363317, + "loss": 0.0093, + "step": 481940 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001126074119772617, + "loss": 0.0127, + "step": 481950 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011260352376089024, + "loss": 0.0096, + "step": 481960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011259963554451877, + "loss": 0.0095, + "step": 481970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011259574732814731, + "loss": 0.0088, + "step": 481980 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011259185911177584, + "loss": 0.0082, + "step": 481990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011258797089540438, + "loss": 0.0084, + "step": 482000 + }, + { + "epoch": 1.25, + "eval_cer": 0.8817404765203906, + "eval_loss": 0.0068023488856852055, + "eval_runtime": 107.9256, + "eval_samples_per_second": 18.531, + "eval_steps_per_second": 4.633, + "step": 482000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011258408267903291, + "loss": 0.0117, + "step": 482010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011258019446266145, + "loss": 0.0093, + "step": 482020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011257630624628998, + "loss": 0.0091, + "step": 482030 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011257241802991852, + "loss": 0.009, + "step": 482040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011256852981354705, + "loss": 0.0155, + "step": 482050 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001125646415971756, + "loss": 0.0116, + "step": 482060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011256075338080412, + "loss": 0.0093, + "step": 482070 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011255686516443265, + "loss": 0.0097, + "step": 482080 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001125529769480612, + "loss": 0.0132, + "step": 482090 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011254908873168973, + "loss": 0.0089, + "step": 482100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011254520051531827, + "loss": 0.0136, + "step": 482110 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001125413122989468, + "loss": 0.0141, + "step": 482120 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011253742408257534, + "loss": 0.0161, + "step": 482130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011253353586620387, + "loss": 0.0105, + "step": 482140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011252964764983241, + "loss": 0.0099, + "step": 482150 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011252575943346094, + "loss": 0.0115, + "step": 482160 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011252187121708948, + "loss": 0.0084, + "step": 482170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011251798300071801, + "loss": 0.0106, + "step": 482180 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011251409478434655, + "loss": 0.012, + "step": 482190 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011251020656797508, + "loss": 0.0149, + "step": 482200 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011250631835160362, + "loss": 0.0098, + "step": 482210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011250243013523215, + "loss": 0.0108, + "step": 482220 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011249854191886069, + "loss": 0.0081, + "step": 482230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011249465370248922, + "loss": 0.0149, + "step": 482240 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011249076548611777, + "loss": 0.0159, + "step": 482250 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001124868772697463, + "loss": 0.0126, + "step": 482260 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011248298905337484, + "loss": 0.0106, + "step": 482270 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011247910083700337, + "loss": 0.0092, + "step": 482280 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011247521262063191, + "loss": 0.0133, + "step": 482290 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011247132440426044, + "loss": 0.011, + "step": 482300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011246743618788898, + "loss": 0.0128, + "step": 482310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011246354797151751, + "loss": 0.0089, + "step": 482320 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011245965975514604, + "loss": 0.0083, + "step": 482330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011245577153877458, + "loss": 0.0124, + "step": 482340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011245188332240311, + "loss": 0.0105, + "step": 482350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011244799510603165, + "loss": 0.0101, + "step": 482360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011244410688966018, + "loss": 0.0091, + "step": 482370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011244021867328872, + "loss": 0.0094, + "step": 482380 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011243633045691725, + "loss": 0.0091, + "step": 482390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011243244224054579, + "loss": 0.0136, + "step": 482400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011242855402417432, + "loss": 0.0087, + "step": 482410 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011242466580780287, + "loss": 0.0104, + "step": 482420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011242077759143139, + "loss": 0.0102, + "step": 482430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011241688937505994, + "loss": 0.0109, + "step": 482440 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011241300115868847, + "loss": 0.0089, + "step": 482450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011240911294231701, + "loss": 0.0098, + "step": 482460 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011240522472594554, + "loss": 0.0098, + "step": 482470 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011240133650957408, + "loss": 0.0113, + "step": 482480 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011239744829320261, + "loss": 0.0123, + "step": 482490 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011239356007683115, + "loss": 0.0135, + "step": 482500 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011238967186045968, + "loss": 0.0095, + "step": 482510 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011238578364408822, + "loss": 0.0111, + "step": 482520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011238189542771675, + "loss": 0.0137, + "step": 482530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011237800721134529, + "loss": 0.0071, + "step": 482540 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011237411899497382, + "loss": 0.0119, + "step": 482550 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011237023077860236, + "loss": 0.0079, + "step": 482560 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011236634256223089, + "loss": 0.0069, + "step": 482570 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011236245434585942, + "loss": 0.009, + "step": 482580 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011235856612948796, + "loss": 0.0109, + "step": 482590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011235467791311649, + "loss": 0.01, + "step": 482600 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011235078969674504, + "loss": 0.0098, + "step": 482610 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011234690148037357, + "loss": 0.0121, + "step": 482620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011234301326400211, + "loss": 0.0123, + "step": 482630 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011233912504763064, + "loss": 0.0107, + "step": 482640 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011233523683125918, + "loss": 0.0098, + "step": 482650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011233134861488771, + "loss": 0.012, + "step": 482660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011232746039851625, + "loss": 0.0102, + "step": 482670 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011232357218214478, + "loss": 0.0106, + "step": 482680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011231968396577332, + "loss": 0.01, + "step": 482690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011231579574940185, + "loss": 0.0107, + "step": 482700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011231190753303039, + "loss": 0.0112, + "step": 482710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011230801931665892, + "loss": 0.0112, + "step": 482720 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011230413110028746, + "loss": 0.0124, + "step": 482730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011230024288391599, + "loss": 0.0109, + "step": 482740 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011229635466754453, + "loss": 0.0082, + "step": 482750 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011229246645117306, + "loss": 0.0138, + "step": 482760 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011228857823480161, + "loss": 0.0109, + "step": 482770 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011228469001843014, + "loss": 0.01, + "step": 482780 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011228080180205868, + "loss": 0.0095, + "step": 482790 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011227691358568721, + "loss": 0.0139, + "step": 482800 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011227302536931575, + "loss": 0.0134, + "step": 482810 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011226913715294428, + "loss": 0.0159, + "step": 482820 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011226524893657281, + "loss": 0.0097, + "step": 482830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011226136072020135, + "loss": 0.0149, + "step": 482840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011225747250382988, + "loss": 0.0092, + "step": 482850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011225358428745842, + "loss": 0.0106, + "step": 482860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011224969607108695, + "loss": 0.0128, + "step": 482870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011224580785471549, + "loss": 0.0114, + "step": 482880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011224191963834402, + "loss": 0.0074, + "step": 482890 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223803142197256, + "loss": 0.0113, + "step": 482900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223414320560109, + "loss": 0.0105, + "step": 482910 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011223025498922963, + "loss": 0.0127, + "step": 482920 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011222636677285816, + "loss": 0.0138, + "step": 482930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011222247855648671, + "loss": 0.0109, + "step": 482940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011221859034011523, + "loss": 0.0128, + "step": 482950 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011221470212374378, + "loss": 0.0094, + "step": 482960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011221081390737231, + "loss": 0.0131, + "step": 482970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011220692569100085, + "loss": 0.0131, + "step": 482980 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011220303747462938, + "loss": 0.0117, + "step": 482990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011219914925825792, + "loss": 0.0086, + "step": 483000 + }, + { + "epoch": 1.25, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.006821894086897373, + "eval_runtime": 108.1122, + "eval_samples_per_second": 18.499, + "eval_steps_per_second": 4.625, + "step": 483000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011219526104188645, + "loss": 0.0116, + "step": 483010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011219137282551499, + "loss": 0.0119, + "step": 483020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011218748460914352, + "loss": 0.0102, + "step": 483030 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011218359639277206, + "loss": 0.0115, + "step": 483040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011217970817640059, + "loss": 0.0167, + "step": 483050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011217581996002913, + "loss": 0.0088, + "step": 483060 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011217193174365766, + "loss": 0.0074, + "step": 483070 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011216804352728619, + "loss": 0.0087, + "step": 483080 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011216415531091473, + "loss": 0.0137, + "step": 483090 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011216026709454326, + "loss": 0.0126, + "step": 483100 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001121563788781718, + "loss": 0.0093, + "step": 483110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011215249066180033, + "loss": 0.0106, + "step": 483120 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011214860244542888, + "loss": 0.0124, + "step": 483130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011214471422905741, + "loss": 0.009, + "step": 483140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011214082601268595, + "loss": 0.0108, + "step": 483150 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011213693779631448, + "loss": 0.0112, + "step": 483160 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011213304957994302, + "loss": 0.0093, + "step": 483170 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011212916136357155, + "loss": 0.0098, + "step": 483180 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011212527314720009, + "loss": 0.0101, + "step": 483190 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011212138493082862, + "loss": 0.0141, + "step": 483200 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011211749671445716, + "loss": 0.0114, + "step": 483210 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011211360849808569, + "loss": 0.0178, + "step": 483220 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011210972028171423, + "loss": 0.01, + "step": 483230 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011210583206534276, + "loss": 0.0098, + "step": 483240 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001121019438489713, + "loss": 0.0075, + "step": 483250 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011209805563259983, + "loss": 0.0121, + "step": 483260 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011209416741622837, + "loss": 0.0113, + "step": 483270 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001120902791998569, + "loss": 0.0106, + "step": 483280 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011208639098348545, + "loss": 0.0082, + "step": 483290 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011208250276711397, + "loss": 0.0065, + "step": 483300 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011207861455074252, + "loss": 0.0135, + "step": 483310 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011207472633437105, + "loss": 0.0109, + "step": 483320 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011207083811799958, + "loss": 0.0103, + "step": 483330 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011206694990162812, + "loss": 0.0088, + "step": 483340 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011206306168525665, + "loss": 0.0115, + "step": 483350 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011205917346888519, + "loss": 0.0078, + "step": 483360 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011205528525251372, + "loss": 0.0103, + "step": 483370 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011205139703614226, + "loss": 0.0113, + "step": 483380 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011204750881977079, + "loss": 0.0135, + "step": 483390 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011204362060339933, + "loss": 0.0099, + "step": 483400 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011203973238702786, + "loss": 0.0099, + "step": 483410 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001120358441706564, + "loss": 0.0093, + "step": 483420 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011203195595428493, + "loss": 0.012, + "step": 483430 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011202806773791347, + "loss": 0.0104, + "step": 483440 + }, + { + "epoch": 1.25, + "learning_rate": 0.000112024179521542, + "loss": 0.0102, + "step": 483450 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011202029130517054, + "loss": 0.0105, + "step": 483460 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011201640308879907, + "loss": 0.0118, + "step": 483470 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011201251487242762, + "loss": 0.0102, + "step": 483480 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011200862665605615, + "loss": 0.01, + "step": 483490 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011200473843968469, + "loss": 0.0115, + "step": 483500 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011200085022331322, + "loss": 0.0114, + "step": 483510 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011199696200694176, + "loss": 0.0098, + "step": 483520 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011199307379057029, + "loss": 0.0122, + "step": 483530 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011198918557419883, + "loss": 0.0075, + "step": 483540 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011198529735782736, + "loss": 0.0105, + "step": 483550 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011198140914145589, + "loss": 0.0106, + "step": 483560 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011197752092508443, + "loss": 0.0112, + "step": 483570 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011197363270871296, + "loss": 0.013, + "step": 483580 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001119697444923415, + "loss": 0.0128, + "step": 483590 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011196585627597003, + "loss": 0.0134, + "step": 483600 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011196196805959857, + "loss": 0.0152, + "step": 483610 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001119580798432271, + "loss": 0.0071, + "step": 483620 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011195419162685564, + "loss": 0.0101, + "step": 483630 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011195030341048417, + "loss": 0.0149, + "step": 483640 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011194641519411272, + "loss": 0.0089, + "step": 483650 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011194252697774124, + "loss": 0.0098, + "step": 483660 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011193863876136979, + "loss": 0.012, + "step": 483670 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011193475054499832, + "loss": 0.0097, + "step": 483680 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011193086232862686, + "loss": 0.0115, + "step": 483690 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011192697411225539, + "loss": 0.0126, + "step": 483700 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011192308589588393, + "loss": 0.0116, + "step": 483710 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011191919767951246, + "loss": 0.0131, + "step": 483720 + }, + { + "epoch": 1.25, + "learning_rate": 0.000111915309463141, + "loss": 0.011, + "step": 483730 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011191142124676953, + "loss": 0.0111, + "step": 483740 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011190753303039807, + "loss": 0.0155, + "step": 483750 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001119036448140266, + "loss": 0.0101, + "step": 483760 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011189975659765514, + "loss": 0.011, + "step": 483770 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011189586838128367, + "loss": 0.013, + "step": 483780 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011189198016491221, + "loss": 0.0109, + "step": 483790 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011188809194854074, + "loss": 0.011, + "step": 483800 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011188420373216927, + "loss": 0.009, + "step": 483810 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011188031551579781, + "loss": 0.0121, + "step": 483820 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011187642729942634, + "loss": 0.0114, + "step": 483830 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011187253908305489, + "loss": 0.0137, + "step": 483840 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011186865086668342, + "loss": 0.0082, + "step": 483850 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011186476265031196, + "loss": 0.0125, + "step": 483860 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011186087443394049, + "loss": 0.0106, + "step": 483870 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011185698621756903, + "loss": 0.0132, + "step": 483880 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011185309800119756, + "loss": 0.01, + "step": 483890 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118492097848261, + "loss": 0.0093, + "step": 483900 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011184532156845463, + "loss": 0.0088, + "step": 483910 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011184143335208317, + "loss": 0.011, + "step": 483920 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001118375451357117, + "loss": 0.0109, + "step": 483930 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011183365691934024, + "loss": 0.0096, + "step": 483940 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011182976870296877, + "loss": 0.0115, + "step": 483950 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011182588048659731, + "loss": 0.0101, + "step": 483960 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011182199227022584, + "loss": 0.0109, + "step": 483970 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011181810405385438, + "loss": 0.0112, + "step": 483980 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011181421583748291, + "loss": 0.0116, + "step": 483990 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011181032762111146, + "loss": 0.0101, + "step": 484000 + }, + { + "epoch": 1.25, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.0068328119814395905, + "eval_runtime": 108.0595, + "eval_samples_per_second": 18.508, + "eval_steps_per_second": 4.627, + "step": 484000 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011180643940473999, + "loss": 0.0086, + "step": 484010 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011180255118836853, + "loss": 0.0102, + "step": 484020 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011179866297199706, + "loss": 0.0113, + "step": 484030 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001117947747556256, + "loss": 0.0096, + "step": 484040 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011179088653925413, + "loss": 0.0107, + "step": 484050 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011178699832288266, + "loss": 0.0091, + "step": 484060 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001117831101065112, + "loss": 0.0125, + "step": 484070 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011177922189013973, + "loss": 0.0098, + "step": 484080 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011177533367376827, + "loss": 0.0119, + "step": 484090 + }, + { + "epoch": 1.25, + "learning_rate": 0.0001117714454573968, + "loss": 0.0104, + "step": 484100 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011176755724102534, + "loss": 0.0085, + "step": 484110 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011176366902465387, + "loss": 0.0104, + "step": 484120 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011175978080828241, + "loss": 0.0097, + "step": 484130 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011175589259191094, + "loss": 0.0102, + "step": 484140 + }, + { + "epoch": 1.25, + "learning_rate": 0.00011175200437553948, + "loss": 0.0092, + "step": 484150 + }, + { + "epoch": 1.26, + "learning_rate": 0.000111748116159168, + "loss": 0.0101, + "step": 484160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011174422794279656, + "loss": 0.0125, + "step": 484170 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011174033972642508, + "loss": 0.0101, + "step": 484180 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011173645151005363, + "loss": 0.0082, + "step": 484190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011173256329368216, + "loss": 0.0116, + "step": 484200 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001117286750773107, + "loss": 0.0109, + "step": 484210 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011172478686093923, + "loss": 0.01, + "step": 484220 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011172089864456777, + "loss": 0.0093, + "step": 484230 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001117170104281963, + "loss": 0.0096, + "step": 484240 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011171312221182484, + "loss": 0.0096, + "step": 484250 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011170923399545337, + "loss": 0.0102, + "step": 484260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011170534577908191, + "loss": 0.0083, + "step": 484270 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011170145756271044, + "loss": 0.0111, + "step": 484280 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011169756934633898, + "loss": 0.0115, + "step": 484290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011169368112996751, + "loss": 0.0094, + "step": 484300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011168979291359604, + "loss": 0.0114, + "step": 484310 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011168590469722458, + "loss": 0.0126, + "step": 484320 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001116820164808531, + "loss": 0.0106, + "step": 484330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011167812826448165, + "loss": 0.013, + "step": 484340 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011167424004811018, + "loss": 0.0105, + "step": 484350 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011167035183173873, + "loss": 0.0095, + "step": 484360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011166646361536726, + "loss": 0.009, + "step": 484370 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001116625753989958, + "loss": 0.0101, + "step": 484380 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011165868718262433, + "loss": 0.0145, + "step": 484390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011165479896625287, + "loss": 0.0094, + "step": 484400 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001116509107498814, + "loss": 0.0152, + "step": 484410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011164702253350994, + "loss": 0.01, + "step": 484420 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011164313431713847, + "loss": 0.0098, + "step": 484430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011163924610076701, + "loss": 0.0094, + "step": 484440 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011163535788439554, + "loss": 0.0128, + "step": 484450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011163146966802408, + "loss": 0.0098, + "step": 484460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011162758145165261, + "loss": 0.0085, + "step": 484470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011162369323528115, + "loss": 0.0107, + "step": 484480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011161980501890968, + "loss": 0.0122, + "step": 484490 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011161591680253822, + "loss": 0.0084, + "step": 484500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011161202858616675, + "loss": 0.0087, + "step": 484510 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001116081403697953, + "loss": 0.0123, + "step": 484520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011160425215342382, + "loss": 0.0112, + "step": 484530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011160036393705237, + "loss": 0.0079, + "step": 484540 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001115964757206809, + "loss": 0.0105, + "step": 484550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011159258750430943, + "loss": 0.0123, + "step": 484560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011158869928793797, + "loss": 0.0108, + "step": 484570 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001115848110715665, + "loss": 0.0108, + "step": 484580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011158092285519504, + "loss": 0.0141, + "step": 484590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011157703463882357, + "loss": 0.0116, + "step": 484600 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011157314642245211, + "loss": 0.0133, + "step": 484610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011156925820608064, + "loss": 0.0107, + "step": 484620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011156536998970918, + "loss": 0.009, + "step": 484630 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001115614817733377, + "loss": 0.0121, + "step": 484640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011155759355696625, + "loss": 0.0115, + "step": 484650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011155370534059478, + "loss": 0.0084, + "step": 484660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011154981712422332, + "loss": 0.008, + "step": 484670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011154592890785185, + "loss": 0.0123, + "step": 484680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011154204069148039, + "loss": 0.0097, + "step": 484690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011153815247510892, + "loss": 0.0122, + "step": 484700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011153426425873747, + "loss": 0.0124, + "step": 484710 + }, + { + "epoch": 1.26, + "learning_rate": 0.000111530376042366, + "loss": 0.01, + "step": 484720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011152648782599454, + "loss": 0.0132, + "step": 484730 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011152259960962307, + "loss": 0.0099, + "step": 484740 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011151871139325161, + "loss": 0.0103, + "step": 484750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011151482317688014, + "loss": 0.0117, + "step": 484760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011151093496050868, + "loss": 0.0094, + "step": 484770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011150704674413721, + "loss": 0.0099, + "step": 484780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011150315852776575, + "loss": 0.0107, + "step": 484790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011149927031139428, + "loss": 0.0098, + "step": 484800 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001114953820950228, + "loss": 0.0088, + "step": 484810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011149149387865135, + "loss": 0.0082, + "step": 484820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011148760566227988, + "loss": 0.0108, + "step": 484830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011148371744590842, + "loss": 0.0101, + "step": 484840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011147982922953695, + "loss": 0.0131, + "step": 484850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011147594101316549, + "loss": 0.0094, + "step": 484860 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011147205279679402, + "loss": 0.0118, + "step": 484870 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011146816458042257, + "loss": 0.0086, + "step": 484880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011146427636405109, + "loss": 0.0111, + "step": 484890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011146038814767964, + "loss": 0.01, + "step": 484900 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011145649993130817, + "loss": 0.0089, + "step": 484910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011145261171493671, + "loss": 0.0155, + "step": 484920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011144872349856524, + "loss": 0.0098, + "step": 484930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011144483528219378, + "loss": 0.0091, + "step": 484940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011144094706582231, + "loss": 0.0107, + "step": 484950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011143705884945085, + "loss": 0.0082, + "step": 484960 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011143317063307938, + "loss": 0.0144, + "step": 484970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011142928241670792, + "loss": 0.0134, + "step": 484980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011142539420033645, + "loss": 0.0102, + "step": 484990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011142150598396499, + "loss": 0.0097, + "step": 485000 + }, + { + "epoch": 1.26, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.006655857898294926, + "eval_runtime": 107.9871, + "eval_samples_per_second": 18.521, + "eval_steps_per_second": 4.63, + "step": 485000 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011141761776759352, + "loss": 0.0088, + "step": 485010 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011141372955122206, + "loss": 0.0101, + "step": 485020 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011140984133485059, + "loss": 0.013, + "step": 485030 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011140595311847914, + "loss": 0.0106, + "step": 485040 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011140206490210766, + "loss": 0.0111, + "step": 485050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011139817668573618, + "loss": 0.0115, + "step": 485060 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011139428846936474, + "loss": 0.0099, + "step": 485070 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011139040025299327, + "loss": 0.0101, + "step": 485080 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011138651203662181, + "loss": 0.0118, + "step": 485090 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011138262382025034, + "loss": 0.0145, + "step": 485100 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011137873560387888, + "loss": 0.0095, + "step": 485110 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011137484738750741, + "loss": 0.0103, + "step": 485120 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011137095917113595, + "loss": 0.0094, + "step": 485130 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011136707095476448, + "loss": 0.0106, + "step": 485140 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011136318273839302, + "loss": 0.0097, + "step": 485150 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011135929452202155, + "loss": 0.0118, + "step": 485160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011135540630565009, + "loss": 0.0106, + "step": 485170 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011135151808927862, + "loss": 0.0089, + "step": 485180 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011134762987290716, + "loss": 0.0127, + "step": 485190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011134374165653569, + "loss": 0.0111, + "step": 485200 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011133985344016423, + "loss": 0.0114, + "step": 485210 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011133596522379276, + "loss": 0.0133, + "step": 485220 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011133207700742131, + "loss": 0.0103, + "step": 485230 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132818879104984, + "loss": 0.0117, + "step": 485240 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132430057467838, + "loss": 0.0087, + "step": 485250 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011132041235830691, + "loss": 0.0102, + "step": 485260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011131652414193545, + "loss": 0.0106, + "step": 485270 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011131263592556398, + "loss": 0.0082, + "step": 485280 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011130874770919252, + "loss": 0.0077, + "step": 485290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011130485949282105, + "loss": 0.0106, + "step": 485300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011130097127644958, + "loss": 0.0107, + "step": 485310 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011129708306007812, + "loss": 0.0083, + "step": 485320 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011129319484370665, + "loss": 0.01, + "step": 485330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011128930662733519, + "loss": 0.01, + "step": 485340 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011128541841096372, + "loss": 0.0134, + "step": 485350 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011128153019459226, + "loss": 0.0096, + "step": 485360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011127764197822079, + "loss": 0.012, + "step": 485370 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011127375376184933, + "loss": 0.0075, + "step": 485380 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011126986554547786, + "loss": 0.0094, + "step": 485390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011126597732910641, + "loss": 0.0102, + "step": 485400 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011126208911273492, + "loss": 0.0103, + "step": 485410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011125820089636348, + "loss": 0.0114, + "step": 485420 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011125431267999201, + "loss": 0.0104, + "step": 485430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011125042446362055, + "loss": 0.0092, + "step": 485440 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011124653624724908, + "loss": 0.0098, + "step": 485450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011124264803087762, + "loss": 0.0093, + "step": 485460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011123875981450615, + "loss": 0.0136, + "step": 485470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011123487159813469, + "loss": 0.0102, + "step": 485480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011123098338176322, + "loss": 0.0102, + "step": 485490 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011122709516539176, + "loss": 0.014, + "step": 485500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011122320694902029, + "loss": 0.0141, + "step": 485510 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011121931873264883, + "loss": 0.0117, + "step": 485520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011121543051627736, + "loss": 0.0104, + "step": 485530 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001112115422999059, + "loss": 0.0104, + "step": 485540 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011120765408353443, + "loss": 0.0088, + "step": 485550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011120376586716295, + "loss": 0.0111, + "step": 485560 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001111998776507915, + "loss": 0.009, + "step": 485570 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011119598943442002, + "loss": 0.0089, + "step": 485580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011119210121804858, + "loss": 0.0075, + "step": 485590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011118821300167711, + "loss": 0.0108, + "step": 485600 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011118432478530565, + "loss": 0.0092, + "step": 485610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011118043656893418, + "loss": 0.01, + "step": 485620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011117654835256272, + "loss": 0.0111, + "step": 485630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011117266013619125, + "loss": 0.0095, + "step": 485640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011116877191981979, + "loss": 0.0084, + "step": 485650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011116488370344832, + "loss": 0.0124, + "step": 485660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011116099548707686, + "loss": 0.0148, + "step": 485670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011115710727070539, + "loss": 0.016, + "step": 485680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011115321905433393, + "loss": 0.0112, + "step": 485690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011114933083796246, + "loss": 0.0103, + "step": 485700 + }, + { + "epoch": 1.26, + "learning_rate": 0.000111145442621591, + "loss": 0.01, + "step": 485710 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011114155440521953, + "loss": 0.0105, + "step": 485720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011113766618884807, + "loss": 0.0109, + "step": 485730 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001111337779724766, + "loss": 0.0098, + "step": 485740 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011112988975610515, + "loss": 0.0088, + "step": 485750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011112600153973368, + "loss": 0.011, + "step": 485760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011112211332336222, + "loss": 0.0113, + "step": 485770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011111822510699075, + "loss": 0.0083, + "step": 485780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011111433689061929, + "loss": 0.012, + "step": 485790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011111044867424782, + "loss": 0.0116, + "step": 485800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011110656045787635, + "loss": 0.0116, + "step": 485810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011110267224150489, + "loss": 0.0145, + "step": 485820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011109878402513342, + "loss": 0.0087, + "step": 485830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011109489580876196, + "loss": 0.0094, + "step": 485840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011109100759239049, + "loss": 0.0116, + "step": 485850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011108711937601903, + "loss": 0.0131, + "step": 485860 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011108323115964756, + "loss": 0.0091, + "step": 485870 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001110793429432761, + "loss": 0.0105, + "step": 485880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011107545472690463, + "loss": 0.0075, + "step": 485890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011107156651053317, + "loss": 0.0099, + "step": 485900 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001110676782941617, + "loss": 0.011, + "step": 485910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011106379007779024, + "loss": 0.0117, + "step": 485920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011105990186141876, + "loss": 0.0116, + "step": 485930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011105601364504732, + "loss": 0.0074, + "step": 485940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011105212542867585, + "loss": 0.0082, + "step": 485950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011104823721230439, + "loss": 0.0112, + "step": 485960 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011104434899593292, + "loss": 0.0121, + "step": 485970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011104046077956146, + "loss": 0.0108, + "step": 485980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011103657256318999, + "loss": 0.0106, + "step": 485990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011103268434681853, + "loss": 0.012, + "step": 486000 + }, + { + "epoch": 1.26, + "eval_cer": 0.8816550986674057, + "eval_loss": 0.006589991506189108, + "eval_runtime": 108.066, + "eval_samples_per_second": 18.507, + "eval_steps_per_second": 4.627, + "step": 486000 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011102879613044706, + "loss": 0.0113, + "step": 486010 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001110249079140756, + "loss": 0.0146, + "step": 486020 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011102101969770413, + "loss": 0.0101, + "step": 486030 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011101713148133267, + "loss": 0.0102, + "step": 486040 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001110132432649612, + "loss": 0.0092, + "step": 486050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011100935504858972, + "loss": 0.0102, + "step": 486060 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011100546683221827, + "loss": 0.0116, + "step": 486070 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001110015786158468, + "loss": 0.0148, + "step": 486080 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011099769039947534, + "loss": 0.0085, + "step": 486090 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011099380218310386, + "loss": 0.0128, + "step": 486100 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011098991396673242, + "loss": 0.0108, + "step": 486110 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011098602575036093, + "loss": 0.01, + "step": 486120 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011098213753398949, + "loss": 0.0099, + "step": 486130 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011097824931761802, + "loss": 0.008, + "step": 486140 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011097436110124656, + "loss": 0.011, + "step": 486150 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011097047288487509, + "loss": 0.0106, + "step": 486160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011096658466850363, + "loss": 0.0091, + "step": 486170 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011096269645213216, + "loss": 0.014, + "step": 486180 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109588082357607, + "loss": 0.0116, + "step": 486190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011095492001938923, + "loss": 0.0113, + "step": 486200 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011095103180301777, + "loss": 0.0092, + "step": 486210 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109471435866463, + "loss": 0.011, + "step": 486220 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011094325537027484, + "loss": 0.0103, + "step": 486230 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011093936715390337, + "loss": 0.0101, + "step": 486240 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011093547893753191, + "loss": 0.0117, + "step": 486250 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011093159072116044, + "loss": 0.0081, + "step": 486260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011092770250478899, + "loss": 0.0098, + "step": 486270 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001109238142884175, + "loss": 0.0096, + "step": 486280 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011091992607204603, + "loss": 0.0091, + "step": 486290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011091603785567459, + "loss": 0.0095, + "step": 486300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011091214963930312, + "loss": 0.0097, + "step": 486310 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011090826142293166, + "loss": 0.0123, + "step": 486320 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011090437320656019, + "loss": 0.0085, + "step": 486330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011090048499018873, + "loss": 0.0097, + "step": 486340 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011089659677381726, + "loss": 0.0098, + "step": 486350 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108927085574458, + "loss": 0.0092, + "step": 486360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011088882034107433, + "loss": 0.0096, + "step": 486370 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011088493212470287, + "loss": 0.0074, + "step": 486380 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108810439083314, + "loss": 0.0082, + "step": 486390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011087715569195994, + "loss": 0.0095, + "step": 486400 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011087326747558847, + "loss": 0.0128, + "step": 486410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011086937925921701, + "loss": 0.0123, + "step": 486420 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011086549104284553, + "loss": 0.0106, + "step": 486430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011086160282647408, + "loss": 0.0105, + "step": 486440 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108577146101026, + "loss": 0.016, + "step": 486450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011085382639373116, + "loss": 0.0138, + "step": 486460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011084993817735969, + "loss": 0.0091, + "step": 486470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011084604996098823, + "loss": 0.0077, + "step": 486480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011084216174461676, + "loss": 0.0085, + "step": 486490 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108382735282453, + "loss": 0.0119, + "step": 486500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011083438531187383, + "loss": 0.0105, + "step": 486510 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011083049709550237, + "loss": 0.0104, + "step": 486520 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108266088791309, + "loss": 0.0128, + "step": 486530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011082272066275943, + "loss": 0.0126, + "step": 486540 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011081883244638797, + "loss": 0.01, + "step": 486550 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108149442300165, + "loss": 0.0121, + "step": 486560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011081105601364504, + "loss": 0.0084, + "step": 486570 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011080716779727356, + "loss": 0.0126, + "step": 486580 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001108032795809021, + "loss": 0.0099, + "step": 486590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011079939136453063, + "loss": 0.0098, + "step": 486600 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011079550314815918, + "loss": 0.0104, + "step": 486610 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107916149317877, + "loss": 0.012, + "step": 486620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011078772671541626, + "loss": 0.0152, + "step": 486630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011078383849904477, + "loss": 0.0105, + "step": 486640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011077995028267333, + "loss": 0.0108, + "step": 486650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011077606206630186, + "loss": 0.012, + "step": 486660 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107721738499304, + "loss": 0.013, + "step": 486670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011076828563355893, + "loss": 0.0105, + "step": 486680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011076439741718747, + "loss": 0.01, + "step": 486690 + }, + { + "epoch": 1.26, + "learning_rate": 0.000110760509200816, + "loss": 0.0146, + "step": 486700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011075662098444454, + "loss": 0.0114, + "step": 486710 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011075273276807307, + "loss": 0.0079, + "step": 486720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011074884455170161, + "loss": 0.0077, + "step": 486730 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011074495633533014, + "loss": 0.0125, + "step": 486740 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011074106811895868, + "loss": 0.0079, + "step": 486750 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107371799025872, + "loss": 0.012, + "step": 486760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011073329168621575, + "loss": 0.0095, + "step": 486770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011072940346984428, + "loss": 0.0148, + "step": 486780 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107255152534728, + "loss": 0.0133, + "step": 486790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011072162703710135, + "loss": 0.0094, + "step": 486800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011071773882072987, + "loss": 0.0101, + "step": 486810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011071385060435843, + "loss": 0.0111, + "step": 486820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011070996238798696, + "loss": 0.0121, + "step": 486830 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001107060741716155, + "loss": 0.0132, + "step": 486840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011070218595524403, + "loss": 0.0116, + "step": 486850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011069829773887257, + "loss": 0.0119, + "step": 486860 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106944095225011, + "loss": 0.0089, + "step": 486870 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011069052130612964, + "loss": 0.0144, + "step": 486880 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011068663308975817, + "loss": 0.0073, + "step": 486890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011068274487338671, + "loss": 0.0131, + "step": 486900 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011067885665701524, + "loss": 0.0091, + "step": 486910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011067496844064378, + "loss": 0.0093, + "step": 486920 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106710802242723, + "loss": 0.0105, + "step": 486930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011066719200790085, + "loss": 0.011, + "step": 486940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011066330379152937, + "loss": 0.0097, + "step": 486950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011065941557515792, + "loss": 0.0068, + "step": 486960 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011065552735878644, + "loss": 0.0113, + "step": 486970 + }, + { + "epoch": 1.26, + "learning_rate": 0.000110651639142415, + "loss": 0.0103, + "step": 486980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011064775092604353, + "loss": 0.0088, + "step": 486990 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011064386270967207, + "loss": 0.0107, + "step": 487000 + }, + { + "epoch": 1.26, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.0066790650598704815, + "eval_runtime": 108.1004, + "eval_samples_per_second": 18.501, + "eval_steps_per_second": 4.625, + "step": 487000 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106399744933006, + "loss": 0.0097, + "step": 487010 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011063608627692914, + "loss": 0.0121, + "step": 487020 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011063219806055767, + "loss": 0.0081, + "step": 487030 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106283098441862, + "loss": 0.0098, + "step": 487040 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011062442162781474, + "loss": 0.0128, + "step": 487050 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011062053341144327, + "loss": 0.0141, + "step": 487060 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011061664519507181, + "loss": 0.0104, + "step": 487070 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011061275697870033, + "loss": 0.0077, + "step": 487080 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011060886876232888, + "loss": 0.0102, + "step": 487090 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001106049805459574, + "loss": 0.0143, + "step": 487100 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011060109232958595, + "loss": 0.0094, + "step": 487110 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011059720411321447, + "loss": 0.0103, + "step": 487120 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011059331589684302, + "loss": 0.011, + "step": 487130 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011058942768047154, + "loss": 0.0092, + "step": 487140 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001105855394641001, + "loss": 0.0095, + "step": 487150 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011058165124772861, + "loss": 0.007, + "step": 487160 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011057776303135717, + "loss": 0.0104, + "step": 487170 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001105738748149857, + "loss": 0.0141, + "step": 487180 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011056998659861424, + "loss": 0.0103, + "step": 487190 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011056609838224277, + "loss": 0.0094, + "step": 487200 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011056221016587131, + "loss": 0.0124, + "step": 487210 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011055832194949984, + "loss": 0.0125, + "step": 487220 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011055443373312838, + "loss": 0.0073, + "step": 487230 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001105505455167569, + "loss": 0.0095, + "step": 487240 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011054665730038545, + "loss": 0.0116, + "step": 487250 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011054276908401398, + "loss": 0.0105, + "step": 487260 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011053888086764252, + "loss": 0.0096, + "step": 487270 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011053499265127105, + "loss": 0.0105, + "step": 487280 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011053110443489957, + "loss": 0.0079, + "step": 487290 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011052721621852812, + "loss": 0.0092, + "step": 487300 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011052332800215664, + "loss": 0.0104, + "step": 487310 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011051943978578519, + "loss": 0.0104, + "step": 487320 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011051555156941371, + "loss": 0.0122, + "step": 487330 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011051166335304227, + "loss": 0.0096, + "step": 487340 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001105077751366708, + "loss": 0.0086, + "step": 487350 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011050388692029934, + "loss": 0.0107, + "step": 487360 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011049999870392787, + "loss": 0.0103, + "step": 487370 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011049611048755641, + "loss": 0.011, + "step": 487380 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011049222227118494, + "loss": 0.0092, + "step": 487390 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011048833405481348, + "loss": 0.0115, + "step": 487400 + }, + { + "epoch": 1.26, + "learning_rate": 0.000110484445838442, + "loss": 0.0115, + "step": 487410 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011048055762207055, + "loss": 0.0114, + "step": 487420 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011047666940569908, + "loss": 0.0093, + "step": 487430 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011047278118932762, + "loss": 0.0112, + "step": 487440 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011046889297295615, + "loss": 0.0101, + "step": 487450 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011046500475658469, + "loss": 0.0121, + "step": 487460 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011046111654021321, + "loss": 0.0106, + "step": 487470 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011045722832384176, + "loss": 0.0134, + "step": 487480 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011045334010747028, + "loss": 0.0107, + "step": 487490 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011044945189109884, + "loss": 0.0092, + "step": 487500 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011044556367472735, + "loss": 0.0109, + "step": 487510 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011044167545835591, + "loss": 0.0081, + "step": 487520 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011043778724198444, + "loss": 0.0128, + "step": 487530 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011043389902561297, + "loss": 0.0098, + "step": 487540 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011043001080924151, + "loss": 0.0097, + "step": 487550 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011042612259287004, + "loss": 0.009, + "step": 487560 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011042223437649858, + "loss": 0.0144, + "step": 487570 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001104183461601271, + "loss": 0.0088, + "step": 487580 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011041445794375565, + "loss": 0.0102, + "step": 487590 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011041056972738417, + "loss": 0.0122, + "step": 487600 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011040668151101272, + "loss": 0.0108, + "step": 487610 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011040279329464124, + "loss": 0.0142, + "step": 487620 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011039890507826979, + "loss": 0.0112, + "step": 487630 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011039501686189831, + "loss": 0.015, + "step": 487640 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011039112864552686, + "loss": 0.0127, + "step": 487650 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011038724042915538, + "loss": 0.0156, + "step": 487660 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011038335221278393, + "loss": 0.0223, + "step": 487670 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011037946399641245, + "loss": 0.008, + "step": 487680 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011037557578004101, + "loss": 0.0095, + "step": 487690 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011037168756366954, + "loss": 0.0083, + "step": 487700 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011036779934729808, + "loss": 0.0178, + "step": 487710 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001103639111309266, + "loss": 0.0099, + "step": 487720 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011036002291455515, + "loss": 0.0109, + "step": 487730 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011035613469818368, + "loss": 0.0129, + "step": 487740 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011035224648181222, + "loss": 0.0105, + "step": 487750 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011034835826544075, + "loss": 0.0093, + "step": 487760 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011034447004906929, + "loss": 0.0117, + "step": 487770 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011034058183269782, + "loss": 0.0077, + "step": 487780 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011033669361632634, + "loss": 0.0117, + "step": 487790 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011033280539995489, + "loss": 0.0124, + "step": 487800 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011032891718358341, + "loss": 0.011, + "step": 487810 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011032502896721196, + "loss": 0.0077, + "step": 487820 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011032114075084048, + "loss": 0.0138, + "step": 487830 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011031725253446903, + "loss": 0.0115, + "step": 487840 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011031336431809755, + "loss": 0.0129, + "step": 487850 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011030947610172611, + "loss": 0.0106, + "step": 487860 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011030558788535462, + "loss": 0.0132, + "step": 487870 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011030169966898318, + "loss": 0.013, + "step": 487880 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001102978114526117, + "loss": 0.0101, + "step": 487890 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011029392323624025, + "loss": 0.0091, + "step": 487900 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011029003501986878, + "loss": 0.0095, + "step": 487910 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011028614680349732, + "loss": 0.0118, + "step": 487920 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011028225858712585, + "loss": 0.0134, + "step": 487930 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011027837037075439, + "loss": 0.0135, + "step": 487940 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011027448215438292, + "loss": 0.0111, + "step": 487950 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011027059393801146, + "loss": 0.0097, + "step": 487960 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011026670572163998, + "loss": 0.0122, + "step": 487970 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011026281750526853, + "loss": 0.0113, + "step": 487980 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011025892928889705, + "loss": 0.0112, + "step": 487990 + }, + { + "epoch": 1.26, + "learning_rate": 0.0001102550410725256, + "loss": 0.0118, + "step": 488000 + }, + { + "epoch": 1.26, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.006483182776719332, + "eval_runtime": 108.0759, + "eval_samples_per_second": 18.506, + "eval_steps_per_second": 4.626, + "step": 488000 + }, + { + "epoch": 1.26, + "learning_rate": 0.00011025115285615412, + "loss": 0.0104, + "step": 488010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011024726463978268, + "loss": 0.013, + "step": 488020 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001102433764234112, + "loss": 0.0083, + "step": 488030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011023948820703972, + "loss": 0.0072, + "step": 488040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011023559999066828, + "loss": 0.0094, + "step": 488050 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001102317117742968, + "loss": 0.0112, + "step": 488060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011022782355792535, + "loss": 0.0139, + "step": 488070 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011022393534155388, + "loss": 0.014, + "step": 488080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011022004712518242, + "loss": 0.0125, + "step": 488090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011021615890881094, + "loss": 0.0078, + "step": 488100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011021227069243949, + "loss": 0.0101, + "step": 488110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011020838247606801, + "loss": 0.0135, + "step": 488120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011020449425969656, + "loss": 0.0105, + "step": 488130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011020060604332508, + "loss": 0.0073, + "step": 488140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011019671782695363, + "loss": 0.0117, + "step": 488150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011019282961058215, + "loss": 0.0126, + "step": 488160 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001101889413942107, + "loss": 0.0092, + "step": 488170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011018505317783922, + "loss": 0.0125, + "step": 488180 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011018116496146777, + "loss": 0.0103, + "step": 488190 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001101772767450963, + "loss": 0.0096, + "step": 488200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011017338852872485, + "loss": 0.0085, + "step": 488210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011016950031235338, + "loss": 0.0116, + "step": 488220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011016561209598192, + "loss": 0.0085, + "step": 488230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011016172387961045, + "loss": 0.009, + "step": 488240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011015783566323899, + "loss": 0.0092, + "step": 488250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011015394744686752, + "loss": 0.0094, + "step": 488260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011015005923049606, + "loss": 0.0092, + "step": 488270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011014617101412459, + "loss": 0.0082, + "step": 488280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011014228279775311, + "loss": 0.0078, + "step": 488290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011013839458138166, + "loss": 0.0099, + "step": 488300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011013450636501018, + "loss": 0.0108, + "step": 488310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011013061814863873, + "loss": 0.0099, + "step": 488320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011012672993226725, + "loss": 0.0121, + "step": 488330 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001101228417158958, + "loss": 0.0127, + "step": 488340 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011011895349952432, + "loss": 0.0124, + "step": 488350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011011506528315286, + "loss": 0.0098, + "step": 488360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011011117706678139, + "loss": 0.0084, + "step": 488370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011010728885040995, + "loss": 0.0082, + "step": 488380 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011010340063403846, + "loss": 0.0131, + "step": 488390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011009951241766702, + "loss": 0.0094, + "step": 488400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011009562420129555, + "loss": 0.0117, + "step": 488410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011009173598492409, + "loss": 0.0146, + "step": 488420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011008784776855262, + "loss": 0.0136, + "step": 488430 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011008395955218116, + "loss": 0.0089, + "step": 488440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011008007133580969, + "loss": 0.0154, + "step": 488450 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011007618311943823, + "loss": 0.0116, + "step": 488460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011007229490306676, + "loss": 0.0113, + "step": 488470 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001100684066866953, + "loss": 0.0109, + "step": 488480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011006451847032382, + "loss": 0.009, + "step": 488490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011006063025395237, + "loss": 0.0091, + "step": 488500 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001100567420375809, + "loss": 0.0092, + "step": 488510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011005285382120944, + "loss": 0.009, + "step": 488520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011004896560483796, + "loss": 0.0093, + "step": 488530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011004507738846649, + "loss": 0.0084, + "step": 488540 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011004118917209503, + "loss": 0.0103, + "step": 488550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011003730095572356, + "loss": 0.0085, + "step": 488560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011003341273935212, + "loss": 0.0125, + "step": 488570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011002952452298065, + "loss": 0.0143, + "step": 488580 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011002563630660919, + "loss": 0.0115, + "step": 488590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011002174809023772, + "loss": 0.0123, + "step": 488600 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011001785987386626, + "loss": 0.0095, + "step": 488610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011001397165749478, + "loss": 0.013, + "step": 488620 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011001008344112333, + "loss": 0.0084, + "step": 488630 + }, + { + "epoch": 1.27, + "learning_rate": 0.00011000619522475185, + "loss": 0.0128, + "step": 488640 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001100023070083804, + "loss": 0.0126, + "step": 488650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010999841879200892, + "loss": 0.0136, + "step": 488660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010999453057563747, + "loss": 0.0143, + "step": 488670 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109990642359266, + "loss": 0.0114, + "step": 488680 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010998675414289454, + "loss": 0.01, + "step": 488690 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010998286592652306, + "loss": 0.0098, + "step": 488700 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099789777101516, + "loss": 0.008, + "step": 488710 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010997508949378013, + "loss": 0.0094, + "step": 488720 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010997120127740869, + "loss": 0.0089, + "step": 488730 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099673130610372, + "loss": 0.0087, + "step": 488740 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010996342484466576, + "loss": 0.009, + "step": 488750 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010995953662829429, + "loss": 0.0094, + "step": 488760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010995564841192283, + "loss": 0.01, + "step": 488770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010995176019555136, + "loss": 0.0088, + "step": 488780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010994787197917988, + "loss": 0.0091, + "step": 488790 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010994398376280843, + "loss": 0.0096, + "step": 488800 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010994009554643695, + "loss": 0.0096, + "step": 488810 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099362073300655, + "loss": 0.012, + "step": 488820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010993231911369402, + "loss": 0.0132, + "step": 488830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010992843089732257, + "loss": 0.0092, + "step": 488840 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099245426809511, + "loss": 0.0118, + "step": 488850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010992065446457964, + "loss": 0.01, + "step": 488860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010991676624820816, + "loss": 0.0099, + "step": 488870 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099128780318367, + "loss": 0.0139, + "step": 488880 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010990898981546523, + "loss": 0.0103, + "step": 488890 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010990510159909377, + "loss": 0.011, + "step": 488900 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001099012133827223, + "loss": 0.0131, + "step": 488910 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010989732516635086, + "loss": 0.0073, + "step": 488920 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010989343694997939, + "loss": 0.0094, + "step": 488930 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010988954873360793, + "loss": 0.0109, + "step": 488940 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010988566051723646, + "loss": 0.0098, + "step": 488950 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109881772300865, + "loss": 0.0078, + "step": 488960 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010987788408449353, + "loss": 0.011, + "step": 488970 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010987399586812207, + "loss": 0.011, + "step": 488980 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001098701076517506, + "loss": 0.0107, + "step": 488990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010986621943537914, + "loss": 0.0093, + "step": 489000 + }, + { + "epoch": 1.27, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.0065433569252491, + "eval_runtime": 108.073, + "eval_samples_per_second": 18.506, + "eval_steps_per_second": 4.627, + "step": 489000 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010986233121900766, + "loss": 0.009, + "step": 489010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010985844300263619, + "loss": 0.0112, + "step": 489020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010985455478626473, + "loss": 0.0096, + "step": 489030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010985066656989326, + "loss": 0.0103, + "step": 489040 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001098467783535218, + "loss": 0.0092, + "step": 489050 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010984289013715033, + "loss": 0.0089, + "step": 489060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010983900192077887, + "loss": 0.0086, + "step": 489070 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001098351137044074, + "loss": 0.0095, + "step": 489080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010983122548803596, + "loss": 0.0096, + "step": 489090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010982733727166447, + "loss": 0.0114, + "step": 489100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010982344905529303, + "loss": 0.0086, + "step": 489110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010981956083892156, + "loss": 0.0093, + "step": 489120 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001098156726225501, + "loss": 0.0116, + "step": 489130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010981178440617862, + "loss": 0.0117, + "step": 489140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010980789618980717, + "loss": 0.0115, + "step": 489150 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001098040079734357, + "loss": 0.0127, + "step": 489160 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010980011975706424, + "loss": 0.0097, + "step": 489170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010979623154069276, + "loss": 0.0107, + "step": 489180 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097923433243213, + "loss": 0.0112, + "step": 489190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010978845510794983, + "loss": 0.012, + "step": 489200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010978456689157838, + "loss": 0.0072, + "step": 489210 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097806786752069, + "loss": 0.0117, + "step": 489220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010977679045883545, + "loss": 0.0091, + "step": 489230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010977290224246397, + "loss": 0.0102, + "step": 489240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010976901402609253, + "loss": 0.0114, + "step": 489250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010976512580972104, + "loss": 0.009, + "step": 489260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010976123759334957, + "loss": 0.0117, + "step": 489270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010975734937697813, + "loss": 0.012, + "step": 489280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010975346116060665, + "loss": 0.012, + "step": 489290 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097495729442352, + "loss": 0.0092, + "step": 489300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010974568472786372, + "loss": 0.0101, + "step": 489310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010974179651149227, + "loss": 0.0082, + "step": 489320 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097379082951208, + "loss": 0.0085, + "step": 489330 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010973402007874934, + "loss": 0.0093, + "step": 489340 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010973013186237786, + "loss": 0.0088, + "step": 489350 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001097262436460064, + "loss": 0.0087, + "step": 489360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010972235542963493, + "loss": 0.009, + "step": 489370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010971846721326347, + "loss": 0.008, + "step": 489380 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109714578996892, + "loss": 0.0088, + "step": 489390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010971069078052054, + "loss": 0.0111, + "step": 489400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010970680256414907, + "loss": 0.0154, + "step": 489410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010970291434777761, + "loss": 0.0122, + "step": 489420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010969902613140614, + "loss": 0.0102, + "step": 489430 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096951379150347, + "loss": 0.0141, + "step": 489440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010969124969866323, + "loss": 0.019, + "step": 489450 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010968736148229177, + "loss": 0.0091, + "step": 489460 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096834732659203, + "loss": 0.0102, + "step": 489470 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010967958504954884, + "loss": 0.01, + "step": 489480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010967569683317737, + "loss": 0.0081, + "step": 489490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010967180861680591, + "loss": 0.0092, + "step": 489500 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010966792040043443, + "loss": 0.0084, + "step": 489510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010966403218406296, + "loss": 0.0107, + "step": 489520 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096601439676915, + "loss": 0.0102, + "step": 489530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010965625575132003, + "loss": 0.0109, + "step": 489540 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010965236753494857, + "loss": 0.011, + "step": 489550 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096484793185771, + "loss": 0.0091, + "step": 489560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010964459110220564, + "loss": 0.0099, + "step": 489570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010964070288583417, + "loss": 0.0109, + "step": 489580 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010963681466946271, + "loss": 0.0079, + "step": 489590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010963292645309124, + "loss": 0.0107, + "step": 489600 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096290382367198, + "loss": 0.011, + "step": 489610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010962515002034831, + "loss": 0.0091, + "step": 489620 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010962126180397687, + "loss": 0.0089, + "step": 489630 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001096173735876054, + "loss": 0.0098, + "step": 489640 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010961348537123394, + "loss": 0.0096, + "step": 489650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010960959715486246, + "loss": 0.0092, + "step": 489660 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109605708938491, + "loss": 0.0102, + "step": 489670 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010960182072211953, + "loss": 0.0096, + "step": 489680 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010959793250574808, + "loss": 0.0074, + "step": 489690 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095940442893766, + "loss": 0.0095, + "step": 489700 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010959015607300515, + "loss": 0.0126, + "step": 489710 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010958626785663367, + "loss": 0.0083, + "step": 489720 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010958237964026222, + "loss": 0.0116, + "step": 489730 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010957849142389074, + "loss": 0.0126, + "step": 489740 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010957460320751929, + "loss": 0.0093, + "step": 489750 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010957071499114781, + "loss": 0.0106, + "step": 489760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010956682677477634, + "loss": 0.0111, + "step": 489770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010956293855840488, + "loss": 0.0107, + "step": 489780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010955905034203341, + "loss": 0.009, + "step": 489790 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010955516212566197, + "loss": 0.0101, + "step": 489800 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095512739092905, + "loss": 0.0123, + "step": 489810 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010954738569291904, + "loss": 0.0083, + "step": 489820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010954349747654756, + "loss": 0.0087, + "step": 489830 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095396092601761, + "loss": 0.013, + "step": 489840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010953572104380463, + "loss": 0.0123, + "step": 489850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010953183282743318, + "loss": 0.0118, + "step": 489860 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001095279446110617, + "loss": 0.0101, + "step": 489870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010952405639469025, + "loss": 0.0078, + "step": 489880 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010952016817831877, + "loss": 0.0093, + "step": 489890 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010951627996194731, + "loss": 0.008, + "step": 489900 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010951239174557584, + "loss": 0.0142, + "step": 489910 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010950850352920438, + "loss": 0.0092, + "step": 489920 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010950461531283291, + "loss": 0.0106, + "step": 489930 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010950072709646145, + "loss": 0.0092, + "step": 489940 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010949683888008998, + "loss": 0.0081, + "step": 489950 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010949295066371854, + "loss": 0.011, + "step": 489960 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010948906244734707, + "loss": 0.0088, + "step": 489970 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010948517423097561, + "loss": 0.0132, + "step": 489980 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010948128601460414, + "loss": 0.0085, + "step": 489990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010947739779823268, + "loss": 0.008, + "step": 490000 + }, + { + "epoch": 1.27, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.006557569373399019, + "eval_runtime": 107.9754, + "eval_samples_per_second": 18.523, + "eval_steps_per_second": 4.631, + "step": 490000 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001094735095818612, + "loss": 0.0084, + "step": 490010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010946962136548973, + "loss": 0.0097, + "step": 490020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010946573314911827, + "loss": 0.0102, + "step": 490030 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001094618449327468, + "loss": 0.0091, + "step": 490040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010945795671637534, + "loss": 0.0095, + "step": 490050 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010945406850000387, + "loss": 0.0085, + "step": 490060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010945018028363241, + "loss": 0.01, + "step": 490070 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010944629206726094, + "loss": 0.0139, + "step": 490080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010944240385088948, + "loss": 0.0146, + "step": 490090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010943851563451801, + "loss": 0.0104, + "step": 490100 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010943462741814655, + "loss": 0.0111, + "step": 490110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010943073920177508, + "loss": 0.0132, + "step": 490120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010942685098540362, + "loss": 0.0084, + "step": 490130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010942296276903215, + "loss": 0.0062, + "step": 490140 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001094190745526607, + "loss": 0.0099, + "step": 490150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010941518633628923, + "loss": 0.0133, + "step": 490160 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010941129811991778, + "loss": 0.0093, + "step": 490170 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001094074099035463, + "loss": 0.0098, + "step": 490180 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010940352168717485, + "loss": 0.0146, + "step": 490190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010939963347080337, + "loss": 0.0098, + "step": 490200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010939574525443192, + "loss": 0.0117, + "step": 490210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010939185703806044, + "loss": 0.0113, + "step": 490220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010938796882168899, + "loss": 0.0166, + "step": 490230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010938408060531751, + "loss": 0.0132, + "step": 490240 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010938019238894606, + "loss": 0.0142, + "step": 490250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010937630417257458, + "loss": 0.0089, + "step": 490260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010937241595620311, + "loss": 0.0088, + "step": 490270 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010936852773983165, + "loss": 0.0094, + "step": 490280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010936463952346018, + "loss": 0.0096, + "step": 490290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010936075130708872, + "loss": 0.0091, + "step": 490300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010935686309071725, + "loss": 0.0104, + "step": 490310 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001093529748743458, + "loss": 0.0102, + "step": 490320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010934908665797432, + "loss": 0.0108, + "step": 490330 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010934519844160288, + "loss": 0.0112, + "step": 490340 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001093413102252314, + "loss": 0.0091, + "step": 490350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010933742200885995, + "loss": 0.011, + "step": 490360 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010933353379248847, + "loss": 0.0107, + "step": 490370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010932964557611702, + "loss": 0.0121, + "step": 490380 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010932575735974554, + "loss": 0.0151, + "step": 490390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010932186914337409, + "loss": 0.0122, + "step": 490400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010931798092700261, + "loss": 0.0086, + "step": 490410 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010931409271063115, + "loss": 0.0099, + "step": 490420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010931020449425968, + "loss": 0.0099, + "step": 490430 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010930631627788822, + "loss": 0.0119, + "step": 490440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010930242806151675, + "loss": 0.013, + "step": 490450 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001092985398451453, + "loss": 0.0116, + "step": 490460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010929465162877382, + "loss": 0.0108, + "step": 490470 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010929076341240238, + "loss": 0.0127, + "step": 490480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010928687519603089, + "loss": 0.0098, + "step": 490490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010928298697965945, + "loss": 0.0146, + "step": 490500 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010927909876328798, + "loss": 0.0098, + "step": 490510 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001092752105469165, + "loss": 0.009, + "step": 490520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010927132233054505, + "loss": 0.011, + "step": 490530 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010926743411417357, + "loss": 0.0118, + "step": 490540 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010926354589780211, + "loss": 0.0087, + "step": 490550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010925965768143064, + "loss": 0.0117, + "step": 490560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010925576946505918, + "loss": 0.0107, + "step": 490570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010925188124868771, + "loss": 0.0099, + "step": 490580 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010924799303231625, + "loss": 0.0092, + "step": 490590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010924410481594478, + "loss": 0.0239, + "step": 490600 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010924021659957332, + "loss": 0.0085, + "step": 490610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010923632838320185, + "loss": 0.0093, + "step": 490620 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001092324401668304, + "loss": 0.0103, + "step": 490630 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010922855195045892, + "loss": 0.0133, + "step": 490640 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010922466373408746, + "loss": 0.0091, + "step": 490650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010922077551771599, + "loss": 0.0102, + "step": 490660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010921688730134455, + "loss": 0.0132, + "step": 490670 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010921299908497307, + "loss": 0.0083, + "step": 490680 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010920911086860162, + "loss": 0.0111, + "step": 490690 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010920522265223014, + "loss": 0.011, + "step": 490700 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010920133443585869, + "loss": 0.0082, + "step": 490710 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010919744621948721, + "loss": 0.0091, + "step": 490720 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010919355800311576, + "loss": 0.0122, + "step": 490730 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010918966978674428, + "loss": 0.0105, + "step": 490740 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010918578157037283, + "loss": 0.0063, + "step": 490750 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010918189335400135, + "loss": 0.0099, + "step": 490760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010917800513762988, + "loss": 0.0106, + "step": 490770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010917411692125842, + "loss": 0.0114, + "step": 490780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010917022870488695, + "loss": 0.011, + "step": 490790 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010916634048851549, + "loss": 0.0138, + "step": 490800 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010916245227214402, + "loss": 0.0087, + "step": 490810 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010915856405577256, + "loss": 0.0112, + "step": 490820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010915467583940109, + "loss": 0.0071, + "step": 490830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010915078762302965, + "loss": 0.0091, + "step": 490840 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010914689940665816, + "loss": 0.0087, + "step": 490850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010914301119028672, + "loss": 0.0106, + "step": 490860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010913912297391524, + "loss": 0.0119, + "step": 490870 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010913523475754379, + "loss": 0.0109, + "step": 490880 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010913134654117231, + "loss": 0.0092, + "step": 490890 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010912745832480086, + "loss": 0.0132, + "step": 490900 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010912357010842938, + "loss": 0.0092, + "step": 490910 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010911968189205792, + "loss": 0.0122, + "step": 490920 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010911579367568645, + "loss": 0.01, + "step": 490930 + }, + { + "epoch": 1.27, + "learning_rate": 0.000109111905459315, + "loss": 0.0116, + "step": 490940 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010910801724294352, + "loss": 0.0112, + "step": 490950 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010910412902657206, + "loss": 0.0124, + "step": 490960 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010910024081020059, + "loss": 0.0115, + "step": 490970 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010909635259382913, + "loss": 0.0104, + "step": 490980 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010909246437745766, + "loss": 0.0092, + "step": 490990 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010908857616108622, + "loss": 0.0107, + "step": 491000 + }, + { + "epoch": 1.27, + "eval_cer": 0.881688689953826, + "eval_loss": 0.0065551563166081905, + "eval_runtime": 108.1856, + "eval_samples_per_second": 18.487, + "eval_steps_per_second": 4.622, + "step": 491000 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010908468794471473, + "loss": 0.0098, + "step": 491010 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010908079972834326, + "loss": 0.012, + "step": 491020 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010907691151197182, + "loss": 0.0071, + "step": 491030 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010907302329560034, + "loss": 0.0105, + "step": 491040 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010906913507922888, + "loss": 0.0105, + "step": 491050 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010906524686285741, + "loss": 0.0105, + "step": 491060 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010906135864648595, + "loss": 0.0108, + "step": 491070 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010905747043011448, + "loss": 0.01, + "step": 491080 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010905358221374302, + "loss": 0.012, + "step": 491090 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010904969399737155, + "loss": 0.0113, + "step": 491100 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001090458057810001, + "loss": 0.0099, + "step": 491110 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010904191756462862, + "loss": 0.0106, + "step": 491120 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010903802934825716, + "loss": 0.0084, + "step": 491130 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010903414113188569, + "loss": 0.0151, + "step": 491140 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010903025291551423, + "loss": 0.0129, + "step": 491150 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010902636469914276, + "loss": 0.0115, + "step": 491160 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001090224764827713, + "loss": 0.0089, + "step": 491170 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010901858826639983, + "loss": 0.0119, + "step": 491180 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010901470005002839, + "loss": 0.0122, + "step": 491190 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010901081183365691, + "loss": 0.0085, + "step": 491200 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010900692361728546, + "loss": 0.0139, + "step": 491210 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010900303540091398, + "loss": 0.0117, + "step": 491220 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010899914718454253, + "loss": 0.014, + "step": 491230 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010899525896817105, + "loss": 0.0108, + "step": 491240 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089913707517996, + "loss": 0.0077, + "step": 491250 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010898748253542812, + "loss": 0.0142, + "step": 491260 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010898359431905665, + "loss": 0.0101, + "step": 491270 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089797061026852, + "loss": 0.013, + "step": 491280 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010897581788631372, + "loss": 0.0086, + "step": 491290 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010897192966994226, + "loss": 0.0127, + "step": 491300 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010896804145357079, + "loss": 0.0085, + "step": 491310 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010896415323719933, + "loss": 0.0094, + "step": 491320 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010896026502082786, + "loss": 0.0106, + "step": 491330 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089563768044564, + "loss": 0.01, + "step": 491340 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010895248858808493, + "loss": 0.0105, + "step": 491350 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010894860037171349, + "loss": 0.0118, + "step": 491360 + }, + { + "epoch": 1.27, + "learning_rate": 0.000108944712155342, + "loss": 0.0167, + "step": 491370 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010894082393897056, + "loss": 0.012, + "step": 491380 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010893693572259908, + "loss": 0.0094, + "step": 491390 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010893304750622763, + "loss": 0.0114, + "step": 491400 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010892915928985615, + "loss": 0.0108, + "step": 491410 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089252710734847, + "loss": 0.0079, + "step": 491420 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010892138285711322, + "loss": 0.0091, + "step": 491430 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010891749464074176, + "loss": 0.0118, + "step": 491440 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010891360642437029, + "loss": 0.0102, + "step": 491450 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010890971820799883, + "loss": 0.0084, + "step": 491460 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010890582999162736, + "loss": 0.0085, + "step": 491470 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001089019417752559, + "loss": 0.0111, + "step": 491480 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010889805355888443, + "loss": 0.0087, + "step": 491490 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010889416534251296, + "loss": 0.0128, + "step": 491500 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088902771261415, + "loss": 0.0105, + "step": 491510 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010888638890977003, + "loss": 0.01, + "step": 491520 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010888250069339857, + "loss": 0.0089, + "step": 491530 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088786124770271, + "loss": 0.0122, + "step": 491540 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010887472426065566, + "loss": 0.0119, + "step": 491550 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010887083604428418, + "loss": 0.0105, + "step": 491560 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010886694782791272, + "loss": 0.0089, + "step": 491570 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010886305961154125, + "loss": 0.0103, + "step": 491580 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088591713951698, + "loss": 0.0123, + "step": 491590 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010885528317879832, + "loss": 0.0108, + "step": 491600 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010885139496242686, + "loss": 0.0095, + "step": 491610 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010884750674605539, + "loss": 0.0141, + "step": 491620 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010884361852968393, + "loss": 0.0106, + "step": 491630 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010883973031331246, + "loss": 0.016, + "step": 491640 + }, + { + "epoch": 1.27, + "learning_rate": 0.000108835842096941, + "loss": 0.0118, + "step": 491650 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010883195388056953, + "loss": 0.0128, + "step": 491660 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010882806566419807, + "loss": 0.01, + "step": 491670 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088241774478266, + "loss": 0.0087, + "step": 491680 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010882028923145514, + "loss": 0.0138, + "step": 491690 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010881640101508367, + "loss": 0.0082, + "step": 491700 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010881251279871223, + "loss": 0.0109, + "step": 491710 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010880862458234074, + "loss": 0.0095, + "step": 491720 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001088047363659693, + "loss": 0.0119, + "step": 491730 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010880084814959782, + "loss": 0.0093, + "step": 491740 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010879695993322635, + "loss": 0.0083, + "step": 491750 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001087930717168549, + "loss": 0.008, + "step": 491760 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010878918350048342, + "loss": 0.0147, + "step": 491770 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010878529528411196, + "loss": 0.0082, + "step": 491780 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010878140706774049, + "loss": 0.0161, + "step": 491790 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010877751885136903, + "loss": 0.0102, + "step": 491800 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010877363063499756, + "loss": 0.0142, + "step": 491810 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001087697424186261, + "loss": 0.009, + "step": 491820 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010876585420225463, + "loss": 0.0105, + "step": 491830 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010876196598588317, + "loss": 0.0081, + "step": 491840 + }, + { + "epoch": 1.27, + "learning_rate": 0.0001087580777695117, + "loss": 0.0109, + "step": 491850 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010875418955314024, + "loss": 0.0072, + "step": 491860 + }, + { + "epoch": 1.27, + "learning_rate": 0.00010875030133676877, + "loss": 0.0088, + "step": 491870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010874641312039731, + "loss": 0.0093, + "step": 491880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010874252490402584, + "loss": 0.0104, + "step": 491890 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001087386366876544, + "loss": 0.0114, + "step": 491900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010873474847128292, + "loss": 0.0133, + "step": 491910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010873086025491147, + "loss": 0.0139, + "step": 491920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010872697203854, + "loss": 0.007, + "step": 491930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010872308382216854, + "loss": 0.0099, + "step": 491940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010871919560579706, + "loss": 0.0114, + "step": 491950 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001087153073894256, + "loss": 0.0061, + "step": 491960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010871141917305413, + "loss": 0.0075, + "step": 491970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010870753095668267, + "loss": 0.0091, + "step": 491980 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001087036427403112, + "loss": 0.009, + "step": 491990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010869975452393973, + "loss": 0.0135, + "step": 492000 + }, + { + "epoch": 1.28, + "eval_cer": 0.8816453012088664, + "eval_loss": 0.006531266961246729, + "eval_runtime": 108.0198, + "eval_samples_per_second": 18.515, + "eval_steps_per_second": 4.629, + "step": 492000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010869586630756827, + "loss": 0.0092, + "step": 492010 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086919780911968, + "loss": 0.0085, + "step": 492020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010868808987482534, + "loss": 0.0098, + "step": 492030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010868420165845387, + "loss": 0.014, + "step": 492040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010868031344208241, + "loss": 0.0102, + "step": 492050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010867642522571094, + "loss": 0.0096, + "step": 492060 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086725370093395, + "loss": 0.0102, + "step": 492070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010866864879296801, + "loss": 0.0113, + "step": 492080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010866476057659656, + "loss": 0.0103, + "step": 492090 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010866087236022509, + "loss": 0.0127, + "step": 492100 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010865698414385363, + "loss": 0.0083, + "step": 492110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010865309592748216, + "loss": 0.0093, + "step": 492120 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086492077111107, + "loss": 0.0074, + "step": 492130 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010864531949473923, + "loss": 0.0087, + "step": 492140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010864143127836777, + "loss": 0.0124, + "step": 492150 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001086375430619963, + "loss": 0.0106, + "step": 492160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010863365484562484, + "loss": 0.0103, + "step": 492170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010862976662925337, + "loss": 0.0111, + "step": 492180 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010862587841288191, + "loss": 0.0125, + "step": 492190 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010862199019651044, + "loss": 0.0103, + "step": 492200 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010861810198013898, + "loss": 0.0108, + "step": 492210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010861421376376751, + "loss": 0.0109, + "step": 492220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010861032554739607, + "loss": 0.01, + "step": 492230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010860643733102458, + "loss": 0.0089, + "step": 492240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010860254911465311, + "loss": 0.0096, + "step": 492250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010859866089828166, + "loss": 0.0131, + "step": 492260 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010859477268191019, + "loss": 0.0119, + "step": 492270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010859088446553873, + "loss": 0.0091, + "step": 492280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010858699624916726, + "loss": 0.0076, + "step": 492290 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085831080327958, + "loss": 0.01, + "step": 492300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010857921981642433, + "loss": 0.0108, + "step": 492310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010857533160005287, + "loss": 0.0112, + "step": 492320 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085714433836814, + "loss": 0.0125, + "step": 492330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010856755516730994, + "loss": 0.0097, + "step": 492340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010856366695093847, + "loss": 0.0105, + "step": 492350 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010855977873456701, + "loss": 0.0121, + "step": 492360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010855589051819554, + "loss": 0.0102, + "step": 492370 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010855200230182408, + "loss": 0.0108, + "step": 492380 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010854811408545261, + "loss": 0.0084, + "step": 492390 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010854422586908115, + "loss": 0.0094, + "step": 492400 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010854033765270968, + "loss": 0.0104, + "step": 492410 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010853644943633824, + "loss": 0.0079, + "step": 492420 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010853256121996676, + "loss": 0.0129, + "step": 492430 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085286730035953, + "loss": 0.0104, + "step": 492440 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010852478478722383, + "loss": 0.0123, + "step": 492450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010852089657085237, + "loss": 0.0111, + "step": 492460 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085170083544809, + "loss": 0.0116, + "step": 492470 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010851312013810944, + "loss": 0.0098, + "step": 492480 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010850923192173797, + "loss": 0.0104, + "step": 492490 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001085053437053665, + "loss": 0.0107, + "step": 492500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010850145548899504, + "loss": 0.0131, + "step": 492510 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010849756727262357, + "loss": 0.0113, + "step": 492520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010849367905625211, + "loss": 0.0102, + "step": 492530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010848979083988064, + "loss": 0.0104, + "step": 492540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010848590262350918, + "loss": 0.0079, + "step": 492550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010848201440713771, + "loss": 0.0106, + "step": 492560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010847812619076625, + "loss": 0.0141, + "step": 492570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010847423797439478, + "loss": 0.0074, + "step": 492580 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010847034975802333, + "loss": 0.0109, + "step": 492590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010846646154165185, + "loss": 0.0102, + "step": 492600 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001084625733252804, + "loss": 0.0123, + "step": 492610 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010845868510890893, + "loss": 0.0109, + "step": 492620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010845479689253747, + "loss": 0.0111, + "step": 492630 + }, + { + "epoch": 1.28, + "learning_rate": 0.000108450908676166, + "loss": 0.0102, + "step": 492640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010844702045979454, + "loss": 0.0093, + "step": 492650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010844313224342307, + "loss": 0.0136, + "step": 492660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010843924402705161, + "loss": 0.0103, + "step": 492670 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010843535581068014, + "loss": 0.0098, + "step": 492680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010843146759430868, + "loss": 0.0106, + "step": 492690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010842757937793721, + "loss": 0.009, + "step": 492700 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010842369116156575, + "loss": 0.0105, + "step": 492710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010841980294519428, + "loss": 0.0102, + "step": 492720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010841591472882282, + "loss": 0.0106, + "step": 492730 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010841202651245135, + "loss": 0.0057, + "step": 492740 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010840813829607988, + "loss": 0.0092, + "step": 492750 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010840425007970842, + "loss": 0.0085, + "step": 492760 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010840036186333695, + "loss": 0.0131, + "step": 492770 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001083964736469655, + "loss": 0.0114, + "step": 492780 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010839258543059403, + "loss": 0.0098, + "step": 492790 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010838869721422257, + "loss": 0.0096, + "step": 492800 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001083848089978511, + "loss": 0.0114, + "step": 492810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010838092078147964, + "loss": 0.0105, + "step": 492820 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010837703256510817, + "loss": 0.01, + "step": 492830 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010837314434873671, + "loss": 0.0104, + "step": 492840 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010836925613236524, + "loss": 0.0147, + "step": 492850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010836536791599378, + "loss": 0.011, + "step": 492860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010836147969962231, + "loss": 0.0141, + "step": 492870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010835759148325085, + "loss": 0.0142, + "step": 492880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010835370326687938, + "loss": 0.012, + "step": 492890 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010834981505050792, + "loss": 0.0092, + "step": 492900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010834592683413645, + "loss": 0.0144, + "step": 492910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010834203861776499, + "loss": 0.0133, + "step": 492920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010833815040139352, + "loss": 0.0113, + "step": 492930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010833426218502208, + "loss": 0.0066, + "step": 492940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010833037396865059, + "loss": 0.0123, + "step": 492950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010832648575227915, + "loss": 0.0134, + "step": 492960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010832259753590767, + "loss": 0.0112, + "step": 492970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010831870931953621, + "loss": 0.0103, + "step": 492980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010831482110316474, + "loss": 0.0117, + "step": 492990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010831093288679327, + "loss": 0.0076, + "step": 493000 + }, + { + "epoch": 1.28, + "eval_cer": 0.8816564983043399, + "eval_loss": 0.006680097430944443, + "eval_runtime": 108.037, + "eval_samples_per_second": 18.512, + "eval_steps_per_second": 4.628, + "step": 493000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010830704467042181, + "loss": 0.0096, + "step": 493010 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010830315645405034, + "loss": 0.0117, + "step": 493020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010829926823767888, + "loss": 0.0087, + "step": 493030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010829538002130741, + "loss": 0.008, + "step": 493040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010829149180493595, + "loss": 0.0101, + "step": 493050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010828760358856448, + "loss": 0.0079, + "step": 493060 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010828371537219302, + "loss": 0.0122, + "step": 493070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010827982715582155, + "loss": 0.0109, + "step": 493080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010827593893945009, + "loss": 0.0112, + "step": 493090 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010827205072307862, + "loss": 0.0115, + "step": 493100 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010826816250670716, + "loss": 0.0114, + "step": 493110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010826427429033569, + "loss": 0.0081, + "step": 493120 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010826038607396424, + "loss": 0.0095, + "step": 493130 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010825649785759277, + "loss": 0.0097, + "step": 493140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010825260964122131, + "loss": 0.0108, + "step": 493150 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010824872142484984, + "loss": 0.0094, + "step": 493160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010824483320847838, + "loss": 0.01, + "step": 493170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010824094499210691, + "loss": 0.0093, + "step": 493180 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010823705677573545, + "loss": 0.0085, + "step": 493190 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010823316855936398, + "loss": 0.0076, + "step": 493200 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010822928034299252, + "loss": 0.0091, + "step": 493210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010822539212662105, + "loss": 0.0094, + "step": 493220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010822150391024959, + "loss": 0.0085, + "step": 493230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010821761569387812, + "loss": 0.0118, + "step": 493240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010821372747750665, + "loss": 0.0116, + "step": 493250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010820983926113519, + "loss": 0.014, + "step": 493260 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010820595104476372, + "loss": 0.0081, + "step": 493270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010820206282839226, + "loss": 0.008, + "step": 493280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010819817461202079, + "loss": 0.0096, + "step": 493290 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010819428639564934, + "loss": 0.0114, + "step": 493300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010819039817927786, + "loss": 0.0104, + "step": 493310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010818650996290641, + "loss": 0.0109, + "step": 493320 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010818262174653494, + "loss": 0.0128, + "step": 493330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010817873353016348, + "loss": 0.0108, + "step": 493340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010817484531379201, + "loss": 0.0123, + "step": 493350 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010817095709742055, + "loss": 0.0093, + "step": 493360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010816706888104908, + "loss": 0.0168, + "step": 493370 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010816318066467762, + "loss": 0.0118, + "step": 493380 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010815929244830615, + "loss": 0.0097, + "step": 493390 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010815540423193469, + "loss": 0.0072, + "step": 493400 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010815151601556322, + "loss": 0.0117, + "step": 493410 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010814762779919176, + "loss": 0.0099, + "step": 493420 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010814373958282029, + "loss": 0.0135, + "step": 493430 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010813985136644883, + "loss": 0.0103, + "step": 493440 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010813596315007736, + "loss": 0.0111, + "step": 493450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010813207493370592, + "loss": 0.0122, + "step": 493460 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010812818671733443, + "loss": 0.0086, + "step": 493470 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010812429850096299, + "loss": 0.0115, + "step": 493480 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010812041028459151, + "loss": 0.0086, + "step": 493490 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010811652206822004, + "loss": 0.0097, + "step": 493500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010811263385184858, + "loss": 0.0098, + "step": 493510 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010810874563547711, + "loss": 0.008, + "step": 493520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010810485741910565, + "loss": 0.0091, + "step": 493530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010810096920273418, + "loss": 0.0098, + "step": 493540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010809708098636272, + "loss": 0.0086, + "step": 493550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010809319276999125, + "loss": 0.0081, + "step": 493560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010808930455361979, + "loss": 0.0085, + "step": 493570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010808541633724832, + "loss": 0.009, + "step": 493580 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010808152812087686, + "loss": 0.0109, + "step": 493590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010807763990450539, + "loss": 0.0103, + "step": 493600 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010807375168813393, + "loss": 0.0078, + "step": 493610 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010806986347176246, + "loss": 0.0082, + "step": 493620 + }, + { + "epoch": 1.28, + "learning_rate": 0.000108065975255391, + "loss": 0.0101, + "step": 493630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010806208703901953, + "loss": 0.0092, + "step": 493640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010805819882264808, + "loss": 0.0116, + "step": 493650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010805431060627661, + "loss": 0.012, + "step": 493660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010805042238990515, + "loss": 0.0082, + "step": 493670 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010804653417353368, + "loss": 0.0146, + "step": 493680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010804264595716222, + "loss": 0.0109, + "step": 493690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010803875774079075, + "loss": 0.0108, + "step": 493700 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001080348695244193, + "loss": 0.0137, + "step": 493710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010803098130804782, + "loss": 0.011, + "step": 493720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010802709309167636, + "loss": 0.0073, + "step": 493730 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010802320487530489, + "loss": 0.0096, + "step": 493740 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010801931665893342, + "loss": 0.0104, + "step": 493750 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010801542844256196, + "loss": 0.013, + "step": 493760 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010801154022619049, + "loss": 0.01, + "step": 493770 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010800765200981903, + "loss": 0.0115, + "step": 493780 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010800376379344756, + "loss": 0.0109, + "step": 493790 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001079998755770761, + "loss": 0.0077, + "step": 493800 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010799598736070463, + "loss": 0.0107, + "step": 493810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010799209914433318, + "loss": 0.0069, + "step": 493820 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001079882109279617, + "loss": 0.0101, + "step": 493830 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010798432271159025, + "loss": 0.01, + "step": 493840 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010798043449521878, + "loss": 0.0096, + "step": 493850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010797654627884732, + "loss": 0.0104, + "step": 493860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010797265806247585, + "loss": 0.009, + "step": 493870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010796876984610439, + "loss": 0.0083, + "step": 493880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010796488162973292, + "loss": 0.0104, + "step": 493890 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010796099341336146, + "loss": 0.0081, + "step": 493900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010795710519698999, + "loss": 0.0093, + "step": 493910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010795321698061853, + "loss": 0.0082, + "step": 493920 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010794932876424706, + "loss": 0.0086, + "step": 493930 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001079454405478756, + "loss": 0.0103, + "step": 493940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010794155233150413, + "loss": 0.0098, + "step": 493950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010793766411513267, + "loss": 0.0116, + "step": 493960 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001079337758987612, + "loss": 0.0096, + "step": 493970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010792988768238976, + "loss": 0.008, + "step": 493980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010792599946601827, + "loss": 0.0093, + "step": 493990 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001079221112496468, + "loss": 0.01, + "step": 494000 + }, + { + "epoch": 1.28, + "eval_cer": 0.88167329394755, + "eval_loss": 0.006551279220730066, + "eval_runtime": 107.9937, + "eval_samples_per_second": 18.52, + "eval_steps_per_second": 4.63, + "step": 494000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010791822303327535, + "loss": 0.0097, + "step": 494010 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010791433481690388, + "loss": 0.0124, + "step": 494020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010791044660053242, + "loss": 0.0112, + "step": 494030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010790655838416095, + "loss": 0.0111, + "step": 494040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010790267016778949, + "loss": 0.0097, + "step": 494050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010789878195141802, + "loss": 0.0103, + "step": 494060 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010789489373504656, + "loss": 0.0115, + "step": 494070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010789100551867509, + "loss": 0.0091, + "step": 494080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010788711730230363, + "loss": 0.0099, + "step": 494090 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010788322908593216, + "loss": 0.0139, + "step": 494100 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078793408695607, + "loss": 0.0087, + "step": 494110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010787545265318923, + "loss": 0.0086, + "step": 494120 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010787156443681777, + "loss": 0.0093, + "step": 494130 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078676762204463, + "loss": 0.0089, + "step": 494140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010786378800407484, + "loss": 0.0122, + "step": 494150 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010785989978770337, + "loss": 0.0164, + "step": 494160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010785601157133192, + "loss": 0.0125, + "step": 494170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010785212335496045, + "loss": 0.0124, + "step": 494180 + }, + { + "epoch": 1.28, + "learning_rate": 0.000107848235138589, + "loss": 0.0105, + "step": 494190 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010784434692221752, + "loss": 0.01, + "step": 494200 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010784045870584606, + "loss": 0.0107, + "step": 494210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010783657048947459, + "loss": 0.0095, + "step": 494220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010783268227310312, + "loss": 0.0137, + "step": 494230 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010782879405673166, + "loss": 0.0096, + "step": 494240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010782490584036019, + "loss": 0.0117, + "step": 494250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010782101762398873, + "loss": 0.0115, + "step": 494260 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010781712940761726, + "loss": 0.0091, + "step": 494270 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078132411912458, + "loss": 0.0117, + "step": 494280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010780935297487433, + "loss": 0.0095, + "step": 494290 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010780546475850287, + "loss": 0.0148, + "step": 494300 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001078015765421314, + "loss": 0.0091, + "step": 494310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010779768832575994, + "loss": 0.0097, + "step": 494320 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010779380010938847, + "loss": 0.009, + "step": 494330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010778991189301701, + "loss": 0.0124, + "step": 494340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010778602367664554, + "loss": 0.0123, + "step": 494350 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001077821354602741, + "loss": 0.0111, + "step": 494360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010777824724390262, + "loss": 0.0104, + "step": 494370 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010777435902753116, + "loss": 0.01, + "step": 494380 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010777047081115969, + "loss": 0.0111, + "step": 494390 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010776658259478823, + "loss": 0.0104, + "step": 494400 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010776269437841676, + "loss": 0.0129, + "step": 494410 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001077588061620453, + "loss": 0.0094, + "step": 494420 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010775491794567383, + "loss": 0.0113, + "step": 494430 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010775102972930237, + "loss": 0.0101, + "step": 494440 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001077471415129309, + "loss": 0.0119, + "step": 494450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010774325329655944, + "loss": 0.0101, + "step": 494460 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010773936508018797, + "loss": 0.0111, + "step": 494470 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001077354768638165, + "loss": 0.0064, + "step": 494480 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010773158864744504, + "loss": 0.0087, + "step": 494490 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010772770043107357, + "loss": 0.0076, + "step": 494500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010772381221470211, + "loss": 0.0131, + "step": 494510 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010771992399833064, + "loss": 0.0092, + "step": 494520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010771603578195919, + "loss": 0.0089, + "step": 494530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010771214756558771, + "loss": 0.008, + "step": 494540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010770825934921626, + "loss": 0.0106, + "step": 494550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010770437113284479, + "loss": 0.0095, + "step": 494560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010770048291647333, + "loss": 0.0074, + "step": 494570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010769659470010186, + "loss": 0.0081, + "step": 494580 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001076927064837304, + "loss": 0.0077, + "step": 494590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010768881826735893, + "loss": 0.0075, + "step": 494600 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010768493005098747, + "loss": 0.0107, + "step": 494610 + }, + { + "epoch": 1.28, + "learning_rate": 0.000107681041834616, + "loss": 0.0087, + "step": 494620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010767715361824454, + "loss": 0.0085, + "step": 494630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010767326540187307, + "loss": 0.0124, + "step": 494640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010766937718550161, + "loss": 0.0107, + "step": 494650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010766548896913014, + "loss": 0.0097, + "step": 494660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010766160075275868, + "loss": 0.0089, + "step": 494670 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010765771253638721, + "loss": 0.011, + "step": 494680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010765382432001576, + "loss": 0.0099, + "step": 494690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010764993610364428, + "loss": 0.0092, + "step": 494700 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010764604788727283, + "loss": 0.0106, + "step": 494710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010764215967090136, + "loss": 0.0087, + "step": 494720 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010763827145452989, + "loss": 0.0082, + "step": 494730 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010763438323815843, + "loss": 0.0084, + "step": 494740 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010763049502178696, + "loss": 0.0099, + "step": 494750 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001076266068054155, + "loss": 0.0092, + "step": 494760 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010762271858904403, + "loss": 0.0197, + "step": 494770 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010761883037267257, + "loss": 0.0097, + "step": 494780 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001076149421563011, + "loss": 0.0088, + "step": 494790 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010761105393992964, + "loss": 0.0119, + "step": 494800 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010760716572355817, + "loss": 0.0114, + "step": 494810 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010760327750718671, + "loss": 0.0111, + "step": 494820 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010759938929081524, + "loss": 0.0129, + "step": 494830 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010759550107444378, + "loss": 0.0085, + "step": 494840 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010759161285807231, + "loss": 0.0108, + "step": 494850 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010758772464170085, + "loss": 0.009, + "step": 494860 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010758383642532938, + "loss": 0.0092, + "step": 494870 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010757994820895793, + "loss": 0.0102, + "step": 494880 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010757605999258646, + "loss": 0.0106, + "step": 494890 + }, + { + "epoch": 1.28, + "learning_rate": 0.000107572171776215, + "loss": 0.0135, + "step": 494900 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010756828355984353, + "loss": 0.0169, + "step": 494910 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010756439534347207, + "loss": 0.0116, + "step": 494920 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001075605071271006, + "loss": 0.0101, + "step": 494930 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010755661891072914, + "loss": 0.0085, + "step": 494940 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010755273069435767, + "loss": 0.0112, + "step": 494950 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010754884247798621, + "loss": 0.0095, + "step": 494960 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010754495426161474, + "loss": 0.0103, + "step": 494970 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010754106604524327, + "loss": 0.007, + "step": 494980 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010753717782887181, + "loss": 0.0136, + "step": 494990 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010753328961250034, + "loss": 0.0112, + "step": 495000 + }, + { + "epoch": 1.28, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.006601433735340834, + "eval_runtime": 108.0099, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, + "step": 495000 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010752940139612888, + "loss": 0.0162, + "step": 495010 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010752551317975741, + "loss": 0.0107, + "step": 495020 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010752162496338595, + "loss": 0.0105, + "step": 495030 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010751773674701448, + "loss": 0.0094, + "step": 495040 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010751384853064303, + "loss": 0.0117, + "step": 495050 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010750996031427155, + "loss": 0.0102, + "step": 495060 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001075060720979001, + "loss": 0.0123, + "step": 495070 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010750218388152863, + "loss": 0.0124, + "step": 495080 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010749829566515717, + "loss": 0.0106, + "step": 495090 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074944074487857, + "loss": 0.0078, + "step": 495100 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010749051923241424, + "loss": 0.0091, + "step": 495110 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010748663101604277, + "loss": 0.0098, + "step": 495120 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010748274279967131, + "loss": 0.011, + "step": 495130 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010747885458329984, + "loss": 0.0107, + "step": 495140 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010747496636692838, + "loss": 0.0094, + "step": 495150 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010747107815055691, + "loss": 0.008, + "step": 495160 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010746718993418545, + "loss": 0.0103, + "step": 495170 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010746330171781398, + "loss": 0.0087, + "step": 495180 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010745941350144252, + "loss": 0.012, + "step": 495190 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010745552528507105, + "loss": 0.008, + "step": 495200 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074516370686996, + "loss": 0.0086, + "step": 495210 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010744774885232812, + "loss": 0.0092, + "step": 495220 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010744386063595665, + "loss": 0.0114, + "step": 495230 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074399724195852, + "loss": 0.0091, + "step": 495240 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010743608420321373, + "loss": 0.0103, + "step": 495250 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010743219598684227, + "loss": 0.0085, + "step": 495260 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001074283077704708, + "loss": 0.0093, + "step": 495270 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010742441955409934, + "loss": 0.0122, + "step": 495280 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010742053133772787, + "loss": 0.0153, + "step": 495290 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010741664312135641, + "loss": 0.0086, + "step": 495300 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010741275490498494, + "loss": 0.0117, + "step": 495310 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010740886668861348, + "loss": 0.0085, + "step": 495320 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010740497847224201, + "loss": 0.0105, + "step": 495330 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010740109025587055, + "loss": 0.0085, + "step": 495340 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010739720203949908, + "loss": 0.0107, + "step": 495350 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010739331382312762, + "loss": 0.0087, + "step": 495360 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010738942560675615, + "loss": 0.009, + "step": 495370 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010738553739038469, + "loss": 0.0093, + "step": 495380 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010738164917401322, + "loss": 0.0095, + "step": 495390 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010737776095764177, + "loss": 0.0169, + "step": 495400 + }, + { + "epoch": 1.28, + "learning_rate": 0.0001073738727412703, + "loss": 0.0092, + "step": 495410 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010736998452489884, + "loss": 0.0122, + "step": 495420 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010736609630852737, + "loss": 0.0087, + "step": 495430 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010736220809215591, + "loss": 0.0078, + "step": 495440 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010735831987578444, + "loss": 0.0091, + "step": 495450 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010735443165941298, + "loss": 0.0102, + "step": 495460 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010735054344304151, + "loss": 0.0084, + "step": 495470 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010734665522667004, + "loss": 0.0078, + "step": 495480 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010734276701029858, + "loss": 0.0092, + "step": 495490 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010733887879392711, + "loss": 0.0099, + "step": 495500 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010733499057755565, + "loss": 0.0082, + "step": 495510 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010733110236118418, + "loss": 0.0118, + "step": 495520 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010732721414481272, + "loss": 0.0091, + "step": 495530 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010732332592844125, + "loss": 0.0106, + "step": 495540 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010731943771206979, + "loss": 0.0077, + "step": 495550 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010731554949569832, + "loss": 0.0123, + "step": 495560 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010731166127932686, + "loss": 0.0086, + "step": 495570 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010730777306295539, + "loss": 0.0101, + "step": 495580 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010730388484658394, + "loss": 0.0121, + "step": 495590 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010729999663021247, + "loss": 0.0114, + "step": 495600 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010729610841384101, + "loss": 0.0099, + "step": 495610 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010729222019746954, + "loss": 0.0106, + "step": 495620 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010728833198109808, + "loss": 0.0101, + "step": 495630 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010728444376472661, + "loss": 0.0119, + "step": 495640 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010728055554835515, + "loss": 0.0122, + "step": 495650 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010727666733198368, + "loss": 0.0145, + "step": 495660 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010727277911561222, + "loss": 0.0088, + "step": 495670 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010726889089924075, + "loss": 0.0093, + "step": 495680 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010726500268286929, + "loss": 0.0104, + "step": 495690 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010726111446649782, + "loss": 0.0111, + "step": 495700 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010725722625012636, + "loss": 0.0111, + "step": 495710 + }, + { + "epoch": 1.28, + "learning_rate": 0.00010725333803375489, + "loss": 0.0097, + "step": 495720 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010724944981738342, + "loss": 0.0108, + "step": 495730 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010724556160101196, + "loss": 0.0108, + "step": 495740 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010724167338464049, + "loss": 0.0105, + "step": 495750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010723778516826904, + "loss": 0.0145, + "step": 495760 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010723389695189757, + "loss": 0.0082, + "step": 495770 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010723000873552611, + "loss": 0.0109, + "step": 495780 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010722612051915464, + "loss": 0.0108, + "step": 495790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010722223230278318, + "loss": 0.0104, + "step": 495800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010721834408641171, + "loss": 0.0078, + "step": 495810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010721445587004025, + "loss": 0.0085, + "step": 495820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010721056765366878, + "loss": 0.0082, + "step": 495830 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010720667943729732, + "loss": 0.0093, + "step": 495840 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010720279122092585, + "loss": 0.0099, + "step": 495850 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010719890300455439, + "loss": 0.0122, + "step": 495860 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010719501478818292, + "loss": 0.0092, + "step": 495870 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010719112657181146, + "loss": 0.0109, + "step": 495880 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010718723835543999, + "loss": 0.0101, + "step": 495890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010718335013906853, + "loss": 0.0135, + "step": 495900 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010717946192269706, + "loss": 0.0102, + "step": 495910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010717557370632561, + "loss": 0.0068, + "step": 495920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010717168548995413, + "loss": 0.0115, + "step": 495930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010716779727358268, + "loss": 0.0155, + "step": 495940 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010716390905721121, + "loss": 0.0086, + "step": 495950 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010716002084083975, + "loss": 0.0116, + "step": 495960 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010715613262446828, + "loss": 0.0096, + "step": 495970 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010715224440809681, + "loss": 0.0116, + "step": 495980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010714835619172535, + "loss": 0.0115, + "step": 495990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010714446797535388, + "loss": 0.0088, + "step": 496000 + }, + { + "epoch": 1.29, + "eval_cer": 0.8816648961259449, + "eval_loss": 0.006738040130585432, + "eval_runtime": 107.9676, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 496000 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010714057975898242, + "loss": 0.0116, + "step": 496010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010713669154261095, + "loss": 0.0111, + "step": 496020 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010713280332623949, + "loss": 0.0107, + "step": 496030 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010712891510986802, + "loss": 0.011, + "step": 496040 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010712502689349656, + "loss": 0.0103, + "step": 496050 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010712113867712509, + "loss": 0.0132, + "step": 496060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010711725046075363, + "loss": 0.0085, + "step": 496070 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010711336224438216, + "loss": 0.0088, + "step": 496080 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001071094740280107, + "loss": 0.0131, + "step": 496090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010710558581163923, + "loss": 0.0156, + "step": 496100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010710169759526778, + "loss": 0.0097, + "step": 496110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010709780937889631, + "loss": 0.0092, + "step": 496120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010709392116252485, + "loss": 0.0118, + "step": 496130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010709003294615338, + "loss": 0.0121, + "step": 496140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010708614472978192, + "loss": 0.0135, + "step": 496150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010708225651341045, + "loss": 0.0092, + "step": 496160 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010707836829703899, + "loss": 0.0097, + "step": 496170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010707448008066752, + "loss": 0.0109, + "step": 496180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010707059186429606, + "loss": 0.0089, + "step": 496190 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010706670364792459, + "loss": 0.0139, + "step": 496200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010706281543155313, + "loss": 0.011, + "step": 496210 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010705892721518166, + "loss": 0.0124, + "step": 496220 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010705503899881019, + "loss": 0.0108, + "step": 496230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010705115078243873, + "loss": 0.0127, + "step": 496240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010704726256606726, + "loss": 0.0099, + "step": 496250 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001070433743496958, + "loss": 0.0101, + "step": 496260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010703948613332433, + "loss": 0.0122, + "step": 496270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010703559791695288, + "loss": 0.0091, + "step": 496280 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001070317097005814, + "loss": 0.0109, + "step": 496290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010702782148420995, + "loss": 0.0103, + "step": 496300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010702393326783848, + "loss": 0.0081, + "step": 496310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010702004505146702, + "loss": 0.0093, + "step": 496320 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010701615683509555, + "loss": 0.01, + "step": 496330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010701226861872409, + "loss": 0.0078, + "step": 496340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010700838040235262, + "loss": 0.0103, + "step": 496350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010700449218598116, + "loss": 0.008, + "step": 496360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010700060396960969, + "loss": 0.0079, + "step": 496370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010699671575323823, + "loss": 0.0134, + "step": 496380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010699282753686676, + "loss": 0.0094, + "step": 496390 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001069889393204953, + "loss": 0.0101, + "step": 496400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010698505110412383, + "loss": 0.0126, + "step": 496410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010698116288775237, + "loss": 0.0115, + "step": 496420 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001069772746713809, + "loss": 0.0108, + "step": 496430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010697338645500945, + "loss": 0.012, + "step": 496440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010696949823863797, + "loss": 0.0081, + "step": 496450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010696561002226652, + "loss": 0.013, + "step": 496460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010696172180589505, + "loss": 0.012, + "step": 496470 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010695783358952358, + "loss": 0.012, + "step": 496480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010695394537315212, + "loss": 0.0088, + "step": 496490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010695005715678065, + "loss": 0.0107, + "step": 496500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010694616894040919, + "loss": 0.0118, + "step": 496510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010694228072403772, + "loss": 0.0155, + "step": 496520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010693839250766626, + "loss": 0.01, + "step": 496530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010693450429129479, + "loss": 0.0084, + "step": 496540 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010693061607492333, + "loss": 0.0116, + "step": 496550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010692672785855186, + "loss": 0.0137, + "step": 496560 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001069228396421804, + "loss": 0.0096, + "step": 496570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010691895142580893, + "loss": 0.0094, + "step": 496580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010691506320943747, + "loss": 0.0089, + "step": 496590 + }, + { + "epoch": 1.29, + "learning_rate": 0.000106911174993066, + "loss": 0.0083, + "step": 496600 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010690728677669454, + "loss": 0.0116, + "step": 496610 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010690339856032307, + "loss": 0.0115, + "step": 496620 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010689951034395162, + "loss": 0.0113, + "step": 496630 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010689562212758015, + "loss": 0.0094, + "step": 496640 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010689173391120869, + "loss": 0.0097, + "step": 496650 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010688784569483722, + "loss": 0.0098, + "step": 496660 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010688395747846576, + "loss": 0.0095, + "step": 496670 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010688006926209429, + "loss": 0.0087, + "step": 496680 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010687618104572283, + "loss": 0.0123, + "step": 496690 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010687229282935136, + "loss": 0.0117, + "step": 496700 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010686840461297989, + "loss": 0.0094, + "step": 496710 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010686451639660843, + "loss": 0.011, + "step": 496720 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010686062818023696, + "loss": 0.0142, + "step": 496730 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001068567399638655, + "loss": 0.0084, + "step": 496740 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010685285174749403, + "loss": 0.0105, + "step": 496750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010684896353112257, + "loss": 0.012, + "step": 496760 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001068450753147511, + "loss": 0.0099, + "step": 496770 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010684118709837964, + "loss": 0.0086, + "step": 496780 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010683729888200817, + "loss": 0.0152, + "step": 496790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010683341066563672, + "loss": 0.0131, + "step": 496800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010682952244926524, + "loss": 0.0103, + "step": 496810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010682563423289379, + "loss": 0.0128, + "step": 496820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010682174601652232, + "loss": 0.0106, + "step": 496830 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010681785780015086, + "loss": 0.0084, + "step": 496840 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010681396958377939, + "loss": 0.009, + "step": 496850 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010681008136740793, + "loss": 0.0095, + "step": 496860 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010680619315103646, + "loss": 0.0098, + "step": 496870 + }, + { + "epoch": 1.29, + "learning_rate": 0.000106802304934665, + "loss": 0.0098, + "step": 496880 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010679841671829353, + "loss": 0.0075, + "step": 496890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010679452850192207, + "loss": 0.0086, + "step": 496900 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001067906402855506, + "loss": 0.0099, + "step": 496910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010678675206917914, + "loss": 0.0096, + "step": 496920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010678286385280767, + "loss": 0.0104, + "step": 496930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010677897563643621, + "loss": 0.0099, + "step": 496940 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010677508742006474, + "loss": 0.0124, + "step": 496950 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010677119920369327, + "loss": 0.0116, + "step": 496960 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010676731098732181, + "loss": 0.0104, + "step": 496970 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010676342277095034, + "loss": 0.0131, + "step": 496980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010675953455457889, + "loss": 0.0099, + "step": 496990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010675564633820742, + "loss": 0.0082, + "step": 497000 + }, + { + "epoch": 1.29, + "eval_cer": 0.881657897941274, + "eval_loss": 0.006887293886393309, + "eval_runtime": 108.0582, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 497000 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010675175812183596, + "loss": 0.0097, + "step": 497010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010674786990546449, + "loss": 0.0097, + "step": 497020 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010674398168909303, + "loss": 0.01, + "step": 497030 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010674009347272156, + "loss": 0.011, + "step": 497040 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001067362052563501, + "loss": 0.0094, + "step": 497050 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010673231703997863, + "loss": 0.0088, + "step": 497060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010672842882360717, + "loss": 0.0109, + "step": 497070 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001067245406072357, + "loss": 0.0114, + "step": 497080 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010672065239086424, + "loss": 0.0101, + "step": 497090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010671676417449277, + "loss": 0.011, + "step": 497100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010671287595812131, + "loss": 0.01, + "step": 497110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010670898774174984, + "loss": 0.024, + "step": 497120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010670509952537838, + "loss": 0.011, + "step": 497130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010670121130900691, + "loss": 0.0094, + "step": 497140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010669732309263546, + "loss": 0.0108, + "step": 497150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010669343487626398, + "loss": 0.0074, + "step": 497160 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010668954665989253, + "loss": 0.0088, + "step": 497170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010668565844352106, + "loss": 0.0114, + "step": 497180 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001066817702271496, + "loss": 0.0072, + "step": 497190 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010667788201077813, + "loss": 0.0092, + "step": 497200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010667399379440666, + "loss": 0.0104, + "step": 497210 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001066701055780352, + "loss": 0.0128, + "step": 497220 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010666621736166373, + "loss": 0.0117, + "step": 497230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010666232914529227, + "loss": 0.0088, + "step": 497240 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001066584409289208, + "loss": 0.0107, + "step": 497250 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010665455271254934, + "loss": 0.0105, + "step": 497260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010665066449617787, + "loss": 0.0089, + "step": 497270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010664677627980641, + "loss": 0.0091, + "step": 497280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010664288806343494, + "loss": 0.0094, + "step": 497290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010663899984706348, + "loss": 0.0107, + "step": 497300 + }, + { + "epoch": 1.29, + "learning_rate": 0.000106635111630692, + "loss": 0.0105, + "step": 497310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010663122341432055, + "loss": 0.0134, + "step": 497320 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010662733519794908, + "loss": 0.0085, + "step": 497330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010662344698157763, + "loss": 0.0091, + "step": 497340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010661955876520616, + "loss": 0.0109, + "step": 497350 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001066156705488347, + "loss": 0.0122, + "step": 497360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010661178233246323, + "loss": 0.0096, + "step": 497370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010660789411609177, + "loss": 0.0124, + "step": 497380 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001066040058997203, + "loss": 0.0126, + "step": 497390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010660011768334884, + "loss": 0.0088, + "step": 497400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010659622946697737, + "loss": 0.0094, + "step": 497410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010659234125060591, + "loss": 0.0132, + "step": 497420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010658845303423444, + "loss": 0.0093, + "step": 497430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010658456481786298, + "loss": 0.0119, + "step": 497440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010658067660149151, + "loss": 0.0106, + "step": 497450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010657678838512004, + "loss": 0.008, + "step": 497460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010657290016874858, + "loss": 0.0126, + "step": 497470 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001065690119523771, + "loss": 0.0118, + "step": 497480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010656512373600565, + "loss": 0.0107, + "step": 497490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010656123551963418, + "loss": 0.0111, + "step": 497500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010655734730326273, + "loss": 0.0104, + "step": 497510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010655345908689125, + "loss": 0.0101, + "step": 497520 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001065495708705198, + "loss": 0.0111, + "step": 497530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010654568265414833, + "loss": 0.0109, + "step": 497540 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010654179443777687, + "loss": 0.0082, + "step": 497550 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001065379062214054, + "loss": 0.0094, + "step": 497560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010653401800503394, + "loss": 0.0098, + "step": 497570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010653012978866247, + "loss": 0.0154, + "step": 497580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010652624157229101, + "loss": 0.0121, + "step": 497590 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010652235335591954, + "loss": 0.0124, + "step": 497600 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010651846513954808, + "loss": 0.0085, + "step": 497610 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010651457692317661, + "loss": 0.0077, + "step": 497620 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010651068870680515, + "loss": 0.0105, + "step": 497630 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010650680049043368, + "loss": 0.0107, + "step": 497640 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010650291227406222, + "loss": 0.0113, + "step": 497650 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010649902405769075, + "loss": 0.0109, + "step": 497660 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001064951358413193, + "loss": 0.0105, + "step": 497670 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010649124762494782, + "loss": 0.0097, + "step": 497680 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010648735940857637, + "loss": 0.0099, + "step": 497690 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001064834711922049, + "loss": 0.0098, + "step": 497700 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010647958297583343, + "loss": 0.0091, + "step": 497710 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010647569475946197, + "loss": 0.0095, + "step": 497720 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001064718065430905, + "loss": 0.0151, + "step": 497730 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010646791832671904, + "loss": 0.0129, + "step": 497740 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010646403011034757, + "loss": 0.0085, + "step": 497750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010646014189397611, + "loss": 0.0123, + "step": 497760 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010645625367760464, + "loss": 0.0091, + "step": 497770 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010645236546123318, + "loss": 0.0091, + "step": 497780 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010644847724486171, + "loss": 0.0086, + "step": 497790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010644458902849025, + "loss": 0.008, + "step": 497800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010644070081211878, + "loss": 0.0093, + "step": 497810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010643681259574732, + "loss": 0.0064, + "step": 497820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010643292437937585, + "loss": 0.0117, + "step": 497830 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010642903616300439, + "loss": 0.0109, + "step": 497840 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010642514794663292, + "loss": 0.0098, + "step": 497850 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010642125973026147, + "loss": 0.0084, + "step": 497860 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010641737151389, + "loss": 0.0085, + "step": 497870 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010641348329751854, + "loss": 0.0117, + "step": 497880 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010640959508114707, + "loss": 0.0088, + "step": 497890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010640570686477561, + "loss": 0.0092, + "step": 497900 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010640181864840414, + "loss": 0.0115, + "step": 497910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010639793043203268, + "loss": 0.0121, + "step": 497920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010639404221566121, + "loss": 0.0092, + "step": 497930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010639015399928975, + "loss": 0.0122, + "step": 497940 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010638626578291828, + "loss": 0.0075, + "step": 497950 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001063823775665468, + "loss": 0.0114, + "step": 497960 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010637848935017535, + "loss": 0.0096, + "step": 497970 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010637460113380388, + "loss": 0.0102, + "step": 497980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010637071291743242, + "loss": 0.0128, + "step": 497990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010636682470106095, + "loss": 0.0096, + "step": 498000 + }, + { + "epoch": 1.29, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.0066691674292087555, + "eval_runtime": 108.0801, + "eval_samples_per_second": 18.505, + "eval_steps_per_second": 4.626, + "step": 498000 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010636293648468949, + "loss": 0.0116, + "step": 498010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010635904826831802, + "loss": 0.0074, + "step": 498020 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010635516005194657, + "loss": 0.0088, + "step": 498030 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010635127183557509, + "loss": 0.0076, + "step": 498040 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010634738361920364, + "loss": 0.0083, + "step": 498050 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010634349540283217, + "loss": 0.0153, + "step": 498060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010633960718646071, + "loss": 0.011, + "step": 498070 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010633571897008924, + "loss": 0.0111, + "step": 498080 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010633183075371778, + "loss": 0.0111, + "step": 498090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010632794253734631, + "loss": 0.0113, + "step": 498100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010632405432097485, + "loss": 0.0134, + "step": 498110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010632016610460338, + "loss": 0.016, + "step": 498120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010631627788823192, + "loss": 0.0103, + "step": 498130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010631238967186045, + "loss": 0.0112, + "step": 498140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010630850145548899, + "loss": 0.0106, + "step": 498150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010630461323911752, + "loss": 0.0065, + "step": 498160 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010630072502274606, + "loss": 0.0101, + "step": 498170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010629683680637459, + "loss": 0.0105, + "step": 498180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010629294859000314, + "loss": 0.0108, + "step": 498190 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010628906037363166, + "loss": 0.0082, + "step": 498200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010628517215726018, + "loss": 0.0092, + "step": 498210 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010628128394088874, + "loss": 0.01, + "step": 498220 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010627739572451727, + "loss": 0.0104, + "step": 498230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010627350750814581, + "loss": 0.0109, + "step": 498240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010626961929177434, + "loss": 0.0088, + "step": 498250 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010626573107540288, + "loss": 0.0097, + "step": 498260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010626184285903141, + "loss": 0.0098, + "step": 498270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010625795464265995, + "loss": 0.0096, + "step": 498280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010625406642628848, + "loss": 0.0103, + "step": 498290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010625017820991702, + "loss": 0.012, + "step": 498300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010624628999354555, + "loss": 0.0104, + "step": 498310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010624240177717409, + "loss": 0.0114, + "step": 498320 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010623851356080262, + "loss": 0.0084, + "step": 498330 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010623462534443116, + "loss": 0.0129, + "step": 498340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010623073712805969, + "loss": 0.0117, + "step": 498350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010622684891168823, + "loss": 0.0112, + "step": 498360 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010622296069531676, + "loss": 0.0125, + "step": 498370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010621907247894531, + "loss": 0.0104, + "step": 498380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010621518426257384, + "loss": 0.0122, + "step": 498390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010621129604620238, + "loss": 0.0116, + "step": 498400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010620740782983091, + "loss": 0.0092, + "step": 498410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010620351961345945, + "loss": 0.0103, + "step": 498420 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010619963139708798, + "loss": 0.0108, + "step": 498430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010619574318071652, + "loss": 0.0083, + "step": 498440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010619185496434505, + "loss": 0.0107, + "step": 498450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010618796674797358, + "loss": 0.0098, + "step": 498460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010618407853160212, + "loss": 0.0102, + "step": 498470 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010618019031523065, + "loss": 0.0091, + "step": 498480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010617630209885919, + "loss": 0.0104, + "step": 498490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010617241388248772, + "loss": 0.0105, + "step": 498500 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010616852566611626, + "loss": 0.012, + "step": 498510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010616463744974479, + "loss": 0.0097, + "step": 498520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010616074923337333, + "loss": 0.0135, + "step": 498530 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010615686101700186, + "loss": 0.0111, + "step": 498540 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001061529728006304, + "loss": 0.0118, + "step": 498550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010614908458425893, + "loss": 0.0097, + "step": 498560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010614519636788748, + "loss": 0.0099, + "step": 498570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010614130815151601, + "loss": 0.0139, + "step": 498580 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010613741993514455, + "loss": 0.0133, + "step": 498590 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010613353171877308, + "loss": 0.0138, + "step": 498600 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010612964350240162, + "loss": 0.0097, + "step": 498610 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010612575528603015, + "loss": 0.0084, + "step": 498620 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010612186706965869, + "loss": 0.0085, + "step": 498630 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010611797885328722, + "loss": 0.0107, + "step": 498640 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010611409063691576, + "loss": 0.0094, + "step": 498650 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010611020242054429, + "loss": 0.0112, + "step": 498660 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010610631420417283, + "loss": 0.009, + "step": 498670 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010610242598780136, + "loss": 0.0077, + "step": 498680 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060985377714299, + "loss": 0.0099, + "step": 498690 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010609464955505843, + "loss": 0.0135, + "step": 498700 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010609076133868695, + "loss": 0.0118, + "step": 498710 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060868731223155, + "loss": 0.0094, + "step": 498720 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010608298490594402, + "loss": 0.015, + "step": 498730 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010607909668957258, + "loss": 0.01, + "step": 498740 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060752084732011, + "loss": 0.0088, + "step": 498750 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010607132025682965, + "loss": 0.0102, + "step": 498760 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010606743204045818, + "loss": 0.0114, + "step": 498770 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010606354382408672, + "loss": 0.0105, + "step": 498780 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010605965560771525, + "loss": 0.0139, + "step": 498790 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010605576739134379, + "loss": 0.0105, + "step": 498800 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010605187917497232, + "loss": 0.0109, + "step": 498810 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010604799095860086, + "loss": 0.0125, + "step": 498820 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010604410274222939, + "loss": 0.0097, + "step": 498830 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010604021452585793, + "loss": 0.0115, + "step": 498840 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010603632630948646, + "loss": 0.011, + "step": 498850 + }, + { + "epoch": 1.29, + "learning_rate": 0.000106032438093115, + "loss": 0.0103, + "step": 498860 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010602854987674353, + "loss": 0.0106, + "step": 498870 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010602466166037207, + "loss": 0.0089, + "step": 498880 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001060207734440006, + "loss": 0.0096, + "step": 498890 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010601688522762915, + "loss": 0.0126, + "step": 498900 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010601299701125767, + "loss": 0.0119, + "step": 498910 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010600910879488622, + "loss": 0.0086, + "step": 498920 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010600522057851475, + "loss": 0.0106, + "step": 498930 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010600133236214329, + "loss": 0.0085, + "step": 498940 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010599744414577182, + "loss": 0.0095, + "step": 498950 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010599355592940035, + "loss": 0.0088, + "step": 498960 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010598966771302889, + "loss": 0.0081, + "step": 498970 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010598577949665742, + "loss": 0.0107, + "step": 498980 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010598189128028596, + "loss": 0.0129, + "step": 498990 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010597800306391449, + "loss": 0.0127, + "step": 499000 + }, + { + "epoch": 1.29, + "eval_cer": 0.8816467008458005, + "eval_loss": 0.006797228939831257, + "eval_runtime": 108.108, + "eval_samples_per_second": 18.5, + "eval_steps_per_second": 4.625, + "step": 499000 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010597411484754303, + "loss": 0.011, + "step": 499010 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010597022663117156, + "loss": 0.0117, + "step": 499020 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001059663384148001, + "loss": 0.0096, + "step": 499030 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010596245019842863, + "loss": 0.0089, + "step": 499040 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010595856198205717, + "loss": 0.0096, + "step": 499050 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001059546737656857, + "loss": 0.0102, + "step": 499060 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010595078554931424, + "loss": 0.0096, + "step": 499070 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010594689733294276, + "loss": 0.0119, + "step": 499080 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010594300911657132, + "loss": 0.0077, + "step": 499090 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010593912090019985, + "loss": 0.01, + "step": 499100 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010593523268382839, + "loss": 0.0111, + "step": 499110 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010593134446745692, + "loss": 0.0111, + "step": 499120 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010592745625108546, + "loss": 0.0084, + "step": 499130 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010592356803471399, + "loss": 0.0091, + "step": 499140 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010591967981834253, + "loss": 0.0127, + "step": 499150 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010591579160197106, + "loss": 0.0105, + "step": 499160 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001059119033855996, + "loss": 0.0111, + "step": 499170 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010590801516922813, + "loss": 0.0137, + "step": 499180 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010590412695285667, + "loss": 0.0119, + "step": 499190 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001059002387364852, + "loss": 0.0086, + "step": 499200 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010589635052011372, + "loss": 0.0134, + "step": 499210 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010589246230374227, + "loss": 0.0103, + "step": 499220 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001058885740873708, + "loss": 0.0083, + "step": 499230 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010588468587099934, + "loss": 0.0098, + "step": 499240 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010588079765462786, + "loss": 0.0113, + "step": 499250 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010587690943825642, + "loss": 0.0101, + "step": 499260 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010587302122188493, + "loss": 0.0085, + "step": 499270 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010586913300551349, + "loss": 0.0101, + "step": 499280 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010586524478914202, + "loss": 0.0098, + "step": 499290 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010586135657277056, + "loss": 0.0124, + "step": 499300 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010585746835639909, + "loss": 0.01, + "step": 499310 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010585358014002763, + "loss": 0.0095, + "step": 499320 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010584969192365616, + "loss": 0.0089, + "step": 499330 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001058458037072847, + "loss": 0.0095, + "step": 499340 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010584191549091323, + "loss": 0.0089, + "step": 499350 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010583802727454177, + "loss": 0.0083, + "step": 499360 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001058341390581703, + "loss": 0.0085, + "step": 499370 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010583025084179884, + "loss": 0.0094, + "step": 499380 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010582636262542737, + "loss": 0.0106, + "step": 499390 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010582247440905591, + "loss": 0.0128, + "step": 499400 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010581858619268444, + "loss": 0.008, + "step": 499410 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010581469797631299, + "loss": 0.0118, + "step": 499420 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001058108097599415, + "loss": 0.0124, + "step": 499430 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010580692154357003, + "loss": 0.0083, + "step": 499440 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010580303332719859, + "loss": 0.0074, + "step": 499450 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010579914511082712, + "loss": 0.009, + "step": 499460 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010579525689445566, + "loss": 0.0092, + "step": 499470 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010579136867808419, + "loss": 0.0126, + "step": 499480 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010578748046171273, + "loss": 0.0093, + "step": 499490 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010578359224534126, + "loss": 0.0138, + "step": 499500 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001057797040289698, + "loss": 0.0097, + "step": 499510 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010577581581259833, + "loss": 0.0082, + "step": 499520 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010577192759622687, + "loss": 0.0108, + "step": 499530 + }, + { + "epoch": 1.29, + "learning_rate": 0.0001057680393798554, + "loss": 0.0114, + "step": 499540 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010576415116348394, + "loss": 0.0112, + "step": 499550 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010576026294711247, + "loss": 0.0108, + "step": 499560 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010575637473074101, + "loss": 0.0093, + "step": 499570 + }, + { + "epoch": 1.29, + "learning_rate": 0.00010575248651436954, + "loss": 0.0093, + "step": 499580 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010574859829799808, + "loss": 0.0094, + "step": 499590 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001057447100816266, + "loss": 0.0101, + "step": 499600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010574082186525516, + "loss": 0.007, + "step": 499610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010573693364888369, + "loss": 0.0096, + "step": 499620 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010573304543251223, + "loss": 0.0084, + "step": 499630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010572915721614076, + "loss": 0.0071, + "step": 499640 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001057252689997693, + "loss": 0.0102, + "step": 499650 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010572138078339783, + "loss": 0.0114, + "step": 499660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010571749256702637, + "loss": 0.0108, + "step": 499670 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001057136043506549, + "loss": 0.0093, + "step": 499680 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010570971613428343, + "loss": 0.0112, + "step": 499690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010570582791791197, + "loss": 0.0078, + "step": 499700 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001057019397015405, + "loss": 0.0098, + "step": 499710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010569805148516904, + "loss": 0.0111, + "step": 499720 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010569416326879756, + "loss": 0.0096, + "step": 499730 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056902750524261, + "loss": 0.0115, + "step": 499740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010568638683605463, + "loss": 0.0062, + "step": 499750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010568249861968318, + "loss": 0.0081, + "step": 499760 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056786104033117, + "loss": 0.0132, + "step": 499770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010567472218694025, + "loss": 0.013, + "step": 499780 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010567083397056877, + "loss": 0.0087, + "step": 499790 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010566694575419733, + "loss": 0.0095, + "step": 499800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010566305753782586, + "loss": 0.0075, + "step": 499810 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056591693214544, + "loss": 0.0078, + "step": 499820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010565528110508293, + "loss": 0.0104, + "step": 499830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010565139288871147, + "loss": 0.0121, + "step": 499840 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010564750467234, + "loss": 0.0106, + "step": 499850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010564361645596854, + "loss": 0.0132, + "step": 499860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010563972823959707, + "loss": 0.0079, + "step": 499870 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010563584002322561, + "loss": 0.0106, + "step": 499880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010563195180685414, + "loss": 0.0101, + "step": 499890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010562806359048268, + "loss": 0.0104, + "step": 499900 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056241753741112, + "loss": 0.0111, + "step": 499910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010562028715773975, + "loss": 0.0105, + "step": 499920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010561639894136828, + "loss": 0.0103, + "step": 499930 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001056125107249968, + "loss": 0.0106, + "step": 499940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010560862250862535, + "loss": 0.0145, + "step": 499950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010560473429225387, + "loss": 0.0126, + "step": 499960 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010560084607588243, + "loss": 0.0132, + "step": 499970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010559695785951096, + "loss": 0.0125, + "step": 499980 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055930696431395, + "loss": 0.0102, + "step": 499990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010558918142676803, + "loss": 0.0084, + "step": 500000 + }, + { + "epoch": 1.3, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.006844638846814632, + "eval_runtime": 107.9782, + "eval_samples_per_second": 18.522, + "eval_steps_per_second": 4.631, + "step": 500000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010558529321039657, + "loss": 0.0109, + "step": 500010 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055814049940251, + "loss": 0.0125, + "step": 500020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010557751677765364, + "loss": 0.0096, + "step": 500030 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010557362856128217, + "loss": 0.0089, + "step": 500040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010556974034491071, + "loss": 0.0113, + "step": 500050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010556585212853924, + "loss": 0.0097, + "step": 500060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010556196391216778, + "loss": 0.0098, + "step": 500070 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055580756957963, + "loss": 0.0094, + "step": 500080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010555418747942485, + "loss": 0.0122, + "step": 500090 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010555029926305338, + "loss": 0.0096, + "step": 500100 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010554641104668192, + "loss": 0.0077, + "step": 500110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010554252283031044, + "loss": 0.0099, + "step": 500120 + }, + { + "epoch": 1.3, + "learning_rate": 0.000105538634613939, + "loss": 0.01, + "step": 500130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010553474639756751, + "loss": 0.0127, + "step": 500140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010553085818119607, + "loss": 0.01, + "step": 500150 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055269699648246, + "loss": 0.0094, + "step": 500160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010552308174845314, + "loss": 0.0077, + "step": 500170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010551919353208167, + "loss": 0.0128, + "step": 500180 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001055153053157102, + "loss": 0.0099, + "step": 500190 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010551141709933874, + "loss": 0.0079, + "step": 500200 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010550752888296727, + "loss": 0.013, + "step": 500210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010550364066659581, + "loss": 0.011, + "step": 500220 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010549975245022434, + "loss": 0.0083, + "step": 500230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010549586423385288, + "loss": 0.011, + "step": 500240 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001054919760174814, + "loss": 0.0077, + "step": 500250 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010548808780110995, + "loss": 0.0109, + "step": 500260 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010548419958473847, + "loss": 0.0102, + "step": 500270 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010548031136836702, + "loss": 0.0095, + "step": 500280 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010547642315199554, + "loss": 0.0123, + "step": 500290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010547253493562409, + "loss": 0.011, + "step": 500300 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010546864671925261, + "loss": 0.0111, + "step": 500310 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010546475850288117, + "loss": 0.0099, + "step": 500320 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001054608702865097, + "loss": 0.0086, + "step": 500330 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010545698207013824, + "loss": 0.0092, + "step": 500340 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010545309385376677, + "loss": 0.0095, + "step": 500350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010544920563739531, + "loss": 0.0098, + "step": 500360 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010544531742102384, + "loss": 0.0108, + "step": 500370 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010544142920465238, + "loss": 0.0105, + "step": 500380 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001054375409882809, + "loss": 0.0136, + "step": 500390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010543365277190945, + "loss": 0.0123, + "step": 500400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010542976455553798, + "loss": 0.0067, + "step": 500410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010542587633916652, + "loss": 0.0099, + "step": 500420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010542198812279505, + "loss": 0.0106, + "step": 500430 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010541809990642357, + "loss": 0.0099, + "step": 500440 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010541421169005212, + "loss": 0.0127, + "step": 500450 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010541032347368064, + "loss": 0.0116, + "step": 500460 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010540643525730919, + "loss": 0.0116, + "step": 500470 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010540254704093771, + "loss": 0.011, + "step": 500480 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010539865882456627, + "loss": 0.0084, + "step": 500490 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010539477060819478, + "loss": 0.0104, + "step": 500500 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010539088239182334, + "loss": 0.0099, + "step": 500510 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010538699417545187, + "loss": 0.0098, + "step": 500520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010538310595908041, + "loss": 0.0112, + "step": 500530 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010537921774270894, + "loss": 0.0126, + "step": 500540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010537532952633748, + "loss": 0.0085, + "step": 500550 + }, + { + "epoch": 1.3, + "learning_rate": 0.000105371441309966, + "loss": 0.0126, + "step": 500560 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010536755309359455, + "loss": 0.0088, + "step": 500570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010536366487722308, + "loss": 0.0141, + "step": 500580 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010535977666085162, + "loss": 0.0113, + "step": 500590 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010535588844448015, + "loss": 0.0109, + "step": 500600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010535200022810869, + "loss": 0.0133, + "step": 500610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010534811201173721, + "loss": 0.0102, + "step": 500620 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010534422379536576, + "loss": 0.0086, + "step": 500630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010534033557899428, + "loss": 0.0124, + "step": 500640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010533644736262284, + "loss": 0.0112, + "step": 500650 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010533255914625135, + "loss": 0.0096, + "step": 500660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010532867092987991, + "loss": 0.0114, + "step": 500670 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010532478271350844, + "loss": 0.0112, + "step": 500680 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010532089449713697, + "loss": 0.0105, + "step": 500690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010531700628076551, + "loss": 0.0094, + "step": 500700 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010531311806439404, + "loss": 0.0086, + "step": 500710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010530922984802258, + "loss": 0.0118, + "step": 500720 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001053053416316511, + "loss": 0.0108, + "step": 500730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010530145341527965, + "loss": 0.0118, + "step": 500740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010529756519890817, + "loss": 0.0084, + "step": 500750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010529367698253672, + "loss": 0.0105, + "step": 500760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010528978876616524, + "loss": 0.0104, + "step": 500770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010528590054979379, + "loss": 0.0124, + "step": 500780 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010528201233342231, + "loss": 0.0106, + "step": 500790 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010527812411705086, + "loss": 0.0108, + "step": 500800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010527423590067938, + "loss": 0.0101, + "step": 500810 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010527034768430793, + "loss": 0.0156, + "step": 500820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010526645946793645, + "loss": 0.0085, + "step": 500830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010526257125156501, + "loss": 0.0102, + "step": 500840 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010525868303519354, + "loss": 0.0099, + "step": 500850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010525479481882208, + "loss": 0.0102, + "step": 500860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010525090660245061, + "loss": 0.0096, + "step": 500870 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010524701838607915, + "loss": 0.0093, + "step": 500880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010524313016970768, + "loss": 0.0103, + "step": 500890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010523924195333622, + "loss": 0.0117, + "step": 500900 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010523535373696475, + "loss": 0.0115, + "step": 500910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010523146552059329, + "loss": 0.0101, + "step": 500920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010522757730422182, + "loss": 0.0117, + "step": 500930 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010522368908785034, + "loss": 0.0111, + "step": 500940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010521980087147889, + "loss": 0.0111, + "step": 500950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010521591265510741, + "loss": 0.01, + "step": 500960 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010521202443873596, + "loss": 0.0098, + "step": 500970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010520813622236448, + "loss": 0.0097, + "step": 500980 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010520424800599303, + "loss": 0.0117, + "step": 500990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010520035978962155, + "loss": 0.0122, + "step": 501000 + }, + { + "epoch": 1.3, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.0065152887254953384, + "eval_runtime": 107.805, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, + "step": 501000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010519647157325011, + "loss": 0.0084, + "step": 501010 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010519258335687862, + "loss": 0.0108, + "step": 501020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010518869514050718, + "loss": 0.01, + "step": 501030 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001051848069241357, + "loss": 0.0146, + "step": 501040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010518091870776425, + "loss": 0.0115, + "step": 501050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010517703049139278, + "loss": 0.0106, + "step": 501060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010517314227502132, + "loss": 0.0098, + "step": 501070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010516925405864985, + "loss": 0.0124, + "step": 501080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010516536584227839, + "loss": 0.0086, + "step": 501090 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010516147762590692, + "loss": 0.008, + "step": 501100 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010515758940953546, + "loss": 0.0105, + "step": 501110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010515370119316399, + "loss": 0.0118, + "step": 501120 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010514981297679253, + "loss": 0.0119, + "step": 501130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010514592476042105, + "loss": 0.0084, + "step": 501140 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001051420365440496, + "loss": 0.0113, + "step": 501150 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010513814832767812, + "loss": 0.0083, + "step": 501160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010513426011130667, + "loss": 0.0116, + "step": 501170 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001051303718949352, + "loss": 0.0102, + "step": 501180 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010512648367856372, + "loss": 0.011, + "step": 501190 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010512259546219228, + "loss": 0.008, + "step": 501200 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001051187072458208, + "loss": 0.0085, + "step": 501210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010511481902944935, + "loss": 0.0105, + "step": 501220 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010511093081307788, + "loss": 0.0126, + "step": 501230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010510704259670642, + "loss": 0.0116, + "step": 501240 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010510315438033495, + "loss": 0.0083, + "step": 501250 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010509926616396349, + "loss": 0.0099, + "step": 501260 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010509537794759201, + "loss": 0.0115, + "step": 501270 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010509148973122056, + "loss": 0.0086, + "step": 501280 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010508760151484908, + "loss": 0.0089, + "step": 501290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010508371329847763, + "loss": 0.0105, + "step": 501300 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010507982508210615, + "loss": 0.009, + "step": 501310 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001050759368657347, + "loss": 0.0099, + "step": 501320 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010507204864936322, + "loss": 0.0118, + "step": 501330 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010506816043299177, + "loss": 0.0126, + "step": 501340 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001050642722166203, + "loss": 0.0077, + "step": 501350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010506038400024885, + "loss": 0.0099, + "step": 501360 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010505649578387736, + "loss": 0.0088, + "step": 501370 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010505260756750592, + "loss": 0.0087, + "step": 501380 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010504871935113445, + "loss": 0.0088, + "step": 501390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010504483113476299, + "loss": 0.0084, + "step": 501400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010504094291839152, + "loss": 0.0068, + "step": 501410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010503705470202006, + "loss": 0.0103, + "step": 501420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010503316648564859, + "loss": 0.0088, + "step": 501430 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010502927826927711, + "loss": 0.0127, + "step": 501440 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010502539005290566, + "loss": 0.0101, + "step": 501450 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010502150183653418, + "loss": 0.0135, + "step": 501460 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010501761362016273, + "loss": 0.0108, + "step": 501470 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010501372540379125, + "loss": 0.0091, + "step": 501480 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001050098371874198, + "loss": 0.0091, + "step": 501490 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010500594897104832, + "loss": 0.0094, + "step": 501500 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010500206075467687, + "loss": 0.0084, + "step": 501510 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010499817253830539, + "loss": 0.0117, + "step": 501520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010499428432193393, + "loss": 0.0085, + "step": 501530 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010499039610556246, + "loss": 0.0105, + "step": 501540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010498650788919102, + "loss": 0.0085, + "step": 501550 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010498261967281955, + "loss": 0.0085, + "step": 501560 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010497873145644809, + "loss": 0.0097, + "step": 501570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010497484324007662, + "loss": 0.0085, + "step": 501580 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010497095502370516, + "loss": 0.0126, + "step": 501590 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010496706680733369, + "loss": 0.0092, + "step": 501600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010496317859096223, + "loss": 0.0085, + "step": 501610 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010495929037459076, + "loss": 0.0077, + "step": 501620 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049554021582193, + "loss": 0.0108, + "step": 501630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010495151394184783, + "loss": 0.0121, + "step": 501640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010494762572547637, + "loss": 0.0107, + "step": 501650 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001049437375091049, + "loss": 0.0123, + "step": 501660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010493984929273344, + "loss": 0.0105, + "step": 501670 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010493596107636196, + "loss": 0.0099, + "step": 501680 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010493207285999049, + "loss": 0.0125, + "step": 501690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010492818464361903, + "loss": 0.0102, + "step": 501700 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010492429642724756, + "loss": 0.0081, + "step": 501710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010492040821087612, + "loss": 0.0108, + "step": 501720 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010491651999450463, + "loss": 0.017, + "step": 501730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010491263177813319, + "loss": 0.0109, + "step": 501740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010490874356176172, + "loss": 0.0096, + "step": 501750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010490485534539026, + "loss": 0.0103, + "step": 501760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010490096712901879, + "loss": 0.0114, + "step": 501770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010489707891264733, + "loss": 0.0103, + "step": 501780 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010489319069627585, + "loss": 0.0082, + "step": 501790 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001048893024799044, + "loss": 0.0106, + "step": 501800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010488541426353292, + "loss": 0.0112, + "step": 501810 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010488152604716147, + "loss": 0.0092, + "step": 501820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010487763783079, + "loss": 0.0093, + "step": 501830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010487374961441854, + "loss": 0.0091, + "step": 501840 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010486986139804706, + "loss": 0.0118, + "step": 501850 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001048659731816756, + "loss": 0.0078, + "step": 501860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010486208496530413, + "loss": 0.0066, + "step": 501870 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010485819674893269, + "loss": 0.0106, + "step": 501880 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001048543085325612, + "loss": 0.0109, + "step": 501890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010485042031618976, + "loss": 0.0121, + "step": 501900 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010484653209981829, + "loss": 0.0088, + "step": 501910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010484264388344681, + "loss": 0.0098, + "step": 501920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010483875566707536, + "loss": 0.01, + "step": 501930 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010483486745070388, + "loss": 0.0083, + "step": 501940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010483097923433243, + "loss": 0.011, + "step": 501950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010482709101796095, + "loss": 0.011, + "step": 501960 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001048232028015895, + "loss": 0.0086, + "step": 501970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010481931458521802, + "loss": 0.0094, + "step": 501980 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010481542636884657, + "loss": 0.0152, + "step": 501990 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001048115381524751, + "loss": 0.0114, + "step": 502000 + }, + { + "epoch": 1.3, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.006790985353291035, + "eval_runtime": 107.9811, + "eval_samples_per_second": 18.522, + "eval_steps_per_second": 4.63, + "step": 502000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010480764993610364, + "loss": 0.0103, + "step": 502010 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010480376171973216, + "loss": 0.0105, + "step": 502020 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047998735033607, + "loss": 0.0098, + "step": 502030 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010479598528698923, + "loss": 0.0104, + "step": 502040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010479209707061777, + "loss": 0.009, + "step": 502050 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047882088542463, + "loss": 0.0087, + "step": 502060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010478432063787486, + "loss": 0.0098, + "step": 502070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010478043242150339, + "loss": 0.0089, + "step": 502080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010477654420513193, + "loss": 0.0086, + "step": 502090 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010477265598876046, + "loss": 0.0145, + "step": 502100 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104768767772389, + "loss": 0.0072, + "step": 502110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010476487955601753, + "loss": 0.009, + "step": 502120 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010476099133964607, + "loss": 0.0082, + "step": 502130 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047571031232746, + "loss": 0.0123, + "step": 502140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010475321490690314, + "loss": 0.0098, + "step": 502150 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010474932669053166, + "loss": 0.0107, + "step": 502160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010474543847416019, + "loss": 0.0101, + "step": 502170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010474155025778873, + "loss": 0.0104, + "step": 502180 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010473766204141726, + "loss": 0.013, + "step": 502190 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047337738250458, + "loss": 0.0089, + "step": 502200 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010472988560867433, + "loss": 0.0108, + "step": 502210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010472599739230287, + "loss": 0.0119, + "step": 502220 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047221091759314, + "loss": 0.009, + "step": 502230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010471822095955996, + "loss": 0.0118, + "step": 502240 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010471433274318847, + "loss": 0.0121, + "step": 502250 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010471044452681703, + "loss": 0.0085, + "step": 502260 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010470655631044556, + "loss": 0.0124, + "step": 502270 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001047026680940741, + "loss": 0.0105, + "step": 502280 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010469877987770262, + "loss": 0.0106, + "step": 502290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010469489166133117, + "loss": 0.0119, + "step": 502300 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046910034449597, + "loss": 0.0099, + "step": 502310 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010468711522858824, + "loss": 0.0085, + "step": 502320 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010468322701221676, + "loss": 0.0082, + "step": 502330 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046793387958453, + "loss": 0.0123, + "step": 502340 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010467545057947383, + "loss": 0.0113, + "step": 502350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010467156236310238, + "loss": 0.0102, + "step": 502360 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046676741467309, + "loss": 0.0111, + "step": 502370 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010466378593035945, + "loss": 0.01, + "step": 502380 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010465989771398797, + "loss": 0.0118, + "step": 502390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010465600949761653, + "loss": 0.0089, + "step": 502400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010465212128124504, + "loss": 0.011, + "step": 502410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010464823306487357, + "loss": 0.0096, + "step": 502420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010464434484850213, + "loss": 0.0119, + "step": 502430 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010464045663213065, + "loss": 0.0087, + "step": 502440 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046365684157592, + "loss": 0.0103, + "step": 502450 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010463268019938772, + "loss": 0.0089, + "step": 502460 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010462879198301627, + "loss": 0.0117, + "step": 502470 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046249037666448, + "loss": 0.0089, + "step": 502480 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010462101555027334, + "loss": 0.0109, + "step": 502490 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010461712733390186, + "loss": 0.011, + "step": 502500 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001046132391175304, + "loss": 0.0072, + "step": 502510 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010460935090115893, + "loss": 0.0109, + "step": 502520 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010460546268478748, + "loss": 0.0084, + "step": 502530 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104601574468416, + "loss": 0.0152, + "step": 502540 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010459768625204454, + "loss": 0.0097, + "step": 502550 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010459379803567307, + "loss": 0.0092, + "step": 502560 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010458990981930161, + "loss": 0.0122, + "step": 502570 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010458602160293014, + "loss": 0.009, + "step": 502580 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045821333865587, + "loss": 0.0099, + "step": 502590 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010457824517018723, + "loss": 0.0098, + "step": 502600 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010457435695381577, + "loss": 0.0121, + "step": 502610 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045704687374443, + "loss": 0.0081, + "step": 502620 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010456658052107284, + "loss": 0.0068, + "step": 502630 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010456269230470137, + "loss": 0.0142, + "step": 502640 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010455880408832991, + "loss": 0.012, + "step": 502650 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010455491587195844, + "loss": 0.0098, + "step": 502660 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010455102765558696, + "loss": 0.0092, + "step": 502670 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045471394392155, + "loss": 0.0089, + "step": 502680 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010454325122284403, + "loss": 0.0108, + "step": 502690 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010453936300647257, + "loss": 0.0111, + "step": 502700 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045354747901011, + "loss": 0.0105, + "step": 502710 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010453158657372964, + "loss": 0.0118, + "step": 502720 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010452769835735817, + "loss": 0.0106, + "step": 502730 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010452381014098671, + "loss": 0.0108, + "step": 502740 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010451992192461524, + "loss": 0.0102, + "step": 502750 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010451603370824378, + "loss": 0.0103, + "step": 502760 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010451214549187231, + "loss": 0.0169, + "step": 502770 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010450825727550087, + "loss": 0.0117, + "step": 502780 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001045043690591294, + "loss": 0.0157, + "step": 502790 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010450048084275794, + "loss": 0.0121, + "step": 502800 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010449659262638646, + "loss": 0.0102, + "step": 502810 + }, + { + "epoch": 1.3, + "learning_rate": 0.000104492704410015, + "loss": 0.0109, + "step": 502820 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010448881619364353, + "loss": 0.0092, + "step": 502830 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010448492797727208, + "loss": 0.0107, + "step": 502840 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001044810397609006, + "loss": 0.0104, + "step": 502850 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010447715154452915, + "loss": 0.0093, + "step": 502860 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010447326332815767, + "loss": 0.0103, + "step": 502870 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010446937511178622, + "loss": 0.0076, + "step": 502880 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010446548689541474, + "loss": 0.0085, + "step": 502890 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010446159867904329, + "loss": 0.0088, + "step": 502900 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010445771046267181, + "loss": 0.0108, + "step": 502910 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010445382224630034, + "loss": 0.0078, + "step": 502920 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010444993402992888, + "loss": 0.0086, + "step": 502930 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010444604581355741, + "loss": 0.0106, + "step": 502940 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010444215759718597, + "loss": 0.0129, + "step": 502950 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010443826938081448, + "loss": 0.0062, + "step": 502960 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010443438116444304, + "loss": 0.0105, + "step": 502970 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010443049294807156, + "loss": 0.0075, + "step": 502980 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001044266047317001, + "loss": 0.0116, + "step": 502990 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010442271651532863, + "loss": 0.0093, + "step": 503000 + }, + { + "epoch": 1.3, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.006540039554238319, + "eval_runtime": 108.0994, + "eval_samples_per_second": 18.501, + "eval_steps_per_second": 4.625, + "step": 503000 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010441882829895718, + "loss": 0.0084, + "step": 503010 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001044149400825857, + "loss": 0.014, + "step": 503020 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010441105186621425, + "loss": 0.0129, + "step": 503030 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010440716364984277, + "loss": 0.013, + "step": 503040 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010440327543347132, + "loss": 0.0099, + "step": 503050 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010439938721709984, + "loss": 0.0118, + "step": 503060 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010439549900072838, + "loss": 0.0091, + "step": 503070 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010439161078435691, + "loss": 0.0107, + "step": 503080 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010438772256798545, + "loss": 0.0095, + "step": 503090 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010438383435161398, + "loss": 0.0118, + "step": 503100 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010437994613524254, + "loss": 0.0096, + "step": 503110 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010437605791887105, + "loss": 0.0104, + "step": 503120 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010437216970249961, + "loss": 0.0072, + "step": 503130 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010436828148612814, + "loss": 0.008, + "step": 503140 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010436439326975668, + "loss": 0.0105, + "step": 503150 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001043605050533852, + "loss": 0.0106, + "step": 503160 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010435661683701373, + "loss": 0.0093, + "step": 503170 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010435272862064228, + "loss": 0.0108, + "step": 503180 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001043488404042708, + "loss": 0.01, + "step": 503190 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010434495218789934, + "loss": 0.01, + "step": 503200 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010434106397152787, + "loss": 0.009, + "step": 503210 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010433717575515641, + "loss": 0.0089, + "step": 503220 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010433328753878494, + "loss": 0.0077, + "step": 503230 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010432939932241348, + "loss": 0.0091, + "step": 503240 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010432551110604201, + "loss": 0.0096, + "step": 503250 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010432162288967055, + "loss": 0.0109, + "step": 503260 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010431773467329908, + "loss": 0.0127, + "step": 503270 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010431384645692762, + "loss": 0.0117, + "step": 503280 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010430995824055615, + "loss": 0.0139, + "step": 503290 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010430607002418471, + "loss": 0.009, + "step": 503300 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010430218180781324, + "loss": 0.0119, + "step": 503310 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010429829359144178, + "loss": 0.0098, + "step": 503320 + }, + { + "epoch": 1.3, + "learning_rate": 0.0001042944053750703, + "loss": 0.0106, + "step": 503330 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010429051715869885, + "loss": 0.0118, + "step": 503340 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010428662894232737, + "loss": 0.0087, + "step": 503350 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010428274072595592, + "loss": 0.0106, + "step": 503360 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010427885250958444, + "loss": 0.0094, + "step": 503370 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010427496429321299, + "loss": 0.0093, + "step": 503380 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010427107607684151, + "loss": 0.0098, + "step": 503390 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010426718786047006, + "loss": 0.0106, + "step": 503400 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010426329964409858, + "loss": 0.0119, + "step": 503410 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010425941142772711, + "loss": 0.0104, + "step": 503420 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010425552321135565, + "loss": 0.0101, + "step": 503430 + }, + { + "epoch": 1.3, + "learning_rate": 0.00010425163499498418, + "loss": 0.0091, + "step": 503440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010424774677861272, + "loss": 0.0103, + "step": 503450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010424385856224125, + "loss": 0.0096, + "step": 503460 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001042399703458698, + "loss": 0.0093, + "step": 503470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010423608212949832, + "loss": 0.0107, + "step": 503480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010423219391312688, + "loss": 0.0198, + "step": 503490 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001042283056967554, + "loss": 0.0073, + "step": 503500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010422441748038395, + "loss": 0.0135, + "step": 503510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010422052926401247, + "loss": 0.0092, + "step": 503520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010421664104764102, + "loss": 0.0102, + "step": 503530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010421275283126954, + "loss": 0.01, + "step": 503540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010420886461489809, + "loss": 0.0113, + "step": 503550 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010420497639852661, + "loss": 0.0134, + "step": 503560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010420108818215515, + "loss": 0.015, + "step": 503570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010419719996578368, + "loss": 0.0077, + "step": 503580 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010419331174941222, + "loss": 0.0106, + "step": 503590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010418942353304075, + "loss": 0.0094, + "step": 503600 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041855353166693, + "loss": 0.0093, + "step": 503610 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010418164710029782, + "loss": 0.0089, + "step": 503620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010417775888392638, + "loss": 0.0146, + "step": 503630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010417387066755489, + "loss": 0.009, + "step": 503640 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010416998245118345, + "loss": 0.0103, + "step": 503650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010416609423481198, + "loss": 0.0127, + "step": 503660 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041622060184405, + "loss": 0.0092, + "step": 503670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010415831780206905, + "loss": 0.0109, + "step": 503680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010415442958569757, + "loss": 0.0077, + "step": 503690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010415054136932611, + "loss": 0.0068, + "step": 503700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010414665315295464, + "loss": 0.0088, + "step": 503710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010414276493658318, + "loss": 0.01, + "step": 503720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010413887672021171, + "loss": 0.0068, + "step": 503730 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010413498850384025, + "loss": 0.0071, + "step": 503740 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010413110028746878, + "loss": 0.0094, + "step": 503750 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010412721207109732, + "loss": 0.0104, + "step": 503760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010412332385472585, + "loss": 0.0105, + "step": 503770 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001041194356383544, + "loss": 0.0077, + "step": 503780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010411554742198292, + "loss": 0.0097, + "step": 503790 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010411165920561146, + "loss": 0.0101, + "step": 503800 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010410777098923999, + "loss": 0.0104, + "step": 503810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010410388277286855, + "loss": 0.0122, + "step": 503820 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010409999455649707, + "loss": 0.0079, + "step": 503830 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010409610634012562, + "loss": 0.0099, + "step": 503840 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010409221812375414, + "loss": 0.0102, + "step": 503850 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010408832990738269, + "loss": 0.0086, + "step": 503860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010408444169101121, + "loss": 0.0092, + "step": 503870 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010408055347463976, + "loss": 0.0126, + "step": 503880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010407666525826828, + "loss": 0.0101, + "step": 503890 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010407277704189683, + "loss": 0.0088, + "step": 503900 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010406888882552535, + "loss": 0.0079, + "step": 503910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010406500060915388, + "loss": 0.0109, + "step": 503920 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010406111239278242, + "loss": 0.0072, + "step": 503930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010405722417641095, + "loss": 0.0098, + "step": 503940 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001040533359600395, + "loss": 0.012, + "step": 503950 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010404944774366802, + "loss": 0.0136, + "step": 503960 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010404555952729656, + "loss": 0.0109, + "step": 503970 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010404167131092509, + "loss": 0.01, + "step": 503980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010403778309455363, + "loss": 0.0102, + "step": 503990 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010403389487818216, + "loss": 0.0122, + "step": 504000 + }, + { + "epoch": 1.31, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.0066497717052698135, + "eval_runtime": 108.0868, + "eval_samples_per_second": 18.504, + "eval_steps_per_second": 4.626, + "step": 504000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010403000666181072, + "loss": 0.0098, + "step": 504010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010402611844543924, + "loss": 0.0094, + "step": 504020 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010402223022906779, + "loss": 0.0102, + "step": 504030 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010401834201269631, + "loss": 0.0081, + "step": 504040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010401445379632486, + "loss": 0.009, + "step": 504050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010401056557995338, + "loss": 0.0144, + "step": 504060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010400667736358193, + "loss": 0.0088, + "step": 504070 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010400278914721045, + "loss": 0.012, + "step": 504080 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103998900930839, + "loss": 0.009, + "step": 504090 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010399501271446752, + "loss": 0.0127, + "step": 504100 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010399112449809606, + "loss": 0.0113, + "step": 504110 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010398723628172459, + "loss": 0.0105, + "step": 504120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010398334806535313, + "loss": 0.0101, + "step": 504130 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010397945984898166, + "loss": 0.0091, + "step": 504140 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039755716326102, + "loss": 0.0135, + "step": 504150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010397168341623873, + "loss": 0.0115, + "step": 504160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010396779519986726, + "loss": 0.0113, + "step": 504170 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010396390698349582, + "loss": 0.01, + "step": 504180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010396001876712434, + "loss": 0.0119, + "step": 504190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010395613055075289, + "loss": 0.0146, + "step": 504200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010395224233438141, + "loss": 0.0106, + "step": 504210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010394835411800995, + "loss": 0.0094, + "step": 504220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010394446590163848, + "loss": 0.0126, + "step": 504230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010394057768526702, + "loss": 0.0092, + "step": 504240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010393668946889555, + "loss": 0.0068, + "step": 504250 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039328012525241, + "loss": 0.0129, + "step": 504260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010392891303615262, + "loss": 0.0098, + "step": 504270 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010392502481978116, + "loss": 0.0096, + "step": 504280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010392113660340969, + "loss": 0.0095, + "step": 504290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010391724838703823, + "loss": 0.0078, + "step": 504300 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010391336017066676, + "loss": 0.0079, + "step": 504310 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001039094719542953, + "loss": 0.0117, + "step": 504320 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010390558373792383, + "loss": 0.0098, + "step": 504330 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010390169552155239, + "loss": 0.009, + "step": 504340 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038978073051809, + "loss": 0.0126, + "step": 504350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010389391908880946, + "loss": 0.0104, + "step": 504360 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010389003087243798, + "loss": 0.0123, + "step": 504370 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010388614265606653, + "loss": 0.0072, + "step": 504380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010388225443969505, + "loss": 0.0118, + "step": 504390 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038783662233236, + "loss": 0.0084, + "step": 504400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010387447800695212, + "loss": 0.0112, + "step": 504410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010387058979058065, + "loss": 0.0113, + "step": 504420 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038667015742092, + "loss": 0.0088, + "step": 504430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010386281335783772, + "loss": 0.0088, + "step": 504440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010385892514146626, + "loss": 0.0093, + "step": 504450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010385503692509479, + "loss": 0.0113, + "step": 504460 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010385114870872333, + "loss": 0.013, + "step": 504470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010384726049235186, + "loss": 0.0138, + "step": 504480 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038433722759804, + "loss": 0.0097, + "step": 504490 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010383948405960893, + "loss": 0.0323, + "step": 504500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010383559584323747, + "loss": 0.0113, + "step": 504510 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103831707626866, + "loss": 0.0146, + "step": 504520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010382781941049456, + "loss": 0.0085, + "step": 504530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010382393119412308, + "loss": 0.0099, + "step": 504540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010382004297775163, + "loss": 0.0099, + "step": 504550 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010381615476138015, + "loss": 0.0121, + "step": 504560 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001038122665450087, + "loss": 0.0104, + "step": 504570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010380837832863722, + "loss": 0.0115, + "step": 504580 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010380449011226577, + "loss": 0.0118, + "step": 504590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010380060189589429, + "loss": 0.0109, + "step": 504600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010379671367952283, + "loss": 0.0101, + "step": 504610 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010379282546315136, + "loss": 0.0101, + "step": 504620 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037889372467799, + "loss": 0.0108, + "step": 504630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010378504903040843, + "loss": 0.012, + "step": 504640 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010378116081403696, + "loss": 0.0145, + "step": 504650 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037772725976655, + "loss": 0.011, + "step": 504660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010377338438129403, + "loss": 0.0124, + "step": 504670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010376949616492257, + "loss": 0.0105, + "step": 504680 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037656079485511, + "loss": 0.0093, + "step": 504690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010376171973217966, + "loss": 0.0107, + "step": 504700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010375783151580817, + "loss": 0.0084, + "step": 504710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010375394329943673, + "loss": 0.0086, + "step": 504720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010375005508306525, + "loss": 0.008, + "step": 504730 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037461668666938, + "loss": 0.0106, + "step": 504740 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010374227865032232, + "loss": 0.0101, + "step": 504750 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010373839043395086, + "loss": 0.0081, + "step": 504760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010373450221757939, + "loss": 0.0085, + "step": 504770 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010373061400120793, + "loss": 0.0113, + "step": 504780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010372672578483646, + "loss": 0.007, + "step": 504790 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103722837568465, + "loss": 0.0074, + "step": 504800 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010371894935209353, + "loss": 0.0118, + "step": 504810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010371506113572207, + "loss": 0.0105, + "step": 504820 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001037111729193506, + "loss": 0.0141, + "step": 504830 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010370728470297914, + "loss": 0.0104, + "step": 504840 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010370339648660767, + "loss": 0.0091, + "step": 504850 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010369950827023623, + "loss": 0.0099, + "step": 504860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010369562005386474, + "loss": 0.0105, + "step": 504870 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036917318374933, + "loss": 0.0123, + "step": 504880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010368784362112182, + "loss": 0.0104, + "step": 504890 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010368395540475035, + "loss": 0.0127, + "step": 504900 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036800671883789, + "loss": 0.008, + "step": 504910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010367617897200742, + "loss": 0.0132, + "step": 504920 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010367229075563596, + "loss": 0.0102, + "step": 504930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010366840253926449, + "loss": 0.012, + "step": 504940 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010366451432289303, + "loss": 0.0088, + "step": 504950 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010366062610652156, + "loss": 0.0094, + "step": 504960 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036567378901501, + "loss": 0.0099, + "step": 504970 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010365284967377863, + "loss": 0.0112, + "step": 504980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010364896145740717, + "loss": 0.0099, + "step": 504990 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036450732410357, + "loss": 0.008, + "step": 505000 + }, + { + "epoch": 1.31, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.006840614136308432, + "eval_runtime": 108.1691, + "eval_samples_per_second": 18.49, + "eval_steps_per_second": 4.622, + "step": 505000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010364118502466424, + "loss": 0.0109, + "step": 505010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010363729680829277, + "loss": 0.0099, + "step": 505020 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010363340859192131, + "loss": 0.0087, + "step": 505030 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010362952037554984, + "loss": 0.0103, + "step": 505040 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036256321591784, + "loss": 0.0114, + "step": 505050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010362174394280692, + "loss": 0.0117, + "step": 505060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010361785572643547, + "loss": 0.0103, + "step": 505070 + }, + { + "epoch": 1.31, + "learning_rate": 0.000103613967510064, + "loss": 0.0093, + "step": 505080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010361007929369254, + "loss": 0.0106, + "step": 505090 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010360619107732106, + "loss": 0.0129, + "step": 505100 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001036023028609496, + "loss": 0.0094, + "step": 505110 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010359841464457813, + "loss": 0.0089, + "step": 505120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010359452642820667, + "loss": 0.0126, + "step": 505130 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001035906382118352, + "loss": 0.0099, + "step": 505140 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010358674999546373, + "loss": 0.0106, + "step": 505150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010358286177909227, + "loss": 0.0085, + "step": 505160 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001035789735627208, + "loss": 0.0079, + "step": 505170 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010357508534634934, + "loss": 0.009, + "step": 505180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010357119712997787, + "loss": 0.0112, + "step": 505190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010356730891360641, + "loss": 0.0111, + "step": 505200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010356342069723494, + "loss": 0.0112, + "step": 505210 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001035595324808635, + "loss": 0.0089, + "step": 505220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010355564426449201, + "loss": 0.0076, + "step": 505230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010355175604812056, + "loss": 0.01, + "step": 505240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010354786783174909, + "loss": 0.008, + "step": 505250 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010354397961537763, + "loss": 0.0108, + "step": 505260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010354009139900616, + "loss": 0.0099, + "step": 505270 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001035362031826347, + "loss": 0.0101, + "step": 505280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010353231496626323, + "loss": 0.0105, + "step": 505290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010352842674989177, + "loss": 0.0111, + "step": 505300 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001035245385335203, + "loss": 0.0097, + "step": 505310 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010352065031714884, + "loss": 0.008, + "step": 505320 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010351676210077737, + "loss": 0.0128, + "step": 505330 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010351287388440591, + "loss": 0.0082, + "step": 505340 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010350898566803444, + "loss": 0.0097, + "step": 505350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010350509745166298, + "loss": 0.0092, + "step": 505360 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010350120923529151, + "loss": 0.0125, + "step": 505370 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010349732101892005, + "loss": 0.0108, + "step": 505380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010349343280254858, + "loss": 0.0115, + "step": 505390 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010348954458617711, + "loss": 0.0112, + "step": 505400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010348565636980566, + "loss": 0.0101, + "step": 505410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010348176815343419, + "loss": 0.0087, + "step": 505420 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010347787993706273, + "loss": 0.0111, + "step": 505430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010347399172069126, + "loss": 0.0107, + "step": 505440 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034701035043198, + "loss": 0.0095, + "step": 505450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010346621528794833, + "loss": 0.0112, + "step": 505460 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010346232707157687, + "loss": 0.0107, + "step": 505470 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034584388552054, + "loss": 0.0092, + "step": 505480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010345455063883394, + "loss": 0.0093, + "step": 505490 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010345066242246247, + "loss": 0.0117, + "step": 505500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010344677420609101, + "loss": 0.0075, + "step": 505510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010344288598971954, + "loss": 0.0107, + "step": 505520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010343899777334808, + "loss": 0.0118, + "step": 505530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010343510955697661, + "loss": 0.0152, + "step": 505540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010343122134060515, + "loss": 0.0088, + "step": 505550 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010342733312423368, + "loss": 0.0092, + "step": 505560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010342344490786224, + "loss": 0.0101, + "step": 505570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010341955669149075, + "loss": 0.0115, + "step": 505580 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034156684751193, + "loss": 0.0099, + "step": 505590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010341178025874783, + "loss": 0.009, + "step": 505600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010340789204237638, + "loss": 0.0083, + "step": 505610 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001034040038260049, + "loss": 0.0092, + "step": 505620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010340011560963344, + "loss": 0.0113, + "step": 505630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010339622739326197, + "loss": 0.0136, + "step": 505640 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001033923391768905, + "loss": 0.0114, + "step": 505650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010338845096051904, + "loss": 0.0075, + "step": 505660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010338456274414757, + "loss": 0.0106, + "step": 505670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010338067452777611, + "loss": 0.0078, + "step": 505680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010337678631140464, + "loss": 0.014, + "step": 505690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010337289809503318, + "loss": 0.011, + "step": 505700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010336900987866171, + "loss": 0.009, + "step": 505710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010336512166229025, + "loss": 0.0089, + "step": 505720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010336123344591878, + "loss": 0.0094, + "step": 505730 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010335734522954732, + "loss": 0.0091, + "step": 505740 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010335345701317585, + "loss": 0.0117, + "step": 505750 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001033495687968044, + "loss": 0.0069, + "step": 505760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010334568058043293, + "loss": 0.0102, + "step": 505770 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010334179236406147, + "loss": 0.0114, + "step": 505780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010333790414769, + "loss": 0.0121, + "step": 505790 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010333401593131854, + "loss": 0.0107, + "step": 505800 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010333012771494707, + "loss": 0.0087, + "step": 505810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010332623949857561, + "loss": 0.0133, + "step": 505820 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010332235128220414, + "loss": 0.0098, + "step": 505830 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010331846306583268, + "loss": 0.0139, + "step": 505840 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010331457484946121, + "loss": 0.0095, + "step": 505850 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010331068663308975, + "loss": 0.0163, + "step": 505860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010330679841671828, + "loss": 0.0107, + "step": 505870 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010330291020034682, + "loss": 0.0139, + "step": 505880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010329902198397535, + "loss": 0.0096, + "step": 505890 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010329513376760388, + "loss": 0.0188, + "step": 505900 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010329124555123242, + "loss": 0.0081, + "step": 505910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010328735733486095, + "loss": 0.0133, + "step": 505920 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001032834691184895, + "loss": 0.0101, + "step": 505930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010327958090211802, + "loss": 0.0078, + "step": 505940 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010327569268574657, + "loss": 0.0319, + "step": 505950 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001032718044693751, + "loss": 0.0085, + "step": 505960 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010326791625300364, + "loss": 0.0111, + "step": 505970 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010326402803663217, + "loss": 0.0087, + "step": 505980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010326013982026071, + "loss": 0.0171, + "step": 505990 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010325625160388924, + "loss": 0.0131, + "step": 506000 + }, + { + "epoch": 1.31, + "eval_cer": 0.88167329394755, + "eval_loss": 0.006615667603909969, + "eval_runtime": 107.9151, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 506000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010325236338751778, + "loss": 0.0095, + "step": 506010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010324847517114631, + "loss": 0.0094, + "step": 506020 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010324458695477485, + "loss": 0.0105, + "step": 506030 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010324069873840338, + "loss": 0.0091, + "step": 506040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010323681052203192, + "loss": 0.0147, + "step": 506050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010323292230566045, + "loss": 0.0101, + "step": 506060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010322903408928899, + "loss": 0.0099, + "step": 506070 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010322514587291752, + "loss": 0.0073, + "step": 506080 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010322125765654608, + "loss": 0.0114, + "step": 506090 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010321736944017459, + "loss": 0.0113, + "step": 506100 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010321348122380315, + "loss": 0.008, + "step": 506110 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010320959300743167, + "loss": 0.0109, + "step": 506120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010320570479106022, + "loss": 0.0118, + "step": 506130 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010320181657468874, + "loss": 0.0092, + "step": 506140 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010319792835831727, + "loss": 0.0109, + "step": 506150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010319404014194581, + "loss": 0.008, + "step": 506160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010319015192557434, + "loss": 0.0103, + "step": 506170 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010318626370920288, + "loss": 0.0104, + "step": 506180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010318237549283141, + "loss": 0.0117, + "step": 506190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010317848727645995, + "loss": 0.0101, + "step": 506200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010317459906008848, + "loss": 0.0112, + "step": 506210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010317071084371702, + "loss": 0.0082, + "step": 506220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010316682262734555, + "loss": 0.0109, + "step": 506230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010316293441097409, + "loss": 0.012, + "step": 506240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010315904619460262, + "loss": 0.0124, + "step": 506250 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010315515797823116, + "loss": 0.0084, + "step": 506260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010315126976185969, + "loss": 0.0088, + "step": 506270 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010314738154548824, + "loss": 0.011, + "step": 506280 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010314349332911677, + "loss": 0.0085, + "step": 506290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010313960511274531, + "loss": 0.0095, + "step": 506300 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010313571689637384, + "loss": 0.0118, + "step": 506310 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010313182868000238, + "loss": 0.0108, + "step": 506320 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010312794046363091, + "loss": 0.0096, + "step": 506330 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010312405224725945, + "loss": 0.0118, + "step": 506340 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010312016403088798, + "loss": 0.0117, + "step": 506350 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010311627581451652, + "loss": 0.0068, + "step": 506360 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010311238759814505, + "loss": 0.0096, + "step": 506370 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001031084993817736, + "loss": 0.0096, + "step": 506380 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010310461116540212, + "loss": 0.0128, + "step": 506390 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010310072294903065, + "loss": 0.0107, + "step": 506400 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010309683473265919, + "loss": 0.0134, + "step": 506410 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010309294651628772, + "loss": 0.0135, + "step": 506420 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010308905829991626, + "loss": 0.0081, + "step": 506430 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010308517008354479, + "loss": 0.0075, + "step": 506440 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010308128186717334, + "loss": 0.0105, + "step": 506450 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010307739365080186, + "loss": 0.0085, + "step": 506460 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010307350543443041, + "loss": 0.0123, + "step": 506470 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010306961721805894, + "loss": 0.0062, + "step": 506480 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010306572900168748, + "loss": 0.0072, + "step": 506490 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010306184078531601, + "loss": 0.0129, + "step": 506500 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010305795256894455, + "loss": 0.0119, + "step": 506510 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010305406435257308, + "loss": 0.0088, + "step": 506520 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010305017613620162, + "loss": 0.0121, + "step": 506530 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010304628791983015, + "loss": 0.0119, + "step": 506540 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010304239970345869, + "loss": 0.0093, + "step": 506550 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010303851148708722, + "loss": 0.0095, + "step": 506560 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010303462327071576, + "loss": 0.0117, + "step": 506570 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010303073505434429, + "loss": 0.0087, + "step": 506580 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010302684683797283, + "loss": 0.0076, + "step": 506590 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010302295862160136, + "loss": 0.0117, + "step": 506600 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010301907040522992, + "loss": 0.0082, + "step": 506610 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010301518218885843, + "loss": 0.0115, + "step": 506620 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010301129397248699, + "loss": 0.0091, + "step": 506630 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010300740575611551, + "loss": 0.0105, + "step": 506640 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010300351753974404, + "loss": 0.0147, + "step": 506650 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010299962932337258, + "loss": 0.0101, + "step": 506660 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010299574110700111, + "loss": 0.0088, + "step": 506670 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010299185289062965, + "loss": 0.0084, + "step": 506680 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010298796467425818, + "loss": 0.0113, + "step": 506690 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010298407645788672, + "loss": 0.0089, + "step": 506700 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010298018824151525, + "loss": 0.0145, + "step": 506710 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010297630002514379, + "loss": 0.0107, + "step": 506720 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010297241180877232, + "loss": 0.0127, + "step": 506730 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010296852359240086, + "loss": 0.0122, + "step": 506740 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010296463537602939, + "loss": 0.0133, + "step": 506750 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010296074715965793, + "loss": 0.0111, + "step": 506760 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010295685894328646, + "loss": 0.0113, + "step": 506770 + }, + { + "epoch": 1.31, + "learning_rate": 0.000102952970726915, + "loss": 0.0119, + "step": 506780 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010294908251054353, + "loss": 0.008, + "step": 506790 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010294519429417208, + "loss": 0.0104, + "step": 506800 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010294130607780061, + "loss": 0.0115, + "step": 506810 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010293741786142915, + "loss": 0.0123, + "step": 506820 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010293352964505768, + "loss": 0.0106, + "step": 506830 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010292964142868622, + "loss": 0.0097, + "step": 506840 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010292575321231475, + "loss": 0.0112, + "step": 506850 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001029218649959433, + "loss": 0.0095, + "step": 506860 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010291797677957182, + "loss": 0.0082, + "step": 506870 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010291408856320036, + "loss": 0.0136, + "step": 506880 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010291020034682889, + "loss": 0.0074, + "step": 506890 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010290631213045742, + "loss": 0.0113, + "step": 506900 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010290242391408596, + "loss": 0.0081, + "step": 506910 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010289853569771449, + "loss": 0.0103, + "step": 506920 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010289464748134303, + "loss": 0.0099, + "step": 506930 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010289075926497156, + "loss": 0.0118, + "step": 506940 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028868710486001, + "loss": 0.0102, + "step": 506950 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010288298283222863, + "loss": 0.0095, + "step": 506960 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010287909461585717, + "loss": 0.0099, + "step": 506970 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028752063994857, + "loss": 0.0116, + "step": 506980 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010287131818311425, + "loss": 0.0101, + "step": 506990 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010286742996674278, + "loss": 0.0111, + "step": 507000 + }, + { + "epoch": 1.31, + "eval_cer": 0.8816592975782083, + "eval_loss": 0.0065526701509952545, + "eval_runtime": 108.0305, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, + "step": 507000 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010286354175037132, + "loss": 0.0113, + "step": 507010 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010285965353399985, + "loss": 0.0081, + "step": 507020 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028557653176284, + "loss": 0.0106, + "step": 507030 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010285187710125692, + "loss": 0.0078, + "step": 507040 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010284798888488546, + "loss": 0.0133, + "step": 507050 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010284410066851399, + "loss": 0.0107, + "step": 507060 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010284021245214253, + "loss": 0.0099, + "step": 507070 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010283632423577106, + "loss": 0.0105, + "step": 507080 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028324360193996, + "loss": 0.0091, + "step": 507090 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010282854780302813, + "loss": 0.0098, + "step": 507100 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010282465958665667, + "loss": 0.0104, + "step": 507110 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028207713702852, + "loss": 0.0102, + "step": 507120 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010281688315391373, + "loss": 0.0082, + "step": 507130 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010281299493754227, + "loss": 0.0105, + "step": 507140 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001028091067211708, + "loss": 0.0118, + "step": 507150 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010280521850479935, + "loss": 0.0087, + "step": 507160 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010280133028842787, + "loss": 0.011, + "step": 507170 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010279744207205642, + "loss": 0.01, + "step": 507180 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010279355385568495, + "loss": 0.011, + "step": 507190 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010278966563931349, + "loss": 0.0096, + "step": 507200 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010278577742294202, + "loss": 0.0118, + "step": 507210 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010278188920657056, + "loss": 0.011, + "step": 507220 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010277800099019909, + "loss": 0.01, + "step": 507230 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010277411277382763, + "loss": 0.0129, + "step": 507240 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010277022455745616, + "loss": 0.0097, + "step": 507250 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001027663363410847, + "loss": 0.0095, + "step": 507260 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010276244812471323, + "loss": 0.0086, + "step": 507270 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010275855990834177, + "loss": 0.0114, + "step": 507280 + }, + { + "epoch": 1.31, + "learning_rate": 0.0001027546716919703, + "loss": 0.0094, + "step": 507290 + }, + { + "epoch": 1.31, + "learning_rate": 0.00010275078347559884, + "loss": 0.0123, + "step": 507300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010274689525922737, + "loss": 0.0096, + "step": 507310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010274300704285592, + "loss": 0.0097, + "step": 507320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010273911882648444, + "loss": 0.0122, + "step": 507330 + }, + { + "epoch": 1.32, + "learning_rate": 0.000102735230610113, + "loss": 0.0126, + "step": 507340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010273134239374152, + "loss": 0.0087, + "step": 507350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010272745417737006, + "loss": 0.0094, + "step": 507360 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010272356596099859, + "loss": 0.0112, + "step": 507370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010271967774462712, + "loss": 0.0103, + "step": 507380 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010271578952825566, + "loss": 0.0071, + "step": 507390 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010271190131188419, + "loss": 0.0104, + "step": 507400 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010270801309551273, + "loss": 0.0111, + "step": 507410 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010270412487914126, + "loss": 0.0081, + "step": 507420 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001027002366627698, + "loss": 0.0093, + "step": 507430 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010269634844639833, + "loss": 0.0111, + "step": 507440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010269246023002687, + "loss": 0.0119, + "step": 507450 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026885720136554, + "loss": 0.0066, + "step": 507460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010268468379728394, + "loss": 0.0113, + "step": 507470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010268079558091247, + "loss": 0.0146, + "step": 507480 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010267690736454101, + "loss": 0.0097, + "step": 507490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010267301914816954, + "loss": 0.0117, + "step": 507500 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026691309317981, + "loss": 0.0104, + "step": 507510 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010266524271542662, + "loss": 0.0138, + "step": 507520 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010266135449905516, + "loss": 0.009, + "step": 507530 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010265746628268369, + "loss": 0.0087, + "step": 507540 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010265357806631223, + "loss": 0.0107, + "step": 507550 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010264968984994076, + "loss": 0.0136, + "step": 507560 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026458016335693, + "loss": 0.0107, + "step": 507570 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010264191341719783, + "loss": 0.0115, + "step": 507580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010263802520082637, + "loss": 0.0085, + "step": 507590 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026341369844549, + "loss": 0.0094, + "step": 507600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010263024876808344, + "loss": 0.0081, + "step": 507610 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010262636055171197, + "loss": 0.0103, + "step": 507620 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001026224723353405, + "loss": 0.0097, + "step": 507630 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010261858411896904, + "loss": 0.0103, + "step": 507640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010261469590259757, + "loss": 0.0082, + "step": 507650 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010261080768622611, + "loss": 0.0103, + "step": 507660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010260691946985464, + "loss": 0.0112, + "step": 507670 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010260303125348319, + "loss": 0.0108, + "step": 507680 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010259914303711171, + "loss": 0.009, + "step": 507690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010259525482074026, + "loss": 0.0084, + "step": 507700 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010259136660436879, + "loss": 0.0118, + "step": 507710 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010258747838799733, + "loss": 0.0099, + "step": 507720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010258359017162586, + "loss": 0.0092, + "step": 507730 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001025797019552544, + "loss": 0.0084, + "step": 507740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010257581373888293, + "loss": 0.0133, + "step": 507750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010257192552251147, + "loss": 0.0078, + "step": 507760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010256803730614, + "loss": 0.0095, + "step": 507770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010256414908976854, + "loss": 0.0146, + "step": 507780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010256026087339707, + "loss": 0.0119, + "step": 507790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010255637265702561, + "loss": 0.0095, + "step": 507800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010255248444065414, + "loss": 0.0086, + "step": 507810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010254859622428268, + "loss": 0.0091, + "step": 507820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010254470800791121, + "loss": 0.01, + "step": 507830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010254081979153976, + "loss": 0.0087, + "step": 507840 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010253693157516828, + "loss": 0.0098, + "step": 507850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010253304335879683, + "loss": 0.0083, + "step": 507860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010252915514242536, + "loss": 0.0132, + "step": 507870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010252526692605389, + "loss": 0.0093, + "step": 507880 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010252137870968243, + "loss": 0.0105, + "step": 507890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010251749049331096, + "loss": 0.0098, + "step": 507900 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001025136022769395, + "loss": 0.0079, + "step": 507910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010250971406056803, + "loss": 0.0098, + "step": 507920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010250582584419657, + "loss": 0.0071, + "step": 507930 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001025019376278251, + "loss": 0.0104, + "step": 507940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010249804941145364, + "loss": 0.0109, + "step": 507950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010249416119508217, + "loss": 0.0089, + "step": 507960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010249027297871071, + "loss": 0.0156, + "step": 507970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010248638476233924, + "loss": 0.0077, + "step": 507980 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010248249654596778, + "loss": 0.0086, + "step": 507990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010247860832959631, + "loss": 0.01, + "step": 508000 + }, + { + "epoch": 1.32, + "eval_cer": 0.8817026863231677, + "eval_loss": 0.00661470415070653, + "eval_runtime": 108.0315, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, + "step": 508000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010247472011322485, + "loss": 0.0111, + "step": 508010 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010247083189685338, + "loss": 0.0104, + "step": 508020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010246694368048193, + "loss": 0.0098, + "step": 508030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010246305546411046, + "loss": 0.0123, + "step": 508040 + }, + { + "epoch": 1.32, + "learning_rate": 0.000102459167247739, + "loss": 0.0106, + "step": 508050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010245527903136753, + "loss": 0.0093, + "step": 508060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010245139081499607, + "loss": 0.02, + "step": 508070 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001024475025986246, + "loss": 0.0108, + "step": 508080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010244361438225314, + "loss": 0.01, + "step": 508090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010243972616588167, + "loss": 0.0108, + "step": 508100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010243583794951021, + "loss": 0.009, + "step": 508110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010243194973313874, + "loss": 0.0104, + "step": 508120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010242806151676727, + "loss": 0.0081, + "step": 508130 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010242417330039581, + "loss": 0.0085, + "step": 508140 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010242028508402434, + "loss": 0.0101, + "step": 508150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010241639686765288, + "loss": 0.0112, + "step": 508160 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010241250865128141, + "loss": 0.0088, + "step": 508170 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010240862043490995, + "loss": 0.0105, + "step": 508180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010240473221853848, + "loss": 0.0097, + "step": 508190 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010240084400216702, + "loss": 0.0105, + "step": 508200 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010239695578579555, + "loss": 0.0072, + "step": 508210 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023930675694241, + "loss": 0.0109, + "step": 508220 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010238917935305263, + "loss": 0.0092, + "step": 508230 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010238529113668117, + "loss": 0.0119, + "step": 508240 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023814029203097, + "loss": 0.0078, + "step": 508250 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010237751470393824, + "loss": 0.0118, + "step": 508260 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010237362648756677, + "loss": 0.008, + "step": 508270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010236973827119531, + "loss": 0.0112, + "step": 508280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010236585005482384, + "loss": 0.0103, + "step": 508290 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010236196183845238, + "loss": 0.0095, + "step": 508300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010235807362208091, + "loss": 0.0101, + "step": 508310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010235418540570945, + "loss": 0.0097, + "step": 508320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010235029718933798, + "loss": 0.0125, + "step": 508330 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010234640897296652, + "loss": 0.011, + "step": 508340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010234252075659505, + "loss": 0.0084, + "step": 508350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010233863254022359, + "loss": 0.0075, + "step": 508360 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010233474432385212, + "loss": 0.0101, + "step": 508370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010233085610748065, + "loss": 0.0067, + "step": 508380 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023269678911092, + "loss": 0.0075, + "step": 508390 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010232307967473773, + "loss": 0.0101, + "step": 508400 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010231919145836627, + "loss": 0.0092, + "step": 508410 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001023153032419948, + "loss": 0.0115, + "step": 508420 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010231141502562334, + "loss": 0.0095, + "step": 508430 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010230752680925187, + "loss": 0.0098, + "step": 508440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010230363859288041, + "loss": 0.0128, + "step": 508450 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010229975037650894, + "loss": 0.0108, + "step": 508460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010229586216013748, + "loss": 0.0128, + "step": 508470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010229197394376601, + "loss": 0.0101, + "step": 508480 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010228808572739455, + "loss": 0.0079, + "step": 508490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010228419751102308, + "loss": 0.0083, + "step": 508500 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010228030929465162, + "loss": 0.0075, + "step": 508510 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010227642107828015, + "loss": 0.012, + "step": 508520 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010227253286190869, + "loss": 0.0072, + "step": 508530 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010226864464553722, + "loss": 0.0086, + "step": 508540 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010226475642916577, + "loss": 0.0127, + "step": 508550 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010226086821279429, + "loss": 0.0105, + "step": 508560 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010225697999642284, + "loss": 0.0097, + "step": 508570 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010225309178005137, + "loss": 0.0101, + "step": 508580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010224920356367991, + "loss": 0.014, + "step": 508590 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010224531534730844, + "loss": 0.0113, + "step": 508600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010224142713093698, + "loss": 0.0103, + "step": 508610 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010223753891456551, + "loss": 0.0091, + "step": 508620 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010223365069819404, + "loss": 0.0134, + "step": 508630 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010222976248182258, + "loss": 0.011, + "step": 508640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010222587426545111, + "loss": 0.0101, + "step": 508650 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010222198604907965, + "loss": 0.0092, + "step": 508660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010221809783270818, + "loss": 0.0126, + "step": 508670 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010221420961633672, + "loss": 0.0121, + "step": 508680 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010221032139996525, + "loss": 0.0102, + "step": 508690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010220643318359379, + "loss": 0.0117, + "step": 508700 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010220254496722232, + "loss": 0.0095, + "step": 508710 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010219865675085086, + "loss": 0.0097, + "step": 508720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010219476853447939, + "loss": 0.0094, + "step": 508730 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010219088031810794, + "loss": 0.0088, + "step": 508740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010218699210173647, + "loss": 0.0113, + "step": 508750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010218310388536501, + "loss": 0.0099, + "step": 508760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010217921566899354, + "loss": 0.0097, + "step": 508770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010217532745262208, + "loss": 0.0111, + "step": 508780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010217143923625061, + "loss": 0.0096, + "step": 508790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010216755101987915, + "loss": 0.0146, + "step": 508800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010216366280350768, + "loss": 0.0095, + "step": 508810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010215977458713622, + "loss": 0.0138, + "step": 508820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010215588637076475, + "loss": 0.0082, + "step": 508830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010215199815439329, + "loss": 0.0095, + "step": 508840 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010214810993802182, + "loss": 0.0136, + "step": 508850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010214422172165036, + "loss": 0.0117, + "step": 508860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010214033350527889, + "loss": 0.0127, + "step": 508870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010213644528890742, + "loss": 0.0138, + "step": 508880 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010213255707253596, + "loss": 0.0138, + "step": 508890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010212866885616449, + "loss": 0.0083, + "step": 508900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010212478063979304, + "loss": 0.0101, + "step": 508910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010212089242342156, + "loss": 0.0108, + "step": 508920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010211700420705011, + "loss": 0.0079, + "step": 508930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010211311599067864, + "loss": 0.0097, + "step": 508940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010210922777430718, + "loss": 0.0077, + "step": 508950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010210533955793571, + "loss": 0.0094, + "step": 508960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010210145134156425, + "loss": 0.011, + "step": 508970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010209756312519278, + "loss": 0.0117, + "step": 508980 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010209367490882132, + "loss": 0.0131, + "step": 508990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010208978669244985, + "loss": 0.011, + "step": 509000 + }, + { + "epoch": 1.32, + "eval_cer": 0.881704085960102, + "eval_loss": 0.0064851148054003716, + "eval_runtime": 108.0593, + "eval_samples_per_second": 18.508, + "eval_steps_per_second": 4.627, + "step": 509000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010208589847607839, + "loss": 0.0097, + "step": 509010 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010208201025970692, + "loss": 0.0071, + "step": 509020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010207812204333546, + "loss": 0.0133, + "step": 509030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010207423382696399, + "loss": 0.008, + "step": 509040 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010207034561059253, + "loss": 0.0089, + "step": 509050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010206645739422106, + "loss": 0.0088, + "step": 509060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010206256917784961, + "loss": 0.0088, + "step": 509070 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010205868096147813, + "loss": 0.0147, + "step": 509080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010205479274510668, + "loss": 0.0114, + "step": 509090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010205090452873521, + "loss": 0.0107, + "step": 509100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010204701631236375, + "loss": 0.0133, + "step": 509110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010204312809599228, + "loss": 0.0117, + "step": 509120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010203923987962081, + "loss": 0.0091, + "step": 509130 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010203535166324935, + "loss": 0.0075, + "step": 509140 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010203146344687788, + "loss": 0.0121, + "step": 509150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010202757523050642, + "loss": 0.0076, + "step": 509160 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010202368701413495, + "loss": 0.0083, + "step": 509170 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010201979879776349, + "loss": 0.0116, + "step": 509180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010201591058139202, + "loss": 0.0097, + "step": 509190 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010201202236502056, + "loss": 0.0145, + "step": 509200 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010200813414864909, + "loss": 0.0108, + "step": 509210 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010200424593227763, + "loss": 0.0109, + "step": 509220 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010200035771590616, + "loss": 0.0102, + "step": 509230 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019964694995347, + "loss": 0.0156, + "step": 509240 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010199258128316323, + "loss": 0.0098, + "step": 509250 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010198869306679178, + "loss": 0.0095, + "step": 509260 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010198480485042031, + "loss": 0.0118, + "step": 509270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010198091663404885, + "loss": 0.0102, + "step": 509280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010197702841767738, + "loss": 0.0112, + "step": 509290 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010197314020130592, + "loss": 0.0097, + "step": 509300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010196925198493445, + "loss": 0.0066, + "step": 509310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010196536376856299, + "loss": 0.0083, + "step": 509320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010196147555219152, + "loss": 0.0084, + "step": 509330 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010195758733582006, + "loss": 0.0095, + "step": 509340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010195369911944859, + "loss": 0.0111, + "step": 509350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010194981090307713, + "loss": 0.0085, + "step": 509360 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010194592268670566, + "loss": 0.0157, + "step": 509370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010194203447033419, + "loss": 0.01, + "step": 509380 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010193814625396273, + "loss": 0.0121, + "step": 509390 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010193425803759126, + "loss": 0.0112, + "step": 509400 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019303698212198, + "loss": 0.0099, + "step": 509410 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010192648160484833, + "loss": 0.0115, + "step": 509420 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010192259338847688, + "loss": 0.009, + "step": 509430 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001019187051721054, + "loss": 0.0107, + "step": 509440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010191481695573395, + "loss": 0.0128, + "step": 509450 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010191092873936248, + "loss": 0.0093, + "step": 509460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010190704052299102, + "loss": 0.0123, + "step": 509470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010190315230661955, + "loss": 0.0077, + "step": 509480 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010189926409024809, + "loss": 0.0124, + "step": 509490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010189537587387662, + "loss": 0.0079, + "step": 509500 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010189148765750516, + "loss": 0.0127, + "step": 509510 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010188759944113369, + "loss": 0.0099, + "step": 509520 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010188371122476223, + "loss": 0.0136, + "step": 509530 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010187982300839076, + "loss": 0.0086, + "step": 509540 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018759347920193, + "loss": 0.0134, + "step": 509550 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010187204657564783, + "loss": 0.0091, + "step": 509560 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010186815835927637, + "loss": 0.0099, + "step": 509570 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018642701429049, + "loss": 0.0088, + "step": 509580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010186038192653344, + "loss": 0.011, + "step": 509590 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010185649371016197, + "loss": 0.0153, + "step": 509600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010185260549379052, + "loss": 0.0126, + "step": 509610 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010184871727741905, + "loss": 0.0134, + "step": 509620 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010184482906104758, + "loss": 0.009, + "step": 509630 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010184094084467612, + "loss": 0.01, + "step": 509640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010183705262830465, + "loss": 0.0109, + "step": 509650 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010183316441193319, + "loss": 0.0094, + "step": 509660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010182927619556172, + "loss": 0.008, + "step": 509670 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010182538797919026, + "loss": 0.0113, + "step": 509680 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010182149976281879, + "loss": 0.0091, + "step": 509690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010181761154644733, + "loss": 0.0119, + "step": 509700 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010181372333007586, + "loss": 0.0114, + "step": 509710 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001018098351137044, + "loss": 0.0099, + "step": 509720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010180594689733293, + "loss": 0.0072, + "step": 509730 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010180205868096147, + "loss": 0.0105, + "step": 509740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010179817046459, + "loss": 0.0098, + "step": 509750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010179428224821854, + "loss": 0.0098, + "step": 509760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010179039403184707, + "loss": 0.0115, + "step": 509770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010178650581547562, + "loss": 0.0106, + "step": 509780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010178261759910414, + "loss": 0.0125, + "step": 509790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010177872938273269, + "loss": 0.0077, + "step": 509800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010177484116636122, + "loss": 0.0112, + "step": 509810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010177095294998976, + "loss": 0.0111, + "step": 509820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010176706473361829, + "loss": 0.0108, + "step": 509830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010176317651724683, + "loss": 0.01, + "step": 509840 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010175928830087536, + "loss": 0.0093, + "step": 509850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010175540008450389, + "loss": 0.0108, + "step": 509860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010175151186813243, + "loss": 0.008, + "step": 509870 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010174762365176096, + "loss": 0.0091, + "step": 509880 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001017437354353895, + "loss": 0.0088, + "step": 509890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010173984721901803, + "loss": 0.0099, + "step": 509900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010173595900264657, + "loss": 0.0082, + "step": 509910 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001017320707862751, + "loss": 0.0112, + "step": 509920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010172818256990364, + "loss": 0.0098, + "step": 509930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010172429435353217, + "loss": 0.0122, + "step": 509940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010172040613716071, + "loss": 0.0102, + "step": 509950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010171651792078924, + "loss": 0.0131, + "step": 509960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010171262970441779, + "loss": 0.0095, + "step": 509970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010170874148804632, + "loss": 0.012, + "step": 509980 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010170485327167486, + "loss": 0.0123, + "step": 509990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010170096505530339, + "loss": 0.0113, + "step": 510000 + }, + { + "epoch": 1.32, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.0066459812223911285, + "eval_runtime": 108.1498, + "eval_samples_per_second": 18.493, + "eval_steps_per_second": 4.623, + "step": 510000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010169707683893193, + "loss": 0.0081, + "step": 510010 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010169318862256046, + "loss": 0.0139, + "step": 510020 + }, + { + "epoch": 1.32, + "learning_rate": 0.000101689300406189, + "loss": 0.0092, + "step": 510030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010168541218981753, + "loss": 0.0157, + "step": 510040 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010168152397344607, + "loss": 0.0113, + "step": 510050 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016776357570746, + "loss": 0.0098, + "step": 510060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010167374754070314, + "loss": 0.0112, + "step": 510070 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010166985932433167, + "loss": 0.0099, + "step": 510080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010166597110796021, + "loss": 0.0089, + "step": 510090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010166208289158874, + "loss": 0.0095, + "step": 510100 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010165819467521727, + "loss": 0.012, + "step": 510110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010165430645884581, + "loss": 0.0119, + "step": 510120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010165041824247434, + "loss": 0.0095, + "step": 510130 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010164653002610289, + "loss": 0.01, + "step": 510140 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016426418097314, + "loss": 0.0099, + "step": 510150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010163875359335996, + "loss": 0.0103, + "step": 510160 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010163486537698849, + "loss": 0.0109, + "step": 510170 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010163097716061703, + "loss": 0.01, + "step": 510180 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010162708894424556, + "loss": 0.0099, + "step": 510190 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016232007278741, + "loss": 0.0088, + "step": 510200 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010161931251150263, + "loss": 0.0101, + "step": 510210 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010161542429513117, + "loss": 0.0103, + "step": 510220 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001016115360787597, + "loss": 0.0086, + "step": 510230 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010160764786238824, + "loss": 0.0095, + "step": 510240 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010160375964601677, + "loss": 0.0087, + "step": 510250 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010159987142964531, + "loss": 0.0098, + "step": 510260 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010159598321327384, + "loss": 0.0087, + "step": 510270 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010159209499690238, + "loss": 0.0093, + "step": 510280 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010158820678053091, + "loss": 0.0108, + "step": 510290 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010158431856415946, + "loss": 0.0124, + "step": 510300 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010158043034778798, + "loss": 0.0109, + "step": 510310 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010157654213141653, + "loss": 0.0107, + "step": 510320 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010157265391504506, + "loss": 0.0085, + "step": 510330 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001015687656986736, + "loss": 0.0138, + "step": 510340 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010156487748230213, + "loss": 0.0098, + "step": 510350 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010156098926593066, + "loss": 0.0125, + "step": 510360 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001015571010495592, + "loss": 0.0093, + "step": 510370 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010155321283318773, + "loss": 0.0112, + "step": 510380 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010154932461681627, + "loss": 0.0112, + "step": 510390 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001015454364004448, + "loss": 0.0112, + "step": 510400 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010154154818407334, + "loss": 0.0093, + "step": 510410 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010153765996770187, + "loss": 0.0088, + "step": 510420 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010153377175133041, + "loss": 0.0078, + "step": 510430 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010152988353495894, + "loss": 0.0142, + "step": 510440 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010152599531858748, + "loss": 0.0083, + "step": 510450 + }, + { + "epoch": 1.32, + "learning_rate": 0.000101522107102216, + "loss": 0.0068, + "step": 510460 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010151821888584455, + "loss": 0.009, + "step": 510470 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010151433066947308, + "loss": 0.01, + "step": 510480 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010151044245310163, + "loss": 0.012, + "step": 510490 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010150655423673016, + "loss": 0.0136, + "step": 510500 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001015026660203587, + "loss": 0.0116, + "step": 510510 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010149877780398723, + "loss": 0.0106, + "step": 510520 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010149488958761577, + "loss": 0.0087, + "step": 510530 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014910013712443, + "loss": 0.0095, + "step": 510540 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010148711315487284, + "loss": 0.0104, + "step": 510550 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010148322493850137, + "loss": 0.0112, + "step": 510560 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010147933672212991, + "loss": 0.0083, + "step": 510570 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010147544850575844, + "loss": 0.0139, + "step": 510580 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010147156028938698, + "loss": 0.0104, + "step": 510590 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010146767207301551, + "loss": 0.0083, + "step": 510600 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010146378385664404, + "loss": 0.0088, + "step": 510610 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010145989564027258, + "loss": 0.0105, + "step": 510620 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014560074239011, + "loss": 0.0097, + "step": 510630 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010145211920752965, + "loss": 0.0092, + "step": 510640 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010144823099115818, + "loss": 0.0102, + "step": 510650 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010144434277478673, + "loss": 0.0071, + "step": 510660 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010144045455841525, + "loss": 0.0065, + "step": 510670 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014365663420438, + "loss": 0.0105, + "step": 510680 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010143267812567233, + "loss": 0.0108, + "step": 510690 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010142878990930087, + "loss": 0.0118, + "step": 510700 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001014249016929294, + "loss": 0.0136, + "step": 510710 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010142101347655794, + "loss": 0.0086, + "step": 510720 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010141712526018647, + "loss": 0.0111, + "step": 510730 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010141323704381501, + "loss": 0.0093, + "step": 510740 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010140934882744354, + "loss": 0.0079, + "step": 510750 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010140546061107208, + "loss": 0.0087, + "step": 510760 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010140157239470061, + "loss": 0.0088, + "step": 510770 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010139768417832915, + "loss": 0.0089, + "step": 510780 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010139379596195768, + "loss": 0.008, + "step": 510790 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010138990774558622, + "loss": 0.0116, + "step": 510800 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010138601952921475, + "loss": 0.0084, + "step": 510810 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010138213131284329, + "loss": 0.0101, + "step": 510820 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010137824309647182, + "loss": 0.0097, + "step": 510830 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010137435488010037, + "loss": 0.0072, + "step": 510840 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001013704666637289, + "loss": 0.0081, + "step": 510850 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010136657844735743, + "loss": 0.0102, + "step": 510860 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010136269023098597, + "loss": 0.0088, + "step": 510870 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001013588020146145, + "loss": 0.0085, + "step": 510880 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010135491379824304, + "loss": 0.0118, + "step": 510890 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010135102558187157, + "loss": 0.0093, + "step": 510900 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010134713736550011, + "loss": 0.0102, + "step": 510910 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010134324914912864, + "loss": 0.0122, + "step": 510920 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010133936093275718, + "loss": 0.0073, + "step": 510930 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010133547271638571, + "loss": 0.0121, + "step": 510940 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010133158450001425, + "loss": 0.0112, + "step": 510950 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010132769628364278, + "loss": 0.0092, + "step": 510960 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010132380806727132, + "loss": 0.0131, + "step": 510970 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010131991985089985, + "loss": 0.0083, + "step": 510980 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010131603163452839, + "loss": 0.0109, + "step": 510990 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010131214341815692, + "loss": 0.0086, + "step": 511000 + }, + { + "epoch": 1.32, + "eval_cer": 0.8816564983043399, + "eval_loss": 0.006579502020031214, + "eval_runtime": 107.825, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 511000 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010130825520178547, + "loss": 0.0117, + "step": 511010 + }, + { + "epoch": 1.32, + "learning_rate": 0.000101304366985414, + "loss": 0.0068, + "step": 511020 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010130047876904254, + "loss": 0.0092, + "step": 511030 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010129659055267107, + "loss": 0.0089, + "step": 511040 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010129270233629961, + "loss": 0.0089, + "step": 511050 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010128881411992814, + "loss": 0.0108, + "step": 511060 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010128492590355668, + "loss": 0.0105, + "step": 511070 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010128103768718521, + "loss": 0.0119, + "step": 511080 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010127714947081375, + "loss": 0.009, + "step": 511090 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010127326125444228, + "loss": 0.0121, + "step": 511100 + }, + { + "epoch": 1.32, + "learning_rate": 0.0001012693730380708, + "loss": 0.016, + "step": 511110 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010126548482169935, + "loss": 0.0099, + "step": 511120 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010126159660532788, + "loss": 0.0123, + "step": 511130 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010125770838895642, + "loss": 0.01, + "step": 511140 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010125382017258495, + "loss": 0.0107, + "step": 511150 + }, + { + "epoch": 1.32, + "learning_rate": 0.00010124993195621349, + "loss": 0.0103, + "step": 511160 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010124604373984202, + "loss": 0.0095, + "step": 511170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010124215552347056, + "loss": 0.0119, + "step": 511180 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010123826730709909, + "loss": 0.0077, + "step": 511190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010123437909072764, + "loss": 0.0115, + "step": 511200 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010123049087435617, + "loss": 0.0112, + "step": 511210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010122660265798471, + "loss": 0.0094, + "step": 511220 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010122271444161324, + "loss": 0.013, + "step": 511230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010121882622524178, + "loss": 0.0091, + "step": 511240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010121493800887031, + "loss": 0.0112, + "step": 511250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010121104979249885, + "loss": 0.0095, + "step": 511260 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010120716157612738, + "loss": 0.0111, + "step": 511270 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010120327335975592, + "loss": 0.0108, + "step": 511280 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010119938514338445, + "loss": 0.0101, + "step": 511290 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010119549692701299, + "loss": 0.0155, + "step": 511300 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010119160871064152, + "loss": 0.0113, + "step": 511310 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010118772049427006, + "loss": 0.0103, + "step": 511320 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010118383227789859, + "loss": 0.0067, + "step": 511330 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010117994406152713, + "loss": 0.0094, + "step": 511340 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010117605584515566, + "loss": 0.0103, + "step": 511350 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010117216762878418, + "loss": 0.0087, + "step": 511360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010116827941241274, + "loss": 0.0106, + "step": 511370 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010116439119604125, + "loss": 0.007, + "step": 511380 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010116050297966981, + "loss": 0.0144, + "step": 511390 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010115661476329834, + "loss": 0.013, + "step": 511400 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010115272654692688, + "loss": 0.0129, + "step": 511410 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010114883833055541, + "loss": 0.0117, + "step": 511420 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010114495011418395, + "loss": 0.0104, + "step": 511430 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010114106189781248, + "loss": 0.012, + "step": 511440 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010113717368144102, + "loss": 0.0101, + "step": 511450 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010113328546506955, + "loss": 0.0114, + "step": 511460 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010112939724869809, + "loss": 0.0073, + "step": 511470 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010112550903232662, + "loss": 0.0113, + "step": 511480 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010112162081595516, + "loss": 0.0096, + "step": 511490 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010111773259958369, + "loss": 0.0096, + "step": 511500 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010111384438321223, + "loss": 0.0077, + "step": 511510 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010110995616684076, + "loss": 0.0096, + "step": 511520 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010110606795046931, + "loss": 0.013, + "step": 511530 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010110217973409783, + "loss": 0.0109, + "step": 511540 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010109829151772638, + "loss": 0.009, + "step": 511550 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010109440330135491, + "loss": 0.0092, + "step": 511560 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010109051508498345, + "loss": 0.0099, + "step": 511570 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010108662686861198, + "loss": 0.0105, + "step": 511580 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010108273865224052, + "loss": 0.0113, + "step": 511590 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010107885043586905, + "loss": 0.0095, + "step": 511600 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010107496221949758, + "loss": 0.0075, + "step": 511610 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010107107400312612, + "loss": 0.0096, + "step": 511620 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010106718578675465, + "loss": 0.0089, + "step": 511630 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010106329757038319, + "loss": 0.0073, + "step": 511640 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010105940935401172, + "loss": 0.0096, + "step": 511650 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010105552113764026, + "loss": 0.0097, + "step": 511660 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010105163292126879, + "loss": 0.0102, + "step": 511670 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010104774470489733, + "loss": 0.0115, + "step": 511680 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010104385648852586, + "loss": 0.0097, + "step": 511690 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001010399682721544, + "loss": 0.0078, + "step": 511700 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010103608005578293, + "loss": 0.0063, + "step": 511710 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010103219183941148, + "loss": 0.009, + "step": 511720 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010102830362304001, + "loss": 0.0121, + "step": 511730 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010102441540666855, + "loss": 0.0118, + "step": 511740 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010102052719029708, + "loss": 0.0126, + "step": 511750 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010101663897392562, + "loss": 0.0085, + "step": 511760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010101275075755415, + "loss": 0.0078, + "step": 511770 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010100886254118269, + "loss": 0.0079, + "step": 511780 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010100497432481122, + "loss": 0.0097, + "step": 511790 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010100108610843976, + "loss": 0.0071, + "step": 511800 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010099719789206829, + "loss": 0.0099, + "step": 511810 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010099330967569683, + "loss": 0.0085, + "step": 511820 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010098942145932536, + "loss": 0.0104, + "step": 511830 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001009855332429539, + "loss": 0.0091, + "step": 511840 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010098164502658243, + "loss": 0.0085, + "step": 511850 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010097775681021095, + "loss": 0.0083, + "step": 511860 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001009738685938395, + "loss": 0.012, + "step": 511870 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010096998037746802, + "loss": 0.0105, + "step": 511880 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010096609216109658, + "loss": 0.0101, + "step": 511890 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001009622039447251, + "loss": 0.0127, + "step": 511900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010095831572835365, + "loss": 0.0128, + "step": 511910 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010095442751198218, + "loss": 0.0071, + "step": 511920 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010095053929561072, + "loss": 0.0078, + "step": 511930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010094665107923925, + "loss": 0.0088, + "step": 511940 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010094276286286779, + "loss": 0.0091, + "step": 511950 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010093887464649632, + "loss": 0.0081, + "step": 511960 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010093498643012486, + "loss": 0.0087, + "step": 511970 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010093109821375339, + "loss": 0.0112, + "step": 511980 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010092720999738193, + "loss": 0.0113, + "step": 511990 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010092332178101046, + "loss": 0.0088, + "step": 512000 + }, + { + "epoch": 1.33, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.006633738521486521, + "eval_runtime": 107.8155, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.638, + "step": 512000 + }, + { + "epoch": 1.33, + "learning_rate": 0.000100919433564639, + "loss": 0.0103, + "step": 512010 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010091554534826753, + "loss": 0.0086, + "step": 512020 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010091165713189607, + "loss": 0.0127, + "step": 512030 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001009077689155246, + "loss": 0.0105, + "step": 512040 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010090388069915315, + "loss": 0.0104, + "step": 512050 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010089999248278167, + "loss": 0.014, + "step": 512060 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010089610426641022, + "loss": 0.008, + "step": 512070 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010089221605003875, + "loss": 0.0077, + "step": 512080 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010088832783366729, + "loss": 0.0124, + "step": 512090 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010088443961729582, + "loss": 0.0103, + "step": 512100 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010088055140092435, + "loss": 0.0091, + "step": 512110 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010087666318455289, + "loss": 0.0108, + "step": 512120 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010087277496818142, + "loss": 0.0104, + "step": 512130 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010086888675180996, + "loss": 0.0095, + "step": 512140 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010086499853543849, + "loss": 0.0101, + "step": 512150 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010086111031906703, + "loss": 0.0113, + "step": 512160 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010085722210269556, + "loss": 0.0069, + "step": 512170 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008533338863241, + "loss": 0.0085, + "step": 512180 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010084944566995263, + "loss": 0.0093, + "step": 512190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010084555745358117, + "loss": 0.0097, + "step": 512200 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001008416692372097, + "loss": 0.0104, + "step": 512210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010083778102083824, + "loss": 0.0088, + "step": 512220 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010083389280446677, + "loss": 0.0106, + "step": 512230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010083000458809532, + "loss": 0.0125, + "step": 512240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010082611637172385, + "loss": 0.0114, + "step": 512250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010082222815535239, + "loss": 0.0094, + "step": 512260 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010081833993898092, + "loss": 0.0106, + "step": 512270 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010081445172260946, + "loss": 0.01, + "step": 512280 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010081056350623799, + "loss": 0.0117, + "step": 512290 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010080667528986653, + "loss": 0.009, + "step": 512300 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010080278707349506, + "loss": 0.0104, + "step": 512310 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001007988988571236, + "loss": 0.0103, + "step": 512320 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010079501064075213, + "loss": 0.0101, + "step": 512330 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010079112242438067, + "loss": 0.0112, + "step": 512340 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001007872342080092, + "loss": 0.0109, + "step": 512350 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010078334599163773, + "loss": 0.0093, + "step": 512360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010077945777526627, + "loss": 0.008, + "step": 512370 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001007755695588948, + "loss": 0.0114, + "step": 512380 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010077168134252334, + "loss": 0.0107, + "step": 512390 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010076779312615186, + "loss": 0.0146, + "step": 512400 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001007639049097804, + "loss": 0.0136, + "step": 512410 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010076001669340893, + "loss": 0.0106, + "step": 512420 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010075612847703749, + "loss": 0.0083, + "step": 512430 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010075224026066602, + "loss": 0.0152, + "step": 512440 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010074835204429456, + "loss": 0.0113, + "step": 512450 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010074446382792309, + "loss": 0.0097, + "step": 512460 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010074057561155163, + "loss": 0.0099, + "step": 512470 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010073668739518016, + "loss": 0.0143, + "step": 512480 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001007327991788087, + "loss": 0.009, + "step": 512490 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010072891096243723, + "loss": 0.0085, + "step": 512500 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010072502274606577, + "loss": 0.0093, + "step": 512510 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001007211345296943, + "loss": 0.0094, + "step": 512520 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010071724631332284, + "loss": 0.0115, + "step": 512530 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010071335809695137, + "loss": 0.0085, + "step": 512540 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010070946988057991, + "loss": 0.0068, + "step": 512550 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010070558166420844, + "loss": 0.0084, + "step": 512560 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010070169344783698, + "loss": 0.0106, + "step": 512570 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006978052314655, + "loss": 0.0098, + "step": 512580 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010069391701509403, + "loss": 0.0113, + "step": 512590 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010069002879872259, + "loss": 0.0095, + "step": 512600 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010068614058235112, + "loss": 0.0089, + "step": 512610 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010068225236597966, + "loss": 0.0113, + "step": 512620 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010067836414960819, + "loss": 0.0094, + "step": 512630 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010067447593323673, + "loss": 0.0104, + "step": 512640 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010067058771686526, + "loss": 0.012, + "step": 512650 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006666995004938, + "loss": 0.0107, + "step": 512660 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010066281128412233, + "loss": 0.0096, + "step": 512670 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010065892306775087, + "loss": 0.0094, + "step": 512680 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006550348513794, + "loss": 0.0089, + "step": 512690 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010065114663500794, + "loss": 0.0074, + "step": 512700 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010064725841863647, + "loss": 0.0108, + "step": 512710 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010064337020226501, + "loss": 0.0089, + "step": 512720 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010063948198589354, + "loss": 0.0086, + "step": 512730 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010063559376952208, + "loss": 0.0104, + "step": 512740 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006317055531506, + "loss": 0.0116, + "step": 512750 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010062781733677916, + "loss": 0.0105, + "step": 512760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010062392912040767, + "loss": 0.011, + "step": 512770 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010062004090403623, + "loss": 0.0109, + "step": 512780 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010061615268766476, + "loss": 0.0085, + "step": 512790 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006122644712933, + "loss": 0.0093, + "step": 512800 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010060837625492183, + "loss": 0.0131, + "step": 512810 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010060448803855037, + "loss": 0.0095, + "step": 512820 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001006005998221789, + "loss": 0.0135, + "step": 512830 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010059671160580743, + "loss": 0.0106, + "step": 512840 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010059282338943597, + "loss": 0.0117, + "step": 512850 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005889351730645, + "loss": 0.0116, + "step": 512860 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010058504695669304, + "loss": 0.0085, + "step": 512870 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010058115874032157, + "loss": 0.0093, + "step": 512880 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005772705239501, + "loss": 0.0132, + "step": 512890 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010057338230757863, + "loss": 0.0111, + "step": 512900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010056949409120718, + "loss": 0.0092, + "step": 512910 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005656058748357, + "loss": 0.0093, + "step": 512920 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010056171765846425, + "loss": 0.0095, + "step": 512930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010055782944209277, + "loss": 0.0097, + "step": 512940 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010055394122572133, + "loss": 0.0105, + "step": 512950 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010055005300934986, + "loss": 0.0117, + "step": 512960 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005461647929784, + "loss": 0.0083, + "step": 512970 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010054227657660693, + "loss": 0.0115, + "step": 512980 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010053838836023547, + "loss": 0.0069, + "step": 512990 + }, + { + "epoch": 1.33, + "learning_rate": 0.000100534500143864, + "loss": 0.0112, + "step": 513000 + }, + { + "epoch": 1.33, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.006440384313464165, + "eval_runtime": 107.8594, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 513000 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010053061192749254, + "loss": 0.0088, + "step": 513010 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010052672371112107, + "loss": 0.0093, + "step": 513020 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010052283549474961, + "loss": 0.0079, + "step": 513030 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010051894727837814, + "loss": 0.0106, + "step": 513040 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010051505906200668, + "loss": 0.0099, + "step": 513050 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001005111708456352, + "loss": 0.0101, + "step": 513060 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010050728262926375, + "loss": 0.0102, + "step": 513070 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010050339441289228, + "loss": 0.0119, + "step": 513080 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004995061965208, + "loss": 0.008, + "step": 513090 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010049561798014935, + "loss": 0.0078, + "step": 513100 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010049172976377787, + "loss": 0.0088, + "step": 513110 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010048784154740643, + "loss": 0.0111, + "step": 513120 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010048395333103494, + "loss": 0.0094, + "step": 513130 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004800651146635, + "loss": 0.0081, + "step": 513140 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010047617689829203, + "loss": 0.0089, + "step": 513150 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010047228868192057, + "loss": 0.0086, + "step": 513160 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004684004655491, + "loss": 0.0107, + "step": 513170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010046451224917764, + "loss": 0.0119, + "step": 513180 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010046062403280617, + "loss": 0.009, + "step": 513190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010045673581643471, + "loss": 0.0099, + "step": 513200 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010045284760006324, + "loss": 0.0093, + "step": 513210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010044895938369178, + "loss": 0.0095, + "step": 513220 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004450711673203, + "loss": 0.0104, + "step": 513230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010044118295094885, + "loss": 0.0096, + "step": 513240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010043729473457738, + "loss": 0.0149, + "step": 513250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010043340651820592, + "loss": 0.0108, + "step": 513260 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010042951830183444, + "loss": 0.0092, + "step": 513270 + }, + { + "epoch": 1.33, + "learning_rate": 0.000100425630085463, + "loss": 0.0102, + "step": 513280 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010042174186909151, + "loss": 0.0091, + "step": 513290 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010041785365272007, + "loss": 0.0078, + "step": 513300 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004139654363486, + "loss": 0.0153, + "step": 513310 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010041007721997714, + "loss": 0.0092, + "step": 513320 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010040618900360567, + "loss": 0.0107, + "step": 513330 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001004023007872342, + "loss": 0.009, + "step": 513340 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010039841257086274, + "loss": 0.0123, + "step": 513350 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010039452435449127, + "loss": 0.0099, + "step": 513360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010039063613811981, + "loss": 0.012, + "step": 513370 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010038674792174834, + "loss": 0.0087, + "step": 513380 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010038285970537688, + "loss": 0.0079, + "step": 513390 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003789714890054, + "loss": 0.009, + "step": 513400 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010037508327263395, + "loss": 0.0102, + "step": 513410 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010037119505626247, + "loss": 0.0093, + "step": 513420 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010036730683989102, + "loss": 0.0097, + "step": 513430 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010036341862351954, + "loss": 0.01, + "step": 513440 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010035953040714809, + "loss": 0.009, + "step": 513450 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010035564219077661, + "loss": 0.0104, + "step": 513460 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010035175397440517, + "loss": 0.0091, + "step": 513470 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003478657580337, + "loss": 0.0083, + "step": 513480 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010034397754166224, + "loss": 0.0095, + "step": 513490 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010034008932529077, + "loss": 0.0102, + "step": 513500 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010033620110891931, + "loss": 0.0089, + "step": 513510 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010033231289254784, + "loss": 0.0101, + "step": 513520 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010032842467617638, + "loss": 0.0102, + "step": 513530 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001003245364598049, + "loss": 0.0099, + "step": 513540 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010032064824343345, + "loss": 0.0097, + "step": 513550 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010031676002706198, + "loss": 0.0082, + "step": 513560 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010031287181069052, + "loss": 0.0106, + "step": 513570 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010030898359431905, + "loss": 0.0073, + "step": 513580 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010030509537794757, + "loss": 0.0103, + "step": 513590 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010030120716157612, + "loss": 0.0113, + "step": 513600 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010029731894520464, + "loss": 0.0103, + "step": 513610 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010029343072883319, + "loss": 0.0159, + "step": 513620 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010028954251246171, + "loss": 0.0107, + "step": 513630 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010028565429609027, + "loss": 0.0083, + "step": 513640 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010028176607971878, + "loss": 0.0091, + "step": 513650 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010027787786334734, + "loss": 0.0108, + "step": 513660 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010027398964697587, + "loss": 0.0076, + "step": 513670 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010027010143060441, + "loss": 0.0119, + "step": 513680 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010026621321423294, + "loss": 0.0079, + "step": 513690 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010026232499786148, + "loss": 0.0087, + "step": 513700 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010025843678149, + "loss": 0.0138, + "step": 513710 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010025454856511855, + "loss": 0.0131, + "step": 513720 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010025066034874708, + "loss": 0.0083, + "step": 513730 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010024677213237562, + "loss": 0.0082, + "step": 513740 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010024288391600415, + "loss": 0.0115, + "step": 513750 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010023899569963269, + "loss": 0.0077, + "step": 513760 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010023510748326122, + "loss": 0.0109, + "step": 513770 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010023121926688976, + "loss": 0.0131, + "step": 513780 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010022733105051828, + "loss": 0.0099, + "step": 513790 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010022344283414683, + "loss": 0.0111, + "step": 513800 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010021955461777535, + "loss": 0.0129, + "step": 513810 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010021566640140391, + "loss": 0.0068, + "step": 513820 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010021177818503244, + "loss": 0.0108, + "step": 513830 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010020788996866097, + "loss": 0.0122, + "step": 513840 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010020400175228951, + "loss": 0.0117, + "step": 513850 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010020011353591804, + "loss": 0.0095, + "step": 513860 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010019622531954658, + "loss": 0.0122, + "step": 513870 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001001923371031751, + "loss": 0.009, + "step": 513880 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010018844888680365, + "loss": 0.0084, + "step": 513890 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010018456067043218, + "loss": 0.0121, + "step": 513900 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010018067245406072, + "loss": 0.0095, + "step": 513910 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010017678423768924, + "loss": 0.0073, + "step": 513920 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010017289602131779, + "loss": 0.0062, + "step": 513930 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010016900780494631, + "loss": 0.0145, + "step": 513940 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010016511958857486, + "loss": 0.0087, + "step": 513950 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010016123137220338, + "loss": 0.0095, + "step": 513960 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010015734315583193, + "loss": 0.0132, + "step": 513970 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010015345493946045, + "loss": 0.0082, + "step": 513980 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010014956672308901, + "loss": 0.0084, + "step": 513990 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010014567850671752, + "loss": 0.0073, + "step": 514000 + }, + { + "epoch": 1.33, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.006481009069830179, + "eval_runtime": 108.0446, + "eval_samples_per_second": 18.511, + "eval_steps_per_second": 4.628, + "step": 514000 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010014179029034608, + "loss": 0.0106, + "step": 514010 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010013790207397461, + "loss": 0.0117, + "step": 514020 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010013401385760315, + "loss": 0.0088, + "step": 514030 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010013012564123168, + "loss": 0.0116, + "step": 514040 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010012623742486022, + "loss": 0.0089, + "step": 514050 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010012234920848875, + "loss": 0.011, + "step": 514060 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010011846099211729, + "loss": 0.0108, + "step": 514070 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010011457277574582, + "loss": 0.0091, + "step": 514080 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010011068455937434, + "loss": 0.0139, + "step": 514090 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010010679634300289, + "loss": 0.0082, + "step": 514100 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010010290812663141, + "loss": 0.0092, + "step": 514110 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010009901991025996, + "loss": 0.0145, + "step": 514120 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010009513169388848, + "loss": 0.0119, + "step": 514130 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010009124347751703, + "loss": 0.0082, + "step": 514140 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010008735526114555, + "loss": 0.0131, + "step": 514150 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000834670447741, + "loss": 0.0093, + "step": 514160 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010007957882840262, + "loss": 0.0117, + "step": 514170 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010007569061203118, + "loss": 0.0087, + "step": 514180 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000718023956597, + "loss": 0.01, + "step": 514190 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010006791417928825, + "loss": 0.0099, + "step": 514200 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010006402596291678, + "loss": 0.0084, + "step": 514210 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010006013774654532, + "loss": 0.0127, + "step": 514220 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010005624953017385, + "loss": 0.0101, + "step": 514230 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010005236131380239, + "loss": 0.0113, + "step": 514240 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010004847309743092, + "loss": 0.0091, + "step": 514250 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010004458488105946, + "loss": 0.0114, + "step": 514260 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010004069666468799, + "loss": 0.012, + "step": 514270 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010003680844831653, + "loss": 0.0088, + "step": 514280 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010003292023194506, + "loss": 0.0101, + "step": 514290 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000290320155736, + "loss": 0.0091, + "step": 514300 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010002514379920212, + "loss": 0.0119, + "step": 514310 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010002125558283067, + "loss": 0.0095, + "step": 514320 + }, + { + "epoch": 1.33, + "learning_rate": 0.0001000173673664592, + "loss": 0.0088, + "step": 514330 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010001347915008772, + "loss": 0.0077, + "step": 514340 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010000959093371628, + "loss": 0.0128, + "step": 514350 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010000570271734479, + "loss": 0.009, + "step": 514360 + }, + { + "epoch": 1.33, + "learning_rate": 0.00010000181450097335, + "loss": 0.0083, + "step": 514370 + }, + { + "epoch": 1.33, + "learning_rate": 9.999792628460188e-05, + "loss": 0.0085, + "step": 514380 + }, + { + "epoch": 1.33, + "learning_rate": 9.999403806823042e-05, + "loss": 0.01, + "step": 514390 + }, + { + "epoch": 1.33, + "learning_rate": 9.999014985185895e-05, + "loss": 0.0146, + "step": 514400 + }, + { + "epoch": 1.33, + "learning_rate": 9.998626163548749e-05, + "loss": 0.0117, + "step": 514410 + }, + { + "epoch": 1.33, + "learning_rate": 9.998237341911602e-05, + "loss": 0.0086, + "step": 514420 + }, + { + "epoch": 1.33, + "learning_rate": 9.997848520274456e-05, + "loss": 0.0091, + "step": 514430 + }, + { + "epoch": 1.33, + "learning_rate": 9.997459698637308e-05, + "loss": 0.0085, + "step": 514440 + }, + { + "epoch": 1.33, + "learning_rate": 9.997070877000163e-05, + "loss": 0.0095, + "step": 514450 + }, + { + "epoch": 1.33, + "learning_rate": 9.996682055363015e-05, + "loss": 0.0084, + "step": 514460 + }, + { + "epoch": 1.33, + "learning_rate": 9.99629323372587e-05, + "loss": 0.011, + "step": 514470 + }, + { + "epoch": 1.33, + "learning_rate": 9.995904412088722e-05, + "loss": 0.0088, + "step": 514480 + }, + { + "epoch": 1.33, + "learning_rate": 9.995515590451577e-05, + "loss": 0.0073, + "step": 514490 + }, + { + "epoch": 1.33, + "learning_rate": 9.99512676881443e-05, + "loss": 0.0141, + "step": 514500 + }, + { + "epoch": 1.33, + "learning_rate": 9.994737947177285e-05, + "loss": 0.0099, + "step": 514510 + }, + { + "epoch": 1.33, + "learning_rate": 9.994349125540136e-05, + "loss": 0.0088, + "step": 514520 + }, + { + "epoch": 1.33, + "learning_rate": 9.993960303902992e-05, + "loss": 0.0095, + "step": 514530 + }, + { + "epoch": 1.33, + "learning_rate": 9.993571482265845e-05, + "loss": 0.0107, + "step": 514540 + }, + { + "epoch": 1.33, + "learning_rate": 9.993182660628699e-05, + "loss": 0.0089, + "step": 514550 + }, + { + "epoch": 1.33, + "learning_rate": 9.992793838991552e-05, + "loss": 0.009, + "step": 514560 + }, + { + "epoch": 1.33, + "learning_rate": 9.992405017354406e-05, + "loss": 0.0085, + "step": 514570 + }, + { + "epoch": 1.33, + "learning_rate": 9.992016195717259e-05, + "loss": 0.0123, + "step": 514580 + }, + { + "epoch": 1.33, + "learning_rate": 9.991627374080111e-05, + "loss": 0.0112, + "step": 514590 + }, + { + "epoch": 1.33, + "learning_rate": 9.991238552442966e-05, + "loss": 0.0125, + "step": 514600 + }, + { + "epoch": 1.33, + "learning_rate": 9.990849730805818e-05, + "loss": 0.0116, + "step": 514610 + }, + { + "epoch": 1.33, + "learning_rate": 9.990460909168673e-05, + "loss": 0.0122, + "step": 514620 + }, + { + "epoch": 1.33, + "learning_rate": 9.990072087531525e-05, + "loss": 0.0084, + "step": 514630 + }, + { + "epoch": 1.33, + "learning_rate": 9.98968326589438e-05, + "loss": 0.0125, + "step": 514640 + }, + { + "epoch": 1.33, + "learning_rate": 9.989294444257232e-05, + "loss": 0.0069, + "step": 514650 + }, + { + "epoch": 1.33, + "learning_rate": 9.988905622620087e-05, + "loss": 0.0087, + "step": 514660 + }, + { + "epoch": 1.33, + "learning_rate": 9.98851680098294e-05, + "loss": 0.0083, + "step": 514670 + }, + { + "epoch": 1.33, + "learning_rate": 9.988127979345793e-05, + "loss": 0.0098, + "step": 514680 + }, + { + "epoch": 1.33, + "learning_rate": 9.987739157708646e-05, + "loss": 0.0121, + "step": 514690 + }, + { + "epoch": 1.33, + "learning_rate": 9.987350336071502e-05, + "loss": 0.0078, + "step": 514700 + }, + { + "epoch": 1.33, + "learning_rate": 9.986961514434355e-05, + "loss": 0.0084, + "step": 514710 + }, + { + "epoch": 1.33, + "learning_rate": 9.986572692797209e-05, + "loss": 0.0199, + "step": 514720 + }, + { + "epoch": 1.33, + "learning_rate": 9.986183871160062e-05, + "loss": 0.0079, + "step": 514730 + }, + { + "epoch": 1.33, + "learning_rate": 9.985795049522916e-05, + "loss": 0.0089, + "step": 514740 + }, + { + "epoch": 1.33, + "learning_rate": 9.985406227885769e-05, + "loss": 0.0096, + "step": 514750 + }, + { + "epoch": 1.33, + "learning_rate": 9.985017406248623e-05, + "loss": 0.0108, + "step": 514760 + }, + { + "epoch": 1.33, + "learning_rate": 9.984628584611476e-05, + "loss": 0.0096, + "step": 514770 + }, + { + "epoch": 1.33, + "learning_rate": 9.98423976297433e-05, + "loss": 0.0193, + "step": 514780 + }, + { + "epoch": 1.33, + "learning_rate": 9.983850941337183e-05, + "loss": 0.01, + "step": 514790 + }, + { + "epoch": 1.33, + "learning_rate": 9.983462119700037e-05, + "loss": 0.0115, + "step": 514800 + }, + { + "epoch": 1.33, + "learning_rate": 9.98307329806289e-05, + "loss": 0.0099, + "step": 514810 + }, + { + "epoch": 1.33, + "learning_rate": 9.982684476425744e-05, + "loss": 0.0085, + "step": 514820 + }, + { + "epoch": 1.33, + "learning_rate": 9.982295654788596e-05, + "loss": 0.0066, + "step": 514830 + }, + { + "epoch": 1.33, + "learning_rate": 9.981906833151449e-05, + "loss": 0.0123, + "step": 514840 + }, + { + "epoch": 1.33, + "learning_rate": 9.981518011514303e-05, + "loss": 0.0103, + "step": 514850 + }, + { + "epoch": 1.33, + "learning_rate": 9.981129189877156e-05, + "loss": 0.0122, + "step": 514860 + }, + { + "epoch": 1.33, + "learning_rate": 9.980740368240012e-05, + "loss": 0.0093, + "step": 514870 + }, + { + "epoch": 1.33, + "learning_rate": 9.980351546602863e-05, + "loss": 0.0073, + "step": 514880 + }, + { + "epoch": 1.33, + "learning_rate": 9.979962724965719e-05, + "loss": 0.0087, + "step": 514890 + }, + { + "epoch": 1.33, + "learning_rate": 9.979573903328572e-05, + "loss": 0.0101, + "step": 514900 + }, + { + "epoch": 1.33, + "learning_rate": 9.979185081691426e-05, + "loss": 0.0091, + "step": 514910 + }, + { + "epoch": 1.33, + "learning_rate": 9.978796260054279e-05, + "loss": 0.0075, + "step": 514920 + }, + { + "epoch": 1.33, + "learning_rate": 9.978407438417133e-05, + "loss": 0.011, + "step": 514930 + }, + { + "epoch": 1.33, + "learning_rate": 9.978018616779985e-05, + "loss": 0.0107, + "step": 514940 + }, + { + "epoch": 1.33, + "learning_rate": 9.97762979514284e-05, + "loss": 0.0083, + "step": 514950 + }, + { + "epoch": 1.33, + "learning_rate": 9.977240973505692e-05, + "loss": 0.0106, + "step": 514960 + }, + { + "epoch": 1.33, + "learning_rate": 9.976852151868547e-05, + "loss": 0.0083, + "step": 514970 + }, + { + "epoch": 1.33, + "learning_rate": 9.9764633302314e-05, + "loss": 0.0093, + "step": 514980 + }, + { + "epoch": 1.33, + "learning_rate": 9.976074508594254e-05, + "loss": 0.0101, + "step": 514990 + }, + { + "epoch": 1.33, + "learning_rate": 9.975685686957106e-05, + "loss": 0.0079, + "step": 515000 + }, + { + "epoch": 1.33, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.006493269931524992, + "eval_runtime": 108.0338, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, + "step": 515000 + }, + { + "epoch": 1.33, + "learning_rate": 9.97529686531996e-05, + "loss": 0.0072, + "step": 515010 + }, + { + "epoch": 1.34, + "learning_rate": 9.974908043682813e-05, + "loss": 0.0088, + "step": 515020 + }, + { + "epoch": 1.34, + "learning_rate": 9.974519222045668e-05, + "loss": 0.0101, + "step": 515030 + }, + { + "epoch": 1.34, + "learning_rate": 9.97413040040852e-05, + "loss": 0.0084, + "step": 515040 + }, + { + "epoch": 1.34, + "learning_rate": 9.973741578771376e-05, + "loss": 0.0128, + "step": 515050 + }, + { + "epoch": 1.34, + "learning_rate": 9.973352757134229e-05, + "loss": 0.0101, + "step": 515060 + }, + { + "epoch": 1.34, + "learning_rate": 9.972963935497081e-05, + "loss": 0.0098, + "step": 515070 + }, + { + "epoch": 1.34, + "learning_rate": 9.972575113859936e-05, + "loss": 0.0117, + "step": 515080 + }, + { + "epoch": 1.34, + "learning_rate": 9.972186292222788e-05, + "loss": 0.0095, + "step": 515090 + }, + { + "epoch": 1.34, + "learning_rate": 9.971797470585643e-05, + "loss": 0.0107, + "step": 515100 + }, + { + "epoch": 1.34, + "learning_rate": 9.971408648948495e-05, + "loss": 0.0095, + "step": 515110 + }, + { + "epoch": 1.34, + "learning_rate": 9.97101982731135e-05, + "loss": 0.0098, + "step": 515120 + }, + { + "epoch": 1.34, + "learning_rate": 9.970631005674202e-05, + "loss": 0.0099, + "step": 515130 + }, + { + "epoch": 1.34, + "learning_rate": 9.970242184037057e-05, + "loss": 0.0095, + "step": 515140 + }, + { + "epoch": 1.34, + "learning_rate": 9.96985336239991e-05, + "loss": 0.0125, + "step": 515150 + }, + { + "epoch": 1.34, + "learning_rate": 9.969464540762764e-05, + "loss": 0.0086, + "step": 515160 + }, + { + "epoch": 1.34, + "learning_rate": 9.969075719125616e-05, + "loss": 0.0108, + "step": 515170 + }, + { + "epoch": 1.34, + "learning_rate": 9.96868689748847e-05, + "loss": 0.0097, + "step": 515180 + }, + { + "epoch": 1.34, + "learning_rate": 9.968298075851323e-05, + "loss": 0.0081, + "step": 515190 + }, + { + "epoch": 1.34, + "learning_rate": 9.967909254214177e-05, + "loss": 0.0082, + "step": 515200 + }, + { + "epoch": 1.34, + "learning_rate": 9.96752043257703e-05, + "loss": 0.0071, + "step": 515210 + }, + { + "epoch": 1.34, + "learning_rate": 9.967131610939886e-05, + "loss": 0.0125, + "step": 515220 + }, + { + "epoch": 1.34, + "learning_rate": 9.966742789302739e-05, + "loss": 0.0108, + "step": 515230 + }, + { + "epoch": 1.34, + "learning_rate": 9.966353967665593e-05, + "loss": 0.0087, + "step": 515240 + }, + { + "epoch": 1.34, + "learning_rate": 9.965965146028446e-05, + "loss": 0.0091, + "step": 515250 + }, + { + "epoch": 1.34, + "learning_rate": 9.9655763243913e-05, + "loss": 0.0109, + "step": 515260 + }, + { + "epoch": 1.34, + "learning_rate": 9.965187502754153e-05, + "loss": 0.0087, + "step": 515270 + }, + { + "epoch": 1.34, + "learning_rate": 9.964798681117007e-05, + "loss": 0.0104, + "step": 515280 + }, + { + "epoch": 1.34, + "learning_rate": 9.96440985947986e-05, + "loss": 0.0103, + "step": 515290 + }, + { + "epoch": 1.34, + "learning_rate": 9.964021037842714e-05, + "loss": 0.0086, + "step": 515300 + }, + { + "epoch": 1.34, + "learning_rate": 9.963632216205567e-05, + "loss": 0.0107, + "step": 515310 + }, + { + "epoch": 1.34, + "learning_rate": 9.96324339456842e-05, + "loss": 0.0107, + "step": 515320 + }, + { + "epoch": 1.34, + "learning_rate": 9.962854572931273e-05, + "loss": 0.0074, + "step": 515330 + }, + { + "epoch": 1.34, + "learning_rate": 9.962465751294126e-05, + "loss": 0.015, + "step": 515340 + }, + { + "epoch": 1.34, + "learning_rate": 9.96207692965698e-05, + "loss": 0.0123, + "step": 515350 + }, + { + "epoch": 1.34, + "learning_rate": 9.961688108019833e-05, + "loss": 0.0099, + "step": 515360 + }, + { + "epoch": 1.34, + "learning_rate": 9.961299286382687e-05, + "loss": 0.012, + "step": 515370 + }, + { + "epoch": 1.34, + "learning_rate": 9.96091046474554e-05, + "loss": 0.0089, + "step": 515380 + }, + { + "epoch": 1.34, + "learning_rate": 9.960521643108394e-05, + "loss": 0.0128, + "step": 515390 + }, + { + "epoch": 1.34, + "learning_rate": 9.960132821471247e-05, + "loss": 0.0116, + "step": 515400 + }, + { + "epoch": 1.34, + "learning_rate": 9.959743999834103e-05, + "loss": 0.0083, + "step": 515410 + }, + { + "epoch": 1.34, + "learning_rate": 9.959355178196956e-05, + "loss": 0.0078, + "step": 515420 + }, + { + "epoch": 1.34, + "learning_rate": 9.95896635655981e-05, + "loss": 0.0117, + "step": 515430 + }, + { + "epoch": 1.34, + "learning_rate": 9.958577534922663e-05, + "loss": 0.0086, + "step": 515440 + }, + { + "epoch": 1.34, + "learning_rate": 9.958188713285517e-05, + "loss": 0.0091, + "step": 515450 + }, + { + "epoch": 1.34, + "learning_rate": 9.95779989164837e-05, + "loss": 0.0097, + "step": 515460 + }, + { + "epoch": 1.34, + "learning_rate": 9.957411070011224e-05, + "loss": 0.0079, + "step": 515470 + }, + { + "epoch": 1.34, + "learning_rate": 9.957022248374076e-05, + "loss": 0.007, + "step": 515480 + }, + { + "epoch": 1.34, + "learning_rate": 9.95663342673693e-05, + "loss": 0.0109, + "step": 515490 + }, + { + "epoch": 1.34, + "learning_rate": 9.956244605099783e-05, + "loss": 0.011, + "step": 515500 + }, + { + "epoch": 1.34, + "learning_rate": 9.955855783462638e-05, + "loss": 0.013, + "step": 515510 + }, + { + "epoch": 1.34, + "learning_rate": 9.95546696182549e-05, + "loss": 0.0085, + "step": 515520 + }, + { + "epoch": 1.34, + "learning_rate": 9.955078140188345e-05, + "loss": 0.0121, + "step": 515530 + }, + { + "epoch": 1.34, + "learning_rate": 9.954689318551197e-05, + "loss": 0.0123, + "step": 515540 + }, + { + "epoch": 1.34, + "learning_rate": 9.954300496914052e-05, + "loss": 0.0133, + "step": 515550 + }, + { + "epoch": 1.34, + "learning_rate": 9.953911675276904e-05, + "loss": 0.0102, + "step": 515560 + }, + { + "epoch": 1.34, + "learning_rate": 9.953522853639757e-05, + "loss": 0.0084, + "step": 515570 + }, + { + "epoch": 1.34, + "learning_rate": 9.953134032002613e-05, + "loss": 0.0121, + "step": 515580 + }, + { + "epoch": 1.34, + "learning_rate": 9.952745210365464e-05, + "loss": 0.0122, + "step": 515590 + }, + { + "epoch": 1.34, + "learning_rate": 9.95235638872832e-05, + "loss": 0.0109, + "step": 515600 + }, + { + "epoch": 1.34, + "learning_rate": 9.951967567091172e-05, + "loss": 0.0092, + "step": 515610 + }, + { + "epoch": 1.34, + "learning_rate": 9.951578745454027e-05, + "loss": 0.0113, + "step": 515620 + }, + { + "epoch": 1.34, + "learning_rate": 9.95118992381688e-05, + "loss": 0.0086, + "step": 515630 + }, + { + "epoch": 1.34, + "learning_rate": 9.950801102179734e-05, + "loss": 0.0109, + "step": 515640 + }, + { + "epoch": 1.34, + "learning_rate": 9.950412280542586e-05, + "loss": 0.0101, + "step": 515650 + }, + { + "epoch": 1.34, + "learning_rate": 9.95002345890544e-05, + "loss": 0.0099, + "step": 515660 + }, + { + "epoch": 1.34, + "learning_rate": 9.949634637268293e-05, + "loss": 0.0082, + "step": 515670 + }, + { + "epoch": 1.34, + "learning_rate": 9.949245815631148e-05, + "loss": 0.0115, + "step": 515680 + }, + { + "epoch": 1.34, + "learning_rate": 9.948856993994e-05, + "loss": 0.0132, + "step": 515690 + }, + { + "epoch": 1.34, + "learning_rate": 9.948468172356855e-05, + "loss": 0.0085, + "step": 515700 + }, + { + "epoch": 1.34, + "learning_rate": 9.948079350719707e-05, + "loss": 0.0093, + "step": 515710 + }, + { + "epoch": 1.34, + "learning_rate": 9.947690529082561e-05, + "loss": 0.0104, + "step": 515720 + }, + { + "epoch": 1.34, + "learning_rate": 9.947301707445414e-05, + "loss": 0.0094, + "step": 515730 + }, + { + "epoch": 1.34, + "learning_rate": 9.94691288580827e-05, + "loss": 0.0085, + "step": 515740 + }, + { + "epoch": 1.34, + "learning_rate": 9.946524064171121e-05, + "loss": 0.0111, + "step": 515750 + }, + { + "epoch": 1.34, + "learning_rate": 9.946135242533977e-05, + "loss": 0.0118, + "step": 515760 + }, + { + "epoch": 1.34, + "learning_rate": 9.94574642089683e-05, + "loss": 0.0115, + "step": 515770 + }, + { + "epoch": 1.34, + "learning_rate": 9.945357599259684e-05, + "loss": 0.0082, + "step": 515780 + }, + { + "epoch": 1.34, + "learning_rate": 9.944968777622537e-05, + "loss": 0.0081, + "step": 515790 + }, + { + "epoch": 1.34, + "learning_rate": 9.944579955985391e-05, + "loss": 0.0084, + "step": 515800 + }, + { + "epoch": 1.34, + "learning_rate": 9.944191134348244e-05, + "loss": 0.009, + "step": 515810 + }, + { + "epoch": 1.34, + "learning_rate": 9.943802312711096e-05, + "loss": 0.0092, + "step": 515820 + }, + { + "epoch": 1.34, + "learning_rate": 9.94341349107395e-05, + "loss": 0.01, + "step": 515830 + }, + { + "epoch": 1.34, + "learning_rate": 9.943024669436803e-05, + "loss": 0.0082, + "step": 515840 + }, + { + "epoch": 1.34, + "learning_rate": 9.942635847799657e-05, + "loss": 0.0077, + "step": 515850 + }, + { + "epoch": 1.34, + "learning_rate": 9.94224702616251e-05, + "loss": 0.0132, + "step": 515860 + }, + { + "epoch": 1.34, + "learning_rate": 9.941858204525364e-05, + "loss": 0.012, + "step": 515870 + }, + { + "epoch": 1.34, + "learning_rate": 9.941469382888217e-05, + "loss": 0.0112, + "step": 515880 + }, + { + "epoch": 1.34, + "learning_rate": 9.941080561251071e-05, + "loss": 0.0101, + "step": 515890 + }, + { + "epoch": 1.34, + "learning_rate": 9.940691739613924e-05, + "loss": 0.0073, + "step": 515900 + }, + { + "epoch": 1.34, + "learning_rate": 9.940302917976778e-05, + "loss": 0.0103, + "step": 515910 + }, + { + "epoch": 1.34, + "learning_rate": 9.939914096339631e-05, + "loss": 0.0092, + "step": 515920 + }, + { + "epoch": 1.34, + "learning_rate": 9.939525274702487e-05, + "loss": 0.0105, + "step": 515930 + }, + { + "epoch": 1.34, + "learning_rate": 9.93913645306534e-05, + "loss": 0.0093, + "step": 515940 + }, + { + "epoch": 1.34, + "learning_rate": 9.938747631428194e-05, + "loss": 0.0088, + "step": 515950 + }, + { + "epoch": 1.34, + "learning_rate": 9.938358809791047e-05, + "loss": 0.0099, + "step": 515960 + }, + { + "epoch": 1.34, + "learning_rate": 9.9379699881539e-05, + "loss": 0.0111, + "step": 515970 + }, + { + "epoch": 1.34, + "learning_rate": 9.937581166516753e-05, + "loss": 0.0086, + "step": 515980 + }, + { + "epoch": 1.34, + "learning_rate": 9.937192344879608e-05, + "loss": 0.01, + "step": 515990 + }, + { + "epoch": 1.34, + "learning_rate": 9.93680352324246e-05, + "loss": 0.0092, + "step": 516000 + }, + { + "epoch": 1.34, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.006371052470058203, + "eval_runtime": 107.8941, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 516000 + }, + { + "epoch": 1.34, + "learning_rate": 9.936414701605315e-05, + "loss": 0.0107, + "step": 516010 + }, + { + "epoch": 1.34, + "learning_rate": 9.936025879968167e-05, + "loss": 0.0106, + "step": 516020 + }, + { + "epoch": 1.34, + "learning_rate": 9.935637058331022e-05, + "loss": 0.009, + "step": 516030 + }, + { + "epoch": 1.34, + "learning_rate": 9.935248236693874e-05, + "loss": 0.0084, + "step": 516040 + }, + { + "epoch": 1.34, + "learning_rate": 9.934859415056729e-05, + "loss": 0.0073, + "step": 516050 + }, + { + "epoch": 1.34, + "learning_rate": 9.934470593419581e-05, + "loss": 0.0123, + "step": 516060 + }, + { + "epoch": 1.34, + "learning_rate": 9.934081771782434e-05, + "loss": 0.0102, + "step": 516070 + }, + { + "epoch": 1.34, + "learning_rate": 9.933692950145288e-05, + "loss": 0.0109, + "step": 516080 + }, + { + "epoch": 1.34, + "learning_rate": 9.933304128508141e-05, + "loss": 0.009, + "step": 516090 + }, + { + "epoch": 1.34, + "learning_rate": 9.932915306870997e-05, + "loss": 0.0074, + "step": 516100 + }, + { + "epoch": 1.34, + "learning_rate": 9.932526485233848e-05, + "loss": 0.0088, + "step": 516110 + }, + { + "epoch": 1.34, + "learning_rate": 9.932137663596704e-05, + "loss": 0.0091, + "step": 516120 + }, + { + "epoch": 1.34, + "learning_rate": 9.931748841959556e-05, + "loss": 0.0107, + "step": 516130 + }, + { + "epoch": 1.34, + "learning_rate": 9.93136002032241e-05, + "loss": 0.0151, + "step": 516140 + }, + { + "epoch": 1.34, + "learning_rate": 9.930971198685263e-05, + "loss": 0.012, + "step": 516150 + }, + { + "epoch": 1.34, + "learning_rate": 9.930582377048118e-05, + "loss": 0.0078, + "step": 516160 + }, + { + "epoch": 1.34, + "learning_rate": 9.93019355541097e-05, + "loss": 0.0081, + "step": 516170 + }, + { + "epoch": 1.34, + "learning_rate": 9.929804733773825e-05, + "loss": 0.012, + "step": 516180 + }, + { + "epoch": 1.34, + "learning_rate": 9.929415912136677e-05, + "loss": 0.0099, + "step": 516190 + }, + { + "epoch": 1.34, + "learning_rate": 9.929027090499532e-05, + "loss": 0.011, + "step": 516200 + }, + { + "epoch": 1.34, + "learning_rate": 9.928638268862384e-05, + "loss": 0.0103, + "step": 516210 + }, + { + "epoch": 1.34, + "learning_rate": 9.928249447225238e-05, + "loss": 0.0079, + "step": 516220 + }, + { + "epoch": 1.34, + "learning_rate": 9.927860625588091e-05, + "loss": 0.0084, + "step": 516230 + }, + { + "epoch": 1.34, + "learning_rate": 9.927471803950945e-05, + "loss": 0.0093, + "step": 516240 + }, + { + "epoch": 1.34, + "learning_rate": 9.927082982313798e-05, + "loss": 0.0087, + "step": 516250 + }, + { + "epoch": 1.34, + "learning_rate": 9.926694160676654e-05, + "loss": 0.0084, + "step": 516260 + }, + { + "epoch": 1.34, + "learning_rate": 9.926305339039505e-05, + "loss": 0.0082, + "step": 516270 + }, + { + "epoch": 1.34, + "learning_rate": 9.925916517402361e-05, + "loss": 0.0102, + "step": 516280 + }, + { + "epoch": 1.34, + "learning_rate": 9.925527695765214e-05, + "loss": 0.0113, + "step": 516290 + }, + { + "epoch": 1.34, + "learning_rate": 9.925138874128068e-05, + "loss": 0.0119, + "step": 516300 + }, + { + "epoch": 1.34, + "learning_rate": 9.92475005249092e-05, + "loss": 0.0074, + "step": 516310 + }, + { + "epoch": 1.34, + "learning_rate": 9.924361230853773e-05, + "loss": 0.012, + "step": 516320 + }, + { + "epoch": 1.34, + "learning_rate": 9.923972409216628e-05, + "loss": 0.0116, + "step": 516330 + }, + { + "epoch": 1.34, + "learning_rate": 9.92358358757948e-05, + "loss": 0.0101, + "step": 516340 + }, + { + "epoch": 1.34, + "learning_rate": 9.923194765942334e-05, + "loss": 0.0097, + "step": 516350 + }, + { + "epoch": 1.34, + "learning_rate": 9.922805944305187e-05, + "loss": 0.011, + "step": 516360 + }, + { + "epoch": 1.34, + "learning_rate": 9.922417122668041e-05, + "loss": 0.0092, + "step": 516370 + }, + { + "epoch": 1.34, + "learning_rate": 9.922028301030894e-05, + "loss": 0.0098, + "step": 516380 + }, + { + "epoch": 1.34, + "learning_rate": 9.921639479393748e-05, + "loss": 0.0081, + "step": 516390 + }, + { + "epoch": 1.34, + "learning_rate": 9.921250657756601e-05, + "loss": 0.0095, + "step": 516400 + }, + { + "epoch": 1.34, + "learning_rate": 9.920861836119455e-05, + "loss": 0.0108, + "step": 516410 + }, + { + "epoch": 1.34, + "learning_rate": 9.920473014482308e-05, + "loss": 0.0113, + "step": 516420 + }, + { + "epoch": 1.34, + "learning_rate": 9.920084192845162e-05, + "loss": 0.0104, + "step": 516430 + }, + { + "epoch": 1.34, + "learning_rate": 9.919695371208015e-05, + "loss": 0.0093, + "step": 516440 + }, + { + "epoch": 1.34, + "learning_rate": 9.919306549570871e-05, + "loss": 0.0079, + "step": 516450 + }, + { + "epoch": 1.34, + "learning_rate": 9.918917727933724e-05, + "loss": 0.0091, + "step": 516460 + }, + { + "epoch": 1.34, + "learning_rate": 9.918528906296578e-05, + "loss": 0.0089, + "step": 516470 + }, + { + "epoch": 1.34, + "learning_rate": 9.91814008465943e-05, + "loss": 0.0089, + "step": 516480 + }, + { + "epoch": 1.34, + "learning_rate": 9.917751263022285e-05, + "loss": 0.0085, + "step": 516490 + }, + { + "epoch": 1.34, + "learning_rate": 9.917362441385137e-05, + "loss": 0.0083, + "step": 516500 + }, + { + "epoch": 1.34, + "learning_rate": 9.916973619747992e-05, + "loss": 0.0102, + "step": 516510 + }, + { + "epoch": 1.34, + "learning_rate": 9.916584798110844e-05, + "loss": 0.0133, + "step": 516520 + }, + { + "epoch": 1.34, + "learning_rate": 9.916195976473699e-05, + "loss": 0.0127, + "step": 516530 + }, + { + "epoch": 1.34, + "learning_rate": 9.915807154836551e-05, + "loss": 0.0097, + "step": 516540 + }, + { + "epoch": 1.34, + "learning_rate": 9.915418333199406e-05, + "loss": 0.0107, + "step": 516550 + }, + { + "epoch": 1.34, + "learning_rate": 9.915029511562258e-05, + "loss": 0.0125, + "step": 516560 + }, + { + "epoch": 1.34, + "learning_rate": 9.914640689925111e-05, + "loss": 0.0094, + "step": 516570 + }, + { + "epoch": 1.34, + "learning_rate": 9.914251868287965e-05, + "loss": 0.0101, + "step": 516580 + }, + { + "epoch": 1.34, + "learning_rate": 9.913863046650818e-05, + "loss": 0.0109, + "step": 516590 + }, + { + "epoch": 1.34, + "learning_rate": 9.913474225013672e-05, + "loss": 0.0113, + "step": 516600 + }, + { + "epoch": 1.34, + "learning_rate": 9.913085403376525e-05, + "loss": 0.0081, + "step": 516610 + }, + { + "epoch": 1.34, + "learning_rate": 9.912696581739379e-05, + "loss": 0.0083, + "step": 516620 + }, + { + "epoch": 1.34, + "learning_rate": 9.912307760102232e-05, + "loss": 0.0078, + "step": 516630 + }, + { + "epoch": 1.34, + "learning_rate": 9.911918938465088e-05, + "loss": 0.0094, + "step": 516640 + }, + { + "epoch": 1.34, + "learning_rate": 9.91153011682794e-05, + "loss": 0.0107, + "step": 516650 + }, + { + "epoch": 1.34, + "learning_rate": 9.911141295190795e-05, + "loss": 0.0122, + "step": 516660 + }, + { + "epoch": 1.34, + "learning_rate": 9.910752473553647e-05, + "loss": 0.0142, + "step": 516670 + }, + { + "epoch": 1.34, + "learning_rate": 9.910363651916502e-05, + "loss": 0.0088, + "step": 516680 + }, + { + "epoch": 1.34, + "learning_rate": 9.909974830279354e-05, + "loss": 0.0089, + "step": 516690 + }, + { + "epoch": 1.34, + "learning_rate": 9.909586008642209e-05, + "loss": 0.0082, + "step": 516700 + }, + { + "epoch": 1.34, + "learning_rate": 9.909197187005061e-05, + "loss": 0.0089, + "step": 516710 + }, + { + "epoch": 1.34, + "learning_rate": 9.908808365367916e-05, + "loss": 0.007, + "step": 516720 + }, + { + "epoch": 1.34, + "learning_rate": 9.908419543730768e-05, + "loss": 0.0096, + "step": 516730 + }, + { + "epoch": 1.34, + "learning_rate": 9.908030722093622e-05, + "loss": 0.0093, + "step": 516740 + }, + { + "epoch": 1.34, + "learning_rate": 9.907641900456475e-05, + "loss": 0.01, + "step": 516750 + }, + { + "epoch": 1.34, + "learning_rate": 9.90725307881933e-05, + "loss": 0.0065, + "step": 516760 + }, + { + "epoch": 1.34, + "learning_rate": 9.906864257182182e-05, + "loss": 0.0105, + "step": 516770 + }, + { + "epoch": 1.34, + "learning_rate": 9.906475435545036e-05, + "loss": 0.0076, + "step": 516780 + }, + { + "epoch": 1.34, + "learning_rate": 9.906086613907889e-05, + "loss": 0.0095, + "step": 516790 + }, + { + "epoch": 1.34, + "learning_rate": 9.905697792270745e-05, + "loss": 0.0088, + "step": 516800 + }, + { + "epoch": 1.34, + "learning_rate": 9.905308970633598e-05, + "loss": 0.0087, + "step": 516810 + }, + { + "epoch": 1.34, + "learning_rate": 9.90492014899645e-05, + "loss": 0.0101, + "step": 516820 + }, + { + "epoch": 1.34, + "learning_rate": 9.904531327359305e-05, + "loss": 0.0089, + "step": 516830 + }, + { + "epoch": 1.34, + "learning_rate": 9.904142505722157e-05, + "loss": 0.0082, + "step": 516840 + }, + { + "epoch": 1.34, + "learning_rate": 9.903753684085012e-05, + "loss": 0.0069, + "step": 516850 + }, + { + "epoch": 1.34, + "learning_rate": 9.903364862447864e-05, + "loss": 0.0097, + "step": 516860 + }, + { + "epoch": 1.34, + "learning_rate": 9.902976040810718e-05, + "loss": 0.0096, + "step": 516870 + }, + { + "epoch": 1.34, + "learning_rate": 9.902587219173571e-05, + "loss": 0.0108, + "step": 516880 + }, + { + "epoch": 1.34, + "learning_rate": 9.902198397536425e-05, + "loss": 0.0103, + "step": 516890 + }, + { + "epoch": 1.34, + "learning_rate": 9.901809575899278e-05, + "loss": 0.0116, + "step": 516900 + }, + { + "epoch": 1.34, + "learning_rate": 9.901420754262132e-05, + "loss": 0.0091, + "step": 516910 + }, + { + "epoch": 1.34, + "learning_rate": 9.901031932624985e-05, + "loss": 0.0104, + "step": 516920 + }, + { + "epoch": 1.34, + "learning_rate": 9.90064311098784e-05, + "loss": 0.0092, + "step": 516930 + }, + { + "epoch": 1.34, + "learning_rate": 9.900254289350692e-05, + "loss": 0.0089, + "step": 516940 + }, + { + "epoch": 1.34, + "learning_rate": 9.899865467713546e-05, + "loss": 0.0127, + "step": 516950 + }, + { + "epoch": 1.34, + "learning_rate": 9.899476646076399e-05, + "loss": 0.0077, + "step": 516960 + }, + { + "epoch": 1.34, + "learning_rate": 9.899087824439255e-05, + "loss": 0.0112, + "step": 516970 + }, + { + "epoch": 1.34, + "learning_rate": 9.898699002802106e-05, + "loss": 0.0102, + "step": 516980 + }, + { + "epoch": 1.34, + "learning_rate": 9.898310181164962e-05, + "loss": 0.0115, + "step": 516990 + }, + { + "epoch": 1.34, + "learning_rate": 9.897921359527814e-05, + "loss": 0.0112, + "step": 517000 + }, + { + "epoch": 1.34, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.006507012993097305, + "eval_runtime": 107.881, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 517000 + }, + { + "epoch": 1.34, + "learning_rate": 9.897532537890669e-05, + "loss": 0.0128, + "step": 517010 + }, + { + "epoch": 1.34, + "learning_rate": 9.897143716253521e-05, + "loss": 0.0128, + "step": 517020 + }, + { + "epoch": 1.34, + "learning_rate": 9.896754894616376e-05, + "loss": 0.0094, + "step": 517030 + }, + { + "epoch": 1.34, + "learning_rate": 9.896366072979228e-05, + "loss": 0.0101, + "step": 517040 + }, + { + "epoch": 1.34, + "learning_rate": 9.895977251342083e-05, + "loss": 0.012, + "step": 517050 + }, + { + "epoch": 1.34, + "learning_rate": 9.895588429704935e-05, + "loss": 0.0129, + "step": 517060 + }, + { + "epoch": 1.34, + "learning_rate": 9.895199608067788e-05, + "loss": 0.0094, + "step": 517070 + }, + { + "epoch": 1.34, + "learning_rate": 9.894810786430642e-05, + "loss": 0.0082, + "step": 517080 + }, + { + "epoch": 1.34, + "learning_rate": 9.894421964793495e-05, + "loss": 0.0092, + "step": 517090 + }, + { + "epoch": 1.34, + "learning_rate": 9.89403314315635e-05, + "loss": 0.008, + "step": 517100 + }, + { + "epoch": 1.34, + "learning_rate": 9.893644321519202e-05, + "loss": 0.0096, + "step": 517110 + }, + { + "epoch": 1.34, + "learning_rate": 9.893255499882056e-05, + "loss": 0.01, + "step": 517120 + }, + { + "epoch": 1.34, + "learning_rate": 9.892866678244909e-05, + "loss": 0.0107, + "step": 517130 + }, + { + "epoch": 1.34, + "learning_rate": 9.892477856607763e-05, + "loss": 0.0095, + "step": 517140 + }, + { + "epoch": 1.34, + "learning_rate": 9.892089034970616e-05, + "loss": 0.0099, + "step": 517150 + }, + { + "epoch": 1.34, + "learning_rate": 9.891700213333472e-05, + "loss": 0.0084, + "step": 517160 + }, + { + "epoch": 1.34, + "learning_rate": 9.891311391696324e-05, + "loss": 0.008, + "step": 517170 + }, + { + "epoch": 1.34, + "learning_rate": 9.890922570059179e-05, + "loss": 0.0104, + "step": 517180 + }, + { + "epoch": 1.34, + "learning_rate": 9.890533748422031e-05, + "loss": 0.0093, + "step": 517190 + }, + { + "epoch": 1.34, + "learning_rate": 9.890144926784886e-05, + "loss": 0.0114, + "step": 517200 + }, + { + "epoch": 1.34, + "learning_rate": 9.889756105147738e-05, + "loss": 0.0093, + "step": 517210 + }, + { + "epoch": 1.34, + "learning_rate": 9.889367283510593e-05, + "loss": 0.0124, + "step": 517220 + }, + { + "epoch": 1.34, + "learning_rate": 9.888978461873445e-05, + "loss": 0.0117, + "step": 517230 + }, + { + "epoch": 1.34, + "learning_rate": 9.8885896402363e-05, + "loss": 0.0087, + "step": 517240 + }, + { + "epoch": 1.34, + "learning_rate": 9.888200818599152e-05, + "loss": 0.0076, + "step": 517250 + }, + { + "epoch": 1.34, + "learning_rate": 9.887811996962006e-05, + "loss": 0.0118, + "step": 517260 + }, + { + "epoch": 1.34, + "learning_rate": 9.887423175324859e-05, + "loss": 0.007, + "step": 517270 + }, + { + "epoch": 1.34, + "learning_rate": 9.887034353687713e-05, + "loss": 0.01, + "step": 517280 + }, + { + "epoch": 1.34, + "learning_rate": 9.886645532050566e-05, + "loss": 0.0082, + "step": 517290 + }, + { + "epoch": 1.34, + "learning_rate": 9.88625671041342e-05, + "loss": 0.0095, + "step": 517300 + }, + { + "epoch": 1.34, + "learning_rate": 9.885867888776273e-05, + "loss": 0.0114, + "step": 517310 + }, + { + "epoch": 1.34, + "learning_rate": 9.885479067139126e-05, + "loss": 0.0107, + "step": 517320 + }, + { + "epoch": 1.34, + "learning_rate": 9.885090245501982e-05, + "loss": 0.0066, + "step": 517330 + }, + { + "epoch": 1.34, + "learning_rate": 9.884701423864833e-05, + "loss": 0.0081, + "step": 517340 + }, + { + "epoch": 1.34, + "learning_rate": 9.884312602227689e-05, + "loss": 0.0115, + "step": 517350 + }, + { + "epoch": 1.34, + "learning_rate": 9.883923780590541e-05, + "loss": 0.0106, + "step": 517360 + }, + { + "epoch": 1.34, + "learning_rate": 9.883534958953396e-05, + "loss": 0.0076, + "step": 517370 + }, + { + "epoch": 1.34, + "learning_rate": 9.883146137316248e-05, + "loss": 0.0121, + "step": 517380 + }, + { + "epoch": 1.34, + "learning_rate": 9.882757315679102e-05, + "loss": 0.0072, + "step": 517390 + }, + { + "epoch": 1.34, + "learning_rate": 9.882368494041955e-05, + "loss": 0.0079, + "step": 517400 + }, + { + "epoch": 1.34, + "learning_rate": 9.88197967240481e-05, + "loss": 0.0096, + "step": 517410 + }, + { + "epoch": 1.34, + "learning_rate": 9.881590850767662e-05, + "loss": 0.0124, + "step": 517420 + }, + { + "epoch": 1.34, + "learning_rate": 9.881202029130516e-05, + "loss": 0.0102, + "step": 517430 + }, + { + "epoch": 1.34, + "learning_rate": 9.880813207493369e-05, + "loss": 0.0091, + "step": 517440 + }, + { + "epoch": 1.34, + "learning_rate": 9.880424385856223e-05, + "loss": 0.0138, + "step": 517450 + }, + { + "epoch": 1.34, + "learning_rate": 9.880035564219076e-05, + "loss": 0.0085, + "step": 517460 + }, + { + "epoch": 1.34, + "learning_rate": 9.87964674258193e-05, + "loss": 0.0147, + "step": 517470 + }, + { + "epoch": 1.34, + "learning_rate": 9.879257920944783e-05, + "loss": 0.0095, + "step": 517480 + }, + { + "epoch": 1.34, + "learning_rate": 9.878869099307639e-05, + "loss": 0.0118, + "step": 517490 + }, + { + "epoch": 1.34, + "learning_rate": 9.87848027767049e-05, + "loss": 0.0103, + "step": 517500 + }, + { + "epoch": 1.34, + "learning_rate": 9.878091456033346e-05, + "loss": 0.0098, + "step": 517510 + }, + { + "epoch": 1.34, + "learning_rate": 9.877702634396198e-05, + "loss": 0.0099, + "step": 517520 + }, + { + "epoch": 1.34, + "learning_rate": 9.877313812759053e-05, + "loss": 0.0074, + "step": 517530 + }, + { + "epoch": 1.34, + "learning_rate": 9.876924991121905e-05, + "loss": 0.0108, + "step": 517540 + }, + { + "epoch": 1.34, + "learning_rate": 9.87653616948476e-05, + "loss": 0.0108, + "step": 517550 + }, + { + "epoch": 1.34, + "learning_rate": 9.876147347847612e-05, + "loss": 0.0116, + "step": 517560 + }, + { + "epoch": 1.34, + "learning_rate": 9.875758526210465e-05, + "loss": 0.0127, + "step": 517570 + }, + { + "epoch": 1.34, + "learning_rate": 9.87536970457332e-05, + "loss": 0.0108, + "step": 517580 + }, + { + "epoch": 1.34, + "learning_rate": 9.874980882936172e-05, + "loss": 0.0078, + "step": 517590 + }, + { + "epoch": 1.34, + "learning_rate": 9.874592061299026e-05, + "loss": 0.0098, + "step": 517600 + }, + { + "epoch": 1.34, + "learning_rate": 9.874203239661879e-05, + "loss": 0.0096, + "step": 517610 + }, + { + "epoch": 1.34, + "learning_rate": 9.873814418024733e-05, + "loss": 0.0107, + "step": 517620 + }, + { + "epoch": 1.34, + "learning_rate": 9.873425596387586e-05, + "loss": 0.0099, + "step": 517630 + }, + { + "epoch": 1.34, + "learning_rate": 9.87303677475044e-05, + "loss": 0.0103, + "step": 517640 + }, + { + "epoch": 1.34, + "learning_rate": 9.872647953113293e-05, + "loss": 0.0084, + "step": 517650 + }, + { + "epoch": 1.34, + "learning_rate": 9.872259131476147e-05, + "loss": 0.0122, + "step": 517660 + }, + { + "epoch": 1.34, + "learning_rate": 9.871870309839e-05, + "loss": 0.0086, + "step": 517670 + }, + { + "epoch": 1.34, + "learning_rate": 9.871481488201856e-05, + "loss": 0.0117, + "step": 517680 + }, + { + "epoch": 1.34, + "learning_rate": 9.871092666564708e-05, + "loss": 0.0126, + "step": 517690 + }, + { + "epoch": 1.34, + "learning_rate": 9.870703844927563e-05, + "loss": 0.012, + "step": 517700 + }, + { + "epoch": 1.34, + "learning_rate": 9.870315023290415e-05, + "loss": 0.0079, + "step": 517710 + }, + { + "epoch": 1.34, + "learning_rate": 9.86992620165327e-05, + "loss": 0.0092, + "step": 517720 + }, + { + "epoch": 1.34, + "learning_rate": 9.869537380016122e-05, + "loss": 0.0164, + "step": 517730 + }, + { + "epoch": 1.34, + "learning_rate": 9.869148558378977e-05, + "loss": 0.0112, + "step": 517740 + }, + { + "epoch": 1.34, + "learning_rate": 9.86875973674183e-05, + "loss": 0.0116, + "step": 517750 + }, + { + "epoch": 1.34, + "learning_rate": 9.868370915104683e-05, + "loss": 0.0131, + "step": 517760 + }, + { + "epoch": 1.34, + "learning_rate": 9.867982093467536e-05, + "loss": 0.0122, + "step": 517770 + }, + { + "epoch": 1.34, + "learning_rate": 9.86759327183039e-05, + "loss": 0.01, + "step": 517780 + }, + { + "epoch": 1.34, + "learning_rate": 9.867204450193243e-05, + "loss": 0.0109, + "step": 517790 + }, + { + "epoch": 1.34, + "learning_rate": 9.866815628556096e-05, + "loss": 0.0118, + "step": 517800 + }, + { + "epoch": 1.34, + "learning_rate": 9.86642680691895e-05, + "loss": 0.01, + "step": 517810 + }, + { + "epoch": 1.34, + "learning_rate": 9.866037985281803e-05, + "loss": 0.0111, + "step": 517820 + }, + { + "epoch": 1.34, + "learning_rate": 9.865649163644657e-05, + "loss": 0.009, + "step": 517830 + }, + { + "epoch": 1.34, + "learning_rate": 9.86526034200751e-05, + "loss": 0.0122, + "step": 517840 + }, + { + "epoch": 1.34, + "learning_rate": 9.864871520370366e-05, + "loss": 0.0102, + "step": 517850 + }, + { + "epoch": 1.34, + "learning_rate": 9.864482698733217e-05, + "loss": 0.0106, + "step": 517860 + }, + { + "epoch": 1.34, + "learning_rate": 9.864093877096073e-05, + "loss": 0.0078, + "step": 517870 + }, + { + "epoch": 1.34, + "learning_rate": 9.863705055458925e-05, + "loss": 0.0088, + "step": 517880 + }, + { + "epoch": 1.34, + "learning_rate": 9.86331623382178e-05, + "loss": 0.009, + "step": 517890 + }, + { + "epoch": 1.34, + "learning_rate": 9.862927412184632e-05, + "loss": 0.0094, + "step": 517900 + }, + { + "epoch": 1.34, + "learning_rate": 9.862538590547486e-05, + "loss": 0.0099, + "step": 517910 + }, + { + "epoch": 1.34, + "learning_rate": 9.862149768910339e-05, + "loss": 0.012, + "step": 517920 + }, + { + "epoch": 1.34, + "learning_rate": 9.861760947273193e-05, + "loss": 0.0073, + "step": 517930 + }, + { + "epoch": 1.34, + "learning_rate": 9.861372125636046e-05, + "loss": 0.0121, + "step": 517940 + }, + { + "epoch": 1.34, + "learning_rate": 9.8609833039989e-05, + "loss": 0.008, + "step": 517950 + }, + { + "epoch": 1.34, + "learning_rate": 9.860594482361753e-05, + "loss": 0.0097, + "step": 517960 + }, + { + "epoch": 1.34, + "learning_rate": 9.860205660724607e-05, + "loss": 0.0108, + "step": 517970 + }, + { + "epoch": 1.34, + "learning_rate": 9.85981683908746e-05, + "loss": 0.0088, + "step": 517980 + }, + { + "epoch": 1.34, + "learning_rate": 9.859428017450314e-05, + "loss": 0.0128, + "step": 517990 + }, + { + "epoch": 1.34, + "learning_rate": 9.859039195813167e-05, + "loss": 0.0113, + "step": 518000 + }, + { + "epoch": 1.34, + "eval_cer": 0.8816536990304715, + "eval_loss": 0.006467238999903202, + "eval_runtime": 107.9416, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 518000 + }, + { + "epoch": 1.34, + "learning_rate": 9.858650374176021e-05, + "loss": 0.0113, + "step": 518010 + }, + { + "epoch": 1.34, + "learning_rate": 9.858261552538874e-05, + "loss": 0.0135, + "step": 518020 + }, + { + "epoch": 1.34, + "learning_rate": 9.85787273090173e-05, + "loss": 0.0081, + "step": 518030 + }, + { + "epoch": 1.34, + "learning_rate": 9.857483909264582e-05, + "loss": 0.0122, + "step": 518040 + }, + { + "epoch": 1.34, + "learning_rate": 9.857095087627435e-05, + "loss": 0.011, + "step": 518050 + }, + { + "epoch": 1.34, + "learning_rate": 9.85670626599029e-05, + "loss": 0.0107, + "step": 518060 + }, + { + "epoch": 1.34, + "learning_rate": 9.856317444353142e-05, + "loss": 0.0103, + "step": 518070 + }, + { + "epoch": 1.34, + "learning_rate": 9.855928622715996e-05, + "loss": 0.0098, + "step": 518080 + }, + { + "epoch": 1.34, + "learning_rate": 9.855539801078849e-05, + "loss": 0.0121, + "step": 518090 + }, + { + "epoch": 1.34, + "learning_rate": 9.855150979441703e-05, + "loss": 0.0102, + "step": 518100 + }, + { + "epoch": 1.34, + "learning_rate": 9.854762157804556e-05, + "loss": 0.0097, + "step": 518110 + }, + { + "epoch": 1.34, + "learning_rate": 9.85437333616741e-05, + "loss": 0.0106, + "step": 518120 + }, + { + "epoch": 1.34, + "learning_rate": 9.853984514530263e-05, + "loss": 0.0102, + "step": 518130 + }, + { + "epoch": 1.34, + "learning_rate": 9.853595692893117e-05, + "loss": 0.0129, + "step": 518140 + }, + { + "epoch": 1.34, + "learning_rate": 9.85320687125597e-05, + "loss": 0.0076, + "step": 518150 + }, + { + "epoch": 1.34, + "learning_rate": 9.852818049618824e-05, + "loss": 0.0158, + "step": 518160 + }, + { + "epoch": 1.34, + "learning_rate": 9.852429227981677e-05, + "loss": 0.0094, + "step": 518170 + }, + { + "epoch": 1.34, + "learning_rate": 9.852040406344531e-05, + "loss": 0.0085, + "step": 518180 + }, + { + "epoch": 1.34, + "learning_rate": 9.851651584707384e-05, + "loss": 0.0121, + "step": 518190 + }, + { + "epoch": 1.34, + "learning_rate": 9.85126276307024e-05, + "loss": 0.0089, + "step": 518200 + }, + { + "epoch": 1.34, + "learning_rate": 9.850873941433091e-05, + "loss": 0.0101, + "step": 518210 + }, + { + "epoch": 1.34, + "learning_rate": 9.850485119795947e-05, + "loss": 0.0095, + "step": 518220 + }, + { + "epoch": 1.34, + "learning_rate": 9.8500962981588e-05, + "loss": 0.01, + "step": 518230 + }, + { + "epoch": 1.34, + "learning_rate": 9.849707476521654e-05, + "loss": 0.0103, + "step": 518240 + }, + { + "epoch": 1.34, + "learning_rate": 9.849318654884506e-05, + "loss": 0.008, + "step": 518250 + }, + { + "epoch": 1.34, + "learning_rate": 9.84892983324736e-05, + "loss": 0.0095, + "step": 518260 + }, + { + "epoch": 1.34, + "learning_rate": 9.848541011610213e-05, + "loss": 0.0078, + "step": 518270 + }, + { + "epoch": 1.34, + "learning_rate": 9.848152189973067e-05, + "loss": 0.0094, + "step": 518280 + }, + { + "epoch": 1.34, + "learning_rate": 9.84776336833592e-05, + "loss": 0.0123, + "step": 518290 + }, + { + "epoch": 1.34, + "learning_rate": 9.847374546698773e-05, + "loss": 0.0104, + "step": 518300 + }, + { + "epoch": 1.34, + "learning_rate": 9.846985725061627e-05, + "loss": 0.0092, + "step": 518310 + }, + { + "epoch": 1.34, + "learning_rate": 9.84659690342448e-05, + "loss": 0.0086, + "step": 518320 + }, + { + "epoch": 1.34, + "learning_rate": 9.846208081787334e-05, + "loss": 0.0101, + "step": 518330 + }, + { + "epoch": 1.34, + "learning_rate": 9.845819260150187e-05, + "loss": 0.0088, + "step": 518340 + }, + { + "epoch": 1.34, + "learning_rate": 9.845430438513041e-05, + "loss": 0.0089, + "step": 518350 + }, + { + "epoch": 1.34, + "learning_rate": 9.845041616875894e-05, + "loss": 0.0108, + "step": 518360 + }, + { + "epoch": 1.34, + "learning_rate": 9.844652795238748e-05, + "loss": 0.0078, + "step": 518370 + }, + { + "epoch": 1.34, + "learning_rate": 9.844263973601601e-05, + "loss": 0.008, + "step": 518380 + }, + { + "epoch": 1.34, + "learning_rate": 9.843875151964457e-05, + "loss": 0.0106, + "step": 518390 + }, + { + "epoch": 1.34, + "learning_rate": 9.843486330327309e-05, + "loss": 0.0109, + "step": 518400 + }, + { + "epoch": 1.34, + "learning_rate": 9.843097508690163e-05, + "loss": 0.0098, + "step": 518410 + }, + { + "epoch": 1.34, + "learning_rate": 9.842708687053016e-05, + "loss": 0.0114, + "step": 518420 + }, + { + "epoch": 1.34, + "learning_rate": 9.84231986541587e-05, + "loss": 0.0116, + "step": 518430 + }, + { + "epoch": 1.34, + "learning_rate": 9.841931043778723e-05, + "loss": 0.0081, + "step": 518440 + }, + { + "epoch": 1.34, + "learning_rate": 9.841542222141577e-05, + "loss": 0.0111, + "step": 518450 + }, + { + "epoch": 1.34, + "learning_rate": 9.84115340050443e-05, + "loss": 0.0094, + "step": 518460 + }, + { + "epoch": 1.34, + "learning_rate": 9.840764578867284e-05, + "loss": 0.0109, + "step": 518470 + }, + { + "epoch": 1.34, + "learning_rate": 9.840375757230137e-05, + "loss": 0.0078, + "step": 518480 + }, + { + "epoch": 1.34, + "learning_rate": 9.839986935592991e-05, + "loss": 0.0104, + "step": 518490 + }, + { + "epoch": 1.34, + "learning_rate": 9.839598113955844e-05, + "loss": 0.0109, + "step": 518500 + }, + { + "epoch": 1.34, + "learning_rate": 9.839209292318698e-05, + "loss": 0.0106, + "step": 518510 + }, + { + "epoch": 1.34, + "learning_rate": 9.838820470681551e-05, + "loss": 0.0135, + "step": 518520 + }, + { + "epoch": 1.34, + "learning_rate": 9.838431649044405e-05, + "loss": 0.0077, + "step": 518530 + }, + { + "epoch": 1.34, + "learning_rate": 9.838042827407258e-05, + "loss": 0.0082, + "step": 518540 + }, + { + "epoch": 1.34, + "learning_rate": 9.837654005770111e-05, + "loss": 0.0086, + "step": 518550 + }, + { + "epoch": 1.34, + "learning_rate": 9.837265184132966e-05, + "loss": 0.0115, + "step": 518560 + }, + { + "epoch": 1.34, + "learning_rate": 9.836876362495818e-05, + "loss": 0.0111, + "step": 518570 + }, + { + "epoch": 1.34, + "learning_rate": 9.836487540858673e-05, + "loss": 0.0096, + "step": 518580 + }, + { + "epoch": 1.34, + "learning_rate": 9.836098719221526e-05, + "loss": 0.011, + "step": 518590 + }, + { + "epoch": 1.34, + "learning_rate": 9.83570989758438e-05, + "loss": 0.01, + "step": 518600 + }, + { + "epoch": 1.34, + "learning_rate": 9.835321075947233e-05, + "loss": 0.0119, + "step": 518610 + }, + { + "epoch": 1.34, + "learning_rate": 9.834932254310087e-05, + "loss": 0.0109, + "step": 518620 + }, + { + "epoch": 1.34, + "learning_rate": 9.83454343267294e-05, + "loss": 0.0103, + "step": 518630 + }, + { + "epoch": 1.34, + "learning_rate": 9.834154611035794e-05, + "loss": 0.0084, + "step": 518640 + }, + { + "epoch": 1.34, + "learning_rate": 9.833765789398647e-05, + "loss": 0.0097, + "step": 518650 + }, + { + "epoch": 1.34, + "learning_rate": 9.833376967761501e-05, + "loss": 0.0097, + "step": 518660 + }, + { + "epoch": 1.34, + "learning_rate": 9.832988146124354e-05, + "loss": 0.0106, + "step": 518670 + }, + { + "epoch": 1.34, + "learning_rate": 9.832599324487208e-05, + "loss": 0.0089, + "step": 518680 + }, + { + "epoch": 1.34, + "learning_rate": 9.832210502850061e-05, + "loss": 0.0067, + "step": 518690 + }, + { + "epoch": 1.34, + "learning_rate": 9.831821681212915e-05, + "loss": 0.0171, + "step": 518700 + }, + { + "epoch": 1.34, + "learning_rate": 9.831432859575768e-05, + "loss": 0.009, + "step": 518710 + }, + { + "epoch": 1.34, + "learning_rate": 9.831044037938624e-05, + "loss": 0.0085, + "step": 518720 + }, + { + "epoch": 1.34, + "learning_rate": 9.830655216301475e-05, + "loss": 0.008, + "step": 518730 + }, + { + "epoch": 1.34, + "learning_rate": 9.83026639466433e-05, + "loss": 0.0117, + "step": 518740 + }, + { + "epoch": 1.34, + "learning_rate": 9.829877573027183e-05, + "loss": 0.009, + "step": 518750 + }, + { + "epoch": 1.34, + "learning_rate": 9.829488751390038e-05, + "loss": 0.0096, + "step": 518760 + }, + { + "epoch": 1.34, + "learning_rate": 9.82909992975289e-05, + "loss": 0.0096, + "step": 518770 + }, + { + "epoch": 1.34, + "learning_rate": 9.828711108115745e-05, + "loss": 0.0144, + "step": 518780 + }, + { + "epoch": 1.34, + "learning_rate": 9.828322286478597e-05, + "loss": 0.0083, + "step": 518790 + }, + { + "epoch": 1.34, + "learning_rate": 9.82793346484145e-05, + "loss": 0.0094, + "step": 518800 + }, + { + "epoch": 1.34, + "learning_rate": 9.827544643204304e-05, + "loss": 0.0092, + "step": 518810 + }, + { + "epoch": 1.34, + "learning_rate": 9.827155821567157e-05, + "loss": 0.0111, + "step": 518820 + }, + { + "epoch": 1.34, + "learning_rate": 9.826766999930011e-05, + "loss": 0.0095, + "step": 518830 + }, + { + "epoch": 1.34, + "learning_rate": 9.826378178292864e-05, + "loss": 0.0103, + "step": 518840 + }, + { + "epoch": 1.34, + "learning_rate": 9.825989356655718e-05, + "loss": 0.0122, + "step": 518850 + }, + { + "epoch": 1.34, + "learning_rate": 9.825600535018571e-05, + "loss": 0.0109, + "step": 518860 + }, + { + "epoch": 1.34, + "learning_rate": 9.825211713381425e-05, + "loss": 0.0092, + "step": 518870 + }, + { + "epoch": 1.35, + "learning_rate": 9.824822891744278e-05, + "loss": 0.0108, + "step": 518880 + }, + { + "epoch": 1.35, + "learning_rate": 9.824434070107132e-05, + "loss": 0.0084, + "step": 518890 + }, + { + "epoch": 1.35, + "learning_rate": 9.824045248469985e-05, + "loss": 0.0088, + "step": 518900 + }, + { + "epoch": 1.35, + "learning_rate": 9.82365642683284e-05, + "loss": 0.008, + "step": 518910 + }, + { + "epoch": 1.35, + "learning_rate": 9.823267605195693e-05, + "loss": 0.0096, + "step": 518920 + }, + { + "epoch": 1.35, + "learning_rate": 9.822878783558547e-05, + "loss": 0.0074, + "step": 518930 + }, + { + "epoch": 1.35, + "learning_rate": 9.8224899619214e-05, + "loss": 0.0094, + "step": 518940 + }, + { + "epoch": 1.35, + "learning_rate": 9.822101140284254e-05, + "loss": 0.0101, + "step": 518950 + }, + { + "epoch": 1.35, + "learning_rate": 9.821712318647107e-05, + "loss": 0.007, + "step": 518960 + }, + { + "epoch": 1.35, + "learning_rate": 9.821323497009961e-05, + "loss": 0.0115, + "step": 518970 + }, + { + "epoch": 1.35, + "learning_rate": 9.820934675372814e-05, + "loss": 0.0089, + "step": 518980 + }, + { + "epoch": 1.35, + "learning_rate": 9.820545853735668e-05, + "loss": 0.0079, + "step": 518990 + }, + { + "epoch": 1.35, + "learning_rate": 9.820157032098521e-05, + "loss": 0.0079, + "step": 519000 + }, + { + "epoch": 1.35, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.006426098756492138, + "eval_runtime": 107.8933, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 519000 + }, + { + "epoch": 1.35, + "learning_rate": 9.819768210461375e-05, + "loss": 0.0138, + "step": 519010 + }, + { + "epoch": 1.35, + "learning_rate": 9.819379388824228e-05, + "loss": 0.009, + "step": 519020 + }, + { + "epoch": 1.35, + "learning_rate": 9.818990567187082e-05, + "loss": 0.0089, + "step": 519030 + }, + { + "epoch": 1.35, + "learning_rate": 9.818601745549935e-05, + "loss": 0.0121, + "step": 519040 + }, + { + "epoch": 1.35, + "learning_rate": 9.818212923912788e-05, + "loss": 0.0104, + "step": 519050 + }, + { + "epoch": 1.35, + "learning_rate": 9.817824102275642e-05, + "loss": 0.011, + "step": 519060 + }, + { + "epoch": 1.35, + "learning_rate": 9.817435280638495e-05, + "loss": 0.0119, + "step": 519070 + }, + { + "epoch": 1.35, + "learning_rate": 9.81704645900135e-05, + "loss": 0.0111, + "step": 519080 + }, + { + "epoch": 1.35, + "learning_rate": 9.816657637364202e-05, + "loss": 0.011, + "step": 519090 + }, + { + "epoch": 1.35, + "learning_rate": 9.816268815727057e-05, + "loss": 0.0089, + "step": 519100 + }, + { + "epoch": 1.35, + "learning_rate": 9.81587999408991e-05, + "loss": 0.0106, + "step": 519110 + }, + { + "epoch": 1.35, + "learning_rate": 9.815491172452764e-05, + "loss": 0.0093, + "step": 519120 + }, + { + "epoch": 1.35, + "learning_rate": 9.815102350815617e-05, + "loss": 0.009, + "step": 519130 + }, + { + "epoch": 1.35, + "learning_rate": 9.814713529178471e-05, + "loss": 0.012, + "step": 519140 + }, + { + "epoch": 1.35, + "learning_rate": 9.814324707541324e-05, + "loss": 0.009, + "step": 519150 + }, + { + "epoch": 1.35, + "learning_rate": 9.813935885904178e-05, + "loss": 0.0102, + "step": 519160 + }, + { + "epoch": 1.35, + "learning_rate": 9.813547064267031e-05, + "loss": 0.0091, + "step": 519170 + }, + { + "epoch": 1.35, + "learning_rate": 9.813158242629885e-05, + "loss": 0.0075, + "step": 519180 + }, + { + "epoch": 1.35, + "learning_rate": 9.812769420992738e-05, + "loss": 0.0093, + "step": 519190 + }, + { + "epoch": 1.35, + "learning_rate": 9.812380599355592e-05, + "loss": 0.007, + "step": 519200 + }, + { + "epoch": 1.35, + "learning_rate": 9.811991777718445e-05, + "loss": 0.0117, + "step": 519210 + }, + { + "epoch": 1.35, + "learning_rate": 9.811602956081299e-05, + "loss": 0.0102, + "step": 519220 + }, + { + "epoch": 1.35, + "learning_rate": 9.811214134444152e-05, + "loss": 0.0105, + "step": 519230 + }, + { + "epoch": 1.35, + "learning_rate": 9.810825312807006e-05, + "loss": 0.0101, + "step": 519240 + }, + { + "epoch": 1.35, + "learning_rate": 9.810436491169859e-05, + "loss": 0.0098, + "step": 519250 + }, + { + "epoch": 1.35, + "learning_rate": 9.810047669532715e-05, + "loss": 0.008, + "step": 519260 + }, + { + "epoch": 1.35, + "learning_rate": 9.809658847895567e-05, + "loss": 0.0105, + "step": 519270 + }, + { + "epoch": 1.35, + "learning_rate": 9.809270026258422e-05, + "loss": 0.0168, + "step": 519280 + }, + { + "epoch": 1.35, + "learning_rate": 9.808881204621274e-05, + "loss": 0.0081, + "step": 519290 + }, + { + "epoch": 1.35, + "learning_rate": 9.808492382984127e-05, + "loss": 0.0077, + "step": 519300 + }, + { + "epoch": 1.35, + "learning_rate": 9.808103561346981e-05, + "loss": 0.0102, + "step": 519310 + }, + { + "epoch": 1.35, + "learning_rate": 9.807714739709834e-05, + "loss": 0.0109, + "step": 519320 + }, + { + "epoch": 1.35, + "learning_rate": 9.807325918072688e-05, + "loss": 0.0129, + "step": 519330 + }, + { + "epoch": 1.35, + "learning_rate": 9.806937096435541e-05, + "loss": 0.0086, + "step": 519340 + }, + { + "epoch": 1.35, + "learning_rate": 9.806548274798395e-05, + "loss": 0.0082, + "step": 519350 + }, + { + "epoch": 1.35, + "learning_rate": 9.806159453161248e-05, + "loss": 0.0153, + "step": 519360 + }, + { + "epoch": 1.35, + "learning_rate": 9.805770631524102e-05, + "loss": 0.0123, + "step": 519370 + }, + { + "epoch": 1.35, + "learning_rate": 9.805381809886955e-05, + "loss": 0.0121, + "step": 519380 + }, + { + "epoch": 1.35, + "learning_rate": 9.804992988249809e-05, + "loss": 0.0096, + "step": 519390 + }, + { + "epoch": 1.35, + "learning_rate": 9.804604166612662e-05, + "loss": 0.0172, + "step": 519400 + }, + { + "epoch": 1.35, + "learning_rate": 9.804215344975516e-05, + "loss": 0.0087, + "step": 519410 + }, + { + "epoch": 1.35, + "learning_rate": 9.803826523338369e-05, + "loss": 0.008, + "step": 519420 + }, + { + "epoch": 1.35, + "learning_rate": 9.803437701701224e-05, + "loss": 0.0106, + "step": 519430 + }, + { + "epoch": 1.35, + "learning_rate": 9.803048880064077e-05, + "loss": 0.0098, + "step": 519440 + }, + { + "epoch": 1.35, + "learning_rate": 9.802660058426931e-05, + "loss": 0.0085, + "step": 519450 + }, + { + "epoch": 1.35, + "learning_rate": 9.802271236789784e-05, + "loss": 0.0095, + "step": 519460 + }, + { + "epoch": 1.35, + "learning_rate": 9.801882415152638e-05, + "loss": 0.0082, + "step": 519470 + }, + { + "epoch": 1.35, + "learning_rate": 9.801493593515491e-05, + "loss": 0.0106, + "step": 519480 + }, + { + "epoch": 1.35, + "learning_rate": 9.801104771878345e-05, + "loss": 0.0109, + "step": 519490 + }, + { + "epoch": 1.35, + "learning_rate": 9.800715950241198e-05, + "loss": 0.0091, + "step": 519500 + }, + { + "epoch": 1.35, + "learning_rate": 9.800327128604052e-05, + "loss": 0.011, + "step": 519510 + }, + { + "epoch": 1.35, + "learning_rate": 9.799938306966905e-05, + "loss": 0.0092, + "step": 519520 + }, + { + "epoch": 1.35, + "learning_rate": 9.79954948532976e-05, + "loss": 0.0105, + "step": 519530 + }, + { + "epoch": 1.35, + "learning_rate": 9.799160663692612e-05, + "loss": 0.009, + "step": 519540 + }, + { + "epoch": 1.35, + "learning_rate": 9.798771842055465e-05, + "loss": 0.0091, + "step": 519550 + }, + { + "epoch": 1.35, + "learning_rate": 9.798383020418319e-05, + "loss": 0.0098, + "step": 519560 + }, + { + "epoch": 1.35, + "learning_rate": 9.797994198781172e-05, + "loss": 0.0095, + "step": 519570 + }, + { + "epoch": 1.35, + "learning_rate": 9.797605377144026e-05, + "loss": 0.0077, + "step": 519580 + }, + { + "epoch": 1.35, + "learning_rate": 9.797216555506879e-05, + "loss": 0.0119, + "step": 519590 + }, + { + "epoch": 1.35, + "learning_rate": 9.796827733869733e-05, + "loss": 0.0092, + "step": 519600 + }, + { + "epoch": 1.35, + "learning_rate": 9.796438912232586e-05, + "loss": 0.0095, + "step": 519610 + }, + { + "epoch": 1.35, + "learning_rate": 9.796050090595441e-05, + "loss": 0.0101, + "step": 519620 + }, + { + "epoch": 1.35, + "learning_rate": 9.795661268958294e-05, + "loss": 0.0078, + "step": 519630 + }, + { + "epoch": 1.35, + "learning_rate": 9.795272447321148e-05, + "loss": 0.0092, + "step": 519640 + }, + { + "epoch": 1.35, + "learning_rate": 9.794883625684001e-05, + "loss": 0.0116, + "step": 519650 + }, + { + "epoch": 1.35, + "learning_rate": 9.794494804046855e-05, + "loss": 0.0084, + "step": 519660 + }, + { + "epoch": 1.35, + "learning_rate": 9.794105982409708e-05, + "loss": 0.0109, + "step": 519670 + }, + { + "epoch": 1.35, + "learning_rate": 9.793717160772562e-05, + "loss": 0.0109, + "step": 519680 + }, + { + "epoch": 1.35, + "learning_rate": 9.793328339135415e-05, + "loss": 0.0097, + "step": 519690 + }, + { + "epoch": 1.35, + "learning_rate": 9.792939517498269e-05, + "loss": 0.0077, + "step": 519700 + }, + { + "epoch": 1.35, + "learning_rate": 9.792550695861122e-05, + "loss": 0.0069, + "step": 519710 + }, + { + "epoch": 1.35, + "learning_rate": 9.792161874223976e-05, + "loss": 0.0086, + "step": 519720 + }, + { + "epoch": 1.35, + "learning_rate": 9.791773052586829e-05, + "loss": 0.0081, + "step": 519730 + }, + { + "epoch": 1.35, + "learning_rate": 9.791384230949683e-05, + "loss": 0.0088, + "step": 519740 + }, + { + "epoch": 1.35, + "learning_rate": 9.790995409312536e-05, + "loss": 0.0141, + "step": 519750 + }, + { + "epoch": 1.35, + "learning_rate": 9.79060658767539e-05, + "loss": 0.012, + "step": 519760 + }, + { + "epoch": 1.35, + "learning_rate": 9.790217766038243e-05, + "loss": 0.0116, + "step": 519770 + }, + { + "epoch": 1.35, + "learning_rate": 9.789828944401099e-05, + "loss": 0.0154, + "step": 519780 + }, + { + "epoch": 1.35, + "learning_rate": 9.789440122763951e-05, + "loss": 0.0173, + "step": 519790 + }, + { + "epoch": 1.35, + "learning_rate": 9.789051301126803e-05, + "loss": 0.007, + "step": 519800 + }, + { + "epoch": 1.35, + "learning_rate": 9.788662479489658e-05, + "loss": 0.0111, + "step": 519810 + }, + { + "epoch": 1.35, + "learning_rate": 9.788273657852511e-05, + "loss": 0.0131, + "step": 519820 + }, + { + "epoch": 1.35, + "learning_rate": 9.787884836215365e-05, + "loss": 0.0147, + "step": 519830 + }, + { + "epoch": 1.35, + "learning_rate": 9.787496014578218e-05, + "loss": 0.0087, + "step": 519840 + }, + { + "epoch": 1.35, + "learning_rate": 9.787107192941072e-05, + "loss": 0.0107, + "step": 519850 + }, + { + "epoch": 1.35, + "learning_rate": 9.786718371303925e-05, + "loss": 0.011, + "step": 519860 + }, + { + "epoch": 1.35, + "learning_rate": 9.786329549666779e-05, + "loss": 0.0113, + "step": 519870 + }, + { + "epoch": 1.35, + "learning_rate": 9.785940728029632e-05, + "loss": 0.0097, + "step": 519880 + }, + { + "epoch": 1.35, + "learning_rate": 9.785551906392486e-05, + "loss": 0.0094, + "step": 519890 + }, + { + "epoch": 1.35, + "learning_rate": 9.785163084755339e-05, + "loss": 0.0147, + "step": 519900 + }, + { + "epoch": 1.35, + "learning_rate": 9.784774263118193e-05, + "loss": 0.0102, + "step": 519910 + }, + { + "epoch": 1.35, + "learning_rate": 9.784385441481046e-05, + "loss": 0.0115, + "step": 519920 + }, + { + "epoch": 1.35, + "learning_rate": 9.7839966198439e-05, + "loss": 0.0086, + "step": 519930 + }, + { + "epoch": 1.35, + "learning_rate": 9.783607798206753e-05, + "loss": 0.0102, + "step": 519940 + }, + { + "epoch": 1.35, + "learning_rate": 9.783218976569608e-05, + "loss": 0.009, + "step": 519950 + }, + { + "epoch": 1.35, + "learning_rate": 9.78283015493246e-05, + "loss": 0.0099, + "step": 519960 + }, + { + "epoch": 1.35, + "learning_rate": 9.782441333295315e-05, + "loss": 0.0102, + "step": 519970 + }, + { + "epoch": 1.35, + "learning_rate": 9.782052511658168e-05, + "loss": 0.0092, + "step": 519980 + }, + { + "epoch": 1.35, + "learning_rate": 9.781663690021022e-05, + "loss": 0.0107, + "step": 519990 + }, + { + "epoch": 1.35, + "learning_rate": 9.781274868383875e-05, + "loss": 0.0105, + "step": 520000 + }, + { + "epoch": 1.35, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.006626142654567957, + "eval_runtime": 107.8646, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, + "step": 520000 + }, + { + "epoch": 1.35, + "learning_rate": 9.78088604674673e-05, + "loss": 0.0113, + "step": 520010 + }, + { + "epoch": 1.35, + "learning_rate": 9.780497225109582e-05, + "loss": 0.0097, + "step": 520020 + }, + { + "epoch": 1.35, + "learning_rate": 9.780108403472436e-05, + "loss": 0.0088, + "step": 520030 + }, + { + "epoch": 1.35, + "learning_rate": 9.779719581835289e-05, + "loss": 0.0105, + "step": 520040 + }, + { + "epoch": 1.35, + "learning_rate": 9.779330760198142e-05, + "loss": 0.0097, + "step": 520050 + }, + { + "epoch": 1.35, + "learning_rate": 9.778941938560996e-05, + "loss": 0.0105, + "step": 520060 + }, + { + "epoch": 1.35, + "learning_rate": 9.778553116923849e-05, + "loss": 0.0084, + "step": 520070 + }, + { + "epoch": 1.35, + "learning_rate": 9.778164295286703e-05, + "loss": 0.0079, + "step": 520080 + }, + { + "epoch": 1.35, + "learning_rate": 9.777775473649556e-05, + "loss": 0.0233, + "step": 520090 + }, + { + "epoch": 1.35, + "learning_rate": 9.77738665201241e-05, + "loss": 0.0116, + "step": 520100 + }, + { + "epoch": 1.35, + "learning_rate": 9.776997830375263e-05, + "loss": 0.0131, + "step": 520110 + }, + { + "epoch": 1.35, + "learning_rate": 9.776609008738117e-05, + "loss": 0.0085, + "step": 520120 + }, + { + "epoch": 1.35, + "learning_rate": 9.77622018710097e-05, + "loss": 0.0087, + "step": 520130 + }, + { + "epoch": 1.35, + "learning_rate": 9.775831365463825e-05, + "loss": 0.0073, + "step": 520140 + }, + { + "epoch": 1.35, + "learning_rate": 9.775442543826678e-05, + "loss": 0.0085, + "step": 520150 + }, + { + "epoch": 1.35, + "learning_rate": 9.775053722189532e-05, + "loss": 0.016, + "step": 520160 + }, + { + "epoch": 1.35, + "learning_rate": 9.774664900552385e-05, + "loss": 0.012, + "step": 520170 + }, + { + "epoch": 1.35, + "learning_rate": 9.77427607891524e-05, + "loss": 0.0075, + "step": 520180 + }, + { + "epoch": 1.35, + "learning_rate": 9.773887257278092e-05, + "loss": 0.0087, + "step": 520190 + }, + { + "epoch": 1.35, + "learning_rate": 9.773498435640946e-05, + "loss": 0.0081, + "step": 520200 + }, + { + "epoch": 1.35, + "learning_rate": 9.773109614003799e-05, + "loss": 0.0134, + "step": 520210 + }, + { + "epoch": 1.35, + "learning_rate": 9.772720792366653e-05, + "loss": 0.0082, + "step": 520220 + }, + { + "epoch": 1.35, + "learning_rate": 9.772331970729506e-05, + "loss": 0.01, + "step": 520230 + }, + { + "epoch": 1.35, + "learning_rate": 9.77194314909236e-05, + "loss": 0.0081, + "step": 520240 + }, + { + "epoch": 1.35, + "learning_rate": 9.771554327455213e-05, + "loss": 0.0082, + "step": 520250 + }, + { + "epoch": 1.35, + "learning_rate": 9.771165505818067e-05, + "loss": 0.0094, + "step": 520260 + }, + { + "epoch": 1.35, + "learning_rate": 9.77077668418092e-05, + "loss": 0.0078, + "step": 520270 + }, + { + "epoch": 1.35, + "learning_rate": 9.770387862543773e-05, + "loss": 0.0093, + "step": 520280 + }, + { + "epoch": 1.35, + "learning_rate": 9.769999040906627e-05, + "loss": 0.0085, + "step": 520290 + }, + { + "epoch": 1.35, + "learning_rate": 9.76961021926948e-05, + "loss": 0.0098, + "step": 520300 + }, + { + "epoch": 1.35, + "learning_rate": 9.769221397632335e-05, + "loss": 0.011, + "step": 520310 + }, + { + "epoch": 1.35, + "learning_rate": 9.768832575995187e-05, + "loss": 0.0107, + "step": 520320 + }, + { + "epoch": 1.35, + "learning_rate": 9.768443754358042e-05, + "loss": 0.0149, + "step": 520330 + }, + { + "epoch": 1.35, + "learning_rate": 9.768054932720895e-05, + "loss": 0.0095, + "step": 520340 + }, + { + "epoch": 1.35, + "learning_rate": 9.767666111083749e-05, + "loss": 0.0086, + "step": 520350 + }, + { + "epoch": 1.35, + "learning_rate": 9.767277289446602e-05, + "loss": 0.009, + "step": 520360 + }, + { + "epoch": 1.35, + "learning_rate": 9.766888467809456e-05, + "loss": 0.0134, + "step": 520370 + }, + { + "epoch": 1.35, + "learning_rate": 9.766499646172309e-05, + "loss": 0.0107, + "step": 520380 + }, + { + "epoch": 1.35, + "learning_rate": 9.766110824535163e-05, + "loss": 0.0092, + "step": 520390 + }, + { + "epoch": 1.35, + "learning_rate": 9.765722002898016e-05, + "loss": 0.0109, + "step": 520400 + }, + { + "epoch": 1.35, + "learning_rate": 9.76533318126087e-05, + "loss": 0.0115, + "step": 520410 + }, + { + "epoch": 1.35, + "learning_rate": 9.764944359623723e-05, + "loss": 0.0089, + "step": 520420 + }, + { + "epoch": 1.35, + "learning_rate": 9.764555537986577e-05, + "loss": 0.0105, + "step": 520430 + }, + { + "epoch": 1.35, + "learning_rate": 9.76416671634943e-05, + "loss": 0.0088, + "step": 520440 + }, + { + "epoch": 1.35, + "learning_rate": 9.763777894712284e-05, + "loss": 0.0114, + "step": 520450 + }, + { + "epoch": 1.35, + "learning_rate": 9.763389073075137e-05, + "loss": 0.0069, + "step": 520460 + }, + { + "epoch": 1.35, + "learning_rate": 9.763000251437992e-05, + "loss": 0.0097, + "step": 520470 + }, + { + "epoch": 1.35, + "learning_rate": 9.762611429800844e-05, + "loss": 0.0117, + "step": 520480 + }, + { + "epoch": 1.35, + "learning_rate": 9.7622226081637e-05, + "loss": 0.0105, + "step": 520490 + }, + { + "epoch": 1.35, + "learning_rate": 9.761833786526552e-05, + "loss": 0.01, + "step": 520500 + }, + { + "epoch": 1.35, + "learning_rate": 9.761444964889406e-05, + "loss": 0.0134, + "step": 520510 + }, + { + "epoch": 1.35, + "learning_rate": 9.761056143252259e-05, + "loss": 0.0114, + "step": 520520 + }, + { + "epoch": 1.35, + "learning_rate": 9.760667321615112e-05, + "loss": 0.011, + "step": 520530 + }, + { + "epoch": 1.35, + "learning_rate": 9.760278499977966e-05, + "loss": 0.0104, + "step": 520540 + }, + { + "epoch": 1.35, + "learning_rate": 9.759889678340819e-05, + "loss": 0.0083, + "step": 520550 + }, + { + "epoch": 1.35, + "learning_rate": 9.759500856703673e-05, + "loss": 0.0083, + "step": 520560 + }, + { + "epoch": 1.35, + "learning_rate": 9.759112035066526e-05, + "loss": 0.01, + "step": 520570 + }, + { + "epoch": 1.35, + "learning_rate": 9.75872321342938e-05, + "loss": 0.0151, + "step": 520580 + }, + { + "epoch": 1.35, + "learning_rate": 9.758334391792233e-05, + "loss": 0.011, + "step": 520590 + }, + { + "epoch": 1.35, + "learning_rate": 9.757945570155087e-05, + "loss": 0.0098, + "step": 520600 + }, + { + "epoch": 1.35, + "learning_rate": 9.75755674851794e-05, + "loss": 0.0078, + "step": 520610 + }, + { + "epoch": 1.35, + "learning_rate": 9.757167926880794e-05, + "loss": 0.0146, + "step": 520620 + }, + { + "epoch": 1.35, + "learning_rate": 9.756779105243647e-05, + "loss": 0.0071, + "step": 520630 + }, + { + "epoch": 1.35, + "learning_rate": 9.756390283606501e-05, + "loss": 0.0117, + "step": 520640 + }, + { + "epoch": 1.35, + "learning_rate": 9.756001461969354e-05, + "loss": 0.0101, + "step": 520650 + }, + { + "epoch": 1.35, + "learning_rate": 9.75561264033221e-05, + "loss": 0.01, + "step": 520660 + }, + { + "epoch": 1.35, + "learning_rate": 9.755223818695062e-05, + "loss": 0.0113, + "step": 520670 + }, + { + "epoch": 1.35, + "learning_rate": 9.754834997057916e-05, + "loss": 0.0098, + "step": 520680 + }, + { + "epoch": 1.35, + "learning_rate": 9.754446175420769e-05, + "loss": 0.0101, + "step": 520690 + }, + { + "epoch": 1.35, + "learning_rate": 9.754057353783623e-05, + "loss": 0.0088, + "step": 520700 + }, + { + "epoch": 1.35, + "learning_rate": 9.753668532146476e-05, + "loss": 0.0086, + "step": 520710 + }, + { + "epoch": 1.35, + "learning_rate": 9.75327971050933e-05, + "loss": 0.0113, + "step": 520720 + }, + { + "epoch": 1.35, + "learning_rate": 9.752890888872183e-05, + "loss": 0.0109, + "step": 520730 + }, + { + "epoch": 1.35, + "learning_rate": 9.752502067235037e-05, + "loss": 0.0082, + "step": 520740 + }, + { + "epoch": 1.35, + "learning_rate": 9.75211324559789e-05, + "loss": 0.0104, + "step": 520750 + }, + { + "epoch": 1.35, + "learning_rate": 9.751724423960744e-05, + "loss": 0.013, + "step": 520760 + }, + { + "epoch": 1.35, + "learning_rate": 9.751335602323597e-05, + "loss": 0.0079, + "step": 520770 + }, + { + "epoch": 1.35, + "learning_rate": 9.75094678068645e-05, + "loss": 0.0104, + "step": 520780 + }, + { + "epoch": 1.35, + "learning_rate": 9.750557959049304e-05, + "loss": 0.0085, + "step": 520790 + }, + { + "epoch": 1.35, + "learning_rate": 9.750169137412157e-05, + "loss": 0.0112, + "step": 520800 + }, + { + "epoch": 1.35, + "learning_rate": 9.749780315775011e-05, + "loss": 0.0111, + "step": 520810 + }, + { + "epoch": 1.35, + "learning_rate": 9.749391494137864e-05, + "loss": 0.0086, + "step": 520820 + }, + { + "epoch": 1.35, + "learning_rate": 9.749002672500718e-05, + "loss": 0.0092, + "step": 520830 + }, + { + "epoch": 1.35, + "learning_rate": 9.748613850863571e-05, + "loss": 0.0102, + "step": 520840 + }, + { + "epoch": 1.35, + "learning_rate": 9.748225029226426e-05, + "loss": 0.01, + "step": 520850 + }, + { + "epoch": 1.35, + "learning_rate": 9.747836207589279e-05, + "loss": 0.0089, + "step": 520860 + }, + { + "epoch": 1.35, + "learning_rate": 9.747447385952133e-05, + "loss": 0.0083, + "step": 520870 + }, + { + "epoch": 1.35, + "learning_rate": 9.747058564314986e-05, + "loss": 0.0122, + "step": 520880 + }, + { + "epoch": 1.35, + "learning_rate": 9.74666974267784e-05, + "loss": 0.012, + "step": 520890 + }, + { + "epoch": 1.35, + "learning_rate": 9.746280921040693e-05, + "loss": 0.0106, + "step": 520900 + }, + { + "epoch": 1.35, + "learning_rate": 9.745892099403547e-05, + "loss": 0.0097, + "step": 520910 + }, + { + "epoch": 1.35, + "learning_rate": 9.7455032777664e-05, + "loss": 0.0097, + "step": 520920 + }, + { + "epoch": 1.35, + "learning_rate": 9.745114456129254e-05, + "loss": 0.0074, + "step": 520930 + }, + { + "epoch": 1.35, + "learning_rate": 9.744725634492107e-05, + "loss": 0.0113, + "step": 520940 + }, + { + "epoch": 1.35, + "learning_rate": 9.744336812854961e-05, + "loss": 0.0122, + "step": 520950 + }, + { + "epoch": 1.35, + "learning_rate": 9.743947991217814e-05, + "loss": 0.0129, + "step": 520960 + }, + { + "epoch": 1.35, + "learning_rate": 9.743559169580668e-05, + "loss": 0.014, + "step": 520970 + }, + { + "epoch": 1.35, + "learning_rate": 9.743170347943521e-05, + "loss": 0.0108, + "step": 520980 + }, + { + "epoch": 1.35, + "learning_rate": 9.742781526306375e-05, + "loss": 0.0142, + "step": 520990 + }, + { + "epoch": 1.35, + "learning_rate": 9.742392704669228e-05, + "loss": 0.0098, + "step": 521000 + }, + { + "epoch": 1.35, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.006592988967895508, + "eval_runtime": 107.9088, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.634, + "step": 521000 + }, + { + "epoch": 1.35, + "learning_rate": 9.742003883032083e-05, + "loss": 0.011, + "step": 521010 + }, + { + "epoch": 1.35, + "learning_rate": 9.741615061394936e-05, + "loss": 0.0093, + "step": 521020 + }, + { + "epoch": 1.35, + "learning_rate": 9.741226239757788e-05, + "loss": 0.009, + "step": 521030 + }, + { + "epoch": 1.35, + "learning_rate": 9.740837418120643e-05, + "loss": 0.0084, + "step": 521040 + }, + { + "epoch": 1.35, + "learning_rate": 9.740448596483496e-05, + "loss": 0.0088, + "step": 521050 + }, + { + "epoch": 1.35, + "learning_rate": 9.74005977484635e-05, + "loss": 0.01, + "step": 521060 + }, + { + "epoch": 1.35, + "learning_rate": 9.739670953209203e-05, + "loss": 0.0094, + "step": 521070 + }, + { + "epoch": 1.35, + "learning_rate": 9.739282131572057e-05, + "loss": 0.0098, + "step": 521080 + }, + { + "epoch": 1.35, + "learning_rate": 9.73889330993491e-05, + "loss": 0.0091, + "step": 521090 + }, + { + "epoch": 1.35, + "learning_rate": 9.738504488297764e-05, + "loss": 0.0104, + "step": 521100 + }, + { + "epoch": 1.35, + "learning_rate": 9.738115666660617e-05, + "loss": 0.0084, + "step": 521110 + }, + { + "epoch": 1.35, + "learning_rate": 9.737726845023471e-05, + "loss": 0.0104, + "step": 521120 + }, + { + "epoch": 1.35, + "learning_rate": 9.737338023386324e-05, + "loss": 0.0097, + "step": 521130 + }, + { + "epoch": 1.35, + "learning_rate": 9.736949201749178e-05, + "loss": 0.0088, + "step": 521140 + }, + { + "epoch": 1.35, + "learning_rate": 9.736560380112031e-05, + "loss": 0.0076, + "step": 521150 + }, + { + "epoch": 1.35, + "learning_rate": 9.736171558474885e-05, + "loss": 0.0118, + "step": 521160 + }, + { + "epoch": 1.35, + "learning_rate": 9.735782736837738e-05, + "loss": 0.0083, + "step": 521170 + }, + { + "epoch": 1.35, + "learning_rate": 9.735393915200593e-05, + "loss": 0.0124, + "step": 521180 + }, + { + "epoch": 1.35, + "learning_rate": 9.735005093563445e-05, + "loss": 0.0082, + "step": 521190 + }, + { + "epoch": 1.35, + "learning_rate": 9.7346162719263e-05, + "loss": 0.0118, + "step": 521200 + }, + { + "epoch": 1.35, + "learning_rate": 9.734227450289153e-05, + "loss": 0.0076, + "step": 521210 + }, + { + "epoch": 1.35, + "learning_rate": 9.733838628652007e-05, + "loss": 0.0093, + "step": 521220 + }, + { + "epoch": 1.35, + "learning_rate": 9.73344980701486e-05, + "loss": 0.0106, + "step": 521230 + }, + { + "epoch": 1.35, + "learning_rate": 9.733060985377714e-05, + "loss": 0.0092, + "step": 521240 + }, + { + "epoch": 1.35, + "learning_rate": 9.732672163740567e-05, + "loss": 0.0103, + "step": 521250 + }, + { + "epoch": 1.35, + "learning_rate": 9.732283342103421e-05, + "loss": 0.0097, + "step": 521260 + }, + { + "epoch": 1.35, + "learning_rate": 9.731894520466274e-05, + "loss": 0.0114, + "step": 521270 + }, + { + "epoch": 1.35, + "learning_rate": 9.731505698829127e-05, + "loss": 0.0129, + "step": 521280 + }, + { + "epoch": 1.35, + "learning_rate": 9.731116877191981e-05, + "loss": 0.0118, + "step": 521290 + }, + { + "epoch": 1.35, + "learning_rate": 9.730728055554834e-05, + "loss": 0.0115, + "step": 521300 + }, + { + "epoch": 1.35, + "learning_rate": 9.730339233917688e-05, + "loss": 0.0097, + "step": 521310 + }, + { + "epoch": 1.35, + "learning_rate": 9.729950412280541e-05, + "loss": 0.0122, + "step": 521320 + }, + { + "epoch": 1.35, + "learning_rate": 9.729561590643395e-05, + "loss": 0.0071, + "step": 521330 + }, + { + "epoch": 1.35, + "learning_rate": 9.729172769006248e-05, + "loss": 0.0091, + "step": 521340 + }, + { + "epoch": 1.35, + "learning_rate": 9.728783947369102e-05, + "loss": 0.0205, + "step": 521350 + }, + { + "epoch": 1.35, + "learning_rate": 9.728395125731955e-05, + "loss": 0.0123, + "step": 521360 + }, + { + "epoch": 1.35, + "learning_rate": 9.72800630409481e-05, + "loss": 0.011, + "step": 521370 + }, + { + "epoch": 1.35, + "learning_rate": 9.727617482457663e-05, + "loss": 0.0095, + "step": 521380 + }, + { + "epoch": 1.35, + "learning_rate": 9.727228660820517e-05, + "loss": 0.0114, + "step": 521390 + }, + { + "epoch": 1.35, + "learning_rate": 9.72683983918337e-05, + "loss": 0.011, + "step": 521400 + }, + { + "epoch": 1.35, + "learning_rate": 9.726451017546224e-05, + "loss": 0.0107, + "step": 521410 + }, + { + "epoch": 1.35, + "learning_rate": 9.726062195909077e-05, + "loss": 0.0172, + "step": 521420 + }, + { + "epoch": 1.35, + "learning_rate": 9.725673374271931e-05, + "loss": 0.0119, + "step": 521430 + }, + { + "epoch": 1.35, + "learning_rate": 9.725284552634784e-05, + "loss": 0.009, + "step": 521440 + }, + { + "epoch": 1.35, + "learning_rate": 9.724895730997638e-05, + "loss": 0.0105, + "step": 521450 + }, + { + "epoch": 1.35, + "learning_rate": 9.724506909360491e-05, + "loss": 0.0095, + "step": 521460 + }, + { + "epoch": 1.35, + "learning_rate": 9.724118087723345e-05, + "loss": 0.0088, + "step": 521470 + }, + { + "epoch": 1.35, + "learning_rate": 9.723729266086198e-05, + "loss": 0.0103, + "step": 521480 + }, + { + "epoch": 1.35, + "learning_rate": 9.723340444449052e-05, + "loss": 0.011, + "step": 521490 + }, + { + "epoch": 1.35, + "learning_rate": 9.722951622811905e-05, + "loss": 0.0097, + "step": 521500 + }, + { + "epoch": 1.35, + "learning_rate": 9.722562801174759e-05, + "loss": 0.0086, + "step": 521510 + }, + { + "epoch": 1.35, + "learning_rate": 9.722173979537612e-05, + "loss": 0.0082, + "step": 521520 + }, + { + "epoch": 1.35, + "learning_rate": 9.721785157900465e-05, + "loss": 0.0108, + "step": 521530 + }, + { + "epoch": 1.35, + "learning_rate": 9.72139633626332e-05, + "loss": 0.0075, + "step": 521540 + }, + { + "epoch": 1.35, + "learning_rate": 9.721007514626172e-05, + "loss": 0.009, + "step": 521550 + }, + { + "epoch": 1.35, + "learning_rate": 9.720618692989027e-05, + "loss": 0.0071, + "step": 521560 + }, + { + "epoch": 1.35, + "learning_rate": 9.72022987135188e-05, + "loss": 0.0079, + "step": 521570 + }, + { + "epoch": 1.35, + "learning_rate": 9.719841049714734e-05, + "loss": 0.0106, + "step": 521580 + }, + { + "epoch": 1.35, + "learning_rate": 9.719452228077587e-05, + "loss": 0.0153, + "step": 521590 + }, + { + "epoch": 1.35, + "learning_rate": 9.719063406440441e-05, + "loss": 0.0068, + "step": 521600 + }, + { + "epoch": 1.35, + "learning_rate": 9.718674584803294e-05, + "loss": 0.0091, + "step": 521610 + }, + { + "epoch": 1.35, + "learning_rate": 9.718285763166148e-05, + "loss": 0.0097, + "step": 521620 + }, + { + "epoch": 1.35, + "learning_rate": 9.717896941529001e-05, + "loss": 0.0103, + "step": 521630 + }, + { + "epoch": 1.35, + "learning_rate": 9.717508119891855e-05, + "loss": 0.0068, + "step": 521640 + }, + { + "epoch": 1.35, + "learning_rate": 9.717119298254708e-05, + "loss": 0.0068, + "step": 521650 + }, + { + "epoch": 1.35, + "learning_rate": 9.716730476617562e-05, + "loss": 0.0088, + "step": 521660 + }, + { + "epoch": 1.35, + "learning_rate": 9.716341654980415e-05, + "loss": 0.0081, + "step": 521670 + }, + { + "epoch": 1.35, + "learning_rate": 9.715952833343269e-05, + "loss": 0.0101, + "step": 521680 + }, + { + "epoch": 1.35, + "learning_rate": 9.715564011706122e-05, + "loss": 0.0094, + "step": 521690 + }, + { + "epoch": 1.35, + "learning_rate": 9.715175190068977e-05, + "loss": 0.009, + "step": 521700 + }, + { + "epoch": 1.35, + "learning_rate": 9.714786368431829e-05, + "loss": 0.0112, + "step": 521710 + }, + { + "epoch": 1.35, + "learning_rate": 9.714397546794684e-05, + "loss": 0.0091, + "step": 521720 + }, + { + "epoch": 1.35, + "learning_rate": 9.714008725157537e-05, + "loss": 0.0108, + "step": 521730 + }, + { + "epoch": 1.35, + "learning_rate": 9.713619903520391e-05, + "loss": 0.0077, + "step": 521740 + }, + { + "epoch": 1.35, + "learning_rate": 9.713231081883244e-05, + "loss": 0.0105, + "step": 521750 + }, + { + "epoch": 1.35, + "learning_rate": 9.712842260246098e-05, + "loss": 0.0076, + "step": 521760 + }, + { + "epoch": 1.35, + "learning_rate": 9.712453438608951e-05, + "loss": 0.0109, + "step": 521770 + }, + { + "epoch": 1.35, + "learning_rate": 9.712064616971804e-05, + "loss": 0.0098, + "step": 521780 + }, + { + "epoch": 1.35, + "learning_rate": 9.711675795334658e-05, + "loss": 0.0116, + "step": 521790 + }, + { + "epoch": 1.35, + "learning_rate": 9.711286973697511e-05, + "loss": 0.0121, + "step": 521800 + }, + { + "epoch": 1.35, + "learning_rate": 9.710898152060365e-05, + "loss": 0.0142, + "step": 521810 + }, + { + "epoch": 1.35, + "learning_rate": 9.710509330423218e-05, + "loss": 0.0079, + "step": 521820 + }, + { + "epoch": 1.35, + "learning_rate": 9.710120508786072e-05, + "loss": 0.011, + "step": 521830 + }, + { + "epoch": 1.35, + "learning_rate": 9.709731687148925e-05, + "loss": 0.0097, + "step": 521840 + }, + { + "epoch": 1.35, + "learning_rate": 9.709342865511779e-05, + "loss": 0.0096, + "step": 521850 + }, + { + "epoch": 1.35, + "learning_rate": 9.708954043874632e-05, + "loss": 0.0071, + "step": 521860 + }, + { + "epoch": 1.35, + "learning_rate": 9.708565222237486e-05, + "loss": 0.0101, + "step": 521870 + }, + { + "epoch": 1.35, + "learning_rate": 9.708176400600339e-05, + "loss": 0.0116, + "step": 521880 + }, + { + "epoch": 1.35, + "learning_rate": 9.707787578963194e-05, + "loss": 0.0069, + "step": 521890 + }, + { + "epoch": 1.35, + "learning_rate": 9.707398757326047e-05, + "loss": 0.0127, + "step": 521900 + }, + { + "epoch": 1.35, + "learning_rate": 9.707009935688901e-05, + "loss": 0.0117, + "step": 521910 + }, + { + "epoch": 1.35, + "learning_rate": 9.706621114051754e-05, + "loss": 0.01, + "step": 521920 + }, + { + "epoch": 1.35, + "learning_rate": 9.706232292414608e-05, + "loss": 0.0101, + "step": 521930 + }, + { + "epoch": 1.35, + "learning_rate": 9.705843470777461e-05, + "loss": 0.008, + "step": 521940 + }, + { + "epoch": 1.35, + "learning_rate": 9.705454649140315e-05, + "loss": 0.0098, + "step": 521950 + }, + { + "epoch": 1.35, + "learning_rate": 9.705065827503168e-05, + "loss": 0.0132, + "step": 521960 + }, + { + "epoch": 1.35, + "learning_rate": 9.704677005866022e-05, + "loss": 0.0102, + "step": 521970 + }, + { + "epoch": 1.35, + "learning_rate": 9.704288184228875e-05, + "loss": 0.0072, + "step": 521980 + }, + { + "epoch": 1.35, + "learning_rate": 9.703899362591729e-05, + "loss": 0.0073, + "step": 521990 + }, + { + "epoch": 1.35, + "learning_rate": 9.703510540954582e-05, + "loss": 0.0131, + "step": 522000 + }, + { + "epoch": 1.35, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.006435697432607412, + "eval_runtime": 107.8203, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 522000 + }, + { + "epoch": 1.35, + "learning_rate": 9.703121719317436e-05, + "loss": 0.0104, + "step": 522010 + }, + { + "epoch": 1.35, + "learning_rate": 9.702732897680289e-05, + "loss": 0.0084, + "step": 522020 + }, + { + "epoch": 1.35, + "learning_rate": 9.702344076043142e-05, + "loss": 0.009, + "step": 522030 + }, + { + "epoch": 1.35, + "learning_rate": 9.701955254405996e-05, + "loss": 0.0069, + "step": 522040 + }, + { + "epoch": 1.35, + "learning_rate": 9.701566432768849e-05, + "loss": 0.0133, + "step": 522050 + }, + { + "epoch": 1.35, + "learning_rate": 9.701177611131704e-05, + "loss": 0.0086, + "step": 522060 + }, + { + "epoch": 1.35, + "learning_rate": 9.700788789494556e-05, + "loss": 0.0083, + "step": 522070 + }, + { + "epoch": 1.35, + "learning_rate": 9.700399967857411e-05, + "loss": 0.0104, + "step": 522080 + }, + { + "epoch": 1.35, + "learning_rate": 9.700011146220264e-05, + "loss": 0.0108, + "step": 522090 + }, + { + "epoch": 1.35, + "learning_rate": 9.699622324583118e-05, + "loss": 0.0075, + "step": 522100 + }, + { + "epoch": 1.35, + "learning_rate": 9.699233502945971e-05, + "loss": 0.0093, + "step": 522110 + }, + { + "epoch": 1.35, + "learning_rate": 9.698844681308825e-05, + "loss": 0.0097, + "step": 522120 + }, + { + "epoch": 1.35, + "learning_rate": 9.698455859671678e-05, + "loss": 0.0105, + "step": 522130 + }, + { + "epoch": 1.35, + "learning_rate": 9.698067038034532e-05, + "loss": 0.0093, + "step": 522140 + }, + { + "epoch": 1.35, + "learning_rate": 9.697678216397385e-05, + "loss": 0.0078, + "step": 522150 + }, + { + "epoch": 1.35, + "learning_rate": 9.697289394760239e-05, + "loss": 0.0077, + "step": 522160 + }, + { + "epoch": 1.35, + "learning_rate": 9.696900573123092e-05, + "loss": 0.0109, + "step": 522170 + }, + { + "epoch": 1.35, + "learning_rate": 9.696511751485946e-05, + "loss": 0.0103, + "step": 522180 + }, + { + "epoch": 1.35, + "learning_rate": 9.696122929848799e-05, + "loss": 0.0117, + "step": 522190 + }, + { + "epoch": 1.35, + "learning_rate": 9.695734108211653e-05, + "loss": 0.01, + "step": 522200 + }, + { + "epoch": 1.35, + "learning_rate": 9.695345286574506e-05, + "loss": 0.0087, + "step": 522210 + }, + { + "epoch": 1.35, + "learning_rate": 9.69495646493736e-05, + "loss": 0.0115, + "step": 522220 + }, + { + "epoch": 1.35, + "learning_rate": 9.694567643300213e-05, + "loss": 0.0106, + "step": 522230 + }, + { + "epoch": 1.35, + "learning_rate": 9.694178821663068e-05, + "loss": 0.0112, + "step": 522240 + }, + { + "epoch": 1.35, + "learning_rate": 9.693790000025921e-05, + "loss": 0.0063, + "step": 522250 + }, + { + "epoch": 1.35, + "learning_rate": 9.693401178388775e-05, + "loss": 0.0083, + "step": 522260 + }, + { + "epoch": 1.35, + "learning_rate": 9.693012356751628e-05, + "loss": 0.0091, + "step": 522270 + }, + { + "epoch": 1.35, + "learning_rate": 9.692623535114481e-05, + "loss": 0.0096, + "step": 522280 + }, + { + "epoch": 1.35, + "learning_rate": 9.692234713477335e-05, + "loss": 0.0089, + "step": 522290 + }, + { + "epoch": 1.35, + "learning_rate": 9.691845891840188e-05, + "loss": 0.01, + "step": 522300 + }, + { + "epoch": 1.35, + "learning_rate": 9.691457070203042e-05, + "loss": 0.0073, + "step": 522310 + }, + { + "epoch": 1.35, + "learning_rate": 9.691068248565895e-05, + "loss": 0.0053, + "step": 522320 + }, + { + "epoch": 1.35, + "learning_rate": 9.690679426928749e-05, + "loss": 0.0082, + "step": 522330 + }, + { + "epoch": 1.35, + "learning_rate": 9.690290605291602e-05, + "loss": 0.0102, + "step": 522340 + }, + { + "epoch": 1.35, + "learning_rate": 9.689901783654456e-05, + "loss": 0.0134, + "step": 522350 + }, + { + "epoch": 1.35, + "learning_rate": 9.689512962017309e-05, + "loss": 0.0118, + "step": 522360 + }, + { + "epoch": 1.35, + "learning_rate": 9.689124140380163e-05, + "loss": 0.0093, + "step": 522370 + }, + { + "epoch": 1.35, + "learning_rate": 9.688735318743016e-05, + "loss": 0.01, + "step": 522380 + }, + { + "epoch": 1.35, + "learning_rate": 9.68834649710587e-05, + "loss": 0.0085, + "step": 522390 + }, + { + "epoch": 1.35, + "learning_rate": 9.687957675468723e-05, + "loss": 0.01, + "step": 522400 + }, + { + "epoch": 1.35, + "learning_rate": 9.687568853831578e-05, + "loss": 0.0094, + "step": 522410 + }, + { + "epoch": 1.35, + "learning_rate": 9.68718003219443e-05, + "loss": 0.009, + "step": 522420 + }, + { + "epoch": 1.35, + "learning_rate": 9.686791210557285e-05, + "loss": 0.0066, + "step": 522430 + }, + { + "epoch": 1.35, + "learning_rate": 9.686402388920138e-05, + "loss": 0.0101, + "step": 522440 + }, + { + "epoch": 1.35, + "learning_rate": 9.686013567282992e-05, + "loss": 0.0088, + "step": 522450 + }, + { + "epoch": 1.35, + "learning_rate": 9.685624745645845e-05, + "loss": 0.0103, + "step": 522460 + }, + { + "epoch": 1.35, + "learning_rate": 9.685235924008699e-05, + "loss": 0.0266, + "step": 522470 + }, + { + "epoch": 1.35, + "learning_rate": 9.684847102371552e-05, + "loss": 0.0144, + "step": 522480 + }, + { + "epoch": 1.35, + "learning_rate": 9.684458280734406e-05, + "loss": 0.0119, + "step": 522490 + }, + { + "epoch": 1.35, + "learning_rate": 9.684069459097259e-05, + "loss": 0.0092, + "step": 522500 + }, + { + "epoch": 1.35, + "learning_rate": 9.683680637460113e-05, + "loss": 0.0078, + "step": 522510 + }, + { + "epoch": 1.35, + "learning_rate": 9.683291815822966e-05, + "loss": 0.011, + "step": 522520 + }, + { + "epoch": 1.35, + "learning_rate": 9.682902994185819e-05, + "loss": 0.0127, + "step": 522530 + }, + { + "epoch": 1.35, + "learning_rate": 9.682514172548673e-05, + "loss": 0.0075, + "step": 522540 + }, + { + "epoch": 1.35, + "learning_rate": 9.682125350911526e-05, + "loss": 0.0143, + "step": 522550 + }, + { + "epoch": 1.35, + "learning_rate": 9.68173652927438e-05, + "loss": 0.0121, + "step": 522560 + }, + { + "epoch": 1.35, + "learning_rate": 9.681347707637233e-05, + "loss": 0.0098, + "step": 522570 + }, + { + "epoch": 1.35, + "learning_rate": 9.680958886000087e-05, + "loss": 0.0083, + "step": 522580 + }, + { + "epoch": 1.35, + "learning_rate": 9.68057006436294e-05, + "loss": 0.0073, + "step": 522590 + }, + { + "epoch": 1.35, + "learning_rate": 9.680181242725795e-05, + "loss": 0.0106, + "step": 522600 + }, + { + "epoch": 1.35, + "learning_rate": 9.679792421088648e-05, + "loss": 0.0103, + "step": 522610 + }, + { + "epoch": 1.35, + "learning_rate": 9.679403599451502e-05, + "loss": 0.0085, + "step": 522620 + }, + { + "epoch": 1.35, + "learning_rate": 9.679014777814355e-05, + "loss": 0.0098, + "step": 522630 + }, + { + "epoch": 1.35, + "learning_rate": 9.678625956177209e-05, + "loss": 0.0152, + "step": 522640 + }, + { + "epoch": 1.35, + "learning_rate": 9.678237134540062e-05, + "loss": 0.0093, + "step": 522650 + }, + { + "epoch": 1.35, + "learning_rate": 9.677848312902916e-05, + "loss": 0.0079, + "step": 522660 + }, + { + "epoch": 1.35, + "learning_rate": 9.677459491265769e-05, + "loss": 0.0101, + "step": 522670 + }, + { + "epoch": 1.35, + "learning_rate": 9.677070669628623e-05, + "loss": 0.0082, + "step": 522680 + }, + { + "epoch": 1.35, + "learning_rate": 9.676681847991476e-05, + "loss": 0.0097, + "step": 522690 + }, + { + "epoch": 1.35, + "learning_rate": 9.67629302635433e-05, + "loss": 0.0105, + "step": 522700 + }, + { + "epoch": 1.35, + "learning_rate": 9.675904204717183e-05, + "loss": 0.0104, + "step": 522710 + }, + { + "epoch": 1.35, + "learning_rate": 9.675515383080037e-05, + "loss": 0.0088, + "step": 522720 + }, + { + "epoch": 1.35, + "learning_rate": 9.67512656144289e-05, + "loss": 0.0078, + "step": 522730 + }, + { + "epoch": 1.36, + "learning_rate": 9.674737739805744e-05, + "loss": 0.0102, + "step": 522740 + }, + { + "epoch": 1.36, + "learning_rate": 9.674348918168597e-05, + "loss": 0.0129, + "step": 522750 + }, + { + "epoch": 1.36, + "learning_rate": 9.673960096531452e-05, + "loss": 0.0078, + "step": 522760 + }, + { + "epoch": 1.36, + "learning_rate": 9.673571274894305e-05, + "loss": 0.0123, + "step": 522770 + }, + { + "epoch": 1.36, + "learning_rate": 9.673182453257157e-05, + "loss": 0.0092, + "step": 522780 + }, + { + "epoch": 1.36, + "learning_rate": 9.672793631620012e-05, + "loss": 0.0127, + "step": 522790 + }, + { + "epoch": 1.36, + "learning_rate": 9.672404809982865e-05, + "loss": 0.01, + "step": 522800 + }, + { + "epoch": 1.36, + "learning_rate": 9.672015988345719e-05, + "loss": 0.0097, + "step": 522810 + }, + { + "epoch": 1.36, + "learning_rate": 9.671627166708572e-05, + "loss": 0.0124, + "step": 522820 + }, + { + "epoch": 1.36, + "learning_rate": 9.671238345071426e-05, + "loss": 0.0067, + "step": 522830 + }, + { + "epoch": 1.36, + "learning_rate": 9.670849523434279e-05, + "loss": 0.0118, + "step": 522840 + }, + { + "epoch": 1.36, + "learning_rate": 9.670460701797133e-05, + "loss": 0.0085, + "step": 522850 + }, + { + "epoch": 1.36, + "learning_rate": 9.670071880159986e-05, + "loss": 0.0124, + "step": 522860 + }, + { + "epoch": 1.36, + "learning_rate": 9.66968305852284e-05, + "loss": 0.0081, + "step": 522870 + }, + { + "epoch": 1.36, + "learning_rate": 9.669294236885693e-05, + "loss": 0.0085, + "step": 522880 + }, + { + "epoch": 1.36, + "learning_rate": 9.668905415248547e-05, + "loss": 0.0082, + "step": 522890 + }, + { + "epoch": 1.36, + "learning_rate": 9.6685165936114e-05, + "loss": 0.01, + "step": 522900 + }, + { + "epoch": 1.36, + "learning_rate": 9.668127771974254e-05, + "loss": 0.0108, + "step": 522910 + }, + { + "epoch": 1.36, + "learning_rate": 9.667738950337107e-05, + "loss": 0.009, + "step": 522920 + }, + { + "epoch": 1.36, + "learning_rate": 9.667350128699962e-05, + "loss": 0.01, + "step": 522930 + }, + { + "epoch": 1.36, + "learning_rate": 9.666961307062814e-05, + "loss": 0.0084, + "step": 522940 + }, + { + "epoch": 1.36, + "learning_rate": 9.666572485425669e-05, + "loss": 0.0079, + "step": 522950 + }, + { + "epoch": 1.36, + "learning_rate": 9.666183663788522e-05, + "loss": 0.011, + "step": 522960 + }, + { + "epoch": 1.36, + "learning_rate": 9.665794842151376e-05, + "loss": 0.0094, + "step": 522970 + }, + { + "epoch": 1.36, + "learning_rate": 9.665406020514229e-05, + "loss": 0.0061, + "step": 522980 + }, + { + "epoch": 1.36, + "learning_rate": 9.665017198877083e-05, + "loss": 0.0097, + "step": 522990 + }, + { + "epoch": 1.36, + "learning_rate": 9.664628377239936e-05, + "loss": 0.01, + "step": 523000 + }, + { + "epoch": 1.36, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.006541228387504816, + "eval_runtime": 107.8789, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 523000 + }, + { + "epoch": 1.36, + "learning_rate": 9.664239555602789e-05, + "loss": 0.0105, + "step": 523010 + }, + { + "epoch": 1.36, + "learning_rate": 9.663850733965643e-05, + "loss": 0.0105, + "step": 523020 + }, + { + "epoch": 1.36, + "learning_rate": 9.663461912328496e-05, + "loss": 0.0089, + "step": 523030 + }, + { + "epoch": 1.36, + "learning_rate": 9.66307309069135e-05, + "loss": 0.0093, + "step": 523040 + }, + { + "epoch": 1.36, + "learning_rate": 9.662684269054203e-05, + "loss": 0.0104, + "step": 523050 + }, + { + "epoch": 1.36, + "learning_rate": 9.662295447417057e-05, + "loss": 0.0094, + "step": 523060 + }, + { + "epoch": 1.36, + "learning_rate": 9.66190662577991e-05, + "loss": 0.0118, + "step": 523070 + }, + { + "epoch": 1.36, + "learning_rate": 9.661517804142764e-05, + "loss": 0.0118, + "step": 523080 + }, + { + "epoch": 1.36, + "learning_rate": 9.661128982505617e-05, + "loss": 0.0102, + "step": 523090 + }, + { + "epoch": 1.36, + "learning_rate": 9.660740160868471e-05, + "loss": 0.0069, + "step": 523100 + }, + { + "epoch": 1.36, + "learning_rate": 9.660351339231324e-05, + "loss": 0.0075, + "step": 523110 + }, + { + "epoch": 1.36, + "learning_rate": 9.659962517594179e-05, + "loss": 0.0137, + "step": 523120 + }, + { + "epoch": 1.36, + "learning_rate": 9.659573695957032e-05, + "loss": 0.014, + "step": 523130 + }, + { + "epoch": 1.36, + "learning_rate": 9.659184874319886e-05, + "loss": 0.0105, + "step": 523140 + }, + { + "epoch": 1.36, + "learning_rate": 9.658796052682739e-05, + "loss": 0.0079, + "step": 523150 + }, + { + "epoch": 1.36, + "learning_rate": 9.658407231045593e-05, + "loss": 0.009, + "step": 523160 + }, + { + "epoch": 1.36, + "learning_rate": 9.658018409408446e-05, + "loss": 0.0095, + "step": 523170 + }, + { + "epoch": 1.36, + "learning_rate": 9.6576295877713e-05, + "loss": 0.0085, + "step": 523180 + }, + { + "epoch": 1.36, + "learning_rate": 9.657240766134153e-05, + "loss": 0.0144, + "step": 523190 + }, + { + "epoch": 1.36, + "learning_rate": 9.656851944497007e-05, + "loss": 0.0118, + "step": 523200 + }, + { + "epoch": 1.36, + "learning_rate": 9.65646312285986e-05, + "loss": 0.0084, + "step": 523210 + }, + { + "epoch": 1.36, + "learning_rate": 9.656074301222714e-05, + "loss": 0.0104, + "step": 523220 + }, + { + "epoch": 1.36, + "learning_rate": 9.655685479585567e-05, + "loss": 0.0079, + "step": 523230 + }, + { + "epoch": 1.36, + "learning_rate": 9.655296657948421e-05, + "loss": 0.0082, + "step": 523240 + }, + { + "epoch": 1.36, + "learning_rate": 9.654907836311274e-05, + "loss": 0.01, + "step": 523250 + }, + { + "epoch": 1.36, + "learning_rate": 9.654519014674127e-05, + "loss": 0.0106, + "step": 523260 + }, + { + "epoch": 1.36, + "learning_rate": 9.654130193036981e-05, + "loss": 0.0118, + "step": 523270 + }, + { + "epoch": 1.36, + "learning_rate": 9.653741371399834e-05, + "loss": 0.0119, + "step": 523280 + }, + { + "epoch": 1.36, + "learning_rate": 9.653352549762689e-05, + "loss": 0.0075, + "step": 523290 + }, + { + "epoch": 1.36, + "learning_rate": 9.65296372812554e-05, + "loss": 0.0086, + "step": 523300 + }, + { + "epoch": 1.36, + "learning_rate": 9.652574906488396e-05, + "loss": 0.0113, + "step": 523310 + }, + { + "epoch": 1.36, + "learning_rate": 9.652186084851249e-05, + "loss": 0.0095, + "step": 523320 + }, + { + "epoch": 1.36, + "learning_rate": 9.651797263214103e-05, + "loss": 0.0079, + "step": 523330 + }, + { + "epoch": 1.36, + "learning_rate": 9.651408441576956e-05, + "loss": 0.0111, + "step": 523340 + }, + { + "epoch": 1.36, + "learning_rate": 9.65101961993981e-05, + "loss": 0.0094, + "step": 523350 + }, + { + "epoch": 1.36, + "learning_rate": 9.650630798302663e-05, + "loss": 0.0082, + "step": 523360 + }, + { + "epoch": 1.36, + "learning_rate": 9.650241976665517e-05, + "loss": 0.0089, + "step": 523370 + }, + { + "epoch": 1.36, + "learning_rate": 9.64985315502837e-05, + "loss": 0.0089, + "step": 523380 + }, + { + "epoch": 1.36, + "learning_rate": 9.649464333391224e-05, + "loss": 0.01, + "step": 523390 + }, + { + "epoch": 1.36, + "learning_rate": 9.649075511754077e-05, + "loss": 0.0098, + "step": 523400 + }, + { + "epoch": 1.36, + "learning_rate": 9.648686690116931e-05, + "loss": 0.0101, + "step": 523410 + }, + { + "epoch": 1.36, + "learning_rate": 9.648297868479784e-05, + "loss": 0.0098, + "step": 523420 + }, + { + "epoch": 1.36, + "learning_rate": 9.647909046842638e-05, + "loss": 0.0124, + "step": 523430 + }, + { + "epoch": 1.36, + "learning_rate": 9.647520225205491e-05, + "loss": 0.0118, + "step": 523440 + }, + { + "epoch": 1.36, + "learning_rate": 9.647131403568345e-05, + "loss": 0.0112, + "step": 523450 + }, + { + "epoch": 1.36, + "learning_rate": 9.646742581931198e-05, + "loss": 0.0107, + "step": 523460 + }, + { + "epoch": 1.36, + "learning_rate": 9.646353760294053e-05, + "loss": 0.0103, + "step": 523470 + }, + { + "epoch": 1.36, + "learning_rate": 9.645964938656906e-05, + "loss": 0.0084, + "step": 523480 + }, + { + "epoch": 1.36, + "learning_rate": 9.64557611701976e-05, + "loss": 0.0133, + "step": 523490 + }, + { + "epoch": 1.36, + "learning_rate": 9.645187295382613e-05, + "loss": 0.0104, + "step": 523500 + }, + { + "epoch": 1.36, + "learning_rate": 9.644798473745466e-05, + "loss": 0.0092, + "step": 523510 + }, + { + "epoch": 1.36, + "learning_rate": 9.64440965210832e-05, + "loss": 0.0106, + "step": 523520 + }, + { + "epoch": 1.36, + "learning_rate": 9.644020830471173e-05, + "loss": 0.01, + "step": 523530 + }, + { + "epoch": 1.36, + "learning_rate": 9.643632008834027e-05, + "loss": 0.009, + "step": 523540 + }, + { + "epoch": 1.36, + "learning_rate": 9.64324318719688e-05, + "loss": 0.0137, + "step": 523550 + }, + { + "epoch": 1.36, + "learning_rate": 9.642854365559734e-05, + "loss": 0.0076, + "step": 523560 + }, + { + "epoch": 1.36, + "learning_rate": 9.642465543922587e-05, + "loss": 0.0084, + "step": 523570 + }, + { + "epoch": 1.36, + "learning_rate": 9.642076722285441e-05, + "loss": 0.0126, + "step": 523580 + }, + { + "epoch": 1.36, + "learning_rate": 9.641687900648294e-05, + "loss": 0.0102, + "step": 523590 + }, + { + "epoch": 1.36, + "learning_rate": 9.641299079011148e-05, + "loss": 0.0083, + "step": 523600 + }, + { + "epoch": 1.36, + "learning_rate": 9.640910257374001e-05, + "loss": 0.0084, + "step": 523610 + }, + { + "epoch": 1.36, + "learning_rate": 9.640521435736855e-05, + "loss": 0.0107, + "step": 523620 + }, + { + "epoch": 1.36, + "learning_rate": 9.640132614099708e-05, + "loss": 0.0083, + "step": 523630 + }, + { + "epoch": 1.36, + "learning_rate": 9.639743792462563e-05, + "loss": 0.0115, + "step": 523640 + }, + { + "epoch": 1.36, + "learning_rate": 9.639354970825416e-05, + "loss": 0.0115, + "step": 523650 + }, + { + "epoch": 1.36, + "learning_rate": 9.63896614918827e-05, + "loss": 0.0108, + "step": 523660 + }, + { + "epoch": 1.36, + "learning_rate": 9.638577327551123e-05, + "loss": 0.0084, + "step": 523670 + }, + { + "epoch": 1.36, + "learning_rate": 9.638188505913977e-05, + "loss": 0.0083, + "step": 523680 + }, + { + "epoch": 1.36, + "learning_rate": 9.63779968427683e-05, + "loss": 0.0123, + "step": 523690 + }, + { + "epoch": 1.36, + "learning_rate": 9.637410862639684e-05, + "loss": 0.0095, + "step": 523700 + }, + { + "epoch": 1.36, + "learning_rate": 9.637022041002537e-05, + "loss": 0.0083, + "step": 523710 + }, + { + "epoch": 1.36, + "learning_rate": 9.636633219365391e-05, + "loss": 0.0109, + "step": 523720 + }, + { + "epoch": 1.36, + "learning_rate": 9.636244397728244e-05, + "loss": 0.0115, + "step": 523730 + }, + { + "epoch": 1.36, + "learning_rate": 9.635855576091098e-05, + "loss": 0.0106, + "step": 523740 + }, + { + "epoch": 1.36, + "learning_rate": 9.635466754453951e-05, + "loss": 0.0089, + "step": 523750 + }, + { + "epoch": 1.36, + "learning_rate": 9.635077932816804e-05, + "loss": 0.015, + "step": 523760 + }, + { + "epoch": 1.36, + "learning_rate": 9.634689111179658e-05, + "loss": 0.0094, + "step": 523770 + }, + { + "epoch": 1.36, + "learning_rate": 9.63430028954251e-05, + "loss": 0.01, + "step": 523780 + }, + { + "epoch": 1.36, + "learning_rate": 9.633911467905365e-05, + "loss": 0.0069, + "step": 523790 + }, + { + "epoch": 1.36, + "learning_rate": 9.633522646268218e-05, + "loss": 0.0089, + "step": 523800 + }, + { + "epoch": 1.36, + "learning_rate": 9.633133824631072e-05, + "loss": 0.0095, + "step": 523810 + }, + { + "epoch": 1.36, + "learning_rate": 9.632745002993925e-05, + "loss": 0.009, + "step": 523820 + }, + { + "epoch": 1.36, + "learning_rate": 9.63235618135678e-05, + "loss": 0.0146, + "step": 523830 + }, + { + "epoch": 1.36, + "learning_rate": 9.631967359719633e-05, + "loss": 0.0115, + "step": 523840 + }, + { + "epoch": 1.36, + "learning_rate": 9.631578538082487e-05, + "loss": 0.0079, + "step": 523850 + }, + { + "epoch": 1.36, + "learning_rate": 9.63118971644534e-05, + "loss": 0.01, + "step": 523860 + }, + { + "epoch": 1.36, + "learning_rate": 9.630800894808194e-05, + "loss": 0.0111, + "step": 523870 + }, + { + "epoch": 1.36, + "learning_rate": 9.630412073171047e-05, + "loss": 0.0169, + "step": 523880 + }, + { + "epoch": 1.36, + "learning_rate": 9.630023251533901e-05, + "loss": 0.0085, + "step": 523890 + }, + { + "epoch": 1.36, + "learning_rate": 9.629634429896754e-05, + "loss": 0.0101, + "step": 523900 + }, + { + "epoch": 1.36, + "learning_rate": 9.629245608259608e-05, + "loss": 0.0102, + "step": 523910 + }, + { + "epoch": 1.36, + "learning_rate": 9.628856786622461e-05, + "loss": 0.011, + "step": 523920 + }, + { + "epoch": 1.36, + "learning_rate": 9.628467964985315e-05, + "loss": 0.0115, + "step": 523930 + }, + { + "epoch": 1.36, + "learning_rate": 9.628079143348168e-05, + "loss": 0.0114, + "step": 523940 + }, + { + "epoch": 1.36, + "learning_rate": 9.627690321711022e-05, + "loss": 0.0097, + "step": 523950 + }, + { + "epoch": 1.36, + "learning_rate": 9.627301500073875e-05, + "loss": 0.0102, + "step": 523960 + }, + { + "epoch": 1.36, + "learning_rate": 9.626912678436729e-05, + "loss": 0.0087, + "step": 523970 + }, + { + "epoch": 1.36, + "learning_rate": 9.626523856799582e-05, + "loss": 0.0099, + "step": 523980 + }, + { + "epoch": 1.36, + "learning_rate": 9.626135035162437e-05, + "loss": 0.009, + "step": 523990 + }, + { + "epoch": 1.36, + "learning_rate": 9.62574621352529e-05, + "loss": 0.0124, + "step": 524000 + }, + { + "epoch": 1.36, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.0065029398538172245, + "eval_runtime": 107.8132, + "eval_samples_per_second": 18.551, + "eval_steps_per_second": 4.638, + "step": 524000 + }, + { + "epoch": 1.36, + "learning_rate": 9.625357391888141e-05, + "loss": 0.008, + "step": 524010 + }, + { + "epoch": 1.36, + "learning_rate": 9.624968570250997e-05, + "loss": 0.0115, + "step": 524020 + }, + { + "epoch": 1.36, + "learning_rate": 9.62457974861385e-05, + "loss": 0.011, + "step": 524030 + }, + { + "epoch": 1.36, + "learning_rate": 9.624190926976704e-05, + "loss": 0.0105, + "step": 524040 + }, + { + "epoch": 1.36, + "learning_rate": 9.623802105339557e-05, + "loss": 0.0124, + "step": 524050 + }, + { + "epoch": 1.36, + "learning_rate": 9.623413283702411e-05, + "loss": 0.0074, + "step": 524060 + }, + { + "epoch": 1.36, + "learning_rate": 9.623024462065264e-05, + "loss": 0.0106, + "step": 524070 + }, + { + "epoch": 1.36, + "learning_rate": 9.622635640428118e-05, + "loss": 0.0089, + "step": 524080 + }, + { + "epoch": 1.36, + "learning_rate": 9.622246818790971e-05, + "loss": 0.0102, + "step": 524090 + }, + { + "epoch": 1.36, + "learning_rate": 9.621857997153825e-05, + "loss": 0.0116, + "step": 524100 + }, + { + "epoch": 1.36, + "learning_rate": 9.621469175516678e-05, + "loss": 0.0088, + "step": 524110 + }, + { + "epoch": 1.36, + "learning_rate": 9.621080353879532e-05, + "loss": 0.0091, + "step": 524120 + }, + { + "epoch": 1.36, + "learning_rate": 9.620691532242385e-05, + "loss": 0.0087, + "step": 524130 + }, + { + "epoch": 1.36, + "learning_rate": 9.620302710605239e-05, + "loss": 0.0092, + "step": 524140 + }, + { + "epoch": 1.36, + "learning_rate": 9.619913888968092e-05, + "loss": 0.009, + "step": 524150 + }, + { + "epoch": 1.36, + "learning_rate": 9.619525067330947e-05, + "loss": 0.0112, + "step": 524160 + }, + { + "epoch": 1.36, + "learning_rate": 9.619136245693799e-05, + "loss": 0.0094, + "step": 524170 + }, + { + "epoch": 1.36, + "learning_rate": 9.618747424056654e-05, + "loss": 0.0166, + "step": 524180 + }, + { + "epoch": 1.36, + "learning_rate": 9.618358602419507e-05, + "loss": 0.0093, + "step": 524190 + }, + { + "epoch": 1.36, + "learning_rate": 9.617969780782361e-05, + "loss": 0.0117, + "step": 524200 + }, + { + "epoch": 1.36, + "learning_rate": 9.617580959145214e-05, + "loss": 0.009, + "step": 524210 + }, + { + "epoch": 1.36, + "learning_rate": 9.617192137508068e-05, + "loss": 0.008, + "step": 524220 + }, + { + "epoch": 1.36, + "learning_rate": 9.616803315870921e-05, + "loss": 0.0106, + "step": 524230 + }, + { + "epoch": 1.36, + "learning_rate": 9.616414494233775e-05, + "loss": 0.009, + "step": 524240 + }, + { + "epoch": 1.36, + "learning_rate": 9.616025672596628e-05, + "loss": 0.0082, + "step": 524250 + }, + { + "epoch": 1.36, + "learning_rate": 9.61563685095948e-05, + "loss": 0.0084, + "step": 524260 + }, + { + "epoch": 1.36, + "learning_rate": 9.615248029322335e-05, + "loss": 0.0099, + "step": 524270 + }, + { + "epoch": 1.36, + "learning_rate": 9.614859207685188e-05, + "loss": 0.0094, + "step": 524280 + }, + { + "epoch": 1.36, + "learning_rate": 9.614470386048042e-05, + "loss": 0.0128, + "step": 524290 + }, + { + "epoch": 1.36, + "learning_rate": 9.614081564410895e-05, + "loss": 0.0093, + "step": 524300 + }, + { + "epoch": 1.36, + "learning_rate": 9.613692742773749e-05, + "loss": 0.0134, + "step": 524310 + }, + { + "epoch": 1.36, + "learning_rate": 9.613303921136602e-05, + "loss": 0.0103, + "step": 524320 + }, + { + "epoch": 1.36, + "learning_rate": 9.612915099499456e-05, + "loss": 0.0085, + "step": 524330 + }, + { + "epoch": 1.36, + "learning_rate": 9.612526277862309e-05, + "loss": 0.0076, + "step": 524340 + }, + { + "epoch": 1.36, + "learning_rate": 9.612137456225164e-05, + "loss": 0.0085, + "step": 524350 + }, + { + "epoch": 1.36, + "learning_rate": 9.611748634588017e-05, + "loss": 0.0083, + "step": 524360 + }, + { + "epoch": 1.36, + "learning_rate": 9.611359812950871e-05, + "loss": 0.0131, + "step": 524370 + }, + { + "epoch": 1.36, + "learning_rate": 9.610970991313724e-05, + "loss": 0.0116, + "step": 524380 + }, + { + "epoch": 1.36, + "learning_rate": 9.610582169676578e-05, + "loss": 0.0094, + "step": 524390 + }, + { + "epoch": 1.36, + "learning_rate": 9.610193348039431e-05, + "loss": 0.0072, + "step": 524400 + }, + { + "epoch": 1.36, + "learning_rate": 9.609804526402285e-05, + "loss": 0.0103, + "step": 524410 + }, + { + "epoch": 1.36, + "learning_rate": 9.609415704765138e-05, + "loss": 0.0112, + "step": 524420 + }, + { + "epoch": 1.36, + "learning_rate": 9.609026883127992e-05, + "loss": 0.0097, + "step": 524430 + }, + { + "epoch": 1.36, + "learning_rate": 9.608638061490845e-05, + "loss": 0.0097, + "step": 524440 + }, + { + "epoch": 1.36, + "learning_rate": 9.608249239853699e-05, + "loss": 0.0116, + "step": 524450 + }, + { + "epoch": 1.36, + "learning_rate": 9.607860418216552e-05, + "loss": 0.0088, + "step": 524460 + }, + { + "epoch": 1.36, + "learning_rate": 9.607471596579406e-05, + "loss": 0.0081, + "step": 524470 + }, + { + "epoch": 1.36, + "learning_rate": 9.607082774942259e-05, + "loss": 0.0115, + "step": 524480 + }, + { + "epoch": 1.36, + "learning_rate": 9.606693953305113e-05, + "loss": 0.0081, + "step": 524490 + }, + { + "epoch": 1.36, + "learning_rate": 9.606305131667966e-05, + "loss": 0.0107, + "step": 524500 + }, + { + "epoch": 1.36, + "learning_rate": 9.605916310030818e-05, + "loss": 0.0095, + "step": 524510 + }, + { + "epoch": 1.36, + "learning_rate": 9.605527488393674e-05, + "loss": 0.0092, + "step": 524520 + }, + { + "epoch": 1.36, + "learning_rate": 9.605138666756525e-05, + "loss": 0.0081, + "step": 524530 + }, + { + "epoch": 1.36, + "learning_rate": 9.604749845119381e-05, + "loss": 0.009, + "step": 524540 + }, + { + "epoch": 1.36, + "learning_rate": 9.604361023482234e-05, + "loss": 0.0101, + "step": 524550 + }, + { + "epoch": 1.36, + "learning_rate": 9.603972201845088e-05, + "loss": 0.0078, + "step": 524560 + }, + { + "epoch": 1.36, + "learning_rate": 9.603583380207941e-05, + "loss": 0.0097, + "step": 524570 + }, + { + "epoch": 1.36, + "learning_rate": 9.603194558570795e-05, + "loss": 0.0085, + "step": 524580 + }, + { + "epoch": 1.36, + "learning_rate": 9.602805736933648e-05, + "loss": 0.0094, + "step": 524590 + }, + { + "epoch": 1.36, + "learning_rate": 9.602416915296502e-05, + "loss": 0.0092, + "step": 524600 + }, + { + "epoch": 1.36, + "learning_rate": 9.602028093659355e-05, + "loss": 0.0077, + "step": 524610 + }, + { + "epoch": 1.36, + "learning_rate": 9.601639272022209e-05, + "loss": 0.0094, + "step": 524620 + }, + { + "epoch": 1.36, + "learning_rate": 9.601250450385062e-05, + "loss": 0.0106, + "step": 524630 + }, + { + "epoch": 1.36, + "learning_rate": 9.600861628747916e-05, + "loss": 0.0088, + "step": 524640 + }, + { + "epoch": 1.36, + "learning_rate": 9.600472807110769e-05, + "loss": 0.0105, + "step": 524650 + }, + { + "epoch": 1.36, + "learning_rate": 9.600083985473623e-05, + "loss": 0.0263, + "step": 524660 + }, + { + "epoch": 1.36, + "learning_rate": 9.599695163836476e-05, + "loss": 0.0128, + "step": 524670 + }, + { + "epoch": 1.36, + "learning_rate": 9.599306342199331e-05, + "loss": 0.0088, + "step": 524680 + }, + { + "epoch": 1.36, + "learning_rate": 9.598917520562183e-05, + "loss": 0.0117, + "step": 524690 + }, + { + "epoch": 1.36, + "learning_rate": 9.598528698925038e-05, + "loss": 0.0122, + "step": 524700 + }, + { + "epoch": 1.36, + "learning_rate": 9.598139877287891e-05, + "loss": 0.0097, + "step": 524710 + }, + { + "epoch": 1.36, + "learning_rate": 9.597751055650745e-05, + "loss": 0.0121, + "step": 524720 + }, + { + "epoch": 1.36, + "learning_rate": 9.597362234013598e-05, + "loss": 0.0101, + "step": 524730 + }, + { + "epoch": 1.36, + "learning_rate": 9.596973412376452e-05, + "loss": 0.0099, + "step": 524740 + }, + { + "epoch": 1.36, + "learning_rate": 9.596584590739305e-05, + "loss": 0.0097, + "step": 524750 + }, + { + "epoch": 1.36, + "learning_rate": 9.596195769102158e-05, + "loss": 0.0072, + "step": 524760 + }, + { + "epoch": 1.36, + "learning_rate": 9.595806947465012e-05, + "loss": 0.0074, + "step": 524770 + }, + { + "epoch": 1.36, + "learning_rate": 9.595418125827865e-05, + "loss": 0.01, + "step": 524780 + }, + { + "epoch": 1.36, + "learning_rate": 9.595029304190719e-05, + "loss": 0.0087, + "step": 524790 + }, + { + "epoch": 1.36, + "learning_rate": 9.594640482553572e-05, + "loss": 0.0099, + "step": 524800 + }, + { + "epoch": 1.36, + "learning_rate": 9.594251660916426e-05, + "loss": 0.0094, + "step": 524810 + }, + { + "epoch": 1.36, + "learning_rate": 9.593862839279279e-05, + "loss": 0.0104, + "step": 524820 + }, + { + "epoch": 1.36, + "learning_rate": 9.593474017642133e-05, + "loss": 0.0111, + "step": 524830 + }, + { + "epoch": 1.36, + "learning_rate": 9.593085196004986e-05, + "loss": 0.014, + "step": 524840 + }, + { + "epoch": 1.36, + "learning_rate": 9.59269637436784e-05, + "loss": 0.0079, + "step": 524850 + }, + { + "epoch": 1.36, + "learning_rate": 9.592307552730693e-05, + "loss": 0.0124, + "step": 524860 + }, + { + "epoch": 1.36, + "learning_rate": 9.591918731093548e-05, + "loss": 0.0084, + "step": 524870 + }, + { + "epoch": 1.36, + "learning_rate": 9.591529909456401e-05, + "loss": 0.0076, + "step": 524880 + }, + { + "epoch": 1.36, + "learning_rate": 9.591141087819255e-05, + "loss": 0.0081, + "step": 524890 + }, + { + "epoch": 1.36, + "learning_rate": 9.590752266182108e-05, + "loss": 0.0091, + "step": 524900 + }, + { + "epoch": 1.36, + "learning_rate": 9.590363444544962e-05, + "loss": 0.0108, + "step": 524910 + }, + { + "epoch": 1.36, + "learning_rate": 9.589974622907815e-05, + "loss": 0.0093, + "step": 524920 + }, + { + "epoch": 1.36, + "learning_rate": 9.589585801270669e-05, + "loss": 0.0114, + "step": 524930 + }, + { + "epoch": 1.36, + "learning_rate": 9.589196979633522e-05, + "loss": 0.0095, + "step": 524940 + }, + { + "epoch": 1.36, + "learning_rate": 9.588808157996376e-05, + "loss": 0.0115, + "step": 524950 + }, + { + "epoch": 1.36, + "learning_rate": 9.588419336359229e-05, + "loss": 0.0082, + "step": 524960 + }, + { + "epoch": 1.36, + "learning_rate": 9.588030514722083e-05, + "loss": 0.0116, + "step": 524970 + }, + { + "epoch": 1.36, + "learning_rate": 9.587641693084936e-05, + "loss": 0.009, + "step": 524980 + }, + { + "epoch": 1.36, + "learning_rate": 9.58725287144779e-05, + "loss": 0.0093, + "step": 524990 + }, + { + "epoch": 1.36, + "learning_rate": 9.586864049810643e-05, + "loss": 0.0099, + "step": 525000 + }, + { + "epoch": 1.36, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.006309923715889454, + "eval_runtime": 107.932, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.633, + "step": 525000 + }, + { + "epoch": 1.36, + "learning_rate": 9.586475228173496e-05, + "loss": 0.0128, + "step": 525010 + }, + { + "epoch": 1.36, + "learning_rate": 9.58608640653635e-05, + "loss": 0.0118, + "step": 525020 + }, + { + "epoch": 1.36, + "learning_rate": 9.585697584899202e-05, + "loss": 0.0076, + "step": 525030 + }, + { + "epoch": 1.36, + "learning_rate": 9.585308763262057e-05, + "loss": 0.0097, + "step": 525040 + }, + { + "epoch": 1.36, + "learning_rate": 9.58491994162491e-05, + "loss": 0.0079, + "step": 525050 + }, + { + "epoch": 1.36, + "learning_rate": 9.584531119987765e-05, + "loss": 0.0098, + "step": 525060 + }, + { + "epoch": 1.36, + "learning_rate": 9.584142298350618e-05, + "loss": 0.0138, + "step": 525070 + }, + { + "epoch": 1.36, + "learning_rate": 9.583753476713472e-05, + "loss": 0.009, + "step": 525080 + }, + { + "epoch": 1.36, + "learning_rate": 9.583364655076325e-05, + "loss": 0.0115, + "step": 525090 + }, + { + "epoch": 1.36, + "learning_rate": 9.582975833439179e-05, + "loss": 0.0106, + "step": 525100 + }, + { + "epoch": 1.36, + "learning_rate": 9.582587011802032e-05, + "loss": 0.0104, + "step": 525110 + }, + { + "epoch": 1.36, + "learning_rate": 9.582198190164886e-05, + "loss": 0.0082, + "step": 525120 + }, + { + "epoch": 1.36, + "learning_rate": 9.581809368527739e-05, + "loss": 0.01, + "step": 525130 + }, + { + "epoch": 1.36, + "learning_rate": 9.581420546890593e-05, + "loss": 0.0075, + "step": 525140 + }, + { + "epoch": 1.36, + "learning_rate": 9.581031725253446e-05, + "loss": 0.009, + "step": 525150 + }, + { + "epoch": 1.36, + "learning_rate": 9.5806429036163e-05, + "loss": 0.0097, + "step": 525160 + }, + { + "epoch": 1.36, + "learning_rate": 9.580254081979153e-05, + "loss": 0.0118, + "step": 525170 + }, + { + "epoch": 1.36, + "learning_rate": 9.579865260342007e-05, + "loss": 0.0112, + "step": 525180 + }, + { + "epoch": 1.36, + "learning_rate": 9.57947643870486e-05, + "loss": 0.0092, + "step": 525190 + }, + { + "epoch": 1.36, + "learning_rate": 9.579087617067714e-05, + "loss": 0.0077, + "step": 525200 + }, + { + "epoch": 1.36, + "learning_rate": 9.578698795430567e-05, + "loss": 0.0088, + "step": 525210 + }, + { + "epoch": 1.36, + "learning_rate": 9.578309973793422e-05, + "loss": 0.0094, + "step": 525220 + }, + { + "epoch": 1.36, + "learning_rate": 9.577921152156275e-05, + "loss": 0.0113, + "step": 525230 + }, + { + "epoch": 1.36, + "learning_rate": 9.577532330519129e-05, + "loss": 0.0096, + "step": 525240 + }, + { + "epoch": 1.36, + "learning_rate": 9.577143508881982e-05, + "loss": 0.0087, + "step": 525250 + }, + { + "epoch": 1.36, + "learning_rate": 9.576754687244835e-05, + "loss": 0.012, + "step": 525260 + }, + { + "epoch": 1.36, + "learning_rate": 9.576365865607689e-05, + "loss": 0.0097, + "step": 525270 + }, + { + "epoch": 1.36, + "learning_rate": 9.575977043970542e-05, + "loss": 0.0148, + "step": 525280 + }, + { + "epoch": 1.36, + "learning_rate": 9.575588222333396e-05, + "loss": 0.0098, + "step": 525290 + }, + { + "epoch": 1.36, + "learning_rate": 9.575199400696249e-05, + "loss": 0.0113, + "step": 525300 + }, + { + "epoch": 1.36, + "learning_rate": 9.574810579059103e-05, + "loss": 0.0109, + "step": 525310 + }, + { + "epoch": 1.36, + "learning_rate": 9.574421757421956e-05, + "loss": 0.0079, + "step": 525320 + }, + { + "epoch": 1.36, + "learning_rate": 9.57403293578481e-05, + "loss": 0.0103, + "step": 525330 + }, + { + "epoch": 1.36, + "learning_rate": 9.573644114147663e-05, + "loss": 0.0094, + "step": 525340 + }, + { + "epoch": 1.36, + "learning_rate": 9.573255292510517e-05, + "loss": 0.0074, + "step": 525350 + }, + { + "epoch": 1.36, + "learning_rate": 9.57286647087337e-05, + "loss": 0.0089, + "step": 525360 + }, + { + "epoch": 1.36, + "learning_rate": 9.572477649236224e-05, + "loss": 0.0118, + "step": 525370 + }, + { + "epoch": 1.36, + "learning_rate": 9.572088827599077e-05, + "loss": 0.0101, + "step": 525380 + }, + { + "epoch": 1.36, + "learning_rate": 9.571700005961932e-05, + "loss": 0.0127, + "step": 525390 + }, + { + "epoch": 1.36, + "learning_rate": 9.571311184324784e-05, + "loss": 0.0091, + "step": 525400 + }, + { + "epoch": 1.36, + "learning_rate": 9.570922362687639e-05, + "loss": 0.0113, + "step": 525410 + }, + { + "epoch": 1.36, + "learning_rate": 9.570533541050492e-05, + "loss": 0.0085, + "step": 525420 + }, + { + "epoch": 1.36, + "learning_rate": 9.570144719413346e-05, + "loss": 0.0119, + "step": 525430 + }, + { + "epoch": 1.36, + "learning_rate": 9.569755897776199e-05, + "loss": 0.0109, + "step": 525440 + }, + { + "epoch": 1.36, + "learning_rate": 9.569367076139053e-05, + "loss": 0.0139, + "step": 525450 + }, + { + "epoch": 1.36, + "learning_rate": 9.568978254501906e-05, + "loss": 0.0092, + "step": 525460 + }, + { + "epoch": 1.36, + "learning_rate": 9.56858943286476e-05, + "loss": 0.02, + "step": 525470 + }, + { + "epoch": 1.36, + "learning_rate": 9.568200611227613e-05, + "loss": 0.009, + "step": 525480 + }, + { + "epoch": 1.36, + "learning_rate": 9.567811789590466e-05, + "loss": 0.0084, + "step": 525490 + }, + { + "epoch": 1.36, + "learning_rate": 9.56742296795332e-05, + "loss": 0.0091, + "step": 525500 + }, + { + "epoch": 1.36, + "learning_rate": 9.567034146316173e-05, + "loss": 0.0091, + "step": 525510 + }, + { + "epoch": 1.36, + "learning_rate": 9.566645324679027e-05, + "loss": 0.0119, + "step": 525520 + }, + { + "epoch": 1.36, + "learning_rate": 9.56625650304188e-05, + "loss": 0.0087, + "step": 525530 + }, + { + "epoch": 1.36, + "learning_rate": 9.565867681404734e-05, + "loss": 0.0089, + "step": 525540 + }, + { + "epoch": 1.36, + "learning_rate": 9.565478859767586e-05, + "loss": 0.0093, + "step": 525550 + }, + { + "epoch": 1.36, + "learning_rate": 9.56509003813044e-05, + "loss": 0.0095, + "step": 525560 + }, + { + "epoch": 1.36, + "learning_rate": 9.564701216493293e-05, + "loss": 0.0107, + "step": 525570 + }, + { + "epoch": 1.36, + "learning_rate": 9.564312394856149e-05, + "loss": 0.0092, + "step": 525580 + }, + { + "epoch": 1.36, + "learning_rate": 9.563923573219002e-05, + "loss": 0.0075, + "step": 525590 + }, + { + "epoch": 1.36, + "learning_rate": 9.563534751581856e-05, + "loss": 0.014, + "step": 525600 + }, + { + "epoch": 1.36, + "learning_rate": 9.563145929944709e-05, + "loss": 0.008, + "step": 525610 + }, + { + "epoch": 1.36, + "learning_rate": 9.562757108307563e-05, + "loss": 0.0108, + "step": 525620 + }, + { + "epoch": 1.36, + "learning_rate": 9.562368286670416e-05, + "loss": 0.009, + "step": 525630 + }, + { + "epoch": 1.36, + "learning_rate": 9.56197946503327e-05, + "loss": 0.0085, + "step": 525640 + }, + { + "epoch": 1.36, + "learning_rate": 9.561590643396123e-05, + "loss": 0.0103, + "step": 525650 + }, + { + "epoch": 1.36, + "learning_rate": 9.561201821758977e-05, + "loss": 0.0078, + "step": 525660 + }, + { + "epoch": 1.36, + "learning_rate": 9.56081300012183e-05, + "loss": 0.0079, + "step": 525670 + }, + { + "epoch": 1.36, + "learning_rate": 9.560424178484684e-05, + "loss": 0.0106, + "step": 525680 + }, + { + "epoch": 1.36, + "learning_rate": 9.560035356847537e-05, + "loss": 0.0093, + "step": 525690 + }, + { + "epoch": 1.36, + "learning_rate": 9.559646535210391e-05, + "loss": 0.0115, + "step": 525700 + }, + { + "epoch": 1.36, + "learning_rate": 9.559257713573244e-05, + "loss": 0.0092, + "step": 525710 + }, + { + "epoch": 1.36, + "learning_rate": 9.558868891936098e-05, + "loss": 0.008, + "step": 525720 + }, + { + "epoch": 1.36, + "learning_rate": 9.55848007029895e-05, + "loss": 0.0146, + "step": 525730 + }, + { + "epoch": 1.36, + "learning_rate": 9.558091248661803e-05, + "loss": 0.0095, + "step": 525740 + }, + { + "epoch": 1.36, + "learning_rate": 9.557702427024659e-05, + "loss": 0.0099, + "step": 525750 + }, + { + "epoch": 1.36, + "learning_rate": 9.55731360538751e-05, + "loss": 0.0096, + "step": 525760 + }, + { + "epoch": 1.36, + "learning_rate": 9.556924783750366e-05, + "loss": 0.0122, + "step": 525770 + }, + { + "epoch": 1.36, + "learning_rate": 9.556535962113219e-05, + "loss": 0.0081, + "step": 525780 + }, + { + "epoch": 1.36, + "learning_rate": 9.556147140476073e-05, + "loss": 0.0084, + "step": 525790 + }, + { + "epoch": 1.36, + "learning_rate": 9.555758318838926e-05, + "loss": 0.0092, + "step": 525800 + }, + { + "epoch": 1.36, + "learning_rate": 9.55536949720178e-05, + "loss": 0.0084, + "step": 525810 + }, + { + "epoch": 1.36, + "learning_rate": 9.554980675564633e-05, + "loss": 0.0071, + "step": 525820 + }, + { + "epoch": 1.36, + "learning_rate": 9.554591853927487e-05, + "loss": 0.0168, + "step": 525830 + }, + { + "epoch": 1.36, + "learning_rate": 9.55420303229034e-05, + "loss": 0.0083, + "step": 525840 + }, + { + "epoch": 1.36, + "learning_rate": 9.553814210653194e-05, + "loss": 0.0093, + "step": 525850 + }, + { + "epoch": 1.36, + "learning_rate": 9.553425389016047e-05, + "loss": 0.0076, + "step": 525860 + }, + { + "epoch": 1.36, + "learning_rate": 9.553036567378901e-05, + "loss": 0.0087, + "step": 525870 + }, + { + "epoch": 1.36, + "learning_rate": 9.552647745741754e-05, + "loss": 0.0095, + "step": 525880 + }, + { + "epoch": 1.36, + "learning_rate": 9.552258924104608e-05, + "loss": 0.0127, + "step": 525890 + }, + { + "epoch": 1.36, + "learning_rate": 9.55187010246746e-05, + "loss": 0.0108, + "step": 525900 + }, + { + "epoch": 1.36, + "learning_rate": 9.551481280830316e-05, + "loss": 0.0089, + "step": 525910 + }, + { + "epoch": 1.36, + "learning_rate": 9.551092459193167e-05, + "loss": 0.0096, + "step": 525920 + }, + { + "epoch": 1.36, + "learning_rate": 9.550703637556023e-05, + "loss": 0.0079, + "step": 525930 + }, + { + "epoch": 1.36, + "learning_rate": 9.550314815918876e-05, + "loss": 0.0096, + "step": 525940 + }, + { + "epoch": 1.36, + "learning_rate": 9.54992599428173e-05, + "loss": 0.0101, + "step": 525950 + }, + { + "epoch": 1.36, + "learning_rate": 9.549537172644583e-05, + "loss": 0.0097, + "step": 525960 + }, + { + "epoch": 1.36, + "learning_rate": 9.549148351007437e-05, + "loss": 0.0079, + "step": 525970 + }, + { + "epoch": 1.36, + "learning_rate": 9.54875952937029e-05, + "loss": 0.0092, + "step": 525980 + }, + { + "epoch": 1.36, + "learning_rate": 9.548370707733143e-05, + "loss": 0.0075, + "step": 525990 + }, + { + "epoch": 1.36, + "learning_rate": 9.547981886095997e-05, + "loss": 0.0104, + "step": 526000 + }, + { + "epoch": 1.36, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.006388062611222267, + "eval_runtime": 107.8148, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.638, + "step": 526000 + }, + { + "epoch": 1.36, + "learning_rate": 9.54759306445885e-05, + "loss": 0.0081, + "step": 526010 + }, + { + "epoch": 1.36, + "learning_rate": 9.547204242821704e-05, + "loss": 0.009, + "step": 526020 + }, + { + "epoch": 1.36, + "learning_rate": 9.546815421184557e-05, + "loss": 0.0082, + "step": 526030 + }, + { + "epoch": 1.36, + "learning_rate": 9.546426599547411e-05, + "loss": 0.0087, + "step": 526040 + }, + { + "epoch": 1.36, + "learning_rate": 9.546037777910263e-05, + "loss": 0.0113, + "step": 526050 + }, + { + "epoch": 1.36, + "learning_rate": 9.545648956273118e-05, + "loss": 0.0105, + "step": 526060 + }, + { + "epoch": 1.36, + "learning_rate": 9.54526013463597e-05, + "loss": 0.0082, + "step": 526070 + }, + { + "epoch": 1.36, + "learning_rate": 9.544871312998825e-05, + "loss": 0.0066, + "step": 526080 + }, + { + "epoch": 1.36, + "learning_rate": 9.544482491361677e-05, + "loss": 0.0095, + "step": 526090 + }, + { + "epoch": 1.36, + "learning_rate": 9.544093669724533e-05, + "loss": 0.0118, + "step": 526100 + }, + { + "epoch": 1.36, + "learning_rate": 9.543704848087386e-05, + "loss": 0.0121, + "step": 526110 + }, + { + "epoch": 1.36, + "learning_rate": 9.54331602645024e-05, + "loss": 0.0086, + "step": 526120 + }, + { + "epoch": 1.36, + "learning_rate": 9.542927204813093e-05, + "loss": 0.0105, + "step": 526130 + }, + { + "epoch": 1.36, + "learning_rate": 9.542538383175947e-05, + "loss": 0.0095, + "step": 526140 + }, + { + "epoch": 1.36, + "learning_rate": 9.5421495615388e-05, + "loss": 0.0111, + "step": 526150 + }, + { + "epoch": 1.36, + "learning_rate": 9.541760739901654e-05, + "loss": 0.0116, + "step": 526160 + }, + { + "epoch": 1.36, + "learning_rate": 9.541371918264507e-05, + "loss": 0.0102, + "step": 526170 + }, + { + "epoch": 1.36, + "learning_rate": 9.540983096627361e-05, + "loss": 0.0121, + "step": 526180 + }, + { + "epoch": 1.36, + "learning_rate": 9.540594274990214e-05, + "loss": 0.0125, + "step": 526190 + }, + { + "epoch": 1.36, + "learning_rate": 9.540205453353068e-05, + "loss": 0.0096, + "step": 526200 + }, + { + "epoch": 1.36, + "learning_rate": 9.53981663171592e-05, + "loss": 0.0093, + "step": 526210 + }, + { + "epoch": 1.36, + "learning_rate": 9.539427810078775e-05, + "loss": 0.0086, + "step": 526220 + }, + { + "epoch": 1.36, + "learning_rate": 9.539038988441628e-05, + "loss": 0.0089, + "step": 526230 + }, + { + "epoch": 1.36, + "learning_rate": 9.53865016680448e-05, + "loss": 0.0118, + "step": 526240 + }, + { + "epoch": 1.36, + "learning_rate": 9.538261345167335e-05, + "loss": 0.0124, + "step": 526250 + }, + { + "epoch": 1.36, + "learning_rate": 9.537872523530187e-05, + "loss": 0.0074, + "step": 526260 + }, + { + "epoch": 1.36, + "learning_rate": 9.537483701893043e-05, + "loss": 0.0082, + "step": 526270 + }, + { + "epoch": 1.36, + "learning_rate": 9.537094880255894e-05, + "loss": 0.0077, + "step": 526280 + }, + { + "epoch": 1.36, + "learning_rate": 9.53670605861875e-05, + "loss": 0.0068, + "step": 526290 + }, + { + "epoch": 1.36, + "learning_rate": 9.536317236981603e-05, + "loss": 0.0079, + "step": 526300 + }, + { + "epoch": 1.36, + "learning_rate": 9.535928415344457e-05, + "loss": 0.0095, + "step": 526310 + }, + { + "epoch": 1.36, + "learning_rate": 9.53553959370731e-05, + "loss": 0.0082, + "step": 526320 + }, + { + "epoch": 1.36, + "learning_rate": 9.535150772070164e-05, + "loss": 0.0101, + "step": 526330 + }, + { + "epoch": 1.36, + "learning_rate": 9.534761950433017e-05, + "loss": 0.0093, + "step": 526340 + }, + { + "epoch": 1.36, + "learning_rate": 9.534373128795871e-05, + "loss": 0.0114, + "step": 526350 + }, + { + "epoch": 1.36, + "learning_rate": 9.533984307158724e-05, + "loss": 0.0131, + "step": 526360 + }, + { + "epoch": 1.36, + "learning_rate": 9.533595485521578e-05, + "loss": 0.0092, + "step": 526370 + }, + { + "epoch": 1.36, + "learning_rate": 9.53320666388443e-05, + "loss": 0.0098, + "step": 526380 + }, + { + "epoch": 1.36, + "learning_rate": 9.532817842247285e-05, + "loss": 0.0081, + "step": 526390 + }, + { + "epoch": 1.36, + "learning_rate": 9.532429020610138e-05, + "loss": 0.0105, + "step": 526400 + }, + { + "epoch": 1.36, + "learning_rate": 9.532040198972992e-05, + "loss": 0.0106, + "step": 526410 + }, + { + "epoch": 1.36, + "learning_rate": 9.531651377335845e-05, + "loss": 0.013, + "step": 526420 + }, + { + "epoch": 1.36, + "learning_rate": 9.531262555698699e-05, + "loss": 0.0071, + "step": 526430 + }, + { + "epoch": 1.36, + "learning_rate": 9.530873734061551e-05, + "loss": 0.008, + "step": 526440 + }, + { + "epoch": 1.36, + "learning_rate": 9.530484912424407e-05, + "loss": 0.0064, + "step": 526450 + }, + { + "epoch": 1.36, + "learning_rate": 9.53009609078726e-05, + "loss": 0.0119, + "step": 526460 + }, + { + "epoch": 1.36, + "learning_rate": 9.529707269150114e-05, + "loss": 0.0142, + "step": 526470 + }, + { + "epoch": 1.36, + "learning_rate": 9.529318447512967e-05, + "loss": 0.0112, + "step": 526480 + }, + { + "epoch": 1.36, + "learning_rate": 9.52892962587582e-05, + "loss": 0.0096, + "step": 526490 + }, + { + "epoch": 1.36, + "learning_rate": 9.528540804238674e-05, + "loss": 0.0108, + "step": 526500 + }, + { + "epoch": 1.36, + "learning_rate": 9.528151982601527e-05, + "loss": 0.009, + "step": 526510 + }, + { + "epoch": 1.36, + "learning_rate": 9.527763160964381e-05, + "loss": 0.0115, + "step": 526520 + }, + { + "epoch": 1.36, + "learning_rate": 9.527374339327234e-05, + "loss": 0.0099, + "step": 526530 + }, + { + "epoch": 1.36, + "learning_rate": 9.526985517690088e-05, + "loss": 0.0087, + "step": 526540 + }, + { + "epoch": 1.36, + "learning_rate": 9.52659669605294e-05, + "loss": 0.0097, + "step": 526550 + }, + { + "epoch": 1.36, + "learning_rate": 9.526207874415795e-05, + "loss": 0.0114, + "step": 526560 + }, + { + "epoch": 1.36, + "learning_rate": 9.525819052778647e-05, + "loss": 0.0099, + "step": 526570 + }, + { + "epoch": 1.36, + "learning_rate": 9.525430231141502e-05, + "loss": 0.0098, + "step": 526580 + }, + { + "epoch": 1.36, + "learning_rate": 9.525041409504354e-05, + "loss": 0.0104, + "step": 526590 + }, + { + "epoch": 1.37, + "learning_rate": 9.524652587867209e-05, + "loss": 0.0086, + "step": 526600 + }, + { + "epoch": 1.37, + "learning_rate": 9.524263766230061e-05, + "loss": 0.0085, + "step": 526610 + }, + { + "epoch": 1.37, + "learning_rate": 9.523874944592917e-05, + "loss": 0.0092, + "step": 526620 + }, + { + "epoch": 1.37, + "learning_rate": 9.523486122955768e-05, + "loss": 0.01, + "step": 526630 + }, + { + "epoch": 1.37, + "learning_rate": 9.523097301318624e-05, + "loss": 0.0107, + "step": 526640 + }, + { + "epoch": 1.37, + "learning_rate": 9.522708479681477e-05, + "loss": 0.0101, + "step": 526650 + }, + { + "epoch": 1.37, + "learning_rate": 9.522319658044331e-05, + "loss": 0.0062, + "step": 526660 + }, + { + "epoch": 1.37, + "learning_rate": 9.521930836407184e-05, + "loss": 0.0072, + "step": 526670 + }, + { + "epoch": 1.37, + "learning_rate": 9.521542014770038e-05, + "loss": 0.0093, + "step": 526680 + }, + { + "epoch": 1.37, + "learning_rate": 9.52115319313289e-05, + "loss": 0.0078, + "step": 526690 + }, + { + "epoch": 1.37, + "learning_rate": 9.520764371495745e-05, + "loss": 0.0101, + "step": 526700 + }, + { + "epoch": 1.37, + "learning_rate": 9.520375549858598e-05, + "loss": 0.0097, + "step": 526710 + }, + { + "epoch": 1.37, + "learning_rate": 9.519986728221452e-05, + "loss": 0.0097, + "step": 526720 + }, + { + "epoch": 1.37, + "learning_rate": 9.519597906584305e-05, + "loss": 0.0082, + "step": 526730 + }, + { + "epoch": 1.37, + "learning_rate": 9.519209084947157e-05, + "loss": 0.0124, + "step": 526740 + }, + { + "epoch": 1.37, + "learning_rate": 9.518820263310012e-05, + "loss": 0.0104, + "step": 526750 + }, + { + "epoch": 1.37, + "learning_rate": 9.518431441672864e-05, + "loss": 0.0093, + "step": 526760 + }, + { + "epoch": 1.37, + "learning_rate": 9.518042620035719e-05, + "loss": 0.0113, + "step": 526770 + }, + { + "epoch": 1.37, + "learning_rate": 9.517653798398571e-05, + "loss": 0.0098, + "step": 526780 + }, + { + "epoch": 1.37, + "learning_rate": 9.517264976761426e-05, + "loss": 0.0099, + "step": 526790 + }, + { + "epoch": 1.37, + "learning_rate": 9.516876155124278e-05, + "loss": 0.0111, + "step": 526800 + }, + { + "epoch": 1.37, + "learning_rate": 9.516487333487134e-05, + "loss": 0.0102, + "step": 526810 + }, + { + "epoch": 1.37, + "learning_rate": 9.516098511849987e-05, + "loss": 0.0077, + "step": 526820 + }, + { + "epoch": 1.37, + "learning_rate": 9.515709690212841e-05, + "loss": 0.0098, + "step": 526830 + }, + { + "epoch": 1.37, + "learning_rate": 9.515320868575694e-05, + "loss": 0.0125, + "step": 526840 + }, + { + "epoch": 1.37, + "learning_rate": 9.514932046938548e-05, + "loss": 0.0081, + "step": 526850 + }, + { + "epoch": 1.37, + "learning_rate": 9.5145432253014e-05, + "loss": 0.0095, + "step": 526860 + }, + { + "epoch": 1.37, + "learning_rate": 9.514154403664255e-05, + "loss": 0.0098, + "step": 526870 + }, + { + "epoch": 1.37, + "learning_rate": 9.513765582027108e-05, + "loss": 0.0078, + "step": 526880 + }, + { + "epoch": 1.37, + "learning_rate": 9.513376760389962e-05, + "loss": 0.0105, + "step": 526890 + }, + { + "epoch": 1.37, + "learning_rate": 9.512987938752815e-05, + "loss": 0.0104, + "step": 526900 + }, + { + "epoch": 1.37, + "learning_rate": 9.512599117115669e-05, + "loss": 0.0092, + "step": 526910 + }, + { + "epoch": 1.37, + "learning_rate": 9.512210295478522e-05, + "loss": 0.0068, + "step": 526920 + }, + { + "epoch": 1.37, + "learning_rate": 9.511821473841376e-05, + "loss": 0.0085, + "step": 526930 + }, + { + "epoch": 1.37, + "learning_rate": 9.511432652204229e-05, + "loss": 0.01, + "step": 526940 + }, + { + "epoch": 1.37, + "learning_rate": 9.511043830567083e-05, + "loss": 0.0095, + "step": 526950 + }, + { + "epoch": 1.37, + "learning_rate": 9.510655008929935e-05, + "loss": 0.0105, + "step": 526960 + }, + { + "epoch": 1.37, + "learning_rate": 9.510266187292791e-05, + "loss": 0.0123, + "step": 526970 + }, + { + "epoch": 1.37, + "learning_rate": 9.509877365655644e-05, + "loss": 0.0092, + "step": 526980 + }, + { + "epoch": 1.37, + "learning_rate": 9.509488544018495e-05, + "loss": 0.0066, + "step": 526990 + }, + { + "epoch": 1.37, + "learning_rate": 9.509099722381351e-05, + "loss": 0.0091, + "step": 527000 + }, + { + "epoch": 1.37, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.006512734107673168, + "eval_runtime": 108.0004, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.63, + "step": 527000 + }, + { + "epoch": 1.37, + "learning_rate": 9.508710900744204e-05, + "loss": 0.011, + "step": 527010 + }, + { + "epoch": 1.37, + "learning_rate": 9.508322079107058e-05, + "loss": 0.0086, + "step": 527020 + }, + { + "epoch": 1.37, + "learning_rate": 9.50793325746991e-05, + "loss": 0.0087, + "step": 527030 + }, + { + "epoch": 1.37, + "learning_rate": 9.507544435832765e-05, + "loss": 0.0106, + "step": 527040 + }, + { + "epoch": 1.37, + "learning_rate": 9.507155614195618e-05, + "loss": 0.0102, + "step": 527050 + }, + { + "epoch": 1.37, + "learning_rate": 9.506766792558472e-05, + "loss": 0.0098, + "step": 527060 + }, + { + "epoch": 1.37, + "learning_rate": 9.506377970921325e-05, + "loss": 0.0095, + "step": 527070 + }, + { + "epoch": 1.37, + "learning_rate": 9.505989149284179e-05, + "loss": 0.0102, + "step": 527080 + }, + { + "epoch": 1.37, + "learning_rate": 9.505600327647031e-05, + "loss": 0.0102, + "step": 527090 + }, + { + "epoch": 1.37, + "learning_rate": 9.505211506009886e-05, + "loss": 0.008, + "step": 527100 + }, + { + "epoch": 1.37, + "learning_rate": 9.504822684372738e-05, + "loss": 0.0108, + "step": 527110 + }, + { + "epoch": 1.37, + "learning_rate": 9.504433862735593e-05, + "loss": 0.0094, + "step": 527120 + }, + { + "epoch": 1.37, + "learning_rate": 9.504045041098445e-05, + "loss": 0.0128, + "step": 527130 + }, + { + "epoch": 1.37, + "learning_rate": 9.503656219461301e-05, + "loss": 0.0097, + "step": 527140 + }, + { + "epoch": 1.37, + "learning_rate": 9.503267397824152e-05, + "loss": 0.009, + "step": 527150 + }, + { + "epoch": 1.37, + "learning_rate": 9.502878576187008e-05, + "loss": 0.0104, + "step": 527160 + }, + { + "epoch": 1.37, + "learning_rate": 9.502489754549861e-05, + "loss": 0.0093, + "step": 527170 + }, + { + "epoch": 1.37, + "learning_rate": 9.502100932912715e-05, + "loss": 0.0102, + "step": 527180 + }, + { + "epoch": 1.37, + "learning_rate": 9.501712111275568e-05, + "loss": 0.0087, + "step": 527190 + }, + { + "epoch": 1.37, + "learning_rate": 9.501323289638422e-05, + "loss": 0.0111, + "step": 527200 + }, + { + "epoch": 1.37, + "learning_rate": 9.500934468001275e-05, + "loss": 0.008, + "step": 527210 + }, + { + "epoch": 1.37, + "learning_rate": 9.500545646364129e-05, + "loss": 0.0094, + "step": 527220 + }, + { + "epoch": 1.37, + "learning_rate": 9.500156824726982e-05, + "loss": 0.016, + "step": 527230 + }, + { + "epoch": 1.37, + "learning_rate": 9.499768003089834e-05, + "loss": 0.0098, + "step": 527240 + }, + { + "epoch": 1.37, + "learning_rate": 9.499379181452689e-05, + "loss": 0.0098, + "step": 527250 + }, + { + "epoch": 1.37, + "learning_rate": 9.498990359815541e-05, + "loss": 0.0074, + "step": 527260 + }, + { + "epoch": 1.37, + "learning_rate": 9.498601538178396e-05, + "loss": 0.0076, + "step": 527270 + }, + { + "epoch": 1.37, + "learning_rate": 9.498212716541248e-05, + "loss": 0.0096, + "step": 527280 + }, + { + "epoch": 1.37, + "learning_rate": 9.497823894904103e-05, + "loss": 0.0103, + "step": 527290 + }, + { + "epoch": 1.37, + "learning_rate": 9.497435073266955e-05, + "loss": 0.0071, + "step": 527300 + }, + { + "epoch": 1.37, + "learning_rate": 9.49704625162981e-05, + "loss": 0.0095, + "step": 527310 + }, + { + "epoch": 1.37, + "learning_rate": 9.496657429992662e-05, + "loss": 0.0135, + "step": 527320 + }, + { + "epoch": 1.37, + "learning_rate": 9.496268608355518e-05, + "loss": 0.0079, + "step": 527330 + }, + { + "epoch": 1.37, + "learning_rate": 9.49587978671837e-05, + "loss": 0.0075, + "step": 527340 + }, + { + "epoch": 1.37, + "learning_rate": 9.495490965081225e-05, + "loss": 0.011, + "step": 527350 + }, + { + "epoch": 1.37, + "learning_rate": 9.495102143444078e-05, + "loss": 0.0084, + "step": 527360 + }, + { + "epoch": 1.37, + "learning_rate": 9.494713321806932e-05, + "loss": 0.009, + "step": 527370 + }, + { + "epoch": 1.37, + "learning_rate": 9.494324500169785e-05, + "loss": 0.0134, + "step": 527380 + }, + { + "epoch": 1.37, + "learning_rate": 9.493935678532639e-05, + "loss": 0.0125, + "step": 527390 + }, + { + "epoch": 1.37, + "learning_rate": 9.493546856895492e-05, + "loss": 0.0089, + "step": 527400 + }, + { + "epoch": 1.37, + "learning_rate": 9.493158035258346e-05, + "loss": 0.0094, + "step": 527410 + }, + { + "epoch": 1.37, + "learning_rate": 9.492769213621199e-05, + "loss": 0.0127, + "step": 527420 + }, + { + "epoch": 1.37, + "learning_rate": 9.492380391984053e-05, + "loss": 0.0083, + "step": 527430 + }, + { + "epoch": 1.37, + "learning_rate": 9.491991570346906e-05, + "loss": 0.0104, + "step": 527440 + }, + { + "epoch": 1.37, + "learning_rate": 9.49160274870976e-05, + "loss": 0.0114, + "step": 527450 + }, + { + "epoch": 1.37, + "learning_rate": 9.491213927072612e-05, + "loss": 0.0107, + "step": 527460 + }, + { + "epoch": 1.37, + "learning_rate": 9.490825105435467e-05, + "loss": 0.0094, + "step": 527470 + }, + { + "epoch": 1.37, + "learning_rate": 9.49043628379832e-05, + "loss": 0.0081, + "step": 527480 + }, + { + "epoch": 1.37, + "learning_rate": 9.490047462161172e-05, + "loss": 0.0094, + "step": 527490 + }, + { + "epoch": 1.37, + "learning_rate": 9.489658640524028e-05, + "loss": 0.0087, + "step": 527500 + }, + { + "epoch": 1.37, + "learning_rate": 9.489269818886879e-05, + "loss": 0.0139, + "step": 527510 + }, + { + "epoch": 1.37, + "learning_rate": 9.488880997249735e-05, + "loss": 0.0086, + "step": 527520 + }, + { + "epoch": 1.37, + "learning_rate": 9.488492175612588e-05, + "loss": 0.0096, + "step": 527530 + }, + { + "epoch": 1.37, + "learning_rate": 9.488103353975442e-05, + "loss": 0.0074, + "step": 527540 + }, + { + "epoch": 1.37, + "learning_rate": 9.487714532338295e-05, + "loss": 0.0086, + "step": 527550 + }, + { + "epoch": 1.37, + "learning_rate": 9.487325710701149e-05, + "loss": 0.0101, + "step": 527560 + }, + { + "epoch": 1.37, + "learning_rate": 9.486936889064002e-05, + "loss": 0.0071, + "step": 527570 + }, + { + "epoch": 1.37, + "learning_rate": 9.486548067426856e-05, + "loss": 0.0102, + "step": 527580 + }, + { + "epoch": 1.37, + "learning_rate": 9.486159245789708e-05, + "loss": 0.0074, + "step": 527590 + }, + { + "epoch": 1.37, + "learning_rate": 9.485770424152563e-05, + "loss": 0.0094, + "step": 527600 + }, + { + "epoch": 1.37, + "learning_rate": 9.485381602515415e-05, + "loss": 0.0102, + "step": 527610 + }, + { + "epoch": 1.37, + "learning_rate": 9.48499278087827e-05, + "loss": 0.0071, + "step": 527620 + }, + { + "epoch": 1.37, + "learning_rate": 9.484603959241122e-05, + "loss": 0.0122, + "step": 527630 + }, + { + "epoch": 1.37, + "learning_rate": 9.484215137603977e-05, + "loss": 0.0094, + "step": 527640 + }, + { + "epoch": 1.37, + "learning_rate": 9.48382631596683e-05, + "loss": 0.011, + "step": 527650 + }, + { + "epoch": 1.37, + "learning_rate": 9.483437494329684e-05, + "loss": 0.009, + "step": 527660 + }, + { + "epoch": 1.37, + "learning_rate": 9.483048672692536e-05, + "loss": 0.011, + "step": 527670 + }, + { + "epoch": 1.37, + "learning_rate": 9.482659851055392e-05, + "loss": 0.0083, + "step": 527680 + }, + { + "epoch": 1.37, + "learning_rate": 9.482271029418245e-05, + "loss": 0.0122, + "step": 527690 + }, + { + "epoch": 1.37, + "learning_rate": 9.481882207781099e-05, + "loss": 0.0107, + "step": 527700 + }, + { + "epoch": 1.37, + "learning_rate": 9.481493386143952e-05, + "loss": 0.0087, + "step": 527710 + }, + { + "epoch": 1.37, + "learning_rate": 9.481104564506806e-05, + "loss": 0.0088, + "step": 527720 + }, + { + "epoch": 1.37, + "learning_rate": 9.480715742869659e-05, + "loss": 0.0113, + "step": 527730 + }, + { + "epoch": 1.37, + "learning_rate": 9.480326921232511e-05, + "loss": 0.0088, + "step": 527740 + }, + { + "epoch": 1.37, + "learning_rate": 9.479938099595366e-05, + "loss": 0.0082, + "step": 527750 + }, + { + "epoch": 1.37, + "learning_rate": 9.479549277958218e-05, + "loss": 0.0072, + "step": 527760 + }, + { + "epoch": 1.37, + "learning_rate": 9.479160456321073e-05, + "loss": 0.0117, + "step": 527770 + }, + { + "epoch": 1.37, + "learning_rate": 9.478771634683925e-05, + "loss": 0.0128, + "step": 527780 + }, + { + "epoch": 1.37, + "learning_rate": 9.47838281304678e-05, + "loss": 0.0107, + "step": 527790 + }, + { + "epoch": 1.37, + "learning_rate": 9.477993991409632e-05, + "loss": 0.012, + "step": 527800 + }, + { + "epoch": 1.37, + "learning_rate": 9.477605169772487e-05, + "loss": 0.0083, + "step": 527810 + }, + { + "epoch": 1.37, + "learning_rate": 9.47721634813534e-05, + "loss": 0.0102, + "step": 527820 + }, + { + "epoch": 1.37, + "learning_rate": 9.476827526498194e-05, + "loss": 0.0088, + "step": 527830 + }, + { + "epoch": 1.37, + "learning_rate": 9.476438704861046e-05, + "loss": 0.0135, + "step": 527840 + }, + { + "epoch": 1.37, + "learning_rate": 9.476049883223902e-05, + "loss": 0.0117, + "step": 527850 + }, + { + "epoch": 1.37, + "learning_rate": 9.475661061586755e-05, + "loss": 0.0096, + "step": 527860 + }, + { + "epoch": 1.37, + "learning_rate": 9.475272239949609e-05, + "loss": 0.0087, + "step": 527870 + }, + { + "epoch": 1.37, + "learning_rate": 9.474883418312462e-05, + "loss": 0.008, + "step": 527880 + }, + { + "epoch": 1.37, + "learning_rate": 9.474494596675316e-05, + "loss": 0.0082, + "step": 527890 + }, + { + "epoch": 1.37, + "learning_rate": 9.474105775038169e-05, + "loss": 0.008, + "step": 527900 + }, + { + "epoch": 1.37, + "learning_rate": 9.473716953401023e-05, + "loss": 0.0091, + "step": 527910 + }, + { + "epoch": 1.37, + "learning_rate": 9.473328131763876e-05, + "loss": 0.0125, + "step": 527920 + }, + { + "epoch": 1.37, + "learning_rate": 9.47293931012673e-05, + "loss": 0.0082, + "step": 527930 + }, + { + "epoch": 1.37, + "learning_rate": 9.472550488489583e-05, + "loss": 0.0126, + "step": 527940 + }, + { + "epoch": 1.37, + "learning_rate": 9.472161666852437e-05, + "loss": 0.0092, + "step": 527950 + }, + { + "epoch": 1.37, + "learning_rate": 9.47177284521529e-05, + "loss": 0.0094, + "step": 527960 + }, + { + "epoch": 1.37, + "learning_rate": 9.471384023578144e-05, + "loss": 0.0078, + "step": 527970 + }, + { + "epoch": 1.37, + "learning_rate": 9.470995201940996e-05, + "loss": 0.0116, + "step": 527980 + }, + { + "epoch": 1.37, + "learning_rate": 9.470606380303849e-05, + "loss": 0.008, + "step": 527990 + }, + { + "epoch": 1.37, + "learning_rate": 9.470217558666703e-05, + "loss": 0.0101, + "step": 528000 + }, + { + "epoch": 1.37, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.006410685367882252, + "eval_runtime": 108.0197, + "eval_samples_per_second": 18.515, + "eval_steps_per_second": 4.629, + "step": 528000 + }, + { + "epoch": 1.37, + "learning_rate": 9.469828737029556e-05, + "loss": 0.009, + "step": 528010 + }, + { + "epoch": 1.37, + "learning_rate": 9.46943991539241e-05, + "loss": 0.009, + "step": 528020 + }, + { + "epoch": 1.37, + "learning_rate": 9.469051093755263e-05, + "loss": 0.0081, + "step": 528030 + }, + { + "epoch": 1.37, + "learning_rate": 9.468662272118119e-05, + "loss": 0.0097, + "step": 528040 + }, + { + "epoch": 1.37, + "learning_rate": 9.468273450480972e-05, + "loss": 0.009, + "step": 528050 + }, + { + "epoch": 1.37, + "learning_rate": 9.467884628843826e-05, + "loss": 0.0121, + "step": 528060 + }, + { + "epoch": 1.37, + "learning_rate": 9.467495807206679e-05, + "loss": 0.0086, + "step": 528070 + }, + { + "epoch": 1.37, + "learning_rate": 9.467106985569533e-05, + "loss": 0.0085, + "step": 528080 + }, + { + "epoch": 1.37, + "learning_rate": 9.466718163932386e-05, + "loss": 0.0104, + "step": 528090 + }, + { + "epoch": 1.37, + "learning_rate": 9.46632934229524e-05, + "loss": 0.011, + "step": 528100 + }, + { + "epoch": 1.37, + "learning_rate": 9.465940520658092e-05, + "loss": 0.0101, + "step": 528110 + }, + { + "epoch": 1.37, + "learning_rate": 9.465551699020947e-05, + "loss": 0.011, + "step": 528120 + }, + { + "epoch": 1.37, + "learning_rate": 9.4651628773838e-05, + "loss": 0.012, + "step": 528130 + }, + { + "epoch": 1.37, + "learning_rate": 9.464774055746654e-05, + "loss": 0.0115, + "step": 528140 + }, + { + "epoch": 1.37, + "learning_rate": 9.464385234109506e-05, + "loss": 0.0126, + "step": 528150 + }, + { + "epoch": 1.37, + "learning_rate": 9.46399641247236e-05, + "loss": 0.008, + "step": 528160 + }, + { + "epoch": 1.37, + "learning_rate": 9.463607590835213e-05, + "loss": 0.0117, + "step": 528170 + }, + { + "epoch": 1.37, + "learning_rate": 9.463218769198068e-05, + "loss": 0.0084, + "step": 528180 + }, + { + "epoch": 1.37, + "learning_rate": 9.46282994756092e-05, + "loss": 0.0121, + "step": 528190 + }, + { + "epoch": 1.37, + "learning_rate": 9.462441125923776e-05, + "loss": 0.0089, + "step": 528200 + }, + { + "epoch": 1.37, + "learning_rate": 9.462052304286629e-05, + "loss": 0.0103, + "step": 528210 + }, + { + "epoch": 1.37, + "learning_rate": 9.46166348264948e-05, + "loss": 0.0094, + "step": 528220 + }, + { + "epoch": 1.37, + "learning_rate": 9.461274661012336e-05, + "loss": 0.0113, + "step": 528230 + }, + { + "epoch": 1.37, + "learning_rate": 9.460885839375188e-05, + "loss": 0.0106, + "step": 528240 + }, + { + "epoch": 1.37, + "learning_rate": 9.460497017738043e-05, + "loss": 0.0112, + "step": 528250 + }, + { + "epoch": 1.37, + "learning_rate": 9.460108196100895e-05, + "loss": 0.012, + "step": 528260 + }, + { + "epoch": 1.37, + "learning_rate": 9.45971937446375e-05, + "loss": 0.0087, + "step": 528270 + }, + { + "epoch": 1.37, + "learning_rate": 9.459330552826602e-05, + "loss": 0.0084, + "step": 528280 + }, + { + "epoch": 1.37, + "learning_rate": 9.458941731189457e-05, + "loss": 0.0091, + "step": 528290 + }, + { + "epoch": 1.37, + "learning_rate": 9.45855290955231e-05, + "loss": 0.0111, + "step": 528300 + }, + { + "epoch": 1.37, + "learning_rate": 9.458164087915164e-05, + "loss": 0.0135, + "step": 528310 + }, + { + "epoch": 1.37, + "learning_rate": 9.457775266278016e-05, + "loss": 0.012, + "step": 528320 + }, + { + "epoch": 1.37, + "learning_rate": 9.45738644464087e-05, + "loss": 0.0093, + "step": 528330 + }, + { + "epoch": 1.37, + "learning_rate": 9.456997623003723e-05, + "loss": 0.0076, + "step": 528340 + }, + { + "epoch": 1.37, + "learning_rate": 9.456608801366578e-05, + "loss": 0.0066, + "step": 528350 + }, + { + "epoch": 1.37, + "learning_rate": 9.45621997972943e-05, + "loss": 0.0113, + "step": 528360 + }, + { + "epoch": 1.37, + "learning_rate": 9.455831158092286e-05, + "loss": 0.0087, + "step": 528370 + }, + { + "epoch": 1.37, + "learning_rate": 9.455442336455137e-05, + "loss": 0.0086, + "step": 528380 + }, + { + "epoch": 1.37, + "learning_rate": 9.455053514817993e-05, + "loss": 0.0142, + "step": 528390 + }, + { + "epoch": 1.37, + "learning_rate": 9.454664693180846e-05, + "loss": 0.0118, + "step": 528400 + }, + { + "epoch": 1.37, + "learning_rate": 9.4542758715437e-05, + "loss": 0.0101, + "step": 528410 + }, + { + "epoch": 1.37, + "learning_rate": 9.453887049906553e-05, + "loss": 0.0101, + "step": 528420 + }, + { + "epoch": 1.37, + "learning_rate": 9.453498228269407e-05, + "loss": 0.0121, + "step": 528430 + }, + { + "epoch": 1.37, + "learning_rate": 9.45310940663226e-05, + "loss": 0.0121, + "step": 528440 + }, + { + "epoch": 1.37, + "learning_rate": 9.452720584995114e-05, + "loss": 0.0098, + "step": 528450 + }, + { + "epoch": 1.37, + "learning_rate": 9.452331763357967e-05, + "loss": 0.0075, + "step": 528460 + }, + { + "epoch": 1.37, + "learning_rate": 9.45194294172082e-05, + "loss": 0.0118, + "step": 528470 + }, + { + "epoch": 1.37, + "learning_rate": 9.451554120083674e-05, + "loss": 0.0121, + "step": 528480 + }, + { + "epoch": 1.37, + "learning_rate": 9.451165298446526e-05, + "loss": 0.0093, + "step": 528490 + }, + { + "epoch": 1.37, + "learning_rate": 9.45077647680938e-05, + "loss": 0.0107, + "step": 528500 + }, + { + "epoch": 1.37, + "learning_rate": 9.450387655172233e-05, + "loss": 0.0113, + "step": 528510 + }, + { + "epoch": 1.37, + "learning_rate": 9.449998833535087e-05, + "loss": 0.0091, + "step": 528520 + }, + { + "epoch": 1.37, + "learning_rate": 9.44961001189794e-05, + "loss": 0.0116, + "step": 528530 + }, + { + "epoch": 1.37, + "learning_rate": 9.449221190260794e-05, + "loss": 0.0094, + "step": 528540 + }, + { + "epoch": 1.37, + "learning_rate": 9.448832368623647e-05, + "loss": 0.0096, + "step": 528550 + }, + { + "epoch": 1.37, + "learning_rate": 9.448443546986503e-05, + "loss": 0.0105, + "step": 528560 + }, + { + "epoch": 1.37, + "learning_rate": 9.448054725349356e-05, + "loss": 0.0077, + "step": 528570 + }, + { + "epoch": 1.37, + "learning_rate": 9.44766590371221e-05, + "loss": 0.0085, + "step": 528580 + }, + { + "epoch": 1.37, + "learning_rate": 9.447277082075063e-05, + "loss": 0.0085, + "step": 528590 + }, + { + "epoch": 1.37, + "learning_rate": 9.446888260437917e-05, + "loss": 0.0113, + "step": 528600 + }, + { + "epoch": 1.37, + "learning_rate": 9.44649943880077e-05, + "loss": 0.0109, + "step": 528610 + }, + { + "epoch": 1.37, + "learning_rate": 9.446110617163624e-05, + "loss": 0.0135, + "step": 528620 + }, + { + "epoch": 1.37, + "learning_rate": 9.445721795526476e-05, + "loss": 0.0094, + "step": 528630 + }, + { + "epoch": 1.37, + "learning_rate": 9.44533297388933e-05, + "loss": 0.0098, + "step": 528640 + }, + { + "epoch": 1.37, + "learning_rate": 9.444944152252183e-05, + "loss": 0.0111, + "step": 528650 + }, + { + "epoch": 1.37, + "learning_rate": 9.444555330615038e-05, + "loss": 0.0092, + "step": 528660 + }, + { + "epoch": 1.37, + "learning_rate": 9.44416650897789e-05, + "loss": 0.0096, + "step": 528670 + }, + { + "epoch": 1.37, + "learning_rate": 9.443777687340745e-05, + "loss": 0.0109, + "step": 528680 + }, + { + "epoch": 1.37, + "learning_rate": 9.443388865703597e-05, + "loss": 0.0089, + "step": 528690 + }, + { + "epoch": 1.37, + "learning_rate": 9.443000044066452e-05, + "loss": 0.0097, + "step": 528700 + }, + { + "epoch": 1.37, + "learning_rate": 9.442611222429304e-05, + "loss": 0.0078, + "step": 528710 + }, + { + "epoch": 1.37, + "learning_rate": 9.442222400792157e-05, + "loss": 0.0107, + "step": 528720 + }, + { + "epoch": 1.37, + "learning_rate": 9.441833579155013e-05, + "loss": 0.0074, + "step": 528730 + }, + { + "epoch": 1.37, + "learning_rate": 9.441444757517864e-05, + "loss": 0.0095, + "step": 528740 + }, + { + "epoch": 1.37, + "learning_rate": 9.44105593588072e-05, + "loss": 0.0112, + "step": 528750 + }, + { + "epoch": 1.37, + "learning_rate": 9.440667114243572e-05, + "loss": 0.0094, + "step": 528760 + }, + { + "epoch": 1.37, + "learning_rate": 9.440278292606427e-05, + "loss": 0.0125, + "step": 528770 + }, + { + "epoch": 1.37, + "learning_rate": 9.43988947096928e-05, + "loss": 0.0099, + "step": 528780 + }, + { + "epoch": 1.37, + "learning_rate": 9.439500649332134e-05, + "loss": 0.0111, + "step": 528790 + }, + { + "epoch": 1.37, + "learning_rate": 9.439111827694986e-05, + "loss": 0.0087, + "step": 528800 + }, + { + "epoch": 1.37, + "learning_rate": 9.43872300605784e-05, + "loss": 0.0087, + "step": 528810 + }, + { + "epoch": 1.37, + "learning_rate": 9.438334184420693e-05, + "loss": 0.0128, + "step": 528820 + }, + { + "epoch": 1.37, + "learning_rate": 9.437945362783548e-05, + "loss": 0.0096, + "step": 528830 + }, + { + "epoch": 1.37, + "learning_rate": 9.4375565411464e-05, + "loss": 0.0097, + "step": 528840 + }, + { + "epoch": 1.37, + "learning_rate": 9.437167719509255e-05, + "loss": 0.0119, + "step": 528850 + }, + { + "epoch": 1.37, + "learning_rate": 9.436778897872107e-05, + "loss": 0.0119, + "step": 528860 + }, + { + "epoch": 1.37, + "learning_rate": 9.436390076234961e-05, + "loss": 0.0118, + "step": 528870 + }, + { + "epoch": 1.37, + "learning_rate": 9.436001254597814e-05, + "loss": 0.01, + "step": 528880 + }, + { + "epoch": 1.37, + "learning_rate": 9.43561243296067e-05, + "loss": 0.0081, + "step": 528890 + }, + { + "epoch": 1.37, + "learning_rate": 9.435223611323521e-05, + "loss": 0.0124, + "step": 528900 + }, + { + "epoch": 1.37, + "learning_rate": 9.434834789686377e-05, + "loss": 0.0114, + "step": 528910 + }, + { + "epoch": 1.37, + "learning_rate": 9.43444596804923e-05, + "loss": 0.0099, + "step": 528920 + }, + { + "epoch": 1.37, + "learning_rate": 9.434057146412084e-05, + "loss": 0.0074, + "step": 528930 + }, + { + "epoch": 1.37, + "learning_rate": 9.433668324774937e-05, + "loss": 0.0084, + "step": 528940 + }, + { + "epoch": 1.37, + "learning_rate": 9.433279503137791e-05, + "loss": 0.009, + "step": 528950 + }, + { + "epoch": 1.37, + "learning_rate": 9.432890681500644e-05, + "loss": 0.0098, + "step": 528960 + }, + { + "epoch": 1.37, + "learning_rate": 9.432501859863496e-05, + "loss": 0.0105, + "step": 528970 + }, + { + "epoch": 1.37, + "learning_rate": 9.43211303822635e-05, + "loss": 0.0095, + "step": 528980 + }, + { + "epoch": 1.37, + "learning_rate": 9.431724216589203e-05, + "loss": 0.0076, + "step": 528990 + }, + { + "epoch": 1.37, + "learning_rate": 9.431335394952057e-05, + "loss": 0.0091, + "step": 529000 + }, + { + "epoch": 1.37, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.006558180321007967, + "eval_runtime": 107.9692, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 529000 + }, + { + "epoch": 1.37, + "learning_rate": 9.43094657331491e-05, + "loss": 0.0104, + "step": 529010 + }, + { + "epoch": 1.37, + "learning_rate": 9.430557751677764e-05, + "loss": 0.0106, + "step": 529020 + }, + { + "epoch": 1.37, + "learning_rate": 9.430168930040617e-05, + "loss": 0.0078, + "step": 529030 + }, + { + "epoch": 1.37, + "learning_rate": 9.429780108403471e-05, + "loss": 0.0066, + "step": 529040 + }, + { + "epoch": 1.37, + "learning_rate": 9.429391286766324e-05, + "loss": 0.0099, + "step": 529050 + }, + { + "epoch": 1.37, + "learning_rate": 9.429002465129178e-05, + "loss": 0.0115, + "step": 529060 + }, + { + "epoch": 1.37, + "learning_rate": 9.428613643492031e-05, + "loss": 0.0097, + "step": 529070 + }, + { + "epoch": 1.37, + "learning_rate": 9.428224821854887e-05, + "loss": 0.012, + "step": 529080 + }, + { + "epoch": 1.37, + "learning_rate": 9.42783600021774e-05, + "loss": 0.0087, + "step": 529090 + }, + { + "epoch": 1.37, + "learning_rate": 9.427447178580594e-05, + "loss": 0.0115, + "step": 529100 + }, + { + "epoch": 1.37, + "learning_rate": 9.427058356943447e-05, + "loss": 0.0087, + "step": 529110 + }, + { + "epoch": 1.37, + "learning_rate": 9.426669535306301e-05, + "loss": 0.0101, + "step": 529120 + }, + { + "epoch": 1.37, + "learning_rate": 9.426280713669153e-05, + "loss": 0.0109, + "step": 529130 + }, + { + "epoch": 1.37, + "learning_rate": 9.425891892032008e-05, + "loss": 0.0082, + "step": 529140 + }, + { + "epoch": 1.37, + "learning_rate": 9.42550307039486e-05, + "loss": 0.0087, + "step": 529150 + }, + { + "epoch": 1.37, + "learning_rate": 9.425114248757715e-05, + "loss": 0.0083, + "step": 529160 + }, + { + "epoch": 1.37, + "learning_rate": 9.424725427120567e-05, + "loss": 0.008, + "step": 529170 + }, + { + "epoch": 1.37, + "learning_rate": 9.424336605483422e-05, + "loss": 0.0094, + "step": 529180 + }, + { + "epoch": 1.37, + "learning_rate": 9.423947783846274e-05, + "loss": 0.0096, + "step": 529190 + }, + { + "epoch": 1.37, + "learning_rate": 9.423558962209129e-05, + "loss": 0.0086, + "step": 529200 + }, + { + "epoch": 1.37, + "learning_rate": 9.423170140571981e-05, + "loss": 0.0126, + "step": 529210 + }, + { + "epoch": 1.37, + "learning_rate": 9.422781318934834e-05, + "loss": 0.0105, + "step": 529220 + }, + { + "epoch": 1.37, + "learning_rate": 9.422392497297688e-05, + "loss": 0.0079, + "step": 529230 + }, + { + "epoch": 1.37, + "learning_rate": 9.422003675660541e-05, + "loss": 0.0068, + "step": 529240 + }, + { + "epoch": 1.37, + "learning_rate": 9.421614854023395e-05, + "loss": 0.009, + "step": 529250 + }, + { + "epoch": 1.37, + "learning_rate": 9.421226032386248e-05, + "loss": 0.0068, + "step": 529260 + }, + { + "epoch": 1.37, + "learning_rate": 9.420837210749104e-05, + "loss": 0.0085, + "step": 529270 + }, + { + "epoch": 1.37, + "learning_rate": 9.420448389111956e-05, + "loss": 0.0132, + "step": 529280 + }, + { + "epoch": 1.37, + "learning_rate": 9.42005956747481e-05, + "loss": 0.009, + "step": 529290 + }, + { + "epoch": 1.37, + "learning_rate": 9.419670745837663e-05, + "loss": 0.0116, + "step": 529300 + }, + { + "epoch": 1.37, + "learning_rate": 9.419281924200518e-05, + "loss": 0.0135, + "step": 529310 + }, + { + "epoch": 1.37, + "learning_rate": 9.41889310256337e-05, + "loss": 0.0082, + "step": 529320 + }, + { + "epoch": 1.37, + "learning_rate": 9.418504280926225e-05, + "loss": 0.0114, + "step": 529330 + }, + { + "epoch": 1.37, + "learning_rate": 9.418115459289077e-05, + "loss": 0.0071, + "step": 529340 + }, + { + "epoch": 1.37, + "learning_rate": 9.417726637651932e-05, + "loss": 0.0112, + "step": 529350 + }, + { + "epoch": 1.37, + "learning_rate": 9.417337816014784e-05, + "loss": 0.0096, + "step": 529360 + }, + { + "epoch": 1.37, + "learning_rate": 9.416948994377639e-05, + "loss": 0.0103, + "step": 529370 + }, + { + "epoch": 1.37, + "learning_rate": 9.416560172740491e-05, + "loss": 0.0107, + "step": 529380 + }, + { + "epoch": 1.37, + "learning_rate": 9.416171351103345e-05, + "loss": 0.0093, + "step": 529390 + }, + { + "epoch": 1.37, + "learning_rate": 9.415782529466198e-05, + "loss": 0.0132, + "step": 529400 + }, + { + "epoch": 1.37, + "learning_rate": 9.415393707829052e-05, + "loss": 0.011, + "step": 529410 + }, + { + "epoch": 1.37, + "learning_rate": 9.415004886191905e-05, + "loss": 0.0119, + "step": 529420 + }, + { + "epoch": 1.37, + "learning_rate": 9.414616064554761e-05, + "loss": 0.0108, + "step": 529430 + }, + { + "epoch": 1.37, + "learning_rate": 9.414227242917614e-05, + "loss": 0.0106, + "step": 529440 + }, + { + "epoch": 1.37, + "learning_rate": 9.413838421280468e-05, + "loss": 0.0096, + "step": 529450 + }, + { + "epoch": 1.37, + "learning_rate": 9.41344959964332e-05, + "loss": 0.0096, + "step": 529460 + }, + { + "epoch": 1.37, + "learning_rate": 9.413060778006173e-05, + "loss": 0.0089, + "step": 529470 + }, + { + "epoch": 1.37, + "learning_rate": 9.412671956369028e-05, + "loss": 0.0087, + "step": 529480 + }, + { + "epoch": 1.37, + "learning_rate": 9.41228313473188e-05, + "loss": 0.0111, + "step": 529490 + }, + { + "epoch": 1.37, + "learning_rate": 9.411894313094735e-05, + "loss": 0.0072, + "step": 529500 + }, + { + "epoch": 1.37, + "learning_rate": 9.411505491457587e-05, + "loss": 0.0126, + "step": 529510 + }, + { + "epoch": 1.37, + "learning_rate": 9.411116669820441e-05, + "loss": 0.0082, + "step": 529520 + }, + { + "epoch": 1.37, + "learning_rate": 9.410727848183294e-05, + "loss": 0.0139, + "step": 529530 + }, + { + "epoch": 1.37, + "learning_rate": 9.410339026546148e-05, + "loss": 0.0105, + "step": 529540 + }, + { + "epoch": 1.37, + "learning_rate": 9.409950204909001e-05, + "loss": 0.0087, + "step": 529550 + }, + { + "epoch": 1.37, + "learning_rate": 9.409561383271855e-05, + "loss": 0.0106, + "step": 529560 + }, + { + "epoch": 1.37, + "learning_rate": 9.409172561634708e-05, + "loss": 0.0095, + "step": 529570 + }, + { + "epoch": 1.37, + "learning_rate": 9.408783739997562e-05, + "loss": 0.0095, + "step": 529580 + }, + { + "epoch": 1.37, + "learning_rate": 9.408394918360415e-05, + "loss": 0.0094, + "step": 529590 + }, + { + "epoch": 1.37, + "learning_rate": 9.408006096723271e-05, + "loss": 0.0093, + "step": 529600 + }, + { + "epoch": 1.37, + "learning_rate": 9.407617275086122e-05, + "loss": 0.0063, + "step": 529610 + }, + { + "epoch": 1.37, + "learning_rate": 9.407228453448978e-05, + "loss": 0.0092, + "step": 529620 + }, + { + "epoch": 1.37, + "learning_rate": 9.40683963181183e-05, + "loss": 0.0119, + "step": 529630 + }, + { + "epoch": 1.37, + "learning_rate": 9.406450810174685e-05, + "loss": 0.0101, + "step": 529640 + }, + { + "epoch": 1.37, + "learning_rate": 9.406061988537537e-05, + "loss": 0.011, + "step": 529650 + }, + { + "epoch": 1.37, + "learning_rate": 9.405673166900392e-05, + "loss": 0.0117, + "step": 529660 + }, + { + "epoch": 1.37, + "learning_rate": 9.405284345263244e-05, + "loss": 0.013, + "step": 529670 + }, + { + "epoch": 1.37, + "learning_rate": 9.404895523626099e-05, + "loss": 0.0111, + "step": 529680 + }, + { + "epoch": 1.37, + "learning_rate": 9.404506701988951e-05, + "loss": 0.0086, + "step": 529690 + }, + { + "epoch": 1.37, + "learning_rate": 9.404117880351806e-05, + "loss": 0.0123, + "step": 529700 + }, + { + "epoch": 1.37, + "learning_rate": 9.403729058714658e-05, + "loss": 0.0078, + "step": 529710 + }, + { + "epoch": 1.37, + "learning_rate": 9.403340237077511e-05, + "loss": 0.0072, + "step": 529720 + }, + { + "epoch": 1.37, + "learning_rate": 9.402951415440365e-05, + "loss": 0.0097, + "step": 529730 + }, + { + "epoch": 1.37, + "learning_rate": 9.402562593803218e-05, + "loss": 0.0087, + "step": 529740 + }, + { + "epoch": 1.37, + "learning_rate": 9.402173772166072e-05, + "loss": 0.0077, + "step": 529750 + }, + { + "epoch": 1.37, + "learning_rate": 9.401784950528925e-05, + "loss": 0.0077, + "step": 529760 + }, + { + "epoch": 1.37, + "learning_rate": 9.401396128891779e-05, + "loss": 0.0101, + "step": 529770 + }, + { + "epoch": 1.37, + "learning_rate": 9.401007307254632e-05, + "loss": 0.0097, + "step": 529780 + }, + { + "epoch": 1.37, + "learning_rate": 9.400618485617488e-05, + "loss": 0.0096, + "step": 529790 + }, + { + "epoch": 1.37, + "learning_rate": 9.40022966398034e-05, + "loss": 0.0108, + "step": 529800 + }, + { + "epoch": 1.37, + "learning_rate": 9.399840842343195e-05, + "loss": 0.0094, + "step": 529810 + }, + { + "epoch": 1.37, + "learning_rate": 9.399452020706047e-05, + "loss": 0.0112, + "step": 529820 + }, + { + "epoch": 1.37, + "learning_rate": 9.399063199068902e-05, + "loss": 0.0085, + "step": 529830 + }, + { + "epoch": 1.37, + "learning_rate": 9.398674377431754e-05, + "loss": 0.0081, + "step": 529840 + }, + { + "epoch": 1.37, + "learning_rate": 9.398285555794609e-05, + "loss": 0.0106, + "step": 529850 + }, + { + "epoch": 1.37, + "learning_rate": 9.397896734157461e-05, + "loss": 0.0107, + "step": 529860 + }, + { + "epoch": 1.37, + "learning_rate": 9.397507912520316e-05, + "loss": 0.0097, + "step": 529870 + }, + { + "epoch": 1.37, + "learning_rate": 9.397119090883168e-05, + "loss": 0.0101, + "step": 529880 + }, + { + "epoch": 1.37, + "learning_rate": 9.396730269246023e-05, + "loss": 0.0137, + "step": 529890 + }, + { + "epoch": 1.37, + "learning_rate": 9.396341447608875e-05, + "loss": 0.0101, + "step": 529900 + }, + { + "epoch": 1.37, + "learning_rate": 9.39595262597173e-05, + "loss": 0.0133, + "step": 529910 + }, + { + "epoch": 1.37, + "learning_rate": 9.395563804334582e-05, + "loss": 0.0097, + "step": 529920 + }, + { + "epoch": 1.37, + "learning_rate": 9.395174982697436e-05, + "loss": 0.0115, + "step": 529930 + }, + { + "epoch": 1.37, + "learning_rate": 9.394786161060289e-05, + "loss": 0.0092, + "step": 529940 + }, + { + "epoch": 1.37, + "learning_rate": 9.394397339423145e-05, + "loss": 0.0095, + "step": 529950 + }, + { + "epoch": 1.37, + "learning_rate": 9.394008517785998e-05, + "loss": 0.009, + "step": 529960 + }, + { + "epoch": 1.37, + "learning_rate": 9.393619696148849e-05, + "loss": 0.0113, + "step": 529970 + }, + { + "epoch": 1.37, + "learning_rate": 9.393230874511705e-05, + "loss": 0.0078, + "step": 529980 + }, + { + "epoch": 1.37, + "learning_rate": 9.392842052874557e-05, + "loss": 0.0088, + "step": 529990 + }, + { + "epoch": 1.37, + "learning_rate": 9.392453231237412e-05, + "loss": 0.0123, + "step": 530000 + }, + { + "epoch": 1.37, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.0064879064448177814, + "eval_runtime": 107.9436, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 530000 + }, + { + "epoch": 1.37, + "learning_rate": 9.392064409600264e-05, + "loss": 0.0073, + "step": 530010 + }, + { + "epoch": 1.37, + "learning_rate": 9.391675587963119e-05, + "loss": 0.009, + "step": 530020 + }, + { + "epoch": 1.37, + "learning_rate": 9.391286766325971e-05, + "loss": 0.0111, + "step": 530030 + }, + { + "epoch": 1.37, + "learning_rate": 9.390897944688825e-05, + "loss": 0.0094, + "step": 530040 + }, + { + "epoch": 1.37, + "learning_rate": 9.390509123051678e-05, + "loss": 0.0087, + "step": 530050 + }, + { + "epoch": 1.37, + "learning_rate": 9.390120301414532e-05, + "loss": 0.0112, + "step": 530060 + }, + { + "epoch": 1.37, + "learning_rate": 9.389731479777385e-05, + "loss": 0.0121, + "step": 530070 + }, + { + "epoch": 1.37, + "learning_rate": 9.38934265814024e-05, + "loss": 0.0092, + "step": 530080 + }, + { + "epoch": 1.37, + "learning_rate": 9.388953836503092e-05, + "loss": 0.0122, + "step": 530090 + }, + { + "epoch": 1.37, + "learning_rate": 9.388565014865946e-05, + "loss": 0.0135, + "step": 530100 + }, + { + "epoch": 1.37, + "learning_rate": 9.388176193228799e-05, + "loss": 0.0086, + "step": 530110 + }, + { + "epoch": 1.37, + "learning_rate": 9.387787371591655e-05, + "loss": 0.0175, + "step": 530120 + }, + { + "epoch": 1.37, + "learning_rate": 9.387398549954506e-05, + "loss": 0.0096, + "step": 530130 + }, + { + "epoch": 1.37, + "learning_rate": 9.387009728317362e-05, + "loss": 0.0089, + "step": 530140 + }, + { + "epoch": 1.37, + "learning_rate": 9.386620906680215e-05, + "loss": 0.0082, + "step": 530150 + }, + { + "epoch": 1.37, + "learning_rate": 9.386232085043069e-05, + "loss": 0.0092, + "step": 530160 + }, + { + "epoch": 1.37, + "learning_rate": 9.385843263405921e-05, + "loss": 0.0098, + "step": 530170 + }, + { + "epoch": 1.37, + "learning_rate": 9.385454441768776e-05, + "loss": 0.0092, + "step": 530180 + }, + { + "epoch": 1.37, + "learning_rate": 9.385065620131628e-05, + "loss": 0.0077, + "step": 530190 + }, + { + "epoch": 1.37, + "learning_rate": 9.384676798494483e-05, + "loss": 0.0191, + "step": 530200 + }, + { + "epoch": 1.37, + "learning_rate": 9.384287976857335e-05, + "loss": 0.0118, + "step": 530210 + }, + { + "epoch": 1.37, + "learning_rate": 9.383899155220188e-05, + "loss": 0.0122, + "step": 530220 + }, + { + "epoch": 1.37, + "learning_rate": 9.383510333583042e-05, + "loss": 0.009, + "step": 530230 + }, + { + "epoch": 1.37, + "learning_rate": 9.383121511945895e-05, + "loss": 0.0086, + "step": 530240 + }, + { + "epoch": 1.37, + "learning_rate": 9.38273269030875e-05, + "loss": 0.0098, + "step": 530250 + }, + { + "epoch": 1.37, + "learning_rate": 9.382343868671602e-05, + "loss": 0.0128, + "step": 530260 + }, + { + "epoch": 1.37, + "learning_rate": 9.381955047034456e-05, + "loss": 0.0089, + "step": 530270 + }, + { + "epoch": 1.37, + "learning_rate": 9.381566225397309e-05, + "loss": 0.008, + "step": 530280 + }, + { + "epoch": 1.37, + "learning_rate": 9.381177403760163e-05, + "loss": 0.0069, + "step": 530290 + }, + { + "epoch": 1.37, + "learning_rate": 9.380788582123016e-05, + "loss": 0.0118, + "step": 530300 + }, + { + "epoch": 1.37, + "learning_rate": 9.380399760485872e-05, + "loss": 0.0079, + "step": 530310 + }, + { + "epoch": 1.37, + "learning_rate": 9.380010938848724e-05, + "loss": 0.0075, + "step": 530320 + }, + { + "epoch": 1.37, + "learning_rate": 9.379622117211579e-05, + "loss": 0.0079, + "step": 530330 + }, + { + "epoch": 1.37, + "learning_rate": 9.379233295574431e-05, + "loss": 0.0109, + "step": 530340 + }, + { + "epoch": 1.37, + "learning_rate": 9.378844473937286e-05, + "loss": 0.0093, + "step": 530350 + }, + { + "epoch": 1.37, + "learning_rate": 9.378455652300138e-05, + "loss": 0.0089, + "step": 530360 + }, + { + "epoch": 1.37, + "learning_rate": 9.378066830662993e-05, + "loss": 0.0103, + "step": 530370 + }, + { + "epoch": 1.37, + "learning_rate": 9.377678009025845e-05, + "loss": 0.0112, + "step": 530380 + }, + { + "epoch": 1.37, + "learning_rate": 9.3772891873887e-05, + "loss": 0.0119, + "step": 530390 + }, + { + "epoch": 1.37, + "learning_rate": 9.376900365751552e-05, + "loss": 0.0091, + "step": 530400 + }, + { + "epoch": 1.37, + "learning_rate": 9.376511544114406e-05, + "loss": 0.0076, + "step": 530410 + }, + { + "epoch": 1.37, + "learning_rate": 9.376122722477259e-05, + "loss": 0.0088, + "step": 530420 + }, + { + "epoch": 1.37, + "learning_rate": 9.375733900840113e-05, + "loss": 0.009, + "step": 530430 + }, + { + "epoch": 1.37, + "learning_rate": 9.375345079202966e-05, + "loss": 0.0084, + "step": 530440 + }, + { + "epoch": 1.38, + "learning_rate": 9.37495625756582e-05, + "loss": 0.0099, + "step": 530450 + }, + { + "epoch": 1.38, + "learning_rate": 9.374567435928673e-05, + "loss": 0.0085, + "step": 530460 + }, + { + "epoch": 1.38, + "learning_rate": 9.374178614291526e-05, + "loss": 0.0088, + "step": 530470 + }, + { + "epoch": 1.38, + "learning_rate": 9.373789792654382e-05, + "loss": 0.0092, + "step": 530480 + }, + { + "epoch": 1.38, + "learning_rate": 9.373400971017233e-05, + "loss": 0.0115, + "step": 530490 + }, + { + "epoch": 1.38, + "learning_rate": 9.373012149380089e-05, + "loss": 0.0103, + "step": 530500 + }, + { + "epoch": 1.38, + "learning_rate": 9.372623327742941e-05, + "loss": 0.0087, + "step": 530510 + }, + { + "epoch": 1.38, + "learning_rate": 9.372234506105796e-05, + "loss": 0.0078, + "step": 530520 + }, + { + "epoch": 1.38, + "learning_rate": 9.371845684468648e-05, + "loss": 0.0091, + "step": 530530 + }, + { + "epoch": 1.38, + "learning_rate": 9.371456862831502e-05, + "loss": 0.0112, + "step": 530540 + }, + { + "epoch": 1.38, + "learning_rate": 9.371068041194355e-05, + "loss": 0.0108, + "step": 530550 + }, + { + "epoch": 1.38, + "learning_rate": 9.37067921955721e-05, + "loss": 0.012, + "step": 530560 + }, + { + "epoch": 1.38, + "learning_rate": 9.370290397920062e-05, + "loss": 0.009, + "step": 530570 + }, + { + "epoch": 1.38, + "learning_rate": 9.369901576282916e-05, + "loss": 0.009, + "step": 530580 + }, + { + "epoch": 1.38, + "learning_rate": 9.369512754645769e-05, + "loss": 0.0144, + "step": 530590 + }, + { + "epoch": 1.38, + "learning_rate": 9.369123933008623e-05, + "loss": 0.0092, + "step": 530600 + }, + { + "epoch": 1.38, + "learning_rate": 9.368735111371476e-05, + "loss": 0.0102, + "step": 530610 + }, + { + "epoch": 1.38, + "learning_rate": 9.36834628973433e-05, + "loss": 0.0101, + "step": 530620 + }, + { + "epoch": 1.38, + "learning_rate": 9.367957468097183e-05, + "loss": 0.012, + "step": 530630 + }, + { + "epoch": 1.38, + "learning_rate": 9.367568646460037e-05, + "loss": 0.0109, + "step": 530640 + }, + { + "epoch": 1.38, + "learning_rate": 9.36717982482289e-05, + "loss": 0.0145, + "step": 530650 + }, + { + "epoch": 1.38, + "learning_rate": 9.366791003185746e-05, + "loss": 0.0065, + "step": 530660 + }, + { + "epoch": 1.38, + "learning_rate": 9.366402181548598e-05, + "loss": 0.0106, + "step": 530670 + }, + { + "epoch": 1.38, + "learning_rate": 9.366013359911453e-05, + "loss": 0.0089, + "step": 530680 + }, + { + "epoch": 1.38, + "learning_rate": 9.365624538274305e-05, + "loss": 0.0087, + "step": 530690 + }, + { + "epoch": 1.38, + "learning_rate": 9.36523571663716e-05, + "loss": 0.0078, + "step": 530700 + }, + { + "epoch": 1.38, + "learning_rate": 9.364846895000012e-05, + "loss": 0.0107, + "step": 530710 + }, + { + "epoch": 1.38, + "learning_rate": 9.364458073362865e-05, + "loss": 0.008, + "step": 530720 + }, + { + "epoch": 1.38, + "learning_rate": 9.36406925172572e-05, + "loss": 0.0113, + "step": 530730 + }, + { + "epoch": 1.38, + "learning_rate": 9.363680430088572e-05, + "loss": 0.0156, + "step": 530740 + }, + { + "epoch": 1.38, + "learning_rate": 9.363291608451426e-05, + "loss": 0.0102, + "step": 530750 + }, + { + "epoch": 1.38, + "learning_rate": 9.362902786814279e-05, + "loss": 0.0115, + "step": 530760 + }, + { + "epoch": 1.38, + "learning_rate": 9.362513965177133e-05, + "loss": 0.0185, + "step": 530770 + }, + { + "epoch": 1.38, + "learning_rate": 9.362125143539986e-05, + "loss": 0.0083, + "step": 530780 + }, + { + "epoch": 1.38, + "learning_rate": 9.36173632190284e-05, + "loss": 0.0081, + "step": 530790 + }, + { + "epoch": 1.38, + "learning_rate": 9.361347500265693e-05, + "loss": 0.01, + "step": 530800 + }, + { + "epoch": 1.38, + "learning_rate": 9.360958678628547e-05, + "loss": 0.0103, + "step": 530810 + }, + { + "epoch": 1.38, + "learning_rate": 9.3605698569914e-05, + "loss": 0.0115, + "step": 530820 + }, + { + "epoch": 1.38, + "learning_rate": 9.360181035354256e-05, + "loss": 0.0119, + "step": 530830 + }, + { + "epoch": 1.38, + "learning_rate": 9.359792213717107e-05, + "loss": 0.0077, + "step": 530840 + }, + { + "epoch": 1.38, + "learning_rate": 9.359403392079963e-05, + "loss": 0.0094, + "step": 530850 + }, + { + "epoch": 1.38, + "learning_rate": 9.359014570442815e-05, + "loss": 0.0115, + "step": 530860 + }, + { + "epoch": 1.38, + "learning_rate": 9.35862574880567e-05, + "loss": 0.0099, + "step": 530870 + }, + { + "epoch": 1.38, + "learning_rate": 9.358236927168522e-05, + "loss": 0.011, + "step": 530880 + }, + { + "epoch": 1.38, + "learning_rate": 9.357848105531377e-05, + "loss": 0.0081, + "step": 530890 + }, + { + "epoch": 1.38, + "learning_rate": 9.35745928389423e-05, + "loss": 0.0105, + "step": 530900 + }, + { + "epoch": 1.38, + "learning_rate": 9.357070462257084e-05, + "loss": 0.0094, + "step": 530910 + }, + { + "epoch": 1.38, + "learning_rate": 9.356681640619936e-05, + "loss": 0.0077, + "step": 530920 + }, + { + "epoch": 1.38, + "learning_rate": 9.35629281898279e-05, + "loss": 0.0103, + "step": 530930 + }, + { + "epoch": 1.38, + "learning_rate": 9.355903997345643e-05, + "loss": 0.0092, + "step": 530940 + }, + { + "epoch": 1.38, + "learning_rate": 9.355515175708496e-05, + "loss": 0.0088, + "step": 530950 + }, + { + "epoch": 1.38, + "learning_rate": 9.35512635407135e-05, + "loss": 0.0105, + "step": 530960 + }, + { + "epoch": 1.38, + "learning_rate": 9.354737532434203e-05, + "loss": 0.0122, + "step": 530970 + }, + { + "epoch": 1.38, + "learning_rate": 9.354348710797057e-05, + "loss": 0.0102, + "step": 530980 + }, + { + "epoch": 1.38, + "learning_rate": 9.35395988915991e-05, + "loss": 0.0093, + "step": 530990 + }, + { + "epoch": 1.38, + "learning_rate": 9.353571067522764e-05, + "loss": 0.0123, + "step": 531000 + }, + { + "epoch": 1.38, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.006338402628898621, + "eval_runtime": 107.8828, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 531000 + }, + { + "epoch": 1.38, + "learning_rate": 9.353182245885617e-05, + "loss": 0.0096, + "step": 531010 + }, + { + "epoch": 1.38, + "learning_rate": 9.352793424248473e-05, + "loss": 0.0123, + "step": 531020 + }, + { + "epoch": 1.38, + "learning_rate": 9.352404602611325e-05, + "loss": 0.0192, + "step": 531030 + }, + { + "epoch": 1.38, + "learning_rate": 9.35201578097418e-05, + "loss": 0.0083, + "step": 531040 + }, + { + "epoch": 1.38, + "learning_rate": 9.351626959337032e-05, + "loss": 0.01, + "step": 531050 + }, + { + "epoch": 1.38, + "learning_rate": 9.351238137699886e-05, + "loss": 0.0099, + "step": 531060 + }, + { + "epoch": 1.38, + "learning_rate": 9.350849316062739e-05, + "loss": 0.0096, + "step": 531070 + }, + { + "epoch": 1.38, + "learning_rate": 9.350460494425593e-05, + "loss": 0.0089, + "step": 531080 + }, + { + "epoch": 1.38, + "learning_rate": 9.350071672788446e-05, + "loss": 0.0084, + "step": 531090 + }, + { + "epoch": 1.38, + "learning_rate": 9.3496828511513e-05, + "loss": 0.0112, + "step": 531100 + }, + { + "epoch": 1.38, + "learning_rate": 9.349294029514153e-05, + "loss": 0.0114, + "step": 531110 + }, + { + "epoch": 1.38, + "learning_rate": 9.348905207877007e-05, + "loss": 0.0074, + "step": 531120 + }, + { + "epoch": 1.38, + "learning_rate": 9.34851638623986e-05, + "loss": 0.009, + "step": 531130 + }, + { + "epoch": 1.38, + "learning_rate": 9.348127564602714e-05, + "loss": 0.0074, + "step": 531140 + }, + { + "epoch": 1.38, + "learning_rate": 9.347738742965567e-05, + "loss": 0.0094, + "step": 531150 + }, + { + "epoch": 1.38, + "learning_rate": 9.347349921328421e-05, + "loss": 0.0117, + "step": 531160 + }, + { + "epoch": 1.38, + "learning_rate": 9.346961099691274e-05, + "loss": 0.008, + "step": 531170 + }, + { + "epoch": 1.38, + "learning_rate": 9.34657227805413e-05, + "loss": 0.0097, + "step": 531180 + }, + { + "epoch": 1.38, + "learning_rate": 9.346183456416982e-05, + "loss": 0.0093, + "step": 531190 + }, + { + "epoch": 1.38, + "learning_rate": 9.345794634779834e-05, + "loss": 0.01, + "step": 531200 + }, + { + "epoch": 1.38, + "learning_rate": 9.34540581314269e-05, + "loss": 0.0093, + "step": 531210 + }, + { + "epoch": 1.38, + "learning_rate": 9.345016991505542e-05, + "loss": 0.0086, + "step": 531220 + }, + { + "epoch": 1.38, + "learning_rate": 9.344628169868396e-05, + "loss": 0.011, + "step": 531230 + }, + { + "epoch": 1.38, + "learning_rate": 9.344239348231249e-05, + "loss": 0.0086, + "step": 531240 + }, + { + "epoch": 1.38, + "learning_rate": 9.343850526594103e-05, + "loss": 0.0105, + "step": 531250 + }, + { + "epoch": 1.38, + "learning_rate": 9.343461704956956e-05, + "loss": 0.008, + "step": 531260 + }, + { + "epoch": 1.38, + "learning_rate": 9.34307288331981e-05, + "loss": 0.0102, + "step": 531270 + }, + { + "epoch": 1.38, + "learning_rate": 9.342684061682663e-05, + "loss": 0.0087, + "step": 531280 + }, + { + "epoch": 1.38, + "learning_rate": 9.342295240045517e-05, + "loss": 0.0116, + "step": 531290 + }, + { + "epoch": 1.38, + "learning_rate": 9.34190641840837e-05, + "loss": 0.0089, + "step": 531300 + }, + { + "epoch": 1.38, + "learning_rate": 9.341517596771224e-05, + "loss": 0.0077, + "step": 531310 + }, + { + "epoch": 1.38, + "learning_rate": 9.341128775134077e-05, + "loss": 0.0083, + "step": 531320 + }, + { + "epoch": 1.38, + "learning_rate": 9.340739953496931e-05, + "loss": 0.0089, + "step": 531330 + }, + { + "epoch": 1.38, + "learning_rate": 9.340351131859784e-05, + "loss": 0.01, + "step": 531340 + }, + { + "epoch": 1.38, + "learning_rate": 9.33996231022264e-05, + "loss": 0.0081, + "step": 531350 + }, + { + "epoch": 1.38, + "learning_rate": 9.339573488585491e-05, + "loss": 0.0095, + "step": 531360 + }, + { + "epoch": 1.38, + "learning_rate": 9.339184666948347e-05, + "loss": 0.0078, + "step": 531370 + }, + { + "epoch": 1.38, + "learning_rate": 9.3387958453112e-05, + "loss": 0.0077, + "step": 531380 + }, + { + "epoch": 1.38, + "learning_rate": 9.338407023674054e-05, + "loss": 0.0108, + "step": 531390 + }, + { + "epoch": 1.38, + "learning_rate": 9.338018202036906e-05, + "loss": 0.0094, + "step": 531400 + }, + { + "epoch": 1.38, + "learning_rate": 9.33762938039976e-05, + "loss": 0.0102, + "step": 531410 + }, + { + "epoch": 1.38, + "learning_rate": 9.337240558762613e-05, + "loss": 0.0084, + "step": 531420 + }, + { + "epoch": 1.38, + "learning_rate": 9.336851737125468e-05, + "loss": 0.0095, + "step": 531430 + }, + { + "epoch": 1.38, + "learning_rate": 9.33646291548832e-05, + "loss": 0.0103, + "step": 531440 + }, + { + "epoch": 1.38, + "learning_rate": 9.336074093851173e-05, + "loss": 0.0109, + "step": 531450 + }, + { + "epoch": 1.38, + "learning_rate": 9.335685272214027e-05, + "loss": 0.0088, + "step": 531460 + }, + { + "epoch": 1.38, + "learning_rate": 9.33529645057688e-05, + "loss": 0.0091, + "step": 531470 + }, + { + "epoch": 1.38, + "learning_rate": 9.334907628939734e-05, + "loss": 0.0088, + "step": 531480 + }, + { + "epoch": 1.38, + "learning_rate": 9.334518807302587e-05, + "loss": 0.0095, + "step": 531490 + }, + { + "epoch": 1.38, + "learning_rate": 9.334129985665441e-05, + "loss": 0.0102, + "step": 531500 + }, + { + "epoch": 1.38, + "learning_rate": 9.333741164028294e-05, + "loss": 0.0106, + "step": 531510 + }, + { + "epoch": 1.38, + "learning_rate": 9.333352342391148e-05, + "loss": 0.0091, + "step": 531520 + }, + { + "epoch": 1.38, + "learning_rate": 9.332963520754001e-05, + "loss": 0.0077, + "step": 531530 + }, + { + "epoch": 1.38, + "learning_rate": 9.332574699116857e-05, + "loss": 0.0114, + "step": 531540 + }, + { + "epoch": 1.38, + "learning_rate": 9.33218587747971e-05, + "loss": 0.0127, + "step": 531550 + }, + { + "epoch": 1.38, + "learning_rate": 9.331797055842564e-05, + "loss": 0.0088, + "step": 531560 + }, + { + "epoch": 1.38, + "learning_rate": 9.331408234205416e-05, + "loss": 0.0107, + "step": 531570 + }, + { + "epoch": 1.38, + "learning_rate": 9.33101941256827e-05, + "loss": 0.0103, + "step": 531580 + }, + { + "epoch": 1.38, + "learning_rate": 9.330630590931123e-05, + "loss": 0.0093, + "step": 531590 + }, + { + "epoch": 1.38, + "learning_rate": 9.330241769293977e-05, + "loss": 0.0081, + "step": 531600 + }, + { + "epoch": 1.38, + "learning_rate": 9.32985294765683e-05, + "loss": 0.0089, + "step": 531610 + }, + { + "epoch": 1.38, + "learning_rate": 9.329464126019684e-05, + "loss": 0.008, + "step": 531620 + }, + { + "epoch": 1.38, + "learning_rate": 9.329075304382537e-05, + "loss": 0.0091, + "step": 531630 + }, + { + "epoch": 1.38, + "learning_rate": 9.328686482745391e-05, + "loss": 0.011, + "step": 531640 + }, + { + "epoch": 1.38, + "learning_rate": 9.328297661108244e-05, + "loss": 0.0132, + "step": 531650 + }, + { + "epoch": 1.38, + "learning_rate": 9.327908839471098e-05, + "loss": 0.0093, + "step": 531660 + }, + { + "epoch": 1.38, + "learning_rate": 9.327520017833951e-05, + "loss": 0.0076, + "step": 531670 + }, + { + "epoch": 1.38, + "learning_rate": 9.327131196196805e-05, + "loss": 0.0112, + "step": 531680 + }, + { + "epoch": 1.38, + "learning_rate": 9.326742374559658e-05, + "loss": 0.0152, + "step": 531690 + }, + { + "epoch": 1.38, + "learning_rate": 9.326353552922511e-05, + "loss": 0.0104, + "step": 531700 + }, + { + "epoch": 1.38, + "learning_rate": 9.325964731285366e-05, + "loss": 0.0093, + "step": 531710 + }, + { + "epoch": 1.38, + "learning_rate": 9.325575909648218e-05, + "loss": 0.0111, + "step": 531720 + }, + { + "epoch": 1.38, + "learning_rate": 9.325187088011073e-05, + "loss": 0.0075, + "step": 531730 + }, + { + "epoch": 1.38, + "learning_rate": 9.324798266373926e-05, + "loss": 0.007, + "step": 531740 + }, + { + "epoch": 1.38, + "learning_rate": 9.32440944473678e-05, + "loss": 0.0114, + "step": 531750 + }, + { + "epoch": 1.38, + "learning_rate": 9.324020623099633e-05, + "loss": 0.0088, + "step": 531760 + }, + { + "epoch": 1.38, + "learning_rate": 9.323631801462487e-05, + "loss": 0.0086, + "step": 531770 + }, + { + "epoch": 1.38, + "learning_rate": 9.32324297982534e-05, + "loss": 0.0091, + "step": 531780 + }, + { + "epoch": 1.38, + "learning_rate": 9.322854158188194e-05, + "loss": 0.0105, + "step": 531790 + }, + { + "epoch": 1.38, + "learning_rate": 9.322465336551047e-05, + "loss": 0.0098, + "step": 531800 + }, + { + "epoch": 1.38, + "learning_rate": 9.322076514913901e-05, + "loss": 0.0093, + "step": 531810 + }, + { + "epoch": 1.38, + "learning_rate": 9.321687693276754e-05, + "loss": 0.0101, + "step": 531820 + }, + { + "epoch": 1.38, + "learning_rate": 9.321298871639608e-05, + "loss": 0.0068, + "step": 531830 + }, + { + "epoch": 1.38, + "learning_rate": 9.320910050002461e-05, + "loss": 0.0081, + "step": 531840 + }, + { + "epoch": 1.38, + "learning_rate": 9.320521228365315e-05, + "loss": 0.0114, + "step": 531850 + }, + { + "epoch": 1.38, + "learning_rate": 9.320132406728168e-05, + "loss": 0.0113, + "step": 531860 + }, + { + "epoch": 1.38, + "learning_rate": 9.319743585091022e-05, + "loss": 0.0092, + "step": 531870 + }, + { + "epoch": 1.38, + "learning_rate": 9.319354763453875e-05, + "loss": 0.0083, + "step": 531880 + }, + { + "epoch": 1.38, + "learning_rate": 9.31896594181673e-05, + "loss": 0.0088, + "step": 531890 + }, + { + "epoch": 1.38, + "learning_rate": 9.318577120179583e-05, + "loss": 0.0106, + "step": 531900 + }, + { + "epoch": 1.38, + "learning_rate": 9.318188298542438e-05, + "loss": 0.0104, + "step": 531910 + }, + { + "epoch": 1.38, + "learning_rate": 9.31779947690529e-05, + "loss": 0.0117, + "step": 531920 + }, + { + "epoch": 1.38, + "learning_rate": 9.317410655268145e-05, + "loss": 0.0125, + "step": 531930 + }, + { + "epoch": 1.38, + "learning_rate": 9.317021833630997e-05, + "loss": 0.011, + "step": 531940 + }, + { + "epoch": 1.38, + "learning_rate": 9.31663301199385e-05, + "loss": 0.0088, + "step": 531950 + }, + { + "epoch": 1.38, + "learning_rate": 9.316244190356704e-05, + "loss": 0.0088, + "step": 531960 + }, + { + "epoch": 1.38, + "learning_rate": 9.315855368719557e-05, + "loss": 0.0078, + "step": 531970 + }, + { + "epoch": 1.38, + "learning_rate": 9.315466547082411e-05, + "loss": 0.0075, + "step": 531980 + }, + { + "epoch": 1.38, + "learning_rate": 9.315077725445264e-05, + "loss": 0.0095, + "step": 531990 + }, + { + "epoch": 1.38, + "learning_rate": 9.314688903808118e-05, + "loss": 0.0085, + "step": 532000 + }, + { + "epoch": 1.38, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.0063028521835803986, + "eval_runtime": 108.1012, + "eval_samples_per_second": 18.501, + "eval_steps_per_second": 4.625, + "step": 532000 + }, + { + "epoch": 1.38, + "learning_rate": 9.314300082170971e-05, + "loss": 0.006, + "step": 532010 + }, + { + "epoch": 1.38, + "learning_rate": 9.313911260533825e-05, + "loss": 0.0104, + "step": 532020 + }, + { + "epoch": 1.38, + "learning_rate": 9.313522438896678e-05, + "loss": 0.0101, + "step": 532030 + }, + { + "epoch": 1.38, + "learning_rate": 9.313133617259532e-05, + "loss": 0.0079, + "step": 532040 + }, + { + "epoch": 1.38, + "learning_rate": 9.312744795622385e-05, + "loss": 0.012, + "step": 532050 + }, + { + "epoch": 1.38, + "learning_rate": 9.31235597398524e-05, + "loss": 0.0101, + "step": 532060 + }, + { + "epoch": 1.38, + "learning_rate": 9.311967152348093e-05, + "loss": 0.0085, + "step": 532070 + }, + { + "epoch": 1.38, + "learning_rate": 9.311578330710947e-05, + "loss": 0.0106, + "step": 532080 + }, + { + "epoch": 1.38, + "learning_rate": 9.3111895090738e-05, + "loss": 0.0092, + "step": 532090 + }, + { + "epoch": 1.38, + "learning_rate": 9.310800687436654e-05, + "loss": 0.0094, + "step": 532100 + }, + { + "epoch": 1.38, + "learning_rate": 9.310411865799507e-05, + "loss": 0.0074, + "step": 532110 + }, + { + "epoch": 1.38, + "learning_rate": 9.310023044162361e-05, + "loss": 0.0072, + "step": 532120 + }, + { + "epoch": 1.38, + "learning_rate": 9.309634222525214e-05, + "loss": 0.0132, + "step": 532130 + }, + { + "epoch": 1.38, + "learning_rate": 9.309245400888068e-05, + "loss": 0.0091, + "step": 532140 + }, + { + "epoch": 1.38, + "learning_rate": 9.308856579250921e-05, + "loss": 0.0105, + "step": 532150 + }, + { + "epoch": 1.38, + "learning_rate": 9.308467757613775e-05, + "loss": 0.0105, + "step": 532160 + }, + { + "epoch": 1.38, + "learning_rate": 9.308078935976628e-05, + "loss": 0.0111, + "step": 532170 + }, + { + "epoch": 1.38, + "learning_rate": 9.307690114339482e-05, + "loss": 0.0106, + "step": 532180 + }, + { + "epoch": 1.38, + "learning_rate": 9.307301292702335e-05, + "loss": 0.0111, + "step": 532190 + }, + { + "epoch": 1.38, + "learning_rate": 9.306912471065188e-05, + "loss": 0.0079, + "step": 532200 + }, + { + "epoch": 1.38, + "learning_rate": 9.306523649428042e-05, + "loss": 0.0081, + "step": 532210 + }, + { + "epoch": 1.38, + "learning_rate": 9.306134827790895e-05, + "loss": 0.0102, + "step": 532220 + }, + { + "epoch": 1.38, + "learning_rate": 9.305746006153749e-05, + "loss": 0.0115, + "step": 532230 + }, + { + "epoch": 1.38, + "learning_rate": 9.305357184516602e-05, + "loss": 0.0118, + "step": 532240 + }, + { + "epoch": 1.38, + "learning_rate": 9.304968362879457e-05, + "loss": 0.0117, + "step": 532250 + }, + { + "epoch": 1.38, + "learning_rate": 9.30457954124231e-05, + "loss": 0.011, + "step": 532260 + }, + { + "epoch": 1.38, + "learning_rate": 9.304190719605164e-05, + "loss": 0.0129, + "step": 532270 + }, + { + "epoch": 1.38, + "learning_rate": 9.303801897968017e-05, + "loss": 0.0127, + "step": 532280 + }, + { + "epoch": 1.38, + "learning_rate": 9.303413076330871e-05, + "loss": 0.0085, + "step": 532290 + }, + { + "epoch": 1.38, + "learning_rate": 9.303024254693724e-05, + "loss": 0.011, + "step": 532300 + }, + { + "epoch": 1.38, + "learning_rate": 9.302635433056578e-05, + "loss": 0.0074, + "step": 532310 + }, + { + "epoch": 1.38, + "learning_rate": 9.302246611419431e-05, + "loss": 0.0145, + "step": 532320 + }, + { + "epoch": 1.38, + "learning_rate": 9.301857789782285e-05, + "loss": 0.0108, + "step": 532330 + }, + { + "epoch": 1.38, + "learning_rate": 9.301468968145138e-05, + "loss": 0.0083, + "step": 532340 + }, + { + "epoch": 1.38, + "learning_rate": 9.301080146507992e-05, + "loss": 0.0097, + "step": 532350 + }, + { + "epoch": 1.38, + "learning_rate": 9.300691324870845e-05, + "loss": 0.011, + "step": 532360 + }, + { + "epoch": 1.38, + "learning_rate": 9.300302503233699e-05, + "loss": 0.0083, + "step": 532370 + }, + { + "epoch": 1.38, + "learning_rate": 9.299913681596552e-05, + "loss": 0.0111, + "step": 532380 + }, + { + "epoch": 1.38, + "learning_rate": 9.299524859959406e-05, + "loss": 0.0095, + "step": 532390 + }, + { + "epoch": 1.38, + "learning_rate": 9.299136038322259e-05, + "loss": 0.0108, + "step": 532400 + }, + { + "epoch": 1.38, + "learning_rate": 9.298747216685115e-05, + "loss": 0.009, + "step": 532410 + }, + { + "epoch": 1.38, + "learning_rate": 9.298358395047967e-05, + "loss": 0.008, + "step": 532420 + }, + { + "epoch": 1.38, + "learning_rate": 9.297969573410822e-05, + "loss": 0.0058, + "step": 532430 + }, + { + "epoch": 1.38, + "learning_rate": 9.297580751773674e-05, + "loss": 0.0092, + "step": 532440 + }, + { + "epoch": 1.38, + "learning_rate": 9.297191930136527e-05, + "loss": 0.0077, + "step": 532450 + }, + { + "epoch": 1.38, + "learning_rate": 9.296803108499381e-05, + "loss": 0.0096, + "step": 532460 + }, + { + "epoch": 1.38, + "learning_rate": 9.296414286862234e-05, + "loss": 0.0114, + "step": 532470 + }, + { + "epoch": 1.38, + "learning_rate": 9.296025465225088e-05, + "loss": 0.0076, + "step": 532480 + }, + { + "epoch": 1.38, + "learning_rate": 9.295636643587941e-05, + "loss": 0.0116, + "step": 532490 + }, + { + "epoch": 1.38, + "learning_rate": 9.295247821950795e-05, + "loss": 0.0108, + "step": 532500 + }, + { + "epoch": 1.38, + "learning_rate": 9.294859000313648e-05, + "loss": 0.0096, + "step": 532510 + }, + { + "epoch": 1.38, + "learning_rate": 9.294470178676502e-05, + "loss": 0.0098, + "step": 532520 + }, + { + "epoch": 1.38, + "learning_rate": 9.294081357039355e-05, + "loss": 0.008, + "step": 532530 + }, + { + "epoch": 1.38, + "learning_rate": 9.293692535402209e-05, + "loss": 0.0093, + "step": 532540 + }, + { + "epoch": 1.38, + "learning_rate": 9.293303713765062e-05, + "loss": 0.0084, + "step": 532550 + }, + { + "epoch": 1.38, + "learning_rate": 9.292914892127916e-05, + "loss": 0.0092, + "step": 532560 + }, + { + "epoch": 1.38, + "learning_rate": 9.292526070490769e-05, + "loss": 0.0079, + "step": 532570 + }, + { + "epoch": 1.38, + "learning_rate": 9.292137248853625e-05, + "loss": 0.0101, + "step": 532580 + }, + { + "epoch": 1.38, + "learning_rate": 9.291748427216476e-05, + "loss": 0.0093, + "step": 532590 + }, + { + "epoch": 1.38, + "learning_rate": 9.291359605579331e-05, + "loss": 0.011, + "step": 532600 + }, + { + "epoch": 1.38, + "learning_rate": 9.290970783942184e-05, + "loss": 0.0108, + "step": 532610 + }, + { + "epoch": 1.38, + "learning_rate": 9.290581962305038e-05, + "loss": 0.0093, + "step": 532620 + }, + { + "epoch": 1.38, + "learning_rate": 9.290193140667891e-05, + "loss": 0.0091, + "step": 532630 + }, + { + "epoch": 1.38, + "learning_rate": 9.289804319030745e-05, + "loss": 0.0087, + "step": 532640 + }, + { + "epoch": 1.38, + "learning_rate": 9.289415497393598e-05, + "loss": 0.0098, + "step": 532650 + }, + { + "epoch": 1.38, + "learning_rate": 9.289026675756452e-05, + "loss": 0.0072, + "step": 532660 + }, + { + "epoch": 1.38, + "learning_rate": 9.288637854119305e-05, + "loss": 0.0109, + "step": 532670 + }, + { + "epoch": 1.38, + "learning_rate": 9.28824903248216e-05, + "loss": 0.0113, + "step": 532680 + }, + { + "epoch": 1.38, + "learning_rate": 9.287860210845012e-05, + "loss": 0.0136, + "step": 532690 + }, + { + "epoch": 1.38, + "learning_rate": 9.287471389207865e-05, + "loss": 0.0101, + "step": 532700 + }, + { + "epoch": 1.38, + "learning_rate": 9.287082567570719e-05, + "loss": 0.0073, + "step": 532710 + }, + { + "epoch": 1.38, + "learning_rate": 9.286693745933572e-05, + "loss": 0.0101, + "step": 532720 + }, + { + "epoch": 1.38, + "learning_rate": 9.286304924296426e-05, + "loss": 0.0206, + "step": 532730 + }, + { + "epoch": 1.38, + "learning_rate": 9.285916102659279e-05, + "loss": 0.0087, + "step": 532740 + }, + { + "epoch": 1.38, + "learning_rate": 9.285527281022133e-05, + "loss": 0.0091, + "step": 532750 + }, + { + "epoch": 1.38, + "learning_rate": 9.285138459384986e-05, + "loss": 0.0085, + "step": 532760 + }, + { + "epoch": 1.38, + "learning_rate": 9.284749637747841e-05, + "loss": 0.01, + "step": 532770 + }, + { + "epoch": 1.38, + "learning_rate": 9.284360816110694e-05, + "loss": 0.0097, + "step": 532780 + }, + { + "epoch": 1.38, + "learning_rate": 9.283971994473548e-05, + "loss": 0.009, + "step": 532790 + }, + { + "epoch": 1.38, + "learning_rate": 9.283583172836401e-05, + "loss": 0.0101, + "step": 532800 + }, + { + "epoch": 1.38, + "learning_rate": 9.283194351199255e-05, + "loss": 0.0114, + "step": 532810 + }, + { + "epoch": 1.38, + "learning_rate": 9.282805529562108e-05, + "loss": 0.0086, + "step": 532820 + }, + { + "epoch": 1.38, + "learning_rate": 9.282416707924962e-05, + "loss": 0.0148, + "step": 532830 + }, + { + "epoch": 1.38, + "learning_rate": 9.282027886287815e-05, + "loss": 0.0085, + "step": 532840 + }, + { + "epoch": 1.38, + "learning_rate": 9.281639064650669e-05, + "loss": 0.0074, + "step": 532850 + }, + { + "epoch": 1.38, + "learning_rate": 9.281250243013522e-05, + "loss": 0.0102, + "step": 532860 + }, + { + "epoch": 1.38, + "learning_rate": 9.280861421376376e-05, + "loss": 0.012, + "step": 532870 + }, + { + "epoch": 1.38, + "learning_rate": 9.280472599739229e-05, + "loss": 0.0076, + "step": 532880 + }, + { + "epoch": 1.38, + "learning_rate": 9.280083778102083e-05, + "loss": 0.0132, + "step": 532890 + }, + { + "epoch": 1.38, + "learning_rate": 9.279694956464936e-05, + "loss": 0.0095, + "step": 532900 + }, + { + "epoch": 1.38, + "learning_rate": 9.27930613482779e-05, + "loss": 0.0084, + "step": 532910 + }, + { + "epoch": 1.38, + "learning_rate": 9.278917313190643e-05, + "loss": 0.0101, + "step": 532920 + }, + { + "epoch": 1.38, + "learning_rate": 9.278528491553499e-05, + "loss": 0.0089, + "step": 532930 + }, + { + "epoch": 1.38, + "learning_rate": 9.278139669916351e-05, + "loss": 0.0083, + "step": 532940 + }, + { + "epoch": 1.38, + "learning_rate": 9.277750848279203e-05, + "loss": 0.0087, + "step": 532950 + }, + { + "epoch": 1.38, + "learning_rate": 9.277362026642058e-05, + "loss": 0.011, + "step": 532960 + }, + { + "epoch": 1.38, + "learning_rate": 9.276973205004911e-05, + "loss": 0.009, + "step": 532970 + }, + { + "epoch": 1.38, + "learning_rate": 9.276584383367765e-05, + "loss": 0.014, + "step": 532980 + }, + { + "epoch": 1.38, + "learning_rate": 9.276195561730618e-05, + "loss": 0.0064, + "step": 532990 + }, + { + "epoch": 1.38, + "learning_rate": 9.275806740093472e-05, + "loss": 0.0092, + "step": 533000 + }, + { + "epoch": 1.38, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.006268115248531103, + "eval_runtime": 107.8458, + "eval_samples_per_second": 18.545, + "eval_steps_per_second": 4.636, + "step": 533000 + }, + { + "epoch": 1.38, + "learning_rate": 9.275417918456325e-05, + "loss": 0.0076, + "step": 533010 + }, + { + "epoch": 1.38, + "learning_rate": 9.275029096819179e-05, + "loss": 0.0086, + "step": 533020 + }, + { + "epoch": 1.38, + "learning_rate": 9.274640275182032e-05, + "loss": 0.0094, + "step": 533030 + }, + { + "epoch": 1.38, + "learning_rate": 9.274251453544886e-05, + "loss": 0.0094, + "step": 533040 + }, + { + "epoch": 1.38, + "learning_rate": 9.273862631907739e-05, + "loss": 0.0104, + "step": 533050 + }, + { + "epoch": 1.38, + "learning_rate": 9.273473810270593e-05, + "loss": 0.0095, + "step": 533060 + }, + { + "epoch": 1.38, + "learning_rate": 9.273084988633446e-05, + "loss": 0.0086, + "step": 533070 + }, + { + "epoch": 1.38, + "learning_rate": 9.2726961669963e-05, + "loss": 0.0093, + "step": 533080 + }, + { + "epoch": 1.38, + "learning_rate": 9.272307345359153e-05, + "loss": 0.0094, + "step": 533090 + }, + { + "epoch": 1.38, + "learning_rate": 9.271918523722009e-05, + "loss": 0.0094, + "step": 533100 + }, + { + "epoch": 1.38, + "learning_rate": 9.27152970208486e-05, + "loss": 0.0106, + "step": 533110 + }, + { + "epoch": 1.38, + "learning_rate": 9.271140880447715e-05, + "loss": 0.0081, + "step": 533120 + }, + { + "epoch": 1.38, + "learning_rate": 9.270752058810568e-05, + "loss": 0.0092, + "step": 533130 + }, + { + "epoch": 1.38, + "learning_rate": 9.270363237173422e-05, + "loss": 0.0116, + "step": 533140 + }, + { + "epoch": 1.38, + "learning_rate": 9.269974415536275e-05, + "loss": 0.0119, + "step": 533150 + }, + { + "epoch": 1.38, + "learning_rate": 9.26958559389913e-05, + "loss": 0.0085, + "step": 533160 + }, + { + "epoch": 1.38, + "learning_rate": 9.269196772261982e-05, + "loss": 0.011, + "step": 533170 + }, + { + "epoch": 1.38, + "learning_rate": 9.268807950624836e-05, + "loss": 0.0108, + "step": 533180 + }, + { + "epoch": 1.38, + "learning_rate": 9.268419128987689e-05, + "loss": 0.0092, + "step": 533190 + }, + { + "epoch": 1.38, + "learning_rate": 9.268030307350542e-05, + "loss": 0.014, + "step": 533200 + }, + { + "epoch": 1.38, + "learning_rate": 9.267641485713396e-05, + "loss": 0.0085, + "step": 533210 + }, + { + "epoch": 1.38, + "learning_rate": 9.267252664076249e-05, + "loss": 0.0106, + "step": 533220 + }, + { + "epoch": 1.38, + "learning_rate": 9.266863842439103e-05, + "loss": 0.0084, + "step": 533230 + }, + { + "epoch": 1.38, + "learning_rate": 9.266475020801956e-05, + "loss": 0.0089, + "step": 533240 + }, + { + "epoch": 1.38, + "learning_rate": 9.26608619916481e-05, + "loss": 0.009, + "step": 533250 + }, + { + "epoch": 1.38, + "learning_rate": 9.265697377527663e-05, + "loss": 0.0107, + "step": 533260 + }, + { + "epoch": 1.38, + "learning_rate": 9.265308555890517e-05, + "loss": 0.0143, + "step": 533270 + }, + { + "epoch": 1.38, + "learning_rate": 9.26491973425337e-05, + "loss": 0.0078, + "step": 533280 + }, + { + "epoch": 1.38, + "learning_rate": 9.264530912616225e-05, + "loss": 0.0093, + "step": 533290 + }, + { + "epoch": 1.38, + "learning_rate": 9.264142090979078e-05, + "loss": 0.0078, + "step": 533300 + }, + { + "epoch": 1.38, + "learning_rate": 9.263753269341932e-05, + "loss": 0.0093, + "step": 533310 + }, + { + "epoch": 1.38, + "learning_rate": 9.263364447704785e-05, + "loss": 0.0084, + "step": 533320 + }, + { + "epoch": 1.38, + "learning_rate": 9.26297562606764e-05, + "loss": 0.0101, + "step": 533330 + }, + { + "epoch": 1.38, + "learning_rate": 9.262586804430492e-05, + "loss": 0.0075, + "step": 533340 + }, + { + "epoch": 1.38, + "learning_rate": 9.262197982793346e-05, + "loss": 0.0135, + "step": 533350 + }, + { + "epoch": 1.38, + "learning_rate": 9.261809161156199e-05, + "loss": 0.009, + "step": 533360 + }, + { + "epoch": 1.38, + "learning_rate": 9.261420339519053e-05, + "loss": 0.0109, + "step": 533370 + }, + { + "epoch": 1.38, + "learning_rate": 9.261031517881906e-05, + "loss": 0.0121, + "step": 533380 + }, + { + "epoch": 1.38, + "learning_rate": 9.26064269624476e-05, + "loss": 0.0133, + "step": 533390 + }, + { + "epoch": 1.38, + "learning_rate": 9.260253874607613e-05, + "loss": 0.0094, + "step": 533400 + }, + { + "epoch": 1.38, + "learning_rate": 9.259865052970467e-05, + "loss": 0.0137, + "step": 533410 + }, + { + "epoch": 1.38, + "learning_rate": 9.25947623133332e-05, + "loss": 0.0117, + "step": 533420 + }, + { + "epoch": 1.38, + "learning_rate": 9.259087409696173e-05, + "loss": 0.0082, + "step": 533430 + }, + { + "epoch": 1.38, + "learning_rate": 9.258698588059027e-05, + "loss": 0.0085, + "step": 533440 + }, + { + "epoch": 1.38, + "learning_rate": 9.25830976642188e-05, + "loss": 0.0074, + "step": 533450 + }, + { + "epoch": 1.38, + "learning_rate": 9.257920944784734e-05, + "loss": 0.01, + "step": 533460 + }, + { + "epoch": 1.38, + "learning_rate": 9.257532123147587e-05, + "loss": 0.01, + "step": 533470 + }, + { + "epoch": 1.38, + "learning_rate": 9.257143301510442e-05, + "loss": 0.0123, + "step": 533480 + }, + { + "epoch": 1.38, + "learning_rate": 9.256754479873295e-05, + "loss": 0.0103, + "step": 533490 + }, + { + "epoch": 1.38, + "learning_rate": 9.256365658236149e-05, + "loss": 0.0074, + "step": 533500 + }, + { + "epoch": 1.38, + "learning_rate": 9.255976836599002e-05, + "loss": 0.0099, + "step": 533510 + }, + { + "epoch": 1.38, + "learning_rate": 9.255588014961856e-05, + "loss": 0.0085, + "step": 533520 + }, + { + "epoch": 1.38, + "learning_rate": 9.255199193324709e-05, + "loss": 0.0115, + "step": 533530 + }, + { + "epoch": 1.38, + "learning_rate": 9.254810371687563e-05, + "loss": 0.0148, + "step": 533540 + }, + { + "epoch": 1.38, + "learning_rate": 9.254421550050416e-05, + "loss": 0.0114, + "step": 533550 + }, + { + "epoch": 1.38, + "learning_rate": 9.25403272841327e-05, + "loss": 0.011, + "step": 533560 + }, + { + "epoch": 1.38, + "learning_rate": 9.253643906776123e-05, + "loss": 0.0094, + "step": 533570 + }, + { + "epoch": 1.38, + "learning_rate": 9.253255085138977e-05, + "loss": 0.0086, + "step": 533580 + }, + { + "epoch": 1.38, + "learning_rate": 9.25286626350183e-05, + "loss": 0.0078, + "step": 533590 + }, + { + "epoch": 1.38, + "learning_rate": 9.252477441864684e-05, + "loss": 0.0126, + "step": 533600 + }, + { + "epoch": 1.38, + "learning_rate": 9.252088620227537e-05, + "loss": 0.0116, + "step": 533610 + }, + { + "epoch": 1.38, + "learning_rate": 9.251699798590391e-05, + "loss": 0.0099, + "step": 533620 + }, + { + "epoch": 1.38, + "learning_rate": 9.251310976953244e-05, + "loss": 0.0118, + "step": 533630 + }, + { + "epoch": 1.38, + "learning_rate": 9.2509221553161e-05, + "loss": 0.01, + "step": 533640 + }, + { + "epoch": 1.38, + "learning_rate": 9.250533333678952e-05, + "loss": 0.0082, + "step": 533650 + }, + { + "epoch": 1.38, + "learning_rate": 9.250144512041806e-05, + "loss": 0.0125, + "step": 533660 + }, + { + "epoch": 1.38, + "learning_rate": 9.249755690404659e-05, + "loss": 0.0112, + "step": 533670 + }, + { + "epoch": 1.38, + "learning_rate": 9.249366868767512e-05, + "loss": 0.0077, + "step": 533680 + }, + { + "epoch": 1.38, + "learning_rate": 9.248978047130366e-05, + "loss": 0.0098, + "step": 533690 + }, + { + "epoch": 1.38, + "learning_rate": 9.248589225493219e-05, + "loss": 0.009, + "step": 533700 + }, + { + "epoch": 1.38, + "learning_rate": 9.248200403856073e-05, + "loss": 0.0109, + "step": 533710 + }, + { + "epoch": 1.38, + "learning_rate": 9.247811582218926e-05, + "loss": 0.009, + "step": 533720 + }, + { + "epoch": 1.38, + "learning_rate": 9.24742276058178e-05, + "loss": 0.0104, + "step": 533730 + }, + { + "epoch": 1.38, + "learning_rate": 9.247033938944633e-05, + "loss": 0.0071, + "step": 533740 + }, + { + "epoch": 1.38, + "learning_rate": 9.246645117307487e-05, + "loss": 0.0093, + "step": 533750 + }, + { + "epoch": 1.38, + "learning_rate": 9.24625629567034e-05, + "loss": 0.0079, + "step": 533760 + }, + { + "epoch": 1.38, + "learning_rate": 9.245867474033194e-05, + "loss": 0.0093, + "step": 533770 + }, + { + "epoch": 1.38, + "learning_rate": 9.245478652396047e-05, + "loss": 0.0087, + "step": 533780 + }, + { + "epoch": 1.38, + "learning_rate": 9.245089830758901e-05, + "loss": 0.0095, + "step": 533790 + }, + { + "epoch": 1.38, + "learning_rate": 9.244701009121754e-05, + "loss": 0.008, + "step": 533800 + }, + { + "epoch": 1.38, + "learning_rate": 9.24431218748461e-05, + "loss": 0.0139, + "step": 533810 + }, + { + "epoch": 1.38, + "learning_rate": 9.243923365847461e-05, + "loss": 0.0108, + "step": 533820 + }, + { + "epoch": 1.38, + "learning_rate": 9.243534544210316e-05, + "loss": 0.0082, + "step": 533830 + }, + { + "epoch": 1.38, + "learning_rate": 9.243145722573169e-05, + "loss": 0.0123, + "step": 533840 + }, + { + "epoch": 1.38, + "learning_rate": 9.242756900936023e-05, + "loss": 0.0107, + "step": 533850 + }, + { + "epoch": 1.38, + "learning_rate": 9.242368079298876e-05, + "loss": 0.0084, + "step": 533860 + }, + { + "epoch": 1.38, + "learning_rate": 9.24197925766173e-05, + "loss": 0.0119, + "step": 533870 + }, + { + "epoch": 1.38, + "learning_rate": 9.241590436024583e-05, + "loss": 0.0095, + "step": 533880 + }, + { + "epoch": 1.38, + "learning_rate": 9.241201614387437e-05, + "loss": 0.0094, + "step": 533890 + }, + { + "epoch": 1.38, + "learning_rate": 9.24081279275029e-05, + "loss": 0.0086, + "step": 533900 + }, + { + "epoch": 1.38, + "learning_rate": 9.240423971113144e-05, + "loss": 0.0082, + "step": 533910 + }, + { + "epoch": 1.38, + "learning_rate": 9.240035149475997e-05, + "loss": 0.0087, + "step": 533920 + }, + { + "epoch": 1.38, + "learning_rate": 9.23964632783885e-05, + "loss": 0.0102, + "step": 533930 + }, + { + "epoch": 1.38, + "learning_rate": 9.239257506201704e-05, + "loss": 0.0103, + "step": 533940 + }, + { + "epoch": 1.38, + "learning_rate": 9.238868684564557e-05, + "loss": 0.0096, + "step": 533950 + }, + { + "epoch": 1.38, + "learning_rate": 9.238479862927411e-05, + "loss": 0.0093, + "step": 533960 + }, + { + "epoch": 1.38, + "learning_rate": 9.238091041290264e-05, + "loss": 0.0111, + "step": 533970 + }, + { + "epoch": 1.38, + "learning_rate": 9.237702219653118e-05, + "loss": 0.0109, + "step": 533980 + }, + { + "epoch": 1.38, + "learning_rate": 9.237313398015971e-05, + "loss": 0.0128, + "step": 533990 + }, + { + "epoch": 1.38, + "learning_rate": 9.236924576378826e-05, + "loss": 0.0091, + "step": 534000 + }, + { + "epoch": 1.38, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.0059846206568181515, + "eval_runtime": 107.6906, + "eval_samples_per_second": 18.572, + "eval_steps_per_second": 4.643, + "step": 534000 + }, + { + "epoch": 1.38, + "learning_rate": 9.236535754741679e-05, + "loss": 0.0112, + "step": 534010 + }, + { + "epoch": 1.38, + "learning_rate": 9.236146933104533e-05, + "loss": 0.0117, + "step": 534020 + }, + { + "epoch": 1.38, + "learning_rate": 9.235758111467386e-05, + "loss": 0.0094, + "step": 534030 + }, + { + "epoch": 1.38, + "learning_rate": 9.23536928983024e-05, + "loss": 0.0092, + "step": 534040 + }, + { + "epoch": 1.38, + "learning_rate": 9.234980468193093e-05, + "loss": 0.0064, + "step": 534050 + }, + { + "epoch": 1.38, + "learning_rate": 9.234591646555947e-05, + "loss": 0.0108, + "step": 534060 + }, + { + "epoch": 1.38, + "learning_rate": 9.2342028249188e-05, + "loss": 0.008, + "step": 534070 + }, + { + "epoch": 1.38, + "learning_rate": 9.233814003281654e-05, + "loss": 0.0117, + "step": 534080 + }, + { + "epoch": 1.38, + "learning_rate": 9.233425181644507e-05, + "loss": 0.0069, + "step": 534090 + }, + { + "epoch": 1.38, + "learning_rate": 9.233036360007361e-05, + "loss": 0.0096, + "step": 534100 + }, + { + "epoch": 1.38, + "learning_rate": 9.232647538370214e-05, + "loss": 0.0091, + "step": 534110 + }, + { + "epoch": 1.38, + "learning_rate": 9.232258716733068e-05, + "loss": 0.0097, + "step": 534120 + }, + { + "epoch": 1.38, + "learning_rate": 9.231869895095921e-05, + "loss": 0.0107, + "step": 534130 + }, + { + "epoch": 1.38, + "learning_rate": 9.231481073458775e-05, + "loss": 0.0108, + "step": 534140 + }, + { + "epoch": 1.38, + "learning_rate": 9.231092251821628e-05, + "loss": 0.0099, + "step": 534150 + }, + { + "epoch": 1.38, + "learning_rate": 9.230703430184483e-05, + "loss": 0.0106, + "step": 534160 + }, + { + "epoch": 1.38, + "learning_rate": 9.230314608547336e-05, + "loss": 0.0092, + "step": 534170 + }, + { + "epoch": 1.38, + "learning_rate": 9.229925786910188e-05, + "loss": 0.0139, + "step": 534180 + }, + { + "epoch": 1.38, + "learning_rate": 9.229536965273043e-05, + "loss": 0.0089, + "step": 534190 + }, + { + "epoch": 1.38, + "learning_rate": 9.229148143635896e-05, + "loss": 0.0088, + "step": 534200 + }, + { + "epoch": 1.38, + "learning_rate": 9.22875932199875e-05, + "loss": 0.0105, + "step": 534210 + }, + { + "epoch": 1.38, + "learning_rate": 9.228370500361603e-05, + "loss": 0.0095, + "step": 534220 + }, + { + "epoch": 1.38, + "learning_rate": 9.227981678724457e-05, + "loss": 0.0093, + "step": 534230 + }, + { + "epoch": 1.38, + "learning_rate": 9.22759285708731e-05, + "loss": 0.0088, + "step": 534240 + }, + { + "epoch": 1.38, + "learning_rate": 9.227204035450164e-05, + "loss": 0.0094, + "step": 534250 + }, + { + "epoch": 1.38, + "learning_rate": 9.226815213813017e-05, + "loss": 0.0102, + "step": 534260 + }, + { + "epoch": 1.38, + "learning_rate": 9.226426392175871e-05, + "loss": 0.0117, + "step": 534270 + }, + { + "epoch": 1.38, + "learning_rate": 9.226037570538724e-05, + "loss": 0.0081, + "step": 534280 + }, + { + "epoch": 1.38, + "learning_rate": 9.225648748901578e-05, + "loss": 0.0098, + "step": 534290 + }, + { + "epoch": 1.38, + "learning_rate": 9.225259927264431e-05, + "loss": 0.0076, + "step": 534300 + }, + { + "epoch": 1.39, + "learning_rate": 9.224871105627285e-05, + "loss": 0.0084, + "step": 534310 + }, + { + "epoch": 1.39, + "learning_rate": 9.224482283990138e-05, + "loss": 0.0114, + "step": 534320 + }, + { + "epoch": 1.39, + "learning_rate": 9.224093462352993e-05, + "loss": 0.0081, + "step": 534330 + }, + { + "epoch": 1.39, + "learning_rate": 9.223704640715845e-05, + "loss": 0.0102, + "step": 534340 + }, + { + "epoch": 1.39, + "learning_rate": 9.2233158190787e-05, + "loss": 0.0085, + "step": 534350 + }, + { + "epoch": 1.39, + "learning_rate": 9.222926997441553e-05, + "loss": 0.0099, + "step": 534360 + }, + { + "epoch": 1.39, + "learning_rate": 9.222538175804407e-05, + "loss": 0.0081, + "step": 534370 + }, + { + "epoch": 1.39, + "learning_rate": 9.22214935416726e-05, + "loss": 0.0111, + "step": 534380 + }, + { + "epoch": 1.39, + "learning_rate": 9.221760532530114e-05, + "loss": 0.0101, + "step": 534390 + }, + { + "epoch": 1.39, + "learning_rate": 9.221371710892967e-05, + "loss": 0.0121, + "step": 534400 + }, + { + "epoch": 1.39, + "learning_rate": 9.220982889255821e-05, + "loss": 0.01, + "step": 534410 + }, + { + "epoch": 1.39, + "learning_rate": 9.220594067618674e-05, + "loss": 0.0126, + "step": 534420 + }, + { + "epoch": 1.39, + "learning_rate": 9.220205245981527e-05, + "loss": 0.0106, + "step": 534430 + }, + { + "epoch": 1.39, + "learning_rate": 9.219816424344381e-05, + "loss": 0.0082, + "step": 534440 + }, + { + "epoch": 1.39, + "learning_rate": 9.219427602707234e-05, + "loss": 0.0093, + "step": 534450 + }, + { + "epoch": 1.39, + "learning_rate": 9.219038781070088e-05, + "loss": 0.0099, + "step": 534460 + }, + { + "epoch": 1.39, + "learning_rate": 9.218649959432941e-05, + "loss": 0.0075, + "step": 534470 + }, + { + "epoch": 1.39, + "learning_rate": 9.218261137795795e-05, + "loss": 0.0102, + "step": 534480 + }, + { + "epoch": 1.39, + "learning_rate": 9.217872316158648e-05, + "loss": 0.0101, + "step": 534490 + }, + { + "epoch": 1.39, + "learning_rate": 9.217483494521502e-05, + "loss": 0.0102, + "step": 534500 + }, + { + "epoch": 1.39, + "learning_rate": 9.217094672884355e-05, + "loss": 0.0082, + "step": 534510 + }, + { + "epoch": 1.39, + "learning_rate": 9.21670585124721e-05, + "loss": 0.0091, + "step": 534520 + }, + { + "epoch": 1.39, + "learning_rate": 9.216317029610063e-05, + "loss": 0.0092, + "step": 534530 + }, + { + "epoch": 1.39, + "learning_rate": 9.215928207972917e-05, + "loss": 0.0092, + "step": 534540 + }, + { + "epoch": 1.39, + "learning_rate": 9.21553938633577e-05, + "loss": 0.0093, + "step": 534550 + }, + { + "epoch": 1.39, + "learning_rate": 9.215150564698624e-05, + "loss": 0.0106, + "step": 534560 + }, + { + "epoch": 1.39, + "learning_rate": 9.214761743061477e-05, + "loss": 0.0079, + "step": 534570 + }, + { + "epoch": 1.39, + "learning_rate": 9.214372921424331e-05, + "loss": 0.0084, + "step": 534580 + }, + { + "epoch": 1.39, + "learning_rate": 9.213984099787184e-05, + "loss": 0.0096, + "step": 534590 + }, + { + "epoch": 1.39, + "learning_rate": 9.213595278150038e-05, + "loss": 0.0096, + "step": 534600 + }, + { + "epoch": 1.39, + "learning_rate": 9.213206456512891e-05, + "loss": 0.0108, + "step": 534610 + }, + { + "epoch": 1.39, + "learning_rate": 9.212817634875745e-05, + "loss": 0.0099, + "step": 534620 + }, + { + "epoch": 1.39, + "learning_rate": 9.212428813238598e-05, + "loss": 0.0093, + "step": 534630 + }, + { + "epoch": 1.39, + "learning_rate": 9.212039991601452e-05, + "loss": 0.008, + "step": 534640 + }, + { + "epoch": 1.39, + "learning_rate": 9.211651169964305e-05, + "loss": 0.01, + "step": 534650 + }, + { + "epoch": 1.39, + "learning_rate": 9.211262348327159e-05, + "loss": 0.0155, + "step": 534660 + }, + { + "epoch": 1.39, + "learning_rate": 9.210873526690012e-05, + "loss": 0.0094, + "step": 534670 + }, + { + "epoch": 1.39, + "learning_rate": 9.210484705052865e-05, + "loss": 0.0075, + "step": 534680 + }, + { + "epoch": 1.39, + "learning_rate": 9.21009588341572e-05, + "loss": 0.0093, + "step": 534690 + }, + { + "epoch": 1.39, + "learning_rate": 9.209707061778572e-05, + "loss": 0.0075, + "step": 534700 + }, + { + "epoch": 1.39, + "learning_rate": 9.209318240141427e-05, + "loss": 0.0086, + "step": 534710 + }, + { + "epoch": 1.39, + "learning_rate": 9.20892941850428e-05, + "loss": 0.0081, + "step": 534720 + }, + { + "epoch": 1.39, + "learning_rate": 9.208540596867134e-05, + "loss": 0.0078, + "step": 534730 + }, + { + "epoch": 1.39, + "learning_rate": 9.208151775229987e-05, + "loss": 0.0074, + "step": 534740 + }, + { + "epoch": 1.39, + "learning_rate": 9.207762953592841e-05, + "loss": 0.0091, + "step": 534750 + }, + { + "epoch": 1.39, + "learning_rate": 9.207374131955694e-05, + "loss": 0.0095, + "step": 534760 + }, + { + "epoch": 1.39, + "learning_rate": 9.206985310318548e-05, + "loss": 0.0082, + "step": 534770 + }, + { + "epoch": 1.39, + "learning_rate": 9.206596488681401e-05, + "loss": 0.0093, + "step": 534780 + }, + { + "epoch": 1.39, + "learning_rate": 9.206207667044255e-05, + "loss": 0.0079, + "step": 534790 + }, + { + "epoch": 1.39, + "learning_rate": 9.205818845407108e-05, + "loss": 0.0079, + "step": 534800 + }, + { + "epoch": 1.39, + "learning_rate": 9.205430023769962e-05, + "loss": 0.0095, + "step": 534810 + }, + { + "epoch": 1.39, + "learning_rate": 9.205041202132815e-05, + "loss": 0.0106, + "step": 534820 + }, + { + "epoch": 1.39, + "learning_rate": 9.204652380495669e-05, + "loss": 0.0077, + "step": 534830 + }, + { + "epoch": 1.39, + "learning_rate": 9.204263558858522e-05, + "loss": 0.0071, + "step": 534840 + }, + { + "epoch": 1.39, + "learning_rate": 9.203874737221376e-05, + "loss": 0.0108, + "step": 534850 + }, + { + "epoch": 1.39, + "learning_rate": 9.203485915584229e-05, + "loss": 0.0074, + "step": 534860 + }, + { + "epoch": 1.39, + "learning_rate": 9.203097093947084e-05, + "loss": 0.0084, + "step": 534870 + }, + { + "epoch": 1.39, + "learning_rate": 9.202708272309937e-05, + "loss": 0.0087, + "step": 534880 + }, + { + "epoch": 1.39, + "learning_rate": 9.202319450672791e-05, + "loss": 0.0098, + "step": 534890 + }, + { + "epoch": 1.39, + "learning_rate": 9.201930629035644e-05, + "loss": 0.0083, + "step": 534900 + }, + { + "epoch": 1.39, + "learning_rate": 9.201541807398498e-05, + "loss": 0.0075, + "step": 534910 + }, + { + "epoch": 1.39, + "learning_rate": 9.201152985761351e-05, + "loss": 0.0088, + "step": 534920 + }, + { + "epoch": 1.39, + "learning_rate": 9.200764164124204e-05, + "loss": 0.0122, + "step": 534930 + }, + { + "epoch": 1.39, + "learning_rate": 9.200375342487058e-05, + "loss": 0.0083, + "step": 534940 + }, + { + "epoch": 1.39, + "learning_rate": 9.199986520849911e-05, + "loss": 0.01, + "step": 534950 + }, + { + "epoch": 1.39, + "learning_rate": 9.199597699212765e-05, + "loss": 0.0097, + "step": 534960 + }, + { + "epoch": 1.39, + "learning_rate": 9.199208877575618e-05, + "loss": 0.0122, + "step": 534970 + }, + { + "epoch": 1.39, + "learning_rate": 9.198820055938472e-05, + "loss": 0.0076, + "step": 534980 + }, + { + "epoch": 1.39, + "learning_rate": 9.198431234301325e-05, + "loss": 0.009, + "step": 534990 + }, + { + "epoch": 1.39, + "learning_rate": 9.198042412664179e-05, + "loss": 0.0105, + "step": 535000 + }, + { + "epoch": 1.39, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.0063683707267045975, + "eval_runtime": 107.8309, + "eval_samples_per_second": 18.548, + "eval_steps_per_second": 4.637, + "step": 535000 + }, + { + "epoch": 1.39, + "learning_rate": 9.197653591027032e-05, + "loss": 0.0114, + "step": 535010 + }, + { + "epoch": 1.39, + "learning_rate": 9.197264769389886e-05, + "loss": 0.0086, + "step": 535020 + }, + { + "epoch": 1.39, + "learning_rate": 9.196875947752739e-05, + "loss": 0.0101, + "step": 535030 + }, + { + "epoch": 1.39, + "learning_rate": 9.196487126115594e-05, + "loss": 0.0121, + "step": 535040 + }, + { + "epoch": 1.39, + "learning_rate": 9.196098304478446e-05, + "loss": 0.0115, + "step": 535050 + }, + { + "epoch": 1.39, + "learning_rate": 9.195709482841301e-05, + "loss": 0.0124, + "step": 535060 + }, + { + "epoch": 1.39, + "learning_rate": 9.195320661204154e-05, + "loss": 0.0079, + "step": 535070 + }, + { + "epoch": 1.39, + "learning_rate": 9.194931839567008e-05, + "loss": 0.012, + "step": 535080 + }, + { + "epoch": 1.39, + "learning_rate": 9.194543017929861e-05, + "loss": 0.0095, + "step": 535090 + }, + { + "epoch": 1.39, + "learning_rate": 9.194154196292715e-05, + "loss": 0.0083, + "step": 535100 + }, + { + "epoch": 1.39, + "learning_rate": 9.193765374655568e-05, + "loss": 0.0091, + "step": 535110 + }, + { + "epoch": 1.39, + "learning_rate": 9.193376553018422e-05, + "loss": 0.0097, + "step": 535120 + }, + { + "epoch": 1.39, + "learning_rate": 9.192987731381275e-05, + "loss": 0.0109, + "step": 535130 + }, + { + "epoch": 1.39, + "learning_rate": 9.192598909744129e-05, + "loss": 0.0109, + "step": 535140 + }, + { + "epoch": 1.39, + "learning_rate": 9.192210088106982e-05, + "loss": 0.0107, + "step": 535150 + }, + { + "epoch": 1.39, + "learning_rate": 9.191821266469836e-05, + "loss": 0.009, + "step": 535160 + }, + { + "epoch": 1.39, + "learning_rate": 9.191432444832689e-05, + "loss": 0.0101, + "step": 535170 + }, + { + "epoch": 1.39, + "learning_rate": 9.191043623195542e-05, + "loss": 0.0101, + "step": 535180 + }, + { + "epoch": 1.39, + "learning_rate": 9.190654801558396e-05, + "loss": 0.0095, + "step": 535190 + }, + { + "epoch": 1.39, + "learning_rate": 9.190265979921249e-05, + "loss": 0.0143, + "step": 535200 + }, + { + "epoch": 1.39, + "learning_rate": 9.189877158284103e-05, + "loss": 0.0089, + "step": 535210 + }, + { + "epoch": 1.39, + "learning_rate": 9.189488336646956e-05, + "loss": 0.0076, + "step": 535220 + }, + { + "epoch": 1.39, + "learning_rate": 9.189099515009811e-05, + "loss": 0.0103, + "step": 535230 + }, + { + "epoch": 1.39, + "learning_rate": 9.188710693372664e-05, + "loss": 0.0117, + "step": 535240 + }, + { + "epoch": 1.39, + "learning_rate": 9.188321871735518e-05, + "loss": 0.0087, + "step": 535250 + }, + { + "epoch": 1.39, + "learning_rate": 9.187933050098371e-05, + "loss": 0.0093, + "step": 535260 + }, + { + "epoch": 1.39, + "learning_rate": 9.187544228461225e-05, + "loss": 0.01, + "step": 535270 + }, + { + "epoch": 1.39, + "learning_rate": 9.187155406824078e-05, + "loss": 0.0105, + "step": 535280 + }, + { + "epoch": 1.39, + "learning_rate": 9.186766585186932e-05, + "loss": 0.0098, + "step": 535290 + }, + { + "epoch": 1.39, + "learning_rate": 9.186377763549785e-05, + "loss": 0.0091, + "step": 535300 + }, + { + "epoch": 1.39, + "learning_rate": 9.185988941912639e-05, + "loss": 0.0092, + "step": 535310 + }, + { + "epoch": 1.39, + "learning_rate": 9.185600120275492e-05, + "loss": 0.0097, + "step": 535320 + }, + { + "epoch": 1.39, + "learning_rate": 9.185211298638346e-05, + "loss": 0.0096, + "step": 535330 + }, + { + "epoch": 1.39, + "learning_rate": 9.184822477001199e-05, + "loss": 0.0073, + "step": 535340 + }, + { + "epoch": 1.39, + "learning_rate": 9.184433655364053e-05, + "loss": 0.0103, + "step": 535350 + }, + { + "epoch": 1.39, + "learning_rate": 9.184044833726906e-05, + "loss": 0.0071, + "step": 535360 + }, + { + "epoch": 1.39, + "learning_rate": 9.18365601208976e-05, + "loss": 0.0065, + "step": 535370 + }, + { + "epoch": 1.39, + "learning_rate": 9.183267190452613e-05, + "loss": 0.0108, + "step": 535380 + }, + { + "epoch": 1.39, + "learning_rate": 9.182878368815468e-05, + "loss": 0.0087, + "step": 535390 + }, + { + "epoch": 1.39, + "learning_rate": 9.182489547178321e-05, + "loss": 0.0089, + "step": 535400 + }, + { + "epoch": 1.39, + "learning_rate": 9.182100725541175e-05, + "loss": 0.0103, + "step": 535410 + }, + { + "epoch": 1.39, + "learning_rate": 9.181711903904028e-05, + "loss": 0.0118, + "step": 535420 + }, + { + "epoch": 1.39, + "learning_rate": 9.181323082266881e-05, + "loss": 0.0114, + "step": 535430 + }, + { + "epoch": 1.39, + "learning_rate": 9.180934260629735e-05, + "loss": 0.009, + "step": 535440 + }, + { + "epoch": 1.39, + "learning_rate": 9.180545438992588e-05, + "loss": 0.0067, + "step": 535450 + }, + { + "epoch": 1.39, + "learning_rate": 9.180156617355442e-05, + "loss": 0.0108, + "step": 535460 + }, + { + "epoch": 1.39, + "learning_rate": 9.179767795718295e-05, + "loss": 0.0091, + "step": 535470 + }, + { + "epoch": 1.39, + "learning_rate": 9.179378974081149e-05, + "loss": 0.0079, + "step": 535480 + }, + { + "epoch": 1.39, + "learning_rate": 9.178990152444002e-05, + "loss": 0.0121, + "step": 535490 + }, + { + "epoch": 1.39, + "learning_rate": 9.178601330806856e-05, + "loss": 0.0109, + "step": 535500 + }, + { + "epoch": 1.39, + "learning_rate": 9.178212509169709e-05, + "loss": 0.0069, + "step": 535510 + }, + { + "epoch": 1.39, + "learning_rate": 9.177823687532563e-05, + "loss": 0.0095, + "step": 535520 + }, + { + "epoch": 1.39, + "learning_rate": 9.177434865895416e-05, + "loss": 0.0075, + "step": 535530 + }, + { + "epoch": 1.39, + "learning_rate": 9.17704604425827e-05, + "loss": 0.0101, + "step": 535540 + }, + { + "epoch": 1.39, + "learning_rate": 9.176657222621123e-05, + "loss": 0.0088, + "step": 535550 + }, + { + "epoch": 1.39, + "learning_rate": 9.176268400983978e-05, + "loss": 0.0051, + "step": 535560 + }, + { + "epoch": 1.39, + "learning_rate": 9.17587957934683e-05, + "loss": 0.0108, + "step": 535570 + }, + { + "epoch": 1.39, + "learning_rate": 9.175490757709685e-05, + "loss": 0.0064, + "step": 535580 + }, + { + "epoch": 1.39, + "learning_rate": 9.175101936072538e-05, + "loss": 0.0097, + "step": 535590 + }, + { + "epoch": 1.39, + "learning_rate": 9.174713114435392e-05, + "loss": 0.0134, + "step": 535600 + }, + { + "epoch": 1.39, + "learning_rate": 9.174324292798245e-05, + "loss": 0.0092, + "step": 535610 + }, + { + "epoch": 1.39, + "learning_rate": 9.173935471161099e-05, + "loss": 0.0087, + "step": 535620 + }, + { + "epoch": 1.39, + "learning_rate": 9.173546649523952e-05, + "loss": 0.0083, + "step": 535630 + }, + { + "epoch": 1.39, + "learning_rate": 9.173157827886806e-05, + "loss": 0.0114, + "step": 535640 + }, + { + "epoch": 1.39, + "learning_rate": 9.172769006249659e-05, + "loss": 0.0092, + "step": 535650 + }, + { + "epoch": 1.39, + "learning_rate": 9.172380184612513e-05, + "loss": 0.0078, + "step": 535660 + }, + { + "epoch": 1.39, + "learning_rate": 9.171991362975366e-05, + "loss": 0.0088, + "step": 535670 + }, + { + "epoch": 1.39, + "learning_rate": 9.171602541338219e-05, + "loss": 0.0112, + "step": 535680 + }, + { + "epoch": 1.39, + "learning_rate": 9.171213719701073e-05, + "loss": 0.0096, + "step": 535690 + }, + { + "epoch": 1.39, + "learning_rate": 9.170824898063926e-05, + "loss": 0.01, + "step": 535700 + }, + { + "epoch": 1.39, + "learning_rate": 9.17043607642678e-05, + "loss": 0.0083, + "step": 535710 + }, + { + "epoch": 1.39, + "learning_rate": 9.170047254789633e-05, + "loss": 0.0098, + "step": 535720 + }, + { + "epoch": 1.39, + "learning_rate": 9.169658433152487e-05, + "loss": 0.01, + "step": 535730 + }, + { + "epoch": 1.39, + "learning_rate": 9.16926961151534e-05, + "loss": 0.0207, + "step": 535740 + }, + { + "epoch": 1.39, + "learning_rate": 9.168880789878195e-05, + "loss": 0.0081, + "step": 535750 + }, + { + "epoch": 1.39, + "learning_rate": 9.168491968241048e-05, + "loss": 0.0102, + "step": 535760 + }, + { + "epoch": 1.39, + "learning_rate": 9.168103146603902e-05, + "loss": 0.0088, + "step": 535770 + }, + { + "epoch": 1.39, + "learning_rate": 9.167714324966755e-05, + "loss": 0.0101, + "step": 535780 + }, + { + "epoch": 1.39, + "learning_rate": 9.167325503329609e-05, + "loss": 0.0075, + "step": 535790 + }, + { + "epoch": 1.39, + "learning_rate": 9.166936681692462e-05, + "loss": 0.0143, + "step": 535800 + }, + { + "epoch": 1.39, + "learning_rate": 9.166547860055316e-05, + "loss": 0.0101, + "step": 535810 + }, + { + "epoch": 1.39, + "learning_rate": 9.166159038418169e-05, + "loss": 0.0113, + "step": 535820 + }, + { + "epoch": 1.39, + "learning_rate": 9.165770216781023e-05, + "loss": 0.01, + "step": 535830 + }, + { + "epoch": 1.39, + "learning_rate": 9.165381395143876e-05, + "loss": 0.009, + "step": 535840 + }, + { + "epoch": 1.39, + "learning_rate": 9.16499257350673e-05, + "loss": 0.0109, + "step": 535850 + }, + { + "epoch": 1.39, + "learning_rate": 9.164603751869583e-05, + "loss": 0.0088, + "step": 535860 + }, + { + "epoch": 1.39, + "learning_rate": 9.164214930232437e-05, + "loss": 0.0095, + "step": 535870 + }, + { + "epoch": 1.39, + "learning_rate": 9.16382610859529e-05, + "loss": 0.0099, + "step": 535880 + }, + { + "epoch": 1.39, + "learning_rate": 9.163437286958144e-05, + "loss": 0.011, + "step": 535890 + }, + { + "epoch": 1.39, + "learning_rate": 9.163048465320997e-05, + "loss": 0.01, + "step": 535900 + }, + { + "epoch": 1.39, + "learning_rate": 9.162659643683852e-05, + "loss": 0.0104, + "step": 535910 + }, + { + "epoch": 1.39, + "learning_rate": 9.162270822046705e-05, + "loss": 0.0116, + "step": 535920 + }, + { + "epoch": 1.39, + "learning_rate": 9.161882000409557e-05, + "loss": 0.0074, + "step": 535930 + }, + { + "epoch": 1.39, + "learning_rate": 9.161493178772412e-05, + "loss": 0.0121, + "step": 535940 + }, + { + "epoch": 1.39, + "learning_rate": 9.161104357135265e-05, + "loss": 0.011, + "step": 535950 + }, + { + "epoch": 1.39, + "learning_rate": 9.160715535498119e-05, + "loss": 0.0113, + "step": 535960 + }, + { + "epoch": 1.39, + "learning_rate": 9.160326713860972e-05, + "loss": 0.0101, + "step": 535970 + }, + { + "epoch": 1.39, + "learning_rate": 9.159937892223826e-05, + "loss": 0.0097, + "step": 535980 + }, + { + "epoch": 1.39, + "learning_rate": 9.159549070586679e-05, + "loss": 0.0083, + "step": 535990 + }, + { + "epoch": 1.39, + "learning_rate": 9.159160248949533e-05, + "loss": 0.0079, + "step": 536000 + }, + { + "epoch": 1.39, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.006177127361297607, + "eval_runtime": 107.7114, + "eval_samples_per_second": 18.568, + "eval_steps_per_second": 4.642, + "step": 536000 + }, + { + "epoch": 1.39, + "learning_rate": 9.158771427312386e-05, + "loss": 0.0102, + "step": 536010 + }, + { + "epoch": 1.39, + "learning_rate": 9.15838260567524e-05, + "loss": 0.0093, + "step": 536020 + }, + { + "epoch": 1.39, + "learning_rate": 9.157993784038093e-05, + "loss": 0.0102, + "step": 536030 + }, + { + "epoch": 1.39, + "learning_rate": 9.157604962400947e-05, + "loss": 0.0107, + "step": 536040 + }, + { + "epoch": 1.39, + "learning_rate": 9.1572161407638e-05, + "loss": 0.0125, + "step": 536050 + }, + { + "epoch": 1.39, + "learning_rate": 9.156827319126654e-05, + "loss": 0.0101, + "step": 536060 + }, + { + "epoch": 1.39, + "learning_rate": 9.156438497489507e-05, + "loss": 0.0091, + "step": 536070 + }, + { + "epoch": 1.39, + "learning_rate": 9.156049675852361e-05, + "loss": 0.0107, + "step": 536080 + }, + { + "epoch": 1.39, + "learning_rate": 9.155660854215214e-05, + "loss": 0.0079, + "step": 536090 + }, + { + "epoch": 1.39, + "learning_rate": 9.155272032578069e-05, + "loss": 0.0098, + "step": 536100 + }, + { + "epoch": 1.39, + "learning_rate": 9.154883210940922e-05, + "loss": 0.0092, + "step": 536110 + }, + { + "epoch": 1.39, + "learning_rate": 9.154494389303776e-05, + "loss": 0.0096, + "step": 536120 + }, + { + "epoch": 1.39, + "learning_rate": 9.154105567666629e-05, + "loss": 0.0079, + "step": 536130 + }, + { + "epoch": 1.39, + "learning_rate": 9.153716746029483e-05, + "loss": 0.0095, + "step": 536140 + }, + { + "epoch": 1.39, + "learning_rate": 9.153327924392336e-05, + "loss": 0.0087, + "step": 536150 + }, + { + "epoch": 1.39, + "learning_rate": 9.152939102755189e-05, + "loss": 0.0093, + "step": 536160 + }, + { + "epoch": 1.39, + "learning_rate": 9.152550281118043e-05, + "loss": 0.0089, + "step": 536170 + }, + { + "epoch": 1.39, + "learning_rate": 9.152161459480896e-05, + "loss": 0.0078, + "step": 536180 + }, + { + "epoch": 1.39, + "learning_rate": 9.15177263784375e-05, + "loss": 0.0098, + "step": 536190 + }, + { + "epoch": 1.39, + "learning_rate": 9.151383816206603e-05, + "loss": 0.011, + "step": 536200 + }, + { + "epoch": 1.39, + "learning_rate": 9.150994994569457e-05, + "loss": 0.0074, + "step": 536210 + }, + { + "epoch": 1.39, + "learning_rate": 9.15060617293231e-05, + "loss": 0.0097, + "step": 536220 + }, + { + "epoch": 1.39, + "learning_rate": 9.150217351295164e-05, + "loss": 0.011, + "step": 536230 + }, + { + "epoch": 1.39, + "learning_rate": 9.149828529658017e-05, + "loss": 0.0084, + "step": 536240 + }, + { + "epoch": 1.39, + "learning_rate": 9.149439708020871e-05, + "loss": 0.0102, + "step": 536250 + }, + { + "epoch": 1.39, + "learning_rate": 9.149050886383724e-05, + "loss": 0.0096, + "step": 536260 + }, + { + "epoch": 1.39, + "learning_rate": 9.148662064746579e-05, + "loss": 0.0077, + "step": 536270 + }, + { + "epoch": 1.39, + "learning_rate": 9.14827324310943e-05, + "loss": 0.0088, + "step": 536280 + }, + { + "epoch": 1.39, + "learning_rate": 9.147884421472286e-05, + "loss": 0.0083, + "step": 536290 + }, + { + "epoch": 1.39, + "learning_rate": 9.147495599835139e-05, + "loss": 0.0096, + "step": 536300 + }, + { + "epoch": 1.39, + "learning_rate": 9.147106778197993e-05, + "loss": 0.01, + "step": 536310 + }, + { + "epoch": 1.39, + "learning_rate": 9.146717956560846e-05, + "loss": 0.0084, + "step": 536320 + }, + { + "epoch": 1.39, + "learning_rate": 9.1463291349237e-05, + "loss": 0.0087, + "step": 536330 + }, + { + "epoch": 1.39, + "learning_rate": 9.145940313286553e-05, + "loss": 0.0112, + "step": 536340 + }, + { + "epoch": 1.39, + "learning_rate": 9.145551491649407e-05, + "loss": 0.0066, + "step": 536350 + }, + { + "epoch": 1.39, + "learning_rate": 9.14516267001226e-05, + "loss": 0.0096, + "step": 536360 + }, + { + "epoch": 1.39, + "learning_rate": 9.144773848375114e-05, + "loss": 0.0074, + "step": 536370 + }, + { + "epoch": 1.39, + "learning_rate": 9.144385026737967e-05, + "loss": 0.0073, + "step": 536380 + }, + { + "epoch": 1.39, + "learning_rate": 9.143996205100821e-05, + "loss": 0.0082, + "step": 536390 + }, + { + "epoch": 1.39, + "learning_rate": 9.143607383463674e-05, + "loss": 0.0093, + "step": 536400 + }, + { + "epoch": 1.39, + "learning_rate": 9.143218561826527e-05, + "loss": 0.0109, + "step": 536410 + }, + { + "epoch": 1.39, + "learning_rate": 9.142829740189381e-05, + "loss": 0.0119, + "step": 536420 + }, + { + "epoch": 1.39, + "learning_rate": 9.142440918552234e-05, + "loss": 0.0081, + "step": 536430 + }, + { + "epoch": 1.39, + "learning_rate": 9.142052096915088e-05, + "loss": 0.0079, + "step": 536440 + }, + { + "epoch": 1.39, + "learning_rate": 9.14166327527794e-05, + "loss": 0.0069, + "step": 536450 + }, + { + "epoch": 1.39, + "learning_rate": 9.141274453640796e-05, + "loss": 0.0075, + "step": 536460 + }, + { + "epoch": 1.39, + "learning_rate": 9.140885632003649e-05, + "loss": 0.0091, + "step": 536470 + }, + { + "epoch": 1.39, + "learning_rate": 9.140496810366503e-05, + "loss": 0.0092, + "step": 536480 + }, + { + "epoch": 1.39, + "learning_rate": 9.140107988729356e-05, + "loss": 0.0087, + "step": 536490 + }, + { + "epoch": 1.39, + "learning_rate": 9.13971916709221e-05, + "loss": 0.0077, + "step": 536500 + }, + { + "epoch": 1.39, + "learning_rate": 9.139330345455063e-05, + "loss": 0.0066, + "step": 536510 + }, + { + "epoch": 1.39, + "learning_rate": 9.138941523817917e-05, + "loss": 0.0093, + "step": 536520 + }, + { + "epoch": 1.39, + "learning_rate": 9.13855270218077e-05, + "loss": 0.0106, + "step": 536530 + }, + { + "epoch": 1.39, + "learning_rate": 9.138163880543624e-05, + "loss": 0.0129, + "step": 536540 + }, + { + "epoch": 1.39, + "learning_rate": 9.137775058906477e-05, + "loss": 0.0105, + "step": 536550 + }, + { + "epoch": 1.39, + "learning_rate": 9.137386237269331e-05, + "loss": 0.0129, + "step": 536560 + }, + { + "epoch": 1.39, + "learning_rate": 9.136997415632184e-05, + "loss": 0.0091, + "step": 536570 + }, + { + "epoch": 1.39, + "learning_rate": 9.136608593995038e-05, + "loss": 0.0104, + "step": 536580 + }, + { + "epoch": 1.39, + "learning_rate": 9.136219772357891e-05, + "loss": 0.0086, + "step": 536590 + }, + { + "epoch": 1.39, + "learning_rate": 9.135830950720745e-05, + "loss": 0.0092, + "step": 536600 + }, + { + "epoch": 1.39, + "learning_rate": 9.135442129083598e-05, + "loss": 0.0098, + "step": 536610 + }, + { + "epoch": 1.39, + "learning_rate": 9.135053307446453e-05, + "loss": 0.0094, + "step": 536620 + }, + { + "epoch": 1.39, + "learning_rate": 9.134664485809306e-05, + "loss": 0.0116, + "step": 536630 + }, + { + "epoch": 1.39, + "learning_rate": 9.13427566417216e-05, + "loss": 0.0129, + "step": 536640 + }, + { + "epoch": 1.39, + "learning_rate": 9.133886842535013e-05, + "loss": 0.0079, + "step": 536650 + }, + { + "epoch": 1.39, + "learning_rate": 9.133498020897866e-05, + "loss": 0.009, + "step": 536660 + }, + { + "epoch": 1.39, + "learning_rate": 9.13310919926072e-05, + "loss": 0.0074, + "step": 536670 + }, + { + "epoch": 1.39, + "learning_rate": 9.132720377623573e-05, + "loss": 0.0088, + "step": 536680 + }, + { + "epoch": 1.39, + "learning_rate": 9.132331555986427e-05, + "loss": 0.0066, + "step": 536690 + }, + { + "epoch": 1.39, + "learning_rate": 9.13194273434928e-05, + "loss": 0.0125, + "step": 536700 + }, + { + "epoch": 1.39, + "learning_rate": 9.131553912712134e-05, + "loss": 0.0099, + "step": 536710 + }, + { + "epoch": 1.39, + "learning_rate": 9.131165091074987e-05, + "loss": 0.0099, + "step": 536720 + }, + { + "epoch": 1.39, + "learning_rate": 9.130776269437841e-05, + "loss": 0.0087, + "step": 536730 + }, + { + "epoch": 1.39, + "learning_rate": 9.130387447800694e-05, + "loss": 0.0119, + "step": 536740 + }, + { + "epoch": 1.39, + "learning_rate": 9.129998626163548e-05, + "loss": 0.0099, + "step": 536750 + }, + { + "epoch": 1.39, + "learning_rate": 9.129609804526401e-05, + "loss": 0.0086, + "step": 536760 + }, + { + "epoch": 1.39, + "learning_rate": 9.129220982889255e-05, + "loss": 0.0079, + "step": 536770 + }, + { + "epoch": 1.39, + "learning_rate": 9.128832161252108e-05, + "loss": 0.0089, + "step": 536780 + }, + { + "epoch": 1.39, + "learning_rate": 9.128443339614963e-05, + "loss": 0.0113, + "step": 536790 + }, + { + "epoch": 1.39, + "learning_rate": 9.128054517977815e-05, + "loss": 0.009, + "step": 536800 + }, + { + "epoch": 1.39, + "learning_rate": 9.12766569634067e-05, + "loss": 0.0099, + "step": 536810 + }, + { + "epoch": 1.39, + "learning_rate": 9.127276874703523e-05, + "loss": 0.0107, + "step": 536820 + }, + { + "epoch": 1.39, + "learning_rate": 9.126888053066377e-05, + "loss": 0.009, + "step": 536830 + }, + { + "epoch": 1.39, + "learning_rate": 9.12649923142923e-05, + "loss": 0.0083, + "step": 536840 + }, + { + "epoch": 1.39, + "learning_rate": 9.126110409792084e-05, + "loss": 0.0108, + "step": 536850 + }, + { + "epoch": 1.39, + "learning_rate": 9.125721588154937e-05, + "loss": 0.0089, + "step": 536860 + }, + { + "epoch": 1.39, + "learning_rate": 9.125332766517791e-05, + "loss": 0.0073, + "step": 536870 + }, + { + "epoch": 1.39, + "learning_rate": 9.124943944880644e-05, + "loss": 0.009, + "step": 536880 + }, + { + "epoch": 1.39, + "learning_rate": 9.124555123243498e-05, + "loss": 0.0092, + "step": 536890 + }, + { + "epoch": 1.39, + "learning_rate": 9.124166301606351e-05, + "loss": 0.0079, + "step": 536900 + }, + { + "epoch": 1.39, + "learning_rate": 9.123777479969204e-05, + "loss": 0.0125, + "step": 536910 + }, + { + "epoch": 1.39, + "learning_rate": 9.123388658332058e-05, + "loss": 0.0079, + "step": 536920 + }, + { + "epoch": 1.39, + "learning_rate": 9.12299983669491e-05, + "loss": 0.0078, + "step": 536930 + }, + { + "epoch": 1.39, + "learning_rate": 9.122611015057765e-05, + "loss": 0.0059, + "step": 536940 + }, + { + "epoch": 1.39, + "learning_rate": 9.122222193420618e-05, + "loss": 0.0086, + "step": 536950 + }, + { + "epoch": 1.39, + "learning_rate": 9.121833371783472e-05, + "loss": 0.0104, + "step": 536960 + }, + { + "epoch": 1.39, + "learning_rate": 9.121444550146325e-05, + "loss": 0.0094, + "step": 536970 + }, + { + "epoch": 1.39, + "learning_rate": 9.12105572850918e-05, + "loss": 0.01, + "step": 536980 + }, + { + "epoch": 1.39, + "learning_rate": 9.120666906872033e-05, + "loss": 0.011, + "step": 536990 + }, + { + "epoch": 1.39, + "learning_rate": 9.120278085234887e-05, + "loss": 0.01, + "step": 537000 + }, + { + "epoch": 1.39, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.006287885829806328, + "eval_runtime": 107.8496, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, + "step": 537000 + }, + { + "epoch": 1.39, + "learning_rate": 9.11988926359774e-05, + "loss": 0.0101, + "step": 537010 + }, + { + "epoch": 1.39, + "learning_rate": 9.119500441960594e-05, + "loss": 0.0075, + "step": 537020 + }, + { + "epoch": 1.39, + "learning_rate": 9.119111620323447e-05, + "loss": 0.0102, + "step": 537030 + }, + { + "epoch": 1.39, + "learning_rate": 9.118722798686301e-05, + "loss": 0.0087, + "step": 537040 + }, + { + "epoch": 1.39, + "learning_rate": 9.118333977049154e-05, + "loss": 0.0124, + "step": 537050 + }, + { + "epoch": 1.39, + "learning_rate": 9.117945155412008e-05, + "loss": 0.0104, + "step": 537060 + }, + { + "epoch": 1.39, + "learning_rate": 9.117556333774861e-05, + "loss": 0.0086, + "step": 537070 + }, + { + "epoch": 1.39, + "learning_rate": 9.117167512137715e-05, + "loss": 0.0089, + "step": 537080 + }, + { + "epoch": 1.39, + "learning_rate": 9.116778690500568e-05, + "loss": 0.0104, + "step": 537090 + }, + { + "epoch": 1.39, + "learning_rate": 9.116389868863422e-05, + "loss": 0.0103, + "step": 537100 + }, + { + "epoch": 1.39, + "learning_rate": 9.116001047226275e-05, + "loss": 0.0075, + "step": 537110 + }, + { + "epoch": 1.39, + "learning_rate": 9.115612225589129e-05, + "loss": 0.0096, + "step": 537120 + }, + { + "epoch": 1.39, + "learning_rate": 9.115223403951982e-05, + "loss": 0.0089, + "step": 537130 + }, + { + "epoch": 1.39, + "learning_rate": 9.114834582314837e-05, + "loss": 0.0092, + "step": 537140 + }, + { + "epoch": 1.39, + "learning_rate": 9.11444576067769e-05, + "loss": 0.0125, + "step": 537150 + }, + { + "epoch": 1.39, + "learning_rate": 9.114056939040541e-05, + "loss": 0.0091, + "step": 537160 + }, + { + "epoch": 1.39, + "learning_rate": 9.113668117403397e-05, + "loss": 0.0112, + "step": 537170 + }, + { + "epoch": 1.39, + "learning_rate": 9.11327929576625e-05, + "loss": 0.0099, + "step": 537180 + }, + { + "epoch": 1.39, + "learning_rate": 9.112890474129104e-05, + "loss": 0.0099, + "step": 537190 + }, + { + "epoch": 1.39, + "learning_rate": 9.112501652491957e-05, + "loss": 0.0093, + "step": 537200 + }, + { + "epoch": 1.39, + "learning_rate": 9.112112830854811e-05, + "loss": 0.0099, + "step": 537210 + }, + { + "epoch": 1.39, + "learning_rate": 9.111724009217664e-05, + "loss": 0.0108, + "step": 537220 + }, + { + "epoch": 1.39, + "learning_rate": 9.111335187580518e-05, + "loss": 0.0091, + "step": 537230 + }, + { + "epoch": 1.39, + "learning_rate": 9.110946365943371e-05, + "loss": 0.0097, + "step": 537240 + }, + { + "epoch": 1.39, + "learning_rate": 9.110557544306225e-05, + "loss": 0.0113, + "step": 537250 + }, + { + "epoch": 1.39, + "learning_rate": 9.110168722669078e-05, + "loss": 0.0105, + "step": 537260 + }, + { + "epoch": 1.39, + "learning_rate": 9.109779901031932e-05, + "loss": 0.0084, + "step": 537270 + }, + { + "epoch": 1.39, + "learning_rate": 9.109391079394785e-05, + "loss": 0.0105, + "step": 537280 + }, + { + "epoch": 1.39, + "learning_rate": 9.109002257757639e-05, + "loss": 0.0075, + "step": 537290 + }, + { + "epoch": 1.39, + "learning_rate": 9.108613436120492e-05, + "loss": 0.0118, + "step": 537300 + }, + { + "epoch": 1.39, + "learning_rate": 9.108224614483347e-05, + "loss": 0.0079, + "step": 537310 + }, + { + "epoch": 1.39, + "learning_rate": 9.107835792846199e-05, + "loss": 0.0086, + "step": 537320 + }, + { + "epoch": 1.39, + "learning_rate": 9.107446971209054e-05, + "loss": 0.0095, + "step": 537330 + }, + { + "epoch": 1.39, + "learning_rate": 9.107058149571907e-05, + "loss": 0.0103, + "step": 537340 + }, + { + "epoch": 1.39, + "learning_rate": 9.106669327934761e-05, + "loss": 0.0077, + "step": 537350 + }, + { + "epoch": 1.39, + "learning_rate": 9.106280506297614e-05, + "loss": 0.0106, + "step": 537360 + }, + { + "epoch": 1.39, + "learning_rate": 9.105891684660468e-05, + "loss": 0.0118, + "step": 537370 + }, + { + "epoch": 1.39, + "learning_rate": 9.105502863023321e-05, + "loss": 0.0088, + "step": 537380 + }, + { + "epoch": 1.39, + "learning_rate": 9.105114041386175e-05, + "loss": 0.0091, + "step": 537390 + }, + { + "epoch": 1.39, + "learning_rate": 9.104725219749028e-05, + "loss": 0.0101, + "step": 537400 + }, + { + "epoch": 1.39, + "learning_rate": 9.104336398111881e-05, + "loss": 0.0104, + "step": 537410 + }, + { + "epoch": 1.39, + "learning_rate": 9.103947576474735e-05, + "loss": 0.0074, + "step": 537420 + }, + { + "epoch": 1.39, + "learning_rate": 9.103558754837588e-05, + "loss": 0.0102, + "step": 537430 + }, + { + "epoch": 1.39, + "learning_rate": 9.103169933200442e-05, + "loss": 0.0112, + "step": 537440 + }, + { + "epoch": 1.39, + "learning_rate": 9.102781111563295e-05, + "loss": 0.0104, + "step": 537450 + }, + { + "epoch": 1.39, + "learning_rate": 9.102392289926149e-05, + "loss": 0.0101, + "step": 537460 + }, + { + "epoch": 1.39, + "learning_rate": 9.102003468289002e-05, + "loss": 0.0091, + "step": 537470 + }, + { + "epoch": 1.39, + "learning_rate": 9.101614646651856e-05, + "loss": 0.008, + "step": 537480 + }, + { + "epoch": 1.39, + "learning_rate": 9.101225825014709e-05, + "loss": 0.0103, + "step": 537490 + }, + { + "epoch": 1.39, + "learning_rate": 9.100837003377564e-05, + "loss": 0.0126, + "step": 537500 + }, + { + "epoch": 1.39, + "learning_rate": 9.100448181740417e-05, + "loss": 0.0104, + "step": 537510 + }, + { + "epoch": 1.39, + "learning_rate": 9.100059360103271e-05, + "loss": 0.0099, + "step": 537520 + }, + { + "epoch": 1.39, + "learning_rate": 9.099670538466124e-05, + "loss": 0.0128, + "step": 537530 + }, + { + "epoch": 1.39, + "learning_rate": 9.099281716828978e-05, + "loss": 0.0103, + "step": 537540 + }, + { + "epoch": 1.39, + "learning_rate": 9.098892895191831e-05, + "loss": 0.0088, + "step": 537550 + }, + { + "epoch": 1.39, + "learning_rate": 9.098504073554685e-05, + "loss": 0.0118, + "step": 537560 + }, + { + "epoch": 1.39, + "learning_rate": 9.098115251917538e-05, + "loss": 0.0105, + "step": 537570 + }, + { + "epoch": 1.39, + "learning_rate": 9.097726430280392e-05, + "loss": 0.0088, + "step": 537580 + }, + { + "epoch": 1.39, + "learning_rate": 9.097337608643245e-05, + "loss": 0.0091, + "step": 537590 + }, + { + "epoch": 1.39, + "learning_rate": 9.096948787006099e-05, + "loss": 0.008, + "step": 537600 + }, + { + "epoch": 1.39, + "learning_rate": 9.096559965368952e-05, + "loss": 0.0154, + "step": 537610 + }, + { + "epoch": 1.39, + "learning_rate": 9.096171143731806e-05, + "loss": 0.0085, + "step": 537620 + }, + { + "epoch": 1.39, + "learning_rate": 9.095782322094659e-05, + "loss": 0.007, + "step": 537630 + }, + { + "epoch": 1.39, + "learning_rate": 9.095393500457513e-05, + "loss": 0.0101, + "step": 537640 + }, + { + "epoch": 1.39, + "learning_rate": 9.095004678820366e-05, + "loss": 0.0106, + "step": 537650 + }, + { + "epoch": 1.39, + "learning_rate": 9.094615857183219e-05, + "loss": 0.0089, + "step": 537660 + }, + { + "epoch": 1.39, + "learning_rate": 9.094227035546073e-05, + "loss": 0.0082, + "step": 537670 + }, + { + "epoch": 1.39, + "learning_rate": 9.093838213908925e-05, + "loss": 0.0069, + "step": 537680 + }, + { + "epoch": 1.39, + "learning_rate": 9.093449392271781e-05, + "loss": 0.0114, + "step": 537690 + }, + { + "epoch": 1.39, + "learning_rate": 9.093060570634634e-05, + "loss": 0.0128, + "step": 537700 + }, + { + "epoch": 1.39, + "learning_rate": 9.092671748997488e-05, + "loss": 0.0094, + "step": 537710 + }, + { + "epoch": 1.39, + "learning_rate": 9.092282927360341e-05, + "loss": 0.009, + "step": 537720 + }, + { + "epoch": 1.39, + "learning_rate": 9.091894105723195e-05, + "loss": 0.0088, + "step": 537730 + }, + { + "epoch": 1.39, + "learning_rate": 9.091505284086048e-05, + "loss": 0.0105, + "step": 537740 + }, + { + "epoch": 1.39, + "learning_rate": 9.091116462448902e-05, + "loss": 0.0077, + "step": 537750 + }, + { + "epoch": 1.39, + "learning_rate": 9.090727640811755e-05, + "loss": 0.0151, + "step": 537760 + }, + { + "epoch": 1.39, + "learning_rate": 9.090338819174609e-05, + "loss": 0.0075, + "step": 537770 + }, + { + "epoch": 1.39, + "learning_rate": 9.089949997537462e-05, + "loss": 0.0096, + "step": 537780 + }, + { + "epoch": 1.39, + "learning_rate": 9.089561175900316e-05, + "loss": 0.0103, + "step": 537790 + }, + { + "epoch": 1.39, + "learning_rate": 9.089172354263169e-05, + "loss": 0.0092, + "step": 537800 + }, + { + "epoch": 1.39, + "learning_rate": 9.088783532626023e-05, + "loss": 0.0099, + "step": 537810 + }, + { + "epoch": 1.39, + "learning_rate": 9.088394710988876e-05, + "loss": 0.0083, + "step": 537820 + }, + { + "epoch": 1.39, + "learning_rate": 9.08800588935173e-05, + "loss": 0.0096, + "step": 537830 + }, + { + "epoch": 1.39, + "learning_rate": 9.087617067714583e-05, + "loss": 0.0081, + "step": 537840 + }, + { + "epoch": 1.39, + "learning_rate": 9.087228246077438e-05, + "loss": 0.0118, + "step": 537850 + }, + { + "epoch": 1.39, + "learning_rate": 9.086839424440291e-05, + "loss": 0.0107, + "step": 537860 + }, + { + "epoch": 1.39, + "learning_rate": 9.086450602803145e-05, + "loss": 0.0099, + "step": 537870 + }, + { + "epoch": 1.39, + "learning_rate": 9.086061781165998e-05, + "loss": 0.0079, + "step": 537880 + }, + { + "epoch": 1.39, + "learning_rate": 9.085672959528852e-05, + "loss": 0.0089, + "step": 537890 + }, + { + "epoch": 1.39, + "learning_rate": 9.085284137891705e-05, + "loss": 0.0117, + "step": 537900 + }, + { + "epoch": 1.39, + "learning_rate": 9.084895316254558e-05, + "loss": 0.0091, + "step": 537910 + }, + { + "epoch": 1.39, + "learning_rate": 9.084506494617412e-05, + "loss": 0.0085, + "step": 537920 + }, + { + "epoch": 1.39, + "learning_rate": 9.084117672980265e-05, + "loss": 0.0097, + "step": 537930 + }, + { + "epoch": 1.39, + "learning_rate": 9.083728851343119e-05, + "loss": 0.0103, + "step": 537940 + }, + { + "epoch": 1.39, + "learning_rate": 9.083340029705972e-05, + "loss": 0.0097, + "step": 537950 + }, + { + "epoch": 1.39, + "learning_rate": 9.082951208068826e-05, + "loss": 0.0065, + "step": 537960 + }, + { + "epoch": 1.39, + "learning_rate": 9.082562386431679e-05, + "loss": 0.0105, + "step": 537970 + }, + { + "epoch": 1.39, + "learning_rate": 9.082173564794533e-05, + "loss": 0.0107, + "step": 537980 + }, + { + "epoch": 1.39, + "learning_rate": 9.081784743157386e-05, + "loss": 0.0082, + "step": 537990 + }, + { + "epoch": 1.39, + "learning_rate": 9.08139592152024e-05, + "loss": 0.0126, + "step": 538000 + }, + { + "epoch": 1.39, + "eval_cer": 0.8816522993935373, + "eval_loss": 0.006265460047870874, + "eval_runtime": 107.8561, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 538000 + }, + { + "epoch": 1.39, + "learning_rate": 9.081007099883093e-05, + "loss": 0.0092, + "step": 538010 + }, + { + "epoch": 1.39, + "learning_rate": 9.080618278245948e-05, + "loss": 0.0089, + "step": 538020 + }, + { + "epoch": 1.39, + "learning_rate": 9.0802294566088e-05, + "loss": 0.0136, + "step": 538030 + }, + { + "epoch": 1.39, + "learning_rate": 9.079840634971655e-05, + "loss": 0.0128, + "step": 538040 + }, + { + "epoch": 1.39, + "learning_rate": 9.079451813334508e-05, + "loss": 0.011, + "step": 538050 + }, + { + "epoch": 1.39, + "learning_rate": 9.079062991697362e-05, + "loss": 0.0102, + "step": 538060 + }, + { + "epoch": 1.39, + "learning_rate": 9.078674170060215e-05, + "loss": 0.0084, + "step": 538070 + }, + { + "epoch": 1.39, + "learning_rate": 9.078285348423069e-05, + "loss": 0.0117, + "step": 538080 + }, + { + "epoch": 1.39, + "learning_rate": 9.077896526785922e-05, + "loss": 0.012, + "step": 538090 + }, + { + "epoch": 1.39, + "learning_rate": 9.077507705148776e-05, + "loss": 0.0074, + "step": 538100 + }, + { + "epoch": 1.39, + "learning_rate": 9.077118883511629e-05, + "loss": 0.0108, + "step": 538110 + }, + { + "epoch": 1.39, + "learning_rate": 9.076730061874483e-05, + "loss": 0.0122, + "step": 538120 + }, + { + "epoch": 1.39, + "learning_rate": 9.076341240237336e-05, + "loss": 0.0099, + "step": 538130 + }, + { + "epoch": 1.39, + "learning_rate": 9.07595241860019e-05, + "loss": 0.0073, + "step": 538140 + }, + { + "epoch": 1.39, + "learning_rate": 9.075563596963043e-05, + "loss": 0.0138, + "step": 538150 + }, + { + "epoch": 1.39, + "learning_rate": 9.075174775325896e-05, + "loss": 0.0083, + "step": 538160 + }, + { + "epoch": 1.4, + "learning_rate": 9.07478595368875e-05, + "loss": 0.0133, + "step": 538170 + }, + { + "epoch": 1.4, + "learning_rate": 9.074397132051603e-05, + "loss": 0.0073, + "step": 538180 + }, + { + "epoch": 1.4, + "learning_rate": 9.074008310414457e-05, + "loss": 0.0087, + "step": 538190 + }, + { + "epoch": 1.4, + "learning_rate": 9.07361948877731e-05, + "loss": 0.0075, + "step": 538200 + }, + { + "epoch": 1.4, + "learning_rate": 9.073230667140165e-05, + "loss": 0.0082, + "step": 538210 + }, + { + "epoch": 1.4, + "learning_rate": 9.072841845503018e-05, + "loss": 0.0109, + "step": 538220 + }, + { + "epoch": 1.4, + "learning_rate": 9.072453023865872e-05, + "loss": 0.0065, + "step": 538230 + }, + { + "epoch": 1.4, + "learning_rate": 9.072064202228725e-05, + "loss": 0.0102, + "step": 538240 + }, + { + "epoch": 1.4, + "learning_rate": 9.071675380591579e-05, + "loss": 0.0087, + "step": 538250 + }, + { + "epoch": 1.4, + "learning_rate": 9.071286558954432e-05, + "loss": 0.0085, + "step": 538260 + }, + { + "epoch": 1.4, + "learning_rate": 9.070897737317286e-05, + "loss": 0.012, + "step": 538270 + }, + { + "epoch": 1.4, + "learning_rate": 9.070508915680139e-05, + "loss": 0.0087, + "step": 538280 + }, + { + "epoch": 1.4, + "learning_rate": 9.070120094042993e-05, + "loss": 0.0065, + "step": 538290 + }, + { + "epoch": 1.4, + "learning_rate": 9.069731272405846e-05, + "loss": 0.0214, + "step": 538300 + }, + { + "epoch": 1.4, + "learning_rate": 9.0693424507687e-05, + "loss": 0.0093, + "step": 538310 + }, + { + "epoch": 1.4, + "learning_rate": 9.068953629131553e-05, + "loss": 0.0111, + "step": 538320 + }, + { + "epoch": 1.4, + "learning_rate": 9.068564807494407e-05, + "loss": 0.0102, + "step": 538330 + }, + { + "epoch": 1.4, + "learning_rate": 9.06817598585726e-05, + "loss": 0.0086, + "step": 538340 + }, + { + "epoch": 1.4, + "learning_rate": 9.067787164220114e-05, + "loss": 0.009, + "step": 538350 + }, + { + "epoch": 1.4, + "learning_rate": 9.067398342582967e-05, + "loss": 0.01, + "step": 538360 + }, + { + "epoch": 1.4, + "learning_rate": 9.067009520945822e-05, + "loss": 0.009, + "step": 538370 + }, + { + "epoch": 1.4, + "learning_rate": 9.066620699308675e-05, + "loss": 0.011, + "step": 538380 + }, + { + "epoch": 1.4, + "learning_rate": 9.066231877671529e-05, + "loss": 0.0084, + "step": 538390 + }, + { + "epoch": 1.4, + "learning_rate": 9.065843056034382e-05, + "loss": 0.0069, + "step": 538400 + }, + { + "epoch": 1.4, + "learning_rate": 9.065454234397235e-05, + "loss": 0.0083, + "step": 538410 + }, + { + "epoch": 1.4, + "learning_rate": 9.065065412760089e-05, + "loss": 0.0084, + "step": 538420 + }, + { + "epoch": 1.4, + "learning_rate": 9.064676591122942e-05, + "loss": 0.0097, + "step": 538430 + }, + { + "epoch": 1.4, + "learning_rate": 9.064287769485796e-05, + "loss": 0.0085, + "step": 538440 + }, + { + "epoch": 1.4, + "learning_rate": 9.063898947848649e-05, + "loss": 0.0114, + "step": 538450 + }, + { + "epoch": 1.4, + "learning_rate": 9.063510126211503e-05, + "loss": 0.0083, + "step": 538460 + }, + { + "epoch": 1.4, + "learning_rate": 9.063121304574356e-05, + "loss": 0.0095, + "step": 538470 + }, + { + "epoch": 1.4, + "learning_rate": 9.06273248293721e-05, + "loss": 0.0107, + "step": 538480 + }, + { + "epoch": 1.4, + "learning_rate": 9.062343661300063e-05, + "loss": 0.0087, + "step": 538490 + }, + { + "epoch": 1.4, + "learning_rate": 9.061954839662917e-05, + "loss": 0.0105, + "step": 538500 + }, + { + "epoch": 1.4, + "learning_rate": 9.06156601802577e-05, + "loss": 0.0096, + "step": 538510 + }, + { + "epoch": 1.4, + "learning_rate": 9.061177196388624e-05, + "loss": 0.0108, + "step": 538520 + }, + { + "epoch": 1.4, + "learning_rate": 9.060788374751477e-05, + "loss": 0.0087, + "step": 538530 + }, + { + "epoch": 1.4, + "learning_rate": 9.060399553114332e-05, + "loss": 0.0087, + "step": 538540 + }, + { + "epoch": 1.4, + "learning_rate": 9.060010731477184e-05, + "loss": 0.0125, + "step": 538550 + }, + { + "epoch": 1.4, + "learning_rate": 9.059621909840039e-05, + "loss": 0.0105, + "step": 538560 + }, + { + "epoch": 1.4, + "learning_rate": 9.059233088202892e-05, + "loss": 0.0078, + "step": 538570 + }, + { + "epoch": 1.4, + "learning_rate": 9.058844266565746e-05, + "loss": 0.0078, + "step": 538580 + }, + { + "epoch": 1.4, + "learning_rate": 9.058455444928599e-05, + "loss": 0.008, + "step": 538590 + }, + { + "epoch": 1.4, + "learning_rate": 9.058066623291453e-05, + "loss": 0.0104, + "step": 538600 + }, + { + "epoch": 1.4, + "learning_rate": 9.057677801654306e-05, + "loss": 0.0087, + "step": 538610 + }, + { + "epoch": 1.4, + "learning_rate": 9.05728898001716e-05, + "loss": 0.0078, + "step": 538620 + }, + { + "epoch": 1.4, + "learning_rate": 9.056900158380013e-05, + "loss": 0.0076, + "step": 538630 + }, + { + "epoch": 1.4, + "learning_rate": 9.056511336742866e-05, + "loss": 0.0078, + "step": 538640 + }, + { + "epoch": 1.4, + "learning_rate": 9.05612251510572e-05, + "loss": 0.0097, + "step": 538650 + }, + { + "epoch": 1.4, + "learning_rate": 9.055733693468573e-05, + "loss": 0.009, + "step": 538660 + }, + { + "epoch": 1.4, + "learning_rate": 9.055344871831427e-05, + "loss": 0.0089, + "step": 538670 + }, + { + "epoch": 1.4, + "learning_rate": 9.05495605019428e-05, + "loss": 0.0096, + "step": 538680 + }, + { + "epoch": 1.4, + "learning_rate": 9.054567228557134e-05, + "loss": 0.0143, + "step": 538690 + }, + { + "epoch": 1.4, + "learning_rate": 9.054178406919986e-05, + "loss": 0.0086, + "step": 538700 + }, + { + "epoch": 1.4, + "learning_rate": 9.05378958528284e-05, + "loss": 0.0083, + "step": 538710 + }, + { + "epoch": 1.4, + "learning_rate": 9.053400763645693e-05, + "loss": 0.0081, + "step": 538720 + }, + { + "epoch": 1.4, + "learning_rate": 9.053011942008549e-05, + "loss": 0.0104, + "step": 538730 + }, + { + "epoch": 1.4, + "learning_rate": 9.052623120371402e-05, + "loss": 0.0086, + "step": 538740 + }, + { + "epoch": 1.4, + "learning_rate": 9.052234298734256e-05, + "loss": 0.0083, + "step": 538750 + }, + { + "epoch": 1.4, + "learning_rate": 9.051845477097109e-05, + "loss": 0.007, + "step": 538760 + }, + { + "epoch": 1.4, + "learning_rate": 9.051456655459963e-05, + "loss": 0.0065, + "step": 538770 + }, + { + "epoch": 1.4, + "learning_rate": 9.051067833822816e-05, + "loss": 0.0082, + "step": 538780 + }, + { + "epoch": 1.4, + "learning_rate": 9.05067901218567e-05, + "loss": 0.0097, + "step": 538790 + }, + { + "epoch": 1.4, + "learning_rate": 9.050290190548523e-05, + "loss": 0.0102, + "step": 538800 + }, + { + "epoch": 1.4, + "learning_rate": 9.049901368911377e-05, + "loss": 0.0085, + "step": 538810 + }, + { + "epoch": 1.4, + "learning_rate": 9.04951254727423e-05, + "loss": 0.0087, + "step": 538820 + }, + { + "epoch": 1.4, + "learning_rate": 9.049123725637084e-05, + "loss": 0.0075, + "step": 538830 + }, + { + "epoch": 1.4, + "learning_rate": 9.048734903999937e-05, + "loss": 0.008, + "step": 538840 + }, + { + "epoch": 1.4, + "learning_rate": 9.048346082362791e-05, + "loss": 0.0091, + "step": 538850 + }, + { + "epoch": 1.4, + "learning_rate": 9.047957260725644e-05, + "loss": 0.0118, + "step": 538860 + }, + { + "epoch": 1.4, + "learning_rate": 9.047568439088498e-05, + "loss": 0.0084, + "step": 538870 + }, + { + "epoch": 1.4, + "learning_rate": 9.04717961745135e-05, + "loss": 0.0081, + "step": 538880 + }, + { + "epoch": 1.4, + "learning_rate": 9.046790795814203e-05, + "loss": 0.0099, + "step": 538890 + }, + { + "epoch": 1.4, + "learning_rate": 9.046401974177059e-05, + "loss": 0.0079, + "step": 538900 + }, + { + "epoch": 1.4, + "learning_rate": 9.04601315253991e-05, + "loss": 0.0091, + "step": 538910 + }, + { + "epoch": 1.4, + "learning_rate": 9.045624330902766e-05, + "loss": 0.01, + "step": 538920 + }, + { + "epoch": 1.4, + "learning_rate": 9.045235509265619e-05, + "loss": 0.0082, + "step": 538930 + }, + { + "epoch": 1.4, + "learning_rate": 9.044846687628473e-05, + "loss": 0.0079, + "step": 538940 + }, + { + "epoch": 1.4, + "learning_rate": 9.044457865991326e-05, + "loss": 0.0119, + "step": 538950 + }, + { + "epoch": 1.4, + "learning_rate": 9.04406904435418e-05, + "loss": 0.0086, + "step": 538960 + }, + { + "epoch": 1.4, + "learning_rate": 9.043680222717033e-05, + "loss": 0.009, + "step": 538970 + }, + { + "epoch": 1.4, + "learning_rate": 9.043291401079887e-05, + "loss": 0.012, + "step": 538980 + }, + { + "epoch": 1.4, + "learning_rate": 9.04290257944274e-05, + "loss": 0.0085, + "step": 538990 + }, + { + "epoch": 1.4, + "learning_rate": 9.042513757805594e-05, + "loss": 0.0103, + "step": 539000 + }, + { + "epoch": 1.4, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.006161821540445089, + "eval_runtime": 107.9304, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.633, + "step": 539000 + }, + { + "epoch": 1.4, + "learning_rate": 9.042124936168447e-05, + "loss": 0.0105, + "step": 539010 + }, + { + "epoch": 1.4, + "learning_rate": 9.041736114531301e-05, + "loss": 0.0132, + "step": 539020 + }, + { + "epoch": 1.4, + "learning_rate": 9.041347292894154e-05, + "loss": 0.0101, + "step": 539030 + }, + { + "epoch": 1.4, + "learning_rate": 9.040958471257008e-05, + "loss": 0.0095, + "step": 539040 + }, + { + "epoch": 1.4, + "learning_rate": 9.04056964961986e-05, + "loss": 0.0071, + "step": 539050 + }, + { + "epoch": 1.4, + "learning_rate": 9.040180827982715e-05, + "loss": 0.0112, + "step": 539060 + }, + { + "epoch": 1.4, + "learning_rate": 9.039792006345568e-05, + "loss": 0.009, + "step": 539070 + }, + { + "epoch": 1.4, + "learning_rate": 9.039403184708423e-05, + "loss": 0.0141, + "step": 539080 + }, + { + "epoch": 1.4, + "learning_rate": 9.039014363071276e-05, + "loss": 0.0119, + "step": 539090 + }, + { + "epoch": 1.4, + "learning_rate": 9.03862554143413e-05, + "loss": 0.0117, + "step": 539100 + }, + { + "epoch": 1.4, + "learning_rate": 9.038236719796983e-05, + "loss": 0.012, + "step": 539110 + }, + { + "epoch": 1.4, + "learning_rate": 9.037847898159837e-05, + "loss": 0.0107, + "step": 539120 + }, + { + "epoch": 1.4, + "learning_rate": 9.03745907652269e-05, + "loss": 0.0083, + "step": 539130 + }, + { + "epoch": 1.4, + "learning_rate": 9.037070254885543e-05, + "loss": 0.0106, + "step": 539140 + }, + { + "epoch": 1.4, + "learning_rate": 9.036681433248397e-05, + "loss": 0.0102, + "step": 539150 + }, + { + "epoch": 1.4, + "learning_rate": 9.03629261161125e-05, + "loss": 0.0113, + "step": 539160 + }, + { + "epoch": 1.4, + "learning_rate": 9.035903789974104e-05, + "loss": 0.0099, + "step": 539170 + }, + { + "epoch": 1.4, + "learning_rate": 9.035514968336957e-05, + "loss": 0.0089, + "step": 539180 + }, + { + "epoch": 1.4, + "learning_rate": 9.035126146699811e-05, + "loss": 0.01, + "step": 539190 + }, + { + "epoch": 1.4, + "learning_rate": 9.034737325062664e-05, + "loss": 0.0099, + "step": 539200 + }, + { + "epoch": 1.4, + "learning_rate": 9.034348503425518e-05, + "loss": 0.0084, + "step": 539210 + }, + { + "epoch": 1.4, + "learning_rate": 9.03395968178837e-05, + "loss": 0.0118, + "step": 539220 + }, + { + "epoch": 1.4, + "learning_rate": 9.033570860151225e-05, + "loss": 0.008, + "step": 539230 + }, + { + "epoch": 1.4, + "learning_rate": 9.033182038514077e-05, + "loss": 0.0096, + "step": 539240 + }, + { + "epoch": 1.4, + "learning_rate": 9.032793216876933e-05, + "loss": 0.0117, + "step": 539250 + }, + { + "epoch": 1.4, + "learning_rate": 9.032404395239784e-05, + "loss": 0.008, + "step": 539260 + }, + { + "epoch": 1.4, + "learning_rate": 9.03201557360264e-05, + "loss": 0.0102, + "step": 539270 + }, + { + "epoch": 1.4, + "learning_rate": 9.031626751965493e-05, + "loss": 0.0127, + "step": 539280 + }, + { + "epoch": 1.4, + "learning_rate": 9.031237930328347e-05, + "loss": 0.0101, + "step": 539290 + }, + { + "epoch": 1.4, + "learning_rate": 9.0308491086912e-05, + "loss": 0.0087, + "step": 539300 + }, + { + "epoch": 1.4, + "learning_rate": 9.030460287054054e-05, + "loss": 0.009, + "step": 539310 + }, + { + "epoch": 1.4, + "learning_rate": 9.030071465416907e-05, + "loss": 0.0067, + "step": 539320 + }, + { + "epoch": 1.4, + "learning_rate": 9.029682643779761e-05, + "loss": 0.0085, + "step": 539330 + }, + { + "epoch": 1.4, + "learning_rate": 9.029293822142614e-05, + "loss": 0.007, + "step": 539340 + }, + { + "epoch": 1.4, + "learning_rate": 9.028905000505468e-05, + "loss": 0.0101, + "step": 539350 + }, + { + "epoch": 1.4, + "learning_rate": 9.02851617886832e-05, + "loss": 0.0078, + "step": 539360 + }, + { + "epoch": 1.4, + "learning_rate": 9.028127357231175e-05, + "loss": 0.0094, + "step": 539370 + }, + { + "epoch": 1.4, + "learning_rate": 9.027738535594028e-05, + "loss": 0.0061, + "step": 539380 + }, + { + "epoch": 1.4, + "learning_rate": 9.02734971395688e-05, + "loss": 0.0088, + "step": 539390 + }, + { + "epoch": 1.4, + "learning_rate": 9.026960892319735e-05, + "loss": 0.0084, + "step": 539400 + }, + { + "epoch": 1.4, + "learning_rate": 9.026572070682587e-05, + "loss": 0.0112, + "step": 539410 + }, + { + "epoch": 1.4, + "learning_rate": 9.026183249045442e-05, + "loss": 0.0093, + "step": 539420 + }, + { + "epoch": 1.4, + "learning_rate": 9.025794427408294e-05, + "loss": 0.0066, + "step": 539430 + }, + { + "epoch": 1.4, + "learning_rate": 9.02540560577115e-05, + "loss": 0.0089, + "step": 539440 + }, + { + "epoch": 1.4, + "learning_rate": 9.025016784134003e-05, + "loss": 0.0085, + "step": 539450 + }, + { + "epoch": 1.4, + "learning_rate": 9.024627962496857e-05, + "loss": 0.0104, + "step": 539460 + }, + { + "epoch": 1.4, + "learning_rate": 9.02423914085971e-05, + "loss": 0.0106, + "step": 539470 + }, + { + "epoch": 1.4, + "learning_rate": 9.023850319222564e-05, + "loss": 0.014, + "step": 539480 + }, + { + "epoch": 1.4, + "learning_rate": 9.023461497585417e-05, + "loss": 0.0112, + "step": 539490 + }, + { + "epoch": 1.4, + "learning_rate": 9.023072675948271e-05, + "loss": 0.0082, + "step": 539500 + }, + { + "epoch": 1.4, + "learning_rate": 9.022683854311124e-05, + "loss": 0.0116, + "step": 539510 + }, + { + "epoch": 1.4, + "learning_rate": 9.022295032673978e-05, + "loss": 0.0082, + "step": 539520 + }, + { + "epoch": 1.4, + "learning_rate": 9.02190621103683e-05, + "loss": 0.0146, + "step": 539530 + }, + { + "epoch": 1.4, + "learning_rate": 9.021517389399685e-05, + "loss": 0.0098, + "step": 539540 + }, + { + "epoch": 1.4, + "learning_rate": 9.021128567762538e-05, + "loss": 0.0098, + "step": 539550 + }, + { + "epoch": 1.4, + "learning_rate": 9.020739746125392e-05, + "loss": 0.0077, + "step": 539560 + }, + { + "epoch": 1.4, + "learning_rate": 9.020350924488245e-05, + "loss": 0.0092, + "step": 539570 + }, + { + "epoch": 1.4, + "learning_rate": 9.019962102851099e-05, + "loss": 0.008, + "step": 539580 + }, + { + "epoch": 1.4, + "learning_rate": 9.019573281213952e-05, + "loss": 0.0062, + "step": 539590 + }, + { + "epoch": 1.4, + "learning_rate": 9.019184459576807e-05, + "loss": 0.0092, + "step": 539600 + }, + { + "epoch": 1.4, + "learning_rate": 9.01879563793966e-05, + "loss": 0.0099, + "step": 539610 + }, + { + "epoch": 1.4, + "learning_rate": 9.018406816302514e-05, + "loss": 0.0073, + "step": 539620 + }, + { + "epoch": 1.4, + "learning_rate": 9.018017994665367e-05, + "loss": 0.0108, + "step": 539630 + }, + { + "epoch": 1.4, + "learning_rate": 9.01762917302822e-05, + "loss": 0.0097, + "step": 539640 + }, + { + "epoch": 1.4, + "learning_rate": 9.017240351391074e-05, + "loss": 0.0079, + "step": 539650 + }, + { + "epoch": 1.4, + "learning_rate": 9.016851529753927e-05, + "loss": 0.0068, + "step": 539660 + }, + { + "epoch": 1.4, + "learning_rate": 9.016462708116781e-05, + "loss": 0.0105, + "step": 539670 + }, + { + "epoch": 1.4, + "learning_rate": 9.016073886479634e-05, + "loss": 0.0115, + "step": 539680 + }, + { + "epoch": 1.4, + "learning_rate": 9.015685064842488e-05, + "loss": 0.0097, + "step": 539690 + }, + { + "epoch": 1.4, + "learning_rate": 9.01529624320534e-05, + "loss": 0.0111, + "step": 539700 + }, + { + "epoch": 1.4, + "learning_rate": 9.014907421568195e-05, + "loss": 0.01, + "step": 539710 + }, + { + "epoch": 1.4, + "learning_rate": 9.014518599931048e-05, + "loss": 0.0073, + "step": 539720 + }, + { + "epoch": 1.4, + "learning_rate": 9.014129778293902e-05, + "loss": 0.012, + "step": 539730 + }, + { + "epoch": 1.4, + "learning_rate": 9.013740956656754e-05, + "loss": 0.009, + "step": 539740 + }, + { + "epoch": 1.4, + "learning_rate": 9.013352135019609e-05, + "loss": 0.0089, + "step": 539750 + }, + { + "epoch": 1.4, + "learning_rate": 9.012963313382461e-05, + "loss": 0.0096, + "step": 539760 + }, + { + "epoch": 1.4, + "learning_rate": 9.012574491745317e-05, + "loss": 0.01, + "step": 539770 + }, + { + "epoch": 1.4, + "learning_rate": 9.012185670108168e-05, + "loss": 0.0099, + "step": 539780 + }, + { + "epoch": 1.4, + "learning_rate": 9.011796848471024e-05, + "loss": 0.0101, + "step": 539790 + }, + { + "epoch": 1.4, + "learning_rate": 9.011408026833877e-05, + "loss": 0.0108, + "step": 539800 + }, + { + "epoch": 1.4, + "learning_rate": 9.011019205196731e-05, + "loss": 0.0121, + "step": 539810 + }, + { + "epoch": 1.4, + "learning_rate": 9.010630383559584e-05, + "loss": 0.0104, + "step": 539820 + }, + { + "epoch": 1.4, + "learning_rate": 9.010241561922438e-05, + "loss": 0.0076, + "step": 539830 + }, + { + "epoch": 1.4, + "learning_rate": 9.009852740285291e-05, + "loss": 0.0087, + "step": 539840 + }, + { + "epoch": 1.4, + "learning_rate": 9.009463918648145e-05, + "loss": 0.0082, + "step": 539850 + }, + { + "epoch": 1.4, + "learning_rate": 9.009075097010998e-05, + "loss": 0.0094, + "step": 539860 + }, + { + "epoch": 1.4, + "learning_rate": 9.008686275373852e-05, + "loss": 0.0115, + "step": 539870 + }, + { + "epoch": 1.4, + "learning_rate": 9.008297453736705e-05, + "loss": 0.0072, + "step": 539880 + }, + { + "epoch": 1.4, + "learning_rate": 9.007908632099557e-05, + "loss": 0.0091, + "step": 539890 + }, + { + "epoch": 1.4, + "learning_rate": 9.007519810462412e-05, + "loss": 0.0086, + "step": 539900 + }, + { + "epoch": 1.4, + "learning_rate": 9.007130988825264e-05, + "loss": 0.0079, + "step": 539910 + }, + { + "epoch": 1.4, + "learning_rate": 9.006742167188119e-05, + "loss": 0.0077, + "step": 539920 + }, + { + "epoch": 1.4, + "learning_rate": 9.006353345550971e-05, + "loss": 0.0106, + "step": 539930 + }, + { + "epoch": 1.4, + "learning_rate": 9.005964523913826e-05, + "loss": 0.0082, + "step": 539940 + }, + { + "epoch": 1.4, + "learning_rate": 9.005575702276678e-05, + "loss": 0.0098, + "step": 539950 + }, + { + "epoch": 1.4, + "learning_rate": 9.005186880639534e-05, + "loss": 0.0075, + "step": 539960 + }, + { + "epoch": 1.4, + "learning_rate": 9.004798059002387e-05, + "loss": 0.011, + "step": 539970 + }, + { + "epoch": 1.4, + "learning_rate": 9.004409237365241e-05, + "loss": 0.0096, + "step": 539980 + }, + { + "epoch": 1.4, + "learning_rate": 9.004020415728094e-05, + "loss": 0.0085, + "step": 539990 + }, + { + "epoch": 1.4, + "learning_rate": 9.003631594090948e-05, + "loss": 0.0109, + "step": 540000 + }, + { + "epoch": 1.4, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.006191324442625046, + "eval_runtime": 107.7847, + "eval_samples_per_second": 18.556, + "eval_steps_per_second": 4.639, + "step": 540000 + }, + { + "epoch": 1.4, + "learning_rate": 9.0032427724538e-05, + "loss": 0.013, + "step": 540010 + }, + { + "epoch": 1.4, + "learning_rate": 9.002853950816655e-05, + "loss": 0.0101, + "step": 540020 + }, + { + "epoch": 1.4, + "learning_rate": 9.002465129179508e-05, + "loss": 0.0075, + "step": 540030 + }, + { + "epoch": 1.4, + "learning_rate": 9.002076307542362e-05, + "loss": 0.0117, + "step": 540040 + }, + { + "epoch": 1.4, + "learning_rate": 9.001687485905215e-05, + "loss": 0.0109, + "step": 540050 + }, + { + "epoch": 1.4, + "learning_rate": 9.001298664268069e-05, + "loss": 0.0096, + "step": 540060 + }, + { + "epoch": 1.4, + "learning_rate": 9.000909842630922e-05, + "loss": 0.0093, + "step": 540070 + }, + { + "epoch": 1.4, + "learning_rate": 9.000521020993776e-05, + "loss": 0.0088, + "step": 540080 + }, + { + "epoch": 1.4, + "learning_rate": 9.000132199356629e-05, + "loss": 0.0104, + "step": 540090 + }, + { + "epoch": 1.4, + "learning_rate": 8.999743377719483e-05, + "loss": 0.008, + "step": 540100 + }, + { + "epoch": 1.4, + "learning_rate": 8.999354556082335e-05, + "loss": 0.0109, + "step": 540110 + }, + { + "epoch": 1.4, + "learning_rate": 8.998965734445191e-05, + "loss": 0.0129, + "step": 540120 + }, + { + "epoch": 1.4, + "learning_rate": 8.998576912808044e-05, + "loss": 0.0095, + "step": 540130 + }, + { + "epoch": 1.4, + "learning_rate": 8.998188091170895e-05, + "loss": 0.0102, + "step": 540140 + }, + { + "epoch": 1.4, + "learning_rate": 8.997799269533751e-05, + "loss": 0.0073, + "step": 540150 + }, + { + "epoch": 1.4, + "learning_rate": 8.997410447896604e-05, + "loss": 0.008, + "step": 540160 + }, + { + "epoch": 1.4, + "learning_rate": 8.997021626259458e-05, + "loss": 0.0112, + "step": 540170 + }, + { + "epoch": 1.4, + "learning_rate": 8.99663280462231e-05, + "loss": 0.008, + "step": 540180 + }, + { + "epoch": 1.4, + "learning_rate": 8.996243982985165e-05, + "loss": 0.0099, + "step": 540190 + }, + { + "epoch": 1.4, + "learning_rate": 8.995855161348018e-05, + "loss": 0.0084, + "step": 540200 + }, + { + "epoch": 1.4, + "learning_rate": 8.995466339710872e-05, + "loss": 0.0106, + "step": 540210 + }, + { + "epoch": 1.4, + "learning_rate": 8.995077518073725e-05, + "loss": 0.0081, + "step": 540220 + }, + { + "epoch": 1.4, + "learning_rate": 8.994688696436579e-05, + "loss": 0.0081, + "step": 540230 + }, + { + "epoch": 1.4, + "learning_rate": 8.994299874799431e-05, + "loss": 0.0089, + "step": 540240 + }, + { + "epoch": 1.4, + "learning_rate": 8.993911053162286e-05, + "loss": 0.0073, + "step": 540250 + }, + { + "epoch": 1.4, + "learning_rate": 8.993522231525138e-05, + "loss": 0.0143, + "step": 540260 + }, + { + "epoch": 1.4, + "learning_rate": 8.993133409887993e-05, + "loss": 0.0091, + "step": 540270 + }, + { + "epoch": 1.4, + "learning_rate": 8.992744588250845e-05, + "loss": 0.0097, + "step": 540280 + }, + { + "epoch": 1.4, + "learning_rate": 8.9923557666137e-05, + "loss": 0.0098, + "step": 540290 + }, + { + "epoch": 1.4, + "learning_rate": 8.991966944976552e-05, + "loss": 0.0098, + "step": 540300 + }, + { + "epoch": 1.4, + "learning_rate": 8.991578123339408e-05, + "loss": 0.0096, + "step": 540310 + }, + { + "epoch": 1.4, + "learning_rate": 8.991189301702261e-05, + "loss": 0.0088, + "step": 540320 + }, + { + "epoch": 1.4, + "learning_rate": 8.990800480065115e-05, + "loss": 0.0077, + "step": 540330 + }, + { + "epoch": 1.4, + "learning_rate": 8.990411658427968e-05, + "loss": 0.0089, + "step": 540340 + }, + { + "epoch": 1.4, + "learning_rate": 8.990022836790822e-05, + "loss": 0.0084, + "step": 540350 + }, + { + "epoch": 1.4, + "learning_rate": 8.989634015153675e-05, + "loss": 0.0083, + "step": 540360 + }, + { + "epoch": 1.4, + "learning_rate": 8.989245193516529e-05, + "loss": 0.0085, + "step": 540370 + }, + { + "epoch": 1.4, + "learning_rate": 8.988856371879382e-05, + "loss": 0.009, + "step": 540380 + }, + { + "epoch": 1.4, + "learning_rate": 8.988467550242234e-05, + "loss": 0.0067, + "step": 540390 + }, + { + "epoch": 1.4, + "learning_rate": 8.988078728605089e-05, + "loss": 0.0082, + "step": 540400 + }, + { + "epoch": 1.4, + "learning_rate": 8.987689906967941e-05, + "loss": 0.0108, + "step": 540410 + }, + { + "epoch": 1.4, + "learning_rate": 8.987301085330796e-05, + "loss": 0.0091, + "step": 540420 + }, + { + "epoch": 1.4, + "learning_rate": 8.986912263693648e-05, + "loss": 0.0105, + "step": 540430 + }, + { + "epoch": 1.4, + "learning_rate": 8.986523442056503e-05, + "loss": 0.0114, + "step": 540440 + }, + { + "epoch": 1.4, + "learning_rate": 8.986134620419355e-05, + "loss": 0.0073, + "step": 540450 + }, + { + "epoch": 1.4, + "learning_rate": 8.98574579878221e-05, + "loss": 0.0093, + "step": 540460 + }, + { + "epoch": 1.4, + "learning_rate": 8.985356977145062e-05, + "loss": 0.0097, + "step": 540470 + }, + { + "epoch": 1.4, + "learning_rate": 8.984968155507918e-05, + "loss": 0.0104, + "step": 540480 + }, + { + "epoch": 1.4, + "learning_rate": 8.98457933387077e-05, + "loss": 0.0103, + "step": 540490 + }, + { + "epoch": 1.4, + "learning_rate": 8.984190512233625e-05, + "loss": 0.0111, + "step": 540500 + }, + { + "epoch": 1.4, + "learning_rate": 8.983801690596478e-05, + "loss": 0.0095, + "step": 540510 + }, + { + "epoch": 1.4, + "learning_rate": 8.983412868959332e-05, + "loss": 0.0111, + "step": 540520 + }, + { + "epoch": 1.4, + "learning_rate": 8.983024047322185e-05, + "loss": 0.0118, + "step": 540530 + }, + { + "epoch": 1.4, + "learning_rate": 8.982635225685039e-05, + "loss": 0.0091, + "step": 540540 + }, + { + "epoch": 1.4, + "learning_rate": 8.982246404047892e-05, + "loss": 0.009, + "step": 540550 + }, + { + "epoch": 1.4, + "learning_rate": 8.981857582410746e-05, + "loss": 0.0085, + "step": 540560 + }, + { + "epoch": 1.4, + "learning_rate": 8.981468760773599e-05, + "loss": 0.0095, + "step": 540570 + }, + { + "epoch": 1.4, + "learning_rate": 8.981079939136453e-05, + "loss": 0.0114, + "step": 540580 + }, + { + "epoch": 1.4, + "learning_rate": 8.980691117499306e-05, + "loss": 0.0118, + "step": 540590 + }, + { + "epoch": 1.4, + "learning_rate": 8.98030229586216e-05, + "loss": 0.0076, + "step": 540600 + }, + { + "epoch": 1.4, + "learning_rate": 8.979913474225013e-05, + "loss": 0.0096, + "step": 540610 + }, + { + "epoch": 1.4, + "learning_rate": 8.979524652587867e-05, + "loss": 0.01, + "step": 540620 + }, + { + "epoch": 1.4, + "learning_rate": 8.97913583095072e-05, + "loss": 0.0098, + "step": 540630 + }, + { + "epoch": 1.4, + "learning_rate": 8.978747009313572e-05, + "loss": 0.009, + "step": 540640 + }, + { + "epoch": 1.4, + "learning_rate": 8.978358187676426e-05, + "loss": 0.0108, + "step": 540650 + }, + { + "epoch": 1.4, + "learning_rate": 8.977969366039279e-05, + "loss": 0.0126, + "step": 540660 + }, + { + "epoch": 1.4, + "learning_rate": 8.977580544402135e-05, + "loss": 0.0081, + "step": 540670 + }, + { + "epoch": 1.4, + "learning_rate": 8.977191722764988e-05, + "loss": 0.0118, + "step": 540680 + }, + { + "epoch": 1.4, + "learning_rate": 8.976802901127842e-05, + "loss": 0.0076, + "step": 540690 + }, + { + "epoch": 1.4, + "learning_rate": 8.976414079490695e-05, + "loss": 0.0115, + "step": 540700 + }, + { + "epoch": 1.4, + "learning_rate": 8.976025257853549e-05, + "loss": 0.0083, + "step": 540710 + }, + { + "epoch": 1.4, + "learning_rate": 8.975636436216402e-05, + "loss": 0.0091, + "step": 540720 + }, + { + "epoch": 1.4, + "learning_rate": 8.975247614579256e-05, + "loss": 0.0089, + "step": 540730 + }, + { + "epoch": 1.4, + "learning_rate": 8.974858792942109e-05, + "loss": 0.0091, + "step": 540740 + }, + { + "epoch": 1.4, + "learning_rate": 8.974469971304963e-05, + "loss": 0.0109, + "step": 540750 + }, + { + "epoch": 1.4, + "learning_rate": 8.974081149667815e-05, + "loss": 0.0131, + "step": 540760 + }, + { + "epoch": 1.4, + "learning_rate": 8.97369232803067e-05, + "loss": 0.0098, + "step": 540770 + }, + { + "epoch": 1.4, + "learning_rate": 8.973303506393522e-05, + "loss": 0.0098, + "step": 540780 + }, + { + "epoch": 1.4, + "learning_rate": 8.972914684756377e-05, + "loss": 0.0086, + "step": 540790 + }, + { + "epoch": 1.4, + "learning_rate": 8.97252586311923e-05, + "loss": 0.01, + "step": 540800 + }, + { + "epoch": 1.4, + "learning_rate": 8.972137041482084e-05, + "loss": 0.0088, + "step": 540810 + }, + { + "epoch": 1.4, + "learning_rate": 8.971748219844936e-05, + "loss": 0.0088, + "step": 540820 + }, + { + "epoch": 1.4, + "learning_rate": 8.971359398207792e-05, + "loss": 0.0081, + "step": 540830 + }, + { + "epoch": 1.4, + "learning_rate": 8.970970576570645e-05, + "loss": 0.0078, + "step": 540840 + }, + { + "epoch": 1.4, + "learning_rate": 8.970581754933499e-05, + "loss": 0.0118, + "step": 540850 + }, + { + "epoch": 1.4, + "learning_rate": 8.970192933296352e-05, + "loss": 0.0081, + "step": 540860 + }, + { + "epoch": 1.4, + "learning_rate": 8.969804111659206e-05, + "loss": 0.0085, + "step": 540870 + }, + { + "epoch": 1.4, + "learning_rate": 8.969415290022059e-05, + "loss": 0.0103, + "step": 540880 + }, + { + "epoch": 1.4, + "learning_rate": 8.969026468384911e-05, + "loss": 0.0081, + "step": 540890 + }, + { + "epoch": 1.4, + "learning_rate": 8.968637646747766e-05, + "loss": 0.0108, + "step": 540900 + }, + { + "epoch": 1.4, + "learning_rate": 8.968248825110618e-05, + "loss": 0.0084, + "step": 540910 + }, + { + "epoch": 1.4, + "learning_rate": 8.967860003473473e-05, + "loss": 0.0092, + "step": 540920 + }, + { + "epoch": 1.4, + "learning_rate": 8.967471181836325e-05, + "loss": 0.0093, + "step": 540930 + }, + { + "epoch": 1.4, + "learning_rate": 8.96708236019918e-05, + "loss": 0.0094, + "step": 540940 + }, + { + "epoch": 1.4, + "learning_rate": 8.966693538562032e-05, + "loss": 0.0089, + "step": 540950 + }, + { + "epoch": 1.4, + "learning_rate": 8.966304716924887e-05, + "loss": 0.0079, + "step": 540960 + }, + { + "epoch": 1.4, + "learning_rate": 8.96591589528774e-05, + "loss": 0.0108, + "step": 540970 + }, + { + "epoch": 1.4, + "learning_rate": 8.965527073650594e-05, + "loss": 0.0109, + "step": 540980 + }, + { + "epoch": 1.4, + "learning_rate": 8.965138252013446e-05, + "loss": 0.0085, + "step": 540990 + }, + { + "epoch": 1.4, + "learning_rate": 8.964749430376302e-05, + "loss": 0.0108, + "step": 541000 + }, + { + "epoch": 1.4, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.006157417315989733, + "eval_runtime": 107.7568, + "eval_samples_per_second": 18.56, + "eval_steps_per_second": 4.64, + "step": 541000 + }, + { + "epoch": 1.4, + "learning_rate": 8.964360608739153e-05, + "loss": 0.0082, + "step": 541010 + }, + { + "epoch": 1.4, + "learning_rate": 8.963971787102009e-05, + "loss": 0.0103, + "step": 541020 + }, + { + "epoch": 1.4, + "learning_rate": 8.963582965464862e-05, + "loss": 0.0087, + "step": 541030 + }, + { + "epoch": 1.4, + "learning_rate": 8.963194143827716e-05, + "loss": 0.0075, + "step": 541040 + }, + { + "epoch": 1.4, + "learning_rate": 8.962805322190569e-05, + "loss": 0.0114, + "step": 541050 + }, + { + "epoch": 1.4, + "learning_rate": 8.962416500553423e-05, + "loss": 0.0093, + "step": 541060 + }, + { + "epoch": 1.4, + "learning_rate": 8.962027678916276e-05, + "loss": 0.0103, + "step": 541070 + }, + { + "epoch": 1.4, + "learning_rate": 8.96163885727913e-05, + "loss": 0.0078, + "step": 541080 + }, + { + "epoch": 1.4, + "learning_rate": 8.961250035641983e-05, + "loss": 0.0108, + "step": 541090 + }, + { + "epoch": 1.4, + "learning_rate": 8.960861214004837e-05, + "loss": 0.0068, + "step": 541100 + }, + { + "epoch": 1.4, + "learning_rate": 8.96047239236769e-05, + "loss": 0.0094, + "step": 541110 + }, + { + "epoch": 1.4, + "learning_rate": 8.960083570730544e-05, + "loss": 0.0121, + "step": 541120 + }, + { + "epoch": 1.4, + "learning_rate": 8.959694749093397e-05, + "loss": 0.0082, + "step": 541130 + }, + { + "epoch": 1.4, + "learning_rate": 8.959305927456249e-05, + "loss": 0.0086, + "step": 541140 + }, + { + "epoch": 1.4, + "learning_rate": 8.958917105819103e-05, + "loss": 0.0074, + "step": 541150 + }, + { + "epoch": 1.4, + "learning_rate": 8.958528284181956e-05, + "loss": 0.0101, + "step": 541160 + }, + { + "epoch": 1.4, + "learning_rate": 8.95813946254481e-05, + "loss": 0.0094, + "step": 541170 + }, + { + "epoch": 1.4, + "learning_rate": 8.957750640907663e-05, + "loss": 0.0086, + "step": 541180 + }, + { + "epoch": 1.4, + "learning_rate": 8.957361819270519e-05, + "loss": 0.0078, + "step": 541190 + }, + { + "epoch": 1.4, + "learning_rate": 8.956972997633372e-05, + "loss": 0.0116, + "step": 541200 + }, + { + "epoch": 1.4, + "learning_rate": 8.956584175996226e-05, + "loss": 0.0075, + "step": 541210 + }, + { + "epoch": 1.4, + "learning_rate": 8.956195354359079e-05, + "loss": 0.0137, + "step": 541220 + }, + { + "epoch": 1.4, + "learning_rate": 8.955806532721933e-05, + "loss": 0.0082, + "step": 541230 + }, + { + "epoch": 1.4, + "learning_rate": 8.955417711084786e-05, + "loss": 0.018, + "step": 541240 + }, + { + "epoch": 1.4, + "learning_rate": 8.95502888944764e-05, + "loss": 0.0147, + "step": 541250 + }, + { + "epoch": 1.4, + "learning_rate": 8.954640067810493e-05, + "loss": 0.0104, + "step": 541260 + }, + { + "epoch": 1.4, + "learning_rate": 8.954251246173347e-05, + "loss": 0.0082, + "step": 541270 + }, + { + "epoch": 1.4, + "learning_rate": 8.9538624245362e-05, + "loss": 0.012, + "step": 541280 + }, + { + "epoch": 1.4, + "learning_rate": 8.953473602899054e-05, + "loss": 0.0104, + "step": 541290 + }, + { + "epoch": 1.4, + "learning_rate": 8.953084781261906e-05, + "loss": 0.0093, + "step": 541300 + }, + { + "epoch": 1.4, + "learning_rate": 8.95269595962476e-05, + "loss": 0.008, + "step": 541310 + }, + { + "epoch": 1.4, + "learning_rate": 8.952307137987613e-05, + "loss": 0.0116, + "step": 541320 + }, + { + "epoch": 1.4, + "learning_rate": 8.951918316350468e-05, + "loss": 0.0109, + "step": 541330 + }, + { + "epoch": 1.4, + "learning_rate": 8.95152949471332e-05, + "loss": 0.0104, + "step": 541340 + }, + { + "epoch": 1.4, + "learning_rate": 8.951140673076176e-05, + "loss": 0.0091, + "step": 541350 + }, + { + "epoch": 1.4, + "learning_rate": 8.950751851439029e-05, + "loss": 0.0116, + "step": 541360 + }, + { + "epoch": 1.4, + "learning_rate": 8.95036302980188e-05, + "loss": 0.009, + "step": 541370 + }, + { + "epoch": 1.4, + "learning_rate": 8.949974208164736e-05, + "loss": 0.0092, + "step": 541380 + }, + { + "epoch": 1.4, + "learning_rate": 8.949585386527589e-05, + "loss": 0.0061, + "step": 541390 + }, + { + "epoch": 1.4, + "learning_rate": 8.949196564890443e-05, + "loss": 0.009, + "step": 541400 + }, + { + "epoch": 1.4, + "learning_rate": 8.948807743253295e-05, + "loss": 0.0083, + "step": 541410 + }, + { + "epoch": 1.4, + "learning_rate": 8.94841892161615e-05, + "loss": 0.0079, + "step": 541420 + }, + { + "epoch": 1.4, + "learning_rate": 8.948030099979002e-05, + "loss": 0.0167, + "step": 541430 + }, + { + "epoch": 1.4, + "learning_rate": 8.947641278341857e-05, + "loss": 0.0109, + "step": 541440 + }, + { + "epoch": 1.4, + "learning_rate": 8.94725245670471e-05, + "loss": 0.0125, + "step": 541450 + }, + { + "epoch": 1.4, + "learning_rate": 8.946863635067564e-05, + "loss": 0.0091, + "step": 541460 + }, + { + "epoch": 1.4, + "learning_rate": 8.946474813430416e-05, + "loss": 0.0093, + "step": 541470 + }, + { + "epoch": 1.4, + "learning_rate": 8.94608599179327e-05, + "loss": 0.0107, + "step": 541480 + }, + { + "epoch": 1.4, + "learning_rate": 8.945697170156123e-05, + "loss": 0.0089, + "step": 541490 + }, + { + "epoch": 1.4, + "learning_rate": 8.945308348518978e-05, + "loss": 0.0097, + "step": 541500 + }, + { + "epoch": 1.4, + "learning_rate": 8.94491952688183e-05, + "loss": 0.0122, + "step": 541510 + }, + { + "epoch": 1.4, + "learning_rate": 8.944530705244686e-05, + "loss": 0.0088, + "step": 541520 + }, + { + "epoch": 1.4, + "learning_rate": 8.944141883607537e-05, + "loss": 0.0097, + "step": 541530 + }, + { + "epoch": 1.4, + "learning_rate": 8.943753061970393e-05, + "loss": 0.0087, + "step": 541540 + }, + { + "epoch": 1.4, + "learning_rate": 8.943364240333246e-05, + "loss": 0.0111, + "step": 541550 + }, + { + "epoch": 1.4, + "learning_rate": 8.9429754186961e-05, + "loss": 0.0102, + "step": 541560 + }, + { + "epoch": 1.4, + "learning_rate": 8.942586597058953e-05, + "loss": 0.0098, + "step": 541570 + }, + { + "epoch": 1.4, + "learning_rate": 8.942197775421807e-05, + "loss": 0.0111, + "step": 541580 + }, + { + "epoch": 1.4, + "learning_rate": 8.94180895378466e-05, + "loss": 0.0132, + "step": 541590 + }, + { + "epoch": 1.4, + "learning_rate": 8.941420132147514e-05, + "loss": 0.0101, + "step": 541600 + }, + { + "epoch": 1.4, + "learning_rate": 8.941031310510367e-05, + "loss": 0.0105, + "step": 541610 + }, + { + "epoch": 1.4, + "learning_rate": 8.94064248887322e-05, + "loss": 0.01, + "step": 541620 + }, + { + "epoch": 1.4, + "learning_rate": 8.940253667236074e-05, + "loss": 0.0087, + "step": 541630 + }, + { + "epoch": 1.4, + "learning_rate": 8.939864845598926e-05, + "loss": 0.0128, + "step": 541640 + }, + { + "epoch": 1.4, + "learning_rate": 8.93947602396178e-05, + "loss": 0.0134, + "step": 541650 + }, + { + "epoch": 1.4, + "learning_rate": 8.939087202324633e-05, + "loss": 0.0098, + "step": 541660 + }, + { + "epoch": 1.4, + "learning_rate": 8.938698380687487e-05, + "loss": 0.0099, + "step": 541670 + }, + { + "epoch": 1.4, + "learning_rate": 8.93830955905034e-05, + "loss": 0.0105, + "step": 541680 + }, + { + "epoch": 1.4, + "learning_rate": 8.937920737413194e-05, + "loss": 0.0077, + "step": 541690 + }, + { + "epoch": 1.4, + "learning_rate": 8.937531915776047e-05, + "loss": 0.0087, + "step": 541700 + }, + { + "epoch": 1.4, + "learning_rate": 8.937143094138903e-05, + "loss": 0.0111, + "step": 541710 + }, + { + "epoch": 1.4, + "learning_rate": 8.936754272501756e-05, + "loss": 0.008, + "step": 541720 + }, + { + "epoch": 1.4, + "learning_rate": 8.93636545086461e-05, + "loss": 0.0109, + "step": 541730 + }, + { + "epoch": 1.4, + "learning_rate": 8.935976629227463e-05, + "loss": 0.0095, + "step": 541740 + }, + { + "epoch": 1.4, + "learning_rate": 8.935587807590317e-05, + "loss": 0.0148, + "step": 541750 + }, + { + "epoch": 1.4, + "learning_rate": 8.93519898595317e-05, + "loss": 0.0101, + "step": 541760 + }, + { + "epoch": 1.4, + "learning_rate": 8.934810164316024e-05, + "loss": 0.0107, + "step": 541770 + }, + { + "epoch": 1.4, + "learning_rate": 8.934421342678876e-05, + "loss": 0.0088, + "step": 541780 + }, + { + "epoch": 1.4, + "learning_rate": 8.93403252104173e-05, + "loss": 0.0122, + "step": 541790 + }, + { + "epoch": 1.4, + "learning_rate": 8.933643699404583e-05, + "loss": 0.0094, + "step": 541800 + }, + { + "epoch": 1.4, + "learning_rate": 8.933254877767438e-05, + "loss": 0.0091, + "step": 541810 + }, + { + "epoch": 1.4, + "learning_rate": 8.93286605613029e-05, + "loss": 0.0091, + "step": 541820 + }, + { + "epoch": 1.4, + "learning_rate": 8.932477234493145e-05, + "loss": 0.009, + "step": 541830 + }, + { + "epoch": 1.4, + "learning_rate": 8.932088412855997e-05, + "loss": 0.0083, + "step": 541840 + }, + { + "epoch": 1.4, + "learning_rate": 8.931699591218852e-05, + "loss": 0.0084, + "step": 541850 + }, + { + "epoch": 1.4, + "learning_rate": 8.931310769581704e-05, + "loss": 0.0099, + "step": 541860 + }, + { + "epoch": 1.4, + "learning_rate": 8.930921947944557e-05, + "loss": 0.0092, + "step": 541870 + }, + { + "epoch": 1.4, + "learning_rate": 8.930533126307411e-05, + "loss": 0.0108, + "step": 541880 + }, + { + "epoch": 1.4, + "learning_rate": 8.930144304670264e-05, + "loss": 0.0082, + "step": 541890 + }, + { + "epoch": 1.4, + "learning_rate": 8.92975548303312e-05, + "loss": 0.0112, + "step": 541900 + }, + { + "epoch": 1.4, + "learning_rate": 8.929366661395972e-05, + "loss": 0.0095, + "step": 541910 + }, + { + "epoch": 1.4, + "learning_rate": 8.928977839758827e-05, + "loss": 0.0078, + "step": 541920 + }, + { + "epoch": 1.4, + "learning_rate": 8.92858901812168e-05, + "loss": 0.0087, + "step": 541930 + }, + { + "epoch": 1.4, + "learning_rate": 8.928200196484534e-05, + "loss": 0.009, + "step": 541940 + }, + { + "epoch": 1.4, + "learning_rate": 8.927811374847386e-05, + "loss": 0.0099, + "step": 541950 + }, + { + "epoch": 1.4, + "learning_rate": 8.92742255321024e-05, + "loss": 0.0113, + "step": 541960 + }, + { + "epoch": 1.4, + "learning_rate": 8.927033731573093e-05, + "loss": 0.0099, + "step": 541970 + }, + { + "epoch": 1.4, + "learning_rate": 8.926644909935948e-05, + "loss": 0.0086, + "step": 541980 + }, + { + "epoch": 1.4, + "learning_rate": 8.9262560882988e-05, + "loss": 0.0098, + "step": 541990 + }, + { + "epoch": 1.4, + "learning_rate": 8.925867266661655e-05, + "loss": 0.0122, + "step": 542000 + }, + { + "epoch": 1.4, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.005949368700385094, + "eval_runtime": 107.8552, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 542000 + }, + { + "epoch": 1.4, + "learning_rate": 8.925478445024507e-05, + "loss": 0.0109, + "step": 542010 + }, + { + "epoch": 1.4, + "learning_rate": 8.925089623387362e-05, + "loss": 0.009, + "step": 542020 + }, + { + "epoch": 1.41, + "learning_rate": 8.924700801750214e-05, + "loss": 0.0094, + "step": 542030 + }, + { + "epoch": 1.41, + "learning_rate": 8.924311980113068e-05, + "loss": 0.0126, + "step": 542040 + }, + { + "epoch": 1.41, + "learning_rate": 8.923923158475921e-05, + "loss": 0.0084, + "step": 542050 + }, + { + "epoch": 1.41, + "learning_rate": 8.923534336838777e-05, + "loss": 0.0109, + "step": 542060 + }, + { + "epoch": 1.41, + "learning_rate": 8.92314551520163e-05, + "loss": 0.013, + "step": 542070 + }, + { + "epoch": 1.41, + "learning_rate": 8.922756693564484e-05, + "loss": 0.0098, + "step": 542080 + }, + { + "epoch": 1.41, + "learning_rate": 8.922367871927337e-05, + "loss": 0.0101, + "step": 542090 + }, + { + "epoch": 1.41, + "learning_rate": 8.921979050290191e-05, + "loss": 0.0134, + "step": 542100 + }, + { + "epoch": 1.41, + "learning_rate": 8.921590228653044e-05, + "loss": 0.01, + "step": 542110 + }, + { + "epoch": 1.41, + "learning_rate": 8.921201407015896e-05, + "loss": 0.0118, + "step": 542120 + }, + { + "epoch": 1.41, + "learning_rate": 8.92081258537875e-05, + "loss": 0.0106, + "step": 542130 + }, + { + "epoch": 1.41, + "learning_rate": 8.920423763741603e-05, + "loss": 0.0119, + "step": 542140 + }, + { + "epoch": 1.41, + "learning_rate": 8.920034942104458e-05, + "loss": 0.0083, + "step": 542150 + }, + { + "epoch": 1.41, + "learning_rate": 8.91964612046731e-05, + "loss": 0.0127, + "step": 542160 + }, + { + "epoch": 1.41, + "learning_rate": 8.919257298830164e-05, + "loss": 0.0089, + "step": 542170 + }, + { + "epoch": 1.41, + "learning_rate": 8.918868477193017e-05, + "loss": 0.0086, + "step": 542180 + }, + { + "epoch": 1.41, + "learning_rate": 8.918479655555871e-05, + "loss": 0.0098, + "step": 542190 + }, + { + "epoch": 1.41, + "learning_rate": 8.918090833918724e-05, + "loss": 0.0112, + "step": 542200 + }, + { + "epoch": 1.41, + "learning_rate": 8.917702012281578e-05, + "loss": 0.0075, + "step": 542210 + }, + { + "epoch": 1.41, + "learning_rate": 8.917313190644431e-05, + "loss": 0.0105, + "step": 542220 + }, + { + "epoch": 1.41, + "learning_rate": 8.916924369007287e-05, + "loss": 0.0096, + "step": 542230 + }, + { + "epoch": 1.41, + "learning_rate": 8.916535547370138e-05, + "loss": 0.0095, + "step": 542240 + }, + { + "epoch": 1.41, + "learning_rate": 8.916146725732994e-05, + "loss": 0.0096, + "step": 542250 + }, + { + "epoch": 1.41, + "learning_rate": 8.915757904095847e-05, + "loss": 0.0077, + "step": 542260 + }, + { + "epoch": 1.41, + "learning_rate": 8.915369082458701e-05, + "loss": 0.0101, + "step": 542270 + }, + { + "epoch": 1.41, + "learning_rate": 8.914980260821554e-05, + "loss": 0.014, + "step": 542280 + }, + { + "epoch": 1.41, + "learning_rate": 8.914591439184408e-05, + "loss": 0.0102, + "step": 542290 + }, + { + "epoch": 1.41, + "learning_rate": 8.91420261754726e-05, + "loss": 0.0096, + "step": 542300 + }, + { + "epoch": 1.41, + "learning_rate": 8.913813795910115e-05, + "loss": 0.0073, + "step": 542310 + }, + { + "epoch": 1.41, + "learning_rate": 8.913424974272967e-05, + "loss": 0.0074, + "step": 542320 + }, + { + "epoch": 1.41, + "learning_rate": 8.913036152635822e-05, + "loss": 0.0111, + "step": 542330 + }, + { + "epoch": 1.41, + "learning_rate": 8.912647330998674e-05, + "loss": 0.0094, + "step": 542340 + }, + { + "epoch": 1.41, + "learning_rate": 8.912258509361529e-05, + "loss": 0.0122, + "step": 542350 + }, + { + "epoch": 1.41, + "learning_rate": 8.911869687724381e-05, + "loss": 0.0094, + "step": 542360 + }, + { + "epoch": 1.41, + "learning_rate": 8.911480866087234e-05, + "loss": 0.009, + "step": 542370 + }, + { + "epoch": 1.41, + "learning_rate": 8.911092044450088e-05, + "loss": 0.0107, + "step": 542380 + }, + { + "epoch": 1.41, + "learning_rate": 8.910703222812941e-05, + "loss": 0.007, + "step": 542390 + }, + { + "epoch": 1.41, + "learning_rate": 8.910314401175795e-05, + "loss": 0.0094, + "step": 542400 + }, + { + "epoch": 1.41, + "learning_rate": 8.909925579538648e-05, + "loss": 0.0085, + "step": 542410 + }, + { + "epoch": 1.41, + "learning_rate": 8.909536757901504e-05, + "loss": 0.0077, + "step": 542420 + }, + { + "epoch": 1.41, + "learning_rate": 8.909147936264356e-05, + "loss": 0.0136, + "step": 542430 + }, + { + "epoch": 1.41, + "learning_rate": 8.90875911462721e-05, + "loss": 0.0098, + "step": 542440 + }, + { + "epoch": 1.41, + "learning_rate": 8.908370292990063e-05, + "loss": 0.0077, + "step": 542450 + }, + { + "epoch": 1.41, + "learning_rate": 8.907981471352918e-05, + "loss": 0.0094, + "step": 542460 + }, + { + "epoch": 1.41, + "learning_rate": 8.90759264971577e-05, + "loss": 0.0092, + "step": 542470 + }, + { + "epoch": 1.41, + "learning_rate": 8.907203828078625e-05, + "loss": 0.0072, + "step": 542480 + }, + { + "epoch": 1.41, + "learning_rate": 8.906815006441477e-05, + "loss": 0.0084, + "step": 542490 + }, + { + "epoch": 1.41, + "learning_rate": 8.906426184804332e-05, + "loss": 0.0097, + "step": 542500 + }, + { + "epoch": 1.41, + "learning_rate": 8.906037363167184e-05, + "loss": 0.0122, + "step": 542510 + }, + { + "epoch": 1.41, + "learning_rate": 8.905648541530039e-05, + "loss": 0.0118, + "step": 542520 + }, + { + "epoch": 1.41, + "learning_rate": 8.905259719892891e-05, + "loss": 0.0087, + "step": 542530 + }, + { + "epoch": 1.41, + "learning_rate": 8.904870898255746e-05, + "loss": 0.0091, + "step": 542540 + }, + { + "epoch": 1.41, + "learning_rate": 8.904482076618598e-05, + "loss": 0.0095, + "step": 542550 + }, + { + "epoch": 1.41, + "learning_rate": 8.904093254981452e-05, + "loss": 0.0114, + "step": 542560 + }, + { + "epoch": 1.41, + "learning_rate": 8.903704433344305e-05, + "loss": 0.0103, + "step": 542570 + }, + { + "epoch": 1.41, + "learning_rate": 8.903315611707161e-05, + "loss": 0.0104, + "step": 542580 + }, + { + "epoch": 1.41, + "learning_rate": 8.902926790070014e-05, + "loss": 0.0089, + "step": 542590 + }, + { + "epoch": 1.41, + "learning_rate": 8.902537968432868e-05, + "loss": 0.0109, + "step": 542600 + }, + { + "epoch": 1.41, + "learning_rate": 8.90214914679572e-05, + "loss": 0.0106, + "step": 542610 + }, + { + "epoch": 1.41, + "learning_rate": 8.901760325158573e-05, + "loss": 0.0066, + "step": 542620 + }, + { + "epoch": 1.41, + "learning_rate": 8.901371503521428e-05, + "loss": 0.0098, + "step": 542630 + }, + { + "epoch": 1.41, + "learning_rate": 8.90098268188428e-05, + "loss": 0.008, + "step": 542640 + }, + { + "epoch": 1.41, + "learning_rate": 8.900593860247135e-05, + "loss": 0.0087, + "step": 542650 + }, + { + "epoch": 1.41, + "learning_rate": 8.900205038609987e-05, + "loss": 0.0079, + "step": 542660 + }, + { + "epoch": 1.41, + "learning_rate": 8.899816216972842e-05, + "loss": 0.0102, + "step": 542670 + }, + { + "epoch": 1.41, + "learning_rate": 8.899427395335694e-05, + "loss": 0.0166, + "step": 542680 + }, + { + "epoch": 1.41, + "learning_rate": 8.899038573698548e-05, + "loss": 0.0154, + "step": 542690 + }, + { + "epoch": 1.41, + "learning_rate": 8.898649752061401e-05, + "loss": 0.0135, + "step": 542700 + }, + { + "epoch": 1.41, + "learning_rate": 8.898260930424255e-05, + "loss": 0.0088, + "step": 542710 + }, + { + "epoch": 1.41, + "learning_rate": 8.897872108787108e-05, + "loss": 0.0126, + "step": 542720 + }, + { + "epoch": 1.41, + "learning_rate": 8.897483287149962e-05, + "loss": 0.0098, + "step": 542730 + }, + { + "epoch": 1.41, + "learning_rate": 8.897094465512815e-05, + "loss": 0.0077, + "step": 542740 + }, + { + "epoch": 1.41, + "learning_rate": 8.896705643875671e-05, + "loss": 0.0104, + "step": 542750 + }, + { + "epoch": 1.41, + "learning_rate": 8.896316822238522e-05, + "loss": 0.0098, + "step": 542760 + }, + { + "epoch": 1.41, + "learning_rate": 8.895928000601378e-05, + "loss": 0.0102, + "step": 542770 + }, + { + "epoch": 1.41, + "learning_rate": 8.89553917896423e-05, + "loss": 0.0104, + "step": 542780 + }, + { + "epoch": 1.41, + "learning_rate": 8.895150357327085e-05, + "loss": 0.008, + "step": 542790 + }, + { + "epoch": 1.41, + "learning_rate": 8.894761535689938e-05, + "loss": 0.0075, + "step": 542800 + }, + { + "epoch": 1.41, + "learning_rate": 8.894372714052792e-05, + "loss": 0.0088, + "step": 542810 + }, + { + "epoch": 1.41, + "learning_rate": 8.893983892415644e-05, + "loss": 0.0119, + "step": 542820 + }, + { + "epoch": 1.41, + "learning_rate": 8.893595070778499e-05, + "loss": 0.0133, + "step": 542830 + }, + { + "epoch": 1.41, + "learning_rate": 8.893206249141351e-05, + "loss": 0.0114, + "step": 542840 + }, + { + "epoch": 1.41, + "learning_rate": 8.892817427504206e-05, + "loss": 0.0069, + "step": 542850 + }, + { + "epoch": 1.41, + "learning_rate": 8.892428605867058e-05, + "loss": 0.0083, + "step": 542860 + }, + { + "epoch": 1.41, + "learning_rate": 8.892039784229911e-05, + "loss": 0.0094, + "step": 542870 + }, + { + "epoch": 1.41, + "learning_rate": 8.891650962592765e-05, + "loss": 0.0107, + "step": 542880 + }, + { + "epoch": 1.41, + "learning_rate": 8.891262140955618e-05, + "loss": 0.0098, + "step": 542890 + }, + { + "epoch": 1.41, + "learning_rate": 8.890873319318472e-05, + "loss": 0.0084, + "step": 542900 + }, + { + "epoch": 1.41, + "learning_rate": 8.890484497681325e-05, + "loss": 0.008, + "step": 542910 + }, + { + "epoch": 1.41, + "learning_rate": 8.89009567604418e-05, + "loss": 0.0093, + "step": 542920 + }, + { + "epoch": 1.41, + "learning_rate": 8.889706854407032e-05, + "loss": 0.0087, + "step": 542930 + }, + { + "epoch": 1.41, + "learning_rate": 8.889318032769888e-05, + "loss": 0.0092, + "step": 542940 + }, + { + "epoch": 1.41, + "learning_rate": 8.88892921113274e-05, + "loss": 0.0086, + "step": 542950 + }, + { + "epoch": 1.41, + "learning_rate": 8.888540389495595e-05, + "loss": 0.0107, + "step": 542960 + }, + { + "epoch": 1.41, + "learning_rate": 8.888151567858447e-05, + "loss": 0.0066, + "step": 542970 + }, + { + "epoch": 1.41, + "learning_rate": 8.887762746221302e-05, + "loss": 0.01, + "step": 542980 + }, + { + "epoch": 1.41, + "learning_rate": 8.887373924584154e-05, + "loss": 0.0121, + "step": 542990 + }, + { + "epoch": 1.41, + "learning_rate": 8.886985102947009e-05, + "loss": 0.0093, + "step": 543000 + }, + { + "epoch": 1.41, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.006007141899317503, + "eval_runtime": 107.8179, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.637, + "step": 543000 + }, + { + "epoch": 1.41, + "learning_rate": 8.886596281309861e-05, + "loss": 0.0093, + "step": 543010 + }, + { + "epoch": 1.41, + "learning_rate": 8.886207459672716e-05, + "loss": 0.0089, + "step": 543020 + }, + { + "epoch": 1.41, + "learning_rate": 8.885818638035568e-05, + "loss": 0.0076, + "step": 543030 + }, + { + "epoch": 1.41, + "learning_rate": 8.885429816398423e-05, + "loss": 0.0086, + "step": 543040 + }, + { + "epoch": 1.41, + "learning_rate": 8.885040994761275e-05, + "loss": 0.0094, + "step": 543050 + }, + { + "epoch": 1.41, + "learning_rate": 8.88465217312413e-05, + "loss": 0.0076, + "step": 543060 + }, + { + "epoch": 1.41, + "learning_rate": 8.884263351486982e-05, + "loss": 0.0086, + "step": 543070 + }, + { + "epoch": 1.41, + "learning_rate": 8.883874529849836e-05, + "loss": 0.0094, + "step": 543080 + }, + { + "epoch": 1.41, + "learning_rate": 8.883485708212689e-05, + "loss": 0.0089, + "step": 543090 + }, + { + "epoch": 1.41, + "learning_rate": 8.883096886575545e-05, + "loss": 0.0075, + "step": 543100 + }, + { + "epoch": 1.41, + "learning_rate": 8.882708064938398e-05, + "loss": 0.0088, + "step": 543110 + }, + { + "epoch": 1.41, + "learning_rate": 8.882319243301249e-05, + "loss": 0.0107, + "step": 543120 + }, + { + "epoch": 1.41, + "learning_rate": 8.881930421664105e-05, + "loss": 0.0101, + "step": 543130 + }, + { + "epoch": 1.41, + "learning_rate": 8.881541600026957e-05, + "loss": 0.0067, + "step": 543140 + }, + { + "epoch": 1.41, + "learning_rate": 8.881152778389812e-05, + "loss": 0.0082, + "step": 543150 + }, + { + "epoch": 1.41, + "learning_rate": 8.880763956752664e-05, + "loss": 0.0075, + "step": 543160 + }, + { + "epoch": 1.41, + "learning_rate": 8.880375135115519e-05, + "loss": 0.0098, + "step": 543170 + }, + { + "epoch": 1.41, + "learning_rate": 8.879986313478371e-05, + "loss": 0.0081, + "step": 543180 + }, + { + "epoch": 1.41, + "learning_rate": 8.879597491841225e-05, + "loss": 0.0106, + "step": 543190 + }, + { + "epoch": 1.41, + "learning_rate": 8.879208670204078e-05, + "loss": 0.009, + "step": 543200 + }, + { + "epoch": 1.41, + "learning_rate": 8.878819848566932e-05, + "loss": 0.0121, + "step": 543210 + }, + { + "epoch": 1.41, + "learning_rate": 8.878431026929785e-05, + "loss": 0.0061, + "step": 543220 + }, + { + "epoch": 1.41, + "learning_rate": 8.87804220529264e-05, + "loss": 0.0088, + "step": 543230 + }, + { + "epoch": 1.41, + "learning_rate": 8.877653383655492e-05, + "loss": 0.0088, + "step": 543240 + }, + { + "epoch": 1.41, + "learning_rate": 8.877264562018346e-05, + "loss": 0.0064, + "step": 543250 + }, + { + "epoch": 1.41, + "learning_rate": 8.876875740381199e-05, + "loss": 0.0092, + "step": 543260 + }, + { + "epoch": 1.41, + "learning_rate": 8.876486918744053e-05, + "loss": 0.0117, + "step": 543270 + }, + { + "epoch": 1.41, + "learning_rate": 8.876098097106906e-05, + "loss": 0.0075, + "step": 543280 + }, + { + "epoch": 1.41, + "learning_rate": 8.875709275469762e-05, + "loss": 0.0107, + "step": 543290 + }, + { + "epoch": 1.41, + "learning_rate": 8.875320453832615e-05, + "loss": 0.0166, + "step": 543300 + }, + { + "epoch": 1.41, + "learning_rate": 8.874931632195469e-05, + "loss": 0.0088, + "step": 543310 + }, + { + "epoch": 1.41, + "learning_rate": 8.874542810558321e-05, + "loss": 0.0123, + "step": 543320 + }, + { + "epoch": 1.41, + "learning_rate": 8.874153988921176e-05, + "loss": 0.008, + "step": 543330 + }, + { + "epoch": 1.41, + "learning_rate": 8.873765167284028e-05, + "loss": 0.0114, + "step": 543340 + }, + { + "epoch": 1.41, + "learning_rate": 8.873376345646883e-05, + "loss": 0.0095, + "step": 543350 + }, + { + "epoch": 1.41, + "learning_rate": 8.872987524009735e-05, + "loss": 0.0123, + "step": 543360 + }, + { + "epoch": 1.41, + "learning_rate": 8.872598702372588e-05, + "loss": 0.0085, + "step": 543370 + }, + { + "epoch": 1.41, + "learning_rate": 8.872209880735442e-05, + "loss": 0.0079, + "step": 543380 + }, + { + "epoch": 1.41, + "learning_rate": 8.871821059098295e-05, + "loss": 0.0086, + "step": 543390 + }, + { + "epoch": 1.41, + "learning_rate": 8.87143223746115e-05, + "loss": 0.0114, + "step": 543400 + }, + { + "epoch": 1.41, + "learning_rate": 8.871043415824002e-05, + "loss": 0.0102, + "step": 543410 + }, + { + "epoch": 1.41, + "learning_rate": 8.870654594186856e-05, + "loss": 0.0097, + "step": 543420 + }, + { + "epoch": 1.41, + "learning_rate": 8.870265772549709e-05, + "loss": 0.0133, + "step": 543430 + }, + { + "epoch": 1.41, + "learning_rate": 8.869876950912563e-05, + "loss": 0.0112, + "step": 543440 + }, + { + "epoch": 1.41, + "learning_rate": 8.869488129275416e-05, + "loss": 0.0156, + "step": 543450 + }, + { + "epoch": 1.41, + "learning_rate": 8.869099307638272e-05, + "loss": 0.0084, + "step": 543460 + }, + { + "epoch": 1.41, + "learning_rate": 8.868710486001123e-05, + "loss": 0.0101, + "step": 543470 + }, + { + "epoch": 1.41, + "learning_rate": 8.868321664363979e-05, + "loss": 0.0103, + "step": 543480 + }, + { + "epoch": 1.41, + "learning_rate": 8.867932842726831e-05, + "loss": 0.0095, + "step": 543490 + }, + { + "epoch": 1.41, + "learning_rate": 8.867544021089686e-05, + "loss": 0.0059, + "step": 543500 + }, + { + "epoch": 1.41, + "learning_rate": 8.867155199452538e-05, + "loss": 0.011, + "step": 543510 + }, + { + "epoch": 1.41, + "learning_rate": 8.866766377815393e-05, + "loss": 0.0098, + "step": 543520 + }, + { + "epoch": 1.41, + "learning_rate": 8.866377556178245e-05, + "loss": 0.0105, + "step": 543530 + }, + { + "epoch": 1.41, + "learning_rate": 8.8659887345411e-05, + "loss": 0.009, + "step": 543540 + }, + { + "epoch": 1.41, + "learning_rate": 8.865599912903952e-05, + "loss": 0.0112, + "step": 543550 + }, + { + "epoch": 1.41, + "learning_rate": 8.865211091266807e-05, + "loss": 0.0108, + "step": 543560 + }, + { + "epoch": 1.41, + "learning_rate": 8.86482226962966e-05, + "loss": 0.0087, + "step": 543570 + }, + { + "epoch": 1.41, + "learning_rate": 8.864433447992513e-05, + "loss": 0.0095, + "step": 543580 + }, + { + "epoch": 1.41, + "learning_rate": 8.864044626355366e-05, + "loss": 0.0085, + "step": 543590 + }, + { + "epoch": 1.41, + "learning_rate": 8.86365580471822e-05, + "loss": 0.0104, + "step": 543600 + }, + { + "epoch": 1.41, + "learning_rate": 8.863266983081073e-05, + "loss": 0.0123, + "step": 543610 + }, + { + "epoch": 1.41, + "learning_rate": 8.862878161443926e-05, + "loss": 0.0099, + "step": 543620 + }, + { + "epoch": 1.41, + "learning_rate": 8.86248933980678e-05, + "loss": 0.0119, + "step": 543630 + }, + { + "epoch": 1.41, + "learning_rate": 8.862100518169633e-05, + "loss": 0.0097, + "step": 543640 + }, + { + "epoch": 1.41, + "learning_rate": 8.861711696532489e-05, + "loss": 0.0132, + "step": 543650 + }, + { + "epoch": 1.41, + "learning_rate": 8.861322874895341e-05, + "loss": 0.0087, + "step": 543660 + }, + { + "epoch": 1.41, + "learning_rate": 8.860934053258196e-05, + "loss": 0.0108, + "step": 543670 + }, + { + "epoch": 1.41, + "learning_rate": 8.860545231621048e-05, + "loss": 0.0107, + "step": 543680 + }, + { + "epoch": 1.41, + "learning_rate": 8.860156409983903e-05, + "loss": 0.01, + "step": 543690 + }, + { + "epoch": 1.41, + "learning_rate": 8.859767588346755e-05, + "loss": 0.0108, + "step": 543700 + }, + { + "epoch": 1.41, + "learning_rate": 8.85937876670961e-05, + "loss": 0.0083, + "step": 543710 + }, + { + "epoch": 1.41, + "learning_rate": 8.858989945072462e-05, + "loss": 0.0083, + "step": 543720 + }, + { + "epoch": 1.41, + "learning_rate": 8.858601123435316e-05, + "loss": 0.0119, + "step": 543730 + }, + { + "epoch": 1.41, + "learning_rate": 8.858212301798169e-05, + "loss": 0.0075, + "step": 543740 + }, + { + "epoch": 1.41, + "learning_rate": 8.857823480161023e-05, + "loss": 0.0137, + "step": 543750 + }, + { + "epoch": 1.41, + "learning_rate": 8.857434658523876e-05, + "loss": 0.0087, + "step": 543760 + }, + { + "epoch": 1.41, + "learning_rate": 8.85704583688673e-05, + "loss": 0.009, + "step": 543770 + }, + { + "epoch": 1.41, + "learning_rate": 8.856657015249583e-05, + "loss": 0.0091, + "step": 543780 + }, + { + "epoch": 1.41, + "learning_rate": 8.856268193612437e-05, + "loss": 0.0079, + "step": 543790 + }, + { + "epoch": 1.41, + "learning_rate": 8.85587937197529e-05, + "loss": 0.0091, + "step": 543800 + }, + { + "epoch": 1.41, + "learning_rate": 8.855490550338146e-05, + "loss": 0.0089, + "step": 543810 + }, + { + "epoch": 1.41, + "learning_rate": 8.855101728700999e-05, + "loss": 0.0093, + "step": 543820 + }, + { + "epoch": 1.41, + "learning_rate": 8.854712907063853e-05, + "loss": 0.011, + "step": 543830 + }, + { + "epoch": 1.41, + "learning_rate": 8.854324085426705e-05, + "loss": 0.0096, + "step": 543840 + }, + { + "epoch": 1.41, + "learning_rate": 8.853935263789558e-05, + "loss": 0.0088, + "step": 543850 + }, + { + "epoch": 1.41, + "learning_rate": 8.853546442152412e-05, + "loss": 0.011, + "step": 543860 + }, + { + "epoch": 1.41, + "learning_rate": 8.853157620515265e-05, + "loss": 0.0107, + "step": 543870 + }, + { + "epoch": 1.41, + "learning_rate": 8.85276879887812e-05, + "loss": 0.0111, + "step": 543880 + }, + { + "epoch": 1.41, + "learning_rate": 8.852379977240972e-05, + "loss": 0.011, + "step": 543890 + }, + { + "epoch": 1.41, + "learning_rate": 8.851991155603826e-05, + "loss": 0.0126, + "step": 543900 + }, + { + "epoch": 1.41, + "learning_rate": 8.851602333966679e-05, + "loss": 0.0087, + "step": 543910 + }, + { + "epoch": 1.41, + "learning_rate": 8.851213512329533e-05, + "loss": 0.0116, + "step": 543920 + }, + { + "epoch": 1.41, + "learning_rate": 8.850824690692386e-05, + "loss": 0.0102, + "step": 543930 + }, + { + "epoch": 1.41, + "learning_rate": 8.85043586905524e-05, + "loss": 0.0142, + "step": 543940 + }, + { + "epoch": 1.41, + "learning_rate": 8.850047047418093e-05, + "loss": 0.009, + "step": 543950 + }, + { + "epoch": 1.41, + "learning_rate": 8.849658225780947e-05, + "loss": 0.0105, + "step": 543960 + }, + { + "epoch": 1.41, + "learning_rate": 8.8492694041438e-05, + "loss": 0.0069, + "step": 543970 + }, + { + "epoch": 1.41, + "learning_rate": 8.848880582506656e-05, + "loss": 0.0078, + "step": 543980 + }, + { + "epoch": 1.41, + "learning_rate": 8.848491760869507e-05, + "loss": 0.009, + "step": 543990 + }, + { + "epoch": 1.41, + "learning_rate": 8.848102939232363e-05, + "loss": 0.0133, + "step": 544000 + }, + { + "epoch": 1.41, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.006026812829077244, + "eval_runtime": 107.9103, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.633, + "step": 544000 + }, + { + "epoch": 1.41, + "learning_rate": 8.847714117595215e-05, + "loss": 0.0129, + "step": 544010 + }, + { + "epoch": 1.41, + "learning_rate": 8.84732529595807e-05, + "loss": 0.0113, + "step": 544020 + }, + { + "epoch": 1.41, + "learning_rate": 8.846936474320922e-05, + "loss": 0.0088, + "step": 544030 + }, + { + "epoch": 1.41, + "learning_rate": 8.846547652683777e-05, + "loss": 0.0132, + "step": 544040 + }, + { + "epoch": 1.41, + "learning_rate": 8.84615883104663e-05, + "loss": 0.0107, + "step": 544050 + }, + { + "epoch": 1.41, + "learning_rate": 8.845770009409484e-05, + "loss": 0.0091, + "step": 544060 + }, + { + "epoch": 1.41, + "learning_rate": 8.845381187772336e-05, + "loss": 0.0086, + "step": 544070 + }, + { + "epoch": 1.41, + "learning_rate": 8.84499236613519e-05, + "loss": 0.0097, + "step": 544080 + }, + { + "epoch": 1.41, + "learning_rate": 8.844603544498043e-05, + "loss": 0.0117, + "step": 544090 + }, + { + "epoch": 1.41, + "learning_rate": 8.844214722860896e-05, + "loss": 0.0078, + "step": 544100 + }, + { + "epoch": 1.41, + "learning_rate": 8.84382590122375e-05, + "loss": 0.0091, + "step": 544110 + }, + { + "epoch": 1.41, + "learning_rate": 8.843437079586603e-05, + "loss": 0.0097, + "step": 544120 + }, + { + "epoch": 1.41, + "learning_rate": 8.843048257949457e-05, + "loss": 0.0092, + "step": 544130 + }, + { + "epoch": 1.41, + "learning_rate": 8.84265943631231e-05, + "loss": 0.006, + "step": 544140 + }, + { + "epoch": 1.41, + "learning_rate": 8.842270614675164e-05, + "loss": 0.0097, + "step": 544150 + }, + { + "epoch": 1.41, + "learning_rate": 8.841881793038017e-05, + "loss": 0.0133, + "step": 544160 + }, + { + "epoch": 1.41, + "learning_rate": 8.841492971400873e-05, + "loss": 0.0093, + "step": 544170 + }, + { + "epoch": 1.41, + "learning_rate": 8.841104149763725e-05, + "loss": 0.0069, + "step": 544180 + }, + { + "epoch": 1.41, + "learning_rate": 8.84071532812658e-05, + "loss": 0.0125, + "step": 544190 + }, + { + "epoch": 1.41, + "learning_rate": 8.840326506489432e-05, + "loss": 0.0081, + "step": 544200 + }, + { + "epoch": 1.41, + "learning_rate": 8.839937684852287e-05, + "loss": 0.0092, + "step": 544210 + }, + { + "epoch": 1.41, + "learning_rate": 8.839548863215139e-05, + "loss": 0.0082, + "step": 544220 + }, + { + "epoch": 1.41, + "learning_rate": 8.839160041577993e-05, + "loss": 0.0109, + "step": 544230 + }, + { + "epoch": 1.41, + "learning_rate": 8.838771219940846e-05, + "loss": 0.0101, + "step": 544240 + }, + { + "epoch": 1.41, + "learning_rate": 8.8383823983037e-05, + "loss": 0.0117, + "step": 544250 + }, + { + "epoch": 1.41, + "learning_rate": 8.837993576666553e-05, + "loss": 0.0067, + "step": 544260 + }, + { + "epoch": 1.41, + "learning_rate": 8.837604755029407e-05, + "loss": 0.009, + "step": 544270 + }, + { + "epoch": 1.41, + "learning_rate": 8.83721593339226e-05, + "loss": 0.0065, + "step": 544280 + }, + { + "epoch": 1.41, + "learning_rate": 8.836827111755114e-05, + "loss": 0.0095, + "step": 544290 + }, + { + "epoch": 1.41, + "learning_rate": 8.836438290117967e-05, + "loss": 0.008, + "step": 544300 + }, + { + "epoch": 1.41, + "learning_rate": 8.836049468480821e-05, + "loss": 0.0059, + "step": 544310 + }, + { + "epoch": 1.41, + "learning_rate": 8.835660646843674e-05, + "loss": 0.0107, + "step": 544320 + }, + { + "epoch": 1.41, + "learning_rate": 8.83527182520653e-05, + "loss": 0.0106, + "step": 544330 + }, + { + "epoch": 1.41, + "learning_rate": 8.834883003569383e-05, + "loss": 0.0092, + "step": 544340 + }, + { + "epoch": 1.41, + "learning_rate": 8.834494181932234e-05, + "loss": 0.0093, + "step": 544350 + }, + { + "epoch": 1.41, + "learning_rate": 8.83410536029509e-05, + "loss": 0.0089, + "step": 544360 + }, + { + "epoch": 1.41, + "learning_rate": 8.833716538657942e-05, + "loss": 0.0088, + "step": 544370 + }, + { + "epoch": 1.41, + "learning_rate": 8.833327717020796e-05, + "loss": 0.0083, + "step": 544380 + }, + { + "epoch": 1.41, + "learning_rate": 8.832938895383649e-05, + "loss": 0.0074, + "step": 544390 + }, + { + "epoch": 1.41, + "learning_rate": 8.832550073746503e-05, + "loss": 0.0117, + "step": 544400 + }, + { + "epoch": 1.41, + "learning_rate": 8.832161252109356e-05, + "loss": 0.0087, + "step": 544410 + }, + { + "epoch": 1.41, + "learning_rate": 8.83177243047221e-05, + "loss": 0.0057, + "step": 544420 + }, + { + "epoch": 1.41, + "learning_rate": 8.831383608835063e-05, + "loss": 0.0101, + "step": 544430 + }, + { + "epoch": 1.41, + "learning_rate": 8.830994787197917e-05, + "loss": 0.0084, + "step": 544440 + }, + { + "epoch": 1.41, + "learning_rate": 8.83060596556077e-05, + "loss": 0.0094, + "step": 544450 + }, + { + "epoch": 1.41, + "learning_rate": 8.830217143923624e-05, + "loss": 0.0127, + "step": 544460 + }, + { + "epoch": 1.41, + "learning_rate": 8.829828322286477e-05, + "loss": 0.0101, + "step": 544470 + }, + { + "epoch": 1.41, + "learning_rate": 8.829439500649331e-05, + "loss": 0.01, + "step": 544480 + }, + { + "epoch": 1.41, + "learning_rate": 8.829050679012184e-05, + "loss": 0.0083, + "step": 544490 + }, + { + "epoch": 1.41, + "learning_rate": 8.828661857375038e-05, + "loss": 0.0081, + "step": 544500 + }, + { + "epoch": 1.41, + "learning_rate": 8.828273035737891e-05, + "loss": 0.0087, + "step": 544510 + }, + { + "epoch": 1.41, + "learning_rate": 8.827884214100747e-05, + "loss": 0.0108, + "step": 544520 + }, + { + "epoch": 1.41, + "learning_rate": 8.8274953924636e-05, + "loss": 0.009, + "step": 544530 + }, + { + "epoch": 1.41, + "learning_rate": 8.827106570826454e-05, + "loss": 0.0104, + "step": 544540 + }, + { + "epoch": 1.41, + "learning_rate": 8.826717749189306e-05, + "loss": 0.0086, + "step": 544550 + }, + { + "epoch": 1.41, + "learning_rate": 8.82632892755216e-05, + "loss": 0.0092, + "step": 544560 + }, + { + "epoch": 1.41, + "learning_rate": 8.825940105915013e-05, + "loss": 0.009, + "step": 544570 + }, + { + "epoch": 1.41, + "learning_rate": 8.825551284277868e-05, + "loss": 0.0128, + "step": 544580 + }, + { + "epoch": 1.41, + "learning_rate": 8.82516246264072e-05, + "loss": 0.0095, + "step": 544590 + }, + { + "epoch": 1.41, + "learning_rate": 8.824773641003573e-05, + "loss": 0.0097, + "step": 544600 + }, + { + "epoch": 1.41, + "learning_rate": 8.824384819366427e-05, + "loss": 0.0101, + "step": 544610 + }, + { + "epoch": 1.41, + "learning_rate": 8.82399599772928e-05, + "loss": 0.0117, + "step": 544620 + }, + { + "epoch": 1.41, + "learning_rate": 8.823607176092134e-05, + "loss": 0.0097, + "step": 544630 + }, + { + "epoch": 1.41, + "learning_rate": 8.823218354454987e-05, + "loss": 0.0117, + "step": 544640 + }, + { + "epoch": 1.41, + "learning_rate": 8.822829532817841e-05, + "loss": 0.0131, + "step": 544650 + }, + { + "epoch": 1.41, + "learning_rate": 8.822440711180694e-05, + "loss": 0.01, + "step": 544660 + }, + { + "epoch": 1.41, + "learning_rate": 8.822051889543548e-05, + "loss": 0.0081, + "step": 544670 + }, + { + "epoch": 1.41, + "learning_rate": 8.821663067906401e-05, + "loss": 0.0081, + "step": 544680 + }, + { + "epoch": 1.41, + "learning_rate": 8.821274246269257e-05, + "loss": 0.007, + "step": 544690 + }, + { + "epoch": 1.41, + "learning_rate": 8.820885424632108e-05, + "loss": 0.0173, + "step": 544700 + }, + { + "epoch": 1.41, + "learning_rate": 8.820496602994964e-05, + "loss": 0.0086, + "step": 544710 + }, + { + "epoch": 1.41, + "learning_rate": 8.820107781357816e-05, + "loss": 0.0105, + "step": 544720 + }, + { + "epoch": 1.41, + "learning_rate": 8.81971895972067e-05, + "loss": 0.0109, + "step": 544730 + }, + { + "epoch": 1.41, + "learning_rate": 8.819330138083523e-05, + "loss": 0.0118, + "step": 544740 + }, + { + "epoch": 1.41, + "learning_rate": 8.818941316446377e-05, + "loss": 0.0121, + "step": 544750 + }, + { + "epoch": 1.41, + "learning_rate": 8.81855249480923e-05, + "loss": 0.0107, + "step": 544760 + }, + { + "epoch": 1.41, + "learning_rate": 8.818163673172084e-05, + "loss": 0.0096, + "step": 544770 + }, + { + "epoch": 1.41, + "learning_rate": 8.817774851534937e-05, + "loss": 0.0076, + "step": 544780 + }, + { + "epoch": 1.41, + "learning_rate": 8.817386029897791e-05, + "loss": 0.0101, + "step": 544790 + }, + { + "epoch": 1.41, + "learning_rate": 8.816997208260644e-05, + "loss": 0.0099, + "step": 544800 + }, + { + "epoch": 1.41, + "learning_rate": 8.816608386623498e-05, + "loss": 0.0064, + "step": 544810 + }, + { + "epoch": 1.41, + "learning_rate": 8.816219564986351e-05, + "loss": 0.0121, + "step": 544820 + }, + { + "epoch": 1.41, + "learning_rate": 8.815830743349205e-05, + "loss": 0.0097, + "step": 544830 + }, + { + "epoch": 1.41, + "learning_rate": 8.815441921712058e-05, + "loss": 0.0105, + "step": 544840 + }, + { + "epoch": 1.41, + "learning_rate": 8.815053100074911e-05, + "loss": 0.0071, + "step": 544850 + }, + { + "epoch": 1.41, + "learning_rate": 8.814664278437765e-05, + "loss": 0.0074, + "step": 544860 + }, + { + "epoch": 1.41, + "learning_rate": 8.814275456800618e-05, + "loss": 0.0098, + "step": 544870 + }, + { + "epoch": 1.41, + "learning_rate": 8.813886635163473e-05, + "loss": 0.0099, + "step": 544880 + }, + { + "epoch": 1.41, + "learning_rate": 8.813497813526326e-05, + "loss": 0.01, + "step": 544890 + }, + { + "epoch": 1.41, + "learning_rate": 8.81310899188918e-05, + "loss": 0.0084, + "step": 544900 + }, + { + "epoch": 1.41, + "learning_rate": 8.812720170252033e-05, + "loss": 0.0091, + "step": 544910 + }, + { + "epoch": 1.41, + "learning_rate": 8.812331348614887e-05, + "loss": 0.008, + "step": 544920 + }, + { + "epoch": 1.41, + "learning_rate": 8.81194252697774e-05, + "loss": 0.0087, + "step": 544930 + }, + { + "epoch": 1.41, + "learning_rate": 8.811553705340594e-05, + "loss": 0.0105, + "step": 544940 + }, + { + "epoch": 1.41, + "learning_rate": 8.811164883703447e-05, + "loss": 0.0087, + "step": 544950 + }, + { + "epoch": 1.41, + "learning_rate": 8.810776062066301e-05, + "loss": 0.0102, + "step": 544960 + }, + { + "epoch": 1.41, + "learning_rate": 8.810387240429154e-05, + "loss": 0.0073, + "step": 544970 + }, + { + "epoch": 1.41, + "learning_rate": 8.809998418792008e-05, + "loss": 0.0095, + "step": 544980 + }, + { + "epoch": 1.41, + "learning_rate": 8.809609597154861e-05, + "loss": 0.0086, + "step": 544990 + }, + { + "epoch": 1.41, + "learning_rate": 8.809220775517715e-05, + "loss": 0.0092, + "step": 545000 + }, + { + "epoch": 1.41, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.0062423269264400005, + "eval_runtime": 107.912, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.633, + "step": 545000 + }, + { + "epoch": 1.41, + "learning_rate": 8.808831953880568e-05, + "loss": 0.0121, + "step": 545010 + }, + { + "epoch": 1.41, + "learning_rate": 8.808443132243422e-05, + "loss": 0.0095, + "step": 545020 + }, + { + "epoch": 1.41, + "learning_rate": 8.808054310606275e-05, + "loss": 0.0098, + "step": 545030 + }, + { + "epoch": 1.41, + "learning_rate": 8.80766548896913e-05, + "loss": 0.0109, + "step": 545040 + }, + { + "epoch": 1.41, + "learning_rate": 8.807276667331983e-05, + "loss": 0.009, + "step": 545050 + }, + { + "epoch": 1.41, + "learning_rate": 8.806887845694838e-05, + "loss": 0.0078, + "step": 545060 + }, + { + "epoch": 1.41, + "learning_rate": 8.80649902405769e-05, + "loss": 0.011, + "step": 545070 + }, + { + "epoch": 1.41, + "learning_rate": 8.806110202420545e-05, + "loss": 0.0093, + "step": 545080 + }, + { + "epoch": 1.41, + "learning_rate": 8.805721380783397e-05, + "loss": 0.0072, + "step": 545090 + }, + { + "epoch": 1.41, + "learning_rate": 8.80533255914625e-05, + "loss": 0.0099, + "step": 545100 + }, + { + "epoch": 1.41, + "learning_rate": 8.804943737509104e-05, + "loss": 0.0104, + "step": 545110 + }, + { + "epoch": 1.41, + "learning_rate": 8.804554915871957e-05, + "loss": 0.0086, + "step": 545120 + }, + { + "epoch": 1.41, + "learning_rate": 8.804166094234811e-05, + "loss": 0.0084, + "step": 545130 + }, + { + "epoch": 1.41, + "learning_rate": 8.803777272597664e-05, + "loss": 0.0085, + "step": 545140 + }, + { + "epoch": 1.41, + "learning_rate": 8.803388450960518e-05, + "loss": 0.0093, + "step": 545150 + }, + { + "epoch": 1.41, + "learning_rate": 8.802999629323371e-05, + "loss": 0.0091, + "step": 545160 + }, + { + "epoch": 1.41, + "learning_rate": 8.802610807686225e-05, + "loss": 0.0095, + "step": 545170 + }, + { + "epoch": 1.41, + "learning_rate": 8.802221986049078e-05, + "loss": 0.0079, + "step": 545180 + }, + { + "epoch": 1.41, + "learning_rate": 8.801833164411932e-05, + "loss": 0.0087, + "step": 545190 + }, + { + "epoch": 1.41, + "learning_rate": 8.801444342774785e-05, + "loss": 0.0106, + "step": 545200 + }, + { + "epoch": 1.41, + "learning_rate": 8.80105552113764e-05, + "loss": 0.0084, + "step": 545210 + }, + { + "epoch": 1.41, + "learning_rate": 8.800666699500492e-05, + "loss": 0.0102, + "step": 545220 + }, + { + "epoch": 1.41, + "learning_rate": 8.800277877863348e-05, + "loss": 0.0119, + "step": 545230 + }, + { + "epoch": 1.41, + "learning_rate": 8.7998890562262e-05, + "loss": 0.0093, + "step": 545240 + }, + { + "epoch": 1.41, + "learning_rate": 8.799500234589054e-05, + "loss": 0.0111, + "step": 545250 + }, + { + "epoch": 1.41, + "learning_rate": 8.799111412951907e-05, + "loss": 0.0094, + "step": 545260 + }, + { + "epoch": 1.41, + "learning_rate": 8.798722591314761e-05, + "loss": 0.008, + "step": 545270 + }, + { + "epoch": 1.41, + "learning_rate": 8.798333769677614e-05, + "loss": 0.01, + "step": 545280 + }, + { + "epoch": 1.41, + "learning_rate": 8.797944948040468e-05, + "loss": 0.0107, + "step": 545290 + }, + { + "epoch": 1.41, + "learning_rate": 8.797556126403321e-05, + "loss": 0.0089, + "step": 545300 + }, + { + "epoch": 1.41, + "learning_rate": 8.797167304766175e-05, + "loss": 0.0082, + "step": 545310 + }, + { + "epoch": 1.41, + "learning_rate": 8.796778483129028e-05, + "loss": 0.0137, + "step": 545320 + }, + { + "epoch": 1.41, + "learning_rate": 8.796389661491882e-05, + "loss": 0.0085, + "step": 545330 + }, + { + "epoch": 1.41, + "learning_rate": 8.796000839854735e-05, + "loss": 0.0117, + "step": 545340 + }, + { + "epoch": 1.41, + "learning_rate": 8.795612018217588e-05, + "loss": 0.0121, + "step": 545350 + }, + { + "epoch": 1.41, + "learning_rate": 8.795223196580442e-05, + "loss": 0.0091, + "step": 545360 + }, + { + "epoch": 1.41, + "learning_rate": 8.794834374943295e-05, + "loss": 0.0109, + "step": 545370 + }, + { + "epoch": 1.41, + "learning_rate": 8.794445553306149e-05, + "loss": 0.0104, + "step": 545380 + }, + { + "epoch": 1.41, + "learning_rate": 8.794056731669002e-05, + "loss": 0.0087, + "step": 545390 + }, + { + "epoch": 1.41, + "learning_rate": 8.793667910031857e-05, + "loss": 0.0096, + "step": 545400 + }, + { + "epoch": 1.41, + "learning_rate": 8.79327908839471e-05, + "loss": 0.0085, + "step": 545410 + }, + { + "epoch": 1.41, + "learning_rate": 8.792890266757564e-05, + "loss": 0.0067, + "step": 545420 + }, + { + "epoch": 1.41, + "learning_rate": 8.792501445120417e-05, + "loss": 0.0086, + "step": 545430 + }, + { + "epoch": 1.41, + "learning_rate": 8.792112623483271e-05, + "loss": 0.0092, + "step": 545440 + }, + { + "epoch": 1.41, + "learning_rate": 8.791723801846124e-05, + "loss": 0.0086, + "step": 545450 + }, + { + "epoch": 1.41, + "learning_rate": 8.791334980208978e-05, + "loss": 0.0087, + "step": 545460 + }, + { + "epoch": 1.41, + "learning_rate": 8.790946158571831e-05, + "loss": 0.0082, + "step": 545470 + }, + { + "epoch": 1.41, + "learning_rate": 8.790557336934685e-05, + "loss": 0.0099, + "step": 545480 + }, + { + "epoch": 1.41, + "learning_rate": 8.790168515297538e-05, + "loss": 0.0092, + "step": 545490 + }, + { + "epoch": 1.41, + "learning_rate": 8.789779693660392e-05, + "loss": 0.009, + "step": 545500 + }, + { + "epoch": 1.41, + "learning_rate": 8.789390872023245e-05, + "loss": 0.011, + "step": 545510 + }, + { + "epoch": 1.41, + "learning_rate": 8.789002050386099e-05, + "loss": 0.0088, + "step": 545520 + }, + { + "epoch": 1.41, + "learning_rate": 8.788613228748952e-05, + "loss": 0.0108, + "step": 545530 + }, + { + "epoch": 1.41, + "learning_rate": 8.788224407111806e-05, + "loss": 0.0118, + "step": 545540 + }, + { + "epoch": 1.41, + "learning_rate": 8.787835585474659e-05, + "loss": 0.0091, + "step": 545550 + }, + { + "epoch": 1.41, + "learning_rate": 8.787446763837515e-05, + "loss": 0.008, + "step": 545560 + }, + { + "epoch": 1.41, + "learning_rate": 8.787057942200367e-05, + "loss": 0.0119, + "step": 545570 + }, + { + "epoch": 1.41, + "learning_rate": 8.786669120563222e-05, + "loss": 0.0104, + "step": 545580 + }, + { + "epoch": 1.41, + "learning_rate": 8.786280298926074e-05, + "loss": 0.0102, + "step": 545590 + }, + { + "epoch": 1.41, + "learning_rate": 8.785891477288927e-05, + "loss": 0.0268, + "step": 545600 + }, + { + "epoch": 1.41, + "learning_rate": 8.785502655651781e-05, + "loss": 0.0087, + "step": 545610 + }, + { + "epoch": 1.41, + "learning_rate": 8.785113834014634e-05, + "loss": 0.0102, + "step": 545620 + }, + { + "epoch": 1.41, + "learning_rate": 8.784725012377488e-05, + "loss": 0.0087, + "step": 545630 + }, + { + "epoch": 1.41, + "learning_rate": 8.784336190740341e-05, + "loss": 0.0119, + "step": 545640 + }, + { + "epoch": 1.41, + "learning_rate": 8.783947369103195e-05, + "loss": 0.0097, + "step": 545650 + }, + { + "epoch": 1.41, + "learning_rate": 8.783558547466048e-05, + "loss": 0.0083, + "step": 545660 + }, + { + "epoch": 1.41, + "learning_rate": 8.783169725828902e-05, + "loss": 0.0101, + "step": 545670 + }, + { + "epoch": 1.41, + "learning_rate": 8.782780904191755e-05, + "loss": 0.0115, + "step": 545680 + }, + { + "epoch": 1.41, + "learning_rate": 8.782392082554609e-05, + "loss": 0.0086, + "step": 545690 + }, + { + "epoch": 1.41, + "learning_rate": 8.782003260917462e-05, + "loss": 0.0068, + "step": 545700 + }, + { + "epoch": 1.41, + "learning_rate": 8.781614439280316e-05, + "loss": 0.0078, + "step": 545710 + }, + { + "epoch": 1.41, + "learning_rate": 8.781225617643169e-05, + "loss": 0.0127, + "step": 545720 + }, + { + "epoch": 1.41, + "learning_rate": 8.780836796006025e-05, + "loss": 0.0123, + "step": 545730 + }, + { + "epoch": 1.41, + "learning_rate": 8.780447974368876e-05, + "loss": 0.0111, + "step": 545740 + }, + { + "epoch": 1.41, + "learning_rate": 8.780059152731732e-05, + "loss": 0.0104, + "step": 545750 + }, + { + "epoch": 1.41, + "learning_rate": 8.779670331094584e-05, + "loss": 0.0102, + "step": 545760 + }, + { + "epoch": 1.41, + "learning_rate": 8.779281509457438e-05, + "loss": 0.0095, + "step": 545770 + }, + { + "epoch": 1.41, + "learning_rate": 8.778892687820291e-05, + "loss": 0.0085, + "step": 545780 + }, + { + "epoch": 1.41, + "learning_rate": 8.778503866183145e-05, + "loss": 0.007, + "step": 545790 + }, + { + "epoch": 1.41, + "learning_rate": 8.778115044545998e-05, + "loss": 0.0091, + "step": 545800 + }, + { + "epoch": 1.41, + "learning_rate": 8.777726222908852e-05, + "loss": 0.0095, + "step": 545810 + }, + { + "epoch": 1.41, + "learning_rate": 8.777337401271705e-05, + "loss": 0.0078, + "step": 545820 + }, + { + "epoch": 1.41, + "learning_rate": 8.77694857963456e-05, + "loss": 0.0097, + "step": 545830 + }, + { + "epoch": 1.41, + "learning_rate": 8.776559757997412e-05, + "loss": 0.0088, + "step": 545840 + }, + { + "epoch": 1.41, + "learning_rate": 8.776170936360265e-05, + "loss": 0.0093, + "step": 545850 + }, + { + "epoch": 1.41, + "learning_rate": 8.775782114723119e-05, + "loss": 0.0107, + "step": 545860 + }, + { + "epoch": 1.41, + "learning_rate": 8.775393293085972e-05, + "loss": 0.0086, + "step": 545870 + }, + { + "epoch": 1.41, + "learning_rate": 8.775004471448826e-05, + "loss": 0.0095, + "step": 545880 + }, + { + "epoch": 1.42, + "learning_rate": 8.774615649811679e-05, + "loss": 0.0107, + "step": 545890 + }, + { + "epoch": 1.42, + "learning_rate": 8.774226828174533e-05, + "loss": 0.0106, + "step": 545900 + }, + { + "epoch": 1.42, + "learning_rate": 8.773838006537386e-05, + "loss": 0.0117, + "step": 545910 + }, + { + "epoch": 1.42, + "learning_rate": 8.773449184900241e-05, + "loss": 0.0093, + "step": 545920 + }, + { + "epoch": 1.42, + "learning_rate": 8.773060363263094e-05, + "loss": 0.008, + "step": 545930 + }, + { + "epoch": 1.42, + "learning_rate": 8.772671541625948e-05, + "loss": 0.009, + "step": 545940 + }, + { + "epoch": 1.42, + "learning_rate": 8.772282719988801e-05, + "loss": 0.0123, + "step": 545950 + }, + { + "epoch": 1.42, + "learning_rate": 8.771893898351655e-05, + "loss": 0.0151, + "step": 545960 + }, + { + "epoch": 1.42, + "learning_rate": 8.771505076714508e-05, + "loss": 0.0092, + "step": 545970 + }, + { + "epoch": 1.42, + "learning_rate": 8.771116255077362e-05, + "loss": 0.0125, + "step": 545980 + }, + { + "epoch": 1.42, + "learning_rate": 8.770727433440215e-05, + "loss": 0.0104, + "step": 545990 + }, + { + "epoch": 1.42, + "learning_rate": 8.77033861180307e-05, + "loss": 0.0106, + "step": 546000 + }, + { + "epoch": 1.42, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.0062417564913630486, + "eval_runtime": 107.9696, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 546000 + }, + { + "epoch": 1.42, + "learning_rate": 8.769949790165922e-05, + "loss": 0.0111, + "step": 546010 + }, + { + "epoch": 1.42, + "learning_rate": 8.769560968528776e-05, + "loss": 0.011, + "step": 546020 + }, + { + "epoch": 1.42, + "learning_rate": 8.769172146891629e-05, + "loss": 0.0107, + "step": 546030 + }, + { + "epoch": 1.42, + "learning_rate": 8.768783325254483e-05, + "loss": 0.009, + "step": 546040 + }, + { + "epoch": 1.42, + "learning_rate": 8.768394503617336e-05, + "loss": 0.0074, + "step": 546050 + }, + { + "epoch": 1.42, + "learning_rate": 8.76800568198019e-05, + "loss": 0.011, + "step": 546060 + }, + { + "epoch": 1.42, + "learning_rate": 8.767616860343043e-05, + "loss": 0.0083, + "step": 546070 + }, + { + "epoch": 1.42, + "learning_rate": 8.767228038705899e-05, + "loss": 0.0102, + "step": 546080 + }, + { + "epoch": 1.42, + "learning_rate": 8.76683921706875e-05, + "loss": 0.0097, + "step": 546090 + }, + { + "epoch": 1.42, + "learning_rate": 8.766450395431603e-05, + "loss": 0.0088, + "step": 546100 + }, + { + "epoch": 1.42, + "learning_rate": 8.766061573794458e-05, + "loss": 0.0098, + "step": 546110 + }, + { + "epoch": 1.42, + "learning_rate": 8.765672752157311e-05, + "loss": 0.0142, + "step": 546120 + }, + { + "epoch": 1.42, + "learning_rate": 8.765283930520165e-05, + "loss": 0.0082, + "step": 546130 + }, + { + "epoch": 1.42, + "learning_rate": 8.764895108883018e-05, + "loss": 0.0083, + "step": 546140 + }, + { + "epoch": 1.42, + "learning_rate": 8.764506287245872e-05, + "loss": 0.0102, + "step": 546150 + }, + { + "epoch": 1.42, + "learning_rate": 8.764117465608725e-05, + "loss": 0.0119, + "step": 546160 + }, + { + "epoch": 1.42, + "learning_rate": 8.763728643971579e-05, + "loss": 0.0089, + "step": 546170 + }, + { + "epoch": 1.42, + "learning_rate": 8.763339822334432e-05, + "loss": 0.0088, + "step": 546180 + }, + { + "epoch": 1.42, + "learning_rate": 8.762951000697286e-05, + "loss": 0.0191, + "step": 546190 + }, + { + "epoch": 1.42, + "learning_rate": 8.762562179060139e-05, + "loss": 0.0122, + "step": 546200 + }, + { + "epoch": 1.42, + "learning_rate": 8.762173357422993e-05, + "loss": 0.0108, + "step": 546210 + }, + { + "epoch": 1.42, + "learning_rate": 8.761784535785846e-05, + "loss": 0.0089, + "step": 546220 + }, + { + "epoch": 1.42, + "learning_rate": 8.7613957141487e-05, + "loss": 0.0103, + "step": 546230 + }, + { + "epoch": 1.42, + "learning_rate": 8.761006892511553e-05, + "loss": 0.0117, + "step": 546240 + }, + { + "epoch": 1.42, + "learning_rate": 8.760618070874407e-05, + "loss": 0.0081, + "step": 546250 + }, + { + "epoch": 1.42, + "learning_rate": 8.76022924923726e-05, + "loss": 0.0086, + "step": 546260 + }, + { + "epoch": 1.42, + "learning_rate": 8.759840427600115e-05, + "loss": 0.0092, + "step": 546270 + }, + { + "epoch": 1.42, + "learning_rate": 8.759451605962968e-05, + "loss": 0.0086, + "step": 546280 + }, + { + "epoch": 1.42, + "learning_rate": 8.759062784325822e-05, + "loss": 0.0114, + "step": 546290 + }, + { + "epoch": 1.42, + "learning_rate": 8.758673962688675e-05, + "loss": 0.0112, + "step": 546300 + }, + { + "epoch": 1.42, + "learning_rate": 8.75828514105153e-05, + "loss": 0.0085, + "step": 546310 + }, + { + "epoch": 1.42, + "learning_rate": 8.757896319414382e-05, + "loss": 0.0122, + "step": 546320 + }, + { + "epoch": 1.42, + "learning_rate": 8.757507497777236e-05, + "loss": 0.0078, + "step": 546330 + }, + { + "epoch": 1.42, + "learning_rate": 8.757118676140089e-05, + "loss": 0.0103, + "step": 546340 + }, + { + "epoch": 1.42, + "learning_rate": 8.756729854502942e-05, + "loss": 0.0081, + "step": 546350 + }, + { + "epoch": 1.42, + "learning_rate": 8.756341032865796e-05, + "loss": 0.01, + "step": 546360 + }, + { + "epoch": 1.42, + "learning_rate": 8.755952211228649e-05, + "loss": 0.0113, + "step": 546370 + }, + { + "epoch": 1.42, + "learning_rate": 8.755563389591503e-05, + "loss": 0.0077, + "step": 546380 + }, + { + "epoch": 1.42, + "learning_rate": 8.755174567954356e-05, + "loss": 0.0085, + "step": 546390 + }, + { + "epoch": 1.42, + "learning_rate": 8.75478574631721e-05, + "loss": 0.0131, + "step": 546400 + }, + { + "epoch": 1.42, + "learning_rate": 8.754396924680063e-05, + "loss": 0.0116, + "step": 546410 + }, + { + "epoch": 1.42, + "learning_rate": 8.754008103042917e-05, + "loss": 0.0089, + "step": 546420 + }, + { + "epoch": 1.42, + "learning_rate": 8.75361928140577e-05, + "loss": 0.0098, + "step": 546430 + }, + { + "epoch": 1.42, + "learning_rate": 8.753230459768625e-05, + "loss": 0.0065, + "step": 546440 + }, + { + "epoch": 1.42, + "learning_rate": 8.752841638131477e-05, + "loss": 0.009, + "step": 546450 + }, + { + "epoch": 1.42, + "learning_rate": 8.752452816494332e-05, + "loss": 0.009, + "step": 546460 + }, + { + "epoch": 1.42, + "learning_rate": 8.752063994857185e-05, + "loss": 0.0101, + "step": 546470 + }, + { + "epoch": 1.42, + "learning_rate": 8.75167517322004e-05, + "loss": 0.0093, + "step": 546480 + }, + { + "epoch": 1.42, + "learning_rate": 8.751286351582892e-05, + "loss": 0.0085, + "step": 546490 + }, + { + "epoch": 1.42, + "learning_rate": 8.750897529945746e-05, + "loss": 0.0088, + "step": 546500 + }, + { + "epoch": 1.42, + "learning_rate": 8.750508708308599e-05, + "loss": 0.0091, + "step": 546510 + }, + { + "epoch": 1.42, + "learning_rate": 8.750119886671453e-05, + "loss": 0.0082, + "step": 546520 + }, + { + "epoch": 1.42, + "learning_rate": 8.749731065034306e-05, + "loss": 0.0102, + "step": 546530 + }, + { + "epoch": 1.42, + "learning_rate": 8.74934224339716e-05, + "loss": 0.0089, + "step": 546540 + }, + { + "epoch": 1.42, + "learning_rate": 8.748953421760013e-05, + "loss": 0.0094, + "step": 546550 + }, + { + "epoch": 1.42, + "learning_rate": 8.748564600122867e-05, + "loss": 0.0071, + "step": 546560 + }, + { + "epoch": 1.42, + "learning_rate": 8.74817577848572e-05, + "loss": 0.0082, + "step": 546570 + }, + { + "epoch": 1.42, + "learning_rate": 8.747786956848573e-05, + "loss": 0.0095, + "step": 546580 + }, + { + "epoch": 1.42, + "learning_rate": 8.747398135211427e-05, + "loss": 0.008, + "step": 546590 + }, + { + "epoch": 1.42, + "learning_rate": 8.74700931357428e-05, + "loss": 0.0088, + "step": 546600 + }, + { + "epoch": 1.42, + "learning_rate": 8.746620491937134e-05, + "loss": 0.0109, + "step": 546610 + }, + { + "epoch": 1.42, + "learning_rate": 8.746231670299987e-05, + "loss": 0.0116, + "step": 546620 + }, + { + "epoch": 1.42, + "learning_rate": 8.745842848662842e-05, + "loss": 0.0105, + "step": 546630 + }, + { + "epoch": 1.42, + "learning_rate": 8.745454027025695e-05, + "loss": 0.0088, + "step": 546640 + }, + { + "epoch": 1.42, + "learning_rate": 8.745065205388549e-05, + "loss": 0.0091, + "step": 546650 + }, + { + "epoch": 1.42, + "learning_rate": 8.744676383751402e-05, + "loss": 0.0087, + "step": 546660 + }, + { + "epoch": 1.42, + "learning_rate": 8.744287562114256e-05, + "loss": 0.0093, + "step": 546670 + }, + { + "epoch": 1.42, + "learning_rate": 8.743898740477109e-05, + "loss": 0.014, + "step": 546680 + }, + { + "epoch": 1.42, + "learning_rate": 8.743509918839963e-05, + "loss": 0.0103, + "step": 546690 + }, + { + "epoch": 1.42, + "learning_rate": 8.743121097202816e-05, + "loss": 0.0106, + "step": 546700 + }, + { + "epoch": 1.42, + "learning_rate": 8.74273227556567e-05, + "loss": 0.0077, + "step": 546710 + }, + { + "epoch": 1.42, + "learning_rate": 8.742343453928523e-05, + "loss": 0.0134, + "step": 546720 + }, + { + "epoch": 1.42, + "learning_rate": 8.741954632291377e-05, + "loss": 0.0115, + "step": 546730 + }, + { + "epoch": 1.42, + "learning_rate": 8.74156581065423e-05, + "loss": 0.0125, + "step": 546740 + }, + { + "epoch": 1.42, + "learning_rate": 8.741176989017084e-05, + "loss": 0.0092, + "step": 546750 + }, + { + "epoch": 1.42, + "learning_rate": 8.740788167379937e-05, + "loss": 0.0131, + "step": 546760 + }, + { + "epoch": 1.42, + "learning_rate": 8.740399345742791e-05, + "loss": 0.0104, + "step": 546770 + }, + { + "epoch": 1.42, + "learning_rate": 8.740010524105644e-05, + "loss": 0.0199, + "step": 546780 + }, + { + "epoch": 1.42, + "learning_rate": 8.7396217024685e-05, + "loss": 0.0087, + "step": 546790 + }, + { + "epoch": 1.42, + "learning_rate": 8.739232880831352e-05, + "loss": 0.0074, + "step": 546800 + }, + { + "epoch": 1.42, + "learning_rate": 8.738844059194206e-05, + "loss": 0.009, + "step": 546810 + }, + { + "epoch": 1.42, + "learning_rate": 8.738455237557059e-05, + "loss": 0.0096, + "step": 546820 + }, + { + "epoch": 1.42, + "learning_rate": 8.738066415919912e-05, + "loss": 0.0109, + "step": 546830 + }, + { + "epoch": 1.42, + "learning_rate": 8.737677594282766e-05, + "loss": 0.0083, + "step": 546840 + }, + { + "epoch": 1.42, + "learning_rate": 8.737288772645619e-05, + "loss": 0.0079, + "step": 546850 + }, + { + "epoch": 1.42, + "learning_rate": 8.736899951008473e-05, + "loss": 0.0125, + "step": 546860 + }, + { + "epoch": 1.42, + "learning_rate": 8.736511129371326e-05, + "loss": 0.0096, + "step": 546870 + }, + { + "epoch": 1.42, + "learning_rate": 8.73612230773418e-05, + "loss": 0.0077, + "step": 546880 + }, + { + "epoch": 1.42, + "learning_rate": 8.735733486097033e-05, + "loss": 0.0087, + "step": 546890 + }, + { + "epoch": 1.42, + "learning_rate": 8.735344664459887e-05, + "loss": 0.0093, + "step": 546900 + }, + { + "epoch": 1.42, + "learning_rate": 8.73495584282274e-05, + "loss": 0.0107, + "step": 546910 + }, + { + "epoch": 1.42, + "learning_rate": 8.734567021185594e-05, + "loss": 0.0095, + "step": 546920 + }, + { + "epoch": 1.42, + "learning_rate": 8.734178199548447e-05, + "loss": 0.0086, + "step": 546930 + }, + { + "epoch": 1.42, + "learning_rate": 8.733789377911301e-05, + "loss": 0.01, + "step": 546940 + }, + { + "epoch": 1.42, + "learning_rate": 8.733400556274154e-05, + "loss": 0.0103, + "step": 546950 + }, + { + "epoch": 1.42, + "learning_rate": 8.73301173463701e-05, + "loss": 0.0094, + "step": 546960 + }, + { + "epoch": 1.42, + "learning_rate": 8.732622912999861e-05, + "loss": 0.0065, + "step": 546970 + }, + { + "epoch": 1.42, + "learning_rate": 8.732234091362716e-05, + "loss": 0.0097, + "step": 546980 + }, + { + "epoch": 1.42, + "learning_rate": 8.731845269725569e-05, + "loss": 0.0063, + "step": 546990 + }, + { + "epoch": 1.42, + "learning_rate": 8.731456448088423e-05, + "loss": 0.0099, + "step": 547000 + }, + { + "epoch": 1.42, + "eval_cer": 0.8817166826925096, + "eval_loss": 0.006214640568941832, + "eval_runtime": 107.961, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, + "step": 547000 + }, + { + "epoch": 1.42, + "learning_rate": 8.731067626451276e-05, + "loss": 0.0073, + "step": 547010 + }, + { + "epoch": 1.42, + "learning_rate": 8.73067880481413e-05, + "loss": 0.0112, + "step": 547020 + }, + { + "epoch": 1.42, + "learning_rate": 8.730289983176983e-05, + "loss": 0.0091, + "step": 547030 + }, + { + "epoch": 1.42, + "learning_rate": 8.729901161539837e-05, + "loss": 0.0102, + "step": 547040 + }, + { + "epoch": 1.42, + "learning_rate": 8.72951233990269e-05, + "loss": 0.0082, + "step": 547050 + }, + { + "epoch": 1.42, + "learning_rate": 8.729123518265544e-05, + "loss": 0.013, + "step": 547060 + }, + { + "epoch": 1.42, + "learning_rate": 8.728734696628397e-05, + "loss": 0.0079, + "step": 547070 + }, + { + "epoch": 1.42, + "learning_rate": 8.72834587499125e-05, + "loss": 0.0089, + "step": 547080 + }, + { + "epoch": 1.42, + "learning_rate": 8.727957053354104e-05, + "loss": 0.0096, + "step": 547090 + }, + { + "epoch": 1.42, + "learning_rate": 8.727568231716957e-05, + "loss": 0.0118, + "step": 547100 + }, + { + "epoch": 1.42, + "learning_rate": 8.727179410079811e-05, + "loss": 0.0097, + "step": 547110 + }, + { + "epoch": 1.42, + "learning_rate": 8.726790588442664e-05, + "loss": 0.0093, + "step": 547120 + }, + { + "epoch": 1.42, + "learning_rate": 8.726401766805518e-05, + "loss": 0.009, + "step": 547130 + }, + { + "epoch": 1.42, + "learning_rate": 8.726012945168371e-05, + "loss": 0.0083, + "step": 547140 + }, + { + "epoch": 1.42, + "learning_rate": 8.725624123531226e-05, + "loss": 0.0072, + "step": 547150 + }, + { + "epoch": 1.42, + "learning_rate": 8.725235301894079e-05, + "loss": 0.0117, + "step": 547160 + }, + { + "epoch": 1.42, + "learning_rate": 8.724846480256933e-05, + "loss": 0.0124, + "step": 547170 + }, + { + "epoch": 1.42, + "learning_rate": 8.724457658619786e-05, + "loss": 0.008, + "step": 547180 + }, + { + "epoch": 1.42, + "learning_rate": 8.72406883698264e-05, + "loss": 0.0119, + "step": 547190 + }, + { + "epoch": 1.42, + "learning_rate": 8.723680015345493e-05, + "loss": 0.0103, + "step": 547200 + }, + { + "epoch": 1.42, + "learning_rate": 8.723291193708347e-05, + "loss": 0.0113, + "step": 547210 + }, + { + "epoch": 1.42, + "learning_rate": 8.7229023720712e-05, + "loss": 0.0114, + "step": 547220 + }, + { + "epoch": 1.42, + "learning_rate": 8.722513550434054e-05, + "loss": 0.0084, + "step": 547230 + }, + { + "epoch": 1.42, + "learning_rate": 8.722124728796907e-05, + "loss": 0.0082, + "step": 547240 + }, + { + "epoch": 1.42, + "learning_rate": 8.721735907159761e-05, + "loss": 0.0086, + "step": 547250 + }, + { + "epoch": 1.42, + "learning_rate": 8.721347085522614e-05, + "loss": 0.0113, + "step": 547260 + }, + { + "epoch": 1.42, + "learning_rate": 8.720958263885468e-05, + "loss": 0.0079, + "step": 547270 + }, + { + "epoch": 1.42, + "learning_rate": 8.720569442248321e-05, + "loss": 0.0095, + "step": 547280 + }, + { + "epoch": 1.42, + "learning_rate": 8.720180620611175e-05, + "loss": 0.0095, + "step": 547290 + }, + { + "epoch": 1.42, + "learning_rate": 8.719791798974028e-05, + "loss": 0.0106, + "step": 547300 + }, + { + "epoch": 1.42, + "learning_rate": 8.719402977336883e-05, + "loss": 0.0101, + "step": 547310 + }, + { + "epoch": 1.42, + "learning_rate": 8.719014155699736e-05, + "loss": 0.008, + "step": 547320 + }, + { + "epoch": 1.42, + "learning_rate": 8.718625334062588e-05, + "loss": 0.0106, + "step": 547330 + }, + { + "epoch": 1.42, + "learning_rate": 8.718236512425443e-05, + "loss": 0.0096, + "step": 547340 + }, + { + "epoch": 1.42, + "learning_rate": 8.717847690788296e-05, + "loss": 0.0083, + "step": 547350 + }, + { + "epoch": 1.42, + "learning_rate": 8.71745886915115e-05, + "loss": 0.0095, + "step": 547360 + }, + { + "epoch": 1.42, + "learning_rate": 8.717070047514003e-05, + "loss": 0.0098, + "step": 547370 + }, + { + "epoch": 1.42, + "learning_rate": 8.716681225876857e-05, + "loss": 0.0094, + "step": 547380 + }, + { + "epoch": 1.42, + "learning_rate": 8.71629240423971e-05, + "loss": 0.0106, + "step": 547390 + }, + { + "epoch": 1.42, + "learning_rate": 8.715903582602564e-05, + "loss": 0.01, + "step": 547400 + }, + { + "epoch": 1.42, + "learning_rate": 8.715514760965417e-05, + "loss": 0.012, + "step": 547410 + }, + { + "epoch": 1.42, + "learning_rate": 8.715125939328271e-05, + "loss": 0.0087, + "step": 547420 + }, + { + "epoch": 1.42, + "learning_rate": 8.714737117691124e-05, + "loss": 0.0088, + "step": 547430 + }, + { + "epoch": 1.42, + "learning_rate": 8.714348296053978e-05, + "loss": 0.0103, + "step": 547440 + }, + { + "epoch": 1.42, + "learning_rate": 8.713959474416831e-05, + "loss": 0.0084, + "step": 547450 + }, + { + "epoch": 1.42, + "learning_rate": 8.713570652779685e-05, + "loss": 0.0096, + "step": 547460 + }, + { + "epoch": 1.42, + "learning_rate": 8.713181831142538e-05, + "loss": 0.0077, + "step": 547470 + }, + { + "epoch": 1.42, + "learning_rate": 8.712793009505392e-05, + "loss": 0.0113, + "step": 547480 + }, + { + "epoch": 1.42, + "learning_rate": 8.712404187868245e-05, + "loss": 0.0078, + "step": 547490 + }, + { + "epoch": 1.42, + "learning_rate": 8.7120153662311e-05, + "loss": 0.0079, + "step": 547500 + }, + { + "epoch": 1.42, + "learning_rate": 8.711626544593953e-05, + "loss": 0.0087, + "step": 547510 + }, + { + "epoch": 1.42, + "learning_rate": 8.711237722956807e-05, + "loss": 0.0079, + "step": 547520 + }, + { + "epoch": 1.42, + "learning_rate": 8.71084890131966e-05, + "loss": 0.0136, + "step": 547530 + }, + { + "epoch": 1.42, + "learning_rate": 8.710460079682514e-05, + "loss": 0.0091, + "step": 547540 + }, + { + "epoch": 1.42, + "learning_rate": 8.710071258045367e-05, + "loss": 0.0109, + "step": 547550 + }, + { + "epoch": 1.42, + "learning_rate": 8.709682436408221e-05, + "loss": 0.0087, + "step": 547560 + }, + { + "epoch": 1.42, + "learning_rate": 8.709293614771074e-05, + "loss": 0.0109, + "step": 547570 + }, + { + "epoch": 1.42, + "learning_rate": 8.708904793133927e-05, + "loss": 0.0072, + "step": 547580 + }, + { + "epoch": 1.42, + "learning_rate": 8.708515971496781e-05, + "loss": 0.0115, + "step": 547590 + }, + { + "epoch": 1.42, + "learning_rate": 8.708127149859634e-05, + "loss": 0.0096, + "step": 547600 + }, + { + "epoch": 1.42, + "learning_rate": 8.707738328222488e-05, + "loss": 0.009, + "step": 547610 + }, + { + "epoch": 1.42, + "learning_rate": 8.707349506585341e-05, + "loss": 0.0084, + "step": 547620 + }, + { + "epoch": 1.42, + "learning_rate": 8.706960684948195e-05, + "loss": 0.0081, + "step": 547630 + }, + { + "epoch": 1.42, + "learning_rate": 8.706571863311048e-05, + "loss": 0.0095, + "step": 547640 + }, + { + "epoch": 1.42, + "learning_rate": 8.706183041673902e-05, + "loss": 0.0066, + "step": 547650 + }, + { + "epoch": 1.42, + "learning_rate": 8.705794220036755e-05, + "loss": 0.0114, + "step": 547660 + }, + { + "epoch": 1.42, + "learning_rate": 8.70540539839961e-05, + "loss": 0.0077, + "step": 547670 + }, + { + "epoch": 1.42, + "learning_rate": 8.705016576762462e-05, + "loss": 0.0103, + "step": 547680 + }, + { + "epoch": 1.42, + "learning_rate": 8.704627755125317e-05, + "loss": 0.0098, + "step": 547690 + }, + { + "epoch": 1.42, + "learning_rate": 8.70423893348817e-05, + "loss": 0.0104, + "step": 547700 + }, + { + "epoch": 1.42, + "learning_rate": 8.703850111851024e-05, + "loss": 0.0083, + "step": 547710 + }, + { + "epoch": 1.42, + "learning_rate": 8.703461290213877e-05, + "loss": 0.01, + "step": 547720 + }, + { + "epoch": 1.42, + "learning_rate": 8.703072468576731e-05, + "loss": 0.0084, + "step": 547730 + }, + { + "epoch": 1.42, + "learning_rate": 8.702683646939584e-05, + "loss": 0.0098, + "step": 547740 + }, + { + "epoch": 1.42, + "learning_rate": 8.702294825302438e-05, + "loss": 0.0096, + "step": 547750 + }, + { + "epoch": 1.42, + "learning_rate": 8.701906003665291e-05, + "loss": 0.0101, + "step": 547760 + }, + { + "epoch": 1.42, + "learning_rate": 8.701517182028145e-05, + "loss": 0.012, + "step": 547770 + }, + { + "epoch": 1.42, + "learning_rate": 8.701128360390998e-05, + "loss": 0.0075, + "step": 547780 + }, + { + "epoch": 1.42, + "learning_rate": 8.700739538753852e-05, + "loss": 0.0079, + "step": 547790 + }, + { + "epoch": 1.42, + "learning_rate": 8.700350717116705e-05, + "loss": 0.0074, + "step": 547800 + }, + { + "epoch": 1.42, + "learning_rate": 8.699961895479559e-05, + "loss": 0.0106, + "step": 547810 + }, + { + "epoch": 1.42, + "learning_rate": 8.699573073842412e-05, + "loss": 0.009, + "step": 547820 + }, + { + "epoch": 1.42, + "learning_rate": 8.699184252205265e-05, + "loss": 0.0073, + "step": 547830 + }, + { + "epoch": 1.42, + "learning_rate": 8.698795430568119e-05, + "loss": 0.0093, + "step": 547840 + }, + { + "epoch": 1.42, + "learning_rate": 8.698406608930972e-05, + "loss": 0.0103, + "step": 547850 + }, + { + "epoch": 1.42, + "learning_rate": 8.698017787293827e-05, + "loss": 0.0104, + "step": 547860 + }, + { + "epoch": 1.42, + "learning_rate": 8.69762896565668e-05, + "loss": 0.0068, + "step": 547870 + }, + { + "epoch": 1.42, + "learning_rate": 8.697240144019534e-05, + "loss": 0.0095, + "step": 547880 + }, + { + "epoch": 1.42, + "learning_rate": 8.696851322382387e-05, + "loss": 0.0102, + "step": 547890 + }, + { + "epoch": 1.42, + "learning_rate": 8.696462500745241e-05, + "loss": 0.0087, + "step": 547900 + }, + { + "epoch": 1.42, + "learning_rate": 8.696073679108094e-05, + "loss": 0.0109, + "step": 547910 + }, + { + "epoch": 1.42, + "learning_rate": 8.695684857470948e-05, + "loss": 0.0085, + "step": 547920 + }, + { + "epoch": 1.42, + "learning_rate": 8.695296035833801e-05, + "loss": 0.0107, + "step": 547930 + }, + { + "epoch": 1.42, + "learning_rate": 8.694907214196655e-05, + "loss": 0.0088, + "step": 547940 + }, + { + "epoch": 1.42, + "learning_rate": 8.694518392559508e-05, + "loss": 0.0098, + "step": 547950 + }, + { + "epoch": 1.42, + "learning_rate": 8.694129570922362e-05, + "loss": 0.0084, + "step": 547960 + }, + { + "epoch": 1.42, + "learning_rate": 8.693740749285215e-05, + "loss": 0.0078, + "step": 547970 + }, + { + "epoch": 1.42, + "learning_rate": 8.693351927648069e-05, + "loss": 0.0102, + "step": 547980 + }, + { + "epoch": 1.42, + "learning_rate": 8.692963106010922e-05, + "loss": 0.0094, + "step": 547990 + }, + { + "epoch": 1.42, + "learning_rate": 8.692574284373776e-05, + "loss": 0.0095, + "step": 548000 + }, + { + "epoch": 1.42, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.006283493246883154, + "eval_runtime": 107.9445, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 548000 + }, + { + "epoch": 1.42, + "learning_rate": 8.692185462736629e-05, + "loss": 0.0106, + "step": 548010 + }, + { + "epoch": 1.42, + "learning_rate": 8.691796641099484e-05, + "loss": 0.0085, + "step": 548020 + }, + { + "epoch": 1.42, + "learning_rate": 8.691407819462337e-05, + "loss": 0.01, + "step": 548030 + }, + { + "epoch": 1.42, + "learning_rate": 8.691018997825191e-05, + "loss": 0.0101, + "step": 548040 + }, + { + "epoch": 1.42, + "learning_rate": 8.690630176188044e-05, + "loss": 0.0127, + "step": 548050 + }, + { + "epoch": 1.42, + "learning_rate": 8.690241354550898e-05, + "loss": 0.0071, + "step": 548060 + }, + { + "epoch": 1.42, + "learning_rate": 8.689852532913751e-05, + "loss": 0.0091, + "step": 548070 + }, + { + "epoch": 1.42, + "learning_rate": 8.689463711276604e-05, + "loss": 0.0113, + "step": 548080 + }, + { + "epoch": 1.42, + "learning_rate": 8.689074889639458e-05, + "loss": 0.0084, + "step": 548090 + }, + { + "epoch": 1.42, + "learning_rate": 8.688686068002311e-05, + "loss": 0.0104, + "step": 548100 + }, + { + "epoch": 1.42, + "learning_rate": 8.688297246365165e-05, + "loss": 0.01, + "step": 548110 + }, + { + "epoch": 1.42, + "learning_rate": 8.687908424728018e-05, + "loss": 0.0078, + "step": 548120 + }, + { + "epoch": 1.42, + "learning_rate": 8.687519603090872e-05, + "loss": 0.0088, + "step": 548130 + }, + { + "epoch": 1.42, + "learning_rate": 8.687130781453725e-05, + "loss": 0.0099, + "step": 548140 + }, + { + "epoch": 1.42, + "learning_rate": 8.686741959816579e-05, + "loss": 0.0079, + "step": 548150 + }, + { + "epoch": 1.42, + "learning_rate": 8.686353138179432e-05, + "loss": 0.0109, + "step": 548160 + }, + { + "epoch": 1.42, + "learning_rate": 8.685964316542286e-05, + "loss": 0.0098, + "step": 548170 + }, + { + "epoch": 1.42, + "learning_rate": 8.685575494905139e-05, + "loss": 0.0072, + "step": 548180 + }, + { + "epoch": 1.42, + "learning_rate": 8.685186673267994e-05, + "loss": 0.0092, + "step": 548190 + }, + { + "epoch": 1.42, + "learning_rate": 8.684797851630846e-05, + "loss": 0.0096, + "step": 548200 + }, + { + "epoch": 1.42, + "learning_rate": 8.684409029993701e-05, + "loss": 0.0092, + "step": 548210 + }, + { + "epoch": 1.42, + "learning_rate": 8.684020208356554e-05, + "loss": 0.0115, + "step": 548220 + }, + { + "epoch": 1.42, + "learning_rate": 8.683631386719408e-05, + "loss": 0.0107, + "step": 548230 + }, + { + "epoch": 1.42, + "learning_rate": 8.683242565082261e-05, + "loss": 0.0109, + "step": 548240 + }, + { + "epoch": 1.42, + "learning_rate": 8.682853743445115e-05, + "loss": 0.0086, + "step": 548250 + }, + { + "epoch": 1.42, + "learning_rate": 8.682464921807968e-05, + "loss": 0.0096, + "step": 548260 + }, + { + "epoch": 1.42, + "learning_rate": 8.682076100170822e-05, + "loss": 0.0074, + "step": 548270 + }, + { + "epoch": 1.42, + "learning_rate": 8.681687278533675e-05, + "loss": 0.0073, + "step": 548280 + }, + { + "epoch": 1.42, + "learning_rate": 8.681298456896529e-05, + "loss": 0.0077, + "step": 548290 + }, + { + "epoch": 1.42, + "learning_rate": 8.680909635259382e-05, + "loss": 0.0116, + "step": 548300 + }, + { + "epoch": 1.42, + "learning_rate": 8.680520813622236e-05, + "loss": 0.01, + "step": 548310 + }, + { + "epoch": 1.42, + "learning_rate": 8.680131991985089e-05, + "loss": 0.0115, + "step": 548320 + }, + { + "epoch": 1.42, + "learning_rate": 8.679743170347942e-05, + "loss": 0.0081, + "step": 548330 + }, + { + "epoch": 1.42, + "learning_rate": 8.679354348710796e-05, + "loss": 0.0078, + "step": 548340 + }, + { + "epoch": 1.42, + "learning_rate": 8.678965527073649e-05, + "loss": 0.0105, + "step": 548350 + }, + { + "epoch": 1.42, + "learning_rate": 8.678576705436503e-05, + "loss": 0.008, + "step": 548360 + }, + { + "epoch": 1.42, + "learning_rate": 8.678187883799356e-05, + "loss": 0.0089, + "step": 548370 + }, + { + "epoch": 1.42, + "learning_rate": 8.677799062162211e-05, + "loss": 0.0094, + "step": 548380 + }, + { + "epoch": 1.42, + "learning_rate": 8.677410240525064e-05, + "loss": 0.0071, + "step": 548390 + }, + { + "epoch": 1.42, + "learning_rate": 8.677021418887918e-05, + "loss": 0.0116, + "step": 548400 + }, + { + "epoch": 1.42, + "learning_rate": 8.676632597250771e-05, + "loss": 0.0132, + "step": 548410 + }, + { + "epoch": 1.42, + "learning_rate": 8.676243775613625e-05, + "loss": 0.0079, + "step": 548420 + }, + { + "epoch": 1.42, + "learning_rate": 8.675854953976478e-05, + "loss": 0.0092, + "step": 548430 + }, + { + "epoch": 1.42, + "learning_rate": 8.675466132339332e-05, + "loss": 0.0102, + "step": 548440 + }, + { + "epoch": 1.42, + "learning_rate": 8.675077310702185e-05, + "loss": 0.0074, + "step": 548450 + }, + { + "epoch": 1.42, + "learning_rate": 8.674688489065039e-05, + "loss": 0.0074, + "step": 548460 + }, + { + "epoch": 1.42, + "learning_rate": 8.674299667427892e-05, + "loss": 0.0066, + "step": 548470 + }, + { + "epoch": 1.42, + "learning_rate": 8.673910845790746e-05, + "loss": 0.0122, + "step": 548480 + }, + { + "epoch": 1.42, + "learning_rate": 8.673522024153599e-05, + "loss": 0.0116, + "step": 548490 + }, + { + "epoch": 1.42, + "learning_rate": 8.673133202516453e-05, + "loss": 0.0089, + "step": 548500 + }, + { + "epoch": 1.42, + "learning_rate": 8.672744380879306e-05, + "loss": 0.0077, + "step": 548510 + }, + { + "epoch": 1.42, + "learning_rate": 8.67235555924216e-05, + "loss": 0.0091, + "step": 548520 + }, + { + "epoch": 1.42, + "learning_rate": 8.671966737605013e-05, + "loss": 0.0092, + "step": 548530 + }, + { + "epoch": 1.42, + "learning_rate": 8.671577915967868e-05, + "loss": 0.0119, + "step": 548540 + }, + { + "epoch": 1.42, + "learning_rate": 8.671189094330721e-05, + "loss": 0.0109, + "step": 548550 + }, + { + "epoch": 1.42, + "learning_rate": 8.670800272693575e-05, + "loss": 0.0082, + "step": 548560 + }, + { + "epoch": 1.42, + "learning_rate": 8.670411451056428e-05, + "loss": 0.0091, + "step": 548570 + }, + { + "epoch": 1.42, + "learning_rate": 8.670022629419281e-05, + "loss": 0.0094, + "step": 548580 + }, + { + "epoch": 1.42, + "learning_rate": 8.669633807782135e-05, + "loss": 0.0062, + "step": 548590 + }, + { + "epoch": 1.42, + "learning_rate": 8.669244986144988e-05, + "loss": 0.0109, + "step": 548600 + }, + { + "epoch": 1.42, + "learning_rate": 8.668856164507842e-05, + "loss": 0.0097, + "step": 548610 + }, + { + "epoch": 1.42, + "learning_rate": 8.668467342870695e-05, + "loss": 0.0133, + "step": 548620 + }, + { + "epoch": 1.42, + "learning_rate": 8.668078521233549e-05, + "loss": 0.0092, + "step": 548630 + }, + { + "epoch": 1.42, + "learning_rate": 8.667689699596402e-05, + "loss": 0.0089, + "step": 548640 + }, + { + "epoch": 1.42, + "learning_rate": 8.667300877959256e-05, + "loss": 0.0121, + "step": 548650 + }, + { + "epoch": 1.42, + "learning_rate": 8.666912056322109e-05, + "loss": 0.0088, + "step": 548660 + }, + { + "epoch": 1.42, + "learning_rate": 8.666523234684963e-05, + "loss": 0.0084, + "step": 548670 + }, + { + "epoch": 1.42, + "learning_rate": 8.666134413047816e-05, + "loss": 0.009, + "step": 548680 + }, + { + "epoch": 1.42, + "learning_rate": 8.66574559141067e-05, + "loss": 0.01, + "step": 548690 + }, + { + "epoch": 1.42, + "learning_rate": 8.665356769773523e-05, + "loss": 0.008, + "step": 548700 + }, + { + "epoch": 1.42, + "learning_rate": 8.664967948136377e-05, + "loss": 0.0084, + "step": 548710 + }, + { + "epoch": 1.42, + "learning_rate": 8.66457912649923e-05, + "loss": 0.0077, + "step": 548720 + }, + { + "epoch": 1.42, + "learning_rate": 8.664190304862085e-05, + "loss": 0.0092, + "step": 548730 + }, + { + "epoch": 1.42, + "learning_rate": 8.663801483224938e-05, + "loss": 0.0097, + "step": 548740 + }, + { + "epoch": 1.42, + "learning_rate": 8.663412661587792e-05, + "loss": 0.0091, + "step": 548750 + }, + { + "epoch": 1.42, + "learning_rate": 8.663023839950645e-05, + "loss": 0.0098, + "step": 548760 + }, + { + "epoch": 1.42, + "learning_rate": 8.662635018313499e-05, + "loss": 0.011, + "step": 548770 + }, + { + "epoch": 1.42, + "learning_rate": 8.662246196676352e-05, + "loss": 0.0097, + "step": 548780 + }, + { + "epoch": 1.42, + "learning_rate": 8.661857375039206e-05, + "loss": 0.0137, + "step": 548790 + }, + { + "epoch": 1.42, + "learning_rate": 8.661468553402059e-05, + "loss": 0.0141, + "step": 548800 + }, + { + "epoch": 1.42, + "learning_rate": 8.661079731764913e-05, + "loss": 0.0101, + "step": 548810 + }, + { + "epoch": 1.42, + "learning_rate": 8.660690910127766e-05, + "loss": 0.0089, + "step": 548820 + }, + { + "epoch": 1.42, + "learning_rate": 8.660302088490619e-05, + "loss": 0.0088, + "step": 548830 + }, + { + "epoch": 1.42, + "learning_rate": 8.659913266853473e-05, + "loss": 0.0147, + "step": 548840 + }, + { + "epoch": 1.42, + "learning_rate": 8.659524445216326e-05, + "loss": 0.0114, + "step": 548850 + }, + { + "epoch": 1.42, + "learning_rate": 8.65913562357918e-05, + "loss": 0.0115, + "step": 548860 + }, + { + "epoch": 1.42, + "learning_rate": 8.658746801942033e-05, + "loss": 0.0089, + "step": 548870 + }, + { + "epoch": 1.42, + "learning_rate": 8.658357980304887e-05, + "loss": 0.0095, + "step": 548880 + }, + { + "epoch": 1.42, + "learning_rate": 8.65796915866774e-05, + "loss": 0.0076, + "step": 548890 + }, + { + "epoch": 1.42, + "learning_rate": 8.657580337030595e-05, + "loss": 0.0099, + "step": 548900 + }, + { + "epoch": 1.42, + "learning_rate": 8.657191515393447e-05, + "loss": 0.0092, + "step": 548910 + }, + { + "epoch": 1.42, + "learning_rate": 8.656802693756302e-05, + "loss": 0.0074, + "step": 548920 + }, + { + "epoch": 1.42, + "learning_rate": 8.656413872119155e-05, + "loss": 0.0106, + "step": 548930 + }, + { + "epoch": 1.42, + "learning_rate": 8.656025050482009e-05, + "loss": 0.0095, + "step": 548940 + }, + { + "epoch": 1.42, + "learning_rate": 8.655636228844862e-05, + "loss": 0.0092, + "step": 548950 + }, + { + "epoch": 1.42, + "learning_rate": 8.655247407207716e-05, + "loss": 0.0107, + "step": 548960 + }, + { + "epoch": 1.42, + "learning_rate": 8.654858585570569e-05, + "loss": 0.0085, + "step": 548970 + }, + { + "epoch": 1.42, + "learning_rate": 8.654469763933423e-05, + "loss": 0.0097, + "step": 548980 + }, + { + "epoch": 1.42, + "learning_rate": 8.654080942296276e-05, + "loss": 0.0099, + "step": 548990 + }, + { + "epoch": 1.42, + "learning_rate": 8.65369212065913e-05, + "loss": 0.0107, + "step": 549000 + }, + { + "epoch": 1.42, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.006188477389514446, + "eval_runtime": 107.8567, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 549000 + }, + { + "epoch": 1.42, + "learning_rate": 8.653303299021983e-05, + "loss": 0.01, + "step": 549010 + }, + { + "epoch": 1.42, + "learning_rate": 8.652914477384837e-05, + "loss": 0.0084, + "step": 549020 + }, + { + "epoch": 1.42, + "learning_rate": 8.65252565574769e-05, + "loss": 0.01, + "step": 549030 + }, + { + "epoch": 1.42, + "learning_rate": 8.652136834110544e-05, + "loss": 0.0112, + "step": 549040 + }, + { + "epoch": 1.42, + "learning_rate": 8.651748012473397e-05, + "loss": 0.01, + "step": 549050 + }, + { + "epoch": 1.42, + "learning_rate": 8.65135919083625e-05, + "loss": 0.0092, + "step": 549060 + }, + { + "epoch": 1.42, + "learning_rate": 8.650970369199104e-05, + "loss": 0.0103, + "step": 549070 + }, + { + "epoch": 1.42, + "learning_rate": 8.650581547561957e-05, + "loss": 0.0098, + "step": 549080 + }, + { + "epoch": 1.42, + "learning_rate": 8.650192725924812e-05, + "loss": 0.0072, + "step": 549090 + }, + { + "epoch": 1.42, + "learning_rate": 8.649803904287665e-05, + "loss": 0.0089, + "step": 549100 + }, + { + "epoch": 1.42, + "learning_rate": 8.649415082650519e-05, + "loss": 0.0096, + "step": 549110 + }, + { + "epoch": 1.42, + "learning_rate": 8.649026261013372e-05, + "loss": 0.01, + "step": 549120 + }, + { + "epoch": 1.42, + "learning_rate": 8.648637439376226e-05, + "loss": 0.009, + "step": 549130 + }, + { + "epoch": 1.42, + "learning_rate": 8.648248617739079e-05, + "loss": 0.0091, + "step": 549140 + }, + { + "epoch": 1.42, + "learning_rate": 8.647859796101933e-05, + "loss": 0.0089, + "step": 549150 + }, + { + "epoch": 1.42, + "learning_rate": 8.647470974464786e-05, + "loss": 0.0098, + "step": 549160 + }, + { + "epoch": 1.42, + "learning_rate": 8.64708215282764e-05, + "loss": 0.0068, + "step": 549170 + }, + { + "epoch": 1.42, + "learning_rate": 8.646693331190493e-05, + "loss": 0.0085, + "step": 549180 + }, + { + "epoch": 1.42, + "learning_rate": 8.646304509553347e-05, + "loss": 0.0084, + "step": 549190 + }, + { + "epoch": 1.42, + "learning_rate": 8.6459156879162e-05, + "loss": 0.0089, + "step": 549200 + }, + { + "epoch": 1.42, + "learning_rate": 8.645526866279054e-05, + "loss": 0.0091, + "step": 549210 + }, + { + "epoch": 1.42, + "learning_rate": 8.645138044641907e-05, + "loss": 0.0113, + "step": 549220 + }, + { + "epoch": 1.42, + "learning_rate": 8.644749223004761e-05, + "loss": 0.0084, + "step": 549230 + }, + { + "epoch": 1.42, + "learning_rate": 8.644360401367614e-05, + "loss": 0.0075, + "step": 549240 + }, + { + "epoch": 1.42, + "learning_rate": 8.643971579730469e-05, + "loss": 0.0079, + "step": 549250 + }, + { + "epoch": 1.42, + "learning_rate": 8.643582758093322e-05, + "loss": 0.0107, + "step": 549260 + }, + { + "epoch": 1.42, + "learning_rate": 8.643193936456176e-05, + "loss": 0.0081, + "step": 549270 + }, + { + "epoch": 1.42, + "learning_rate": 8.642805114819029e-05, + "loss": 0.0092, + "step": 549280 + }, + { + "epoch": 1.42, + "learning_rate": 8.642416293181883e-05, + "loss": 0.0089, + "step": 549290 + }, + { + "epoch": 1.42, + "learning_rate": 8.642027471544736e-05, + "loss": 0.0129, + "step": 549300 + }, + { + "epoch": 1.42, + "learning_rate": 8.641638649907589e-05, + "loss": 0.0065, + "step": 549310 + }, + { + "epoch": 1.42, + "learning_rate": 8.641249828270443e-05, + "loss": 0.0107, + "step": 549320 + }, + { + "epoch": 1.42, + "learning_rate": 8.640861006633296e-05, + "loss": 0.0113, + "step": 549330 + }, + { + "epoch": 1.42, + "learning_rate": 8.64047218499615e-05, + "loss": 0.0096, + "step": 549340 + }, + { + "epoch": 1.42, + "learning_rate": 8.640083363359003e-05, + "loss": 0.0103, + "step": 549350 + }, + { + "epoch": 1.42, + "learning_rate": 8.639694541721857e-05, + "loss": 0.0069, + "step": 549360 + }, + { + "epoch": 1.42, + "learning_rate": 8.63930572008471e-05, + "loss": 0.0117, + "step": 549370 + }, + { + "epoch": 1.42, + "learning_rate": 8.638916898447564e-05, + "loss": 0.0109, + "step": 549380 + }, + { + "epoch": 1.42, + "learning_rate": 8.638528076810417e-05, + "loss": 0.0093, + "step": 549390 + }, + { + "epoch": 1.42, + "learning_rate": 8.638139255173271e-05, + "loss": 0.0075, + "step": 549400 + }, + { + "epoch": 1.42, + "learning_rate": 8.637750433536124e-05, + "loss": 0.0101, + "step": 549410 + }, + { + "epoch": 1.42, + "learning_rate": 8.637361611898979e-05, + "loss": 0.0102, + "step": 549420 + }, + { + "epoch": 1.42, + "learning_rate": 8.63697279026183e-05, + "loss": 0.01, + "step": 549430 + }, + { + "epoch": 1.42, + "learning_rate": 8.636583968624686e-05, + "loss": 0.0107, + "step": 549440 + }, + { + "epoch": 1.42, + "learning_rate": 8.636195146987539e-05, + "loss": 0.009, + "step": 549450 + }, + { + "epoch": 1.42, + "learning_rate": 8.635806325350393e-05, + "loss": 0.0103, + "step": 549460 + }, + { + "epoch": 1.42, + "learning_rate": 8.635417503713246e-05, + "loss": 0.0105, + "step": 549470 + }, + { + "epoch": 1.42, + "learning_rate": 8.6350286820761e-05, + "loss": 0.0093, + "step": 549480 + }, + { + "epoch": 1.42, + "learning_rate": 8.634639860438953e-05, + "loss": 0.0101, + "step": 549490 + }, + { + "epoch": 1.42, + "learning_rate": 8.634251038801807e-05, + "loss": 0.0072, + "step": 549500 + }, + { + "epoch": 1.42, + "learning_rate": 8.63386221716466e-05, + "loss": 0.009, + "step": 549510 + }, + { + "epoch": 1.42, + "learning_rate": 8.633473395527514e-05, + "loss": 0.0081, + "step": 549520 + }, + { + "epoch": 1.42, + "learning_rate": 8.633084573890367e-05, + "loss": 0.0098, + "step": 549530 + }, + { + "epoch": 1.42, + "learning_rate": 8.632695752253221e-05, + "loss": 0.0086, + "step": 549540 + }, + { + "epoch": 1.42, + "learning_rate": 8.632306930616074e-05, + "loss": 0.0108, + "step": 549550 + }, + { + "epoch": 1.42, + "learning_rate": 8.631918108978927e-05, + "loss": 0.0096, + "step": 549560 + }, + { + "epoch": 1.42, + "learning_rate": 8.631529287341781e-05, + "loss": 0.0087, + "step": 549570 + }, + { + "epoch": 1.42, + "learning_rate": 8.631140465704634e-05, + "loss": 0.0107, + "step": 549580 + }, + { + "epoch": 1.42, + "learning_rate": 8.630751644067488e-05, + "loss": 0.008, + "step": 549590 + }, + { + "epoch": 1.42, + "learning_rate": 8.63036282243034e-05, + "loss": 0.0087, + "step": 549600 + }, + { + "epoch": 1.42, + "learning_rate": 8.629974000793196e-05, + "loss": 0.0087, + "step": 549610 + }, + { + "epoch": 1.42, + "learning_rate": 8.629585179156049e-05, + "loss": 0.0119, + "step": 549620 + }, + { + "epoch": 1.42, + "learning_rate": 8.629196357518903e-05, + "loss": 0.0106, + "step": 549630 + }, + { + "epoch": 1.42, + "learning_rate": 8.628807535881756e-05, + "loss": 0.0084, + "step": 549640 + }, + { + "epoch": 1.42, + "learning_rate": 8.62841871424461e-05, + "loss": 0.0105, + "step": 549650 + }, + { + "epoch": 1.42, + "learning_rate": 8.628029892607463e-05, + "loss": 0.0084, + "step": 549660 + }, + { + "epoch": 1.42, + "learning_rate": 8.627641070970317e-05, + "loss": 0.007, + "step": 549670 + }, + { + "epoch": 1.42, + "learning_rate": 8.62725224933317e-05, + "loss": 0.0119, + "step": 549680 + }, + { + "epoch": 1.42, + "learning_rate": 8.626863427696024e-05, + "loss": 0.0085, + "step": 549690 + }, + { + "epoch": 1.42, + "learning_rate": 8.626474606058877e-05, + "loss": 0.0094, + "step": 549700 + }, + { + "epoch": 1.42, + "learning_rate": 8.626085784421731e-05, + "loss": 0.0094, + "step": 549710 + }, + { + "epoch": 1.42, + "learning_rate": 8.625696962784584e-05, + "loss": 0.0106, + "step": 549720 + }, + { + "epoch": 1.42, + "learning_rate": 8.625308141147438e-05, + "loss": 0.0103, + "step": 549730 + }, + { + "epoch": 1.43, + "learning_rate": 8.624919319510291e-05, + "loss": 0.0082, + "step": 549740 + }, + { + "epoch": 1.43, + "learning_rate": 8.624530497873145e-05, + "loss": 0.0085, + "step": 549750 + }, + { + "epoch": 1.43, + "learning_rate": 8.624141676235998e-05, + "loss": 0.0079, + "step": 549760 + }, + { + "epoch": 1.43, + "learning_rate": 8.623752854598853e-05, + "loss": 0.0105, + "step": 549770 + }, + { + "epoch": 1.43, + "learning_rate": 8.623364032961706e-05, + "loss": 0.0106, + "step": 549780 + }, + { + "epoch": 1.43, + "learning_rate": 8.62297521132456e-05, + "loss": 0.0078, + "step": 549790 + }, + { + "epoch": 1.43, + "learning_rate": 8.622586389687413e-05, + "loss": 0.0094, + "step": 549800 + }, + { + "epoch": 1.43, + "learning_rate": 8.622197568050266e-05, + "loss": 0.0099, + "step": 549810 + }, + { + "epoch": 1.43, + "learning_rate": 8.62180874641312e-05, + "loss": 0.011, + "step": 549820 + }, + { + "epoch": 1.43, + "learning_rate": 8.621419924775973e-05, + "loss": 0.0088, + "step": 549830 + }, + { + "epoch": 1.43, + "learning_rate": 8.621031103138827e-05, + "loss": 0.0129, + "step": 549840 + }, + { + "epoch": 1.43, + "learning_rate": 8.62064228150168e-05, + "loss": 0.0104, + "step": 549850 + }, + { + "epoch": 1.43, + "learning_rate": 8.620253459864534e-05, + "loss": 0.009, + "step": 549860 + }, + { + "epoch": 1.43, + "learning_rate": 8.619864638227387e-05, + "loss": 0.0105, + "step": 549870 + }, + { + "epoch": 1.43, + "learning_rate": 8.619475816590241e-05, + "loss": 0.01, + "step": 549880 + }, + { + "epoch": 1.43, + "learning_rate": 8.619086994953094e-05, + "loss": 0.009, + "step": 549890 + }, + { + "epoch": 1.43, + "learning_rate": 8.618698173315948e-05, + "loss": 0.008, + "step": 549900 + }, + { + "epoch": 1.43, + "learning_rate": 8.618309351678801e-05, + "loss": 0.0088, + "step": 549910 + }, + { + "epoch": 1.43, + "learning_rate": 8.617920530041655e-05, + "loss": 0.0083, + "step": 549920 + }, + { + "epoch": 1.43, + "learning_rate": 8.617531708404508e-05, + "loss": 0.0108, + "step": 549930 + }, + { + "epoch": 1.43, + "learning_rate": 8.617142886767363e-05, + "loss": 0.0085, + "step": 549940 + }, + { + "epoch": 1.43, + "learning_rate": 8.616754065130215e-05, + "loss": 0.0064, + "step": 549950 + }, + { + "epoch": 1.43, + "learning_rate": 8.61636524349307e-05, + "loss": 0.0099, + "step": 549960 + }, + { + "epoch": 1.43, + "learning_rate": 8.615976421855923e-05, + "loss": 0.0114, + "step": 549970 + }, + { + "epoch": 1.43, + "learning_rate": 8.615587600218777e-05, + "loss": 0.011, + "step": 549980 + }, + { + "epoch": 1.43, + "learning_rate": 8.61519877858163e-05, + "loss": 0.0096, + "step": 549990 + }, + { + "epoch": 1.43, + "learning_rate": 8.614809956944484e-05, + "loss": 0.0107, + "step": 550000 + }, + { + "epoch": 1.43, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.006080552935600281, + "eval_runtime": 107.8759, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 550000 + }, + { + "epoch": 1.43, + "learning_rate": 8.614421135307337e-05, + "loss": 0.0092, + "step": 550010 + }, + { + "epoch": 1.43, + "learning_rate": 8.614032313670191e-05, + "loss": 0.0097, + "step": 550020 + }, + { + "epoch": 1.43, + "learning_rate": 8.613643492033044e-05, + "loss": 0.0081, + "step": 550030 + }, + { + "epoch": 1.43, + "learning_rate": 8.613254670395898e-05, + "loss": 0.01, + "step": 550040 + }, + { + "epoch": 1.43, + "learning_rate": 8.612865848758751e-05, + "loss": 0.0077, + "step": 550050 + }, + { + "epoch": 1.43, + "learning_rate": 8.612477027121604e-05, + "loss": 0.0074, + "step": 550060 + }, + { + "epoch": 1.43, + "learning_rate": 8.612088205484458e-05, + "loss": 0.0066, + "step": 550070 + }, + { + "epoch": 1.43, + "learning_rate": 8.61169938384731e-05, + "loss": 0.0104, + "step": 550080 + }, + { + "epoch": 1.43, + "learning_rate": 8.611310562210165e-05, + "loss": 0.0104, + "step": 550090 + }, + { + "epoch": 1.43, + "learning_rate": 8.610921740573018e-05, + "loss": 0.0126, + "step": 550100 + }, + { + "epoch": 1.43, + "learning_rate": 8.610532918935872e-05, + "loss": 0.0092, + "step": 550110 + }, + { + "epoch": 1.43, + "learning_rate": 8.610144097298725e-05, + "loss": 0.0122, + "step": 550120 + }, + { + "epoch": 1.43, + "learning_rate": 8.60975527566158e-05, + "loss": 0.01, + "step": 550130 + }, + { + "epoch": 1.43, + "learning_rate": 8.609366454024433e-05, + "loss": 0.0125, + "step": 550140 + }, + { + "epoch": 1.43, + "learning_rate": 8.608977632387287e-05, + "loss": 0.0071, + "step": 550150 + }, + { + "epoch": 1.43, + "learning_rate": 8.60858881075014e-05, + "loss": 0.0104, + "step": 550160 + }, + { + "epoch": 1.43, + "learning_rate": 8.608199989112994e-05, + "loss": 0.0079, + "step": 550170 + }, + { + "epoch": 1.43, + "learning_rate": 8.607811167475847e-05, + "loss": 0.0089, + "step": 550180 + }, + { + "epoch": 1.43, + "learning_rate": 8.607422345838701e-05, + "loss": 0.0082, + "step": 550190 + }, + { + "epoch": 1.43, + "learning_rate": 8.607033524201554e-05, + "loss": 0.0075, + "step": 550200 + }, + { + "epoch": 1.43, + "learning_rate": 8.606644702564408e-05, + "loss": 0.0083, + "step": 550210 + }, + { + "epoch": 1.43, + "learning_rate": 8.606255880927261e-05, + "loss": 0.0084, + "step": 550220 + }, + { + "epoch": 1.43, + "learning_rate": 8.605867059290115e-05, + "loss": 0.0073, + "step": 550230 + }, + { + "epoch": 1.43, + "learning_rate": 8.605478237652968e-05, + "loss": 0.0103, + "step": 550240 + }, + { + "epoch": 1.43, + "learning_rate": 8.605089416015822e-05, + "loss": 0.0108, + "step": 550250 + }, + { + "epoch": 1.43, + "learning_rate": 8.604700594378675e-05, + "loss": 0.0094, + "step": 550260 + }, + { + "epoch": 1.43, + "learning_rate": 8.604311772741529e-05, + "loss": 0.0099, + "step": 550270 + }, + { + "epoch": 1.43, + "learning_rate": 8.603922951104382e-05, + "loss": 0.007, + "step": 550280 + }, + { + "epoch": 1.43, + "learning_rate": 8.603534129467237e-05, + "loss": 0.0087, + "step": 550290 + }, + { + "epoch": 1.43, + "learning_rate": 8.603145307830089e-05, + "loss": 0.0073, + "step": 550300 + }, + { + "epoch": 1.43, + "learning_rate": 8.602756486192942e-05, + "loss": 0.0073, + "step": 550310 + }, + { + "epoch": 1.43, + "learning_rate": 8.602367664555797e-05, + "loss": 0.0101, + "step": 550320 + }, + { + "epoch": 1.43, + "learning_rate": 8.60197884291865e-05, + "loss": 0.0083, + "step": 550330 + }, + { + "epoch": 1.43, + "learning_rate": 8.601590021281504e-05, + "loss": 0.0076, + "step": 550340 + }, + { + "epoch": 1.43, + "learning_rate": 8.601201199644357e-05, + "loss": 0.011, + "step": 550350 + }, + { + "epoch": 1.43, + "learning_rate": 8.600812378007211e-05, + "loss": 0.0082, + "step": 550360 + }, + { + "epoch": 1.43, + "learning_rate": 8.600423556370064e-05, + "loss": 0.0117, + "step": 550370 + }, + { + "epoch": 1.43, + "learning_rate": 8.600034734732918e-05, + "loss": 0.0103, + "step": 550380 + }, + { + "epoch": 1.43, + "learning_rate": 8.599645913095771e-05, + "loss": 0.0079, + "step": 550390 + }, + { + "epoch": 1.43, + "learning_rate": 8.599257091458625e-05, + "loss": 0.0072, + "step": 550400 + }, + { + "epoch": 1.43, + "learning_rate": 8.598868269821478e-05, + "loss": 0.0097, + "step": 550410 + }, + { + "epoch": 1.43, + "learning_rate": 8.598479448184332e-05, + "loss": 0.006, + "step": 550420 + }, + { + "epoch": 1.43, + "learning_rate": 8.598090626547185e-05, + "loss": 0.0073, + "step": 550430 + }, + { + "epoch": 1.43, + "learning_rate": 8.597701804910039e-05, + "loss": 0.0084, + "step": 550440 + }, + { + "epoch": 1.43, + "learning_rate": 8.597312983272892e-05, + "loss": 0.0093, + "step": 550450 + }, + { + "epoch": 1.43, + "learning_rate": 8.596924161635746e-05, + "loss": 0.0092, + "step": 550460 + }, + { + "epoch": 1.43, + "learning_rate": 8.596535339998599e-05, + "loss": 0.0116, + "step": 550470 + }, + { + "epoch": 1.43, + "learning_rate": 8.596146518361454e-05, + "loss": 0.0112, + "step": 550480 + }, + { + "epoch": 1.43, + "learning_rate": 8.595757696724307e-05, + "loss": 0.0084, + "step": 550490 + }, + { + "epoch": 1.43, + "learning_rate": 8.595368875087161e-05, + "loss": 0.0118, + "step": 550500 + }, + { + "epoch": 1.43, + "learning_rate": 8.594980053450014e-05, + "loss": 0.0093, + "step": 550510 + }, + { + "epoch": 1.43, + "learning_rate": 8.594591231812868e-05, + "loss": 0.0094, + "step": 550520 + }, + { + "epoch": 1.43, + "learning_rate": 8.594202410175721e-05, + "loss": 0.0123, + "step": 550530 + }, + { + "epoch": 1.43, + "learning_rate": 8.593813588538575e-05, + "loss": 0.0058, + "step": 550540 + }, + { + "epoch": 1.43, + "learning_rate": 8.593424766901428e-05, + "loss": 0.0087, + "step": 550550 + }, + { + "epoch": 1.43, + "learning_rate": 8.593035945264281e-05, + "loss": 0.0087, + "step": 550560 + }, + { + "epoch": 1.43, + "learning_rate": 8.592647123627135e-05, + "loss": 0.0088, + "step": 550570 + }, + { + "epoch": 1.43, + "learning_rate": 8.592258301989988e-05, + "loss": 0.0112, + "step": 550580 + }, + { + "epoch": 1.43, + "learning_rate": 8.591869480352842e-05, + "loss": 0.0118, + "step": 550590 + }, + { + "epoch": 1.43, + "learning_rate": 8.591480658715695e-05, + "loss": 0.0126, + "step": 550600 + }, + { + "epoch": 1.43, + "learning_rate": 8.591091837078549e-05, + "loss": 0.012, + "step": 550610 + }, + { + "epoch": 1.43, + "learning_rate": 8.590703015441402e-05, + "loss": 0.0113, + "step": 550620 + }, + { + "epoch": 1.43, + "learning_rate": 8.590314193804256e-05, + "loss": 0.01, + "step": 550630 + }, + { + "epoch": 1.43, + "learning_rate": 8.589925372167109e-05, + "loss": 0.0106, + "step": 550640 + }, + { + "epoch": 1.43, + "learning_rate": 8.589536550529964e-05, + "loss": 0.0055, + "step": 550650 + }, + { + "epoch": 1.43, + "learning_rate": 8.589147728892816e-05, + "loss": 0.0084, + "step": 550660 + }, + { + "epoch": 1.43, + "learning_rate": 8.588758907255671e-05, + "loss": 0.0084, + "step": 550670 + }, + { + "epoch": 1.43, + "learning_rate": 8.588370085618524e-05, + "loss": 0.0134, + "step": 550680 + }, + { + "epoch": 1.43, + "learning_rate": 8.587981263981378e-05, + "loss": 0.0107, + "step": 550690 + }, + { + "epoch": 1.43, + "learning_rate": 8.587592442344231e-05, + "loss": 0.0105, + "step": 550700 + }, + { + "epoch": 1.43, + "learning_rate": 8.587203620707085e-05, + "loss": 0.0089, + "step": 550710 + }, + { + "epoch": 1.43, + "learning_rate": 8.586814799069938e-05, + "loss": 0.007, + "step": 550720 + }, + { + "epoch": 1.43, + "learning_rate": 8.586425977432792e-05, + "loss": 0.0061, + "step": 550730 + }, + { + "epoch": 1.43, + "learning_rate": 8.586037155795645e-05, + "loss": 0.0105, + "step": 550740 + }, + { + "epoch": 1.43, + "learning_rate": 8.585648334158499e-05, + "loss": 0.0089, + "step": 550750 + }, + { + "epoch": 1.43, + "learning_rate": 8.585259512521352e-05, + "loss": 0.0076, + "step": 550760 + }, + { + "epoch": 1.43, + "learning_rate": 8.584870690884206e-05, + "loss": 0.01, + "step": 550770 + }, + { + "epoch": 1.43, + "learning_rate": 8.584481869247059e-05, + "loss": 0.0103, + "step": 550780 + }, + { + "epoch": 1.43, + "learning_rate": 8.584093047609913e-05, + "loss": 0.008, + "step": 550790 + }, + { + "epoch": 1.43, + "learning_rate": 8.583704225972766e-05, + "loss": 0.0085, + "step": 550800 + }, + { + "epoch": 1.43, + "learning_rate": 8.583315404335619e-05, + "loss": 0.0095, + "step": 550810 + }, + { + "epoch": 1.43, + "learning_rate": 8.582926582698473e-05, + "loss": 0.0122, + "step": 550820 + }, + { + "epoch": 1.43, + "learning_rate": 8.582537761061326e-05, + "loss": 0.0093, + "step": 550830 + }, + { + "epoch": 1.43, + "learning_rate": 8.582148939424181e-05, + "loss": 0.0105, + "step": 550840 + }, + { + "epoch": 1.43, + "learning_rate": 8.581760117787034e-05, + "loss": 0.0056, + "step": 550850 + }, + { + "epoch": 1.43, + "learning_rate": 8.581371296149888e-05, + "loss": 0.0076, + "step": 550860 + }, + { + "epoch": 1.43, + "learning_rate": 8.580982474512741e-05, + "loss": 0.0085, + "step": 550870 + }, + { + "epoch": 1.43, + "learning_rate": 8.580593652875595e-05, + "loss": 0.013, + "step": 550880 + }, + { + "epoch": 1.43, + "learning_rate": 8.580204831238448e-05, + "loss": 0.0103, + "step": 550890 + }, + { + "epoch": 1.43, + "learning_rate": 8.579816009601302e-05, + "loss": 0.0073, + "step": 550900 + }, + { + "epoch": 1.43, + "learning_rate": 8.579427187964155e-05, + "loss": 0.0085, + "step": 550910 + }, + { + "epoch": 1.43, + "learning_rate": 8.579038366327009e-05, + "loss": 0.0095, + "step": 550920 + }, + { + "epoch": 1.43, + "learning_rate": 8.578649544689862e-05, + "loss": 0.0129, + "step": 550930 + }, + { + "epoch": 1.43, + "learning_rate": 8.578260723052716e-05, + "loss": 0.0097, + "step": 550940 + }, + { + "epoch": 1.43, + "learning_rate": 8.577871901415569e-05, + "loss": 0.0073, + "step": 550950 + }, + { + "epoch": 1.43, + "learning_rate": 8.577483079778423e-05, + "loss": 0.0117, + "step": 550960 + }, + { + "epoch": 1.43, + "learning_rate": 8.577094258141276e-05, + "loss": 0.0109, + "step": 550970 + }, + { + "epoch": 1.43, + "learning_rate": 8.57670543650413e-05, + "loss": 0.0121, + "step": 550980 + }, + { + "epoch": 1.43, + "learning_rate": 8.576316614866983e-05, + "loss": 0.0117, + "step": 550990 + }, + { + "epoch": 1.43, + "learning_rate": 8.575927793229838e-05, + "loss": 0.0086, + "step": 551000 + }, + { + "epoch": 1.43, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.006159137934446335, + "eval_runtime": 107.439, + "eval_samples_per_second": 18.615, + "eval_steps_per_second": 4.654, + "step": 551000 + }, + { + "epoch": 1.43, + "learning_rate": 8.575538971592691e-05, + "loss": 0.0098, + "step": 551010 + }, + { + "epoch": 1.43, + "learning_rate": 8.575150149955545e-05, + "loss": 0.0115, + "step": 551020 + }, + { + "epoch": 1.43, + "learning_rate": 8.574761328318398e-05, + "loss": 0.0077, + "step": 551030 + }, + { + "epoch": 1.43, + "learning_rate": 8.574372506681252e-05, + "loss": 0.0074, + "step": 551040 + }, + { + "epoch": 1.43, + "learning_rate": 8.573983685044105e-05, + "loss": 0.0077, + "step": 551050 + }, + { + "epoch": 1.43, + "learning_rate": 8.573594863406958e-05, + "loss": 0.0096, + "step": 551060 + }, + { + "epoch": 1.43, + "learning_rate": 8.573206041769812e-05, + "loss": 0.0116, + "step": 551070 + }, + { + "epoch": 1.43, + "learning_rate": 8.572817220132665e-05, + "loss": 0.0065, + "step": 551080 + }, + { + "epoch": 1.43, + "learning_rate": 8.572428398495519e-05, + "loss": 0.0093, + "step": 551090 + }, + { + "epoch": 1.43, + "learning_rate": 8.572039576858372e-05, + "loss": 0.0123, + "step": 551100 + }, + { + "epoch": 1.43, + "learning_rate": 8.571650755221226e-05, + "loss": 0.0085, + "step": 551110 + }, + { + "epoch": 1.43, + "learning_rate": 8.571261933584079e-05, + "loss": 0.008, + "step": 551120 + }, + { + "epoch": 1.43, + "learning_rate": 8.570873111946933e-05, + "loss": 0.0094, + "step": 551130 + }, + { + "epoch": 1.43, + "learning_rate": 8.570484290309786e-05, + "loss": 0.009, + "step": 551140 + }, + { + "epoch": 1.43, + "learning_rate": 8.57009546867264e-05, + "loss": 0.0069, + "step": 551150 + }, + { + "epoch": 1.43, + "learning_rate": 8.569706647035493e-05, + "loss": 0.0088, + "step": 551160 + }, + { + "epoch": 1.43, + "learning_rate": 8.569317825398348e-05, + "loss": 0.0082, + "step": 551170 + }, + { + "epoch": 1.43, + "learning_rate": 8.5689290037612e-05, + "loss": 0.0089, + "step": 551180 + }, + { + "epoch": 1.43, + "learning_rate": 8.568540182124055e-05, + "loss": 0.0118, + "step": 551190 + }, + { + "epoch": 1.43, + "learning_rate": 8.568151360486908e-05, + "loss": 0.0077, + "step": 551200 + }, + { + "epoch": 1.43, + "learning_rate": 8.567762538849762e-05, + "loss": 0.0094, + "step": 551210 + }, + { + "epoch": 1.43, + "learning_rate": 8.567373717212615e-05, + "loss": 0.0096, + "step": 551220 + }, + { + "epoch": 1.43, + "learning_rate": 8.566984895575469e-05, + "loss": 0.0132, + "step": 551230 + }, + { + "epoch": 1.43, + "learning_rate": 8.566596073938322e-05, + "loss": 0.0083, + "step": 551240 + }, + { + "epoch": 1.43, + "learning_rate": 8.566207252301176e-05, + "loss": 0.0113, + "step": 551250 + }, + { + "epoch": 1.43, + "learning_rate": 8.565818430664029e-05, + "loss": 0.0099, + "step": 551260 + }, + { + "epoch": 1.43, + "learning_rate": 8.565429609026883e-05, + "loss": 0.0111, + "step": 551270 + }, + { + "epoch": 1.43, + "learning_rate": 8.565040787389736e-05, + "loss": 0.0107, + "step": 551280 + }, + { + "epoch": 1.43, + "learning_rate": 8.56465196575259e-05, + "loss": 0.011, + "step": 551290 + }, + { + "epoch": 1.43, + "learning_rate": 8.564263144115443e-05, + "loss": 0.0091, + "step": 551300 + }, + { + "epoch": 1.43, + "learning_rate": 8.563874322478296e-05, + "loss": 0.0091, + "step": 551310 + }, + { + "epoch": 1.43, + "learning_rate": 8.56348550084115e-05, + "loss": 0.0114, + "step": 551320 + }, + { + "epoch": 1.43, + "learning_rate": 8.563096679204003e-05, + "loss": 0.0093, + "step": 551330 + }, + { + "epoch": 1.43, + "learning_rate": 8.562707857566857e-05, + "loss": 0.0113, + "step": 551340 + }, + { + "epoch": 1.43, + "learning_rate": 8.56231903592971e-05, + "loss": 0.0089, + "step": 551350 + }, + { + "epoch": 1.43, + "learning_rate": 8.561930214292565e-05, + "loss": 0.0104, + "step": 551360 + }, + { + "epoch": 1.43, + "learning_rate": 8.561541392655418e-05, + "loss": 0.01, + "step": 551370 + }, + { + "epoch": 1.43, + "learning_rate": 8.561152571018272e-05, + "loss": 0.0102, + "step": 551380 + }, + { + "epoch": 1.43, + "learning_rate": 8.560763749381125e-05, + "loss": 0.0133, + "step": 551390 + }, + { + "epoch": 1.43, + "learning_rate": 8.560374927743979e-05, + "loss": 0.0073, + "step": 551400 + }, + { + "epoch": 1.43, + "learning_rate": 8.559986106106832e-05, + "loss": 0.0101, + "step": 551410 + }, + { + "epoch": 1.43, + "learning_rate": 8.559597284469686e-05, + "loss": 0.0102, + "step": 551420 + }, + { + "epoch": 1.43, + "learning_rate": 8.559208462832539e-05, + "loss": 0.0098, + "step": 551430 + }, + { + "epoch": 1.43, + "learning_rate": 8.558819641195393e-05, + "loss": 0.0095, + "step": 551440 + }, + { + "epoch": 1.43, + "learning_rate": 8.558430819558246e-05, + "loss": 0.0076, + "step": 551450 + }, + { + "epoch": 1.43, + "learning_rate": 8.5580419979211e-05, + "loss": 0.0118, + "step": 551460 + }, + { + "epoch": 1.43, + "learning_rate": 8.557653176283953e-05, + "loss": 0.012, + "step": 551470 + }, + { + "epoch": 1.43, + "learning_rate": 8.557264354646807e-05, + "loss": 0.0097, + "step": 551480 + }, + { + "epoch": 1.43, + "learning_rate": 8.55687553300966e-05, + "loss": 0.0108, + "step": 551490 + }, + { + "epoch": 1.43, + "learning_rate": 8.556486711372514e-05, + "loss": 0.0082, + "step": 551500 + }, + { + "epoch": 1.43, + "learning_rate": 8.556097889735367e-05, + "loss": 0.011, + "step": 551510 + }, + { + "epoch": 1.43, + "learning_rate": 8.555709068098222e-05, + "loss": 0.0082, + "step": 551520 + }, + { + "epoch": 1.43, + "learning_rate": 8.555320246461074e-05, + "loss": 0.0105, + "step": 551530 + }, + { + "epoch": 1.43, + "learning_rate": 8.554931424823929e-05, + "loss": 0.0134, + "step": 551540 + }, + { + "epoch": 1.43, + "learning_rate": 8.554542603186782e-05, + "loss": 0.0073, + "step": 551550 + }, + { + "epoch": 1.43, + "learning_rate": 8.554153781549635e-05, + "loss": 0.0097, + "step": 551560 + }, + { + "epoch": 1.43, + "learning_rate": 8.553764959912489e-05, + "loss": 0.0087, + "step": 551570 + }, + { + "epoch": 1.43, + "learning_rate": 8.553376138275342e-05, + "loss": 0.0105, + "step": 551580 + }, + { + "epoch": 1.43, + "learning_rate": 8.552987316638196e-05, + "loss": 0.01, + "step": 551590 + }, + { + "epoch": 1.43, + "learning_rate": 8.552598495001049e-05, + "loss": 0.0086, + "step": 551600 + }, + { + "epoch": 1.43, + "learning_rate": 8.552209673363903e-05, + "loss": 0.0121, + "step": 551610 + }, + { + "epoch": 1.43, + "learning_rate": 8.551820851726756e-05, + "loss": 0.0089, + "step": 551620 + }, + { + "epoch": 1.43, + "learning_rate": 8.55143203008961e-05, + "loss": 0.0115, + "step": 551630 + }, + { + "epoch": 1.43, + "learning_rate": 8.551043208452463e-05, + "loss": 0.0092, + "step": 551640 + }, + { + "epoch": 1.43, + "learning_rate": 8.550654386815317e-05, + "loss": 0.0106, + "step": 551650 + }, + { + "epoch": 1.43, + "learning_rate": 8.55026556517817e-05, + "loss": 0.008, + "step": 551660 + }, + { + "epoch": 1.43, + "learning_rate": 8.549876743541024e-05, + "loss": 0.0084, + "step": 551670 + }, + { + "epoch": 1.43, + "learning_rate": 8.549487921903877e-05, + "loss": 0.0095, + "step": 551680 + }, + { + "epoch": 1.43, + "learning_rate": 8.549099100266731e-05, + "loss": 0.0096, + "step": 551690 + }, + { + "epoch": 1.43, + "learning_rate": 8.548710278629584e-05, + "loss": 0.0135, + "step": 551700 + }, + { + "epoch": 1.43, + "learning_rate": 8.548321456992439e-05, + "loss": 0.0066, + "step": 551710 + }, + { + "epoch": 1.43, + "learning_rate": 8.547932635355292e-05, + "loss": 0.0073, + "step": 551720 + }, + { + "epoch": 1.43, + "learning_rate": 8.547543813718146e-05, + "loss": 0.0078, + "step": 551730 + }, + { + "epoch": 1.43, + "learning_rate": 8.547154992080999e-05, + "loss": 0.0091, + "step": 551740 + }, + { + "epoch": 1.43, + "learning_rate": 8.546766170443853e-05, + "loss": 0.0143, + "step": 551750 + }, + { + "epoch": 1.43, + "learning_rate": 8.546377348806706e-05, + "loss": 0.0084, + "step": 551760 + }, + { + "epoch": 1.43, + "learning_rate": 8.54598852716956e-05, + "loss": 0.0093, + "step": 551770 + }, + { + "epoch": 1.43, + "learning_rate": 8.545599705532413e-05, + "loss": 0.0104, + "step": 551780 + }, + { + "epoch": 1.43, + "learning_rate": 8.545210883895266e-05, + "loss": 0.0096, + "step": 551790 + }, + { + "epoch": 1.43, + "learning_rate": 8.54482206225812e-05, + "loss": 0.0079, + "step": 551800 + }, + { + "epoch": 1.43, + "learning_rate": 8.544433240620973e-05, + "loss": 0.0104, + "step": 551810 + }, + { + "epoch": 1.43, + "learning_rate": 8.544044418983827e-05, + "loss": 0.0107, + "step": 551820 + }, + { + "epoch": 1.43, + "learning_rate": 8.54365559734668e-05, + "loss": 0.0087, + "step": 551830 + }, + { + "epoch": 1.43, + "learning_rate": 8.543266775709534e-05, + "loss": 0.0112, + "step": 551840 + }, + { + "epoch": 1.43, + "learning_rate": 8.542877954072387e-05, + "loss": 0.0118, + "step": 551850 + }, + { + "epoch": 1.43, + "learning_rate": 8.542489132435241e-05, + "loss": 0.0101, + "step": 551860 + }, + { + "epoch": 1.43, + "learning_rate": 8.542100310798093e-05, + "loss": 0.0114, + "step": 551870 + }, + { + "epoch": 1.43, + "learning_rate": 8.541711489160949e-05, + "loss": 0.0094, + "step": 551880 + }, + { + "epoch": 1.43, + "learning_rate": 8.5413226675238e-05, + "loss": 0.007, + "step": 551890 + }, + { + "epoch": 1.43, + "learning_rate": 8.540933845886656e-05, + "loss": 0.0085, + "step": 551900 + }, + { + "epoch": 1.43, + "learning_rate": 8.540545024249509e-05, + "loss": 0.01, + "step": 551910 + }, + { + "epoch": 1.43, + "learning_rate": 8.540156202612363e-05, + "loss": 0.0112, + "step": 551920 + }, + { + "epoch": 1.43, + "learning_rate": 8.539767380975216e-05, + "loss": 0.0116, + "step": 551930 + }, + { + "epoch": 1.43, + "learning_rate": 8.53937855933807e-05, + "loss": 0.008, + "step": 551940 + }, + { + "epoch": 1.43, + "learning_rate": 8.538989737700923e-05, + "loss": 0.0062, + "step": 551950 + }, + { + "epoch": 1.43, + "learning_rate": 8.538600916063777e-05, + "loss": 0.0082, + "step": 551960 + }, + { + "epoch": 1.43, + "learning_rate": 8.53821209442663e-05, + "loss": 0.0083, + "step": 551970 + }, + { + "epoch": 1.43, + "learning_rate": 8.537823272789484e-05, + "loss": 0.0083, + "step": 551980 + }, + { + "epoch": 1.43, + "learning_rate": 8.537434451152337e-05, + "loss": 0.0107, + "step": 551990 + }, + { + "epoch": 1.43, + "learning_rate": 8.537045629515191e-05, + "loss": 0.0107, + "step": 552000 + }, + { + "epoch": 1.43, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.006157498341053724, + "eval_runtime": 107.7718, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.639, + "step": 552000 + }, + { + "epoch": 1.43, + "learning_rate": 8.536656807878044e-05, + "loss": 0.0084, + "step": 552010 + }, + { + "epoch": 1.43, + "learning_rate": 8.536267986240898e-05, + "loss": 0.0105, + "step": 552020 + }, + { + "epoch": 1.43, + "learning_rate": 8.53587916460375e-05, + "loss": 0.0117, + "step": 552030 + }, + { + "epoch": 1.43, + "learning_rate": 8.535490342966603e-05, + "loss": 0.0115, + "step": 552040 + }, + { + "epoch": 1.43, + "learning_rate": 8.535101521329458e-05, + "loss": 0.0103, + "step": 552050 + }, + { + "epoch": 1.43, + "learning_rate": 8.53471269969231e-05, + "loss": 0.0089, + "step": 552060 + }, + { + "epoch": 1.43, + "learning_rate": 8.534323878055166e-05, + "loss": 0.0092, + "step": 552070 + }, + { + "epoch": 1.43, + "learning_rate": 8.533935056418019e-05, + "loss": 0.0088, + "step": 552080 + }, + { + "epoch": 1.43, + "learning_rate": 8.533546234780873e-05, + "loss": 0.0092, + "step": 552090 + }, + { + "epoch": 1.43, + "learning_rate": 8.533157413143726e-05, + "loss": 0.0091, + "step": 552100 + }, + { + "epoch": 1.43, + "learning_rate": 8.53276859150658e-05, + "loss": 0.0094, + "step": 552110 + }, + { + "epoch": 1.43, + "learning_rate": 8.532379769869433e-05, + "loss": 0.011, + "step": 552120 + }, + { + "epoch": 1.43, + "learning_rate": 8.531990948232287e-05, + "loss": 0.0109, + "step": 552130 + }, + { + "epoch": 1.43, + "learning_rate": 8.53160212659514e-05, + "loss": 0.0068, + "step": 552140 + }, + { + "epoch": 1.43, + "learning_rate": 8.531213304957994e-05, + "loss": 0.0161, + "step": 552150 + }, + { + "epoch": 1.43, + "learning_rate": 8.530824483320847e-05, + "loss": 0.0082, + "step": 552160 + }, + { + "epoch": 1.43, + "learning_rate": 8.530435661683701e-05, + "loss": 0.0102, + "step": 552170 + }, + { + "epoch": 1.43, + "learning_rate": 8.530046840046554e-05, + "loss": 0.0074, + "step": 552180 + }, + { + "epoch": 1.43, + "learning_rate": 8.529658018409408e-05, + "loss": 0.0088, + "step": 552190 + }, + { + "epoch": 1.43, + "learning_rate": 8.52926919677226e-05, + "loss": 0.0137, + "step": 552200 + }, + { + "epoch": 1.43, + "learning_rate": 8.528880375135115e-05, + "loss": 0.0107, + "step": 552210 + }, + { + "epoch": 1.43, + "learning_rate": 8.528491553497968e-05, + "loss": 0.0127, + "step": 552220 + }, + { + "epoch": 1.43, + "learning_rate": 8.528102731860823e-05, + "loss": 0.0092, + "step": 552230 + }, + { + "epoch": 1.43, + "learning_rate": 8.527713910223676e-05, + "loss": 0.0086, + "step": 552240 + }, + { + "epoch": 1.43, + "learning_rate": 8.52732508858653e-05, + "loss": 0.008, + "step": 552250 + }, + { + "epoch": 1.43, + "learning_rate": 8.526936266949383e-05, + "loss": 0.014, + "step": 552260 + }, + { + "epoch": 1.43, + "learning_rate": 8.526547445312237e-05, + "loss": 0.0088, + "step": 552270 + }, + { + "epoch": 1.43, + "learning_rate": 8.52615862367509e-05, + "loss": 0.0113, + "step": 552280 + }, + { + "epoch": 1.43, + "learning_rate": 8.525769802037943e-05, + "loss": 0.0079, + "step": 552290 + }, + { + "epoch": 1.43, + "learning_rate": 8.525380980400797e-05, + "loss": 0.0077, + "step": 552300 + }, + { + "epoch": 1.43, + "learning_rate": 8.52499215876365e-05, + "loss": 0.011, + "step": 552310 + }, + { + "epoch": 1.43, + "learning_rate": 8.524603337126504e-05, + "loss": 0.0127, + "step": 552320 + }, + { + "epoch": 1.43, + "learning_rate": 8.524214515489357e-05, + "loss": 0.0081, + "step": 552330 + }, + { + "epoch": 1.43, + "learning_rate": 8.523825693852211e-05, + "loss": 0.0118, + "step": 552340 + }, + { + "epoch": 1.43, + "learning_rate": 8.523436872215064e-05, + "loss": 0.0105, + "step": 552350 + }, + { + "epoch": 1.43, + "learning_rate": 8.523048050577918e-05, + "loss": 0.0139, + "step": 552360 + }, + { + "epoch": 1.43, + "learning_rate": 8.52265922894077e-05, + "loss": 0.0094, + "step": 552370 + }, + { + "epoch": 1.43, + "learning_rate": 8.522270407303625e-05, + "loss": 0.0091, + "step": 552380 + }, + { + "epoch": 1.43, + "learning_rate": 8.521881585666477e-05, + "loss": 0.0087, + "step": 552390 + }, + { + "epoch": 1.43, + "learning_rate": 8.521492764029333e-05, + "loss": 0.01, + "step": 552400 + }, + { + "epoch": 1.43, + "learning_rate": 8.521103942392184e-05, + "loss": 0.0089, + "step": 552410 + }, + { + "epoch": 1.43, + "learning_rate": 8.52071512075504e-05, + "loss": 0.0095, + "step": 552420 + }, + { + "epoch": 1.43, + "learning_rate": 8.520326299117893e-05, + "loss": 0.0085, + "step": 552430 + }, + { + "epoch": 1.43, + "learning_rate": 8.519937477480747e-05, + "loss": 0.0072, + "step": 552440 + }, + { + "epoch": 1.43, + "learning_rate": 8.5195486558436e-05, + "loss": 0.0071, + "step": 552450 + }, + { + "epoch": 1.43, + "learning_rate": 8.519159834206454e-05, + "loss": 0.0099, + "step": 552460 + }, + { + "epoch": 1.43, + "learning_rate": 8.518771012569307e-05, + "loss": 0.0091, + "step": 552470 + }, + { + "epoch": 1.43, + "learning_rate": 8.518382190932161e-05, + "loss": 0.0091, + "step": 552480 + }, + { + "epoch": 1.43, + "learning_rate": 8.517993369295014e-05, + "loss": 0.0112, + "step": 552490 + }, + { + "epoch": 1.43, + "learning_rate": 8.517604547657868e-05, + "loss": 0.008, + "step": 552500 + }, + { + "epoch": 1.43, + "learning_rate": 8.51721572602072e-05, + "loss": 0.0092, + "step": 552510 + }, + { + "epoch": 1.43, + "learning_rate": 8.516826904383575e-05, + "loss": 0.0075, + "step": 552520 + }, + { + "epoch": 1.43, + "learning_rate": 8.516438082746428e-05, + "loss": 0.0079, + "step": 552530 + }, + { + "epoch": 1.43, + "learning_rate": 8.51604926110928e-05, + "loss": 0.0104, + "step": 552540 + }, + { + "epoch": 1.43, + "learning_rate": 8.515660439472135e-05, + "loss": 0.0069, + "step": 552550 + }, + { + "epoch": 1.43, + "learning_rate": 8.515271617834987e-05, + "loss": 0.0069, + "step": 552560 + }, + { + "epoch": 1.43, + "learning_rate": 8.514882796197842e-05, + "loss": 0.0077, + "step": 552570 + }, + { + "epoch": 1.43, + "learning_rate": 8.514493974560694e-05, + "loss": 0.0099, + "step": 552580 + }, + { + "epoch": 1.43, + "learning_rate": 8.51410515292355e-05, + "loss": 0.0107, + "step": 552590 + }, + { + "epoch": 1.43, + "learning_rate": 8.513716331286403e-05, + "loss": 0.0077, + "step": 552600 + }, + { + "epoch": 1.43, + "learning_rate": 8.513327509649257e-05, + "loss": 0.0085, + "step": 552610 + }, + { + "epoch": 1.43, + "learning_rate": 8.51293868801211e-05, + "loss": 0.0097, + "step": 552620 + }, + { + "epoch": 1.43, + "learning_rate": 8.512549866374964e-05, + "loss": 0.0085, + "step": 552630 + }, + { + "epoch": 1.43, + "learning_rate": 8.512161044737817e-05, + "loss": 0.007, + "step": 552640 + }, + { + "epoch": 1.43, + "learning_rate": 8.511772223100671e-05, + "loss": 0.0083, + "step": 552650 + }, + { + "epoch": 1.43, + "learning_rate": 8.511383401463524e-05, + "loss": 0.0076, + "step": 552660 + }, + { + "epoch": 1.43, + "learning_rate": 8.510994579826378e-05, + "loss": 0.0087, + "step": 552670 + }, + { + "epoch": 1.43, + "learning_rate": 8.51060575818923e-05, + "loss": 0.0086, + "step": 552680 + }, + { + "epoch": 1.43, + "learning_rate": 8.510216936552085e-05, + "loss": 0.0099, + "step": 552690 + }, + { + "epoch": 1.43, + "learning_rate": 8.509828114914938e-05, + "loss": 0.0098, + "step": 552700 + }, + { + "epoch": 1.43, + "learning_rate": 8.509439293277792e-05, + "loss": 0.012, + "step": 552710 + }, + { + "epoch": 1.43, + "learning_rate": 8.509050471640645e-05, + "loss": 0.0128, + "step": 552720 + }, + { + "epoch": 1.43, + "learning_rate": 8.508661650003499e-05, + "loss": 0.0134, + "step": 552730 + }, + { + "epoch": 1.43, + "learning_rate": 8.508272828366352e-05, + "loss": 0.0088, + "step": 552740 + }, + { + "epoch": 1.43, + "learning_rate": 8.507884006729207e-05, + "loss": 0.0073, + "step": 552750 + }, + { + "epoch": 1.43, + "learning_rate": 8.50749518509206e-05, + "loss": 0.0116, + "step": 552760 + }, + { + "epoch": 1.43, + "learning_rate": 8.507106363454914e-05, + "loss": 0.0082, + "step": 552770 + }, + { + "epoch": 1.43, + "learning_rate": 8.506717541817767e-05, + "loss": 0.0089, + "step": 552780 + }, + { + "epoch": 1.43, + "learning_rate": 8.50632872018062e-05, + "loss": 0.0072, + "step": 552790 + }, + { + "epoch": 1.43, + "learning_rate": 8.505939898543474e-05, + "loss": 0.009, + "step": 552800 + }, + { + "epoch": 1.43, + "learning_rate": 8.505551076906327e-05, + "loss": 0.0109, + "step": 552810 + }, + { + "epoch": 1.43, + "learning_rate": 8.505162255269181e-05, + "loss": 0.0078, + "step": 552820 + }, + { + "epoch": 1.43, + "learning_rate": 8.504773433632034e-05, + "loss": 0.0077, + "step": 552830 + }, + { + "epoch": 1.43, + "learning_rate": 8.504384611994888e-05, + "loss": 0.0097, + "step": 552840 + }, + { + "epoch": 1.43, + "learning_rate": 8.50399579035774e-05, + "loss": 0.0114, + "step": 552850 + }, + { + "epoch": 1.43, + "learning_rate": 8.503606968720595e-05, + "loss": 0.0127, + "step": 552860 + }, + { + "epoch": 1.43, + "learning_rate": 8.503218147083448e-05, + "loss": 0.0114, + "step": 552870 + }, + { + "epoch": 1.43, + "learning_rate": 8.502829325446302e-05, + "loss": 0.0103, + "step": 552880 + }, + { + "epoch": 1.43, + "learning_rate": 8.502440503809154e-05, + "loss": 0.0145, + "step": 552890 + }, + { + "epoch": 1.43, + "learning_rate": 8.502051682172009e-05, + "loss": 0.0074, + "step": 552900 + }, + { + "epoch": 1.43, + "learning_rate": 8.501662860534861e-05, + "loss": 0.0068, + "step": 552910 + }, + { + "epoch": 1.43, + "learning_rate": 8.501274038897716e-05, + "loss": 0.0097, + "step": 552920 + }, + { + "epoch": 1.43, + "learning_rate": 8.500885217260568e-05, + "loss": 0.0064, + "step": 552930 + }, + { + "epoch": 1.43, + "learning_rate": 8.500496395623424e-05, + "loss": 0.0119, + "step": 552940 + }, + { + "epoch": 1.43, + "learning_rate": 8.500107573986277e-05, + "loss": 0.0086, + "step": 552950 + }, + { + "epoch": 1.43, + "learning_rate": 8.499718752349131e-05, + "loss": 0.0087, + "step": 552960 + }, + { + "epoch": 1.43, + "learning_rate": 8.499329930711984e-05, + "loss": 0.0083, + "step": 552970 + }, + { + "epoch": 1.43, + "learning_rate": 8.498941109074838e-05, + "loss": 0.0068, + "step": 552980 + }, + { + "epoch": 1.43, + "learning_rate": 8.498552287437691e-05, + "loss": 0.0104, + "step": 552990 + }, + { + "epoch": 1.43, + "learning_rate": 8.498163465800545e-05, + "loss": 0.0112, + "step": 553000 + }, + { + "epoch": 1.43, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.006217279937118292, + "eval_runtime": 107.8256, + "eval_samples_per_second": 18.548, + "eval_steps_per_second": 4.637, + "step": 553000 + }, + { + "epoch": 1.43, + "learning_rate": 8.497774644163398e-05, + "loss": 0.0072, + "step": 553010 + }, + { + "epoch": 1.43, + "learning_rate": 8.497385822526252e-05, + "loss": 0.0102, + "step": 553020 + }, + { + "epoch": 1.43, + "learning_rate": 8.496997000889105e-05, + "loss": 0.008, + "step": 553030 + }, + { + "epoch": 1.43, + "learning_rate": 8.496608179251957e-05, + "loss": 0.0135, + "step": 553040 + }, + { + "epoch": 1.43, + "learning_rate": 8.496219357614812e-05, + "loss": 0.0089, + "step": 553050 + }, + { + "epoch": 1.43, + "learning_rate": 8.495830535977664e-05, + "loss": 0.0102, + "step": 553060 + }, + { + "epoch": 1.43, + "learning_rate": 8.495441714340519e-05, + "loss": 0.0104, + "step": 553070 + }, + { + "epoch": 1.43, + "learning_rate": 8.495052892703371e-05, + "loss": 0.0102, + "step": 553080 + }, + { + "epoch": 1.43, + "learning_rate": 8.494664071066226e-05, + "loss": 0.0101, + "step": 553090 + }, + { + "epoch": 1.43, + "learning_rate": 8.494275249429078e-05, + "loss": 0.0108, + "step": 553100 + }, + { + "epoch": 1.43, + "learning_rate": 8.493886427791934e-05, + "loss": 0.0096, + "step": 553110 + }, + { + "epoch": 1.43, + "learning_rate": 8.493497606154785e-05, + "loss": 0.0088, + "step": 553120 + }, + { + "epoch": 1.43, + "learning_rate": 8.493108784517641e-05, + "loss": 0.0089, + "step": 553130 + }, + { + "epoch": 1.43, + "learning_rate": 8.492719962880494e-05, + "loss": 0.0075, + "step": 553140 + }, + { + "epoch": 1.43, + "learning_rate": 8.492331141243348e-05, + "loss": 0.0105, + "step": 553150 + }, + { + "epoch": 1.43, + "learning_rate": 8.4919423196062e-05, + "loss": 0.0084, + "step": 553160 + }, + { + "epoch": 1.43, + "learning_rate": 8.491553497969055e-05, + "loss": 0.0097, + "step": 553170 + }, + { + "epoch": 1.43, + "learning_rate": 8.491164676331908e-05, + "loss": 0.0108, + "step": 553180 + }, + { + "epoch": 1.43, + "learning_rate": 8.490775854694762e-05, + "loss": 0.0079, + "step": 553190 + }, + { + "epoch": 1.43, + "learning_rate": 8.490387033057615e-05, + "loss": 0.0092, + "step": 553200 + }, + { + "epoch": 1.43, + "learning_rate": 8.489998211420469e-05, + "loss": 0.0116, + "step": 553210 + }, + { + "epoch": 1.43, + "learning_rate": 8.489609389783322e-05, + "loss": 0.01, + "step": 553220 + }, + { + "epoch": 1.43, + "learning_rate": 8.489220568146176e-05, + "loss": 0.0093, + "step": 553230 + }, + { + "epoch": 1.43, + "learning_rate": 8.488831746509029e-05, + "loss": 0.0078, + "step": 553240 + }, + { + "epoch": 1.43, + "learning_rate": 8.488442924871883e-05, + "loss": 0.0085, + "step": 553250 + }, + { + "epoch": 1.43, + "learning_rate": 8.488054103234736e-05, + "loss": 0.0092, + "step": 553260 + }, + { + "epoch": 1.43, + "learning_rate": 8.487665281597591e-05, + "loss": 0.0097, + "step": 553270 + }, + { + "epoch": 1.43, + "learning_rate": 8.487276459960442e-05, + "loss": 0.0109, + "step": 553280 + }, + { + "epoch": 1.43, + "learning_rate": 8.486887638323295e-05, + "loss": 0.0125, + "step": 553290 + }, + { + "epoch": 1.43, + "learning_rate": 8.486498816686151e-05, + "loss": 0.0098, + "step": 553300 + }, + { + "epoch": 1.43, + "learning_rate": 8.486109995049004e-05, + "loss": 0.007, + "step": 553310 + }, + { + "epoch": 1.43, + "learning_rate": 8.485721173411858e-05, + "loss": 0.0086, + "step": 553320 + }, + { + "epoch": 1.43, + "learning_rate": 8.48533235177471e-05, + "loss": 0.0084, + "step": 553330 + }, + { + "epoch": 1.43, + "learning_rate": 8.484943530137565e-05, + "loss": 0.0099, + "step": 553340 + }, + { + "epoch": 1.43, + "learning_rate": 8.484554708500418e-05, + "loss": 0.0097, + "step": 553350 + }, + { + "epoch": 1.43, + "learning_rate": 8.484165886863272e-05, + "loss": 0.0079, + "step": 553360 + }, + { + "epoch": 1.43, + "learning_rate": 8.483777065226125e-05, + "loss": 0.0071, + "step": 553370 + }, + { + "epoch": 1.43, + "learning_rate": 8.483388243588979e-05, + "loss": 0.0095, + "step": 553380 + }, + { + "epoch": 1.43, + "learning_rate": 8.482999421951832e-05, + "loss": 0.0104, + "step": 553390 + }, + { + "epoch": 1.43, + "learning_rate": 8.482610600314686e-05, + "loss": 0.0103, + "step": 553400 + }, + { + "epoch": 1.43, + "learning_rate": 8.482221778677538e-05, + "loss": 0.0107, + "step": 553410 + }, + { + "epoch": 1.43, + "learning_rate": 8.481832957040393e-05, + "loss": 0.009, + "step": 553420 + }, + { + "epoch": 1.43, + "learning_rate": 8.481444135403245e-05, + "loss": 0.0108, + "step": 553430 + }, + { + "epoch": 1.43, + "learning_rate": 8.4810553137661e-05, + "loss": 0.0112, + "step": 553440 + }, + { + "epoch": 1.43, + "learning_rate": 8.480666492128952e-05, + "loss": 0.0101, + "step": 553450 + }, + { + "epoch": 1.43, + "learning_rate": 8.480277670491808e-05, + "loss": 0.0092, + "step": 553460 + }, + { + "epoch": 1.43, + "learning_rate": 8.479888848854661e-05, + "loss": 0.0114, + "step": 553470 + }, + { + "epoch": 1.43, + "learning_rate": 8.479500027217515e-05, + "loss": 0.0121, + "step": 553480 + }, + { + "epoch": 1.43, + "learning_rate": 8.479111205580368e-05, + "loss": 0.0097, + "step": 553490 + }, + { + "epoch": 1.43, + "learning_rate": 8.478722383943222e-05, + "loss": 0.0099, + "step": 553500 + }, + { + "epoch": 1.43, + "learning_rate": 8.478333562306075e-05, + "loss": 0.0102, + "step": 553510 + }, + { + "epoch": 1.43, + "learning_rate": 8.477944740668929e-05, + "loss": 0.0098, + "step": 553520 + }, + { + "epoch": 1.43, + "learning_rate": 8.477555919031782e-05, + "loss": 0.0091, + "step": 553530 + }, + { + "epoch": 1.43, + "learning_rate": 8.477167097394634e-05, + "loss": 0.0121, + "step": 553540 + }, + { + "epoch": 1.43, + "learning_rate": 8.476778275757489e-05, + "loss": 0.0102, + "step": 553550 + }, + { + "epoch": 1.43, + "learning_rate": 8.476389454120341e-05, + "loss": 0.0106, + "step": 553560 + }, + { + "epoch": 1.43, + "learning_rate": 8.476000632483196e-05, + "loss": 0.0115, + "step": 553570 + }, + { + "epoch": 1.43, + "learning_rate": 8.475611810846048e-05, + "loss": 0.0096, + "step": 553580 + }, + { + "epoch": 1.43, + "learning_rate": 8.475222989208903e-05, + "loss": 0.0148, + "step": 553590 + }, + { + "epoch": 1.44, + "learning_rate": 8.474834167571755e-05, + "loss": 0.0072, + "step": 553600 + }, + { + "epoch": 1.44, + "learning_rate": 8.47444534593461e-05, + "loss": 0.0096, + "step": 553610 + }, + { + "epoch": 1.44, + "learning_rate": 8.474056524297462e-05, + "loss": 0.0088, + "step": 553620 + }, + { + "epoch": 1.44, + "learning_rate": 8.473667702660318e-05, + "loss": 0.01, + "step": 553630 + }, + { + "epoch": 1.44, + "learning_rate": 8.47327888102317e-05, + "loss": 0.0087, + "step": 553640 + }, + { + "epoch": 1.44, + "learning_rate": 8.472890059386025e-05, + "loss": 0.0096, + "step": 553650 + }, + { + "epoch": 1.44, + "learning_rate": 8.472501237748878e-05, + "loss": 0.0083, + "step": 553660 + }, + { + "epoch": 1.44, + "learning_rate": 8.472112416111732e-05, + "loss": 0.0094, + "step": 553670 + }, + { + "epoch": 1.44, + "learning_rate": 8.471723594474585e-05, + "loss": 0.0085, + "step": 553680 + }, + { + "epoch": 1.44, + "learning_rate": 8.471334772837439e-05, + "loss": 0.0074, + "step": 553690 + }, + { + "epoch": 1.44, + "learning_rate": 8.470945951200292e-05, + "loss": 0.0126, + "step": 553700 + }, + { + "epoch": 1.44, + "learning_rate": 8.470557129563146e-05, + "loss": 0.0105, + "step": 553710 + }, + { + "epoch": 1.44, + "learning_rate": 8.470168307925999e-05, + "loss": 0.009, + "step": 553720 + }, + { + "epoch": 1.44, + "learning_rate": 8.469779486288853e-05, + "loss": 0.0111, + "step": 553730 + }, + { + "epoch": 1.44, + "learning_rate": 8.469390664651706e-05, + "loss": 0.0104, + "step": 553740 + }, + { + "epoch": 1.44, + "learning_rate": 8.46900184301456e-05, + "loss": 0.0107, + "step": 553750 + }, + { + "epoch": 1.44, + "learning_rate": 8.468613021377413e-05, + "loss": 0.0089, + "step": 553760 + }, + { + "epoch": 1.44, + "learning_rate": 8.468224199740267e-05, + "loss": 0.009, + "step": 553770 + }, + { + "epoch": 1.44, + "learning_rate": 8.46783537810312e-05, + "loss": 0.0103, + "step": 553780 + }, + { + "epoch": 1.44, + "learning_rate": 8.467446556465972e-05, + "loss": 0.0089, + "step": 553790 + }, + { + "epoch": 1.44, + "learning_rate": 8.467057734828826e-05, + "loss": 0.009, + "step": 553800 + }, + { + "epoch": 1.44, + "learning_rate": 8.466668913191679e-05, + "loss": 0.0089, + "step": 553810 + }, + { + "epoch": 1.44, + "learning_rate": 8.466280091554535e-05, + "loss": 0.0089, + "step": 553820 + }, + { + "epoch": 1.44, + "learning_rate": 8.465891269917388e-05, + "loss": 0.0117, + "step": 553830 + }, + { + "epoch": 1.44, + "learning_rate": 8.465502448280242e-05, + "loss": 0.0086, + "step": 553840 + }, + { + "epoch": 1.44, + "learning_rate": 8.465113626643095e-05, + "loss": 0.0087, + "step": 553850 + }, + { + "epoch": 1.44, + "learning_rate": 8.464724805005949e-05, + "loss": 0.0104, + "step": 553860 + }, + { + "epoch": 1.44, + "learning_rate": 8.464335983368802e-05, + "loss": 0.0138, + "step": 553870 + }, + { + "epoch": 1.44, + "learning_rate": 8.463947161731656e-05, + "loss": 0.0101, + "step": 553880 + }, + { + "epoch": 1.44, + "learning_rate": 8.463558340094509e-05, + "loss": 0.0096, + "step": 553890 + }, + { + "epoch": 1.44, + "learning_rate": 8.463169518457363e-05, + "loss": 0.0092, + "step": 553900 + }, + { + "epoch": 1.44, + "learning_rate": 8.462780696820216e-05, + "loss": 0.0113, + "step": 553910 + }, + { + "epoch": 1.44, + "learning_rate": 8.46239187518307e-05, + "loss": 0.0074, + "step": 553920 + }, + { + "epoch": 1.44, + "learning_rate": 8.462003053545922e-05, + "loss": 0.0103, + "step": 553930 + }, + { + "epoch": 1.44, + "learning_rate": 8.461614231908777e-05, + "loss": 0.0106, + "step": 553940 + }, + { + "epoch": 1.44, + "learning_rate": 8.46122541027163e-05, + "loss": 0.0083, + "step": 553950 + }, + { + "epoch": 1.44, + "learning_rate": 8.460836588634484e-05, + "loss": 0.0103, + "step": 553960 + }, + { + "epoch": 1.44, + "learning_rate": 8.460447766997336e-05, + "loss": 0.0074, + "step": 553970 + }, + { + "epoch": 1.44, + "learning_rate": 8.460058945360192e-05, + "loss": 0.0092, + "step": 553980 + }, + { + "epoch": 1.44, + "learning_rate": 8.459670123723045e-05, + "loss": 0.0113, + "step": 553990 + }, + { + "epoch": 1.44, + "learning_rate": 8.459281302085899e-05, + "loss": 0.008, + "step": 554000 + }, + { + "epoch": 1.44, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.006148200016468763, + "eval_runtime": 107.8579, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 554000 + }, + { + "epoch": 1.44, + "learning_rate": 8.458892480448752e-05, + "loss": 0.0101, + "step": 554010 + }, + { + "epoch": 1.44, + "learning_rate": 8.458503658811606e-05, + "loss": 0.0082, + "step": 554020 + }, + { + "epoch": 1.44, + "learning_rate": 8.458114837174459e-05, + "loss": 0.009, + "step": 554030 + }, + { + "epoch": 1.44, + "learning_rate": 8.457726015537312e-05, + "loss": 0.0089, + "step": 554040 + }, + { + "epoch": 1.44, + "learning_rate": 8.457337193900166e-05, + "loss": 0.0101, + "step": 554050 + }, + { + "epoch": 1.44, + "learning_rate": 8.456948372263018e-05, + "loss": 0.0108, + "step": 554060 + }, + { + "epoch": 1.44, + "learning_rate": 8.456559550625873e-05, + "loss": 0.0082, + "step": 554070 + }, + { + "epoch": 1.44, + "learning_rate": 8.456170728988725e-05, + "loss": 0.0076, + "step": 554080 + }, + { + "epoch": 1.44, + "learning_rate": 8.45578190735158e-05, + "loss": 0.0096, + "step": 554090 + }, + { + "epoch": 1.44, + "learning_rate": 8.455393085714432e-05, + "loss": 0.0115, + "step": 554100 + }, + { + "epoch": 1.44, + "learning_rate": 8.455004264077287e-05, + "loss": 0.0086, + "step": 554110 + }, + { + "epoch": 1.44, + "learning_rate": 8.45461544244014e-05, + "loss": 0.009, + "step": 554120 + }, + { + "epoch": 1.44, + "learning_rate": 8.454226620802994e-05, + "loss": 0.007, + "step": 554130 + }, + { + "epoch": 1.44, + "learning_rate": 8.453837799165846e-05, + "loss": 0.0082, + "step": 554140 + }, + { + "epoch": 1.44, + "learning_rate": 8.453448977528702e-05, + "loss": 0.0113, + "step": 554150 + }, + { + "epoch": 1.44, + "learning_rate": 8.453060155891553e-05, + "loss": 0.0081, + "step": 554160 + }, + { + "epoch": 1.44, + "learning_rate": 8.452671334254409e-05, + "loss": 0.0098, + "step": 554170 + }, + { + "epoch": 1.44, + "learning_rate": 8.452282512617262e-05, + "loss": 0.0081, + "step": 554180 + }, + { + "epoch": 1.44, + "learning_rate": 8.451893690980116e-05, + "loss": 0.0109, + "step": 554190 + }, + { + "epoch": 1.44, + "learning_rate": 8.451504869342969e-05, + "loss": 0.0084, + "step": 554200 + }, + { + "epoch": 1.44, + "learning_rate": 8.451116047705823e-05, + "loss": 0.0123, + "step": 554210 + }, + { + "epoch": 1.44, + "learning_rate": 8.450727226068676e-05, + "loss": 0.0092, + "step": 554220 + }, + { + "epoch": 1.44, + "learning_rate": 8.45033840443153e-05, + "loss": 0.0094, + "step": 554230 + }, + { + "epoch": 1.44, + "learning_rate": 8.449949582794383e-05, + "loss": 0.011, + "step": 554240 + }, + { + "epoch": 1.44, + "learning_rate": 8.449560761157237e-05, + "loss": 0.0086, + "step": 554250 + }, + { + "epoch": 1.44, + "learning_rate": 8.44917193952009e-05, + "loss": 0.0087, + "step": 554260 + }, + { + "epoch": 1.44, + "learning_rate": 8.448783117882944e-05, + "loss": 0.0094, + "step": 554270 + }, + { + "epoch": 1.44, + "learning_rate": 8.448394296245797e-05, + "loss": 0.0079, + "step": 554280 + }, + { + "epoch": 1.44, + "learning_rate": 8.44800547460865e-05, + "loss": 0.009, + "step": 554290 + }, + { + "epoch": 1.44, + "learning_rate": 8.447616652971503e-05, + "loss": 0.0109, + "step": 554300 + }, + { + "epoch": 1.44, + "learning_rate": 8.447227831334356e-05, + "loss": 0.01, + "step": 554310 + }, + { + "epoch": 1.44, + "learning_rate": 8.44683900969721e-05, + "loss": 0.0101, + "step": 554320 + }, + { + "epoch": 1.44, + "learning_rate": 8.446450188060063e-05, + "loss": 0.0095, + "step": 554330 + }, + { + "epoch": 1.44, + "learning_rate": 8.446061366422919e-05, + "loss": 0.0103, + "step": 554340 + }, + { + "epoch": 1.44, + "learning_rate": 8.445672544785772e-05, + "loss": 0.0084, + "step": 554350 + }, + { + "epoch": 1.44, + "learning_rate": 8.445283723148626e-05, + "loss": 0.0102, + "step": 554360 + }, + { + "epoch": 1.44, + "learning_rate": 8.444894901511479e-05, + "loss": 0.0097, + "step": 554370 + }, + { + "epoch": 1.44, + "learning_rate": 8.444506079874333e-05, + "loss": 0.0096, + "step": 554380 + }, + { + "epoch": 1.44, + "learning_rate": 8.444117258237186e-05, + "loss": 0.0125, + "step": 554390 + }, + { + "epoch": 1.44, + "learning_rate": 8.44372843660004e-05, + "loss": 0.0109, + "step": 554400 + }, + { + "epoch": 1.44, + "learning_rate": 8.443339614962893e-05, + "loss": 0.0104, + "step": 554410 + }, + { + "epoch": 1.44, + "learning_rate": 8.442950793325747e-05, + "loss": 0.009, + "step": 554420 + }, + { + "epoch": 1.44, + "learning_rate": 8.4425619716886e-05, + "loss": 0.0105, + "step": 554430 + }, + { + "epoch": 1.44, + "learning_rate": 8.442173150051454e-05, + "loss": 0.011, + "step": 554440 + }, + { + "epoch": 1.44, + "learning_rate": 8.441784328414306e-05, + "loss": 0.0111, + "step": 554450 + }, + { + "epoch": 1.44, + "learning_rate": 8.44139550677716e-05, + "loss": 0.0103, + "step": 554460 + }, + { + "epoch": 1.44, + "learning_rate": 8.441006685140013e-05, + "loss": 0.0111, + "step": 554470 + }, + { + "epoch": 1.44, + "learning_rate": 8.440617863502868e-05, + "loss": 0.0122, + "step": 554480 + }, + { + "epoch": 1.44, + "learning_rate": 8.44022904186572e-05, + "loss": 0.0091, + "step": 554490 + }, + { + "epoch": 1.44, + "learning_rate": 8.439840220228576e-05, + "loss": 0.0061, + "step": 554500 + }, + { + "epoch": 1.44, + "learning_rate": 8.439451398591427e-05, + "loss": 0.0129, + "step": 554510 + }, + { + "epoch": 1.44, + "learning_rate": 8.43906257695428e-05, + "loss": 0.0093, + "step": 554520 + }, + { + "epoch": 1.44, + "learning_rate": 8.438673755317136e-05, + "loss": 0.0074, + "step": 554530 + }, + { + "epoch": 1.44, + "learning_rate": 8.438284933679989e-05, + "loss": 0.0105, + "step": 554540 + }, + { + "epoch": 1.44, + "learning_rate": 8.437896112042843e-05, + "loss": 0.0089, + "step": 554550 + }, + { + "epoch": 1.44, + "learning_rate": 8.437507290405695e-05, + "loss": 0.0063, + "step": 554560 + }, + { + "epoch": 1.44, + "learning_rate": 8.43711846876855e-05, + "loss": 0.0091, + "step": 554570 + }, + { + "epoch": 1.44, + "learning_rate": 8.436729647131402e-05, + "loss": 0.0089, + "step": 554580 + }, + { + "epoch": 1.44, + "learning_rate": 8.436340825494257e-05, + "loss": 0.0076, + "step": 554590 + }, + { + "epoch": 1.44, + "learning_rate": 8.43595200385711e-05, + "loss": 0.01, + "step": 554600 + }, + { + "epoch": 1.44, + "learning_rate": 8.435563182219964e-05, + "loss": 0.0064, + "step": 554610 + }, + { + "epoch": 1.44, + "learning_rate": 8.435174360582816e-05, + "loss": 0.0103, + "step": 554620 + }, + { + "epoch": 1.44, + "learning_rate": 8.43478553894567e-05, + "loss": 0.0088, + "step": 554630 + }, + { + "epoch": 1.44, + "learning_rate": 8.434396717308523e-05, + "loss": 0.0097, + "step": 554640 + }, + { + "epoch": 1.44, + "learning_rate": 8.434007895671378e-05, + "loss": 0.0093, + "step": 554650 + }, + { + "epoch": 1.44, + "learning_rate": 8.43361907403423e-05, + "loss": 0.007, + "step": 554660 + }, + { + "epoch": 1.44, + "learning_rate": 8.433230252397085e-05, + "loss": 0.0083, + "step": 554670 + }, + { + "epoch": 1.44, + "learning_rate": 8.432841430759937e-05, + "loss": 0.0093, + "step": 554680 + }, + { + "epoch": 1.44, + "learning_rate": 8.432452609122793e-05, + "loss": 0.012, + "step": 554690 + }, + { + "epoch": 1.44, + "learning_rate": 8.432063787485646e-05, + "loss": 0.01, + "step": 554700 + }, + { + "epoch": 1.44, + "learning_rate": 8.4316749658485e-05, + "loss": 0.011, + "step": 554710 + }, + { + "epoch": 1.44, + "learning_rate": 8.431286144211353e-05, + "loss": 0.0109, + "step": 554720 + }, + { + "epoch": 1.44, + "learning_rate": 8.430897322574207e-05, + "loss": 0.009, + "step": 554730 + }, + { + "epoch": 1.44, + "learning_rate": 8.43050850093706e-05, + "loss": 0.0118, + "step": 554740 + }, + { + "epoch": 1.44, + "learning_rate": 8.430119679299914e-05, + "loss": 0.0063, + "step": 554750 + }, + { + "epoch": 1.44, + "learning_rate": 8.429730857662767e-05, + "loss": 0.0122, + "step": 554760 + }, + { + "epoch": 1.44, + "learning_rate": 8.42934203602562e-05, + "loss": 0.0116, + "step": 554770 + }, + { + "epoch": 1.44, + "learning_rate": 8.428953214388474e-05, + "loss": 0.0104, + "step": 554780 + }, + { + "epoch": 1.44, + "learning_rate": 8.428564392751326e-05, + "loss": 0.0091, + "step": 554790 + }, + { + "epoch": 1.44, + "learning_rate": 8.42817557111418e-05, + "loss": 0.0117, + "step": 554800 + }, + { + "epoch": 1.44, + "learning_rate": 8.427786749477033e-05, + "loss": 0.0087, + "step": 554810 + }, + { + "epoch": 1.44, + "learning_rate": 8.427397927839887e-05, + "loss": 0.0077, + "step": 554820 + }, + { + "epoch": 1.44, + "learning_rate": 8.42700910620274e-05, + "loss": 0.0111, + "step": 554830 + }, + { + "epoch": 1.44, + "learning_rate": 8.426620284565594e-05, + "loss": 0.0117, + "step": 554840 + }, + { + "epoch": 1.44, + "learning_rate": 8.426231462928447e-05, + "loss": 0.0087, + "step": 554850 + }, + { + "epoch": 1.44, + "learning_rate": 8.425842641291303e-05, + "loss": 0.0081, + "step": 554860 + }, + { + "epoch": 1.44, + "learning_rate": 8.425453819654154e-05, + "loss": 0.0069, + "step": 554870 + }, + { + "epoch": 1.44, + "learning_rate": 8.42506499801701e-05, + "loss": 0.01, + "step": 554880 + }, + { + "epoch": 1.44, + "learning_rate": 8.424676176379863e-05, + "loss": 0.009, + "step": 554890 + }, + { + "epoch": 1.44, + "learning_rate": 8.424287354742717e-05, + "loss": 0.0087, + "step": 554900 + }, + { + "epoch": 1.44, + "learning_rate": 8.42389853310557e-05, + "loss": 0.0118, + "step": 554910 + }, + { + "epoch": 1.44, + "learning_rate": 8.423509711468424e-05, + "loss": 0.012, + "step": 554920 + }, + { + "epoch": 1.44, + "learning_rate": 8.423120889831277e-05, + "loss": 0.0122, + "step": 554930 + }, + { + "epoch": 1.44, + "learning_rate": 8.42273206819413e-05, + "loss": 0.0089, + "step": 554940 + }, + { + "epoch": 1.44, + "learning_rate": 8.422343246556983e-05, + "loss": 0.0081, + "step": 554950 + }, + { + "epoch": 1.44, + "learning_rate": 8.421954424919838e-05, + "loss": 0.0078, + "step": 554960 + }, + { + "epoch": 1.44, + "learning_rate": 8.42156560328269e-05, + "loss": 0.0088, + "step": 554970 + }, + { + "epoch": 1.44, + "learning_rate": 8.421176781645545e-05, + "loss": 0.0098, + "step": 554980 + }, + { + "epoch": 1.44, + "learning_rate": 8.420787960008397e-05, + "loss": 0.0105, + "step": 554990 + }, + { + "epoch": 1.44, + "learning_rate": 8.420399138371252e-05, + "loss": 0.0111, + "step": 555000 + }, + { + "epoch": 1.44, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.006103316321969032, + "eval_runtime": 107.9114, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.633, + "step": 555000 + }, + { + "epoch": 1.44, + "learning_rate": 8.420010316734104e-05, + "loss": 0.0099, + "step": 555010 + }, + { + "epoch": 1.44, + "learning_rate": 8.419621495096957e-05, + "loss": 0.0141, + "step": 555020 + }, + { + "epoch": 1.44, + "learning_rate": 8.419232673459811e-05, + "loss": 0.0099, + "step": 555030 + }, + { + "epoch": 1.44, + "learning_rate": 8.418843851822664e-05, + "loss": 0.011, + "step": 555040 + }, + { + "epoch": 1.44, + "learning_rate": 8.41845503018552e-05, + "loss": 0.0092, + "step": 555050 + }, + { + "epoch": 1.44, + "learning_rate": 8.418066208548373e-05, + "loss": 0.0115, + "step": 555060 + }, + { + "epoch": 1.44, + "learning_rate": 8.417677386911227e-05, + "loss": 0.0072, + "step": 555070 + }, + { + "epoch": 1.44, + "learning_rate": 8.41728856527408e-05, + "loss": 0.0097, + "step": 555080 + }, + { + "epoch": 1.44, + "learning_rate": 8.416899743636934e-05, + "loss": 0.0147, + "step": 555090 + }, + { + "epoch": 1.44, + "learning_rate": 8.416510921999786e-05, + "loss": 0.0098, + "step": 555100 + }, + { + "epoch": 1.44, + "learning_rate": 8.41612210036264e-05, + "loss": 0.0087, + "step": 555110 + }, + { + "epoch": 1.44, + "learning_rate": 8.415733278725493e-05, + "loss": 0.0123, + "step": 555120 + }, + { + "epoch": 1.44, + "learning_rate": 8.415344457088348e-05, + "loss": 0.0105, + "step": 555130 + }, + { + "epoch": 1.44, + "learning_rate": 8.4149556354512e-05, + "loss": 0.0105, + "step": 555140 + }, + { + "epoch": 1.44, + "learning_rate": 8.414566813814055e-05, + "loss": 0.0064, + "step": 555150 + }, + { + "epoch": 1.44, + "learning_rate": 8.414177992176907e-05, + "loss": 0.0102, + "step": 555160 + }, + { + "epoch": 1.44, + "learning_rate": 8.413789170539762e-05, + "loss": 0.0081, + "step": 555170 + }, + { + "epoch": 1.44, + "learning_rate": 8.413400348902614e-05, + "loss": 0.0089, + "step": 555180 + }, + { + "epoch": 1.44, + "learning_rate": 8.413011527265469e-05, + "loss": 0.0073, + "step": 555190 + }, + { + "epoch": 1.44, + "learning_rate": 8.412622705628321e-05, + "loss": 0.0066, + "step": 555200 + }, + { + "epoch": 1.44, + "learning_rate": 8.412233883991177e-05, + "loss": 0.0083, + "step": 555210 + }, + { + "epoch": 1.44, + "learning_rate": 8.41184506235403e-05, + "loss": 0.0089, + "step": 555220 + }, + { + "epoch": 1.44, + "learning_rate": 8.411456240716884e-05, + "loss": 0.0106, + "step": 555230 + }, + { + "epoch": 1.44, + "learning_rate": 8.411067419079737e-05, + "loss": 0.0096, + "step": 555240 + }, + { + "epoch": 1.44, + "learning_rate": 8.410678597442591e-05, + "loss": 0.0117, + "step": 555250 + }, + { + "epoch": 1.44, + "learning_rate": 8.410289775805444e-05, + "loss": 0.0155, + "step": 555260 + }, + { + "epoch": 1.44, + "learning_rate": 8.409900954168296e-05, + "loss": 0.0076, + "step": 555270 + }, + { + "epoch": 1.44, + "learning_rate": 8.40951213253115e-05, + "loss": 0.0089, + "step": 555280 + }, + { + "epoch": 1.44, + "learning_rate": 8.409123310894003e-05, + "loss": 0.0072, + "step": 555290 + }, + { + "epoch": 1.44, + "learning_rate": 8.408734489256858e-05, + "loss": 0.0129, + "step": 555300 + }, + { + "epoch": 1.44, + "learning_rate": 8.40834566761971e-05, + "loss": 0.0083, + "step": 555310 + }, + { + "epoch": 1.44, + "learning_rate": 8.407956845982565e-05, + "loss": 0.0095, + "step": 555320 + }, + { + "epoch": 1.44, + "learning_rate": 8.407568024345417e-05, + "loss": 0.0082, + "step": 555330 + }, + { + "epoch": 1.44, + "learning_rate": 8.407179202708271e-05, + "loss": 0.0083, + "step": 555340 + }, + { + "epoch": 1.44, + "learning_rate": 8.406790381071124e-05, + "loss": 0.0091, + "step": 555350 + }, + { + "epoch": 1.44, + "learning_rate": 8.406401559433978e-05, + "loss": 0.0088, + "step": 555360 + }, + { + "epoch": 1.44, + "learning_rate": 8.406012737796831e-05, + "loss": 0.0086, + "step": 555370 + }, + { + "epoch": 1.44, + "learning_rate": 8.405623916159687e-05, + "loss": 0.0105, + "step": 555380 + }, + { + "epoch": 1.44, + "learning_rate": 8.405235094522538e-05, + "loss": 0.012, + "step": 555390 + }, + { + "epoch": 1.44, + "learning_rate": 8.404846272885394e-05, + "loss": 0.0166, + "step": 555400 + }, + { + "epoch": 1.44, + "learning_rate": 8.404457451248247e-05, + "loss": 0.0108, + "step": 555410 + }, + { + "epoch": 1.44, + "learning_rate": 8.404068629611101e-05, + "loss": 0.0075, + "step": 555420 + }, + { + "epoch": 1.44, + "learning_rate": 8.403679807973954e-05, + "loss": 0.0113, + "step": 555430 + }, + { + "epoch": 1.44, + "learning_rate": 8.403290986336808e-05, + "loss": 0.0094, + "step": 555440 + }, + { + "epoch": 1.44, + "learning_rate": 8.40290216469966e-05, + "loss": 0.0097, + "step": 555450 + }, + { + "epoch": 1.44, + "learning_rate": 8.402513343062515e-05, + "loss": 0.0091, + "step": 555460 + }, + { + "epoch": 1.44, + "learning_rate": 8.402124521425367e-05, + "loss": 0.0143, + "step": 555470 + }, + { + "epoch": 1.44, + "learning_rate": 8.401735699788222e-05, + "loss": 0.0082, + "step": 555480 + }, + { + "epoch": 1.44, + "learning_rate": 8.401346878151074e-05, + "loss": 0.0075, + "step": 555490 + }, + { + "epoch": 1.44, + "learning_rate": 8.400958056513929e-05, + "loss": 0.0086, + "step": 555500 + }, + { + "epoch": 1.44, + "learning_rate": 8.400569234876781e-05, + "loss": 0.0095, + "step": 555510 + }, + { + "epoch": 1.44, + "learning_rate": 8.400180413239634e-05, + "loss": 0.0074, + "step": 555520 + }, + { + "epoch": 1.44, + "learning_rate": 8.399791591602488e-05, + "loss": 0.0109, + "step": 555530 + }, + { + "epoch": 1.44, + "learning_rate": 8.399402769965341e-05, + "loss": 0.0109, + "step": 555540 + }, + { + "epoch": 1.44, + "learning_rate": 8.399013948328195e-05, + "loss": 0.0107, + "step": 555550 + }, + { + "epoch": 1.44, + "learning_rate": 8.398625126691048e-05, + "loss": 0.0125, + "step": 555560 + }, + { + "epoch": 1.44, + "learning_rate": 8.398236305053904e-05, + "loss": 0.0089, + "step": 555570 + }, + { + "epoch": 1.44, + "learning_rate": 8.397847483416756e-05, + "loss": 0.0114, + "step": 555580 + }, + { + "epoch": 1.44, + "learning_rate": 8.39745866177961e-05, + "loss": 0.011, + "step": 555590 + }, + { + "epoch": 1.44, + "learning_rate": 8.397069840142463e-05, + "loss": 0.0101, + "step": 555600 + }, + { + "epoch": 1.44, + "learning_rate": 8.396681018505318e-05, + "loss": 0.0087, + "step": 555610 + }, + { + "epoch": 1.44, + "learning_rate": 8.39629219686817e-05, + "loss": 0.0086, + "step": 555620 + }, + { + "epoch": 1.44, + "learning_rate": 8.395903375231025e-05, + "loss": 0.0099, + "step": 555630 + }, + { + "epoch": 1.44, + "learning_rate": 8.395514553593877e-05, + "loss": 0.0092, + "step": 555640 + }, + { + "epoch": 1.44, + "learning_rate": 8.395125731956732e-05, + "loss": 0.0079, + "step": 555650 + }, + { + "epoch": 1.44, + "learning_rate": 8.394736910319584e-05, + "loss": 0.0073, + "step": 555660 + }, + { + "epoch": 1.44, + "learning_rate": 8.394348088682439e-05, + "loss": 0.0096, + "step": 555670 + }, + { + "epoch": 1.44, + "learning_rate": 8.393959267045291e-05, + "loss": 0.0091, + "step": 555680 + }, + { + "epoch": 1.44, + "learning_rate": 8.393570445408146e-05, + "loss": 0.0088, + "step": 555690 + }, + { + "epoch": 1.44, + "learning_rate": 8.393181623770998e-05, + "loss": 0.0103, + "step": 555700 + }, + { + "epoch": 1.44, + "learning_rate": 8.392792802133852e-05, + "loss": 0.01, + "step": 555710 + }, + { + "epoch": 1.44, + "learning_rate": 8.392403980496705e-05, + "loss": 0.0086, + "step": 555720 + }, + { + "epoch": 1.44, + "learning_rate": 8.392015158859561e-05, + "loss": 0.0089, + "step": 555730 + }, + { + "epoch": 1.44, + "learning_rate": 8.391626337222412e-05, + "loss": 0.0134, + "step": 555740 + }, + { + "epoch": 1.44, + "learning_rate": 8.391237515585268e-05, + "loss": 0.007, + "step": 555750 + }, + { + "epoch": 1.44, + "learning_rate": 8.39084869394812e-05, + "loss": 0.0079, + "step": 555760 + }, + { + "epoch": 1.44, + "learning_rate": 8.390459872310973e-05, + "loss": 0.0144, + "step": 555770 + }, + { + "epoch": 1.44, + "learning_rate": 8.390071050673828e-05, + "loss": 0.0109, + "step": 555780 + }, + { + "epoch": 1.44, + "learning_rate": 8.38968222903668e-05, + "loss": 0.0087, + "step": 555790 + }, + { + "epoch": 1.44, + "learning_rate": 8.389293407399535e-05, + "loss": 0.0106, + "step": 555800 + }, + { + "epoch": 1.44, + "learning_rate": 8.388904585762387e-05, + "loss": 0.0087, + "step": 555810 + }, + { + "epoch": 1.44, + "learning_rate": 8.388515764125242e-05, + "loss": 0.0101, + "step": 555820 + }, + { + "epoch": 1.44, + "learning_rate": 8.388126942488094e-05, + "loss": 0.0077, + "step": 555830 + }, + { + "epoch": 1.44, + "learning_rate": 8.387738120850948e-05, + "loss": 0.0102, + "step": 555840 + }, + { + "epoch": 1.44, + "learning_rate": 8.387349299213801e-05, + "loss": 0.0105, + "step": 555850 + }, + { + "epoch": 1.44, + "learning_rate": 8.386960477576655e-05, + "loss": 0.01, + "step": 555860 + }, + { + "epoch": 1.44, + "learning_rate": 8.386571655939508e-05, + "loss": 0.0098, + "step": 555870 + }, + { + "epoch": 1.44, + "learning_rate": 8.386182834302362e-05, + "loss": 0.0077, + "step": 555880 + }, + { + "epoch": 1.44, + "learning_rate": 8.385794012665215e-05, + "loss": 0.0093, + "step": 555890 + }, + { + "epoch": 1.44, + "learning_rate": 8.38540519102807e-05, + "loss": 0.0091, + "step": 555900 + }, + { + "epoch": 1.44, + "learning_rate": 8.385016369390922e-05, + "loss": 0.0122, + "step": 555910 + }, + { + "epoch": 1.44, + "learning_rate": 8.384627547753778e-05, + "loss": 0.0119, + "step": 555920 + }, + { + "epoch": 1.44, + "learning_rate": 8.38423872611663e-05, + "loss": 0.0102, + "step": 555930 + }, + { + "epoch": 1.44, + "learning_rate": 8.383849904479485e-05, + "loss": 0.009, + "step": 555940 + }, + { + "epoch": 1.44, + "learning_rate": 8.383461082842338e-05, + "loss": 0.0084, + "step": 555950 + }, + { + "epoch": 1.44, + "learning_rate": 8.383072261205192e-05, + "loss": 0.0097, + "step": 555960 + }, + { + "epoch": 1.44, + "learning_rate": 8.382683439568044e-05, + "loss": 0.0112, + "step": 555970 + }, + { + "epoch": 1.44, + "learning_rate": 8.382294617930899e-05, + "loss": 0.0072, + "step": 555980 + }, + { + "epoch": 1.44, + "learning_rate": 8.381905796293751e-05, + "loss": 0.0102, + "step": 555990 + }, + { + "epoch": 1.44, + "learning_rate": 8.381516974656606e-05, + "loss": 0.0118, + "step": 556000 + }, + { + "epoch": 1.44, + "eval_cer": 0.88167329394755, + "eval_loss": 0.0062253098003566265, + "eval_runtime": 107.7174, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, + "step": 556000 + }, + { + "epoch": 1.44, + "learning_rate": 8.381128153019458e-05, + "loss": 0.0078, + "step": 556010 + }, + { + "epoch": 1.44, + "learning_rate": 8.380739331382311e-05, + "loss": 0.0055, + "step": 556020 + }, + { + "epoch": 1.44, + "learning_rate": 8.380350509745165e-05, + "loss": 0.0091, + "step": 556030 + }, + { + "epoch": 1.44, + "learning_rate": 8.379961688108018e-05, + "loss": 0.0083, + "step": 556040 + }, + { + "epoch": 1.44, + "learning_rate": 8.379572866470872e-05, + "loss": 0.0068, + "step": 556050 + }, + { + "epoch": 1.44, + "learning_rate": 8.379184044833725e-05, + "loss": 0.0079, + "step": 556060 + }, + { + "epoch": 1.44, + "learning_rate": 8.37879522319658e-05, + "loss": 0.01, + "step": 556070 + }, + { + "epoch": 1.44, + "learning_rate": 8.378406401559432e-05, + "loss": 0.0096, + "step": 556080 + }, + { + "epoch": 1.44, + "learning_rate": 8.378017579922288e-05, + "loss": 0.01, + "step": 556090 + }, + { + "epoch": 1.44, + "learning_rate": 8.377628758285139e-05, + "loss": 0.0123, + "step": 556100 + }, + { + "epoch": 1.44, + "learning_rate": 8.377239936647995e-05, + "loss": 0.0085, + "step": 556110 + }, + { + "epoch": 1.44, + "learning_rate": 8.376851115010847e-05, + "loss": 0.0123, + "step": 556120 + }, + { + "epoch": 1.44, + "learning_rate": 8.376462293373702e-05, + "loss": 0.0097, + "step": 556130 + }, + { + "epoch": 1.44, + "learning_rate": 8.376073471736554e-05, + "loss": 0.0081, + "step": 556140 + }, + { + "epoch": 1.44, + "learning_rate": 8.375684650099409e-05, + "loss": 0.0073, + "step": 556150 + }, + { + "epoch": 1.44, + "learning_rate": 8.375295828462261e-05, + "loss": 0.0097, + "step": 556160 + }, + { + "epoch": 1.44, + "learning_rate": 8.374907006825116e-05, + "loss": 0.0079, + "step": 556170 + }, + { + "epoch": 1.44, + "learning_rate": 8.374518185187968e-05, + "loss": 0.0108, + "step": 556180 + }, + { + "epoch": 1.44, + "learning_rate": 8.374129363550823e-05, + "loss": 0.0098, + "step": 556190 + }, + { + "epoch": 1.44, + "learning_rate": 8.373740541913675e-05, + "loss": 0.0088, + "step": 556200 + }, + { + "epoch": 1.44, + "learning_rate": 8.37335172027653e-05, + "loss": 0.0077, + "step": 556210 + }, + { + "epoch": 1.44, + "learning_rate": 8.372962898639382e-05, + "loss": 0.0088, + "step": 556220 + }, + { + "epoch": 1.44, + "learning_rate": 8.372574077002236e-05, + "loss": 0.0108, + "step": 556230 + }, + { + "epoch": 1.44, + "learning_rate": 8.372185255365089e-05, + "loss": 0.0081, + "step": 556240 + }, + { + "epoch": 1.44, + "learning_rate": 8.371796433727945e-05, + "loss": 0.0083, + "step": 556250 + }, + { + "epoch": 1.44, + "learning_rate": 8.371407612090796e-05, + "loss": 0.0091, + "step": 556260 + }, + { + "epoch": 1.44, + "learning_rate": 8.371018790453649e-05, + "loss": 0.01, + "step": 556270 + }, + { + "epoch": 1.44, + "learning_rate": 8.370629968816505e-05, + "loss": 0.0072, + "step": 556280 + }, + { + "epoch": 1.44, + "learning_rate": 8.370241147179357e-05, + "loss": 0.0139, + "step": 556290 + }, + { + "epoch": 1.44, + "learning_rate": 8.369852325542212e-05, + "loss": 0.0077, + "step": 556300 + }, + { + "epoch": 1.44, + "learning_rate": 8.369463503905064e-05, + "loss": 0.0113, + "step": 556310 + }, + { + "epoch": 1.44, + "learning_rate": 8.369074682267919e-05, + "loss": 0.0094, + "step": 556320 + }, + { + "epoch": 1.44, + "learning_rate": 8.368685860630771e-05, + "loss": 0.0087, + "step": 556330 + }, + { + "epoch": 1.44, + "learning_rate": 8.368297038993626e-05, + "loss": 0.0104, + "step": 556340 + }, + { + "epoch": 1.44, + "learning_rate": 8.367908217356478e-05, + "loss": 0.0107, + "step": 556350 + }, + { + "epoch": 1.44, + "learning_rate": 8.367519395719332e-05, + "loss": 0.0109, + "step": 556360 + }, + { + "epoch": 1.44, + "learning_rate": 8.367130574082185e-05, + "loss": 0.009, + "step": 556370 + }, + { + "epoch": 1.44, + "learning_rate": 8.36674175244504e-05, + "loss": 0.0089, + "step": 556380 + }, + { + "epoch": 1.44, + "learning_rate": 8.366352930807892e-05, + "loss": 0.0084, + "step": 556390 + }, + { + "epoch": 1.44, + "learning_rate": 8.365964109170746e-05, + "loss": 0.0092, + "step": 556400 + }, + { + "epoch": 1.44, + "learning_rate": 8.365575287533599e-05, + "loss": 0.0105, + "step": 556410 + }, + { + "epoch": 1.44, + "learning_rate": 8.365186465896453e-05, + "loss": 0.0082, + "step": 556420 + }, + { + "epoch": 1.44, + "learning_rate": 8.364797644259306e-05, + "loss": 0.0098, + "step": 556430 + }, + { + "epoch": 1.44, + "learning_rate": 8.364408822622162e-05, + "loss": 0.0083, + "step": 556440 + }, + { + "epoch": 1.44, + "learning_rate": 8.364020000985015e-05, + "loss": 0.0075, + "step": 556450 + }, + { + "epoch": 1.44, + "learning_rate": 8.363631179347869e-05, + "loss": 0.0085, + "step": 556460 + }, + { + "epoch": 1.44, + "learning_rate": 8.363242357710722e-05, + "loss": 0.0076, + "step": 556470 + }, + { + "epoch": 1.44, + "learning_rate": 8.362853536073576e-05, + "loss": 0.0094, + "step": 556480 + }, + { + "epoch": 1.44, + "learning_rate": 8.362464714436428e-05, + "loss": 0.0087, + "step": 556490 + }, + { + "epoch": 1.44, + "learning_rate": 8.362075892799283e-05, + "loss": 0.0119, + "step": 556500 + }, + { + "epoch": 1.44, + "learning_rate": 8.361687071162135e-05, + "loss": 0.008, + "step": 556510 + }, + { + "epoch": 1.44, + "learning_rate": 8.361298249524988e-05, + "loss": 0.01, + "step": 556520 + }, + { + "epoch": 1.44, + "learning_rate": 8.360909427887842e-05, + "loss": 0.0096, + "step": 556530 + }, + { + "epoch": 1.44, + "learning_rate": 8.360520606250695e-05, + "loss": 0.0083, + "step": 556540 + }, + { + "epoch": 1.44, + "learning_rate": 8.36013178461355e-05, + "loss": 0.0079, + "step": 556550 + }, + { + "epoch": 1.44, + "learning_rate": 8.359742962976402e-05, + "loss": 0.0091, + "step": 556560 + }, + { + "epoch": 1.44, + "learning_rate": 8.359354141339256e-05, + "loss": 0.0119, + "step": 556570 + }, + { + "epoch": 1.44, + "learning_rate": 8.358965319702109e-05, + "loss": 0.0155, + "step": 556580 + }, + { + "epoch": 1.44, + "learning_rate": 8.358576498064963e-05, + "loss": 0.0092, + "step": 556590 + }, + { + "epoch": 1.44, + "learning_rate": 8.358187676427816e-05, + "loss": 0.0094, + "step": 556600 + }, + { + "epoch": 1.44, + "learning_rate": 8.357798854790672e-05, + "loss": 0.0074, + "step": 556610 + }, + { + "epoch": 1.44, + "learning_rate": 8.357410033153523e-05, + "loss": 0.0097, + "step": 556620 + }, + { + "epoch": 1.44, + "learning_rate": 8.357021211516379e-05, + "loss": 0.0102, + "step": 556630 + }, + { + "epoch": 1.44, + "learning_rate": 8.356632389879231e-05, + "loss": 0.0088, + "step": 556640 + }, + { + "epoch": 1.44, + "learning_rate": 8.356243568242086e-05, + "loss": 0.0113, + "step": 556650 + }, + { + "epoch": 1.44, + "learning_rate": 8.355854746604938e-05, + "loss": 0.0083, + "step": 556660 + }, + { + "epoch": 1.44, + "learning_rate": 8.355465924967793e-05, + "loss": 0.0098, + "step": 556670 + }, + { + "epoch": 1.44, + "learning_rate": 8.355077103330645e-05, + "loss": 0.0105, + "step": 556680 + }, + { + "epoch": 1.44, + "learning_rate": 8.3546882816935e-05, + "loss": 0.0083, + "step": 556690 + }, + { + "epoch": 1.44, + "learning_rate": 8.354299460056352e-05, + "loss": 0.0092, + "step": 556700 + }, + { + "epoch": 1.44, + "learning_rate": 8.353910638419207e-05, + "loss": 0.0078, + "step": 556710 + }, + { + "epoch": 1.44, + "learning_rate": 8.35352181678206e-05, + "loss": 0.0102, + "step": 556720 + }, + { + "epoch": 1.44, + "learning_rate": 8.353132995144914e-05, + "loss": 0.0081, + "step": 556730 + }, + { + "epoch": 1.44, + "learning_rate": 8.352744173507766e-05, + "loss": 0.0096, + "step": 556740 + }, + { + "epoch": 1.44, + "learning_rate": 8.35235535187062e-05, + "loss": 0.0093, + "step": 556750 + }, + { + "epoch": 1.44, + "learning_rate": 8.351966530233473e-05, + "loss": 0.0084, + "step": 556760 + }, + { + "epoch": 1.44, + "learning_rate": 8.351577708596326e-05, + "loss": 0.0073, + "step": 556770 + }, + { + "epoch": 1.44, + "learning_rate": 8.35118888695918e-05, + "loss": 0.0107, + "step": 556780 + }, + { + "epoch": 1.44, + "learning_rate": 8.350800065322033e-05, + "loss": 0.0096, + "step": 556790 + }, + { + "epoch": 1.44, + "learning_rate": 8.350411243684889e-05, + "loss": 0.0098, + "step": 556800 + }, + { + "epoch": 1.44, + "learning_rate": 8.350022422047741e-05, + "loss": 0.0102, + "step": 556810 + }, + { + "epoch": 1.44, + "learning_rate": 8.349633600410596e-05, + "loss": 0.0101, + "step": 556820 + }, + { + "epoch": 1.44, + "learning_rate": 8.349244778773448e-05, + "loss": 0.0079, + "step": 556830 + }, + { + "epoch": 1.44, + "learning_rate": 8.348855957136303e-05, + "loss": 0.0076, + "step": 556840 + }, + { + "epoch": 1.44, + "learning_rate": 8.348467135499155e-05, + "loss": 0.009, + "step": 556850 + }, + { + "epoch": 1.44, + "learning_rate": 8.34807831386201e-05, + "loss": 0.0105, + "step": 556860 + }, + { + "epoch": 1.44, + "learning_rate": 8.347689492224862e-05, + "loss": 0.013, + "step": 556870 + }, + { + "epoch": 1.44, + "learning_rate": 8.347300670587716e-05, + "loss": 0.0076, + "step": 556880 + }, + { + "epoch": 1.44, + "learning_rate": 8.346911848950569e-05, + "loss": 0.0093, + "step": 556890 + }, + { + "epoch": 1.44, + "learning_rate": 8.346523027313423e-05, + "loss": 0.0136, + "step": 556900 + }, + { + "epoch": 1.44, + "learning_rate": 8.346134205676276e-05, + "loss": 0.0113, + "step": 556910 + }, + { + "epoch": 1.44, + "learning_rate": 8.34574538403913e-05, + "loss": 0.0062, + "step": 556920 + }, + { + "epoch": 1.44, + "learning_rate": 8.345356562401983e-05, + "loss": 0.0086, + "step": 556930 + }, + { + "epoch": 1.44, + "learning_rate": 8.344967740764837e-05, + "loss": 0.0096, + "step": 556940 + }, + { + "epoch": 1.44, + "learning_rate": 8.34457891912769e-05, + "loss": 0.0085, + "step": 556950 + }, + { + "epoch": 1.44, + "learning_rate": 8.344190097490546e-05, + "loss": 0.0095, + "step": 556960 + }, + { + "epoch": 1.44, + "learning_rate": 8.343801275853399e-05, + "loss": 0.0108, + "step": 556970 + }, + { + "epoch": 1.44, + "learning_rate": 8.343412454216253e-05, + "loss": 0.0101, + "step": 556980 + }, + { + "epoch": 1.44, + "learning_rate": 8.343023632579106e-05, + "loss": 0.0076, + "step": 556990 + }, + { + "epoch": 1.44, + "learning_rate": 8.342634810941958e-05, + "loss": 0.0101, + "step": 557000 + }, + { + "epoch": 1.44, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.006132596172392368, + "eval_runtime": 107.8337, + "eval_samples_per_second": 18.547, + "eval_steps_per_second": 4.637, + "step": 557000 + }, + { + "epoch": 1.44, + "learning_rate": 8.342245989304812e-05, + "loss": 0.0092, + "step": 557010 + }, + { + "epoch": 1.44, + "learning_rate": 8.341857167667665e-05, + "loss": 0.0075, + "step": 557020 + }, + { + "epoch": 1.44, + "learning_rate": 8.34146834603052e-05, + "loss": 0.0099, + "step": 557030 + }, + { + "epoch": 1.44, + "learning_rate": 8.341079524393372e-05, + "loss": 0.0092, + "step": 557040 + }, + { + "epoch": 1.44, + "learning_rate": 8.340690702756226e-05, + "loss": 0.0095, + "step": 557050 + }, + { + "epoch": 1.44, + "learning_rate": 8.340301881119079e-05, + "loss": 0.0092, + "step": 557060 + }, + { + "epoch": 1.44, + "learning_rate": 8.339913059481933e-05, + "loss": 0.0088, + "step": 557070 + }, + { + "epoch": 1.44, + "learning_rate": 8.339524237844786e-05, + "loss": 0.0068, + "step": 557080 + }, + { + "epoch": 1.44, + "learning_rate": 8.33913541620764e-05, + "loss": 0.0115, + "step": 557090 + }, + { + "epoch": 1.44, + "learning_rate": 8.338746594570493e-05, + "loss": 0.0072, + "step": 557100 + }, + { + "epoch": 1.44, + "learning_rate": 8.338357772933347e-05, + "loss": 0.009, + "step": 557110 + }, + { + "epoch": 1.44, + "learning_rate": 8.3379689512962e-05, + "loss": 0.0086, + "step": 557120 + }, + { + "epoch": 1.44, + "learning_rate": 8.337580129659054e-05, + "loss": 0.0078, + "step": 557130 + }, + { + "epoch": 1.44, + "learning_rate": 8.337191308021907e-05, + "loss": 0.0104, + "step": 557140 + }, + { + "epoch": 1.44, + "learning_rate": 8.336802486384763e-05, + "loss": 0.0111, + "step": 557150 + }, + { + "epoch": 1.44, + "learning_rate": 8.336413664747615e-05, + "loss": 0.0061, + "step": 557160 + }, + { + "epoch": 1.44, + "learning_rate": 8.33602484311047e-05, + "loss": 0.0096, + "step": 557170 + }, + { + "epoch": 1.44, + "learning_rate": 8.335636021473322e-05, + "loss": 0.01, + "step": 557180 + }, + { + "epoch": 1.44, + "learning_rate": 8.335247199836177e-05, + "loss": 0.009, + "step": 557190 + }, + { + "epoch": 1.44, + "learning_rate": 8.33485837819903e-05, + "loss": 0.0111, + "step": 557200 + }, + { + "epoch": 1.44, + "learning_rate": 8.334469556561884e-05, + "loss": 0.0092, + "step": 557210 + }, + { + "epoch": 1.44, + "learning_rate": 8.334080734924736e-05, + "loss": 0.009, + "step": 557220 + }, + { + "epoch": 1.44, + "learning_rate": 8.33369191328759e-05, + "loss": 0.0078, + "step": 557230 + }, + { + "epoch": 1.44, + "learning_rate": 8.333303091650443e-05, + "loss": 0.0087, + "step": 557240 + }, + { + "epoch": 1.44, + "learning_rate": 8.332914270013296e-05, + "loss": 0.0118, + "step": 557250 + }, + { + "epoch": 1.44, + "learning_rate": 8.33252544837615e-05, + "loss": 0.0081, + "step": 557260 + }, + { + "epoch": 1.44, + "learning_rate": 8.332136626739003e-05, + "loss": 0.0064, + "step": 557270 + }, + { + "epoch": 1.44, + "learning_rate": 8.331747805101857e-05, + "loss": 0.011, + "step": 557280 + }, + { + "epoch": 1.44, + "learning_rate": 8.33135898346471e-05, + "loss": 0.0068, + "step": 557290 + }, + { + "epoch": 1.44, + "learning_rate": 8.330970161827564e-05, + "loss": 0.0099, + "step": 557300 + }, + { + "epoch": 1.44, + "learning_rate": 8.330581340190417e-05, + "loss": 0.0126, + "step": 557310 + }, + { + "epoch": 1.44, + "learning_rate": 8.330192518553273e-05, + "loss": 0.009, + "step": 557320 + }, + { + "epoch": 1.44, + "learning_rate": 8.329803696916124e-05, + "loss": 0.0112, + "step": 557330 + }, + { + "epoch": 1.44, + "learning_rate": 8.32941487527898e-05, + "loss": 0.0103, + "step": 557340 + }, + { + "epoch": 1.44, + "learning_rate": 8.329026053641832e-05, + "loss": 0.0117, + "step": 557350 + }, + { + "epoch": 1.44, + "learning_rate": 8.328637232004687e-05, + "loss": 0.0131, + "step": 557360 + }, + { + "epoch": 1.44, + "learning_rate": 8.32824841036754e-05, + "loss": 0.0095, + "step": 557370 + }, + { + "epoch": 1.44, + "learning_rate": 8.327859588730393e-05, + "loss": 0.0081, + "step": 557380 + }, + { + "epoch": 1.44, + "learning_rate": 8.327470767093246e-05, + "loss": 0.0101, + "step": 557390 + }, + { + "epoch": 1.44, + "learning_rate": 8.3270819454561e-05, + "loss": 0.0103, + "step": 557400 + }, + { + "epoch": 1.44, + "learning_rate": 8.326693123818953e-05, + "loss": 0.0085, + "step": 557410 + }, + { + "epoch": 1.44, + "learning_rate": 8.326304302181807e-05, + "loss": 0.0099, + "step": 557420 + }, + { + "epoch": 1.44, + "learning_rate": 8.32591548054466e-05, + "loss": 0.008, + "step": 557430 + }, + { + "epoch": 1.44, + "learning_rate": 8.325526658907514e-05, + "loss": 0.0101, + "step": 557440 + }, + { + "epoch": 1.44, + "learning_rate": 8.325137837270367e-05, + "loss": 0.0071, + "step": 557450 + }, + { + "epoch": 1.45, + "learning_rate": 8.324749015633221e-05, + "loss": 0.0099, + "step": 557460 + }, + { + "epoch": 1.45, + "learning_rate": 8.324360193996074e-05, + "loss": 0.0099, + "step": 557470 + }, + { + "epoch": 1.45, + "learning_rate": 8.32397137235893e-05, + "loss": 0.0108, + "step": 557480 + }, + { + "epoch": 1.45, + "learning_rate": 8.323582550721781e-05, + "loss": 0.0101, + "step": 557490 + }, + { + "epoch": 1.45, + "learning_rate": 8.323193729084634e-05, + "loss": 0.0096, + "step": 557500 + }, + { + "epoch": 1.45, + "learning_rate": 8.32280490744749e-05, + "loss": 0.0115, + "step": 557510 + }, + { + "epoch": 1.45, + "learning_rate": 8.322416085810342e-05, + "loss": 0.0097, + "step": 557520 + }, + { + "epoch": 1.45, + "learning_rate": 8.322027264173196e-05, + "loss": 0.0095, + "step": 557530 + }, + { + "epoch": 1.45, + "learning_rate": 8.321638442536049e-05, + "loss": 0.012, + "step": 557540 + }, + { + "epoch": 1.45, + "learning_rate": 8.321249620898903e-05, + "loss": 0.0119, + "step": 557550 + }, + { + "epoch": 1.45, + "learning_rate": 8.320860799261756e-05, + "loss": 0.0097, + "step": 557560 + }, + { + "epoch": 1.45, + "learning_rate": 8.32047197762461e-05, + "loss": 0.0075, + "step": 557570 + }, + { + "epoch": 1.45, + "learning_rate": 8.320083155987463e-05, + "loss": 0.0097, + "step": 557580 + }, + { + "epoch": 1.45, + "learning_rate": 8.319694334350317e-05, + "loss": 0.0074, + "step": 557590 + }, + { + "epoch": 1.45, + "learning_rate": 8.31930551271317e-05, + "loss": 0.0066, + "step": 557600 + }, + { + "epoch": 1.45, + "learning_rate": 8.318916691076024e-05, + "loss": 0.0068, + "step": 557610 + }, + { + "epoch": 1.45, + "learning_rate": 8.318527869438877e-05, + "loss": 0.0091, + "step": 557620 + }, + { + "epoch": 1.45, + "learning_rate": 8.318139047801731e-05, + "loss": 0.0115, + "step": 557630 + }, + { + "epoch": 1.45, + "learning_rate": 8.317750226164584e-05, + "loss": 0.0086, + "step": 557640 + }, + { + "epoch": 1.45, + "learning_rate": 8.317361404527438e-05, + "loss": 0.0106, + "step": 557650 + }, + { + "epoch": 1.45, + "learning_rate": 8.316972582890291e-05, + "loss": 0.0115, + "step": 557660 + }, + { + "epoch": 1.45, + "learning_rate": 8.316583761253147e-05, + "loss": 0.0067, + "step": 557670 + }, + { + "epoch": 1.45, + "learning_rate": 8.316194939616e-05, + "loss": 0.0105, + "step": 557680 + }, + { + "epoch": 1.45, + "learning_rate": 8.315806117978854e-05, + "loss": 0.0085, + "step": 557690 + }, + { + "epoch": 1.45, + "learning_rate": 8.315417296341706e-05, + "loss": 0.0094, + "step": 557700 + }, + { + "epoch": 1.45, + "learning_rate": 8.31502847470456e-05, + "loss": 0.0076, + "step": 557710 + }, + { + "epoch": 1.45, + "learning_rate": 8.314639653067413e-05, + "loss": 0.012, + "step": 557720 + }, + { + "epoch": 1.45, + "learning_rate": 8.314250831430268e-05, + "loss": 0.0073, + "step": 557730 + }, + { + "epoch": 1.45, + "learning_rate": 8.31386200979312e-05, + "loss": 0.0103, + "step": 557740 + }, + { + "epoch": 1.45, + "learning_rate": 8.313473188155973e-05, + "loss": 0.0106, + "step": 557750 + }, + { + "epoch": 1.45, + "learning_rate": 8.313084366518827e-05, + "loss": 0.0101, + "step": 557760 + }, + { + "epoch": 1.45, + "learning_rate": 8.31269554488168e-05, + "loss": 0.013, + "step": 557770 + }, + { + "epoch": 1.45, + "learning_rate": 8.312306723244534e-05, + "loss": 0.0082, + "step": 557780 + }, + { + "epoch": 1.45, + "learning_rate": 8.311917901607387e-05, + "loss": 0.0079, + "step": 557790 + }, + { + "epoch": 1.45, + "learning_rate": 8.311529079970241e-05, + "loss": 0.0086, + "step": 557800 + }, + { + "epoch": 1.45, + "learning_rate": 8.311140258333094e-05, + "loss": 0.0084, + "step": 557810 + }, + { + "epoch": 1.45, + "learning_rate": 8.310751436695948e-05, + "loss": 0.0107, + "step": 557820 + }, + { + "epoch": 1.45, + "learning_rate": 8.310362615058801e-05, + "loss": 0.0082, + "step": 557830 + }, + { + "epoch": 1.45, + "learning_rate": 8.309973793421657e-05, + "loss": 0.0156, + "step": 557840 + }, + { + "epoch": 1.45, + "learning_rate": 8.309584971784508e-05, + "loss": 0.0092, + "step": 557850 + }, + { + "epoch": 1.45, + "learning_rate": 8.309196150147364e-05, + "loss": 0.0103, + "step": 557860 + }, + { + "epoch": 1.45, + "learning_rate": 8.308807328510216e-05, + "loss": 0.0105, + "step": 557870 + }, + { + "epoch": 1.45, + "learning_rate": 8.30841850687307e-05, + "loss": 0.0112, + "step": 557880 + }, + { + "epoch": 1.45, + "learning_rate": 8.308029685235923e-05, + "loss": 0.0107, + "step": 557890 + }, + { + "epoch": 1.45, + "learning_rate": 8.307640863598777e-05, + "loss": 0.0095, + "step": 557900 + }, + { + "epoch": 1.45, + "learning_rate": 8.30725204196163e-05, + "loss": 0.0071, + "step": 557910 + }, + { + "epoch": 1.45, + "learning_rate": 8.306863220324484e-05, + "loss": 0.0109, + "step": 557920 + }, + { + "epoch": 1.45, + "learning_rate": 8.306474398687337e-05, + "loss": 0.0087, + "step": 557930 + }, + { + "epoch": 1.45, + "learning_rate": 8.306085577050191e-05, + "loss": 0.0073, + "step": 557940 + }, + { + "epoch": 1.45, + "learning_rate": 8.305696755413044e-05, + "loss": 0.011, + "step": 557950 + }, + { + "epoch": 1.45, + "learning_rate": 8.305307933775898e-05, + "loss": 0.0084, + "step": 557960 + }, + { + "epoch": 1.45, + "learning_rate": 8.304919112138751e-05, + "loss": 0.0083, + "step": 557970 + }, + { + "epoch": 1.45, + "learning_rate": 8.304530290501605e-05, + "loss": 0.0092, + "step": 557980 + }, + { + "epoch": 1.45, + "learning_rate": 8.304141468864458e-05, + "loss": 0.0091, + "step": 557990 + }, + { + "epoch": 1.45, + "learning_rate": 8.303752647227311e-05, + "loss": 0.0111, + "step": 558000 + }, + { + "epoch": 1.45, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.006029914598912001, + "eval_runtime": 108.0298, + "eval_samples_per_second": 18.513, + "eval_steps_per_second": 4.628, + "step": 558000 + }, + { + "epoch": 1.45, + "learning_rate": 8.303363825590165e-05, + "loss": 0.01, + "step": 558010 + }, + { + "epoch": 1.45, + "learning_rate": 8.302975003953018e-05, + "loss": 0.0076, + "step": 558020 + }, + { + "epoch": 1.45, + "learning_rate": 8.302586182315873e-05, + "loss": 0.0064, + "step": 558030 + }, + { + "epoch": 1.45, + "learning_rate": 8.302197360678726e-05, + "loss": 0.0121, + "step": 558040 + }, + { + "epoch": 1.45, + "learning_rate": 8.30180853904158e-05, + "loss": 0.0096, + "step": 558050 + }, + { + "epoch": 1.45, + "learning_rate": 8.301419717404433e-05, + "loss": 0.0103, + "step": 558060 + }, + { + "epoch": 1.45, + "learning_rate": 8.301030895767287e-05, + "loss": 0.0098, + "step": 558070 + }, + { + "epoch": 1.45, + "learning_rate": 8.30064207413014e-05, + "loss": 0.0102, + "step": 558080 + }, + { + "epoch": 1.45, + "learning_rate": 8.300253252492994e-05, + "loss": 0.0133, + "step": 558090 + }, + { + "epoch": 1.45, + "learning_rate": 8.299864430855847e-05, + "loss": 0.0112, + "step": 558100 + }, + { + "epoch": 1.45, + "learning_rate": 8.299475609218701e-05, + "loss": 0.0096, + "step": 558110 + }, + { + "epoch": 1.45, + "learning_rate": 8.299086787581554e-05, + "loss": 0.008, + "step": 558120 + }, + { + "epoch": 1.45, + "learning_rate": 8.298697965944408e-05, + "loss": 0.01, + "step": 558130 + }, + { + "epoch": 1.45, + "learning_rate": 8.298309144307261e-05, + "loss": 0.0092, + "step": 558140 + }, + { + "epoch": 1.45, + "learning_rate": 8.297920322670115e-05, + "loss": 0.0093, + "step": 558150 + }, + { + "epoch": 1.45, + "learning_rate": 8.297531501032968e-05, + "loss": 0.0071, + "step": 558160 + }, + { + "epoch": 1.45, + "learning_rate": 8.297142679395822e-05, + "loss": 0.0106, + "step": 558170 + }, + { + "epoch": 1.45, + "learning_rate": 8.296753857758675e-05, + "loss": 0.0068, + "step": 558180 + }, + { + "epoch": 1.45, + "learning_rate": 8.29636503612153e-05, + "loss": 0.0115, + "step": 558190 + }, + { + "epoch": 1.45, + "learning_rate": 8.295976214484383e-05, + "loss": 0.0092, + "step": 558200 + }, + { + "epoch": 1.45, + "learning_rate": 8.295587392847238e-05, + "loss": 0.0094, + "step": 558210 + }, + { + "epoch": 1.45, + "learning_rate": 8.29519857121009e-05, + "loss": 0.0079, + "step": 558220 + }, + { + "epoch": 1.45, + "learning_rate": 8.294809749572945e-05, + "loss": 0.0088, + "step": 558230 + }, + { + "epoch": 1.45, + "learning_rate": 8.294420927935797e-05, + "loss": 0.013, + "step": 558240 + }, + { + "epoch": 1.45, + "learning_rate": 8.29403210629865e-05, + "loss": 0.0098, + "step": 558250 + }, + { + "epoch": 1.45, + "learning_rate": 8.293643284661504e-05, + "loss": 0.0075, + "step": 558260 + }, + { + "epoch": 1.45, + "learning_rate": 8.293254463024357e-05, + "loss": 0.0122, + "step": 558270 + }, + { + "epoch": 1.45, + "learning_rate": 8.292865641387211e-05, + "loss": 0.0093, + "step": 558280 + }, + { + "epoch": 1.45, + "learning_rate": 8.292476819750064e-05, + "loss": 0.0093, + "step": 558290 + }, + { + "epoch": 1.45, + "learning_rate": 8.292087998112918e-05, + "loss": 0.0091, + "step": 558300 + }, + { + "epoch": 1.45, + "learning_rate": 8.291699176475771e-05, + "loss": 0.0084, + "step": 558310 + }, + { + "epoch": 1.45, + "learning_rate": 8.291310354838625e-05, + "loss": 0.0096, + "step": 558320 + }, + { + "epoch": 1.45, + "learning_rate": 8.290921533201478e-05, + "loss": 0.0103, + "step": 558330 + }, + { + "epoch": 1.45, + "learning_rate": 8.290532711564332e-05, + "loss": 0.0057, + "step": 558340 + }, + { + "epoch": 1.45, + "learning_rate": 8.290143889927185e-05, + "loss": 0.0087, + "step": 558350 + }, + { + "epoch": 1.45, + "learning_rate": 8.28975506829004e-05, + "loss": 0.0076, + "step": 558360 + }, + { + "epoch": 1.45, + "learning_rate": 8.289366246652892e-05, + "loss": 0.0091, + "step": 558370 + }, + { + "epoch": 1.45, + "learning_rate": 8.288977425015748e-05, + "loss": 0.0064, + "step": 558380 + }, + { + "epoch": 1.45, + "learning_rate": 8.2885886033786e-05, + "loss": 0.009, + "step": 558390 + }, + { + "epoch": 1.45, + "learning_rate": 8.288199781741455e-05, + "loss": 0.0085, + "step": 558400 + }, + { + "epoch": 1.45, + "learning_rate": 8.287810960104307e-05, + "loss": 0.0108, + "step": 558410 + }, + { + "epoch": 1.45, + "learning_rate": 8.287422138467161e-05, + "loss": 0.0071, + "step": 558420 + }, + { + "epoch": 1.45, + "learning_rate": 8.287033316830014e-05, + "loss": 0.0119, + "step": 558430 + }, + { + "epoch": 1.45, + "learning_rate": 8.286644495192868e-05, + "loss": 0.0081, + "step": 558440 + }, + { + "epoch": 1.45, + "learning_rate": 8.286255673555721e-05, + "loss": 0.0101, + "step": 558450 + }, + { + "epoch": 1.45, + "learning_rate": 8.285866851918575e-05, + "loss": 0.0087, + "step": 558460 + }, + { + "epoch": 1.45, + "learning_rate": 8.285478030281428e-05, + "loss": 0.0136, + "step": 558470 + }, + { + "epoch": 1.45, + "learning_rate": 8.285089208644282e-05, + "loss": 0.0079, + "step": 558480 + }, + { + "epoch": 1.45, + "learning_rate": 8.284700387007135e-05, + "loss": 0.0074, + "step": 558490 + }, + { + "epoch": 1.45, + "learning_rate": 8.284311565369988e-05, + "loss": 0.0068, + "step": 558500 + }, + { + "epoch": 1.45, + "learning_rate": 8.283922743732842e-05, + "loss": 0.0126, + "step": 558510 + }, + { + "epoch": 1.45, + "learning_rate": 8.283533922095695e-05, + "loss": 0.0102, + "step": 558520 + }, + { + "epoch": 1.45, + "learning_rate": 8.283145100458549e-05, + "loss": 0.0128, + "step": 558530 + }, + { + "epoch": 1.45, + "learning_rate": 8.282756278821402e-05, + "loss": 0.01, + "step": 558540 + }, + { + "epoch": 1.45, + "learning_rate": 8.282367457184257e-05, + "loss": 0.0097, + "step": 558550 + }, + { + "epoch": 1.45, + "learning_rate": 8.28197863554711e-05, + "loss": 0.0096, + "step": 558560 + }, + { + "epoch": 1.45, + "learning_rate": 8.281589813909964e-05, + "loss": 0.0105, + "step": 558570 + }, + { + "epoch": 1.45, + "learning_rate": 8.281200992272817e-05, + "loss": 0.0103, + "step": 558580 + }, + { + "epoch": 1.45, + "learning_rate": 8.280812170635671e-05, + "loss": 0.0084, + "step": 558590 + }, + { + "epoch": 1.45, + "learning_rate": 8.280423348998524e-05, + "loss": 0.0076, + "step": 558600 + }, + { + "epoch": 1.45, + "learning_rate": 8.280034527361378e-05, + "loss": 0.0093, + "step": 558610 + }, + { + "epoch": 1.45, + "learning_rate": 8.279645705724231e-05, + "loss": 0.0091, + "step": 558620 + }, + { + "epoch": 1.45, + "learning_rate": 8.279256884087085e-05, + "loss": 0.0119, + "step": 558630 + }, + { + "epoch": 1.45, + "learning_rate": 8.278868062449938e-05, + "loss": 0.0114, + "step": 558640 + }, + { + "epoch": 1.45, + "learning_rate": 8.278479240812792e-05, + "loss": 0.0065, + "step": 558650 + }, + { + "epoch": 1.45, + "learning_rate": 8.278090419175645e-05, + "loss": 0.0089, + "step": 558660 + }, + { + "epoch": 1.45, + "learning_rate": 8.277701597538499e-05, + "loss": 0.0094, + "step": 558670 + }, + { + "epoch": 1.45, + "learning_rate": 8.277312775901352e-05, + "loss": 0.0107, + "step": 558680 + }, + { + "epoch": 1.45, + "learning_rate": 8.276923954264206e-05, + "loss": 0.0071, + "step": 558690 + }, + { + "epoch": 1.45, + "learning_rate": 8.276535132627059e-05, + "loss": 0.0097, + "step": 558700 + }, + { + "epoch": 1.45, + "learning_rate": 8.276146310989915e-05, + "loss": 0.0112, + "step": 558710 + }, + { + "epoch": 1.45, + "learning_rate": 8.275757489352766e-05, + "loss": 0.0107, + "step": 558720 + }, + { + "epoch": 1.45, + "learning_rate": 8.275368667715622e-05, + "loss": 0.0093, + "step": 558730 + }, + { + "epoch": 1.45, + "learning_rate": 8.274979846078474e-05, + "loss": 0.0088, + "step": 558740 + }, + { + "epoch": 1.45, + "learning_rate": 8.274591024441327e-05, + "loss": 0.0094, + "step": 558750 + }, + { + "epoch": 1.45, + "learning_rate": 8.274202202804181e-05, + "loss": 0.0097, + "step": 558760 + }, + { + "epoch": 1.45, + "learning_rate": 8.273813381167034e-05, + "loss": 0.0103, + "step": 558770 + }, + { + "epoch": 1.45, + "learning_rate": 8.273424559529888e-05, + "loss": 0.0086, + "step": 558780 + }, + { + "epoch": 1.45, + "learning_rate": 8.273035737892741e-05, + "loss": 0.0085, + "step": 558790 + }, + { + "epoch": 1.45, + "learning_rate": 8.272646916255595e-05, + "loss": 0.0096, + "step": 558800 + }, + { + "epoch": 1.45, + "learning_rate": 8.272258094618448e-05, + "loss": 0.01, + "step": 558810 + }, + { + "epoch": 1.45, + "learning_rate": 8.271869272981302e-05, + "loss": 0.0118, + "step": 558820 + }, + { + "epoch": 1.45, + "learning_rate": 8.271480451344155e-05, + "loss": 0.0089, + "step": 558830 + }, + { + "epoch": 1.45, + "learning_rate": 8.271091629707009e-05, + "loss": 0.0094, + "step": 558840 + }, + { + "epoch": 1.45, + "learning_rate": 8.270702808069862e-05, + "loss": 0.0073, + "step": 558850 + }, + { + "epoch": 1.45, + "learning_rate": 8.270313986432716e-05, + "loss": 0.0099, + "step": 558860 + }, + { + "epoch": 1.45, + "learning_rate": 8.269925164795569e-05, + "loss": 0.0074, + "step": 558870 + }, + { + "epoch": 1.45, + "learning_rate": 8.269536343158423e-05, + "loss": 0.0088, + "step": 558880 + }, + { + "epoch": 1.45, + "learning_rate": 8.269147521521276e-05, + "loss": 0.0118, + "step": 558890 + }, + { + "epoch": 1.45, + "learning_rate": 8.268758699884132e-05, + "loss": 0.0107, + "step": 558900 + }, + { + "epoch": 1.45, + "learning_rate": 8.268369878246984e-05, + "loss": 0.0125, + "step": 558910 + }, + { + "epoch": 1.45, + "learning_rate": 8.267981056609838e-05, + "loss": 0.0083, + "step": 558920 + }, + { + "epoch": 1.45, + "learning_rate": 8.267592234972691e-05, + "loss": 0.0097, + "step": 558930 + }, + { + "epoch": 1.45, + "learning_rate": 8.267203413335545e-05, + "loss": 0.0075, + "step": 558940 + }, + { + "epoch": 1.45, + "learning_rate": 8.266814591698398e-05, + "loss": 0.0075, + "step": 558950 + }, + { + "epoch": 1.45, + "learning_rate": 8.266425770061252e-05, + "loss": 0.0088, + "step": 558960 + }, + { + "epoch": 1.45, + "learning_rate": 8.266036948424105e-05, + "loss": 0.0107, + "step": 558970 + }, + { + "epoch": 1.45, + "learning_rate": 8.26564812678696e-05, + "loss": 0.0105, + "step": 558980 + }, + { + "epoch": 1.45, + "learning_rate": 8.265259305149812e-05, + "loss": 0.0092, + "step": 558990 + }, + { + "epoch": 1.45, + "learning_rate": 8.264870483512665e-05, + "loss": 0.0097, + "step": 559000 + }, + { + "epoch": 1.45, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.005990092176944017, + "eval_runtime": 107.8601, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 559000 + }, + { + "epoch": 1.45, + "learning_rate": 8.264481661875519e-05, + "loss": 0.0109, + "step": 559010 + }, + { + "epoch": 1.45, + "learning_rate": 8.264092840238372e-05, + "loss": 0.009, + "step": 559020 + }, + { + "epoch": 1.45, + "learning_rate": 8.263704018601226e-05, + "loss": 0.0098, + "step": 559030 + }, + { + "epoch": 1.45, + "learning_rate": 8.263315196964079e-05, + "loss": 0.0119, + "step": 559040 + }, + { + "epoch": 1.45, + "learning_rate": 8.262926375326933e-05, + "loss": 0.0159, + "step": 559050 + }, + { + "epoch": 1.45, + "learning_rate": 8.262537553689786e-05, + "loss": 0.0093, + "step": 559060 + }, + { + "epoch": 1.45, + "learning_rate": 8.262148732052641e-05, + "loss": 0.0106, + "step": 559070 + }, + { + "epoch": 1.45, + "learning_rate": 8.261759910415493e-05, + "loss": 0.0107, + "step": 559080 + }, + { + "epoch": 1.45, + "learning_rate": 8.261371088778348e-05, + "loss": 0.0071, + "step": 559090 + }, + { + "epoch": 1.45, + "learning_rate": 8.260982267141201e-05, + "loss": 0.0106, + "step": 559100 + }, + { + "epoch": 1.45, + "learning_rate": 8.260593445504055e-05, + "loss": 0.0113, + "step": 559110 + }, + { + "epoch": 1.45, + "learning_rate": 8.260204623866908e-05, + "loss": 0.0095, + "step": 559120 + }, + { + "epoch": 1.45, + "learning_rate": 8.259815802229762e-05, + "loss": 0.0113, + "step": 559130 + }, + { + "epoch": 1.45, + "learning_rate": 8.259426980592615e-05, + "loss": 0.0076, + "step": 559140 + }, + { + "epoch": 1.45, + "learning_rate": 8.25903815895547e-05, + "loss": 0.008, + "step": 559150 + }, + { + "epoch": 1.45, + "learning_rate": 8.258649337318322e-05, + "loss": 0.0144, + "step": 559160 + }, + { + "epoch": 1.45, + "learning_rate": 8.258260515681176e-05, + "loss": 0.0069, + "step": 559170 + }, + { + "epoch": 1.45, + "learning_rate": 8.257871694044029e-05, + "loss": 0.0134, + "step": 559180 + }, + { + "epoch": 1.45, + "learning_rate": 8.257482872406883e-05, + "loss": 0.0075, + "step": 559190 + }, + { + "epoch": 1.45, + "learning_rate": 8.257094050769736e-05, + "loss": 0.0177, + "step": 559200 + }, + { + "epoch": 1.45, + "learning_rate": 8.25670522913259e-05, + "loss": 0.0109, + "step": 559210 + }, + { + "epoch": 1.45, + "learning_rate": 8.256316407495443e-05, + "loss": 0.0099, + "step": 559220 + }, + { + "epoch": 1.45, + "learning_rate": 8.255927585858299e-05, + "loss": 0.0108, + "step": 559230 + }, + { + "epoch": 1.45, + "learning_rate": 8.25553876422115e-05, + "loss": 0.0128, + "step": 559240 + }, + { + "epoch": 1.45, + "learning_rate": 8.255149942584003e-05, + "loss": 0.0115, + "step": 559250 + }, + { + "epoch": 1.45, + "learning_rate": 8.254761120946858e-05, + "loss": 0.0088, + "step": 559260 + }, + { + "epoch": 1.45, + "learning_rate": 8.254372299309711e-05, + "loss": 0.0087, + "step": 559270 + }, + { + "epoch": 1.45, + "learning_rate": 8.253983477672565e-05, + "loss": 0.0082, + "step": 559280 + }, + { + "epoch": 1.45, + "learning_rate": 8.253594656035418e-05, + "loss": 0.0082, + "step": 559290 + }, + { + "epoch": 1.45, + "learning_rate": 8.253205834398272e-05, + "loss": 0.0085, + "step": 559300 + }, + { + "epoch": 1.45, + "learning_rate": 8.252817012761125e-05, + "loss": 0.0066, + "step": 559310 + }, + { + "epoch": 1.45, + "learning_rate": 8.252428191123979e-05, + "loss": 0.0076, + "step": 559320 + }, + { + "epoch": 1.45, + "learning_rate": 8.252039369486832e-05, + "loss": 0.0104, + "step": 559330 + }, + { + "epoch": 1.45, + "learning_rate": 8.251650547849686e-05, + "loss": 0.0077, + "step": 559340 + }, + { + "epoch": 1.45, + "learning_rate": 8.251261726212539e-05, + "loss": 0.0102, + "step": 559350 + }, + { + "epoch": 1.45, + "learning_rate": 8.250872904575393e-05, + "loss": 0.0128, + "step": 559360 + }, + { + "epoch": 1.45, + "learning_rate": 8.250484082938246e-05, + "loss": 0.0078, + "step": 559370 + }, + { + "epoch": 1.45, + "learning_rate": 8.2500952613011e-05, + "loss": 0.0086, + "step": 559380 + }, + { + "epoch": 1.45, + "learning_rate": 8.249706439663953e-05, + "loss": 0.0079, + "step": 559390 + }, + { + "epoch": 1.45, + "learning_rate": 8.249317618026807e-05, + "loss": 0.008, + "step": 559400 + }, + { + "epoch": 1.45, + "learning_rate": 8.24892879638966e-05, + "loss": 0.0116, + "step": 559410 + }, + { + "epoch": 1.45, + "learning_rate": 8.248539974752516e-05, + "loss": 0.0104, + "step": 559420 + }, + { + "epoch": 1.45, + "learning_rate": 8.248151153115368e-05, + "loss": 0.0084, + "step": 559430 + }, + { + "epoch": 1.45, + "learning_rate": 8.247762331478222e-05, + "loss": 0.0124, + "step": 559440 + }, + { + "epoch": 1.45, + "learning_rate": 8.247373509841075e-05, + "loss": 0.0099, + "step": 559450 + }, + { + "epoch": 1.45, + "learning_rate": 8.24698468820393e-05, + "loss": 0.0088, + "step": 559460 + }, + { + "epoch": 1.45, + "learning_rate": 8.246595866566782e-05, + "loss": 0.0088, + "step": 559470 + }, + { + "epoch": 1.45, + "learning_rate": 8.246207044929636e-05, + "loss": 0.0095, + "step": 559480 + }, + { + "epoch": 1.45, + "learning_rate": 8.245818223292489e-05, + "loss": 0.0086, + "step": 559490 + }, + { + "epoch": 1.45, + "learning_rate": 8.245429401655342e-05, + "loss": 0.0097, + "step": 559500 + }, + { + "epoch": 1.45, + "learning_rate": 8.245040580018196e-05, + "loss": 0.009, + "step": 559510 + }, + { + "epoch": 1.45, + "learning_rate": 8.244651758381049e-05, + "loss": 0.0099, + "step": 559520 + }, + { + "epoch": 1.45, + "learning_rate": 8.244262936743903e-05, + "loss": 0.0089, + "step": 559530 + }, + { + "epoch": 1.45, + "learning_rate": 8.243874115106756e-05, + "loss": 0.0107, + "step": 559540 + }, + { + "epoch": 1.45, + "learning_rate": 8.24348529346961e-05, + "loss": 0.0093, + "step": 559550 + }, + { + "epoch": 1.45, + "learning_rate": 8.243096471832463e-05, + "loss": 0.0132, + "step": 559560 + }, + { + "epoch": 1.45, + "learning_rate": 8.242707650195317e-05, + "loss": 0.009, + "step": 559570 + }, + { + "epoch": 1.45, + "learning_rate": 8.24231882855817e-05, + "loss": 0.0111, + "step": 559580 + }, + { + "epoch": 1.45, + "learning_rate": 8.241930006921025e-05, + "loss": 0.009, + "step": 559590 + }, + { + "epoch": 1.45, + "learning_rate": 8.241541185283877e-05, + "loss": 0.0088, + "step": 559600 + }, + { + "epoch": 1.45, + "learning_rate": 8.241152363646732e-05, + "loss": 0.0089, + "step": 559610 + }, + { + "epoch": 1.45, + "learning_rate": 8.240763542009585e-05, + "loss": 0.0088, + "step": 559620 + }, + { + "epoch": 1.45, + "learning_rate": 8.24037472037244e-05, + "loss": 0.011, + "step": 559630 + }, + { + "epoch": 1.45, + "learning_rate": 8.239985898735292e-05, + "loss": 0.011, + "step": 559640 + }, + { + "epoch": 1.45, + "learning_rate": 8.239597077098146e-05, + "loss": 0.0095, + "step": 559650 + }, + { + "epoch": 1.45, + "learning_rate": 8.239208255460999e-05, + "loss": 0.0096, + "step": 559660 + }, + { + "epoch": 1.45, + "learning_rate": 8.238819433823853e-05, + "loss": 0.0095, + "step": 559670 + }, + { + "epoch": 1.45, + "learning_rate": 8.238430612186706e-05, + "loss": 0.0077, + "step": 559680 + }, + { + "epoch": 1.45, + "learning_rate": 8.23804179054956e-05, + "loss": 0.0078, + "step": 559690 + }, + { + "epoch": 1.45, + "learning_rate": 8.237652968912413e-05, + "loss": 0.0113, + "step": 559700 + }, + { + "epoch": 1.45, + "learning_rate": 8.237264147275267e-05, + "loss": 0.0083, + "step": 559710 + }, + { + "epoch": 1.45, + "learning_rate": 8.23687532563812e-05, + "loss": 0.0088, + "step": 559720 + }, + { + "epoch": 1.45, + "learning_rate": 8.236486504000973e-05, + "loss": 0.0079, + "step": 559730 + }, + { + "epoch": 1.45, + "learning_rate": 8.236097682363827e-05, + "loss": 0.0086, + "step": 559740 + }, + { + "epoch": 1.45, + "learning_rate": 8.23570886072668e-05, + "loss": 0.0098, + "step": 559750 + }, + { + "epoch": 1.45, + "learning_rate": 8.235320039089534e-05, + "loss": 0.0072, + "step": 559760 + }, + { + "epoch": 1.45, + "learning_rate": 8.234931217452387e-05, + "loss": 0.0094, + "step": 559770 + }, + { + "epoch": 1.45, + "learning_rate": 8.234542395815242e-05, + "loss": 0.0079, + "step": 559780 + }, + { + "epoch": 1.45, + "learning_rate": 8.234153574178095e-05, + "loss": 0.0108, + "step": 559790 + }, + { + "epoch": 1.45, + "learning_rate": 8.23376475254095e-05, + "loss": 0.0085, + "step": 559800 + }, + { + "epoch": 1.45, + "learning_rate": 8.233375930903802e-05, + "loss": 0.0108, + "step": 559810 + }, + { + "epoch": 1.45, + "learning_rate": 8.232987109266656e-05, + "loss": 0.0079, + "step": 559820 + }, + { + "epoch": 1.45, + "learning_rate": 8.232598287629509e-05, + "loss": 0.0085, + "step": 559830 + }, + { + "epoch": 1.45, + "learning_rate": 8.232209465992363e-05, + "loss": 0.0118, + "step": 559840 + }, + { + "epoch": 1.45, + "learning_rate": 8.231820644355216e-05, + "loss": 0.01, + "step": 559850 + }, + { + "epoch": 1.45, + "learning_rate": 8.23143182271807e-05, + "loss": 0.0128, + "step": 559860 + }, + { + "epoch": 1.45, + "learning_rate": 8.231043001080923e-05, + "loss": 0.0101, + "step": 559870 + }, + { + "epoch": 1.45, + "learning_rate": 8.230654179443777e-05, + "loss": 0.0094, + "step": 559880 + }, + { + "epoch": 1.45, + "learning_rate": 8.23026535780663e-05, + "loss": 0.0089, + "step": 559890 + }, + { + "epoch": 1.45, + "learning_rate": 8.229876536169484e-05, + "loss": 0.0091, + "step": 559900 + }, + { + "epoch": 1.45, + "learning_rate": 8.229487714532337e-05, + "loss": 0.0098, + "step": 559910 + }, + { + "epoch": 1.45, + "learning_rate": 8.229098892895191e-05, + "loss": 0.0104, + "step": 559920 + }, + { + "epoch": 1.45, + "learning_rate": 8.228710071258044e-05, + "loss": 0.0096, + "step": 559930 + }, + { + "epoch": 1.45, + "learning_rate": 8.2283212496209e-05, + "loss": 0.0087, + "step": 559940 + }, + { + "epoch": 1.45, + "learning_rate": 8.227932427983751e-05, + "loss": 0.0107, + "step": 559950 + }, + { + "epoch": 1.45, + "learning_rate": 8.227543606346606e-05, + "loss": 0.0071, + "step": 559960 + }, + { + "epoch": 1.45, + "learning_rate": 8.227154784709459e-05, + "loss": 0.009, + "step": 559970 + }, + { + "epoch": 1.45, + "learning_rate": 8.226765963072312e-05, + "loss": 0.0095, + "step": 559980 + }, + { + "epoch": 1.45, + "learning_rate": 8.226377141435166e-05, + "loss": 0.0098, + "step": 559990 + }, + { + "epoch": 1.45, + "learning_rate": 8.225988319798019e-05, + "loss": 0.0105, + "step": 560000 + }, + { + "epoch": 1.45, + "eval_cer": 0.881688689953826, + "eval_loss": 0.00610503600910306, + "eval_runtime": 108.0797, + "eval_samples_per_second": 18.505, + "eval_steps_per_second": 4.626, + "step": 560000 + }, + { + "epoch": 1.45, + "learning_rate": 8.225599498160873e-05, + "loss": 0.0116, + "step": 560010 + }, + { + "epoch": 1.45, + "learning_rate": 8.225210676523726e-05, + "loss": 0.0078, + "step": 560020 + }, + { + "epoch": 1.45, + "learning_rate": 8.22482185488658e-05, + "loss": 0.0082, + "step": 560030 + }, + { + "epoch": 1.45, + "learning_rate": 8.224433033249433e-05, + "loss": 0.0109, + "step": 560040 + }, + { + "epoch": 1.45, + "learning_rate": 8.224044211612287e-05, + "loss": 0.0103, + "step": 560050 + }, + { + "epoch": 1.45, + "learning_rate": 8.22365538997514e-05, + "loss": 0.0057, + "step": 560060 + }, + { + "epoch": 1.45, + "learning_rate": 8.223266568337994e-05, + "loss": 0.0099, + "step": 560070 + }, + { + "epoch": 1.45, + "learning_rate": 8.222877746700847e-05, + "loss": 0.0079, + "step": 560080 + }, + { + "epoch": 1.45, + "learning_rate": 8.222488925063701e-05, + "loss": 0.0088, + "step": 560090 + }, + { + "epoch": 1.45, + "learning_rate": 8.222100103426554e-05, + "loss": 0.0078, + "step": 560100 + }, + { + "epoch": 1.45, + "learning_rate": 8.221711281789408e-05, + "loss": 0.0098, + "step": 560110 + }, + { + "epoch": 1.45, + "learning_rate": 8.221322460152261e-05, + "loss": 0.0107, + "step": 560120 + }, + { + "epoch": 1.45, + "learning_rate": 8.220933638515116e-05, + "loss": 0.0105, + "step": 560130 + }, + { + "epoch": 1.45, + "learning_rate": 8.220544816877969e-05, + "loss": 0.0106, + "step": 560140 + }, + { + "epoch": 1.45, + "learning_rate": 8.220155995240823e-05, + "loss": 0.0103, + "step": 560150 + }, + { + "epoch": 1.45, + "learning_rate": 8.219767173603676e-05, + "loss": 0.0081, + "step": 560160 + }, + { + "epoch": 1.45, + "learning_rate": 8.21937835196653e-05, + "loss": 0.009, + "step": 560170 + }, + { + "epoch": 1.45, + "learning_rate": 8.218989530329383e-05, + "loss": 0.0063, + "step": 560180 + }, + { + "epoch": 1.45, + "learning_rate": 8.218600708692237e-05, + "loss": 0.0121, + "step": 560190 + }, + { + "epoch": 1.45, + "learning_rate": 8.21821188705509e-05, + "loss": 0.0086, + "step": 560200 + }, + { + "epoch": 1.45, + "learning_rate": 8.217823065417944e-05, + "loss": 0.0115, + "step": 560210 + }, + { + "epoch": 1.45, + "learning_rate": 8.217434243780797e-05, + "loss": 0.0084, + "step": 560220 + }, + { + "epoch": 1.45, + "learning_rate": 8.21704542214365e-05, + "loss": 0.009, + "step": 560230 + }, + { + "epoch": 1.45, + "learning_rate": 8.216656600506504e-05, + "loss": 0.0128, + "step": 560240 + }, + { + "epoch": 1.45, + "learning_rate": 8.216267778869357e-05, + "loss": 0.0099, + "step": 560250 + }, + { + "epoch": 1.45, + "learning_rate": 8.215878957232211e-05, + "loss": 0.0088, + "step": 560260 + }, + { + "epoch": 1.45, + "learning_rate": 8.215490135595064e-05, + "loss": 0.0101, + "step": 560270 + }, + { + "epoch": 1.45, + "learning_rate": 8.215101313957918e-05, + "loss": 0.0115, + "step": 560280 + }, + { + "epoch": 1.45, + "learning_rate": 8.214712492320771e-05, + "loss": 0.0094, + "step": 560290 + }, + { + "epoch": 1.45, + "learning_rate": 8.214323670683626e-05, + "loss": 0.0092, + "step": 560300 + }, + { + "epoch": 1.45, + "learning_rate": 8.213934849046478e-05, + "loss": 0.0084, + "step": 560310 + }, + { + "epoch": 1.45, + "learning_rate": 8.213546027409333e-05, + "loss": 0.0128, + "step": 560320 + }, + { + "epoch": 1.45, + "learning_rate": 8.213157205772186e-05, + "loss": 0.0086, + "step": 560330 + }, + { + "epoch": 1.45, + "learning_rate": 8.21276838413504e-05, + "loss": 0.0118, + "step": 560340 + }, + { + "epoch": 1.45, + "learning_rate": 8.212379562497893e-05, + "loss": 0.0113, + "step": 560350 + }, + { + "epoch": 1.45, + "learning_rate": 8.211990740860747e-05, + "loss": 0.0081, + "step": 560360 + }, + { + "epoch": 1.45, + "learning_rate": 8.2116019192236e-05, + "loss": 0.0072, + "step": 560370 + }, + { + "epoch": 1.45, + "learning_rate": 8.211213097586454e-05, + "loss": 0.0073, + "step": 560380 + }, + { + "epoch": 1.45, + "learning_rate": 8.210824275949307e-05, + "loss": 0.0091, + "step": 560390 + }, + { + "epoch": 1.45, + "learning_rate": 8.210435454312161e-05, + "loss": 0.0081, + "step": 560400 + }, + { + "epoch": 1.45, + "learning_rate": 8.210046632675014e-05, + "loss": 0.0091, + "step": 560410 + }, + { + "epoch": 1.45, + "learning_rate": 8.209657811037868e-05, + "loss": 0.0082, + "step": 560420 + }, + { + "epoch": 1.45, + "learning_rate": 8.209268989400721e-05, + "loss": 0.0076, + "step": 560430 + }, + { + "epoch": 1.45, + "learning_rate": 8.208880167763575e-05, + "loss": 0.0092, + "step": 560440 + }, + { + "epoch": 1.45, + "learning_rate": 8.208491346126428e-05, + "loss": 0.0078, + "step": 560450 + }, + { + "epoch": 1.45, + "learning_rate": 8.208102524489283e-05, + "loss": 0.0094, + "step": 560460 + }, + { + "epoch": 1.45, + "learning_rate": 8.207713702852135e-05, + "loss": 0.0074, + "step": 560470 + }, + { + "epoch": 1.45, + "learning_rate": 8.207324881214988e-05, + "loss": 0.0075, + "step": 560480 + }, + { + "epoch": 1.45, + "learning_rate": 8.206936059577843e-05, + "loss": 0.0066, + "step": 560490 + }, + { + "epoch": 1.45, + "learning_rate": 8.206547237940696e-05, + "loss": 0.0115, + "step": 560500 + }, + { + "epoch": 1.45, + "learning_rate": 8.20615841630355e-05, + "loss": 0.0102, + "step": 560510 + }, + { + "epoch": 1.45, + "learning_rate": 8.205769594666403e-05, + "loss": 0.0096, + "step": 560520 + }, + { + "epoch": 1.45, + "learning_rate": 8.205380773029257e-05, + "loss": 0.0088, + "step": 560530 + }, + { + "epoch": 1.45, + "learning_rate": 8.20499195139211e-05, + "loss": 0.0093, + "step": 560540 + }, + { + "epoch": 1.45, + "learning_rate": 8.204603129754964e-05, + "loss": 0.0091, + "step": 560550 + }, + { + "epoch": 1.45, + "learning_rate": 8.204214308117817e-05, + "loss": 0.0073, + "step": 560560 + }, + { + "epoch": 1.45, + "learning_rate": 8.203825486480671e-05, + "loss": 0.0084, + "step": 560570 + }, + { + "epoch": 1.45, + "learning_rate": 8.203436664843524e-05, + "loss": 0.0087, + "step": 560580 + }, + { + "epoch": 1.45, + "learning_rate": 8.203047843206378e-05, + "loss": 0.0111, + "step": 560590 + }, + { + "epoch": 1.45, + "learning_rate": 8.202659021569231e-05, + "loss": 0.0097, + "step": 560600 + }, + { + "epoch": 1.45, + "learning_rate": 8.202270199932085e-05, + "loss": 0.0114, + "step": 560610 + }, + { + "epoch": 1.45, + "learning_rate": 8.201881378294938e-05, + "loss": 0.0099, + "step": 560620 + }, + { + "epoch": 1.45, + "learning_rate": 8.201492556657792e-05, + "loss": 0.009, + "step": 560630 + }, + { + "epoch": 1.45, + "learning_rate": 8.201103735020645e-05, + "loss": 0.0083, + "step": 560640 + }, + { + "epoch": 1.45, + "learning_rate": 8.2007149133835e-05, + "loss": 0.0115, + "step": 560650 + }, + { + "epoch": 1.45, + "learning_rate": 8.200326091746353e-05, + "loss": 0.0107, + "step": 560660 + }, + { + "epoch": 1.45, + "learning_rate": 8.199937270109207e-05, + "loss": 0.0104, + "step": 560670 + }, + { + "epoch": 1.45, + "learning_rate": 8.19954844847206e-05, + "loss": 0.0107, + "step": 560680 + }, + { + "epoch": 1.45, + "learning_rate": 8.199159626834914e-05, + "loss": 0.0084, + "step": 560690 + }, + { + "epoch": 1.45, + "learning_rate": 8.198770805197767e-05, + "loss": 0.0106, + "step": 560700 + }, + { + "epoch": 1.45, + "learning_rate": 8.198381983560621e-05, + "loss": 0.0081, + "step": 560710 + }, + { + "epoch": 1.45, + "learning_rate": 8.197993161923474e-05, + "loss": 0.0105, + "step": 560720 + }, + { + "epoch": 1.45, + "learning_rate": 8.197604340286327e-05, + "loss": 0.0095, + "step": 560730 + }, + { + "epoch": 1.45, + "learning_rate": 8.197215518649181e-05, + "loss": 0.0093, + "step": 560740 + }, + { + "epoch": 1.45, + "learning_rate": 8.196826697012034e-05, + "loss": 0.0103, + "step": 560750 + }, + { + "epoch": 1.45, + "learning_rate": 8.196437875374888e-05, + "loss": 0.011, + "step": 560760 + }, + { + "epoch": 1.45, + "learning_rate": 8.196049053737741e-05, + "loss": 0.0069, + "step": 560770 + }, + { + "epoch": 1.45, + "learning_rate": 8.195660232100595e-05, + "loss": 0.008, + "step": 560780 + }, + { + "epoch": 1.45, + "learning_rate": 8.195271410463448e-05, + "loss": 0.0103, + "step": 560790 + }, + { + "epoch": 1.45, + "learning_rate": 8.194882588826302e-05, + "loss": 0.0089, + "step": 560800 + }, + { + "epoch": 1.45, + "learning_rate": 8.194493767189155e-05, + "loss": 0.0082, + "step": 560810 + }, + { + "epoch": 1.45, + "learning_rate": 8.19410494555201e-05, + "loss": 0.0094, + "step": 560820 + }, + { + "epoch": 1.45, + "learning_rate": 8.193716123914862e-05, + "loss": 0.0105, + "step": 560830 + }, + { + "epoch": 1.45, + "learning_rate": 8.193327302277717e-05, + "loss": 0.0094, + "step": 560840 + }, + { + "epoch": 1.45, + "learning_rate": 8.19293848064057e-05, + "loss": 0.0083, + "step": 560850 + }, + { + "epoch": 1.45, + "learning_rate": 8.192549659003424e-05, + "loss": 0.0086, + "step": 560860 + }, + { + "epoch": 1.45, + "learning_rate": 8.192160837366277e-05, + "loss": 0.0074, + "step": 560870 + }, + { + "epoch": 1.45, + "learning_rate": 8.191772015729131e-05, + "loss": 0.0088, + "step": 560880 + }, + { + "epoch": 1.45, + "learning_rate": 8.191383194091984e-05, + "loss": 0.0111, + "step": 560890 + }, + { + "epoch": 1.45, + "learning_rate": 8.190994372454838e-05, + "loss": 0.0079, + "step": 560900 + }, + { + "epoch": 1.45, + "learning_rate": 8.190605550817691e-05, + "loss": 0.0077, + "step": 560910 + }, + { + "epoch": 1.45, + "learning_rate": 8.190216729180545e-05, + "loss": 0.0104, + "step": 560920 + }, + { + "epoch": 1.45, + "learning_rate": 8.189827907543398e-05, + "loss": 0.0107, + "step": 560930 + }, + { + "epoch": 1.45, + "learning_rate": 8.189439085906252e-05, + "loss": 0.0076, + "step": 560940 + }, + { + "epoch": 1.45, + "learning_rate": 8.189050264269105e-05, + "loss": 0.0085, + "step": 560950 + }, + { + "epoch": 1.45, + "learning_rate": 8.188661442631959e-05, + "loss": 0.009, + "step": 560960 + }, + { + "epoch": 1.45, + "learning_rate": 8.188272620994812e-05, + "loss": 0.0067, + "step": 560970 + }, + { + "epoch": 1.45, + "learning_rate": 8.187883799357665e-05, + "loss": 0.0079, + "step": 560980 + }, + { + "epoch": 1.45, + "learning_rate": 8.187494977720519e-05, + "loss": 0.0074, + "step": 560990 + }, + { + "epoch": 1.45, + "learning_rate": 8.187106156083372e-05, + "loss": 0.0194, + "step": 561000 + }, + { + "epoch": 1.45, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.00594002241268754, + "eval_runtime": 107.9686, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 561000 + }, + { + "epoch": 1.45, + "learning_rate": 8.186717334446227e-05, + "loss": 0.0074, + "step": 561010 + }, + { + "epoch": 1.45, + "learning_rate": 8.18632851280908e-05, + "loss": 0.0106, + "step": 561020 + }, + { + "epoch": 1.45, + "learning_rate": 8.185939691171934e-05, + "loss": 0.0109, + "step": 561030 + }, + { + "epoch": 1.45, + "learning_rate": 8.185550869534787e-05, + "loss": 0.0063, + "step": 561040 + }, + { + "epoch": 1.45, + "learning_rate": 8.185162047897641e-05, + "loss": 0.008, + "step": 561050 + }, + { + "epoch": 1.45, + "learning_rate": 8.184773226260494e-05, + "loss": 0.0083, + "step": 561060 + }, + { + "epoch": 1.45, + "learning_rate": 8.184384404623348e-05, + "loss": 0.0096, + "step": 561070 + }, + { + "epoch": 1.45, + "learning_rate": 8.183995582986201e-05, + "loss": 0.0106, + "step": 561080 + }, + { + "epoch": 1.45, + "learning_rate": 8.183606761349055e-05, + "loss": 0.0096, + "step": 561090 + }, + { + "epoch": 1.45, + "learning_rate": 8.183217939711908e-05, + "loss": 0.0086, + "step": 561100 + }, + { + "epoch": 1.45, + "learning_rate": 8.182829118074762e-05, + "loss": 0.0075, + "step": 561110 + }, + { + "epoch": 1.45, + "learning_rate": 8.182440296437615e-05, + "loss": 0.0101, + "step": 561120 + }, + { + "epoch": 1.45, + "learning_rate": 8.182051474800469e-05, + "loss": 0.0092, + "step": 561130 + }, + { + "epoch": 1.45, + "learning_rate": 8.181662653163322e-05, + "loss": 0.012, + "step": 561140 + }, + { + "epoch": 1.45, + "learning_rate": 8.181273831526176e-05, + "loss": 0.008, + "step": 561150 + }, + { + "epoch": 1.45, + "learning_rate": 8.180885009889029e-05, + "loss": 0.0093, + "step": 561160 + }, + { + "epoch": 1.45, + "learning_rate": 8.180496188251884e-05, + "loss": 0.0136, + "step": 561170 + }, + { + "epoch": 1.45, + "learning_rate": 8.180107366614737e-05, + "loss": 0.0093, + "step": 561180 + }, + { + "epoch": 1.45, + "learning_rate": 8.179718544977591e-05, + "loss": 0.0114, + "step": 561190 + }, + { + "epoch": 1.45, + "learning_rate": 8.179329723340444e-05, + "loss": 0.0107, + "step": 561200 + }, + { + "epoch": 1.45, + "learning_rate": 8.178940901703298e-05, + "loss": 0.0112, + "step": 561210 + }, + { + "epoch": 1.45, + "learning_rate": 8.178552080066151e-05, + "loss": 0.0106, + "step": 561220 + }, + { + "epoch": 1.45, + "learning_rate": 8.178163258429004e-05, + "loss": 0.0086, + "step": 561230 + }, + { + "epoch": 1.45, + "learning_rate": 8.177774436791858e-05, + "loss": 0.0062, + "step": 561240 + }, + { + "epoch": 1.45, + "learning_rate": 8.177385615154711e-05, + "loss": 0.0086, + "step": 561250 + }, + { + "epoch": 1.45, + "learning_rate": 8.176996793517565e-05, + "loss": 0.0074, + "step": 561260 + }, + { + "epoch": 1.45, + "learning_rate": 8.176607971880418e-05, + "loss": 0.0098, + "step": 561270 + }, + { + "epoch": 1.45, + "learning_rate": 8.176219150243272e-05, + "loss": 0.0074, + "step": 561280 + }, + { + "epoch": 1.45, + "learning_rate": 8.175830328606125e-05, + "loss": 0.0121, + "step": 561290 + }, + { + "epoch": 1.45, + "learning_rate": 8.175441506968979e-05, + "loss": 0.0135, + "step": 561300 + }, + { + "epoch": 1.45, + "learning_rate": 8.175052685331832e-05, + "loss": 0.0101, + "step": 561310 + }, + { + "epoch": 1.46, + "learning_rate": 8.174663863694686e-05, + "loss": 0.0126, + "step": 561320 + }, + { + "epoch": 1.46, + "learning_rate": 8.174275042057539e-05, + "loss": 0.0063, + "step": 561330 + }, + { + "epoch": 1.46, + "learning_rate": 8.173886220420393e-05, + "loss": 0.0092, + "step": 561340 + }, + { + "epoch": 1.46, + "learning_rate": 8.173497398783246e-05, + "loss": 0.0087, + "step": 561350 + }, + { + "epoch": 1.46, + "learning_rate": 8.173108577146101e-05, + "loss": 0.0073, + "step": 561360 + }, + { + "epoch": 1.46, + "learning_rate": 8.172719755508954e-05, + "loss": 0.0085, + "step": 561370 + }, + { + "epoch": 1.46, + "learning_rate": 8.172330933871808e-05, + "loss": 0.0089, + "step": 561380 + }, + { + "epoch": 1.46, + "learning_rate": 8.171942112234661e-05, + "loss": 0.0107, + "step": 561390 + }, + { + "epoch": 1.46, + "learning_rate": 8.171553290597515e-05, + "loss": 0.0146, + "step": 561400 + }, + { + "epoch": 1.46, + "learning_rate": 8.171164468960368e-05, + "loss": 0.0086, + "step": 561410 + }, + { + "epoch": 1.46, + "learning_rate": 8.170775647323222e-05, + "loss": 0.0075, + "step": 561420 + }, + { + "epoch": 1.46, + "learning_rate": 8.170386825686075e-05, + "loss": 0.0081, + "step": 561430 + }, + { + "epoch": 1.46, + "learning_rate": 8.169998004048929e-05, + "loss": 0.0096, + "step": 561440 + }, + { + "epoch": 1.46, + "learning_rate": 8.169609182411782e-05, + "loss": 0.0075, + "step": 561450 + }, + { + "epoch": 1.46, + "learning_rate": 8.169220360774636e-05, + "loss": 0.0101, + "step": 561460 + }, + { + "epoch": 1.46, + "learning_rate": 8.168831539137489e-05, + "loss": 0.0119, + "step": 561470 + }, + { + "epoch": 1.46, + "learning_rate": 8.168442717500342e-05, + "loss": 0.0105, + "step": 561480 + }, + { + "epoch": 1.46, + "learning_rate": 8.168053895863196e-05, + "loss": 0.0104, + "step": 561490 + }, + { + "epoch": 1.46, + "learning_rate": 8.167665074226049e-05, + "loss": 0.008, + "step": 561500 + }, + { + "epoch": 1.46, + "learning_rate": 8.167276252588903e-05, + "loss": 0.0084, + "step": 561510 + }, + { + "epoch": 1.46, + "learning_rate": 8.166887430951756e-05, + "loss": 0.0099, + "step": 561520 + }, + { + "epoch": 1.46, + "learning_rate": 8.166498609314611e-05, + "loss": 0.0104, + "step": 561530 + }, + { + "epoch": 1.46, + "learning_rate": 8.166109787677463e-05, + "loss": 0.0078, + "step": 561540 + }, + { + "epoch": 1.46, + "learning_rate": 8.165720966040318e-05, + "loss": 0.011, + "step": 561550 + }, + { + "epoch": 1.46, + "learning_rate": 8.165332144403171e-05, + "loss": 0.0093, + "step": 561560 + }, + { + "epoch": 1.46, + "learning_rate": 8.164943322766025e-05, + "loss": 0.0068, + "step": 561570 + }, + { + "epoch": 1.46, + "learning_rate": 8.164554501128878e-05, + "loss": 0.0086, + "step": 561580 + }, + { + "epoch": 1.46, + "learning_rate": 8.164165679491732e-05, + "loss": 0.0099, + "step": 561590 + }, + { + "epoch": 1.46, + "learning_rate": 8.163776857854585e-05, + "loss": 0.0109, + "step": 561600 + }, + { + "epoch": 1.46, + "learning_rate": 8.163388036217439e-05, + "loss": 0.0092, + "step": 561610 + }, + { + "epoch": 1.46, + "learning_rate": 8.162999214580292e-05, + "loss": 0.008, + "step": 561620 + }, + { + "epoch": 1.46, + "learning_rate": 8.162610392943146e-05, + "loss": 0.0091, + "step": 561630 + }, + { + "epoch": 1.46, + "learning_rate": 8.162221571305999e-05, + "loss": 0.0093, + "step": 561640 + }, + { + "epoch": 1.46, + "learning_rate": 8.161832749668853e-05, + "loss": 0.0085, + "step": 561650 + }, + { + "epoch": 1.46, + "learning_rate": 8.161443928031706e-05, + "loss": 0.0091, + "step": 561660 + }, + { + "epoch": 1.46, + "learning_rate": 8.16105510639456e-05, + "loss": 0.0098, + "step": 561670 + }, + { + "epoch": 1.46, + "learning_rate": 8.160666284757413e-05, + "loss": 0.0097, + "step": 561680 + }, + { + "epoch": 1.46, + "learning_rate": 8.160277463120268e-05, + "loss": 0.0097, + "step": 561690 + }, + { + "epoch": 1.46, + "learning_rate": 8.15988864148312e-05, + "loss": 0.0083, + "step": 561700 + }, + { + "epoch": 1.46, + "learning_rate": 8.159499819845975e-05, + "loss": 0.0099, + "step": 561710 + }, + { + "epoch": 1.46, + "learning_rate": 8.159110998208828e-05, + "loss": 0.0057, + "step": 561720 + }, + { + "epoch": 1.46, + "learning_rate": 8.158722176571681e-05, + "loss": 0.0095, + "step": 561730 + }, + { + "epoch": 1.46, + "learning_rate": 8.158333354934535e-05, + "loss": 0.0082, + "step": 561740 + }, + { + "epoch": 1.46, + "learning_rate": 8.157944533297388e-05, + "loss": 0.0157, + "step": 561750 + }, + { + "epoch": 1.46, + "learning_rate": 8.157555711660242e-05, + "loss": 0.0084, + "step": 561760 + }, + { + "epoch": 1.46, + "learning_rate": 8.157166890023095e-05, + "loss": 0.0089, + "step": 561770 + }, + { + "epoch": 1.46, + "learning_rate": 8.156778068385949e-05, + "loss": 0.0119, + "step": 561780 + }, + { + "epoch": 1.46, + "learning_rate": 8.156389246748802e-05, + "loss": 0.0085, + "step": 561790 + }, + { + "epoch": 1.46, + "learning_rate": 8.156000425111656e-05, + "loss": 0.0094, + "step": 561800 + }, + { + "epoch": 1.46, + "learning_rate": 8.155611603474509e-05, + "loss": 0.01, + "step": 561810 + }, + { + "epoch": 1.46, + "learning_rate": 8.155222781837363e-05, + "loss": 0.0145, + "step": 561820 + }, + { + "epoch": 1.46, + "learning_rate": 8.154833960200216e-05, + "loss": 0.0123, + "step": 561830 + }, + { + "epoch": 1.46, + "learning_rate": 8.15444513856307e-05, + "loss": 0.0089, + "step": 561840 + }, + { + "epoch": 1.46, + "learning_rate": 8.154056316925923e-05, + "loss": 0.0079, + "step": 561850 + }, + { + "epoch": 1.46, + "learning_rate": 8.153667495288777e-05, + "loss": 0.0124, + "step": 561860 + }, + { + "epoch": 1.46, + "learning_rate": 8.15327867365163e-05, + "loss": 0.0088, + "step": 561870 + }, + { + "epoch": 1.46, + "learning_rate": 8.152889852014485e-05, + "loss": 0.0089, + "step": 561880 + }, + { + "epoch": 1.46, + "learning_rate": 8.152501030377338e-05, + "loss": 0.01, + "step": 561890 + }, + { + "epoch": 1.46, + "learning_rate": 8.152112208740192e-05, + "loss": 0.0096, + "step": 561900 + }, + { + "epoch": 1.46, + "learning_rate": 8.151723387103045e-05, + "loss": 0.0091, + "step": 561910 + }, + { + "epoch": 1.46, + "learning_rate": 8.151334565465899e-05, + "loss": 0.0087, + "step": 561920 + }, + { + "epoch": 1.46, + "learning_rate": 8.150945743828752e-05, + "loss": 0.0078, + "step": 561930 + }, + { + "epoch": 1.46, + "learning_rate": 8.150556922191606e-05, + "loss": 0.0103, + "step": 561940 + }, + { + "epoch": 1.46, + "learning_rate": 8.150168100554459e-05, + "loss": 0.0097, + "step": 561950 + }, + { + "epoch": 1.46, + "learning_rate": 8.149779278917313e-05, + "loss": 0.0097, + "step": 561960 + }, + { + "epoch": 1.46, + "learning_rate": 8.149390457280166e-05, + "loss": 0.0135, + "step": 561970 + }, + { + "epoch": 1.46, + "learning_rate": 8.149001635643019e-05, + "loss": 0.0073, + "step": 561980 + }, + { + "epoch": 1.46, + "learning_rate": 8.148612814005873e-05, + "loss": 0.0124, + "step": 561990 + }, + { + "epoch": 1.46, + "learning_rate": 8.148223992368726e-05, + "loss": 0.0098, + "step": 562000 + }, + { + "epoch": 1.46, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.006133432034403086, + "eval_runtime": 107.8225, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 562000 + }, + { + "epoch": 1.46, + "learning_rate": 8.14783517073158e-05, + "loss": 0.0069, + "step": 562010 + }, + { + "epoch": 1.46, + "learning_rate": 8.147446349094433e-05, + "loss": 0.0077, + "step": 562020 + }, + { + "epoch": 1.46, + "learning_rate": 8.147057527457287e-05, + "loss": 0.0082, + "step": 562030 + }, + { + "epoch": 1.46, + "learning_rate": 8.14666870582014e-05, + "loss": 0.0091, + "step": 562040 + }, + { + "epoch": 1.46, + "learning_rate": 8.146279884182995e-05, + "loss": 0.0094, + "step": 562050 + }, + { + "epoch": 1.46, + "learning_rate": 8.145891062545847e-05, + "loss": 0.0081, + "step": 562060 + }, + { + "epoch": 1.46, + "learning_rate": 8.145502240908702e-05, + "loss": 0.0108, + "step": 562070 + }, + { + "epoch": 1.46, + "learning_rate": 8.145113419271555e-05, + "loss": 0.0109, + "step": 562080 + }, + { + "epoch": 1.46, + "learning_rate": 8.144724597634409e-05, + "loss": 0.0117, + "step": 562090 + }, + { + "epoch": 1.46, + "learning_rate": 8.144335775997262e-05, + "loss": 0.0124, + "step": 562100 + }, + { + "epoch": 1.46, + "learning_rate": 8.143946954360116e-05, + "loss": 0.0103, + "step": 562110 + }, + { + "epoch": 1.46, + "learning_rate": 8.143558132722969e-05, + "loss": 0.0073, + "step": 562120 + }, + { + "epoch": 1.46, + "learning_rate": 8.143169311085823e-05, + "loss": 0.0107, + "step": 562130 + }, + { + "epoch": 1.46, + "learning_rate": 8.142780489448676e-05, + "loss": 0.0068, + "step": 562140 + }, + { + "epoch": 1.46, + "learning_rate": 8.14239166781153e-05, + "loss": 0.0067, + "step": 562150 + }, + { + "epoch": 1.46, + "learning_rate": 8.142002846174383e-05, + "loss": 0.0098, + "step": 562160 + }, + { + "epoch": 1.46, + "learning_rate": 8.141614024537237e-05, + "loss": 0.0101, + "step": 562170 + }, + { + "epoch": 1.46, + "learning_rate": 8.14122520290009e-05, + "loss": 0.0093, + "step": 562180 + }, + { + "epoch": 1.46, + "learning_rate": 8.140836381262944e-05, + "loss": 0.011, + "step": 562190 + }, + { + "epoch": 1.46, + "learning_rate": 8.140447559625797e-05, + "loss": 0.0113, + "step": 562200 + }, + { + "epoch": 1.46, + "learning_rate": 8.14005873798865e-05, + "loss": 0.0089, + "step": 562210 + }, + { + "epoch": 1.46, + "learning_rate": 8.139669916351504e-05, + "loss": 0.0093, + "step": 562220 + }, + { + "epoch": 1.46, + "learning_rate": 8.139281094714357e-05, + "loss": 0.0103, + "step": 562230 + }, + { + "epoch": 1.46, + "learning_rate": 8.138892273077212e-05, + "loss": 0.013, + "step": 562240 + }, + { + "epoch": 1.46, + "learning_rate": 8.138503451440065e-05, + "loss": 0.0077, + "step": 562250 + }, + { + "epoch": 1.46, + "learning_rate": 8.138114629802919e-05, + "loss": 0.0087, + "step": 562260 + }, + { + "epoch": 1.46, + "learning_rate": 8.137725808165772e-05, + "loss": 0.0092, + "step": 562270 + }, + { + "epoch": 1.46, + "learning_rate": 8.137336986528626e-05, + "loss": 0.0077, + "step": 562280 + }, + { + "epoch": 1.46, + "learning_rate": 8.136948164891479e-05, + "loss": 0.0088, + "step": 562290 + }, + { + "epoch": 1.46, + "learning_rate": 8.136559343254333e-05, + "loss": 0.0083, + "step": 562300 + }, + { + "epoch": 1.46, + "learning_rate": 8.136170521617186e-05, + "loss": 0.0078, + "step": 562310 + }, + { + "epoch": 1.46, + "learning_rate": 8.13578169998004e-05, + "loss": 0.0097, + "step": 562320 + }, + { + "epoch": 1.46, + "learning_rate": 8.135392878342893e-05, + "loss": 0.0107, + "step": 562330 + }, + { + "epoch": 1.46, + "learning_rate": 8.135004056705747e-05, + "loss": 0.0074, + "step": 562340 + }, + { + "epoch": 1.46, + "learning_rate": 8.1346152350686e-05, + "loss": 0.011, + "step": 562350 + }, + { + "epoch": 1.46, + "learning_rate": 8.134226413431454e-05, + "loss": 0.0067, + "step": 562360 + }, + { + "epoch": 1.46, + "learning_rate": 8.133837591794307e-05, + "loss": 0.0102, + "step": 562370 + }, + { + "epoch": 1.46, + "learning_rate": 8.133448770157161e-05, + "loss": 0.0095, + "step": 562380 + }, + { + "epoch": 1.46, + "learning_rate": 8.133059948520014e-05, + "loss": 0.0129, + "step": 562390 + }, + { + "epoch": 1.46, + "learning_rate": 8.132671126882869e-05, + "loss": 0.008, + "step": 562400 + }, + { + "epoch": 1.46, + "learning_rate": 8.132282305245722e-05, + "loss": 0.0094, + "step": 562410 + }, + { + "epoch": 1.46, + "learning_rate": 8.131893483608576e-05, + "loss": 0.0097, + "step": 562420 + }, + { + "epoch": 1.46, + "learning_rate": 8.131504661971429e-05, + "loss": 0.0136, + "step": 562430 + }, + { + "epoch": 1.46, + "learning_rate": 8.131115840334283e-05, + "loss": 0.0121, + "step": 562440 + }, + { + "epoch": 1.46, + "learning_rate": 8.130727018697136e-05, + "loss": 0.0137, + "step": 562450 + }, + { + "epoch": 1.46, + "learning_rate": 8.130338197059989e-05, + "loss": 0.0098, + "step": 562460 + }, + { + "epoch": 1.46, + "learning_rate": 8.129949375422843e-05, + "loss": 0.0108, + "step": 562470 + }, + { + "epoch": 1.46, + "learning_rate": 8.129560553785696e-05, + "loss": 0.0141, + "step": 562480 + }, + { + "epoch": 1.46, + "learning_rate": 8.12917173214855e-05, + "loss": 0.009, + "step": 562490 + }, + { + "epoch": 1.46, + "learning_rate": 8.128782910511403e-05, + "loss": 0.0071, + "step": 562500 + }, + { + "epoch": 1.46, + "learning_rate": 8.128394088874257e-05, + "loss": 0.0076, + "step": 562510 + }, + { + "epoch": 1.46, + "learning_rate": 8.12800526723711e-05, + "loss": 0.0105, + "step": 562520 + }, + { + "epoch": 1.46, + "learning_rate": 8.127616445599964e-05, + "loss": 0.0068, + "step": 562530 + }, + { + "epoch": 1.46, + "learning_rate": 8.127227623962817e-05, + "loss": 0.0122, + "step": 562540 + }, + { + "epoch": 1.46, + "learning_rate": 8.126838802325671e-05, + "loss": 0.0077, + "step": 562550 + }, + { + "epoch": 1.46, + "learning_rate": 8.126449980688524e-05, + "loss": 0.009, + "step": 562560 + }, + { + "epoch": 1.46, + "learning_rate": 8.126061159051379e-05, + "loss": 0.0085, + "step": 562570 + }, + { + "epoch": 1.46, + "learning_rate": 8.125672337414231e-05, + "loss": 0.0091, + "step": 562580 + }, + { + "epoch": 1.46, + "learning_rate": 8.125283515777086e-05, + "loss": 0.0097, + "step": 562590 + }, + { + "epoch": 1.46, + "learning_rate": 8.124894694139939e-05, + "loss": 0.0098, + "step": 562600 + }, + { + "epoch": 1.46, + "learning_rate": 8.124505872502793e-05, + "loss": 0.0096, + "step": 562610 + }, + { + "epoch": 1.46, + "learning_rate": 8.124117050865646e-05, + "loss": 0.0118, + "step": 562620 + }, + { + "epoch": 1.46, + "learning_rate": 8.1237282292285e-05, + "loss": 0.0098, + "step": 562630 + }, + { + "epoch": 1.46, + "learning_rate": 8.123339407591353e-05, + "loss": 0.0098, + "step": 562640 + }, + { + "epoch": 1.46, + "learning_rate": 8.122950585954207e-05, + "loss": 0.0089, + "step": 562650 + }, + { + "epoch": 1.46, + "learning_rate": 8.12256176431706e-05, + "loss": 0.0087, + "step": 562660 + }, + { + "epoch": 1.46, + "learning_rate": 8.122172942679914e-05, + "loss": 0.0076, + "step": 562670 + }, + { + "epoch": 1.46, + "learning_rate": 8.121784121042767e-05, + "loss": 0.0134, + "step": 562680 + }, + { + "epoch": 1.46, + "learning_rate": 8.121395299405621e-05, + "loss": 0.0098, + "step": 562690 + }, + { + "epoch": 1.46, + "learning_rate": 8.121006477768474e-05, + "loss": 0.009, + "step": 562700 + }, + { + "epoch": 1.46, + "learning_rate": 8.120617656131327e-05, + "loss": 0.0064, + "step": 562710 + }, + { + "epoch": 1.46, + "learning_rate": 8.120228834494181e-05, + "loss": 0.0101, + "step": 562720 + }, + { + "epoch": 1.46, + "learning_rate": 8.119840012857034e-05, + "loss": 0.0161, + "step": 562730 + }, + { + "epoch": 1.46, + "learning_rate": 8.119451191219888e-05, + "loss": 0.0088, + "step": 562740 + }, + { + "epoch": 1.46, + "learning_rate": 8.11906236958274e-05, + "loss": 0.0076, + "step": 562750 + }, + { + "epoch": 1.46, + "learning_rate": 8.118673547945596e-05, + "loss": 0.008, + "step": 562760 + }, + { + "epoch": 1.46, + "learning_rate": 8.118284726308449e-05, + "loss": 0.0068, + "step": 562770 + }, + { + "epoch": 1.46, + "learning_rate": 8.117895904671303e-05, + "loss": 0.0068, + "step": 562780 + }, + { + "epoch": 1.46, + "learning_rate": 8.117507083034156e-05, + "loss": 0.0067, + "step": 562790 + }, + { + "epoch": 1.46, + "learning_rate": 8.11711826139701e-05, + "loss": 0.0074, + "step": 562800 + }, + { + "epoch": 1.46, + "learning_rate": 8.116729439759863e-05, + "loss": 0.0109, + "step": 562810 + }, + { + "epoch": 1.46, + "learning_rate": 8.116340618122717e-05, + "loss": 0.0074, + "step": 562820 + }, + { + "epoch": 1.46, + "learning_rate": 8.11595179648557e-05, + "loss": 0.0101, + "step": 562830 + }, + { + "epoch": 1.46, + "learning_rate": 8.115562974848424e-05, + "loss": 0.007, + "step": 562840 + }, + { + "epoch": 1.46, + "learning_rate": 8.115174153211277e-05, + "loss": 0.0071, + "step": 562850 + }, + { + "epoch": 1.46, + "learning_rate": 8.114785331574131e-05, + "loss": 0.008, + "step": 562860 + }, + { + "epoch": 1.46, + "learning_rate": 8.114396509936984e-05, + "loss": 0.0129, + "step": 562870 + }, + { + "epoch": 1.46, + "learning_rate": 8.114007688299838e-05, + "loss": 0.0087, + "step": 562880 + }, + { + "epoch": 1.46, + "learning_rate": 8.113618866662691e-05, + "loss": 0.008, + "step": 562890 + }, + { + "epoch": 1.46, + "learning_rate": 8.113230045025545e-05, + "loss": 0.0126, + "step": 562900 + }, + { + "epoch": 1.46, + "learning_rate": 8.112841223388398e-05, + "loss": 0.0109, + "step": 562910 + }, + { + "epoch": 1.46, + "learning_rate": 8.112452401751253e-05, + "loss": 0.0058, + "step": 562920 + }, + { + "epoch": 1.46, + "learning_rate": 8.112063580114105e-05, + "loss": 0.0081, + "step": 562930 + }, + { + "epoch": 1.46, + "learning_rate": 8.11167475847696e-05, + "loss": 0.0088, + "step": 562940 + }, + { + "epoch": 1.46, + "learning_rate": 8.111285936839813e-05, + "loss": 0.0087, + "step": 562950 + }, + { + "epoch": 1.46, + "learning_rate": 8.110897115202666e-05, + "loss": 0.0079, + "step": 562960 + }, + { + "epoch": 1.46, + "learning_rate": 8.11050829356552e-05, + "loss": 0.0119, + "step": 562970 + }, + { + "epoch": 1.46, + "learning_rate": 8.110119471928373e-05, + "loss": 0.0105, + "step": 562980 + }, + { + "epoch": 1.46, + "learning_rate": 8.109730650291227e-05, + "loss": 0.0067, + "step": 562990 + }, + { + "epoch": 1.46, + "learning_rate": 8.10934182865408e-05, + "loss": 0.009, + "step": 563000 + }, + { + "epoch": 1.46, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.0060217659920454025, + "eval_runtime": 108.0142, + "eval_samples_per_second": 18.516, + "eval_steps_per_second": 4.629, + "step": 563000 + }, + { + "epoch": 1.46, + "learning_rate": 8.108953007016934e-05, + "loss": 0.0124, + "step": 563010 + }, + { + "epoch": 1.46, + "learning_rate": 8.108564185379787e-05, + "loss": 0.008, + "step": 563020 + }, + { + "epoch": 1.46, + "learning_rate": 8.108175363742641e-05, + "loss": 0.0089, + "step": 563030 + }, + { + "epoch": 1.46, + "learning_rate": 8.107786542105494e-05, + "loss": 0.0234, + "step": 563040 + }, + { + "epoch": 1.46, + "learning_rate": 8.107397720468348e-05, + "loss": 0.0133, + "step": 563050 + }, + { + "epoch": 1.46, + "learning_rate": 8.107008898831201e-05, + "loss": 0.01, + "step": 563060 + }, + { + "epoch": 1.46, + "learning_rate": 8.106620077194055e-05, + "loss": 0.0093, + "step": 563070 + }, + { + "epoch": 1.46, + "learning_rate": 8.106231255556908e-05, + "loss": 0.0098, + "step": 563080 + }, + { + "epoch": 1.46, + "learning_rate": 8.105842433919762e-05, + "loss": 0.0113, + "step": 563090 + }, + { + "epoch": 1.46, + "learning_rate": 8.105453612282615e-05, + "loss": 0.0078, + "step": 563100 + }, + { + "epoch": 1.46, + "learning_rate": 8.10506479064547e-05, + "loss": 0.0089, + "step": 563110 + }, + { + "epoch": 1.46, + "learning_rate": 8.104675969008323e-05, + "loss": 0.0078, + "step": 563120 + }, + { + "epoch": 1.46, + "learning_rate": 8.104287147371177e-05, + "loss": 0.0093, + "step": 563130 + }, + { + "epoch": 1.46, + "learning_rate": 8.10389832573403e-05, + "loss": 0.0079, + "step": 563140 + }, + { + "epoch": 1.46, + "learning_rate": 8.103509504096884e-05, + "loss": 0.0096, + "step": 563150 + }, + { + "epoch": 1.46, + "learning_rate": 8.103120682459737e-05, + "loss": 0.0066, + "step": 563160 + }, + { + "epoch": 1.46, + "learning_rate": 8.102731860822591e-05, + "loss": 0.0116, + "step": 563170 + }, + { + "epoch": 1.46, + "learning_rate": 8.102343039185444e-05, + "loss": 0.0098, + "step": 563180 + }, + { + "epoch": 1.46, + "learning_rate": 8.101954217548298e-05, + "loss": 0.0069, + "step": 563190 + }, + { + "epoch": 1.46, + "learning_rate": 8.101565395911151e-05, + "loss": 0.0133, + "step": 563200 + }, + { + "epoch": 1.46, + "learning_rate": 8.101176574274004e-05, + "loss": 0.0088, + "step": 563210 + }, + { + "epoch": 1.46, + "learning_rate": 8.100787752636858e-05, + "loss": 0.0077, + "step": 563220 + }, + { + "epoch": 1.46, + "learning_rate": 8.10039893099971e-05, + "loss": 0.0091, + "step": 563230 + }, + { + "epoch": 1.46, + "learning_rate": 8.100010109362565e-05, + "loss": 0.0065, + "step": 563240 + }, + { + "epoch": 1.46, + "learning_rate": 8.099621287725418e-05, + "loss": 0.0144, + "step": 563250 + }, + { + "epoch": 1.46, + "learning_rate": 8.099232466088272e-05, + "loss": 0.0108, + "step": 563260 + }, + { + "epoch": 1.46, + "learning_rate": 8.098843644451125e-05, + "loss": 0.007, + "step": 563270 + }, + { + "epoch": 1.46, + "learning_rate": 8.09845482281398e-05, + "loss": 0.0107, + "step": 563280 + }, + { + "epoch": 1.46, + "learning_rate": 8.098066001176832e-05, + "loss": 0.0101, + "step": 563290 + }, + { + "epoch": 1.46, + "learning_rate": 8.097677179539687e-05, + "loss": 0.0063, + "step": 563300 + }, + { + "epoch": 1.46, + "learning_rate": 8.09728835790254e-05, + "loss": 0.0142, + "step": 563310 + }, + { + "epoch": 1.46, + "learning_rate": 8.096899536265394e-05, + "loss": 0.0101, + "step": 563320 + }, + { + "epoch": 1.46, + "learning_rate": 8.096510714628247e-05, + "loss": 0.0114, + "step": 563330 + }, + { + "epoch": 1.46, + "learning_rate": 8.096121892991101e-05, + "loss": 0.0107, + "step": 563340 + }, + { + "epoch": 1.46, + "learning_rate": 8.095733071353954e-05, + "loss": 0.0084, + "step": 563350 + }, + { + "epoch": 1.46, + "learning_rate": 8.095344249716808e-05, + "loss": 0.0093, + "step": 563360 + }, + { + "epoch": 1.46, + "learning_rate": 8.094955428079661e-05, + "loss": 0.0092, + "step": 563370 + }, + { + "epoch": 1.46, + "learning_rate": 8.094566606442515e-05, + "loss": 0.0108, + "step": 563380 + }, + { + "epoch": 1.46, + "learning_rate": 8.094177784805368e-05, + "loss": 0.0098, + "step": 563390 + }, + { + "epoch": 1.46, + "learning_rate": 8.093788963168222e-05, + "loss": 0.0116, + "step": 563400 + }, + { + "epoch": 1.46, + "learning_rate": 8.093400141531075e-05, + "loss": 0.0093, + "step": 563410 + }, + { + "epoch": 1.46, + "learning_rate": 8.093011319893929e-05, + "loss": 0.0089, + "step": 563420 + }, + { + "epoch": 1.46, + "learning_rate": 8.092622498256782e-05, + "loss": 0.0131, + "step": 563430 + }, + { + "epoch": 1.46, + "learning_rate": 8.092233676619637e-05, + "loss": 0.0067, + "step": 563440 + }, + { + "epoch": 1.46, + "learning_rate": 8.091844854982489e-05, + "loss": 0.0089, + "step": 563450 + }, + { + "epoch": 1.46, + "learning_rate": 8.091456033345342e-05, + "loss": 0.0084, + "step": 563460 + }, + { + "epoch": 1.46, + "learning_rate": 8.091067211708197e-05, + "loss": 0.0086, + "step": 563470 + }, + { + "epoch": 1.46, + "learning_rate": 8.09067839007105e-05, + "loss": 0.0082, + "step": 563480 + }, + { + "epoch": 1.46, + "learning_rate": 8.090289568433904e-05, + "loss": 0.0071, + "step": 563490 + }, + { + "epoch": 1.46, + "learning_rate": 8.089900746796757e-05, + "loss": 0.0102, + "step": 563500 + }, + { + "epoch": 1.46, + "learning_rate": 8.089511925159611e-05, + "loss": 0.0121, + "step": 563510 + }, + { + "epoch": 1.46, + "learning_rate": 8.089123103522464e-05, + "loss": 0.0097, + "step": 563520 + }, + { + "epoch": 1.46, + "learning_rate": 8.088734281885318e-05, + "loss": 0.0089, + "step": 563530 + }, + { + "epoch": 1.46, + "learning_rate": 8.088345460248171e-05, + "loss": 0.0103, + "step": 563540 + }, + { + "epoch": 1.46, + "learning_rate": 8.087956638611025e-05, + "loss": 0.0088, + "step": 563550 + }, + { + "epoch": 1.46, + "learning_rate": 8.087567816973878e-05, + "loss": 0.0162, + "step": 563560 + }, + { + "epoch": 1.46, + "learning_rate": 8.087178995336732e-05, + "loss": 0.0101, + "step": 563570 + }, + { + "epoch": 1.46, + "learning_rate": 8.086790173699585e-05, + "loss": 0.0097, + "step": 563580 + }, + { + "epoch": 1.46, + "learning_rate": 8.086401352062439e-05, + "loss": 0.011, + "step": 563590 + }, + { + "epoch": 1.46, + "learning_rate": 8.086012530425292e-05, + "loss": 0.0092, + "step": 563600 + }, + { + "epoch": 1.46, + "learning_rate": 8.085623708788146e-05, + "loss": 0.0093, + "step": 563610 + }, + { + "epoch": 1.46, + "learning_rate": 8.085234887150999e-05, + "loss": 0.0094, + "step": 563620 + }, + { + "epoch": 1.46, + "learning_rate": 8.084846065513854e-05, + "loss": 0.0098, + "step": 563630 + }, + { + "epoch": 1.46, + "learning_rate": 8.084457243876707e-05, + "loss": 0.0108, + "step": 563640 + }, + { + "epoch": 1.46, + "learning_rate": 8.084068422239561e-05, + "loss": 0.0088, + "step": 563650 + }, + { + "epoch": 1.46, + "learning_rate": 8.083679600602414e-05, + "loss": 0.0093, + "step": 563660 + }, + { + "epoch": 1.46, + "learning_rate": 8.083290778965268e-05, + "loss": 0.0124, + "step": 563670 + }, + { + "epoch": 1.46, + "learning_rate": 8.082901957328121e-05, + "loss": 0.0074, + "step": 563680 + }, + { + "epoch": 1.46, + "learning_rate": 8.082513135690975e-05, + "loss": 0.0084, + "step": 563690 + }, + { + "epoch": 1.46, + "learning_rate": 8.082124314053828e-05, + "loss": 0.0104, + "step": 563700 + }, + { + "epoch": 1.46, + "learning_rate": 8.081735492416681e-05, + "loss": 0.0157, + "step": 563710 + }, + { + "epoch": 1.46, + "learning_rate": 8.081346670779535e-05, + "loss": 0.0086, + "step": 563720 + }, + { + "epoch": 1.46, + "learning_rate": 8.080957849142388e-05, + "loss": 0.01, + "step": 563730 + }, + { + "epoch": 1.46, + "learning_rate": 8.080569027505242e-05, + "loss": 0.0095, + "step": 563740 + }, + { + "epoch": 1.46, + "learning_rate": 8.080180205868095e-05, + "loss": 0.0079, + "step": 563750 + }, + { + "epoch": 1.46, + "learning_rate": 8.079791384230949e-05, + "loss": 0.0101, + "step": 563760 + }, + { + "epoch": 1.46, + "learning_rate": 8.079402562593802e-05, + "loss": 0.0098, + "step": 563770 + }, + { + "epoch": 1.46, + "learning_rate": 8.079013740956656e-05, + "loss": 0.0103, + "step": 563780 + }, + { + "epoch": 1.46, + "learning_rate": 8.078624919319509e-05, + "loss": 0.0107, + "step": 563790 + }, + { + "epoch": 1.46, + "learning_rate": 8.078236097682364e-05, + "loss": 0.0101, + "step": 563800 + }, + { + "epoch": 1.46, + "learning_rate": 8.077847276045216e-05, + "loss": 0.0088, + "step": 563810 + }, + { + "epoch": 1.46, + "learning_rate": 8.077458454408071e-05, + "loss": 0.0071, + "step": 563820 + }, + { + "epoch": 1.46, + "learning_rate": 8.077069632770924e-05, + "loss": 0.008, + "step": 563830 + }, + { + "epoch": 1.46, + "learning_rate": 8.076680811133778e-05, + "loss": 0.0118, + "step": 563840 + }, + { + "epoch": 1.46, + "learning_rate": 8.076291989496631e-05, + "loss": 0.0074, + "step": 563850 + }, + { + "epoch": 1.46, + "learning_rate": 8.075903167859485e-05, + "loss": 0.0092, + "step": 563860 + }, + { + "epoch": 1.46, + "learning_rate": 8.075514346222338e-05, + "loss": 0.01, + "step": 563870 + }, + { + "epoch": 1.46, + "learning_rate": 8.075125524585192e-05, + "loss": 0.0095, + "step": 563880 + }, + { + "epoch": 1.46, + "learning_rate": 8.074736702948045e-05, + "loss": 0.0062, + "step": 563890 + }, + { + "epoch": 1.46, + "learning_rate": 8.074347881310899e-05, + "loss": 0.0095, + "step": 563900 + }, + { + "epoch": 1.46, + "learning_rate": 8.073959059673752e-05, + "loss": 0.0093, + "step": 563910 + }, + { + "epoch": 1.46, + "learning_rate": 8.073570238036606e-05, + "loss": 0.0094, + "step": 563920 + }, + { + "epoch": 1.46, + "learning_rate": 8.073181416399459e-05, + "loss": 0.0103, + "step": 563930 + }, + { + "epoch": 1.46, + "learning_rate": 8.072792594762313e-05, + "loss": 0.0082, + "step": 563940 + }, + { + "epoch": 1.46, + "learning_rate": 8.072403773125166e-05, + "loss": 0.0081, + "step": 563950 + }, + { + "epoch": 1.46, + "learning_rate": 8.072014951488019e-05, + "loss": 0.0075, + "step": 563960 + }, + { + "epoch": 1.46, + "learning_rate": 8.071626129850873e-05, + "loss": 0.0085, + "step": 563970 + }, + { + "epoch": 1.46, + "learning_rate": 8.071237308213726e-05, + "loss": 0.0071, + "step": 563980 + }, + { + "epoch": 1.46, + "learning_rate": 8.070848486576581e-05, + "loss": 0.008, + "step": 563990 + }, + { + "epoch": 1.46, + "learning_rate": 8.070459664939434e-05, + "loss": 0.007, + "step": 564000 + }, + { + "epoch": 1.46, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.006286456249654293, + "eval_runtime": 107.8864, + "eval_samples_per_second": 18.538, + "eval_steps_per_second": 4.635, + "step": 564000 + }, + { + "epoch": 1.46, + "learning_rate": 8.070070843302288e-05, + "loss": 0.0086, + "step": 564010 + }, + { + "epoch": 1.46, + "learning_rate": 8.069682021665141e-05, + "loss": 0.0081, + "step": 564020 + }, + { + "epoch": 1.46, + "learning_rate": 8.069293200027995e-05, + "loss": 0.011, + "step": 564030 + }, + { + "epoch": 1.46, + "learning_rate": 8.068904378390848e-05, + "loss": 0.0104, + "step": 564040 + }, + { + "epoch": 1.46, + "learning_rate": 8.068515556753702e-05, + "loss": 0.0084, + "step": 564050 + }, + { + "epoch": 1.46, + "learning_rate": 8.068126735116555e-05, + "loss": 0.0081, + "step": 564060 + }, + { + "epoch": 1.46, + "learning_rate": 8.067737913479409e-05, + "loss": 0.0079, + "step": 564070 + }, + { + "epoch": 1.46, + "learning_rate": 8.067349091842262e-05, + "loss": 0.0101, + "step": 564080 + }, + { + "epoch": 1.46, + "learning_rate": 8.066960270205116e-05, + "loss": 0.007, + "step": 564090 + }, + { + "epoch": 1.46, + "learning_rate": 8.066571448567969e-05, + "loss": 0.0084, + "step": 564100 + }, + { + "epoch": 1.46, + "learning_rate": 8.066182626930823e-05, + "loss": 0.0093, + "step": 564110 + }, + { + "epoch": 1.46, + "learning_rate": 8.065793805293676e-05, + "loss": 0.012, + "step": 564120 + }, + { + "epoch": 1.46, + "learning_rate": 8.06540498365653e-05, + "loss": 0.0105, + "step": 564130 + }, + { + "epoch": 1.46, + "learning_rate": 8.065016162019383e-05, + "loss": 0.0132, + "step": 564140 + }, + { + "epoch": 1.46, + "learning_rate": 8.064627340382238e-05, + "loss": 0.0092, + "step": 564150 + }, + { + "epoch": 1.46, + "learning_rate": 8.06423851874509e-05, + "loss": 0.0096, + "step": 564160 + }, + { + "epoch": 1.46, + "learning_rate": 8.063849697107945e-05, + "loss": 0.0112, + "step": 564170 + }, + { + "epoch": 1.46, + "learning_rate": 8.063460875470798e-05, + "loss": 0.0126, + "step": 564180 + }, + { + "epoch": 1.46, + "learning_rate": 8.063072053833652e-05, + "loss": 0.0096, + "step": 564190 + }, + { + "epoch": 1.46, + "learning_rate": 8.062683232196505e-05, + "loss": 0.0102, + "step": 564200 + }, + { + "epoch": 1.46, + "learning_rate": 8.062294410559358e-05, + "loss": 0.0076, + "step": 564210 + }, + { + "epoch": 1.46, + "learning_rate": 8.061905588922212e-05, + "loss": 0.0092, + "step": 564220 + }, + { + "epoch": 1.46, + "learning_rate": 8.061516767285065e-05, + "loss": 0.0098, + "step": 564230 + }, + { + "epoch": 1.46, + "learning_rate": 8.061127945647919e-05, + "loss": 0.01, + "step": 564240 + }, + { + "epoch": 1.46, + "learning_rate": 8.060739124010772e-05, + "loss": 0.0068, + "step": 564250 + }, + { + "epoch": 1.46, + "learning_rate": 8.060350302373626e-05, + "loss": 0.0084, + "step": 564260 + }, + { + "epoch": 1.46, + "learning_rate": 8.059961480736479e-05, + "loss": 0.0074, + "step": 564270 + }, + { + "epoch": 1.46, + "learning_rate": 8.059572659099333e-05, + "loss": 0.0091, + "step": 564280 + }, + { + "epoch": 1.46, + "learning_rate": 8.059183837462186e-05, + "loss": 0.0109, + "step": 564290 + }, + { + "epoch": 1.46, + "learning_rate": 8.05879501582504e-05, + "loss": 0.01, + "step": 564300 + }, + { + "epoch": 1.46, + "learning_rate": 8.058406194187893e-05, + "loss": 0.0086, + "step": 564310 + }, + { + "epoch": 1.46, + "learning_rate": 8.058017372550747e-05, + "loss": 0.0108, + "step": 564320 + }, + { + "epoch": 1.46, + "learning_rate": 8.0576285509136e-05, + "loss": 0.0087, + "step": 564330 + }, + { + "epoch": 1.46, + "learning_rate": 8.057239729276455e-05, + "loss": 0.0078, + "step": 564340 + }, + { + "epoch": 1.46, + "learning_rate": 8.056850907639308e-05, + "loss": 0.0091, + "step": 564350 + }, + { + "epoch": 1.46, + "learning_rate": 8.056462086002162e-05, + "loss": 0.0077, + "step": 564360 + }, + { + "epoch": 1.46, + "learning_rate": 8.056073264365015e-05, + "loss": 0.0081, + "step": 564370 + }, + { + "epoch": 1.46, + "learning_rate": 8.055684442727869e-05, + "loss": 0.0106, + "step": 564380 + }, + { + "epoch": 1.46, + "learning_rate": 8.055295621090722e-05, + "loss": 0.011, + "step": 564390 + }, + { + "epoch": 1.46, + "learning_rate": 8.054906799453576e-05, + "loss": 0.0091, + "step": 564400 + }, + { + "epoch": 1.46, + "learning_rate": 8.054517977816429e-05, + "loss": 0.0089, + "step": 564410 + }, + { + "epoch": 1.46, + "learning_rate": 8.054129156179283e-05, + "loss": 0.0087, + "step": 564420 + }, + { + "epoch": 1.46, + "learning_rate": 8.053740334542136e-05, + "loss": 0.0088, + "step": 564430 + }, + { + "epoch": 1.46, + "learning_rate": 8.05335151290499e-05, + "loss": 0.008, + "step": 564440 + }, + { + "epoch": 1.46, + "learning_rate": 8.052962691267843e-05, + "loss": 0.0096, + "step": 564450 + }, + { + "epoch": 1.46, + "learning_rate": 8.052573869630696e-05, + "loss": 0.0255, + "step": 564460 + }, + { + "epoch": 1.46, + "learning_rate": 8.05218504799355e-05, + "loss": 0.0087, + "step": 564470 + }, + { + "epoch": 1.46, + "learning_rate": 8.051796226356403e-05, + "loss": 0.0086, + "step": 564480 + }, + { + "epoch": 1.46, + "learning_rate": 8.051407404719257e-05, + "loss": 0.009, + "step": 564490 + }, + { + "epoch": 1.46, + "learning_rate": 8.05101858308211e-05, + "loss": 0.0122, + "step": 564500 + }, + { + "epoch": 1.46, + "learning_rate": 8.050629761444965e-05, + "loss": 0.0061, + "step": 564510 + }, + { + "epoch": 1.46, + "learning_rate": 8.050240939807816e-05, + "loss": 0.008, + "step": 564520 + }, + { + "epoch": 1.46, + "learning_rate": 8.049852118170672e-05, + "loss": 0.0089, + "step": 564530 + }, + { + "epoch": 1.46, + "learning_rate": 8.049463296533525e-05, + "loss": 0.0114, + "step": 564540 + }, + { + "epoch": 1.46, + "learning_rate": 8.049074474896379e-05, + "loss": 0.0078, + "step": 564550 + }, + { + "epoch": 1.46, + "learning_rate": 8.048685653259232e-05, + "loss": 0.0142, + "step": 564560 + }, + { + "epoch": 1.46, + "learning_rate": 8.048296831622086e-05, + "loss": 0.0136, + "step": 564570 + }, + { + "epoch": 1.46, + "learning_rate": 8.047908009984939e-05, + "loss": 0.0092, + "step": 564580 + }, + { + "epoch": 1.46, + "learning_rate": 8.047519188347793e-05, + "loss": 0.0085, + "step": 564590 + }, + { + "epoch": 1.46, + "learning_rate": 8.047130366710646e-05, + "loss": 0.0119, + "step": 564600 + }, + { + "epoch": 1.46, + "learning_rate": 8.0467415450735e-05, + "loss": 0.0089, + "step": 564610 + }, + { + "epoch": 1.46, + "learning_rate": 8.046352723436353e-05, + "loss": 0.0085, + "step": 564620 + }, + { + "epoch": 1.46, + "learning_rate": 8.045963901799207e-05, + "loss": 0.0116, + "step": 564630 + }, + { + "epoch": 1.46, + "learning_rate": 8.04557508016206e-05, + "loss": 0.0074, + "step": 564640 + }, + { + "epoch": 1.46, + "learning_rate": 8.045186258524914e-05, + "loss": 0.0089, + "step": 564650 + }, + { + "epoch": 1.46, + "learning_rate": 8.044797436887767e-05, + "loss": 0.0104, + "step": 564660 + }, + { + "epoch": 1.46, + "learning_rate": 8.044408615250622e-05, + "loss": 0.0127, + "step": 564670 + }, + { + "epoch": 1.46, + "learning_rate": 8.044019793613474e-05, + "loss": 0.0066, + "step": 564680 + }, + { + "epoch": 1.46, + "learning_rate": 8.043630971976329e-05, + "loss": 0.0093, + "step": 564690 + }, + { + "epoch": 1.46, + "learning_rate": 8.043242150339182e-05, + "loss": 0.0102, + "step": 564700 + }, + { + "epoch": 1.46, + "learning_rate": 8.042853328702035e-05, + "loss": 0.0116, + "step": 564710 + }, + { + "epoch": 1.46, + "learning_rate": 8.042464507064889e-05, + "loss": 0.0096, + "step": 564720 + }, + { + "epoch": 1.46, + "learning_rate": 8.042075685427742e-05, + "loss": 0.0097, + "step": 564730 + }, + { + "epoch": 1.46, + "learning_rate": 8.041686863790596e-05, + "loss": 0.0097, + "step": 564740 + }, + { + "epoch": 1.46, + "learning_rate": 8.041298042153449e-05, + "loss": 0.0117, + "step": 564750 + }, + { + "epoch": 1.46, + "learning_rate": 8.040909220516303e-05, + "loss": 0.0089, + "step": 564760 + }, + { + "epoch": 1.46, + "learning_rate": 8.040520398879156e-05, + "loss": 0.0073, + "step": 564770 + }, + { + "epoch": 1.46, + "learning_rate": 8.04013157724201e-05, + "loss": 0.0084, + "step": 564780 + }, + { + "epoch": 1.46, + "learning_rate": 8.039742755604863e-05, + "loss": 0.011, + "step": 564790 + }, + { + "epoch": 1.46, + "learning_rate": 8.039353933967717e-05, + "loss": 0.0105, + "step": 564800 + }, + { + "epoch": 1.46, + "learning_rate": 8.03896511233057e-05, + "loss": 0.0101, + "step": 564810 + }, + { + "epoch": 1.46, + "learning_rate": 8.038576290693424e-05, + "loss": 0.0083, + "step": 564820 + }, + { + "epoch": 1.46, + "learning_rate": 8.038187469056277e-05, + "loss": 0.0068, + "step": 564830 + }, + { + "epoch": 1.46, + "learning_rate": 8.037798647419131e-05, + "loss": 0.0085, + "step": 564840 + }, + { + "epoch": 1.46, + "learning_rate": 8.037409825781984e-05, + "loss": 0.0108, + "step": 564850 + }, + { + "epoch": 1.46, + "learning_rate": 8.037021004144839e-05, + "loss": 0.0075, + "step": 564860 + }, + { + "epoch": 1.46, + "learning_rate": 8.036632182507692e-05, + "loss": 0.0075, + "step": 564870 + }, + { + "epoch": 1.46, + "learning_rate": 8.036243360870546e-05, + "loss": 0.0117, + "step": 564880 + }, + { + "epoch": 1.46, + "learning_rate": 8.035854539233399e-05, + "loss": 0.0097, + "step": 564890 + }, + { + "epoch": 1.46, + "learning_rate": 8.035465717596253e-05, + "loss": 0.0113, + "step": 564900 + }, + { + "epoch": 1.46, + "learning_rate": 8.035076895959106e-05, + "loss": 0.0063, + "step": 564910 + }, + { + "epoch": 1.46, + "learning_rate": 8.03468807432196e-05, + "loss": 0.0097, + "step": 564920 + }, + { + "epoch": 1.46, + "learning_rate": 8.034299252684813e-05, + "loss": 0.0088, + "step": 564930 + }, + { + "epoch": 1.46, + "learning_rate": 8.033910431047666e-05, + "loss": 0.0087, + "step": 564940 + }, + { + "epoch": 1.46, + "learning_rate": 8.03352160941052e-05, + "loss": 0.0112, + "step": 564950 + }, + { + "epoch": 1.46, + "learning_rate": 8.033132787773373e-05, + "loss": 0.0096, + "step": 564960 + }, + { + "epoch": 1.46, + "learning_rate": 8.032743966136227e-05, + "loss": 0.0142, + "step": 564970 + }, + { + "epoch": 1.46, + "learning_rate": 8.03235514449908e-05, + "loss": 0.0092, + "step": 564980 + }, + { + "epoch": 1.46, + "learning_rate": 8.031966322861934e-05, + "loss": 0.0106, + "step": 564990 + }, + { + "epoch": 1.46, + "learning_rate": 8.031577501224787e-05, + "loss": 0.0112, + "step": 565000 + }, + { + "epoch": 1.46, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.006258940789848566, + "eval_runtime": 107.7505, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, + "step": 565000 + }, + { + "epoch": 1.46, + "learning_rate": 8.031188679587641e-05, + "loss": 0.0104, + "step": 565010 + }, + { + "epoch": 1.46, + "learning_rate": 8.030799857950494e-05, + "loss": 0.0068, + "step": 565020 + }, + { + "epoch": 1.46, + "learning_rate": 8.030411036313349e-05, + "loss": 0.0082, + "step": 565030 + }, + { + "epoch": 1.46, + "learning_rate": 8.0300222146762e-05, + "loss": 0.008, + "step": 565040 + }, + { + "epoch": 1.46, + "learning_rate": 8.029633393039056e-05, + "loss": 0.0085, + "step": 565050 + }, + { + "epoch": 1.46, + "learning_rate": 8.029244571401909e-05, + "loss": 0.011, + "step": 565060 + }, + { + "epoch": 1.46, + "learning_rate": 8.028855749764763e-05, + "loss": 0.0096, + "step": 565070 + }, + { + "epoch": 1.46, + "learning_rate": 8.028466928127616e-05, + "loss": 0.0076, + "step": 565080 + }, + { + "epoch": 1.46, + "learning_rate": 8.02807810649047e-05, + "loss": 0.0087, + "step": 565090 + }, + { + "epoch": 1.46, + "learning_rate": 8.027689284853323e-05, + "loss": 0.0111, + "step": 565100 + }, + { + "epoch": 1.46, + "learning_rate": 8.027300463216177e-05, + "loss": 0.0093, + "step": 565110 + }, + { + "epoch": 1.46, + "learning_rate": 8.02691164157903e-05, + "loss": 0.0122, + "step": 565120 + }, + { + "epoch": 1.46, + "learning_rate": 8.026522819941884e-05, + "loss": 0.0081, + "step": 565130 + }, + { + "epoch": 1.46, + "learning_rate": 8.026133998304737e-05, + "loss": 0.0103, + "step": 565140 + }, + { + "epoch": 1.46, + "learning_rate": 8.025745176667591e-05, + "loss": 0.0084, + "step": 565150 + }, + { + "epoch": 1.46, + "learning_rate": 8.025356355030444e-05, + "loss": 0.0153, + "step": 565160 + }, + { + "epoch": 1.47, + "learning_rate": 8.024967533393298e-05, + "loss": 0.0073, + "step": 565170 + }, + { + "epoch": 1.47, + "learning_rate": 8.02457871175615e-05, + "loss": 0.0101, + "step": 565180 + }, + { + "epoch": 1.47, + "learning_rate": 8.024189890119003e-05, + "loss": 0.009, + "step": 565190 + }, + { + "epoch": 1.47, + "learning_rate": 8.023801068481858e-05, + "loss": 0.0152, + "step": 565200 + }, + { + "epoch": 1.47, + "learning_rate": 8.02341224684471e-05, + "loss": 0.0114, + "step": 565210 + }, + { + "epoch": 1.47, + "learning_rate": 8.023023425207566e-05, + "loss": 0.0083, + "step": 565220 + }, + { + "epoch": 1.47, + "learning_rate": 8.022634603570419e-05, + "loss": 0.0077, + "step": 565230 + }, + { + "epoch": 1.47, + "learning_rate": 8.022245781933273e-05, + "loss": 0.0106, + "step": 565240 + }, + { + "epoch": 1.47, + "learning_rate": 8.021856960296126e-05, + "loss": 0.008, + "step": 565250 + }, + { + "epoch": 1.47, + "learning_rate": 8.02146813865898e-05, + "loss": 0.007, + "step": 565260 + }, + { + "epoch": 1.47, + "learning_rate": 8.021079317021833e-05, + "loss": 0.0068, + "step": 565270 + }, + { + "epoch": 1.47, + "learning_rate": 8.020690495384687e-05, + "loss": 0.0083, + "step": 565280 + }, + { + "epoch": 1.47, + "learning_rate": 8.02030167374754e-05, + "loss": 0.0093, + "step": 565290 + }, + { + "epoch": 1.47, + "learning_rate": 8.019912852110394e-05, + "loss": 0.008, + "step": 565300 + }, + { + "epoch": 1.47, + "learning_rate": 8.019524030473247e-05, + "loss": 0.009, + "step": 565310 + }, + { + "epoch": 1.47, + "learning_rate": 8.019135208836101e-05, + "loss": 0.0085, + "step": 565320 + }, + { + "epoch": 1.47, + "learning_rate": 8.018746387198954e-05, + "loss": 0.0077, + "step": 565330 + }, + { + "epoch": 1.47, + "learning_rate": 8.018357565561808e-05, + "loss": 0.0104, + "step": 565340 + }, + { + "epoch": 1.47, + "learning_rate": 8.01796874392466e-05, + "loss": 0.0061, + "step": 565350 + }, + { + "epoch": 1.47, + "learning_rate": 8.017579922287515e-05, + "loss": 0.0109, + "step": 565360 + }, + { + "epoch": 1.47, + "learning_rate": 8.017191100650368e-05, + "loss": 0.0083, + "step": 565370 + }, + { + "epoch": 1.47, + "learning_rate": 8.016802279013223e-05, + "loss": 0.0099, + "step": 565380 + }, + { + "epoch": 1.47, + "learning_rate": 8.016413457376076e-05, + "loss": 0.0071, + "step": 565390 + }, + { + "epoch": 1.47, + "learning_rate": 8.01602463573893e-05, + "loss": 0.008, + "step": 565400 + }, + { + "epoch": 1.47, + "learning_rate": 8.015635814101783e-05, + "loss": 0.0085, + "step": 565410 + }, + { + "epoch": 1.47, + "learning_rate": 8.015246992464637e-05, + "loss": 0.0092, + "step": 565420 + }, + { + "epoch": 1.47, + "learning_rate": 8.01485817082749e-05, + "loss": 0.0117, + "step": 565430 + }, + { + "epoch": 1.47, + "learning_rate": 8.014469349190343e-05, + "loss": 0.0099, + "step": 565440 + }, + { + "epoch": 1.47, + "learning_rate": 8.014080527553197e-05, + "loss": 0.0082, + "step": 565450 + }, + { + "epoch": 1.47, + "learning_rate": 8.01369170591605e-05, + "loss": 0.0097, + "step": 565460 + }, + { + "epoch": 1.47, + "learning_rate": 8.013302884278904e-05, + "loss": 0.0074, + "step": 565470 + }, + { + "epoch": 1.47, + "learning_rate": 8.012914062641757e-05, + "loss": 0.0077, + "step": 565480 + }, + { + "epoch": 1.47, + "learning_rate": 8.012525241004611e-05, + "loss": 0.0092, + "step": 565490 + }, + { + "epoch": 1.47, + "learning_rate": 8.012136419367464e-05, + "loss": 0.0119, + "step": 565500 + }, + { + "epoch": 1.47, + "learning_rate": 8.011747597730318e-05, + "loss": 0.0094, + "step": 565510 + }, + { + "epoch": 1.47, + "learning_rate": 8.01135877609317e-05, + "loss": 0.0076, + "step": 565520 + }, + { + "epoch": 1.47, + "learning_rate": 8.010969954456025e-05, + "loss": 0.008, + "step": 565530 + }, + { + "epoch": 1.47, + "learning_rate": 8.010581132818877e-05, + "loss": 0.008, + "step": 565540 + }, + { + "epoch": 1.47, + "learning_rate": 8.010192311181732e-05, + "loss": 0.0112, + "step": 565550 + }, + { + "epoch": 1.47, + "learning_rate": 8.009803489544584e-05, + "loss": 0.0133, + "step": 565560 + }, + { + "epoch": 1.47, + "learning_rate": 8.00941466790744e-05, + "loss": 0.0081, + "step": 565570 + }, + { + "epoch": 1.47, + "learning_rate": 8.009025846270293e-05, + "loss": 0.0092, + "step": 565580 + }, + { + "epoch": 1.47, + "learning_rate": 8.008637024633147e-05, + "loss": 0.0108, + "step": 565590 + }, + { + "epoch": 1.47, + "learning_rate": 8.008248202996e-05, + "loss": 0.0103, + "step": 565600 + }, + { + "epoch": 1.47, + "learning_rate": 8.007859381358854e-05, + "loss": 0.0133, + "step": 565610 + }, + { + "epoch": 1.47, + "learning_rate": 8.007470559721707e-05, + "loss": 0.0082, + "step": 565620 + }, + { + "epoch": 1.47, + "learning_rate": 8.007081738084561e-05, + "loss": 0.0064, + "step": 565630 + }, + { + "epoch": 1.47, + "learning_rate": 8.006692916447414e-05, + "loss": 0.0075, + "step": 565640 + }, + { + "epoch": 1.47, + "learning_rate": 8.006304094810268e-05, + "loss": 0.0125, + "step": 565650 + }, + { + "epoch": 1.47, + "learning_rate": 8.005915273173121e-05, + "loss": 0.0075, + "step": 565660 + }, + { + "epoch": 1.47, + "learning_rate": 8.005526451535975e-05, + "loss": 0.0095, + "step": 565670 + }, + { + "epoch": 1.47, + "learning_rate": 8.005137629898828e-05, + "loss": 0.0083, + "step": 565680 + }, + { + "epoch": 1.47, + "learning_rate": 8.00474880826168e-05, + "loss": 0.0075, + "step": 565690 + }, + { + "epoch": 1.47, + "learning_rate": 8.004359986624535e-05, + "loss": 0.0109, + "step": 565700 + }, + { + "epoch": 1.47, + "learning_rate": 8.003971164987387e-05, + "loss": 0.0073, + "step": 565710 + }, + { + "epoch": 1.47, + "learning_rate": 8.003582343350242e-05, + "loss": 0.0091, + "step": 565720 + }, + { + "epoch": 1.47, + "learning_rate": 8.003193521713094e-05, + "loss": 0.0086, + "step": 565730 + }, + { + "epoch": 1.47, + "learning_rate": 8.00280470007595e-05, + "loss": 0.0072, + "step": 565740 + }, + { + "epoch": 1.47, + "learning_rate": 8.002415878438801e-05, + "loss": 0.0096, + "step": 565750 + }, + { + "epoch": 1.47, + "learning_rate": 8.002027056801657e-05, + "loss": 0.0085, + "step": 565760 + }, + { + "epoch": 1.47, + "learning_rate": 8.00163823516451e-05, + "loss": 0.0151, + "step": 565770 + }, + { + "epoch": 1.47, + "learning_rate": 8.001249413527364e-05, + "loss": 0.008, + "step": 565780 + }, + { + "epoch": 1.47, + "learning_rate": 8.000860591890217e-05, + "loss": 0.0119, + "step": 565790 + }, + { + "epoch": 1.47, + "learning_rate": 8.000471770253071e-05, + "loss": 0.0069, + "step": 565800 + }, + { + "epoch": 1.47, + "learning_rate": 8.000082948615924e-05, + "loss": 0.0072, + "step": 565810 + }, + { + "epoch": 1.47, + "learning_rate": 7.999694126978778e-05, + "loss": 0.0115, + "step": 565820 + }, + { + "epoch": 1.47, + "learning_rate": 7.99930530534163e-05, + "loss": 0.0112, + "step": 565830 + }, + { + "epoch": 1.47, + "learning_rate": 7.998916483704485e-05, + "loss": 0.0102, + "step": 565840 + }, + { + "epoch": 1.47, + "learning_rate": 7.998527662067338e-05, + "loss": 0.0099, + "step": 565850 + }, + { + "epoch": 1.47, + "learning_rate": 7.998138840430192e-05, + "loss": 0.0109, + "step": 565860 + }, + { + "epoch": 1.47, + "learning_rate": 7.997750018793045e-05, + "loss": 0.009, + "step": 565870 + }, + { + "epoch": 1.47, + "learning_rate": 7.997361197155899e-05, + "loss": 0.0073, + "step": 565880 + }, + { + "epoch": 1.47, + "learning_rate": 7.996972375518752e-05, + "loss": 0.0078, + "step": 565890 + }, + { + "epoch": 1.47, + "learning_rate": 7.996583553881607e-05, + "loss": 0.0094, + "step": 565900 + }, + { + "epoch": 1.47, + "learning_rate": 7.996194732244459e-05, + "loss": 0.01, + "step": 565910 + }, + { + "epoch": 1.47, + "learning_rate": 7.995805910607314e-05, + "loss": 0.008, + "step": 565920 + }, + { + "epoch": 1.47, + "learning_rate": 7.995417088970167e-05, + "loss": 0.0089, + "step": 565930 + }, + { + "epoch": 1.47, + "learning_rate": 7.99502826733302e-05, + "loss": 0.0096, + "step": 565940 + }, + { + "epoch": 1.47, + "learning_rate": 7.994639445695874e-05, + "loss": 0.0066, + "step": 565950 + }, + { + "epoch": 1.47, + "learning_rate": 7.994250624058727e-05, + "loss": 0.0091, + "step": 565960 + }, + { + "epoch": 1.47, + "learning_rate": 7.993861802421581e-05, + "loss": 0.0095, + "step": 565970 + }, + { + "epoch": 1.47, + "learning_rate": 7.993472980784434e-05, + "loss": 0.0118, + "step": 565980 + }, + { + "epoch": 1.47, + "learning_rate": 7.993084159147288e-05, + "loss": 0.0074, + "step": 565990 + }, + { + "epoch": 1.47, + "learning_rate": 7.99269533751014e-05, + "loss": 0.0098, + "step": 566000 + }, + { + "epoch": 1.47, + "eval_cer": 0.8817180823294437, + "eval_loss": 0.0061110155656933784, + "eval_runtime": 107.9972, + "eval_samples_per_second": 18.519, + "eval_steps_per_second": 4.63, + "step": 566000 + }, + { + "epoch": 1.47, + "learning_rate": 7.992306515872995e-05, + "loss": 0.0099, + "step": 566010 + }, + { + "epoch": 1.47, + "learning_rate": 7.991917694235848e-05, + "loss": 0.0087, + "step": 566020 + }, + { + "epoch": 1.47, + "learning_rate": 7.991528872598702e-05, + "loss": 0.0073, + "step": 566030 + }, + { + "epoch": 1.47, + "learning_rate": 7.991140050961555e-05, + "loss": 0.009, + "step": 566040 + }, + { + "epoch": 1.47, + "learning_rate": 7.990751229324409e-05, + "loss": 0.0072, + "step": 566050 + }, + { + "epoch": 1.47, + "learning_rate": 7.990362407687261e-05, + "loss": 0.0093, + "step": 566060 + }, + { + "epoch": 1.47, + "learning_rate": 7.989973586050116e-05, + "loss": 0.0075, + "step": 566070 + }, + { + "epoch": 1.47, + "learning_rate": 7.989584764412968e-05, + "loss": 0.0098, + "step": 566080 + }, + { + "epoch": 1.47, + "learning_rate": 7.989195942775824e-05, + "loss": 0.0078, + "step": 566090 + }, + { + "epoch": 1.47, + "learning_rate": 7.988807121138677e-05, + "loss": 0.0097, + "step": 566100 + }, + { + "epoch": 1.47, + "learning_rate": 7.988418299501531e-05, + "loss": 0.0089, + "step": 566110 + }, + { + "epoch": 1.47, + "learning_rate": 7.988029477864384e-05, + "loss": 0.0073, + "step": 566120 + }, + { + "epoch": 1.47, + "learning_rate": 7.987640656227238e-05, + "loss": 0.0061, + "step": 566130 + }, + { + "epoch": 1.47, + "learning_rate": 7.987251834590091e-05, + "loss": 0.0097, + "step": 566140 + }, + { + "epoch": 1.47, + "learning_rate": 7.986863012952945e-05, + "loss": 0.0092, + "step": 566150 + }, + { + "epoch": 1.47, + "learning_rate": 7.986474191315798e-05, + "loss": 0.0067, + "step": 566160 + }, + { + "epoch": 1.47, + "learning_rate": 7.986085369678652e-05, + "loss": 0.0098, + "step": 566170 + }, + { + "epoch": 1.47, + "learning_rate": 7.985696548041505e-05, + "loss": 0.0082, + "step": 566180 + }, + { + "epoch": 1.47, + "learning_rate": 7.985307726404357e-05, + "loss": 0.01, + "step": 566190 + }, + { + "epoch": 1.47, + "learning_rate": 7.984918904767212e-05, + "loss": 0.0097, + "step": 566200 + }, + { + "epoch": 1.47, + "learning_rate": 7.984530083130064e-05, + "loss": 0.0085, + "step": 566210 + }, + { + "epoch": 1.47, + "learning_rate": 7.984141261492919e-05, + "loss": 0.0087, + "step": 566220 + }, + { + "epoch": 1.47, + "learning_rate": 7.983752439855771e-05, + "loss": 0.0092, + "step": 566230 + }, + { + "epoch": 1.47, + "learning_rate": 7.983363618218626e-05, + "loss": 0.013, + "step": 566240 + }, + { + "epoch": 1.47, + "learning_rate": 7.982974796581478e-05, + "loss": 0.0089, + "step": 566250 + }, + { + "epoch": 1.47, + "learning_rate": 7.982585974944334e-05, + "loss": 0.0085, + "step": 566260 + }, + { + "epoch": 1.47, + "learning_rate": 7.982197153307185e-05, + "loss": 0.0096, + "step": 566270 + }, + { + "epoch": 1.47, + "learning_rate": 7.981808331670041e-05, + "loss": 0.0068, + "step": 566280 + }, + { + "epoch": 1.47, + "learning_rate": 7.981419510032894e-05, + "loss": 0.0123, + "step": 566290 + }, + { + "epoch": 1.47, + "learning_rate": 7.981030688395748e-05, + "loss": 0.0109, + "step": 566300 + }, + { + "epoch": 1.47, + "learning_rate": 7.9806418667586e-05, + "loss": 0.0105, + "step": 566310 + }, + { + "epoch": 1.47, + "learning_rate": 7.980253045121455e-05, + "loss": 0.0084, + "step": 566320 + }, + { + "epoch": 1.47, + "learning_rate": 7.979864223484308e-05, + "loss": 0.0099, + "step": 566330 + }, + { + "epoch": 1.47, + "learning_rate": 7.979475401847162e-05, + "loss": 0.0105, + "step": 566340 + }, + { + "epoch": 1.47, + "learning_rate": 7.979086580210015e-05, + "loss": 0.0093, + "step": 566350 + }, + { + "epoch": 1.47, + "learning_rate": 7.978697758572869e-05, + "loss": 0.0115, + "step": 566360 + }, + { + "epoch": 1.47, + "learning_rate": 7.978308936935722e-05, + "loss": 0.0128, + "step": 566370 + }, + { + "epoch": 1.47, + "learning_rate": 7.977920115298576e-05, + "loss": 0.0139, + "step": 566380 + }, + { + "epoch": 1.47, + "learning_rate": 7.977531293661429e-05, + "loss": 0.0115, + "step": 566390 + }, + { + "epoch": 1.47, + "learning_rate": 7.977142472024283e-05, + "loss": 0.0091, + "step": 566400 + }, + { + "epoch": 1.47, + "learning_rate": 7.976753650387136e-05, + "loss": 0.0077, + "step": 566410 + }, + { + "epoch": 1.47, + "learning_rate": 7.976364828749991e-05, + "loss": 0.0091, + "step": 566420 + }, + { + "epoch": 1.47, + "learning_rate": 7.975976007112843e-05, + "loss": 0.0091, + "step": 566430 + }, + { + "epoch": 1.47, + "learning_rate": 7.975587185475695e-05, + "loss": 0.0078, + "step": 566440 + }, + { + "epoch": 1.47, + "learning_rate": 7.975198363838551e-05, + "loss": 0.0107, + "step": 566450 + }, + { + "epoch": 1.47, + "learning_rate": 7.974809542201404e-05, + "loss": 0.0077, + "step": 566460 + }, + { + "epoch": 1.47, + "learning_rate": 7.974420720564258e-05, + "loss": 0.0064, + "step": 566470 + }, + { + "epoch": 1.47, + "learning_rate": 7.97403189892711e-05, + "loss": 0.01, + "step": 566480 + }, + { + "epoch": 1.47, + "learning_rate": 7.973643077289965e-05, + "loss": 0.0094, + "step": 566490 + }, + { + "epoch": 1.47, + "learning_rate": 7.973254255652818e-05, + "loss": 0.0075, + "step": 566500 + }, + { + "epoch": 1.47, + "learning_rate": 7.972865434015672e-05, + "loss": 0.0101, + "step": 566510 + }, + { + "epoch": 1.47, + "learning_rate": 7.972476612378525e-05, + "loss": 0.0072, + "step": 566520 + }, + { + "epoch": 1.47, + "learning_rate": 7.972087790741379e-05, + "loss": 0.011, + "step": 566530 + }, + { + "epoch": 1.47, + "learning_rate": 7.971698969104232e-05, + "loss": 0.0093, + "step": 566540 + }, + { + "epoch": 1.47, + "learning_rate": 7.971310147467086e-05, + "loss": 0.0103, + "step": 566550 + }, + { + "epoch": 1.47, + "learning_rate": 7.970921325829939e-05, + "loss": 0.0093, + "step": 566560 + }, + { + "epoch": 1.47, + "learning_rate": 7.970532504192793e-05, + "loss": 0.0095, + "step": 566570 + }, + { + "epoch": 1.47, + "learning_rate": 7.970143682555645e-05, + "loss": 0.0073, + "step": 566580 + }, + { + "epoch": 1.47, + "learning_rate": 7.9697548609185e-05, + "loss": 0.0077, + "step": 566590 + }, + { + "epoch": 1.47, + "learning_rate": 7.969366039281352e-05, + "loss": 0.0074, + "step": 566600 + }, + { + "epoch": 1.47, + "learning_rate": 7.968977217644208e-05, + "loss": 0.0099, + "step": 566610 + }, + { + "epoch": 1.47, + "learning_rate": 7.968588396007061e-05, + "loss": 0.0109, + "step": 566620 + }, + { + "epoch": 1.47, + "learning_rate": 7.968199574369915e-05, + "loss": 0.0112, + "step": 566630 + }, + { + "epoch": 1.47, + "learning_rate": 7.967810752732768e-05, + "loss": 0.0076, + "step": 566640 + }, + { + "epoch": 1.47, + "learning_rate": 7.967421931095622e-05, + "loss": 0.0104, + "step": 566650 + }, + { + "epoch": 1.47, + "learning_rate": 7.967033109458475e-05, + "loss": 0.0079, + "step": 566660 + }, + { + "epoch": 1.47, + "learning_rate": 7.966644287821329e-05, + "loss": 0.0092, + "step": 566670 + }, + { + "epoch": 1.47, + "learning_rate": 7.966255466184182e-05, + "loss": 0.0098, + "step": 566680 + }, + { + "epoch": 1.47, + "learning_rate": 7.965866644547035e-05, + "loss": 0.0097, + "step": 566690 + }, + { + "epoch": 1.47, + "learning_rate": 7.965477822909889e-05, + "loss": 0.0073, + "step": 566700 + }, + { + "epoch": 1.47, + "learning_rate": 7.965089001272741e-05, + "loss": 0.0079, + "step": 566710 + }, + { + "epoch": 1.47, + "learning_rate": 7.964700179635596e-05, + "loss": 0.0096, + "step": 566720 + }, + { + "epoch": 1.47, + "learning_rate": 7.964311357998448e-05, + "loss": 0.0112, + "step": 566730 + }, + { + "epoch": 1.47, + "learning_rate": 7.963922536361303e-05, + "loss": 0.0059, + "step": 566740 + }, + { + "epoch": 1.47, + "learning_rate": 7.963533714724155e-05, + "loss": 0.0072, + "step": 566750 + }, + { + "epoch": 1.47, + "learning_rate": 7.96314489308701e-05, + "loss": 0.0109, + "step": 566760 + }, + { + "epoch": 1.47, + "learning_rate": 7.962756071449862e-05, + "loss": 0.0119, + "step": 566770 + }, + { + "epoch": 1.47, + "learning_rate": 7.962367249812717e-05, + "loss": 0.0085, + "step": 566780 + }, + { + "epoch": 1.47, + "learning_rate": 7.96197842817557e-05, + "loss": 0.0096, + "step": 566790 + }, + { + "epoch": 1.47, + "learning_rate": 7.961589606538425e-05, + "loss": 0.0105, + "step": 566800 + }, + { + "epoch": 1.47, + "learning_rate": 7.961200784901278e-05, + "loss": 0.0085, + "step": 566810 + }, + { + "epoch": 1.47, + "learning_rate": 7.960811963264132e-05, + "loss": 0.0102, + "step": 566820 + }, + { + "epoch": 1.47, + "learning_rate": 7.960423141626985e-05, + "loss": 0.0068, + "step": 566830 + }, + { + "epoch": 1.47, + "learning_rate": 7.960034319989839e-05, + "loss": 0.007, + "step": 566840 + }, + { + "epoch": 1.47, + "learning_rate": 7.959645498352692e-05, + "loss": 0.0095, + "step": 566850 + }, + { + "epoch": 1.47, + "learning_rate": 7.959256676715546e-05, + "loss": 0.0087, + "step": 566860 + }, + { + "epoch": 1.47, + "learning_rate": 7.958867855078399e-05, + "loss": 0.0071, + "step": 566870 + }, + { + "epoch": 1.47, + "learning_rate": 7.958479033441253e-05, + "loss": 0.0062, + "step": 566880 + }, + { + "epoch": 1.47, + "learning_rate": 7.958090211804106e-05, + "loss": 0.008, + "step": 566890 + }, + { + "epoch": 1.47, + "learning_rate": 7.95770139016696e-05, + "loss": 0.0088, + "step": 566900 + }, + { + "epoch": 1.47, + "learning_rate": 7.957312568529813e-05, + "loss": 0.0076, + "step": 566910 + }, + { + "epoch": 1.47, + "learning_rate": 7.956923746892667e-05, + "loss": 0.009, + "step": 566920 + }, + { + "epoch": 1.47, + "learning_rate": 7.95653492525552e-05, + "loss": 0.0105, + "step": 566930 + }, + { + "epoch": 1.47, + "learning_rate": 7.956146103618372e-05, + "loss": 0.01, + "step": 566940 + }, + { + "epoch": 1.47, + "learning_rate": 7.955757281981226e-05, + "loss": 0.0122, + "step": 566950 + }, + { + "epoch": 1.47, + "learning_rate": 7.955368460344079e-05, + "loss": 0.009, + "step": 566960 + }, + { + "epoch": 1.47, + "learning_rate": 7.954979638706935e-05, + "loss": 0.01, + "step": 566970 + }, + { + "epoch": 1.47, + "learning_rate": 7.954590817069788e-05, + "loss": 0.0123, + "step": 566980 + }, + { + "epoch": 1.47, + "learning_rate": 7.954201995432642e-05, + "loss": 0.01, + "step": 566990 + }, + { + "epoch": 1.47, + "learning_rate": 7.953813173795495e-05, + "loss": 0.0095, + "step": 567000 + }, + { + "epoch": 1.47, + "eval_cer": 0.88167329394755, + "eval_loss": 0.006201473996043205, + "eval_runtime": 108.0039, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.629, + "step": 567000 + }, + { + "epoch": 1.47, + "learning_rate": 7.953424352158349e-05, + "loss": 0.0078, + "step": 567010 + }, + { + "epoch": 1.47, + "learning_rate": 7.953035530521202e-05, + "loss": 0.0085, + "step": 567020 + }, + { + "epoch": 1.47, + "learning_rate": 7.952646708884056e-05, + "loss": 0.0086, + "step": 567030 + }, + { + "epoch": 1.47, + "learning_rate": 7.952257887246909e-05, + "loss": 0.0086, + "step": 567040 + }, + { + "epoch": 1.47, + "learning_rate": 7.951869065609763e-05, + "loss": 0.0078, + "step": 567050 + }, + { + "epoch": 1.47, + "learning_rate": 7.951480243972616e-05, + "loss": 0.0105, + "step": 567060 + }, + { + "epoch": 1.47, + "learning_rate": 7.95109142233547e-05, + "loss": 0.0082, + "step": 567070 + }, + { + "epoch": 1.47, + "learning_rate": 7.950702600698322e-05, + "loss": 0.0089, + "step": 567080 + }, + { + "epoch": 1.47, + "learning_rate": 7.950313779061177e-05, + "loss": 0.0104, + "step": 567090 + }, + { + "epoch": 1.47, + "learning_rate": 7.94992495742403e-05, + "loss": 0.0099, + "step": 567100 + }, + { + "epoch": 1.47, + "learning_rate": 7.949536135786884e-05, + "loss": 0.0161, + "step": 567110 + }, + { + "epoch": 1.47, + "learning_rate": 7.949147314149736e-05, + "loss": 0.0083, + "step": 567120 + }, + { + "epoch": 1.47, + "learning_rate": 7.948758492512592e-05, + "loss": 0.0114, + "step": 567130 + }, + { + "epoch": 1.47, + "learning_rate": 7.948369670875443e-05, + "loss": 0.0086, + "step": 567140 + }, + { + "epoch": 1.47, + "learning_rate": 7.947980849238299e-05, + "loss": 0.0095, + "step": 567150 + }, + { + "epoch": 1.47, + "learning_rate": 7.947592027601152e-05, + "loss": 0.0089, + "step": 567160 + }, + { + "epoch": 1.47, + "learning_rate": 7.947203205964006e-05, + "loss": 0.0128, + "step": 567170 + }, + { + "epoch": 1.47, + "learning_rate": 7.946814384326859e-05, + "loss": 0.009, + "step": 567180 + }, + { + "epoch": 1.47, + "learning_rate": 7.946425562689712e-05, + "loss": 0.013, + "step": 567190 + }, + { + "epoch": 1.47, + "learning_rate": 7.946036741052566e-05, + "loss": 0.0078, + "step": 567200 + }, + { + "epoch": 1.47, + "learning_rate": 7.945647919415418e-05, + "loss": 0.009, + "step": 567210 + }, + { + "epoch": 1.47, + "learning_rate": 7.945259097778273e-05, + "loss": 0.0096, + "step": 567220 + }, + { + "epoch": 1.47, + "learning_rate": 7.944870276141125e-05, + "loss": 0.0089, + "step": 567230 + }, + { + "epoch": 1.47, + "learning_rate": 7.94448145450398e-05, + "loss": 0.0103, + "step": 567240 + }, + { + "epoch": 1.47, + "learning_rate": 7.944092632866832e-05, + "loss": 0.0094, + "step": 567250 + }, + { + "epoch": 1.47, + "learning_rate": 7.943703811229687e-05, + "loss": 0.0093, + "step": 567260 + }, + { + "epoch": 1.47, + "learning_rate": 7.94331498959254e-05, + "loss": 0.008, + "step": 567270 + }, + { + "epoch": 1.47, + "learning_rate": 7.942926167955394e-05, + "loss": 0.0095, + "step": 567280 + }, + { + "epoch": 1.47, + "learning_rate": 7.942537346318246e-05, + "loss": 0.0096, + "step": 567290 + }, + { + "epoch": 1.47, + "learning_rate": 7.9421485246811e-05, + "loss": 0.0083, + "step": 567300 + }, + { + "epoch": 1.47, + "learning_rate": 7.941759703043953e-05, + "loss": 0.01, + "step": 567310 + }, + { + "epoch": 1.47, + "learning_rate": 7.941370881406809e-05, + "loss": 0.0095, + "step": 567320 + }, + { + "epoch": 1.47, + "learning_rate": 7.940982059769662e-05, + "loss": 0.0078, + "step": 567330 + }, + { + "epoch": 1.47, + "learning_rate": 7.940593238132516e-05, + "loss": 0.0113, + "step": 567340 + }, + { + "epoch": 1.47, + "learning_rate": 7.940204416495369e-05, + "loss": 0.0099, + "step": 567350 + }, + { + "epoch": 1.47, + "learning_rate": 7.939815594858223e-05, + "loss": 0.0095, + "step": 567360 + }, + { + "epoch": 1.47, + "learning_rate": 7.939426773221076e-05, + "loss": 0.0119, + "step": 567370 + }, + { + "epoch": 1.47, + "learning_rate": 7.93903795158393e-05, + "loss": 0.01, + "step": 567380 + }, + { + "epoch": 1.47, + "learning_rate": 7.938649129946783e-05, + "loss": 0.0097, + "step": 567390 + }, + { + "epoch": 1.47, + "learning_rate": 7.938260308309637e-05, + "loss": 0.0111, + "step": 567400 + }, + { + "epoch": 1.47, + "learning_rate": 7.93787148667249e-05, + "loss": 0.0089, + "step": 567410 + }, + { + "epoch": 1.47, + "learning_rate": 7.937482665035342e-05, + "loss": 0.0105, + "step": 567420 + }, + { + "epoch": 1.47, + "learning_rate": 7.937093843398197e-05, + "loss": 0.0085, + "step": 567430 + }, + { + "epoch": 1.47, + "learning_rate": 7.93670502176105e-05, + "loss": 0.0106, + "step": 567440 + }, + { + "epoch": 1.47, + "learning_rate": 7.936316200123904e-05, + "loss": 0.0121, + "step": 567450 + }, + { + "epoch": 1.47, + "learning_rate": 7.935927378486756e-05, + "loss": 0.0103, + "step": 567460 + }, + { + "epoch": 1.47, + "learning_rate": 7.93553855684961e-05, + "loss": 0.0115, + "step": 567470 + }, + { + "epoch": 1.47, + "learning_rate": 7.935149735212463e-05, + "loss": 0.0093, + "step": 567480 + }, + { + "epoch": 1.47, + "learning_rate": 7.934760913575319e-05, + "loss": 0.0082, + "step": 567490 + }, + { + "epoch": 1.47, + "learning_rate": 7.93437209193817e-05, + "loss": 0.012, + "step": 567500 + }, + { + "epoch": 1.47, + "learning_rate": 7.933983270301026e-05, + "loss": 0.0072, + "step": 567510 + }, + { + "epoch": 1.47, + "learning_rate": 7.933594448663879e-05, + "loss": 0.0072, + "step": 567520 + }, + { + "epoch": 1.47, + "learning_rate": 7.933205627026733e-05, + "loss": 0.0082, + "step": 567530 + }, + { + "epoch": 1.47, + "learning_rate": 7.932816805389586e-05, + "loss": 0.0089, + "step": 567540 + }, + { + "epoch": 1.47, + "learning_rate": 7.93242798375244e-05, + "loss": 0.0104, + "step": 567550 + }, + { + "epoch": 1.47, + "learning_rate": 7.932039162115293e-05, + "loss": 0.009, + "step": 567560 + }, + { + "epoch": 1.47, + "learning_rate": 7.931650340478147e-05, + "loss": 0.01, + "step": 567570 + }, + { + "epoch": 1.47, + "learning_rate": 7.931261518841e-05, + "loss": 0.0069, + "step": 567580 + }, + { + "epoch": 1.47, + "learning_rate": 7.930872697203854e-05, + "loss": 0.0093, + "step": 567590 + }, + { + "epoch": 1.47, + "learning_rate": 7.930483875566706e-05, + "loss": 0.0075, + "step": 567600 + }, + { + "epoch": 1.47, + "learning_rate": 7.93009505392956e-05, + "loss": 0.0081, + "step": 567610 + }, + { + "epoch": 1.47, + "learning_rate": 7.929706232292413e-05, + "loss": 0.0091, + "step": 567620 + }, + { + "epoch": 1.47, + "learning_rate": 7.929317410655268e-05, + "loss": 0.0089, + "step": 567630 + }, + { + "epoch": 1.47, + "learning_rate": 7.92892858901812e-05, + "loss": 0.0081, + "step": 567640 + }, + { + "epoch": 1.47, + "learning_rate": 7.928539767380976e-05, + "loss": 0.0093, + "step": 567650 + }, + { + "epoch": 1.47, + "learning_rate": 7.928150945743827e-05, + "loss": 0.0105, + "step": 567660 + }, + { + "epoch": 1.47, + "learning_rate": 7.92776212410668e-05, + "loss": 0.0104, + "step": 567670 + }, + { + "epoch": 1.47, + "learning_rate": 7.927373302469536e-05, + "loss": 0.0091, + "step": 567680 + }, + { + "epoch": 1.47, + "learning_rate": 7.926984480832389e-05, + "loss": 0.0073, + "step": 567690 + }, + { + "epoch": 1.47, + "learning_rate": 7.926595659195243e-05, + "loss": 0.011, + "step": 567700 + }, + { + "epoch": 1.47, + "learning_rate": 7.926206837558096e-05, + "loss": 0.0114, + "step": 567710 + }, + { + "epoch": 1.47, + "learning_rate": 7.92581801592095e-05, + "loss": 0.0082, + "step": 567720 + }, + { + "epoch": 1.47, + "learning_rate": 7.925429194283802e-05, + "loss": 0.0086, + "step": 567730 + }, + { + "epoch": 1.47, + "learning_rate": 7.925040372646657e-05, + "loss": 0.0101, + "step": 567740 + }, + { + "epoch": 1.47, + "learning_rate": 7.92465155100951e-05, + "loss": 0.0079, + "step": 567750 + }, + { + "epoch": 1.47, + "learning_rate": 7.924262729372364e-05, + "loss": 0.008, + "step": 567760 + }, + { + "epoch": 1.47, + "learning_rate": 7.923873907735216e-05, + "loss": 0.009, + "step": 567770 + }, + { + "epoch": 1.47, + "learning_rate": 7.92348508609807e-05, + "loss": 0.0076, + "step": 567780 + }, + { + "epoch": 1.47, + "learning_rate": 7.923096264460923e-05, + "loss": 0.0098, + "step": 567790 + }, + { + "epoch": 1.47, + "learning_rate": 7.922707442823778e-05, + "loss": 0.0096, + "step": 567800 + }, + { + "epoch": 1.47, + "learning_rate": 7.92231862118663e-05, + "loss": 0.0085, + "step": 567810 + }, + { + "epoch": 1.47, + "learning_rate": 7.921929799549485e-05, + "loss": 0.01, + "step": 567820 + }, + { + "epoch": 1.47, + "learning_rate": 7.921540977912337e-05, + "loss": 0.0091, + "step": 567830 + }, + { + "epoch": 1.47, + "learning_rate": 7.921152156275193e-05, + "loss": 0.0091, + "step": 567840 + }, + { + "epoch": 1.47, + "learning_rate": 7.920763334638046e-05, + "loss": 0.0065, + "step": 567850 + }, + { + "epoch": 1.47, + "learning_rate": 7.9203745130009e-05, + "loss": 0.0121, + "step": 567860 + }, + { + "epoch": 1.47, + "learning_rate": 7.919985691363753e-05, + "loss": 0.0118, + "step": 567870 + }, + { + "epoch": 1.47, + "learning_rate": 7.919596869726607e-05, + "loss": 0.0093, + "step": 567880 + }, + { + "epoch": 1.47, + "learning_rate": 7.91920804808946e-05, + "loss": 0.0082, + "step": 567890 + }, + { + "epoch": 1.47, + "learning_rate": 7.918819226452314e-05, + "loss": 0.0106, + "step": 567900 + }, + { + "epoch": 1.47, + "learning_rate": 7.918430404815167e-05, + "loss": 0.0122, + "step": 567910 + }, + { + "epoch": 1.47, + "learning_rate": 7.91804158317802e-05, + "loss": 0.0091, + "step": 567920 + }, + { + "epoch": 1.47, + "learning_rate": 7.917652761540874e-05, + "loss": 0.0086, + "step": 567930 + }, + { + "epoch": 1.47, + "learning_rate": 7.917263939903726e-05, + "loss": 0.0093, + "step": 567940 + }, + { + "epoch": 1.47, + "learning_rate": 7.91687511826658e-05, + "loss": 0.0095, + "step": 567950 + }, + { + "epoch": 1.47, + "learning_rate": 7.916486296629433e-05, + "loss": 0.0099, + "step": 567960 + }, + { + "epoch": 1.47, + "learning_rate": 7.916097474992288e-05, + "loss": 0.0093, + "step": 567970 + }, + { + "epoch": 1.47, + "learning_rate": 7.91570865335514e-05, + "loss": 0.0104, + "step": 567980 + }, + { + "epoch": 1.47, + "learning_rate": 7.915319831717994e-05, + "loss": 0.0097, + "step": 567990 + }, + { + "epoch": 1.47, + "learning_rate": 7.914931010080847e-05, + "loss": 0.0078, + "step": 568000 + }, + { + "epoch": 1.47, + "eval_cer": 0.8817166826925096, + "eval_loss": 0.00597924692556262, + "eval_runtime": 108.0502, + "eval_samples_per_second": 18.51, + "eval_steps_per_second": 4.627, + "step": 568000 + }, + { + "epoch": 1.47, + "learning_rate": 7.914542188443703e-05, + "loss": 0.0069, + "step": 568010 + }, + { + "epoch": 1.47, + "learning_rate": 7.914153366806554e-05, + "loss": 0.0116, + "step": 568020 + }, + { + "epoch": 1.47, + "learning_rate": 7.91376454516941e-05, + "loss": 0.0092, + "step": 568030 + }, + { + "epoch": 1.47, + "learning_rate": 7.913375723532263e-05, + "loss": 0.008, + "step": 568040 + }, + { + "epoch": 1.47, + "learning_rate": 7.912986901895117e-05, + "loss": 0.0079, + "step": 568050 + }, + { + "epoch": 1.47, + "learning_rate": 7.91259808025797e-05, + "loss": 0.0103, + "step": 568060 + }, + { + "epoch": 1.47, + "learning_rate": 7.912209258620824e-05, + "loss": 0.0118, + "step": 568070 + }, + { + "epoch": 1.47, + "learning_rate": 7.911820436983677e-05, + "loss": 0.0117, + "step": 568080 + }, + { + "epoch": 1.47, + "learning_rate": 7.911431615346531e-05, + "loss": 0.01, + "step": 568090 + }, + { + "epoch": 1.47, + "learning_rate": 7.911042793709384e-05, + "loss": 0.0088, + "step": 568100 + }, + { + "epoch": 1.47, + "learning_rate": 7.910653972072238e-05, + "loss": 0.0087, + "step": 568110 + }, + { + "epoch": 1.47, + "learning_rate": 7.91026515043509e-05, + "loss": 0.0118, + "step": 568120 + }, + { + "epoch": 1.47, + "learning_rate": 7.909876328797945e-05, + "loss": 0.01, + "step": 568130 + }, + { + "epoch": 1.47, + "learning_rate": 7.909487507160797e-05, + "loss": 0.0072, + "step": 568140 + }, + { + "epoch": 1.47, + "learning_rate": 7.909098685523652e-05, + "loss": 0.0112, + "step": 568150 + }, + { + "epoch": 1.47, + "learning_rate": 7.908709863886504e-05, + "loss": 0.0071, + "step": 568160 + }, + { + "epoch": 1.47, + "learning_rate": 7.908321042249357e-05, + "loss": 0.0095, + "step": 568170 + }, + { + "epoch": 1.47, + "learning_rate": 7.907932220612211e-05, + "loss": 0.0101, + "step": 568180 + }, + { + "epoch": 1.47, + "learning_rate": 7.907543398975064e-05, + "loss": 0.0118, + "step": 568190 + }, + { + "epoch": 1.47, + "learning_rate": 7.90715457733792e-05, + "loss": 0.008, + "step": 568200 + }, + { + "epoch": 1.47, + "learning_rate": 7.906765755700773e-05, + "loss": 0.0128, + "step": 568210 + }, + { + "epoch": 1.47, + "learning_rate": 7.906376934063627e-05, + "loss": 0.0096, + "step": 568220 + }, + { + "epoch": 1.47, + "learning_rate": 7.90598811242648e-05, + "loss": 0.0088, + "step": 568230 + }, + { + "epoch": 1.47, + "learning_rate": 7.905599290789334e-05, + "loss": 0.0123, + "step": 568240 + }, + { + "epoch": 1.47, + "learning_rate": 7.905210469152186e-05, + "loss": 0.0081, + "step": 568250 + }, + { + "epoch": 1.47, + "learning_rate": 7.90482164751504e-05, + "loss": 0.0117, + "step": 568260 + }, + { + "epoch": 1.47, + "learning_rate": 7.904432825877893e-05, + "loss": 0.0101, + "step": 568270 + }, + { + "epoch": 1.47, + "learning_rate": 7.904044004240748e-05, + "loss": 0.0088, + "step": 568280 + }, + { + "epoch": 1.47, + "learning_rate": 7.9036551826036e-05, + "loss": 0.0107, + "step": 568290 + }, + { + "epoch": 1.47, + "learning_rate": 7.903266360966455e-05, + "loss": 0.0065, + "step": 568300 + }, + { + "epoch": 1.47, + "learning_rate": 7.902877539329307e-05, + "loss": 0.0075, + "step": 568310 + }, + { + "epoch": 1.47, + "learning_rate": 7.902488717692162e-05, + "loss": 0.0075, + "step": 568320 + }, + { + "epoch": 1.47, + "learning_rate": 7.902099896055014e-05, + "loss": 0.01, + "step": 568330 + }, + { + "epoch": 1.47, + "learning_rate": 7.901711074417869e-05, + "loss": 0.0106, + "step": 568340 + }, + { + "epoch": 1.47, + "learning_rate": 7.901322252780721e-05, + "loss": 0.0072, + "step": 568350 + }, + { + "epoch": 1.47, + "learning_rate": 7.900933431143577e-05, + "loss": 0.0117, + "step": 568360 + }, + { + "epoch": 1.47, + "learning_rate": 7.900544609506428e-05, + "loss": 0.0087, + "step": 568370 + }, + { + "epoch": 1.47, + "learning_rate": 7.900155787869284e-05, + "loss": 0.0088, + "step": 568380 + }, + { + "epoch": 1.47, + "learning_rate": 7.899766966232137e-05, + "loss": 0.0103, + "step": 568390 + }, + { + "epoch": 1.47, + "learning_rate": 7.899378144594991e-05, + "loss": 0.0093, + "step": 568400 + }, + { + "epoch": 1.47, + "learning_rate": 7.898989322957844e-05, + "loss": 0.0096, + "step": 568410 + }, + { + "epoch": 1.47, + "learning_rate": 7.898600501320696e-05, + "loss": 0.0109, + "step": 568420 + }, + { + "epoch": 1.47, + "learning_rate": 7.89821167968355e-05, + "loss": 0.0158, + "step": 568430 + }, + { + "epoch": 1.47, + "learning_rate": 7.897822858046403e-05, + "loss": 0.0086, + "step": 568440 + }, + { + "epoch": 1.47, + "learning_rate": 7.897434036409258e-05, + "loss": 0.009, + "step": 568450 + }, + { + "epoch": 1.47, + "learning_rate": 7.89704521477211e-05, + "loss": 0.0079, + "step": 568460 + }, + { + "epoch": 1.47, + "learning_rate": 7.896656393134965e-05, + "loss": 0.0116, + "step": 568470 + }, + { + "epoch": 1.47, + "learning_rate": 7.896267571497817e-05, + "loss": 0.0095, + "step": 568480 + }, + { + "epoch": 1.47, + "learning_rate": 7.895878749860671e-05, + "loss": 0.0085, + "step": 568490 + }, + { + "epoch": 1.47, + "learning_rate": 7.895489928223524e-05, + "loss": 0.0096, + "step": 568500 + }, + { + "epoch": 1.47, + "learning_rate": 7.895101106586378e-05, + "loss": 0.0153, + "step": 568510 + }, + { + "epoch": 1.47, + "learning_rate": 7.894712284949231e-05, + "loss": 0.0092, + "step": 568520 + }, + { + "epoch": 1.47, + "learning_rate": 7.894323463312085e-05, + "loss": 0.0089, + "step": 568530 + }, + { + "epoch": 1.47, + "learning_rate": 7.893934641674938e-05, + "loss": 0.0098, + "step": 568540 + }, + { + "epoch": 1.47, + "learning_rate": 7.893545820037794e-05, + "loss": 0.0081, + "step": 568550 + }, + { + "epoch": 1.47, + "learning_rate": 7.893156998400647e-05, + "loss": 0.0156, + "step": 568560 + }, + { + "epoch": 1.47, + "learning_rate": 7.892768176763501e-05, + "loss": 0.0088, + "step": 568570 + }, + { + "epoch": 1.47, + "learning_rate": 7.892379355126354e-05, + "loss": 0.0101, + "step": 568580 + }, + { + "epoch": 1.47, + "learning_rate": 7.891990533489208e-05, + "loss": 0.0109, + "step": 568590 + }, + { + "epoch": 1.47, + "learning_rate": 7.89160171185206e-05, + "loss": 0.0112, + "step": 568600 + }, + { + "epoch": 1.47, + "learning_rate": 7.891212890214915e-05, + "loss": 0.0104, + "step": 568610 + }, + { + "epoch": 1.47, + "learning_rate": 7.890824068577767e-05, + "loss": 0.0118, + "step": 568620 + }, + { + "epoch": 1.47, + "learning_rate": 7.890435246940622e-05, + "loss": 0.0127, + "step": 568630 + }, + { + "epoch": 1.47, + "learning_rate": 7.890046425303474e-05, + "loss": 0.0087, + "step": 568640 + }, + { + "epoch": 1.47, + "learning_rate": 7.889657603666329e-05, + "loss": 0.0093, + "step": 568650 + }, + { + "epoch": 1.47, + "learning_rate": 7.889268782029181e-05, + "loss": 0.0078, + "step": 568660 + }, + { + "epoch": 1.47, + "learning_rate": 7.888879960392034e-05, + "loss": 0.0068, + "step": 568670 + }, + { + "epoch": 1.47, + "learning_rate": 7.888491138754888e-05, + "loss": 0.0093, + "step": 568680 + }, + { + "epoch": 1.47, + "learning_rate": 7.888102317117741e-05, + "loss": 0.009, + "step": 568690 + }, + { + "epoch": 1.47, + "learning_rate": 7.887713495480595e-05, + "loss": 0.0089, + "step": 568700 + }, + { + "epoch": 1.47, + "learning_rate": 7.887324673843448e-05, + "loss": 0.0117, + "step": 568710 + }, + { + "epoch": 1.47, + "learning_rate": 7.886935852206304e-05, + "loss": 0.0078, + "step": 568720 + }, + { + "epoch": 1.47, + "learning_rate": 7.886547030569155e-05, + "loss": 0.0112, + "step": 568730 + }, + { + "epoch": 1.47, + "learning_rate": 7.886158208932011e-05, + "loss": 0.0084, + "step": 568740 + }, + { + "epoch": 1.47, + "learning_rate": 7.885769387294863e-05, + "loss": 0.0072, + "step": 568750 + }, + { + "epoch": 1.47, + "learning_rate": 7.885380565657718e-05, + "loss": 0.0104, + "step": 568760 + }, + { + "epoch": 1.47, + "learning_rate": 7.88499174402057e-05, + "loss": 0.0088, + "step": 568770 + }, + { + "epoch": 1.47, + "learning_rate": 7.884602922383425e-05, + "loss": 0.0064, + "step": 568780 + }, + { + "epoch": 1.47, + "learning_rate": 7.884214100746277e-05, + "loss": 0.0078, + "step": 568790 + }, + { + "epoch": 1.47, + "learning_rate": 7.883825279109132e-05, + "loss": 0.011, + "step": 568800 + }, + { + "epoch": 1.47, + "learning_rate": 7.883436457471984e-05, + "loss": 0.0109, + "step": 568810 + }, + { + "epoch": 1.47, + "learning_rate": 7.883047635834839e-05, + "loss": 0.0111, + "step": 568820 + }, + { + "epoch": 1.47, + "learning_rate": 7.882658814197691e-05, + "loss": 0.0079, + "step": 568830 + }, + { + "epoch": 1.47, + "learning_rate": 7.882269992560546e-05, + "loss": 0.0079, + "step": 568840 + }, + { + "epoch": 1.47, + "learning_rate": 7.881881170923398e-05, + "loss": 0.0076, + "step": 568850 + }, + { + "epoch": 1.47, + "learning_rate": 7.881492349286253e-05, + "loss": 0.0084, + "step": 568860 + }, + { + "epoch": 1.47, + "learning_rate": 7.881103527649105e-05, + "loss": 0.0067, + "step": 568870 + }, + { + "epoch": 1.47, + "learning_rate": 7.880714706011961e-05, + "loss": 0.0101, + "step": 568880 + }, + { + "epoch": 1.47, + "learning_rate": 7.880325884374812e-05, + "loss": 0.0073, + "step": 568890 + }, + { + "epoch": 1.47, + "learning_rate": 7.879937062737668e-05, + "loss": 0.0087, + "step": 568900 + }, + { + "epoch": 1.47, + "learning_rate": 7.87954824110052e-05, + "loss": 0.0105, + "step": 568910 + }, + { + "epoch": 1.47, + "learning_rate": 7.879159419463373e-05, + "loss": 0.0071, + "step": 568920 + }, + { + "epoch": 1.47, + "learning_rate": 7.878770597826228e-05, + "loss": 0.0065, + "step": 568930 + }, + { + "epoch": 1.47, + "learning_rate": 7.87838177618908e-05, + "loss": 0.0073, + "step": 568940 + }, + { + "epoch": 1.47, + "learning_rate": 7.877992954551935e-05, + "loss": 0.0064, + "step": 568950 + }, + { + "epoch": 1.47, + "learning_rate": 7.877604132914787e-05, + "loss": 0.0083, + "step": 568960 + }, + { + "epoch": 1.47, + "learning_rate": 7.877215311277642e-05, + "loss": 0.0085, + "step": 568970 + }, + { + "epoch": 1.47, + "learning_rate": 7.876826489640494e-05, + "loss": 0.0077, + "step": 568980 + }, + { + "epoch": 1.47, + "learning_rate": 7.876437668003349e-05, + "loss": 0.0102, + "step": 568990 + }, + { + "epoch": 1.47, + "learning_rate": 7.876048846366201e-05, + "loss": 0.0089, + "step": 569000 + }, + { + "epoch": 1.47, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.006051726173609495, + "eval_runtime": 107.8929, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 569000 + }, + { + "epoch": 1.47, + "learning_rate": 7.875660024729055e-05, + "loss": 0.0087, + "step": 569010 + }, + { + "epoch": 1.47, + "learning_rate": 7.875271203091908e-05, + "loss": 0.0106, + "step": 569020 + }, + { + "epoch": 1.48, + "learning_rate": 7.874882381454762e-05, + "loss": 0.0075, + "step": 569030 + }, + { + "epoch": 1.48, + "learning_rate": 7.874493559817615e-05, + "loss": 0.0093, + "step": 569040 + }, + { + "epoch": 1.48, + "learning_rate": 7.87410473818047e-05, + "loss": 0.0096, + "step": 569050 + }, + { + "epoch": 1.48, + "learning_rate": 7.873715916543322e-05, + "loss": 0.0087, + "step": 569060 + }, + { + "epoch": 1.48, + "learning_rate": 7.873327094906178e-05, + "loss": 0.0067, + "step": 569070 + }, + { + "epoch": 1.48, + "learning_rate": 7.87293827326903e-05, + "loss": 0.01, + "step": 569080 + }, + { + "epoch": 1.48, + "learning_rate": 7.872549451631885e-05, + "loss": 0.0074, + "step": 569090 + }, + { + "epoch": 1.48, + "learning_rate": 7.872160629994738e-05, + "loss": 0.0089, + "step": 569100 + }, + { + "epoch": 1.48, + "learning_rate": 7.871771808357592e-05, + "loss": 0.0098, + "step": 569110 + }, + { + "epoch": 1.48, + "learning_rate": 7.871382986720445e-05, + "loss": 0.0114, + "step": 569120 + }, + { + "epoch": 1.48, + "learning_rate": 7.870994165083299e-05, + "loss": 0.0083, + "step": 569130 + }, + { + "epoch": 1.48, + "learning_rate": 7.870605343446151e-05, + "loss": 0.008, + "step": 569140 + }, + { + "epoch": 1.48, + "learning_rate": 7.870216521809006e-05, + "loss": 0.0102, + "step": 569150 + }, + { + "epoch": 1.48, + "learning_rate": 7.869827700171858e-05, + "loss": 0.0074, + "step": 569160 + }, + { + "epoch": 1.48, + "learning_rate": 7.869438878534711e-05, + "loss": 0.0081, + "step": 569170 + }, + { + "epoch": 1.48, + "learning_rate": 7.869050056897565e-05, + "loss": 0.0106, + "step": 569180 + }, + { + "epoch": 1.48, + "learning_rate": 7.868661235260418e-05, + "loss": 0.0079, + "step": 569190 + }, + { + "epoch": 1.48, + "learning_rate": 7.868272413623272e-05, + "loss": 0.0111, + "step": 569200 + }, + { + "epoch": 1.48, + "learning_rate": 7.867883591986125e-05, + "loss": 0.01, + "step": 569210 + }, + { + "epoch": 1.48, + "learning_rate": 7.86749477034898e-05, + "loss": 0.01, + "step": 569220 + }, + { + "epoch": 1.48, + "learning_rate": 7.867105948711832e-05, + "loss": 0.0107, + "step": 569230 + }, + { + "epoch": 1.48, + "learning_rate": 7.866717127074688e-05, + "loss": 0.0092, + "step": 569240 + }, + { + "epoch": 1.48, + "learning_rate": 7.866328305437539e-05, + "loss": 0.0094, + "step": 569250 + }, + { + "epoch": 1.48, + "learning_rate": 7.865939483800395e-05, + "loss": 0.0126, + "step": 569260 + }, + { + "epoch": 1.48, + "learning_rate": 7.865550662163247e-05, + "loss": 0.0083, + "step": 569270 + }, + { + "epoch": 1.48, + "learning_rate": 7.865161840526102e-05, + "loss": 0.0115, + "step": 569280 + }, + { + "epoch": 1.48, + "learning_rate": 7.864773018888954e-05, + "loss": 0.0093, + "step": 569290 + }, + { + "epoch": 1.48, + "learning_rate": 7.864384197251809e-05, + "loss": 0.0082, + "step": 569300 + }, + { + "epoch": 1.48, + "learning_rate": 7.863995375614661e-05, + "loss": 0.0078, + "step": 569310 + }, + { + "epoch": 1.48, + "learning_rate": 7.863606553977516e-05, + "loss": 0.0093, + "step": 569320 + }, + { + "epoch": 1.48, + "learning_rate": 7.863217732340368e-05, + "loss": 0.0075, + "step": 569330 + }, + { + "epoch": 1.48, + "learning_rate": 7.862828910703223e-05, + "loss": 0.0101, + "step": 569340 + }, + { + "epoch": 1.48, + "learning_rate": 7.862440089066075e-05, + "loss": 0.0082, + "step": 569350 + }, + { + "epoch": 1.48, + "learning_rate": 7.86205126742893e-05, + "loss": 0.0072, + "step": 569360 + }, + { + "epoch": 1.48, + "learning_rate": 7.861662445791782e-05, + "loss": 0.0085, + "step": 569370 + }, + { + "epoch": 1.48, + "learning_rate": 7.861273624154637e-05, + "loss": 0.0109, + "step": 569380 + }, + { + "epoch": 1.48, + "learning_rate": 7.860884802517489e-05, + "loss": 0.0112, + "step": 569390 + }, + { + "epoch": 1.48, + "learning_rate": 7.860495980880345e-05, + "loss": 0.009, + "step": 569400 + }, + { + "epoch": 1.48, + "learning_rate": 7.860107159243196e-05, + "loss": 0.0109, + "step": 569410 + }, + { + "epoch": 1.48, + "learning_rate": 7.859718337606049e-05, + "loss": 0.0117, + "step": 569420 + }, + { + "epoch": 1.48, + "learning_rate": 7.859329515968905e-05, + "loss": 0.0089, + "step": 569430 + }, + { + "epoch": 1.48, + "learning_rate": 7.858940694331757e-05, + "loss": 0.0084, + "step": 569440 + }, + { + "epoch": 1.48, + "learning_rate": 7.858551872694612e-05, + "loss": 0.0086, + "step": 569450 + }, + { + "epoch": 1.48, + "learning_rate": 7.858163051057464e-05, + "loss": 0.0087, + "step": 569460 + }, + { + "epoch": 1.48, + "learning_rate": 7.857774229420319e-05, + "loss": 0.0109, + "step": 569470 + }, + { + "epoch": 1.48, + "learning_rate": 7.857385407783171e-05, + "loss": 0.0078, + "step": 569480 + }, + { + "epoch": 1.48, + "learning_rate": 7.856996586146026e-05, + "loss": 0.0077, + "step": 569490 + }, + { + "epoch": 1.48, + "learning_rate": 7.856607764508878e-05, + "loss": 0.0065, + "step": 569500 + }, + { + "epoch": 1.48, + "learning_rate": 7.856218942871733e-05, + "loss": 0.0102, + "step": 569510 + }, + { + "epoch": 1.48, + "learning_rate": 7.855830121234585e-05, + "loss": 0.0093, + "step": 569520 + }, + { + "epoch": 1.48, + "learning_rate": 7.85544129959744e-05, + "loss": 0.0098, + "step": 569530 + }, + { + "epoch": 1.48, + "learning_rate": 7.855052477960292e-05, + "loss": 0.0083, + "step": 569540 + }, + { + "epoch": 1.48, + "learning_rate": 7.854663656323146e-05, + "loss": 0.0073, + "step": 569550 + }, + { + "epoch": 1.48, + "learning_rate": 7.854274834685999e-05, + "loss": 0.0117, + "step": 569560 + }, + { + "epoch": 1.48, + "learning_rate": 7.853886013048853e-05, + "loss": 0.007, + "step": 569570 + }, + { + "epoch": 1.48, + "learning_rate": 7.853497191411706e-05, + "loss": 0.0083, + "step": 569580 + }, + { + "epoch": 1.48, + "learning_rate": 7.853108369774562e-05, + "loss": 0.0076, + "step": 569590 + }, + { + "epoch": 1.48, + "learning_rate": 7.852719548137415e-05, + "loss": 0.0102, + "step": 569600 + }, + { + "epoch": 1.48, + "learning_rate": 7.852330726500269e-05, + "loss": 0.009, + "step": 569610 + }, + { + "epoch": 1.48, + "learning_rate": 7.851941904863122e-05, + "loss": 0.0093, + "step": 569620 + }, + { + "epoch": 1.48, + "learning_rate": 7.851553083225976e-05, + "loss": 0.0087, + "step": 569630 + }, + { + "epoch": 1.48, + "learning_rate": 7.851164261588829e-05, + "loss": 0.0111, + "step": 569640 + }, + { + "epoch": 1.48, + "learning_rate": 7.850775439951683e-05, + "loss": 0.0095, + "step": 569650 + }, + { + "epoch": 1.48, + "learning_rate": 7.850386618314535e-05, + "loss": 0.0085, + "step": 569660 + }, + { + "epoch": 1.48, + "learning_rate": 7.849997796677388e-05, + "loss": 0.0101, + "step": 569670 + }, + { + "epoch": 1.48, + "learning_rate": 7.849608975040242e-05, + "loss": 0.0085, + "step": 569680 + }, + { + "epoch": 1.48, + "learning_rate": 7.849220153403095e-05, + "loss": 0.0108, + "step": 569690 + }, + { + "epoch": 1.48, + "learning_rate": 7.84883133176595e-05, + "loss": 0.0072, + "step": 569700 + }, + { + "epoch": 1.48, + "learning_rate": 7.848442510128802e-05, + "loss": 0.0086, + "step": 569710 + }, + { + "epoch": 1.48, + "learning_rate": 7.848053688491656e-05, + "loss": 0.008, + "step": 569720 + }, + { + "epoch": 1.48, + "learning_rate": 7.847664866854509e-05, + "loss": 0.0074, + "step": 569730 + }, + { + "epoch": 1.48, + "learning_rate": 7.847276045217363e-05, + "loss": 0.0079, + "step": 569740 + }, + { + "epoch": 1.48, + "learning_rate": 7.846887223580216e-05, + "loss": 0.0128, + "step": 569750 + }, + { + "epoch": 1.48, + "learning_rate": 7.84649840194307e-05, + "loss": 0.0089, + "step": 569760 + }, + { + "epoch": 1.48, + "learning_rate": 7.846109580305923e-05, + "loss": 0.0123, + "step": 569770 + }, + { + "epoch": 1.48, + "learning_rate": 7.845720758668779e-05, + "loss": 0.0082, + "step": 569780 + }, + { + "epoch": 1.48, + "learning_rate": 7.845331937031631e-05, + "loss": 0.0071, + "step": 569790 + }, + { + "epoch": 1.48, + "learning_rate": 7.844943115394486e-05, + "loss": 0.0084, + "step": 569800 + }, + { + "epoch": 1.48, + "learning_rate": 7.844554293757338e-05, + "loss": 0.0109, + "step": 569810 + }, + { + "epoch": 1.48, + "learning_rate": 7.844165472120193e-05, + "loss": 0.009, + "step": 569820 + }, + { + "epoch": 1.48, + "learning_rate": 7.843776650483045e-05, + "loss": 0.0101, + "step": 569830 + }, + { + "epoch": 1.48, + "learning_rate": 7.8433878288459e-05, + "loss": 0.0076, + "step": 569840 + }, + { + "epoch": 1.48, + "learning_rate": 7.842999007208752e-05, + "loss": 0.0137, + "step": 569850 + }, + { + "epoch": 1.48, + "learning_rate": 7.842610185571607e-05, + "loss": 0.0097, + "step": 569860 + }, + { + "epoch": 1.48, + "learning_rate": 7.84222136393446e-05, + "loss": 0.0088, + "step": 569870 + }, + { + "epoch": 1.48, + "learning_rate": 7.841832542297314e-05, + "loss": 0.0079, + "step": 569880 + }, + { + "epoch": 1.48, + "learning_rate": 7.841443720660166e-05, + "loss": 0.0112, + "step": 569890 + }, + { + "epoch": 1.48, + "learning_rate": 7.84105489902302e-05, + "loss": 0.0108, + "step": 569900 + }, + { + "epoch": 1.48, + "learning_rate": 7.840666077385873e-05, + "loss": 0.0071, + "step": 569910 + }, + { + "epoch": 1.48, + "learning_rate": 7.840277255748726e-05, + "loss": 0.0103, + "step": 569920 + }, + { + "epoch": 1.48, + "learning_rate": 7.83988843411158e-05, + "loss": 0.0089, + "step": 569930 + }, + { + "epoch": 1.48, + "learning_rate": 7.839499612474433e-05, + "loss": 0.0106, + "step": 569940 + }, + { + "epoch": 1.48, + "learning_rate": 7.839110790837289e-05, + "loss": 0.0091, + "step": 569950 + }, + { + "epoch": 1.48, + "learning_rate": 7.83872196920014e-05, + "loss": 0.01, + "step": 569960 + }, + { + "epoch": 1.48, + "learning_rate": 7.838333147562996e-05, + "loss": 0.0099, + "step": 569970 + }, + { + "epoch": 1.48, + "learning_rate": 7.837944325925848e-05, + "loss": 0.008, + "step": 569980 + }, + { + "epoch": 1.48, + "learning_rate": 7.837555504288703e-05, + "loss": 0.0091, + "step": 569990 + }, + { + "epoch": 1.48, + "learning_rate": 7.837166682651555e-05, + "loss": 0.009, + "step": 570000 + }, + { + "epoch": 1.48, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.006050651427358389, + "eval_runtime": 107.8737, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 570000 + }, + { + "epoch": 1.48, + "learning_rate": 7.83677786101441e-05, + "loss": 0.0104, + "step": 570010 + }, + { + "epoch": 1.48, + "learning_rate": 7.836389039377262e-05, + "loss": 0.0105, + "step": 570020 + }, + { + "epoch": 1.48, + "learning_rate": 7.836000217740116e-05, + "loss": 0.0102, + "step": 570030 + }, + { + "epoch": 1.48, + "learning_rate": 7.835611396102969e-05, + "loss": 0.0104, + "step": 570040 + }, + { + "epoch": 1.48, + "learning_rate": 7.835222574465823e-05, + "loss": 0.0061, + "step": 570050 + }, + { + "epoch": 1.48, + "learning_rate": 7.834833752828676e-05, + "loss": 0.013, + "step": 570060 + }, + { + "epoch": 1.48, + "learning_rate": 7.83444493119153e-05, + "loss": 0.0066, + "step": 570070 + }, + { + "epoch": 1.48, + "learning_rate": 7.834056109554383e-05, + "loss": 0.0128, + "step": 570080 + }, + { + "epoch": 1.48, + "learning_rate": 7.833667287917237e-05, + "loss": 0.011, + "step": 570090 + }, + { + "epoch": 1.48, + "learning_rate": 7.83327846628009e-05, + "loss": 0.0109, + "step": 570100 + }, + { + "epoch": 1.48, + "learning_rate": 7.832889644642946e-05, + "loss": 0.0106, + "step": 570110 + }, + { + "epoch": 1.48, + "learning_rate": 7.832500823005797e-05, + "loss": 0.0059, + "step": 570120 + }, + { + "epoch": 1.48, + "learning_rate": 7.832112001368653e-05, + "loss": 0.0074, + "step": 570130 + }, + { + "epoch": 1.48, + "learning_rate": 7.831723179731506e-05, + "loss": 0.0123, + "step": 570140 + }, + { + "epoch": 1.48, + "learning_rate": 7.831334358094358e-05, + "loss": 0.0145, + "step": 570150 + }, + { + "epoch": 1.48, + "learning_rate": 7.830945536457212e-05, + "loss": 0.0084, + "step": 570160 + }, + { + "epoch": 1.48, + "learning_rate": 7.830556714820065e-05, + "loss": 0.0082, + "step": 570170 + }, + { + "epoch": 1.48, + "learning_rate": 7.83016789318292e-05, + "loss": 0.01, + "step": 570180 + }, + { + "epoch": 1.48, + "learning_rate": 7.829779071545772e-05, + "loss": 0.0111, + "step": 570190 + }, + { + "epoch": 1.48, + "learning_rate": 7.829390249908626e-05, + "loss": 0.0093, + "step": 570200 + }, + { + "epoch": 1.48, + "learning_rate": 7.829001428271479e-05, + "loss": 0.0084, + "step": 570210 + }, + { + "epoch": 1.48, + "learning_rate": 7.828612606634333e-05, + "loss": 0.0111, + "step": 570220 + }, + { + "epoch": 1.48, + "learning_rate": 7.828223784997186e-05, + "loss": 0.0096, + "step": 570230 + }, + { + "epoch": 1.48, + "learning_rate": 7.82783496336004e-05, + "loss": 0.0079, + "step": 570240 + }, + { + "epoch": 1.48, + "learning_rate": 7.827446141722893e-05, + "loss": 0.0085, + "step": 570250 + }, + { + "epoch": 1.48, + "learning_rate": 7.827057320085747e-05, + "loss": 0.0086, + "step": 570260 + }, + { + "epoch": 1.48, + "learning_rate": 7.8266684984486e-05, + "loss": 0.0063, + "step": 570270 + }, + { + "epoch": 1.48, + "learning_rate": 7.826279676811454e-05, + "loss": 0.0118, + "step": 570280 + }, + { + "epoch": 1.48, + "learning_rate": 7.825890855174307e-05, + "loss": 0.0081, + "step": 570290 + }, + { + "epoch": 1.48, + "learning_rate": 7.825502033537163e-05, + "loss": 0.0079, + "step": 570300 + }, + { + "epoch": 1.48, + "learning_rate": 7.825113211900015e-05, + "loss": 0.0094, + "step": 570310 + }, + { + "epoch": 1.48, + "learning_rate": 7.82472439026287e-05, + "loss": 0.0075, + "step": 570320 + }, + { + "epoch": 1.48, + "learning_rate": 7.824335568625722e-05, + "loss": 0.0141, + "step": 570330 + }, + { + "epoch": 1.48, + "learning_rate": 7.823946746988577e-05, + "loss": 0.011, + "step": 570340 + }, + { + "epoch": 1.48, + "learning_rate": 7.82355792535143e-05, + "loss": 0.009, + "step": 570350 + }, + { + "epoch": 1.48, + "learning_rate": 7.823169103714284e-05, + "loss": 0.0106, + "step": 570360 + }, + { + "epoch": 1.48, + "learning_rate": 7.822780282077136e-05, + "loss": 0.0083, + "step": 570370 + }, + { + "epoch": 1.48, + "learning_rate": 7.82239146043999e-05, + "loss": 0.0077, + "step": 570380 + }, + { + "epoch": 1.48, + "learning_rate": 7.822002638802843e-05, + "loss": 0.0083, + "step": 570390 + }, + { + "epoch": 1.48, + "learning_rate": 7.821613817165696e-05, + "loss": 0.0104, + "step": 570400 + }, + { + "epoch": 1.48, + "learning_rate": 7.82122499552855e-05, + "loss": 0.0152, + "step": 570410 + }, + { + "epoch": 1.48, + "learning_rate": 7.820836173891403e-05, + "loss": 0.0085, + "step": 570420 + }, + { + "epoch": 1.48, + "learning_rate": 7.820447352254257e-05, + "loss": 0.0074, + "step": 570430 + }, + { + "epoch": 1.48, + "learning_rate": 7.82005853061711e-05, + "loss": 0.0083, + "step": 570440 + }, + { + "epoch": 1.48, + "learning_rate": 7.819669708979964e-05, + "loss": 0.0116, + "step": 570450 + }, + { + "epoch": 1.48, + "learning_rate": 7.819280887342817e-05, + "loss": 0.0067, + "step": 570460 + }, + { + "epoch": 1.48, + "learning_rate": 7.818892065705673e-05, + "loss": 0.0104, + "step": 570470 + }, + { + "epoch": 1.48, + "learning_rate": 7.818503244068524e-05, + "loss": 0.0082, + "step": 570480 + }, + { + "epoch": 1.48, + "learning_rate": 7.81811442243138e-05, + "loss": 0.0201, + "step": 570490 + }, + { + "epoch": 1.48, + "learning_rate": 7.817725600794232e-05, + "loss": 0.009, + "step": 570500 + }, + { + "epoch": 1.48, + "learning_rate": 7.817336779157087e-05, + "loss": 0.011, + "step": 570510 + }, + { + "epoch": 1.48, + "learning_rate": 7.81694795751994e-05, + "loss": 0.0107, + "step": 570520 + }, + { + "epoch": 1.48, + "learning_rate": 7.816559135882794e-05, + "loss": 0.0103, + "step": 570530 + }, + { + "epoch": 1.48, + "learning_rate": 7.816170314245646e-05, + "loss": 0.0084, + "step": 570540 + }, + { + "epoch": 1.48, + "learning_rate": 7.8157814926085e-05, + "loss": 0.0079, + "step": 570550 + }, + { + "epoch": 1.48, + "learning_rate": 7.815392670971353e-05, + "loss": 0.0093, + "step": 570560 + }, + { + "epoch": 1.48, + "learning_rate": 7.815003849334207e-05, + "loss": 0.0069, + "step": 570570 + }, + { + "epoch": 1.48, + "learning_rate": 7.81461502769706e-05, + "loss": 0.0109, + "step": 570580 + }, + { + "epoch": 1.48, + "learning_rate": 7.814226206059914e-05, + "loss": 0.0079, + "step": 570590 + }, + { + "epoch": 1.48, + "learning_rate": 7.813837384422767e-05, + "loss": 0.0079, + "step": 570600 + }, + { + "epoch": 1.48, + "learning_rate": 7.813448562785621e-05, + "loss": 0.0115, + "step": 570610 + }, + { + "epoch": 1.48, + "learning_rate": 7.813059741148474e-05, + "loss": 0.0099, + "step": 570620 + }, + { + "epoch": 1.48, + "learning_rate": 7.81267091951133e-05, + "loss": 0.0102, + "step": 570630 + }, + { + "epoch": 1.48, + "learning_rate": 7.812282097874181e-05, + "loss": 0.0087, + "step": 570640 + }, + { + "epoch": 1.48, + "learning_rate": 7.811893276237034e-05, + "loss": 0.0072, + "step": 570650 + }, + { + "epoch": 1.48, + "learning_rate": 7.81150445459989e-05, + "loss": 0.0109, + "step": 570660 + }, + { + "epoch": 1.48, + "learning_rate": 7.811115632962742e-05, + "loss": 0.0069, + "step": 570670 + }, + { + "epoch": 1.48, + "learning_rate": 7.810726811325596e-05, + "loss": 0.0084, + "step": 570680 + }, + { + "epoch": 1.48, + "learning_rate": 7.810337989688449e-05, + "loss": 0.0102, + "step": 570690 + }, + { + "epoch": 1.48, + "learning_rate": 7.809949168051303e-05, + "loss": 0.0088, + "step": 570700 + }, + { + "epoch": 1.48, + "learning_rate": 7.809560346414156e-05, + "loss": 0.0084, + "step": 570710 + }, + { + "epoch": 1.48, + "learning_rate": 7.80917152477701e-05, + "loss": 0.0093, + "step": 570720 + }, + { + "epoch": 1.48, + "learning_rate": 7.808782703139863e-05, + "loss": 0.0099, + "step": 570730 + }, + { + "epoch": 1.48, + "learning_rate": 7.808393881502717e-05, + "loss": 0.0069, + "step": 570740 + }, + { + "epoch": 1.48, + "learning_rate": 7.80800505986557e-05, + "loss": 0.0086, + "step": 570750 + }, + { + "epoch": 1.48, + "learning_rate": 7.807616238228424e-05, + "loss": 0.0118, + "step": 570760 + }, + { + "epoch": 1.48, + "learning_rate": 7.807227416591277e-05, + "loss": 0.0089, + "step": 570770 + }, + { + "epoch": 1.48, + "learning_rate": 7.806838594954131e-05, + "loss": 0.0109, + "step": 570780 + }, + { + "epoch": 1.48, + "learning_rate": 7.806449773316984e-05, + "loss": 0.0107, + "step": 570790 + }, + { + "epoch": 1.48, + "learning_rate": 7.806060951679838e-05, + "loss": 0.0075, + "step": 570800 + }, + { + "epoch": 1.48, + "learning_rate": 7.805672130042691e-05, + "loss": 0.0079, + "step": 570810 + }, + { + "epoch": 1.48, + "learning_rate": 7.805283308405547e-05, + "loss": 0.0081, + "step": 570820 + }, + { + "epoch": 1.48, + "learning_rate": 7.8048944867684e-05, + "loss": 0.0103, + "step": 570830 + }, + { + "epoch": 1.48, + "learning_rate": 7.804505665131254e-05, + "loss": 0.0102, + "step": 570840 + }, + { + "epoch": 1.48, + "learning_rate": 7.804116843494106e-05, + "loss": 0.0076, + "step": 570850 + }, + { + "epoch": 1.48, + "learning_rate": 7.80372802185696e-05, + "loss": 0.0072, + "step": 570860 + }, + { + "epoch": 1.48, + "learning_rate": 7.803339200219813e-05, + "loss": 0.0099, + "step": 570870 + }, + { + "epoch": 1.48, + "learning_rate": 7.802950378582668e-05, + "loss": 0.008, + "step": 570880 + }, + { + "epoch": 1.48, + "learning_rate": 7.80256155694552e-05, + "loss": 0.0068, + "step": 570890 + }, + { + "epoch": 1.48, + "learning_rate": 7.802172735308373e-05, + "loss": 0.0111, + "step": 570900 + }, + { + "epoch": 1.48, + "learning_rate": 7.801783913671227e-05, + "loss": 0.0098, + "step": 570910 + }, + { + "epoch": 1.48, + "learning_rate": 7.80139509203408e-05, + "loss": 0.008, + "step": 570920 + }, + { + "epoch": 1.48, + "learning_rate": 7.801006270396934e-05, + "loss": 0.0091, + "step": 570930 + }, + { + "epoch": 1.48, + "learning_rate": 7.800617448759787e-05, + "loss": 0.0108, + "step": 570940 + }, + { + "epoch": 1.48, + "learning_rate": 7.800228627122641e-05, + "loss": 0.0078, + "step": 570950 + }, + { + "epoch": 1.48, + "learning_rate": 7.799839805485494e-05, + "loss": 0.0094, + "step": 570960 + }, + { + "epoch": 1.48, + "learning_rate": 7.799450983848348e-05, + "loss": 0.0079, + "step": 570970 + }, + { + "epoch": 1.48, + "learning_rate": 7.799062162211201e-05, + "loss": 0.0099, + "step": 570980 + }, + { + "epoch": 1.48, + "learning_rate": 7.798673340574055e-05, + "loss": 0.0118, + "step": 570990 + }, + { + "epoch": 1.48, + "learning_rate": 7.798284518936908e-05, + "loss": 0.0062, + "step": 571000 + }, + { + "epoch": 1.48, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.006170371081680059, + "eval_runtime": 108.0088, + "eval_samples_per_second": 18.517, + "eval_steps_per_second": 4.629, + "step": 571000 + }, + { + "epoch": 1.48, + "learning_rate": 7.797895697299764e-05, + "loss": 0.0086, + "step": 571010 + }, + { + "epoch": 1.48, + "learning_rate": 7.797506875662616e-05, + "loss": 0.0093, + "step": 571020 + }, + { + "epoch": 1.48, + "learning_rate": 7.79711805402547e-05, + "loss": 0.0103, + "step": 571030 + }, + { + "epoch": 1.48, + "learning_rate": 7.796729232388323e-05, + "loss": 0.0106, + "step": 571040 + }, + { + "epoch": 1.48, + "learning_rate": 7.796340410751178e-05, + "loss": 0.008, + "step": 571050 + }, + { + "epoch": 1.48, + "learning_rate": 7.79595158911403e-05, + "loss": 0.0081, + "step": 571060 + }, + { + "epoch": 1.48, + "learning_rate": 7.795562767476884e-05, + "loss": 0.0086, + "step": 571070 + }, + { + "epoch": 1.48, + "learning_rate": 7.795173945839737e-05, + "loss": 0.0071, + "step": 571080 + }, + { + "epoch": 1.48, + "learning_rate": 7.794785124202591e-05, + "loss": 0.0102, + "step": 571090 + }, + { + "epoch": 1.48, + "learning_rate": 7.794396302565444e-05, + "loss": 0.0121, + "step": 571100 + }, + { + "epoch": 1.48, + "learning_rate": 7.794007480928298e-05, + "loss": 0.0103, + "step": 571110 + }, + { + "epoch": 1.48, + "learning_rate": 7.793618659291151e-05, + "loss": 0.0094, + "step": 571120 + }, + { + "epoch": 1.48, + "learning_rate": 7.793229837654005e-05, + "loss": 0.0084, + "step": 571130 + }, + { + "epoch": 1.48, + "learning_rate": 7.792841016016858e-05, + "loss": 0.008, + "step": 571140 + }, + { + "epoch": 1.48, + "learning_rate": 7.792452194379711e-05, + "loss": 0.0111, + "step": 571150 + }, + { + "epoch": 1.48, + "learning_rate": 7.792063372742565e-05, + "loss": 0.0077, + "step": 571160 + }, + { + "epoch": 1.48, + "learning_rate": 7.791674551105418e-05, + "loss": 0.0098, + "step": 571170 + }, + { + "epoch": 1.48, + "learning_rate": 7.791285729468273e-05, + "loss": 0.0077, + "step": 571180 + }, + { + "epoch": 1.48, + "learning_rate": 7.790896907831126e-05, + "loss": 0.0133, + "step": 571190 + }, + { + "epoch": 1.48, + "learning_rate": 7.79050808619398e-05, + "loss": 0.0125, + "step": 571200 + }, + { + "epoch": 1.48, + "learning_rate": 7.790119264556833e-05, + "loss": 0.0082, + "step": 571210 + }, + { + "epoch": 1.48, + "learning_rate": 7.789730442919687e-05, + "loss": 0.0096, + "step": 571220 + }, + { + "epoch": 1.48, + "learning_rate": 7.78934162128254e-05, + "loss": 0.0092, + "step": 571230 + }, + { + "epoch": 1.48, + "learning_rate": 7.788952799645394e-05, + "loss": 0.0121, + "step": 571240 + }, + { + "epoch": 1.48, + "learning_rate": 7.788563978008247e-05, + "loss": 0.008, + "step": 571250 + }, + { + "epoch": 1.48, + "learning_rate": 7.788175156371101e-05, + "loss": 0.0068, + "step": 571260 + }, + { + "epoch": 1.48, + "learning_rate": 7.787786334733954e-05, + "loss": 0.0108, + "step": 571270 + }, + { + "epoch": 1.48, + "learning_rate": 7.787397513096808e-05, + "loss": 0.0093, + "step": 571280 + }, + { + "epoch": 1.48, + "learning_rate": 7.787008691459661e-05, + "loss": 0.0066, + "step": 571290 + }, + { + "epoch": 1.48, + "learning_rate": 7.786619869822515e-05, + "loss": 0.0087, + "step": 571300 + }, + { + "epoch": 1.48, + "learning_rate": 7.786231048185368e-05, + "loss": 0.0087, + "step": 571310 + }, + { + "epoch": 1.48, + "learning_rate": 7.785842226548222e-05, + "loss": 0.0131, + "step": 571320 + }, + { + "epoch": 1.48, + "learning_rate": 7.785453404911075e-05, + "loss": 0.0083, + "step": 571330 + }, + { + "epoch": 1.48, + "learning_rate": 7.78506458327393e-05, + "loss": 0.0093, + "step": 571340 + }, + { + "epoch": 1.48, + "learning_rate": 7.784675761636782e-05, + "loss": 0.0095, + "step": 571350 + }, + { + "epoch": 1.48, + "learning_rate": 7.784286939999638e-05, + "loss": 0.0102, + "step": 571360 + }, + { + "epoch": 1.48, + "learning_rate": 7.78389811836249e-05, + "loss": 0.0107, + "step": 571370 + }, + { + "epoch": 1.48, + "learning_rate": 7.783509296725345e-05, + "loss": 0.0123, + "step": 571380 + }, + { + "epoch": 1.48, + "learning_rate": 7.783120475088197e-05, + "loss": 0.0084, + "step": 571390 + }, + { + "epoch": 1.48, + "learning_rate": 7.78273165345105e-05, + "loss": 0.0082, + "step": 571400 + }, + { + "epoch": 1.48, + "learning_rate": 7.782342831813904e-05, + "loss": 0.0182, + "step": 571410 + }, + { + "epoch": 1.48, + "learning_rate": 7.781954010176757e-05, + "loss": 0.0076, + "step": 571420 + }, + { + "epoch": 1.48, + "learning_rate": 7.781565188539611e-05, + "loss": 0.0089, + "step": 571430 + }, + { + "epoch": 1.48, + "learning_rate": 7.781176366902464e-05, + "loss": 0.0125, + "step": 571440 + }, + { + "epoch": 1.48, + "learning_rate": 7.780787545265318e-05, + "loss": 0.0086, + "step": 571450 + }, + { + "epoch": 1.48, + "learning_rate": 7.780398723628171e-05, + "loss": 0.0097, + "step": 571460 + }, + { + "epoch": 1.48, + "learning_rate": 7.780009901991025e-05, + "loss": 0.0092, + "step": 571470 + }, + { + "epoch": 1.48, + "learning_rate": 7.779621080353878e-05, + "loss": 0.0082, + "step": 571480 + }, + { + "epoch": 1.48, + "learning_rate": 7.779232258716732e-05, + "loss": 0.0075, + "step": 571490 + }, + { + "epoch": 1.48, + "learning_rate": 7.778843437079585e-05, + "loss": 0.0092, + "step": 571500 + }, + { + "epoch": 1.48, + "learning_rate": 7.778454615442439e-05, + "loss": 0.0111, + "step": 571510 + }, + { + "epoch": 1.48, + "learning_rate": 7.778065793805292e-05, + "loss": 0.0129, + "step": 571520 + }, + { + "epoch": 1.48, + "learning_rate": 7.777676972168148e-05, + "loss": 0.0083, + "step": 571530 + }, + { + "epoch": 1.48, + "learning_rate": 7.777288150531e-05, + "loss": 0.0084, + "step": 571540 + }, + { + "epoch": 1.48, + "learning_rate": 7.776899328893855e-05, + "loss": 0.0083, + "step": 571550 + }, + { + "epoch": 1.48, + "learning_rate": 7.776510507256707e-05, + "loss": 0.0067, + "step": 571560 + }, + { + "epoch": 1.48, + "learning_rate": 7.776121685619561e-05, + "loss": 0.0096, + "step": 571570 + }, + { + "epoch": 1.48, + "learning_rate": 7.775732863982414e-05, + "loss": 0.0113, + "step": 571580 + }, + { + "epoch": 1.48, + "learning_rate": 7.775344042345268e-05, + "loss": 0.0091, + "step": 571590 + }, + { + "epoch": 1.48, + "learning_rate": 7.774955220708121e-05, + "loss": 0.0108, + "step": 571600 + }, + { + "epoch": 1.48, + "learning_rate": 7.774566399070975e-05, + "loss": 0.0081, + "step": 571610 + }, + { + "epoch": 1.48, + "learning_rate": 7.774177577433828e-05, + "loss": 0.0122, + "step": 571620 + }, + { + "epoch": 1.48, + "learning_rate": 7.773788755796682e-05, + "loss": 0.0089, + "step": 571630 + }, + { + "epoch": 1.48, + "learning_rate": 7.773399934159535e-05, + "loss": 0.0104, + "step": 571640 + }, + { + "epoch": 1.48, + "learning_rate": 7.773011112522388e-05, + "loss": 0.008, + "step": 571650 + }, + { + "epoch": 1.48, + "learning_rate": 7.772622290885242e-05, + "loss": 0.0086, + "step": 571660 + }, + { + "epoch": 1.48, + "learning_rate": 7.772233469248095e-05, + "loss": 0.0128, + "step": 571670 + }, + { + "epoch": 1.48, + "learning_rate": 7.771844647610949e-05, + "loss": 0.0093, + "step": 571680 + }, + { + "epoch": 1.48, + "learning_rate": 7.771455825973802e-05, + "loss": 0.0087, + "step": 571690 + }, + { + "epoch": 1.48, + "learning_rate": 7.771067004336657e-05, + "loss": 0.0089, + "step": 571700 + }, + { + "epoch": 1.48, + "learning_rate": 7.770678182699509e-05, + "loss": 0.0089, + "step": 571710 + }, + { + "epoch": 1.48, + "learning_rate": 7.770289361062364e-05, + "loss": 0.0084, + "step": 571720 + }, + { + "epoch": 1.48, + "learning_rate": 7.769900539425217e-05, + "loss": 0.0068, + "step": 571730 + }, + { + "epoch": 1.48, + "learning_rate": 7.769511717788071e-05, + "loss": 0.0096, + "step": 571740 + }, + { + "epoch": 1.48, + "learning_rate": 7.769122896150924e-05, + "loss": 0.0157, + "step": 571750 + }, + { + "epoch": 1.48, + "learning_rate": 7.768734074513778e-05, + "loss": 0.0083, + "step": 571760 + }, + { + "epoch": 1.48, + "learning_rate": 7.768345252876631e-05, + "loss": 0.0109, + "step": 571770 + }, + { + "epoch": 1.48, + "learning_rate": 7.767956431239485e-05, + "loss": 0.0095, + "step": 571780 + }, + { + "epoch": 1.48, + "learning_rate": 7.767567609602338e-05, + "loss": 0.0117, + "step": 571790 + }, + { + "epoch": 1.48, + "learning_rate": 7.767178787965192e-05, + "loss": 0.0115, + "step": 571800 + }, + { + "epoch": 1.48, + "learning_rate": 7.766789966328045e-05, + "loss": 0.0079, + "step": 571810 + }, + { + "epoch": 1.48, + "learning_rate": 7.7664011446909e-05, + "loss": 0.011, + "step": 571820 + }, + { + "epoch": 1.48, + "learning_rate": 7.766012323053752e-05, + "loss": 0.0088, + "step": 571830 + }, + { + "epoch": 1.48, + "learning_rate": 7.765623501416606e-05, + "loss": 0.0117, + "step": 571840 + }, + { + "epoch": 1.48, + "learning_rate": 7.765234679779459e-05, + "loss": 0.0091, + "step": 571850 + }, + { + "epoch": 1.48, + "learning_rate": 7.764845858142315e-05, + "loss": 0.0103, + "step": 571860 + }, + { + "epoch": 1.48, + "learning_rate": 7.764457036505166e-05, + "loss": 0.0096, + "step": 571870 + }, + { + "epoch": 1.48, + "learning_rate": 7.764068214868022e-05, + "loss": 0.0082, + "step": 571880 + }, + { + "epoch": 1.48, + "learning_rate": 7.763679393230874e-05, + "loss": 0.0098, + "step": 571890 + }, + { + "epoch": 1.48, + "learning_rate": 7.763290571593727e-05, + "loss": 0.0096, + "step": 571900 + }, + { + "epoch": 1.48, + "learning_rate": 7.762901749956581e-05, + "loss": 0.0112, + "step": 571910 + }, + { + "epoch": 1.48, + "learning_rate": 7.762512928319434e-05, + "loss": 0.0132, + "step": 571920 + }, + { + "epoch": 1.48, + "learning_rate": 7.762124106682288e-05, + "loss": 0.0104, + "step": 571930 + }, + { + "epoch": 1.48, + "learning_rate": 7.761735285045141e-05, + "loss": 0.0088, + "step": 571940 + }, + { + "epoch": 1.48, + "learning_rate": 7.761346463407995e-05, + "loss": 0.012, + "step": 571950 + }, + { + "epoch": 1.48, + "learning_rate": 7.760957641770848e-05, + "loss": 0.0097, + "step": 571960 + }, + { + "epoch": 1.48, + "learning_rate": 7.760568820133702e-05, + "loss": 0.0098, + "step": 571970 + }, + { + "epoch": 1.48, + "learning_rate": 7.760179998496555e-05, + "loss": 0.0113, + "step": 571980 + }, + { + "epoch": 1.48, + "learning_rate": 7.759791176859409e-05, + "loss": 0.0097, + "step": 571990 + }, + { + "epoch": 1.48, + "learning_rate": 7.759402355222262e-05, + "loss": 0.0086, + "step": 572000 + }, + { + "epoch": 1.48, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.006190904416143894, + "eval_runtime": 107.9681, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 572000 + }, + { + "epoch": 1.48, + "learning_rate": 7.759013533585116e-05, + "loss": 0.0098, + "step": 572010 + }, + { + "epoch": 1.48, + "learning_rate": 7.758624711947969e-05, + "loss": 0.0122, + "step": 572020 + }, + { + "epoch": 1.48, + "learning_rate": 7.758235890310823e-05, + "loss": 0.0079, + "step": 572030 + }, + { + "epoch": 1.48, + "learning_rate": 7.757847068673676e-05, + "loss": 0.0092, + "step": 572040 + }, + { + "epoch": 1.48, + "learning_rate": 7.757458247036532e-05, + "loss": 0.0119, + "step": 572050 + }, + { + "epoch": 1.48, + "learning_rate": 7.757069425399384e-05, + "loss": 0.0092, + "step": 572060 + }, + { + "epoch": 1.48, + "learning_rate": 7.756680603762239e-05, + "loss": 0.0084, + "step": 572070 + }, + { + "epoch": 1.48, + "learning_rate": 7.756291782125091e-05, + "loss": 0.0123, + "step": 572080 + }, + { + "epoch": 1.48, + "learning_rate": 7.755902960487945e-05, + "loss": 0.0094, + "step": 572090 + }, + { + "epoch": 1.48, + "learning_rate": 7.755514138850798e-05, + "loss": 0.0118, + "step": 572100 + }, + { + "epoch": 1.48, + "learning_rate": 7.755125317213652e-05, + "loss": 0.0094, + "step": 572110 + }, + { + "epoch": 1.48, + "learning_rate": 7.754736495576505e-05, + "loss": 0.0081, + "step": 572120 + }, + { + "epoch": 1.48, + "learning_rate": 7.75434767393936e-05, + "loss": 0.0109, + "step": 572130 + }, + { + "epoch": 1.48, + "learning_rate": 7.753958852302212e-05, + "loss": 0.0091, + "step": 572140 + }, + { + "epoch": 1.48, + "learning_rate": 7.753570030665065e-05, + "loss": 0.0082, + "step": 572150 + }, + { + "epoch": 1.48, + "learning_rate": 7.753181209027919e-05, + "loss": 0.0111, + "step": 572160 + }, + { + "epoch": 1.48, + "learning_rate": 7.752792387390772e-05, + "loss": 0.0088, + "step": 572170 + }, + { + "epoch": 1.48, + "learning_rate": 7.752403565753626e-05, + "loss": 0.0069, + "step": 572180 + }, + { + "epoch": 1.48, + "learning_rate": 7.752014744116479e-05, + "loss": 0.0127, + "step": 572190 + }, + { + "epoch": 1.48, + "learning_rate": 7.751625922479333e-05, + "loss": 0.0099, + "step": 572200 + }, + { + "epoch": 1.48, + "learning_rate": 7.751237100842186e-05, + "loss": 0.0099, + "step": 572210 + }, + { + "epoch": 1.48, + "learning_rate": 7.750848279205041e-05, + "loss": 0.0074, + "step": 572220 + }, + { + "epoch": 1.48, + "learning_rate": 7.750459457567893e-05, + "loss": 0.0089, + "step": 572230 + }, + { + "epoch": 1.48, + "learning_rate": 7.750070635930748e-05, + "loss": 0.0078, + "step": 572240 + }, + { + "epoch": 1.48, + "learning_rate": 7.749681814293601e-05, + "loss": 0.0085, + "step": 572250 + }, + { + "epoch": 1.48, + "learning_rate": 7.749292992656455e-05, + "loss": 0.0083, + "step": 572260 + }, + { + "epoch": 1.48, + "learning_rate": 7.748904171019308e-05, + "loss": 0.0133, + "step": 572270 + }, + { + "epoch": 1.48, + "learning_rate": 7.748515349382162e-05, + "loss": 0.0107, + "step": 572280 + }, + { + "epoch": 1.48, + "learning_rate": 7.748126527745015e-05, + "loss": 0.0078, + "step": 572290 + }, + { + "epoch": 1.48, + "learning_rate": 7.74773770610787e-05, + "loss": 0.011, + "step": 572300 + }, + { + "epoch": 1.48, + "learning_rate": 7.747348884470722e-05, + "loss": 0.0093, + "step": 572310 + }, + { + "epoch": 1.48, + "learning_rate": 7.746960062833576e-05, + "loss": 0.0106, + "step": 572320 + }, + { + "epoch": 1.48, + "learning_rate": 7.746571241196429e-05, + "loss": 0.0079, + "step": 572330 + }, + { + "epoch": 1.48, + "learning_rate": 7.746182419559283e-05, + "loss": 0.0088, + "step": 572340 + }, + { + "epoch": 1.48, + "learning_rate": 7.745793597922136e-05, + "loss": 0.0088, + "step": 572350 + }, + { + "epoch": 1.48, + "learning_rate": 7.74540477628499e-05, + "loss": 0.0098, + "step": 572360 + }, + { + "epoch": 1.48, + "learning_rate": 7.745015954647843e-05, + "loss": 0.0074, + "step": 572370 + }, + { + "epoch": 1.48, + "learning_rate": 7.744627133010697e-05, + "loss": 0.011, + "step": 572380 + }, + { + "epoch": 1.48, + "learning_rate": 7.74423831137355e-05, + "loss": 0.012, + "step": 572390 + }, + { + "epoch": 1.48, + "learning_rate": 7.743849489736403e-05, + "loss": 0.0093, + "step": 572400 + }, + { + "epoch": 1.48, + "learning_rate": 7.743460668099258e-05, + "loss": 0.0084, + "step": 572410 + }, + { + "epoch": 1.48, + "learning_rate": 7.743071846462111e-05, + "loss": 0.0099, + "step": 572420 + }, + { + "epoch": 1.48, + "learning_rate": 7.742683024824965e-05, + "loss": 0.0094, + "step": 572430 + }, + { + "epoch": 1.48, + "learning_rate": 7.742294203187818e-05, + "loss": 0.0078, + "step": 572440 + }, + { + "epoch": 1.48, + "learning_rate": 7.741905381550672e-05, + "loss": 0.0091, + "step": 572450 + }, + { + "epoch": 1.48, + "learning_rate": 7.741516559913525e-05, + "loss": 0.0075, + "step": 572460 + }, + { + "epoch": 1.48, + "learning_rate": 7.741127738276379e-05, + "loss": 0.0081, + "step": 572470 + }, + { + "epoch": 1.48, + "learning_rate": 7.740738916639232e-05, + "loss": 0.0073, + "step": 572480 + }, + { + "epoch": 1.48, + "learning_rate": 7.740350095002086e-05, + "loss": 0.0093, + "step": 572490 + }, + { + "epoch": 1.48, + "learning_rate": 7.739961273364939e-05, + "loss": 0.0072, + "step": 572500 + }, + { + "epoch": 1.48, + "learning_rate": 7.739572451727793e-05, + "loss": 0.0115, + "step": 572510 + }, + { + "epoch": 1.48, + "learning_rate": 7.739183630090646e-05, + "loss": 0.0118, + "step": 572520 + }, + { + "epoch": 1.48, + "learning_rate": 7.7387948084535e-05, + "loss": 0.011, + "step": 572530 + }, + { + "epoch": 1.48, + "learning_rate": 7.738405986816353e-05, + "loss": 0.011, + "step": 572540 + }, + { + "epoch": 1.48, + "learning_rate": 7.738017165179207e-05, + "loss": 0.0104, + "step": 572550 + }, + { + "epoch": 1.48, + "learning_rate": 7.73762834354206e-05, + "loss": 0.0073, + "step": 572560 + }, + { + "epoch": 1.48, + "learning_rate": 7.737239521904916e-05, + "loss": 0.0079, + "step": 572570 + }, + { + "epoch": 1.48, + "learning_rate": 7.736850700267767e-05, + "loss": 0.0115, + "step": 572580 + }, + { + "epoch": 1.48, + "learning_rate": 7.736461878630623e-05, + "loss": 0.0093, + "step": 572590 + }, + { + "epoch": 1.48, + "learning_rate": 7.736073056993475e-05, + "loss": 0.0083, + "step": 572600 + }, + { + "epoch": 1.48, + "learning_rate": 7.73568423535633e-05, + "loss": 0.0087, + "step": 572610 + }, + { + "epoch": 1.48, + "learning_rate": 7.735295413719182e-05, + "loss": 0.0068, + "step": 572620 + }, + { + "epoch": 1.48, + "learning_rate": 7.734906592082036e-05, + "loss": 0.0107, + "step": 572630 + }, + { + "epoch": 1.48, + "learning_rate": 7.734517770444889e-05, + "loss": 0.0076, + "step": 572640 + }, + { + "epoch": 1.48, + "learning_rate": 7.734128948807742e-05, + "loss": 0.0082, + "step": 572650 + }, + { + "epoch": 1.48, + "learning_rate": 7.733740127170596e-05, + "loss": 0.013, + "step": 572660 + }, + { + "epoch": 1.48, + "learning_rate": 7.733351305533449e-05, + "loss": 0.01, + "step": 572670 + }, + { + "epoch": 1.48, + "learning_rate": 7.732962483896303e-05, + "loss": 0.0097, + "step": 572680 + }, + { + "epoch": 1.48, + "learning_rate": 7.732573662259156e-05, + "loss": 0.0093, + "step": 572690 + }, + { + "epoch": 1.48, + "learning_rate": 7.73218484062201e-05, + "loss": 0.0099, + "step": 572700 + }, + { + "epoch": 1.48, + "learning_rate": 7.731796018984863e-05, + "loss": 0.01, + "step": 572710 + }, + { + "epoch": 1.48, + "learning_rate": 7.731407197347717e-05, + "loss": 0.0119, + "step": 572720 + }, + { + "epoch": 1.48, + "learning_rate": 7.73101837571057e-05, + "loss": 0.0094, + "step": 572730 + }, + { + "epoch": 1.48, + "learning_rate": 7.730629554073424e-05, + "loss": 0.0101, + "step": 572740 + }, + { + "epoch": 1.48, + "learning_rate": 7.730240732436277e-05, + "loss": 0.0097, + "step": 572750 + }, + { + "epoch": 1.48, + "learning_rate": 7.729851910799132e-05, + "loss": 0.0078, + "step": 572760 + }, + { + "epoch": 1.48, + "learning_rate": 7.729463089161985e-05, + "loss": 0.0097, + "step": 572770 + }, + { + "epoch": 1.48, + "learning_rate": 7.72907426752484e-05, + "loss": 0.007, + "step": 572780 + }, + { + "epoch": 1.48, + "learning_rate": 7.728685445887692e-05, + "loss": 0.0091, + "step": 572790 + }, + { + "epoch": 1.48, + "learning_rate": 7.728296624250546e-05, + "loss": 0.0088, + "step": 572800 + }, + { + "epoch": 1.48, + "learning_rate": 7.727907802613399e-05, + "loss": 0.0071, + "step": 572810 + }, + { + "epoch": 1.48, + "learning_rate": 7.727518980976253e-05, + "loss": 0.0098, + "step": 572820 + }, + { + "epoch": 1.48, + "learning_rate": 7.727130159339106e-05, + "loss": 0.0067, + "step": 572830 + }, + { + "epoch": 1.48, + "learning_rate": 7.72674133770196e-05, + "loss": 0.008, + "step": 572840 + }, + { + "epoch": 1.48, + "learning_rate": 7.726352516064813e-05, + "loss": 0.0089, + "step": 572850 + }, + { + "epoch": 1.48, + "learning_rate": 7.725963694427667e-05, + "loss": 0.0088, + "step": 572860 + }, + { + "epoch": 1.48, + "learning_rate": 7.72557487279052e-05, + "loss": 0.0081, + "step": 572870 + }, + { + "epoch": 1.48, + "learning_rate": 7.725186051153373e-05, + "loss": 0.0098, + "step": 572880 + }, + { + "epoch": 1.49, + "learning_rate": 7.724797229516227e-05, + "loss": 0.0083, + "step": 572890 + }, + { + "epoch": 1.49, + "learning_rate": 7.72440840787908e-05, + "loss": 0.009, + "step": 572900 + }, + { + "epoch": 1.49, + "learning_rate": 7.724019586241934e-05, + "loss": 0.01, + "step": 572910 + }, + { + "epoch": 1.49, + "learning_rate": 7.723630764604787e-05, + "loss": 0.0096, + "step": 572920 + }, + { + "epoch": 1.49, + "learning_rate": 7.723241942967642e-05, + "loss": 0.0087, + "step": 572930 + }, + { + "epoch": 1.49, + "learning_rate": 7.722853121330494e-05, + "loss": 0.0075, + "step": 572940 + }, + { + "epoch": 1.49, + "learning_rate": 7.72246429969335e-05, + "loss": 0.0104, + "step": 572950 + }, + { + "epoch": 1.49, + "learning_rate": 7.722075478056202e-05, + "loss": 0.0134, + "step": 572960 + }, + { + "epoch": 1.49, + "learning_rate": 7.721686656419056e-05, + "loss": 0.0076, + "step": 572970 + }, + { + "epoch": 1.49, + "learning_rate": 7.721297834781909e-05, + "loss": 0.0069, + "step": 572980 + }, + { + "epoch": 1.49, + "learning_rate": 7.720909013144763e-05, + "loss": 0.0108, + "step": 572990 + }, + { + "epoch": 1.49, + "learning_rate": 7.720520191507616e-05, + "loss": 0.0096, + "step": 573000 + }, + { + "epoch": 1.49, + "eval_cer": 0.8817026863231677, + "eval_loss": 0.006154380738735199, + "eval_runtime": 107.6789, + "eval_samples_per_second": 18.574, + "eval_steps_per_second": 4.643, + "step": 573000 + }, + { + "epoch": 1.49, + "learning_rate": 7.72013136987047e-05, + "loss": 0.0111, + "step": 573010 + }, + { + "epoch": 1.49, + "learning_rate": 7.719742548233323e-05, + "loss": 0.0092, + "step": 573020 + }, + { + "epoch": 1.49, + "learning_rate": 7.719353726596177e-05, + "loss": 0.0075, + "step": 573030 + }, + { + "epoch": 1.49, + "learning_rate": 7.71896490495903e-05, + "loss": 0.0079, + "step": 573040 + }, + { + "epoch": 1.49, + "learning_rate": 7.718576083321884e-05, + "loss": 0.0084, + "step": 573050 + }, + { + "epoch": 1.49, + "learning_rate": 7.718187261684737e-05, + "loss": 0.0106, + "step": 573060 + }, + { + "epoch": 1.49, + "learning_rate": 7.717798440047591e-05, + "loss": 0.0095, + "step": 573070 + }, + { + "epoch": 1.49, + "learning_rate": 7.717409618410444e-05, + "loss": 0.0066, + "step": 573080 + }, + { + "epoch": 1.49, + "learning_rate": 7.7170207967733e-05, + "loss": 0.0108, + "step": 573090 + }, + { + "epoch": 1.49, + "learning_rate": 7.716631975136151e-05, + "loss": 0.0115, + "step": 573100 + }, + { + "epoch": 1.49, + "learning_rate": 7.716243153499006e-05, + "loss": 0.0089, + "step": 573110 + }, + { + "epoch": 1.49, + "learning_rate": 7.715854331861859e-05, + "loss": 0.0093, + "step": 573120 + }, + { + "epoch": 1.49, + "learning_rate": 7.715465510224712e-05, + "loss": 0.0098, + "step": 573130 + }, + { + "epoch": 1.49, + "learning_rate": 7.715076688587566e-05, + "loss": 0.0074, + "step": 573140 + }, + { + "epoch": 1.49, + "learning_rate": 7.714687866950419e-05, + "loss": 0.008, + "step": 573150 + }, + { + "epoch": 1.49, + "learning_rate": 7.714299045313273e-05, + "loss": 0.0079, + "step": 573160 + }, + { + "epoch": 1.49, + "learning_rate": 7.713910223676126e-05, + "loss": 0.0088, + "step": 573170 + }, + { + "epoch": 1.49, + "learning_rate": 7.71352140203898e-05, + "loss": 0.0081, + "step": 573180 + }, + { + "epoch": 1.49, + "learning_rate": 7.713132580401833e-05, + "loss": 0.0081, + "step": 573190 + }, + { + "epoch": 1.49, + "learning_rate": 7.712743758764687e-05, + "loss": 0.0088, + "step": 573200 + }, + { + "epoch": 1.49, + "learning_rate": 7.71235493712754e-05, + "loss": 0.0074, + "step": 573210 + }, + { + "epoch": 1.49, + "learning_rate": 7.711966115490394e-05, + "loss": 0.0102, + "step": 573220 + }, + { + "epoch": 1.49, + "learning_rate": 7.711577293853247e-05, + "loss": 0.0108, + "step": 573230 + }, + { + "epoch": 1.49, + "learning_rate": 7.711188472216101e-05, + "loss": 0.0089, + "step": 573240 + }, + { + "epoch": 1.49, + "learning_rate": 7.710799650578954e-05, + "loss": 0.0084, + "step": 573250 + }, + { + "epoch": 1.49, + "learning_rate": 7.710410828941808e-05, + "loss": 0.0082, + "step": 573260 + }, + { + "epoch": 1.49, + "learning_rate": 7.710022007304661e-05, + "loss": 0.0136, + "step": 573270 + }, + { + "epoch": 1.49, + "learning_rate": 7.709633185667516e-05, + "loss": 0.0063, + "step": 573280 + }, + { + "epoch": 1.49, + "learning_rate": 7.709244364030369e-05, + "loss": 0.0096, + "step": 573290 + }, + { + "epoch": 1.49, + "learning_rate": 7.708855542393223e-05, + "loss": 0.0096, + "step": 573300 + }, + { + "epoch": 1.49, + "learning_rate": 7.708466720756076e-05, + "loss": 0.0083, + "step": 573310 + }, + { + "epoch": 1.49, + "learning_rate": 7.70807789911893e-05, + "loss": 0.0124, + "step": 573320 + }, + { + "epoch": 1.49, + "learning_rate": 7.707689077481783e-05, + "loss": 0.0119, + "step": 573330 + }, + { + "epoch": 1.49, + "learning_rate": 7.707300255844637e-05, + "loss": 0.0095, + "step": 573340 + }, + { + "epoch": 1.49, + "learning_rate": 7.70691143420749e-05, + "loss": 0.0088, + "step": 573350 + }, + { + "epoch": 1.49, + "learning_rate": 7.706522612570344e-05, + "loss": 0.0073, + "step": 573360 + }, + { + "epoch": 1.49, + "learning_rate": 7.706133790933197e-05, + "loss": 0.0094, + "step": 573370 + }, + { + "epoch": 1.49, + "learning_rate": 7.70574496929605e-05, + "loss": 0.0073, + "step": 573380 + }, + { + "epoch": 1.49, + "learning_rate": 7.705356147658904e-05, + "loss": 0.0089, + "step": 573390 + }, + { + "epoch": 1.49, + "learning_rate": 7.704967326021757e-05, + "loss": 0.01, + "step": 573400 + }, + { + "epoch": 1.49, + "learning_rate": 7.704578504384611e-05, + "loss": 0.0111, + "step": 573410 + }, + { + "epoch": 1.49, + "learning_rate": 7.704189682747464e-05, + "loss": 0.0099, + "step": 573420 + }, + { + "epoch": 1.49, + "learning_rate": 7.703800861110318e-05, + "loss": 0.0121, + "step": 573430 + }, + { + "epoch": 1.49, + "learning_rate": 7.703412039473171e-05, + "loss": 0.0108, + "step": 573440 + }, + { + "epoch": 1.49, + "learning_rate": 7.703023217836026e-05, + "loss": 0.0075, + "step": 573450 + }, + { + "epoch": 1.49, + "learning_rate": 7.702634396198878e-05, + "loss": 0.0115, + "step": 573460 + }, + { + "epoch": 1.49, + "learning_rate": 7.702245574561733e-05, + "loss": 0.0105, + "step": 573470 + }, + { + "epoch": 1.49, + "learning_rate": 7.701856752924586e-05, + "loss": 0.0081, + "step": 573480 + }, + { + "epoch": 1.49, + "learning_rate": 7.70146793128744e-05, + "loss": 0.009, + "step": 573490 + }, + { + "epoch": 1.49, + "learning_rate": 7.701079109650293e-05, + "loss": 0.0075, + "step": 573500 + }, + { + "epoch": 1.49, + "learning_rate": 7.700690288013147e-05, + "loss": 0.0102, + "step": 573510 + }, + { + "epoch": 1.49, + "learning_rate": 7.700301466376e-05, + "loss": 0.0097, + "step": 573520 + }, + { + "epoch": 1.49, + "learning_rate": 7.699912644738854e-05, + "loss": 0.008, + "step": 573530 + }, + { + "epoch": 1.49, + "learning_rate": 7.699523823101707e-05, + "loss": 0.0091, + "step": 573540 + }, + { + "epoch": 1.49, + "learning_rate": 7.699135001464561e-05, + "loss": 0.01, + "step": 573550 + }, + { + "epoch": 1.49, + "learning_rate": 7.698746179827414e-05, + "loss": 0.0097, + "step": 573560 + }, + { + "epoch": 1.49, + "learning_rate": 7.698357358190268e-05, + "loss": 0.0105, + "step": 573570 + }, + { + "epoch": 1.49, + "learning_rate": 7.697968536553121e-05, + "loss": 0.0066, + "step": 573580 + }, + { + "epoch": 1.49, + "learning_rate": 7.697579714915975e-05, + "loss": 0.0099, + "step": 573590 + }, + { + "epoch": 1.49, + "learning_rate": 7.697190893278828e-05, + "loss": 0.0085, + "step": 573600 + }, + { + "epoch": 1.49, + "learning_rate": 7.696802071641684e-05, + "loss": 0.01, + "step": 573610 + }, + { + "epoch": 1.49, + "learning_rate": 7.696413250004535e-05, + "loss": 0.0075, + "step": 573620 + }, + { + "epoch": 1.49, + "learning_rate": 7.696024428367388e-05, + "loss": 0.0119, + "step": 573630 + }, + { + "epoch": 1.49, + "learning_rate": 7.695635606730243e-05, + "loss": 0.0091, + "step": 573640 + }, + { + "epoch": 1.49, + "learning_rate": 7.695246785093096e-05, + "loss": 0.0105, + "step": 573650 + }, + { + "epoch": 1.49, + "learning_rate": 7.69485796345595e-05, + "loss": 0.0093, + "step": 573660 + }, + { + "epoch": 1.49, + "learning_rate": 7.694469141818803e-05, + "loss": 0.0097, + "step": 573670 + }, + { + "epoch": 1.49, + "learning_rate": 7.694080320181657e-05, + "loss": 0.0098, + "step": 573680 + }, + { + "epoch": 1.49, + "learning_rate": 7.69369149854451e-05, + "loss": 0.0124, + "step": 573690 + }, + { + "epoch": 1.49, + "learning_rate": 7.693302676907364e-05, + "loss": 0.008, + "step": 573700 + }, + { + "epoch": 1.49, + "learning_rate": 7.692913855270217e-05, + "loss": 0.0118, + "step": 573710 + }, + { + "epoch": 1.49, + "learning_rate": 7.692525033633071e-05, + "loss": 0.0085, + "step": 573720 + }, + { + "epoch": 1.49, + "learning_rate": 7.692136211995924e-05, + "loss": 0.0097, + "step": 573730 + }, + { + "epoch": 1.49, + "learning_rate": 7.691747390358778e-05, + "loss": 0.0106, + "step": 573740 + }, + { + "epoch": 1.49, + "learning_rate": 7.691358568721631e-05, + "loss": 0.0095, + "step": 573750 + }, + { + "epoch": 1.49, + "learning_rate": 7.690969747084485e-05, + "loss": 0.0084, + "step": 573760 + }, + { + "epoch": 1.49, + "learning_rate": 7.690580925447338e-05, + "loss": 0.008, + "step": 573770 + }, + { + "epoch": 1.49, + "learning_rate": 7.690192103810192e-05, + "loss": 0.0091, + "step": 573780 + }, + { + "epoch": 1.49, + "learning_rate": 7.689803282173045e-05, + "loss": 0.0094, + "step": 573790 + }, + { + "epoch": 1.49, + "learning_rate": 7.6894144605359e-05, + "loss": 0.0104, + "step": 573800 + }, + { + "epoch": 1.49, + "learning_rate": 7.689025638898753e-05, + "loss": 0.0078, + "step": 573810 + }, + { + "epoch": 1.49, + "learning_rate": 7.688636817261607e-05, + "loss": 0.0084, + "step": 573820 + }, + { + "epoch": 1.49, + "learning_rate": 7.68824799562446e-05, + "loss": 0.0086, + "step": 573830 + }, + { + "epoch": 1.49, + "learning_rate": 7.687859173987314e-05, + "loss": 0.0089, + "step": 573840 + }, + { + "epoch": 1.49, + "learning_rate": 7.687470352350167e-05, + "loss": 0.0101, + "step": 573850 + }, + { + "epoch": 1.49, + "learning_rate": 7.687081530713021e-05, + "loss": 0.0128, + "step": 573860 + }, + { + "epoch": 1.49, + "learning_rate": 7.686692709075874e-05, + "loss": 0.0106, + "step": 573870 + }, + { + "epoch": 1.49, + "learning_rate": 7.686303887438727e-05, + "loss": 0.0091, + "step": 573880 + }, + { + "epoch": 1.49, + "learning_rate": 7.685915065801581e-05, + "loss": 0.0067, + "step": 573890 + }, + { + "epoch": 1.49, + "learning_rate": 7.685526244164434e-05, + "loss": 0.0092, + "step": 573900 + }, + { + "epoch": 1.49, + "learning_rate": 7.685137422527288e-05, + "loss": 0.007, + "step": 573910 + }, + { + "epoch": 1.49, + "learning_rate": 7.684748600890141e-05, + "loss": 0.0135, + "step": 573920 + }, + { + "epoch": 1.49, + "learning_rate": 7.684359779252995e-05, + "loss": 0.0087, + "step": 573930 + }, + { + "epoch": 1.49, + "learning_rate": 7.683970957615848e-05, + "loss": 0.0076, + "step": 573940 + }, + { + "epoch": 1.49, + "learning_rate": 7.683582135978702e-05, + "loss": 0.0073, + "step": 573950 + }, + { + "epoch": 1.49, + "learning_rate": 7.683193314341555e-05, + "loss": 0.0088, + "step": 573960 + }, + { + "epoch": 1.49, + "learning_rate": 7.682804492704409e-05, + "loss": 0.0077, + "step": 573970 + }, + { + "epoch": 1.49, + "learning_rate": 7.682415671067262e-05, + "loss": 0.01, + "step": 573980 + }, + { + "epoch": 1.49, + "learning_rate": 7.682026849430117e-05, + "loss": 0.01, + "step": 573990 + }, + { + "epoch": 1.49, + "learning_rate": 7.68163802779297e-05, + "loss": 0.0116, + "step": 574000 + }, + { + "epoch": 1.49, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.0060965148732066154, + "eval_runtime": 107.9458, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 574000 + }, + { + "epoch": 1.49, + "learning_rate": 7.681249206155824e-05, + "loss": 0.0106, + "step": 574010 + }, + { + "epoch": 1.49, + "learning_rate": 7.680860384518677e-05, + "loss": 0.0094, + "step": 574020 + }, + { + "epoch": 1.49, + "learning_rate": 7.680471562881531e-05, + "loss": 0.0074, + "step": 574030 + }, + { + "epoch": 1.49, + "learning_rate": 7.680082741244384e-05, + "loss": 0.0092, + "step": 574040 + }, + { + "epoch": 1.49, + "learning_rate": 7.679693919607238e-05, + "loss": 0.0076, + "step": 574050 + }, + { + "epoch": 1.49, + "learning_rate": 7.679305097970091e-05, + "loss": 0.0072, + "step": 574060 + }, + { + "epoch": 1.49, + "learning_rate": 7.678916276332945e-05, + "loss": 0.0082, + "step": 574070 + }, + { + "epoch": 1.49, + "learning_rate": 7.678527454695798e-05, + "loss": 0.0073, + "step": 574080 + }, + { + "epoch": 1.49, + "learning_rate": 7.678138633058652e-05, + "loss": 0.0082, + "step": 574090 + }, + { + "epoch": 1.49, + "learning_rate": 7.677749811421505e-05, + "loss": 0.0091, + "step": 574100 + }, + { + "epoch": 1.49, + "learning_rate": 7.677360989784359e-05, + "loss": 0.0078, + "step": 574110 + }, + { + "epoch": 1.49, + "learning_rate": 7.676972168147212e-05, + "loss": 0.0093, + "step": 574120 + }, + { + "epoch": 1.49, + "learning_rate": 7.676583346510065e-05, + "loss": 0.007, + "step": 574130 + }, + { + "epoch": 1.49, + "learning_rate": 7.676194524872919e-05, + "loss": 0.0058, + "step": 574140 + }, + { + "epoch": 1.49, + "learning_rate": 7.675805703235772e-05, + "loss": 0.0073, + "step": 574150 + }, + { + "epoch": 1.49, + "learning_rate": 7.675416881598627e-05, + "loss": 0.0054, + "step": 574160 + }, + { + "epoch": 1.49, + "learning_rate": 7.675028059961479e-05, + "loss": 0.008, + "step": 574170 + }, + { + "epoch": 1.49, + "learning_rate": 7.674639238324334e-05, + "loss": 0.0153, + "step": 574180 + }, + { + "epoch": 1.49, + "learning_rate": 7.674250416687187e-05, + "loss": 0.0084, + "step": 574190 + }, + { + "epoch": 1.49, + "learning_rate": 7.673861595050041e-05, + "loss": 0.0071, + "step": 574200 + }, + { + "epoch": 1.49, + "learning_rate": 7.673472773412894e-05, + "loss": 0.0113, + "step": 574210 + }, + { + "epoch": 1.49, + "learning_rate": 7.673083951775748e-05, + "loss": 0.0104, + "step": 574220 + }, + { + "epoch": 1.49, + "learning_rate": 7.672695130138601e-05, + "loss": 0.0096, + "step": 574230 + }, + { + "epoch": 1.49, + "learning_rate": 7.672306308501455e-05, + "loss": 0.0068, + "step": 574240 + }, + { + "epoch": 1.49, + "learning_rate": 7.671917486864308e-05, + "loss": 0.0104, + "step": 574250 + }, + { + "epoch": 1.49, + "learning_rate": 7.671528665227162e-05, + "loss": 0.008, + "step": 574260 + }, + { + "epoch": 1.49, + "learning_rate": 7.671139843590015e-05, + "loss": 0.0077, + "step": 574270 + }, + { + "epoch": 1.49, + "learning_rate": 7.670751021952869e-05, + "loss": 0.0083, + "step": 574280 + }, + { + "epoch": 1.49, + "learning_rate": 7.670362200315722e-05, + "loss": 0.0087, + "step": 574290 + }, + { + "epoch": 1.49, + "learning_rate": 7.669973378678576e-05, + "loss": 0.0081, + "step": 574300 + }, + { + "epoch": 1.49, + "learning_rate": 7.669584557041429e-05, + "loss": 0.0085, + "step": 574310 + }, + { + "epoch": 1.49, + "learning_rate": 7.669195735404284e-05, + "loss": 0.01, + "step": 574320 + }, + { + "epoch": 1.49, + "learning_rate": 7.668806913767136e-05, + "loss": 0.0098, + "step": 574330 + }, + { + "epoch": 1.49, + "learning_rate": 7.668418092129991e-05, + "loss": 0.0098, + "step": 574340 + }, + { + "epoch": 1.49, + "learning_rate": 7.668029270492844e-05, + "loss": 0.0118, + "step": 574350 + }, + { + "epoch": 1.49, + "learning_rate": 7.667640448855698e-05, + "loss": 0.0106, + "step": 574360 + }, + { + "epoch": 1.49, + "learning_rate": 7.667251627218551e-05, + "loss": 0.011, + "step": 574370 + }, + { + "epoch": 1.49, + "learning_rate": 7.666862805581404e-05, + "loss": 0.009, + "step": 574380 + }, + { + "epoch": 1.49, + "learning_rate": 7.666473983944258e-05, + "loss": 0.0081, + "step": 574390 + }, + { + "epoch": 1.49, + "learning_rate": 7.666085162307111e-05, + "loss": 0.0092, + "step": 574400 + }, + { + "epoch": 1.49, + "learning_rate": 7.665696340669965e-05, + "loss": 0.0084, + "step": 574410 + }, + { + "epoch": 1.49, + "learning_rate": 7.665307519032818e-05, + "loss": 0.0078, + "step": 574420 + }, + { + "epoch": 1.49, + "learning_rate": 7.664918697395672e-05, + "loss": 0.0145, + "step": 574430 + }, + { + "epoch": 1.49, + "learning_rate": 7.664529875758525e-05, + "loss": 0.0096, + "step": 574440 + }, + { + "epoch": 1.49, + "learning_rate": 7.664141054121379e-05, + "loss": 0.0086, + "step": 574450 + }, + { + "epoch": 1.49, + "learning_rate": 7.663752232484232e-05, + "loss": 0.0142, + "step": 574460 + }, + { + "epoch": 1.49, + "learning_rate": 7.663363410847086e-05, + "loss": 0.0045, + "step": 574470 + }, + { + "epoch": 1.49, + "learning_rate": 7.662974589209939e-05, + "loss": 0.0107, + "step": 574480 + }, + { + "epoch": 1.49, + "learning_rate": 7.662585767572793e-05, + "loss": 0.007, + "step": 574490 + }, + { + "epoch": 1.49, + "learning_rate": 7.662196945935646e-05, + "loss": 0.0082, + "step": 574500 + }, + { + "epoch": 1.49, + "learning_rate": 7.661808124298501e-05, + "loss": 0.0123, + "step": 574510 + }, + { + "epoch": 1.49, + "learning_rate": 7.661419302661354e-05, + "loss": 0.0106, + "step": 574520 + }, + { + "epoch": 1.49, + "learning_rate": 7.661030481024208e-05, + "loss": 0.0081, + "step": 574530 + }, + { + "epoch": 1.49, + "learning_rate": 7.660641659387061e-05, + "loss": 0.013, + "step": 574540 + }, + { + "epoch": 1.49, + "learning_rate": 7.660252837749915e-05, + "loss": 0.0089, + "step": 574550 + }, + { + "epoch": 1.49, + "learning_rate": 7.659864016112768e-05, + "loss": 0.0091, + "step": 574560 + }, + { + "epoch": 1.49, + "learning_rate": 7.659475194475622e-05, + "loss": 0.0083, + "step": 574570 + }, + { + "epoch": 1.49, + "learning_rate": 7.659086372838475e-05, + "loss": 0.0131, + "step": 574580 + }, + { + "epoch": 1.49, + "learning_rate": 7.658697551201329e-05, + "loss": 0.0108, + "step": 574590 + }, + { + "epoch": 1.49, + "learning_rate": 7.658308729564182e-05, + "loss": 0.0123, + "step": 574600 + }, + { + "epoch": 1.49, + "learning_rate": 7.657919907927036e-05, + "loss": 0.0085, + "step": 574610 + }, + { + "epoch": 1.49, + "learning_rate": 7.657531086289889e-05, + "loss": 0.0112, + "step": 574620 + }, + { + "epoch": 1.49, + "learning_rate": 7.657142264652742e-05, + "loss": 0.0077, + "step": 574630 + }, + { + "epoch": 1.49, + "learning_rate": 7.656753443015596e-05, + "loss": 0.0083, + "step": 574640 + }, + { + "epoch": 1.49, + "learning_rate": 7.656364621378449e-05, + "loss": 0.0137, + "step": 574650 + }, + { + "epoch": 1.49, + "learning_rate": 7.655975799741303e-05, + "loss": 0.009, + "step": 574660 + }, + { + "epoch": 1.49, + "learning_rate": 7.655586978104156e-05, + "loss": 0.0095, + "step": 574670 + }, + { + "epoch": 1.49, + "learning_rate": 7.655198156467011e-05, + "loss": 0.01, + "step": 574680 + }, + { + "epoch": 1.49, + "learning_rate": 7.654809334829863e-05, + "loss": 0.0079, + "step": 574690 + }, + { + "epoch": 1.49, + "learning_rate": 7.654420513192718e-05, + "loss": 0.0066, + "step": 574700 + }, + { + "epoch": 1.49, + "learning_rate": 7.654031691555571e-05, + "loss": 0.0099, + "step": 574710 + }, + { + "epoch": 1.49, + "learning_rate": 7.653642869918425e-05, + "loss": 0.0107, + "step": 574720 + }, + { + "epoch": 1.49, + "learning_rate": 7.653254048281278e-05, + "loss": 0.01, + "step": 574730 + }, + { + "epoch": 1.49, + "learning_rate": 7.652865226644132e-05, + "loss": 0.0086, + "step": 574740 + }, + { + "epoch": 1.49, + "learning_rate": 7.652476405006985e-05, + "loss": 0.0104, + "step": 574750 + }, + { + "epoch": 1.49, + "learning_rate": 7.652087583369839e-05, + "loss": 0.0082, + "step": 574760 + }, + { + "epoch": 1.49, + "learning_rate": 7.651698761732692e-05, + "loss": 0.0101, + "step": 574770 + }, + { + "epoch": 1.49, + "learning_rate": 7.651309940095546e-05, + "loss": 0.0083, + "step": 574780 + }, + { + "epoch": 1.49, + "learning_rate": 7.650921118458399e-05, + "loss": 0.0078, + "step": 574790 + }, + { + "epoch": 1.49, + "learning_rate": 7.650532296821253e-05, + "loss": 0.0118, + "step": 574800 + }, + { + "epoch": 1.49, + "learning_rate": 7.650143475184106e-05, + "loss": 0.0078, + "step": 574810 + }, + { + "epoch": 1.49, + "learning_rate": 7.64975465354696e-05, + "loss": 0.01, + "step": 574820 + }, + { + "epoch": 1.49, + "learning_rate": 7.649365831909813e-05, + "loss": 0.0104, + "step": 574830 + }, + { + "epoch": 1.49, + "learning_rate": 7.648977010272668e-05, + "loss": 0.0073, + "step": 574840 + }, + { + "epoch": 1.49, + "learning_rate": 7.64858818863552e-05, + "loss": 0.0106, + "step": 574850 + }, + { + "epoch": 1.49, + "learning_rate": 7.648199366998375e-05, + "loss": 0.01, + "step": 574860 + }, + { + "epoch": 1.49, + "learning_rate": 7.647810545361228e-05, + "loss": 0.0098, + "step": 574870 + }, + { + "epoch": 1.49, + "learning_rate": 7.647421723724081e-05, + "loss": 0.012, + "step": 574880 + }, + { + "epoch": 1.49, + "learning_rate": 7.647032902086935e-05, + "loss": 0.008, + "step": 574890 + }, + { + "epoch": 1.49, + "learning_rate": 7.646644080449788e-05, + "loss": 0.0121, + "step": 574900 + }, + { + "epoch": 1.49, + "learning_rate": 7.646255258812642e-05, + "loss": 0.0113, + "step": 574910 + }, + { + "epoch": 1.49, + "learning_rate": 7.645866437175495e-05, + "loss": 0.0097, + "step": 574920 + }, + { + "epoch": 1.49, + "learning_rate": 7.645477615538349e-05, + "loss": 0.0106, + "step": 574930 + }, + { + "epoch": 1.49, + "learning_rate": 7.645088793901202e-05, + "loss": 0.0126, + "step": 574940 + }, + { + "epoch": 1.49, + "learning_rate": 7.644699972264056e-05, + "loss": 0.0104, + "step": 574950 + }, + { + "epoch": 1.49, + "learning_rate": 7.644311150626909e-05, + "loss": 0.0105, + "step": 574960 + }, + { + "epoch": 1.49, + "learning_rate": 7.643922328989763e-05, + "loss": 0.0085, + "step": 574970 + }, + { + "epoch": 1.49, + "learning_rate": 7.643533507352616e-05, + "loss": 0.0092, + "step": 574980 + }, + { + "epoch": 1.49, + "learning_rate": 7.64314468571547e-05, + "loss": 0.0085, + "step": 574990 + }, + { + "epoch": 1.49, + "learning_rate": 7.642755864078323e-05, + "loss": 0.0095, + "step": 575000 + }, + { + "epoch": 1.49, + "eval_cer": 0.8817166826925096, + "eval_loss": 0.006032513454556465, + "eval_runtime": 107.7203, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, + "step": 575000 + }, + { + "epoch": 1.49, + "learning_rate": 7.642367042441177e-05, + "loss": 0.0083, + "step": 575010 + }, + { + "epoch": 1.49, + "learning_rate": 7.64197822080403e-05, + "loss": 0.0082, + "step": 575020 + }, + { + "epoch": 1.49, + "learning_rate": 7.641589399166885e-05, + "loss": 0.0099, + "step": 575030 + }, + { + "epoch": 1.49, + "learning_rate": 7.641200577529738e-05, + "loss": 0.0103, + "step": 575040 + }, + { + "epoch": 1.49, + "learning_rate": 7.640811755892592e-05, + "loss": 0.0105, + "step": 575050 + }, + { + "epoch": 1.49, + "learning_rate": 7.640422934255445e-05, + "loss": 0.0097, + "step": 575060 + }, + { + "epoch": 1.49, + "learning_rate": 7.640034112618299e-05, + "loss": 0.0081, + "step": 575070 + }, + { + "epoch": 1.49, + "learning_rate": 7.639645290981152e-05, + "loss": 0.0081, + "step": 575080 + }, + { + "epoch": 1.49, + "learning_rate": 7.639256469344006e-05, + "loss": 0.0082, + "step": 575090 + }, + { + "epoch": 1.49, + "learning_rate": 7.638867647706859e-05, + "loss": 0.0112, + "step": 575100 + }, + { + "epoch": 1.49, + "learning_rate": 7.638478826069713e-05, + "loss": 0.008, + "step": 575110 + }, + { + "epoch": 1.49, + "learning_rate": 7.638090004432566e-05, + "loss": 0.0096, + "step": 575120 + }, + { + "epoch": 1.49, + "learning_rate": 7.637701182795419e-05, + "loss": 0.0087, + "step": 575130 + }, + { + "epoch": 1.49, + "learning_rate": 7.637312361158273e-05, + "loss": 0.0122, + "step": 575140 + }, + { + "epoch": 1.49, + "learning_rate": 7.636923539521126e-05, + "loss": 0.0079, + "step": 575150 + }, + { + "epoch": 1.49, + "learning_rate": 7.63653471788398e-05, + "loss": 0.0107, + "step": 575160 + }, + { + "epoch": 1.49, + "learning_rate": 7.636145896246833e-05, + "loss": 0.0146, + "step": 575170 + }, + { + "epoch": 1.49, + "learning_rate": 7.635757074609687e-05, + "loss": 0.0076, + "step": 575180 + }, + { + "epoch": 1.49, + "learning_rate": 7.63536825297254e-05, + "loss": 0.0082, + "step": 575190 + }, + { + "epoch": 1.49, + "learning_rate": 7.634979431335394e-05, + "loss": 0.0097, + "step": 575200 + }, + { + "epoch": 1.49, + "learning_rate": 7.634590609698247e-05, + "loss": 0.0078, + "step": 575210 + }, + { + "epoch": 1.49, + "learning_rate": 7.634201788061102e-05, + "loss": 0.0093, + "step": 575220 + }, + { + "epoch": 1.49, + "learning_rate": 7.633812966423955e-05, + "loss": 0.0114, + "step": 575230 + }, + { + "epoch": 1.49, + "learning_rate": 7.633424144786809e-05, + "loss": 0.0107, + "step": 575240 + }, + { + "epoch": 1.49, + "learning_rate": 7.633035323149662e-05, + "loss": 0.0094, + "step": 575250 + }, + { + "epoch": 1.49, + "learning_rate": 7.632646501512516e-05, + "loss": 0.0067, + "step": 575260 + }, + { + "epoch": 1.49, + "learning_rate": 7.632257679875369e-05, + "loss": 0.0105, + "step": 575270 + }, + { + "epoch": 1.49, + "learning_rate": 7.631868858238223e-05, + "loss": 0.0098, + "step": 575280 + }, + { + "epoch": 1.49, + "learning_rate": 7.631480036601076e-05, + "loss": 0.009, + "step": 575290 + }, + { + "epoch": 1.49, + "learning_rate": 7.63109121496393e-05, + "loss": 0.0113, + "step": 575300 + }, + { + "epoch": 1.49, + "learning_rate": 7.630702393326783e-05, + "loss": 0.0103, + "step": 575310 + }, + { + "epoch": 1.49, + "learning_rate": 7.630313571689637e-05, + "loss": 0.0175, + "step": 575320 + }, + { + "epoch": 1.49, + "learning_rate": 7.62992475005249e-05, + "loss": 0.01, + "step": 575330 + }, + { + "epoch": 1.49, + "learning_rate": 7.629535928415344e-05, + "loss": 0.0078, + "step": 575340 + }, + { + "epoch": 1.49, + "learning_rate": 7.629147106778197e-05, + "loss": 0.008, + "step": 575350 + }, + { + "epoch": 1.49, + "learning_rate": 7.62875828514105e-05, + "loss": 0.0066, + "step": 575360 + }, + { + "epoch": 1.49, + "learning_rate": 7.628369463503904e-05, + "loss": 0.0091, + "step": 575370 + }, + { + "epoch": 1.49, + "learning_rate": 7.627980641866757e-05, + "loss": 0.0104, + "step": 575380 + }, + { + "epoch": 1.49, + "learning_rate": 7.627591820229612e-05, + "loss": 0.0115, + "step": 575390 + }, + { + "epoch": 1.49, + "learning_rate": 7.627202998592465e-05, + "loss": 0.0073, + "step": 575400 + }, + { + "epoch": 1.49, + "learning_rate": 7.626814176955319e-05, + "loss": 0.0084, + "step": 575410 + }, + { + "epoch": 1.49, + "learning_rate": 7.626425355318172e-05, + "loss": 0.0079, + "step": 575420 + }, + { + "epoch": 1.49, + "learning_rate": 7.626036533681026e-05, + "loss": 0.0067, + "step": 575430 + }, + { + "epoch": 1.49, + "learning_rate": 7.625647712043879e-05, + "loss": 0.007, + "step": 575440 + }, + { + "epoch": 1.49, + "learning_rate": 7.625258890406733e-05, + "loss": 0.0086, + "step": 575450 + }, + { + "epoch": 1.49, + "learning_rate": 7.624870068769586e-05, + "loss": 0.0087, + "step": 575460 + }, + { + "epoch": 1.49, + "learning_rate": 7.62448124713244e-05, + "loss": 0.0099, + "step": 575470 + }, + { + "epoch": 1.49, + "learning_rate": 7.624092425495293e-05, + "loss": 0.0072, + "step": 575480 + }, + { + "epoch": 1.49, + "learning_rate": 7.623703603858147e-05, + "loss": 0.0098, + "step": 575490 + }, + { + "epoch": 1.49, + "learning_rate": 7.623314782221e-05, + "loss": 0.0077, + "step": 575500 + }, + { + "epoch": 1.49, + "learning_rate": 7.622925960583854e-05, + "loss": 0.0083, + "step": 575510 + }, + { + "epoch": 1.49, + "learning_rate": 7.622537138946707e-05, + "loss": 0.0082, + "step": 575520 + }, + { + "epoch": 1.49, + "learning_rate": 7.622148317309561e-05, + "loss": 0.0083, + "step": 575530 + }, + { + "epoch": 1.49, + "learning_rate": 7.621759495672414e-05, + "loss": 0.0094, + "step": 575540 + }, + { + "epoch": 1.49, + "learning_rate": 7.621370674035269e-05, + "loss": 0.0084, + "step": 575550 + }, + { + "epoch": 1.49, + "learning_rate": 7.620981852398121e-05, + "loss": 0.0087, + "step": 575560 + }, + { + "epoch": 1.49, + "learning_rate": 7.620593030760976e-05, + "loss": 0.0089, + "step": 575570 + }, + { + "epoch": 1.49, + "learning_rate": 7.620204209123829e-05, + "loss": 0.0104, + "step": 575580 + }, + { + "epoch": 1.49, + "learning_rate": 7.619815387486683e-05, + "loss": 0.0085, + "step": 575590 + }, + { + "epoch": 1.49, + "learning_rate": 7.619426565849536e-05, + "loss": 0.0093, + "step": 575600 + }, + { + "epoch": 1.49, + "learning_rate": 7.619037744212389e-05, + "loss": 0.0168, + "step": 575610 + }, + { + "epoch": 1.49, + "learning_rate": 7.618648922575243e-05, + "loss": 0.0113, + "step": 575620 + }, + { + "epoch": 1.49, + "learning_rate": 7.618260100938096e-05, + "loss": 0.0076, + "step": 575630 + }, + { + "epoch": 1.49, + "learning_rate": 7.61787127930095e-05, + "loss": 0.0087, + "step": 575640 + }, + { + "epoch": 1.49, + "learning_rate": 7.617482457663803e-05, + "loss": 0.01, + "step": 575650 + }, + { + "epoch": 1.49, + "learning_rate": 7.617093636026657e-05, + "loss": 0.0105, + "step": 575660 + }, + { + "epoch": 1.49, + "learning_rate": 7.61670481438951e-05, + "loss": 0.0082, + "step": 575670 + }, + { + "epoch": 1.49, + "learning_rate": 7.616315992752364e-05, + "loss": 0.0078, + "step": 575680 + }, + { + "epoch": 1.49, + "learning_rate": 7.615927171115217e-05, + "loss": 0.0081, + "step": 575690 + }, + { + "epoch": 1.49, + "learning_rate": 7.615538349478071e-05, + "loss": 0.0055, + "step": 575700 + }, + { + "epoch": 1.49, + "learning_rate": 7.615149527840924e-05, + "loss": 0.0082, + "step": 575710 + }, + { + "epoch": 1.49, + "learning_rate": 7.614760706203778e-05, + "loss": 0.0071, + "step": 575720 + }, + { + "epoch": 1.49, + "learning_rate": 7.614371884566631e-05, + "loss": 0.0088, + "step": 575730 + }, + { + "epoch": 1.49, + "learning_rate": 7.613983062929486e-05, + "loss": 0.0089, + "step": 575740 + }, + { + "epoch": 1.49, + "learning_rate": 7.613594241292339e-05, + "loss": 0.01, + "step": 575750 + }, + { + "epoch": 1.49, + "learning_rate": 7.613205419655193e-05, + "loss": 0.0225, + "step": 575760 + }, + { + "epoch": 1.49, + "learning_rate": 7.612816598018046e-05, + "loss": 0.0091, + "step": 575770 + }, + { + "epoch": 1.49, + "learning_rate": 7.6124277763809e-05, + "loss": 0.0123, + "step": 575780 + }, + { + "epoch": 1.49, + "learning_rate": 7.612038954743753e-05, + "loss": 0.0094, + "step": 575790 + }, + { + "epoch": 1.49, + "learning_rate": 7.611650133106607e-05, + "loss": 0.0098, + "step": 575800 + }, + { + "epoch": 1.49, + "learning_rate": 7.61126131146946e-05, + "loss": 0.0072, + "step": 575810 + }, + { + "epoch": 1.49, + "learning_rate": 7.610872489832314e-05, + "loss": 0.0094, + "step": 575820 + }, + { + "epoch": 1.49, + "learning_rate": 7.610483668195167e-05, + "loss": 0.0077, + "step": 575830 + }, + { + "epoch": 1.49, + "learning_rate": 7.610094846558021e-05, + "loss": 0.0086, + "step": 575840 + }, + { + "epoch": 1.49, + "learning_rate": 7.609706024920874e-05, + "loss": 0.008, + "step": 575850 + }, + { + "epoch": 1.49, + "learning_rate": 7.609317203283727e-05, + "loss": 0.0081, + "step": 575860 + }, + { + "epoch": 1.49, + "learning_rate": 7.608928381646581e-05, + "loss": 0.0065, + "step": 575870 + }, + { + "epoch": 1.49, + "learning_rate": 7.608539560009434e-05, + "loss": 0.0099, + "step": 575880 + }, + { + "epoch": 1.49, + "learning_rate": 7.608150738372288e-05, + "loss": 0.0095, + "step": 575890 + }, + { + "epoch": 1.49, + "learning_rate": 7.60776191673514e-05, + "loss": 0.0117, + "step": 575900 + }, + { + "epoch": 1.49, + "learning_rate": 7.607373095097996e-05, + "loss": 0.0103, + "step": 575910 + }, + { + "epoch": 1.49, + "learning_rate": 7.606984273460848e-05, + "loss": 0.0124, + "step": 575920 + }, + { + "epoch": 1.49, + "learning_rate": 7.606595451823703e-05, + "loss": 0.0111, + "step": 575930 + }, + { + "epoch": 1.49, + "learning_rate": 7.606206630186556e-05, + "loss": 0.0116, + "step": 575940 + }, + { + "epoch": 1.49, + "learning_rate": 7.60581780854941e-05, + "loss": 0.0093, + "step": 575950 + }, + { + "epoch": 1.49, + "learning_rate": 7.605428986912263e-05, + "loss": 0.0079, + "step": 575960 + }, + { + "epoch": 1.49, + "learning_rate": 7.605040165275117e-05, + "loss": 0.0063, + "step": 575970 + }, + { + "epoch": 1.49, + "learning_rate": 7.60465134363797e-05, + "loss": 0.0094, + "step": 575980 + }, + { + "epoch": 1.49, + "learning_rate": 7.604262522000824e-05, + "loss": 0.01, + "step": 575990 + }, + { + "epoch": 1.49, + "learning_rate": 7.603873700363677e-05, + "loss": 0.0092, + "step": 576000 + }, + { + "epoch": 1.49, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.006118689198046923, + "eval_runtime": 107.8667, + "eval_samples_per_second": 18.541, + "eval_steps_per_second": 4.635, + "step": 576000 + }, + { + "epoch": 1.49, + "learning_rate": 7.603484878726531e-05, + "loss": 0.0081, + "step": 576010 + }, + { + "epoch": 1.49, + "learning_rate": 7.603096057089384e-05, + "loss": 0.012, + "step": 576020 + }, + { + "epoch": 1.49, + "learning_rate": 7.602707235452238e-05, + "loss": 0.0107, + "step": 576030 + }, + { + "epoch": 1.49, + "learning_rate": 7.602318413815091e-05, + "loss": 0.0091, + "step": 576040 + }, + { + "epoch": 1.49, + "learning_rate": 7.601929592177945e-05, + "loss": 0.0082, + "step": 576050 + }, + { + "epoch": 1.49, + "learning_rate": 7.601540770540798e-05, + "loss": 0.0099, + "step": 576060 + }, + { + "epoch": 1.49, + "learning_rate": 7.601151948903653e-05, + "loss": 0.0087, + "step": 576070 + }, + { + "epoch": 1.49, + "learning_rate": 7.600763127266505e-05, + "loss": 0.0082, + "step": 576080 + }, + { + "epoch": 1.49, + "learning_rate": 7.60037430562936e-05, + "loss": 0.0099, + "step": 576090 + }, + { + "epoch": 1.49, + "learning_rate": 7.599985483992213e-05, + "loss": 0.008, + "step": 576100 + }, + { + "epoch": 1.49, + "learning_rate": 7.599596662355066e-05, + "loss": 0.0109, + "step": 576110 + }, + { + "epoch": 1.49, + "learning_rate": 7.59920784071792e-05, + "loss": 0.0103, + "step": 576120 + }, + { + "epoch": 1.49, + "learning_rate": 7.598819019080773e-05, + "loss": 0.0084, + "step": 576130 + }, + { + "epoch": 1.49, + "learning_rate": 7.598430197443627e-05, + "loss": 0.0095, + "step": 576140 + }, + { + "epoch": 1.49, + "learning_rate": 7.59804137580648e-05, + "loss": 0.015, + "step": 576150 + }, + { + "epoch": 1.49, + "learning_rate": 7.597652554169334e-05, + "loss": 0.0118, + "step": 576160 + }, + { + "epoch": 1.49, + "learning_rate": 7.597263732532187e-05, + "loss": 0.0106, + "step": 576170 + }, + { + "epoch": 1.49, + "learning_rate": 7.596874910895041e-05, + "loss": 0.0074, + "step": 576180 + }, + { + "epoch": 1.49, + "learning_rate": 7.596486089257894e-05, + "loss": 0.0069, + "step": 576190 + }, + { + "epoch": 1.49, + "learning_rate": 7.596097267620748e-05, + "loss": 0.0083, + "step": 576200 + }, + { + "epoch": 1.49, + "learning_rate": 7.595708445983601e-05, + "loss": 0.0112, + "step": 576210 + }, + { + "epoch": 1.49, + "learning_rate": 7.595319624346455e-05, + "loss": 0.0083, + "step": 576220 + }, + { + "epoch": 1.49, + "learning_rate": 7.594930802709308e-05, + "loss": 0.0099, + "step": 576230 + }, + { + "epoch": 1.49, + "learning_rate": 7.594541981072162e-05, + "loss": 0.0106, + "step": 576240 + }, + { + "epoch": 1.49, + "learning_rate": 7.594153159435015e-05, + "loss": 0.0072, + "step": 576250 + }, + { + "epoch": 1.49, + "learning_rate": 7.59376433779787e-05, + "loss": 0.0093, + "step": 576260 + }, + { + "epoch": 1.49, + "learning_rate": 7.593375516160723e-05, + "loss": 0.0081, + "step": 576270 + }, + { + "epoch": 1.49, + "learning_rate": 7.592986694523577e-05, + "loss": 0.0089, + "step": 576280 + }, + { + "epoch": 1.49, + "learning_rate": 7.59259787288643e-05, + "loss": 0.0102, + "step": 576290 + }, + { + "epoch": 1.49, + "learning_rate": 7.592209051249284e-05, + "loss": 0.008, + "step": 576300 + }, + { + "epoch": 1.49, + "learning_rate": 7.591820229612137e-05, + "loss": 0.0117, + "step": 576310 + }, + { + "epoch": 1.49, + "learning_rate": 7.591431407974991e-05, + "loss": 0.0074, + "step": 576320 + }, + { + "epoch": 1.49, + "learning_rate": 7.591042586337844e-05, + "loss": 0.0096, + "step": 576330 + }, + { + "epoch": 1.49, + "learning_rate": 7.590653764700698e-05, + "loss": 0.009, + "step": 576340 + }, + { + "epoch": 1.49, + "learning_rate": 7.590264943063551e-05, + "loss": 0.0086, + "step": 576350 + }, + { + "epoch": 1.49, + "learning_rate": 7.589876121426404e-05, + "loss": 0.0097, + "step": 576360 + }, + { + "epoch": 1.49, + "learning_rate": 7.589487299789258e-05, + "loss": 0.0137, + "step": 576370 + }, + { + "epoch": 1.49, + "learning_rate": 7.589098478152111e-05, + "loss": 0.0084, + "step": 576380 + }, + { + "epoch": 1.49, + "learning_rate": 7.588709656514965e-05, + "loss": 0.0094, + "step": 576390 + }, + { + "epoch": 1.49, + "learning_rate": 7.588320834877818e-05, + "loss": 0.0106, + "step": 576400 + }, + { + "epoch": 1.49, + "learning_rate": 7.587932013240672e-05, + "loss": 0.0079, + "step": 576410 + }, + { + "epoch": 1.49, + "learning_rate": 7.587543191603525e-05, + "loss": 0.0081, + "step": 576420 + }, + { + "epoch": 1.49, + "learning_rate": 7.58715436996638e-05, + "loss": 0.0075, + "step": 576430 + }, + { + "epoch": 1.49, + "learning_rate": 7.586765548329232e-05, + "loss": 0.0127, + "step": 576440 + }, + { + "epoch": 1.49, + "learning_rate": 7.586376726692087e-05, + "loss": 0.0078, + "step": 576450 + }, + { + "epoch": 1.49, + "learning_rate": 7.58598790505494e-05, + "loss": 0.0111, + "step": 576460 + }, + { + "epoch": 1.49, + "learning_rate": 7.585599083417794e-05, + "loss": 0.0146, + "step": 576470 + }, + { + "epoch": 1.49, + "learning_rate": 7.585210261780647e-05, + "loss": 0.0079, + "step": 576480 + }, + { + "epoch": 1.49, + "learning_rate": 7.584821440143501e-05, + "loss": 0.0104, + "step": 576490 + }, + { + "epoch": 1.49, + "learning_rate": 7.584432618506354e-05, + "loss": 0.0077, + "step": 576500 + }, + { + "epoch": 1.49, + "learning_rate": 7.584043796869208e-05, + "loss": 0.0091, + "step": 576510 + }, + { + "epoch": 1.49, + "learning_rate": 7.583654975232061e-05, + "loss": 0.0104, + "step": 576520 + }, + { + "epoch": 1.49, + "learning_rate": 7.583266153594915e-05, + "loss": 0.0086, + "step": 576530 + }, + { + "epoch": 1.49, + "learning_rate": 7.582877331957768e-05, + "loss": 0.0085, + "step": 576540 + }, + { + "epoch": 1.49, + "learning_rate": 7.582488510320622e-05, + "loss": 0.0093, + "step": 576550 + }, + { + "epoch": 1.49, + "learning_rate": 7.582099688683475e-05, + "loss": 0.0097, + "step": 576560 + }, + { + "epoch": 1.49, + "learning_rate": 7.581710867046329e-05, + "loss": 0.0063, + "step": 576570 + }, + { + "epoch": 1.49, + "learning_rate": 7.581322045409182e-05, + "loss": 0.0067, + "step": 576580 + }, + { + "epoch": 1.49, + "learning_rate": 7.580933223772036e-05, + "loss": 0.0166, + "step": 576590 + }, + { + "epoch": 1.49, + "learning_rate": 7.580544402134889e-05, + "loss": 0.0083, + "step": 576600 + }, + { + "epoch": 1.49, + "learning_rate": 7.580155580497742e-05, + "loss": 0.0073, + "step": 576610 + }, + { + "epoch": 1.49, + "learning_rate": 7.579766758860597e-05, + "loss": 0.0068, + "step": 576620 + }, + { + "epoch": 1.49, + "learning_rate": 7.57937793722345e-05, + "loss": 0.0076, + "step": 576630 + }, + { + "epoch": 1.49, + "learning_rate": 7.578989115586304e-05, + "loss": 0.0097, + "step": 576640 + }, + { + "epoch": 1.49, + "learning_rate": 7.578600293949157e-05, + "loss": 0.0098, + "step": 576650 + }, + { + "epoch": 1.49, + "learning_rate": 7.578211472312011e-05, + "loss": 0.0097, + "step": 576660 + }, + { + "epoch": 1.49, + "learning_rate": 7.577822650674864e-05, + "loss": 0.0091, + "step": 576670 + }, + { + "epoch": 1.49, + "learning_rate": 7.577433829037718e-05, + "loss": 0.0092, + "step": 576680 + }, + { + "epoch": 1.49, + "learning_rate": 7.577045007400571e-05, + "loss": 0.0087, + "step": 576690 + }, + { + "epoch": 1.49, + "learning_rate": 7.576656185763425e-05, + "loss": 0.0115, + "step": 576700 + }, + { + "epoch": 1.49, + "learning_rate": 7.576267364126278e-05, + "loss": 0.0093, + "step": 576710 + }, + { + "epoch": 1.49, + "learning_rate": 7.575878542489132e-05, + "loss": 0.0079, + "step": 576720 + }, + { + "epoch": 1.49, + "learning_rate": 7.575489720851985e-05, + "loss": 0.0087, + "step": 576730 + }, + { + "epoch": 1.49, + "learning_rate": 7.575100899214839e-05, + "loss": 0.0088, + "step": 576740 + }, + { + "epoch": 1.5, + "learning_rate": 7.574712077577692e-05, + "loss": 0.0105, + "step": 576750 + }, + { + "epoch": 1.5, + "learning_rate": 7.574323255940546e-05, + "loss": 0.0109, + "step": 576760 + }, + { + "epoch": 1.5, + "learning_rate": 7.573934434303399e-05, + "loss": 0.0063, + "step": 576770 + }, + { + "epoch": 1.5, + "learning_rate": 7.573545612666254e-05, + "loss": 0.0092, + "step": 576780 + }, + { + "epoch": 1.5, + "learning_rate": 7.573156791029106e-05, + "loss": 0.006, + "step": 576790 + }, + { + "epoch": 1.5, + "learning_rate": 7.572767969391961e-05, + "loss": 0.0077, + "step": 576800 + }, + { + "epoch": 1.5, + "learning_rate": 7.572379147754814e-05, + "loss": 0.0072, + "step": 576810 + }, + { + "epoch": 1.5, + "learning_rate": 7.571990326117668e-05, + "loss": 0.0111, + "step": 576820 + }, + { + "epoch": 1.5, + "learning_rate": 7.571601504480521e-05, + "loss": 0.0079, + "step": 576830 + }, + { + "epoch": 1.5, + "learning_rate": 7.571212682843375e-05, + "loss": 0.0112, + "step": 576840 + }, + { + "epoch": 1.5, + "learning_rate": 7.570823861206228e-05, + "loss": 0.0097, + "step": 576850 + }, + { + "epoch": 1.5, + "learning_rate": 7.570435039569081e-05, + "loss": 0.0095, + "step": 576860 + }, + { + "epoch": 1.5, + "learning_rate": 7.570046217931935e-05, + "loss": 0.009, + "step": 576870 + }, + { + "epoch": 1.5, + "learning_rate": 7.569657396294788e-05, + "loss": 0.0086, + "step": 576880 + }, + { + "epoch": 1.5, + "learning_rate": 7.569268574657642e-05, + "loss": 0.0092, + "step": 576890 + }, + { + "epoch": 1.5, + "learning_rate": 7.568879753020495e-05, + "loss": 0.006, + "step": 576900 + }, + { + "epoch": 1.5, + "learning_rate": 7.568490931383349e-05, + "loss": 0.0078, + "step": 576910 + }, + { + "epoch": 1.5, + "learning_rate": 7.568102109746202e-05, + "loss": 0.0079, + "step": 576920 + }, + { + "epoch": 1.5, + "learning_rate": 7.567713288109056e-05, + "loss": 0.0094, + "step": 576930 + }, + { + "epoch": 1.5, + "learning_rate": 7.567324466471909e-05, + "loss": 0.0076, + "step": 576940 + }, + { + "epoch": 1.5, + "learning_rate": 7.566935644834763e-05, + "loss": 0.011, + "step": 576950 + }, + { + "epoch": 1.5, + "learning_rate": 7.566546823197616e-05, + "loss": 0.0092, + "step": 576960 + }, + { + "epoch": 1.5, + "learning_rate": 7.566158001560471e-05, + "loss": 0.0076, + "step": 576970 + }, + { + "epoch": 1.5, + "learning_rate": 7.565769179923324e-05, + "loss": 0.0097, + "step": 576980 + }, + { + "epoch": 1.5, + "learning_rate": 7.565380358286178e-05, + "loss": 0.0102, + "step": 576990 + }, + { + "epoch": 1.5, + "learning_rate": 7.564991536649031e-05, + "loss": 0.0079, + "step": 577000 + }, + { + "epoch": 1.5, + "eval_cer": 0.8817180823294437, + "eval_loss": 0.006126715801656246, + "eval_runtime": 107.6241, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, + "step": 577000 + }, + { + "epoch": 1.5, + "learning_rate": 7.564602715011885e-05, + "loss": 0.0096, + "step": 577010 + }, + { + "epoch": 1.5, + "learning_rate": 7.564213893374738e-05, + "loss": 0.0107, + "step": 577020 + }, + { + "epoch": 1.5, + "learning_rate": 7.563825071737592e-05, + "loss": 0.0106, + "step": 577030 + }, + { + "epoch": 1.5, + "learning_rate": 7.563436250100445e-05, + "loss": 0.0128, + "step": 577040 + }, + { + "epoch": 1.5, + "learning_rate": 7.563047428463299e-05, + "loss": 0.0089, + "step": 577050 + }, + { + "epoch": 1.5, + "learning_rate": 7.562658606826152e-05, + "loss": 0.0097, + "step": 577060 + }, + { + "epoch": 1.5, + "learning_rate": 7.562269785189006e-05, + "loss": 0.0099, + "step": 577070 + }, + { + "epoch": 1.5, + "learning_rate": 7.561880963551859e-05, + "loss": 0.0077, + "step": 577080 + }, + { + "epoch": 1.5, + "learning_rate": 7.561492141914713e-05, + "loss": 0.0076, + "step": 577090 + }, + { + "epoch": 1.5, + "learning_rate": 7.561103320277566e-05, + "loss": 0.0075, + "step": 577100 + }, + { + "epoch": 1.5, + "learning_rate": 7.560714498640419e-05, + "loss": 0.0074, + "step": 577110 + }, + { + "epoch": 1.5, + "learning_rate": 7.560325677003273e-05, + "loss": 0.0083, + "step": 577120 + }, + { + "epoch": 1.5, + "learning_rate": 7.559936855366126e-05, + "loss": 0.0102, + "step": 577130 + }, + { + "epoch": 1.5, + "learning_rate": 7.559548033728981e-05, + "loss": 0.0106, + "step": 577140 + }, + { + "epoch": 1.5, + "learning_rate": 7.559159212091833e-05, + "loss": 0.0082, + "step": 577150 + }, + { + "epoch": 1.5, + "learning_rate": 7.558770390454688e-05, + "loss": 0.0078, + "step": 577160 + }, + { + "epoch": 1.5, + "learning_rate": 7.558381568817541e-05, + "loss": 0.0097, + "step": 577170 + }, + { + "epoch": 1.5, + "learning_rate": 7.557992747180395e-05, + "loss": 0.0086, + "step": 577180 + }, + { + "epoch": 1.5, + "learning_rate": 7.557603925543248e-05, + "loss": 0.0122, + "step": 577190 + }, + { + "epoch": 1.5, + "learning_rate": 7.557215103906102e-05, + "loss": 0.0085, + "step": 577200 + }, + { + "epoch": 1.5, + "learning_rate": 7.556826282268955e-05, + "loss": 0.0099, + "step": 577210 + }, + { + "epoch": 1.5, + "learning_rate": 7.556437460631809e-05, + "loss": 0.0092, + "step": 577220 + }, + { + "epoch": 1.5, + "learning_rate": 7.556048638994662e-05, + "loss": 0.007, + "step": 577230 + }, + { + "epoch": 1.5, + "learning_rate": 7.555659817357516e-05, + "loss": 0.0101, + "step": 577240 + }, + { + "epoch": 1.5, + "learning_rate": 7.555270995720369e-05, + "loss": 0.0094, + "step": 577250 + }, + { + "epoch": 1.5, + "learning_rate": 7.554882174083223e-05, + "loss": 0.0087, + "step": 577260 + }, + { + "epoch": 1.5, + "learning_rate": 7.554493352446076e-05, + "loss": 0.0076, + "step": 577270 + }, + { + "epoch": 1.5, + "learning_rate": 7.55410453080893e-05, + "loss": 0.0099, + "step": 577280 + }, + { + "epoch": 1.5, + "learning_rate": 7.553715709171783e-05, + "loss": 0.0126, + "step": 577290 + }, + { + "epoch": 1.5, + "learning_rate": 7.553326887534638e-05, + "loss": 0.0104, + "step": 577300 + }, + { + "epoch": 1.5, + "learning_rate": 7.55293806589749e-05, + "loss": 0.011, + "step": 577310 + }, + { + "epoch": 1.5, + "learning_rate": 7.552549244260345e-05, + "loss": 0.0067, + "step": 577320 + }, + { + "epoch": 1.5, + "learning_rate": 7.552160422623198e-05, + "loss": 0.0155, + "step": 577330 + }, + { + "epoch": 1.5, + "learning_rate": 7.551771600986052e-05, + "loss": 0.0092, + "step": 577340 + }, + { + "epoch": 1.5, + "learning_rate": 7.551382779348905e-05, + "loss": 0.0098, + "step": 577350 + }, + { + "epoch": 1.5, + "learning_rate": 7.550993957711758e-05, + "loss": 0.0089, + "step": 577360 + }, + { + "epoch": 1.5, + "learning_rate": 7.550605136074612e-05, + "loss": 0.0124, + "step": 577370 + }, + { + "epoch": 1.5, + "learning_rate": 7.550216314437465e-05, + "loss": 0.0058, + "step": 577380 + }, + { + "epoch": 1.5, + "learning_rate": 7.549827492800319e-05, + "loss": 0.0097, + "step": 577390 + }, + { + "epoch": 1.5, + "learning_rate": 7.549438671163172e-05, + "loss": 0.0072, + "step": 577400 + }, + { + "epoch": 1.5, + "learning_rate": 7.549049849526026e-05, + "loss": 0.0094, + "step": 577410 + }, + { + "epoch": 1.5, + "learning_rate": 7.548661027888879e-05, + "loss": 0.0113, + "step": 577420 + }, + { + "epoch": 1.5, + "learning_rate": 7.548272206251733e-05, + "loss": 0.0091, + "step": 577430 + }, + { + "epoch": 1.5, + "learning_rate": 7.547883384614586e-05, + "loss": 0.0076, + "step": 577440 + }, + { + "epoch": 1.5, + "learning_rate": 7.54749456297744e-05, + "loss": 0.0062, + "step": 577450 + }, + { + "epoch": 1.5, + "learning_rate": 7.547105741340293e-05, + "loss": 0.0103, + "step": 577460 + }, + { + "epoch": 1.5, + "learning_rate": 7.546716919703147e-05, + "loss": 0.0118, + "step": 577470 + }, + { + "epoch": 1.5, + "learning_rate": 7.546328098066e-05, + "loss": 0.0081, + "step": 577480 + }, + { + "epoch": 1.5, + "learning_rate": 7.545939276428855e-05, + "loss": 0.01, + "step": 577490 + }, + { + "epoch": 1.5, + "learning_rate": 7.545550454791708e-05, + "loss": 0.0127, + "step": 577500 + }, + { + "epoch": 1.5, + "learning_rate": 7.545161633154562e-05, + "loss": 0.0081, + "step": 577510 + }, + { + "epoch": 1.5, + "learning_rate": 7.544772811517415e-05, + "loss": 0.01, + "step": 577520 + }, + { + "epoch": 1.5, + "learning_rate": 7.544383989880269e-05, + "loss": 0.008, + "step": 577530 + }, + { + "epoch": 1.5, + "learning_rate": 7.543995168243122e-05, + "loss": 0.0093, + "step": 577540 + }, + { + "epoch": 1.5, + "learning_rate": 7.543606346605976e-05, + "loss": 0.0064, + "step": 577550 + }, + { + "epoch": 1.5, + "learning_rate": 7.543217524968829e-05, + "loss": 0.0089, + "step": 577560 + }, + { + "epoch": 1.5, + "learning_rate": 7.542828703331683e-05, + "loss": 0.0075, + "step": 577570 + }, + { + "epoch": 1.5, + "learning_rate": 7.542439881694536e-05, + "loss": 0.007, + "step": 577580 + }, + { + "epoch": 1.5, + "learning_rate": 7.54205106005739e-05, + "loss": 0.0085, + "step": 577590 + }, + { + "epoch": 1.5, + "learning_rate": 7.541662238420243e-05, + "loss": 0.0108, + "step": 577600 + }, + { + "epoch": 1.5, + "learning_rate": 7.541273416783096e-05, + "loss": 0.0096, + "step": 577610 + }, + { + "epoch": 1.5, + "learning_rate": 7.54088459514595e-05, + "loss": 0.0083, + "step": 577620 + }, + { + "epoch": 1.5, + "learning_rate": 7.540495773508803e-05, + "loss": 0.0103, + "step": 577630 + }, + { + "epoch": 1.5, + "learning_rate": 7.540106951871657e-05, + "loss": 0.0088, + "step": 577640 + }, + { + "epoch": 1.5, + "learning_rate": 7.53971813023451e-05, + "loss": 0.0081, + "step": 577650 + }, + { + "epoch": 1.5, + "learning_rate": 7.539329308597365e-05, + "loss": 0.0091, + "step": 577660 + }, + { + "epoch": 1.5, + "learning_rate": 7.538940486960217e-05, + "loss": 0.0067, + "step": 577670 + }, + { + "epoch": 1.5, + "learning_rate": 7.538551665323072e-05, + "loss": 0.0053, + "step": 577680 + }, + { + "epoch": 1.5, + "learning_rate": 7.538162843685925e-05, + "loss": 0.0083, + "step": 577690 + }, + { + "epoch": 1.5, + "learning_rate": 7.537774022048779e-05, + "loss": 0.0112, + "step": 577700 + }, + { + "epoch": 1.5, + "learning_rate": 7.537385200411632e-05, + "loss": 0.0101, + "step": 577710 + }, + { + "epoch": 1.5, + "learning_rate": 7.536996378774486e-05, + "loss": 0.007, + "step": 577720 + }, + { + "epoch": 1.5, + "learning_rate": 7.536607557137339e-05, + "loss": 0.0101, + "step": 577730 + }, + { + "epoch": 1.5, + "learning_rate": 7.536218735500193e-05, + "loss": 0.0093, + "step": 577740 + }, + { + "epoch": 1.5, + "learning_rate": 7.535829913863046e-05, + "loss": 0.0074, + "step": 577750 + }, + { + "epoch": 1.5, + "learning_rate": 7.5354410922259e-05, + "loss": 0.0102, + "step": 577760 + }, + { + "epoch": 1.5, + "learning_rate": 7.535052270588753e-05, + "loss": 0.011, + "step": 577770 + }, + { + "epoch": 1.5, + "learning_rate": 7.534663448951607e-05, + "loss": 0.0068, + "step": 577780 + }, + { + "epoch": 1.5, + "learning_rate": 7.53427462731446e-05, + "loss": 0.0099, + "step": 577790 + }, + { + "epoch": 1.5, + "learning_rate": 7.533885805677314e-05, + "loss": 0.0074, + "step": 577800 + }, + { + "epoch": 1.5, + "learning_rate": 7.533496984040167e-05, + "loss": 0.0098, + "step": 577810 + }, + { + "epoch": 1.5, + "learning_rate": 7.533108162403022e-05, + "loss": 0.0105, + "step": 577820 + }, + { + "epoch": 1.5, + "learning_rate": 7.532719340765874e-05, + "loss": 0.0082, + "step": 577830 + }, + { + "epoch": 1.5, + "learning_rate": 7.532330519128729e-05, + "loss": 0.0083, + "step": 577840 + }, + { + "epoch": 1.5, + "learning_rate": 7.531941697491582e-05, + "loss": 0.0087, + "step": 577850 + }, + { + "epoch": 1.5, + "learning_rate": 7.531552875854435e-05, + "loss": 0.0074, + "step": 577860 + }, + { + "epoch": 1.5, + "learning_rate": 7.531164054217289e-05, + "loss": 0.0102, + "step": 577870 + }, + { + "epoch": 1.5, + "learning_rate": 7.530775232580142e-05, + "loss": 0.0104, + "step": 577880 + }, + { + "epoch": 1.5, + "learning_rate": 7.530386410942996e-05, + "loss": 0.0098, + "step": 577890 + }, + { + "epoch": 1.5, + "learning_rate": 7.529997589305849e-05, + "loss": 0.0124, + "step": 577900 + }, + { + "epoch": 1.5, + "learning_rate": 7.529608767668703e-05, + "loss": 0.0099, + "step": 577910 + }, + { + "epoch": 1.5, + "learning_rate": 7.529219946031556e-05, + "loss": 0.0104, + "step": 577920 + }, + { + "epoch": 1.5, + "learning_rate": 7.52883112439441e-05, + "loss": 0.0076, + "step": 577930 + }, + { + "epoch": 1.5, + "learning_rate": 7.528442302757263e-05, + "loss": 0.0065, + "step": 577940 + }, + { + "epoch": 1.5, + "learning_rate": 7.528053481120117e-05, + "loss": 0.0067, + "step": 577950 + }, + { + "epoch": 1.5, + "learning_rate": 7.52766465948297e-05, + "loss": 0.0064, + "step": 577960 + }, + { + "epoch": 1.5, + "learning_rate": 7.527275837845824e-05, + "loss": 0.0084, + "step": 577970 + }, + { + "epoch": 1.5, + "learning_rate": 7.526887016208677e-05, + "loss": 0.0079, + "step": 577980 + }, + { + "epoch": 1.5, + "learning_rate": 7.526498194571531e-05, + "loss": 0.0101, + "step": 577990 + }, + { + "epoch": 1.5, + "learning_rate": 7.526109372934384e-05, + "loss": 0.0082, + "step": 578000 + }, + { + "epoch": 1.5, + "eval_cer": 0.8817096845078387, + "eval_loss": 0.0061296941712498665, + "eval_runtime": 107.7949, + "eval_samples_per_second": 18.554, + "eval_steps_per_second": 4.638, + "step": 578000 + }, + { + "epoch": 1.5, + "learning_rate": 7.525720551297239e-05, + "loss": 0.0082, + "step": 578010 + }, + { + "epoch": 1.5, + "learning_rate": 7.525331729660092e-05, + "loss": 0.0083, + "step": 578020 + }, + { + "epoch": 1.5, + "learning_rate": 7.524942908022946e-05, + "loss": 0.0107, + "step": 578030 + }, + { + "epoch": 1.5, + "learning_rate": 7.524554086385799e-05, + "loss": 0.0096, + "step": 578040 + }, + { + "epoch": 1.5, + "learning_rate": 7.524165264748653e-05, + "loss": 0.0094, + "step": 578050 + }, + { + "epoch": 1.5, + "learning_rate": 7.523776443111506e-05, + "loss": 0.0067, + "step": 578060 + }, + { + "epoch": 1.5, + "learning_rate": 7.52338762147436e-05, + "loss": 0.0082, + "step": 578070 + }, + { + "epoch": 1.5, + "learning_rate": 7.522998799837213e-05, + "loss": 0.0116, + "step": 578080 + }, + { + "epoch": 1.5, + "learning_rate": 7.522609978200066e-05, + "loss": 0.0129, + "step": 578090 + }, + { + "epoch": 1.5, + "learning_rate": 7.52222115656292e-05, + "loss": 0.0099, + "step": 578100 + }, + { + "epoch": 1.5, + "learning_rate": 7.521832334925773e-05, + "loss": 0.0093, + "step": 578110 + }, + { + "epoch": 1.5, + "learning_rate": 7.521443513288627e-05, + "loss": 0.0102, + "step": 578120 + }, + { + "epoch": 1.5, + "learning_rate": 7.52105469165148e-05, + "loss": 0.0098, + "step": 578130 + }, + { + "epoch": 1.5, + "learning_rate": 7.520665870014334e-05, + "loss": 0.0078, + "step": 578140 + }, + { + "epoch": 1.5, + "learning_rate": 7.520277048377187e-05, + "loss": 0.0089, + "step": 578150 + }, + { + "epoch": 1.5, + "learning_rate": 7.519888226740041e-05, + "loss": 0.0081, + "step": 578160 + }, + { + "epoch": 1.5, + "learning_rate": 7.519499405102894e-05, + "loss": 0.0107, + "step": 578170 + }, + { + "epoch": 1.5, + "learning_rate": 7.519110583465748e-05, + "loss": 0.0104, + "step": 578180 + }, + { + "epoch": 1.5, + "learning_rate": 7.5187217618286e-05, + "loss": 0.0084, + "step": 578190 + }, + { + "epoch": 1.5, + "learning_rate": 7.518332940191456e-05, + "loss": 0.0098, + "step": 578200 + }, + { + "epoch": 1.5, + "learning_rate": 7.517944118554309e-05, + "loss": 0.0102, + "step": 578210 + }, + { + "epoch": 1.5, + "learning_rate": 7.517555296917163e-05, + "loss": 0.0077, + "step": 578220 + }, + { + "epoch": 1.5, + "learning_rate": 7.517166475280016e-05, + "loss": 0.0103, + "step": 578230 + }, + { + "epoch": 1.5, + "learning_rate": 7.51677765364287e-05, + "loss": 0.0106, + "step": 578240 + }, + { + "epoch": 1.5, + "learning_rate": 7.516388832005723e-05, + "loss": 0.0095, + "step": 578250 + }, + { + "epoch": 1.5, + "learning_rate": 7.516000010368577e-05, + "loss": 0.009, + "step": 578260 + }, + { + "epoch": 1.5, + "learning_rate": 7.51561118873143e-05, + "loss": 0.0061, + "step": 578270 + }, + { + "epoch": 1.5, + "learning_rate": 7.515222367094284e-05, + "loss": 0.0081, + "step": 578280 + }, + { + "epoch": 1.5, + "learning_rate": 7.514833545457137e-05, + "loss": 0.0132, + "step": 578290 + }, + { + "epoch": 1.5, + "learning_rate": 7.514444723819991e-05, + "loss": 0.0053, + "step": 578300 + }, + { + "epoch": 1.5, + "learning_rate": 7.514055902182844e-05, + "loss": 0.0113, + "step": 578310 + }, + { + "epoch": 1.5, + "learning_rate": 7.513667080545698e-05, + "loss": 0.0084, + "step": 578320 + }, + { + "epoch": 1.5, + "learning_rate": 7.51327825890855e-05, + "loss": 0.0112, + "step": 578330 + }, + { + "epoch": 1.5, + "learning_rate": 7.512889437271403e-05, + "loss": 0.0074, + "step": 578340 + }, + { + "epoch": 1.5, + "learning_rate": 7.512500615634258e-05, + "loss": 0.0129, + "step": 578350 + }, + { + "epoch": 1.5, + "learning_rate": 7.51211179399711e-05, + "loss": 0.0101, + "step": 578360 + }, + { + "epoch": 1.5, + "learning_rate": 7.511722972359966e-05, + "loss": 0.0143, + "step": 578370 + }, + { + "epoch": 1.5, + "learning_rate": 7.511334150722817e-05, + "loss": 0.0086, + "step": 578380 + }, + { + "epoch": 1.5, + "learning_rate": 7.510945329085673e-05, + "loss": 0.0103, + "step": 578390 + }, + { + "epoch": 1.5, + "learning_rate": 7.510556507448526e-05, + "loss": 0.0076, + "step": 578400 + }, + { + "epoch": 1.5, + "learning_rate": 7.51016768581138e-05, + "loss": 0.01, + "step": 578410 + }, + { + "epoch": 1.5, + "learning_rate": 7.509778864174233e-05, + "loss": 0.0125, + "step": 578420 + }, + { + "epoch": 1.5, + "learning_rate": 7.509390042537087e-05, + "loss": 0.0099, + "step": 578430 + }, + { + "epoch": 1.5, + "learning_rate": 7.50900122089994e-05, + "loss": 0.0115, + "step": 578440 + }, + { + "epoch": 1.5, + "learning_rate": 7.508612399262794e-05, + "loss": 0.0089, + "step": 578450 + }, + { + "epoch": 1.5, + "learning_rate": 7.508223577625647e-05, + "loss": 0.0071, + "step": 578460 + }, + { + "epoch": 1.5, + "learning_rate": 7.507834755988501e-05, + "loss": 0.0103, + "step": 578470 + }, + { + "epoch": 1.5, + "learning_rate": 7.507445934351354e-05, + "loss": 0.011, + "step": 578480 + }, + { + "epoch": 1.5, + "learning_rate": 7.507057112714208e-05, + "loss": 0.0139, + "step": 578490 + }, + { + "epoch": 1.5, + "learning_rate": 7.50666829107706e-05, + "loss": 0.0116, + "step": 578500 + }, + { + "epoch": 1.5, + "learning_rate": 7.506279469439915e-05, + "loss": 0.0096, + "step": 578510 + }, + { + "epoch": 1.5, + "learning_rate": 7.505890647802768e-05, + "loss": 0.0083, + "step": 578520 + }, + { + "epoch": 1.5, + "learning_rate": 7.505501826165623e-05, + "loss": 0.0096, + "step": 578530 + }, + { + "epoch": 1.5, + "learning_rate": 7.505113004528475e-05, + "loss": 0.0069, + "step": 578540 + }, + { + "epoch": 1.5, + "learning_rate": 7.50472418289133e-05, + "loss": 0.0074, + "step": 578550 + }, + { + "epoch": 1.5, + "learning_rate": 7.504335361254183e-05, + "loss": 0.0079, + "step": 578560 + }, + { + "epoch": 1.5, + "learning_rate": 7.503946539617037e-05, + "loss": 0.0103, + "step": 578570 + }, + { + "epoch": 1.5, + "learning_rate": 7.50355771797989e-05, + "loss": 0.0107, + "step": 578580 + }, + { + "epoch": 1.5, + "learning_rate": 7.503168896342743e-05, + "loss": 0.0101, + "step": 578590 + }, + { + "epoch": 1.5, + "learning_rate": 7.502780074705597e-05, + "loss": 0.0047, + "step": 578600 + }, + { + "epoch": 1.5, + "learning_rate": 7.50239125306845e-05, + "loss": 0.0092, + "step": 578610 + }, + { + "epoch": 1.5, + "learning_rate": 7.502002431431304e-05, + "loss": 0.0104, + "step": 578620 + }, + { + "epoch": 1.5, + "learning_rate": 7.501613609794157e-05, + "loss": 0.0112, + "step": 578630 + }, + { + "epoch": 1.5, + "learning_rate": 7.501224788157011e-05, + "loss": 0.0071, + "step": 578640 + }, + { + "epoch": 1.5, + "learning_rate": 7.500835966519864e-05, + "loss": 0.0122, + "step": 578650 + }, + { + "epoch": 1.5, + "learning_rate": 7.500447144882718e-05, + "loss": 0.0084, + "step": 578660 + }, + { + "epoch": 1.5, + "learning_rate": 7.50005832324557e-05, + "loss": 0.0098, + "step": 578670 + }, + { + "epoch": 1.5, + "learning_rate": 7.499669501608425e-05, + "loss": 0.008, + "step": 578680 + }, + { + "epoch": 1.5, + "learning_rate": 7.499280679971279e-05, + "loss": 0.008, + "step": 578690 + }, + { + "epoch": 1.5, + "learning_rate": 7.498891858334132e-05, + "loss": 0.0078, + "step": 578700 + }, + { + "epoch": 1.5, + "learning_rate": 7.498503036696984e-05, + "loss": 0.0128, + "step": 578710 + }, + { + "epoch": 1.5, + "learning_rate": 7.498114215059839e-05, + "loss": 0.008, + "step": 578720 + }, + { + "epoch": 1.5, + "learning_rate": 7.497725393422693e-05, + "loss": 0.0081, + "step": 578730 + }, + { + "epoch": 1.5, + "learning_rate": 7.497336571785546e-05, + "loss": 0.0087, + "step": 578740 + }, + { + "epoch": 1.5, + "learning_rate": 7.4969477501484e-05, + "loss": 0.0097, + "step": 578750 + }, + { + "epoch": 1.5, + "learning_rate": 7.496558928511253e-05, + "loss": 0.0129, + "step": 578760 + }, + { + "epoch": 1.5, + "learning_rate": 7.496170106874107e-05, + "loss": 0.0094, + "step": 578770 + }, + { + "epoch": 1.5, + "learning_rate": 7.49578128523696e-05, + "loss": 0.0072, + "step": 578780 + }, + { + "epoch": 1.5, + "learning_rate": 7.495392463599814e-05, + "loss": 0.0078, + "step": 578790 + }, + { + "epoch": 1.5, + "learning_rate": 7.495003641962667e-05, + "loss": 0.0112, + "step": 578800 + }, + { + "epoch": 1.5, + "learning_rate": 7.494614820325521e-05, + "loss": 0.0107, + "step": 578810 + }, + { + "epoch": 1.5, + "learning_rate": 7.494225998688375e-05, + "loss": 0.0084, + "step": 578820 + }, + { + "epoch": 1.5, + "learning_rate": 7.493837177051228e-05, + "loss": 0.0091, + "step": 578830 + }, + { + "epoch": 1.5, + "learning_rate": 7.493448355414082e-05, + "loss": 0.0074, + "step": 578840 + }, + { + "epoch": 1.5, + "learning_rate": 7.493059533776935e-05, + "loss": 0.0096, + "step": 578850 + }, + { + "epoch": 1.5, + "learning_rate": 7.492670712139789e-05, + "loss": 0.0082, + "step": 578860 + }, + { + "epoch": 1.5, + "learning_rate": 7.492281890502642e-05, + "loss": 0.0077, + "step": 578870 + }, + { + "epoch": 1.5, + "learning_rate": 7.491893068865496e-05, + "loss": 0.0072, + "step": 578880 + }, + { + "epoch": 1.5, + "learning_rate": 7.49150424722835e-05, + "loss": 0.0128, + "step": 578890 + }, + { + "epoch": 1.5, + "learning_rate": 7.491115425591203e-05, + "loss": 0.0079, + "step": 578900 + }, + { + "epoch": 1.5, + "learning_rate": 7.490726603954057e-05, + "loss": 0.0068, + "step": 578910 + }, + { + "epoch": 1.5, + "learning_rate": 7.49033778231691e-05, + "loss": 0.0074, + "step": 578920 + }, + { + "epoch": 1.5, + "learning_rate": 7.489948960679764e-05, + "loss": 0.007, + "step": 578930 + }, + { + "epoch": 1.5, + "learning_rate": 7.489560139042617e-05, + "loss": 0.0067, + "step": 578940 + }, + { + "epoch": 1.5, + "learning_rate": 7.489171317405471e-05, + "loss": 0.0077, + "step": 578950 + }, + { + "epoch": 1.5, + "learning_rate": 7.488782495768324e-05, + "loss": 0.0074, + "step": 578960 + }, + { + "epoch": 1.5, + "learning_rate": 7.488393674131176e-05, + "loss": 0.0073, + "step": 578970 + }, + { + "epoch": 1.5, + "learning_rate": 7.48800485249403e-05, + "loss": 0.0092, + "step": 578980 + }, + { + "epoch": 1.5, + "learning_rate": 7.487616030856885e-05, + "loss": 0.0082, + "step": 578990 + }, + { + "epoch": 1.5, + "learning_rate": 7.487227209219738e-05, + "loss": 0.0089, + "step": 579000 + }, + { + "epoch": 1.5, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.006176051218062639, + "eval_runtime": 107.8782, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 579000 + }, + { + "epoch": 1.5, + "learning_rate": 7.486838387582592e-05, + "loss": 0.0083, + "step": 579010 + }, + { + "epoch": 1.5, + "learning_rate": 7.486449565945445e-05, + "loss": 0.0091, + "step": 579020 + }, + { + "epoch": 1.5, + "learning_rate": 7.486060744308299e-05, + "loss": 0.0065, + "step": 579030 + }, + { + "epoch": 1.5, + "learning_rate": 7.485671922671152e-05, + "loss": 0.0124, + "step": 579040 + }, + { + "epoch": 1.5, + "learning_rate": 7.485283101034006e-05, + "loss": 0.0071, + "step": 579050 + }, + { + "epoch": 1.5, + "learning_rate": 7.484894279396859e-05, + "loss": 0.0072, + "step": 579060 + }, + { + "epoch": 1.5, + "learning_rate": 7.484505457759713e-05, + "loss": 0.0085, + "step": 579070 + }, + { + "epoch": 1.5, + "learning_rate": 7.484116636122567e-05, + "loss": 0.0092, + "step": 579080 + }, + { + "epoch": 1.5, + "learning_rate": 7.48372781448542e-05, + "loss": 0.0072, + "step": 579090 + }, + { + "epoch": 1.5, + "learning_rate": 7.483338992848274e-05, + "loss": 0.0103, + "step": 579100 + }, + { + "epoch": 1.5, + "learning_rate": 7.482950171211127e-05, + "loss": 0.0097, + "step": 579110 + }, + { + "epoch": 1.5, + "learning_rate": 7.482561349573981e-05, + "loss": 0.0084, + "step": 579120 + }, + { + "epoch": 1.5, + "learning_rate": 7.482172527936834e-05, + "loss": 0.0086, + "step": 579130 + }, + { + "epoch": 1.5, + "learning_rate": 7.481783706299688e-05, + "loss": 0.0075, + "step": 579140 + }, + { + "epoch": 1.5, + "learning_rate": 7.481394884662542e-05, + "loss": 0.0078, + "step": 579150 + }, + { + "epoch": 1.5, + "learning_rate": 7.481006063025395e-05, + "loss": 0.0096, + "step": 579160 + }, + { + "epoch": 1.5, + "learning_rate": 7.480617241388249e-05, + "loss": 0.0086, + "step": 579170 + }, + { + "epoch": 1.5, + "learning_rate": 7.480228419751102e-05, + "loss": 0.0086, + "step": 579180 + }, + { + "epoch": 1.5, + "learning_rate": 7.479839598113956e-05, + "loss": 0.0108, + "step": 579190 + }, + { + "epoch": 1.5, + "learning_rate": 7.479450776476809e-05, + "loss": 0.0085, + "step": 579200 + }, + { + "epoch": 1.5, + "learning_rate": 7.479061954839662e-05, + "loss": 0.0086, + "step": 579210 + }, + { + "epoch": 1.5, + "learning_rate": 7.478673133202516e-05, + "loss": 0.0112, + "step": 579220 + }, + { + "epoch": 1.5, + "learning_rate": 7.478284311565368e-05, + "loss": 0.0112, + "step": 579230 + }, + { + "epoch": 1.5, + "learning_rate": 7.477895489928223e-05, + "loss": 0.0087, + "step": 579240 + }, + { + "epoch": 1.5, + "learning_rate": 7.477506668291077e-05, + "loss": 0.0075, + "step": 579250 + }, + { + "epoch": 1.5, + "learning_rate": 7.47711784665393e-05, + "loss": 0.0083, + "step": 579260 + }, + { + "epoch": 1.5, + "learning_rate": 7.476729025016784e-05, + "loss": 0.0081, + "step": 579270 + }, + { + "epoch": 1.5, + "learning_rate": 7.476340203379637e-05, + "loss": 0.009, + "step": 579280 + }, + { + "epoch": 1.5, + "learning_rate": 7.475951381742491e-05, + "loss": 0.0097, + "step": 579290 + }, + { + "epoch": 1.5, + "learning_rate": 7.475562560105344e-05, + "loss": 0.0104, + "step": 579300 + }, + { + "epoch": 1.5, + "learning_rate": 7.475173738468198e-05, + "loss": 0.0105, + "step": 579310 + }, + { + "epoch": 1.5, + "learning_rate": 7.47478491683105e-05, + "loss": 0.0089, + "step": 579320 + }, + { + "epoch": 1.5, + "learning_rate": 7.474396095193905e-05, + "loss": 0.017, + "step": 579330 + }, + { + "epoch": 1.5, + "learning_rate": 7.474007273556759e-05, + "loss": 0.0089, + "step": 579340 + }, + { + "epoch": 1.5, + "learning_rate": 7.473618451919612e-05, + "loss": 0.0118, + "step": 579350 + }, + { + "epoch": 1.5, + "learning_rate": 7.473229630282466e-05, + "loss": 0.012, + "step": 579360 + }, + { + "epoch": 1.5, + "learning_rate": 7.472840808645319e-05, + "loss": 0.0076, + "step": 579370 + }, + { + "epoch": 1.5, + "learning_rate": 7.472451987008173e-05, + "loss": 0.0078, + "step": 579380 + }, + { + "epoch": 1.5, + "learning_rate": 7.472063165371026e-05, + "loss": 0.009, + "step": 579390 + }, + { + "epoch": 1.5, + "learning_rate": 7.47167434373388e-05, + "loss": 0.0079, + "step": 579400 + }, + { + "epoch": 1.5, + "learning_rate": 7.471285522096733e-05, + "loss": 0.0083, + "step": 579410 + }, + { + "epoch": 1.5, + "learning_rate": 7.470896700459587e-05, + "loss": 0.0079, + "step": 579420 + }, + { + "epoch": 1.5, + "learning_rate": 7.470507878822441e-05, + "loss": 0.0077, + "step": 579430 + }, + { + "epoch": 1.5, + "learning_rate": 7.470119057185294e-05, + "loss": 0.007, + "step": 579440 + }, + { + "epoch": 1.5, + "learning_rate": 7.469730235548148e-05, + "loss": 0.01, + "step": 579450 + }, + { + "epoch": 1.5, + "learning_rate": 7.469341413911001e-05, + "loss": 0.0088, + "step": 579460 + }, + { + "epoch": 1.5, + "learning_rate": 7.468952592273853e-05, + "loss": 0.0099, + "step": 579470 + }, + { + "epoch": 1.5, + "learning_rate": 7.468563770636708e-05, + "loss": 0.0082, + "step": 579480 + }, + { + "epoch": 1.5, + "learning_rate": 7.46817494899956e-05, + "loss": 0.0084, + "step": 579490 + }, + { + "epoch": 1.5, + "learning_rate": 7.467786127362415e-05, + "loss": 0.0125, + "step": 579500 + }, + { + "epoch": 1.5, + "learning_rate": 7.467397305725267e-05, + "loss": 0.01, + "step": 579510 + }, + { + "epoch": 1.5, + "learning_rate": 7.467008484088122e-05, + "loss": 0.0089, + "step": 579520 + }, + { + "epoch": 1.5, + "learning_rate": 7.466619662450976e-05, + "loss": 0.0093, + "step": 579530 + }, + { + "epoch": 1.5, + "learning_rate": 7.466230840813829e-05, + "loss": 0.0106, + "step": 579540 + }, + { + "epoch": 1.5, + "learning_rate": 7.465842019176683e-05, + "loss": 0.0106, + "step": 579550 + }, + { + "epoch": 1.5, + "learning_rate": 7.465453197539536e-05, + "loss": 0.0071, + "step": 579560 + }, + { + "epoch": 1.5, + "learning_rate": 7.46506437590239e-05, + "loss": 0.0081, + "step": 579570 + }, + { + "epoch": 1.5, + "learning_rate": 7.464675554265243e-05, + "loss": 0.0103, + "step": 579580 + }, + { + "epoch": 1.5, + "learning_rate": 7.464286732628097e-05, + "loss": 0.0089, + "step": 579590 + }, + { + "epoch": 1.5, + "learning_rate": 7.463897910990951e-05, + "loss": 0.0102, + "step": 579600 + }, + { + "epoch": 1.5, + "learning_rate": 7.463509089353804e-05, + "loss": 0.009, + "step": 579610 + }, + { + "epoch": 1.5, + "learning_rate": 7.463120267716658e-05, + "loss": 0.0097, + "step": 579620 + }, + { + "epoch": 1.5, + "learning_rate": 7.46273144607951e-05, + "loss": 0.0155, + "step": 579630 + }, + { + "epoch": 1.5, + "learning_rate": 7.462342624442365e-05, + "loss": 0.0081, + "step": 579640 + }, + { + "epoch": 1.5, + "learning_rate": 7.461953802805218e-05, + "loss": 0.0084, + "step": 579650 + }, + { + "epoch": 1.5, + "learning_rate": 7.461564981168072e-05, + "loss": 0.0107, + "step": 579660 + }, + { + "epoch": 1.5, + "learning_rate": 7.461176159530925e-05, + "loss": 0.008, + "step": 579670 + }, + { + "epoch": 1.5, + "learning_rate": 7.460787337893779e-05, + "loss": 0.0082, + "step": 579680 + }, + { + "epoch": 1.5, + "learning_rate": 7.460398516256633e-05, + "loss": 0.0089, + "step": 579690 + }, + { + "epoch": 1.5, + "learning_rate": 7.460009694619486e-05, + "loss": 0.0089, + "step": 579700 + }, + { + "epoch": 1.5, + "learning_rate": 7.459620872982339e-05, + "loss": 0.0079, + "step": 579710 + }, + { + "epoch": 1.5, + "learning_rate": 7.459232051345193e-05, + "loss": 0.0093, + "step": 579720 + }, + { + "epoch": 1.5, + "learning_rate": 7.458843229708045e-05, + "loss": 0.0082, + "step": 579730 + }, + { + "epoch": 1.5, + "learning_rate": 7.4584544080709e-05, + "loss": 0.0078, + "step": 579740 + }, + { + "epoch": 1.5, + "learning_rate": 7.458065586433752e-05, + "loss": 0.0098, + "step": 579750 + }, + { + "epoch": 1.5, + "learning_rate": 7.457676764796607e-05, + "loss": 0.0076, + "step": 579760 + }, + { + "epoch": 1.5, + "learning_rate": 7.45728794315946e-05, + "loss": 0.0108, + "step": 579770 + }, + { + "epoch": 1.5, + "learning_rate": 7.456899121522314e-05, + "loss": 0.0098, + "step": 579780 + }, + { + "epoch": 1.5, + "learning_rate": 7.456510299885168e-05, + "loss": 0.0086, + "step": 579790 + }, + { + "epoch": 1.5, + "learning_rate": 7.45612147824802e-05, + "loss": 0.0079, + "step": 579800 + }, + { + "epoch": 1.5, + "learning_rate": 7.455732656610875e-05, + "loss": 0.0088, + "step": 579810 + }, + { + "epoch": 1.5, + "learning_rate": 7.455343834973728e-05, + "loss": 0.0101, + "step": 579820 + }, + { + "epoch": 1.5, + "learning_rate": 7.454955013336582e-05, + "loss": 0.0095, + "step": 579830 + }, + { + "epoch": 1.5, + "learning_rate": 7.454566191699435e-05, + "loss": 0.0106, + "step": 579840 + }, + { + "epoch": 1.5, + "learning_rate": 7.454177370062289e-05, + "loss": 0.0086, + "step": 579850 + }, + { + "epoch": 1.5, + "learning_rate": 7.453788548425143e-05, + "loss": 0.0087, + "step": 579860 + }, + { + "epoch": 1.5, + "learning_rate": 7.453399726787996e-05, + "loss": 0.0099, + "step": 579870 + }, + { + "epoch": 1.5, + "learning_rate": 7.45301090515085e-05, + "loss": 0.0082, + "step": 579880 + }, + { + "epoch": 1.5, + "learning_rate": 7.452622083513703e-05, + "loss": 0.0096, + "step": 579890 + }, + { + "epoch": 1.5, + "learning_rate": 7.452233261876557e-05, + "loss": 0.0077, + "step": 579900 + }, + { + "epoch": 1.5, + "learning_rate": 7.45184444023941e-05, + "loss": 0.0092, + "step": 579910 + }, + { + "epoch": 1.5, + "learning_rate": 7.451455618602264e-05, + "loss": 0.0078, + "step": 579920 + }, + { + "epoch": 1.5, + "learning_rate": 7.451066796965117e-05, + "loss": 0.0096, + "step": 579930 + }, + { + "epoch": 1.5, + "learning_rate": 7.450677975327971e-05, + "loss": 0.0094, + "step": 579940 + }, + { + "epoch": 1.5, + "learning_rate": 7.450289153690824e-05, + "loss": 0.0129, + "step": 579950 + }, + { + "epoch": 1.5, + "learning_rate": 7.449900332053678e-05, + "loss": 0.0084, + "step": 579960 + }, + { + "epoch": 1.5, + "learning_rate": 7.44951151041653e-05, + "loss": 0.0095, + "step": 579970 + }, + { + "epoch": 1.5, + "learning_rate": 7.449122688779385e-05, + "loss": 0.0089, + "step": 579980 + }, + { + "epoch": 1.5, + "learning_rate": 7.448733867142237e-05, + "loss": 0.0093, + "step": 579990 + }, + { + "epoch": 1.5, + "learning_rate": 7.448345045505092e-05, + "loss": 0.0111, + "step": 580000 + }, + { + "epoch": 1.5, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.006042073480784893, + "eval_runtime": 107.9383, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 580000 + }, + { + "epoch": 1.5, + "learning_rate": 7.447956223867944e-05, + "loss": 0.0091, + "step": 580010 + }, + { + "epoch": 1.5, + "learning_rate": 7.447567402230799e-05, + "loss": 0.0067, + "step": 580020 + }, + { + "epoch": 1.5, + "learning_rate": 7.447178580593651e-05, + "loss": 0.0122, + "step": 580030 + }, + { + "epoch": 1.5, + "learning_rate": 7.446789758956506e-05, + "loss": 0.0111, + "step": 580040 + }, + { + "epoch": 1.5, + "learning_rate": 7.44640093731936e-05, + "loss": 0.0079, + "step": 580050 + }, + { + "epoch": 1.5, + "learning_rate": 7.446012115682213e-05, + "loss": 0.0108, + "step": 580060 + }, + { + "epoch": 1.5, + "learning_rate": 7.445623294045067e-05, + "loss": 0.0101, + "step": 580070 + }, + { + "epoch": 1.5, + "learning_rate": 7.44523447240792e-05, + "loss": 0.0072, + "step": 580080 + }, + { + "epoch": 1.5, + "learning_rate": 7.444845650770774e-05, + "loss": 0.0108, + "step": 580090 + }, + { + "epoch": 1.5, + "learning_rate": 7.444456829133627e-05, + "loss": 0.0085, + "step": 580100 + }, + { + "epoch": 1.5, + "learning_rate": 7.444068007496481e-05, + "loss": 0.0094, + "step": 580110 + }, + { + "epoch": 1.5, + "learning_rate": 7.443679185859335e-05, + "loss": 0.0098, + "step": 580120 + }, + { + "epoch": 1.5, + "learning_rate": 7.443290364222188e-05, + "loss": 0.0118, + "step": 580130 + }, + { + "epoch": 1.5, + "learning_rate": 7.442901542585042e-05, + "loss": 0.0103, + "step": 580140 + }, + { + "epoch": 1.5, + "learning_rate": 7.442512720947895e-05, + "loss": 0.0059, + "step": 580150 + }, + { + "epoch": 1.5, + "learning_rate": 7.442123899310749e-05, + "loss": 0.0095, + "step": 580160 + }, + { + "epoch": 1.5, + "learning_rate": 7.441735077673602e-05, + "loss": 0.0103, + "step": 580170 + }, + { + "epoch": 1.5, + "learning_rate": 7.441346256036456e-05, + "loss": 0.009, + "step": 580180 + }, + { + "epoch": 1.5, + "learning_rate": 7.440957434399309e-05, + "loss": 0.0072, + "step": 580190 + }, + { + "epoch": 1.5, + "learning_rate": 7.440568612762161e-05, + "loss": 0.0067, + "step": 580200 + }, + { + "epoch": 1.5, + "learning_rate": 7.440179791125016e-05, + "loss": 0.0069, + "step": 580210 + }, + { + "epoch": 1.5, + "learning_rate": 7.43979096948787e-05, + "loss": 0.0085, + "step": 580220 + }, + { + "epoch": 1.5, + "learning_rate": 7.439402147850723e-05, + "loss": 0.0114, + "step": 580230 + }, + { + "epoch": 1.5, + "learning_rate": 7.439013326213577e-05, + "loss": 0.0084, + "step": 580240 + }, + { + "epoch": 1.5, + "learning_rate": 7.43862450457643e-05, + "loss": 0.0084, + "step": 580250 + }, + { + "epoch": 1.5, + "learning_rate": 7.438235682939284e-05, + "loss": 0.011, + "step": 580260 + }, + { + "epoch": 1.5, + "learning_rate": 7.437846861302136e-05, + "loss": 0.0135, + "step": 580270 + }, + { + "epoch": 1.5, + "learning_rate": 7.43745803966499e-05, + "loss": 0.0093, + "step": 580280 + }, + { + "epoch": 1.5, + "learning_rate": 7.437069218027843e-05, + "loss": 0.0082, + "step": 580290 + }, + { + "epoch": 1.5, + "learning_rate": 7.436680396390698e-05, + "loss": 0.0083, + "step": 580300 + }, + { + "epoch": 1.5, + "learning_rate": 7.436291574753552e-05, + "loss": 0.009, + "step": 580310 + }, + { + "epoch": 1.5, + "learning_rate": 7.435902753116405e-05, + "loss": 0.0115, + "step": 580320 + }, + { + "epoch": 1.5, + "learning_rate": 7.435513931479259e-05, + "loss": 0.0088, + "step": 580330 + }, + { + "epoch": 1.5, + "learning_rate": 7.435125109842112e-05, + "loss": 0.0093, + "step": 580340 + }, + { + "epoch": 1.5, + "learning_rate": 7.434736288204966e-05, + "loss": 0.0084, + "step": 580350 + }, + { + "epoch": 1.5, + "learning_rate": 7.434347466567819e-05, + "loss": 0.0124, + "step": 580360 + }, + { + "epoch": 1.5, + "learning_rate": 7.433958644930673e-05, + "loss": 0.0078, + "step": 580370 + }, + { + "epoch": 1.5, + "learning_rate": 7.433569823293527e-05, + "loss": 0.0063, + "step": 580380 + }, + { + "epoch": 1.5, + "learning_rate": 7.43318100165638e-05, + "loss": 0.0073, + "step": 580390 + }, + { + "epoch": 1.5, + "learning_rate": 7.432792180019234e-05, + "loss": 0.0091, + "step": 580400 + }, + { + "epoch": 1.5, + "learning_rate": 7.432403358382087e-05, + "loss": 0.0141, + "step": 580410 + }, + { + "epoch": 1.5, + "learning_rate": 7.432014536744941e-05, + "loss": 0.0065, + "step": 580420 + }, + { + "epoch": 1.5, + "learning_rate": 7.431625715107794e-05, + "loss": 0.0084, + "step": 580430 + }, + { + "epoch": 1.5, + "learning_rate": 7.431236893470648e-05, + "loss": 0.0106, + "step": 580440 + }, + { + "epoch": 1.5, + "learning_rate": 7.4308480718335e-05, + "loss": 0.0084, + "step": 580450 + }, + { + "epoch": 1.5, + "learning_rate": 7.430459250196353e-05, + "loss": 0.0089, + "step": 580460 + }, + { + "epoch": 1.5, + "learning_rate": 7.430070428559208e-05, + "loss": 0.0065, + "step": 580470 + }, + { + "epoch": 1.5, + "learning_rate": 7.429681606922062e-05, + "loss": 0.0083, + "step": 580480 + }, + { + "epoch": 1.5, + "learning_rate": 7.429292785284915e-05, + "loss": 0.0095, + "step": 580490 + }, + { + "epoch": 1.5, + "learning_rate": 7.428903963647769e-05, + "loss": 0.007, + "step": 580500 + }, + { + "epoch": 1.5, + "learning_rate": 7.428515142010621e-05, + "loss": 0.012, + "step": 580510 + }, + { + "epoch": 1.5, + "learning_rate": 7.428126320373476e-05, + "loss": 0.0097, + "step": 580520 + }, + { + "epoch": 1.5, + "learning_rate": 7.427737498736328e-05, + "loss": 0.0121, + "step": 580530 + }, + { + "epoch": 1.5, + "learning_rate": 7.427348677099183e-05, + "loss": 0.0061, + "step": 580540 + }, + { + "epoch": 1.5, + "learning_rate": 7.426959855462035e-05, + "loss": 0.0087, + "step": 580550 + }, + { + "epoch": 1.5, + "learning_rate": 7.42657103382489e-05, + "loss": 0.0079, + "step": 580560 + }, + { + "epoch": 1.5, + "learning_rate": 7.426182212187744e-05, + "loss": 0.0084, + "step": 580570 + }, + { + "epoch": 1.5, + "learning_rate": 7.425793390550597e-05, + "loss": 0.0093, + "step": 580580 + }, + { + "epoch": 1.5, + "learning_rate": 7.425404568913451e-05, + "loss": 0.0064, + "step": 580590 + }, + { + "epoch": 1.5, + "learning_rate": 7.425015747276304e-05, + "loss": 0.0079, + "step": 580600 + }, + { + "epoch": 1.51, + "learning_rate": 7.424626925639158e-05, + "loss": 0.0112, + "step": 580610 + }, + { + "epoch": 1.51, + "learning_rate": 7.42423810400201e-05, + "loss": 0.0089, + "step": 580620 + }, + { + "epoch": 1.51, + "learning_rate": 7.423849282364865e-05, + "loss": 0.007, + "step": 580630 + }, + { + "epoch": 1.51, + "learning_rate": 7.423460460727719e-05, + "loss": 0.0126, + "step": 580640 + }, + { + "epoch": 1.51, + "learning_rate": 7.423071639090572e-05, + "loss": 0.0095, + "step": 580650 + }, + { + "epoch": 1.51, + "learning_rate": 7.422682817453426e-05, + "loss": 0.0099, + "step": 580660 + }, + { + "epoch": 1.51, + "learning_rate": 7.422293995816279e-05, + "loss": 0.009, + "step": 580670 + }, + { + "epoch": 1.51, + "learning_rate": 7.421905174179133e-05, + "loss": 0.0124, + "step": 580680 + }, + { + "epoch": 1.51, + "learning_rate": 7.421516352541986e-05, + "loss": 0.0077, + "step": 580690 + }, + { + "epoch": 1.51, + "learning_rate": 7.421127530904838e-05, + "loss": 0.0082, + "step": 580700 + }, + { + "epoch": 1.51, + "learning_rate": 7.420738709267693e-05, + "loss": 0.009, + "step": 580710 + }, + { + "epoch": 1.51, + "learning_rate": 7.420349887630545e-05, + "loss": 0.0066, + "step": 580720 + }, + { + "epoch": 1.51, + "learning_rate": 7.4199610659934e-05, + "loss": 0.0089, + "step": 580730 + }, + { + "epoch": 1.51, + "learning_rate": 7.419572244356254e-05, + "loss": 0.0088, + "step": 580740 + }, + { + "epoch": 1.51, + "learning_rate": 7.419183422719107e-05, + "loss": 0.0072, + "step": 580750 + }, + { + "epoch": 1.51, + "learning_rate": 7.41879460108196e-05, + "loss": 0.0067, + "step": 580760 + }, + { + "epoch": 1.51, + "learning_rate": 7.418405779444813e-05, + "loss": 0.016, + "step": 580770 + }, + { + "epoch": 1.51, + "learning_rate": 7.418016957807668e-05, + "loss": 0.0096, + "step": 580780 + }, + { + "epoch": 1.51, + "learning_rate": 7.41762813617052e-05, + "loss": 0.0072, + "step": 580790 + }, + { + "epoch": 1.51, + "learning_rate": 7.417239314533375e-05, + "loss": 0.0068, + "step": 580800 + }, + { + "epoch": 1.51, + "learning_rate": 7.416850492896227e-05, + "loss": 0.009, + "step": 580810 + }, + { + "epoch": 1.51, + "learning_rate": 7.416461671259082e-05, + "loss": 0.0072, + "step": 580820 + }, + { + "epoch": 1.51, + "learning_rate": 7.416072849621936e-05, + "loss": 0.007, + "step": 580830 + }, + { + "epoch": 1.51, + "learning_rate": 7.415684027984789e-05, + "loss": 0.0064, + "step": 580840 + }, + { + "epoch": 1.51, + "learning_rate": 7.415295206347643e-05, + "loss": 0.0076, + "step": 580850 + }, + { + "epoch": 1.51, + "learning_rate": 7.414906384710496e-05, + "loss": 0.0074, + "step": 580860 + }, + { + "epoch": 1.51, + "learning_rate": 7.41451756307335e-05, + "loss": 0.0077, + "step": 580870 + }, + { + "epoch": 1.51, + "learning_rate": 7.414128741436202e-05, + "loss": 0.008, + "step": 580880 + }, + { + "epoch": 1.51, + "learning_rate": 7.413739919799057e-05, + "loss": 0.0118, + "step": 580890 + }, + { + "epoch": 1.51, + "learning_rate": 7.41335109816191e-05, + "loss": 0.0074, + "step": 580900 + }, + { + "epoch": 1.51, + "learning_rate": 7.412962276524764e-05, + "loss": 0.0087, + "step": 580910 + }, + { + "epoch": 1.51, + "learning_rate": 7.412573454887618e-05, + "loss": 0.0089, + "step": 580920 + }, + { + "epoch": 1.51, + "learning_rate": 7.41218463325047e-05, + "loss": 0.0067, + "step": 580930 + }, + { + "epoch": 1.51, + "learning_rate": 7.411795811613325e-05, + "loss": 0.0078, + "step": 580940 + }, + { + "epoch": 1.51, + "learning_rate": 7.411406989976178e-05, + "loss": 0.012, + "step": 580950 + }, + { + "epoch": 1.51, + "learning_rate": 7.41101816833903e-05, + "loss": 0.0102, + "step": 580960 + }, + { + "epoch": 1.51, + "learning_rate": 7.410629346701885e-05, + "loss": 0.0107, + "step": 580970 + }, + { + "epoch": 1.51, + "learning_rate": 7.410240525064737e-05, + "loss": 0.0096, + "step": 580980 + }, + { + "epoch": 1.51, + "learning_rate": 7.409851703427592e-05, + "loss": 0.0086, + "step": 580990 + }, + { + "epoch": 1.51, + "learning_rate": 7.409462881790444e-05, + "loss": 0.0095, + "step": 581000 + }, + { + "epoch": 1.51, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.006130463909357786, + "eval_runtime": 107.9133, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 581000 + }, + { + "epoch": 1.51, + "learning_rate": 7.409074060153298e-05, + "loss": 0.0092, + "step": 581010 + }, + { + "epoch": 1.51, + "learning_rate": 7.408685238516153e-05, + "loss": 0.0081, + "step": 581020 + }, + { + "epoch": 1.51, + "learning_rate": 7.408296416879005e-05, + "loss": 0.0084, + "step": 581030 + }, + { + "epoch": 1.51, + "learning_rate": 7.40790759524186e-05, + "loss": 0.0077, + "step": 581040 + }, + { + "epoch": 1.51, + "learning_rate": 7.407518773604712e-05, + "loss": 0.0099, + "step": 581050 + }, + { + "epoch": 1.51, + "learning_rate": 7.407129951967567e-05, + "loss": 0.0105, + "step": 581060 + }, + { + "epoch": 1.51, + "learning_rate": 7.40674113033042e-05, + "loss": 0.0101, + "step": 581070 + }, + { + "epoch": 1.51, + "learning_rate": 7.406352308693274e-05, + "loss": 0.0085, + "step": 581080 + }, + { + "epoch": 1.51, + "learning_rate": 7.405963487056128e-05, + "loss": 0.007, + "step": 581090 + }, + { + "epoch": 1.51, + "learning_rate": 7.40557466541898e-05, + "loss": 0.0099, + "step": 581100 + }, + { + "epoch": 1.51, + "learning_rate": 7.405185843781835e-05, + "loss": 0.0115, + "step": 581110 + }, + { + "epoch": 1.51, + "learning_rate": 7.404797022144688e-05, + "loss": 0.0129, + "step": 581120 + }, + { + "epoch": 1.51, + "learning_rate": 7.404408200507542e-05, + "loss": 0.01, + "step": 581130 + }, + { + "epoch": 1.51, + "learning_rate": 7.404019378870394e-05, + "loss": 0.0075, + "step": 581140 + }, + { + "epoch": 1.51, + "learning_rate": 7.403630557233249e-05, + "loss": 0.0096, + "step": 581150 + }, + { + "epoch": 1.51, + "learning_rate": 7.403241735596101e-05, + "loss": 0.0088, + "step": 581160 + }, + { + "epoch": 1.51, + "learning_rate": 7.402852913958956e-05, + "loss": 0.0075, + "step": 581170 + }, + { + "epoch": 1.51, + "learning_rate": 7.40246409232181e-05, + "loss": 0.0079, + "step": 581180 + }, + { + "epoch": 1.51, + "learning_rate": 7.402075270684663e-05, + "loss": 0.0056, + "step": 581190 + }, + { + "epoch": 1.51, + "learning_rate": 7.401686449047515e-05, + "loss": 0.0067, + "step": 581200 + }, + { + "epoch": 1.51, + "learning_rate": 7.40129762741037e-05, + "loss": 0.0081, + "step": 581210 + }, + { + "epoch": 1.51, + "learning_rate": 7.400908805773222e-05, + "loss": 0.0089, + "step": 581220 + }, + { + "epoch": 1.51, + "learning_rate": 7.400519984136077e-05, + "loss": 0.008, + "step": 581230 + }, + { + "epoch": 1.51, + "learning_rate": 7.40013116249893e-05, + "loss": 0.0093, + "step": 581240 + }, + { + "epoch": 1.51, + "learning_rate": 7.399742340861784e-05, + "loss": 0.0111, + "step": 581250 + }, + { + "epoch": 1.51, + "learning_rate": 7.399353519224636e-05, + "loss": 0.0082, + "step": 581260 + }, + { + "epoch": 1.51, + "learning_rate": 7.39896469758749e-05, + "loss": 0.011, + "step": 581270 + }, + { + "epoch": 1.51, + "learning_rate": 7.398575875950345e-05, + "loss": 0.0084, + "step": 581280 + }, + { + "epoch": 1.51, + "learning_rate": 7.398187054313197e-05, + "loss": 0.0079, + "step": 581290 + }, + { + "epoch": 1.51, + "learning_rate": 7.397798232676052e-05, + "loss": 0.0071, + "step": 581300 + }, + { + "epoch": 1.51, + "learning_rate": 7.397409411038904e-05, + "loss": 0.008, + "step": 581310 + }, + { + "epoch": 1.51, + "learning_rate": 7.397020589401759e-05, + "loss": 0.0105, + "step": 581320 + }, + { + "epoch": 1.51, + "learning_rate": 7.396631767764611e-05, + "loss": 0.0103, + "step": 581330 + }, + { + "epoch": 1.51, + "learning_rate": 7.396242946127466e-05, + "loss": 0.0086, + "step": 581340 + }, + { + "epoch": 1.51, + "learning_rate": 7.39585412449032e-05, + "loss": 0.013, + "step": 581350 + }, + { + "epoch": 1.51, + "learning_rate": 7.395465302853173e-05, + "loss": 0.0053, + "step": 581360 + }, + { + "epoch": 1.51, + "learning_rate": 7.395076481216027e-05, + "loss": 0.01, + "step": 581370 + }, + { + "epoch": 1.51, + "learning_rate": 7.39468765957888e-05, + "loss": 0.0086, + "step": 581380 + }, + { + "epoch": 1.51, + "learning_rate": 7.394298837941734e-05, + "loss": 0.0096, + "step": 581390 + }, + { + "epoch": 1.51, + "learning_rate": 7.393910016304586e-05, + "loss": 0.0101, + "step": 581400 + }, + { + "epoch": 1.51, + "learning_rate": 7.39352119466744e-05, + "loss": 0.0098, + "step": 581410 + }, + { + "epoch": 1.51, + "learning_rate": 7.393132373030293e-05, + "loss": 0.009, + "step": 581420 + }, + { + "epoch": 1.51, + "learning_rate": 7.392743551393148e-05, + "loss": 0.0098, + "step": 581430 + }, + { + "epoch": 1.51, + "learning_rate": 7.392354729756e-05, + "loss": 0.0072, + "step": 581440 + }, + { + "epoch": 1.51, + "learning_rate": 7.391965908118855e-05, + "loss": 0.0113, + "step": 581450 + }, + { + "epoch": 1.51, + "learning_rate": 7.391577086481707e-05, + "loss": 0.0097, + "step": 581460 + }, + { + "epoch": 1.51, + "learning_rate": 7.391188264844562e-05, + "loss": 0.0079, + "step": 581470 + }, + { + "epoch": 1.51, + "learning_rate": 7.390799443207414e-05, + "loss": 0.0105, + "step": 581480 + }, + { + "epoch": 1.51, + "learning_rate": 7.390410621570269e-05, + "loss": 0.0078, + "step": 581490 + }, + { + "epoch": 1.51, + "learning_rate": 7.390021799933121e-05, + "loss": 0.0101, + "step": 581500 + }, + { + "epoch": 1.51, + "learning_rate": 7.389632978295976e-05, + "loss": 0.0097, + "step": 581510 + }, + { + "epoch": 1.51, + "learning_rate": 7.389244156658828e-05, + "loss": 0.0103, + "step": 581520 + }, + { + "epoch": 1.51, + "learning_rate": 7.388855335021682e-05, + "loss": 0.0088, + "step": 581530 + }, + { + "epoch": 1.51, + "learning_rate": 7.388466513384537e-05, + "loss": 0.0114, + "step": 581540 + }, + { + "epoch": 1.51, + "learning_rate": 7.38807769174739e-05, + "loss": 0.0116, + "step": 581550 + }, + { + "epoch": 1.51, + "learning_rate": 7.387688870110244e-05, + "loss": 0.0072, + "step": 581560 + }, + { + "epoch": 1.51, + "learning_rate": 7.387300048473096e-05, + "loss": 0.0072, + "step": 581570 + }, + { + "epoch": 1.51, + "learning_rate": 7.38691122683595e-05, + "loss": 0.0083, + "step": 581580 + }, + { + "epoch": 1.51, + "learning_rate": 7.386522405198803e-05, + "loss": 0.0087, + "step": 581590 + }, + { + "epoch": 1.51, + "learning_rate": 7.386133583561658e-05, + "loss": 0.0081, + "step": 581600 + }, + { + "epoch": 1.51, + "learning_rate": 7.385744761924512e-05, + "loss": 0.0075, + "step": 581610 + }, + { + "epoch": 1.51, + "learning_rate": 7.385355940287365e-05, + "loss": 0.0087, + "step": 581620 + }, + { + "epoch": 1.51, + "learning_rate": 7.384967118650219e-05, + "loss": 0.0077, + "step": 581630 + }, + { + "epoch": 1.51, + "learning_rate": 7.384578297013072e-05, + "loss": 0.0077, + "step": 581640 + }, + { + "epoch": 1.51, + "learning_rate": 7.384189475375926e-05, + "loss": 0.0125, + "step": 581650 + }, + { + "epoch": 1.51, + "learning_rate": 7.383800653738778e-05, + "loss": 0.009, + "step": 581660 + }, + { + "epoch": 1.51, + "learning_rate": 7.383411832101633e-05, + "loss": 0.0082, + "step": 581670 + }, + { + "epoch": 1.51, + "learning_rate": 7.383023010464485e-05, + "loss": 0.0092, + "step": 581680 + }, + { + "epoch": 1.51, + "learning_rate": 7.382634188827338e-05, + "loss": 0.0087, + "step": 581690 + }, + { + "epoch": 1.51, + "learning_rate": 7.382245367190192e-05, + "loss": 0.0087, + "step": 581700 + }, + { + "epoch": 1.51, + "learning_rate": 7.381856545553047e-05, + "loss": 0.0099, + "step": 581710 + }, + { + "epoch": 1.51, + "learning_rate": 7.3814677239159e-05, + "loss": 0.0077, + "step": 581720 + }, + { + "epoch": 1.51, + "learning_rate": 7.381078902278754e-05, + "loss": 0.0096, + "step": 581730 + }, + { + "epoch": 1.51, + "learning_rate": 7.380690080641606e-05, + "loss": 0.0149, + "step": 581740 + }, + { + "epoch": 1.51, + "learning_rate": 7.38030125900446e-05, + "loss": 0.0088, + "step": 581750 + }, + { + "epoch": 1.51, + "learning_rate": 7.379912437367313e-05, + "loss": 0.0083, + "step": 581760 + }, + { + "epoch": 1.51, + "learning_rate": 7.379523615730168e-05, + "loss": 0.0085, + "step": 581770 + }, + { + "epoch": 1.51, + "learning_rate": 7.37913479409302e-05, + "loss": 0.0088, + "step": 581780 + }, + { + "epoch": 1.51, + "learning_rate": 7.378745972455874e-05, + "loss": 0.0077, + "step": 581790 + }, + { + "epoch": 1.51, + "learning_rate": 7.378357150818729e-05, + "loss": 0.0076, + "step": 581800 + }, + { + "epoch": 1.51, + "learning_rate": 7.377968329181581e-05, + "loss": 0.0089, + "step": 581810 + }, + { + "epoch": 1.51, + "learning_rate": 7.377579507544436e-05, + "loss": 0.01, + "step": 581820 + }, + { + "epoch": 1.51, + "learning_rate": 7.377190685907288e-05, + "loss": 0.0105, + "step": 581830 + }, + { + "epoch": 1.51, + "learning_rate": 7.376801864270143e-05, + "loss": 0.009, + "step": 581840 + }, + { + "epoch": 1.51, + "learning_rate": 7.376413042632995e-05, + "loss": 0.0093, + "step": 581850 + }, + { + "epoch": 1.51, + "learning_rate": 7.37602422099585e-05, + "loss": 0.0082, + "step": 581860 + }, + { + "epoch": 1.51, + "learning_rate": 7.375635399358704e-05, + "loss": 0.0081, + "step": 581870 + }, + { + "epoch": 1.51, + "learning_rate": 7.375246577721557e-05, + "loss": 0.0127, + "step": 581880 + }, + { + "epoch": 1.51, + "learning_rate": 7.374857756084411e-05, + "loss": 0.0079, + "step": 581890 + }, + { + "epoch": 1.51, + "learning_rate": 7.374468934447264e-05, + "loss": 0.0075, + "step": 581900 + }, + { + "epoch": 1.51, + "learning_rate": 7.374080112810118e-05, + "loss": 0.0081, + "step": 581910 + }, + { + "epoch": 1.51, + "learning_rate": 7.37369129117297e-05, + "loss": 0.0109, + "step": 581920 + }, + { + "epoch": 1.51, + "learning_rate": 7.373302469535825e-05, + "loss": 0.0111, + "step": 581930 + }, + { + "epoch": 1.51, + "learning_rate": 7.372913647898677e-05, + "loss": 0.0075, + "step": 581940 + }, + { + "epoch": 1.51, + "learning_rate": 7.37252482626153e-05, + "loss": 0.0059, + "step": 581950 + }, + { + "epoch": 1.51, + "learning_rate": 7.372136004624384e-05, + "loss": 0.0086, + "step": 581960 + }, + { + "epoch": 1.51, + "learning_rate": 7.371747182987239e-05, + "loss": 0.0079, + "step": 581970 + }, + { + "epoch": 1.51, + "learning_rate": 7.371358361350091e-05, + "loss": 0.0095, + "step": 581980 + }, + { + "epoch": 1.51, + "learning_rate": 7.370969539712946e-05, + "loss": 0.0096, + "step": 581990 + }, + { + "epoch": 1.51, + "learning_rate": 7.370580718075798e-05, + "loss": 0.0091, + "step": 582000 + }, + { + "epoch": 1.51, + "eval_cer": 0.8816984874123652, + "eval_loss": 0.005966072902083397, + "eval_runtime": 107.7983, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, + "step": 582000 + }, + { + "epoch": 1.51, + "learning_rate": 7.370191896438653e-05, + "loss": 0.0067, + "step": 582010 + }, + { + "epoch": 1.51, + "learning_rate": 7.369803074801505e-05, + "loss": 0.0095, + "step": 582020 + }, + { + "epoch": 1.51, + "learning_rate": 7.36941425316436e-05, + "loss": 0.0106, + "step": 582030 + }, + { + "epoch": 1.51, + "learning_rate": 7.369025431527212e-05, + "loss": 0.0067, + "step": 582040 + }, + { + "epoch": 1.51, + "learning_rate": 7.368636609890066e-05, + "loss": 0.0088, + "step": 582050 + }, + { + "epoch": 1.51, + "learning_rate": 7.36824778825292e-05, + "loss": 0.0091, + "step": 582060 + }, + { + "epoch": 1.51, + "learning_rate": 7.367858966615773e-05, + "loss": 0.007, + "step": 582070 + }, + { + "epoch": 1.51, + "learning_rate": 7.367470144978628e-05, + "loss": 0.0081, + "step": 582080 + }, + { + "epoch": 1.51, + "learning_rate": 7.36708132334148e-05, + "loss": 0.009, + "step": 582090 + }, + { + "epoch": 1.51, + "learning_rate": 7.366692501704335e-05, + "loss": 0.0081, + "step": 582100 + }, + { + "epoch": 1.51, + "learning_rate": 7.366303680067187e-05, + "loss": 0.0117, + "step": 582110 + }, + { + "epoch": 1.51, + "learning_rate": 7.365914858430042e-05, + "loss": 0.0154, + "step": 582120 + }, + { + "epoch": 1.51, + "learning_rate": 7.365526036792896e-05, + "loss": 0.0077, + "step": 582130 + }, + { + "epoch": 1.51, + "learning_rate": 7.365137215155749e-05, + "loss": 0.0125, + "step": 582140 + }, + { + "epoch": 1.51, + "learning_rate": 7.364748393518603e-05, + "loss": 0.0095, + "step": 582150 + }, + { + "epoch": 1.51, + "learning_rate": 7.364359571881456e-05, + "loss": 0.0084, + "step": 582160 + }, + { + "epoch": 1.51, + "learning_rate": 7.36397075024431e-05, + "loss": 0.0114, + "step": 582170 + }, + { + "epoch": 1.51, + "learning_rate": 7.363581928607162e-05, + "loss": 0.0091, + "step": 582180 + }, + { + "epoch": 1.51, + "learning_rate": 7.363193106970015e-05, + "loss": 0.0094, + "step": 582190 + }, + { + "epoch": 1.51, + "learning_rate": 7.36280428533287e-05, + "loss": 0.0084, + "step": 582200 + }, + { + "epoch": 1.51, + "learning_rate": 7.362415463695722e-05, + "loss": 0.0077, + "step": 582210 + }, + { + "epoch": 1.51, + "learning_rate": 7.362026642058576e-05, + "loss": 0.0115, + "step": 582220 + }, + { + "epoch": 1.51, + "learning_rate": 7.36163782042143e-05, + "loss": 0.0077, + "step": 582230 + }, + { + "epoch": 1.51, + "learning_rate": 7.361248998784283e-05, + "loss": 0.0084, + "step": 582240 + }, + { + "epoch": 1.51, + "learning_rate": 7.360860177147138e-05, + "loss": 0.0096, + "step": 582250 + }, + { + "epoch": 1.51, + "learning_rate": 7.36047135550999e-05, + "loss": 0.0094, + "step": 582260 + }, + { + "epoch": 1.51, + "learning_rate": 7.360082533872845e-05, + "loss": 0.0094, + "step": 582270 + }, + { + "epoch": 1.51, + "learning_rate": 7.359693712235697e-05, + "loss": 0.0102, + "step": 582280 + }, + { + "epoch": 1.51, + "learning_rate": 7.359304890598552e-05, + "loss": 0.009, + "step": 582290 + }, + { + "epoch": 1.51, + "learning_rate": 7.358916068961404e-05, + "loss": 0.0085, + "step": 582300 + }, + { + "epoch": 1.51, + "learning_rate": 7.358527247324258e-05, + "loss": 0.0082, + "step": 582310 + }, + { + "epoch": 1.51, + "learning_rate": 7.358138425687113e-05, + "loss": 0.0071, + "step": 582320 + }, + { + "epoch": 1.51, + "learning_rate": 7.357749604049965e-05, + "loss": 0.0092, + "step": 582330 + }, + { + "epoch": 1.51, + "learning_rate": 7.35736078241282e-05, + "loss": 0.008, + "step": 582340 + }, + { + "epoch": 1.51, + "learning_rate": 7.356971960775672e-05, + "loss": 0.0087, + "step": 582350 + }, + { + "epoch": 1.51, + "learning_rate": 7.356583139138527e-05, + "loss": 0.0098, + "step": 582360 + }, + { + "epoch": 1.51, + "learning_rate": 7.35619431750138e-05, + "loss": 0.014, + "step": 582370 + }, + { + "epoch": 1.51, + "learning_rate": 7.355805495864234e-05, + "loss": 0.0084, + "step": 582380 + }, + { + "epoch": 1.51, + "learning_rate": 7.355416674227086e-05, + "loss": 0.0109, + "step": 582390 + }, + { + "epoch": 1.51, + "learning_rate": 7.35502785258994e-05, + "loss": 0.0088, + "step": 582400 + }, + { + "epoch": 1.51, + "learning_rate": 7.354639030952795e-05, + "loss": 0.0062, + "step": 582410 + }, + { + "epoch": 1.51, + "learning_rate": 7.354250209315647e-05, + "loss": 0.0123, + "step": 582420 + }, + { + "epoch": 1.51, + "learning_rate": 7.353861387678502e-05, + "loss": 0.0072, + "step": 582430 + }, + { + "epoch": 1.51, + "learning_rate": 7.353472566041354e-05, + "loss": 0.0082, + "step": 582440 + }, + { + "epoch": 1.51, + "learning_rate": 7.353083744404207e-05, + "loss": 0.0096, + "step": 582450 + }, + { + "epoch": 1.51, + "learning_rate": 7.352694922767061e-05, + "loss": 0.0072, + "step": 582460 + }, + { + "epoch": 1.51, + "learning_rate": 7.352306101129914e-05, + "loss": 0.0103, + "step": 582470 + }, + { + "epoch": 1.51, + "learning_rate": 7.351917279492768e-05, + "loss": 0.0074, + "step": 582480 + }, + { + "epoch": 1.51, + "learning_rate": 7.351528457855621e-05, + "loss": 0.0107, + "step": 582490 + }, + { + "epoch": 1.51, + "learning_rate": 7.351139636218475e-05, + "loss": 0.0102, + "step": 582500 + }, + { + "epoch": 1.51, + "learning_rate": 7.35075081458133e-05, + "loss": 0.0119, + "step": 582510 + }, + { + "epoch": 1.51, + "learning_rate": 7.350361992944182e-05, + "loss": 0.0106, + "step": 582520 + }, + { + "epoch": 1.51, + "learning_rate": 7.349973171307037e-05, + "loss": 0.0122, + "step": 582530 + }, + { + "epoch": 1.51, + "learning_rate": 7.34958434966989e-05, + "loss": 0.0079, + "step": 582540 + }, + { + "epoch": 1.51, + "learning_rate": 7.349195528032743e-05, + "loss": 0.0105, + "step": 582550 + }, + { + "epoch": 1.51, + "learning_rate": 7.348806706395596e-05, + "loss": 0.0077, + "step": 582560 + }, + { + "epoch": 1.51, + "learning_rate": 7.34841788475845e-05, + "loss": 0.0088, + "step": 582570 + }, + { + "epoch": 1.51, + "learning_rate": 7.348029063121305e-05, + "loss": 0.0125, + "step": 582580 + }, + { + "epoch": 1.51, + "learning_rate": 7.347640241484157e-05, + "loss": 0.0098, + "step": 582590 + }, + { + "epoch": 1.51, + "learning_rate": 7.347251419847012e-05, + "loss": 0.009, + "step": 582600 + }, + { + "epoch": 1.51, + "learning_rate": 7.346862598209864e-05, + "loss": 0.0103, + "step": 582610 + }, + { + "epoch": 1.51, + "learning_rate": 7.346473776572719e-05, + "loss": 0.0095, + "step": 582620 + }, + { + "epoch": 1.51, + "learning_rate": 7.346084954935571e-05, + "loss": 0.0131, + "step": 582630 + }, + { + "epoch": 1.51, + "learning_rate": 7.345696133298426e-05, + "loss": 0.0091, + "step": 582640 + }, + { + "epoch": 1.51, + "learning_rate": 7.345307311661278e-05, + "loss": 0.0085, + "step": 582650 + }, + { + "epoch": 1.51, + "learning_rate": 7.344918490024133e-05, + "loss": 0.0118, + "step": 582660 + }, + { + "epoch": 1.51, + "learning_rate": 7.344529668386987e-05, + "loss": 0.0108, + "step": 582670 + }, + { + "epoch": 1.51, + "learning_rate": 7.34414084674984e-05, + "loss": 0.0072, + "step": 582680 + }, + { + "epoch": 1.51, + "learning_rate": 7.343752025112692e-05, + "loss": 0.0091, + "step": 582690 + }, + { + "epoch": 1.51, + "learning_rate": 7.343363203475546e-05, + "loss": 0.0092, + "step": 582700 + }, + { + "epoch": 1.51, + "learning_rate": 7.342974381838399e-05, + "loss": 0.0089, + "step": 582710 + }, + { + "epoch": 1.51, + "learning_rate": 7.342585560201253e-05, + "loss": 0.0125, + "step": 582720 + }, + { + "epoch": 1.51, + "learning_rate": 7.342196738564106e-05, + "loss": 0.0094, + "step": 582730 + }, + { + "epoch": 1.51, + "learning_rate": 7.34180791692696e-05, + "loss": 0.0111, + "step": 582740 + }, + { + "epoch": 1.51, + "learning_rate": 7.341419095289813e-05, + "loss": 0.0087, + "step": 582750 + }, + { + "epoch": 1.51, + "learning_rate": 7.341030273652667e-05, + "loss": 0.0098, + "step": 582760 + }, + { + "epoch": 1.51, + "learning_rate": 7.340641452015522e-05, + "loss": 0.0096, + "step": 582770 + }, + { + "epoch": 1.51, + "learning_rate": 7.340252630378374e-05, + "loss": 0.0106, + "step": 582780 + }, + { + "epoch": 1.51, + "learning_rate": 7.339863808741229e-05, + "loss": 0.0088, + "step": 582790 + }, + { + "epoch": 1.51, + "learning_rate": 7.339474987104081e-05, + "loss": 0.0092, + "step": 582800 + }, + { + "epoch": 1.51, + "learning_rate": 7.339086165466935e-05, + "loss": 0.0123, + "step": 582810 + }, + { + "epoch": 1.51, + "learning_rate": 7.338697343829788e-05, + "loss": 0.0087, + "step": 582820 + }, + { + "epoch": 1.51, + "learning_rate": 7.338308522192642e-05, + "loss": 0.0084, + "step": 582830 + }, + { + "epoch": 1.51, + "learning_rate": 7.337919700555497e-05, + "loss": 0.01, + "step": 582840 + }, + { + "epoch": 1.51, + "learning_rate": 7.33753087891835e-05, + "loss": 0.0109, + "step": 582850 + }, + { + "epoch": 1.51, + "learning_rate": 7.337142057281204e-05, + "loss": 0.0096, + "step": 582860 + }, + { + "epoch": 1.51, + "learning_rate": 7.336753235644056e-05, + "loss": 0.0089, + "step": 582870 + }, + { + "epoch": 1.51, + "learning_rate": 7.33636441400691e-05, + "loss": 0.0084, + "step": 582880 + }, + { + "epoch": 1.51, + "learning_rate": 7.335975592369763e-05, + "loss": 0.0099, + "step": 582890 + }, + { + "epoch": 1.51, + "learning_rate": 7.335586770732618e-05, + "loss": 0.0097, + "step": 582900 + }, + { + "epoch": 1.51, + "learning_rate": 7.33519794909547e-05, + "loss": 0.0125, + "step": 582910 + }, + { + "epoch": 1.51, + "learning_rate": 7.334809127458325e-05, + "loss": 0.0141, + "step": 582920 + }, + { + "epoch": 1.51, + "learning_rate": 7.334420305821177e-05, + "loss": 0.0101, + "step": 582930 + }, + { + "epoch": 1.51, + "learning_rate": 7.334031484184031e-05, + "loss": 0.0112, + "step": 582940 + }, + { + "epoch": 1.51, + "learning_rate": 7.333642662546884e-05, + "loss": 0.0087, + "step": 582950 + }, + { + "epoch": 1.51, + "learning_rate": 7.333253840909738e-05, + "loss": 0.0066, + "step": 582960 + }, + { + "epoch": 1.51, + "learning_rate": 7.332865019272591e-05, + "loss": 0.0103, + "step": 582970 + }, + { + "epoch": 1.51, + "learning_rate": 7.332476197635445e-05, + "loss": 0.0082, + "step": 582980 + }, + { + "epoch": 1.51, + "learning_rate": 7.332087375998298e-05, + "loss": 0.0098, + "step": 582990 + }, + { + "epoch": 1.51, + "learning_rate": 7.331698554361152e-05, + "loss": 0.0098, + "step": 583000 + }, + { + "epoch": 1.51, + "eval_cer": 0.8817138834186412, + "eval_loss": 0.006150657311081886, + "eval_runtime": 107.9428, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 583000 + }, + { + "epoch": 1.51, + "learning_rate": 7.331309732724005e-05, + "loss": 0.0065, + "step": 583010 + }, + { + "epoch": 1.51, + "learning_rate": 7.33092091108686e-05, + "loss": 0.008, + "step": 583020 + }, + { + "epoch": 1.51, + "learning_rate": 7.330532089449714e-05, + "loss": 0.0059, + "step": 583030 + }, + { + "epoch": 1.51, + "learning_rate": 7.330143267812566e-05, + "loss": 0.0095, + "step": 583040 + }, + { + "epoch": 1.51, + "learning_rate": 7.32975444617542e-05, + "loss": 0.0068, + "step": 583050 + }, + { + "epoch": 1.51, + "learning_rate": 7.329365624538273e-05, + "loss": 0.0082, + "step": 583060 + }, + { + "epoch": 1.51, + "learning_rate": 7.328976802901127e-05, + "loss": 0.0079, + "step": 583070 + }, + { + "epoch": 1.51, + "learning_rate": 7.32858798126398e-05, + "loss": 0.0099, + "step": 583080 + }, + { + "epoch": 1.51, + "learning_rate": 7.328199159626834e-05, + "loss": 0.007, + "step": 583090 + }, + { + "epoch": 1.51, + "learning_rate": 7.327810337989689e-05, + "loss": 0.0097, + "step": 583100 + }, + { + "epoch": 1.51, + "learning_rate": 7.327421516352541e-05, + "loss": 0.0099, + "step": 583110 + }, + { + "epoch": 1.51, + "learning_rate": 7.327032694715396e-05, + "loss": 0.0077, + "step": 583120 + }, + { + "epoch": 1.51, + "learning_rate": 7.326643873078248e-05, + "loss": 0.0092, + "step": 583130 + }, + { + "epoch": 1.51, + "learning_rate": 7.326255051441103e-05, + "loss": 0.0084, + "step": 583140 + }, + { + "epoch": 1.51, + "learning_rate": 7.325866229803955e-05, + "loss": 0.0085, + "step": 583150 + }, + { + "epoch": 1.51, + "learning_rate": 7.32547740816681e-05, + "loss": 0.0082, + "step": 583160 + }, + { + "epoch": 1.51, + "learning_rate": 7.325088586529662e-05, + "loss": 0.0101, + "step": 583170 + }, + { + "epoch": 1.51, + "learning_rate": 7.324699764892515e-05, + "loss": 0.0075, + "step": 583180 + }, + { + "epoch": 1.51, + "learning_rate": 7.324310943255369e-05, + "loss": 0.0116, + "step": 583190 + }, + { + "epoch": 1.51, + "learning_rate": 7.323922121618223e-05, + "loss": 0.009, + "step": 583200 + }, + { + "epoch": 1.51, + "learning_rate": 7.323533299981076e-05, + "loss": 0.0056, + "step": 583210 + }, + { + "epoch": 1.51, + "learning_rate": 7.32314447834393e-05, + "loss": 0.0114, + "step": 583220 + }, + { + "epoch": 1.51, + "learning_rate": 7.322755656706783e-05, + "loss": 0.0083, + "step": 583230 + }, + { + "epoch": 1.51, + "learning_rate": 7.322366835069637e-05, + "loss": 0.0115, + "step": 583240 + }, + { + "epoch": 1.51, + "learning_rate": 7.32197801343249e-05, + "loss": 0.0096, + "step": 583250 + }, + { + "epoch": 1.51, + "learning_rate": 7.321589191795344e-05, + "loss": 0.008, + "step": 583260 + }, + { + "epoch": 1.51, + "learning_rate": 7.321200370158197e-05, + "loss": 0.0084, + "step": 583270 + }, + { + "epoch": 1.51, + "learning_rate": 7.320811548521051e-05, + "loss": 0.0067, + "step": 583280 + }, + { + "epoch": 1.51, + "learning_rate": 7.320422726883906e-05, + "loss": 0.0091, + "step": 583290 + }, + { + "epoch": 1.51, + "learning_rate": 7.320033905246758e-05, + "loss": 0.008, + "step": 583300 + }, + { + "epoch": 1.51, + "learning_rate": 7.319645083609613e-05, + "loss": 0.0098, + "step": 583310 + }, + { + "epoch": 1.51, + "learning_rate": 7.319256261972465e-05, + "loss": 0.0079, + "step": 583320 + }, + { + "epoch": 1.51, + "learning_rate": 7.31886744033532e-05, + "loss": 0.0084, + "step": 583330 + }, + { + "epoch": 1.51, + "learning_rate": 7.318478618698172e-05, + "loss": 0.008, + "step": 583340 + }, + { + "epoch": 1.51, + "learning_rate": 7.318089797061026e-05, + "loss": 0.0083, + "step": 583350 + }, + { + "epoch": 1.51, + "learning_rate": 7.31770097542388e-05, + "loss": 0.0106, + "step": 583360 + }, + { + "epoch": 1.51, + "learning_rate": 7.317312153786733e-05, + "loss": 0.0087, + "step": 583370 + }, + { + "epoch": 1.51, + "learning_rate": 7.316923332149588e-05, + "loss": 0.0115, + "step": 583380 + }, + { + "epoch": 1.51, + "learning_rate": 7.31653451051244e-05, + "loss": 0.0094, + "step": 583390 + }, + { + "epoch": 1.51, + "learning_rate": 7.316145688875295e-05, + "loss": 0.008, + "step": 583400 + }, + { + "epoch": 1.51, + "learning_rate": 7.315756867238147e-05, + "loss": 0.0083, + "step": 583410 + }, + { + "epoch": 1.51, + "learning_rate": 7.315368045601002e-05, + "loss": 0.0093, + "step": 583420 + }, + { + "epoch": 1.51, + "learning_rate": 7.314979223963854e-05, + "loss": 0.0099, + "step": 583430 + }, + { + "epoch": 1.51, + "learning_rate": 7.314590402326707e-05, + "loss": 0.0085, + "step": 583440 + }, + { + "epoch": 1.51, + "learning_rate": 7.314201580689561e-05, + "loss": 0.007, + "step": 583450 + }, + { + "epoch": 1.51, + "learning_rate": 7.313812759052415e-05, + "loss": 0.0091, + "step": 583460 + }, + { + "epoch": 1.51, + "learning_rate": 7.313423937415268e-05, + "loss": 0.0107, + "step": 583470 + }, + { + "epoch": 1.51, + "learning_rate": 7.313035115778122e-05, + "loss": 0.0088, + "step": 583480 + }, + { + "epoch": 1.51, + "learning_rate": 7.312646294140975e-05, + "loss": 0.0084, + "step": 583490 + }, + { + "epoch": 1.51, + "learning_rate": 7.31225747250383e-05, + "loss": 0.0106, + "step": 583500 + }, + { + "epoch": 1.51, + "learning_rate": 7.311868650866682e-05, + "loss": 0.0073, + "step": 583510 + }, + { + "epoch": 1.51, + "learning_rate": 7.311479829229536e-05, + "loss": 0.0107, + "step": 583520 + }, + { + "epoch": 1.51, + "learning_rate": 7.311091007592389e-05, + "loss": 0.0141, + "step": 583530 + }, + { + "epoch": 1.51, + "learning_rate": 7.310702185955243e-05, + "loss": 0.0075, + "step": 583540 + }, + { + "epoch": 1.51, + "learning_rate": 7.310313364318098e-05, + "loss": 0.0106, + "step": 583550 + }, + { + "epoch": 1.51, + "learning_rate": 7.30992454268095e-05, + "loss": 0.0068, + "step": 583560 + }, + { + "epoch": 1.51, + "learning_rate": 7.309535721043805e-05, + "loss": 0.0123, + "step": 583570 + }, + { + "epoch": 1.51, + "learning_rate": 7.309146899406657e-05, + "loss": 0.0105, + "step": 583580 + }, + { + "epoch": 1.51, + "learning_rate": 7.308758077769511e-05, + "loss": 0.011, + "step": 583590 + }, + { + "epoch": 1.51, + "learning_rate": 7.308369256132364e-05, + "loss": 0.0063, + "step": 583600 + }, + { + "epoch": 1.51, + "learning_rate": 7.307980434495218e-05, + "loss": 0.0071, + "step": 583610 + }, + { + "epoch": 1.51, + "learning_rate": 7.307591612858071e-05, + "loss": 0.0108, + "step": 583620 + }, + { + "epoch": 1.51, + "learning_rate": 7.307202791220925e-05, + "loss": 0.0079, + "step": 583630 + }, + { + "epoch": 1.51, + "learning_rate": 7.30681396958378e-05, + "loss": 0.0087, + "step": 583640 + }, + { + "epoch": 1.51, + "learning_rate": 7.306425147946632e-05, + "loss": 0.0081, + "step": 583650 + }, + { + "epoch": 1.51, + "learning_rate": 7.306036326309487e-05, + "loss": 0.0069, + "step": 583660 + }, + { + "epoch": 1.51, + "learning_rate": 7.30564750467234e-05, + "loss": 0.0091, + "step": 583670 + }, + { + "epoch": 1.51, + "learning_rate": 7.305258683035192e-05, + "loss": 0.0091, + "step": 583680 + }, + { + "epoch": 1.51, + "learning_rate": 7.304869861398046e-05, + "loss": 0.0055, + "step": 583690 + }, + { + "epoch": 1.51, + "learning_rate": 7.304481039760899e-05, + "loss": 0.0112, + "step": 583700 + }, + { + "epoch": 1.51, + "learning_rate": 7.304092218123753e-05, + "loss": 0.0117, + "step": 583710 + }, + { + "epoch": 1.51, + "learning_rate": 7.303703396486606e-05, + "loss": 0.0099, + "step": 583720 + }, + { + "epoch": 1.51, + "learning_rate": 7.30331457484946e-05, + "loss": 0.0086, + "step": 583730 + }, + { + "epoch": 1.51, + "learning_rate": 7.302925753212314e-05, + "loss": 0.0101, + "step": 583740 + }, + { + "epoch": 1.51, + "learning_rate": 7.302536931575167e-05, + "loss": 0.0081, + "step": 583750 + }, + { + "epoch": 1.51, + "learning_rate": 7.302148109938021e-05, + "loss": 0.009, + "step": 583760 + }, + { + "epoch": 1.51, + "learning_rate": 7.301759288300874e-05, + "loss": 0.0091, + "step": 583770 + }, + { + "epoch": 1.51, + "learning_rate": 7.301370466663728e-05, + "loss": 0.0079, + "step": 583780 + }, + { + "epoch": 1.51, + "learning_rate": 7.300981645026581e-05, + "loss": 0.013, + "step": 583790 + }, + { + "epoch": 1.51, + "learning_rate": 7.300592823389435e-05, + "loss": 0.0082, + "step": 583800 + }, + { + "epoch": 1.51, + "learning_rate": 7.30020400175229e-05, + "loss": 0.0085, + "step": 583810 + }, + { + "epoch": 1.51, + "learning_rate": 7.299815180115142e-05, + "loss": 0.0085, + "step": 583820 + }, + { + "epoch": 1.51, + "learning_rate": 7.299426358477996e-05, + "loss": 0.0095, + "step": 583830 + }, + { + "epoch": 1.51, + "learning_rate": 7.299037536840849e-05, + "loss": 0.0101, + "step": 583840 + }, + { + "epoch": 1.51, + "learning_rate": 7.298648715203703e-05, + "loss": 0.0078, + "step": 583850 + }, + { + "epoch": 1.51, + "learning_rate": 7.298259893566556e-05, + "loss": 0.0068, + "step": 583860 + }, + { + "epoch": 1.51, + "learning_rate": 7.29787107192941e-05, + "loss": 0.0076, + "step": 583870 + }, + { + "epoch": 1.51, + "learning_rate": 7.297482250292263e-05, + "loss": 0.0088, + "step": 583880 + }, + { + "epoch": 1.51, + "learning_rate": 7.297093428655117e-05, + "loss": 0.0085, + "step": 583890 + }, + { + "epoch": 1.51, + "learning_rate": 7.296704607017972e-05, + "loss": 0.0099, + "step": 583900 + }, + { + "epoch": 1.51, + "learning_rate": 7.296315785380824e-05, + "loss": 0.008, + "step": 583910 + }, + { + "epoch": 1.51, + "learning_rate": 7.295926963743677e-05, + "loss": 0.0084, + "step": 583920 + }, + { + "epoch": 1.51, + "learning_rate": 7.295538142106531e-05, + "loss": 0.0087, + "step": 583930 + }, + { + "epoch": 1.51, + "learning_rate": 7.295149320469384e-05, + "loss": 0.0108, + "step": 583940 + }, + { + "epoch": 1.51, + "learning_rate": 7.294760498832238e-05, + "loss": 0.0093, + "step": 583950 + }, + { + "epoch": 1.51, + "learning_rate": 7.294371677195091e-05, + "loss": 0.0062, + "step": 583960 + }, + { + "epoch": 1.51, + "learning_rate": 7.293982855557945e-05, + "loss": 0.0097, + "step": 583970 + }, + { + "epoch": 1.51, + "learning_rate": 7.293594033920798e-05, + "loss": 0.0104, + "step": 583980 + }, + { + "epoch": 1.51, + "learning_rate": 7.293205212283652e-05, + "loss": 0.0079, + "step": 583990 + }, + { + "epoch": 1.51, + "learning_rate": 7.292816390646506e-05, + "loss": 0.0078, + "step": 584000 + }, + { + "epoch": 1.51, + "eval_cer": 0.8816970877754311, + "eval_loss": 0.005978405941277742, + "eval_runtime": 107.7544, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, + "step": 584000 + }, + { + "epoch": 1.51, + "learning_rate": 7.292427569009359e-05, + "loss": 0.0067, + "step": 584010 + }, + { + "epoch": 1.51, + "learning_rate": 7.292038747372213e-05, + "loss": 0.0088, + "step": 584020 + }, + { + "epoch": 1.51, + "learning_rate": 7.291649925735066e-05, + "loss": 0.0101, + "step": 584030 + }, + { + "epoch": 1.51, + "learning_rate": 7.29126110409792e-05, + "loss": 0.0079, + "step": 584040 + }, + { + "epoch": 1.51, + "learning_rate": 7.290872282460773e-05, + "loss": 0.006, + "step": 584050 + }, + { + "epoch": 1.51, + "learning_rate": 7.290483460823627e-05, + "loss": 0.0091, + "step": 584060 + }, + { + "epoch": 1.51, + "learning_rate": 7.290094639186482e-05, + "loss": 0.0114, + "step": 584070 + }, + { + "epoch": 1.51, + "learning_rate": 7.289705817549334e-05, + "loss": 0.0074, + "step": 584080 + }, + { + "epoch": 1.51, + "learning_rate": 7.289316995912188e-05, + "loss": 0.0103, + "step": 584090 + }, + { + "epoch": 1.51, + "learning_rate": 7.288928174275041e-05, + "loss": 0.0088, + "step": 584100 + }, + { + "epoch": 1.51, + "learning_rate": 7.288539352637895e-05, + "loss": 0.0098, + "step": 584110 + }, + { + "epoch": 1.51, + "learning_rate": 7.288150531000748e-05, + "loss": 0.0108, + "step": 584120 + }, + { + "epoch": 1.51, + "learning_rate": 7.287761709363602e-05, + "loss": 0.0087, + "step": 584130 + }, + { + "epoch": 1.51, + "learning_rate": 7.287372887726455e-05, + "loss": 0.0097, + "step": 584140 + }, + { + "epoch": 1.51, + "learning_rate": 7.28698406608931e-05, + "loss": 0.0136, + "step": 584150 + }, + { + "epoch": 1.51, + "learning_rate": 7.286595244452164e-05, + "loss": 0.0118, + "step": 584160 + }, + { + "epoch": 1.51, + "learning_rate": 7.286206422815016e-05, + "loss": 0.0105, + "step": 584170 + }, + { + "epoch": 1.51, + "learning_rate": 7.285817601177869e-05, + "loss": 0.0099, + "step": 584180 + }, + { + "epoch": 1.51, + "learning_rate": 7.285428779540723e-05, + "loss": 0.0084, + "step": 584190 + }, + { + "epoch": 1.51, + "learning_rate": 7.285039957903576e-05, + "loss": 0.0097, + "step": 584200 + }, + { + "epoch": 1.51, + "learning_rate": 7.28465113626643e-05, + "loss": 0.0071, + "step": 584210 + }, + { + "epoch": 1.51, + "learning_rate": 7.284262314629283e-05, + "loss": 0.009, + "step": 584220 + }, + { + "epoch": 1.51, + "learning_rate": 7.283873492992137e-05, + "loss": 0.0107, + "step": 584230 + }, + { + "epoch": 1.51, + "learning_rate": 7.28348467135499e-05, + "loss": 0.0072, + "step": 584240 + }, + { + "epoch": 1.51, + "learning_rate": 7.283095849717844e-05, + "loss": 0.0063, + "step": 584250 + }, + { + "epoch": 1.51, + "learning_rate": 7.282707028080698e-05, + "loss": 0.0077, + "step": 584260 + }, + { + "epoch": 1.51, + "learning_rate": 7.282318206443551e-05, + "loss": 0.0104, + "step": 584270 + }, + { + "epoch": 1.51, + "learning_rate": 7.281929384806405e-05, + "loss": 0.0063, + "step": 584280 + }, + { + "epoch": 1.51, + "learning_rate": 7.281540563169258e-05, + "loss": 0.0085, + "step": 584290 + }, + { + "epoch": 1.51, + "learning_rate": 7.281151741532112e-05, + "loss": 0.0079, + "step": 584300 + }, + { + "epoch": 1.51, + "learning_rate": 7.280762919894965e-05, + "loss": 0.0105, + "step": 584310 + }, + { + "epoch": 1.51, + "learning_rate": 7.28037409825782e-05, + "loss": 0.0098, + "step": 584320 + }, + { + "epoch": 1.51, + "learning_rate": 7.279985276620674e-05, + "loss": 0.0069, + "step": 584330 + }, + { + "epoch": 1.51, + "learning_rate": 7.279596454983526e-05, + "loss": 0.0097, + "step": 584340 + }, + { + "epoch": 1.51, + "learning_rate": 7.27920763334638e-05, + "loss": 0.0106, + "step": 584350 + }, + { + "epoch": 1.51, + "learning_rate": 7.278818811709233e-05, + "loss": 0.011, + "step": 584360 + }, + { + "epoch": 1.51, + "learning_rate": 7.278429990072087e-05, + "loss": 0.0084, + "step": 584370 + }, + { + "epoch": 1.51, + "learning_rate": 7.27804116843494e-05, + "loss": 0.0147, + "step": 584380 + }, + { + "epoch": 1.51, + "learning_rate": 7.277652346797794e-05, + "loss": 0.0115, + "step": 584390 + }, + { + "epoch": 1.51, + "learning_rate": 7.277263525160647e-05, + "loss": 0.0066, + "step": 584400 + }, + { + "epoch": 1.51, + "learning_rate": 7.276874703523501e-05, + "loss": 0.0099, + "step": 584410 + }, + { + "epoch": 1.51, + "learning_rate": 7.276485881886354e-05, + "loss": 0.0098, + "step": 584420 + }, + { + "epoch": 1.51, + "learning_rate": 7.276097060249208e-05, + "loss": 0.0096, + "step": 584430 + }, + { + "epoch": 1.51, + "learning_rate": 7.275708238612061e-05, + "loss": 0.0122, + "step": 584440 + }, + { + "epoch": 1.51, + "learning_rate": 7.275319416974915e-05, + "loss": 0.0071, + "step": 584450 + }, + { + "epoch": 1.52, + "learning_rate": 7.274930595337768e-05, + "loss": 0.0097, + "step": 584460 + }, + { + "epoch": 1.52, + "learning_rate": 7.274541773700622e-05, + "loss": 0.0084, + "step": 584470 + }, + { + "epoch": 1.52, + "learning_rate": 7.274152952063475e-05, + "loss": 0.007, + "step": 584480 + }, + { + "epoch": 1.52, + "learning_rate": 7.273764130426329e-05, + "loss": 0.0108, + "step": 584490 + }, + { + "epoch": 1.52, + "learning_rate": 7.273375308789182e-05, + "loss": 0.0087, + "step": 584500 + }, + { + "epoch": 1.52, + "learning_rate": 7.272986487152036e-05, + "loss": 0.0084, + "step": 584510 + }, + { + "epoch": 1.52, + "learning_rate": 7.27259766551489e-05, + "loss": 0.0094, + "step": 584520 + }, + { + "epoch": 1.52, + "learning_rate": 7.272208843877743e-05, + "loss": 0.0076, + "step": 584530 + }, + { + "epoch": 1.52, + "learning_rate": 7.271820022240597e-05, + "loss": 0.0103, + "step": 584540 + }, + { + "epoch": 1.52, + "learning_rate": 7.27143120060345e-05, + "loss": 0.0062, + "step": 584550 + }, + { + "epoch": 1.52, + "learning_rate": 7.271042378966304e-05, + "loss": 0.0115, + "step": 584560 + }, + { + "epoch": 1.52, + "learning_rate": 7.270653557329157e-05, + "loss": 0.0091, + "step": 584570 + }, + { + "epoch": 1.52, + "learning_rate": 7.270264735692011e-05, + "loss": 0.008, + "step": 584580 + }, + { + "epoch": 1.52, + "learning_rate": 7.269875914054866e-05, + "loss": 0.008, + "step": 584590 + }, + { + "epoch": 1.52, + "learning_rate": 7.269487092417718e-05, + "loss": 0.0107, + "step": 584600 + }, + { + "epoch": 1.52, + "learning_rate": 7.269098270780572e-05, + "loss": 0.0069, + "step": 584610 + }, + { + "epoch": 1.52, + "learning_rate": 7.268709449143425e-05, + "loss": 0.008, + "step": 584620 + }, + { + "epoch": 1.52, + "learning_rate": 7.26832062750628e-05, + "loss": 0.0088, + "step": 584630 + }, + { + "epoch": 1.52, + "learning_rate": 7.267931805869132e-05, + "loss": 0.0081, + "step": 584640 + }, + { + "epoch": 1.52, + "learning_rate": 7.267542984231986e-05, + "loss": 0.0096, + "step": 584650 + }, + { + "epoch": 1.52, + "learning_rate": 7.267154162594839e-05, + "loss": 0.0083, + "step": 584660 + }, + { + "epoch": 1.52, + "learning_rate": 7.266765340957692e-05, + "loss": 0.0074, + "step": 584670 + }, + { + "epoch": 1.52, + "learning_rate": 7.266376519320546e-05, + "loss": 0.0108, + "step": 584680 + }, + { + "epoch": 1.52, + "learning_rate": 7.2659876976834e-05, + "loss": 0.0108, + "step": 584690 + }, + { + "epoch": 1.52, + "learning_rate": 7.265598876046253e-05, + "loss": 0.008, + "step": 584700 + }, + { + "epoch": 1.52, + "learning_rate": 7.265210054409107e-05, + "loss": 0.0072, + "step": 584710 + }, + { + "epoch": 1.52, + "learning_rate": 7.26482123277196e-05, + "loss": 0.0087, + "step": 584720 + }, + { + "epoch": 1.52, + "learning_rate": 7.264432411134814e-05, + "loss": 0.009, + "step": 584730 + }, + { + "epoch": 1.52, + "learning_rate": 7.264043589497667e-05, + "loss": 0.0101, + "step": 584740 + }, + { + "epoch": 1.52, + "learning_rate": 7.263654767860521e-05, + "loss": 0.0107, + "step": 584750 + }, + { + "epoch": 1.52, + "learning_rate": 7.263265946223374e-05, + "loss": 0.0085, + "step": 584760 + }, + { + "epoch": 1.52, + "learning_rate": 7.262877124586228e-05, + "loss": 0.0083, + "step": 584770 + }, + { + "epoch": 1.52, + "learning_rate": 7.262488302949082e-05, + "loss": 0.0076, + "step": 584780 + }, + { + "epoch": 1.52, + "learning_rate": 7.262099481311935e-05, + "loss": 0.0098, + "step": 584790 + }, + { + "epoch": 1.52, + "learning_rate": 7.26171065967479e-05, + "loss": 0.01, + "step": 584800 + }, + { + "epoch": 1.52, + "learning_rate": 7.261321838037642e-05, + "loss": 0.0114, + "step": 584810 + }, + { + "epoch": 1.52, + "learning_rate": 7.260933016400496e-05, + "loss": 0.0107, + "step": 584820 + }, + { + "epoch": 1.52, + "learning_rate": 7.260544194763349e-05, + "loss": 0.0069, + "step": 584830 + }, + { + "epoch": 1.52, + "learning_rate": 7.260155373126203e-05, + "loss": 0.0089, + "step": 584840 + }, + { + "epoch": 1.52, + "learning_rate": 7.259766551489058e-05, + "loss": 0.0081, + "step": 584850 + }, + { + "epoch": 1.52, + "learning_rate": 7.25937772985191e-05, + "loss": 0.0084, + "step": 584860 + }, + { + "epoch": 1.52, + "learning_rate": 7.258988908214764e-05, + "loss": 0.0066, + "step": 584870 + }, + { + "epoch": 1.52, + "learning_rate": 7.258600086577617e-05, + "loss": 0.0095, + "step": 584880 + }, + { + "epoch": 1.52, + "learning_rate": 7.258211264940471e-05, + "loss": 0.0082, + "step": 584890 + }, + { + "epoch": 1.52, + "learning_rate": 7.257822443303324e-05, + "loss": 0.0075, + "step": 584900 + }, + { + "epoch": 1.52, + "learning_rate": 7.257433621666178e-05, + "loss": 0.0085, + "step": 584910 + }, + { + "epoch": 1.52, + "learning_rate": 7.257044800029031e-05, + "loss": 0.0103, + "step": 584920 + }, + { + "epoch": 1.52, + "learning_rate": 7.256655978391884e-05, + "loss": 0.0093, + "step": 584930 + }, + { + "epoch": 1.52, + "learning_rate": 7.256267156754738e-05, + "loss": 0.0077, + "step": 584940 + }, + { + "epoch": 1.52, + "learning_rate": 7.255878335117592e-05, + "loss": 0.0093, + "step": 584950 + }, + { + "epoch": 1.52, + "learning_rate": 7.255489513480445e-05, + "loss": 0.0099, + "step": 584960 + }, + { + "epoch": 1.52, + "learning_rate": 7.2551006918433e-05, + "loss": 0.0077, + "step": 584970 + }, + { + "epoch": 1.52, + "learning_rate": 7.254711870206152e-05, + "loss": 0.0113, + "step": 584980 + }, + { + "epoch": 1.52, + "learning_rate": 7.254323048569006e-05, + "loss": 0.0101, + "step": 584990 + }, + { + "epoch": 1.52, + "learning_rate": 7.253934226931859e-05, + "loss": 0.0061, + "step": 585000 + }, + { + "epoch": 1.52, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.005952306557446718, + "eval_runtime": 107.7504, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, + "step": 585000 + }, + { + "epoch": 1.52, + "learning_rate": 7.253545405294713e-05, + "loss": 0.0096, + "step": 585010 + }, + { + "epoch": 1.52, + "learning_rate": 7.253156583657566e-05, + "loss": 0.0086, + "step": 585020 + }, + { + "epoch": 1.52, + "learning_rate": 7.25276776202042e-05, + "loss": 0.0089, + "step": 585030 + }, + { + "epoch": 1.52, + "learning_rate": 7.252378940383274e-05, + "loss": 0.0108, + "step": 585040 + }, + { + "epoch": 1.52, + "learning_rate": 7.251990118746127e-05, + "loss": 0.0072, + "step": 585050 + }, + { + "epoch": 1.52, + "learning_rate": 7.251601297108981e-05, + "loss": 0.0099, + "step": 585060 + }, + { + "epoch": 1.52, + "learning_rate": 7.251212475471834e-05, + "loss": 0.0077, + "step": 585070 + }, + { + "epoch": 1.52, + "learning_rate": 7.250823653834688e-05, + "loss": 0.0095, + "step": 585080 + }, + { + "epoch": 1.52, + "learning_rate": 7.250434832197541e-05, + "loss": 0.0149, + "step": 585090 + }, + { + "epoch": 1.52, + "learning_rate": 7.250046010560395e-05, + "loss": 0.0096, + "step": 585100 + }, + { + "epoch": 1.52, + "learning_rate": 7.249657188923248e-05, + "loss": 0.0089, + "step": 585110 + }, + { + "epoch": 1.52, + "learning_rate": 7.249268367286102e-05, + "loss": 0.0077, + "step": 585120 + }, + { + "epoch": 1.52, + "learning_rate": 7.248879545648956e-05, + "loss": 0.0105, + "step": 585130 + }, + { + "epoch": 1.52, + "learning_rate": 7.248490724011809e-05, + "loss": 0.0066, + "step": 585140 + }, + { + "epoch": 1.52, + "learning_rate": 7.248101902374663e-05, + "loss": 0.0102, + "step": 585150 + }, + { + "epoch": 1.52, + "learning_rate": 7.247713080737516e-05, + "loss": 0.0099, + "step": 585160 + }, + { + "epoch": 1.52, + "learning_rate": 7.247324259100369e-05, + "loss": 0.0085, + "step": 585170 + }, + { + "epoch": 1.52, + "learning_rate": 7.246935437463223e-05, + "loss": 0.0082, + "step": 585180 + }, + { + "epoch": 1.52, + "learning_rate": 7.246546615826076e-05, + "loss": 0.0094, + "step": 585190 + }, + { + "epoch": 1.52, + "learning_rate": 7.24615779418893e-05, + "loss": 0.0105, + "step": 585200 + }, + { + "epoch": 1.52, + "learning_rate": 7.245768972551783e-05, + "loss": 0.0089, + "step": 585210 + }, + { + "epoch": 1.52, + "learning_rate": 7.245380150914637e-05, + "loss": 0.0086, + "step": 585220 + }, + { + "epoch": 1.52, + "learning_rate": 7.244991329277491e-05, + "loss": 0.0088, + "step": 585230 + }, + { + "epoch": 1.52, + "learning_rate": 7.244602507640344e-05, + "loss": 0.0082, + "step": 585240 + }, + { + "epoch": 1.52, + "learning_rate": 7.244213686003198e-05, + "loss": 0.0081, + "step": 585250 + }, + { + "epoch": 1.52, + "learning_rate": 7.243824864366051e-05, + "loss": 0.0092, + "step": 585260 + }, + { + "epoch": 1.52, + "learning_rate": 7.243436042728905e-05, + "loss": 0.0097, + "step": 585270 + }, + { + "epoch": 1.52, + "learning_rate": 7.243047221091758e-05, + "loss": 0.0089, + "step": 585280 + }, + { + "epoch": 1.52, + "learning_rate": 7.242658399454612e-05, + "loss": 0.0067, + "step": 585290 + }, + { + "epoch": 1.52, + "learning_rate": 7.242269577817466e-05, + "loss": 0.0098, + "step": 585300 + }, + { + "epoch": 1.52, + "learning_rate": 7.241880756180319e-05, + "loss": 0.0077, + "step": 585310 + }, + { + "epoch": 1.52, + "learning_rate": 7.241491934543173e-05, + "loss": 0.0077, + "step": 585320 + }, + { + "epoch": 1.52, + "learning_rate": 7.241103112906026e-05, + "loss": 0.0072, + "step": 585330 + }, + { + "epoch": 1.52, + "learning_rate": 7.24071429126888e-05, + "loss": 0.0103, + "step": 585340 + }, + { + "epoch": 1.52, + "learning_rate": 7.240325469631733e-05, + "loss": 0.0079, + "step": 585350 + }, + { + "epoch": 1.52, + "learning_rate": 7.239936647994587e-05, + "loss": 0.0108, + "step": 585360 + }, + { + "epoch": 1.52, + "learning_rate": 7.23954782635744e-05, + "loss": 0.0086, + "step": 585370 + }, + { + "epoch": 1.52, + "learning_rate": 7.239159004720294e-05, + "loss": 0.0102, + "step": 585380 + }, + { + "epoch": 1.52, + "learning_rate": 7.238770183083148e-05, + "loss": 0.0098, + "step": 585390 + }, + { + "epoch": 1.52, + "learning_rate": 7.238381361446001e-05, + "loss": 0.0084, + "step": 585400 + }, + { + "epoch": 1.52, + "learning_rate": 7.237992539808854e-05, + "loss": 0.0104, + "step": 585410 + }, + { + "epoch": 1.52, + "learning_rate": 7.237603718171708e-05, + "loss": 0.0109, + "step": 585420 + }, + { + "epoch": 1.52, + "learning_rate": 7.237214896534561e-05, + "loss": 0.0096, + "step": 585430 + }, + { + "epoch": 1.52, + "learning_rate": 7.236826074897415e-05, + "loss": 0.009, + "step": 585440 + }, + { + "epoch": 1.52, + "learning_rate": 7.236437253260268e-05, + "loss": 0.0111, + "step": 585450 + }, + { + "epoch": 1.52, + "learning_rate": 7.236048431623122e-05, + "loss": 0.0096, + "step": 585460 + }, + { + "epoch": 1.52, + "learning_rate": 7.235659609985975e-05, + "loss": 0.0097, + "step": 585470 + }, + { + "epoch": 1.52, + "learning_rate": 7.235270788348829e-05, + "loss": 0.0084, + "step": 585480 + }, + { + "epoch": 1.52, + "learning_rate": 7.234881966711683e-05, + "loss": 0.0084, + "step": 585490 + }, + { + "epoch": 1.52, + "learning_rate": 7.234493145074536e-05, + "loss": 0.0095, + "step": 585500 + }, + { + "epoch": 1.52, + "learning_rate": 7.23410432343739e-05, + "loss": 0.0088, + "step": 585510 + }, + { + "epoch": 1.52, + "learning_rate": 7.233715501800243e-05, + "loss": 0.0137, + "step": 585520 + }, + { + "epoch": 1.52, + "learning_rate": 7.233326680163097e-05, + "loss": 0.0078, + "step": 585530 + }, + { + "epoch": 1.52, + "learning_rate": 7.23293785852595e-05, + "loss": 0.0075, + "step": 585540 + }, + { + "epoch": 1.52, + "learning_rate": 7.232549036888804e-05, + "loss": 0.0079, + "step": 585550 + }, + { + "epoch": 1.52, + "learning_rate": 7.232160215251658e-05, + "loss": 0.0106, + "step": 585560 + }, + { + "epoch": 1.52, + "learning_rate": 7.231771393614511e-05, + "loss": 0.0071, + "step": 585570 + }, + { + "epoch": 1.52, + "learning_rate": 7.231382571977365e-05, + "loss": 0.0087, + "step": 585580 + }, + { + "epoch": 1.52, + "learning_rate": 7.230993750340218e-05, + "loss": 0.0087, + "step": 585590 + }, + { + "epoch": 1.52, + "learning_rate": 7.230604928703072e-05, + "loss": 0.0079, + "step": 585600 + }, + { + "epoch": 1.52, + "learning_rate": 7.230216107065925e-05, + "loss": 0.0116, + "step": 585610 + }, + { + "epoch": 1.52, + "learning_rate": 7.22982728542878e-05, + "loss": 0.0077, + "step": 585620 + }, + { + "epoch": 1.52, + "learning_rate": 7.229438463791632e-05, + "loss": 0.0097, + "step": 585630 + }, + { + "epoch": 1.52, + "learning_rate": 7.229049642154486e-05, + "loss": 0.011, + "step": 585640 + }, + { + "epoch": 1.52, + "learning_rate": 7.22866082051734e-05, + "loss": 0.0067, + "step": 585650 + }, + { + "epoch": 1.52, + "learning_rate": 7.228271998880193e-05, + "loss": 0.0138, + "step": 585660 + }, + { + "epoch": 1.52, + "learning_rate": 7.227883177243046e-05, + "loss": 0.0072, + "step": 585670 + }, + { + "epoch": 1.52, + "learning_rate": 7.2274943556059e-05, + "loss": 0.0081, + "step": 585680 + }, + { + "epoch": 1.52, + "learning_rate": 7.227105533968753e-05, + "loss": 0.01, + "step": 585690 + }, + { + "epoch": 1.52, + "learning_rate": 7.226716712331607e-05, + "loss": 0.0085, + "step": 585700 + }, + { + "epoch": 1.52, + "learning_rate": 7.22632789069446e-05, + "loss": 0.0078, + "step": 585710 + }, + { + "epoch": 1.52, + "learning_rate": 7.225939069057314e-05, + "loss": 0.0088, + "step": 585720 + }, + { + "epoch": 1.52, + "learning_rate": 7.225550247420167e-05, + "loss": 0.0093, + "step": 585730 + }, + { + "epoch": 1.52, + "learning_rate": 7.225161425783021e-05, + "loss": 0.0094, + "step": 585740 + }, + { + "epoch": 1.52, + "learning_rate": 7.224772604145875e-05, + "loss": 0.0071, + "step": 585750 + }, + { + "epoch": 1.52, + "learning_rate": 7.224383782508728e-05, + "loss": 0.0073, + "step": 585760 + }, + { + "epoch": 1.52, + "learning_rate": 7.223994960871582e-05, + "loss": 0.0066, + "step": 585770 + }, + { + "epoch": 1.52, + "learning_rate": 7.223606139234435e-05, + "loss": 0.0104, + "step": 585780 + }, + { + "epoch": 1.52, + "learning_rate": 7.223217317597289e-05, + "loss": 0.0094, + "step": 585790 + }, + { + "epoch": 1.52, + "learning_rate": 7.222828495960142e-05, + "loss": 0.0119, + "step": 585800 + }, + { + "epoch": 1.52, + "learning_rate": 7.222439674322996e-05, + "loss": 0.0117, + "step": 585810 + }, + { + "epoch": 1.52, + "learning_rate": 7.22205085268585e-05, + "loss": 0.0064, + "step": 585820 + }, + { + "epoch": 1.52, + "learning_rate": 7.221662031048703e-05, + "loss": 0.0093, + "step": 585830 + }, + { + "epoch": 1.52, + "learning_rate": 7.221273209411557e-05, + "loss": 0.0088, + "step": 585840 + }, + { + "epoch": 1.52, + "learning_rate": 7.22088438777441e-05, + "loss": 0.0079, + "step": 585850 + }, + { + "epoch": 1.52, + "learning_rate": 7.220495566137264e-05, + "loss": 0.0099, + "step": 585860 + }, + { + "epoch": 1.52, + "learning_rate": 7.220106744500117e-05, + "loss": 0.013, + "step": 585870 + }, + { + "epoch": 1.52, + "learning_rate": 7.219717922862971e-05, + "loss": 0.0079, + "step": 585880 + }, + { + "epoch": 1.52, + "learning_rate": 7.219329101225824e-05, + "loss": 0.0071, + "step": 585890 + }, + { + "epoch": 1.52, + "learning_rate": 7.218940279588678e-05, + "loss": 0.0066, + "step": 585900 + }, + { + "epoch": 1.52, + "learning_rate": 7.218551457951531e-05, + "loss": 0.0099, + "step": 585910 + }, + { + "epoch": 1.52, + "learning_rate": 7.218162636314385e-05, + "loss": 0.0086, + "step": 585920 + }, + { + "epoch": 1.52, + "learning_rate": 7.217773814677238e-05, + "loss": 0.0111, + "step": 585930 + }, + { + "epoch": 1.52, + "learning_rate": 7.217384993040092e-05, + "loss": 0.0096, + "step": 585940 + }, + { + "epoch": 1.52, + "learning_rate": 7.216996171402945e-05, + "loss": 0.0075, + "step": 585950 + }, + { + "epoch": 1.52, + "learning_rate": 7.216607349765799e-05, + "loss": 0.0094, + "step": 585960 + }, + { + "epoch": 1.52, + "learning_rate": 7.216218528128652e-05, + "loss": 0.0109, + "step": 585970 + }, + { + "epoch": 1.52, + "learning_rate": 7.215829706491506e-05, + "loss": 0.0094, + "step": 585980 + }, + { + "epoch": 1.52, + "learning_rate": 7.215440884854359e-05, + "loss": 0.0109, + "step": 585990 + }, + { + "epoch": 1.52, + "learning_rate": 7.215052063217213e-05, + "loss": 0.0127, + "step": 586000 + }, + { + "epoch": 1.52, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.00595942372456193, + "eval_runtime": 107.8725, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 586000 + }, + { + "epoch": 1.52, + "learning_rate": 7.214663241580067e-05, + "loss": 0.012, + "step": 586010 + }, + { + "epoch": 1.52, + "learning_rate": 7.21427441994292e-05, + "loss": 0.0105, + "step": 586020 + }, + { + "epoch": 1.52, + "learning_rate": 7.213885598305774e-05, + "loss": 0.0072, + "step": 586030 + }, + { + "epoch": 1.52, + "learning_rate": 7.213496776668627e-05, + "loss": 0.0095, + "step": 586040 + }, + { + "epoch": 1.52, + "learning_rate": 7.213107955031481e-05, + "loss": 0.0085, + "step": 586050 + }, + { + "epoch": 1.52, + "learning_rate": 7.212719133394334e-05, + "loss": 0.0105, + "step": 586060 + }, + { + "epoch": 1.52, + "learning_rate": 7.212330311757188e-05, + "loss": 0.0073, + "step": 586070 + }, + { + "epoch": 1.52, + "learning_rate": 7.211941490120042e-05, + "loss": 0.0124, + "step": 586080 + }, + { + "epoch": 1.52, + "learning_rate": 7.211552668482895e-05, + "loss": 0.0099, + "step": 586090 + }, + { + "epoch": 1.52, + "learning_rate": 7.21116384684575e-05, + "loss": 0.01, + "step": 586100 + }, + { + "epoch": 1.52, + "learning_rate": 7.210775025208602e-05, + "loss": 0.0098, + "step": 586110 + }, + { + "epoch": 1.52, + "learning_rate": 7.210386203571456e-05, + "loss": 0.0087, + "step": 586120 + }, + { + "epoch": 1.52, + "learning_rate": 7.209997381934309e-05, + "loss": 0.0084, + "step": 586130 + }, + { + "epoch": 1.52, + "learning_rate": 7.209608560297163e-05, + "loss": 0.009, + "step": 586140 + }, + { + "epoch": 1.52, + "learning_rate": 7.209219738660016e-05, + "loss": 0.0082, + "step": 586150 + }, + { + "epoch": 1.52, + "learning_rate": 7.208830917022869e-05, + "loss": 0.0079, + "step": 586160 + }, + { + "epoch": 1.52, + "learning_rate": 7.208442095385723e-05, + "loss": 0.0081, + "step": 586170 + }, + { + "epoch": 1.52, + "learning_rate": 7.208053273748577e-05, + "loss": 0.0109, + "step": 586180 + }, + { + "epoch": 1.52, + "learning_rate": 7.20766445211143e-05, + "loss": 0.0092, + "step": 586190 + }, + { + "epoch": 1.52, + "learning_rate": 7.207275630474284e-05, + "loss": 0.0087, + "step": 586200 + }, + { + "epoch": 1.52, + "learning_rate": 7.206886808837137e-05, + "loss": 0.0111, + "step": 586210 + }, + { + "epoch": 1.52, + "learning_rate": 7.206497987199991e-05, + "loss": 0.008, + "step": 586220 + }, + { + "epoch": 1.52, + "learning_rate": 7.206109165562844e-05, + "loss": 0.0098, + "step": 586230 + }, + { + "epoch": 1.52, + "learning_rate": 7.205720343925698e-05, + "loss": 0.0104, + "step": 586240 + }, + { + "epoch": 1.52, + "learning_rate": 7.205331522288551e-05, + "loss": 0.0077, + "step": 586250 + }, + { + "epoch": 1.52, + "learning_rate": 7.204942700651405e-05, + "loss": 0.007, + "step": 586260 + }, + { + "epoch": 1.52, + "learning_rate": 7.204553879014259e-05, + "loss": 0.0084, + "step": 586270 + }, + { + "epoch": 1.52, + "learning_rate": 7.204165057377112e-05, + "loss": 0.0119, + "step": 586280 + }, + { + "epoch": 1.52, + "learning_rate": 7.203776235739966e-05, + "loss": 0.0086, + "step": 586290 + }, + { + "epoch": 1.52, + "learning_rate": 7.203387414102819e-05, + "loss": 0.0082, + "step": 586300 + }, + { + "epoch": 1.52, + "learning_rate": 7.202998592465673e-05, + "loss": 0.0094, + "step": 586310 + }, + { + "epoch": 1.52, + "learning_rate": 7.202609770828526e-05, + "loss": 0.0083, + "step": 586320 + }, + { + "epoch": 1.52, + "learning_rate": 7.20222094919138e-05, + "loss": 0.0079, + "step": 586330 + }, + { + "epoch": 1.52, + "learning_rate": 7.201832127554234e-05, + "loss": 0.009, + "step": 586340 + }, + { + "epoch": 1.52, + "learning_rate": 7.201443305917087e-05, + "loss": 0.0097, + "step": 586350 + }, + { + "epoch": 1.52, + "learning_rate": 7.201054484279941e-05, + "loss": 0.011, + "step": 586360 + }, + { + "epoch": 1.52, + "learning_rate": 7.200665662642794e-05, + "loss": 0.0077, + "step": 586370 + }, + { + "epoch": 1.52, + "learning_rate": 7.200276841005648e-05, + "loss": 0.011, + "step": 586380 + }, + { + "epoch": 1.52, + "learning_rate": 7.199888019368501e-05, + "loss": 0.0123, + "step": 586390 + }, + { + "epoch": 1.52, + "learning_rate": 7.199499197731355e-05, + "loss": 0.0103, + "step": 586400 + }, + { + "epoch": 1.52, + "learning_rate": 7.199110376094208e-05, + "loss": 0.0101, + "step": 586410 + }, + { + "epoch": 1.52, + "learning_rate": 7.198721554457061e-05, + "loss": 0.0076, + "step": 586420 + }, + { + "epoch": 1.52, + "learning_rate": 7.198332732819915e-05, + "loss": 0.0074, + "step": 586430 + }, + { + "epoch": 1.52, + "learning_rate": 7.197943911182769e-05, + "loss": 0.0091, + "step": 586440 + }, + { + "epoch": 1.52, + "learning_rate": 7.197555089545622e-05, + "loss": 0.0105, + "step": 586450 + }, + { + "epoch": 1.52, + "learning_rate": 7.197166267908476e-05, + "loss": 0.0084, + "step": 586460 + }, + { + "epoch": 1.52, + "learning_rate": 7.196777446271329e-05, + "loss": 0.011, + "step": 586470 + }, + { + "epoch": 1.52, + "learning_rate": 7.196388624634183e-05, + "loss": 0.0094, + "step": 586480 + }, + { + "epoch": 1.52, + "learning_rate": 7.195999802997036e-05, + "loss": 0.0099, + "step": 586490 + }, + { + "epoch": 1.52, + "learning_rate": 7.19561098135989e-05, + "loss": 0.0069, + "step": 586500 + }, + { + "epoch": 1.52, + "learning_rate": 7.195222159722743e-05, + "loss": 0.0051, + "step": 586510 + }, + { + "epoch": 1.52, + "learning_rate": 7.194833338085597e-05, + "loss": 0.0112, + "step": 586520 + }, + { + "epoch": 1.52, + "learning_rate": 7.194444516448451e-05, + "loss": 0.0072, + "step": 586530 + }, + { + "epoch": 1.52, + "learning_rate": 7.194055694811304e-05, + "loss": 0.0081, + "step": 586540 + }, + { + "epoch": 1.52, + "learning_rate": 7.193666873174158e-05, + "loss": 0.009, + "step": 586550 + }, + { + "epoch": 1.52, + "learning_rate": 7.193278051537011e-05, + "loss": 0.0067, + "step": 586560 + }, + { + "epoch": 1.52, + "learning_rate": 7.192889229899865e-05, + "loss": 0.0102, + "step": 586570 + }, + { + "epoch": 1.52, + "learning_rate": 7.192500408262718e-05, + "loss": 0.0101, + "step": 586580 + }, + { + "epoch": 1.52, + "learning_rate": 7.192111586625572e-05, + "loss": 0.0109, + "step": 586590 + }, + { + "epoch": 1.52, + "learning_rate": 7.191722764988425e-05, + "loss": 0.0105, + "step": 586600 + }, + { + "epoch": 1.52, + "learning_rate": 7.191333943351279e-05, + "loss": 0.008, + "step": 586610 + }, + { + "epoch": 1.52, + "learning_rate": 7.190945121714133e-05, + "loss": 0.0091, + "step": 586620 + }, + { + "epoch": 1.52, + "learning_rate": 7.190556300076986e-05, + "loss": 0.0071, + "step": 586630 + }, + { + "epoch": 1.52, + "learning_rate": 7.19016747843984e-05, + "loss": 0.0107, + "step": 586640 + }, + { + "epoch": 1.52, + "learning_rate": 7.189778656802693e-05, + "loss": 0.0094, + "step": 586650 + }, + { + "epoch": 1.52, + "learning_rate": 7.189389835165546e-05, + "loss": 0.0085, + "step": 586660 + }, + { + "epoch": 1.52, + "learning_rate": 7.1890010135284e-05, + "loss": 0.0076, + "step": 586670 + }, + { + "epoch": 1.52, + "learning_rate": 7.188612191891253e-05, + "loss": 0.0056, + "step": 586680 + }, + { + "epoch": 1.52, + "learning_rate": 7.188223370254107e-05, + "loss": 0.0087, + "step": 586690 + }, + { + "epoch": 1.52, + "learning_rate": 7.18783454861696e-05, + "loss": 0.0075, + "step": 586700 + }, + { + "epoch": 1.52, + "learning_rate": 7.187445726979814e-05, + "loss": 0.0092, + "step": 586710 + }, + { + "epoch": 1.52, + "learning_rate": 7.187056905342668e-05, + "loss": 0.0088, + "step": 586720 + }, + { + "epoch": 1.52, + "learning_rate": 7.186668083705521e-05, + "loss": 0.0088, + "step": 586730 + }, + { + "epoch": 1.52, + "learning_rate": 7.186279262068375e-05, + "loss": 0.0113, + "step": 586740 + }, + { + "epoch": 1.52, + "learning_rate": 7.185890440431228e-05, + "loss": 0.0084, + "step": 586750 + }, + { + "epoch": 1.52, + "learning_rate": 7.185501618794082e-05, + "loss": 0.0093, + "step": 586760 + }, + { + "epoch": 1.52, + "learning_rate": 7.185112797156935e-05, + "loss": 0.0122, + "step": 586770 + }, + { + "epoch": 1.52, + "learning_rate": 7.184723975519789e-05, + "loss": 0.0075, + "step": 586780 + }, + { + "epoch": 1.52, + "learning_rate": 7.184335153882643e-05, + "loss": 0.0109, + "step": 586790 + }, + { + "epoch": 1.52, + "learning_rate": 7.183946332245496e-05, + "loss": 0.0095, + "step": 586800 + }, + { + "epoch": 1.52, + "learning_rate": 7.18355751060835e-05, + "loss": 0.0073, + "step": 586810 + }, + { + "epoch": 1.52, + "learning_rate": 7.183168688971203e-05, + "loss": 0.0073, + "step": 586820 + }, + { + "epoch": 1.52, + "learning_rate": 7.182779867334057e-05, + "loss": 0.0086, + "step": 586830 + }, + { + "epoch": 1.52, + "learning_rate": 7.18239104569691e-05, + "loss": 0.0108, + "step": 586840 + }, + { + "epoch": 1.52, + "learning_rate": 7.182002224059764e-05, + "loss": 0.0095, + "step": 586850 + }, + { + "epoch": 1.52, + "learning_rate": 7.181613402422617e-05, + "loss": 0.0105, + "step": 586860 + }, + { + "epoch": 1.52, + "learning_rate": 7.181224580785471e-05, + "loss": 0.0088, + "step": 586870 + }, + { + "epoch": 1.52, + "learning_rate": 7.180835759148325e-05, + "loss": 0.0072, + "step": 586880 + }, + { + "epoch": 1.52, + "learning_rate": 7.180446937511178e-05, + "loss": 0.0083, + "step": 586890 + }, + { + "epoch": 1.52, + "learning_rate": 7.180058115874031e-05, + "loss": 0.0062, + "step": 586900 + }, + { + "epoch": 1.52, + "learning_rate": 7.179669294236885e-05, + "loss": 0.008, + "step": 586910 + }, + { + "epoch": 1.52, + "learning_rate": 7.179280472599738e-05, + "loss": 0.0079, + "step": 586920 + }, + { + "epoch": 1.52, + "learning_rate": 7.178891650962592e-05, + "loss": 0.0082, + "step": 586930 + }, + { + "epoch": 1.52, + "learning_rate": 7.178502829325445e-05, + "loss": 0.0083, + "step": 586940 + }, + { + "epoch": 1.52, + "learning_rate": 7.178114007688299e-05, + "loss": 0.0106, + "step": 586950 + }, + { + "epoch": 1.52, + "learning_rate": 7.177725186051152e-05, + "loss": 0.0068, + "step": 586960 + }, + { + "epoch": 1.52, + "learning_rate": 7.177336364414006e-05, + "loss": 0.0101, + "step": 586970 + }, + { + "epoch": 1.52, + "learning_rate": 7.17694754277686e-05, + "loss": 0.0086, + "step": 586980 + }, + { + "epoch": 1.52, + "learning_rate": 7.176558721139713e-05, + "loss": 0.0077, + "step": 586990 + }, + { + "epoch": 1.52, + "learning_rate": 7.176169899502567e-05, + "loss": 0.0087, + "step": 587000 + }, + { + "epoch": 1.52, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.005926743149757385, + "eval_runtime": 107.8399, + "eval_samples_per_second": 18.546, + "eval_steps_per_second": 4.637, + "step": 587000 + }, + { + "epoch": 1.52, + "learning_rate": 7.17578107786542e-05, + "loss": 0.0067, + "step": 587010 + }, + { + "epoch": 1.52, + "learning_rate": 7.175392256228274e-05, + "loss": 0.0066, + "step": 587020 + }, + { + "epoch": 1.52, + "learning_rate": 7.175003434591127e-05, + "loss": 0.0083, + "step": 587030 + }, + { + "epoch": 1.52, + "learning_rate": 7.174614612953981e-05, + "loss": 0.0089, + "step": 587040 + }, + { + "epoch": 1.52, + "learning_rate": 7.174225791316835e-05, + "loss": 0.0086, + "step": 587050 + }, + { + "epoch": 1.52, + "learning_rate": 7.173836969679688e-05, + "loss": 0.0098, + "step": 587060 + }, + { + "epoch": 1.52, + "learning_rate": 7.173448148042542e-05, + "loss": 0.0083, + "step": 587070 + }, + { + "epoch": 1.52, + "learning_rate": 7.173059326405395e-05, + "loss": 0.0081, + "step": 587080 + }, + { + "epoch": 1.52, + "learning_rate": 7.172670504768249e-05, + "loss": 0.0077, + "step": 587090 + }, + { + "epoch": 1.52, + "learning_rate": 7.172281683131102e-05, + "loss": 0.0076, + "step": 587100 + }, + { + "epoch": 1.52, + "learning_rate": 7.171892861493956e-05, + "loss": 0.0078, + "step": 587110 + }, + { + "epoch": 1.52, + "learning_rate": 7.171504039856809e-05, + "loss": 0.0098, + "step": 587120 + }, + { + "epoch": 1.52, + "learning_rate": 7.171115218219663e-05, + "loss": 0.0099, + "step": 587130 + }, + { + "epoch": 1.52, + "learning_rate": 7.170726396582517e-05, + "loss": 0.0083, + "step": 587140 + }, + { + "epoch": 1.52, + "learning_rate": 7.17033757494537e-05, + "loss": 0.0122, + "step": 587150 + }, + { + "epoch": 1.52, + "learning_rate": 7.169948753308223e-05, + "loss": 0.0062, + "step": 587160 + }, + { + "epoch": 1.52, + "learning_rate": 7.169559931671077e-05, + "loss": 0.0128, + "step": 587170 + }, + { + "epoch": 1.52, + "learning_rate": 7.16917111003393e-05, + "loss": 0.0076, + "step": 587180 + }, + { + "epoch": 1.52, + "learning_rate": 7.168782288396784e-05, + "loss": 0.009, + "step": 587190 + }, + { + "epoch": 1.52, + "learning_rate": 7.168393466759637e-05, + "loss": 0.0081, + "step": 587200 + }, + { + "epoch": 1.52, + "learning_rate": 7.168004645122491e-05, + "loss": 0.0068, + "step": 587210 + }, + { + "epoch": 1.52, + "learning_rate": 7.167615823485344e-05, + "loss": 0.0053, + "step": 587220 + }, + { + "epoch": 1.52, + "learning_rate": 7.167227001848198e-05, + "loss": 0.0084, + "step": 587230 + }, + { + "epoch": 1.52, + "learning_rate": 7.166838180211052e-05, + "loss": 0.0099, + "step": 587240 + }, + { + "epoch": 1.52, + "learning_rate": 7.166449358573905e-05, + "loss": 0.0076, + "step": 587250 + }, + { + "epoch": 1.52, + "learning_rate": 7.166060536936759e-05, + "loss": 0.0056, + "step": 587260 + }, + { + "epoch": 1.52, + "learning_rate": 7.165671715299612e-05, + "loss": 0.01, + "step": 587270 + }, + { + "epoch": 1.52, + "learning_rate": 7.165282893662466e-05, + "loss": 0.0085, + "step": 587280 + }, + { + "epoch": 1.52, + "learning_rate": 7.164894072025319e-05, + "loss": 0.0107, + "step": 587290 + }, + { + "epoch": 1.52, + "learning_rate": 7.164505250388173e-05, + "loss": 0.0087, + "step": 587300 + }, + { + "epoch": 1.52, + "learning_rate": 7.164116428751027e-05, + "loss": 0.0093, + "step": 587310 + }, + { + "epoch": 1.52, + "learning_rate": 7.16372760711388e-05, + "loss": 0.0106, + "step": 587320 + }, + { + "epoch": 1.52, + "learning_rate": 7.163338785476734e-05, + "loss": 0.0064, + "step": 587330 + }, + { + "epoch": 1.52, + "learning_rate": 7.162949963839587e-05, + "loss": 0.006, + "step": 587340 + }, + { + "epoch": 1.52, + "learning_rate": 7.162561142202441e-05, + "loss": 0.0085, + "step": 587350 + }, + { + "epoch": 1.52, + "learning_rate": 7.162172320565294e-05, + "loss": 0.0097, + "step": 587360 + }, + { + "epoch": 1.52, + "learning_rate": 7.161783498928148e-05, + "loss": 0.0076, + "step": 587370 + }, + { + "epoch": 1.52, + "learning_rate": 7.161394677291001e-05, + "loss": 0.0073, + "step": 587380 + }, + { + "epoch": 1.52, + "learning_rate": 7.161005855653855e-05, + "loss": 0.008, + "step": 587390 + }, + { + "epoch": 1.52, + "learning_rate": 7.160617034016708e-05, + "loss": 0.0081, + "step": 587400 + }, + { + "epoch": 1.52, + "learning_rate": 7.160228212379562e-05, + "loss": 0.0074, + "step": 587410 + }, + { + "epoch": 1.52, + "learning_rate": 7.159839390742415e-05, + "loss": 0.0083, + "step": 587420 + }, + { + "epoch": 1.52, + "learning_rate": 7.159450569105269e-05, + "loss": 0.007, + "step": 587430 + }, + { + "epoch": 1.52, + "learning_rate": 7.159061747468122e-05, + "loss": 0.0093, + "step": 587440 + }, + { + "epoch": 1.52, + "learning_rate": 7.158672925830976e-05, + "loss": 0.0098, + "step": 587450 + }, + { + "epoch": 1.52, + "learning_rate": 7.158284104193829e-05, + "loss": 0.0112, + "step": 587460 + }, + { + "epoch": 1.52, + "learning_rate": 7.157895282556683e-05, + "loss": 0.0095, + "step": 587470 + }, + { + "epoch": 1.52, + "learning_rate": 7.157506460919536e-05, + "loss": 0.0111, + "step": 587480 + }, + { + "epoch": 1.52, + "learning_rate": 7.15711763928239e-05, + "loss": 0.008, + "step": 587490 + }, + { + "epoch": 1.52, + "learning_rate": 7.156728817645244e-05, + "loss": 0.0089, + "step": 587500 + }, + { + "epoch": 1.52, + "learning_rate": 7.156339996008097e-05, + "loss": 0.014, + "step": 587510 + }, + { + "epoch": 1.52, + "learning_rate": 7.155951174370951e-05, + "loss": 0.0091, + "step": 587520 + }, + { + "epoch": 1.52, + "learning_rate": 7.155562352733804e-05, + "loss": 0.0098, + "step": 587530 + }, + { + "epoch": 1.52, + "learning_rate": 7.155173531096658e-05, + "loss": 0.0089, + "step": 587540 + }, + { + "epoch": 1.52, + "learning_rate": 7.154784709459511e-05, + "loss": 0.0064, + "step": 587550 + }, + { + "epoch": 1.52, + "learning_rate": 7.154395887822365e-05, + "loss": 0.0088, + "step": 587560 + }, + { + "epoch": 1.52, + "learning_rate": 7.154007066185219e-05, + "loss": 0.01, + "step": 587570 + }, + { + "epoch": 1.52, + "learning_rate": 7.153618244548072e-05, + "loss": 0.0077, + "step": 587580 + }, + { + "epoch": 1.52, + "learning_rate": 7.153229422910926e-05, + "loss": 0.0119, + "step": 587590 + }, + { + "epoch": 1.52, + "learning_rate": 7.152840601273779e-05, + "loss": 0.0074, + "step": 587600 + }, + { + "epoch": 1.52, + "learning_rate": 7.152451779636633e-05, + "loss": 0.011, + "step": 587610 + }, + { + "epoch": 1.52, + "learning_rate": 7.152062957999486e-05, + "loss": 0.0099, + "step": 587620 + }, + { + "epoch": 1.52, + "learning_rate": 7.15167413636234e-05, + "loss": 0.0106, + "step": 587630 + }, + { + "epoch": 1.52, + "learning_rate": 7.151285314725193e-05, + "loss": 0.0051, + "step": 587640 + }, + { + "epoch": 1.52, + "learning_rate": 7.150896493088046e-05, + "loss": 0.008, + "step": 587650 + }, + { + "epoch": 1.52, + "learning_rate": 7.1505076714509e-05, + "loss": 0.0082, + "step": 587660 + }, + { + "epoch": 1.52, + "learning_rate": 7.150118849813754e-05, + "loss": 0.0077, + "step": 587670 + }, + { + "epoch": 1.52, + "learning_rate": 7.149730028176607e-05, + "loss": 0.0085, + "step": 587680 + }, + { + "epoch": 1.52, + "learning_rate": 7.149341206539461e-05, + "loss": 0.0106, + "step": 587690 + }, + { + "epoch": 1.52, + "learning_rate": 7.148952384902314e-05, + "loss": 0.0093, + "step": 587700 + }, + { + "epoch": 1.52, + "learning_rate": 7.148563563265168e-05, + "loss": 0.0095, + "step": 587710 + }, + { + "epoch": 1.52, + "learning_rate": 7.148174741628021e-05, + "loss": 0.0083, + "step": 587720 + }, + { + "epoch": 1.52, + "learning_rate": 7.147785919990875e-05, + "loss": 0.0107, + "step": 587730 + }, + { + "epoch": 1.52, + "learning_rate": 7.147397098353728e-05, + "loss": 0.0107, + "step": 587740 + }, + { + "epoch": 1.52, + "learning_rate": 7.147008276716582e-05, + "loss": 0.0074, + "step": 587750 + }, + { + "epoch": 1.52, + "learning_rate": 7.146619455079436e-05, + "loss": 0.0099, + "step": 587760 + }, + { + "epoch": 1.52, + "learning_rate": 7.146230633442289e-05, + "loss": 0.0085, + "step": 587770 + }, + { + "epoch": 1.52, + "learning_rate": 7.145841811805143e-05, + "loss": 0.0082, + "step": 587780 + }, + { + "epoch": 1.52, + "learning_rate": 7.145452990167996e-05, + "loss": 0.0057, + "step": 587790 + }, + { + "epoch": 1.52, + "learning_rate": 7.14506416853085e-05, + "loss": 0.0094, + "step": 587800 + }, + { + "epoch": 1.52, + "learning_rate": 7.144675346893703e-05, + "loss": 0.0097, + "step": 587810 + }, + { + "epoch": 1.52, + "learning_rate": 7.144286525256557e-05, + "loss": 0.0097, + "step": 587820 + }, + { + "epoch": 1.52, + "learning_rate": 7.14389770361941e-05, + "loss": 0.0082, + "step": 587830 + }, + { + "epoch": 1.52, + "learning_rate": 7.143508881982264e-05, + "loss": 0.0084, + "step": 587840 + }, + { + "epoch": 1.52, + "learning_rate": 7.143120060345118e-05, + "loss": 0.0083, + "step": 587850 + }, + { + "epoch": 1.52, + "learning_rate": 7.142731238707971e-05, + "loss": 0.011, + "step": 587860 + }, + { + "epoch": 1.52, + "learning_rate": 7.142342417070825e-05, + "loss": 0.0067, + "step": 587870 + }, + { + "epoch": 1.52, + "learning_rate": 7.141953595433678e-05, + "loss": 0.0086, + "step": 587880 + }, + { + "epoch": 1.52, + "learning_rate": 7.141564773796531e-05, + "loss": 0.0069, + "step": 587890 + }, + { + "epoch": 1.52, + "learning_rate": 7.141175952159385e-05, + "loss": 0.0067, + "step": 587900 + }, + { + "epoch": 1.52, + "learning_rate": 7.140787130522238e-05, + "loss": 0.0092, + "step": 587910 + }, + { + "epoch": 1.52, + "learning_rate": 7.140398308885092e-05, + "loss": 0.0094, + "step": 587920 + }, + { + "epoch": 1.52, + "learning_rate": 7.140009487247945e-05, + "loss": 0.0091, + "step": 587930 + }, + { + "epoch": 1.52, + "learning_rate": 7.139620665610799e-05, + "loss": 0.0113, + "step": 587940 + }, + { + "epoch": 1.52, + "learning_rate": 7.139231843973653e-05, + "loss": 0.0109, + "step": 587950 + }, + { + "epoch": 1.52, + "learning_rate": 7.138843022336506e-05, + "loss": 0.0082, + "step": 587960 + }, + { + "epoch": 1.52, + "learning_rate": 7.13845420069936e-05, + "loss": 0.0096, + "step": 587970 + }, + { + "epoch": 1.52, + "learning_rate": 7.138065379062213e-05, + "loss": 0.0102, + "step": 587980 + }, + { + "epoch": 1.52, + "learning_rate": 7.137676557425067e-05, + "loss": 0.0073, + "step": 587990 + }, + { + "epoch": 1.52, + "learning_rate": 7.13728773578792e-05, + "loss": 0.0072, + "step": 588000 + }, + { + "epoch": 1.52, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.005772036034613848, + "eval_runtime": 107.6593, + "eval_samples_per_second": 18.577, + "eval_steps_per_second": 4.644, + "step": 588000 + }, + { + "epoch": 1.52, + "learning_rate": 7.136898914150774e-05, + "loss": 0.0073, + "step": 588010 + }, + { + "epoch": 1.52, + "learning_rate": 7.136510092513628e-05, + "loss": 0.0102, + "step": 588020 + }, + { + "epoch": 1.52, + "learning_rate": 7.136121270876481e-05, + "loss": 0.01, + "step": 588030 + }, + { + "epoch": 1.52, + "learning_rate": 7.135732449239335e-05, + "loss": 0.0083, + "step": 588040 + }, + { + "epoch": 1.52, + "learning_rate": 7.135343627602188e-05, + "loss": 0.0085, + "step": 588050 + }, + { + "epoch": 1.52, + "learning_rate": 7.134954805965042e-05, + "loss": 0.0091, + "step": 588060 + }, + { + "epoch": 1.52, + "learning_rate": 7.134565984327895e-05, + "loss": 0.0075, + "step": 588070 + }, + { + "epoch": 1.52, + "learning_rate": 7.134177162690749e-05, + "loss": 0.012, + "step": 588080 + }, + { + "epoch": 1.52, + "learning_rate": 7.133788341053602e-05, + "loss": 0.0109, + "step": 588090 + }, + { + "epoch": 1.52, + "learning_rate": 7.133399519416456e-05, + "loss": 0.008, + "step": 588100 + }, + { + "epoch": 1.52, + "learning_rate": 7.13301069777931e-05, + "loss": 0.0073, + "step": 588110 + }, + { + "epoch": 1.52, + "learning_rate": 7.132621876142163e-05, + "loss": 0.0095, + "step": 588120 + }, + { + "epoch": 1.52, + "learning_rate": 7.132233054505017e-05, + "loss": 0.0098, + "step": 588130 + }, + { + "epoch": 1.52, + "learning_rate": 7.13184423286787e-05, + "loss": 0.0066, + "step": 588140 + }, + { + "epoch": 1.52, + "learning_rate": 7.131455411230723e-05, + "loss": 0.0087, + "step": 588150 + }, + { + "epoch": 1.52, + "learning_rate": 7.131066589593577e-05, + "loss": 0.0102, + "step": 588160 + }, + { + "epoch": 1.52, + "learning_rate": 7.13067776795643e-05, + "loss": 0.009, + "step": 588170 + }, + { + "epoch": 1.52, + "learning_rate": 7.130288946319284e-05, + "loss": 0.009, + "step": 588180 + }, + { + "epoch": 1.52, + "learning_rate": 7.129900124682137e-05, + "loss": 0.0106, + "step": 588190 + }, + { + "epoch": 1.52, + "learning_rate": 7.129511303044991e-05, + "loss": 0.0092, + "step": 588200 + }, + { + "epoch": 1.52, + "learning_rate": 7.129122481407845e-05, + "loss": 0.0107, + "step": 588210 + }, + { + "epoch": 1.52, + "learning_rate": 7.128733659770698e-05, + "loss": 0.0101, + "step": 588220 + }, + { + "epoch": 1.52, + "learning_rate": 7.128344838133552e-05, + "loss": 0.0085, + "step": 588230 + }, + { + "epoch": 1.52, + "learning_rate": 7.127956016496405e-05, + "loss": 0.0088, + "step": 588240 + }, + { + "epoch": 1.52, + "learning_rate": 7.127567194859259e-05, + "loss": 0.0109, + "step": 588250 + }, + { + "epoch": 1.52, + "learning_rate": 7.127178373222112e-05, + "loss": 0.0128, + "step": 588260 + }, + { + "epoch": 1.52, + "learning_rate": 7.126789551584966e-05, + "loss": 0.0127, + "step": 588270 + }, + { + "epoch": 1.52, + "learning_rate": 7.12640072994782e-05, + "loss": 0.01, + "step": 588280 + }, + { + "epoch": 1.52, + "learning_rate": 7.126011908310673e-05, + "loss": 0.0104, + "step": 588290 + }, + { + "epoch": 1.52, + "learning_rate": 7.125623086673527e-05, + "loss": 0.0087, + "step": 588300 + }, + { + "epoch": 1.52, + "learning_rate": 7.12523426503638e-05, + "loss": 0.0088, + "step": 588310 + }, + { + "epoch": 1.53, + "learning_rate": 7.124845443399234e-05, + "loss": 0.0105, + "step": 588320 + }, + { + "epoch": 1.53, + "learning_rate": 7.124456621762087e-05, + "loss": 0.0089, + "step": 588330 + }, + { + "epoch": 1.53, + "learning_rate": 7.124067800124941e-05, + "loss": 0.0115, + "step": 588340 + }, + { + "epoch": 1.53, + "learning_rate": 7.123678978487794e-05, + "loss": 0.0087, + "step": 588350 + }, + { + "epoch": 1.53, + "learning_rate": 7.123290156850648e-05, + "loss": 0.0081, + "step": 588360 + }, + { + "epoch": 1.53, + "learning_rate": 7.122901335213502e-05, + "loss": 0.0085, + "step": 588370 + }, + { + "epoch": 1.53, + "learning_rate": 7.122512513576355e-05, + "loss": 0.0085, + "step": 588380 + }, + { + "epoch": 1.53, + "learning_rate": 7.122123691939208e-05, + "loss": 0.009, + "step": 588390 + }, + { + "epoch": 1.53, + "learning_rate": 7.121734870302062e-05, + "loss": 0.0114, + "step": 588400 + }, + { + "epoch": 1.53, + "learning_rate": 7.121346048664915e-05, + "loss": 0.0095, + "step": 588410 + }, + { + "epoch": 1.53, + "learning_rate": 7.120957227027769e-05, + "loss": 0.01, + "step": 588420 + }, + { + "epoch": 1.53, + "learning_rate": 7.120568405390622e-05, + "loss": 0.0076, + "step": 588430 + }, + { + "epoch": 1.53, + "learning_rate": 7.120179583753476e-05, + "loss": 0.0082, + "step": 588440 + }, + { + "epoch": 1.53, + "learning_rate": 7.119790762116329e-05, + "loss": 0.0108, + "step": 588450 + }, + { + "epoch": 1.53, + "learning_rate": 7.119401940479183e-05, + "loss": 0.0098, + "step": 588460 + }, + { + "epoch": 1.53, + "learning_rate": 7.119013118842037e-05, + "loss": 0.0084, + "step": 588470 + }, + { + "epoch": 1.53, + "learning_rate": 7.11862429720489e-05, + "loss": 0.0099, + "step": 588480 + }, + { + "epoch": 1.53, + "learning_rate": 7.118235475567744e-05, + "loss": 0.01, + "step": 588490 + }, + { + "epoch": 1.53, + "learning_rate": 7.117846653930597e-05, + "loss": 0.0101, + "step": 588500 + }, + { + "epoch": 1.53, + "learning_rate": 7.117457832293451e-05, + "loss": 0.0079, + "step": 588510 + }, + { + "epoch": 1.53, + "learning_rate": 7.117069010656304e-05, + "loss": 0.0058, + "step": 588520 + }, + { + "epoch": 1.53, + "learning_rate": 7.116680189019158e-05, + "loss": 0.0134, + "step": 588530 + }, + { + "epoch": 1.53, + "learning_rate": 7.116291367382012e-05, + "loss": 0.0091, + "step": 588540 + }, + { + "epoch": 1.53, + "learning_rate": 7.115902545744865e-05, + "loss": 0.0085, + "step": 588550 + }, + { + "epoch": 1.53, + "learning_rate": 7.115513724107719e-05, + "loss": 0.0084, + "step": 588560 + }, + { + "epoch": 1.53, + "learning_rate": 7.115124902470572e-05, + "loss": 0.0075, + "step": 588570 + }, + { + "epoch": 1.53, + "learning_rate": 7.114736080833426e-05, + "loss": 0.0078, + "step": 588580 + }, + { + "epoch": 1.53, + "learning_rate": 7.114347259196279e-05, + "loss": 0.0089, + "step": 588590 + }, + { + "epoch": 1.53, + "learning_rate": 7.113958437559133e-05, + "loss": 0.0082, + "step": 588600 + }, + { + "epoch": 1.53, + "learning_rate": 7.113569615921986e-05, + "loss": 0.0069, + "step": 588610 + }, + { + "epoch": 1.53, + "learning_rate": 7.11318079428484e-05, + "loss": 0.0094, + "step": 588620 + }, + { + "epoch": 1.53, + "learning_rate": 7.112791972647694e-05, + "loss": 0.0062, + "step": 588630 + }, + { + "epoch": 1.53, + "learning_rate": 7.112403151010547e-05, + "loss": 0.0082, + "step": 588640 + }, + { + "epoch": 1.53, + "learning_rate": 7.1120143293734e-05, + "loss": 0.0076, + "step": 588650 + }, + { + "epoch": 1.53, + "learning_rate": 7.111625507736254e-05, + "loss": 0.0116, + "step": 588660 + }, + { + "epoch": 1.53, + "learning_rate": 7.111236686099107e-05, + "loss": 0.0103, + "step": 588670 + }, + { + "epoch": 1.53, + "learning_rate": 7.110847864461961e-05, + "loss": 0.0076, + "step": 588680 + }, + { + "epoch": 1.53, + "learning_rate": 7.110459042824814e-05, + "loss": 0.009, + "step": 588690 + }, + { + "epoch": 1.53, + "learning_rate": 7.110070221187668e-05, + "loss": 0.0096, + "step": 588700 + }, + { + "epoch": 1.53, + "learning_rate": 7.109681399550521e-05, + "loss": 0.0142, + "step": 588710 + }, + { + "epoch": 1.53, + "learning_rate": 7.109292577913375e-05, + "loss": 0.0097, + "step": 588720 + }, + { + "epoch": 1.53, + "learning_rate": 7.108903756276229e-05, + "loss": 0.0092, + "step": 588730 + }, + { + "epoch": 1.53, + "learning_rate": 7.108514934639082e-05, + "loss": 0.0084, + "step": 588740 + }, + { + "epoch": 1.53, + "learning_rate": 7.108126113001936e-05, + "loss": 0.01, + "step": 588750 + }, + { + "epoch": 1.53, + "learning_rate": 7.107737291364789e-05, + "loss": 0.0096, + "step": 588760 + }, + { + "epoch": 1.53, + "learning_rate": 7.107348469727643e-05, + "loss": 0.012, + "step": 588770 + }, + { + "epoch": 1.53, + "learning_rate": 7.106959648090496e-05, + "loss": 0.0073, + "step": 588780 + }, + { + "epoch": 1.53, + "learning_rate": 7.10657082645335e-05, + "loss": 0.0054, + "step": 588790 + }, + { + "epoch": 1.53, + "learning_rate": 7.106182004816204e-05, + "loss": 0.0073, + "step": 588800 + }, + { + "epoch": 1.53, + "learning_rate": 7.105793183179057e-05, + "loss": 0.006, + "step": 588810 + }, + { + "epoch": 1.53, + "learning_rate": 7.105404361541911e-05, + "loss": 0.0078, + "step": 588820 + }, + { + "epoch": 1.53, + "learning_rate": 7.105015539904764e-05, + "loss": 0.0078, + "step": 588830 + }, + { + "epoch": 1.53, + "learning_rate": 7.104626718267618e-05, + "loss": 0.0106, + "step": 588840 + }, + { + "epoch": 1.53, + "learning_rate": 7.104237896630471e-05, + "loss": 0.0063, + "step": 588850 + }, + { + "epoch": 1.53, + "learning_rate": 7.103849074993325e-05, + "loss": 0.0089, + "step": 588860 + }, + { + "epoch": 1.53, + "learning_rate": 7.103460253356178e-05, + "loss": 0.0072, + "step": 588870 + }, + { + "epoch": 1.53, + "learning_rate": 7.103071431719032e-05, + "loss": 0.0077, + "step": 588880 + }, + { + "epoch": 1.53, + "learning_rate": 7.102682610081885e-05, + "loss": 0.0099, + "step": 588890 + }, + { + "epoch": 1.53, + "learning_rate": 7.102293788444739e-05, + "loss": 0.0113, + "step": 588900 + }, + { + "epoch": 1.53, + "learning_rate": 7.101904966807592e-05, + "loss": 0.0072, + "step": 588910 + }, + { + "epoch": 1.53, + "learning_rate": 7.101516145170446e-05, + "loss": 0.0084, + "step": 588920 + }, + { + "epoch": 1.53, + "learning_rate": 7.101127323533299e-05, + "loss": 0.0075, + "step": 588930 + }, + { + "epoch": 1.53, + "learning_rate": 7.100738501896153e-05, + "loss": 0.0065, + "step": 588940 + }, + { + "epoch": 1.53, + "learning_rate": 7.100349680259006e-05, + "loss": 0.0094, + "step": 588950 + }, + { + "epoch": 1.53, + "learning_rate": 7.09996085862186e-05, + "loss": 0.0102, + "step": 588960 + }, + { + "epoch": 1.53, + "learning_rate": 7.099572036984713e-05, + "loss": 0.0079, + "step": 588970 + }, + { + "epoch": 1.53, + "learning_rate": 7.099183215347567e-05, + "loss": 0.0096, + "step": 588980 + }, + { + "epoch": 1.53, + "learning_rate": 7.098794393710421e-05, + "loss": 0.0073, + "step": 588990 + }, + { + "epoch": 1.53, + "learning_rate": 7.098405572073274e-05, + "loss": 0.0068, + "step": 589000 + }, + { + "epoch": 1.53, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.005820184480398893, + "eval_runtime": 107.9961, + "eval_samples_per_second": 18.519, + "eval_steps_per_second": 4.63, + "step": 589000 + }, + { + "epoch": 1.53, + "learning_rate": 7.098016750436128e-05, + "loss": 0.0064, + "step": 589010 + }, + { + "epoch": 1.53, + "learning_rate": 7.097627928798981e-05, + "loss": 0.0086, + "step": 589020 + }, + { + "epoch": 1.53, + "learning_rate": 7.097239107161835e-05, + "loss": 0.008, + "step": 589030 + }, + { + "epoch": 1.53, + "learning_rate": 7.096850285524688e-05, + "loss": 0.0094, + "step": 589040 + }, + { + "epoch": 1.53, + "learning_rate": 7.096461463887542e-05, + "loss": 0.0073, + "step": 589050 + }, + { + "epoch": 1.53, + "learning_rate": 7.096072642250396e-05, + "loss": 0.0142, + "step": 589060 + }, + { + "epoch": 1.53, + "learning_rate": 7.095683820613249e-05, + "loss": 0.0084, + "step": 589070 + }, + { + "epoch": 1.53, + "learning_rate": 7.095294998976103e-05, + "loss": 0.0076, + "step": 589080 + }, + { + "epoch": 1.53, + "learning_rate": 7.094906177338956e-05, + "loss": 0.0078, + "step": 589090 + }, + { + "epoch": 1.53, + "learning_rate": 7.09451735570181e-05, + "loss": 0.0094, + "step": 589100 + }, + { + "epoch": 1.53, + "learning_rate": 7.094128534064663e-05, + "loss": 0.0074, + "step": 589110 + }, + { + "epoch": 1.53, + "learning_rate": 7.093739712427517e-05, + "loss": 0.0142, + "step": 589120 + }, + { + "epoch": 1.53, + "learning_rate": 7.09335089079037e-05, + "loss": 0.0066, + "step": 589130 + }, + { + "epoch": 1.53, + "learning_rate": 7.092962069153223e-05, + "loss": 0.0106, + "step": 589140 + }, + { + "epoch": 1.53, + "learning_rate": 7.092573247516077e-05, + "loss": 0.0081, + "step": 589150 + }, + { + "epoch": 1.53, + "learning_rate": 7.092184425878931e-05, + "loss": 0.0085, + "step": 589160 + }, + { + "epoch": 1.53, + "learning_rate": 7.091795604241784e-05, + "loss": 0.0114, + "step": 589170 + }, + { + "epoch": 1.53, + "learning_rate": 7.091406782604638e-05, + "loss": 0.0101, + "step": 589180 + }, + { + "epoch": 1.53, + "learning_rate": 7.091017960967491e-05, + "loss": 0.0094, + "step": 589190 + }, + { + "epoch": 1.53, + "learning_rate": 7.090629139330345e-05, + "loss": 0.009, + "step": 589200 + }, + { + "epoch": 1.53, + "learning_rate": 7.090240317693198e-05, + "loss": 0.0079, + "step": 589210 + }, + { + "epoch": 1.53, + "learning_rate": 7.089851496056052e-05, + "loss": 0.009, + "step": 589220 + }, + { + "epoch": 1.53, + "learning_rate": 7.089462674418905e-05, + "loss": 0.0084, + "step": 589230 + }, + { + "epoch": 1.53, + "learning_rate": 7.089073852781759e-05, + "loss": 0.007, + "step": 589240 + }, + { + "epoch": 1.53, + "learning_rate": 7.088685031144613e-05, + "loss": 0.0106, + "step": 589250 + }, + { + "epoch": 1.53, + "learning_rate": 7.088296209507466e-05, + "loss": 0.0076, + "step": 589260 + }, + { + "epoch": 1.53, + "learning_rate": 7.08790738787032e-05, + "loss": 0.0071, + "step": 589270 + }, + { + "epoch": 1.53, + "learning_rate": 7.087518566233173e-05, + "loss": 0.0111, + "step": 589280 + }, + { + "epoch": 1.53, + "learning_rate": 7.087129744596027e-05, + "loss": 0.0084, + "step": 589290 + }, + { + "epoch": 1.53, + "learning_rate": 7.08674092295888e-05, + "loss": 0.0091, + "step": 589300 + }, + { + "epoch": 1.53, + "learning_rate": 7.086352101321734e-05, + "loss": 0.0081, + "step": 589310 + }, + { + "epoch": 1.53, + "learning_rate": 7.085963279684587e-05, + "loss": 0.0078, + "step": 589320 + }, + { + "epoch": 1.53, + "learning_rate": 7.085574458047441e-05, + "loss": 0.0081, + "step": 589330 + }, + { + "epoch": 1.53, + "learning_rate": 7.085185636410295e-05, + "loss": 0.0079, + "step": 589340 + }, + { + "epoch": 1.53, + "learning_rate": 7.084796814773148e-05, + "loss": 0.01, + "step": 589350 + }, + { + "epoch": 1.53, + "learning_rate": 7.084407993136002e-05, + "loss": 0.01, + "step": 589360 + }, + { + "epoch": 1.53, + "learning_rate": 7.084019171498855e-05, + "loss": 0.0074, + "step": 589370 + }, + { + "epoch": 1.53, + "learning_rate": 7.083630349861708e-05, + "loss": 0.0079, + "step": 589380 + }, + { + "epoch": 1.53, + "learning_rate": 7.083241528224562e-05, + "loss": 0.0068, + "step": 589390 + }, + { + "epoch": 1.53, + "learning_rate": 7.082852706587415e-05, + "loss": 0.0089, + "step": 589400 + }, + { + "epoch": 1.53, + "learning_rate": 7.082463884950269e-05, + "loss": 0.0104, + "step": 589410 + }, + { + "epoch": 1.53, + "learning_rate": 7.082075063313122e-05, + "loss": 0.0091, + "step": 589420 + }, + { + "epoch": 1.53, + "learning_rate": 7.081686241675976e-05, + "loss": 0.0103, + "step": 589430 + }, + { + "epoch": 1.53, + "learning_rate": 7.08129742003883e-05, + "loss": 0.0067, + "step": 589440 + }, + { + "epoch": 1.53, + "learning_rate": 7.080908598401683e-05, + "loss": 0.0116, + "step": 589450 + }, + { + "epoch": 1.53, + "learning_rate": 7.080519776764537e-05, + "loss": 0.0074, + "step": 589460 + }, + { + "epoch": 1.53, + "learning_rate": 7.08013095512739e-05, + "loss": 0.0109, + "step": 589470 + }, + { + "epoch": 1.53, + "learning_rate": 7.079742133490244e-05, + "loss": 0.0071, + "step": 589480 + }, + { + "epoch": 1.53, + "learning_rate": 7.079353311853097e-05, + "loss": 0.007, + "step": 589490 + }, + { + "epoch": 1.53, + "learning_rate": 7.078964490215951e-05, + "loss": 0.0106, + "step": 589500 + }, + { + "epoch": 1.53, + "learning_rate": 7.078575668578805e-05, + "loss": 0.0099, + "step": 589510 + }, + { + "epoch": 1.53, + "learning_rate": 7.078186846941658e-05, + "loss": 0.0084, + "step": 589520 + }, + { + "epoch": 1.53, + "learning_rate": 7.077798025304512e-05, + "loss": 0.0093, + "step": 589530 + }, + { + "epoch": 1.53, + "learning_rate": 7.077409203667365e-05, + "loss": 0.0095, + "step": 589540 + }, + { + "epoch": 1.53, + "learning_rate": 7.077020382030219e-05, + "loss": 0.0108, + "step": 589550 + }, + { + "epoch": 1.53, + "learning_rate": 7.076631560393072e-05, + "loss": 0.007, + "step": 589560 + }, + { + "epoch": 1.53, + "learning_rate": 7.076242738755926e-05, + "loss": 0.0076, + "step": 589570 + }, + { + "epoch": 1.53, + "learning_rate": 7.075853917118779e-05, + "loss": 0.0095, + "step": 589580 + }, + { + "epoch": 1.53, + "learning_rate": 7.075465095481633e-05, + "loss": 0.0085, + "step": 589590 + }, + { + "epoch": 1.53, + "learning_rate": 7.075076273844487e-05, + "loss": 0.0077, + "step": 589600 + }, + { + "epoch": 1.53, + "learning_rate": 7.07468745220734e-05, + "loss": 0.0069, + "step": 589610 + }, + { + "epoch": 1.53, + "learning_rate": 7.074298630570194e-05, + "loss": 0.0112, + "step": 589620 + }, + { + "epoch": 1.53, + "learning_rate": 7.073909808933047e-05, + "loss": 0.0063, + "step": 589630 + }, + { + "epoch": 1.53, + "learning_rate": 7.0735209872959e-05, + "loss": 0.0073, + "step": 589640 + }, + { + "epoch": 1.53, + "learning_rate": 7.073132165658754e-05, + "loss": 0.0102, + "step": 589650 + }, + { + "epoch": 1.53, + "learning_rate": 7.072743344021607e-05, + "loss": 0.009, + "step": 589660 + }, + { + "epoch": 1.53, + "learning_rate": 7.072354522384461e-05, + "loss": 0.0111, + "step": 589670 + }, + { + "epoch": 1.53, + "learning_rate": 7.071965700747314e-05, + "loss": 0.0068, + "step": 589680 + }, + { + "epoch": 1.53, + "learning_rate": 7.071576879110168e-05, + "loss": 0.011, + "step": 589690 + }, + { + "epoch": 1.53, + "learning_rate": 7.071188057473022e-05, + "loss": 0.0068, + "step": 589700 + }, + { + "epoch": 1.53, + "learning_rate": 7.070799235835875e-05, + "loss": 0.0071, + "step": 589710 + }, + { + "epoch": 1.53, + "learning_rate": 7.070410414198729e-05, + "loss": 0.0061, + "step": 589720 + }, + { + "epoch": 1.53, + "learning_rate": 7.070021592561582e-05, + "loss": 0.0073, + "step": 589730 + }, + { + "epoch": 1.53, + "learning_rate": 7.069632770924436e-05, + "loss": 0.0095, + "step": 589740 + }, + { + "epoch": 1.53, + "learning_rate": 7.069243949287289e-05, + "loss": 0.007, + "step": 589750 + }, + { + "epoch": 1.53, + "learning_rate": 7.068855127650143e-05, + "loss": 0.0069, + "step": 589760 + }, + { + "epoch": 1.53, + "learning_rate": 7.068466306012997e-05, + "loss": 0.0078, + "step": 589770 + }, + { + "epoch": 1.53, + "learning_rate": 7.06807748437585e-05, + "loss": 0.0086, + "step": 589780 + }, + { + "epoch": 1.53, + "learning_rate": 7.067688662738704e-05, + "loss": 0.0077, + "step": 589790 + }, + { + "epoch": 1.53, + "learning_rate": 7.067299841101557e-05, + "loss": 0.0092, + "step": 589800 + }, + { + "epoch": 1.53, + "learning_rate": 7.066911019464411e-05, + "loss": 0.0073, + "step": 589810 + }, + { + "epoch": 1.53, + "learning_rate": 7.066522197827264e-05, + "loss": 0.0069, + "step": 589820 + }, + { + "epoch": 1.53, + "learning_rate": 7.066133376190118e-05, + "loss": 0.0099, + "step": 589830 + }, + { + "epoch": 1.53, + "learning_rate": 7.065744554552971e-05, + "loss": 0.0104, + "step": 589840 + }, + { + "epoch": 1.53, + "learning_rate": 7.065355732915825e-05, + "loss": 0.0075, + "step": 589850 + }, + { + "epoch": 1.53, + "learning_rate": 7.064966911278679e-05, + "loss": 0.0094, + "step": 589860 + }, + { + "epoch": 1.53, + "learning_rate": 7.064578089641532e-05, + "loss": 0.0102, + "step": 589870 + }, + { + "epoch": 1.53, + "learning_rate": 7.064189268004385e-05, + "loss": 0.0118, + "step": 589880 + }, + { + "epoch": 1.53, + "learning_rate": 7.063800446367239e-05, + "loss": 0.0098, + "step": 589890 + }, + { + "epoch": 1.53, + "learning_rate": 7.063411624730092e-05, + "loss": 0.0099, + "step": 589900 + }, + { + "epoch": 1.53, + "learning_rate": 7.063022803092946e-05, + "loss": 0.0079, + "step": 589910 + }, + { + "epoch": 1.53, + "learning_rate": 7.062633981455799e-05, + "loss": 0.0091, + "step": 589920 + }, + { + "epoch": 1.53, + "learning_rate": 7.062245159818653e-05, + "loss": 0.0128, + "step": 589930 + }, + { + "epoch": 1.53, + "learning_rate": 7.061856338181506e-05, + "loss": 0.0097, + "step": 589940 + }, + { + "epoch": 1.53, + "learning_rate": 7.06146751654436e-05, + "loss": 0.0087, + "step": 589950 + }, + { + "epoch": 1.53, + "learning_rate": 7.061078694907214e-05, + "loss": 0.0097, + "step": 589960 + }, + { + "epoch": 1.53, + "learning_rate": 7.060689873270067e-05, + "loss": 0.0106, + "step": 589970 + }, + { + "epoch": 1.53, + "learning_rate": 7.060301051632921e-05, + "loss": 0.0069, + "step": 589980 + }, + { + "epoch": 1.53, + "learning_rate": 7.059912229995774e-05, + "loss": 0.0085, + "step": 589990 + }, + { + "epoch": 1.53, + "learning_rate": 7.059523408358628e-05, + "loss": 0.0081, + "step": 590000 + }, + { + "epoch": 1.53, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.00574450334534049, + "eval_runtime": 108.0014, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.63, + "step": 590000 + }, + { + "epoch": 1.53, + "learning_rate": 7.059134586721481e-05, + "loss": 0.0084, + "step": 590010 + }, + { + "epoch": 1.53, + "learning_rate": 7.058745765084335e-05, + "loss": 0.01, + "step": 590020 + }, + { + "epoch": 1.53, + "learning_rate": 7.058356943447189e-05, + "loss": 0.0102, + "step": 590030 + }, + { + "epoch": 1.53, + "learning_rate": 7.057968121810042e-05, + "loss": 0.0081, + "step": 590040 + }, + { + "epoch": 1.53, + "learning_rate": 7.057579300172896e-05, + "loss": 0.0124, + "step": 590050 + }, + { + "epoch": 1.53, + "learning_rate": 7.057190478535749e-05, + "loss": 0.0137, + "step": 590060 + }, + { + "epoch": 1.53, + "learning_rate": 7.056801656898603e-05, + "loss": 0.009, + "step": 590070 + }, + { + "epoch": 1.53, + "learning_rate": 7.056412835261456e-05, + "loss": 0.0064, + "step": 590080 + }, + { + "epoch": 1.53, + "learning_rate": 7.05602401362431e-05, + "loss": 0.0078, + "step": 590090 + }, + { + "epoch": 1.53, + "learning_rate": 7.055635191987163e-05, + "loss": 0.0068, + "step": 590100 + }, + { + "epoch": 1.53, + "learning_rate": 7.055246370350017e-05, + "loss": 0.0091, + "step": 590110 + }, + { + "epoch": 1.53, + "learning_rate": 7.054857548712871e-05, + "loss": 0.008, + "step": 590120 + }, + { + "epoch": 1.53, + "learning_rate": 7.054468727075724e-05, + "loss": 0.0081, + "step": 590130 + }, + { + "epoch": 1.53, + "learning_rate": 7.054079905438577e-05, + "loss": 0.0121, + "step": 590140 + }, + { + "epoch": 1.53, + "learning_rate": 7.053691083801431e-05, + "loss": 0.0103, + "step": 590150 + }, + { + "epoch": 1.53, + "learning_rate": 7.053302262164284e-05, + "loss": 0.0079, + "step": 590160 + }, + { + "epoch": 1.53, + "learning_rate": 7.052913440527138e-05, + "loss": 0.0068, + "step": 590170 + }, + { + "epoch": 1.53, + "learning_rate": 7.052524618889991e-05, + "loss": 0.0065, + "step": 590180 + }, + { + "epoch": 1.53, + "learning_rate": 7.052135797252845e-05, + "loss": 0.0063, + "step": 590190 + }, + { + "epoch": 1.53, + "learning_rate": 7.051746975615698e-05, + "loss": 0.0056, + "step": 590200 + }, + { + "epoch": 1.53, + "learning_rate": 7.051358153978552e-05, + "loss": 0.0091, + "step": 590210 + }, + { + "epoch": 1.53, + "learning_rate": 7.050969332341406e-05, + "loss": 0.0107, + "step": 590220 + }, + { + "epoch": 1.53, + "learning_rate": 7.050580510704259e-05, + "loss": 0.008, + "step": 590230 + }, + { + "epoch": 1.53, + "learning_rate": 7.050191689067113e-05, + "loss": 0.0095, + "step": 590240 + }, + { + "epoch": 1.53, + "learning_rate": 7.049802867429966e-05, + "loss": 0.0084, + "step": 590250 + }, + { + "epoch": 1.53, + "learning_rate": 7.04941404579282e-05, + "loss": 0.006, + "step": 590260 + }, + { + "epoch": 1.53, + "learning_rate": 7.049025224155673e-05, + "loss": 0.0099, + "step": 590270 + }, + { + "epoch": 1.53, + "learning_rate": 7.048636402518527e-05, + "loss": 0.008, + "step": 590280 + }, + { + "epoch": 1.53, + "learning_rate": 7.048247580881381e-05, + "loss": 0.0084, + "step": 590290 + }, + { + "epoch": 1.53, + "learning_rate": 7.047858759244234e-05, + "loss": 0.0076, + "step": 590300 + }, + { + "epoch": 1.53, + "learning_rate": 7.047469937607088e-05, + "loss": 0.007, + "step": 590310 + }, + { + "epoch": 1.53, + "learning_rate": 7.047081115969941e-05, + "loss": 0.0108, + "step": 590320 + }, + { + "epoch": 1.53, + "learning_rate": 7.046692294332795e-05, + "loss": 0.008, + "step": 590330 + }, + { + "epoch": 1.53, + "learning_rate": 7.046303472695648e-05, + "loss": 0.0091, + "step": 590340 + }, + { + "epoch": 1.53, + "learning_rate": 7.045914651058502e-05, + "loss": 0.011, + "step": 590350 + }, + { + "epoch": 1.53, + "learning_rate": 7.045525829421355e-05, + "loss": 0.0078, + "step": 590360 + }, + { + "epoch": 1.53, + "learning_rate": 7.045137007784208e-05, + "loss": 0.0079, + "step": 590370 + }, + { + "epoch": 1.53, + "learning_rate": 7.044748186147062e-05, + "loss": 0.0069, + "step": 590380 + }, + { + "epoch": 1.53, + "learning_rate": 7.044359364509916e-05, + "loss": 0.0089, + "step": 590390 + }, + { + "epoch": 1.53, + "learning_rate": 7.043970542872769e-05, + "loss": 0.0075, + "step": 590400 + }, + { + "epoch": 1.53, + "learning_rate": 7.043581721235623e-05, + "loss": 0.0084, + "step": 590410 + }, + { + "epoch": 1.53, + "learning_rate": 7.043192899598476e-05, + "loss": 0.0068, + "step": 590420 + }, + { + "epoch": 1.53, + "learning_rate": 7.04280407796133e-05, + "loss": 0.0082, + "step": 590430 + }, + { + "epoch": 1.53, + "learning_rate": 7.042415256324183e-05, + "loss": 0.0078, + "step": 590440 + }, + { + "epoch": 1.53, + "learning_rate": 7.042026434687037e-05, + "loss": 0.007, + "step": 590450 + }, + { + "epoch": 1.53, + "learning_rate": 7.04163761304989e-05, + "loss": 0.0081, + "step": 590460 + }, + { + "epoch": 1.53, + "learning_rate": 7.041248791412744e-05, + "loss": 0.0079, + "step": 590470 + }, + { + "epoch": 1.53, + "learning_rate": 7.040859969775598e-05, + "loss": 0.0104, + "step": 590480 + }, + { + "epoch": 1.53, + "learning_rate": 7.040471148138451e-05, + "loss": 0.0084, + "step": 590490 + }, + { + "epoch": 1.53, + "learning_rate": 7.040082326501305e-05, + "loss": 0.0087, + "step": 590500 + }, + { + "epoch": 1.53, + "learning_rate": 7.039693504864158e-05, + "loss": 0.01, + "step": 590510 + }, + { + "epoch": 1.53, + "learning_rate": 7.039304683227012e-05, + "loss": 0.0123, + "step": 590520 + }, + { + "epoch": 1.53, + "learning_rate": 7.038915861589865e-05, + "loss": 0.0095, + "step": 590530 + }, + { + "epoch": 1.53, + "learning_rate": 7.038527039952719e-05, + "loss": 0.0092, + "step": 590540 + }, + { + "epoch": 1.53, + "learning_rate": 7.038138218315573e-05, + "loss": 0.01, + "step": 590550 + }, + { + "epoch": 1.53, + "learning_rate": 7.037749396678426e-05, + "loss": 0.0068, + "step": 590560 + }, + { + "epoch": 1.53, + "learning_rate": 7.03736057504128e-05, + "loss": 0.0077, + "step": 590570 + }, + { + "epoch": 1.53, + "learning_rate": 7.036971753404133e-05, + "loss": 0.0074, + "step": 590580 + }, + { + "epoch": 1.53, + "learning_rate": 7.036582931766987e-05, + "loss": 0.0154, + "step": 590590 + }, + { + "epoch": 1.53, + "learning_rate": 7.03619411012984e-05, + "loss": 0.008, + "step": 590600 + }, + { + "epoch": 1.53, + "learning_rate": 7.035805288492694e-05, + "loss": 0.0092, + "step": 590610 + }, + { + "epoch": 1.53, + "learning_rate": 7.035416466855547e-05, + "loss": 0.0089, + "step": 590620 + }, + { + "epoch": 1.53, + "learning_rate": 7.0350276452184e-05, + "loss": 0.0087, + "step": 590630 + }, + { + "epoch": 1.53, + "learning_rate": 7.034638823581254e-05, + "loss": 0.0074, + "step": 590640 + }, + { + "epoch": 1.53, + "learning_rate": 7.034250001944108e-05, + "loss": 0.007, + "step": 590650 + }, + { + "epoch": 1.53, + "learning_rate": 7.033861180306961e-05, + "loss": 0.0087, + "step": 590660 + }, + { + "epoch": 1.53, + "learning_rate": 7.033472358669815e-05, + "loss": 0.0099, + "step": 590670 + }, + { + "epoch": 1.53, + "learning_rate": 7.033083537032668e-05, + "loss": 0.0096, + "step": 590680 + }, + { + "epoch": 1.53, + "learning_rate": 7.032694715395522e-05, + "loss": 0.0073, + "step": 590690 + }, + { + "epoch": 1.53, + "learning_rate": 7.032305893758375e-05, + "loss": 0.0076, + "step": 590700 + }, + { + "epoch": 1.53, + "learning_rate": 7.031917072121229e-05, + "loss": 0.0084, + "step": 590710 + }, + { + "epoch": 1.53, + "learning_rate": 7.031528250484082e-05, + "loss": 0.0101, + "step": 590720 + }, + { + "epoch": 1.53, + "learning_rate": 7.031139428846936e-05, + "loss": 0.0082, + "step": 590730 + }, + { + "epoch": 1.53, + "learning_rate": 7.03075060720979e-05, + "loss": 0.0093, + "step": 590740 + }, + { + "epoch": 1.53, + "learning_rate": 7.030361785572643e-05, + "loss": 0.0078, + "step": 590750 + }, + { + "epoch": 1.53, + "learning_rate": 7.029972963935497e-05, + "loss": 0.0095, + "step": 590760 + }, + { + "epoch": 1.53, + "learning_rate": 7.02958414229835e-05, + "loss": 0.0076, + "step": 590770 + }, + { + "epoch": 1.53, + "learning_rate": 7.029195320661204e-05, + "loss": 0.0093, + "step": 590780 + }, + { + "epoch": 1.53, + "learning_rate": 7.028806499024057e-05, + "loss": 0.0082, + "step": 590790 + }, + { + "epoch": 1.53, + "learning_rate": 7.028417677386911e-05, + "loss": 0.008, + "step": 590800 + }, + { + "epoch": 1.53, + "learning_rate": 7.028028855749764e-05, + "loss": 0.0083, + "step": 590810 + }, + { + "epoch": 1.53, + "learning_rate": 7.027640034112618e-05, + "loss": 0.0088, + "step": 590820 + }, + { + "epoch": 1.53, + "learning_rate": 7.027251212475472e-05, + "loss": 0.0083, + "step": 590830 + }, + { + "epoch": 1.53, + "learning_rate": 7.026862390838325e-05, + "loss": 0.0076, + "step": 590840 + }, + { + "epoch": 1.53, + "learning_rate": 7.026473569201179e-05, + "loss": 0.0143, + "step": 590850 + }, + { + "epoch": 1.53, + "learning_rate": 7.026084747564032e-05, + "loss": 0.0069, + "step": 590860 + }, + { + "epoch": 1.53, + "learning_rate": 7.025695925926885e-05, + "loss": 0.0093, + "step": 590870 + }, + { + "epoch": 1.53, + "learning_rate": 7.025307104289739e-05, + "loss": 0.0114, + "step": 590880 + }, + { + "epoch": 1.53, + "learning_rate": 7.024918282652592e-05, + "loss": 0.0079, + "step": 590890 + }, + { + "epoch": 1.53, + "learning_rate": 7.024529461015446e-05, + "loss": 0.0087, + "step": 590900 + }, + { + "epoch": 1.53, + "learning_rate": 7.024140639378299e-05, + "loss": 0.0063, + "step": 590910 + }, + { + "epoch": 1.53, + "learning_rate": 7.023751817741153e-05, + "loss": 0.01, + "step": 590920 + }, + { + "epoch": 1.53, + "learning_rate": 7.023362996104007e-05, + "loss": 0.0136, + "step": 590930 + }, + { + "epoch": 1.53, + "learning_rate": 7.02297417446686e-05, + "loss": 0.0104, + "step": 590940 + }, + { + "epoch": 1.53, + "learning_rate": 7.022585352829714e-05, + "loss": 0.0082, + "step": 590950 + }, + { + "epoch": 1.53, + "learning_rate": 7.022196531192567e-05, + "loss": 0.0086, + "step": 590960 + }, + { + "epoch": 1.53, + "learning_rate": 7.021807709555421e-05, + "loss": 0.0063, + "step": 590970 + }, + { + "epoch": 1.53, + "learning_rate": 7.021418887918274e-05, + "loss": 0.0106, + "step": 590980 + }, + { + "epoch": 1.53, + "learning_rate": 7.021030066281128e-05, + "loss": 0.0096, + "step": 590990 + }, + { + "epoch": 1.53, + "learning_rate": 7.020641244643982e-05, + "loss": 0.01, + "step": 591000 + }, + { + "epoch": 1.53, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.005933051463216543, + "eval_runtime": 107.84, + "eval_samples_per_second": 18.546, + "eval_steps_per_second": 4.636, + "step": 591000 + }, + { + "epoch": 1.53, + "learning_rate": 7.020252423006835e-05, + "loss": 0.0103, + "step": 591010 + }, + { + "epoch": 1.53, + "learning_rate": 7.019863601369689e-05, + "loss": 0.0126, + "step": 591020 + }, + { + "epoch": 1.53, + "learning_rate": 7.019474779732542e-05, + "loss": 0.0116, + "step": 591030 + }, + { + "epoch": 1.53, + "learning_rate": 7.019085958095396e-05, + "loss": 0.0085, + "step": 591040 + }, + { + "epoch": 1.53, + "learning_rate": 7.018697136458249e-05, + "loss": 0.0079, + "step": 591050 + }, + { + "epoch": 1.53, + "learning_rate": 7.018308314821103e-05, + "loss": 0.0072, + "step": 591060 + }, + { + "epoch": 1.53, + "learning_rate": 7.017919493183956e-05, + "loss": 0.0087, + "step": 591070 + }, + { + "epoch": 1.53, + "learning_rate": 7.01753067154681e-05, + "loss": 0.0087, + "step": 591080 + }, + { + "epoch": 1.53, + "learning_rate": 7.017141849909664e-05, + "loss": 0.01, + "step": 591090 + }, + { + "epoch": 1.53, + "learning_rate": 7.016753028272517e-05, + "loss": 0.006, + "step": 591100 + }, + { + "epoch": 1.53, + "learning_rate": 7.016364206635371e-05, + "loss": 0.0097, + "step": 591110 + }, + { + "epoch": 1.53, + "learning_rate": 7.015975384998224e-05, + "loss": 0.0086, + "step": 591120 + }, + { + "epoch": 1.53, + "learning_rate": 7.015586563361077e-05, + "loss": 0.0075, + "step": 591130 + }, + { + "epoch": 1.53, + "learning_rate": 7.015197741723931e-05, + "loss": 0.0086, + "step": 591140 + }, + { + "epoch": 1.53, + "learning_rate": 7.014808920086784e-05, + "loss": 0.0095, + "step": 591150 + }, + { + "epoch": 1.53, + "learning_rate": 7.014420098449638e-05, + "loss": 0.0101, + "step": 591160 + }, + { + "epoch": 1.53, + "learning_rate": 7.01403127681249e-05, + "loss": 0.0116, + "step": 591170 + }, + { + "epoch": 1.53, + "learning_rate": 7.013642455175345e-05, + "loss": 0.0065, + "step": 591180 + }, + { + "epoch": 1.53, + "learning_rate": 7.013253633538199e-05, + "loss": 0.0086, + "step": 591190 + }, + { + "epoch": 1.53, + "learning_rate": 7.012864811901052e-05, + "loss": 0.0135, + "step": 591200 + }, + { + "epoch": 1.53, + "learning_rate": 7.012475990263906e-05, + "loss": 0.0086, + "step": 591210 + }, + { + "epoch": 1.53, + "learning_rate": 7.012087168626759e-05, + "loss": 0.0079, + "step": 591220 + }, + { + "epoch": 1.53, + "learning_rate": 7.011698346989613e-05, + "loss": 0.0099, + "step": 591230 + }, + { + "epoch": 1.53, + "learning_rate": 7.011309525352466e-05, + "loss": 0.0096, + "step": 591240 + }, + { + "epoch": 1.53, + "learning_rate": 7.01092070371532e-05, + "loss": 0.011, + "step": 591250 + }, + { + "epoch": 1.53, + "learning_rate": 7.010531882078174e-05, + "loss": 0.0095, + "step": 591260 + }, + { + "epoch": 1.53, + "learning_rate": 7.010143060441027e-05, + "loss": 0.0082, + "step": 591270 + }, + { + "epoch": 1.53, + "learning_rate": 7.009754238803881e-05, + "loss": 0.0078, + "step": 591280 + }, + { + "epoch": 1.53, + "learning_rate": 7.009365417166734e-05, + "loss": 0.0068, + "step": 591290 + }, + { + "epoch": 1.53, + "learning_rate": 7.008976595529588e-05, + "loss": 0.0073, + "step": 591300 + }, + { + "epoch": 1.53, + "learning_rate": 7.008587773892441e-05, + "loss": 0.0083, + "step": 591310 + }, + { + "epoch": 1.53, + "learning_rate": 7.008198952255295e-05, + "loss": 0.0121, + "step": 591320 + }, + { + "epoch": 1.53, + "learning_rate": 7.007810130618148e-05, + "loss": 0.0091, + "step": 591330 + }, + { + "epoch": 1.53, + "learning_rate": 7.007421308981002e-05, + "loss": 0.008, + "step": 591340 + }, + { + "epoch": 1.53, + "learning_rate": 7.007032487343856e-05, + "loss": 0.008, + "step": 591350 + }, + { + "epoch": 1.53, + "learning_rate": 7.006643665706709e-05, + "loss": 0.0081, + "step": 591360 + }, + { + "epoch": 1.53, + "learning_rate": 7.006254844069562e-05, + "loss": 0.0063, + "step": 591370 + }, + { + "epoch": 1.53, + "learning_rate": 7.005866022432416e-05, + "loss": 0.0093, + "step": 591380 + }, + { + "epoch": 1.53, + "learning_rate": 7.005477200795269e-05, + "loss": 0.0091, + "step": 591390 + }, + { + "epoch": 1.53, + "learning_rate": 7.005088379158123e-05, + "loss": 0.0063, + "step": 591400 + }, + { + "epoch": 1.53, + "learning_rate": 7.004699557520976e-05, + "loss": 0.0089, + "step": 591410 + }, + { + "epoch": 1.53, + "learning_rate": 7.00431073588383e-05, + "loss": 0.0077, + "step": 591420 + }, + { + "epoch": 1.53, + "learning_rate": 7.003921914246683e-05, + "loss": 0.0092, + "step": 591430 + }, + { + "epoch": 1.53, + "learning_rate": 7.003533092609537e-05, + "loss": 0.009, + "step": 591440 + }, + { + "epoch": 1.53, + "learning_rate": 7.003144270972391e-05, + "loss": 0.0084, + "step": 591450 + }, + { + "epoch": 1.53, + "learning_rate": 7.002755449335244e-05, + "loss": 0.0064, + "step": 591460 + }, + { + "epoch": 1.53, + "learning_rate": 7.002366627698098e-05, + "loss": 0.011, + "step": 591470 + }, + { + "epoch": 1.53, + "learning_rate": 7.00197780606095e-05, + "loss": 0.01, + "step": 591480 + }, + { + "epoch": 1.53, + "learning_rate": 7.001588984423805e-05, + "loss": 0.0081, + "step": 591490 + }, + { + "epoch": 1.53, + "learning_rate": 7.001200162786658e-05, + "loss": 0.0131, + "step": 591500 + }, + { + "epoch": 1.53, + "learning_rate": 7.000811341149512e-05, + "loss": 0.0087, + "step": 591510 + }, + { + "epoch": 1.53, + "learning_rate": 7.000422519512366e-05, + "loss": 0.0075, + "step": 591520 + }, + { + "epoch": 1.53, + "learning_rate": 7.000033697875219e-05, + "loss": 0.0076, + "step": 591530 + }, + { + "epoch": 1.53, + "learning_rate": 6.999644876238073e-05, + "loss": 0.0092, + "step": 591540 + }, + { + "epoch": 1.53, + "learning_rate": 6.999256054600926e-05, + "loss": 0.0091, + "step": 591550 + }, + { + "epoch": 1.53, + "learning_rate": 6.99886723296378e-05, + "loss": 0.0088, + "step": 591560 + }, + { + "epoch": 1.53, + "learning_rate": 6.998478411326633e-05, + "loss": 0.0106, + "step": 591570 + }, + { + "epoch": 1.53, + "learning_rate": 6.998089589689487e-05, + "loss": 0.0076, + "step": 591580 + }, + { + "epoch": 1.53, + "learning_rate": 6.99770076805234e-05, + "loss": 0.0085, + "step": 591590 + }, + { + "epoch": 1.53, + "learning_rate": 6.997311946415194e-05, + "loss": 0.0096, + "step": 591600 + }, + { + "epoch": 1.53, + "learning_rate": 6.996923124778048e-05, + "loss": 0.0083, + "step": 591610 + }, + { + "epoch": 1.53, + "learning_rate": 6.996534303140901e-05, + "loss": 0.0087, + "step": 591620 + }, + { + "epoch": 1.53, + "learning_rate": 6.996145481503754e-05, + "loss": 0.0091, + "step": 591630 + }, + { + "epoch": 1.53, + "learning_rate": 6.995756659866608e-05, + "loss": 0.0078, + "step": 591640 + }, + { + "epoch": 1.53, + "learning_rate": 6.99536783822946e-05, + "loss": 0.0072, + "step": 591650 + }, + { + "epoch": 1.53, + "learning_rate": 6.994979016592315e-05, + "loss": 0.0107, + "step": 591660 + }, + { + "epoch": 1.53, + "learning_rate": 6.994590194955168e-05, + "loss": 0.0097, + "step": 591670 + }, + { + "epoch": 1.53, + "learning_rate": 6.994201373318022e-05, + "loss": 0.0069, + "step": 591680 + }, + { + "epoch": 1.53, + "learning_rate": 6.993812551680875e-05, + "loss": 0.0095, + "step": 591690 + }, + { + "epoch": 1.53, + "learning_rate": 6.993423730043729e-05, + "loss": 0.0084, + "step": 591700 + }, + { + "epoch": 1.53, + "learning_rate": 6.993034908406583e-05, + "loss": 0.0085, + "step": 591710 + }, + { + "epoch": 1.53, + "learning_rate": 6.992646086769436e-05, + "loss": 0.0102, + "step": 591720 + }, + { + "epoch": 1.53, + "learning_rate": 6.99225726513229e-05, + "loss": 0.0085, + "step": 591730 + }, + { + "epoch": 1.53, + "learning_rate": 6.991868443495143e-05, + "loss": 0.0144, + "step": 591740 + }, + { + "epoch": 1.53, + "learning_rate": 6.991479621857997e-05, + "loss": 0.0082, + "step": 591750 + }, + { + "epoch": 1.53, + "learning_rate": 6.99109080022085e-05, + "loss": 0.0079, + "step": 591760 + }, + { + "epoch": 1.53, + "learning_rate": 6.990701978583704e-05, + "loss": 0.0098, + "step": 591770 + }, + { + "epoch": 1.53, + "learning_rate": 6.990313156946558e-05, + "loss": 0.0086, + "step": 591780 + }, + { + "epoch": 1.53, + "learning_rate": 6.989924335309411e-05, + "loss": 0.007, + "step": 591790 + }, + { + "epoch": 1.53, + "learning_rate": 6.989535513672265e-05, + "loss": 0.0078, + "step": 591800 + }, + { + "epoch": 1.53, + "learning_rate": 6.989146692035118e-05, + "loss": 0.0091, + "step": 591810 + }, + { + "epoch": 1.53, + "learning_rate": 6.988757870397972e-05, + "loss": 0.0099, + "step": 591820 + }, + { + "epoch": 1.53, + "learning_rate": 6.988369048760825e-05, + "loss": 0.009, + "step": 591830 + }, + { + "epoch": 1.53, + "learning_rate": 6.987980227123679e-05, + "loss": 0.0097, + "step": 591840 + }, + { + "epoch": 1.53, + "learning_rate": 6.987591405486532e-05, + "loss": 0.0064, + "step": 591850 + }, + { + "epoch": 1.53, + "learning_rate": 6.987202583849385e-05, + "loss": 0.0081, + "step": 591860 + }, + { + "epoch": 1.53, + "learning_rate": 6.986813762212239e-05, + "loss": 0.0092, + "step": 591870 + }, + { + "epoch": 1.53, + "learning_rate": 6.986424940575093e-05, + "loss": 0.0082, + "step": 591880 + }, + { + "epoch": 1.53, + "learning_rate": 6.986036118937946e-05, + "loss": 0.0058, + "step": 591890 + }, + { + "epoch": 1.53, + "learning_rate": 6.9856472973008e-05, + "loss": 0.0081, + "step": 591900 + }, + { + "epoch": 1.53, + "learning_rate": 6.985258475663653e-05, + "loss": 0.0086, + "step": 591910 + }, + { + "epoch": 1.53, + "learning_rate": 6.984869654026507e-05, + "loss": 0.0119, + "step": 591920 + }, + { + "epoch": 1.53, + "learning_rate": 6.98448083238936e-05, + "loss": 0.0073, + "step": 591930 + }, + { + "epoch": 1.53, + "learning_rate": 6.984092010752214e-05, + "loss": 0.0086, + "step": 591940 + }, + { + "epoch": 1.53, + "learning_rate": 6.983703189115067e-05, + "loss": 0.0077, + "step": 591950 + }, + { + "epoch": 1.53, + "learning_rate": 6.983314367477921e-05, + "loss": 0.0094, + "step": 591960 + }, + { + "epoch": 1.53, + "learning_rate": 6.982925545840775e-05, + "loss": 0.0079, + "step": 591970 + }, + { + "epoch": 1.53, + "learning_rate": 6.982536724203628e-05, + "loss": 0.0083, + "step": 591980 + }, + { + "epoch": 1.53, + "learning_rate": 6.982147902566482e-05, + "loss": 0.0066, + "step": 591990 + }, + { + "epoch": 1.53, + "learning_rate": 6.981759080929335e-05, + "loss": 0.0081, + "step": 592000 + }, + { + "epoch": 1.53, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.005928897298872471, + "eval_runtime": 107.9324, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.633, + "step": 592000 + }, + { + "epoch": 1.53, + "learning_rate": 6.981370259292189e-05, + "loss": 0.0095, + "step": 592010 + }, + { + "epoch": 1.53, + "learning_rate": 6.980981437655042e-05, + "loss": 0.0064, + "step": 592020 + }, + { + "epoch": 1.53, + "learning_rate": 6.980592616017896e-05, + "loss": 0.0112, + "step": 592030 + }, + { + "epoch": 1.53, + "learning_rate": 6.980203794380749e-05, + "loss": 0.0104, + "step": 592040 + }, + { + "epoch": 1.53, + "learning_rate": 6.979814972743603e-05, + "loss": 0.0116, + "step": 592050 + }, + { + "epoch": 1.53, + "learning_rate": 6.979426151106457e-05, + "loss": 0.0121, + "step": 592060 + }, + { + "epoch": 1.53, + "learning_rate": 6.97903732946931e-05, + "loss": 0.0094, + "step": 592070 + }, + { + "epoch": 1.53, + "learning_rate": 6.978648507832164e-05, + "loss": 0.0101, + "step": 592080 + }, + { + "epoch": 1.53, + "learning_rate": 6.978259686195017e-05, + "loss": 0.01, + "step": 592090 + }, + { + "epoch": 1.53, + "learning_rate": 6.977870864557871e-05, + "loss": 0.0109, + "step": 592100 + }, + { + "epoch": 1.53, + "learning_rate": 6.977482042920724e-05, + "loss": 0.0072, + "step": 592110 + }, + { + "epoch": 1.53, + "learning_rate": 6.977093221283576e-05, + "loss": 0.0096, + "step": 592120 + }, + { + "epoch": 1.53, + "learning_rate": 6.97670439964643e-05, + "loss": 0.0061, + "step": 592130 + }, + { + "epoch": 1.53, + "learning_rate": 6.976315578009283e-05, + "loss": 0.0069, + "step": 592140 + }, + { + "epoch": 1.53, + "learning_rate": 6.975926756372138e-05, + "loss": 0.0105, + "step": 592150 + }, + { + "epoch": 1.53, + "learning_rate": 6.975537934734992e-05, + "loss": 0.0084, + "step": 592160 + }, + { + "epoch": 1.53, + "learning_rate": 6.975149113097845e-05, + "loss": 0.0093, + "step": 592170 + }, + { + "epoch": 1.54, + "learning_rate": 6.974760291460699e-05, + "loss": 0.012, + "step": 592180 + }, + { + "epoch": 1.54, + "learning_rate": 6.974371469823552e-05, + "loss": 0.0095, + "step": 592190 + }, + { + "epoch": 1.54, + "learning_rate": 6.973982648186406e-05, + "loss": 0.0072, + "step": 592200 + }, + { + "epoch": 1.54, + "learning_rate": 6.973593826549259e-05, + "loss": 0.0086, + "step": 592210 + }, + { + "epoch": 1.54, + "learning_rate": 6.973205004912113e-05, + "loss": 0.0076, + "step": 592220 + }, + { + "epoch": 1.54, + "learning_rate": 6.972816183274967e-05, + "loss": 0.0077, + "step": 592230 + }, + { + "epoch": 1.54, + "learning_rate": 6.97242736163782e-05, + "loss": 0.0083, + "step": 592240 + }, + { + "epoch": 1.54, + "learning_rate": 6.972038540000674e-05, + "loss": 0.0066, + "step": 592250 + }, + { + "epoch": 1.54, + "learning_rate": 6.971649718363527e-05, + "loss": 0.0124, + "step": 592260 + }, + { + "epoch": 1.54, + "learning_rate": 6.971260896726381e-05, + "loss": 0.0065, + "step": 592270 + }, + { + "epoch": 1.54, + "learning_rate": 6.970872075089234e-05, + "loss": 0.0107, + "step": 592280 + }, + { + "epoch": 1.54, + "learning_rate": 6.970483253452088e-05, + "loss": 0.0088, + "step": 592290 + }, + { + "epoch": 1.54, + "learning_rate": 6.97009443181494e-05, + "loss": 0.0082, + "step": 592300 + }, + { + "epoch": 1.54, + "learning_rate": 6.969705610177795e-05, + "loss": 0.0063, + "step": 592310 + }, + { + "epoch": 1.54, + "learning_rate": 6.969316788540649e-05, + "loss": 0.0105, + "step": 592320 + }, + { + "epoch": 1.54, + "learning_rate": 6.968927966903502e-05, + "loss": 0.0101, + "step": 592330 + }, + { + "epoch": 1.54, + "learning_rate": 6.968539145266356e-05, + "loss": 0.0093, + "step": 592340 + }, + { + "epoch": 1.54, + "learning_rate": 6.968150323629209e-05, + "loss": 0.0088, + "step": 592350 + }, + { + "epoch": 1.54, + "learning_rate": 6.967761501992062e-05, + "loss": 0.0084, + "step": 592360 + }, + { + "epoch": 1.54, + "learning_rate": 6.967372680354916e-05, + "loss": 0.0081, + "step": 592370 + }, + { + "epoch": 1.54, + "learning_rate": 6.966983858717768e-05, + "loss": 0.0081, + "step": 592380 + }, + { + "epoch": 1.54, + "learning_rate": 6.966595037080623e-05, + "loss": 0.0095, + "step": 592390 + }, + { + "epoch": 1.54, + "learning_rate": 6.966206215443475e-05, + "loss": 0.009, + "step": 592400 + }, + { + "epoch": 1.54, + "learning_rate": 6.96581739380633e-05, + "loss": 0.0082, + "step": 592410 + }, + { + "epoch": 1.54, + "learning_rate": 6.965428572169184e-05, + "loss": 0.0089, + "step": 592420 + }, + { + "epoch": 1.54, + "learning_rate": 6.965039750532037e-05, + "loss": 0.0102, + "step": 592430 + }, + { + "epoch": 1.54, + "learning_rate": 6.964650928894891e-05, + "loss": 0.0099, + "step": 592440 + }, + { + "epoch": 1.54, + "learning_rate": 6.964262107257744e-05, + "loss": 0.0073, + "step": 592450 + }, + { + "epoch": 1.54, + "learning_rate": 6.963873285620598e-05, + "loss": 0.0073, + "step": 592460 + }, + { + "epoch": 1.54, + "learning_rate": 6.96348446398345e-05, + "loss": 0.0102, + "step": 592470 + }, + { + "epoch": 1.54, + "learning_rate": 6.963095642346305e-05, + "loss": 0.0074, + "step": 592480 + }, + { + "epoch": 1.54, + "learning_rate": 6.962706820709159e-05, + "loss": 0.0111, + "step": 592490 + }, + { + "epoch": 1.54, + "learning_rate": 6.962317999072012e-05, + "loss": 0.0092, + "step": 592500 + }, + { + "epoch": 1.54, + "learning_rate": 6.961929177434866e-05, + "loss": 0.0087, + "step": 592510 + }, + { + "epoch": 1.54, + "learning_rate": 6.961540355797719e-05, + "loss": 0.0086, + "step": 592520 + }, + { + "epoch": 1.54, + "learning_rate": 6.961151534160573e-05, + "loss": 0.0115, + "step": 592530 + }, + { + "epoch": 1.54, + "learning_rate": 6.960762712523426e-05, + "loss": 0.0103, + "step": 592540 + }, + { + "epoch": 1.54, + "learning_rate": 6.96037389088628e-05, + "loss": 0.0085, + "step": 592550 + }, + { + "epoch": 1.54, + "learning_rate": 6.959985069249133e-05, + "loss": 0.0094, + "step": 592560 + }, + { + "epoch": 1.54, + "learning_rate": 6.959596247611987e-05, + "loss": 0.0092, + "step": 592570 + }, + { + "epoch": 1.54, + "learning_rate": 6.959207425974841e-05, + "loss": 0.0086, + "step": 592580 + }, + { + "epoch": 1.54, + "learning_rate": 6.958818604337694e-05, + "loss": 0.0081, + "step": 592590 + }, + { + "epoch": 1.54, + "learning_rate": 6.958429782700548e-05, + "loss": 0.0073, + "step": 592600 + }, + { + "epoch": 1.54, + "learning_rate": 6.958040961063401e-05, + "loss": 0.0089, + "step": 592610 + }, + { + "epoch": 1.54, + "learning_rate": 6.957652139426254e-05, + "loss": 0.0095, + "step": 592620 + }, + { + "epoch": 1.54, + "learning_rate": 6.957263317789108e-05, + "loss": 0.0122, + "step": 592630 + }, + { + "epoch": 1.54, + "learning_rate": 6.95687449615196e-05, + "loss": 0.0066, + "step": 592640 + }, + { + "epoch": 1.54, + "learning_rate": 6.956485674514815e-05, + "loss": 0.0066, + "step": 592650 + }, + { + "epoch": 1.54, + "learning_rate": 6.956096852877667e-05, + "loss": 0.008, + "step": 592660 + }, + { + "epoch": 1.54, + "learning_rate": 6.955708031240522e-05, + "loss": 0.0091, + "step": 592670 + }, + { + "epoch": 1.54, + "learning_rate": 6.955319209603376e-05, + "loss": 0.0131, + "step": 592680 + }, + { + "epoch": 1.54, + "learning_rate": 6.954930387966229e-05, + "loss": 0.0122, + "step": 592690 + }, + { + "epoch": 1.54, + "learning_rate": 6.954541566329083e-05, + "loss": 0.0087, + "step": 592700 + }, + { + "epoch": 1.54, + "learning_rate": 6.954152744691936e-05, + "loss": 0.0077, + "step": 592710 + }, + { + "epoch": 1.54, + "learning_rate": 6.95376392305479e-05, + "loss": 0.0089, + "step": 592720 + }, + { + "epoch": 1.54, + "learning_rate": 6.953375101417643e-05, + "loss": 0.0119, + "step": 592730 + }, + { + "epoch": 1.54, + "learning_rate": 6.952986279780497e-05, + "loss": 0.0085, + "step": 592740 + }, + { + "epoch": 1.54, + "learning_rate": 6.952597458143351e-05, + "loss": 0.0106, + "step": 592750 + }, + { + "epoch": 1.54, + "learning_rate": 6.952208636506204e-05, + "loss": 0.0112, + "step": 592760 + }, + { + "epoch": 1.54, + "learning_rate": 6.951819814869058e-05, + "loss": 0.0101, + "step": 592770 + }, + { + "epoch": 1.54, + "learning_rate": 6.95143099323191e-05, + "loss": 0.0065, + "step": 592780 + }, + { + "epoch": 1.54, + "learning_rate": 6.951042171594765e-05, + "loss": 0.0111, + "step": 592790 + }, + { + "epoch": 1.54, + "learning_rate": 6.950653349957618e-05, + "loss": 0.0096, + "step": 592800 + }, + { + "epoch": 1.54, + "learning_rate": 6.950264528320472e-05, + "loss": 0.0102, + "step": 592810 + }, + { + "epoch": 1.54, + "learning_rate": 6.949875706683325e-05, + "loss": 0.0092, + "step": 592820 + }, + { + "epoch": 1.54, + "learning_rate": 6.949486885046179e-05, + "loss": 0.0087, + "step": 592830 + }, + { + "epoch": 1.54, + "learning_rate": 6.949098063409033e-05, + "loss": 0.0071, + "step": 592840 + }, + { + "epoch": 1.54, + "learning_rate": 6.948709241771886e-05, + "loss": 0.0097, + "step": 592850 + }, + { + "epoch": 1.54, + "learning_rate": 6.948320420134739e-05, + "loss": 0.0092, + "step": 592860 + }, + { + "epoch": 1.54, + "learning_rate": 6.947931598497593e-05, + "loss": 0.0072, + "step": 592870 + }, + { + "epoch": 1.54, + "learning_rate": 6.947542776860446e-05, + "loss": 0.01, + "step": 592880 + }, + { + "epoch": 1.54, + "learning_rate": 6.9471539552233e-05, + "loss": 0.0086, + "step": 592890 + }, + { + "epoch": 1.54, + "learning_rate": 6.946765133586152e-05, + "loss": 0.0111, + "step": 592900 + }, + { + "epoch": 1.54, + "learning_rate": 6.946376311949007e-05, + "loss": 0.0086, + "step": 592910 + }, + { + "epoch": 1.54, + "learning_rate": 6.94598749031186e-05, + "loss": 0.0079, + "step": 592920 + }, + { + "epoch": 1.54, + "learning_rate": 6.945598668674714e-05, + "loss": 0.0092, + "step": 592930 + }, + { + "epoch": 1.54, + "learning_rate": 6.945209847037568e-05, + "loss": 0.0083, + "step": 592940 + }, + { + "epoch": 1.54, + "learning_rate": 6.94482102540042e-05, + "loss": 0.007, + "step": 592950 + }, + { + "epoch": 1.54, + "learning_rate": 6.944432203763275e-05, + "loss": 0.0095, + "step": 592960 + }, + { + "epoch": 1.54, + "learning_rate": 6.944043382126128e-05, + "loss": 0.0082, + "step": 592970 + }, + { + "epoch": 1.54, + "learning_rate": 6.943654560488982e-05, + "loss": 0.0108, + "step": 592980 + }, + { + "epoch": 1.54, + "learning_rate": 6.943265738851835e-05, + "loss": 0.0056, + "step": 592990 + }, + { + "epoch": 1.54, + "learning_rate": 6.942876917214689e-05, + "loss": 0.0097, + "step": 593000 + }, + { + "epoch": 1.54, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.005945616401731968, + "eval_runtime": 107.8905, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 593000 + }, + { + "epoch": 1.54, + "learning_rate": 6.942488095577543e-05, + "loss": 0.0064, + "step": 593010 + }, + { + "epoch": 1.54, + "learning_rate": 6.942099273940396e-05, + "loss": 0.0081, + "step": 593020 + }, + { + "epoch": 1.54, + "learning_rate": 6.94171045230325e-05, + "loss": 0.0092, + "step": 593030 + }, + { + "epoch": 1.54, + "learning_rate": 6.941321630666103e-05, + "loss": 0.0071, + "step": 593040 + }, + { + "epoch": 1.54, + "learning_rate": 6.940932809028957e-05, + "loss": 0.0106, + "step": 593050 + }, + { + "epoch": 1.54, + "learning_rate": 6.94054398739181e-05, + "loss": 0.0057, + "step": 593060 + }, + { + "epoch": 1.54, + "learning_rate": 6.940155165754664e-05, + "loss": 0.0082, + "step": 593070 + }, + { + "epoch": 1.54, + "learning_rate": 6.939766344117517e-05, + "loss": 0.0079, + "step": 593080 + }, + { + "epoch": 1.54, + "learning_rate": 6.939377522480371e-05, + "loss": 0.0103, + "step": 593090 + }, + { + "epoch": 1.54, + "learning_rate": 6.938988700843224e-05, + "loss": 0.0127, + "step": 593100 + }, + { + "epoch": 1.54, + "learning_rate": 6.938599879206078e-05, + "loss": 0.0101, + "step": 593110 + }, + { + "epoch": 1.54, + "learning_rate": 6.93821105756893e-05, + "loss": 0.0083, + "step": 593120 + }, + { + "epoch": 1.54, + "learning_rate": 6.937822235931785e-05, + "loss": 0.01, + "step": 593130 + }, + { + "epoch": 1.54, + "learning_rate": 6.937433414294638e-05, + "loss": 0.0094, + "step": 593140 + }, + { + "epoch": 1.54, + "learning_rate": 6.937044592657492e-05, + "loss": 0.0083, + "step": 593150 + }, + { + "epoch": 1.54, + "learning_rate": 6.936655771020344e-05, + "loss": 0.0083, + "step": 593160 + }, + { + "epoch": 1.54, + "learning_rate": 6.936266949383199e-05, + "loss": 0.0082, + "step": 593170 + }, + { + "epoch": 1.54, + "learning_rate": 6.935878127746051e-05, + "loss": 0.0111, + "step": 593180 + }, + { + "epoch": 1.54, + "learning_rate": 6.935489306108906e-05, + "loss": 0.0075, + "step": 593190 + }, + { + "epoch": 1.54, + "learning_rate": 6.93510048447176e-05, + "loss": 0.0087, + "step": 593200 + }, + { + "epoch": 1.54, + "learning_rate": 6.934711662834613e-05, + "loss": 0.0093, + "step": 593210 + }, + { + "epoch": 1.54, + "learning_rate": 6.934322841197467e-05, + "loss": 0.0092, + "step": 593220 + }, + { + "epoch": 1.54, + "learning_rate": 6.93393401956032e-05, + "loss": 0.0109, + "step": 593230 + }, + { + "epoch": 1.54, + "learning_rate": 6.933545197923174e-05, + "loss": 0.0087, + "step": 593240 + }, + { + "epoch": 1.54, + "learning_rate": 6.933156376286027e-05, + "loss": 0.0133, + "step": 593250 + }, + { + "epoch": 1.54, + "learning_rate": 6.932767554648881e-05, + "loss": 0.0086, + "step": 593260 + }, + { + "epoch": 1.54, + "learning_rate": 6.932378733011735e-05, + "loss": 0.0096, + "step": 593270 + }, + { + "epoch": 1.54, + "learning_rate": 6.931989911374588e-05, + "loss": 0.0121, + "step": 593280 + }, + { + "epoch": 1.54, + "learning_rate": 6.931601089737442e-05, + "loss": 0.0064, + "step": 593290 + }, + { + "epoch": 1.54, + "learning_rate": 6.931212268100295e-05, + "loss": 0.0093, + "step": 593300 + }, + { + "epoch": 1.54, + "learning_rate": 6.930823446463149e-05, + "loss": 0.0101, + "step": 593310 + }, + { + "epoch": 1.54, + "learning_rate": 6.930434624826002e-05, + "loss": 0.0074, + "step": 593320 + }, + { + "epoch": 1.54, + "learning_rate": 6.930045803188856e-05, + "loss": 0.0088, + "step": 593330 + }, + { + "epoch": 1.54, + "learning_rate": 6.929656981551709e-05, + "loss": 0.0114, + "step": 593340 + }, + { + "epoch": 1.54, + "learning_rate": 6.929268159914561e-05, + "loss": 0.0087, + "step": 593350 + }, + { + "epoch": 1.54, + "learning_rate": 6.928879338277416e-05, + "loss": 0.0106, + "step": 593360 + }, + { + "epoch": 1.54, + "learning_rate": 6.92849051664027e-05, + "loss": 0.0085, + "step": 593370 + }, + { + "epoch": 1.54, + "learning_rate": 6.928101695003123e-05, + "loss": 0.008, + "step": 593380 + }, + { + "epoch": 1.54, + "learning_rate": 6.927712873365977e-05, + "loss": 0.0099, + "step": 593390 + }, + { + "epoch": 1.54, + "learning_rate": 6.92732405172883e-05, + "loss": 0.0051, + "step": 593400 + }, + { + "epoch": 1.54, + "learning_rate": 6.926935230091684e-05, + "loss": 0.0081, + "step": 593410 + }, + { + "epoch": 1.54, + "learning_rate": 6.926546408454536e-05, + "loss": 0.0094, + "step": 593420 + }, + { + "epoch": 1.54, + "learning_rate": 6.92615758681739e-05, + "loss": 0.0084, + "step": 593430 + }, + { + "epoch": 1.54, + "learning_rate": 6.925768765180243e-05, + "loss": 0.0081, + "step": 593440 + }, + { + "epoch": 1.54, + "learning_rate": 6.925379943543098e-05, + "loss": 0.0124, + "step": 593450 + }, + { + "epoch": 1.54, + "learning_rate": 6.924991121905952e-05, + "loss": 0.0123, + "step": 593460 + }, + { + "epoch": 1.54, + "learning_rate": 6.924602300268805e-05, + "loss": 0.0086, + "step": 593470 + }, + { + "epoch": 1.54, + "learning_rate": 6.924213478631659e-05, + "loss": 0.0087, + "step": 593480 + }, + { + "epoch": 1.54, + "learning_rate": 6.923824656994512e-05, + "loss": 0.0085, + "step": 593490 + }, + { + "epoch": 1.54, + "learning_rate": 6.923435835357366e-05, + "loss": 0.0096, + "step": 593500 + }, + { + "epoch": 1.54, + "learning_rate": 6.923047013720219e-05, + "loss": 0.0092, + "step": 593510 + }, + { + "epoch": 1.54, + "learning_rate": 6.922658192083073e-05, + "loss": 0.0075, + "step": 593520 + }, + { + "epoch": 1.54, + "learning_rate": 6.922269370445925e-05, + "loss": 0.0164, + "step": 593530 + }, + { + "epoch": 1.54, + "learning_rate": 6.92188054880878e-05, + "loss": 0.0095, + "step": 593540 + }, + { + "epoch": 1.54, + "learning_rate": 6.921491727171634e-05, + "loss": 0.0092, + "step": 593550 + }, + { + "epoch": 1.54, + "learning_rate": 6.921102905534487e-05, + "loss": 0.0093, + "step": 593560 + }, + { + "epoch": 1.54, + "learning_rate": 6.920714083897341e-05, + "loss": 0.0098, + "step": 593570 + }, + { + "epoch": 1.54, + "learning_rate": 6.920325262260194e-05, + "loss": 0.0083, + "step": 593580 + }, + { + "epoch": 1.54, + "learning_rate": 6.919936440623048e-05, + "loss": 0.0093, + "step": 593590 + }, + { + "epoch": 1.54, + "learning_rate": 6.9195476189859e-05, + "loss": 0.0077, + "step": 593600 + }, + { + "epoch": 1.54, + "learning_rate": 6.919158797348753e-05, + "loss": 0.0072, + "step": 593610 + }, + { + "epoch": 1.54, + "learning_rate": 6.918769975711608e-05, + "loss": 0.0059, + "step": 593620 + }, + { + "epoch": 1.54, + "learning_rate": 6.91838115407446e-05, + "loss": 0.0083, + "step": 593630 + }, + { + "epoch": 1.54, + "learning_rate": 6.917992332437315e-05, + "loss": 0.0089, + "step": 593640 + }, + { + "epoch": 1.54, + "learning_rate": 6.917603510800169e-05, + "loss": 0.0134, + "step": 593650 + }, + { + "epoch": 1.54, + "learning_rate": 6.917214689163021e-05, + "loss": 0.0103, + "step": 593660 + }, + { + "epoch": 1.54, + "learning_rate": 6.916825867525876e-05, + "loss": 0.0091, + "step": 593670 + }, + { + "epoch": 1.54, + "learning_rate": 6.916437045888728e-05, + "loss": 0.009, + "step": 593680 + }, + { + "epoch": 1.54, + "learning_rate": 6.916048224251583e-05, + "loss": 0.0152, + "step": 593690 + }, + { + "epoch": 1.54, + "learning_rate": 6.915659402614435e-05, + "loss": 0.0065, + "step": 593700 + }, + { + "epoch": 1.54, + "learning_rate": 6.91527058097729e-05, + "loss": 0.0097, + "step": 593710 + }, + { + "epoch": 1.54, + "learning_rate": 6.914881759340144e-05, + "loss": 0.0055, + "step": 593720 + }, + { + "epoch": 1.54, + "learning_rate": 6.914492937702997e-05, + "loss": 0.0092, + "step": 593730 + }, + { + "epoch": 1.54, + "learning_rate": 6.914104116065851e-05, + "loss": 0.0078, + "step": 593740 + }, + { + "epoch": 1.54, + "learning_rate": 6.913715294428704e-05, + "loss": 0.0104, + "step": 593750 + }, + { + "epoch": 1.54, + "learning_rate": 6.913326472791558e-05, + "loss": 0.0102, + "step": 593760 + }, + { + "epoch": 1.54, + "learning_rate": 6.91293765115441e-05, + "loss": 0.01, + "step": 593770 + }, + { + "epoch": 1.54, + "learning_rate": 6.912548829517265e-05, + "loss": 0.0116, + "step": 593780 + }, + { + "epoch": 1.54, + "learning_rate": 6.912160007880117e-05, + "loss": 0.0076, + "step": 593790 + }, + { + "epoch": 1.54, + "learning_rate": 6.911771186242972e-05, + "loss": 0.0088, + "step": 593800 + }, + { + "epoch": 1.54, + "learning_rate": 6.911382364605826e-05, + "loss": 0.0087, + "step": 593810 + }, + { + "epoch": 1.54, + "learning_rate": 6.910993542968679e-05, + "loss": 0.0101, + "step": 593820 + }, + { + "epoch": 1.54, + "learning_rate": 6.910604721331533e-05, + "loss": 0.0073, + "step": 593830 + }, + { + "epoch": 1.54, + "learning_rate": 6.910215899694386e-05, + "loss": 0.0077, + "step": 593840 + }, + { + "epoch": 1.54, + "learning_rate": 6.909827078057238e-05, + "loss": 0.0114, + "step": 593850 + }, + { + "epoch": 1.54, + "learning_rate": 6.909438256420093e-05, + "loss": 0.0112, + "step": 593860 + }, + { + "epoch": 1.54, + "learning_rate": 6.909049434782945e-05, + "loss": 0.0084, + "step": 593870 + }, + { + "epoch": 1.54, + "learning_rate": 6.9086606131458e-05, + "loss": 0.0097, + "step": 593880 + }, + { + "epoch": 1.54, + "learning_rate": 6.908271791508652e-05, + "loss": 0.0084, + "step": 593890 + }, + { + "epoch": 1.54, + "learning_rate": 6.907882969871507e-05, + "loss": 0.0096, + "step": 593900 + }, + { + "epoch": 1.54, + "learning_rate": 6.907494148234361e-05, + "loss": 0.0086, + "step": 593910 + }, + { + "epoch": 1.54, + "learning_rate": 6.907105326597213e-05, + "loss": 0.0095, + "step": 593920 + }, + { + "epoch": 1.54, + "learning_rate": 6.906716504960068e-05, + "loss": 0.0108, + "step": 593930 + }, + { + "epoch": 1.54, + "learning_rate": 6.90632768332292e-05, + "loss": 0.0118, + "step": 593940 + }, + { + "epoch": 1.54, + "learning_rate": 6.905938861685775e-05, + "loss": 0.0102, + "step": 593950 + }, + { + "epoch": 1.54, + "learning_rate": 6.905550040048627e-05, + "loss": 0.0088, + "step": 593960 + }, + { + "epoch": 1.54, + "learning_rate": 6.905161218411482e-05, + "loss": 0.01, + "step": 593970 + }, + { + "epoch": 1.54, + "learning_rate": 6.904772396774336e-05, + "loss": 0.0103, + "step": 593980 + }, + { + "epoch": 1.54, + "learning_rate": 6.904383575137189e-05, + "loss": 0.0097, + "step": 593990 + }, + { + "epoch": 1.54, + "learning_rate": 6.903994753500043e-05, + "loss": 0.0116, + "step": 594000 + }, + { + "epoch": 1.54, + "eval_cer": 0.8816998870492994, + "eval_loss": 0.005914547014981508, + "eval_runtime": 107.9749, + "eval_samples_per_second": 18.523, + "eval_steps_per_second": 4.631, + "step": 594000 + }, + { + "epoch": 1.54, + "learning_rate": 6.903605931862896e-05, + "loss": 0.0106, + "step": 594010 + }, + { + "epoch": 1.54, + "learning_rate": 6.90321711022575e-05, + "loss": 0.0092, + "step": 594020 + }, + { + "epoch": 1.54, + "learning_rate": 6.902828288588603e-05, + "loss": 0.0096, + "step": 594030 + }, + { + "epoch": 1.54, + "learning_rate": 6.902439466951457e-05, + "loss": 0.0105, + "step": 594040 + }, + { + "epoch": 1.54, + "learning_rate": 6.90205064531431e-05, + "loss": 0.007, + "step": 594050 + }, + { + "epoch": 1.54, + "learning_rate": 6.901661823677164e-05, + "loss": 0.0112, + "step": 594060 + }, + { + "epoch": 1.54, + "learning_rate": 6.901273002040018e-05, + "loss": 0.0127, + "step": 594070 + }, + { + "epoch": 1.54, + "learning_rate": 6.90088418040287e-05, + "loss": 0.0065, + "step": 594080 + }, + { + "epoch": 1.54, + "learning_rate": 6.900495358765725e-05, + "loss": 0.0097, + "step": 594090 + }, + { + "epoch": 1.54, + "learning_rate": 6.900106537128578e-05, + "loss": 0.0066, + "step": 594100 + }, + { + "epoch": 1.54, + "learning_rate": 6.89971771549143e-05, + "loss": 0.0091, + "step": 594110 + }, + { + "epoch": 1.54, + "learning_rate": 6.899328893854285e-05, + "loss": 0.0085, + "step": 594120 + }, + { + "epoch": 1.54, + "learning_rate": 6.898940072217137e-05, + "loss": 0.0102, + "step": 594130 + }, + { + "epoch": 1.54, + "learning_rate": 6.898551250579992e-05, + "loss": 0.0107, + "step": 594140 + }, + { + "epoch": 1.54, + "learning_rate": 6.898162428942844e-05, + "loss": 0.0077, + "step": 594150 + }, + { + "epoch": 1.54, + "learning_rate": 6.897773607305699e-05, + "loss": 0.0098, + "step": 594160 + }, + { + "epoch": 1.54, + "learning_rate": 6.897384785668553e-05, + "loss": 0.008, + "step": 594170 + }, + { + "epoch": 1.54, + "learning_rate": 6.896995964031405e-05, + "loss": 0.0097, + "step": 594180 + }, + { + "epoch": 1.54, + "learning_rate": 6.89660714239426e-05, + "loss": 0.0102, + "step": 594190 + }, + { + "epoch": 1.54, + "learning_rate": 6.896218320757112e-05, + "loss": 0.0081, + "step": 594200 + }, + { + "epoch": 1.54, + "learning_rate": 6.895829499119967e-05, + "loss": 0.0085, + "step": 594210 + }, + { + "epoch": 1.54, + "learning_rate": 6.89544067748282e-05, + "loss": 0.0092, + "step": 594220 + }, + { + "epoch": 1.54, + "learning_rate": 6.895051855845674e-05, + "loss": 0.0117, + "step": 594230 + }, + { + "epoch": 1.54, + "learning_rate": 6.894663034208528e-05, + "loss": 0.0099, + "step": 594240 + }, + { + "epoch": 1.54, + "learning_rate": 6.89427421257138e-05, + "loss": 0.0089, + "step": 594250 + }, + { + "epoch": 1.54, + "learning_rate": 6.893885390934235e-05, + "loss": 0.0103, + "step": 594260 + }, + { + "epoch": 1.54, + "learning_rate": 6.893496569297088e-05, + "loss": 0.0095, + "step": 594270 + }, + { + "epoch": 1.54, + "learning_rate": 6.893107747659942e-05, + "loss": 0.0085, + "step": 594280 + }, + { + "epoch": 1.54, + "learning_rate": 6.892718926022795e-05, + "loss": 0.009, + "step": 594290 + }, + { + "epoch": 1.54, + "learning_rate": 6.892330104385649e-05, + "loss": 0.0076, + "step": 594300 + }, + { + "epoch": 1.54, + "learning_rate": 6.891941282748501e-05, + "loss": 0.0089, + "step": 594310 + }, + { + "epoch": 1.54, + "learning_rate": 6.891552461111356e-05, + "loss": 0.0081, + "step": 594320 + }, + { + "epoch": 1.54, + "learning_rate": 6.89116363947421e-05, + "loss": 0.008, + "step": 594330 + }, + { + "epoch": 1.54, + "learning_rate": 6.890774817837063e-05, + "loss": 0.0087, + "step": 594340 + }, + { + "epoch": 1.54, + "learning_rate": 6.890385996199915e-05, + "loss": 0.0076, + "step": 594350 + }, + { + "epoch": 1.54, + "learning_rate": 6.88999717456277e-05, + "loss": 0.0084, + "step": 594360 + }, + { + "epoch": 1.54, + "learning_rate": 6.889608352925622e-05, + "loss": 0.0066, + "step": 594370 + }, + { + "epoch": 1.54, + "learning_rate": 6.889219531288477e-05, + "loss": 0.0069, + "step": 594380 + }, + { + "epoch": 1.54, + "learning_rate": 6.88883070965133e-05, + "loss": 0.0095, + "step": 594390 + }, + { + "epoch": 1.54, + "learning_rate": 6.888441888014184e-05, + "loss": 0.011, + "step": 594400 + }, + { + "epoch": 1.54, + "learning_rate": 6.888053066377036e-05, + "loss": 0.0088, + "step": 594410 + }, + { + "epoch": 1.54, + "learning_rate": 6.88766424473989e-05, + "loss": 0.0075, + "step": 594420 + }, + { + "epoch": 1.54, + "learning_rate": 6.887275423102745e-05, + "loss": 0.0104, + "step": 594430 + }, + { + "epoch": 1.54, + "learning_rate": 6.886886601465597e-05, + "loss": 0.0104, + "step": 594440 + }, + { + "epoch": 1.54, + "learning_rate": 6.886497779828452e-05, + "loss": 0.0115, + "step": 594450 + }, + { + "epoch": 1.54, + "learning_rate": 6.886108958191304e-05, + "loss": 0.0064, + "step": 594460 + }, + { + "epoch": 1.54, + "learning_rate": 6.885720136554159e-05, + "loss": 0.0068, + "step": 594470 + }, + { + "epoch": 1.54, + "learning_rate": 6.885331314917011e-05, + "loss": 0.0101, + "step": 594480 + }, + { + "epoch": 1.54, + "learning_rate": 6.884942493279866e-05, + "loss": 0.0094, + "step": 594490 + }, + { + "epoch": 1.54, + "learning_rate": 6.88455367164272e-05, + "loss": 0.0076, + "step": 594500 + }, + { + "epoch": 1.54, + "learning_rate": 6.884164850005573e-05, + "loss": 0.0081, + "step": 594510 + }, + { + "epoch": 1.54, + "learning_rate": 6.883776028368427e-05, + "loss": 0.0069, + "step": 594520 + }, + { + "epoch": 1.54, + "learning_rate": 6.88338720673128e-05, + "loss": 0.0085, + "step": 594530 + }, + { + "epoch": 1.54, + "learning_rate": 6.882998385094134e-05, + "loss": 0.0106, + "step": 594540 + }, + { + "epoch": 1.54, + "learning_rate": 6.882609563456987e-05, + "loss": 0.0061, + "step": 594550 + }, + { + "epoch": 1.54, + "learning_rate": 6.88222074181984e-05, + "loss": 0.007, + "step": 594560 + }, + { + "epoch": 1.54, + "learning_rate": 6.881831920182693e-05, + "loss": 0.007, + "step": 594570 + }, + { + "epoch": 1.54, + "learning_rate": 6.881443098545548e-05, + "loss": 0.0069, + "step": 594580 + }, + { + "epoch": 1.54, + "learning_rate": 6.8810542769084e-05, + "loss": 0.0089, + "step": 594590 + }, + { + "epoch": 1.54, + "learning_rate": 6.880665455271255e-05, + "loss": 0.0087, + "step": 594600 + }, + { + "epoch": 1.54, + "learning_rate": 6.880276633634107e-05, + "loss": 0.0068, + "step": 594610 + }, + { + "epoch": 1.54, + "learning_rate": 6.879887811996962e-05, + "loss": 0.0087, + "step": 594620 + }, + { + "epoch": 1.54, + "learning_rate": 6.879498990359814e-05, + "loss": 0.0076, + "step": 594630 + }, + { + "epoch": 1.54, + "learning_rate": 6.879110168722669e-05, + "loss": 0.0127, + "step": 594640 + }, + { + "epoch": 1.54, + "learning_rate": 6.878721347085521e-05, + "loss": 0.0077, + "step": 594650 + }, + { + "epoch": 1.54, + "learning_rate": 6.878332525448376e-05, + "loss": 0.0098, + "step": 594660 + }, + { + "epoch": 1.54, + "learning_rate": 6.877943703811228e-05, + "loss": 0.0108, + "step": 594670 + }, + { + "epoch": 1.54, + "learning_rate": 6.877554882174083e-05, + "loss": 0.0116, + "step": 594680 + }, + { + "epoch": 1.54, + "learning_rate": 6.877166060536937e-05, + "loss": 0.008, + "step": 594690 + }, + { + "epoch": 1.54, + "learning_rate": 6.87677723889979e-05, + "loss": 0.008, + "step": 594700 + }, + { + "epoch": 1.54, + "learning_rate": 6.876388417262644e-05, + "loss": 0.0081, + "step": 594710 + }, + { + "epoch": 1.54, + "learning_rate": 6.875999595625496e-05, + "loss": 0.008, + "step": 594720 + }, + { + "epoch": 1.54, + "learning_rate": 6.87561077398835e-05, + "loss": 0.0114, + "step": 594730 + }, + { + "epoch": 1.54, + "learning_rate": 6.875221952351203e-05, + "loss": 0.013, + "step": 594740 + }, + { + "epoch": 1.54, + "learning_rate": 6.874833130714058e-05, + "loss": 0.0096, + "step": 594750 + }, + { + "epoch": 1.54, + "learning_rate": 6.87444430907691e-05, + "loss": 0.0097, + "step": 594760 + }, + { + "epoch": 1.54, + "learning_rate": 6.874055487439765e-05, + "loss": 0.009, + "step": 594770 + }, + { + "epoch": 1.54, + "learning_rate": 6.873666665802619e-05, + "loss": 0.0091, + "step": 594780 + }, + { + "epoch": 1.54, + "learning_rate": 6.873277844165472e-05, + "loss": 0.0112, + "step": 594790 + }, + { + "epoch": 1.54, + "learning_rate": 6.872889022528326e-05, + "loss": 0.0087, + "step": 594800 + }, + { + "epoch": 1.54, + "learning_rate": 6.872500200891179e-05, + "loss": 0.0097, + "step": 594810 + }, + { + "epoch": 1.54, + "learning_rate": 6.872111379254033e-05, + "loss": 0.0074, + "step": 594820 + }, + { + "epoch": 1.54, + "learning_rate": 6.871722557616885e-05, + "loss": 0.0073, + "step": 594830 + }, + { + "epoch": 1.54, + "learning_rate": 6.871333735979738e-05, + "loss": 0.0084, + "step": 594840 + }, + { + "epoch": 1.54, + "learning_rate": 6.870944914342592e-05, + "loss": 0.0092, + "step": 594850 + }, + { + "epoch": 1.54, + "learning_rate": 6.870556092705447e-05, + "loss": 0.0085, + "step": 594860 + }, + { + "epoch": 1.54, + "learning_rate": 6.8701672710683e-05, + "loss": 0.0087, + "step": 594870 + }, + { + "epoch": 1.54, + "learning_rate": 6.869778449431154e-05, + "loss": 0.0081, + "step": 594880 + }, + { + "epoch": 1.54, + "learning_rate": 6.869389627794006e-05, + "loss": 0.0125, + "step": 594890 + }, + { + "epoch": 1.54, + "learning_rate": 6.86900080615686e-05, + "loss": 0.0067, + "step": 594900 + }, + { + "epoch": 1.54, + "learning_rate": 6.868611984519713e-05, + "loss": 0.0081, + "step": 594910 + }, + { + "epoch": 1.54, + "learning_rate": 6.868223162882568e-05, + "loss": 0.0075, + "step": 594920 + }, + { + "epoch": 1.54, + "learning_rate": 6.86783434124542e-05, + "loss": 0.0082, + "step": 594930 + }, + { + "epoch": 1.54, + "learning_rate": 6.867445519608275e-05, + "loss": 0.0108, + "step": 594940 + }, + { + "epoch": 1.54, + "learning_rate": 6.867056697971129e-05, + "loss": 0.01, + "step": 594950 + }, + { + "epoch": 1.54, + "learning_rate": 6.866667876333981e-05, + "loss": 0.008, + "step": 594960 + }, + { + "epoch": 1.54, + "learning_rate": 6.866279054696836e-05, + "loss": 0.0106, + "step": 594970 + }, + { + "epoch": 1.54, + "learning_rate": 6.865890233059688e-05, + "loss": 0.0073, + "step": 594980 + }, + { + "epoch": 1.54, + "learning_rate": 6.865501411422543e-05, + "loss": 0.0084, + "step": 594990 + }, + { + "epoch": 1.54, + "learning_rate": 6.865112589785395e-05, + "loss": 0.0088, + "step": 595000 + }, + { + "epoch": 1.54, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.00575125589966774, + "eval_runtime": 107.7066, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, + "step": 595000 + }, + { + "epoch": 1.54, + "learning_rate": 6.86472376814825e-05, + "loss": 0.0097, + "step": 595010 + }, + { + "epoch": 1.54, + "learning_rate": 6.864334946511102e-05, + "loss": 0.0103, + "step": 595020 + }, + { + "epoch": 1.54, + "learning_rate": 6.863946124873957e-05, + "loss": 0.0075, + "step": 595030 + }, + { + "epoch": 1.54, + "learning_rate": 6.863557303236811e-05, + "loss": 0.0106, + "step": 595040 + }, + { + "epoch": 1.54, + "learning_rate": 6.863168481599664e-05, + "loss": 0.0073, + "step": 595050 + }, + { + "epoch": 1.54, + "learning_rate": 6.862779659962518e-05, + "loss": 0.0096, + "step": 595060 + }, + { + "epoch": 1.54, + "learning_rate": 6.86239083832537e-05, + "loss": 0.0079, + "step": 595070 + }, + { + "epoch": 1.54, + "learning_rate": 6.862002016688225e-05, + "loss": 0.0099, + "step": 595080 + }, + { + "epoch": 1.54, + "learning_rate": 6.861613195051077e-05, + "loss": 0.0102, + "step": 595090 + }, + { + "epoch": 1.54, + "learning_rate": 6.86122437341393e-05, + "loss": 0.0099, + "step": 595100 + }, + { + "epoch": 1.54, + "learning_rate": 6.860835551776784e-05, + "loss": 0.0104, + "step": 595110 + }, + { + "epoch": 1.54, + "learning_rate": 6.860446730139637e-05, + "loss": 0.0082, + "step": 595120 + }, + { + "epoch": 1.54, + "learning_rate": 6.860057908502491e-05, + "loss": 0.0119, + "step": 595130 + }, + { + "epoch": 1.54, + "learning_rate": 6.859669086865346e-05, + "loss": 0.0094, + "step": 595140 + }, + { + "epoch": 1.54, + "learning_rate": 6.859280265228198e-05, + "loss": 0.0089, + "step": 595150 + }, + { + "epoch": 1.54, + "learning_rate": 6.858891443591053e-05, + "loss": 0.0084, + "step": 595160 + }, + { + "epoch": 1.54, + "learning_rate": 6.858502621953905e-05, + "loss": 0.0074, + "step": 595170 + }, + { + "epoch": 1.54, + "learning_rate": 6.85811380031676e-05, + "loss": 0.0075, + "step": 595180 + }, + { + "epoch": 1.54, + "learning_rate": 6.857724978679612e-05, + "loss": 0.0088, + "step": 595190 + }, + { + "epoch": 1.54, + "learning_rate": 6.857336157042466e-05, + "loss": 0.0099, + "step": 595200 + }, + { + "epoch": 1.54, + "learning_rate": 6.85694733540532e-05, + "loss": 0.0072, + "step": 595210 + }, + { + "epoch": 1.54, + "learning_rate": 6.856558513768173e-05, + "loss": 0.0102, + "step": 595220 + }, + { + "epoch": 1.54, + "learning_rate": 6.856169692131028e-05, + "loss": 0.0087, + "step": 595230 + }, + { + "epoch": 1.54, + "learning_rate": 6.85578087049388e-05, + "loss": 0.0096, + "step": 595240 + }, + { + "epoch": 1.54, + "learning_rate": 6.855392048856735e-05, + "loss": 0.0062, + "step": 595250 + }, + { + "epoch": 1.54, + "learning_rate": 6.855003227219587e-05, + "loss": 0.0071, + "step": 595260 + }, + { + "epoch": 1.54, + "learning_rate": 6.854614405582442e-05, + "loss": 0.0102, + "step": 595270 + }, + { + "epoch": 1.54, + "learning_rate": 6.854225583945294e-05, + "loss": 0.0072, + "step": 595280 + }, + { + "epoch": 1.54, + "learning_rate": 6.853836762308149e-05, + "loss": 0.0109, + "step": 595290 + }, + { + "epoch": 1.54, + "learning_rate": 6.853447940671003e-05, + "loss": 0.0068, + "step": 595300 + }, + { + "epoch": 1.54, + "learning_rate": 6.853059119033856e-05, + "loss": 0.0086, + "step": 595310 + }, + { + "epoch": 1.54, + "learning_rate": 6.85267029739671e-05, + "loss": 0.0069, + "step": 595320 + }, + { + "epoch": 1.54, + "learning_rate": 6.852281475759562e-05, + "loss": 0.009, + "step": 595330 + }, + { + "epoch": 1.54, + "learning_rate": 6.851892654122415e-05, + "loss": 0.0105, + "step": 595340 + }, + { + "epoch": 1.54, + "learning_rate": 6.85150383248527e-05, + "loss": 0.0125, + "step": 595350 + }, + { + "epoch": 1.54, + "learning_rate": 6.851115010848122e-05, + "loss": 0.0134, + "step": 595360 + }, + { + "epoch": 1.54, + "learning_rate": 6.850726189210976e-05, + "loss": 0.0078, + "step": 595370 + }, + { + "epoch": 1.54, + "learning_rate": 6.850337367573829e-05, + "loss": 0.0073, + "step": 595380 + }, + { + "epoch": 1.54, + "learning_rate": 6.849948545936683e-05, + "loss": 0.0107, + "step": 595390 + }, + { + "epoch": 1.54, + "learning_rate": 6.849559724299538e-05, + "loss": 0.0077, + "step": 595400 + }, + { + "epoch": 1.54, + "learning_rate": 6.84917090266239e-05, + "loss": 0.0087, + "step": 595410 + }, + { + "epoch": 1.54, + "learning_rate": 6.848782081025245e-05, + "loss": 0.0123, + "step": 595420 + }, + { + "epoch": 1.54, + "learning_rate": 6.848393259388097e-05, + "loss": 0.0123, + "step": 595430 + }, + { + "epoch": 1.54, + "learning_rate": 6.848004437750952e-05, + "loss": 0.009, + "step": 595440 + }, + { + "epoch": 1.54, + "learning_rate": 6.847615616113804e-05, + "loss": 0.0078, + "step": 595450 + }, + { + "epoch": 1.54, + "learning_rate": 6.847226794476658e-05, + "loss": 0.0102, + "step": 595460 + }, + { + "epoch": 1.54, + "learning_rate": 6.846837972839513e-05, + "loss": 0.0129, + "step": 595470 + }, + { + "epoch": 1.54, + "learning_rate": 6.846449151202365e-05, + "loss": 0.0089, + "step": 595480 + }, + { + "epoch": 1.54, + "learning_rate": 6.84606032956522e-05, + "loss": 0.0082, + "step": 595490 + }, + { + "epoch": 1.54, + "learning_rate": 6.845671507928072e-05, + "loss": 0.0076, + "step": 595500 + }, + { + "epoch": 1.54, + "learning_rate": 6.845282686290927e-05, + "loss": 0.0088, + "step": 595510 + }, + { + "epoch": 1.54, + "learning_rate": 6.84489386465378e-05, + "loss": 0.0066, + "step": 595520 + }, + { + "epoch": 1.54, + "learning_rate": 6.844505043016634e-05, + "loss": 0.0121, + "step": 595530 + }, + { + "epoch": 1.54, + "learning_rate": 6.844116221379486e-05, + "loss": 0.0085, + "step": 595540 + }, + { + "epoch": 1.54, + "learning_rate": 6.84372739974234e-05, + "loss": 0.0081, + "step": 595550 + }, + { + "epoch": 1.54, + "learning_rate": 6.843338578105195e-05, + "loss": 0.0086, + "step": 595560 + }, + { + "epoch": 1.54, + "learning_rate": 6.842949756468048e-05, + "loss": 0.0086, + "step": 595570 + }, + { + "epoch": 1.54, + "learning_rate": 6.8425609348309e-05, + "loss": 0.0074, + "step": 595580 + }, + { + "epoch": 1.54, + "learning_rate": 6.842172113193754e-05, + "loss": 0.0114, + "step": 595590 + }, + { + "epoch": 1.54, + "learning_rate": 6.841783291556607e-05, + "loss": 0.0068, + "step": 595600 + }, + { + "epoch": 1.54, + "learning_rate": 6.841394469919461e-05, + "loss": 0.0085, + "step": 595610 + }, + { + "epoch": 1.54, + "learning_rate": 6.841005648282314e-05, + "loss": 0.0113, + "step": 595620 + }, + { + "epoch": 1.54, + "learning_rate": 6.840616826645168e-05, + "loss": 0.0079, + "step": 595630 + }, + { + "epoch": 1.54, + "learning_rate": 6.840228005008021e-05, + "loss": 0.0092, + "step": 595640 + }, + { + "epoch": 1.54, + "learning_rate": 6.839839183370875e-05, + "loss": 0.0084, + "step": 595650 + }, + { + "epoch": 1.54, + "learning_rate": 6.83945036173373e-05, + "loss": 0.0102, + "step": 595660 + }, + { + "epoch": 1.54, + "learning_rate": 6.839061540096582e-05, + "loss": 0.0078, + "step": 595670 + }, + { + "epoch": 1.54, + "learning_rate": 6.838672718459437e-05, + "loss": 0.0094, + "step": 595680 + }, + { + "epoch": 1.54, + "learning_rate": 6.83828389682229e-05, + "loss": 0.0067, + "step": 595690 + }, + { + "epoch": 1.54, + "learning_rate": 6.837895075185144e-05, + "loss": 0.0102, + "step": 595700 + }, + { + "epoch": 1.54, + "learning_rate": 6.837506253547996e-05, + "loss": 0.0094, + "step": 595710 + }, + { + "epoch": 1.54, + "learning_rate": 6.83711743191085e-05, + "loss": 0.0121, + "step": 595720 + }, + { + "epoch": 1.54, + "learning_rate": 6.836728610273705e-05, + "loss": 0.0079, + "step": 595730 + }, + { + "epoch": 1.54, + "learning_rate": 6.836339788636557e-05, + "loss": 0.0098, + "step": 595740 + }, + { + "epoch": 1.54, + "learning_rate": 6.835950966999412e-05, + "loss": 0.0081, + "step": 595750 + }, + { + "epoch": 1.54, + "learning_rate": 6.835562145362264e-05, + "loss": 0.0089, + "step": 595760 + }, + { + "epoch": 1.54, + "learning_rate": 6.835173323725119e-05, + "loss": 0.008, + "step": 595770 + }, + { + "epoch": 1.54, + "learning_rate": 6.834784502087971e-05, + "loss": 0.0113, + "step": 595780 + }, + { + "epoch": 1.54, + "learning_rate": 6.834395680450826e-05, + "loss": 0.0076, + "step": 595790 + }, + { + "epoch": 1.54, + "learning_rate": 6.834006858813678e-05, + "loss": 0.0111, + "step": 595800 + }, + { + "epoch": 1.54, + "learning_rate": 6.833618037176533e-05, + "loss": 0.0098, + "step": 595810 + }, + { + "epoch": 1.54, + "learning_rate": 6.833229215539387e-05, + "loss": 0.0073, + "step": 595820 + }, + { + "epoch": 1.54, + "learning_rate": 6.83284039390224e-05, + "loss": 0.0106, + "step": 595830 + }, + { + "epoch": 1.54, + "learning_rate": 6.832451572265092e-05, + "loss": 0.0079, + "step": 595840 + }, + { + "epoch": 1.54, + "learning_rate": 6.832062750627946e-05, + "loss": 0.0094, + "step": 595850 + }, + { + "epoch": 1.54, + "learning_rate": 6.831673928990799e-05, + "loss": 0.008, + "step": 595860 + }, + { + "epoch": 1.54, + "learning_rate": 6.831285107353653e-05, + "loss": 0.0096, + "step": 595870 + }, + { + "epoch": 1.54, + "learning_rate": 6.830896285716506e-05, + "loss": 0.0088, + "step": 595880 + }, + { + "epoch": 1.54, + "learning_rate": 6.83050746407936e-05, + "loss": 0.0074, + "step": 595890 + }, + { + "epoch": 1.54, + "learning_rate": 6.830118642442213e-05, + "loss": 0.0089, + "step": 595900 + }, + { + "epoch": 1.54, + "learning_rate": 6.829729820805067e-05, + "loss": 0.0083, + "step": 595910 + }, + { + "epoch": 1.54, + "learning_rate": 6.829340999167922e-05, + "loss": 0.0075, + "step": 595920 + }, + { + "epoch": 1.54, + "learning_rate": 6.828952177530774e-05, + "loss": 0.0122, + "step": 595930 + }, + { + "epoch": 1.54, + "learning_rate": 6.828563355893629e-05, + "loss": 0.0076, + "step": 595940 + }, + { + "epoch": 1.54, + "learning_rate": 6.828174534256481e-05, + "loss": 0.0128, + "step": 595950 + }, + { + "epoch": 1.54, + "learning_rate": 6.827785712619336e-05, + "loss": 0.0115, + "step": 595960 + }, + { + "epoch": 1.54, + "learning_rate": 6.827396890982188e-05, + "loss": 0.0104, + "step": 595970 + }, + { + "epoch": 1.54, + "learning_rate": 6.827008069345042e-05, + "loss": 0.0097, + "step": 595980 + }, + { + "epoch": 1.54, + "learning_rate": 6.826619247707897e-05, + "loss": 0.0117, + "step": 595990 + }, + { + "epoch": 1.54, + "learning_rate": 6.82623042607075e-05, + "loss": 0.0064, + "step": 596000 + }, + { + "epoch": 1.54, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.006005590315908194, + "eval_runtime": 107.81, + "eval_samples_per_second": 18.551, + "eval_steps_per_second": 4.638, + "step": 596000 + }, + { + "epoch": 1.54, + "learning_rate": 6.825841604433604e-05, + "loss": 0.0122, + "step": 596010 + }, + { + "epoch": 1.54, + "learning_rate": 6.825452782796456e-05, + "loss": 0.0077, + "step": 596020 + }, + { + "epoch": 1.54, + "learning_rate": 6.82506396115931e-05, + "loss": 0.0084, + "step": 596030 + }, + { + "epoch": 1.55, + "learning_rate": 6.824675139522163e-05, + "loss": 0.0092, + "step": 596040 + }, + { + "epoch": 1.55, + "learning_rate": 6.824286317885018e-05, + "loss": 0.0072, + "step": 596050 + }, + { + "epoch": 1.55, + "learning_rate": 6.82389749624787e-05, + "loss": 0.0078, + "step": 596060 + }, + { + "epoch": 1.55, + "learning_rate": 6.823508674610725e-05, + "loss": 0.0072, + "step": 596070 + }, + { + "epoch": 1.55, + "learning_rate": 6.823119852973577e-05, + "loss": 0.0068, + "step": 596080 + }, + { + "epoch": 1.55, + "learning_rate": 6.822731031336432e-05, + "loss": 0.0079, + "step": 596090 + }, + { + "epoch": 1.55, + "learning_rate": 6.822342209699284e-05, + "loss": 0.0055, + "step": 596100 + }, + { + "epoch": 1.55, + "learning_rate": 6.821953388062138e-05, + "loss": 0.0095, + "step": 596110 + }, + { + "epoch": 1.55, + "learning_rate": 6.821564566424991e-05, + "loss": 0.0084, + "step": 596120 + }, + { + "epoch": 1.55, + "learning_rate": 6.821175744787845e-05, + "loss": 0.009, + "step": 596130 + }, + { + "epoch": 1.55, + "learning_rate": 6.820786923150698e-05, + "loss": 0.0127, + "step": 596140 + }, + { + "epoch": 1.55, + "learning_rate": 6.820398101513552e-05, + "loss": 0.0086, + "step": 596150 + }, + { + "epoch": 1.55, + "learning_rate": 6.820009279876405e-05, + "loss": 0.0088, + "step": 596160 + }, + { + "epoch": 1.55, + "learning_rate": 6.81962045823926e-05, + "loss": 0.0083, + "step": 596170 + }, + { + "epoch": 1.55, + "learning_rate": 6.819231636602114e-05, + "loss": 0.0101, + "step": 596180 + }, + { + "epoch": 1.55, + "learning_rate": 6.818842814964966e-05, + "loss": 0.0065, + "step": 596190 + }, + { + "epoch": 1.55, + "learning_rate": 6.81845399332782e-05, + "loss": 0.0073, + "step": 596200 + }, + { + "epoch": 1.55, + "learning_rate": 6.818065171690673e-05, + "loss": 0.0064, + "step": 596210 + }, + { + "epoch": 1.55, + "learning_rate": 6.817676350053528e-05, + "loss": 0.0075, + "step": 596220 + }, + { + "epoch": 1.55, + "learning_rate": 6.81728752841638e-05, + "loss": 0.0079, + "step": 596230 + }, + { + "epoch": 1.55, + "learning_rate": 6.816898706779234e-05, + "loss": 0.0119, + "step": 596240 + }, + { + "epoch": 1.55, + "learning_rate": 6.816509885142087e-05, + "loss": 0.0071, + "step": 596250 + }, + { + "epoch": 1.55, + "learning_rate": 6.816121063504941e-05, + "loss": 0.0103, + "step": 596260 + }, + { + "epoch": 1.55, + "learning_rate": 6.815732241867796e-05, + "loss": 0.0089, + "step": 596270 + }, + { + "epoch": 1.55, + "learning_rate": 6.815343420230648e-05, + "loss": 0.0074, + "step": 596280 + }, + { + "epoch": 1.55, + "learning_rate": 6.814954598593503e-05, + "loss": 0.0081, + "step": 596290 + }, + { + "epoch": 1.55, + "learning_rate": 6.814565776956355e-05, + "loss": 0.0096, + "step": 596300 + }, + { + "epoch": 1.55, + "learning_rate": 6.81417695531921e-05, + "loss": 0.009, + "step": 596310 + }, + { + "epoch": 1.55, + "learning_rate": 6.813788133682062e-05, + "loss": 0.0083, + "step": 596320 + }, + { + "epoch": 1.55, + "learning_rate": 6.813399312044915e-05, + "loss": 0.0118, + "step": 596330 + }, + { + "epoch": 1.55, + "learning_rate": 6.81301049040777e-05, + "loss": 0.0116, + "step": 596340 + }, + { + "epoch": 1.55, + "learning_rate": 6.812621668770622e-05, + "loss": 0.0097, + "step": 596350 + }, + { + "epoch": 1.55, + "learning_rate": 6.812232847133476e-05, + "loss": 0.0096, + "step": 596360 + }, + { + "epoch": 1.55, + "learning_rate": 6.81184402549633e-05, + "loss": 0.0092, + "step": 596370 + }, + { + "epoch": 1.55, + "learning_rate": 6.811455203859183e-05, + "loss": 0.0074, + "step": 596380 + }, + { + "epoch": 1.55, + "learning_rate": 6.811066382222037e-05, + "loss": 0.0068, + "step": 596390 + }, + { + "epoch": 1.55, + "learning_rate": 6.81067756058489e-05, + "loss": 0.0078, + "step": 596400 + }, + { + "epoch": 1.55, + "learning_rate": 6.810288738947744e-05, + "loss": 0.0087, + "step": 596410 + }, + { + "epoch": 1.55, + "learning_rate": 6.809899917310597e-05, + "loss": 0.0071, + "step": 596420 + }, + { + "epoch": 1.55, + "learning_rate": 6.809511095673451e-05, + "loss": 0.0092, + "step": 596430 + }, + { + "epoch": 1.55, + "learning_rate": 6.809122274036306e-05, + "loss": 0.0062, + "step": 596440 + }, + { + "epoch": 1.55, + "learning_rate": 6.808733452399158e-05, + "loss": 0.0075, + "step": 596450 + }, + { + "epoch": 1.55, + "learning_rate": 6.808344630762013e-05, + "loss": 0.0094, + "step": 596460 + }, + { + "epoch": 1.55, + "learning_rate": 6.807955809124865e-05, + "loss": 0.0073, + "step": 596470 + }, + { + "epoch": 1.55, + "learning_rate": 6.80756698748772e-05, + "loss": 0.0089, + "step": 596480 + }, + { + "epoch": 1.55, + "learning_rate": 6.807178165850572e-05, + "loss": 0.0089, + "step": 596490 + }, + { + "epoch": 1.55, + "learning_rate": 6.806789344213426e-05, + "loss": 0.0103, + "step": 596500 + }, + { + "epoch": 1.55, + "learning_rate": 6.806400522576279e-05, + "loss": 0.0103, + "step": 596510 + }, + { + "epoch": 1.55, + "learning_rate": 6.806011700939133e-05, + "loss": 0.0122, + "step": 596520 + }, + { + "epoch": 1.55, + "learning_rate": 6.805622879301988e-05, + "loss": 0.0083, + "step": 596530 + }, + { + "epoch": 1.55, + "learning_rate": 6.80523405766484e-05, + "loss": 0.0087, + "step": 596540 + }, + { + "epoch": 1.55, + "learning_rate": 6.804845236027695e-05, + "loss": 0.0068, + "step": 596550 + }, + { + "epoch": 1.55, + "learning_rate": 6.804456414390547e-05, + "loss": 0.0097, + "step": 596560 + }, + { + "epoch": 1.55, + "learning_rate": 6.804067592753402e-05, + "loss": 0.008, + "step": 596570 + }, + { + "epoch": 1.55, + "learning_rate": 6.803678771116254e-05, + "loss": 0.0071, + "step": 596580 + }, + { + "epoch": 1.55, + "learning_rate": 6.803289949479107e-05, + "loss": 0.0068, + "step": 596590 + }, + { + "epoch": 1.55, + "learning_rate": 6.802901127841961e-05, + "loss": 0.0121, + "step": 596600 + }, + { + "epoch": 1.55, + "learning_rate": 6.802512306204814e-05, + "loss": 0.0076, + "step": 596610 + }, + { + "epoch": 1.55, + "learning_rate": 6.802123484567668e-05, + "loss": 0.006, + "step": 596620 + }, + { + "epoch": 1.55, + "learning_rate": 6.801734662930522e-05, + "loss": 0.0086, + "step": 596630 + }, + { + "epoch": 1.55, + "learning_rate": 6.801345841293375e-05, + "loss": 0.0087, + "step": 596640 + }, + { + "epoch": 1.55, + "learning_rate": 6.80095701965623e-05, + "loss": 0.0073, + "step": 596650 + }, + { + "epoch": 1.55, + "learning_rate": 6.800568198019082e-05, + "loss": 0.0113, + "step": 596660 + }, + { + "epoch": 1.55, + "learning_rate": 6.800179376381936e-05, + "loss": 0.0076, + "step": 596670 + }, + { + "epoch": 1.55, + "learning_rate": 6.799790554744789e-05, + "loss": 0.009, + "step": 596680 + }, + { + "epoch": 1.55, + "learning_rate": 6.799401733107643e-05, + "loss": 0.0094, + "step": 596690 + }, + { + "epoch": 1.55, + "learning_rate": 6.799012911470498e-05, + "loss": 0.0085, + "step": 596700 + }, + { + "epoch": 1.55, + "learning_rate": 6.79862408983335e-05, + "loss": 0.0098, + "step": 596710 + }, + { + "epoch": 1.55, + "learning_rate": 6.798235268196205e-05, + "loss": 0.0095, + "step": 596720 + }, + { + "epoch": 1.55, + "learning_rate": 6.797846446559057e-05, + "loss": 0.0095, + "step": 596730 + }, + { + "epoch": 1.55, + "learning_rate": 6.797457624921911e-05, + "loss": 0.0083, + "step": 596740 + }, + { + "epoch": 1.55, + "learning_rate": 6.797068803284764e-05, + "loss": 0.0062, + "step": 596750 + }, + { + "epoch": 1.55, + "learning_rate": 6.796679981647618e-05, + "loss": 0.0091, + "step": 596760 + }, + { + "epoch": 1.55, + "learning_rate": 6.796291160010471e-05, + "loss": 0.0069, + "step": 596770 + }, + { + "epoch": 1.55, + "learning_rate": 6.795902338373325e-05, + "loss": 0.0094, + "step": 596780 + }, + { + "epoch": 1.55, + "learning_rate": 6.79551351673618e-05, + "loss": 0.0081, + "step": 596790 + }, + { + "epoch": 1.55, + "learning_rate": 6.795124695099032e-05, + "loss": 0.009, + "step": 596800 + }, + { + "epoch": 1.55, + "learning_rate": 6.794735873461887e-05, + "loss": 0.0093, + "step": 596810 + }, + { + "epoch": 1.55, + "learning_rate": 6.79434705182474e-05, + "loss": 0.0067, + "step": 596820 + }, + { + "epoch": 1.55, + "learning_rate": 6.793958230187592e-05, + "loss": 0.0082, + "step": 596830 + }, + { + "epoch": 1.55, + "learning_rate": 6.793569408550446e-05, + "loss": 0.0103, + "step": 596840 + }, + { + "epoch": 1.55, + "learning_rate": 6.793180586913299e-05, + "loss": 0.0093, + "step": 596850 + }, + { + "epoch": 1.55, + "learning_rate": 6.792791765276153e-05, + "loss": 0.0096, + "step": 596860 + }, + { + "epoch": 1.55, + "learning_rate": 6.792402943639006e-05, + "loss": 0.0091, + "step": 596870 + }, + { + "epoch": 1.55, + "learning_rate": 6.79201412200186e-05, + "loss": 0.0125, + "step": 596880 + }, + { + "epoch": 1.55, + "learning_rate": 6.791625300364714e-05, + "loss": 0.0071, + "step": 596890 + }, + { + "epoch": 1.55, + "learning_rate": 6.791236478727567e-05, + "loss": 0.0081, + "step": 596900 + }, + { + "epoch": 1.55, + "learning_rate": 6.790847657090421e-05, + "loss": 0.0102, + "step": 596910 + }, + { + "epoch": 1.55, + "learning_rate": 6.790458835453274e-05, + "loss": 0.0071, + "step": 596920 + }, + { + "epoch": 1.55, + "learning_rate": 6.790070013816128e-05, + "loss": 0.0104, + "step": 596930 + }, + { + "epoch": 1.55, + "learning_rate": 6.789681192178981e-05, + "loss": 0.0085, + "step": 596940 + }, + { + "epoch": 1.55, + "learning_rate": 6.789292370541835e-05, + "loss": 0.0073, + "step": 596950 + }, + { + "epoch": 1.55, + "learning_rate": 6.78890354890469e-05, + "loss": 0.0075, + "step": 596960 + }, + { + "epoch": 1.55, + "learning_rate": 6.788514727267542e-05, + "loss": 0.0075, + "step": 596970 + }, + { + "epoch": 1.55, + "learning_rate": 6.788125905630397e-05, + "loss": 0.0116, + "step": 596980 + }, + { + "epoch": 1.55, + "learning_rate": 6.78773708399325e-05, + "loss": 0.0095, + "step": 596990 + }, + { + "epoch": 1.55, + "learning_rate": 6.787348262356103e-05, + "loss": 0.0082, + "step": 597000 + }, + { + "epoch": 1.55, + "eval_cer": 0.8817082848709045, + "eval_loss": 0.005668503697961569, + "eval_runtime": 107.8595, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 597000 + }, + { + "epoch": 1.55, + "learning_rate": 6.786959440718956e-05, + "loss": 0.0091, + "step": 597010 + }, + { + "epoch": 1.55, + "learning_rate": 6.78657061908181e-05, + "loss": 0.0097, + "step": 597020 + }, + { + "epoch": 1.55, + "learning_rate": 6.786181797444663e-05, + "loss": 0.0084, + "step": 597030 + }, + { + "epoch": 1.55, + "learning_rate": 6.785792975807517e-05, + "loss": 0.008, + "step": 597040 + }, + { + "epoch": 1.55, + "learning_rate": 6.785404154170372e-05, + "loss": 0.0099, + "step": 597050 + }, + { + "epoch": 1.55, + "learning_rate": 6.785015332533224e-05, + "loss": 0.01, + "step": 597060 + }, + { + "epoch": 1.55, + "learning_rate": 6.784626510896077e-05, + "loss": 0.0072, + "step": 597070 + }, + { + "epoch": 1.55, + "learning_rate": 6.784237689258931e-05, + "loss": 0.005, + "step": 597080 + }, + { + "epoch": 1.55, + "learning_rate": 6.783848867621784e-05, + "loss": 0.0111, + "step": 597090 + }, + { + "epoch": 1.55, + "learning_rate": 6.783460045984638e-05, + "loss": 0.0082, + "step": 597100 + }, + { + "epoch": 1.55, + "learning_rate": 6.783071224347491e-05, + "loss": 0.0086, + "step": 597110 + }, + { + "epoch": 1.55, + "learning_rate": 6.782682402710345e-05, + "loss": 0.0094, + "step": 597120 + }, + { + "epoch": 1.55, + "learning_rate": 6.782293581073198e-05, + "loss": 0.0088, + "step": 597130 + }, + { + "epoch": 1.55, + "learning_rate": 6.781904759436052e-05, + "loss": 0.016, + "step": 597140 + }, + { + "epoch": 1.55, + "learning_rate": 6.781515937798906e-05, + "loss": 0.009, + "step": 597150 + }, + { + "epoch": 1.55, + "learning_rate": 6.781127116161759e-05, + "loss": 0.0077, + "step": 597160 + }, + { + "epoch": 1.55, + "learning_rate": 6.780738294524613e-05, + "loss": 0.0085, + "step": 597170 + }, + { + "epoch": 1.55, + "learning_rate": 6.780349472887466e-05, + "loss": 0.0093, + "step": 597180 + }, + { + "epoch": 1.55, + "learning_rate": 6.77996065125032e-05, + "loss": 0.0097, + "step": 597190 + }, + { + "epoch": 1.55, + "learning_rate": 6.779571829613173e-05, + "loss": 0.0094, + "step": 597200 + }, + { + "epoch": 1.55, + "learning_rate": 6.779183007976027e-05, + "loss": 0.0069, + "step": 597210 + }, + { + "epoch": 1.55, + "learning_rate": 6.778794186338882e-05, + "loss": 0.0129, + "step": 597220 + }, + { + "epoch": 1.55, + "learning_rate": 6.778405364701734e-05, + "loss": 0.0085, + "step": 597230 + }, + { + "epoch": 1.55, + "learning_rate": 6.778016543064589e-05, + "loss": 0.008, + "step": 597240 + }, + { + "epoch": 1.55, + "learning_rate": 6.777627721427441e-05, + "loss": 0.0093, + "step": 597250 + }, + { + "epoch": 1.55, + "learning_rate": 6.777238899790295e-05, + "loss": 0.0085, + "step": 597260 + }, + { + "epoch": 1.55, + "learning_rate": 6.776850078153148e-05, + "loss": 0.0115, + "step": 597270 + }, + { + "epoch": 1.55, + "learning_rate": 6.776461256516002e-05, + "loss": 0.0093, + "step": 597280 + }, + { + "epoch": 1.55, + "learning_rate": 6.776072434878855e-05, + "loss": 0.0075, + "step": 597290 + }, + { + "epoch": 1.55, + "learning_rate": 6.77568361324171e-05, + "loss": 0.0121, + "step": 597300 + }, + { + "epoch": 1.55, + "learning_rate": 6.775294791604564e-05, + "loss": 0.0109, + "step": 597310 + }, + { + "epoch": 1.55, + "learning_rate": 6.774905969967416e-05, + "loss": 0.0087, + "step": 597320 + }, + { + "epoch": 1.55, + "learning_rate": 6.774517148330269e-05, + "loss": 0.0115, + "step": 597330 + }, + { + "epoch": 1.55, + "learning_rate": 6.774128326693123e-05, + "loss": 0.0103, + "step": 597340 + }, + { + "epoch": 1.55, + "learning_rate": 6.773739505055976e-05, + "loss": 0.0075, + "step": 597350 + }, + { + "epoch": 1.55, + "learning_rate": 6.77335068341883e-05, + "loss": 0.0076, + "step": 597360 + }, + { + "epoch": 1.55, + "learning_rate": 6.772961861781683e-05, + "loss": 0.0096, + "step": 597370 + }, + { + "epoch": 1.55, + "learning_rate": 6.772573040144537e-05, + "loss": 0.0091, + "step": 597380 + }, + { + "epoch": 1.55, + "learning_rate": 6.77218421850739e-05, + "loss": 0.0077, + "step": 597390 + }, + { + "epoch": 1.55, + "learning_rate": 6.771795396870244e-05, + "loss": 0.0099, + "step": 597400 + }, + { + "epoch": 1.55, + "learning_rate": 6.771406575233098e-05, + "loss": 0.0102, + "step": 597410 + }, + { + "epoch": 1.55, + "learning_rate": 6.771017753595951e-05, + "loss": 0.0094, + "step": 597420 + }, + { + "epoch": 1.55, + "learning_rate": 6.770628931958805e-05, + "loss": 0.0089, + "step": 597430 + }, + { + "epoch": 1.55, + "learning_rate": 6.770240110321658e-05, + "loss": 0.0107, + "step": 597440 + }, + { + "epoch": 1.55, + "learning_rate": 6.769851288684512e-05, + "loss": 0.0089, + "step": 597450 + }, + { + "epoch": 1.55, + "learning_rate": 6.769462467047365e-05, + "loss": 0.0108, + "step": 597460 + }, + { + "epoch": 1.55, + "learning_rate": 6.76907364541022e-05, + "loss": 0.0104, + "step": 597470 + }, + { + "epoch": 1.55, + "learning_rate": 6.768684823773074e-05, + "loss": 0.0071, + "step": 597480 + }, + { + "epoch": 1.55, + "learning_rate": 6.768296002135926e-05, + "loss": 0.0083, + "step": 597490 + }, + { + "epoch": 1.55, + "learning_rate": 6.76790718049878e-05, + "loss": 0.0103, + "step": 597500 + }, + { + "epoch": 1.55, + "learning_rate": 6.767518358861633e-05, + "loss": 0.0076, + "step": 597510 + }, + { + "epoch": 1.55, + "learning_rate": 6.767129537224487e-05, + "loss": 0.009, + "step": 597520 + }, + { + "epoch": 1.55, + "learning_rate": 6.76674071558734e-05, + "loss": 0.0076, + "step": 597530 + }, + { + "epoch": 1.55, + "learning_rate": 6.766351893950194e-05, + "loss": 0.0077, + "step": 597540 + }, + { + "epoch": 1.55, + "learning_rate": 6.765963072313047e-05, + "loss": 0.0115, + "step": 597550 + }, + { + "epoch": 1.55, + "learning_rate": 6.765574250675901e-05, + "loss": 0.007, + "step": 597560 + }, + { + "epoch": 1.55, + "learning_rate": 6.765185429038754e-05, + "loss": 0.0071, + "step": 597570 + }, + { + "epoch": 1.55, + "learning_rate": 6.764796607401608e-05, + "loss": 0.0104, + "step": 597580 + }, + { + "epoch": 1.55, + "learning_rate": 6.764407785764461e-05, + "loss": 0.0079, + "step": 597590 + }, + { + "epoch": 1.55, + "learning_rate": 6.764018964127315e-05, + "loss": 0.0083, + "step": 597600 + }, + { + "epoch": 1.55, + "learning_rate": 6.763630142490168e-05, + "loss": 0.0088, + "step": 597610 + }, + { + "epoch": 1.55, + "learning_rate": 6.763241320853022e-05, + "loss": 0.0072, + "step": 597620 + }, + { + "epoch": 1.55, + "learning_rate": 6.762852499215875e-05, + "loss": 0.0077, + "step": 597630 + }, + { + "epoch": 1.55, + "learning_rate": 6.762463677578729e-05, + "loss": 0.0093, + "step": 597640 + }, + { + "epoch": 1.55, + "learning_rate": 6.762074855941582e-05, + "loss": 0.0071, + "step": 597650 + }, + { + "epoch": 1.55, + "learning_rate": 6.761686034304436e-05, + "loss": 0.0099, + "step": 597660 + }, + { + "epoch": 1.55, + "learning_rate": 6.76129721266729e-05, + "loss": 0.0099, + "step": 597670 + }, + { + "epoch": 1.55, + "learning_rate": 6.760908391030143e-05, + "loss": 0.0137, + "step": 597680 + }, + { + "epoch": 1.55, + "learning_rate": 6.760519569392997e-05, + "loss": 0.0099, + "step": 597690 + }, + { + "epoch": 1.55, + "learning_rate": 6.76013074775585e-05, + "loss": 0.0097, + "step": 597700 + }, + { + "epoch": 1.55, + "learning_rate": 6.759741926118704e-05, + "loss": 0.0085, + "step": 597710 + }, + { + "epoch": 1.55, + "learning_rate": 6.759353104481557e-05, + "loss": 0.0075, + "step": 597720 + }, + { + "epoch": 1.55, + "learning_rate": 6.758964282844411e-05, + "loss": 0.0085, + "step": 597730 + }, + { + "epoch": 1.55, + "learning_rate": 6.758575461207264e-05, + "loss": 0.0082, + "step": 597740 + }, + { + "epoch": 1.55, + "learning_rate": 6.758186639570118e-05, + "loss": 0.009, + "step": 597750 + }, + { + "epoch": 1.55, + "learning_rate": 6.757797817932973e-05, + "loss": 0.0088, + "step": 597760 + }, + { + "epoch": 1.55, + "learning_rate": 6.757408996295825e-05, + "loss": 0.0091, + "step": 597770 + }, + { + "epoch": 1.55, + "learning_rate": 6.75702017465868e-05, + "loss": 0.0074, + "step": 597780 + }, + { + "epoch": 1.55, + "learning_rate": 6.756631353021532e-05, + "loss": 0.0085, + "step": 597790 + }, + { + "epoch": 1.55, + "learning_rate": 6.756242531384386e-05, + "loss": 0.0077, + "step": 597800 + }, + { + "epoch": 1.55, + "learning_rate": 6.755853709747239e-05, + "loss": 0.0087, + "step": 597810 + }, + { + "epoch": 1.55, + "learning_rate": 6.755464888110092e-05, + "loss": 0.0093, + "step": 597820 + }, + { + "epoch": 1.55, + "learning_rate": 6.755076066472946e-05, + "loss": 0.0114, + "step": 597830 + }, + { + "epoch": 1.55, + "learning_rate": 6.754687244835799e-05, + "loss": 0.0076, + "step": 597840 + }, + { + "epoch": 1.55, + "learning_rate": 6.754298423198653e-05, + "loss": 0.0081, + "step": 597850 + }, + { + "epoch": 1.55, + "learning_rate": 6.753909601561507e-05, + "loss": 0.0066, + "step": 597860 + }, + { + "epoch": 1.55, + "learning_rate": 6.75352077992436e-05, + "loss": 0.0067, + "step": 597870 + }, + { + "epoch": 1.55, + "learning_rate": 6.753131958287214e-05, + "loss": 0.0106, + "step": 597880 + }, + { + "epoch": 1.55, + "learning_rate": 6.752743136650067e-05, + "loss": 0.0092, + "step": 597890 + }, + { + "epoch": 1.55, + "learning_rate": 6.752354315012921e-05, + "loss": 0.0083, + "step": 597900 + }, + { + "epoch": 1.55, + "learning_rate": 6.751965493375774e-05, + "loss": 0.0082, + "step": 597910 + }, + { + "epoch": 1.55, + "learning_rate": 6.751576671738628e-05, + "loss": 0.0097, + "step": 597920 + }, + { + "epoch": 1.55, + "learning_rate": 6.751187850101482e-05, + "loss": 0.0093, + "step": 597930 + }, + { + "epoch": 1.55, + "learning_rate": 6.750799028464335e-05, + "loss": 0.0105, + "step": 597940 + }, + { + "epoch": 1.55, + "learning_rate": 6.75041020682719e-05, + "loss": 0.0084, + "step": 597950 + }, + { + "epoch": 1.55, + "learning_rate": 6.750021385190042e-05, + "loss": 0.0066, + "step": 597960 + }, + { + "epoch": 1.55, + "learning_rate": 6.749632563552896e-05, + "loss": 0.0056, + "step": 597970 + }, + { + "epoch": 1.55, + "learning_rate": 6.749243741915749e-05, + "loss": 0.0096, + "step": 597980 + }, + { + "epoch": 1.55, + "learning_rate": 6.748854920278603e-05, + "loss": 0.0092, + "step": 597990 + }, + { + "epoch": 1.55, + "learning_rate": 6.748466098641456e-05, + "loss": 0.0084, + "step": 598000 + }, + { + "epoch": 1.55, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.005743164103478193, + "eval_runtime": 107.8556, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 598000 + }, + { + "epoch": 1.55, + "learning_rate": 6.74807727700431e-05, + "loss": 0.0088, + "step": 598010 + }, + { + "epoch": 1.55, + "learning_rate": 6.747688455367164e-05, + "loss": 0.0096, + "step": 598020 + }, + { + "epoch": 1.55, + "learning_rate": 6.747299633730017e-05, + "loss": 0.0087, + "step": 598030 + }, + { + "epoch": 1.55, + "learning_rate": 6.746910812092871e-05, + "loss": 0.0078, + "step": 598040 + }, + { + "epoch": 1.55, + "learning_rate": 6.746521990455724e-05, + "loss": 0.0102, + "step": 598050 + }, + { + "epoch": 1.55, + "learning_rate": 6.746133168818578e-05, + "loss": 0.0082, + "step": 598060 + }, + { + "epoch": 1.55, + "learning_rate": 6.745744347181431e-05, + "loss": 0.0084, + "step": 598070 + }, + { + "epoch": 1.55, + "learning_rate": 6.745355525544284e-05, + "loss": 0.0091, + "step": 598080 + }, + { + "epoch": 1.55, + "learning_rate": 6.744966703907138e-05, + "loss": 0.0083, + "step": 598090 + }, + { + "epoch": 1.55, + "learning_rate": 6.744577882269991e-05, + "loss": 0.0124, + "step": 598100 + }, + { + "epoch": 1.55, + "learning_rate": 6.744189060632845e-05, + "loss": 0.0096, + "step": 598110 + }, + { + "epoch": 1.55, + "learning_rate": 6.7438002389957e-05, + "loss": 0.0068, + "step": 598120 + }, + { + "epoch": 1.55, + "learning_rate": 6.743411417358552e-05, + "loss": 0.009, + "step": 598130 + }, + { + "epoch": 1.55, + "learning_rate": 6.743022595721406e-05, + "loss": 0.0118, + "step": 598140 + }, + { + "epoch": 1.55, + "learning_rate": 6.742633774084259e-05, + "loss": 0.0095, + "step": 598150 + }, + { + "epoch": 1.55, + "learning_rate": 6.742244952447113e-05, + "loss": 0.0091, + "step": 598160 + }, + { + "epoch": 1.55, + "learning_rate": 6.741856130809966e-05, + "loss": 0.0113, + "step": 598170 + }, + { + "epoch": 1.55, + "learning_rate": 6.74146730917282e-05, + "loss": 0.0085, + "step": 598180 + }, + { + "epoch": 1.55, + "learning_rate": 6.741078487535674e-05, + "loss": 0.009, + "step": 598190 + }, + { + "epoch": 1.55, + "learning_rate": 6.740689665898527e-05, + "loss": 0.0117, + "step": 598200 + }, + { + "epoch": 1.55, + "learning_rate": 6.740300844261381e-05, + "loss": 0.0108, + "step": 598210 + }, + { + "epoch": 1.55, + "learning_rate": 6.739912022624234e-05, + "loss": 0.0073, + "step": 598220 + }, + { + "epoch": 1.55, + "learning_rate": 6.739523200987088e-05, + "loss": 0.0077, + "step": 598230 + }, + { + "epoch": 1.55, + "learning_rate": 6.739134379349941e-05, + "loss": 0.0071, + "step": 598240 + }, + { + "epoch": 1.55, + "learning_rate": 6.738745557712795e-05, + "loss": 0.0083, + "step": 598250 + }, + { + "epoch": 1.55, + "learning_rate": 6.738356736075648e-05, + "loss": 0.0106, + "step": 598260 + }, + { + "epoch": 1.55, + "learning_rate": 6.737967914438502e-05, + "loss": 0.0122, + "step": 598270 + }, + { + "epoch": 1.55, + "learning_rate": 6.737579092801356e-05, + "loss": 0.0135, + "step": 598280 + }, + { + "epoch": 1.55, + "learning_rate": 6.737190271164209e-05, + "loss": 0.0074, + "step": 598290 + }, + { + "epoch": 1.55, + "learning_rate": 6.736801449527063e-05, + "loss": 0.0068, + "step": 598300 + }, + { + "epoch": 1.55, + "learning_rate": 6.736412627889916e-05, + "loss": 0.0078, + "step": 598310 + }, + { + "epoch": 1.55, + "learning_rate": 6.736023806252769e-05, + "loss": 0.0116, + "step": 598320 + }, + { + "epoch": 1.55, + "learning_rate": 6.735634984615623e-05, + "loss": 0.0076, + "step": 598330 + }, + { + "epoch": 1.55, + "learning_rate": 6.735246162978476e-05, + "loss": 0.0107, + "step": 598340 + }, + { + "epoch": 1.55, + "learning_rate": 6.73485734134133e-05, + "loss": 0.0072, + "step": 598350 + }, + { + "epoch": 1.55, + "learning_rate": 6.734468519704183e-05, + "loss": 0.0096, + "step": 598360 + }, + { + "epoch": 1.55, + "learning_rate": 6.734079698067037e-05, + "loss": 0.0116, + "step": 598370 + }, + { + "epoch": 1.55, + "learning_rate": 6.733690876429891e-05, + "loss": 0.0118, + "step": 598380 + }, + { + "epoch": 1.55, + "learning_rate": 6.733302054792744e-05, + "loss": 0.0073, + "step": 598390 + }, + { + "epoch": 1.55, + "learning_rate": 6.732913233155598e-05, + "loss": 0.0094, + "step": 598400 + }, + { + "epoch": 1.55, + "learning_rate": 6.732524411518451e-05, + "loss": 0.0083, + "step": 598410 + }, + { + "epoch": 1.55, + "learning_rate": 6.732135589881305e-05, + "loss": 0.0092, + "step": 598420 + }, + { + "epoch": 1.55, + "learning_rate": 6.731746768244158e-05, + "loss": 0.0091, + "step": 598430 + }, + { + "epoch": 1.55, + "learning_rate": 6.731357946607012e-05, + "loss": 0.0132, + "step": 598440 + }, + { + "epoch": 1.55, + "learning_rate": 6.730969124969866e-05, + "loss": 0.0083, + "step": 598450 + }, + { + "epoch": 1.55, + "learning_rate": 6.730580303332719e-05, + "loss": 0.0097, + "step": 598460 + }, + { + "epoch": 1.55, + "learning_rate": 6.730191481695573e-05, + "loss": 0.0086, + "step": 598470 + }, + { + "epoch": 1.55, + "learning_rate": 6.729802660058426e-05, + "loss": 0.0115, + "step": 598480 + }, + { + "epoch": 1.55, + "learning_rate": 6.72941383842128e-05, + "loss": 0.0094, + "step": 598490 + }, + { + "epoch": 1.55, + "learning_rate": 6.729025016784133e-05, + "loss": 0.009, + "step": 598500 + }, + { + "epoch": 1.55, + "learning_rate": 6.728636195146987e-05, + "loss": 0.0087, + "step": 598510 + }, + { + "epoch": 1.55, + "learning_rate": 6.72824737350984e-05, + "loss": 0.0075, + "step": 598520 + }, + { + "epoch": 1.55, + "learning_rate": 6.727858551872694e-05, + "loss": 0.0088, + "step": 598530 + }, + { + "epoch": 1.55, + "learning_rate": 6.727469730235548e-05, + "loss": 0.0098, + "step": 598540 + }, + { + "epoch": 1.55, + "learning_rate": 6.727080908598401e-05, + "loss": 0.0133, + "step": 598550 + }, + { + "epoch": 1.55, + "learning_rate": 6.726692086961254e-05, + "loss": 0.0083, + "step": 598560 + }, + { + "epoch": 1.55, + "learning_rate": 6.726303265324108e-05, + "loss": 0.0066, + "step": 598570 + }, + { + "epoch": 1.55, + "learning_rate": 6.725914443686961e-05, + "loss": 0.0095, + "step": 598580 + }, + { + "epoch": 1.55, + "learning_rate": 6.725525622049815e-05, + "loss": 0.0102, + "step": 598590 + }, + { + "epoch": 1.55, + "learning_rate": 6.725136800412668e-05, + "loss": 0.0114, + "step": 598600 + }, + { + "epoch": 1.55, + "learning_rate": 6.724747978775522e-05, + "loss": 0.0077, + "step": 598610 + }, + { + "epoch": 1.55, + "learning_rate": 6.724359157138375e-05, + "loss": 0.0076, + "step": 598620 + }, + { + "epoch": 1.55, + "learning_rate": 6.723970335501229e-05, + "loss": 0.0092, + "step": 598630 + }, + { + "epoch": 1.55, + "learning_rate": 6.723581513864083e-05, + "loss": 0.0097, + "step": 598640 + }, + { + "epoch": 1.55, + "learning_rate": 6.723192692226936e-05, + "loss": 0.0081, + "step": 598650 + }, + { + "epoch": 1.55, + "learning_rate": 6.72280387058979e-05, + "loss": 0.0099, + "step": 598660 + }, + { + "epoch": 1.55, + "learning_rate": 6.722415048952643e-05, + "loss": 0.0105, + "step": 598670 + }, + { + "epoch": 1.55, + "learning_rate": 6.722026227315497e-05, + "loss": 0.0103, + "step": 598680 + }, + { + "epoch": 1.55, + "learning_rate": 6.72163740567835e-05, + "loss": 0.007, + "step": 598690 + }, + { + "epoch": 1.55, + "learning_rate": 6.721248584041204e-05, + "loss": 0.0073, + "step": 598700 + }, + { + "epoch": 1.55, + "learning_rate": 6.720859762404058e-05, + "loss": 0.0077, + "step": 598710 + }, + { + "epoch": 1.55, + "learning_rate": 6.720470940766911e-05, + "loss": 0.0091, + "step": 598720 + }, + { + "epoch": 1.55, + "learning_rate": 6.720082119129765e-05, + "loss": 0.0082, + "step": 598730 + }, + { + "epoch": 1.55, + "learning_rate": 6.719693297492618e-05, + "loss": 0.0102, + "step": 598740 + }, + { + "epoch": 1.55, + "learning_rate": 6.719304475855472e-05, + "loss": 0.0079, + "step": 598750 + }, + { + "epoch": 1.55, + "learning_rate": 6.718915654218325e-05, + "loss": 0.0085, + "step": 598760 + }, + { + "epoch": 1.55, + "learning_rate": 6.71852683258118e-05, + "loss": 0.0099, + "step": 598770 + }, + { + "epoch": 1.55, + "learning_rate": 6.718138010944032e-05, + "loss": 0.0075, + "step": 598780 + }, + { + "epoch": 1.55, + "learning_rate": 6.717749189306886e-05, + "loss": 0.0074, + "step": 598790 + }, + { + "epoch": 1.55, + "learning_rate": 6.71736036766974e-05, + "loss": 0.0107, + "step": 598800 + }, + { + "epoch": 1.55, + "learning_rate": 6.716971546032593e-05, + "loss": 0.0078, + "step": 598810 + }, + { + "epoch": 1.55, + "learning_rate": 6.716582724395446e-05, + "loss": 0.0078, + "step": 598820 + }, + { + "epoch": 1.55, + "learning_rate": 6.7161939027583e-05, + "loss": 0.0097, + "step": 598830 + }, + { + "epoch": 1.55, + "learning_rate": 6.715805081121153e-05, + "loss": 0.01, + "step": 598840 + }, + { + "epoch": 1.55, + "learning_rate": 6.715416259484007e-05, + "loss": 0.0053, + "step": 598850 + }, + { + "epoch": 1.55, + "learning_rate": 6.71502743784686e-05, + "loss": 0.0083, + "step": 598860 + }, + { + "epoch": 1.55, + "learning_rate": 6.714638616209714e-05, + "loss": 0.0096, + "step": 598870 + }, + { + "epoch": 1.55, + "learning_rate": 6.714249794572567e-05, + "loss": 0.0084, + "step": 598880 + }, + { + "epoch": 1.55, + "learning_rate": 6.713860972935421e-05, + "loss": 0.0073, + "step": 598890 + }, + { + "epoch": 1.55, + "learning_rate": 6.713472151298275e-05, + "loss": 0.0142, + "step": 598900 + }, + { + "epoch": 1.55, + "learning_rate": 6.713083329661128e-05, + "loss": 0.0083, + "step": 598910 + }, + { + "epoch": 1.55, + "learning_rate": 6.712694508023982e-05, + "loss": 0.0108, + "step": 598920 + }, + { + "epoch": 1.55, + "learning_rate": 6.712305686386835e-05, + "loss": 0.0088, + "step": 598930 + }, + { + "epoch": 1.55, + "learning_rate": 6.711916864749689e-05, + "loss": 0.0088, + "step": 598940 + }, + { + "epoch": 1.55, + "learning_rate": 6.711528043112542e-05, + "loss": 0.0081, + "step": 598950 + }, + { + "epoch": 1.55, + "learning_rate": 6.711139221475396e-05, + "loss": 0.0073, + "step": 598960 + }, + { + "epoch": 1.55, + "learning_rate": 6.710750399838249e-05, + "loss": 0.0096, + "step": 598970 + }, + { + "epoch": 1.55, + "learning_rate": 6.710361578201103e-05, + "loss": 0.0088, + "step": 598980 + }, + { + "epoch": 1.55, + "learning_rate": 6.709972756563957e-05, + "loss": 0.0084, + "step": 598990 + }, + { + "epoch": 1.55, + "learning_rate": 6.70958393492681e-05, + "loss": 0.0112, + "step": 599000 + }, + { + "epoch": 1.55, + "eval_cer": 0.881704085960102, + "eval_loss": 0.005739094223827124, + "eval_runtime": 107.7697, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.64, + "step": 599000 + }, + { + "epoch": 1.55, + "learning_rate": 6.709195113289664e-05, + "loss": 0.0065, + "step": 599010 + }, + { + "epoch": 1.55, + "learning_rate": 6.708806291652517e-05, + "loss": 0.0084, + "step": 599020 + }, + { + "epoch": 1.55, + "learning_rate": 6.708417470015371e-05, + "loss": 0.0085, + "step": 599030 + }, + { + "epoch": 1.55, + "learning_rate": 6.708028648378224e-05, + "loss": 0.0077, + "step": 599040 + }, + { + "epoch": 1.55, + "learning_rate": 6.707639826741078e-05, + "loss": 0.0118, + "step": 599050 + }, + { + "epoch": 1.55, + "learning_rate": 6.707251005103931e-05, + "loss": 0.008, + "step": 599060 + }, + { + "epoch": 1.55, + "learning_rate": 6.706862183466785e-05, + "loss": 0.0112, + "step": 599070 + }, + { + "epoch": 1.55, + "learning_rate": 6.706473361829638e-05, + "loss": 0.0076, + "step": 599080 + }, + { + "epoch": 1.55, + "learning_rate": 6.706084540192492e-05, + "loss": 0.0082, + "step": 599090 + }, + { + "epoch": 1.55, + "learning_rate": 6.705695718555345e-05, + "loss": 0.012, + "step": 599100 + }, + { + "epoch": 1.55, + "learning_rate": 6.705306896918199e-05, + "loss": 0.0068, + "step": 599110 + }, + { + "epoch": 1.55, + "learning_rate": 6.704918075281052e-05, + "loss": 0.0095, + "step": 599120 + }, + { + "epoch": 1.55, + "learning_rate": 6.704529253643906e-05, + "loss": 0.0082, + "step": 599130 + }, + { + "epoch": 1.55, + "learning_rate": 6.704140432006759e-05, + "loss": 0.0098, + "step": 599140 + }, + { + "epoch": 1.55, + "learning_rate": 6.703751610369613e-05, + "loss": 0.0087, + "step": 599150 + }, + { + "epoch": 1.55, + "learning_rate": 6.703362788732467e-05, + "loss": 0.0081, + "step": 599160 + }, + { + "epoch": 1.55, + "learning_rate": 6.70297396709532e-05, + "loss": 0.007, + "step": 599170 + }, + { + "epoch": 1.55, + "learning_rate": 6.702585145458174e-05, + "loss": 0.0097, + "step": 599180 + }, + { + "epoch": 1.55, + "learning_rate": 6.702196323821027e-05, + "loss": 0.008, + "step": 599190 + }, + { + "epoch": 1.55, + "learning_rate": 6.701807502183881e-05, + "loss": 0.0105, + "step": 599200 + }, + { + "epoch": 1.55, + "learning_rate": 6.701418680546734e-05, + "loss": 0.0087, + "step": 599210 + }, + { + "epoch": 1.55, + "learning_rate": 6.701029858909588e-05, + "loss": 0.0122, + "step": 599220 + }, + { + "epoch": 1.55, + "learning_rate": 6.700641037272441e-05, + "loss": 0.0083, + "step": 599230 + }, + { + "epoch": 1.55, + "learning_rate": 6.700252215635295e-05, + "loss": 0.0099, + "step": 599240 + }, + { + "epoch": 1.55, + "learning_rate": 6.69986339399815e-05, + "loss": 0.0188, + "step": 599250 + }, + { + "epoch": 1.55, + "learning_rate": 6.699474572361002e-05, + "loss": 0.0099, + "step": 599260 + }, + { + "epoch": 1.55, + "learning_rate": 6.699085750723856e-05, + "loss": 0.0088, + "step": 599270 + }, + { + "epoch": 1.55, + "learning_rate": 6.698696929086709e-05, + "loss": 0.0106, + "step": 599280 + }, + { + "epoch": 1.55, + "learning_rate": 6.698308107449563e-05, + "loss": 0.0096, + "step": 599290 + }, + { + "epoch": 1.55, + "learning_rate": 6.697919285812416e-05, + "loss": 0.0082, + "step": 599300 + }, + { + "epoch": 1.55, + "learning_rate": 6.697530464175269e-05, + "loss": 0.0108, + "step": 599310 + }, + { + "epoch": 1.55, + "learning_rate": 6.697141642538123e-05, + "loss": 0.0085, + "step": 599320 + }, + { + "epoch": 1.55, + "learning_rate": 6.696752820900976e-05, + "loss": 0.0092, + "step": 599330 + }, + { + "epoch": 1.55, + "learning_rate": 6.69636399926383e-05, + "loss": 0.0109, + "step": 599340 + }, + { + "epoch": 1.55, + "learning_rate": 6.695975177626684e-05, + "loss": 0.0089, + "step": 599350 + }, + { + "epoch": 1.55, + "learning_rate": 6.695586355989537e-05, + "loss": 0.009, + "step": 599360 + }, + { + "epoch": 1.55, + "learning_rate": 6.695197534352391e-05, + "loss": 0.0098, + "step": 599370 + }, + { + "epoch": 1.55, + "learning_rate": 6.694808712715244e-05, + "loss": 0.0071, + "step": 599380 + }, + { + "epoch": 1.55, + "learning_rate": 6.694419891078098e-05, + "loss": 0.0101, + "step": 599390 + }, + { + "epoch": 1.55, + "learning_rate": 6.694031069440951e-05, + "loss": 0.0071, + "step": 599400 + }, + { + "epoch": 1.55, + "learning_rate": 6.693642247803805e-05, + "loss": 0.0089, + "step": 599410 + }, + { + "epoch": 1.55, + "learning_rate": 6.69325342616666e-05, + "loss": 0.0098, + "step": 599420 + }, + { + "epoch": 1.55, + "learning_rate": 6.692864604529512e-05, + "loss": 0.0073, + "step": 599430 + }, + { + "epoch": 1.55, + "learning_rate": 6.692475782892366e-05, + "loss": 0.0079, + "step": 599440 + }, + { + "epoch": 1.55, + "learning_rate": 6.692086961255219e-05, + "loss": 0.0134, + "step": 599450 + }, + { + "epoch": 1.55, + "learning_rate": 6.691698139618073e-05, + "loss": 0.0066, + "step": 599460 + }, + { + "epoch": 1.55, + "learning_rate": 6.691309317980926e-05, + "loss": 0.0067, + "step": 599470 + }, + { + "epoch": 1.55, + "learning_rate": 6.69092049634378e-05, + "loss": 0.0087, + "step": 599480 + }, + { + "epoch": 1.55, + "learning_rate": 6.690531674706633e-05, + "loss": 0.0085, + "step": 599490 + }, + { + "epoch": 1.55, + "learning_rate": 6.690142853069487e-05, + "loss": 0.0096, + "step": 599500 + }, + { + "epoch": 1.55, + "learning_rate": 6.689754031432341e-05, + "loss": 0.0118, + "step": 599510 + }, + { + "epoch": 1.55, + "learning_rate": 6.689365209795194e-05, + "loss": 0.0102, + "step": 599520 + }, + { + "epoch": 1.55, + "learning_rate": 6.688976388158048e-05, + "loss": 0.0079, + "step": 599530 + }, + { + "epoch": 1.55, + "learning_rate": 6.688587566520901e-05, + "loss": 0.0082, + "step": 599540 + }, + { + "epoch": 1.55, + "learning_rate": 6.688198744883754e-05, + "loss": 0.0094, + "step": 599550 + }, + { + "epoch": 1.55, + "learning_rate": 6.687809923246608e-05, + "loss": 0.0134, + "step": 599560 + }, + { + "epoch": 1.55, + "learning_rate": 6.687421101609461e-05, + "loss": 0.0088, + "step": 599570 + }, + { + "epoch": 1.55, + "learning_rate": 6.687032279972315e-05, + "loss": 0.0068, + "step": 599580 + }, + { + "epoch": 1.55, + "learning_rate": 6.686643458335168e-05, + "loss": 0.0087, + "step": 599590 + }, + { + "epoch": 1.55, + "learning_rate": 6.686254636698022e-05, + "loss": 0.0071, + "step": 599600 + }, + { + "epoch": 1.55, + "learning_rate": 6.685865815060876e-05, + "loss": 0.014, + "step": 599610 + }, + { + "epoch": 1.55, + "learning_rate": 6.685476993423729e-05, + "loss": 0.0076, + "step": 599620 + }, + { + "epoch": 1.55, + "learning_rate": 6.685088171786583e-05, + "loss": 0.0071, + "step": 599630 + }, + { + "epoch": 1.55, + "learning_rate": 6.684699350149436e-05, + "loss": 0.0113, + "step": 599640 + }, + { + "epoch": 1.55, + "learning_rate": 6.68431052851229e-05, + "loss": 0.0092, + "step": 599650 + }, + { + "epoch": 1.55, + "learning_rate": 6.683921706875143e-05, + "loss": 0.0128, + "step": 599660 + }, + { + "epoch": 1.55, + "learning_rate": 6.683532885237997e-05, + "loss": 0.0106, + "step": 599670 + }, + { + "epoch": 1.55, + "learning_rate": 6.683144063600851e-05, + "loss": 0.0065, + "step": 599680 + }, + { + "epoch": 1.55, + "learning_rate": 6.682755241963704e-05, + "loss": 0.0067, + "step": 599690 + }, + { + "epoch": 1.55, + "learning_rate": 6.682366420326558e-05, + "loss": 0.0109, + "step": 599700 + }, + { + "epoch": 1.55, + "learning_rate": 6.681977598689411e-05, + "loss": 0.0079, + "step": 599710 + }, + { + "epoch": 1.55, + "learning_rate": 6.681588777052265e-05, + "loss": 0.0082, + "step": 599720 + }, + { + "epoch": 1.55, + "learning_rate": 6.681199955415118e-05, + "loss": 0.0092, + "step": 599730 + }, + { + "epoch": 1.55, + "learning_rate": 6.680811133777972e-05, + "loss": 0.0078, + "step": 599740 + }, + { + "epoch": 1.55, + "learning_rate": 6.680422312140825e-05, + "loss": 0.0088, + "step": 599750 + }, + { + "epoch": 1.55, + "learning_rate": 6.680033490503679e-05, + "loss": 0.0063, + "step": 599760 + }, + { + "epoch": 1.55, + "learning_rate": 6.679644668866533e-05, + "loss": 0.0087, + "step": 599770 + }, + { + "epoch": 1.55, + "learning_rate": 6.679255847229386e-05, + "loss": 0.0092, + "step": 599780 + }, + { + "epoch": 1.55, + "learning_rate": 6.67886702559224e-05, + "loss": 0.009, + "step": 599790 + }, + { + "epoch": 1.55, + "learning_rate": 6.678478203955093e-05, + "loss": 0.0072, + "step": 599800 + }, + { + "epoch": 1.55, + "learning_rate": 6.678089382317946e-05, + "loss": 0.0078, + "step": 599810 + }, + { + "epoch": 1.55, + "learning_rate": 6.6777005606808e-05, + "loss": 0.008, + "step": 599820 + }, + { + "epoch": 1.55, + "learning_rate": 6.677311739043653e-05, + "loss": 0.0087, + "step": 599830 + }, + { + "epoch": 1.55, + "learning_rate": 6.676922917406507e-05, + "loss": 0.0121, + "step": 599840 + }, + { + "epoch": 1.55, + "learning_rate": 6.67653409576936e-05, + "loss": 0.0079, + "step": 599850 + }, + { + "epoch": 1.55, + "learning_rate": 6.676145274132214e-05, + "loss": 0.0091, + "step": 599860 + }, + { + "epoch": 1.55, + "learning_rate": 6.675756452495068e-05, + "loss": 0.0075, + "step": 599870 + }, + { + "epoch": 1.55, + "learning_rate": 6.675367630857921e-05, + "loss": 0.0072, + "step": 599880 + }, + { + "epoch": 1.56, + "learning_rate": 6.674978809220775e-05, + "loss": 0.0102, + "step": 599890 + }, + { + "epoch": 1.56, + "learning_rate": 6.674589987583628e-05, + "loss": 0.0079, + "step": 599900 + }, + { + "epoch": 1.56, + "learning_rate": 6.674201165946482e-05, + "loss": 0.0082, + "step": 599910 + }, + { + "epoch": 1.56, + "learning_rate": 6.673812344309335e-05, + "loss": 0.0095, + "step": 599920 + }, + { + "epoch": 1.56, + "learning_rate": 6.673423522672189e-05, + "loss": 0.0092, + "step": 599930 + }, + { + "epoch": 1.56, + "learning_rate": 6.673034701035043e-05, + "loss": 0.0092, + "step": 599940 + }, + { + "epoch": 1.56, + "learning_rate": 6.672645879397896e-05, + "loss": 0.0078, + "step": 599950 + }, + { + "epoch": 1.56, + "learning_rate": 6.67225705776075e-05, + "loss": 0.0104, + "step": 599960 + }, + { + "epoch": 1.56, + "learning_rate": 6.671868236123603e-05, + "loss": 0.0087, + "step": 599970 + }, + { + "epoch": 1.56, + "learning_rate": 6.671479414486457e-05, + "loss": 0.0091, + "step": 599980 + }, + { + "epoch": 1.56, + "learning_rate": 6.67109059284931e-05, + "loss": 0.0086, + "step": 599990 + }, + { + "epoch": 1.56, + "learning_rate": 6.670701771212164e-05, + "loss": 0.0143, + "step": 600000 + }, + { + "epoch": 1.56, + "eval_cer": 0.88167329394755, + "eval_loss": 0.005724812392145395, + "eval_runtime": 107.7634, + "eval_samples_per_second": 18.559, + "eval_steps_per_second": 4.64, + "step": 600000 + }, + { + "epoch": 1.56, + "learning_rate": 6.670312949575017e-05, + "loss": 0.0087, + "step": 600010 + }, + { + "epoch": 1.56, + "learning_rate": 6.669924127937871e-05, + "loss": 0.0082, + "step": 600020 + }, + { + "epoch": 1.56, + "learning_rate": 6.669535306300725e-05, + "loss": 0.0091, + "step": 600030 + }, + { + "epoch": 1.56, + "learning_rate": 6.669146484663578e-05, + "loss": 0.009, + "step": 600040 + }, + { + "epoch": 1.56, + "learning_rate": 6.668757663026431e-05, + "loss": 0.0082, + "step": 600050 + }, + { + "epoch": 1.56, + "learning_rate": 6.668368841389285e-05, + "loss": 0.0089, + "step": 600060 + }, + { + "epoch": 1.56, + "learning_rate": 6.667980019752138e-05, + "loss": 0.01, + "step": 600070 + }, + { + "epoch": 1.56, + "learning_rate": 6.667591198114992e-05, + "loss": 0.0091, + "step": 600080 + }, + { + "epoch": 1.56, + "learning_rate": 6.667202376477845e-05, + "loss": 0.0097, + "step": 600090 + }, + { + "epoch": 1.56, + "learning_rate": 6.666813554840699e-05, + "loss": 0.0077, + "step": 600100 + }, + { + "epoch": 1.56, + "learning_rate": 6.666424733203552e-05, + "loss": 0.0079, + "step": 600110 + }, + { + "epoch": 1.56, + "learning_rate": 6.666035911566406e-05, + "loss": 0.0107, + "step": 600120 + }, + { + "epoch": 1.56, + "learning_rate": 6.66564708992926e-05, + "loss": 0.0074, + "step": 600130 + }, + { + "epoch": 1.56, + "learning_rate": 6.665258268292113e-05, + "loss": 0.008, + "step": 600140 + }, + { + "epoch": 1.56, + "learning_rate": 6.664869446654967e-05, + "loss": 0.0108, + "step": 600150 + }, + { + "epoch": 1.56, + "learning_rate": 6.66448062501782e-05, + "loss": 0.0075, + "step": 600160 + }, + { + "epoch": 1.56, + "learning_rate": 6.664091803380674e-05, + "loss": 0.007, + "step": 600170 + }, + { + "epoch": 1.56, + "learning_rate": 6.663702981743527e-05, + "loss": 0.0065, + "step": 600180 + }, + { + "epoch": 1.56, + "learning_rate": 6.663314160106381e-05, + "loss": 0.0062, + "step": 600190 + }, + { + "epoch": 1.56, + "learning_rate": 6.662925338469235e-05, + "loss": 0.0082, + "step": 600200 + }, + { + "epoch": 1.56, + "learning_rate": 6.662536516832088e-05, + "loss": 0.008, + "step": 600210 + }, + { + "epoch": 1.56, + "learning_rate": 6.662147695194942e-05, + "loss": 0.0093, + "step": 600220 + }, + { + "epoch": 1.56, + "learning_rate": 6.661758873557795e-05, + "loss": 0.0108, + "step": 600230 + }, + { + "epoch": 1.56, + "learning_rate": 6.661370051920649e-05, + "loss": 0.011, + "step": 600240 + }, + { + "epoch": 1.56, + "learning_rate": 6.660981230283502e-05, + "loss": 0.0079, + "step": 600250 + }, + { + "epoch": 1.56, + "learning_rate": 6.660592408646356e-05, + "loss": 0.0108, + "step": 600260 + }, + { + "epoch": 1.56, + "learning_rate": 6.660203587009209e-05, + "loss": 0.0105, + "step": 600270 + }, + { + "epoch": 1.56, + "learning_rate": 6.659814765372063e-05, + "loss": 0.0119, + "step": 600280 + }, + { + "epoch": 1.56, + "learning_rate": 6.659425943734917e-05, + "loss": 0.0065, + "step": 600290 + }, + { + "epoch": 1.56, + "learning_rate": 6.65903712209777e-05, + "loss": 0.0105, + "step": 600300 + }, + { + "epoch": 1.56, + "learning_rate": 6.658648300460623e-05, + "loss": 0.0068, + "step": 600310 + }, + { + "epoch": 1.56, + "learning_rate": 6.658259478823477e-05, + "loss": 0.0079, + "step": 600320 + }, + { + "epoch": 1.56, + "learning_rate": 6.65787065718633e-05, + "loss": 0.0062, + "step": 600330 + }, + { + "epoch": 1.56, + "learning_rate": 6.657481835549184e-05, + "loss": 0.0082, + "step": 600340 + }, + { + "epoch": 1.56, + "learning_rate": 6.657093013912037e-05, + "loss": 0.008, + "step": 600350 + }, + { + "epoch": 1.56, + "learning_rate": 6.656704192274891e-05, + "loss": 0.0094, + "step": 600360 + }, + { + "epoch": 1.56, + "learning_rate": 6.656315370637744e-05, + "loss": 0.0088, + "step": 600370 + }, + { + "epoch": 1.56, + "learning_rate": 6.655926549000598e-05, + "loss": 0.0056, + "step": 600380 + }, + { + "epoch": 1.56, + "learning_rate": 6.655537727363452e-05, + "loss": 0.008, + "step": 600390 + }, + { + "epoch": 1.56, + "learning_rate": 6.655148905726305e-05, + "loss": 0.0077, + "step": 600400 + }, + { + "epoch": 1.56, + "learning_rate": 6.654760084089159e-05, + "loss": 0.0078, + "step": 600410 + }, + { + "epoch": 1.56, + "learning_rate": 6.654371262452012e-05, + "loss": 0.0121, + "step": 600420 + }, + { + "epoch": 1.56, + "learning_rate": 6.653982440814866e-05, + "loss": 0.0121, + "step": 600430 + }, + { + "epoch": 1.56, + "learning_rate": 6.653593619177719e-05, + "loss": 0.0083, + "step": 600440 + }, + { + "epoch": 1.56, + "learning_rate": 6.653204797540573e-05, + "loss": 0.0074, + "step": 600450 + }, + { + "epoch": 1.56, + "learning_rate": 6.652815975903426e-05, + "loss": 0.01, + "step": 600460 + }, + { + "epoch": 1.56, + "learning_rate": 6.65242715426628e-05, + "loss": 0.009, + "step": 600470 + }, + { + "epoch": 1.56, + "learning_rate": 6.652038332629134e-05, + "loss": 0.0098, + "step": 600480 + }, + { + "epoch": 1.56, + "learning_rate": 6.651649510991987e-05, + "loss": 0.0093, + "step": 600490 + }, + { + "epoch": 1.56, + "learning_rate": 6.651260689354841e-05, + "loss": 0.0069, + "step": 600500 + }, + { + "epoch": 1.56, + "learning_rate": 6.650871867717694e-05, + "loss": 0.0128, + "step": 600510 + }, + { + "epoch": 1.56, + "learning_rate": 6.650483046080548e-05, + "loss": 0.0101, + "step": 600520 + }, + { + "epoch": 1.56, + "learning_rate": 6.650094224443401e-05, + "loss": 0.0082, + "step": 600530 + }, + { + "epoch": 1.56, + "learning_rate": 6.649705402806255e-05, + "loss": 0.009, + "step": 600540 + }, + { + "epoch": 1.56, + "learning_rate": 6.649316581169108e-05, + "loss": 0.0088, + "step": 600550 + }, + { + "epoch": 1.56, + "learning_rate": 6.648927759531961e-05, + "loss": 0.0079, + "step": 600560 + }, + { + "epoch": 1.56, + "learning_rate": 6.648538937894815e-05, + "loss": 0.0088, + "step": 600570 + }, + { + "epoch": 1.56, + "learning_rate": 6.648150116257669e-05, + "loss": 0.0119, + "step": 600580 + }, + { + "epoch": 1.56, + "learning_rate": 6.647761294620522e-05, + "loss": 0.011, + "step": 600590 + }, + { + "epoch": 1.56, + "learning_rate": 6.647372472983376e-05, + "loss": 0.0096, + "step": 600600 + }, + { + "epoch": 1.56, + "learning_rate": 6.646983651346229e-05, + "loss": 0.0096, + "step": 600610 + }, + { + "epoch": 1.56, + "learning_rate": 6.646594829709083e-05, + "loss": 0.0112, + "step": 600620 + }, + { + "epoch": 1.56, + "learning_rate": 6.646206008071936e-05, + "loss": 0.01, + "step": 600630 + }, + { + "epoch": 1.56, + "learning_rate": 6.64581718643479e-05, + "loss": 0.008, + "step": 600640 + }, + { + "epoch": 1.56, + "learning_rate": 6.645428364797644e-05, + "loss": 0.0132, + "step": 600650 + }, + { + "epoch": 1.56, + "learning_rate": 6.645039543160497e-05, + "loss": 0.0124, + "step": 600660 + }, + { + "epoch": 1.56, + "learning_rate": 6.644650721523351e-05, + "loss": 0.0085, + "step": 600670 + }, + { + "epoch": 1.56, + "learning_rate": 6.644261899886204e-05, + "loss": 0.0087, + "step": 600680 + }, + { + "epoch": 1.56, + "learning_rate": 6.643873078249058e-05, + "loss": 0.007, + "step": 600690 + }, + { + "epoch": 1.56, + "learning_rate": 6.643484256611911e-05, + "loss": 0.0091, + "step": 600700 + }, + { + "epoch": 1.56, + "learning_rate": 6.643095434974765e-05, + "loss": 0.01, + "step": 600710 + }, + { + "epoch": 1.56, + "learning_rate": 6.642706613337618e-05, + "loss": 0.0101, + "step": 600720 + }, + { + "epoch": 1.56, + "learning_rate": 6.642317791700472e-05, + "loss": 0.009, + "step": 600730 + }, + { + "epoch": 1.56, + "learning_rate": 6.641928970063326e-05, + "loss": 0.0071, + "step": 600740 + }, + { + "epoch": 1.56, + "learning_rate": 6.641540148426179e-05, + "loss": 0.0078, + "step": 600750 + }, + { + "epoch": 1.56, + "learning_rate": 6.641151326789033e-05, + "loss": 0.0092, + "step": 600760 + }, + { + "epoch": 1.56, + "learning_rate": 6.640762505151886e-05, + "loss": 0.0087, + "step": 600770 + }, + { + "epoch": 1.56, + "learning_rate": 6.64037368351474e-05, + "loss": 0.0089, + "step": 600780 + }, + { + "epoch": 1.56, + "learning_rate": 6.639984861877593e-05, + "loss": 0.0089, + "step": 600790 + }, + { + "epoch": 1.56, + "learning_rate": 6.639596040240446e-05, + "loss": 0.0158, + "step": 600800 + }, + { + "epoch": 1.56, + "learning_rate": 6.6392072186033e-05, + "loss": 0.0106, + "step": 600810 + }, + { + "epoch": 1.56, + "learning_rate": 6.638818396966153e-05, + "loss": 0.0124, + "step": 600820 + }, + { + "epoch": 1.56, + "learning_rate": 6.638429575329007e-05, + "loss": 0.0094, + "step": 600830 + }, + { + "epoch": 1.56, + "learning_rate": 6.638040753691861e-05, + "loss": 0.0108, + "step": 600840 + }, + { + "epoch": 1.56, + "learning_rate": 6.637651932054714e-05, + "loss": 0.0098, + "step": 600850 + }, + { + "epoch": 1.56, + "learning_rate": 6.637263110417568e-05, + "loss": 0.0073, + "step": 600860 + }, + { + "epoch": 1.56, + "learning_rate": 6.636874288780421e-05, + "loss": 0.0097, + "step": 600870 + }, + { + "epoch": 1.56, + "learning_rate": 6.636485467143275e-05, + "loss": 0.0109, + "step": 600880 + }, + { + "epoch": 1.56, + "learning_rate": 6.636096645506128e-05, + "loss": 0.0088, + "step": 600890 + }, + { + "epoch": 1.56, + "learning_rate": 6.635707823868982e-05, + "loss": 0.0098, + "step": 600900 + }, + { + "epoch": 1.56, + "learning_rate": 6.635319002231836e-05, + "loss": 0.0078, + "step": 600910 + }, + { + "epoch": 1.56, + "learning_rate": 6.634930180594689e-05, + "loss": 0.0076, + "step": 600920 + }, + { + "epoch": 1.56, + "learning_rate": 6.634541358957543e-05, + "loss": 0.0075, + "step": 600930 + }, + { + "epoch": 1.56, + "learning_rate": 6.634152537320396e-05, + "loss": 0.0098, + "step": 600940 + }, + { + "epoch": 1.56, + "learning_rate": 6.63376371568325e-05, + "loss": 0.0087, + "step": 600950 + }, + { + "epoch": 1.56, + "learning_rate": 6.633374894046103e-05, + "loss": 0.007, + "step": 600960 + }, + { + "epoch": 1.56, + "learning_rate": 6.632986072408957e-05, + "loss": 0.0064, + "step": 600970 + }, + { + "epoch": 1.56, + "learning_rate": 6.63259725077181e-05, + "loss": 0.0097, + "step": 600980 + }, + { + "epoch": 1.56, + "learning_rate": 6.632208429134664e-05, + "loss": 0.0065, + "step": 600990 + }, + { + "epoch": 1.56, + "learning_rate": 6.631819607497518e-05, + "loss": 0.0124, + "step": 601000 + }, + { + "epoch": 1.56, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.005832574795931578, + "eval_runtime": 107.8162, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.638, + "step": 601000 + }, + { + "epoch": 1.56, + "learning_rate": 6.631430785860371e-05, + "loss": 0.0098, + "step": 601010 + }, + { + "epoch": 1.56, + "learning_rate": 6.631041964223225e-05, + "loss": 0.0111, + "step": 601020 + }, + { + "epoch": 1.56, + "learning_rate": 6.630653142586078e-05, + "loss": 0.0087, + "step": 601030 + }, + { + "epoch": 1.56, + "learning_rate": 6.630264320948931e-05, + "loss": 0.0086, + "step": 601040 + }, + { + "epoch": 1.56, + "learning_rate": 6.629875499311785e-05, + "loss": 0.0123, + "step": 601050 + }, + { + "epoch": 1.56, + "learning_rate": 6.629486677674638e-05, + "loss": 0.0113, + "step": 601060 + }, + { + "epoch": 1.56, + "learning_rate": 6.629097856037492e-05, + "loss": 0.0111, + "step": 601070 + }, + { + "epoch": 1.56, + "learning_rate": 6.628709034400345e-05, + "loss": 0.01, + "step": 601080 + }, + { + "epoch": 1.56, + "learning_rate": 6.628320212763199e-05, + "loss": 0.0083, + "step": 601090 + }, + { + "epoch": 1.56, + "learning_rate": 6.627931391126053e-05, + "loss": 0.0084, + "step": 601100 + }, + { + "epoch": 1.56, + "learning_rate": 6.627542569488906e-05, + "loss": 0.0065, + "step": 601110 + }, + { + "epoch": 1.56, + "learning_rate": 6.62715374785176e-05, + "loss": 0.0061, + "step": 601120 + }, + { + "epoch": 1.56, + "learning_rate": 6.626764926214613e-05, + "loss": 0.0102, + "step": 601130 + }, + { + "epoch": 1.56, + "learning_rate": 6.626376104577467e-05, + "loss": 0.0075, + "step": 601140 + }, + { + "epoch": 1.56, + "learning_rate": 6.62598728294032e-05, + "loss": 0.0083, + "step": 601150 + }, + { + "epoch": 1.56, + "learning_rate": 6.625598461303174e-05, + "loss": 0.008, + "step": 601160 + }, + { + "epoch": 1.56, + "learning_rate": 6.625209639666028e-05, + "loss": 0.01, + "step": 601170 + }, + { + "epoch": 1.56, + "learning_rate": 6.624820818028881e-05, + "loss": 0.0061, + "step": 601180 + }, + { + "epoch": 1.56, + "learning_rate": 6.624431996391735e-05, + "loss": 0.0123, + "step": 601190 + }, + { + "epoch": 1.56, + "learning_rate": 6.624043174754588e-05, + "loss": 0.0075, + "step": 601200 + }, + { + "epoch": 1.56, + "learning_rate": 6.623654353117442e-05, + "loss": 0.0097, + "step": 601210 + }, + { + "epoch": 1.56, + "learning_rate": 6.623265531480295e-05, + "loss": 0.0089, + "step": 601220 + }, + { + "epoch": 1.56, + "learning_rate": 6.622876709843149e-05, + "loss": 0.0095, + "step": 601230 + }, + { + "epoch": 1.56, + "learning_rate": 6.622487888206002e-05, + "loss": 0.0077, + "step": 601240 + }, + { + "epoch": 1.56, + "learning_rate": 6.622099066568856e-05, + "loss": 0.0075, + "step": 601250 + }, + { + "epoch": 1.56, + "learning_rate": 6.62171024493171e-05, + "loss": 0.0133, + "step": 601260 + }, + { + "epoch": 1.56, + "learning_rate": 6.621321423294563e-05, + "loss": 0.0081, + "step": 601270 + }, + { + "epoch": 1.56, + "learning_rate": 6.620932601657417e-05, + "loss": 0.0083, + "step": 601280 + }, + { + "epoch": 1.56, + "learning_rate": 6.62054378002027e-05, + "loss": 0.0116, + "step": 601290 + }, + { + "epoch": 1.56, + "learning_rate": 6.620154958383123e-05, + "loss": 0.0101, + "step": 601300 + }, + { + "epoch": 1.56, + "learning_rate": 6.619766136745977e-05, + "loss": 0.0072, + "step": 601310 + }, + { + "epoch": 1.56, + "learning_rate": 6.61937731510883e-05, + "loss": 0.0084, + "step": 601320 + }, + { + "epoch": 1.56, + "learning_rate": 6.618988493471684e-05, + "loss": 0.0081, + "step": 601330 + }, + { + "epoch": 1.56, + "learning_rate": 6.618599671834537e-05, + "loss": 0.0105, + "step": 601340 + }, + { + "epoch": 1.56, + "learning_rate": 6.618210850197391e-05, + "loss": 0.0088, + "step": 601350 + }, + { + "epoch": 1.56, + "learning_rate": 6.617822028560245e-05, + "loss": 0.0083, + "step": 601360 + }, + { + "epoch": 1.56, + "learning_rate": 6.617433206923098e-05, + "loss": 0.0077, + "step": 601370 + }, + { + "epoch": 1.56, + "learning_rate": 6.617044385285952e-05, + "loss": 0.0097, + "step": 601380 + }, + { + "epoch": 1.56, + "learning_rate": 6.616655563648805e-05, + "loss": 0.0105, + "step": 601390 + }, + { + "epoch": 1.56, + "learning_rate": 6.616266742011659e-05, + "loss": 0.0101, + "step": 601400 + }, + { + "epoch": 1.56, + "learning_rate": 6.615877920374512e-05, + "loss": 0.0087, + "step": 601410 + }, + { + "epoch": 1.56, + "learning_rate": 6.615489098737366e-05, + "loss": 0.0107, + "step": 601420 + }, + { + "epoch": 1.56, + "learning_rate": 6.61510027710022e-05, + "loss": 0.0099, + "step": 601430 + }, + { + "epoch": 1.56, + "learning_rate": 6.614711455463073e-05, + "loss": 0.0076, + "step": 601440 + }, + { + "epoch": 1.56, + "learning_rate": 6.614322633825927e-05, + "loss": 0.0069, + "step": 601450 + }, + { + "epoch": 1.56, + "learning_rate": 6.61393381218878e-05, + "loss": 0.0065, + "step": 601460 + }, + { + "epoch": 1.56, + "learning_rate": 6.613544990551634e-05, + "loss": 0.0108, + "step": 601470 + }, + { + "epoch": 1.56, + "learning_rate": 6.613156168914487e-05, + "loss": 0.0078, + "step": 601480 + }, + { + "epoch": 1.56, + "learning_rate": 6.612767347277341e-05, + "loss": 0.0104, + "step": 601490 + }, + { + "epoch": 1.56, + "learning_rate": 6.612378525640194e-05, + "loss": 0.0084, + "step": 601500 + }, + { + "epoch": 1.56, + "learning_rate": 6.611989704003048e-05, + "loss": 0.0081, + "step": 601510 + }, + { + "epoch": 1.56, + "learning_rate": 6.611600882365902e-05, + "loss": 0.0097, + "step": 601520 + }, + { + "epoch": 1.56, + "learning_rate": 6.611212060728755e-05, + "loss": 0.0078, + "step": 601530 + }, + { + "epoch": 1.56, + "learning_rate": 6.610823239091608e-05, + "loss": 0.0094, + "step": 601540 + }, + { + "epoch": 1.56, + "learning_rate": 6.610434417454462e-05, + "loss": 0.0078, + "step": 601550 + }, + { + "epoch": 1.56, + "learning_rate": 6.610045595817315e-05, + "loss": 0.009, + "step": 601560 + }, + { + "epoch": 1.56, + "learning_rate": 6.609656774180169e-05, + "loss": 0.0087, + "step": 601570 + }, + { + "epoch": 1.56, + "learning_rate": 6.609267952543022e-05, + "loss": 0.0075, + "step": 601580 + }, + { + "epoch": 1.56, + "learning_rate": 6.608879130905876e-05, + "loss": 0.0071, + "step": 601590 + }, + { + "epoch": 1.56, + "learning_rate": 6.608490309268729e-05, + "loss": 0.0077, + "step": 601600 + }, + { + "epoch": 1.56, + "learning_rate": 6.608101487631583e-05, + "loss": 0.0088, + "step": 601610 + }, + { + "epoch": 1.56, + "learning_rate": 6.607712665994437e-05, + "loss": 0.0073, + "step": 601620 + }, + { + "epoch": 1.56, + "learning_rate": 6.60732384435729e-05, + "loss": 0.0099, + "step": 601630 + }, + { + "epoch": 1.56, + "learning_rate": 6.606935022720144e-05, + "loss": 0.0121, + "step": 601640 + }, + { + "epoch": 1.56, + "learning_rate": 6.606546201082997e-05, + "loss": 0.0078, + "step": 601650 + }, + { + "epoch": 1.56, + "learning_rate": 6.606157379445851e-05, + "loss": 0.0079, + "step": 601660 + }, + { + "epoch": 1.56, + "learning_rate": 6.605768557808704e-05, + "loss": 0.0097, + "step": 601670 + }, + { + "epoch": 1.56, + "learning_rate": 6.605379736171558e-05, + "loss": 0.0083, + "step": 601680 + }, + { + "epoch": 1.56, + "learning_rate": 6.604990914534412e-05, + "loss": 0.0093, + "step": 601690 + }, + { + "epoch": 1.56, + "learning_rate": 6.604602092897265e-05, + "loss": 0.0095, + "step": 601700 + }, + { + "epoch": 1.56, + "learning_rate": 6.604213271260119e-05, + "loss": 0.0134, + "step": 601710 + }, + { + "epoch": 1.56, + "learning_rate": 6.603824449622972e-05, + "loss": 0.0096, + "step": 601720 + }, + { + "epoch": 1.56, + "learning_rate": 6.603435627985826e-05, + "loss": 0.0075, + "step": 601730 + }, + { + "epoch": 1.56, + "learning_rate": 6.603046806348679e-05, + "loss": 0.0077, + "step": 601740 + }, + { + "epoch": 1.56, + "learning_rate": 6.602657984711533e-05, + "loss": 0.0071, + "step": 601750 + }, + { + "epoch": 1.56, + "learning_rate": 6.602269163074386e-05, + "loss": 0.0073, + "step": 601760 + }, + { + "epoch": 1.56, + "learning_rate": 6.60188034143724e-05, + "loss": 0.0092, + "step": 601770 + }, + { + "epoch": 1.56, + "learning_rate": 6.601491519800094e-05, + "loss": 0.0067, + "step": 601780 + }, + { + "epoch": 1.56, + "learning_rate": 6.601102698162947e-05, + "loss": 0.0103, + "step": 601790 + }, + { + "epoch": 1.56, + "learning_rate": 6.6007138765258e-05, + "loss": 0.0107, + "step": 601800 + }, + { + "epoch": 1.56, + "learning_rate": 6.600325054888654e-05, + "loss": 0.009, + "step": 601810 + }, + { + "epoch": 1.56, + "learning_rate": 6.599936233251507e-05, + "loss": 0.0071, + "step": 601820 + }, + { + "epoch": 1.56, + "learning_rate": 6.599547411614361e-05, + "loss": 0.0101, + "step": 601830 + }, + { + "epoch": 1.56, + "learning_rate": 6.599158589977214e-05, + "loss": 0.007, + "step": 601840 + }, + { + "epoch": 1.56, + "learning_rate": 6.598769768340068e-05, + "loss": 0.0064, + "step": 601850 + }, + { + "epoch": 1.56, + "learning_rate": 6.598380946702921e-05, + "loss": 0.0088, + "step": 601860 + }, + { + "epoch": 1.56, + "learning_rate": 6.597992125065775e-05, + "loss": 0.0098, + "step": 601870 + }, + { + "epoch": 1.56, + "learning_rate": 6.597603303428629e-05, + "loss": 0.0095, + "step": 601880 + }, + { + "epoch": 1.56, + "learning_rate": 6.597214481791482e-05, + "loss": 0.01, + "step": 601890 + }, + { + "epoch": 1.56, + "learning_rate": 6.596825660154336e-05, + "loss": 0.0119, + "step": 601900 + }, + { + "epoch": 1.56, + "learning_rate": 6.596436838517189e-05, + "loss": 0.0071, + "step": 601910 + }, + { + "epoch": 1.56, + "learning_rate": 6.596048016880043e-05, + "loss": 0.0076, + "step": 601920 + }, + { + "epoch": 1.56, + "learning_rate": 6.595659195242896e-05, + "loss": 0.0066, + "step": 601930 + }, + { + "epoch": 1.56, + "learning_rate": 6.59527037360575e-05, + "loss": 0.006, + "step": 601940 + }, + { + "epoch": 1.56, + "learning_rate": 6.594881551968603e-05, + "loss": 0.01, + "step": 601950 + }, + { + "epoch": 1.56, + "learning_rate": 6.594492730331457e-05, + "loss": 0.0086, + "step": 601960 + }, + { + "epoch": 1.56, + "learning_rate": 6.594103908694311e-05, + "loss": 0.0081, + "step": 601970 + }, + { + "epoch": 1.56, + "learning_rate": 6.593715087057164e-05, + "loss": 0.0072, + "step": 601980 + }, + { + "epoch": 1.56, + "learning_rate": 6.593326265420018e-05, + "loss": 0.0094, + "step": 601990 + }, + { + "epoch": 1.56, + "learning_rate": 6.592937443782871e-05, + "loss": 0.0099, + "step": 602000 + }, + { + "epoch": 1.56, + "eval_cer": 0.8817208816033121, + "eval_loss": 0.005837557837367058, + "eval_runtime": 107.7975, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, + "step": 602000 + }, + { + "epoch": 1.56, + "learning_rate": 6.592548622145725e-05, + "loss": 0.0063, + "step": 602010 + }, + { + "epoch": 1.56, + "learning_rate": 6.592159800508578e-05, + "loss": 0.0104, + "step": 602020 + }, + { + "epoch": 1.56, + "learning_rate": 6.591770978871432e-05, + "loss": 0.0086, + "step": 602030 + }, + { + "epoch": 1.56, + "learning_rate": 6.591382157234285e-05, + "loss": 0.0066, + "step": 602040 + }, + { + "epoch": 1.56, + "learning_rate": 6.590993335597138e-05, + "loss": 0.0067, + "step": 602050 + }, + { + "epoch": 1.56, + "learning_rate": 6.590604513959992e-05, + "loss": 0.0074, + "step": 602060 + }, + { + "epoch": 1.56, + "learning_rate": 6.590215692322846e-05, + "loss": 0.011, + "step": 602070 + }, + { + "epoch": 1.56, + "learning_rate": 6.589826870685699e-05, + "loss": 0.0068, + "step": 602080 + }, + { + "epoch": 1.56, + "learning_rate": 6.589438049048553e-05, + "loss": 0.0078, + "step": 602090 + }, + { + "epoch": 1.56, + "learning_rate": 6.589049227411406e-05, + "loss": 0.0103, + "step": 602100 + }, + { + "epoch": 1.56, + "learning_rate": 6.58866040577426e-05, + "loss": 0.0112, + "step": 602110 + }, + { + "epoch": 1.56, + "learning_rate": 6.588271584137113e-05, + "loss": 0.0069, + "step": 602120 + }, + { + "epoch": 1.56, + "learning_rate": 6.587882762499967e-05, + "loss": 0.0076, + "step": 602130 + }, + { + "epoch": 1.56, + "learning_rate": 6.587493940862821e-05, + "loss": 0.0092, + "step": 602140 + }, + { + "epoch": 1.56, + "learning_rate": 6.587105119225674e-05, + "loss": 0.0118, + "step": 602150 + }, + { + "epoch": 1.56, + "learning_rate": 6.586716297588528e-05, + "loss": 0.013, + "step": 602160 + }, + { + "epoch": 1.56, + "learning_rate": 6.586327475951381e-05, + "loss": 0.0072, + "step": 602170 + }, + { + "epoch": 1.56, + "learning_rate": 6.585938654314235e-05, + "loss": 0.0082, + "step": 602180 + }, + { + "epoch": 1.56, + "learning_rate": 6.585549832677088e-05, + "loss": 0.0095, + "step": 602190 + }, + { + "epoch": 1.56, + "learning_rate": 6.585161011039942e-05, + "loss": 0.0088, + "step": 602200 + }, + { + "epoch": 1.56, + "learning_rate": 6.584772189402795e-05, + "loss": 0.0056, + "step": 602210 + }, + { + "epoch": 1.56, + "learning_rate": 6.584383367765649e-05, + "loss": 0.0086, + "step": 602220 + }, + { + "epoch": 1.56, + "learning_rate": 6.583994546128503e-05, + "loss": 0.0081, + "step": 602230 + }, + { + "epoch": 1.56, + "learning_rate": 6.583605724491356e-05, + "loss": 0.0093, + "step": 602240 + }, + { + "epoch": 1.56, + "learning_rate": 6.58321690285421e-05, + "loss": 0.0087, + "step": 602250 + }, + { + "epoch": 1.56, + "learning_rate": 6.582828081217063e-05, + "loss": 0.0085, + "step": 602260 + }, + { + "epoch": 1.56, + "learning_rate": 6.582439259579917e-05, + "loss": 0.0095, + "step": 602270 + }, + { + "epoch": 1.56, + "learning_rate": 6.58205043794277e-05, + "loss": 0.0097, + "step": 602280 + }, + { + "epoch": 1.56, + "learning_rate": 6.581661616305623e-05, + "loss": 0.0081, + "step": 602290 + }, + { + "epoch": 1.56, + "learning_rate": 6.581272794668477e-05, + "loss": 0.008, + "step": 602300 + }, + { + "epoch": 1.56, + "learning_rate": 6.58088397303133e-05, + "loss": 0.0082, + "step": 602310 + }, + { + "epoch": 1.56, + "learning_rate": 6.580495151394184e-05, + "loss": 0.0102, + "step": 602320 + }, + { + "epoch": 1.56, + "learning_rate": 6.580106329757038e-05, + "loss": 0.0092, + "step": 602330 + }, + { + "epoch": 1.56, + "learning_rate": 6.579717508119891e-05, + "loss": 0.0069, + "step": 602340 + }, + { + "epoch": 1.56, + "learning_rate": 6.579328686482745e-05, + "loss": 0.0093, + "step": 602350 + }, + { + "epoch": 1.56, + "learning_rate": 6.578939864845598e-05, + "loss": 0.0068, + "step": 602360 + }, + { + "epoch": 1.56, + "learning_rate": 6.578551043208452e-05, + "loss": 0.0105, + "step": 602370 + }, + { + "epoch": 1.56, + "learning_rate": 6.578162221571305e-05, + "loss": 0.0087, + "step": 602380 + }, + { + "epoch": 1.56, + "learning_rate": 6.577773399934159e-05, + "loss": 0.0084, + "step": 602390 + }, + { + "epoch": 1.56, + "learning_rate": 6.577384578297013e-05, + "loss": 0.008, + "step": 602400 + }, + { + "epoch": 1.56, + "learning_rate": 6.576995756659866e-05, + "loss": 0.0096, + "step": 602410 + }, + { + "epoch": 1.56, + "learning_rate": 6.57660693502272e-05, + "loss": 0.0142, + "step": 602420 + }, + { + "epoch": 1.56, + "learning_rate": 6.576218113385573e-05, + "loss": 0.0094, + "step": 602430 + }, + { + "epoch": 1.56, + "learning_rate": 6.575829291748427e-05, + "loss": 0.0077, + "step": 602440 + }, + { + "epoch": 1.56, + "learning_rate": 6.57544047011128e-05, + "loss": 0.0091, + "step": 602450 + }, + { + "epoch": 1.56, + "learning_rate": 6.575051648474134e-05, + "loss": 0.0113, + "step": 602460 + }, + { + "epoch": 1.56, + "learning_rate": 6.574662826836987e-05, + "loss": 0.0102, + "step": 602470 + }, + { + "epoch": 1.56, + "learning_rate": 6.574274005199841e-05, + "loss": 0.0086, + "step": 602480 + }, + { + "epoch": 1.56, + "learning_rate": 6.573885183562695e-05, + "loss": 0.0086, + "step": 602490 + }, + { + "epoch": 1.56, + "learning_rate": 6.573496361925548e-05, + "loss": 0.0062, + "step": 602500 + }, + { + "epoch": 1.56, + "learning_rate": 6.573107540288402e-05, + "loss": 0.0085, + "step": 602510 + }, + { + "epoch": 1.56, + "learning_rate": 6.572718718651255e-05, + "loss": 0.0078, + "step": 602520 + }, + { + "epoch": 1.56, + "learning_rate": 6.572329897014108e-05, + "loss": 0.0067, + "step": 602530 + }, + { + "epoch": 1.56, + "learning_rate": 6.571941075376962e-05, + "loss": 0.0092, + "step": 602540 + }, + { + "epoch": 1.56, + "learning_rate": 6.571552253739815e-05, + "loss": 0.0078, + "step": 602550 + }, + { + "epoch": 1.56, + "learning_rate": 6.571163432102669e-05, + "loss": 0.0066, + "step": 602560 + }, + { + "epoch": 1.56, + "learning_rate": 6.570774610465522e-05, + "loss": 0.0103, + "step": 602570 + }, + { + "epoch": 1.56, + "learning_rate": 6.570385788828376e-05, + "loss": 0.0101, + "step": 602580 + }, + { + "epoch": 1.56, + "learning_rate": 6.56999696719123e-05, + "loss": 0.0081, + "step": 602590 + }, + { + "epoch": 1.56, + "learning_rate": 6.569608145554083e-05, + "loss": 0.0068, + "step": 602600 + }, + { + "epoch": 1.56, + "learning_rate": 6.569219323916937e-05, + "loss": 0.0084, + "step": 602610 + }, + { + "epoch": 1.56, + "learning_rate": 6.56883050227979e-05, + "loss": 0.01, + "step": 602620 + }, + { + "epoch": 1.56, + "learning_rate": 6.568441680642644e-05, + "loss": 0.0064, + "step": 602630 + }, + { + "epoch": 1.56, + "learning_rate": 6.568052859005497e-05, + "loss": 0.0087, + "step": 602640 + }, + { + "epoch": 1.56, + "learning_rate": 6.567664037368351e-05, + "loss": 0.0111, + "step": 602650 + }, + { + "epoch": 1.56, + "learning_rate": 6.567275215731205e-05, + "loss": 0.0072, + "step": 602660 + }, + { + "epoch": 1.56, + "learning_rate": 6.566886394094058e-05, + "loss": 0.0126, + "step": 602670 + }, + { + "epoch": 1.56, + "learning_rate": 6.566497572456912e-05, + "loss": 0.0094, + "step": 602680 + }, + { + "epoch": 1.56, + "learning_rate": 6.566108750819765e-05, + "loss": 0.0078, + "step": 602690 + }, + { + "epoch": 1.56, + "learning_rate": 6.565719929182619e-05, + "loss": 0.0101, + "step": 602700 + }, + { + "epoch": 1.56, + "learning_rate": 6.565331107545472e-05, + "loss": 0.008, + "step": 602710 + }, + { + "epoch": 1.56, + "learning_rate": 6.564942285908326e-05, + "loss": 0.0092, + "step": 602720 + }, + { + "epoch": 1.56, + "learning_rate": 6.564553464271179e-05, + "loss": 0.0085, + "step": 602730 + }, + { + "epoch": 1.56, + "learning_rate": 6.564164642634033e-05, + "loss": 0.0111, + "step": 602740 + }, + { + "epoch": 1.56, + "learning_rate": 6.563775820996887e-05, + "loss": 0.0061, + "step": 602750 + }, + { + "epoch": 1.56, + "learning_rate": 6.56338699935974e-05, + "loss": 0.008, + "step": 602760 + }, + { + "epoch": 1.56, + "learning_rate": 6.562998177722594e-05, + "loss": 0.0063, + "step": 602770 + }, + { + "epoch": 1.56, + "learning_rate": 6.562609356085447e-05, + "loss": 0.0057, + "step": 602780 + }, + { + "epoch": 1.56, + "learning_rate": 6.5622205344483e-05, + "loss": 0.0087, + "step": 602790 + }, + { + "epoch": 1.56, + "learning_rate": 6.561831712811154e-05, + "loss": 0.0088, + "step": 602800 + }, + { + "epoch": 1.56, + "learning_rate": 6.561442891174007e-05, + "loss": 0.0102, + "step": 602810 + }, + { + "epoch": 1.56, + "learning_rate": 6.561054069536861e-05, + "loss": 0.012, + "step": 602820 + }, + { + "epoch": 1.56, + "learning_rate": 6.560665247899714e-05, + "loss": 0.0084, + "step": 602830 + }, + { + "epoch": 1.56, + "learning_rate": 6.560276426262568e-05, + "loss": 0.0079, + "step": 602840 + }, + { + "epoch": 1.56, + "learning_rate": 6.559887604625422e-05, + "loss": 0.009, + "step": 602850 + }, + { + "epoch": 1.56, + "learning_rate": 6.559498782988275e-05, + "loss": 0.0085, + "step": 602860 + }, + { + "epoch": 1.56, + "learning_rate": 6.559109961351129e-05, + "loss": 0.0114, + "step": 602870 + }, + { + "epoch": 1.56, + "learning_rate": 6.558721139713982e-05, + "loss": 0.0096, + "step": 602880 + }, + { + "epoch": 1.56, + "learning_rate": 6.558332318076836e-05, + "loss": 0.0084, + "step": 602890 + }, + { + "epoch": 1.56, + "learning_rate": 6.557943496439689e-05, + "loss": 0.0115, + "step": 602900 + }, + { + "epoch": 1.56, + "learning_rate": 6.557554674802543e-05, + "loss": 0.0069, + "step": 602910 + }, + { + "epoch": 1.56, + "learning_rate": 6.557165853165397e-05, + "loss": 0.0104, + "step": 602920 + }, + { + "epoch": 1.56, + "learning_rate": 6.55677703152825e-05, + "loss": 0.0089, + "step": 602930 + }, + { + "epoch": 1.56, + "learning_rate": 6.556388209891104e-05, + "loss": 0.0081, + "step": 602940 + }, + { + "epoch": 1.56, + "learning_rate": 6.555999388253957e-05, + "loss": 0.0067, + "step": 602950 + }, + { + "epoch": 1.56, + "learning_rate": 6.555610566616811e-05, + "loss": 0.0093, + "step": 602960 + }, + { + "epoch": 1.56, + "learning_rate": 6.555221744979664e-05, + "loss": 0.0086, + "step": 602970 + }, + { + "epoch": 1.56, + "learning_rate": 6.554832923342518e-05, + "loss": 0.0063, + "step": 602980 + }, + { + "epoch": 1.56, + "learning_rate": 6.554444101705371e-05, + "loss": 0.0088, + "step": 602990 + }, + { + "epoch": 1.56, + "learning_rate": 6.554055280068225e-05, + "loss": 0.0106, + "step": 603000 + }, + { + "epoch": 1.56, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.005703043192625046, + "eval_runtime": 107.9387, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 603000 + }, + { + "epoch": 1.56, + "learning_rate": 6.553666458431079e-05, + "loss": 0.0093, + "step": 603010 + }, + { + "epoch": 1.56, + "learning_rate": 6.553277636793932e-05, + "loss": 0.0096, + "step": 603020 + }, + { + "epoch": 1.56, + "learning_rate": 6.552888815156785e-05, + "loss": 0.01, + "step": 603030 + }, + { + "epoch": 1.56, + "learning_rate": 6.552499993519639e-05, + "loss": 0.0116, + "step": 603040 + }, + { + "epoch": 1.56, + "learning_rate": 6.552111171882492e-05, + "loss": 0.011, + "step": 603050 + }, + { + "epoch": 1.56, + "learning_rate": 6.551722350245346e-05, + "loss": 0.0083, + "step": 603060 + }, + { + "epoch": 1.56, + "learning_rate": 6.551333528608199e-05, + "loss": 0.009, + "step": 603070 + }, + { + "epoch": 1.56, + "learning_rate": 6.550944706971053e-05, + "loss": 0.0116, + "step": 603080 + }, + { + "epoch": 1.56, + "learning_rate": 6.550555885333906e-05, + "loss": 0.0072, + "step": 603090 + }, + { + "epoch": 1.56, + "learning_rate": 6.55016706369676e-05, + "loss": 0.0077, + "step": 603100 + }, + { + "epoch": 1.56, + "learning_rate": 6.549778242059614e-05, + "loss": 0.008, + "step": 603110 + }, + { + "epoch": 1.56, + "learning_rate": 6.549389420422467e-05, + "loss": 0.0132, + "step": 603120 + }, + { + "epoch": 1.56, + "learning_rate": 6.549000598785321e-05, + "loss": 0.0094, + "step": 603130 + }, + { + "epoch": 1.56, + "learning_rate": 6.548611777148174e-05, + "loss": 0.0091, + "step": 603140 + }, + { + "epoch": 1.56, + "learning_rate": 6.548222955511028e-05, + "loss": 0.0097, + "step": 603150 + }, + { + "epoch": 1.56, + "learning_rate": 6.547834133873881e-05, + "loss": 0.0079, + "step": 603160 + }, + { + "epoch": 1.56, + "learning_rate": 6.547445312236735e-05, + "loss": 0.01, + "step": 603170 + }, + { + "epoch": 1.56, + "learning_rate": 6.547056490599588e-05, + "loss": 0.0101, + "step": 603180 + }, + { + "epoch": 1.56, + "learning_rate": 6.546667668962442e-05, + "loss": 0.0098, + "step": 603190 + }, + { + "epoch": 1.56, + "learning_rate": 6.546278847325296e-05, + "loss": 0.0079, + "step": 603200 + }, + { + "epoch": 1.56, + "learning_rate": 6.545890025688149e-05, + "loss": 0.0103, + "step": 603210 + }, + { + "epoch": 1.56, + "learning_rate": 6.545501204051003e-05, + "loss": 0.0077, + "step": 603220 + }, + { + "epoch": 1.56, + "learning_rate": 6.545112382413856e-05, + "loss": 0.0092, + "step": 603230 + }, + { + "epoch": 1.56, + "learning_rate": 6.54472356077671e-05, + "loss": 0.0085, + "step": 603240 + }, + { + "epoch": 1.56, + "learning_rate": 6.544334739139563e-05, + "loss": 0.0058, + "step": 603250 + }, + { + "epoch": 1.56, + "learning_rate": 6.543945917502417e-05, + "loss": 0.0074, + "step": 603260 + }, + { + "epoch": 1.56, + "learning_rate": 6.543557095865271e-05, + "loss": 0.0076, + "step": 603270 + }, + { + "epoch": 1.56, + "learning_rate": 6.543168274228124e-05, + "loss": 0.0091, + "step": 603280 + }, + { + "epoch": 1.56, + "learning_rate": 6.542779452590977e-05, + "loss": 0.0113, + "step": 603290 + }, + { + "epoch": 1.56, + "learning_rate": 6.542390630953831e-05, + "loss": 0.008, + "step": 603300 + }, + { + "epoch": 1.56, + "learning_rate": 6.542001809316684e-05, + "loss": 0.0099, + "step": 603310 + }, + { + "epoch": 1.56, + "learning_rate": 6.541612987679538e-05, + "loss": 0.012, + "step": 603320 + }, + { + "epoch": 1.56, + "learning_rate": 6.541224166042391e-05, + "loss": 0.0093, + "step": 603330 + }, + { + "epoch": 1.56, + "learning_rate": 6.540835344405245e-05, + "loss": 0.0082, + "step": 603340 + }, + { + "epoch": 1.56, + "learning_rate": 6.540446522768098e-05, + "loss": 0.0074, + "step": 603350 + }, + { + "epoch": 1.56, + "learning_rate": 6.540057701130952e-05, + "loss": 0.0072, + "step": 603360 + }, + { + "epoch": 1.56, + "learning_rate": 6.539668879493806e-05, + "loss": 0.0072, + "step": 603370 + }, + { + "epoch": 1.56, + "learning_rate": 6.539280057856659e-05, + "loss": 0.0062, + "step": 603380 + }, + { + "epoch": 1.56, + "learning_rate": 6.538891236219513e-05, + "loss": 0.007, + "step": 603390 + }, + { + "epoch": 1.56, + "learning_rate": 6.538502414582366e-05, + "loss": 0.0099, + "step": 603400 + }, + { + "epoch": 1.56, + "learning_rate": 6.53811359294522e-05, + "loss": 0.0091, + "step": 603410 + }, + { + "epoch": 1.56, + "learning_rate": 6.537724771308073e-05, + "loss": 0.0061, + "step": 603420 + }, + { + "epoch": 1.56, + "learning_rate": 6.537335949670927e-05, + "loss": 0.0082, + "step": 603430 + }, + { + "epoch": 1.56, + "learning_rate": 6.53694712803378e-05, + "loss": 0.0073, + "step": 603440 + }, + { + "epoch": 1.56, + "learning_rate": 6.536558306396634e-05, + "loss": 0.0079, + "step": 603450 + }, + { + "epoch": 1.56, + "learning_rate": 6.536169484759488e-05, + "loss": 0.0112, + "step": 603460 + }, + { + "epoch": 1.56, + "learning_rate": 6.535780663122341e-05, + "loss": 0.0101, + "step": 603470 + }, + { + "epoch": 1.56, + "learning_rate": 6.535391841485195e-05, + "loss": 0.0089, + "step": 603480 + }, + { + "epoch": 1.56, + "learning_rate": 6.535003019848048e-05, + "loss": 0.0096, + "step": 603490 + }, + { + "epoch": 1.56, + "learning_rate": 6.534614198210902e-05, + "loss": 0.0066, + "step": 603500 + }, + { + "epoch": 1.56, + "learning_rate": 6.534225376573755e-05, + "loss": 0.0087, + "step": 603510 + }, + { + "epoch": 1.56, + "learning_rate": 6.533836554936608e-05, + "loss": 0.0075, + "step": 603520 + }, + { + "epoch": 1.56, + "learning_rate": 6.533447733299462e-05, + "loss": 0.0098, + "step": 603530 + }, + { + "epoch": 1.56, + "learning_rate": 6.533058911662315e-05, + "loss": 0.0079, + "step": 603540 + }, + { + "epoch": 1.56, + "learning_rate": 6.532670090025169e-05, + "loss": 0.0102, + "step": 603550 + }, + { + "epoch": 1.56, + "learning_rate": 6.532281268388023e-05, + "loss": 0.0108, + "step": 603560 + }, + { + "epoch": 1.56, + "learning_rate": 6.531892446750876e-05, + "loss": 0.0078, + "step": 603570 + }, + { + "epoch": 1.56, + "learning_rate": 6.53150362511373e-05, + "loss": 0.0098, + "step": 603580 + }, + { + "epoch": 1.56, + "learning_rate": 6.531114803476583e-05, + "loss": 0.0082, + "step": 603590 + }, + { + "epoch": 1.56, + "learning_rate": 6.530725981839437e-05, + "loss": 0.0072, + "step": 603600 + }, + { + "epoch": 1.56, + "learning_rate": 6.53033716020229e-05, + "loss": 0.0086, + "step": 603610 + }, + { + "epoch": 1.56, + "learning_rate": 6.529948338565144e-05, + "loss": 0.006, + "step": 603620 + }, + { + "epoch": 1.56, + "learning_rate": 6.529559516927998e-05, + "loss": 0.0064, + "step": 603630 + }, + { + "epoch": 1.56, + "learning_rate": 6.529170695290851e-05, + "loss": 0.01, + "step": 603640 + }, + { + "epoch": 1.56, + "learning_rate": 6.528781873653705e-05, + "loss": 0.006, + "step": 603650 + }, + { + "epoch": 1.56, + "learning_rate": 6.528393052016558e-05, + "loss": 0.0105, + "step": 603660 + }, + { + "epoch": 1.56, + "learning_rate": 6.528004230379412e-05, + "loss": 0.0127, + "step": 603670 + }, + { + "epoch": 1.56, + "learning_rate": 6.527615408742265e-05, + "loss": 0.0078, + "step": 603680 + }, + { + "epoch": 1.56, + "learning_rate": 6.527226587105119e-05, + "loss": 0.0077, + "step": 603690 + }, + { + "epoch": 1.56, + "learning_rate": 6.526837765467972e-05, + "loss": 0.0075, + "step": 603700 + }, + { + "epoch": 1.56, + "learning_rate": 6.526448943830826e-05, + "loss": 0.0091, + "step": 603710 + }, + { + "epoch": 1.56, + "learning_rate": 6.52606012219368e-05, + "loss": 0.0106, + "step": 603720 + }, + { + "epoch": 1.56, + "learning_rate": 6.525671300556533e-05, + "loss": 0.0073, + "step": 603730 + }, + { + "epoch": 1.56, + "learning_rate": 6.525282478919387e-05, + "loss": 0.0079, + "step": 603740 + }, + { + "epoch": 1.57, + "learning_rate": 6.52489365728224e-05, + "loss": 0.0097, + "step": 603750 + }, + { + "epoch": 1.57, + "learning_rate": 6.524504835645094e-05, + "loss": 0.0102, + "step": 603760 + }, + { + "epoch": 1.57, + "learning_rate": 6.524116014007947e-05, + "loss": 0.0089, + "step": 603770 + }, + { + "epoch": 1.57, + "learning_rate": 6.5237271923708e-05, + "loss": 0.0085, + "step": 603780 + }, + { + "epoch": 1.57, + "learning_rate": 6.523338370733654e-05, + "loss": 0.0058, + "step": 603790 + }, + { + "epoch": 1.57, + "learning_rate": 6.522949549096507e-05, + "loss": 0.0075, + "step": 603800 + }, + { + "epoch": 1.57, + "learning_rate": 6.522560727459361e-05, + "loss": 0.0123, + "step": 603810 + }, + { + "epoch": 1.57, + "learning_rate": 6.522171905822215e-05, + "loss": 0.0083, + "step": 603820 + }, + { + "epoch": 1.57, + "learning_rate": 6.521783084185068e-05, + "loss": 0.0099, + "step": 603830 + }, + { + "epoch": 1.57, + "learning_rate": 6.521394262547922e-05, + "loss": 0.0064, + "step": 603840 + }, + { + "epoch": 1.57, + "learning_rate": 6.521005440910775e-05, + "loss": 0.008, + "step": 603850 + }, + { + "epoch": 1.57, + "learning_rate": 6.520616619273629e-05, + "loss": 0.01, + "step": 603860 + }, + { + "epoch": 1.57, + "learning_rate": 6.520227797636482e-05, + "loss": 0.0113, + "step": 603870 + }, + { + "epoch": 1.57, + "learning_rate": 6.519838975999336e-05, + "loss": 0.0079, + "step": 603880 + }, + { + "epoch": 1.57, + "learning_rate": 6.51945015436219e-05, + "loss": 0.0084, + "step": 603890 + }, + { + "epoch": 1.57, + "learning_rate": 6.519061332725043e-05, + "loss": 0.0073, + "step": 603900 + }, + { + "epoch": 1.57, + "learning_rate": 6.518672511087897e-05, + "loss": 0.0081, + "step": 603910 + }, + { + "epoch": 1.57, + "learning_rate": 6.51828368945075e-05, + "loss": 0.0092, + "step": 603920 + }, + { + "epoch": 1.57, + "learning_rate": 6.517894867813604e-05, + "loss": 0.0129, + "step": 603930 + }, + { + "epoch": 1.57, + "learning_rate": 6.517506046176457e-05, + "loss": 0.0075, + "step": 603940 + }, + { + "epoch": 1.57, + "learning_rate": 6.517117224539311e-05, + "loss": 0.0062, + "step": 603950 + }, + { + "epoch": 1.57, + "learning_rate": 6.516728402902164e-05, + "loss": 0.0077, + "step": 603960 + }, + { + "epoch": 1.57, + "learning_rate": 6.516339581265018e-05, + "loss": 0.0072, + "step": 603970 + }, + { + "epoch": 1.57, + "learning_rate": 6.515950759627872e-05, + "loss": 0.0118, + "step": 603980 + }, + { + "epoch": 1.57, + "learning_rate": 6.515561937990725e-05, + "loss": 0.0097, + "step": 603990 + }, + { + "epoch": 1.57, + "learning_rate": 6.515173116353579e-05, + "loss": 0.0073, + "step": 604000 + }, + { + "epoch": 1.57, + "eval_cer": 0.8817110841447728, + "eval_loss": 0.005707249511033297, + "eval_runtime": 107.7161, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, + "step": 604000 + }, + { + "epoch": 1.57, + "learning_rate": 6.514784294716432e-05, + "loss": 0.0092, + "step": 604010 + }, + { + "epoch": 1.57, + "learning_rate": 6.514395473079285e-05, + "loss": 0.0114, + "step": 604020 + }, + { + "epoch": 1.57, + "learning_rate": 6.514006651442139e-05, + "loss": 0.008, + "step": 604030 + }, + { + "epoch": 1.57, + "learning_rate": 6.513617829804992e-05, + "loss": 0.0076, + "step": 604040 + }, + { + "epoch": 1.57, + "learning_rate": 6.513229008167846e-05, + "loss": 0.0082, + "step": 604050 + }, + { + "epoch": 1.57, + "learning_rate": 6.512840186530699e-05, + "loss": 0.0106, + "step": 604060 + }, + { + "epoch": 1.57, + "learning_rate": 6.512451364893553e-05, + "loss": 0.0069, + "step": 604070 + }, + { + "epoch": 1.57, + "learning_rate": 6.512062543256407e-05, + "loss": 0.0091, + "step": 604080 + }, + { + "epoch": 1.57, + "learning_rate": 6.51167372161926e-05, + "loss": 0.0106, + "step": 604090 + }, + { + "epoch": 1.57, + "learning_rate": 6.511284899982114e-05, + "loss": 0.0103, + "step": 604100 + }, + { + "epoch": 1.57, + "learning_rate": 6.510896078344967e-05, + "loss": 0.007, + "step": 604110 + }, + { + "epoch": 1.57, + "learning_rate": 6.510507256707821e-05, + "loss": 0.0099, + "step": 604120 + }, + { + "epoch": 1.57, + "learning_rate": 6.510118435070674e-05, + "loss": 0.0082, + "step": 604130 + }, + { + "epoch": 1.57, + "learning_rate": 6.509729613433528e-05, + "loss": 0.0073, + "step": 604140 + }, + { + "epoch": 1.57, + "learning_rate": 6.509340791796382e-05, + "loss": 0.0098, + "step": 604150 + }, + { + "epoch": 1.57, + "learning_rate": 6.508951970159235e-05, + "loss": 0.0075, + "step": 604160 + }, + { + "epoch": 1.57, + "learning_rate": 6.508563148522089e-05, + "loss": 0.0104, + "step": 604170 + }, + { + "epoch": 1.57, + "learning_rate": 6.508174326884942e-05, + "loss": 0.0075, + "step": 604180 + }, + { + "epoch": 1.57, + "learning_rate": 6.507785505247796e-05, + "loss": 0.0068, + "step": 604190 + }, + { + "epoch": 1.57, + "learning_rate": 6.507396683610649e-05, + "loss": 0.0065, + "step": 604200 + }, + { + "epoch": 1.57, + "learning_rate": 6.507007861973503e-05, + "loss": 0.0076, + "step": 604210 + }, + { + "epoch": 1.57, + "learning_rate": 6.506619040336356e-05, + "loss": 0.0071, + "step": 604220 + }, + { + "epoch": 1.57, + "learning_rate": 6.50623021869921e-05, + "loss": 0.0079, + "step": 604230 + }, + { + "epoch": 1.57, + "learning_rate": 6.505841397062064e-05, + "loss": 0.0113, + "step": 604240 + }, + { + "epoch": 1.57, + "learning_rate": 6.505452575424917e-05, + "loss": 0.0107, + "step": 604250 + }, + { + "epoch": 1.57, + "learning_rate": 6.505063753787771e-05, + "loss": 0.0104, + "step": 604260 + }, + { + "epoch": 1.57, + "learning_rate": 6.504674932150624e-05, + "loss": 0.0076, + "step": 604270 + }, + { + "epoch": 1.57, + "learning_rate": 6.504286110513477e-05, + "loss": 0.0116, + "step": 604280 + }, + { + "epoch": 1.57, + "learning_rate": 6.503897288876331e-05, + "loss": 0.0079, + "step": 604290 + }, + { + "epoch": 1.57, + "learning_rate": 6.503508467239184e-05, + "loss": 0.0081, + "step": 604300 + }, + { + "epoch": 1.57, + "learning_rate": 6.503119645602038e-05, + "loss": 0.0093, + "step": 604310 + }, + { + "epoch": 1.57, + "learning_rate": 6.50273082396489e-05, + "loss": 0.0114, + "step": 604320 + }, + { + "epoch": 1.57, + "learning_rate": 6.502342002327745e-05, + "loss": 0.0088, + "step": 604330 + }, + { + "epoch": 1.57, + "learning_rate": 6.501953180690599e-05, + "loss": 0.0112, + "step": 604340 + }, + { + "epoch": 1.57, + "learning_rate": 6.501564359053452e-05, + "loss": 0.0077, + "step": 604350 + }, + { + "epoch": 1.57, + "learning_rate": 6.501175537416306e-05, + "loss": 0.0091, + "step": 604360 + }, + { + "epoch": 1.57, + "learning_rate": 6.500786715779159e-05, + "loss": 0.0114, + "step": 604370 + }, + { + "epoch": 1.57, + "learning_rate": 6.500397894142013e-05, + "loss": 0.0074, + "step": 604380 + }, + { + "epoch": 1.57, + "learning_rate": 6.500009072504866e-05, + "loss": 0.0107, + "step": 604390 + }, + { + "epoch": 1.57, + "learning_rate": 6.49962025086772e-05, + "loss": 0.0096, + "step": 604400 + }, + { + "epoch": 1.57, + "learning_rate": 6.499231429230574e-05, + "loss": 0.0122, + "step": 604410 + }, + { + "epoch": 1.57, + "learning_rate": 6.498842607593427e-05, + "loss": 0.0082, + "step": 604420 + }, + { + "epoch": 1.57, + "learning_rate": 6.498453785956281e-05, + "loss": 0.0051, + "step": 604430 + }, + { + "epoch": 1.57, + "learning_rate": 6.498064964319134e-05, + "loss": 0.0089, + "step": 604440 + }, + { + "epoch": 1.57, + "learning_rate": 6.497676142681988e-05, + "loss": 0.0103, + "step": 604450 + }, + { + "epoch": 1.57, + "learning_rate": 6.497287321044841e-05, + "loss": 0.0063, + "step": 604460 + }, + { + "epoch": 1.57, + "learning_rate": 6.496898499407695e-05, + "loss": 0.0094, + "step": 604470 + }, + { + "epoch": 1.57, + "learning_rate": 6.496509677770548e-05, + "loss": 0.0092, + "step": 604480 + }, + { + "epoch": 1.57, + "learning_rate": 6.496120856133402e-05, + "loss": 0.0058, + "step": 604490 + }, + { + "epoch": 1.57, + "learning_rate": 6.495732034496256e-05, + "loss": 0.01, + "step": 604500 + }, + { + "epoch": 1.57, + "learning_rate": 6.495343212859109e-05, + "loss": 0.0087, + "step": 604510 + }, + { + "epoch": 1.57, + "learning_rate": 6.494954391221962e-05, + "loss": 0.0089, + "step": 604520 + }, + { + "epoch": 1.57, + "learning_rate": 6.494565569584816e-05, + "loss": 0.0108, + "step": 604530 + }, + { + "epoch": 1.57, + "learning_rate": 6.494176747947669e-05, + "loss": 0.0077, + "step": 604540 + }, + { + "epoch": 1.57, + "learning_rate": 6.493787926310523e-05, + "loss": 0.01, + "step": 604550 + }, + { + "epoch": 1.57, + "learning_rate": 6.493399104673376e-05, + "loss": 0.0098, + "step": 604560 + }, + { + "epoch": 1.57, + "learning_rate": 6.49301028303623e-05, + "loss": 0.0083, + "step": 604570 + }, + { + "epoch": 1.57, + "learning_rate": 6.492621461399083e-05, + "loss": 0.0095, + "step": 604580 + }, + { + "epoch": 1.57, + "learning_rate": 6.492232639761937e-05, + "loss": 0.0068, + "step": 604590 + }, + { + "epoch": 1.57, + "learning_rate": 6.491843818124791e-05, + "loss": 0.0123, + "step": 604600 + }, + { + "epoch": 1.57, + "learning_rate": 6.491454996487644e-05, + "loss": 0.0084, + "step": 604610 + }, + { + "epoch": 1.57, + "learning_rate": 6.491066174850498e-05, + "loss": 0.0064, + "step": 604620 + }, + { + "epoch": 1.57, + "learning_rate": 6.490677353213351e-05, + "loss": 0.0074, + "step": 604630 + }, + { + "epoch": 1.57, + "learning_rate": 6.490288531576205e-05, + "loss": 0.0075, + "step": 604640 + }, + { + "epoch": 1.57, + "learning_rate": 6.489899709939058e-05, + "loss": 0.0099, + "step": 604650 + }, + { + "epoch": 1.57, + "learning_rate": 6.489510888301912e-05, + "loss": 0.0072, + "step": 604660 + }, + { + "epoch": 1.57, + "learning_rate": 6.489122066664765e-05, + "loss": 0.0096, + "step": 604670 + }, + { + "epoch": 1.57, + "learning_rate": 6.488733245027619e-05, + "loss": 0.0082, + "step": 604680 + }, + { + "epoch": 1.57, + "learning_rate": 6.488344423390473e-05, + "loss": 0.0089, + "step": 604690 + }, + { + "epoch": 1.57, + "learning_rate": 6.487955601753326e-05, + "loss": 0.0087, + "step": 604700 + }, + { + "epoch": 1.57, + "learning_rate": 6.48756678011618e-05, + "loss": 0.0096, + "step": 604710 + }, + { + "epoch": 1.57, + "learning_rate": 6.487177958479033e-05, + "loss": 0.0085, + "step": 604720 + }, + { + "epoch": 1.57, + "learning_rate": 6.486789136841887e-05, + "loss": 0.0083, + "step": 604730 + }, + { + "epoch": 1.57, + "learning_rate": 6.48640031520474e-05, + "loss": 0.0089, + "step": 604740 + }, + { + "epoch": 1.57, + "learning_rate": 6.486011493567594e-05, + "loss": 0.0073, + "step": 604750 + }, + { + "epoch": 1.57, + "learning_rate": 6.485622671930447e-05, + "loss": 0.0088, + "step": 604760 + }, + { + "epoch": 1.57, + "learning_rate": 6.4852338502933e-05, + "loss": 0.0091, + "step": 604770 + }, + { + "epoch": 1.57, + "learning_rate": 6.484845028656154e-05, + "loss": 0.0067, + "step": 604780 + }, + { + "epoch": 1.57, + "learning_rate": 6.484456207019008e-05, + "loss": 0.0061, + "step": 604790 + }, + { + "epoch": 1.57, + "learning_rate": 6.48406738538186e-05, + "loss": 0.0115, + "step": 604800 + }, + { + "epoch": 1.57, + "learning_rate": 6.483678563744715e-05, + "loss": 0.0086, + "step": 604810 + }, + { + "epoch": 1.57, + "learning_rate": 6.483289742107568e-05, + "loss": 0.009, + "step": 604820 + }, + { + "epoch": 1.57, + "learning_rate": 6.482900920470422e-05, + "loss": 0.0137, + "step": 604830 + }, + { + "epoch": 1.57, + "learning_rate": 6.482512098833275e-05, + "loss": 0.0081, + "step": 604840 + }, + { + "epoch": 1.57, + "learning_rate": 6.482123277196129e-05, + "loss": 0.011, + "step": 604850 + }, + { + "epoch": 1.57, + "learning_rate": 6.481734455558983e-05, + "loss": 0.0094, + "step": 604860 + }, + { + "epoch": 1.57, + "learning_rate": 6.481345633921836e-05, + "loss": 0.0067, + "step": 604870 + }, + { + "epoch": 1.57, + "learning_rate": 6.48095681228469e-05, + "loss": 0.0082, + "step": 604880 + }, + { + "epoch": 1.57, + "learning_rate": 6.480567990647543e-05, + "loss": 0.0106, + "step": 604890 + }, + { + "epoch": 1.57, + "learning_rate": 6.480179169010397e-05, + "loss": 0.0076, + "step": 604900 + }, + { + "epoch": 1.57, + "learning_rate": 6.47979034737325e-05, + "loss": 0.0091, + "step": 604910 + }, + { + "epoch": 1.57, + "learning_rate": 6.479401525736104e-05, + "loss": 0.0078, + "step": 604920 + }, + { + "epoch": 1.57, + "learning_rate": 6.479012704098957e-05, + "loss": 0.0114, + "step": 604930 + }, + { + "epoch": 1.57, + "learning_rate": 6.478623882461811e-05, + "loss": 0.008, + "step": 604940 + }, + { + "epoch": 1.57, + "learning_rate": 6.478235060824665e-05, + "loss": 0.0084, + "step": 604950 + }, + { + "epoch": 1.57, + "learning_rate": 6.477846239187518e-05, + "loss": 0.0072, + "step": 604960 + }, + { + "epoch": 1.57, + "learning_rate": 6.477457417550372e-05, + "loss": 0.0094, + "step": 604970 + }, + { + "epoch": 1.57, + "learning_rate": 6.477068595913225e-05, + "loss": 0.008, + "step": 604980 + }, + { + "epoch": 1.57, + "learning_rate": 6.476679774276079e-05, + "loss": 0.0077, + "step": 604990 + }, + { + "epoch": 1.57, + "learning_rate": 6.476290952638932e-05, + "loss": 0.0078, + "step": 605000 + }, + { + "epoch": 1.57, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.005784572102129459, + "eval_runtime": 107.7017, + "eval_samples_per_second": 18.57, + "eval_steps_per_second": 4.642, + "step": 605000 + }, + { + "epoch": 1.57, + "learning_rate": 6.475902131001785e-05, + "loss": 0.0078, + "step": 605010 + }, + { + "epoch": 1.57, + "learning_rate": 6.475513309364639e-05, + "loss": 0.0067, + "step": 605020 + }, + { + "epoch": 1.57, + "learning_rate": 6.475124487727491e-05, + "loss": 0.007, + "step": 605030 + }, + { + "epoch": 1.57, + "learning_rate": 6.474735666090346e-05, + "loss": 0.009, + "step": 605040 + }, + { + "epoch": 1.57, + "learning_rate": 6.4743468444532e-05, + "loss": 0.0076, + "step": 605050 + }, + { + "epoch": 1.57, + "learning_rate": 6.473958022816053e-05, + "loss": 0.01, + "step": 605060 + }, + { + "epoch": 1.57, + "learning_rate": 6.473569201178907e-05, + "loss": 0.0085, + "step": 605070 + }, + { + "epoch": 1.57, + "learning_rate": 6.47318037954176e-05, + "loss": 0.0084, + "step": 605080 + }, + { + "epoch": 1.57, + "learning_rate": 6.472791557904614e-05, + "loss": 0.0078, + "step": 605090 + }, + { + "epoch": 1.57, + "learning_rate": 6.472402736267467e-05, + "loss": 0.0083, + "step": 605100 + }, + { + "epoch": 1.57, + "learning_rate": 6.472013914630321e-05, + "loss": 0.0079, + "step": 605110 + }, + { + "epoch": 1.57, + "learning_rate": 6.471625092993175e-05, + "loss": 0.0086, + "step": 605120 + }, + { + "epoch": 1.57, + "learning_rate": 6.471236271356028e-05, + "loss": 0.0067, + "step": 605130 + }, + { + "epoch": 1.57, + "learning_rate": 6.470847449718882e-05, + "loss": 0.0073, + "step": 605140 + }, + { + "epoch": 1.57, + "learning_rate": 6.470458628081735e-05, + "loss": 0.0085, + "step": 605150 + }, + { + "epoch": 1.57, + "learning_rate": 6.470069806444589e-05, + "loss": 0.0082, + "step": 605160 + }, + { + "epoch": 1.57, + "learning_rate": 6.469680984807442e-05, + "loss": 0.0125, + "step": 605170 + }, + { + "epoch": 1.57, + "learning_rate": 6.469292163170296e-05, + "loss": 0.009, + "step": 605180 + }, + { + "epoch": 1.57, + "learning_rate": 6.468903341533149e-05, + "loss": 0.0085, + "step": 605190 + }, + { + "epoch": 1.57, + "learning_rate": 6.468514519896003e-05, + "loss": 0.0081, + "step": 605200 + }, + { + "epoch": 1.57, + "learning_rate": 6.468125698258857e-05, + "loss": 0.0104, + "step": 605210 + }, + { + "epoch": 1.57, + "learning_rate": 6.46773687662171e-05, + "loss": 0.0112, + "step": 605220 + }, + { + "epoch": 1.57, + "learning_rate": 6.467348054984564e-05, + "loss": 0.009, + "step": 605230 + }, + { + "epoch": 1.57, + "learning_rate": 6.466959233347417e-05, + "loss": 0.0094, + "step": 605240 + }, + { + "epoch": 1.57, + "learning_rate": 6.466570411710271e-05, + "loss": 0.0083, + "step": 605250 + }, + { + "epoch": 1.57, + "learning_rate": 6.466181590073124e-05, + "loss": 0.0089, + "step": 605260 + }, + { + "epoch": 1.57, + "learning_rate": 6.465792768435977e-05, + "loss": 0.0104, + "step": 605270 + }, + { + "epoch": 1.57, + "learning_rate": 6.465403946798831e-05, + "loss": 0.0098, + "step": 605280 + }, + { + "epoch": 1.57, + "learning_rate": 6.465015125161683e-05, + "loss": 0.0129, + "step": 605290 + }, + { + "epoch": 1.57, + "learning_rate": 6.464626303524538e-05, + "loss": 0.0141, + "step": 605300 + }, + { + "epoch": 1.57, + "learning_rate": 6.464237481887392e-05, + "loss": 0.0125, + "step": 605310 + }, + { + "epoch": 1.57, + "learning_rate": 6.463848660250245e-05, + "loss": 0.0098, + "step": 605320 + }, + { + "epoch": 1.57, + "learning_rate": 6.463459838613099e-05, + "loss": 0.0082, + "step": 605330 + }, + { + "epoch": 1.57, + "learning_rate": 6.463071016975952e-05, + "loss": 0.0075, + "step": 605340 + }, + { + "epoch": 1.57, + "learning_rate": 6.462682195338806e-05, + "loss": 0.0107, + "step": 605350 + }, + { + "epoch": 1.57, + "learning_rate": 6.462293373701659e-05, + "loss": 0.009, + "step": 605360 + }, + { + "epoch": 1.57, + "learning_rate": 6.461904552064513e-05, + "loss": 0.0107, + "step": 605370 + }, + { + "epoch": 1.57, + "learning_rate": 6.461515730427367e-05, + "loss": 0.0097, + "step": 605380 + }, + { + "epoch": 1.57, + "learning_rate": 6.46112690879022e-05, + "loss": 0.0064, + "step": 605390 + }, + { + "epoch": 1.57, + "learning_rate": 6.460738087153074e-05, + "loss": 0.0078, + "step": 605400 + }, + { + "epoch": 1.57, + "learning_rate": 6.460349265515927e-05, + "loss": 0.0075, + "step": 605410 + }, + { + "epoch": 1.57, + "learning_rate": 6.459960443878781e-05, + "loss": 0.0063, + "step": 605420 + }, + { + "epoch": 1.57, + "learning_rate": 6.459571622241634e-05, + "loss": 0.0074, + "step": 605430 + }, + { + "epoch": 1.57, + "learning_rate": 6.459182800604488e-05, + "loss": 0.0067, + "step": 605440 + }, + { + "epoch": 1.57, + "learning_rate": 6.45879397896734e-05, + "loss": 0.0059, + "step": 605450 + }, + { + "epoch": 1.57, + "learning_rate": 6.458405157330195e-05, + "loss": 0.0086, + "step": 605460 + }, + { + "epoch": 1.57, + "learning_rate": 6.458016335693049e-05, + "loss": 0.0071, + "step": 605470 + }, + { + "epoch": 1.57, + "learning_rate": 6.457627514055902e-05, + "loss": 0.0095, + "step": 605480 + }, + { + "epoch": 1.57, + "learning_rate": 6.457238692418756e-05, + "loss": 0.0079, + "step": 605490 + }, + { + "epoch": 1.57, + "learning_rate": 6.456849870781609e-05, + "loss": 0.0077, + "step": 605500 + }, + { + "epoch": 1.57, + "learning_rate": 6.456461049144462e-05, + "loss": 0.0108, + "step": 605510 + }, + { + "epoch": 1.57, + "learning_rate": 6.456072227507316e-05, + "loss": 0.0084, + "step": 605520 + }, + { + "epoch": 1.57, + "learning_rate": 6.455683405870169e-05, + "loss": 0.0071, + "step": 605530 + }, + { + "epoch": 1.57, + "learning_rate": 6.455294584233023e-05, + "loss": 0.0067, + "step": 605540 + }, + { + "epoch": 1.57, + "learning_rate": 6.454905762595875e-05, + "loss": 0.0092, + "step": 605550 + }, + { + "epoch": 1.57, + "learning_rate": 6.45451694095873e-05, + "loss": 0.0092, + "step": 605560 + }, + { + "epoch": 1.57, + "learning_rate": 6.454128119321584e-05, + "loss": 0.0067, + "step": 605570 + }, + { + "epoch": 1.57, + "learning_rate": 6.453739297684437e-05, + "loss": 0.0087, + "step": 605580 + }, + { + "epoch": 1.57, + "learning_rate": 6.453350476047291e-05, + "loss": 0.0061, + "step": 605590 + }, + { + "epoch": 1.57, + "learning_rate": 6.452961654410144e-05, + "loss": 0.0069, + "step": 605600 + }, + { + "epoch": 1.57, + "learning_rate": 6.452572832772998e-05, + "loss": 0.0095, + "step": 605610 + }, + { + "epoch": 1.57, + "learning_rate": 6.45218401113585e-05, + "loss": 0.0079, + "step": 605620 + }, + { + "epoch": 1.57, + "learning_rate": 6.451795189498705e-05, + "loss": 0.0102, + "step": 605630 + }, + { + "epoch": 1.57, + "learning_rate": 6.451406367861559e-05, + "loss": 0.0091, + "step": 605640 + }, + { + "epoch": 1.57, + "learning_rate": 6.451017546224412e-05, + "loss": 0.0077, + "step": 605650 + }, + { + "epoch": 1.57, + "learning_rate": 6.450628724587266e-05, + "loss": 0.0062, + "step": 605660 + }, + { + "epoch": 1.57, + "learning_rate": 6.450239902950119e-05, + "loss": 0.0074, + "step": 605670 + }, + { + "epoch": 1.57, + "learning_rate": 6.449851081312973e-05, + "loss": 0.0054, + "step": 605680 + }, + { + "epoch": 1.57, + "learning_rate": 6.449462259675826e-05, + "loss": 0.0062, + "step": 605690 + }, + { + "epoch": 1.57, + "learning_rate": 6.44907343803868e-05, + "loss": 0.0061, + "step": 605700 + }, + { + "epoch": 1.57, + "learning_rate": 6.448684616401533e-05, + "loss": 0.0076, + "step": 605710 + }, + { + "epoch": 1.57, + "learning_rate": 6.448295794764387e-05, + "loss": 0.0095, + "step": 605720 + }, + { + "epoch": 1.57, + "learning_rate": 6.447906973127241e-05, + "loss": 0.0094, + "step": 605730 + }, + { + "epoch": 1.57, + "learning_rate": 6.447518151490094e-05, + "loss": 0.0061, + "step": 605740 + }, + { + "epoch": 1.57, + "learning_rate": 6.447129329852948e-05, + "loss": 0.0073, + "step": 605750 + }, + { + "epoch": 1.57, + "learning_rate": 6.446740508215801e-05, + "loss": 0.0101, + "step": 605760 + }, + { + "epoch": 1.57, + "learning_rate": 6.446351686578654e-05, + "loss": 0.0081, + "step": 605770 + }, + { + "epoch": 1.57, + "learning_rate": 6.445962864941508e-05, + "loss": 0.0133, + "step": 605780 + }, + { + "epoch": 1.57, + "learning_rate": 6.44557404330436e-05, + "loss": 0.0083, + "step": 605790 + }, + { + "epoch": 1.57, + "learning_rate": 6.445185221667215e-05, + "loss": 0.0091, + "step": 605800 + }, + { + "epoch": 1.57, + "learning_rate": 6.444796400030067e-05, + "loss": 0.0079, + "step": 605810 + }, + { + "epoch": 1.57, + "learning_rate": 6.444407578392922e-05, + "loss": 0.0078, + "step": 605820 + }, + { + "epoch": 1.57, + "learning_rate": 6.444018756755776e-05, + "loss": 0.0076, + "step": 605830 + }, + { + "epoch": 1.57, + "learning_rate": 6.443629935118629e-05, + "loss": 0.0098, + "step": 605840 + }, + { + "epoch": 1.57, + "learning_rate": 6.443241113481483e-05, + "loss": 0.0159, + "step": 605850 + }, + { + "epoch": 1.57, + "learning_rate": 6.442852291844336e-05, + "loss": 0.0102, + "step": 605860 + }, + { + "epoch": 1.57, + "learning_rate": 6.44246347020719e-05, + "loss": 0.0093, + "step": 605870 + }, + { + "epoch": 1.57, + "learning_rate": 6.442074648570043e-05, + "loss": 0.0074, + "step": 605880 + }, + { + "epoch": 1.57, + "learning_rate": 6.441685826932897e-05, + "loss": 0.0086, + "step": 605890 + }, + { + "epoch": 1.57, + "learning_rate": 6.441297005295751e-05, + "loss": 0.0106, + "step": 605900 + }, + { + "epoch": 1.57, + "learning_rate": 6.440908183658604e-05, + "loss": 0.0108, + "step": 605910 + }, + { + "epoch": 1.57, + "learning_rate": 6.440519362021458e-05, + "loss": 0.0086, + "step": 605920 + }, + { + "epoch": 1.57, + "learning_rate": 6.44013054038431e-05, + "loss": 0.0082, + "step": 605930 + }, + { + "epoch": 1.57, + "learning_rate": 6.439741718747165e-05, + "loss": 0.0092, + "step": 605940 + }, + { + "epoch": 1.57, + "learning_rate": 6.439352897110018e-05, + "loss": 0.0116, + "step": 605950 + }, + { + "epoch": 1.57, + "learning_rate": 6.438964075472872e-05, + "loss": 0.0117, + "step": 605960 + }, + { + "epoch": 1.57, + "learning_rate": 6.438575253835725e-05, + "loss": 0.008, + "step": 605970 + }, + { + "epoch": 1.57, + "learning_rate": 6.438186432198579e-05, + "loss": 0.0118, + "step": 605980 + }, + { + "epoch": 1.57, + "learning_rate": 6.437797610561433e-05, + "loss": 0.0124, + "step": 605990 + }, + { + "epoch": 1.57, + "learning_rate": 6.437408788924286e-05, + "loss": 0.0088, + "step": 606000 + }, + { + "epoch": 1.57, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.005717435386031866, + "eval_runtime": 107.7826, + "eval_samples_per_second": 18.556, + "eval_steps_per_second": 4.639, + "step": 606000 + }, + { + "epoch": 1.57, + "learning_rate": 6.437019967287139e-05, + "loss": 0.0095, + "step": 606010 + }, + { + "epoch": 1.57, + "learning_rate": 6.436631145649993e-05, + "loss": 0.0098, + "step": 606020 + }, + { + "epoch": 1.57, + "learning_rate": 6.436242324012846e-05, + "loss": 0.0092, + "step": 606030 + }, + { + "epoch": 1.57, + "learning_rate": 6.4358535023757e-05, + "loss": 0.0089, + "step": 606040 + }, + { + "epoch": 1.57, + "learning_rate": 6.435464680738553e-05, + "loss": 0.01, + "step": 606050 + }, + { + "epoch": 1.57, + "learning_rate": 6.435075859101407e-05, + "loss": 0.0067, + "step": 606060 + }, + { + "epoch": 1.57, + "learning_rate": 6.43468703746426e-05, + "loss": 0.0085, + "step": 606070 + }, + { + "epoch": 1.57, + "learning_rate": 6.434298215827114e-05, + "loss": 0.0066, + "step": 606080 + }, + { + "epoch": 1.57, + "learning_rate": 6.433909394189968e-05, + "loss": 0.0086, + "step": 606090 + }, + { + "epoch": 1.57, + "learning_rate": 6.43352057255282e-05, + "loss": 0.0092, + "step": 606100 + }, + { + "epoch": 1.57, + "learning_rate": 6.433131750915675e-05, + "loss": 0.0096, + "step": 606110 + }, + { + "epoch": 1.57, + "learning_rate": 6.432742929278528e-05, + "loss": 0.0081, + "step": 606120 + }, + { + "epoch": 1.57, + "learning_rate": 6.432354107641382e-05, + "loss": 0.0097, + "step": 606130 + }, + { + "epoch": 1.57, + "learning_rate": 6.431965286004235e-05, + "loss": 0.0066, + "step": 606140 + }, + { + "epoch": 1.57, + "learning_rate": 6.431576464367089e-05, + "loss": 0.011, + "step": 606150 + }, + { + "epoch": 1.57, + "learning_rate": 6.431187642729942e-05, + "loss": 0.0066, + "step": 606160 + }, + { + "epoch": 1.57, + "learning_rate": 6.430798821092796e-05, + "loss": 0.0097, + "step": 606170 + }, + { + "epoch": 1.57, + "learning_rate": 6.43040999945565e-05, + "loss": 0.0073, + "step": 606180 + }, + { + "epoch": 1.57, + "learning_rate": 6.430021177818503e-05, + "loss": 0.0103, + "step": 606190 + }, + { + "epoch": 1.57, + "learning_rate": 6.429632356181357e-05, + "loss": 0.0079, + "step": 606200 + }, + { + "epoch": 1.57, + "learning_rate": 6.42924353454421e-05, + "loss": 0.0087, + "step": 606210 + }, + { + "epoch": 1.57, + "learning_rate": 6.428854712907064e-05, + "loss": 0.0102, + "step": 606220 + }, + { + "epoch": 1.57, + "learning_rate": 6.428465891269917e-05, + "loss": 0.0059, + "step": 606230 + }, + { + "epoch": 1.57, + "learning_rate": 6.428077069632771e-05, + "loss": 0.0071, + "step": 606240 + }, + { + "epoch": 1.57, + "learning_rate": 6.427688247995624e-05, + "loss": 0.0075, + "step": 606250 + }, + { + "epoch": 1.57, + "learning_rate": 6.427299426358476e-05, + "loss": 0.0086, + "step": 606260 + }, + { + "epoch": 1.57, + "learning_rate": 6.42691060472133e-05, + "loss": 0.0089, + "step": 606270 + }, + { + "epoch": 1.57, + "learning_rate": 6.426521783084185e-05, + "loss": 0.0061, + "step": 606280 + }, + { + "epoch": 1.57, + "learning_rate": 6.426132961447038e-05, + "loss": 0.0081, + "step": 606290 + }, + { + "epoch": 1.57, + "learning_rate": 6.425744139809892e-05, + "loss": 0.0093, + "step": 606300 + }, + { + "epoch": 1.57, + "learning_rate": 6.425355318172744e-05, + "loss": 0.0096, + "step": 606310 + }, + { + "epoch": 1.57, + "learning_rate": 6.424966496535599e-05, + "loss": 0.0099, + "step": 606320 + }, + { + "epoch": 1.57, + "learning_rate": 6.424577674898451e-05, + "loss": 0.0082, + "step": 606330 + }, + { + "epoch": 1.57, + "learning_rate": 6.424188853261306e-05, + "loss": 0.0069, + "step": 606340 + }, + { + "epoch": 1.57, + "learning_rate": 6.42380003162416e-05, + "loss": 0.0077, + "step": 606350 + }, + { + "epoch": 1.57, + "learning_rate": 6.423411209987013e-05, + "loss": 0.01, + "step": 606360 + }, + { + "epoch": 1.57, + "learning_rate": 6.423022388349867e-05, + "loss": 0.0076, + "step": 606370 + }, + { + "epoch": 1.57, + "learning_rate": 6.42263356671272e-05, + "loss": 0.0077, + "step": 606380 + }, + { + "epoch": 1.57, + "learning_rate": 6.422244745075574e-05, + "loss": 0.0088, + "step": 606390 + }, + { + "epoch": 1.57, + "learning_rate": 6.421855923438427e-05, + "loss": 0.0103, + "step": 606400 + }, + { + "epoch": 1.57, + "learning_rate": 6.421467101801281e-05, + "loss": 0.0085, + "step": 606410 + }, + { + "epoch": 1.57, + "learning_rate": 6.421078280164134e-05, + "loss": 0.0108, + "step": 606420 + }, + { + "epoch": 1.57, + "learning_rate": 6.420689458526988e-05, + "loss": 0.0055, + "step": 606430 + }, + { + "epoch": 1.57, + "learning_rate": 6.420300636889842e-05, + "loss": 0.0097, + "step": 606440 + }, + { + "epoch": 1.57, + "learning_rate": 6.419911815252695e-05, + "loss": 0.0083, + "step": 606450 + }, + { + "epoch": 1.57, + "learning_rate": 6.419522993615549e-05, + "loss": 0.0073, + "step": 606460 + }, + { + "epoch": 1.57, + "learning_rate": 6.419134171978402e-05, + "loss": 0.0103, + "step": 606470 + }, + { + "epoch": 1.57, + "learning_rate": 6.418745350341256e-05, + "loss": 0.0075, + "step": 606480 + }, + { + "epoch": 1.57, + "learning_rate": 6.418356528704109e-05, + "loss": 0.0084, + "step": 606490 + }, + { + "epoch": 1.57, + "learning_rate": 6.417967707066961e-05, + "loss": 0.0083, + "step": 606500 + }, + { + "epoch": 1.57, + "learning_rate": 6.417578885429816e-05, + "loss": 0.0073, + "step": 606510 + }, + { + "epoch": 1.57, + "learning_rate": 6.417190063792668e-05, + "loss": 0.0129, + "step": 606520 + }, + { + "epoch": 1.57, + "learning_rate": 6.416801242155523e-05, + "loss": 0.0072, + "step": 606530 + }, + { + "epoch": 1.57, + "learning_rate": 6.416412420518377e-05, + "loss": 0.0082, + "step": 606540 + }, + { + "epoch": 1.57, + "learning_rate": 6.41602359888123e-05, + "loss": 0.009, + "step": 606550 + }, + { + "epoch": 1.57, + "learning_rate": 6.415634777244084e-05, + "loss": 0.0065, + "step": 606560 + }, + { + "epoch": 1.57, + "learning_rate": 6.415245955606936e-05, + "loss": 0.0121, + "step": 606570 + }, + { + "epoch": 1.57, + "learning_rate": 6.41485713396979e-05, + "loss": 0.0091, + "step": 606580 + }, + { + "epoch": 1.57, + "learning_rate": 6.414468312332643e-05, + "loss": 0.0092, + "step": 606590 + }, + { + "epoch": 1.57, + "learning_rate": 6.414079490695498e-05, + "loss": 0.009, + "step": 606600 + }, + { + "epoch": 1.57, + "learning_rate": 6.413690669058352e-05, + "loss": 0.0097, + "step": 606610 + }, + { + "epoch": 1.57, + "learning_rate": 6.413301847421205e-05, + "loss": 0.0162, + "step": 606620 + }, + { + "epoch": 1.57, + "learning_rate": 6.412913025784059e-05, + "loss": 0.0067, + "step": 606630 + }, + { + "epoch": 1.57, + "learning_rate": 6.412524204146912e-05, + "loss": 0.0081, + "step": 606640 + }, + { + "epoch": 1.57, + "learning_rate": 6.412135382509766e-05, + "loss": 0.0074, + "step": 606650 + }, + { + "epoch": 1.57, + "learning_rate": 6.411746560872619e-05, + "loss": 0.011, + "step": 606660 + }, + { + "epoch": 1.57, + "learning_rate": 6.411357739235473e-05, + "loss": 0.0106, + "step": 606670 + }, + { + "epoch": 1.57, + "learning_rate": 6.410968917598326e-05, + "loss": 0.0088, + "step": 606680 + }, + { + "epoch": 1.57, + "learning_rate": 6.41058009596118e-05, + "loss": 0.0097, + "step": 606690 + }, + { + "epoch": 1.57, + "learning_rate": 6.410191274324034e-05, + "loss": 0.0089, + "step": 606700 + }, + { + "epoch": 1.57, + "learning_rate": 6.409802452686887e-05, + "loss": 0.0089, + "step": 606710 + }, + { + "epoch": 1.57, + "learning_rate": 6.409413631049741e-05, + "loss": 0.0081, + "step": 606720 + }, + { + "epoch": 1.57, + "learning_rate": 6.409024809412594e-05, + "loss": 0.0072, + "step": 606730 + }, + { + "epoch": 1.57, + "learning_rate": 6.408635987775448e-05, + "loss": 0.0108, + "step": 606740 + }, + { + "epoch": 1.57, + "learning_rate": 6.4082471661383e-05, + "loss": 0.0078, + "step": 606750 + }, + { + "epoch": 1.57, + "learning_rate": 6.407858344501153e-05, + "loss": 0.0079, + "step": 606760 + }, + { + "epoch": 1.57, + "learning_rate": 6.407469522864008e-05, + "loss": 0.0107, + "step": 606770 + }, + { + "epoch": 1.57, + "learning_rate": 6.40708070122686e-05, + "loss": 0.0111, + "step": 606780 + }, + { + "epoch": 1.57, + "learning_rate": 6.406691879589715e-05, + "loss": 0.008, + "step": 606790 + }, + { + "epoch": 1.57, + "learning_rate": 6.406303057952569e-05, + "loss": 0.0095, + "step": 606800 + }, + { + "epoch": 1.57, + "learning_rate": 6.405914236315422e-05, + "loss": 0.008, + "step": 606810 + }, + { + "epoch": 1.57, + "learning_rate": 6.405525414678276e-05, + "loss": 0.0088, + "step": 606820 + }, + { + "epoch": 1.57, + "learning_rate": 6.405136593041128e-05, + "loss": 0.0105, + "step": 606830 + }, + { + "epoch": 1.57, + "learning_rate": 6.404747771403983e-05, + "loss": 0.0061, + "step": 606840 + }, + { + "epoch": 1.57, + "learning_rate": 6.404358949766835e-05, + "loss": 0.0109, + "step": 606850 + }, + { + "epoch": 1.57, + "learning_rate": 6.40397012812969e-05, + "loss": 0.0089, + "step": 606860 + }, + { + "epoch": 1.57, + "learning_rate": 6.403581306492544e-05, + "loss": 0.0093, + "step": 606870 + }, + { + "epoch": 1.57, + "learning_rate": 6.403192484855397e-05, + "loss": 0.011, + "step": 606880 + }, + { + "epoch": 1.57, + "learning_rate": 6.402803663218251e-05, + "loss": 0.0101, + "step": 606890 + }, + { + "epoch": 1.57, + "learning_rate": 6.402414841581104e-05, + "loss": 0.0097, + "step": 606900 + }, + { + "epoch": 1.57, + "learning_rate": 6.402026019943958e-05, + "loss": 0.0097, + "step": 606910 + }, + { + "epoch": 1.57, + "learning_rate": 6.40163719830681e-05, + "loss": 0.0096, + "step": 606920 + }, + { + "epoch": 1.57, + "learning_rate": 6.401248376669665e-05, + "loss": 0.0086, + "step": 606930 + }, + { + "epoch": 1.57, + "learning_rate": 6.400859555032518e-05, + "loss": 0.0077, + "step": 606940 + }, + { + "epoch": 1.57, + "learning_rate": 6.400470733395372e-05, + "loss": 0.01, + "step": 606950 + }, + { + "epoch": 1.57, + "learning_rate": 6.400081911758226e-05, + "loss": 0.0292, + "step": 606960 + }, + { + "epoch": 1.57, + "learning_rate": 6.399693090121079e-05, + "loss": 0.0104, + "step": 606970 + }, + { + "epoch": 1.57, + "learning_rate": 6.399304268483933e-05, + "loss": 0.0074, + "step": 606980 + }, + { + "epoch": 1.57, + "learning_rate": 6.398915446846786e-05, + "loss": 0.0117, + "step": 606990 + }, + { + "epoch": 1.57, + "learning_rate": 6.398526625209638e-05, + "loss": 0.0089, + "step": 607000 + }, + { + "epoch": 1.57, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.00562703050673008, + "eval_runtime": 107.9194, + "eval_samples_per_second": 18.532, + "eval_steps_per_second": 4.633, + "step": 607000 + }, + { + "epoch": 1.57, + "learning_rate": 6.398137803572493e-05, + "loss": 0.0116, + "step": 607010 + }, + { + "epoch": 1.57, + "learning_rate": 6.397748981935345e-05, + "loss": 0.0076, + "step": 607020 + }, + { + "epoch": 1.57, + "learning_rate": 6.3973601602982e-05, + "loss": 0.0134, + "step": 607030 + }, + { + "epoch": 1.57, + "learning_rate": 6.396971338661052e-05, + "loss": 0.0097, + "step": 607040 + }, + { + "epoch": 1.57, + "learning_rate": 6.396582517023907e-05, + "loss": 0.0113, + "step": 607050 + }, + { + "epoch": 1.57, + "learning_rate": 6.396193695386761e-05, + "loss": 0.0079, + "step": 607060 + }, + { + "epoch": 1.57, + "learning_rate": 6.395804873749614e-05, + "loss": 0.0114, + "step": 607070 + }, + { + "epoch": 1.57, + "learning_rate": 6.395416052112468e-05, + "loss": 0.0079, + "step": 607080 + }, + { + "epoch": 1.57, + "learning_rate": 6.39502723047532e-05, + "loss": 0.0101, + "step": 607090 + }, + { + "epoch": 1.57, + "learning_rate": 6.394638408838175e-05, + "loss": 0.0067, + "step": 607100 + }, + { + "epoch": 1.57, + "learning_rate": 6.394249587201027e-05, + "loss": 0.0082, + "step": 607110 + }, + { + "epoch": 1.57, + "learning_rate": 6.393860765563882e-05, + "loss": 0.0103, + "step": 607120 + }, + { + "epoch": 1.57, + "learning_rate": 6.393471943926736e-05, + "loss": 0.0074, + "step": 607130 + }, + { + "epoch": 1.57, + "learning_rate": 6.393083122289589e-05, + "loss": 0.0105, + "step": 607140 + }, + { + "epoch": 1.57, + "learning_rate": 6.392694300652443e-05, + "loss": 0.0072, + "step": 607150 + }, + { + "epoch": 1.57, + "learning_rate": 6.392305479015296e-05, + "loss": 0.008, + "step": 607160 + }, + { + "epoch": 1.57, + "learning_rate": 6.39191665737815e-05, + "loss": 0.0087, + "step": 607170 + }, + { + "epoch": 1.57, + "learning_rate": 6.391527835741003e-05, + "loss": 0.0067, + "step": 607180 + }, + { + "epoch": 1.57, + "learning_rate": 6.391139014103857e-05, + "loss": 0.008, + "step": 607190 + }, + { + "epoch": 1.57, + "learning_rate": 6.39075019246671e-05, + "loss": 0.0083, + "step": 607200 + }, + { + "epoch": 1.57, + "learning_rate": 6.390361370829564e-05, + "loss": 0.0104, + "step": 607210 + }, + { + "epoch": 1.57, + "learning_rate": 6.389972549192418e-05, + "loss": 0.0082, + "step": 607220 + }, + { + "epoch": 1.57, + "learning_rate": 6.38958372755527e-05, + "loss": 0.0093, + "step": 607230 + }, + { + "epoch": 1.57, + "learning_rate": 6.389194905918125e-05, + "loss": 0.0092, + "step": 607240 + }, + { + "epoch": 1.57, + "learning_rate": 6.388806084280978e-05, + "loss": 0.0085, + "step": 607250 + }, + { + "epoch": 1.57, + "learning_rate": 6.38841726264383e-05, + "loss": 0.0104, + "step": 607260 + }, + { + "epoch": 1.57, + "learning_rate": 6.388028441006685e-05, + "loss": 0.0073, + "step": 607270 + }, + { + "epoch": 1.57, + "learning_rate": 6.387639619369537e-05, + "loss": 0.0078, + "step": 607280 + }, + { + "epoch": 1.57, + "learning_rate": 6.387250797732392e-05, + "loss": 0.0078, + "step": 607290 + }, + { + "epoch": 1.57, + "learning_rate": 6.386861976095244e-05, + "loss": 0.0093, + "step": 607300 + }, + { + "epoch": 1.57, + "learning_rate": 6.386473154458099e-05, + "loss": 0.0088, + "step": 607310 + }, + { + "epoch": 1.57, + "learning_rate": 6.386084332820953e-05, + "loss": 0.0074, + "step": 607320 + }, + { + "epoch": 1.57, + "learning_rate": 6.385695511183806e-05, + "loss": 0.009, + "step": 607330 + }, + { + "epoch": 1.57, + "learning_rate": 6.38530668954666e-05, + "loss": 0.0093, + "step": 607340 + }, + { + "epoch": 1.57, + "learning_rate": 6.384917867909512e-05, + "loss": 0.0075, + "step": 607350 + }, + { + "epoch": 1.57, + "learning_rate": 6.384529046272367e-05, + "loss": 0.0088, + "step": 607360 + }, + { + "epoch": 1.57, + "learning_rate": 6.38414022463522e-05, + "loss": 0.0109, + "step": 607370 + }, + { + "epoch": 1.57, + "learning_rate": 6.383751402998074e-05, + "loss": 0.0113, + "step": 607380 + }, + { + "epoch": 1.57, + "learning_rate": 6.383362581360926e-05, + "loss": 0.008, + "step": 607390 + }, + { + "epoch": 1.57, + "learning_rate": 6.38297375972378e-05, + "loss": 0.0072, + "step": 607400 + }, + { + "epoch": 1.57, + "learning_rate": 6.382584938086635e-05, + "loss": 0.0079, + "step": 607410 + }, + { + "epoch": 1.57, + "learning_rate": 6.382196116449488e-05, + "loss": 0.0074, + "step": 607420 + }, + { + "epoch": 1.57, + "learning_rate": 6.381807294812342e-05, + "loss": 0.0095, + "step": 607430 + }, + { + "epoch": 1.57, + "learning_rate": 6.381418473175195e-05, + "loss": 0.01, + "step": 607440 + }, + { + "epoch": 1.57, + "learning_rate": 6.381029651538049e-05, + "loss": 0.0077, + "step": 607450 + }, + { + "epoch": 1.57, + "learning_rate": 6.380640829900902e-05, + "loss": 0.0067, + "step": 607460 + }, + { + "epoch": 1.57, + "learning_rate": 6.380252008263756e-05, + "loss": 0.0076, + "step": 607470 + }, + { + "epoch": 1.57, + "learning_rate": 6.37986318662661e-05, + "loss": 0.0075, + "step": 607480 + }, + { + "epoch": 1.57, + "learning_rate": 6.379474364989461e-05, + "loss": 0.0074, + "step": 607490 + }, + { + "epoch": 1.57, + "learning_rate": 6.379085543352315e-05, + "loss": 0.007, + "step": 607500 + }, + { + "epoch": 1.57, + "learning_rate": 6.37869672171517e-05, + "loss": 0.0075, + "step": 607510 + }, + { + "epoch": 1.57, + "learning_rate": 6.378307900078022e-05, + "loss": 0.0108, + "step": 607520 + }, + { + "epoch": 1.57, + "learning_rate": 6.377919078440877e-05, + "loss": 0.0067, + "step": 607530 + }, + { + "epoch": 1.57, + "learning_rate": 6.37753025680373e-05, + "loss": 0.01, + "step": 607540 + }, + { + "epoch": 1.57, + "learning_rate": 6.377141435166584e-05, + "loss": 0.0115, + "step": 607550 + }, + { + "epoch": 1.57, + "learning_rate": 6.376752613529436e-05, + "loss": 0.0072, + "step": 607560 + }, + { + "epoch": 1.57, + "learning_rate": 6.37636379189229e-05, + "loss": 0.0065, + "step": 607570 + }, + { + "epoch": 1.57, + "learning_rate": 6.375974970255145e-05, + "loss": 0.011, + "step": 607580 + }, + { + "epoch": 1.57, + "learning_rate": 6.375586148617998e-05, + "loss": 0.0087, + "step": 607590 + }, + { + "epoch": 1.57, + "learning_rate": 6.375197326980852e-05, + "loss": 0.0091, + "step": 607600 + }, + { + "epoch": 1.58, + "learning_rate": 6.374808505343704e-05, + "loss": 0.0111, + "step": 607610 + }, + { + "epoch": 1.58, + "learning_rate": 6.374419683706559e-05, + "loss": 0.0079, + "step": 607620 + }, + { + "epoch": 1.58, + "learning_rate": 6.374030862069411e-05, + "loss": 0.0089, + "step": 607630 + }, + { + "epoch": 1.58, + "learning_rate": 6.373642040432266e-05, + "loss": 0.0104, + "step": 607640 + }, + { + "epoch": 1.58, + "learning_rate": 6.373253218795118e-05, + "loss": 0.0083, + "step": 607650 + }, + { + "epoch": 1.58, + "learning_rate": 6.372864397157973e-05, + "loss": 0.0099, + "step": 607660 + }, + { + "epoch": 1.58, + "learning_rate": 6.372475575520827e-05, + "loss": 0.0081, + "step": 607670 + }, + { + "epoch": 1.58, + "learning_rate": 6.37208675388368e-05, + "loss": 0.0065, + "step": 607680 + }, + { + "epoch": 1.58, + "learning_rate": 6.371697932246534e-05, + "loss": 0.0099, + "step": 607690 + }, + { + "epoch": 1.58, + "learning_rate": 6.371309110609387e-05, + "loss": 0.0094, + "step": 607700 + }, + { + "epoch": 1.58, + "learning_rate": 6.370920288972241e-05, + "loss": 0.0085, + "step": 607710 + }, + { + "epoch": 1.58, + "learning_rate": 6.370531467335093e-05, + "loss": 0.0085, + "step": 607720 + }, + { + "epoch": 1.58, + "learning_rate": 6.370142645697948e-05, + "loss": 0.0126, + "step": 607730 + }, + { + "epoch": 1.58, + "learning_rate": 6.3697538240608e-05, + "loss": 0.0096, + "step": 607740 + }, + { + "epoch": 1.58, + "learning_rate": 6.369365002423653e-05, + "loss": 0.0065, + "step": 607750 + }, + { + "epoch": 1.58, + "learning_rate": 6.368976180786507e-05, + "loss": 0.007, + "step": 607760 + }, + { + "epoch": 1.58, + "learning_rate": 6.368587359149362e-05, + "loss": 0.0064, + "step": 607770 + }, + { + "epoch": 1.58, + "learning_rate": 6.368198537512214e-05, + "loss": 0.0093, + "step": 607780 + }, + { + "epoch": 1.58, + "learning_rate": 6.367809715875069e-05, + "loss": 0.0093, + "step": 607790 + }, + { + "epoch": 1.58, + "learning_rate": 6.367420894237921e-05, + "loss": 0.0072, + "step": 607800 + }, + { + "epoch": 1.58, + "learning_rate": 6.367032072600776e-05, + "loss": 0.0105, + "step": 607810 + }, + { + "epoch": 1.58, + "learning_rate": 6.366643250963628e-05, + "loss": 0.0072, + "step": 607820 + }, + { + "epoch": 1.58, + "learning_rate": 6.366254429326483e-05, + "loss": 0.0067, + "step": 607830 + }, + { + "epoch": 1.58, + "learning_rate": 6.365865607689337e-05, + "loss": 0.0075, + "step": 607840 + }, + { + "epoch": 1.58, + "learning_rate": 6.36547678605219e-05, + "loss": 0.0075, + "step": 607850 + }, + { + "epoch": 1.58, + "learning_rate": 6.365087964415044e-05, + "loss": 0.0102, + "step": 607860 + }, + { + "epoch": 1.58, + "learning_rate": 6.364699142777896e-05, + "loss": 0.0088, + "step": 607870 + }, + { + "epoch": 1.58, + "learning_rate": 6.36431032114075e-05, + "loss": 0.0076, + "step": 607880 + }, + { + "epoch": 1.58, + "learning_rate": 6.363921499503603e-05, + "loss": 0.0075, + "step": 607890 + }, + { + "epoch": 1.58, + "learning_rate": 6.363532677866458e-05, + "loss": 0.0095, + "step": 607900 + }, + { + "epoch": 1.58, + "learning_rate": 6.36314385622931e-05, + "loss": 0.0078, + "step": 607910 + }, + { + "epoch": 1.58, + "learning_rate": 6.362755034592165e-05, + "loss": 0.0077, + "step": 607920 + }, + { + "epoch": 1.58, + "learning_rate": 6.362366212955019e-05, + "loss": 0.0079, + "step": 607930 + }, + { + "epoch": 1.58, + "learning_rate": 6.361977391317872e-05, + "loss": 0.0069, + "step": 607940 + }, + { + "epoch": 1.58, + "learning_rate": 6.361588569680726e-05, + "loss": 0.0073, + "step": 607950 + }, + { + "epoch": 1.58, + "learning_rate": 6.361199748043579e-05, + "loss": 0.0083, + "step": 607960 + }, + { + "epoch": 1.58, + "learning_rate": 6.360810926406433e-05, + "loss": 0.011, + "step": 607970 + }, + { + "epoch": 1.58, + "learning_rate": 6.360422104769285e-05, + "loss": 0.0072, + "step": 607980 + }, + { + "epoch": 1.58, + "learning_rate": 6.360033283132138e-05, + "loss": 0.0073, + "step": 607990 + }, + { + "epoch": 1.58, + "learning_rate": 6.359644461494992e-05, + "loss": 0.0085, + "step": 608000 + }, + { + "epoch": 1.58, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.00566211948171258, + "eval_runtime": 107.9004, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, + "step": 608000 + }, + { + "epoch": 1.58, + "learning_rate": 6.359255639857845e-05, + "loss": 0.0093, + "step": 608010 + }, + { + "epoch": 1.58, + "learning_rate": 6.3588668182207e-05, + "loss": 0.0104, + "step": 608020 + }, + { + "epoch": 1.58, + "learning_rate": 6.358477996583554e-05, + "loss": 0.0075, + "step": 608030 + }, + { + "epoch": 1.58, + "learning_rate": 6.358089174946406e-05, + "loss": 0.0093, + "step": 608040 + }, + { + "epoch": 1.58, + "learning_rate": 6.35770035330926e-05, + "loss": 0.0088, + "step": 608050 + }, + { + "epoch": 1.58, + "learning_rate": 6.357311531672113e-05, + "loss": 0.0116, + "step": 608060 + }, + { + "epoch": 1.58, + "learning_rate": 6.356922710034968e-05, + "loss": 0.0075, + "step": 608070 + }, + { + "epoch": 1.58, + "learning_rate": 6.35653388839782e-05, + "loss": 0.0087, + "step": 608080 + }, + { + "epoch": 1.58, + "learning_rate": 6.356145066760675e-05, + "loss": 0.0078, + "step": 608090 + }, + { + "epoch": 1.58, + "learning_rate": 6.355756245123529e-05, + "loss": 0.0079, + "step": 608100 + }, + { + "epoch": 1.58, + "learning_rate": 6.355367423486381e-05, + "loss": 0.0094, + "step": 608110 + }, + { + "epoch": 1.58, + "learning_rate": 6.354978601849236e-05, + "loss": 0.0062, + "step": 608120 + }, + { + "epoch": 1.58, + "learning_rate": 6.354589780212088e-05, + "loss": 0.0075, + "step": 608130 + }, + { + "epoch": 1.58, + "learning_rate": 6.354200958574943e-05, + "loss": 0.0066, + "step": 608140 + }, + { + "epoch": 1.58, + "learning_rate": 6.353812136937795e-05, + "loss": 0.0077, + "step": 608150 + }, + { + "epoch": 1.58, + "learning_rate": 6.35342331530065e-05, + "loss": 0.0084, + "step": 608160 + }, + { + "epoch": 1.58, + "learning_rate": 6.353034493663502e-05, + "loss": 0.0091, + "step": 608170 + }, + { + "epoch": 1.58, + "learning_rate": 6.352645672026357e-05, + "loss": 0.0101, + "step": 608180 + }, + { + "epoch": 1.58, + "learning_rate": 6.352256850389211e-05, + "loss": 0.008, + "step": 608190 + }, + { + "epoch": 1.58, + "learning_rate": 6.351868028752064e-05, + "loss": 0.0082, + "step": 608200 + }, + { + "epoch": 1.58, + "learning_rate": 6.351479207114918e-05, + "loss": 0.0056, + "step": 608210 + }, + { + "epoch": 1.58, + "learning_rate": 6.35109038547777e-05, + "loss": 0.0082, + "step": 608220 + }, + { + "epoch": 1.58, + "learning_rate": 6.350701563840625e-05, + "loss": 0.0096, + "step": 608230 + }, + { + "epoch": 1.58, + "learning_rate": 6.350312742203477e-05, + "loss": 0.0103, + "step": 608240 + }, + { + "epoch": 1.58, + "learning_rate": 6.34992392056633e-05, + "loss": 0.0067, + "step": 608250 + }, + { + "epoch": 1.58, + "learning_rate": 6.349535098929184e-05, + "loss": 0.0069, + "step": 608260 + }, + { + "epoch": 1.58, + "learning_rate": 6.349146277292037e-05, + "loss": 0.0072, + "step": 608270 + }, + { + "epoch": 1.58, + "learning_rate": 6.348757455654891e-05, + "loss": 0.0074, + "step": 608280 + }, + { + "epoch": 1.58, + "learning_rate": 6.348368634017746e-05, + "loss": 0.0101, + "step": 608290 + }, + { + "epoch": 1.58, + "learning_rate": 6.347979812380598e-05, + "loss": 0.0082, + "step": 608300 + }, + { + "epoch": 1.58, + "learning_rate": 6.347590990743453e-05, + "loss": 0.0149, + "step": 608310 + }, + { + "epoch": 1.58, + "learning_rate": 6.347202169106305e-05, + "loss": 0.0079, + "step": 608320 + }, + { + "epoch": 1.58, + "learning_rate": 6.34681334746916e-05, + "loss": 0.0097, + "step": 608330 + }, + { + "epoch": 1.58, + "learning_rate": 6.346424525832012e-05, + "loss": 0.0074, + "step": 608340 + }, + { + "epoch": 1.58, + "learning_rate": 6.346035704194867e-05, + "loss": 0.008, + "step": 608350 + }, + { + "epoch": 1.58, + "learning_rate": 6.345646882557721e-05, + "loss": 0.0067, + "step": 608360 + }, + { + "epoch": 1.58, + "learning_rate": 6.345258060920573e-05, + "loss": 0.0087, + "step": 608370 + }, + { + "epoch": 1.58, + "learning_rate": 6.344869239283428e-05, + "loss": 0.0135, + "step": 608380 + }, + { + "epoch": 1.58, + "learning_rate": 6.34448041764628e-05, + "loss": 0.0079, + "step": 608390 + }, + { + "epoch": 1.58, + "learning_rate": 6.344091596009135e-05, + "loss": 0.0115, + "step": 608400 + }, + { + "epoch": 1.58, + "learning_rate": 6.343702774371987e-05, + "loss": 0.0098, + "step": 608410 + }, + { + "epoch": 1.58, + "learning_rate": 6.343313952734842e-05, + "loss": 0.0106, + "step": 608420 + }, + { + "epoch": 1.58, + "learning_rate": 6.342925131097694e-05, + "loss": 0.0091, + "step": 608430 + }, + { + "epoch": 1.58, + "learning_rate": 6.342536309460549e-05, + "loss": 0.0094, + "step": 608440 + }, + { + "epoch": 1.58, + "learning_rate": 6.342147487823403e-05, + "loss": 0.0104, + "step": 608450 + }, + { + "epoch": 1.58, + "learning_rate": 6.341758666186256e-05, + "loss": 0.0076, + "step": 608460 + }, + { + "epoch": 1.58, + "learning_rate": 6.34136984454911e-05, + "loss": 0.008, + "step": 608470 + }, + { + "epoch": 1.58, + "learning_rate": 6.340981022911963e-05, + "loss": 0.0115, + "step": 608480 + }, + { + "epoch": 1.58, + "learning_rate": 6.340592201274815e-05, + "loss": 0.0095, + "step": 608490 + }, + { + "epoch": 1.58, + "learning_rate": 6.34020337963767e-05, + "loss": 0.0061, + "step": 608500 + }, + { + "epoch": 1.58, + "learning_rate": 6.339814558000522e-05, + "loss": 0.0105, + "step": 608510 + }, + { + "epoch": 1.58, + "learning_rate": 6.339425736363376e-05, + "loss": 0.0063, + "step": 608520 + }, + { + "epoch": 1.58, + "learning_rate": 6.339036914726229e-05, + "loss": 0.0085, + "step": 608530 + }, + { + "epoch": 1.58, + "learning_rate": 6.338648093089083e-05, + "loss": 0.0102, + "step": 608540 + }, + { + "epoch": 1.58, + "learning_rate": 6.338259271451938e-05, + "loss": 0.0076, + "step": 608550 + }, + { + "epoch": 1.58, + "learning_rate": 6.33787044981479e-05, + "loss": 0.01, + "step": 608560 + }, + { + "epoch": 1.58, + "learning_rate": 6.337481628177645e-05, + "loss": 0.0069, + "step": 608570 + }, + { + "epoch": 1.58, + "learning_rate": 6.337092806540497e-05, + "loss": 0.0078, + "step": 608580 + }, + { + "epoch": 1.58, + "learning_rate": 6.336703984903352e-05, + "loss": 0.0099, + "step": 608590 + }, + { + "epoch": 1.58, + "learning_rate": 6.336315163266204e-05, + "loss": 0.0074, + "step": 608600 + }, + { + "epoch": 1.58, + "learning_rate": 6.335926341629059e-05, + "loss": 0.0066, + "step": 608610 + }, + { + "epoch": 1.58, + "learning_rate": 6.335537519991913e-05, + "loss": 0.0099, + "step": 608620 + }, + { + "epoch": 1.58, + "learning_rate": 6.335148698354765e-05, + "loss": 0.0069, + "step": 608630 + }, + { + "epoch": 1.58, + "learning_rate": 6.33475987671762e-05, + "loss": 0.0099, + "step": 608640 + }, + { + "epoch": 1.58, + "learning_rate": 6.334371055080472e-05, + "loss": 0.0067, + "step": 608650 + }, + { + "epoch": 1.58, + "learning_rate": 6.333982233443327e-05, + "loss": 0.0074, + "step": 608660 + }, + { + "epoch": 1.58, + "learning_rate": 6.33359341180618e-05, + "loss": 0.0087, + "step": 608670 + }, + { + "epoch": 1.58, + "learning_rate": 6.333204590169034e-05, + "loss": 0.0087, + "step": 608680 + }, + { + "epoch": 1.58, + "learning_rate": 6.332815768531886e-05, + "loss": 0.0127, + "step": 608690 + }, + { + "epoch": 1.58, + "learning_rate": 6.33242694689474e-05, + "loss": 0.0119, + "step": 608700 + }, + { + "epoch": 1.58, + "learning_rate": 6.332038125257595e-05, + "loss": 0.0083, + "step": 608710 + }, + { + "epoch": 1.58, + "learning_rate": 6.331649303620448e-05, + "loss": 0.0081, + "step": 608720 + }, + { + "epoch": 1.58, + "learning_rate": 6.3312604819833e-05, + "loss": 0.007, + "step": 608730 + }, + { + "epoch": 1.58, + "learning_rate": 6.330871660346155e-05, + "loss": 0.007, + "step": 608740 + }, + { + "epoch": 1.58, + "learning_rate": 6.330482838709007e-05, + "loss": 0.0093, + "step": 608750 + }, + { + "epoch": 1.58, + "learning_rate": 6.330094017071861e-05, + "loss": 0.0086, + "step": 608760 + }, + { + "epoch": 1.58, + "learning_rate": 6.329705195434714e-05, + "loss": 0.0089, + "step": 608770 + }, + { + "epoch": 1.58, + "learning_rate": 6.329316373797568e-05, + "loss": 0.0134, + "step": 608780 + }, + { + "epoch": 1.58, + "learning_rate": 6.328927552160421e-05, + "loss": 0.0069, + "step": 608790 + }, + { + "epoch": 1.58, + "learning_rate": 6.328538730523275e-05, + "loss": 0.008, + "step": 608800 + }, + { + "epoch": 1.58, + "learning_rate": 6.32814990888613e-05, + "loss": 0.0083, + "step": 608810 + }, + { + "epoch": 1.58, + "learning_rate": 6.327761087248982e-05, + "loss": 0.0086, + "step": 608820 + }, + { + "epoch": 1.58, + "learning_rate": 6.327372265611837e-05, + "loss": 0.0087, + "step": 608830 + }, + { + "epoch": 1.58, + "learning_rate": 6.32698344397469e-05, + "loss": 0.0118, + "step": 608840 + }, + { + "epoch": 1.58, + "learning_rate": 6.326594622337544e-05, + "loss": 0.0106, + "step": 608850 + }, + { + "epoch": 1.58, + "learning_rate": 6.326205800700396e-05, + "loss": 0.0078, + "step": 608860 + }, + { + "epoch": 1.58, + "learning_rate": 6.32581697906325e-05, + "loss": 0.0082, + "step": 608870 + }, + { + "epoch": 1.58, + "learning_rate": 6.325428157426103e-05, + "loss": 0.0062, + "step": 608880 + }, + { + "epoch": 1.58, + "learning_rate": 6.325039335788957e-05, + "loss": 0.0092, + "step": 608890 + }, + { + "epoch": 1.58, + "learning_rate": 6.324650514151812e-05, + "loss": 0.0085, + "step": 608900 + }, + { + "epoch": 1.58, + "learning_rate": 6.324261692514664e-05, + "loss": 0.0095, + "step": 608910 + }, + { + "epoch": 1.58, + "learning_rate": 6.323872870877519e-05, + "loss": 0.0161, + "step": 608920 + }, + { + "epoch": 1.58, + "learning_rate": 6.323484049240371e-05, + "loss": 0.0093, + "step": 608930 + }, + { + "epoch": 1.58, + "learning_rate": 6.323095227603226e-05, + "loss": 0.0085, + "step": 608940 + }, + { + "epoch": 1.58, + "learning_rate": 6.322706405966078e-05, + "loss": 0.0085, + "step": 608950 + }, + { + "epoch": 1.58, + "learning_rate": 6.322317584328933e-05, + "loss": 0.0081, + "step": 608960 + }, + { + "epoch": 1.58, + "learning_rate": 6.321928762691787e-05, + "loss": 0.006, + "step": 608970 + }, + { + "epoch": 1.58, + "learning_rate": 6.321539941054638e-05, + "loss": 0.01, + "step": 608980 + }, + { + "epoch": 1.58, + "learning_rate": 6.321151119417492e-05, + "loss": 0.006, + "step": 608990 + }, + { + "epoch": 1.58, + "learning_rate": 6.320762297780347e-05, + "loss": 0.0114, + "step": 609000 + }, + { + "epoch": 1.58, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.005694786552339792, + "eval_runtime": 107.9833, + "eval_samples_per_second": 18.521, + "eval_steps_per_second": 4.63, + "step": 609000 + }, + { + "epoch": 1.58, + "learning_rate": 6.320373476143199e-05, + "loss": 0.0093, + "step": 609010 + }, + { + "epoch": 1.58, + "learning_rate": 6.319984654506053e-05, + "loss": 0.0085, + "step": 609020 + }, + { + "epoch": 1.58, + "learning_rate": 6.319595832868906e-05, + "loss": 0.0108, + "step": 609030 + }, + { + "epoch": 1.58, + "learning_rate": 6.31920701123176e-05, + "loss": 0.0069, + "step": 609040 + }, + { + "epoch": 1.58, + "learning_rate": 6.318818189594613e-05, + "loss": 0.0056, + "step": 609050 + }, + { + "epoch": 1.58, + "learning_rate": 6.318429367957467e-05, + "loss": 0.0079, + "step": 609060 + }, + { + "epoch": 1.58, + "learning_rate": 6.318040546320322e-05, + "loss": 0.0079, + "step": 609070 + }, + { + "epoch": 1.58, + "learning_rate": 6.317651724683174e-05, + "loss": 0.0078, + "step": 609080 + }, + { + "epoch": 1.58, + "learning_rate": 6.317262903046029e-05, + "loss": 0.0129, + "step": 609090 + }, + { + "epoch": 1.58, + "learning_rate": 6.316874081408881e-05, + "loss": 0.0087, + "step": 609100 + }, + { + "epoch": 1.58, + "learning_rate": 6.316485259771736e-05, + "loss": 0.008, + "step": 609110 + }, + { + "epoch": 1.58, + "learning_rate": 6.316096438134588e-05, + "loss": 0.0079, + "step": 609120 + }, + { + "epoch": 1.58, + "learning_rate": 6.315707616497442e-05, + "loss": 0.0104, + "step": 609130 + }, + { + "epoch": 1.58, + "learning_rate": 6.315318794860295e-05, + "loss": 0.0074, + "step": 609140 + }, + { + "epoch": 1.58, + "learning_rate": 6.31492997322315e-05, + "loss": 0.0069, + "step": 609150 + }, + { + "epoch": 1.58, + "learning_rate": 6.314541151586004e-05, + "loss": 0.0095, + "step": 609160 + }, + { + "epoch": 1.58, + "learning_rate": 6.314152329948856e-05, + "loss": 0.0094, + "step": 609170 + }, + { + "epoch": 1.58, + "learning_rate": 6.31376350831171e-05, + "loss": 0.0081, + "step": 609180 + }, + { + "epoch": 1.58, + "learning_rate": 6.313374686674563e-05, + "loss": 0.0087, + "step": 609190 + }, + { + "epoch": 1.58, + "learning_rate": 6.312985865037418e-05, + "loss": 0.0069, + "step": 609200 + }, + { + "epoch": 1.58, + "learning_rate": 6.31259704340027e-05, + "loss": 0.0088, + "step": 609210 + }, + { + "epoch": 1.58, + "learning_rate": 6.312208221763125e-05, + "loss": 0.0069, + "step": 609220 + }, + { + "epoch": 1.58, + "learning_rate": 6.311819400125977e-05, + "loss": 0.0083, + "step": 609230 + }, + { + "epoch": 1.58, + "learning_rate": 6.31143057848883e-05, + "loss": 0.0057, + "step": 609240 + }, + { + "epoch": 1.58, + "learning_rate": 6.311041756851684e-05, + "loss": 0.0091, + "step": 609250 + }, + { + "epoch": 1.58, + "learning_rate": 6.310652935214538e-05, + "loss": 0.0085, + "step": 609260 + }, + { + "epoch": 1.58, + "learning_rate": 6.310264113577391e-05, + "loss": 0.0078, + "step": 609270 + }, + { + "epoch": 1.58, + "learning_rate": 6.309875291940245e-05, + "loss": 0.0067, + "step": 609280 + }, + { + "epoch": 1.58, + "learning_rate": 6.309486470303098e-05, + "loss": 0.0065, + "step": 609290 + }, + { + "epoch": 1.58, + "learning_rate": 6.309097648665952e-05, + "loss": 0.0079, + "step": 609300 + }, + { + "epoch": 1.58, + "learning_rate": 6.308708827028805e-05, + "loss": 0.0086, + "step": 609310 + }, + { + "epoch": 1.58, + "learning_rate": 6.30832000539166e-05, + "loss": 0.0082, + "step": 609320 + }, + { + "epoch": 1.58, + "learning_rate": 6.307931183754514e-05, + "loss": 0.0085, + "step": 609330 + }, + { + "epoch": 1.58, + "learning_rate": 6.307542362117366e-05, + "loss": 0.0072, + "step": 609340 + }, + { + "epoch": 1.58, + "learning_rate": 6.30715354048022e-05, + "loss": 0.0059, + "step": 609350 + }, + { + "epoch": 1.58, + "learning_rate": 6.306764718843073e-05, + "loss": 0.0105, + "step": 609360 + }, + { + "epoch": 1.58, + "learning_rate": 6.306375897205928e-05, + "loss": 0.0061, + "step": 609370 + }, + { + "epoch": 1.58, + "learning_rate": 6.30598707556878e-05, + "loss": 0.0107, + "step": 609380 + }, + { + "epoch": 1.58, + "learning_rate": 6.305598253931634e-05, + "loss": 0.0069, + "step": 609390 + }, + { + "epoch": 1.58, + "learning_rate": 6.305209432294487e-05, + "loss": 0.0093, + "step": 609400 + }, + { + "epoch": 1.58, + "learning_rate": 6.304820610657341e-05, + "loss": 0.0071, + "step": 609410 + }, + { + "epoch": 1.58, + "learning_rate": 6.304431789020196e-05, + "loss": 0.0089, + "step": 609420 + }, + { + "epoch": 1.58, + "learning_rate": 6.304042967383048e-05, + "loss": 0.0087, + "step": 609430 + }, + { + "epoch": 1.58, + "learning_rate": 6.303654145745903e-05, + "loss": 0.01, + "step": 609440 + }, + { + "epoch": 1.58, + "learning_rate": 6.303265324108755e-05, + "loss": 0.0092, + "step": 609450 + }, + { + "epoch": 1.58, + "learning_rate": 6.30287650247161e-05, + "loss": 0.0066, + "step": 609460 + }, + { + "epoch": 1.58, + "learning_rate": 6.302487680834462e-05, + "loss": 0.0083, + "step": 609470 + }, + { + "epoch": 1.58, + "learning_rate": 6.302098859197315e-05, + "loss": 0.0084, + "step": 609480 + }, + { + "epoch": 1.58, + "learning_rate": 6.30171003756017e-05, + "loss": 0.01, + "step": 609490 + }, + { + "epoch": 1.58, + "learning_rate": 6.301321215923022e-05, + "loss": 0.0096, + "step": 609500 + }, + { + "epoch": 1.58, + "learning_rate": 6.300932394285876e-05, + "loss": 0.0078, + "step": 609510 + }, + { + "epoch": 1.58, + "learning_rate": 6.30054357264873e-05, + "loss": 0.0108, + "step": 609520 + }, + { + "epoch": 1.58, + "learning_rate": 6.300154751011583e-05, + "loss": 0.0085, + "step": 609530 + }, + { + "epoch": 1.58, + "learning_rate": 6.299765929374437e-05, + "loss": 0.0094, + "step": 609540 + }, + { + "epoch": 1.58, + "learning_rate": 6.29937710773729e-05, + "loss": 0.0098, + "step": 609550 + }, + { + "epoch": 1.58, + "learning_rate": 6.298988286100144e-05, + "loss": 0.0078, + "step": 609560 + }, + { + "epoch": 1.58, + "learning_rate": 6.298599464462997e-05, + "loss": 0.0143, + "step": 609570 + }, + { + "epoch": 1.58, + "learning_rate": 6.298210642825851e-05, + "loss": 0.0069, + "step": 609580 + }, + { + "epoch": 1.58, + "learning_rate": 6.297821821188706e-05, + "loss": 0.0091, + "step": 609590 + }, + { + "epoch": 1.58, + "learning_rate": 6.297432999551558e-05, + "loss": 0.007, + "step": 609600 + }, + { + "epoch": 1.58, + "learning_rate": 6.297044177914413e-05, + "loss": 0.0113, + "step": 609610 + }, + { + "epoch": 1.58, + "learning_rate": 6.296655356277265e-05, + "loss": 0.0108, + "step": 609620 + }, + { + "epoch": 1.58, + "learning_rate": 6.29626653464012e-05, + "loss": 0.0111, + "step": 609630 + }, + { + "epoch": 1.58, + "learning_rate": 6.295877713002972e-05, + "loss": 0.0092, + "step": 609640 + }, + { + "epoch": 1.58, + "learning_rate": 6.295488891365826e-05, + "loss": 0.0096, + "step": 609650 + }, + { + "epoch": 1.58, + "learning_rate": 6.295100069728679e-05, + "loss": 0.0084, + "step": 609660 + }, + { + "epoch": 1.58, + "learning_rate": 6.294711248091533e-05, + "loss": 0.0084, + "step": 609670 + }, + { + "epoch": 1.58, + "learning_rate": 6.294322426454388e-05, + "loss": 0.0065, + "step": 609680 + }, + { + "epoch": 1.58, + "learning_rate": 6.29393360481724e-05, + "loss": 0.0062, + "step": 609690 + }, + { + "epoch": 1.58, + "learning_rate": 6.293544783180095e-05, + "loss": 0.0087, + "step": 609700 + }, + { + "epoch": 1.58, + "learning_rate": 6.293155961542947e-05, + "loss": 0.009, + "step": 609710 + }, + { + "epoch": 1.58, + "learning_rate": 6.292767139905802e-05, + "loss": 0.0075, + "step": 609720 + }, + { + "epoch": 1.58, + "learning_rate": 6.292378318268654e-05, + "loss": 0.0063, + "step": 609730 + }, + { + "epoch": 1.58, + "learning_rate": 6.291989496631507e-05, + "loss": 0.0054, + "step": 609740 + }, + { + "epoch": 1.58, + "learning_rate": 6.291600674994361e-05, + "loss": 0.0105, + "step": 609750 + }, + { + "epoch": 1.58, + "learning_rate": 6.291211853357214e-05, + "loss": 0.008, + "step": 609760 + }, + { + "epoch": 1.58, + "learning_rate": 6.290823031720068e-05, + "loss": 0.0063, + "step": 609770 + }, + { + "epoch": 1.58, + "learning_rate": 6.290434210082922e-05, + "loss": 0.0085, + "step": 609780 + }, + { + "epoch": 1.58, + "learning_rate": 6.290045388445775e-05, + "loss": 0.0074, + "step": 609790 + }, + { + "epoch": 1.58, + "learning_rate": 6.28965656680863e-05, + "loss": 0.0081, + "step": 609800 + }, + { + "epoch": 1.58, + "learning_rate": 6.289267745171482e-05, + "loss": 0.0069, + "step": 609810 + }, + { + "epoch": 1.58, + "learning_rate": 6.288878923534336e-05, + "loss": 0.0093, + "step": 609820 + }, + { + "epoch": 1.58, + "learning_rate": 6.288490101897189e-05, + "loss": 0.0061, + "step": 609830 + }, + { + "epoch": 1.58, + "learning_rate": 6.288101280260043e-05, + "loss": 0.0077, + "step": 609840 + }, + { + "epoch": 1.58, + "learning_rate": 6.287712458622898e-05, + "loss": 0.0091, + "step": 609850 + }, + { + "epoch": 1.58, + "learning_rate": 6.28732363698575e-05, + "loss": 0.0086, + "step": 609860 + }, + { + "epoch": 1.58, + "learning_rate": 6.286934815348605e-05, + "loss": 0.0097, + "step": 609870 + }, + { + "epoch": 1.58, + "learning_rate": 6.286545993711457e-05, + "loss": 0.0081, + "step": 609880 + }, + { + "epoch": 1.58, + "learning_rate": 6.286157172074312e-05, + "loss": 0.0089, + "step": 609890 + }, + { + "epoch": 1.58, + "learning_rate": 6.285768350437164e-05, + "loss": 0.0091, + "step": 609900 + }, + { + "epoch": 1.58, + "learning_rate": 6.285379528800018e-05, + "loss": 0.0071, + "step": 609910 + }, + { + "epoch": 1.58, + "learning_rate": 6.284990707162871e-05, + "loss": 0.0076, + "step": 609920 + }, + { + "epoch": 1.58, + "learning_rate": 6.284601885525725e-05, + "loss": 0.0086, + "step": 609930 + }, + { + "epoch": 1.58, + "learning_rate": 6.28421306388858e-05, + "loss": 0.0063, + "step": 609940 + }, + { + "epoch": 1.58, + "learning_rate": 6.283824242251432e-05, + "loss": 0.0101, + "step": 609950 + }, + { + "epoch": 1.58, + "learning_rate": 6.283435420614287e-05, + "loss": 0.0117, + "step": 609960 + }, + { + "epoch": 1.58, + "learning_rate": 6.28304659897714e-05, + "loss": 0.0076, + "step": 609970 + }, + { + "epoch": 1.58, + "learning_rate": 6.282657777339992e-05, + "loss": 0.0063, + "step": 609980 + }, + { + "epoch": 1.58, + "learning_rate": 6.282268955702846e-05, + "loss": 0.0114, + "step": 609990 + }, + { + "epoch": 1.58, + "learning_rate": 6.281880134065699e-05, + "loss": 0.0159, + "step": 610000 + }, + { + "epoch": 1.58, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.005619341507554054, + "eval_runtime": 107.799, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, + "step": 610000 + }, + { + "epoch": 1.58, + "learning_rate": 6.281491312428553e-05, + "loss": 0.0054, + "step": 610010 + }, + { + "epoch": 1.58, + "learning_rate": 6.281102490791406e-05, + "loss": 0.008, + "step": 610020 + }, + { + "epoch": 1.58, + "learning_rate": 6.28071366915426e-05, + "loss": 0.0133, + "step": 610030 + }, + { + "epoch": 1.58, + "learning_rate": 6.280324847517114e-05, + "loss": 0.0086, + "step": 610040 + }, + { + "epoch": 1.58, + "learning_rate": 6.279936025879967e-05, + "loss": 0.0084, + "step": 610050 + }, + { + "epoch": 1.58, + "learning_rate": 6.279547204242821e-05, + "loss": 0.0081, + "step": 610060 + }, + { + "epoch": 1.58, + "learning_rate": 6.279158382605674e-05, + "loss": 0.0099, + "step": 610070 + }, + { + "epoch": 1.58, + "learning_rate": 6.278769560968528e-05, + "loss": 0.0092, + "step": 610080 + }, + { + "epoch": 1.58, + "learning_rate": 6.278380739331381e-05, + "loss": 0.0096, + "step": 610090 + }, + { + "epoch": 1.58, + "learning_rate": 6.277991917694235e-05, + "loss": 0.0092, + "step": 610100 + }, + { + "epoch": 1.58, + "learning_rate": 6.27760309605709e-05, + "loss": 0.0076, + "step": 610110 + }, + { + "epoch": 1.58, + "learning_rate": 6.277214274419942e-05, + "loss": 0.009, + "step": 610120 + }, + { + "epoch": 1.58, + "learning_rate": 6.276825452782797e-05, + "loss": 0.0109, + "step": 610130 + }, + { + "epoch": 1.58, + "learning_rate": 6.27643663114565e-05, + "loss": 0.0092, + "step": 610140 + }, + { + "epoch": 1.58, + "learning_rate": 6.276047809508504e-05, + "loss": 0.0126, + "step": 610150 + }, + { + "epoch": 1.58, + "learning_rate": 6.275658987871356e-05, + "loss": 0.0071, + "step": 610160 + }, + { + "epoch": 1.58, + "learning_rate": 6.27527016623421e-05, + "loss": 0.007, + "step": 610170 + }, + { + "epoch": 1.58, + "learning_rate": 6.274881344597063e-05, + "loss": 0.0106, + "step": 610180 + }, + { + "epoch": 1.58, + "learning_rate": 6.274492522959917e-05, + "loss": 0.0088, + "step": 610190 + }, + { + "epoch": 1.58, + "learning_rate": 6.274103701322772e-05, + "loss": 0.0074, + "step": 610200 + }, + { + "epoch": 1.58, + "learning_rate": 6.273714879685624e-05, + "loss": 0.0089, + "step": 610210 + }, + { + "epoch": 1.58, + "learning_rate": 6.273326058048477e-05, + "loss": 0.0062, + "step": 610220 + }, + { + "epoch": 1.58, + "learning_rate": 6.272937236411331e-05, + "loss": 0.0096, + "step": 610230 + }, + { + "epoch": 1.58, + "learning_rate": 6.272548414774184e-05, + "loss": 0.0094, + "step": 610240 + }, + { + "epoch": 1.58, + "learning_rate": 6.272159593137038e-05, + "loss": 0.0086, + "step": 610250 + }, + { + "epoch": 1.58, + "learning_rate": 6.271770771499891e-05, + "loss": 0.0115, + "step": 610260 + }, + { + "epoch": 1.58, + "learning_rate": 6.271381949862745e-05, + "loss": 0.0091, + "step": 610270 + }, + { + "epoch": 1.58, + "learning_rate": 6.270993128225598e-05, + "loss": 0.0082, + "step": 610280 + }, + { + "epoch": 1.58, + "learning_rate": 6.270604306588452e-05, + "loss": 0.0095, + "step": 610290 + }, + { + "epoch": 1.58, + "learning_rate": 6.270215484951306e-05, + "loss": 0.0085, + "step": 610300 + }, + { + "epoch": 1.58, + "learning_rate": 6.269826663314159e-05, + "loss": 0.0124, + "step": 610310 + }, + { + "epoch": 1.58, + "learning_rate": 6.269437841677013e-05, + "loss": 0.0123, + "step": 610320 + }, + { + "epoch": 1.58, + "learning_rate": 6.269049020039866e-05, + "loss": 0.0128, + "step": 610330 + }, + { + "epoch": 1.58, + "learning_rate": 6.26866019840272e-05, + "loss": 0.0088, + "step": 610340 + }, + { + "epoch": 1.58, + "learning_rate": 6.268271376765573e-05, + "loss": 0.0073, + "step": 610350 + }, + { + "epoch": 1.58, + "learning_rate": 6.267882555128427e-05, + "loss": 0.0092, + "step": 610360 + }, + { + "epoch": 1.58, + "learning_rate": 6.26749373349128e-05, + "loss": 0.0102, + "step": 610370 + }, + { + "epoch": 1.58, + "learning_rate": 6.267104911854134e-05, + "loss": 0.0076, + "step": 610380 + }, + { + "epoch": 1.58, + "learning_rate": 6.266716090216989e-05, + "loss": 0.0093, + "step": 610390 + }, + { + "epoch": 1.58, + "learning_rate": 6.266327268579841e-05, + "loss": 0.0075, + "step": 610400 + }, + { + "epoch": 1.58, + "learning_rate": 6.265938446942696e-05, + "loss": 0.0152, + "step": 610410 + }, + { + "epoch": 1.58, + "learning_rate": 6.265549625305548e-05, + "loss": 0.009, + "step": 610420 + }, + { + "epoch": 1.58, + "learning_rate": 6.265160803668402e-05, + "loss": 0.0072, + "step": 610430 + }, + { + "epoch": 1.58, + "learning_rate": 6.264771982031255e-05, + "loss": 0.007, + "step": 610440 + }, + { + "epoch": 1.58, + "learning_rate": 6.26438316039411e-05, + "loss": 0.0064, + "step": 610450 + }, + { + "epoch": 1.58, + "learning_rate": 6.263994338756964e-05, + "loss": 0.0089, + "step": 610460 + }, + { + "epoch": 1.58, + "learning_rate": 6.263605517119815e-05, + "loss": 0.0094, + "step": 610470 + }, + { + "epoch": 1.58, + "learning_rate": 6.263216695482669e-05, + "loss": 0.0082, + "step": 610480 + }, + { + "epoch": 1.58, + "learning_rate": 6.262827873845523e-05, + "loss": 0.0086, + "step": 610490 + }, + { + "epoch": 1.58, + "learning_rate": 6.262439052208376e-05, + "loss": 0.0066, + "step": 610500 + }, + { + "epoch": 1.58, + "learning_rate": 6.26205023057123e-05, + "loss": 0.0078, + "step": 610510 + }, + { + "epoch": 1.58, + "learning_rate": 6.261661408934083e-05, + "loss": 0.0087, + "step": 610520 + }, + { + "epoch": 1.58, + "learning_rate": 6.261272587296937e-05, + "loss": 0.0086, + "step": 610530 + }, + { + "epoch": 1.58, + "learning_rate": 6.26088376565979e-05, + "loss": 0.0095, + "step": 610540 + }, + { + "epoch": 1.58, + "learning_rate": 6.260494944022644e-05, + "loss": 0.0066, + "step": 610550 + }, + { + "epoch": 1.58, + "learning_rate": 6.260106122385498e-05, + "loss": 0.0108, + "step": 610560 + }, + { + "epoch": 1.58, + "learning_rate": 6.259717300748351e-05, + "loss": 0.0086, + "step": 610570 + }, + { + "epoch": 1.58, + "learning_rate": 6.259328479111205e-05, + "loss": 0.0117, + "step": 610580 + }, + { + "epoch": 1.58, + "learning_rate": 6.258939657474058e-05, + "loss": 0.0083, + "step": 610590 + }, + { + "epoch": 1.58, + "learning_rate": 6.258550835836912e-05, + "loss": 0.0061, + "step": 610600 + }, + { + "epoch": 1.58, + "learning_rate": 6.258162014199765e-05, + "loss": 0.009, + "step": 610610 + }, + { + "epoch": 1.58, + "learning_rate": 6.25777319256262e-05, + "loss": 0.0106, + "step": 610620 + }, + { + "epoch": 1.58, + "learning_rate": 6.257384370925472e-05, + "loss": 0.0094, + "step": 610630 + }, + { + "epoch": 1.58, + "learning_rate": 6.256995549288326e-05, + "loss": 0.0073, + "step": 610640 + }, + { + "epoch": 1.58, + "learning_rate": 6.25660672765118e-05, + "loss": 0.0112, + "step": 610650 + }, + { + "epoch": 1.58, + "learning_rate": 6.256217906014033e-05, + "loss": 0.0087, + "step": 610660 + }, + { + "epoch": 1.58, + "learning_rate": 6.255829084376887e-05, + "loss": 0.0085, + "step": 610670 + }, + { + "epoch": 1.58, + "learning_rate": 6.25544026273974e-05, + "loss": 0.0092, + "step": 610680 + }, + { + "epoch": 1.58, + "learning_rate": 6.255051441102594e-05, + "loss": 0.0099, + "step": 610690 + }, + { + "epoch": 1.58, + "learning_rate": 6.254662619465447e-05, + "loss": 0.0099, + "step": 610700 + }, + { + "epoch": 1.58, + "learning_rate": 6.254273797828301e-05, + "loss": 0.0095, + "step": 610710 + }, + { + "epoch": 1.58, + "learning_rate": 6.253884976191154e-05, + "loss": 0.0078, + "step": 610720 + }, + { + "epoch": 1.58, + "learning_rate": 6.253496154554007e-05, + "loss": 0.0085, + "step": 610730 + }, + { + "epoch": 1.58, + "learning_rate": 6.253107332916861e-05, + "loss": 0.0076, + "step": 610740 + }, + { + "epoch": 1.58, + "learning_rate": 6.252718511279715e-05, + "loss": 0.0088, + "step": 610750 + }, + { + "epoch": 1.58, + "learning_rate": 6.252329689642568e-05, + "loss": 0.0074, + "step": 610760 + }, + { + "epoch": 1.58, + "learning_rate": 6.251940868005422e-05, + "loss": 0.0068, + "step": 610770 + }, + { + "epoch": 1.58, + "learning_rate": 6.251552046368275e-05, + "loss": 0.0082, + "step": 610780 + }, + { + "epoch": 1.58, + "learning_rate": 6.25116322473113e-05, + "loss": 0.0078, + "step": 610790 + }, + { + "epoch": 1.58, + "learning_rate": 6.250774403093982e-05, + "loss": 0.008, + "step": 610800 + }, + { + "epoch": 1.58, + "learning_rate": 6.250385581456836e-05, + "loss": 0.0127, + "step": 610810 + }, + { + "epoch": 1.58, + "learning_rate": 6.24999675981969e-05, + "loss": 0.009, + "step": 610820 + }, + { + "epoch": 1.58, + "learning_rate": 6.249607938182543e-05, + "loss": 0.0092, + "step": 610830 + }, + { + "epoch": 1.58, + "learning_rate": 6.249219116545397e-05, + "loss": 0.0073, + "step": 610840 + }, + { + "epoch": 1.58, + "learning_rate": 6.24883029490825e-05, + "loss": 0.0109, + "step": 610850 + }, + { + "epoch": 1.58, + "learning_rate": 6.248441473271104e-05, + "loss": 0.0071, + "step": 610860 + }, + { + "epoch": 1.58, + "learning_rate": 6.248052651633957e-05, + "loss": 0.0081, + "step": 610870 + }, + { + "epoch": 1.58, + "learning_rate": 6.247663829996811e-05, + "loss": 0.0107, + "step": 610880 + }, + { + "epoch": 1.58, + "learning_rate": 6.247275008359664e-05, + "loss": 0.0085, + "step": 610890 + }, + { + "epoch": 1.58, + "learning_rate": 6.246886186722518e-05, + "loss": 0.0065, + "step": 610900 + }, + { + "epoch": 1.58, + "learning_rate": 6.246497365085373e-05, + "loss": 0.0081, + "step": 610910 + }, + { + "epoch": 1.58, + "learning_rate": 6.246108543448225e-05, + "loss": 0.0102, + "step": 610920 + }, + { + "epoch": 1.58, + "learning_rate": 6.24571972181108e-05, + "loss": 0.0111, + "step": 610930 + }, + { + "epoch": 1.58, + "learning_rate": 6.245330900173932e-05, + "loss": 0.0108, + "step": 610940 + }, + { + "epoch": 1.58, + "learning_rate": 6.244942078536786e-05, + "loss": 0.0114, + "step": 610950 + }, + { + "epoch": 1.58, + "learning_rate": 6.244553256899639e-05, + "loss": 0.0094, + "step": 610960 + }, + { + "epoch": 1.58, + "learning_rate": 6.244164435262492e-05, + "loss": 0.0092, + "step": 610970 + }, + { + "epoch": 1.58, + "learning_rate": 6.243775613625346e-05, + "loss": 0.0064, + "step": 610980 + }, + { + "epoch": 1.58, + "learning_rate": 6.243386791988199e-05, + "loss": 0.0104, + "step": 610990 + }, + { + "epoch": 1.58, + "learning_rate": 6.242997970351053e-05, + "loss": 0.0091, + "step": 611000 + }, + { + "epoch": 1.58, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.005523571744561195, + "eval_runtime": 107.8962, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, + "step": 611000 + }, + { + "epoch": 1.58, + "learning_rate": 6.242609148713907e-05, + "loss": 0.0079, + "step": 611010 + }, + { + "epoch": 1.58, + "learning_rate": 6.24222032707676e-05, + "loss": 0.0078, + "step": 611020 + }, + { + "epoch": 1.58, + "learning_rate": 6.241831505439614e-05, + "loss": 0.0083, + "step": 611030 + }, + { + "epoch": 1.58, + "learning_rate": 6.241442683802467e-05, + "loss": 0.0077, + "step": 611040 + }, + { + "epoch": 1.58, + "learning_rate": 6.241053862165321e-05, + "loss": 0.0089, + "step": 611050 + }, + { + "epoch": 1.58, + "learning_rate": 6.240665040528174e-05, + "loss": 0.0097, + "step": 611060 + }, + { + "epoch": 1.58, + "learning_rate": 6.240276218891028e-05, + "loss": 0.0075, + "step": 611070 + }, + { + "epoch": 1.58, + "learning_rate": 6.239887397253882e-05, + "loss": 0.0077, + "step": 611080 + }, + { + "epoch": 1.58, + "learning_rate": 6.239498575616735e-05, + "loss": 0.0078, + "step": 611090 + }, + { + "epoch": 1.58, + "learning_rate": 6.23910975397959e-05, + "loss": 0.0093, + "step": 611100 + }, + { + "epoch": 1.58, + "learning_rate": 6.238720932342442e-05, + "loss": 0.0083, + "step": 611110 + }, + { + "epoch": 1.58, + "learning_rate": 6.238332110705296e-05, + "loss": 0.0104, + "step": 611120 + }, + { + "epoch": 1.58, + "learning_rate": 6.237943289068149e-05, + "loss": 0.0045, + "step": 611130 + }, + { + "epoch": 1.58, + "learning_rate": 6.237554467431003e-05, + "loss": 0.0143, + "step": 611140 + }, + { + "epoch": 1.58, + "learning_rate": 6.237165645793856e-05, + "loss": 0.0081, + "step": 611150 + }, + { + "epoch": 1.58, + "learning_rate": 6.23677682415671e-05, + "loss": 0.0083, + "step": 611160 + }, + { + "epoch": 1.58, + "learning_rate": 6.236388002519565e-05, + "loss": 0.0076, + "step": 611170 + }, + { + "epoch": 1.58, + "learning_rate": 6.235999180882417e-05, + "loss": 0.0093, + "step": 611180 + }, + { + "epoch": 1.58, + "learning_rate": 6.235610359245271e-05, + "loss": 0.008, + "step": 611190 + }, + { + "epoch": 1.58, + "learning_rate": 6.235221537608124e-05, + "loss": 0.0112, + "step": 611200 + }, + { + "epoch": 1.58, + "learning_rate": 6.234832715970978e-05, + "loss": 0.0109, + "step": 611210 + }, + { + "epoch": 1.58, + "learning_rate": 6.234443894333831e-05, + "loss": 0.0107, + "step": 611220 + }, + { + "epoch": 1.58, + "learning_rate": 6.234055072696684e-05, + "loss": 0.0097, + "step": 611230 + }, + { + "epoch": 1.58, + "learning_rate": 6.233666251059538e-05, + "loss": 0.0085, + "step": 611240 + }, + { + "epoch": 1.58, + "learning_rate": 6.233277429422391e-05, + "loss": 0.0059, + "step": 611250 + }, + { + "epoch": 1.58, + "learning_rate": 6.232888607785245e-05, + "loss": 0.0079, + "step": 611260 + }, + { + "epoch": 1.58, + "learning_rate": 6.2324997861481e-05, + "loss": 0.006, + "step": 611270 + }, + { + "epoch": 1.58, + "learning_rate": 6.232110964510952e-05, + "loss": 0.0128, + "step": 611280 + }, + { + "epoch": 1.58, + "learning_rate": 6.231722142873806e-05, + "loss": 0.0096, + "step": 611290 + }, + { + "epoch": 1.58, + "learning_rate": 6.231333321236659e-05, + "loss": 0.0078, + "step": 611300 + }, + { + "epoch": 1.58, + "learning_rate": 6.230944499599513e-05, + "loss": 0.0096, + "step": 611310 + }, + { + "epoch": 1.58, + "learning_rate": 6.230555677962366e-05, + "loss": 0.0096, + "step": 611320 + }, + { + "epoch": 1.58, + "learning_rate": 6.23016685632522e-05, + "loss": 0.0116, + "step": 611330 + }, + { + "epoch": 1.58, + "learning_rate": 6.229778034688074e-05, + "loss": 0.0077, + "step": 611340 + }, + { + "epoch": 1.58, + "learning_rate": 6.229389213050927e-05, + "loss": 0.0073, + "step": 611350 + }, + { + "epoch": 1.58, + "learning_rate": 6.229000391413781e-05, + "loss": 0.0107, + "step": 611360 + }, + { + "epoch": 1.58, + "learning_rate": 6.228611569776634e-05, + "loss": 0.0068, + "step": 611370 + }, + { + "epoch": 1.58, + "learning_rate": 6.228222748139488e-05, + "loss": 0.0069, + "step": 611380 + }, + { + "epoch": 1.58, + "learning_rate": 6.227833926502341e-05, + "loss": 0.0126, + "step": 611390 + }, + { + "epoch": 1.58, + "learning_rate": 6.227445104865195e-05, + "loss": 0.0084, + "step": 611400 + }, + { + "epoch": 1.58, + "learning_rate": 6.227056283228048e-05, + "loss": 0.0109, + "step": 611410 + }, + { + "epoch": 1.58, + "learning_rate": 6.226667461590902e-05, + "loss": 0.0094, + "step": 611420 + }, + { + "epoch": 1.58, + "learning_rate": 6.226278639953757e-05, + "loss": 0.007, + "step": 611430 + }, + { + "epoch": 1.58, + "learning_rate": 6.225889818316609e-05, + "loss": 0.0073, + "step": 611440 + }, + { + "epoch": 1.58, + "learning_rate": 6.225500996679463e-05, + "loss": 0.0074, + "step": 611450 + }, + { + "epoch": 1.58, + "learning_rate": 6.225112175042316e-05, + "loss": 0.0082, + "step": 611460 + }, + { + "epoch": 1.59, + "learning_rate": 6.224723353405169e-05, + "loss": 0.0115, + "step": 611470 + }, + { + "epoch": 1.59, + "learning_rate": 6.224334531768023e-05, + "loss": 0.0088, + "step": 611480 + }, + { + "epoch": 1.59, + "learning_rate": 6.223945710130876e-05, + "loss": 0.0082, + "step": 611490 + }, + { + "epoch": 1.59, + "learning_rate": 6.22355688849373e-05, + "loss": 0.0101, + "step": 611500 + }, + { + "epoch": 1.59, + "learning_rate": 6.223168066856583e-05, + "loss": 0.0069, + "step": 611510 + }, + { + "epoch": 1.59, + "learning_rate": 6.222779245219437e-05, + "loss": 0.0074, + "step": 611520 + }, + { + "epoch": 1.59, + "learning_rate": 6.222390423582291e-05, + "loss": 0.0074, + "step": 611530 + }, + { + "epoch": 1.59, + "learning_rate": 6.222001601945144e-05, + "loss": 0.0077, + "step": 611540 + }, + { + "epoch": 1.59, + "learning_rate": 6.221612780307998e-05, + "loss": 0.0082, + "step": 611550 + }, + { + "epoch": 1.59, + "learning_rate": 6.221223958670851e-05, + "loss": 0.0082, + "step": 611560 + }, + { + "epoch": 1.59, + "learning_rate": 6.220835137033705e-05, + "loss": 0.0081, + "step": 611570 + }, + { + "epoch": 1.59, + "learning_rate": 6.220446315396558e-05, + "loss": 0.0085, + "step": 611580 + }, + { + "epoch": 1.59, + "learning_rate": 6.220057493759412e-05, + "loss": 0.0087, + "step": 611590 + }, + { + "epoch": 1.59, + "learning_rate": 6.219668672122265e-05, + "loss": 0.009, + "step": 611600 + }, + { + "epoch": 1.59, + "learning_rate": 6.219279850485119e-05, + "loss": 0.0072, + "step": 611610 + }, + { + "epoch": 1.59, + "learning_rate": 6.218891028847973e-05, + "loss": 0.0067, + "step": 611620 + }, + { + "epoch": 1.59, + "learning_rate": 6.218502207210826e-05, + "loss": 0.0068, + "step": 611630 + }, + { + "epoch": 1.59, + "learning_rate": 6.21811338557368e-05, + "loss": 0.0115, + "step": 611640 + }, + { + "epoch": 1.59, + "learning_rate": 6.217724563936533e-05, + "loss": 0.0055, + "step": 611650 + }, + { + "epoch": 1.59, + "learning_rate": 6.217335742299387e-05, + "loss": 0.0091, + "step": 611660 + }, + { + "epoch": 1.59, + "learning_rate": 6.21694692066224e-05, + "loss": 0.0078, + "step": 611670 + }, + { + "epoch": 1.59, + "learning_rate": 6.216558099025094e-05, + "loss": 0.0076, + "step": 611680 + }, + { + "epoch": 1.59, + "learning_rate": 6.216169277387949e-05, + "loss": 0.0092, + "step": 611690 + }, + { + "epoch": 1.59, + "learning_rate": 6.215780455750801e-05, + "loss": 0.0108, + "step": 611700 + }, + { + "epoch": 1.59, + "learning_rate": 6.215391634113654e-05, + "loss": 0.0119, + "step": 611710 + }, + { + "epoch": 1.59, + "learning_rate": 6.215002812476508e-05, + "loss": 0.014, + "step": 611720 + }, + { + "epoch": 1.59, + "learning_rate": 6.214613990839361e-05, + "loss": 0.0077, + "step": 611730 + }, + { + "epoch": 1.59, + "learning_rate": 6.214225169202215e-05, + "loss": 0.0078, + "step": 611740 + }, + { + "epoch": 1.59, + "learning_rate": 6.213836347565068e-05, + "loss": 0.0082, + "step": 611750 + }, + { + "epoch": 1.59, + "learning_rate": 6.213447525927922e-05, + "loss": 0.0105, + "step": 611760 + }, + { + "epoch": 1.59, + "learning_rate": 6.213058704290775e-05, + "loss": 0.0096, + "step": 611770 + }, + { + "epoch": 1.59, + "learning_rate": 6.212669882653629e-05, + "loss": 0.0079, + "step": 611780 + }, + { + "epoch": 1.59, + "learning_rate": 6.212281061016483e-05, + "loss": 0.0074, + "step": 611790 + }, + { + "epoch": 1.59, + "learning_rate": 6.211892239379336e-05, + "loss": 0.0082, + "step": 611800 + }, + { + "epoch": 1.59, + "learning_rate": 6.21150341774219e-05, + "loss": 0.0099, + "step": 611810 + }, + { + "epoch": 1.59, + "learning_rate": 6.211114596105043e-05, + "loss": 0.0073, + "step": 611820 + }, + { + "epoch": 1.59, + "learning_rate": 6.210725774467897e-05, + "loss": 0.008, + "step": 611830 + }, + { + "epoch": 1.59, + "learning_rate": 6.21033695283075e-05, + "loss": 0.0094, + "step": 611840 + }, + { + "epoch": 1.59, + "learning_rate": 6.209948131193604e-05, + "loss": 0.0084, + "step": 611850 + }, + { + "epoch": 1.59, + "learning_rate": 6.209559309556457e-05, + "loss": 0.008, + "step": 611860 + }, + { + "epoch": 1.59, + "learning_rate": 6.209170487919311e-05, + "loss": 0.0094, + "step": 611870 + }, + { + "epoch": 1.59, + "learning_rate": 6.208781666282165e-05, + "loss": 0.0101, + "step": 611880 + }, + { + "epoch": 1.59, + "learning_rate": 6.208392844645018e-05, + "loss": 0.0052, + "step": 611890 + }, + { + "epoch": 1.59, + "learning_rate": 6.208004023007872e-05, + "loss": 0.0068, + "step": 611900 + }, + { + "epoch": 1.59, + "learning_rate": 6.207615201370725e-05, + "loss": 0.0136, + "step": 611910 + }, + { + "epoch": 1.59, + "learning_rate": 6.20722637973358e-05, + "loss": 0.0086, + "step": 611920 + }, + { + "epoch": 1.59, + "learning_rate": 6.206837558096432e-05, + "loss": 0.0099, + "step": 611930 + }, + { + "epoch": 1.59, + "learning_rate": 6.206448736459286e-05, + "loss": 0.0076, + "step": 611940 + }, + { + "epoch": 1.59, + "learning_rate": 6.20605991482214e-05, + "loss": 0.0138, + "step": 611950 + }, + { + "epoch": 1.59, + "learning_rate": 6.205671093184992e-05, + "loss": 0.0099, + "step": 611960 + }, + { + "epoch": 1.59, + "learning_rate": 6.205282271547846e-05, + "loss": 0.0095, + "step": 611970 + }, + { + "epoch": 1.59, + "learning_rate": 6.2048934499107e-05, + "loss": 0.0111, + "step": 611980 + }, + { + "epoch": 1.59, + "learning_rate": 6.204504628273553e-05, + "loss": 0.0091, + "step": 611990 + }, + { + "epoch": 1.59, + "learning_rate": 6.204115806636407e-05, + "loss": 0.0058, + "step": 612000 + }, + { + "epoch": 1.59, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.005586665123701096, + "eval_runtime": 107.9859, + "eval_samples_per_second": 18.521, + "eval_steps_per_second": 4.63, + "step": 612000 + }, + { + "epoch": 1.59, + "learning_rate": 6.20372698499926e-05, + "loss": 0.0136, + "step": 612010 + }, + { + "epoch": 1.59, + "learning_rate": 6.203338163362114e-05, + "loss": 0.0122, + "step": 612020 + }, + { + "epoch": 1.59, + "learning_rate": 6.202949341724967e-05, + "loss": 0.0098, + "step": 612030 + }, + { + "epoch": 1.59, + "learning_rate": 6.202560520087821e-05, + "loss": 0.0118, + "step": 612040 + }, + { + "epoch": 1.59, + "learning_rate": 6.202171698450675e-05, + "loss": 0.0087, + "step": 612050 + }, + { + "epoch": 1.59, + "learning_rate": 6.201782876813528e-05, + "loss": 0.0096, + "step": 612060 + }, + { + "epoch": 1.59, + "learning_rate": 6.201394055176382e-05, + "loss": 0.0073, + "step": 612070 + }, + { + "epoch": 1.59, + "learning_rate": 6.201005233539235e-05, + "loss": 0.0076, + "step": 612080 + }, + { + "epoch": 1.59, + "learning_rate": 6.200616411902089e-05, + "loss": 0.0095, + "step": 612090 + }, + { + "epoch": 1.59, + "learning_rate": 6.200227590264942e-05, + "loss": 0.0048, + "step": 612100 + }, + { + "epoch": 1.59, + "learning_rate": 6.199838768627796e-05, + "loss": 0.0101, + "step": 612110 + }, + { + "epoch": 1.59, + "learning_rate": 6.199449946990649e-05, + "loss": 0.0068, + "step": 612120 + }, + { + "epoch": 1.59, + "learning_rate": 6.199061125353503e-05, + "loss": 0.0105, + "step": 612130 + }, + { + "epoch": 1.59, + "learning_rate": 6.198672303716357e-05, + "loss": 0.0054, + "step": 612140 + }, + { + "epoch": 1.59, + "learning_rate": 6.19828348207921e-05, + "loss": 0.0082, + "step": 612150 + }, + { + "epoch": 1.59, + "learning_rate": 6.197894660442064e-05, + "loss": 0.0099, + "step": 612160 + }, + { + "epoch": 1.59, + "learning_rate": 6.197505838804917e-05, + "loss": 0.0066, + "step": 612170 + }, + { + "epoch": 1.59, + "learning_rate": 6.197117017167771e-05, + "loss": 0.0073, + "step": 612180 + }, + { + "epoch": 1.59, + "learning_rate": 6.196728195530624e-05, + "loss": 0.0098, + "step": 612190 + }, + { + "epoch": 1.59, + "learning_rate": 6.196339373893478e-05, + "loss": 0.0091, + "step": 612200 + }, + { + "epoch": 1.59, + "learning_rate": 6.195950552256331e-05, + "loss": 0.0114, + "step": 612210 + }, + { + "epoch": 1.59, + "learning_rate": 6.195561730619184e-05, + "loss": 0.0092, + "step": 612220 + }, + { + "epoch": 1.59, + "learning_rate": 6.195172908982038e-05, + "loss": 0.0078, + "step": 612230 + }, + { + "epoch": 1.59, + "learning_rate": 6.194784087344892e-05, + "loss": 0.0098, + "step": 612240 + }, + { + "epoch": 1.59, + "learning_rate": 6.194395265707745e-05, + "loss": 0.0085, + "step": 612250 + }, + { + "epoch": 1.59, + "learning_rate": 6.194006444070599e-05, + "loss": 0.0072, + "step": 612260 + }, + { + "epoch": 1.59, + "learning_rate": 6.193617622433452e-05, + "loss": 0.0096, + "step": 612270 + }, + { + "epoch": 1.59, + "learning_rate": 6.193228800796306e-05, + "loss": 0.0098, + "step": 612280 + }, + { + "epoch": 1.59, + "learning_rate": 6.192839979159159e-05, + "loss": 0.0094, + "step": 612290 + }, + { + "epoch": 1.59, + "learning_rate": 6.192451157522013e-05, + "loss": 0.0096, + "step": 612300 + }, + { + "epoch": 1.59, + "learning_rate": 6.192062335884867e-05, + "loss": 0.0078, + "step": 612310 + }, + { + "epoch": 1.59, + "learning_rate": 6.19167351424772e-05, + "loss": 0.0105, + "step": 612320 + }, + { + "epoch": 1.59, + "learning_rate": 6.191284692610574e-05, + "loss": 0.0084, + "step": 612330 + }, + { + "epoch": 1.59, + "learning_rate": 6.190895870973427e-05, + "loss": 0.008, + "step": 612340 + }, + { + "epoch": 1.59, + "learning_rate": 6.190507049336281e-05, + "loss": 0.0098, + "step": 612350 + }, + { + "epoch": 1.59, + "learning_rate": 6.190118227699134e-05, + "loss": 0.0088, + "step": 612360 + }, + { + "epoch": 1.59, + "learning_rate": 6.189729406061988e-05, + "loss": 0.0072, + "step": 612370 + }, + { + "epoch": 1.59, + "learning_rate": 6.189340584424841e-05, + "loss": 0.0077, + "step": 612380 + }, + { + "epoch": 1.59, + "learning_rate": 6.188951762787695e-05, + "loss": 0.0069, + "step": 612390 + }, + { + "epoch": 1.59, + "learning_rate": 6.18856294115055e-05, + "loss": 0.0092, + "step": 612400 + }, + { + "epoch": 1.59, + "learning_rate": 6.188174119513402e-05, + "loss": 0.0088, + "step": 612410 + }, + { + "epoch": 1.59, + "learning_rate": 6.187785297876256e-05, + "loss": 0.0103, + "step": 612420 + }, + { + "epoch": 1.59, + "learning_rate": 6.187396476239109e-05, + "loss": 0.0075, + "step": 612430 + }, + { + "epoch": 1.59, + "learning_rate": 6.187007654601963e-05, + "loss": 0.0085, + "step": 612440 + }, + { + "epoch": 1.59, + "learning_rate": 6.186618832964816e-05, + "loss": 0.006, + "step": 612450 + }, + { + "epoch": 1.59, + "learning_rate": 6.186230011327669e-05, + "loss": 0.0086, + "step": 612460 + }, + { + "epoch": 1.59, + "learning_rate": 6.185841189690523e-05, + "loss": 0.0096, + "step": 612470 + }, + { + "epoch": 1.59, + "learning_rate": 6.185452368053376e-05, + "loss": 0.0077, + "step": 612480 + }, + { + "epoch": 1.59, + "learning_rate": 6.18506354641623e-05, + "loss": 0.009, + "step": 612490 + }, + { + "epoch": 1.59, + "learning_rate": 6.184674724779084e-05, + "loss": 0.012, + "step": 612500 + }, + { + "epoch": 1.59, + "learning_rate": 6.184285903141937e-05, + "loss": 0.0099, + "step": 612510 + }, + { + "epoch": 1.59, + "learning_rate": 6.183897081504791e-05, + "loss": 0.0106, + "step": 612520 + }, + { + "epoch": 1.59, + "learning_rate": 6.183508259867644e-05, + "loss": 0.009, + "step": 612530 + }, + { + "epoch": 1.59, + "learning_rate": 6.183119438230498e-05, + "loss": 0.0086, + "step": 612540 + }, + { + "epoch": 1.59, + "learning_rate": 6.182730616593351e-05, + "loss": 0.0094, + "step": 612550 + }, + { + "epoch": 1.59, + "learning_rate": 6.182341794956205e-05, + "loss": 0.0087, + "step": 612560 + }, + { + "epoch": 1.59, + "learning_rate": 6.18195297331906e-05, + "loss": 0.0058, + "step": 612570 + }, + { + "epoch": 1.59, + "learning_rate": 6.181564151681912e-05, + "loss": 0.0101, + "step": 612580 + }, + { + "epoch": 1.59, + "learning_rate": 6.181175330044766e-05, + "loss": 0.0099, + "step": 612590 + }, + { + "epoch": 1.59, + "learning_rate": 6.180786508407619e-05, + "loss": 0.0074, + "step": 612600 + }, + { + "epoch": 1.59, + "learning_rate": 6.180397686770473e-05, + "loss": 0.0088, + "step": 612610 + }, + { + "epoch": 1.59, + "learning_rate": 6.180008865133326e-05, + "loss": 0.0061, + "step": 612620 + }, + { + "epoch": 1.59, + "learning_rate": 6.17962004349618e-05, + "loss": 0.0073, + "step": 612630 + }, + { + "epoch": 1.59, + "learning_rate": 6.179231221859033e-05, + "loss": 0.007, + "step": 612640 + }, + { + "epoch": 1.59, + "learning_rate": 6.178842400221887e-05, + "loss": 0.008, + "step": 612650 + }, + { + "epoch": 1.59, + "learning_rate": 6.178453578584741e-05, + "loss": 0.0075, + "step": 612660 + }, + { + "epoch": 1.59, + "learning_rate": 6.178064756947594e-05, + "loss": 0.0088, + "step": 612670 + }, + { + "epoch": 1.59, + "learning_rate": 6.177675935310448e-05, + "loss": 0.0093, + "step": 612680 + }, + { + "epoch": 1.59, + "learning_rate": 6.177287113673301e-05, + "loss": 0.0071, + "step": 612690 + }, + { + "epoch": 1.59, + "learning_rate": 6.176898292036154e-05, + "loss": 0.0088, + "step": 612700 + }, + { + "epoch": 1.59, + "learning_rate": 6.176509470399008e-05, + "loss": 0.012, + "step": 612710 + }, + { + "epoch": 1.59, + "learning_rate": 6.176120648761861e-05, + "loss": 0.0116, + "step": 612720 + }, + { + "epoch": 1.59, + "learning_rate": 6.175731827124715e-05, + "loss": 0.0076, + "step": 612730 + }, + { + "epoch": 1.59, + "learning_rate": 6.175343005487568e-05, + "loss": 0.0057, + "step": 612740 + }, + { + "epoch": 1.59, + "learning_rate": 6.174954183850422e-05, + "loss": 0.0081, + "step": 612750 + }, + { + "epoch": 1.59, + "learning_rate": 6.174565362213276e-05, + "loss": 0.0091, + "step": 612760 + }, + { + "epoch": 1.59, + "learning_rate": 6.174176540576129e-05, + "loss": 0.008, + "step": 612770 + }, + { + "epoch": 1.59, + "learning_rate": 6.173787718938983e-05, + "loss": 0.014, + "step": 612780 + }, + { + "epoch": 1.59, + "learning_rate": 6.173398897301836e-05, + "loss": 0.0104, + "step": 612790 + }, + { + "epoch": 1.59, + "learning_rate": 6.17301007566469e-05, + "loss": 0.0062, + "step": 612800 + }, + { + "epoch": 1.59, + "learning_rate": 6.172621254027543e-05, + "loss": 0.0081, + "step": 612810 + }, + { + "epoch": 1.59, + "learning_rate": 6.172232432390397e-05, + "loss": 0.0105, + "step": 612820 + }, + { + "epoch": 1.59, + "learning_rate": 6.171843610753251e-05, + "loss": 0.0088, + "step": 612830 + }, + { + "epoch": 1.59, + "learning_rate": 6.171454789116104e-05, + "loss": 0.0114, + "step": 612840 + }, + { + "epoch": 1.59, + "learning_rate": 6.171065967478958e-05, + "loss": 0.0074, + "step": 612850 + }, + { + "epoch": 1.59, + "learning_rate": 6.170677145841811e-05, + "loss": 0.0075, + "step": 612860 + }, + { + "epoch": 1.59, + "learning_rate": 6.170288324204665e-05, + "loss": 0.0071, + "step": 612870 + }, + { + "epoch": 1.59, + "learning_rate": 6.169899502567518e-05, + "loss": 0.0063, + "step": 612880 + }, + { + "epoch": 1.59, + "learning_rate": 6.169510680930372e-05, + "loss": 0.0077, + "step": 612890 + }, + { + "epoch": 1.59, + "learning_rate": 6.169121859293225e-05, + "loss": 0.008, + "step": 612900 + }, + { + "epoch": 1.59, + "learning_rate": 6.168733037656079e-05, + "loss": 0.0101, + "step": 612910 + }, + { + "epoch": 1.59, + "learning_rate": 6.168344216018933e-05, + "loss": 0.0094, + "step": 612920 + }, + { + "epoch": 1.59, + "learning_rate": 6.167955394381786e-05, + "loss": 0.009, + "step": 612930 + }, + { + "epoch": 1.59, + "learning_rate": 6.16756657274464e-05, + "loss": 0.0103, + "step": 612940 + }, + { + "epoch": 1.59, + "learning_rate": 6.167177751107493e-05, + "loss": 0.0084, + "step": 612950 + }, + { + "epoch": 1.59, + "learning_rate": 6.166788929470346e-05, + "loss": 0.01, + "step": 612960 + }, + { + "epoch": 1.59, + "learning_rate": 6.1664001078332e-05, + "loss": 0.0084, + "step": 612970 + }, + { + "epoch": 1.59, + "learning_rate": 6.166011286196053e-05, + "loss": 0.012, + "step": 612980 + }, + { + "epoch": 1.59, + "learning_rate": 6.165622464558907e-05, + "loss": 0.007, + "step": 612990 + }, + { + "epoch": 1.59, + "learning_rate": 6.16523364292176e-05, + "loss": 0.007, + "step": 613000 + }, + { + "epoch": 1.59, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.005634871311485767, + "eval_runtime": 107.6649, + "eval_samples_per_second": 18.576, + "eval_steps_per_second": 4.644, + "step": 613000 + }, + { + "epoch": 1.59, + "learning_rate": 6.164844821284614e-05, + "loss": 0.0105, + "step": 613010 + }, + { + "epoch": 1.59, + "learning_rate": 6.164455999647468e-05, + "loss": 0.009, + "step": 613020 + }, + { + "epoch": 1.59, + "learning_rate": 6.164067178010321e-05, + "loss": 0.0083, + "step": 613030 + }, + { + "epoch": 1.59, + "learning_rate": 6.163678356373175e-05, + "loss": 0.011, + "step": 613040 + }, + { + "epoch": 1.59, + "learning_rate": 6.163289534736028e-05, + "loss": 0.0064, + "step": 613050 + }, + { + "epoch": 1.59, + "learning_rate": 6.162900713098882e-05, + "loss": 0.0091, + "step": 613060 + }, + { + "epoch": 1.59, + "learning_rate": 6.162511891461735e-05, + "loss": 0.0101, + "step": 613070 + }, + { + "epoch": 1.59, + "learning_rate": 6.162123069824589e-05, + "loss": 0.009, + "step": 613080 + }, + { + "epoch": 1.59, + "learning_rate": 6.161734248187442e-05, + "loss": 0.0073, + "step": 613090 + }, + { + "epoch": 1.59, + "learning_rate": 6.161345426550296e-05, + "loss": 0.008, + "step": 613100 + }, + { + "epoch": 1.59, + "learning_rate": 6.16095660491315e-05, + "loss": 0.0082, + "step": 613110 + }, + { + "epoch": 1.59, + "learning_rate": 6.160567783276003e-05, + "loss": 0.0091, + "step": 613120 + }, + { + "epoch": 1.59, + "learning_rate": 6.160178961638857e-05, + "loss": 0.0062, + "step": 613130 + }, + { + "epoch": 1.59, + "learning_rate": 6.15979014000171e-05, + "loss": 0.0068, + "step": 613140 + }, + { + "epoch": 1.59, + "learning_rate": 6.159401318364564e-05, + "loss": 0.0103, + "step": 613150 + }, + { + "epoch": 1.59, + "learning_rate": 6.159012496727417e-05, + "loss": 0.0078, + "step": 613160 + }, + { + "epoch": 1.59, + "learning_rate": 6.158623675090271e-05, + "loss": 0.0053, + "step": 613170 + }, + { + "epoch": 1.59, + "learning_rate": 6.158234853453125e-05, + "loss": 0.0098, + "step": 613180 + }, + { + "epoch": 1.59, + "learning_rate": 6.157846031815978e-05, + "loss": 0.0104, + "step": 613190 + }, + { + "epoch": 1.59, + "learning_rate": 6.157457210178831e-05, + "loss": 0.0099, + "step": 613200 + }, + { + "epoch": 1.59, + "learning_rate": 6.157068388541685e-05, + "loss": 0.0092, + "step": 613210 + }, + { + "epoch": 1.59, + "learning_rate": 6.156679566904538e-05, + "loss": 0.0081, + "step": 613220 + }, + { + "epoch": 1.59, + "learning_rate": 6.156290745267392e-05, + "loss": 0.0067, + "step": 613230 + }, + { + "epoch": 1.59, + "learning_rate": 6.155901923630245e-05, + "loss": 0.0151, + "step": 613240 + }, + { + "epoch": 1.59, + "learning_rate": 6.155513101993099e-05, + "loss": 0.011, + "step": 613250 + }, + { + "epoch": 1.59, + "learning_rate": 6.155124280355952e-05, + "loss": 0.0072, + "step": 613260 + }, + { + "epoch": 1.59, + "learning_rate": 6.154735458718806e-05, + "loss": 0.0106, + "step": 613270 + }, + { + "epoch": 1.59, + "learning_rate": 6.15434663708166e-05, + "loss": 0.0071, + "step": 613280 + }, + { + "epoch": 1.59, + "learning_rate": 6.153957815444513e-05, + "loss": 0.0106, + "step": 613290 + }, + { + "epoch": 1.59, + "learning_rate": 6.153568993807367e-05, + "loss": 0.0097, + "step": 613300 + }, + { + "epoch": 1.59, + "learning_rate": 6.15318017217022e-05, + "loss": 0.0076, + "step": 613310 + }, + { + "epoch": 1.59, + "learning_rate": 6.152791350533074e-05, + "loss": 0.0089, + "step": 613320 + }, + { + "epoch": 1.59, + "learning_rate": 6.152402528895927e-05, + "loss": 0.0075, + "step": 613330 + }, + { + "epoch": 1.59, + "learning_rate": 6.152013707258781e-05, + "loss": 0.0086, + "step": 613340 + }, + { + "epoch": 1.59, + "learning_rate": 6.151624885621634e-05, + "loss": 0.009, + "step": 613350 + }, + { + "epoch": 1.59, + "learning_rate": 6.151236063984488e-05, + "loss": 0.0087, + "step": 613360 + }, + { + "epoch": 1.59, + "learning_rate": 6.150847242347342e-05, + "loss": 0.0066, + "step": 613370 + }, + { + "epoch": 1.59, + "learning_rate": 6.150458420710195e-05, + "loss": 0.0069, + "step": 613380 + }, + { + "epoch": 1.59, + "learning_rate": 6.150069599073049e-05, + "loss": 0.009, + "step": 613390 + }, + { + "epoch": 1.59, + "learning_rate": 6.149680777435902e-05, + "loss": 0.0073, + "step": 613400 + }, + { + "epoch": 1.59, + "learning_rate": 6.149291955798756e-05, + "loss": 0.0087, + "step": 613410 + }, + { + "epoch": 1.59, + "learning_rate": 6.148903134161609e-05, + "loss": 0.0078, + "step": 613420 + }, + { + "epoch": 1.59, + "learning_rate": 6.148514312524463e-05, + "loss": 0.0061, + "step": 613430 + }, + { + "epoch": 1.59, + "learning_rate": 6.148125490887317e-05, + "loss": 0.0083, + "step": 613440 + }, + { + "epoch": 1.59, + "learning_rate": 6.147736669250169e-05, + "loss": 0.0068, + "step": 613450 + }, + { + "epoch": 1.59, + "learning_rate": 6.147347847613023e-05, + "loss": 0.009, + "step": 613460 + }, + { + "epoch": 1.59, + "learning_rate": 6.146959025975877e-05, + "loss": 0.007, + "step": 613470 + }, + { + "epoch": 1.59, + "learning_rate": 6.14657020433873e-05, + "loss": 0.0053, + "step": 613480 + }, + { + "epoch": 1.59, + "learning_rate": 6.146181382701584e-05, + "loss": 0.0077, + "step": 613490 + }, + { + "epoch": 1.59, + "learning_rate": 6.145792561064437e-05, + "loss": 0.0061, + "step": 613500 + }, + { + "epoch": 1.59, + "learning_rate": 6.145403739427291e-05, + "loss": 0.0091, + "step": 613510 + }, + { + "epoch": 1.59, + "learning_rate": 6.145014917790144e-05, + "loss": 0.0097, + "step": 613520 + }, + { + "epoch": 1.59, + "learning_rate": 6.144626096152998e-05, + "loss": 0.009, + "step": 613530 + }, + { + "epoch": 1.59, + "learning_rate": 6.144237274515852e-05, + "loss": 0.0067, + "step": 613540 + }, + { + "epoch": 1.59, + "learning_rate": 6.143848452878705e-05, + "loss": 0.0084, + "step": 613550 + }, + { + "epoch": 1.59, + "learning_rate": 6.143459631241559e-05, + "loss": 0.0114, + "step": 613560 + }, + { + "epoch": 1.59, + "learning_rate": 6.143070809604412e-05, + "loss": 0.0098, + "step": 613570 + }, + { + "epoch": 1.59, + "learning_rate": 6.142681987967266e-05, + "loss": 0.0088, + "step": 613580 + }, + { + "epoch": 1.59, + "learning_rate": 6.142293166330119e-05, + "loss": 0.0093, + "step": 613590 + }, + { + "epoch": 1.59, + "learning_rate": 6.141904344692973e-05, + "loss": 0.0065, + "step": 613600 + }, + { + "epoch": 1.59, + "learning_rate": 6.141515523055826e-05, + "loss": 0.0072, + "step": 613610 + }, + { + "epoch": 1.59, + "learning_rate": 6.14112670141868e-05, + "loss": 0.0084, + "step": 613620 + }, + { + "epoch": 1.59, + "learning_rate": 6.140737879781534e-05, + "loss": 0.0122, + "step": 613630 + }, + { + "epoch": 1.59, + "learning_rate": 6.140349058144387e-05, + "loss": 0.0079, + "step": 613640 + }, + { + "epoch": 1.59, + "learning_rate": 6.139960236507241e-05, + "loss": 0.0081, + "step": 613650 + }, + { + "epoch": 1.59, + "learning_rate": 6.139571414870094e-05, + "loss": 0.0095, + "step": 613660 + }, + { + "epoch": 1.59, + "learning_rate": 6.139182593232948e-05, + "loss": 0.009, + "step": 613670 + }, + { + "epoch": 1.59, + "learning_rate": 6.138793771595801e-05, + "loss": 0.008, + "step": 613680 + }, + { + "epoch": 1.59, + "learning_rate": 6.138404949958655e-05, + "loss": 0.009, + "step": 613690 + }, + { + "epoch": 1.59, + "learning_rate": 6.138016128321508e-05, + "loss": 0.0077, + "step": 613700 + }, + { + "epoch": 1.59, + "learning_rate": 6.137627306684361e-05, + "loss": 0.0079, + "step": 613710 + }, + { + "epoch": 1.59, + "learning_rate": 6.137238485047215e-05, + "loss": 0.006, + "step": 613720 + }, + { + "epoch": 1.59, + "learning_rate": 6.136849663410069e-05, + "loss": 0.0101, + "step": 613730 + }, + { + "epoch": 1.59, + "learning_rate": 6.136460841772922e-05, + "loss": 0.0102, + "step": 613740 + }, + { + "epoch": 1.59, + "learning_rate": 6.136072020135776e-05, + "loss": 0.0083, + "step": 613750 + }, + { + "epoch": 1.59, + "learning_rate": 6.135683198498629e-05, + "loss": 0.0115, + "step": 613760 + }, + { + "epoch": 1.59, + "learning_rate": 6.135294376861483e-05, + "loss": 0.0085, + "step": 613770 + }, + { + "epoch": 1.59, + "learning_rate": 6.134905555224336e-05, + "loss": 0.0094, + "step": 613780 + }, + { + "epoch": 1.59, + "learning_rate": 6.13451673358719e-05, + "loss": 0.0071, + "step": 613790 + }, + { + "epoch": 1.59, + "learning_rate": 6.134127911950044e-05, + "loss": 0.0083, + "step": 613800 + }, + { + "epoch": 1.59, + "learning_rate": 6.133739090312897e-05, + "loss": 0.0094, + "step": 613810 + }, + { + "epoch": 1.59, + "learning_rate": 6.133350268675751e-05, + "loss": 0.0086, + "step": 613820 + }, + { + "epoch": 1.59, + "learning_rate": 6.132961447038604e-05, + "loss": 0.0086, + "step": 613830 + }, + { + "epoch": 1.59, + "learning_rate": 6.132572625401458e-05, + "loss": 0.0083, + "step": 613840 + }, + { + "epoch": 1.59, + "learning_rate": 6.132183803764311e-05, + "loss": 0.0097, + "step": 613850 + }, + { + "epoch": 1.59, + "learning_rate": 6.131794982127165e-05, + "loss": 0.0088, + "step": 613860 + }, + { + "epoch": 1.59, + "learning_rate": 6.131406160490018e-05, + "loss": 0.0074, + "step": 613870 + }, + { + "epoch": 1.59, + "learning_rate": 6.131017338852872e-05, + "loss": 0.0073, + "step": 613880 + }, + { + "epoch": 1.59, + "learning_rate": 6.130628517215726e-05, + "loss": 0.009, + "step": 613890 + }, + { + "epoch": 1.59, + "learning_rate": 6.130239695578579e-05, + "loss": 0.0102, + "step": 613900 + }, + { + "epoch": 1.59, + "learning_rate": 6.129850873941433e-05, + "loss": 0.009, + "step": 613910 + }, + { + "epoch": 1.59, + "learning_rate": 6.129462052304286e-05, + "loss": 0.0085, + "step": 613920 + }, + { + "epoch": 1.59, + "learning_rate": 6.12907323066714e-05, + "loss": 0.0079, + "step": 613930 + }, + { + "epoch": 1.59, + "learning_rate": 6.128684409029993e-05, + "loss": 0.0121, + "step": 613940 + }, + { + "epoch": 1.59, + "learning_rate": 6.128295587392846e-05, + "loss": 0.0083, + "step": 613950 + }, + { + "epoch": 1.59, + "learning_rate": 6.1279067657557e-05, + "loss": 0.0103, + "step": 613960 + }, + { + "epoch": 1.59, + "learning_rate": 6.127517944118553e-05, + "loss": 0.0076, + "step": 613970 + }, + { + "epoch": 1.59, + "learning_rate": 6.127129122481407e-05, + "loss": 0.0086, + "step": 613980 + }, + { + "epoch": 1.59, + "learning_rate": 6.126740300844261e-05, + "loss": 0.0134, + "step": 613990 + }, + { + "epoch": 1.59, + "learning_rate": 6.126351479207114e-05, + "loss": 0.0076, + "step": 614000 + }, + { + "epoch": 1.59, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.005931103602051735, + "eval_runtime": 107.8086, + "eval_samples_per_second": 18.551, + "eval_steps_per_second": 4.638, + "step": 614000 + }, + { + "epoch": 1.59, + "learning_rate": 6.125962657569968e-05, + "loss": 0.0103, + "step": 614010 + }, + { + "epoch": 1.59, + "learning_rate": 6.125573835932821e-05, + "loss": 0.0106, + "step": 614020 + }, + { + "epoch": 1.59, + "learning_rate": 6.125185014295675e-05, + "loss": 0.0114, + "step": 614030 + }, + { + "epoch": 1.59, + "learning_rate": 6.124796192658528e-05, + "loss": 0.0078, + "step": 614040 + }, + { + "epoch": 1.59, + "learning_rate": 6.124407371021382e-05, + "loss": 0.0077, + "step": 614050 + }, + { + "epoch": 1.59, + "learning_rate": 6.124018549384236e-05, + "loss": 0.0098, + "step": 614060 + }, + { + "epoch": 1.59, + "learning_rate": 6.123629727747089e-05, + "loss": 0.0072, + "step": 614070 + }, + { + "epoch": 1.59, + "learning_rate": 6.123240906109943e-05, + "loss": 0.0098, + "step": 614080 + }, + { + "epoch": 1.59, + "learning_rate": 6.122852084472796e-05, + "loss": 0.0097, + "step": 614090 + }, + { + "epoch": 1.59, + "learning_rate": 6.12246326283565e-05, + "loss": 0.0079, + "step": 614100 + }, + { + "epoch": 1.59, + "learning_rate": 6.122074441198503e-05, + "loss": 0.0093, + "step": 614110 + }, + { + "epoch": 1.59, + "learning_rate": 6.121685619561357e-05, + "loss": 0.0078, + "step": 614120 + }, + { + "epoch": 1.59, + "learning_rate": 6.12129679792421e-05, + "loss": 0.0077, + "step": 614130 + }, + { + "epoch": 1.59, + "learning_rate": 6.120907976287064e-05, + "loss": 0.0096, + "step": 614140 + }, + { + "epoch": 1.59, + "learning_rate": 6.120519154649918e-05, + "loss": 0.0106, + "step": 614150 + }, + { + "epoch": 1.59, + "learning_rate": 6.120130333012771e-05, + "loss": 0.0078, + "step": 614160 + }, + { + "epoch": 1.59, + "learning_rate": 6.119741511375625e-05, + "loss": 0.0093, + "step": 614170 + }, + { + "epoch": 1.59, + "learning_rate": 6.119352689738478e-05, + "loss": 0.0077, + "step": 614180 + }, + { + "epoch": 1.59, + "learning_rate": 6.118963868101331e-05, + "loss": 0.0069, + "step": 614190 + }, + { + "epoch": 1.59, + "learning_rate": 6.118575046464185e-05, + "loss": 0.0099, + "step": 614200 + }, + { + "epoch": 1.59, + "learning_rate": 6.118186224827038e-05, + "loss": 0.0117, + "step": 614210 + }, + { + "epoch": 1.59, + "learning_rate": 6.117797403189892e-05, + "loss": 0.0098, + "step": 614220 + }, + { + "epoch": 1.59, + "learning_rate": 6.117408581552745e-05, + "loss": 0.0094, + "step": 614230 + }, + { + "epoch": 1.59, + "learning_rate": 6.117019759915599e-05, + "loss": 0.0108, + "step": 614240 + }, + { + "epoch": 1.59, + "learning_rate": 6.116630938278453e-05, + "loss": 0.0068, + "step": 614250 + }, + { + "epoch": 1.59, + "learning_rate": 6.116242116641306e-05, + "loss": 0.0085, + "step": 614260 + }, + { + "epoch": 1.59, + "learning_rate": 6.11585329500416e-05, + "loss": 0.0095, + "step": 614270 + }, + { + "epoch": 1.59, + "learning_rate": 6.115464473367013e-05, + "loss": 0.0077, + "step": 614280 + }, + { + "epoch": 1.59, + "learning_rate": 6.115075651729867e-05, + "loss": 0.0062, + "step": 614290 + }, + { + "epoch": 1.59, + "learning_rate": 6.11468683009272e-05, + "loss": 0.0064, + "step": 614300 + }, + { + "epoch": 1.59, + "learning_rate": 6.114298008455574e-05, + "loss": 0.0068, + "step": 614310 + }, + { + "epoch": 1.59, + "learning_rate": 6.113909186818428e-05, + "loss": 0.0117, + "step": 614320 + }, + { + "epoch": 1.59, + "learning_rate": 6.113520365181281e-05, + "loss": 0.0107, + "step": 614330 + }, + { + "epoch": 1.59, + "learning_rate": 6.113131543544135e-05, + "loss": 0.0084, + "step": 614340 + }, + { + "epoch": 1.59, + "learning_rate": 6.112742721906988e-05, + "loss": 0.0123, + "step": 614350 + }, + { + "epoch": 1.59, + "learning_rate": 6.112353900269842e-05, + "loss": 0.0085, + "step": 614360 + }, + { + "epoch": 1.59, + "learning_rate": 6.111965078632695e-05, + "loss": 0.0066, + "step": 614370 + }, + { + "epoch": 1.59, + "learning_rate": 6.111576256995549e-05, + "loss": 0.0102, + "step": 614380 + }, + { + "epoch": 1.59, + "learning_rate": 6.111187435358402e-05, + "loss": 0.0122, + "step": 614390 + }, + { + "epoch": 1.59, + "learning_rate": 6.110798613721256e-05, + "loss": 0.0078, + "step": 614400 + }, + { + "epoch": 1.59, + "learning_rate": 6.11040979208411e-05, + "loss": 0.0114, + "step": 614410 + }, + { + "epoch": 1.59, + "learning_rate": 6.110020970446963e-05, + "loss": 0.0114, + "step": 614420 + }, + { + "epoch": 1.59, + "learning_rate": 6.109632148809817e-05, + "loss": 0.008, + "step": 614430 + }, + { + "epoch": 1.59, + "learning_rate": 6.10924332717267e-05, + "loss": 0.0075, + "step": 614440 + }, + { + "epoch": 1.59, + "learning_rate": 6.108854505535523e-05, + "loss": 0.0079, + "step": 614450 + }, + { + "epoch": 1.59, + "learning_rate": 6.108465683898377e-05, + "loss": 0.0096, + "step": 614460 + }, + { + "epoch": 1.59, + "learning_rate": 6.10807686226123e-05, + "loss": 0.0088, + "step": 614470 + }, + { + "epoch": 1.59, + "learning_rate": 6.107688040624084e-05, + "loss": 0.0077, + "step": 614480 + }, + { + "epoch": 1.59, + "learning_rate": 6.107299218986937e-05, + "loss": 0.0087, + "step": 614490 + }, + { + "epoch": 1.59, + "learning_rate": 6.106910397349791e-05, + "loss": 0.0086, + "step": 614500 + }, + { + "epoch": 1.59, + "learning_rate": 6.106521575712645e-05, + "loss": 0.0063, + "step": 614510 + }, + { + "epoch": 1.59, + "learning_rate": 6.106132754075498e-05, + "loss": 0.0071, + "step": 614520 + }, + { + "epoch": 1.59, + "learning_rate": 6.105743932438352e-05, + "loss": 0.01, + "step": 614530 + }, + { + "epoch": 1.59, + "learning_rate": 6.105355110801205e-05, + "loss": 0.0073, + "step": 614540 + }, + { + "epoch": 1.59, + "learning_rate": 6.104966289164059e-05, + "loss": 0.0057, + "step": 614550 + }, + { + "epoch": 1.59, + "learning_rate": 6.104577467526912e-05, + "loss": 0.0092, + "step": 614560 + }, + { + "epoch": 1.59, + "learning_rate": 6.104188645889766e-05, + "loss": 0.0073, + "step": 614570 + }, + { + "epoch": 1.59, + "learning_rate": 6.103799824252619e-05, + "loss": 0.008, + "step": 614580 + }, + { + "epoch": 1.59, + "learning_rate": 6.103411002615473e-05, + "loss": 0.0098, + "step": 614590 + }, + { + "epoch": 1.59, + "learning_rate": 6.1030221809783265e-05, + "loss": 0.0099, + "step": 614600 + }, + { + "epoch": 1.59, + "learning_rate": 6.10263335934118e-05, + "loss": 0.0106, + "step": 614610 + }, + { + "epoch": 1.59, + "learning_rate": 6.1022445377040335e-05, + "loss": 0.0082, + "step": 614620 + }, + { + "epoch": 1.59, + "learning_rate": 6.101855716066888e-05, + "loss": 0.0092, + "step": 614630 + }, + { + "epoch": 1.59, + "learning_rate": 6.101466894429741e-05, + "loss": 0.0119, + "step": 614640 + }, + { + "epoch": 1.59, + "learning_rate": 6.1010780727925946e-05, + "loss": 0.0078, + "step": 614650 + }, + { + "epoch": 1.59, + "learning_rate": 6.100689251155448e-05, + "loss": 0.0062, + "step": 614660 + }, + { + "epoch": 1.59, + "learning_rate": 6.1003004295183016e-05, + "loss": 0.0072, + "step": 614670 + }, + { + "epoch": 1.59, + "learning_rate": 6.099911607881155e-05, + "loss": 0.0082, + "step": 614680 + }, + { + "epoch": 1.59, + "learning_rate": 6.099522786244008e-05, + "loss": 0.0071, + "step": 614690 + }, + { + "epoch": 1.59, + "learning_rate": 6.0991339646068614e-05, + "loss": 0.01, + "step": 614700 + }, + { + "epoch": 1.59, + "learning_rate": 6.098745142969715e-05, + "loss": 0.0099, + "step": 614710 + }, + { + "epoch": 1.59, + "learning_rate": 6.0983563213325684e-05, + "loss": 0.0071, + "step": 614720 + }, + { + "epoch": 1.59, + "learning_rate": 6.0979674996954225e-05, + "loss": 0.008, + "step": 614730 + }, + { + "epoch": 1.59, + "learning_rate": 6.097578678058276e-05, + "loss": 0.01, + "step": 614740 + }, + { + "epoch": 1.59, + "learning_rate": 6.0971898564211295e-05, + "loss": 0.0061, + "step": 614750 + }, + { + "epoch": 1.59, + "learning_rate": 6.096801034783983e-05, + "loss": 0.0093, + "step": 614760 + }, + { + "epoch": 1.59, + "learning_rate": 6.0964122131468365e-05, + "loss": 0.0079, + "step": 614770 + }, + { + "epoch": 1.59, + "learning_rate": 6.09602339150969e-05, + "loss": 0.0086, + "step": 614780 + }, + { + "epoch": 1.59, + "learning_rate": 6.0956345698725434e-05, + "loss": 0.0074, + "step": 614790 + }, + { + "epoch": 1.59, + "learning_rate": 6.095245748235397e-05, + "loss": 0.0099, + "step": 614800 + }, + { + "epoch": 1.59, + "learning_rate": 6.094856926598251e-05, + "loss": 0.007, + "step": 614810 + }, + { + "epoch": 1.59, + "learning_rate": 6.0944681049611046e-05, + "loss": 0.0092, + "step": 614820 + }, + { + "epoch": 1.59, + "learning_rate": 6.094079283323958e-05, + "loss": 0.0077, + "step": 614830 + }, + { + "epoch": 1.59, + "learning_rate": 6.0936904616868116e-05, + "loss": 0.0094, + "step": 614840 + }, + { + "epoch": 1.59, + "learning_rate": 6.093301640049665e-05, + "loss": 0.0082, + "step": 614850 + }, + { + "epoch": 1.59, + "learning_rate": 6.0929128184125185e-05, + "loss": 0.0089, + "step": 614860 + }, + { + "epoch": 1.59, + "learning_rate": 6.092523996775372e-05, + "loss": 0.007, + "step": 614870 + }, + { + "epoch": 1.59, + "learning_rate": 6.0921351751382255e-05, + "loss": 0.0066, + "step": 614880 + }, + { + "epoch": 1.59, + "learning_rate": 6.0917463535010797e-05, + "loss": 0.0063, + "step": 614890 + }, + { + "epoch": 1.59, + "learning_rate": 6.091357531863933e-05, + "loss": 0.0097, + "step": 614900 + }, + { + "epoch": 1.59, + "learning_rate": 6.0909687102267866e-05, + "loss": 0.0083, + "step": 614910 + }, + { + "epoch": 1.59, + "learning_rate": 6.09057988858964e-05, + "loss": 0.009, + "step": 614920 + }, + { + "epoch": 1.59, + "learning_rate": 6.0901910669524936e-05, + "loss": 0.0089, + "step": 614930 + }, + { + "epoch": 1.59, + "learning_rate": 6.0898022453153464e-05, + "loss": 0.0085, + "step": 614940 + }, + { + "epoch": 1.59, + "learning_rate": 6.0894134236782e-05, + "loss": 0.006, + "step": 614950 + }, + { + "epoch": 1.59, + "learning_rate": 6.0890246020410534e-05, + "loss": 0.01, + "step": 614960 + }, + { + "epoch": 1.59, + "learning_rate": 6.088635780403907e-05, + "loss": 0.0076, + "step": 614970 + }, + { + "epoch": 1.59, + "learning_rate": 6.0882469587667604e-05, + "loss": 0.0088, + "step": 614980 + }, + { + "epoch": 1.59, + "learning_rate": 6.0878581371296145e-05, + "loss": 0.0089, + "step": 614990 + }, + { + "epoch": 1.59, + "learning_rate": 6.087469315492468e-05, + "loss": 0.0113, + "step": 615000 + }, + { + "epoch": 1.59, + "eval_cer": 0.8816998870492994, + "eval_loss": 0.005477694794535637, + "eval_runtime": 107.7529, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, + "step": 615000 + }, + { + "epoch": 1.59, + "learning_rate": 6.0870804938553215e-05, + "loss": 0.0063, + "step": 615010 + }, + { + "epoch": 1.59, + "learning_rate": 6.086691672218175e-05, + "loss": 0.0062, + "step": 615020 + }, + { + "epoch": 1.59, + "learning_rate": 6.0863028505810285e-05, + "loss": 0.0091, + "step": 615030 + }, + { + "epoch": 1.59, + "learning_rate": 6.085914028943882e-05, + "loss": 0.0098, + "step": 615040 + }, + { + "epoch": 1.59, + "learning_rate": 6.0855252073067354e-05, + "loss": 0.008, + "step": 615050 + }, + { + "epoch": 1.59, + "learning_rate": 6.085136385669589e-05, + "loss": 0.0072, + "step": 615060 + }, + { + "epoch": 1.59, + "learning_rate": 6.084747564032443e-05, + "loss": 0.0098, + "step": 615070 + }, + { + "epoch": 1.59, + "learning_rate": 6.0843587423952966e-05, + "loss": 0.011, + "step": 615080 + }, + { + "epoch": 1.59, + "learning_rate": 6.08396992075815e-05, + "loss": 0.0052, + "step": 615090 + }, + { + "epoch": 1.59, + "learning_rate": 6.0835810991210035e-05, + "loss": 0.0065, + "step": 615100 + }, + { + "epoch": 1.59, + "learning_rate": 6.083192277483857e-05, + "loss": 0.0088, + "step": 615110 + }, + { + "epoch": 1.59, + "learning_rate": 6.0828034558467105e-05, + "loss": 0.0105, + "step": 615120 + }, + { + "epoch": 1.59, + "learning_rate": 6.082414634209564e-05, + "loss": 0.0106, + "step": 615130 + }, + { + "epoch": 1.59, + "learning_rate": 6.0820258125724175e-05, + "loss": 0.0065, + "step": 615140 + }, + { + "epoch": 1.59, + "learning_rate": 6.0816369909352717e-05, + "loss": 0.0066, + "step": 615150 + }, + { + "epoch": 1.59, + "learning_rate": 6.081248169298125e-05, + "loss": 0.0093, + "step": 615160 + }, + { + "epoch": 1.59, + "learning_rate": 6.0808593476609786e-05, + "loss": 0.0078, + "step": 615170 + }, + { + "epoch": 1.59, + "learning_rate": 6.080470526023832e-05, + "loss": 0.0065, + "step": 615180 + }, + { + "epoch": 1.59, + "learning_rate": 6.080081704386685e-05, + "loss": 0.0079, + "step": 615190 + }, + { + "epoch": 1.59, + "learning_rate": 6.0796928827495384e-05, + "loss": 0.0088, + "step": 615200 + }, + { + "epoch": 1.59, + "learning_rate": 6.079304061112392e-05, + "loss": 0.0069, + "step": 615210 + }, + { + "epoch": 1.59, + "learning_rate": 6.0789152394752454e-05, + "loss": 0.0065, + "step": 615220 + }, + { + "epoch": 1.59, + "learning_rate": 6.078526417838099e-05, + "loss": 0.0085, + "step": 615230 + }, + { + "epoch": 1.59, + "learning_rate": 6.0781375962009524e-05, + "loss": 0.0074, + "step": 615240 + }, + { + "epoch": 1.59, + "learning_rate": 6.0777487745638065e-05, + "loss": 0.0092, + "step": 615250 + }, + { + "epoch": 1.59, + "learning_rate": 6.07735995292666e-05, + "loss": 0.01, + "step": 615260 + }, + { + "epoch": 1.59, + "learning_rate": 6.0769711312895135e-05, + "loss": 0.0086, + "step": 615270 + }, + { + "epoch": 1.59, + "learning_rate": 6.076582309652367e-05, + "loss": 0.0072, + "step": 615280 + }, + { + "epoch": 1.59, + "learning_rate": 6.0761934880152205e-05, + "loss": 0.0087, + "step": 615290 + }, + { + "epoch": 1.59, + "learning_rate": 6.075804666378074e-05, + "loss": 0.0074, + "step": 615300 + }, + { + "epoch": 1.59, + "learning_rate": 6.0754158447409274e-05, + "loss": 0.0066, + "step": 615310 + }, + { + "epoch": 1.59, + "learning_rate": 6.075027023103781e-05, + "loss": 0.0087, + "step": 615320 + }, + { + "epoch": 1.6, + "learning_rate": 6.074638201466635e-05, + "loss": 0.0086, + "step": 615330 + }, + { + "epoch": 1.6, + "learning_rate": 6.0742493798294886e-05, + "loss": 0.0074, + "step": 615340 + }, + { + "epoch": 1.6, + "learning_rate": 6.073860558192342e-05, + "loss": 0.0052, + "step": 615350 + }, + { + "epoch": 1.6, + "learning_rate": 6.0734717365551955e-05, + "loss": 0.0111, + "step": 615360 + }, + { + "epoch": 1.6, + "learning_rate": 6.073082914918049e-05, + "loss": 0.008, + "step": 615370 + }, + { + "epoch": 1.6, + "learning_rate": 6.0726940932809025e-05, + "loss": 0.0087, + "step": 615380 + }, + { + "epoch": 1.6, + "learning_rate": 6.072305271643756e-05, + "loss": 0.0076, + "step": 615390 + }, + { + "epoch": 1.6, + "learning_rate": 6.0719164500066095e-05, + "loss": 0.0098, + "step": 615400 + }, + { + "epoch": 1.6, + "learning_rate": 6.0715276283694637e-05, + "loss": 0.0078, + "step": 615410 + }, + { + "epoch": 1.6, + "learning_rate": 6.071138806732317e-05, + "loss": 0.0088, + "step": 615420 + }, + { + "epoch": 1.6, + "learning_rate": 6.07074998509517e-05, + "loss": 0.0083, + "step": 615430 + }, + { + "epoch": 1.6, + "learning_rate": 6.0703611634580234e-05, + "loss": 0.0088, + "step": 615440 + }, + { + "epoch": 1.6, + "learning_rate": 6.069972341820877e-05, + "loss": 0.0092, + "step": 615450 + }, + { + "epoch": 1.6, + "learning_rate": 6.0695835201837304e-05, + "loss": 0.0086, + "step": 615460 + }, + { + "epoch": 1.6, + "learning_rate": 6.069194698546584e-05, + "loss": 0.0081, + "step": 615470 + }, + { + "epoch": 1.6, + "learning_rate": 6.0688058769094374e-05, + "loss": 0.0061, + "step": 615480 + }, + { + "epoch": 1.6, + "learning_rate": 6.068417055272291e-05, + "loss": 0.0073, + "step": 615490 + }, + { + "epoch": 1.6, + "learning_rate": 6.0680282336351443e-05, + "loss": 0.0115, + "step": 615500 + }, + { + "epoch": 1.6, + "learning_rate": 6.0676394119979985e-05, + "loss": 0.0085, + "step": 615510 + }, + { + "epoch": 1.6, + "learning_rate": 6.067250590360852e-05, + "loss": 0.0094, + "step": 615520 + }, + { + "epoch": 1.6, + "learning_rate": 6.0668617687237055e-05, + "loss": 0.007, + "step": 615530 + }, + { + "epoch": 1.6, + "learning_rate": 6.066472947086559e-05, + "loss": 0.0063, + "step": 615540 + }, + { + "epoch": 1.6, + "learning_rate": 6.0660841254494125e-05, + "loss": 0.0104, + "step": 615550 + }, + { + "epoch": 1.6, + "learning_rate": 6.065695303812266e-05, + "loss": 0.0089, + "step": 615560 + }, + { + "epoch": 1.6, + "learning_rate": 6.0653064821751194e-05, + "loss": 0.0068, + "step": 615570 + }, + { + "epoch": 1.6, + "learning_rate": 6.064917660537973e-05, + "loss": 0.0073, + "step": 615580 + }, + { + "epoch": 1.6, + "learning_rate": 6.064528838900827e-05, + "loss": 0.0061, + "step": 615590 + }, + { + "epoch": 1.6, + "learning_rate": 6.0641400172636806e-05, + "loss": 0.0087, + "step": 615600 + }, + { + "epoch": 1.6, + "learning_rate": 6.063751195626534e-05, + "loss": 0.0094, + "step": 615610 + }, + { + "epoch": 1.6, + "learning_rate": 6.0633623739893875e-05, + "loss": 0.0099, + "step": 615620 + }, + { + "epoch": 1.6, + "learning_rate": 6.062973552352241e-05, + "loss": 0.0093, + "step": 615630 + }, + { + "epoch": 1.6, + "learning_rate": 6.0625847307150945e-05, + "loss": 0.0075, + "step": 615640 + }, + { + "epoch": 1.6, + "learning_rate": 6.062195909077948e-05, + "loss": 0.0108, + "step": 615650 + }, + { + "epoch": 1.6, + "learning_rate": 6.0618070874408015e-05, + "loss": 0.0081, + "step": 615660 + }, + { + "epoch": 1.6, + "learning_rate": 6.061418265803655e-05, + "loss": 0.0099, + "step": 615670 + }, + { + "epoch": 1.6, + "learning_rate": 6.061029444166508e-05, + "loss": 0.0074, + "step": 615680 + }, + { + "epoch": 1.6, + "learning_rate": 6.060640622529362e-05, + "loss": 0.0049, + "step": 615690 + }, + { + "epoch": 1.6, + "learning_rate": 6.0602518008922154e-05, + "loss": 0.0095, + "step": 615700 + }, + { + "epoch": 1.6, + "learning_rate": 6.059862979255069e-05, + "loss": 0.009, + "step": 615710 + }, + { + "epoch": 1.6, + "learning_rate": 6.0594741576179224e-05, + "loss": 0.0054, + "step": 615720 + }, + { + "epoch": 1.6, + "learning_rate": 6.059085335980776e-05, + "loss": 0.0083, + "step": 615730 + }, + { + "epoch": 1.6, + "learning_rate": 6.0586965143436294e-05, + "loss": 0.0097, + "step": 615740 + }, + { + "epoch": 1.6, + "learning_rate": 6.058307692706483e-05, + "loss": 0.0113, + "step": 615750 + }, + { + "epoch": 1.6, + "learning_rate": 6.0579188710693363e-05, + "loss": 0.0083, + "step": 615760 + }, + { + "epoch": 1.6, + "learning_rate": 6.0575300494321905e-05, + "loss": 0.0096, + "step": 615770 + }, + { + "epoch": 1.6, + "learning_rate": 6.057141227795044e-05, + "loss": 0.0096, + "step": 615780 + }, + { + "epoch": 1.6, + "learning_rate": 6.0567524061578975e-05, + "loss": 0.0079, + "step": 615790 + }, + { + "epoch": 1.6, + "learning_rate": 6.056363584520751e-05, + "loss": 0.0086, + "step": 615800 + }, + { + "epoch": 1.6, + "learning_rate": 6.0559747628836045e-05, + "loss": 0.0103, + "step": 615810 + }, + { + "epoch": 1.6, + "learning_rate": 6.055585941246458e-05, + "loss": 0.0109, + "step": 615820 + }, + { + "epoch": 1.6, + "learning_rate": 6.0551971196093114e-05, + "loss": 0.0074, + "step": 615830 + }, + { + "epoch": 1.6, + "learning_rate": 6.054808297972165e-05, + "loss": 0.0094, + "step": 615840 + }, + { + "epoch": 1.6, + "learning_rate": 6.0544194763350184e-05, + "loss": 0.0105, + "step": 615850 + }, + { + "epoch": 1.6, + "learning_rate": 6.0540306546978726e-05, + "loss": 0.0078, + "step": 615860 + }, + { + "epoch": 1.6, + "learning_rate": 6.053641833060726e-05, + "loss": 0.0108, + "step": 615870 + }, + { + "epoch": 1.6, + "learning_rate": 6.0532530114235795e-05, + "loss": 0.0067, + "step": 615880 + }, + { + "epoch": 1.6, + "learning_rate": 6.052864189786433e-05, + "loss": 0.0079, + "step": 615890 + }, + { + "epoch": 1.6, + "learning_rate": 6.0524753681492865e-05, + "loss": 0.008, + "step": 615900 + }, + { + "epoch": 1.6, + "learning_rate": 6.05208654651214e-05, + "loss": 0.0072, + "step": 615910 + }, + { + "epoch": 1.6, + "learning_rate": 6.0516977248749935e-05, + "loss": 0.0078, + "step": 615920 + }, + { + "epoch": 1.6, + "learning_rate": 6.051308903237846e-05, + "loss": 0.0079, + "step": 615930 + }, + { + "epoch": 1.6, + "learning_rate": 6.0509200816007e-05, + "loss": 0.0079, + "step": 615940 + }, + { + "epoch": 1.6, + "learning_rate": 6.050531259963553e-05, + "loss": 0.0113, + "step": 615950 + }, + { + "epoch": 1.6, + "learning_rate": 6.0501424383264074e-05, + "loss": 0.0073, + "step": 615960 + }, + { + "epoch": 1.6, + "learning_rate": 6.049753616689261e-05, + "loss": 0.0085, + "step": 615970 + }, + { + "epoch": 1.6, + "learning_rate": 6.0493647950521144e-05, + "loss": 0.0081, + "step": 615980 + }, + { + "epoch": 1.6, + "learning_rate": 6.048975973414968e-05, + "loss": 0.0078, + "step": 615990 + }, + { + "epoch": 1.6, + "learning_rate": 6.0485871517778214e-05, + "loss": 0.0076, + "step": 616000 + }, + { + "epoch": 1.6, + "eval_cer": 0.8817124837817071, + "eval_loss": 0.005670115817338228, + "eval_runtime": 107.9064, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, + "step": 616000 + }, + { + "epoch": 1.6, + "learning_rate": 6.048198330140675e-05, + "loss": 0.0088, + "step": 616010 + }, + { + "epoch": 1.6, + "learning_rate": 6.0478095085035283e-05, + "loss": 0.0101, + "step": 616020 + }, + { + "epoch": 1.6, + "learning_rate": 6.047420686866382e-05, + "loss": 0.0117, + "step": 616030 + }, + { + "epoch": 1.6, + "learning_rate": 6.047031865229236e-05, + "loss": 0.0092, + "step": 616040 + }, + { + "epoch": 1.6, + "learning_rate": 6.0466430435920895e-05, + "loss": 0.0069, + "step": 616050 + }, + { + "epoch": 1.6, + "learning_rate": 6.046254221954943e-05, + "loss": 0.0073, + "step": 616060 + }, + { + "epoch": 1.6, + "learning_rate": 6.0458654003177964e-05, + "loss": 0.0078, + "step": 616070 + }, + { + "epoch": 1.6, + "learning_rate": 6.04547657868065e-05, + "loss": 0.0061, + "step": 616080 + }, + { + "epoch": 1.6, + "learning_rate": 6.0450877570435034e-05, + "loss": 0.0103, + "step": 616090 + }, + { + "epoch": 1.6, + "learning_rate": 6.044698935406357e-05, + "loss": 0.0096, + "step": 616100 + }, + { + "epoch": 1.6, + "learning_rate": 6.0443101137692104e-05, + "loss": 0.0094, + "step": 616110 + }, + { + "epoch": 1.6, + "learning_rate": 6.0439212921320646e-05, + "loss": 0.0089, + "step": 616120 + }, + { + "epoch": 1.6, + "learning_rate": 6.043532470494918e-05, + "loss": 0.0084, + "step": 616130 + }, + { + "epoch": 1.6, + "learning_rate": 6.0431436488577715e-05, + "loss": 0.007, + "step": 616140 + }, + { + "epoch": 1.6, + "learning_rate": 6.042754827220625e-05, + "loss": 0.01, + "step": 616150 + }, + { + "epoch": 1.6, + "learning_rate": 6.0423660055834785e-05, + "loss": 0.0065, + "step": 616160 + }, + { + "epoch": 1.6, + "learning_rate": 6.041977183946332e-05, + "loss": 0.0095, + "step": 616170 + }, + { + "epoch": 1.6, + "learning_rate": 6.041588362309185e-05, + "loss": 0.0111, + "step": 616180 + }, + { + "epoch": 1.6, + "learning_rate": 6.041199540672038e-05, + "loss": 0.0068, + "step": 616190 + }, + { + "epoch": 1.6, + "learning_rate": 6.040810719034892e-05, + "loss": 0.0094, + "step": 616200 + }, + { + "epoch": 1.6, + "learning_rate": 6.040421897397745e-05, + "loss": 0.0101, + "step": 616210 + }, + { + "epoch": 1.6, + "learning_rate": 6.0400330757605994e-05, + "loss": 0.0109, + "step": 616220 + }, + { + "epoch": 1.6, + "learning_rate": 6.039644254123453e-05, + "loss": 0.0077, + "step": 616230 + }, + { + "epoch": 1.6, + "learning_rate": 6.0392554324863064e-05, + "loss": 0.0078, + "step": 616240 + }, + { + "epoch": 1.6, + "learning_rate": 6.03886661084916e-05, + "loss": 0.0073, + "step": 616250 + }, + { + "epoch": 1.6, + "learning_rate": 6.0384777892120134e-05, + "loss": 0.0078, + "step": 616260 + }, + { + "epoch": 1.6, + "learning_rate": 6.038088967574867e-05, + "loss": 0.0075, + "step": 616270 + }, + { + "epoch": 1.6, + "learning_rate": 6.03770014593772e-05, + "loss": 0.0061, + "step": 616280 + }, + { + "epoch": 1.6, + "learning_rate": 6.037311324300574e-05, + "loss": 0.0093, + "step": 616290 + }, + { + "epoch": 1.6, + "learning_rate": 6.036922502663428e-05, + "loss": 0.0123, + "step": 616300 + }, + { + "epoch": 1.6, + "learning_rate": 6.0365336810262815e-05, + "loss": 0.0088, + "step": 616310 + }, + { + "epoch": 1.6, + "learning_rate": 6.036144859389135e-05, + "loss": 0.0078, + "step": 616320 + }, + { + "epoch": 1.6, + "learning_rate": 6.0357560377519884e-05, + "loss": 0.0074, + "step": 616330 + }, + { + "epoch": 1.6, + "learning_rate": 6.035367216114842e-05, + "loss": 0.011, + "step": 616340 + }, + { + "epoch": 1.6, + "learning_rate": 6.0349783944776954e-05, + "loss": 0.0108, + "step": 616350 + }, + { + "epoch": 1.6, + "learning_rate": 6.034589572840549e-05, + "loss": 0.0074, + "step": 616360 + }, + { + "epoch": 1.6, + "learning_rate": 6.0342007512034024e-05, + "loss": 0.008, + "step": 616370 + }, + { + "epoch": 1.6, + "learning_rate": 6.0338119295662566e-05, + "loss": 0.0075, + "step": 616380 + }, + { + "epoch": 1.6, + "learning_rate": 6.03342310792911e-05, + "loss": 0.0084, + "step": 616390 + }, + { + "epoch": 1.6, + "learning_rate": 6.0330342862919635e-05, + "loss": 0.0098, + "step": 616400 + }, + { + "epoch": 1.6, + "learning_rate": 6.032645464654817e-05, + "loss": 0.0101, + "step": 616410 + }, + { + "epoch": 1.6, + "learning_rate": 6.0322566430176705e-05, + "loss": 0.0086, + "step": 616420 + }, + { + "epoch": 1.6, + "learning_rate": 6.031867821380523e-05, + "loss": 0.009, + "step": 616430 + }, + { + "epoch": 1.6, + "learning_rate": 6.031478999743377e-05, + "loss": 0.01, + "step": 616440 + }, + { + "epoch": 1.6, + "learning_rate": 6.03109017810623e-05, + "loss": 0.0097, + "step": 616450 + }, + { + "epoch": 1.6, + "learning_rate": 6.030701356469084e-05, + "loss": 0.0109, + "step": 616460 + }, + { + "epoch": 1.6, + "learning_rate": 6.030312534831937e-05, + "loss": 0.0091, + "step": 616470 + }, + { + "epoch": 1.6, + "learning_rate": 6.0299237131947914e-05, + "loss": 0.0078, + "step": 616480 + }, + { + "epoch": 1.6, + "learning_rate": 6.029534891557645e-05, + "loss": 0.0101, + "step": 616490 + }, + { + "epoch": 1.6, + "learning_rate": 6.0291460699204984e-05, + "loss": 0.0109, + "step": 616500 + }, + { + "epoch": 1.6, + "learning_rate": 6.028757248283352e-05, + "loss": 0.0084, + "step": 616510 + }, + { + "epoch": 1.6, + "learning_rate": 6.0283684266462054e-05, + "loss": 0.0109, + "step": 616520 + }, + { + "epoch": 1.6, + "learning_rate": 6.027979605009059e-05, + "loss": 0.0083, + "step": 616530 + }, + { + "epoch": 1.6, + "learning_rate": 6.027590783371912e-05, + "loss": 0.0071, + "step": 616540 + }, + { + "epoch": 1.6, + "learning_rate": 6.027201961734766e-05, + "loss": 0.0109, + "step": 616550 + }, + { + "epoch": 1.6, + "learning_rate": 6.02681314009762e-05, + "loss": 0.0101, + "step": 616560 + }, + { + "epoch": 1.6, + "learning_rate": 6.0264243184604735e-05, + "loss": 0.0083, + "step": 616570 + }, + { + "epoch": 1.6, + "learning_rate": 6.026035496823327e-05, + "loss": 0.0076, + "step": 616580 + }, + { + "epoch": 1.6, + "learning_rate": 6.0256466751861804e-05, + "loss": 0.008, + "step": 616590 + }, + { + "epoch": 1.6, + "learning_rate": 6.025257853549034e-05, + "loss": 0.0107, + "step": 616600 + }, + { + "epoch": 1.6, + "learning_rate": 6.0248690319118874e-05, + "loss": 0.0078, + "step": 616610 + }, + { + "epoch": 1.6, + "learning_rate": 6.024480210274741e-05, + "loss": 0.0076, + "step": 616620 + }, + { + "epoch": 1.6, + "learning_rate": 6.0240913886375944e-05, + "loss": 0.0094, + "step": 616630 + }, + { + "epoch": 1.6, + "learning_rate": 6.0237025670004485e-05, + "loss": 0.0086, + "step": 616640 + }, + { + "epoch": 1.6, + "learning_rate": 6.023313745363302e-05, + "loss": 0.0069, + "step": 616650 + }, + { + "epoch": 1.6, + "learning_rate": 6.0229249237261555e-05, + "loss": 0.0088, + "step": 616660 + }, + { + "epoch": 1.6, + "learning_rate": 6.022536102089008e-05, + "loss": 0.0084, + "step": 616670 + }, + { + "epoch": 1.6, + "learning_rate": 6.022147280451862e-05, + "loss": 0.008, + "step": 616680 + }, + { + "epoch": 1.6, + "learning_rate": 6.021758458814715e-05, + "loss": 0.0092, + "step": 616690 + }, + { + "epoch": 1.6, + "learning_rate": 6.021369637177569e-05, + "loss": 0.0075, + "step": 616700 + }, + { + "epoch": 1.6, + "learning_rate": 6.020980815540422e-05, + "loss": 0.0086, + "step": 616710 + }, + { + "epoch": 1.6, + "learning_rate": 6.020591993903276e-05, + "loss": 0.0063, + "step": 616720 + }, + { + "epoch": 1.6, + "learning_rate": 6.020203172266129e-05, + "loss": 0.0093, + "step": 616730 + }, + { + "epoch": 1.6, + "learning_rate": 6.0198143506289834e-05, + "loss": 0.0119, + "step": 616740 + }, + { + "epoch": 1.6, + "learning_rate": 6.019425528991837e-05, + "loss": 0.0067, + "step": 616750 + }, + { + "epoch": 1.6, + "learning_rate": 6.0190367073546904e-05, + "loss": 0.0097, + "step": 616760 + }, + { + "epoch": 1.6, + "learning_rate": 6.018647885717544e-05, + "loss": 0.007, + "step": 616770 + }, + { + "epoch": 1.6, + "learning_rate": 6.0182590640803974e-05, + "loss": 0.0084, + "step": 616780 + }, + { + "epoch": 1.6, + "learning_rate": 6.017870242443251e-05, + "loss": 0.0105, + "step": 616790 + }, + { + "epoch": 1.6, + "learning_rate": 6.017481420806104e-05, + "loss": 0.0094, + "step": 616800 + }, + { + "epoch": 1.6, + "learning_rate": 6.017092599168958e-05, + "loss": 0.0088, + "step": 616810 + }, + { + "epoch": 1.6, + "learning_rate": 6.016703777531812e-05, + "loss": 0.0092, + "step": 616820 + }, + { + "epoch": 1.6, + "learning_rate": 6.0163149558946655e-05, + "loss": 0.0064, + "step": 616830 + }, + { + "epoch": 1.6, + "learning_rate": 6.015926134257519e-05, + "loss": 0.0075, + "step": 616840 + }, + { + "epoch": 1.6, + "learning_rate": 6.0155373126203724e-05, + "loss": 0.009, + "step": 616850 + }, + { + "epoch": 1.6, + "learning_rate": 6.015148490983226e-05, + "loss": 0.0083, + "step": 616860 + }, + { + "epoch": 1.6, + "learning_rate": 6.0147596693460794e-05, + "loss": 0.0081, + "step": 616870 + }, + { + "epoch": 1.6, + "learning_rate": 6.014370847708933e-05, + "loss": 0.0093, + "step": 616880 + }, + { + "epoch": 1.6, + "learning_rate": 6.0139820260717864e-05, + "loss": 0.008, + "step": 616890 + }, + { + "epoch": 1.6, + "learning_rate": 6.0135932044346405e-05, + "loss": 0.0084, + "step": 616900 + }, + { + "epoch": 1.6, + "learning_rate": 6.013204382797494e-05, + "loss": 0.0085, + "step": 616910 + }, + { + "epoch": 1.6, + "learning_rate": 6.012815561160347e-05, + "loss": 0.0088, + "step": 616920 + }, + { + "epoch": 1.6, + "learning_rate": 6.0124267395232e-05, + "loss": 0.0076, + "step": 616930 + }, + { + "epoch": 1.6, + "learning_rate": 6.012037917886054e-05, + "loss": 0.0061, + "step": 616940 + }, + { + "epoch": 1.6, + "learning_rate": 6.011649096248907e-05, + "loss": 0.0088, + "step": 616950 + }, + { + "epoch": 1.6, + "learning_rate": 6.011260274611761e-05, + "loss": 0.0097, + "step": 616960 + }, + { + "epoch": 1.6, + "learning_rate": 6.010871452974614e-05, + "loss": 0.0108, + "step": 616970 + }, + { + "epoch": 1.6, + "learning_rate": 6.010482631337468e-05, + "loss": 0.0058, + "step": 616980 + }, + { + "epoch": 1.6, + "learning_rate": 6.010093809700321e-05, + "loss": 0.0095, + "step": 616990 + }, + { + "epoch": 1.6, + "learning_rate": 6.0097049880631754e-05, + "loss": 0.007, + "step": 617000 + }, + { + "epoch": 1.6, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.005568648222833872, + "eval_runtime": 107.8731, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 617000 + }, + { + "epoch": 1.6, + "learning_rate": 6.009316166426029e-05, + "loss": 0.0089, + "step": 617010 + }, + { + "epoch": 1.6, + "learning_rate": 6.0089273447888824e-05, + "loss": 0.0068, + "step": 617020 + }, + { + "epoch": 1.6, + "learning_rate": 6.008538523151736e-05, + "loss": 0.0102, + "step": 617030 + }, + { + "epoch": 1.6, + "learning_rate": 6.0081497015145893e-05, + "loss": 0.0088, + "step": 617040 + }, + { + "epoch": 1.6, + "learning_rate": 6.007760879877443e-05, + "loss": 0.0097, + "step": 617050 + }, + { + "epoch": 1.6, + "learning_rate": 6.007372058240296e-05, + "loss": 0.0086, + "step": 617060 + }, + { + "epoch": 1.6, + "learning_rate": 6.00698323660315e-05, + "loss": 0.0093, + "step": 617070 + }, + { + "epoch": 1.6, + "learning_rate": 6.006594414966004e-05, + "loss": 0.01, + "step": 617080 + }, + { + "epoch": 1.6, + "learning_rate": 6.0062055933288575e-05, + "loss": 0.0075, + "step": 617090 + }, + { + "epoch": 1.6, + "learning_rate": 6.005816771691711e-05, + "loss": 0.0076, + "step": 617100 + }, + { + "epoch": 1.6, + "learning_rate": 6.0054279500545644e-05, + "loss": 0.0062, + "step": 617110 + }, + { + "epoch": 1.6, + "learning_rate": 6.005039128417418e-05, + "loss": 0.0093, + "step": 617120 + }, + { + "epoch": 1.6, + "learning_rate": 6.0046503067802714e-05, + "loss": 0.011, + "step": 617130 + }, + { + "epoch": 1.6, + "learning_rate": 6.004261485143125e-05, + "loss": 0.0099, + "step": 617140 + }, + { + "epoch": 1.6, + "learning_rate": 6.0038726635059784e-05, + "loss": 0.0084, + "step": 617150 + }, + { + "epoch": 1.6, + "learning_rate": 6.003483841868832e-05, + "loss": 0.0084, + "step": 617160 + }, + { + "epoch": 1.6, + "learning_rate": 6.003095020231685e-05, + "loss": 0.0087, + "step": 617170 + }, + { + "epoch": 1.6, + "learning_rate": 6.002706198594539e-05, + "loss": 0.0097, + "step": 617180 + }, + { + "epoch": 1.6, + "learning_rate": 6.002317376957392e-05, + "loss": 0.0061, + "step": 617190 + }, + { + "epoch": 1.6, + "learning_rate": 6.001928555320246e-05, + "loss": 0.0093, + "step": 617200 + }, + { + "epoch": 1.6, + "learning_rate": 6.001539733683099e-05, + "loss": 0.0128, + "step": 617210 + }, + { + "epoch": 1.6, + "learning_rate": 6.001150912045953e-05, + "loss": 0.008, + "step": 617220 + }, + { + "epoch": 1.6, + "learning_rate": 6.000762090408806e-05, + "loss": 0.008, + "step": 617230 + }, + { + "epoch": 1.6, + "learning_rate": 6.00037326877166e-05, + "loss": 0.0093, + "step": 617240 + }, + { + "epoch": 1.6, + "learning_rate": 5.999984447134513e-05, + "loss": 0.0071, + "step": 617250 + }, + { + "epoch": 1.6, + "learning_rate": 5.999595625497367e-05, + "loss": 0.0077, + "step": 617260 + }, + { + "epoch": 1.6, + "learning_rate": 5.999206803860221e-05, + "loss": 0.009, + "step": 617270 + }, + { + "epoch": 1.6, + "learning_rate": 5.9988179822230744e-05, + "loss": 0.0076, + "step": 617280 + }, + { + "epoch": 1.6, + "learning_rate": 5.998429160585928e-05, + "loss": 0.0085, + "step": 617290 + }, + { + "epoch": 1.6, + "learning_rate": 5.9980403389487813e-05, + "loss": 0.0086, + "step": 617300 + }, + { + "epoch": 1.6, + "learning_rate": 5.997651517311635e-05, + "loss": 0.0101, + "step": 617310 + }, + { + "epoch": 1.6, + "learning_rate": 5.997262695674488e-05, + "loss": 0.0074, + "step": 617320 + }, + { + "epoch": 1.6, + "learning_rate": 5.996873874037342e-05, + "loss": 0.0055, + "step": 617330 + }, + { + "epoch": 1.6, + "learning_rate": 5.996485052400195e-05, + "loss": 0.0065, + "step": 617340 + }, + { + "epoch": 1.6, + "learning_rate": 5.9960962307630495e-05, + "loss": 0.0102, + "step": 617350 + }, + { + "epoch": 1.6, + "learning_rate": 5.995707409125903e-05, + "loss": 0.0088, + "step": 617360 + }, + { + "epoch": 1.6, + "learning_rate": 5.9953185874887564e-05, + "loss": 0.0099, + "step": 617370 + }, + { + "epoch": 1.6, + "learning_rate": 5.99492976585161e-05, + "loss": 0.0079, + "step": 617380 + }, + { + "epoch": 1.6, + "learning_rate": 5.9945409442144634e-05, + "loss": 0.007, + "step": 617390 + }, + { + "epoch": 1.6, + "learning_rate": 5.994152122577317e-05, + "loss": 0.0109, + "step": 617400 + }, + { + "epoch": 1.6, + "learning_rate": 5.9937633009401704e-05, + "loss": 0.0078, + "step": 617410 + }, + { + "epoch": 1.6, + "learning_rate": 5.993374479303023e-05, + "loss": 0.0072, + "step": 617420 + }, + { + "epoch": 1.6, + "learning_rate": 5.992985657665877e-05, + "loss": 0.0101, + "step": 617430 + }, + { + "epoch": 1.6, + "learning_rate": 5.99259683602873e-05, + "loss": 0.0066, + "step": 617440 + }, + { + "epoch": 1.6, + "learning_rate": 5.992208014391584e-05, + "loss": 0.0092, + "step": 617450 + }, + { + "epoch": 1.6, + "learning_rate": 5.991819192754438e-05, + "loss": 0.0076, + "step": 617460 + }, + { + "epoch": 1.6, + "learning_rate": 5.991430371117291e-05, + "loss": 0.0096, + "step": 617470 + }, + { + "epoch": 1.6, + "learning_rate": 5.991041549480145e-05, + "loss": 0.0077, + "step": 617480 + }, + { + "epoch": 1.6, + "learning_rate": 5.990652727842998e-05, + "loss": 0.0078, + "step": 617490 + }, + { + "epoch": 1.6, + "learning_rate": 5.990263906205852e-05, + "loss": 0.0091, + "step": 617500 + }, + { + "epoch": 1.6, + "learning_rate": 5.989875084568705e-05, + "loss": 0.0106, + "step": 617510 + }, + { + "epoch": 1.6, + "learning_rate": 5.989486262931559e-05, + "loss": 0.0077, + "step": 617520 + }, + { + "epoch": 1.6, + "learning_rate": 5.989097441294413e-05, + "loss": 0.0088, + "step": 617530 + }, + { + "epoch": 1.6, + "learning_rate": 5.9887086196572664e-05, + "loss": 0.009, + "step": 617540 + }, + { + "epoch": 1.6, + "learning_rate": 5.98831979802012e-05, + "loss": 0.0078, + "step": 617550 + }, + { + "epoch": 1.6, + "learning_rate": 5.987930976382973e-05, + "loss": 0.0076, + "step": 617560 + }, + { + "epoch": 1.6, + "learning_rate": 5.987542154745827e-05, + "loss": 0.0103, + "step": 617570 + }, + { + "epoch": 1.6, + "learning_rate": 5.98715333310868e-05, + "loss": 0.0095, + "step": 617580 + }, + { + "epoch": 1.6, + "learning_rate": 5.986764511471534e-05, + "loss": 0.0105, + "step": 617590 + }, + { + "epoch": 1.6, + "learning_rate": 5.986375689834387e-05, + "loss": 0.008, + "step": 617600 + }, + { + "epoch": 1.6, + "learning_rate": 5.9859868681972414e-05, + "loss": 0.0098, + "step": 617610 + }, + { + "epoch": 1.6, + "learning_rate": 5.985598046560095e-05, + "loss": 0.0094, + "step": 617620 + }, + { + "epoch": 1.6, + "learning_rate": 5.9852092249229484e-05, + "loss": 0.009, + "step": 617630 + }, + { + "epoch": 1.6, + "learning_rate": 5.984820403285802e-05, + "loss": 0.0077, + "step": 617640 + }, + { + "epoch": 1.6, + "learning_rate": 5.9844315816486554e-05, + "loss": 0.0092, + "step": 617650 + }, + { + "epoch": 1.6, + "learning_rate": 5.984042760011509e-05, + "loss": 0.0082, + "step": 617660 + }, + { + "epoch": 1.6, + "learning_rate": 5.983653938374362e-05, + "loss": 0.0067, + "step": 617670 + }, + { + "epoch": 1.6, + "learning_rate": 5.983265116737215e-05, + "loss": 0.0103, + "step": 617680 + }, + { + "epoch": 1.6, + "learning_rate": 5.9828762951000687e-05, + "loss": 0.0077, + "step": 617690 + }, + { + "epoch": 1.6, + "learning_rate": 5.982487473462922e-05, + "loss": 0.0082, + "step": 617700 + }, + { + "epoch": 1.6, + "learning_rate": 5.982098651825776e-05, + "loss": 0.0089, + "step": 617710 + }, + { + "epoch": 1.6, + "learning_rate": 5.98170983018863e-05, + "loss": 0.0077, + "step": 617720 + }, + { + "epoch": 1.6, + "learning_rate": 5.981321008551483e-05, + "loss": 0.0094, + "step": 617730 + }, + { + "epoch": 1.6, + "learning_rate": 5.980932186914337e-05, + "loss": 0.0096, + "step": 617740 + }, + { + "epoch": 1.6, + "learning_rate": 5.98054336527719e-05, + "loss": 0.0086, + "step": 617750 + }, + { + "epoch": 1.6, + "learning_rate": 5.980154543640044e-05, + "loss": 0.0071, + "step": 617760 + }, + { + "epoch": 1.6, + "learning_rate": 5.979765722002897e-05, + "loss": 0.0104, + "step": 617770 + }, + { + "epoch": 1.6, + "learning_rate": 5.979376900365751e-05, + "loss": 0.0065, + "step": 617780 + }, + { + "epoch": 1.6, + "learning_rate": 5.978988078728605e-05, + "loss": 0.0069, + "step": 617790 + }, + { + "epoch": 1.6, + "learning_rate": 5.9785992570914584e-05, + "loss": 0.0084, + "step": 617800 + }, + { + "epoch": 1.6, + "learning_rate": 5.978210435454312e-05, + "loss": 0.0066, + "step": 617810 + }, + { + "epoch": 1.6, + "learning_rate": 5.977821613817165e-05, + "loss": 0.0074, + "step": 617820 + }, + { + "epoch": 1.6, + "learning_rate": 5.977432792180019e-05, + "loss": 0.007, + "step": 617830 + }, + { + "epoch": 1.6, + "learning_rate": 5.977043970542872e-05, + "loss": 0.0089, + "step": 617840 + }, + { + "epoch": 1.6, + "learning_rate": 5.976655148905726e-05, + "loss": 0.0098, + "step": 617850 + }, + { + "epoch": 1.6, + "learning_rate": 5.976266327268579e-05, + "loss": 0.0124, + "step": 617860 + }, + { + "epoch": 1.6, + "learning_rate": 5.9758775056314334e-05, + "loss": 0.0098, + "step": 617870 + }, + { + "epoch": 1.6, + "learning_rate": 5.975488683994287e-05, + "loss": 0.0074, + "step": 617880 + }, + { + "epoch": 1.6, + "learning_rate": 5.9750998623571404e-05, + "loss": 0.0098, + "step": 617890 + }, + { + "epoch": 1.6, + "learning_rate": 5.974711040719994e-05, + "loss": 0.0075, + "step": 617900 + }, + { + "epoch": 1.6, + "learning_rate": 5.974322219082847e-05, + "loss": 0.0065, + "step": 617910 + }, + { + "epoch": 1.6, + "learning_rate": 5.9739333974457e-05, + "loss": 0.007, + "step": 617920 + }, + { + "epoch": 1.6, + "learning_rate": 5.973544575808554e-05, + "loss": 0.0089, + "step": 617930 + }, + { + "epoch": 1.6, + "learning_rate": 5.973155754171407e-05, + "loss": 0.009, + "step": 617940 + }, + { + "epoch": 1.6, + "learning_rate": 5.9727669325342607e-05, + "loss": 0.0083, + "step": 617950 + }, + { + "epoch": 1.6, + "learning_rate": 5.972378110897114e-05, + "loss": 0.0075, + "step": 617960 + }, + { + "epoch": 1.6, + "learning_rate": 5.971989289259968e-05, + "loss": 0.0096, + "step": 617970 + }, + { + "epoch": 1.6, + "learning_rate": 5.971600467622822e-05, + "loss": 0.0105, + "step": 617980 + }, + { + "epoch": 1.6, + "learning_rate": 5.971211645985675e-05, + "loss": 0.0084, + "step": 617990 + }, + { + "epoch": 1.6, + "learning_rate": 5.970822824348529e-05, + "loss": 0.0095, + "step": 618000 + }, + { + "epoch": 1.6, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.0055539365857839584, + "eval_runtime": 107.9153, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 618000 + }, + { + "epoch": 1.6, + "learning_rate": 5.970434002711382e-05, + "loss": 0.0072, + "step": 618010 + }, + { + "epoch": 1.6, + "learning_rate": 5.970045181074236e-05, + "loss": 0.0086, + "step": 618020 + }, + { + "epoch": 1.6, + "learning_rate": 5.969656359437089e-05, + "loss": 0.0121, + "step": 618030 + }, + { + "epoch": 1.6, + "learning_rate": 5.969267537799943e-05, + "loss": 0.0078, + "step": 618040 + }, + { + "epoch": 1.6, + "learning_rate": 5.968878716162797e-05, + "loss": 0.0083, + "step": 618050 + }, + { + "epoch": 1.6, + "learning_rate": 5.9684898945256504e-05, + "loss": 0.0115, + "step": 618060 + }, + { + "epoch": 1.6, + "learning_rate": 5.968101072888504e-05, + "loss": 0.0074, + "step": 618070 + }, + { + "epoch": 1.6, + "learning_rate": 5.967712251251357e-05, + "loss": 0.0129, + "step": 618080 + }, + { + "epoch": 1.6, + "learning_rate": 5.967323429614211e-05, + "loss": 0.0113, + "step": 618090 + }, + { + "epoch": 1.6, + "learning_rate": 5.966934607977064e-05, + "loss": 0.0076, + "step": 618100 + }, + { + "epoch": 1.6, + "learning_rate": 5.966545786339918e-05, + "loss": 0.0101, + "step": 618110 + }, + { + "epoch": 1.6, + "learning_rate": 5.966156964702771e-05, + "loss": 0.0092, + "step": 618120 + }, + { + "epoch": 1.6, + "learning_rate": 5.9657681430656254e-05, + "loss": 0.0085, + "step": 618130 + }, + { + "epoch": 1.6, + "learning_rate": 5.965379321428479e-05, + "loss": 0.0084, + "step": 618140 + }, + { + "epoch": 1.6, + "learning_rate": 5.9649904997913324e-05, + "loss": 0.0091, + "step": 618150 + }, + { + "epoch": 1.6, + "learning_rate": 5.964601678154185e-05, + "loss": 0.0066, + "step": 618160 + }, + { + "epoch": 1.6, + "learning_rate": 5.964212856517039e-05, + "loss": 0.01, + "step": 618170 + }, + { + "epoch": 1.6, + "learning_rate": 5.963824034879892e-05, + "loss": 0.0082, + "step": 618180 + }, + { + "epoch": 1.6, + "learning_rate": 5.963435213242746e-05, + "loss": 0.0091, + "step": 618190 + }, + { + "epoch": 1.6, + "learning_rate": 5.963046391605599e-05, + "loss": 0.0084, + "step": 618200 + }, + { + "epoch": 1.6, + "learning_rate": 5.9626575699684526e-05, + "loss": 0.0076, + "step": 618210 + }, + { + "epoch": 1.6, + "learning_rate": 5.962268748331306e-05, + "loss": 0.0075, + "step": 618220 + }, + { + "epoch": 1.6, + "learning_rate": 5.96187992669416e-05, + "loss": 0.0098, + "step": 618230 + }, + { + "epoch": 1.6, + "learning_rate": 5.961491105057014e-05, + "loss": 0.0083, + "step": 618240 + }, + { + "epoch": 1.6, + "learning_rate": 5.961102283419867e-05, + "loss": 0.0082, + "step": 618250 + }, + { + "epoch": 1.6, + "learning_rate": 5.960713461782721e-05, + "loss": 0.0113, + "step": 618260 + }, + { + "epoch": 1.6, + "learning_rate": 5.960324640145574e-05, + "loss": 0.0068, + "step": 618270 + }, + { + "epoch": 1.6, + "learning_rate": 5.959935818508428e-05, + "loss": 0.0077, + "step": 618280 + }, + { + "epoch": 1.6, + "learning_rate": 5.959546996871281e-05, + "loss": 0.0111, + "step": 618290 + }, + { + "epoch": 1.6, + "learning_rate": 5.959158175234135e-05, + "loss": 0.0094, + "step": 618300 + }, + { + "epoch": 1.6, + "learning_rate": 5.958769353596989e-05, + "loss": 0.0091, + "step": 618310 + }, + { + "epoch": 1.6, + "learning_rate": 5.9583805319598424e-05, + "loss": 0.0081, + "step": 618320 + }, + { + "epoch": 1.6, + "learning_rate": 5.957991710322696e-05, + "loss": 0.0052, + "step": 618330 + }, + { + "epoch": 1.6, + "learning_rate": 5.957602888685549e-05, + "loss": 0.0104, + "step": 618340 + }, + { + "epoch": 1.6, + "learning_rate": 5.957214067048403e-05, + "loss": 0.0099, + "step": 618350 + }, + { + "epoch": 1.6, + "learning_rate": 5.956825245411256e-05, + "loss": 0.0088, + "step": 618360 + }, + { + "epoch": 1.6, + "learning_rate": 5.95643642377411e-05, + "loss": 0.0078, + "step": 618370 + }, + { + "epoch": 1.6, + "learning_rate": 5.956047602136963e-05, + "loss": 0.0089, + "step": 618380 + }, + { + "epoch": 1.6, + "learning_rate": 5.9556587804998174e-05, + "loss": 0.0087, + "step": 618390 + }, + { + "epoch": 1.6, + "learning_rate": 5.955269958862671e-05, + "loss": 0.0103, + "step": 618400 + }, + { + "epoch": 1.6, + "learning_rate": 5.954881137225524e-05, + "loss": 0.0135, + "step": 618410 + }, + { + "epoch": 1.6, + "learning_rate": 5.954492315588377e-05, + "loss": 0.0093, + "step": 618420 + }, + { + "epoch": 1.6, + "learning_rate": 5.954103493951231e-05, + "loss": 0.0088, + "step": 618430 + }, + { + "epoch": 1.6, + "learning_rate": 5.953714672314084e-05, + "loss": 0.0119, + "step": 618440 + }, + { + "epoch": 1.6, + "learning_rate": 5.953325850676938e-05, + "loss": 0.0099, + "step": 618450 + }, + { + "epoch": 1.6, + "learning_rate": 5.952937029039791e-05, + "loss": 0.0079, + "step": 618460 + }, + { + "epoch": 1.6, + "learning_rate": 5.9525482074026446e-05, + "loss": 0.0093, + "step": 618470 + }, + { + "epoch": 1.6, + "learning_rate": 5.952159385765498e-05, + "loss": 0.009, + "step": 618480 + }, + { + "epoch": 1.6, + "learning_rate": 5.951770564128352e-05, + "loss": 0.0087, + "step": 618490 + }, + { + "epoch": 1.6, + "learning_rate": 5.951381742491206e-05, + "loss": 0.0079, + "step": 618500 + }, + { + "epoch": 1.6, + "learning_rate": 5.950992920854059e-05, + "loss": 0.0064, + "step": 618510 + }, + { + "epoch": 1.6, + "learning_rate": 5.950604099216913e-05, + "loss": 0.0111, + "step": 618520 + }, + { + "epoch": 1.6, + "learning_rate": 5.950215277579766e-05, + "loss": 0.0067, + "step": 618530 + }, + { + "epoch": 1.6, + "learning_rate": 5.94982645594262e-05, + "loss": 0.0102, + "step": 618540 + }, + { + "epoch": 1.6, + "learning_rate": 5.949437634305473e-05, + "loss": 0.0096, + "step": 618550 + }, + { + "epoch": 1.6, + "learning_rate": 5.949048812668327e-05, + "loss": 0.0113, + "step": 618560 + }, + { + "epoch": 1.6, + "learning_rate": 5.94865999103118e-05, + "loss": 0.0067, + "step": 618570 + }, + { + "epoch": 1.6, + "learning_rate": 5.9482711693940343e-05, + "loss": 0.0106, + "step": 618580 + }, + { + "epoch": 1.6, + "learning_rate": 5.947882347756888e-05, + "loss": 0.0092, + "step": 618590 + }, + { + "epoch": 1.6, + "learning_rate": 5.947493526119741e-05, + "loss": 0.006, + "step": 618600 + }, + { + "epoch": 1.6, + "learning_rate": 5.947104704482595e-05, + "loss": 0.0072, + "step": 618610 + }, + { + "epoch": 1.6, + "learning_rate": 5.946715882845448e-05, + "loss": 0.0108, + "step": 618620 + }, + { + "epoch": 1.6, + "learning_rate": 5.946327061208302e-05, + "loss": 0.0078, + "step": 618630 + }, + { + "epoch": 1.6, + "learning_rate": 5.945938239571155e-05, + "loss": 0.0095, + "step": 618640 + }, + { + "epoch": 1.6, + "learning_rate": 5.945549417934009e-05, + "loss": 0.0093, + "step": 618650 + }, + { + "epoch": 1.6, + "learning_rate": 5.9451605962968616e-05, + "loss": 0.0077, + "step": 618660 + }, + { + "epoch": 1.6, + "learning_rate": 5.944771774659715e-05, + "loss": 0.0074, + "step": 618670 + }, + { + "epoch": 1.6, + "learning_rate": 5.944382953022569e-05, + "loss": 0.0059, + "step": 618680 + }, + { + "epoch": 1.6, + "learning_rate": 5.943994131385423e-05, + "loss": 0.0068, + "step": 618690 + }, + { + "epoch": 1.6, + "learning_rate": 5.943605309748276e-05, + "loss": 0.0096, + "step": 618700 + }, + { + "epoch": 1.6, + "learning_rate": 5.94321648811113e-05, + "loss": 0.0083, + "step": 618710 + }, + { + "epoch": 1.6, + "learning_rate": 5.942827666473983e-05, + "loss": 0.0106, + "step": 618720 + }, + { + "epoch": 1.6, + "learning_rate": 5.9424388448368366e-05, + "loss": 0.0064, + "step": 618730 + }, + { + "epoch": 1.6, + "learning_rate": 5.94205002319969e-05, + "loss": 0.0083, + "step": 618740 + }, + { + "epoch": 1.6, + "learning_rate": 5.9416612015625436e-05, + "loss": 0.0068, + "step": 618750 + }, + { + "epoch": 1.6, + "learning_rate": 5.941272379925398e-05, + "loss": 0.0071, + "step": 618760 + }, + { + "epoch": 1.6, + "learning_rate": 5.940883558288251e-05, + "loss": 0.01, + "step": 618770 + }, + { + "epoch": 1.6, + "learning_rate": 5.940494736651105e-05, + "loss": 0.0072, + "step": 618780 + }, + { + "epoch": 1.6, + "learning_rate": 5.940105915013958e-05, + "loss": 0.011, + "step": 618790 + }, + { + "epoch": 1.6, + "learning_rate": 5.939717093376812e-05, + "loss": 0.0114, + "step": 618800 + }, + { + "epoch": 1.6, + "learning_rate": 5.939328271739665e-05, + "loss": 0.0091, + "step": 618810 + }, + { + "epoch": 1.6, + "learning_rate": 5.938939450102519e-05, + "loss": 0.0084, + "step": 618820 + }, + { + "epoch": 1.6, + "learning_rate": 5.938550628465372e-05, + "loss": 0.0078, + "step": 618830 + }, + { + "epoch": 1.6, + "learning_rate": 5.9381618068282263e-05, + "loss": 0.0085, + "step": 618840 + }, + { + "epoch": 1.6, + "learning_rate": 5.93777298519108e-05, + "loss": 0.0094, + "step": 618850 + }, + { + "epoch": 1.6, + "learning_rate": 5.937384163553933e-05, + "loss": 0.0069, + "step": 618860 + }, + { + "epoch": 1.6, + "learning_rate": 5.936995341916787e-05, + "loss": 0.0095, + "step": 618870 + }, + { + "epoch": 1.6, + "learning_rate": 5.93660652027964e-05, + "loss": 0.0068, + "step": 618880 + }, + { + "epoch": 1.6, + "learning_rate": 5.936217698642494e-05, + "loss": 0.0075, + "step": 618890 + }, + { + "epoch": 1.6, + "learning_rate": 5.935828877005347e-05, + "loss": 0.0106, + "step": 618900 + }, + { + "epoch": 1.6, + "learning_rate": 5.9354400553682e-05, + "loss": 0.0097, + "step": 618910 + }, + { + "epoch": 1.6, + "learning_rate": 5.9350512337310536e-05, + "loss": 0.0115, + "step": 618920 + }, + { + "epoch": 1.6, + "learning_rate": 5.934662412093907e-05, + "loss": 0.0099, + "step": 618930 + }, + { + "epoch": 1.6, + "learning_rate": 5.934273590456761e-05, + "loss": 0.01, + "step": 618940 + }, + { + "epoch": 1.6, + "learning_rate": 5.933884768819615e-05, + "loss": 0.0067, + "step": 618950 + }, + { + "epoch": 1.6, + "learning_rate": 5.933495947182468e-05, + "loss": 0.0072, + "step": 618960 + }, + { + "epoch": 1.6, + "learning_rate": 5.933107125545322e-05, + "loss": 0.0076, + "step": 618970 + }, + { + "epoch": 1.6, + "learning_rate": 5.932718303908175e-05, + "loss": 0.0057, + "step": 618980 + }, + { + "epoch": 1.6, + "learning_rate": 5.9323294822710286e-05, + "loss": 0.0091, + "step": 618990 + }, + { + "epoch": 1.6, + "learning_rate": 5.931940660633882e-05, + "loss": 0.0083, + "step": 619000 + }, + { + "epoch": 1.6, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.005528622306883335, + "eval_runtime": 107.7525, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, + "step": 619000 + }, + { + "epoch": 1.6, + "learning_rate": 5.9315518389967356e-05, + "loss": 0.0105, + "step": 619010 + }, + { + "epoch": 1.6, + "learning_rate": 5.93116301735959e-05, + "loss": 0.0101, + "step": 619020 + }, + { + "epoch": 1.6, + "learning_rate": 5.930774195722443e-05, + "loss": 0.0105, + "step": 619030 + }, + { + "epoch": 1.6, + "learning_rate": 5.930385374085297e-05, + "loss": 0.0083, + "step": 619040 + }, + { + "epoch": 1.6, + "learning_rate": 5.92999655244815e-05, + "loss": 0.0111, + "step": 619050 + }, + { + "epoch": 1.6, + "learning_rate": 5.929607730811004e-05, + "loss": 0.0077, + "step": 619060 + }, + { + "epoch": 1.6, + "learning_rate": 5.929218909173857e-05, + "loss": 0.0093, + "step": 619070 + }, + { + "epoch": 1.6, + "learning_rate": 5.928830087536711e-05, + "loss": 0.008, + "step": 619080 + }, + { + "epoch": 1.6, + "learning_rate": 5.928441265899564e-05, + "loss": 0.0089, + "step": 619090 + }, + { + "epoch": 1.6, + "learning_rate": 5.928052444262418e-05, + "loss": 0.0103, + "step": 619100 + }, + { + "epoch": 1.6, + "learning_rate": 5.927663622625272e-05, + "loss": 0.007, + "step": 619110 + }, + { + "epoch": 1.6, + "learning_rate": 5.927274800988125e-05, + "loss": 0.0106, + "step": 619120 + }, + { + "epoch": 1.6, + "learning_rate": 5.926885979350979e-05, + "loss": 0.0085, + "step": 619130 + }, + { + "epoch": 1.6, + "learning_rate": 5.926497157713832e-05, + "loss": 0.0086, + "step": 619140 + }, + { + "epoch": 1.6, + "learning_rate": 5.926108336076686e-05, + "loss": 0.006, + "step": 619150 + }, + { + "epoch": 1.6, + "learning_rate": 5.9257195144395386e-05, + "loss": 0.0073, + "step": 619160 + }, + { + "epoch": 1.6, + "learning_rate": 5.925330692802392e-05, + "loss": 0.006, + "step": 619170 + }, + { + "epoch": 1.61, + "learning_rate": 5.9249418711652455e-05, + "loss": 0.0092, + "step": 619180 + }, + { + "epoch": 1.61, + "learning_rate": 5.924553049528099e-05, + "loss": 0.0096, + "step": 619190 + }, + { + "epoch": 1.61, + "learning_rate": 5.924164227890953e-05, + "loss": 0.0078, + "step": 619200 + }, + { + "epoch": 1.61, + "learning_rate": 5.923775406253807e-05, + "loss": 0.0095, + "step": 619210 + }, + { + "epoch": 1.61, + "learning_rate": 5.92338658461666e-05, + "loss": 0.0091, + "step": 619220 + }, + { + "epoch": 1.61, + "learning_rate": 5.9229977629795137e-05, + "loss": 0.0084, + "step": 619230 + }, + { + "epoch": 1.61, + "learning_rate": 5.922608941342367e-05, + "loss": 0.008, + "step": 619240 + }, + { + "epoch": 1.61, + "learning_rate": 5.9222201197052206e-05, + "loss": 0.0123, + "step": 619250 + }, + { + "epoch": 1.61, + "learning_rate": 5.921831298068074e-05, + "loss": 0.0085, + "step": 619260 + }, + { + "epoch": 1.61, + "learning_rate": 5.9214424764309276e-05, + "loss": 0.0098, + "step": 619270 + }, + { + "epoch": 1.61, + "learning_rate": 5.921053654793782e-05, + "loss": 0.0083, + "step": 619280 + }, + { + "epoch": 1.61, + "learning_rate": 5.920664833156635e-05, + "loss": 0.011, + "step": 619290 + }, + { + "epoch": 1.61, + "learning_rate": 5.920276011519489e-05, + "loss": 0.0088, + "step": 619300 + }, + { + "epoch": 1.61, + "learning_rate": 5.919887189882342e-05, + "loss": 0.0082, + "step": 619310 + }, + { + "epoch": 1.61, + "learning_rate": 5.919498368245196e-05, + "loss": 0.0109, + "step": 619320 + }, + { + "epoch": 1.61, + "learning_rate": 5.919109546608049e-05, + "loss": 0.0107, + "step": 619330 + }, + { + "epoch": 1.61, + "learning_rate": 5.918720724970903e-05, + "loss": 0.0053, + "step": 619340 + }, + { + "epoch": 1.61, + "learning_rate": 5.918331903333756e-05, + "loss": 0.0061, + "step": 619350 + }, + { + "epoch": 1.61, + "learning_rate": 5.91794308169661e-05, + "loss": 0.008, + "step": 619360 + }, + { + "epoch": 1.61, + "learning_rate": 5.917554260059464e-05, + "loss": 0.0088, + "step": 619370 + }, + { + "epoch": 1.61, + "learning_rate": 5.917165438422317e-05, + "loss": 0.012, + "step": 619380 + }, + { + "epoch": 1.61, + "learning_rate": 5.916776616785171e-05, + "loss": 0.0085, + "step": 619390 + }, + { + "epoch": 1.61, + "learning_rate": 5.9163877951480236e-05, + "loss": 0.0091, + "step": 619400 + }, + { + "epoch": 1.61, + "learning_rate": 5.915998973510877e-05, + "loss": 0.0129, + "step": 619410 + }, + { + "epoch": 1.61, + "learning_rate": 5.9156101518737306e-05, + "loss": 0.0103, + "step": 619420 + }, + { + "epoch": 1.61, + "learning_rate": 5.915221330236584e-05, + "loss": 0.0088, + "step": 619430 + }, + { + "epoch": 1.61, + "learning_rate": 5.9148325085994375e-05, + "loss": 0.0084, + "step": 619440 + }, + { + "epoch": 1.61, + "learning_rate": 5.914443686962291e-05, + "loss": 0.009, + "step": 619450 + }, + { + "epoch": 1.61, + "learning_rate": 5.914054865325145e-05, + "loss": 0.011, + "step": 619460 + }, + { + "epoch": 1.61, + "learning_rate": 5.913666043687999e-05, + "loss": 0.0068, + "step": 619470 + }, + { + "epoch": 1.61, + "learning_rate": 5.913277222050852e-05, + "loss": 0.0109, + "step": 619480 + }, + { + "epoch": 1.61, + "learning_rate": 5.9128884004137057e-05, + "loss": 0.0089, + "step": 619490 + }, + { + "epoch": 1.61, + "learning_rate": 5.912499578776559e-05, + "loss": 0.0096, + "step": 619500 + }, + { + "epoch": 1.61, + "learning_rate": 5.9121107571394126e-05, + "loss": 0.0106, + "step": 619510 + }, + { + "epoch": 1.61, + "learning_rate": 5.911721935502266e-05, + "loss": 0.0089, + "step": 619520 + }, + { + "epoch": 1.61, + "learning_rate": 5.9113331138651196e-05, + "loss": 0.0117, + "step": 619530 + }, + { + "epoch": 1.61, + "learning_rate": 5.910944292227974e-05, + "loss": 0.0087, + "step": 619540 + }, + { + "epoch": 1.61, + "learning_rate": 5.910555470590827e-05, + "loss": 0.0085, + "step": 619550 + }, + { + "epoch": 1.61, + "learning_rate": 5.910166648953681e-05, + "loss": 0.0087, + "step": 619560 + }, + { + "epoch": 1.61, + "learning_rate": 5.909777827316534e-05, + "loss": 0.0078, + "step": 619570 + }, + { + "epoch": 1.61, + "learning_rate": 5.909389005679388e-05, + "loss": 0.0061, + "step": 619580 + }, + { + "epoch": 1.61, + "learning_rate": 5.909000184042241e-05, + "loss": 0.0081, + "step": 619590 + }, + { + "epoch": 1.61, + "learning_rate": 5.908611362405095e-05, + "loss": 0.0114, + "step": 619600 + }, + { + "epoch": 1.61, + "learning_rate": 5.908222540767948e-05, + "loss": 0.0086, + "step": 619610 + }, + { + "epoch": 1.61, + "learning_rate": 5.907833719130802e-05, + "loss": 0.0108, + "step": 619620 + }, + { + "epoch": 1.61, + "learning_rate": 5.907444897493656e-05, + "loss": 0.0077, + "step": 619630 + }, + { + "epoch": 1.61, + "learning_rate": 5.907056075856509e-05, + "loss": 0.0091, + "step": 619640 + }, + { + "epoch": 1.61, + "learning_rate": 5.906667254219362e-05, + "loss": 0.0087, + "step": 619650 + }, + { + "epoch": 1.61, + "learning_rate": 5.9062784325822156e-05, + "loss": 0.0086, + "step": 619660 + }, + { + "epoch": 1.61, + "learning_rate": 5.905889610945069e-05, + "loss": 0.0076, + "step": 619670 + }, + { + "epoch": 1.61, + "learning_rate": 5.9055007893079226e-05, + "loss": 0.0091, + "step": 619680 + }, + { + "epoch": 1.61, + "learning_rate": 5.905111967670776e-05, + "loss": 0.0111, + "step": 619690 + }, + { + "epoch": 1.61, + "learning_rate": 5.9047231460336295e-05, + "loss": 0.0091, + "step": 619700 + }, + { + "epoch": 1.61, + "learning_rate": 5.904334324396483e-05, + "loss": 0.0087, + "step": 619710 + }, + { + "epoch": 1.61, + "learning_rate": 5.903945502759337e-05, + "loss": 0.0068, + "step": 619720 + }, + { + "epoch": 1.61, + "learning_rate": 5.903556681122191e-05, + "loss": 0.0055, + "step": 619730 + }, + { + "epoch": 1.61, + "learning_rate": 5.903167859485044e-05, + "loss": 0.0089, + "step": 619740 + }, + { + "epoch": 1.61, + "learning_rate": 5.9027790378478976e-05, + "loss": 0.0101, + "step": 619750 + }, + { + "epoch": 1.61, + "learning_rate": 5.902390216210751e-05, + "loss": 0.0072, + "step": 619760 + }, + { + "epoch": 1.61, + "learning_rate": 5.9020013945736046e-05, + "loss": 0.0119, + "step": 619770 + }, + { + "epoch": 1.61, + "learning_rate": 5.901612572936458e-05, + "loss": 0.0073, + "step": 619780 + }, + { + "epoch": 1.61, + "learning_rate": 5.9012237512993116e-05, + "loss": 0.0083, + "step": 619790 + }, + { + "epoch": 1.61, + "learning_rate": 5.900834929662166e-05, + "loss": 0.0072, + "step": 619800 + }, + { + "epoch": 1.61, + "learning_rate": 5.900446108025019e-05, + "loss": 0.0057, + "step": 619810 + }, + { + "epoch": 1.61, + "learning_rate": 5.900057286387873e-05, + "loss": 0.0092, + "step": 619820 + }, + { + "epoch": 1.61, + "learning_rate": 5.899668464750726e-05, + "loss": 0.009, + "step": 619830 + }, + { + "epoch": 1.61, + "learning_rate": 5.89927964311358e-05, + "loss": 0.0101, + "step": 619840 + }, + { + "epoch": 1.61, + "learning_rate": 5.898890821476433e-05, + "loss": 0.0097, + "step": 619850 + }, + { + "epoch": 1.61, + "learning_rate": 5.898501999839287e-05, + "loss": 0.0103, + "step": 619860 + }, + { + "epoch": 1.61, + "learning_rate": 5.89811317820214e-05, + "loss": 0.0081, + "step": 619870 + }, + { + "epoch": 1.61, + "learning_rate": 5.8977243565649936e-05, + "loss": 0.0081, + "step": 619880 + }, + { + "epoch": 1.61, + "learning_rate": 5.897335534927848e-05, + "loss": 0.0082, + "step": 619890 + }, + { + "epoch": 1.61, + "learning_rate": 5.8969467132907006e-05, + "loss": 0.0057, + "step": 619900 + }, + { + "epoch": 1.61, + "learning_rate": 5.896557891653554e-05, + "loss": 0.0075, + "step": 619910 + }, + { + "epoch": 1.61, + "learning_rate": 5.8961690700164076e-05, + "loss": 0.0074, + "step": 619920 + }, + { + "epoch": 1.61, + "learning_rate": 5.895780248379261e-05, + "loss": 0.0076, + "step": 619930 + }, + { + "epoch": 1.61, + "learning_rate": 5.8953914267421146e-05, + "loss": 0.0077, + "step": 619940 + }, + { + "epoch": 1.61, + "learning_rate": 5.895002605104968e-05, + "loss": 0.0094, + "step": 619950 + }, + { + "epoch": 1.61, + "learning_rate": 5.8946137834678215e-05, + "loss": 0.0114, + "step": 619960 + }, + { + "epoch": 1.61, + "learning_rate": 5.894224961830675e-05, + "loss": 0.01, + "step": 619970 + }, + { + "epoch": 1.61, + "learning_rate": 5.8938361401935285e-05, + "loss": 0.0067, + "step": 619980 + }, + { + "epoch": 1.61, + "learning_rate": 5.893447318556383e-05, + "loss": 0.0074, + "step": 619990 + }, + { + "epoch": 1.61, + "learning_rate": 5.893058496919236e-05, + "loss": 0.0073, + "step": 620000 + }, + { + "epoch": 1.61, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.00557528343051672, + "eval_runtime": 107.8677, + "eval_samples_per_second": 18.541, + "eval_steps_per_second": 4.635, + "step": 620000 + }, + { + "epoch": 1.61, + "learning_rate": 5.8926696752820896e-05, + "loss": 0.0118, + "step": 620010 + }, + { + "epoch": 1.61, + "learning_rate": 5.892280853644943e-05, + "loss": 0.0103, + "step": 620020 + }, + { + "epoch": 1.61, + "learning_rate": 5.8918920320077966e-05, + "loss": 0.0076, + "step": 620030 + }, + { + "epoch": 1.61, + "learning_rate": 5.89150321037065e-05, + "loss": 0.0097, + "step": 620040 + }, + { + "epoch": 1.61, + "learning_rate": 5.8911143887335036e-05, + "loss": 0.0078, + "step": 620050 + }, + { + "epoch": 1.61, + "learning_rate": 5.890725567096357e-05, + "loss": 0.0137, + "step": 620060 + }, + { + "epoch": 1.61, + "learning_rate": 5.890336745459211e-05, + "loss": 0.009, + "step": 620070 + }, + { + "epoch": 1.61, + "learning_rate": 5.889947923822065e-05, + "loss": 0.0091, + "step": 620080 + }, + { + "epoch": 1.61, + "learning_rate": 5.889559102184918e-05, + "loss": 0.0088, + "step": 620090 + }, + { + "epoch": 1.61, + "learning_rate": 5.889170280547772e-05, + "loss": 0.0084, + "step": 620100 + }, + { + "epoch": 1.61, + "learning_rate": 5.888781458910625e-05, + "loss": 0.0085, + "step": 620110 + }, + { + "epoch": 1.61, + "learning_rate": 5.888392637273479e-05, + "loss": 0.0066, + "step": 620120 + }, + { + "epoch": 1.61, + "learning_rate": 5.888003815636332e-05, + "loss": 0.0092, + "step": 620130 + }, + { + "epoch": 1.61, + "learning_rate": 5.8876149939991856e-05, + "loss": 0.0133, + "step": 620140 + }, + { + "epoch": 1.61, + "learning_rate": 5.8872261723620384e-05, + "loss": 0.0087, + "step": 620150 + }, + { + "epoch": 1.61, + "learning_rate": 5.886837350724892e-05, + "loss": 0.0111, + "step": 620160 + }, + { + "epoch": 1.61, + "learning_rate": 5.886448529087746e-05, + "loss": 0.0097, + "step": 620170 + }, + { + "epoch": 1.61, + "learning_rate": 5.8860597074505996e-05, + "loss": 0.0101, + "step": 620180 + }, + { + "epoch": 1.61, + "learning_rate": 5.885670885813453e-05, + "loss": 0.0055, + "step": 620190 + }, + { + "epoch": 1.61, + "learning_rate": 5.8852820641763066e-05, + "loss": 0.0084, + "step": 620200 + }, + { + "epoch": 1.61, + "learning_rate": 5.88489324253916e-05, + "loss": 0.0096, + "step": 620210 + }, + { + "epoch": 1.61, + "learning_rate": 5.8845044209020135e-05, + "loss": 0.0065, + "step": 620220 + }, + { + "epoch": 1.61, + "learning_rate": 5.884115599264867e-05, + "loss": 0.0062, + "step": 620230 + }, + { + "epoch": 1.61, + "learning_rate": 5.8837267776277205e-05, + "loss": 0.0087, + "step": 620240 + }, + { + "epoch": 1.61, + "learning_rate": 5.883337955990575e-05, + "loss": 0.0071, + "step": 620250 + }, + { + "epoch": 1.61, + "learning_rate": 5.882949134353428e-05, + "loss": 0.0092, + "step": 620260 + }, + { + "epoch": 1.61, + "learning_rate": 5.8825603127162816e-05, + "loss": 0.0068, + "step": 620270 + }, + { + "epoch": 1.61, + "learning_rate": 5.882171491079135e-05, + "loss": 0.0128, + "step": 620280 + }, + { + "epoch": 1.61, + "learning_rate": 5.8817826694419886e-05, + "loss": 0.0084, + "step": 620290 + }, + { + "epoch": 1.61, + "learning_rate": 5.881393847804842e-05, + "loss": 0.0074, + "step": 620300 + }, + { + "epoch": 1.61, + "learning_rate": 5.8810050261676956e-05, + "loss": 0.0078, + "step": 620310 + }, + { + "epoch": 1.61, + "learning_rate": 5.880616204530549e-05, + "loss": 0.0074, + "step": 620320 + }, + { + "epoch": 1.61, + "learning_rate": 5.880227382893403e-05, + "loss": 0.0103, + "step": 620330 + }, + { + "epoch": 1.61, + "learning_rate": 5.879838561256257e-05, + "loss": 0.0063, + "step": 620340 + }, + { + "epoch": 1.61, + "learning_rate": 5.87944973961911e-05, + "loss": 0.0093, + "step": 620350 + }, + { + "epoch": 1.61, + "learning_rate": 5.879060917981964e-05, + "loss": 0.0082, + "step": 620360 + }, + { + "epoch": 1.61, + "learning_rate": 5.878672096344817e-05, + "loss": 0.0145, + "step": 620370 + }, + { + "epoch": 1.61, + "learning_rate": 5.878283274707671e-05, + "loss": 0.0089, + "step": 620380 + }, + { + "epoch": 1.61, + "learning_rate": 5.877894453070524e-05, + "loss": 0.0078, + "step": 620390 + }, + { + "epoch": 1.61, + "learning_rate": 5.877505631433377e-05, + "loss": 0.0116, + "step": 620400 + }, + { + "epoch": 1.61, + "learning_rate": 5.8771168097962304e-05, + "loss": 0.0096, + "step": 620410 + }, + { + "epoch": 1.61, + "learning_rate": 5.876727988159084e-05, + "loss": 0.0077, + "step": 620420 + }, + { + "epoch": 1.61, + "learning_rate": 5.876339166521938e-05, + "loss": 0.0127, + "step": 620430 + }, + { + "epoch": 1.61, + "learning_rate": 5.8759503448847916e-05, + "loss": 0.0114, + "step": 620440 + }, + { + "epoch": 1.61, + "learning_rate": 5.875561523247645e-05, + "loss": 0.008, + "step": 620450 + }, + { + "epoch": 1.61, + "learning_rate": 5.8751727016104986e-05, + "loss": 0.0085, + "step": 620460 + }, + { + "epoch": 1.61, + "learning_rate": 5.874783879973352e-05, + "loss": 0.0093, + "step": 620470 + }, + { + "epoch": 1.61, + "learning_rate": 5.8743950583362055e-05, + "loss": 0.0071, + "step": 620480 + }, + { + "epoch": 1.61, + "learning_rate": 5.874006236699059e-05, + "loss": 0.0112, + "step": 620490 + }, + { + "epoch": 1.61, + "learning_rate": 5.8736174150619125e-05, + "loss": 0.0073, + "step": 620500 + }, + { + "epoch": 1.61, + "learning_rate": 5.8732285934247667e-05, + "loss": 0.0083, + "step": 620510 + }, + { + "epoch": 1.61, + "learning_rate": 5.87283977178762e-05, + "loss": 0.0072, + "step": 620520 + }, + { + "epoch": 1.61, + "learning_rate": 5.8724509501504736e-05, + "loss": 0.0088, + "step": 620530 + }, + { + "epoch": 1.61, + "learning_rate": 5.872062128513327e-05, + "loss": 0.0111, + "step": 620540 + }, + { + "epoch": 1.61, + "learning_rate": 5.8716733068761806e-05, + "loss": 0.0079, + "step": 620550 + }, + { + "epoch": 1.61, + "learning_rate": 5.871284485239034e-05, + "loss": 0.008, + "step": 620560 + }, + { + "epoch": 1.61, + "learning_rate": 5.8708956636018876e-05, + "loss": 0.011, + "step": 620570 + }, + { + "epoch": 1.61, + "learning_rate": 5.870506841964741e-05, + "loss": 0.0089, + "step": 620580 + }, + { + "epoch": 1.61, + "learning_rate": 5.870118020327595e-05, + "loss": 0.0079, + "step": 620590 + }, + { + "epoch": 1.61, + "learning_rate": 5.869729198690449e-05, + "loss": 0.007, + "step": 620600 + }, + { + "epoch": 1.61, + "learning_rate": 5.869340377053302e-05, + "loss": 0.0081, + "step": 620610 + }, + { + "epoch": 1.61, + "learning_rate": 5.868951555416156e-05, + "loss": 0.009, + "step": 620620 + }, + { + "epoch": 1.61, + "learning_rate": 5.868562733779009e-05, + "loss": 0.006, + "step": 620630 + }, + { + "epoch": 1.61, + "learning_rate": 5.868173912141862e-05, + "loss": 0.0086, + "step": 620640 + }, + { + "epoch": 1.61, + "learning_rate": 5.8677850905047155e-05, + "loss": 0.0079, + "step": 620650 + }, + { + "epoch": 1.61, + "learning_rate": 5.867396268867569e-05, + "loss": 0.0091, + "step": 620660 + }, + { + "epoch": 1.61, + "learning_rate": 5.8670074472304224e-05, + "loss": 0.0074, + "step": 620670 + }, + { + "epoch": 1.61, + "learning_rate": 5.866618625593276e-05, + "loss": 0.007, + "step": 620680 + }, + { + "epoch": 1.61, + "learning_rate": 5.86622980395613e-05, + "loss": 0.0083, + "step": 620690 + }, + { + "epoch": 1.61, + "learning_rate": 5.8658409823189836e-05, + "loss": 0.0077, + "step": 620700 + }, + { + "epoch": 1.61, + "learning_rate": 5.865452160681837e-05, + "loss": 0.0073, + "step": 620710 + }, + { + "epoch": 1.61, + "learning_rate": 5.8650633390446905e-05, + "loss": 0.01, + "step": 620720 + }, + { + "epoch": 1.61, + "learning_rate": 5.864674517407544e-05, + "loss": 0.0075, + "step": 620730 + }, + { + "epoch": 1.61, + "learning_rate": 5.8642856957703975e-05, + "loss": 0.0091, + "step": 620740 + }, + { + "epoch": 1.61, + "learning_rate": 5.863896874133251e-05, + "loss": 0.0065, + "step": 620750 + }, + { + "epoch": 1.61, + "learning_rate": 5.8635080524961045e-05, + "loss": 0.0104, + "step": 620760 + }, + { + "epoch": 1.61, + "learning_rate": 5.8631192308589587e-05, + "loss": 0.009, + "step": 620770 + }, + { + "epoch": 1.61, + "learning_rate": 5.862730409221812e-05, + "loss": 0.0056, + "step": 620780 + }, + { + "epoch": 1.61, + "learning_rate": 5.8623415875846656e-05, + "loss": 0.0079, + "step": 620790 + }, + { + "epoch": 1.61, + "learning_rate": 5.861952765947519e-05, + "loss": 0.0081, + "step": 620800 + }, + { + "epoch": 1.61, + "learning_rate": 5.8615639443103726e-05, + "loss": 0.0074, + "step": 620810 + }, + { + "epoch": 1.61, + "learning_rate": 5.861175122673226e-05, + "loss": 0.0121, + "step": 620820 + }, + { + "epoch": 1.61, + "learning_rate": 5.8607863010360796e-05, + "loss": 0.0066, + "step": 620830 + }, + { + "epoch": 1.61, + "learning_rate": 5.860397479398933e-05, + "loss": 0.0104, + "step": 620840 + }, + { + "epoch": 1.61, + "learning_rate": 5.860008657761787e-05, + "loss": 0.0101, + "step": 620850 + }, + { + "epoch": 1.61, + "learning_rate": 5.859619836124641e-05, + "loss": 0.0079, + "step": 620860 + }, + { + "epoch": 1.61, + "learning_rate": 5.859231014487494e-05, + "loss": 0.008, + "step": 620870 + }, + { + "epoch": 1.61, + "learning_rate": 5.858842192850348e-05, + "loss": 0.0092, + "step": 620880 + }, + { + "epoch": 1.61, + "learning_rate": 5.8584533712132005e-05, + "loss": 0.0093, + "step": 620890 + }, + { + "epoch": 1.61, + "learning_rate": 5.858064549576054e-05, + "loss": 0.0102, + "step": 620900 + }, + { + "epoch": 1.61, + "learning_rate": 5.8576757279389075e-05, + "loss": 0.0069, + "step": 620910 + }, + { + "epoch": 1.61, + "learning_rate": 5.857286906301761e-05, + "loss": 0.0114, + "step": 620920 + }, + { + "epoch": 1.61, + "learning_rate": 5.8568980846646144e-05, + "loss": 0.0072, + "step": 620930 + }, + { + "epoch": 1.61, + "learning_rate": 5.856509263027468e-05, + "loss": 0.0072, + "step": 620940 + }, + { + "epoch": 1.61, + "learning_rate": 5.856120441390322e-05, + "loss": 0.0082, + "step": 620950 + }, + { + "epoch": 1.61, + "learning_rate": 5.8557316197531756e-05, + "loss": 0.0101, + "step": 620960 + }, + { + "epoch": 1.61, + "learning_rate": 5.855342798116029e-05, + "loss": 0.01, + "step": 620970 + }, + { + "epoch": 1.61, + "learning_rate": 5.8549539764788825e-05, + "loss": 0.0083, + "step": 620980 + }, + { + "epoch": 1.61, + "learning_rate": 5.854565154841736e-05, + "loss": 0.0074, + "step": 620990 + }, + { + "epoch": 1.61, + "learning_rate": 5.8541763332045895e-05, + "loss": 0.0092, + "step": 621000 + }, + { + "epoch": 1.61, + "eval_cer": 0.881704085960102, + "eval_loss": 0.0054284194484353065, + "eval_runtime": 107.746, + "eval_samples_per_second": 18.562, + "eval_steps_per_second": 4.641, + "step": 621000 + }, + { + "epoch": 1.61, + "learning_rate": 5.853787511567443e-05, + "loss": 0.0138, + "step": 621010 + }, + { + "epoch": 1.61, + "learning_rate": 5.8533986899302965e-05, + "loss": 0.0113, + "step": 621020 + }, + { + "epoch": 1.61, + "learning_rate": 5.8530098682931507e-05, + "loss": 0.0077, + "step": 621030 + }, + { + "epoch": 1.61, + "learning_rate": 5.852621046656004e-05, + "loss": 0.0081, + "step": 621040 + }, + { + "epoch": 1.61, + "learning_rate": 5.8522322250188576e-05, + "loss": 0.008, + "step": 621050 + }, + { + "epoch": 1.61, + "learning_rate": 5.851843403381711e-05, + "loss": 0.0094, + "step": 621060 + }, + { + "epoch": 1.61, + "learning_rate": 5.8514545817445646e-05, + "loss": 0.0089, + "step": 621070 + }, + { + "epoch": 1.61, + "learning_rate": 5.851065760107418e-05, + "loss": 0.0103, + "step": 621080 + }, + { + "epoch": 1.61, + "learning_rate": 5.8506769384702716e-05, + "loss": 0.0078, + "step": 621090 + }, + { + "epoch": 1.61, + "learning_rate": 5.850288116833125e-05, + "loss": 0.0051, + "step": 621100 + }, + { + "epoch": 1.61, + "learning_rate": 5.849899295195979e-05, + "loss": 0.0089, + "step": 621110 + }, + { + "epoch": 1.61, + "learning_rate": 5.849510473558833e-05, + "loss": 0.0083, + "step": 621120 + }, + { + "epoch": 1.61, + "learning_rate": 5.849121651921686e-05, + "loss": 0.0077, + "step": 621130 + }, + { + "epoch": 1.61, + "learning_rate": 5.848732830284539e-05, + "loss": 0.0076, + "step": 621140 + }, + { + "epoch": 1.61, + "learning_rate": 5.8483440086473925e-05, + "loss": 0.0088, + "step": 621150 + }, + { + "epoch": 1.61, + "learning_rate": 5.847955187010246e-05, + "loss": 0.0105, + "step": 621160 + }, + { + "epoch": 1.61, + "learning_rate": 5.8475663653730995e-05, + "loss": 0.0077, + "step": 621170 + }, + { + "epoch": 1.61, + "learning_rate": 5.847177543735953e-05, + "loss": 0.0082, + "step": 621180 + }, + { + "epoch": 1.61, + "learning_rate": 5.8467887220988064e-05, + "loss": 0.0091, + "step": 621190 + }, + { + "epoch": 1.61, + "learning_rate": 5.84639990046166e-05, + "loss": 0.0103, + "step": 621200 + }, + { + "epoch": 1.61, + "learning_rate": 5.846011078824514e-05, + "loss": 0.0123, + "step": 621210 + }, + { + "epoch": 1.61, + "learning_rate": 5.8456222571873676e-05, + "loss": 0.0088, + "step": 621220 + }, + { + "epoch": 1.61, + "learning_rate": 5.845233435550221e-05, + "loss": 0.0067, + "step": 621230 + }, + { + "epoch": 1.61, + "learning_rate": 5.8448446139130745e-05, + "loss": 0.0099, + "step": 621240 + }, + { + "epoch": 1.61, + "learning_rate": 5.844455792275928e-05, + "loss": 0.0075, + "step": 621250 + }, + { + "epoch": 1.61, + "learning_rate": 5.8440669706387815e-05, + "loss": 0.0109, + "step": 621260 + }, + { + "epoch": 1.61, + "learning_rate": 5.843678149001635e-05, + "loss": 0.0086, + "step": 621270 + }, + { + "epoch": 1.61, + "learning_rate": 5.8432893273644885e-05, + "loss": 0.0079, + "step": 621280 + }, + { + "epoch": 1.61, + "learning_rate": 5.8429005057273426e-05, + "loss": 0.0073, + "step": 621290 + }, + { + "epoch": 1.61, + "learning_rate": 5.842511684090196e-05, + "loss": 0.0109, + "step": 621300 + }, + { + "epoch": 1.61, + "learning_rate": 5.8421228624530496e-05, + "loss": 0.0105, + "step": 621310 + }, + { + "epoch": 1.61, + "learning_rate": 5.841734040815903e-05, + "loss": 0.0084, + "step": 621320 + }, + { + "epoch": 1.61, + "learning_rate": 5.8413452191787566e-05, + "loss": 0.0074, + "step": 621330 + }, + { + "epoch": 1.61, + "learning_rate": 5.84095639754161e-05, + "loss": 0.0066, + "step": 621340 + }, + { + "epoch": 1.61, + "learning_rate": 5.8405675759044636e-05, + "loss": 0.0099, + "step": 621350 + }, + { + "epoch": 1.61, + "learning_rate": 5.840178754267317e-05, + "loss": 0.0106, + "step": 621360 + }, + { + "epoch": 1.61, + "learning_rate": 5.8397899326301705e-05, + "loss": 0.0089, + "step": 621370 + }, + { + "epoch": 1.61, + "learning_rate": 5.839401110993025e-05, + "loss": 0.0095, + "step": 621380 + }, + { + "epoch": 1.61, + "learning_rate": 5.8390122893558775e-05, + "loss": 0.0075, + "step": 621390 + }, + { + "epoch": 1.61, + "learning_rate": 5.838623467718731e-05, + "loss": 0.0111, + "step": 621400 + }, + { + "epoch": 1.61, + "learning_rate": 5.8382346460815845e-05, + "loss": 0.006, + "step": 621410 + }, + { + "epoch": 1.61, + "learning_rate": 5.837845824444438e-05, + "loss": 0.0074, + "step": 621420 + }, + { + "epoch": 1.61, + "learning_rate": 5.8374570028072915e-05, + "loss": 0.0074, + "step": 621430 + }, + { + "epoch": 1.61, + "learning_rate": 5.837068181170145e-05, + "loss": 0.0079, + "step": 621440 + }, + { + "epoch": 1.61, + "learning_rate": 5.8366793595329984e-05, + "loss": 0.0101, + "step": 621450 + }, + { + "epoch": 1.61, + "learning_rate": 5.836290537895852e-05, + "loss": 0.009, + "step": 621460 + }, + { + "epoch": 1.61, + "learning_rate": 5.8359017162587054e-05, + "loss": 0.0066, + "step": 621470 + }, + { + "epoch": 1.61, + "learning_rate": 5.8355128946215596e-05, + "loss": 0.0106, + "step": 621480 + }, + { + "epoch": 1.61, + "learning_rate": 5.835124072984413e-05, + "loss": 0.0084, + "step": 621490 + }, + { + "epoch": 1.61, + "learning_rate": 5.8347352513472665e-05, + "loss": 0.0092, + "step": 621500 + }, + { + "epoch": 1.61, + "learning_rate": 5.83434642971012e-05, + "loss": 0.0077, + "step": 621510 + }, + { + "epoch": 1.61, + "learning_rate": 5.8339576080729735e-05, + "loss": 0.0076, + "step": 621520 + }, + { + "epoch": 1.61, + "learning_rate": 5.833568786435827e-05, + "loss": 0.0085, + "step": 621530 + }, + { + "epoch": 1.61, + "learning_rate": 5.8331799647986805e-05, + "loss": 0.009, + "step": 621540 + }, + { + "epoch": 1.61, + "learning_rate": 5.832791143161534e-05, + "loss": 0.0077, + "step": 621550 + }, + { + "epoch": 1.61, + "learning_rate": 5.832402321524388e-05, + "loss": 0.0066, + "step": 621560 + }, + { + "epoch": 1.61, + "learning_rate": 5.8320134998872416e-05, + "loss": 0.0072, + "step": 621570 + }, + { + "epoch": 1.61, + "learning_rate": 5.831624678250095e-05, + "loss": 0.0097, + "step": 621580 + }, + { + "epoch": 1.61, + "learning_rate": 5.8312358566129486e-05, + "loss": 0.0096, + "step": 621590 + }, + { + "epoch": 1.61, + "learning_rate": 5.830847034975802e-05, + "loss": 0.0071, + "step": 621600 + }, + { + "epoch": 1.61, + "learning_rate": 5.8304582133386556e-05, + "loss": 0.0076, + "step": 621610 + }, + { + "epoch": 1.61, + "learning_rate": 5.830069391701509e-05, + "loss": 0.007, + "step": 621620 + }, + { + "epoch": 1.61, + "learning_rate": 5.8296805700643625e-05, + "loss": 0.0081, + "step": 621630 + }, + { + "epoch": 1.61, + "learning_rate": 5.829291748427215e-05, + "loss": 0.0075, + "step": 621640 + }, + { + "epoch": 1.61, + "learning_rate": 5.828902926790069e-05, + "loss": 0.0106, + "step": 621650 + }, + { + "epoch": 1.61, + "learning_rate": 5.828514105152923e-05, + "loss": 0.0085, + "step": 621660 + }, + { + "epoch": 1.61, + "learning_rate": 5.8281252835157765e-05, + "loss": 0.0078, + "step": 621670 + }, + { + "epoch": 1.61, + "learning_rate": 5.82773646187863e-05, + "loss": 0.007, + "step": 621680 + }, + { + "epoch": 1.61, + "learning_rate": 5.8273476402414834e-05, + "loss": 0.0078, + "step": 621690 + }, + { + "epoch": 1.61, + "learning_rate": 5.826958818604337e-05, + "loss": 0.0097, + "step": 621700 + }, + { + "epoch": 1.61, + "learning_rate": 5.8265699969671904e-05, + "loss": 0.0073, + "step": 621710 + }, + { + "epoch": 1.61, + "learning_rate": 5.826181175330044e-05, + "loss": 0.0082, + "step": 621720 + }, + { + "epoch": 1.61, + "learning_rate": 5.8257923536928974e-05, + "loss": 0.0089, + "step": 621730 + }, + { + "epoch": 1.61, + "learning_rate": 5.8254035320557516e-05, + "loss": 0.0079, + "step": 621740 + }, + { + "epoch": 1.61, + "learning_rate": 5.825014710418605e-05, + "loss": 0.0114, + "step": 621750 + }, + { + "epoch": 1.61, + "learning_rate": 5.8246258887814585e-05, + "loss": 0.008, + "step": 621760 + }, + { + "epoch": 1.61, + "learning_rate": 5.824237067144312e-05, + "loss": 0.0098, + "step": 621770 + }, + { + "epoch": 1.61, + "learning_rate": 5.8238482455071655e-05, + "loss": 0.0062, + "step": 621780 + }, + { + "epoch": 1.61, + "learning_rate": 5.823459423870019e-05, + "loss": 0.0113, + "step": 621790 + }, + { + "epoch": 1.61, + "learning_rate": 5.8230706022328725e-05, + "loss": 0.0068, + "step": 621800 + }, + { + "epoch": 1.61, + "learning_rate": 5.822681780595726e-05, + "loss": 0.0098, + "step": 621810 + }, + { + "epoch": 1.61, + "learning_rate": 5.82229295895858e-05, + "loss": 0.0122, + "step": 621820 + }, + { + "epoch": 1.61, + "learning_rate": 5.8219041373214336e-05, + "loss": 0.0097, + "step": 621830 + }, + { + "epoch": 1.61, + "learning_rate": 5.821515315684287e-05, + "loss": 0.0074, + "step": 621840 + }, + { + "epoch": 1.61, + "learning_rate": 5.8211264940471406e-05, + "loss": 0.0069, + "step": 621850 + }, + { + "epoch": 1.61, + "learning_rate": 5.820737672409994e-05, + "loss": 0.007, + "step": 621860 + }, + { + "epoch": 1.61, + "learning_rate": 5.8203488507728476e-05, + "loss": 0.008, + "step": 621870 + }, + { + "epoch": 1.61, + "learning_rate": 5.8199600291357004e-05, + "loss": 0.0098, + "step": 621880 + }, + { + "epoch": 1.61, + "learning_rate": 5.819571207498554e-05, + "loss": 0.0065, + "step": 621890 + }, + { + "epoch": 1.61, + "learning_rate": 5.819182385861407e-05, + "loss": 0.0085, + "step": 621900 + }, + { + "epoch": 1.61, + "learning_rate": 5.818793564224261e-05, + "loss": 0.0075, + "step": 621910 + }, + { + "epoch": 1.61, + "learning_rate": 5.818404742587115e-05, + "loss": 0.0083, + "step": 621920 + }, + { + "epoch": 1.61, + "learning_rate": 5.8180159209499685e-05, + "loss": 0.0083, + "step": 621930 + }, + { + "epoch": 1.61, + "learning_rate": 5.817627099312822e-05, + "loss": 0.0085, + "step": 621940 + }, + { + "epoch": 1.61, + "learning_rate": 5.8172382776756754e-05, + "loss": 0.0088, + "step": 621950 + }, + { + "epoch": 1.61, + "learning_rate": 5.816849456038529e-05, + "loss": 0.0122, + "step": 621960 + }, + { + "epoch": 1.61, + "learning_rate": 5.8164606344013824e-05, + "loss": 0.006, + "step": 621970 + }, + { + "epoch": 1.61, + "learning_rate": 5.816071812764236e-05, + "loss": 0.0066, + "step": 621980 + }, + { + "epoch": 1.61, + "learning_rate": 5.8156829911270894e-05, + "loss": 0.0066, + "step": 621990 + }, + { + "epoch": 1.61, + "learning_rate": 5.8152941694899436e-05, + "loss": 0.0106, + "step": 622000 + }, + { + "epoch": 1.61, + "eval_cer": 0.881688689953826, + "eval_loss": 0.005423935130238533, + "eval_runtime": 108.0541, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 622000 + }, + { + "epoch": 1.61, + "learning_rate": 5.814905347852797e-05, + "loss": 0.0078, + "step": 622010 + }, + { + "epoch": 1.61, + "learning_rate": 5.8145165262156505e-05, + "loss": 0.0088, + "step": 622020 + }, + { + "epoch": 1.61, + "learning_rate": 5.814127704578504e-05, + "loss": 0.0119, + "step": 622030 + }, + { + "epoch": 1.61, + "learning_rate": 5.8137388829413575e-05, + "loss": 0.0068, + "step": 622040 + }, + { + "epoch": 1.61, + "learning_rate": 5.813350061304211e-05, + "loss": 0.0105, + "step": 622050 + }, + { + "epoch": 1.61, + "learning_rate": 5.8129612396670645e-05, + "loss": 0.0076, + "step": 622060 + }, + { + "epoch": 1.61, + "learning_rate": 5.812572418029918e-05, + "loss": 0.0064, + "step": 622070 + }, + { + "epoch": 1.61, + "learning_rate": 5.812183596392772e-05, + "loss": 0.0074, + "step": 622080 + }, + { + "epoch": 1.61, + "learning_rate": 5.8117947747556256e-05, + "loss": 0.0076, + "step": 622090 + }, + { + "epoch": 1.61, + "learning_rate": 5.811405953118479e-05, + "loss": 0.008, + "step": 622100 + }, + { + "epoch": 1.61, + "learning_rate": 5.8110171314813326e-05, + "loss": 0.0067, + "step": 622110 + }, + { + "epoch": 1.61, + "learning_rate": 5.810628309844186e-05, + "loss": 0.008, + "step": 622120 + }, + { + "epoch": 1.61, + "learning_rate": 5.810239488207039e-05, + "loss": 0.0111, + "step": 622130 + }, + { + "epoch": 1.61, + "learning_rate": 5.8098506665698924e-05, + "loss": 0.0098, + "step": 622140 + }, + { + "epoch": 1.61, + "learning_rate": 5.809461844932746e-05, + "loss": 0.0081, + "step": 622150 + }, + { + "epoch": 1.61, + "learning_rate": 5.809073023295599e-05, + "loss": 0.0096, + "step": 622160 + }, + { + "epoch": 1.61, + "learning_rate": 5.808684201658453e-05, + "loss": 0.0102, + "step": 622170 + }, + { + "epoch": 1.61, + "learning_rate": 5.808295380021307e-05, + "loss": 0.0111, + "step": 622180 + }, + { + "epoch": 1.61, + "learning_rate": 5.8079065583841605e-05, + "loss": 0.0095, + "step": 622190 + }, + { + "epoch": 1.61, + "learning_rate": 5.807517736747014e-05, + "loss": 0.0067, + "step": 622200 + }, + { + "epoch": 1.61, + "learning_rate": 5.8071289151098674e-05, + "loss": 0.0108, + "step": 622210 + }, + { + "epoch": 1.61, + "learning_rate": 5.806740093472721e-05, + "loss": 0.0091, + "step": 622220 + }, + { + "epoch": 1.61, + "learning_rate": 5.8063512718355744e-05, + "loss": 0.0111, + "step": 622230 + }, + { + "epoch": 1.61, + "learning_rate": 5.805962450198428e-05, + "loss": 0.007, + "step": 622240 + }, + { + "epoch": 1.61, + "learning_rate": 5.8055736285612814e-05, + "loss": 0.007, + "step": 622250 + }, + { + "epoch": 1.61, + "learning_rate": 5.8051848069241355e-05, + "loss": 0.0073, + "step": 622260 + }, + { + "epoch": 1.61, + "learning_rate": 5.804795985286989e-05, + "loss": 0.0107, + "step": 622270 + }, + { + "epoch": 1.61, + "learning_rate": 5.8044071636498425e-05, + "loss": 0.0088, + "step": 622280 + }, + { + "epoch": 1.61, + "learning_rate": 5.804018342012696e-05, + "loss": 0.0092, + "step": 622290 + }, + { + "epoch": 1.61, + "learning_rate": 5.8036295203755495e-05, + "loss": 0.0081, + "step": 622300 + }, + { + "epoch": 1.61, + "learning_rate": 5.803240698738403e-05, + "loss": 0.0098, + "step": 622310 + }, + { + "epoch": 1.61, + "learning_rate": 5.8028518771012565e-05, + "loss": 0.0094, + "step": 622320 + }, + { + "epoch": 1.61, + "learning_rate": 5.80246305546411e-05, + "loss": 0.008, + "step": 622330 + }, + { + "epoch": 1.61, + "learning_rate": 5.802074233826964e-05, + "loss": 0.008, + "step": 622340 + }, + { + "epoch": 1.61, + "learning_rate": 5.8016854121898176e-05, + "loss": 0.0089, + "step": 622350 + }, + { + "epoch": 1.61, + "learning_rate": 5.801296590552671e-05, + "loss": 0.0118, + "step": 622360 + }, + { + "epoch": 1.61, + "learning_rate": 5.8009077689155246e-05, + "loss": 0.0084, + "step": 622370 + }, + { + "epoch": 1.61, + "learning_rate": 5.8005189472783774e-05, + "loss": 0.0078, + "step": 622380 + }, + { + "epoch": 1.61, + "learning_rate": 5.800130125641231e-05, + "loss": 0.0075, + "step": 622390 + }, + { + "epoch": 1.61, + "learning_rate": 5.7997413040040844e-05, + "loss": 0.0072, + "step": 622400 + }, + { + "epoch": 1.61, + "learning_rate": 5.799352482366938e-05, + "loss": 0.0077, + "step": 622410 + }, + { + "epoch": 1.61, + "learning_rate": 5.798963660729791e-05, + "loss": 0.0105, + "step": 622420 + }, + { + "epoch": 1.61, + "learning_rate": 5.798574839092645e-05, + "loss": 0.0069, + "step": 622430 + }, + { + "epoch": 1.61, + "learning_rate": 5.798186017455499e-05, + "loss": 0.0078, + "step": 622440 + }, + { + "epoch": 1.61, + "learning_rate": 5.7977971958183525e-05, + "loss": 0.0107, + "step": 622450 + }, + { + "epoch": 1.61, + "learning_rate": 5.797408374181206e-05, + "loss": 0.0093, + "step": 622460 + }, + { + "epoch": 1.61, + "learning_rate": 5.7970195525440594e-05, + "loss": 0.0062, + "step": 622470 + }, + { + "epoch": 1.61, + "learning_rate": 5.796630730906913e-05, + "loss": 0.0117, + "step": 622480 + }, + { + "epoch": 1.61, + "learning_rate": 5.7962419092697664e-05, + "loss": 0.0114, + "step": 622490 + }, + { + "epoch": 1.61, + "learning_rate": 5.79585308763262e-05, + "loss": 0.0085, + "step": 622500 + }, + { + "epoch": 1.61, + "learning_rate": 5.7954642659954734e-05, + "loss": 0.0102, + "step": 622510 + }, + { + "epoch": 1.61, + "learning_rate": 5.7950754443583275e-05, + "loss": 0.0084, + "step": 622520 + }, + { + "epoch": 1.61, + "learning_rate": 5.794686622721181e-05, + "loss": 0.0068, + "step": 622530 + }, + { + "epoch": 1.61, + "learning_rate": 5.7942978010840345e-05, + "loss": 0.0067, + "step": 622540 + }, + { + "epoch": 1.61, + "learning_rate": 5.793908979446888e-05, + "loss": 0.0083, + "step": 622550 + }, + { + "epoch": 1.61, + "learning_rate": 5.7935201578097415e-05, + "loss": 0.0086, + "step": 622560 + }, + { + "epoch": 1.61, + "learning_rate": 5.793131336172595e-05, + "loss": 0.0076, + "step": 622570 + }, + { + "epoch": 1.61, + "learning_rate": 5.7927425145354485e-05, + "loss": 0.0134, + "step": 622580 + }, + { + "epoch": 1.61, + "learning_rate": 5.792353692898302e-05, + "loss": 0.0087, + "step": 622590 + }, + { + "epoch": 1.61, + "learning_rate": 5.791964871261156e-05, + "loss": 0.0081, + "step": 622600 + }, + { + "epoch": 1.61, + "learning_rate": 5.7915760496240096e-05, + "loss": 0.0081, + "step": 622610 + }, + { + "epoch": 1.61, + "learning_rate": 5.791187227986863e-05, + "loss": 0.0095, + "step": 622620 + }, + { + "epoch": 1.61, + "learning_rate": 5.790798406349716e-05, + "loss": 0.0106, + "step": 622630 + }, + { + "epoch": 1.61, + "learning_rate": 5.7904095847125694e-05, + "loss": 0.0081, + "step": 622640 + }, + { + "epoch": 1.61, + "learning_rate": 5.790020763075423e-05, + "loss": 0.0103, + "step": 622650 + }, + { + "epoch": 1.61, + "learning_rate": 5.7896319414382763e-05, + "loss": 0.0089, + "step": 622660 + }, + { + "epoch": 1.61, + "learning_rate": 5.78924311980113e-05, + "loss": 0.0093, + "step": 622670 + }, + { + "epoch": 1.61, + "learning_rate": 5.788854298163983e-05, + "loss": 0.0089, + "step": 622680 + }, + { + "epoch": 1.61, + "learning_rate": 5.788465476526837e-05, + "loss": 0.0077, + "step": 622690 + }, + { + "epoch": 1.61, + "learning_rate": 5.788076654889691e-05, + "loss": 0.009, + "step": 622700 + }, + { + "epoch": 1.61, + "learning_rate": 5.7876878332525445e-05, + "loss": 0.0092, + "step": 622710 + }, + { + "epoch": 1.61, + "learning_rate": 5.787299011615398e-05, + "loss": 0.0102, + "step": 622720 + }, + { + "epoch": 1.61, + "learning_rate": 5.7869101899782514e-05, + "loss": 0.008, + "step": 622730 + }, + { + "epoch": 1.61, + "learning_rate": 5.786521368341105e-05, + "loss": 0.0103, + "step": 622740 + }, + { + "epoch": 1.61, + "learning_rate": 5.7861325467039584e-05, + "loss": 0.0077, + "step": 622750 + }, + { + "epoch": 1.61, + "learning_rate": 5.785743725066812e-05, + "loss": 0.0078, + "step": 622760 + }, + { + "epoch": 1.61, + "learning_rate": 5.7853549034296654e-05, + "loss": 0.0061, + "step": 622770 + }, + { + "epoch": 1.61, + "learning_rate": 5.784966081792519e-05, + "loss": 0.009, + "step": 622780 + }, + { + "epoch": 1.61, + "learning_rate": 5.784577260155373e-05, + "loss": 0.0089, + "step": 622790 + }, + { + "epoch": 1.61, + "learning_rate": 5.7841884385182265e-05, + "loss": 0.0091, + "step": 622800 + }, + { + "epoch": 1.61, + "learning_rate": 5.78379961688108e-05, + "loss": 0.0089, + "step": 622810 + }, + { + "epoch": 1.61, + "learning_rate": 5.7834107952439335e-05, + "loss": 0.0089, + "step": 622820 + }, + { + "epoch": 1.61, + "learning_rate": 5.783021973606787e-05, + "loss": 0.0081, + "step": 622830 + }, + { + "epoch": 1.61, + "learning_rate": 5.7826331519696405e-05, + "loss": 0.0074, + "step": 622840 + }, + { + "epoch": 1.61, + "learning_rate": 5.782244330332494e-05, + "loss": 0.0061, + "step": 622850 + }, + { + "epoch": 1.61, + "learning_rate": 5.7818555086953474e-05, + "loss": 0.0078, + "step": 622860 + }, + { + "epoch": 1.61, + "learning_rate": 5.7814666870582016e-05, + "loss": 0.0088, + "step": 622870 + }, + { + "epoch": 1.61, + "learning_rate": 5.781077865421054e-05, + "loss": 0.0097, + "step": 622880 + }, + { + "epoch": 1.61, + "learning_rate": 5.780689043783908e-05, + "loss": 0.0079, + "step": 622890 + }, + { + "epoch": 1.61, + "learning_rate": 5.7803002221467614e-05, + "loss": 0.0072, + "step": 622900 + }, + { + "epoch": 1.61, + "learning_rate": 5.779911400509615e-05, + "loss": 0.0087, + "step": 622910 + }, + { + "epoch": 1.61, + "learning_rate": 5.7795225788724683e-05, + "loss": 0.0079, + "step": 622920 + }, + { + "epoch": 1.61, + "learning_rate": 5.779133757235322e-05, + "loss": 0.0117, + "step": 622930 + }, + { + "epoch": 1.61, + "learning_rate": 5.778744935598175e-05, + "loss": 0.0119, + "step": 622940 + }, + { + "epoch": 1.61, + "learning_rate": 5.778356113961029e-05, + "loss": 0.008, + "step": 622950 + }, + { + "epoch": 1.61, + "learning_rate": 5.777967292323882e-05, + "loss": 0.0098, + "step": 622960 + }, + { + "epoch": 1.61, + "learning_rate": 5.7775784706867365e-05, + "loss": 0.0075, + "step": 622970 + }, + { + "epoch": 1.61, + "learning_rate": 5.77718964904959e-05, + "loss": 0.0073, + "step": 622980 + }, + { + "epoch": 1.61, + "learning_rate": 5.7768008274124434e-05, + "loss": 0.0078, + "step": 622990 + }, + { + "epoch": 1.61, + "learning_rate": 5.776412005775297e-05, + "loss": 0.0109, + "step": 623000 + }, + { + "epoch": 1.61, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.005499746184796095, + "eval_runtime": 107.9534, + "eval_samples_per_second": 18.527, + "eval_steps_per_second": 4.632, + "step": 623000 + }, + { + "epoch": 1.61, + "learning_rate": 5.7760231841381504e-05, + "loss": 0.0086, + "step": 623010 + }, + { + "epoch": 1.61, + "learning_rate": 5.775634362501004e-05, + "loss": 0.0082, + "step": 623020 + }, + { + "epoch": 1.61, + "learning_rate": 5.7752455408638574e-05, + "loss": 0.0082, + "step": 623030 + }, + { + "epoch": 1.62, + "learning_rate": 5.774856719226711e-05, + "loss": 0.0071, + "step": 623040 + }, + { + "epoch": 1.62, + "learning_rate": 5.774467897589565e-05, + "loss": 0.0083, + "step": 623050 + }, + { + "epoch": 1.62, + "learning_rate": 5.7740790759524185e-05, + "loss": 0.0066, + "step": 623060 + }, + { + "epoch": 1.62, + "learning_rate": 5.773690254315272e-05, + "loss": 0.0068, + "step": 623070 + }, + { + "epoch": 1.62, + "learning_rate": 5.7733014326781255e-05, + "loss": 0.009, + "step": 623080 + }, + { + "epoch": 1.62, + "learning_rate": 5.772912611040979e-05, + "loss": 0.014, + "step": 623090 + }, + { + "epoch": 1.62, + "learning_rate": 5.7725237894038324e-05, + "loss": 0.0103, + "step": 623100 + }, + { + "epoch": 1.62, + "learning_rate": 5.772134967766686e-05, + "loss": 0.0091, + "step": 623110 + }, + { + "epoch": 1.62, + "learning_rate": 5.771746146129539e-05, + "loss": 0.0086, + "step": 623120 + }, + { + "epoch": 1.62, + "learning_rate": 5.771357324492392e-05, + "loss": 0.0074, + "step": 623130 + }, + { + "epoch": 1.62, + "learning_rate": 5.770968502855246e-05, + "loss": 0.0116, + "step": 623140 + }, + { + "epoch": 1.62, + "learning_rate": 5.7705796812181e-05, + "loss": 0.009, + "step": 623150 + }, + { + "epoch": 1.62, + "learning_rate": 5.7701908595809534e-05, + "loss": 0.0077, + "step": 623160 + }, + { + "epoch": 1.62, + "learning_rate": 5.769802037943807e-05, + "loss": 0.0091, + "step": 623170 + }, + { + "epoch": 1.62, + "learning_rate": 5.76941321630666e-05, + "loss": 0.0083, + "step": 623180 + }, + { + "epoch": 1.62, + "learning_rate": 5.769024394669514e-05, + "loss": 0.0073, + "step": 623190 + }, + { + "epoch": 1.62, + "learning_rate": 5.768635573032367e-05, + "loss": 0.008, + "step": 623200 + }, + { + "epoch": 1.62, + "learning_rate": 5.768246751395221e-05, + "loss": 0.0081, + "step": 623210 + }, + { + "epoch": 1.62, + "learning_rate": 5.767857929758074e-05, + "loss": 0.0084, + "step": 623220 + }, + { + "epoch": 1.62, + "learning_rate": 5.7674691081209284e-05, + "loss": 0.0079, + "step": 623230 + }, + { + "epoch": 1.62, + "learning_rate": 5.767080286483782e-05, + "loss": 0.008, + "step": 623240 + }, + { + "epoch": 1.62, + "learning_rate": 5.7666914648466354e-05, + "loss": 0.0077, + "step": 623250 + }, + { + "epoch": 1.62, + "learning_rate": 5.766302643209489e-05, + "loss": 0.0094, + "step": 623260 + }, + { + "epoch": 1.62, + "learning_rate": 5.7659138215723424e-05, + "loss": 0.0063, + "step": 623270 + }, + { + "epoch": 1.62, + "learning_rate": 5.765524999935196e-05, + "loss": 0.0072, + "step": 623280 + }, + { + "epoch": 1.62, + "learning_rate": 5.7651361782980494e-05, + "loss": 0.0103, + "step": 623290 + }, + { + "epoch": 1.62, + "learning_rate": 5.764747356660903e-05, + "loss": 0.0076, + "step": 623300 + }, + { + "epoch": 1.62, + "learning_rate": 5.764358535023757e-05, + "loss": 0.007, + "step": 623310 + }, + { + "epoch": 1.62, + "learning_rate": 5.7639697133866105e-05, + "loss": 0.0072, + "step": 623320 + }, + { + "epoch": 1.62, + "learning_rate": 5.763580891749464e-05, + "loss": 0.0093, + "step": 623330 + }, + { + "epoch": 1.62, + "learning_rate": 5.7631920701123175e-05, + "loss": 0.0074, + "step": 623340 + }, + { + "epoch": 1.62, + "learning_rate": 5.762803248475171e-05, + "loss": 0.0091, + "step": 623350 + }, + { + "epoch": 1.62, + "learning_rate": 5.7624144268380244e-05, + "loss": 0.0105, + "step": 623360 + }, + { + "epoch": 1.62, + "learning_rate": 5.762025605200877e-05, + "loss": 0.0089, + "step": 623370 + }, + { + "epoch": 1.62, + "learning_rate": 5.761636783563731e-05, + "loss": 0.0077, + "step": 623380 + }, + { + "epoch": 1.62, + "learning_rate": 5.761247961926584e-05, + "loss": 0.0088, + "step": 623390 + }, + { + "epoch": 1.62, + "learning_rate": 5.760859140289438e-05, + "loss": 0.0073, + "step": 623400 + }, + { + "epoch": 1.62, + "learning_rate": 5.760470318652292e-05, + "loss": 0.0065, + "step": 623410 + }, + { + "epoch": 1.62, + "learning_rate": 5.7600814970151454e-05, + "loss": 0.0081, + "step": 623420 + }, + { + "epoch": 1.62, + "learning_rate": 5.759692675377999e-05, + "loss": 0.0087, + "step": 623430 + }, + { + "epoch": 1.62, + "learning_rate": 5.759303853740852e-05, + "loss": 0.0083, + "step": 623440 + }, + { + "epoch": 1.62, + "learning_rate": 5.758915032103706e-05, + "loss": 0.0062, + "step": 623450 + }, + { + "epoch": 1.62, + "learning_rate": 5.758526210466559e-05, + "loss": 0.0067, + "step": 623460 + }, + { + "epoch": 1.62, + "learning_rate": 5.758137388829413e-05, + "loss": 0.0103, + "step": 623470 + }, + { + "epoch": 1.62, + "learning_rate": 5.757748567192266e-05, + "loss": 0.0081, + "step": 623480 + }, + { + "epoch": 1.62, + "learning_rate": 5.7573597455551204e-05, + "loss": 0.0085, + "step": 623490 + }, + { + "epoch": 1.62, + "learning_rate": 5.756970923917974e-05, + "loss": 0.0081, + "step": 623500 + }, + { + "epoch": 1.62, + "learning_rate": 5.7565821022808274e-05, + "loss": 0.0087, + "step": 623510 + }, + { + "epoch": 1.62, + "learning_rate": 5.756193280643681e-05, + "loss": 0.0072, + "step": 623520 + }, + { + "epoch": 1.62, + "learning_rate": 5.7558044590065344e-05, + "loss": 0.0079, + "step": 623530 + }, + { + "epoch": 1.62, + "learning_rate": 5.755415637369388e-05, + "loss": 0.01, + "step": 623540 + }, + { + "epoch": 1.62, + "learning_rate": 5.7550268157322414e-05, + "loss": 0.0073, + "step": 623550 + }, + { + "epoch": 1.62, + "learning_rate": 5.754637994095095e-05, + "loss": 0.0109, + "step": 623560 + }, + { + "epoch": 1.62, + "learning_rate": 5.754249172457949e-05, + "loss": 0.0079, + "step": 623570 + }, + { + "epoch": 1.62, + "learning_rate": 5.7538603508208025e-05, + "loss": 0.0076, + "step": 623580 + }, + { + "epoch": 1.62, + "learning_rate": 5.753471529183656e-05, + "loss": 0.0074, + "step": 623590 + }, + { + "epoch": 1.62, + "learning_rate": 5.7530827075465095e-05, + "loss": 0.0081, + "step": 623600 + }, + { + "epoch": 1.62, + "learning_rate": 5.752693885909363e-05, + "loss": 0.0077, + "step": 623610 + }, + { + "epoch": 1.62, + "learning_rate": 5.752305064272216e-05, + "loss": 0.0074, + "step": 623620 + }, + { + "epoch": 1.62, + "learning_rate": 5.751916242635069e-05, + "loss": 0.0095, + "step": 623630 + }, + { + "epoch": 1.62, + "learning_rate": 5.751527420997923e-05, + "loss": 0.0078, + "step": 623640 + }, + { + "epoch": 1.62, + "learning_rate": 5.751138599360776e-05, + "loss": 0.0088, + "step": 623650 + }, + { + "epoch": 1.62, + "learning_rate": 5.75074977772363e-05, + "loss": 0.0084, + "step": 623660 + }, + { + "epoch": 1.62, + "learning_rate": 5.750360956086484e-05, + "loss": 0.0079, + "step": 623670 + }, + { + "epoch": 1.62, + "learning_rate": 5.7499721344493374e-05, + "loss": 0.0081, + "step": 623680 + }, + { + "epoch": 1.62, + "learning_rate": 5.749583312812191e-05, + "loss": 0.0074, + "step": 623690 + }, + { + "epoch": 1.62, + "learning_rate": 5.749194491175044e-05, + "loss": 0.0081, + "step": 623700 + }, + { + "epoch": 1.62, + "learning_rate": 5.748805669537898e-05, + "loss": 0.0131, + "step": 623710 + }, + { + "epoch": 1.62, + "learning_rate": 5.748416847900751e-05, + "loss": 0.0096, + "step": 623720 + }, + { + "epoch": 1.62, + "learning_rate": 5.748028026263605e-05, + "loss": 0.0059, + "step": 623730 + }, + { + "epoch": 1.62, + "learning_rate": 5.747639204626458e-05, + "loss": 0.0076, + "step": 623740 + }, + { + "epoch": 1.62, + "learning_rate": 5.7472503829893124e-05, + "loss": 0.0079, + "step": 623750 + }, + { + "epoch": 1.62, + "learning_rate": 5.746861561352166e-05, + "loss": 0.0092, + "step": 623760 + }, + { + "epoch": 1.62, + "learning_rate": 5.7464727397150194e-05, + "loss": 0.0093, + "step": 623770 + }, + { + "epoch": 1.62, + "learning_rate": 5.746083918077873e-05, + "loss": 0.0097, + "step": 623780 + }, + { + "epoch": 1.62, + "learning_rate": 5.7456950964407264e-05, + "loss": 0.0114, + "step": 623790 + }, + { + "epoch": 1.62, + "learning_rate": 5.74530627480358e-05, + "loss": 0.0065, + "step": 623800 + }, + { + "epoch": 1.62, + "learning_rate": 5.7449174531664334e-05, + "loss": 0.0091, + "step": 623810 + }, + { + "epoch": 1.62, + "learning_rate": 5.744528631529287e-05, + "loss": 0.0065, + "step": 623820 + }, + { + "epoch": 1.62, + "learning_rate": 5.744139809892141e-05, + "loss": 0.0074, + "step": 623830 + }, + { + "epoch": 1.62, + "learning_rate": 5.7437509882549945e-05, + "loss": 0.0114, + "step": 623840 + }, + { + "epoch": 1.62, + "learning_rate": 5.743362166617848e-05, + "loss": 0.0092, + "step": 623850 + }, + { + "epoch": 1.62, + "learning_rate": 5.7429733449807015e-05, + "loss": 0.0086, + "step": 623860 + }, + { + "epoch": 1.62, + "learning_rate": 5.742584523343554e-05, + "loss": 0.0078, + "step": 623870 + }, + { + "epoch": 1.62, + "learning_rate": 5.742195701706408e-05, + "loss": 0.0085, + "step": 623880 + }, + { + "epoch": 1.62, + "learning_rate": 5.741806880069261e-05, + "loss": 0.0085, + "step": 623890 + }, + { + "epoch": 1.62, + "learning_rate": 5.741418058432115e-05, + "loss": 0.0086, + "step": 623900 + }, + { + "epoch": 1.62, + "learning_rate": 5.741029236794968e-05, + "loss": 0.0097, + "step": 623910 + }, + { + "epoch": 1.62, + "learning_rate": 5.740640415157822e-05, + "loss": 0.0068, + "step": 623920 + }, + { + "epoch": 1.62, + "learning_rate": 5.740251593520676e-05, + "loss": 0.01, + "step": 623930 + }, + { + "epoch": 1.62, + "learning_rate": 5.7398627718835294e-05, + "loss": 0.0072, + "step": 623940 + }, + { + "epoch": 1.62, + "learning_rate": 5.739473950246383e-05, + "loss": 0.0094, + "step": 623950 + }, + { + "epoch": 1.62, + "learning_rate": 5.739085128609236e-05, + "loss": 0.0081, + "step": 623960 + }, + { + "epoch": 1.62, + "learning_rate": 5.73869630697209e-05, + "loss": 0.0083, + "step": 623970 + }, + { + "epoch": 1.62, + "learning_rate": 5.738307485334943e-05, + "loss": 0.0067, + "step": 623980 + }, + { + "epoch": 1.62, + "learning_rate": 5.737918663697797e-05, + "loss": 0.0101, + "step": 623990 + }, + { + "epoch": 1.62, + "learning_rate": 5.73752984206065e-05, + "loss": 0.0086, + "step": 624000 + }, + { + "epoch": 1.62, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.005575355142354965, + "eval_runtime": 107.7874, + "eval_samples_per_second": 18.555, + "eval_steps_per_second": 4.639, + "step": 624000 + }, + { + "epoch": 1.62, + "learning_rate": 5.7371410204235044e-05, + "loss": 0.009, + "step": 624010 + }, + { + "epoch": 1.62, + "learning_rate": 5.736752198786358e-05, + "loss": 0.0066, + "step": 624020 + }, + { + "epoch": 1.62, + "learning_rate": 5.7363633771492114e-05, + "loss": 0.007, + "step": 624030 + }, + { + "epoch": 1.62, + "learning_rate": 5.735974555512065e-05, + "loss": 0.0092, + "step": 624040 + }, + { + "epoch": 1.62, + "learning_rate": 5.7355857338749184e-05, + "loss": 0.0092, + "step": 624050 + }, + { + "epoch": 1.62, + "learning_rate": 5.735196912237772e-05, + "loss": 0.0084, + "step": 624060 + }, + { + "epoch": 1.62, + "learning_rate": 5.7348080906006253e-05, + "loss": 0.01, + "step": 624070 + }, + { + "epoch": 1.62, + "learning_rate": 5.734419268963479e-05, + "loss": 0.0102, + "step": 624080 + }, + { + "epoch": 1.62, + "learning_rate": 5.734030447326332e-05, + "loss": 0.0083, + "step": 624090 + }, + { + "epoch": 1.62, + "learning_rate": 5.7336416256891865e-05, + "loss": 0.008, + "step": 624100 + }, + { + "epoch": 1.62, + "learning_rate": 5.73325280405204e-05, + "loss": 0.0078, + "step": 624110 + }, + { + "epoch": 1.62, + "learning_rate": 5.732863982414893e-05, + "loss": 0.0085, + "step": 624120 + }, + { + "epoch": 1.62, + "learning_rate": 5.732475160777746e-05, + "loss": 0.0147, + "step": 624130 + }, + { + "epoch": 1.62, + "learning_rate": 5.7320863391406e-05, + "loss": 0.0068, + "step": 624140 + }, + { + "epoch": 1.62, + "learning_rate": 5.731697517503453e-05, + "loss": 0.0066, + "step": 624150 + }, + { + "epoch": 1.62, + "learning_rate": 5.731308695866307e-05, + "loss": 0.0069, + "step": 624160 + }, + { + "epoch": 1.62, + "learning_rate": 5.73091987422916e-05, + "loss": 0.0062, + "step": 624170 + }, + { + "epoch": 1.62, + "learning_rate": 5.730531052592014e-05, + "loss": 0.0082, + "step": 624180 + }, + { + "epoch": 1.62, + "learning_rate": 5.730142230954867e-05, + "loss": 0.0081, + "step": 624190 + }, + { + "epoch": 1.62, + "learning_rate": 5.7297534093177213e-05, + "loss": 0.0077, + "step": 624200 + }, + { + "epoch": 1.62, + "learning_rate": 5.729364587680575e-05, + "loss": 0.0093, + "step": 624210 + }, + { + "epoch": 1.62, + "learning_rate": 5.728975766043428e-05, + "loss": 0.0082, + "step": 624220 + }, + { + "epoch": 1.62, + "learning_rate": 5.728586944406282e-05, + "loss": 0.0086, + "step": 624230 + }, + { + "epoch": 1.62, + "learning_rate": 5.728198122769135e-05, + "loss": 0.007, + "step": 624240 + }, + { + "epoch": 1.62, + "learning_rate": 5.727809301131989e-05, + "loss": 0.0077, + "step": 624250 + }, + { + "epoch": 1.62, + "learning_rate": 5.727420479494842e-05, + "loss": 0.0093, + "step": 624260 + }, + { + "epoch": 1.62, + "learning_rate": 5.727031657857696e-05, + "loss": 0.0084, + "step": 624270 + }, + { + "epoch": 1.62, + "learning_rate": 5.72664283622055e-05, + "loss": 0.0063, + "step": 624280 + }, + { + "epoch": 1.62, + "learning_rate": 5.7262540145834034e-05, + "loss": 0.0108, + "step": 624290 + }, + { + "epoch": 1.62, + "learning_rate": 5.725865192946257e-05, + "loss": 0.0064, + "step": 624300 + }, + { + "epoch": 1.62, + "learning_rate": 5.7254763713091104e-05, + "loss": 0.0064, + "step": 624310 + }, + { + "epoch": 1.62, + "learning_rate": 5.725087549671964e-05, + "loss": 0.0088, + "step": 624320 + }, + { + "epoch": 1.62, + "learning_rate": 5.7246987280348173e-05, + "loss": 0.0121, + "step": 624330 + }, + { + "epoch": 1.62, + "learning_rate": 5.724309906397671e-05, + "loss": 0.0069, + "step": 624340 + }, + { + "epoch": 1.62, + "learning_rate": 5.723921084760524e-05, + "loss": 0.008, + "step": 624350 + }, + { + "epoch": 1.62, + "learning_rate": 5.7235322631233785e-05, + "loss": 0.0102, + "step": 624360 + }, + { + "epoch": 1.62, + "learning_rate": 5.7231434414862306e-05, + "loss": 0.0089, + "step": 624370 + }, + { + "epoch": 1.62, + "learning_rate": 5.722754619849085e-05, + "loss": 0.0068, + "step": 624380 + }, + { + "epoch": 1.62, + "learning_rate": 5.722365798211938e-05, + "loss": 0.0054, + "step": 624390 + }, + { + "epoch": 1.62, + "learning_rate": 5.721976976574792e-05, + "loss": 0.0098, + "step": 624400 + }, + { + "epoch": 1.62, + "learning_rate": 5.721588154937645e-05, + "loss": 0.008, + "step": 624410 + }, + { + "epoch": 1.62, + "learning_rate": 5.721199333300499e-05, + "loss": 0.0055, + "step": 624420 + }, + { + "epoch": 1.62, + "learning_rate": 5.720810511663352e-05, + "loss": 0.01, + "step": 624430 + }, + { + "epoch": 1.62, + "learning_rate": 5.720421690026206e-05, + "loss": 0.0097, + "step": 624440 + }, + { + "epoch": 1.62, + "learning_rate": 5.720032868389059e-05, + "loss": 0.0083, + "step": 624450 + }, + { + "epoch": 1.62, + "learning_rate": 5.7196440467519133e-05, + "loss": 0.0075, + "step": 624460 + }, + { + "epoch": 1.62, + "learning_rate": 5.719255225114767e-05, + "loss": 0.0081, + "step": 624470 + }, + { + "epoch": 1.62, + "learning_rate": 5.71886640347762e-05, + "loss": 0.0076, + "step": 624480 + }, + { + "epoch": 1.62, + "learning_rate": 5.718477581840474e-05, + "loss": 0.008, + "step": 624490 + }, + { + "epoch": 1.62, + "learning_rate": 5.718088760203327e-05, + "loss": 0.0094, + "step": 624500 + }, + { + "epoch": 1.62, + "learning_rate": 5.717699938566181e-05, + "loss": 0.0105, + "step": 624510 + }, + { + "epoch": 1.62, + "learning_rate": 5.717311116929034e-05, + "loss": 0.01, + "step": 624520 + }, + { + "epoch": 1.62, + "learning_rate": 5.716922295291888e-05, + "loss": 0.0138, + "step": 624530 + }, + { + "epoch": 1.62, + "learning_rate": 5.716533473654742e-05, + "loss": 0.0067, + "step": 624540 + }, + { + "epoch": 1.62, + "learning_rate": 5.7161446520175954e-05, + "loss": 0.0093, + "step": 624550 + }, + { + "epoch": 1.62, + "learning_rate": 5.715755830380449e-05, + "loss": 0.0064, + "step": 624560 + }, + { + "epoch": 1.62, + "learning_rate": 5.7153670087433024e-05, + "loss": 0.0076, + "step": 624570 + }, + { + "epoch": 1.62, + "learning_rate": 5.714978187106156e-05, + "loss": 0.0084, + "step": 624580 + }, + { + "epoch": 1.62, + "learning_rate": 5.714589365469009e-05, + "loss": 0.0071, + "step": 624590 + }, + { + "epoch": 1.62, + "learning_rate": 5.714200543831863e-05, + "loss": 0.0091, + "step": 624600 + }, + { + "epoch": 1.62, + "learning_rate": 5.7138117221947156e-05, + "loss": 0.0095, + "step": 624610 + }, + { + "epoch": 1.62, + "learning_rate": 5.713422900557569e-05, + "loss": 0.0089, + "step": 624620 + }, + { + "epoch": 1.62, + "learning_rate": 5.7130340789204226e-05, + "loss": 0.0162, + "step": 624630 + }, + { + "epoch": 1.62, + "learning_rate": 5.712645257283277e-05, + "loss": 0.0081, + "step": 624640 + }, + { + "epoch": 1.62, + "learning_rate": 5.71225643564613e-05, + "loss": 0.0082, + "step": 624650 + }, + { + "epoch": 1.62, + "learning_rate": 5.711867614008984e-05, + "loss": 0.0107, + "step": 624660 + }, + { + "epoch": 1.62, + "learning_rate": 5.711478792371837e-05, + "loss": 0.0083, + "step": 624670 + }, + { + "epoch": 1.62, + "learning_rate": 5.711089970734691e-05, + "loss": 0.0125, + "step": 624680 + }, + { + "epoch": 1.62, + "learning_rate": 5.710701149097544e-05, + "loss": 0.0063, + "step": 624690 + }, + { + "epoch": 1.62, + "learning_rate": 5.710312327460398e-05, + "loss": 0.0076, + "step": 624700 + }, + { + "epoch": 1.62, + "learning_rate": 5.709923505823251e-05, + "loss": 0.0071, + "step": 624710 + }, + { + "epoch": 1.62, + "learning_rate": 5.709534684186105e-05, + "loss": 0.0071, + "step": 624720 + }, + { + "epoch": 1.62, + "learning_rate": 5.709145862548959e-05, + "loss": 0.0085, + "step": 624730 + }, + { + "epoch": 1.62, + "learning_rate": 5.708757040911812e-05, + "loss": 0.0081, + "step": 624740 + }, + { + "epoch": 1.62, + "learning_rate": 5.708368219274666e-05, + "loss": 0.0096, + "step": 624750 + }, + { + "epoch": 1.62, + "learning_rate": 5.707979397637519e-05, + "loss": 0.0113, + "step": 624760 + }, + { + "epoch": 1.62, + "learning_rate": 5.707590576000373e-05, + "loss": 0.0063, + "step": 624770 + }, + { + "epoch": 1.62, + "learning_rate": 5.707201754363226e-05, + "loss": 0.009, + "step": 624780 + }, + { + "epoch": 1.62, + "learning_rate": 5.70681293272608e-05, + "loss": 0.0099, + "step": 624790 + }, + { + "epoch": 1.62, + "learning_rate": 5.706424111088934e-05, + "loss": 0.0077, + "step": 624800 + }, + { + "epoch": 1.62, + "learning_rate": 5.7060352894517874e-05, + "loss": 0.0074, + "step": 624810 + }, + { + "epoch": 1.62, + "learning_rate": 5.705646467814641e-05, + "loss": 0.0066, + "step": 624820 + }, + { + "epoch": 1.62, + "learning_rate": 5.7052576461774944e-05, + "loss": 0.0067, + "step": 624830 + }, + { + "epoch": 1.62, + "learning_rate": 5.704868824540348e-05, + "loss": 0.0087, + "step": 624840 + }, + { + "epoch": 1.62, + "learning_rate": 5.704480002903201e-05, + "loss": 0.0103, + "step": 624850 + }, + { + "epoch": 1.62, + "learning_rate": 5.704091181266054e-05, + "loss": 0.0077, + "step": 624860 + }, + { + "epoch": 1.62, + "learning_rate": 5.7037023596289076e-05, + "loss": 0.008, + "step": 624870 + }, + { + "epoch": 1.62, + "learning_rate": 5.703313537991761e-05, + "loss": 0.0111, + "step": 624880 + }, + { + "epoch": 1.62, + "learning_rate": 5.7029247163546146e-05, + "loss": 0.0079, + "step": 624890 + }, + { + "epoch": 1.62, + "learning_rate": 5.702535894717469e-05, + "loss": 0.0094, + "step": 624900 + }, + { + "epoch": 1.62, + "learning_rate": 5.702147073080322e-05, + "loss": 0.007, + "step": 624910 + }, + { + "epoch": 1.62, + "learning_rate": 5.701758251443176e-05, + "loss": 0.0106, + "step": 624920 + }, + { + "epoch": 1.62, + "learning_rate": 5.701369429806029e-05, + "loss": 0.0079, + "step": 624930 + }, + { + "epoch": 1.62, + "learning_rate": 5.700980608168883e-05, + "loss": 0.0099, + "step": 624940 + }, + { + "epoch": 1.62, + "learning_rate": 5.700591786531736e-05, + "loss": 0.0075, + "step": 624950 + }, + { + "epoch": 1.62, + "learning_rate": 5.70020296489459e-05, + "loss": 0.0094, + "step": 624960 + }, + { + "epoch": 1.62, + "learning_rate": 5.699814143257443e-05, + "loss": 0.0082, + "step": 624970 + }, + { + "epoch": 1.62, + "learning_rate": 5.699425321620297e-05, + "loss": 0.0117, + "step": 624980 + }, + { + "epoch": 1.62, + "learning_rate": 5.699036499983151e-05, + "loss": 0.0079, + "step": 624990 + }, + { + "epoch": 1.62, + "learning_rate": 5.698647678346004e-05, + "loss": 0.0066, + "step": 625000 + }, + { + "epoch": 1.62, + "eval_cer": 0.8816481004827348, + "eval_loss": 0.005520543083548546, + "eval_runtime": 107.9384, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 625000 + }, + { + "epoch": 1.62, + "learning_rate": 5.698258856708858e-05, + "loss": 0.0059, + "step": 625010 + }, + { + "epoch": 1.62, + "learning_rate": 5.697870035071711e-05, + "loss": 0.0106, + "step": 625020 + }, + { + "epoch": 1.62, + "learning_rate": 5.697481213434565e-05, + "loss": 0.0072, + "step": 625030 + }, + { + "epoch": 1.62, + "learning_rate": 5.697092391797418e-05, + "loss": 0.0103, + "step": 625040 + }, + { + "epoch": 1.62, + "learning_rate": 5.696703570160272e-05, + "loss": 0.0078, + "step": 625050 + }, + { + "epoch": 1.62, + "learning_rate": 5.696314748523126e-05, + "loss": 0.0076, + "step": 625060 + }, + { + "epoch": 1.62, + "learning_rate": 5.6959259268859794e-05, + "loss": 0.0113, + "step": 625070 + }, + { + "epoch": 1.62, + "learning_rate": 5.695537105248833e-05, + "loss": 0.0071, + "step": 625080 + }, + { + "epoch": 1.62, + "learning_rate": 5.6951482836116864e-05, + "loss": 0.0064, + "step": 625090 + }, + { + "epoch": 1.62, + "learning_rate": 5.69475946197454e-05, + "loss": 0.0098, + "step": 625100 + }, + { + "epoch": 1.62, + "learning_rate": 5.6943706403373927e-05, + "loss": 0.006, + "step": 625110 + }, + { + "epoch": 1.62, + "learning_rate": 5.693981818700246e-05, + "loss": 0.0066, + "step": 625120 + }, + { + "epoch": 1.62, + "learning_rate": 5.6935929970630996e-05, + "loss": 0.0082, + "step": 625130 + }, + { + "epoch": 1.62, + "learning_rate": 5.693204175425953e-05, + "loss": 0.0094, + "step": 625140 + }, + { + "epoch": 1.62, + "learning_rate": 5.6928153537888066e-05, + "loss": 0.0076, + "step": 625150 + }, + { + "epoch": 1.62, + "learning_rate": 5.692426532151661e-05, + "loss": 0.0084, + "step": 625160 + }, + { + "epoch": 1.62, + "learning_rate": 5.692037710514514e-05, + "loss": 0.0077, + "step": 625170 + }, + { + "epoch": 1.62, + "learning_rate": 5.691648888877368e-05, + "loss": 0.0073, + "step": 625180 + }, + { + "epoch": 1.62, + "learning_rate": 5.691260067240221e-05, + "loss": 0.0129, + "step": 625190 + }, + { + "epoch": 1.62, + "learning_rate": 5.690871245603075e-05, + "loss": 0.0085, + "step": 625200 + }, + { + "epoch": 1.62, + "learning_rate": 5.690482423965928e-05, + "loss": 0.0077, + "step": 625210 + }, + { + "epoch": 1.62, + "learning_rate": 5.690093602328782e-05, + "loss": 0.0081, + "step": 625220 + }, + { + "epoch": 1.62, + "learning_rate": 5.689704780691635e-05, + "loss": 0.0062, + "step": 625230 + }, + { + "epoch": 1.62, + "learning_rate": 5.689315959054489e-05, + "loss": 0.0093, + "step": 625240 + }, + { + "epoch": 1.62, + "learning_rate": 5.688927137417343e-05, + "loss": 0.0094, + "step": 625250 + }, + { + "epoch": 1.62, + "learning_rate": 5.688538315780196e-05, + "loss": 0.0081, + "step": 625260 + }, + { + "epoch": 1.62, + "learning_rate": 5.68814949414305e-05, + "loss": 0.011, + "step": 625270 + }, + { + "epoch": 1.62, + "learning_rate": 5.687760672505903e-05, + "loss": 0.0108, + "step": 625280 + }, + { + "epoch": 1.62, + "learning_rate": 5.687371850868757e-05, + "loss": 0.006, + "step": 625290 + }, + { + "epoch": 1.62, + "learning_rate": 5.68698302923161e-05, + "loss": 0.0094, + "step": 625300 + }, + { + "epoch": 1.62, + "learning_rate": 5.686594207594464e-05, + "loss": 0.0092, + "step": 625310 + }, + { + "epoch": 1.62, + "learning_rate": 5.686205385957318e-05, + "loss": 0.0076, + "step": 625320 + }, + { + "epoch": 1.62, + "learning_rate": 5.6858165643201714e-05, + "loss": 0.0075, + "step": 625330 + }, + { + "epoch": 1.62, + "learning_rate": 5.685427742683025e-05, + "loss": 0.0092, + "step": 625340 + }, + { + "epoch": 1.62, + "learning_rate": 5.6850389210458784e-05, + "loss": 0.0108, + "step": 625350 + }, + { + "epoch": 1.62, + "learning_rate": 5.684650099408731e-05, + "loss": 0.0077, + "step": 625360 + }, + { + "epoch": 1.62, + "learning_rate": 5.6842612777715846e-05, + "loss": 0.0066, + "step": 625370 + }, + { + "epoch": 1.62, + "learning_rate": 5.683872456134438e-05, + "loss": 0.008, + "step": 625380 + }, + { + "epoch": 1.62, + "learning_rate": 5.6834836344972916e-05, + "loss": 0.008, + "step": 625390 + }, + { + "epoch": 1.62, + "learning_rate": 5.683094812860145e-05, + "loss": 0.0083, + "step": 625400 + }, + { + "epoch": 1.62, + "learning_rate": 5.6827059912229986e-05, + "loss": 0.0083, + "step": 625410 + }, + { + "epoch": 1.62, + "learning_rate": 5.682317169585853e-05, + "loss": 0.0059, + "step": 625420 + }, + { + "epoch": 1.62, + "learning_rate": 5.681928347948706e-05, + "loss": 0.0104, + "step": 625430 + }, + { + "epoch": 1.62, + "learning_rate": 5.68153952631156e-05, + "loss": 0.0092, + "step": 625440 + }, + { + "epoch": 1.62, + "learning_rate": 5.681150704674413e-05, + "loss": 0.0083, + "step": 625450 + }, + { + "epoch": 1.62, + "learning_rate": 5.680761883037267e-05, + "loss": 0.0087, + "step": 625460 + }, + { + "epoch": 1.62, + "learning_rate": 5.68037306140012e-05, + "loss": 0.0101, + "step": 625470 + }, + { + "epoch": 1.62, + "learning_rate": 5.679984239762974e-05, + "loss": 0.0125, + "step": 625480 + }, + { + "epoch": 1.62, + "learning_rate": 5.679595418125827e-05, + "loss": 0.0112, + "step": 625490 + }, + { + "epoch": 1.62, + "learning_rate": 5.6792065964886806e-05, + "loss": 0.0086, + "step": 625500 + }, + { + "epoch": 1.62, + "learning_rate": 5.678817774851535e-05, + "loss": 0.0085, + "step": 625510 + }, + { + "epoch": 1.62, + "learning_rate": 5.678428953214388e-05, + "loss": 0.0091, + "step": 625520 + }, + { + "epoch": 1.62, + "learning_rate": 5.678040131577242e-05, + "loss": 0.0115, + "step": 625530 + }, + { + "epoch": 1.62, + "learning_rate": 5.677651309940095e-05, + "loss": 0.0069, + "step": 625540 + }, + { + "epoch": 1.62, + "learning_rate": 5.677262488302949e-05, + "loss": 0.0089, + "step": 625550 + }, + { + "epoch": 1.62, + "learning_rate": 5.676873666665802e-05, + "loss": 0.0077, + "step": 625560 + }, + { + "epoch": 1.62, + "learning_rate": 5.676484845028656e-05, + "loss": 0.0092, + "step": 625570 + }, + { + "epoch": 1.62, + "learning_rate": 5.676096023391509e-05, + "loss": 0.006, + "step": 625580 + }, + { + "epoch": 1.62, + "learning_rate": 5.6757072017543634e-05, + "loss": 0.0142, + "step": 625590 + }, + { + "epoch": 1.62, + "learning_rate": 5.675318380117217e-05, + "loss": 0.0089, + "step": 625600 + }, + { + "epoch": 1.62, + "learning_rate": 5.67492955848007e-05, + "loss": 0.0096, + "step": 625610 + }, + { + "epoch": 1.62, + "learning_rate": 5.674540736842923e-05, + "loss": 0.0086, + "step": 625620 + }, + { + "epoch": 1.62, + "learning_rate": 5.6741519152057766e-05, + "loss": 0.009, + "step": 625630 + }, + { + "epoch": 1.62, + "learning_rate": 5.67376309356863e-05, + "loss": 0.0078, + "step": 625640 + }, + { + "epoch": 1.62, + "learning_rate": 5.6733742719314836e-05, + "loss": 0.0091, + "step": 625650 + }, + { + "epoch": 1.62, + "learning_rate": 5.672985450294337e-05, + "loss": 0.0122, + "step": 625660 + }, + { + "epoch": 1.62, + "learning_rate": 5.6725966286571906e-05, + "loss": 0.0074, + "step": 625670 + }, + { + "epoch": 1.62, + "learning_rate": 5.672207807020044e-05, + "loss": 0.0077, + "step": 625680 + }, + { + "epoch": 1.62, + "learning_rate": 5.671818985382898e-05, + "loss": 0.0078, + "step": 625690 + }, + { + "epoch": 1.62, + "learning_rate": 5.671430163745752e-05, + "loss": 0.0084, + "step": 625700 + }, + { + "epoch": 1.62, + "learning_rate": 5.671041342108605e-05, + "loss": 0.0098, + "step": 625710 + }, + { + "epoch": 1.62, + "learning_rate": 5.670652520471459e-05, + "loss": 0.0101, + "step": 625720 + }, + { + "epoch": 1.62, + "learning_rate": 5.670263698834312e-05, + "loss": 0.0089, + "step": 625730 + }, + { + "epoch": 1.62, + "learning_rate": 5.669874877197166e-05, + "loss": 0.0087, + "step": 625740 + }, + { + "epoch": 1.62, + "learning_rate": 5.669486055560019e-05, + "loss": 0.0059, + "step": 625750 + }, + { + "epoch": 1.62, + "learning_rate": 5.6690972339228726e-05, + "loss": 0.0068, + "step": 625760 + }, + { + "epoch": 1.62, + "learning_rate": 5.668708412285727e-05, + "loss": 0.0054, + "step": 625770 + }, + { + "epoch": 1.62, + "learning_rate": 5.66831959064858e-05, + "loss": 0.0091, + "step": 625780 + }, + { + "epoch": 1.62, + "learning_rate": 5.667930769011434e-05, + "loss": 0.008, + "step": 625790 + }, + { + "epoch": 1.62, + "learning_rate": 5.667541947374287e-05, + "loss": 0.0105, + "step": 625800 + }, + { + "epoch": 1.62, + "learning_rate": 5.667153125737141e-05, + "loss": 0.0079, + "step": 625810 + }, + { + "epoch": 1.62, + "learning_rate": 5.666764304099994e-05, + "loss": 0.0074, + "step": 625820 + }, + { + "epoch": 1.62, + "learning_rate": 5.666375482462848e-05, + "loss": 0.0097, + "step": 625830 + }, + { + "epoch": 1.62, + "learning_rate": 5.665986660825701e-05, + "loss": 0.0079, + "step": 625840 + }, + { + "epoch": 1.62, + "learning_rate": 5.665597839188554e-05, + "loss": 0.008, + "step": 625850 + }, + { + "epoch": 1.62, + "learning_rate": 5.6652090175514075e-05, + "loss": 0.0087, + "step": 625860 + }, + { + "epoch": 1.62, + "learning_rate": 5.664820195914262e-05, + "loss": 0.0084, + "step": 625870 + }, + { + "epoch": 1.62, + "learning_rate": 5.664431374277115e-05, + "loss": 0.0077, + "step": 625880 + }, + { + "epoch": 1.62, + "learning_rate": 5.6640425526399686e-05, + "loss": 0.0117, + "step": 625890 + }, + { + "epoch": 1.62, + "learning_rate": 5.663653731002822e-05, + "loss": 0.0089, + "step": 625900 + }, + { + "epoch": 1.62, + "learning_rate": 5.6632649093656756e-05, + "loss": 0.0127, + "step": 625910 + }, + { + "epoch": 1.62, + "learning_rate": 5.662876087728529e-05, + "loss": 0.0082, + "step": 625920 + }, + { + "epoch": 1.62, + "learning_rate": 5.6624872660913826e-05, + "loss": 0.0057, + "step": 625930 + }, + { + "epoch": 1.62, + "learning_rate": 5.662098444454236e-05, + "loss": 0.008, + "step": 625940 + }, + { + "epoch": 1.62, + "learning_rate": 5.66170962281709e-05, + "loss": 0.0093, + "step": 625950 + }, + { + "epoch": 1.62, + "learning_rate": 5.661320801179944e-05, + "loss": 0.008, + "step": 625960 + }, + { + "epoch": 1.62, + "learning_rate": 5.660931979542797e-05, + "loss": 0.0085, + "step": 625970 + }, + { + "epoch": 1.62, + "learning_rate": 5.660543157905651e-05, + "loss": 0.0102, + "step": 625980 + }, + { + "epoch": 1.62, + "learning_rate": 5.660154336268504e-05, + "loss": 0.0139, + "step": 625990 + }, + { + "epoch": 1.62, + "learning_rate": 5.659765514631358e-05, + "loss": 0.0084, + "step": 626000 + }, + { + "epoch": 1.62, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.005688130855560303, + "eval_runtime": 107.8597, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 626000 + }, + { + "epoch": 1.62, + "learning_rate": 5.659376692994211e-05, + "loss": 0.0085, + "step": 626010 + }, + { + "epoch": 1.62, + "learning_rate": 5.6589878713570646e-05, + "loss": 0.0101, + "step": 626020 + }, + { + "epoch": 1.62, + "learning_rate": 5.658599049719919e-05, + "loss": 0.009, + "step": 626030 + }, + { + "epoch": 1.62, + "learning_rate": 5.658210228082772e-05, + "loss": 0.0052, + "step": 626040 + }, + { + "epoch": 1.62, + "learning_rate": 5.657821406445626e-05, + "loss": 0.0077, + "step": 626050 + }, + { + "epoch": 1.62, + "learning_rate": 5.657432584808479e-05, + "loss": 0.0085, + "step": 626060 + }, + { + "epoch": 1.62, + "learning_rate": 5.657043763171333e-05, + "loss": 0.0052, + "step": 626070 + }, + { + "epoch": 1.62, + "learning_rate": 5.656654941534186e-05, + "loss": 0.01, + "step": 626080 + }, + { + "epoch": 1.62, + "learning_rate": 5.65626611989704e-05, + "loss": 0.0099, + "step": 626090 + }, + { + "epoch": 1.62, + "learning_rate": 5.6558772982598925e-05, + "loss": 0.0107, + "step": 626100 + }, + { + "epoch": 1.62, + "learning_rate": 5.655488476622746e-05, + "loss": 0.0086, + "step": 626110 + }, + { + "epoch": 1.62, + "learning_rate": 5.6550996549855995e-05, + "loss": 0.008, + "step": 626120 + }, + { + "epoch": 1.62, + "learning_rate": 5.6547108333484537e-05, + "loss": 0.0096, + "step": 626130 + }, + { + "epoch": 1.62, + "learning_rate": 5.654322011711307e-05, + "loss": 0.0107, + "step": 626140 + }, + { + "epoch": 1.62, + "learning_rate": 5.6539331900741606e-05, + "loss": 0.0083, + "step": 626150 + }, + { + "epoch": 1.62, + "learning_rate": 5.653544368437014e-05, + "loss": 0.0085, + "step": 626160 + }, + { + "epoch": 1.62, + "learning_rate": 5.6531555467998676e-05, + "loss": 0.0068, + "step": 626170 + }, + { + "epoch": 1.62, + "learning_rate": 5.652766725162721e-05, + "loss": 0.0076, + "step": 626180 + }, + { + "epoch": 1.62, + "learning_rate": 5.6523779035255746e-05, + "loss": 0.0074, + "step": 626190 + }, + { + "epoch": 1.62, + "learning_rate": 5.651989081888428e-05, + "loss": 0.0066, + "step": 626200 + }, + { + "epoch": 1.62, + "learning_rate": 5.651600260251282e-05, + "loss": 0.0061, + "step": 626210 + }, + { + "epoch": 1.62, + "learning_rate": 5.651211438614136e-05, + "loss": 0.0073, + "step": 626220 + }, + { + "epoch": 1.62, + "learning_rate": 5.650822616976989e-05, + "loss": 0.0098, + "step": 626230 + }, + { + "epoch": 1.62, + "learning_rate": 5.650433795339843e-05, + "loss": 0.0093, + "step": 626240 + }, + { + "epoch": 1.62, + "learning_rate": 5.650044973702696e-05, + "loss": 0.0099, + "step": 626250 + }, + { + "epoch": 1.62, + "learning_rate": 5.6496561520655497e-05, + "loss": 0.0086, + "step": 626260 + }, + { + "epoch": 1.62, + "learning_rate": 5.649267330428403e-05, + "loss": 0.0073, + "step": 626270 + }, + { + "epoch": 1.62, + "learning_rate": 5.6488785087912566e-05, + "loss": 0.007, + "step": 626280 + }, + { + "epoch": 1.62, + "learning_rate": 5.648489687154111e-05, + "loss": 0.0084, + "step": 626290 + }, + { + "epoch": 1.62, + "learning_rate": 5.648100865516964e-05, + "loss": 0.0077, + "step": 626300 + }, + { + "epoch": 1.62, + "learning_rate": 5.647712043879818e-05, + "loss": 0.0085, + "step": 626310 + }, + { + "epoch": 1.62, + "learning_rate": 5.647323222242671e-05, + "loss": 0.0093, + "step": 626320 + }, + { + "epoch": 1.62, + "learning_rate": 5.646934400605525e-05, + "loss": 0.0083, + "step": 626330 + }, + { + "epoch": 1.62, + "learning_rate": 5.646545578968378e-05, + "loss": 0.0087, + "step": 626340 + }, + { + "epoch": 1.62, + "learning_rate": 5.646156757331231e-05, + "loss": 0.007, + "step": 626350 + }, + { + "epoch": 1.62, + "learning_rate": 5.6457679356940845e-05, + "loss": 0.0112, + "step": 626360 + }, + { + "epoch": 1.62, + "learning_rate": 5.645379114056938e-05, + "loss": 0.0135, + "step": 626370 + }, + { + "epoch": 1.62, + "learning_rate": 5.6449902924197915e-05, + "loss": 0.0081, + "step": 626380 + }, + { + "epoch": 1.62, + "learning_rate": 5.6446014707826457e-05, + "loss": 0.0095, + "step": 626390 + }, + { + "epoch": 1.62, + "learning_rate": 5.644212649145499e-05, + "loss": 0.0093, + "step": 626400 + }, + { + "epoch": 1.62, + "learning_rate": 5.6438238275083526e-05, + "loss": 0.008, + "step": 626410 + }, + { + "epoch": 1.62, + "learning_rate": 5.643435005871206e-05, + "loss": 0.0082, + "step": 626420 + }, + { + "epoch": 1.62, + "learning_rate": 5.6430461842340596e-05, + "loss": 0.0059, + "step": 626430 + }, + { + "epoch": 1.62, + "learning_rate": 5.642657362596913e-05, + "loss": 0.0056, + "step": 626440 + }, + { + "epoch": 1.62, + "learning_rate": 5.6422685409597666e-05, + "loss": 0.009, + "step": 626450 + }, + { + "epoch": 1.62, + "learning_rate": 5.64187971932262e-05, + "loss": 0.0098, + "step": 626460 + }, + { + "epoch": 1.62, + "learning_rate": 5.641490897685474e-05, + "loss": 0.0096, + "step": 626470 + }, + { + "epoch": 1.62, + "learning_rate": 5.641102076048328e-05, + "loss": 0.0078, + "step": 626480 + }, + { + "epoch": 1.62, + "learning_rate": 5.640713254411181e-05, + "loss": 0.0091, + "step": 626490 + }, + { + "epoch": 1.62, + "learning_rate": 5.640324432774035e-05, + "loss": 0.0073, + "step": 626500 + }, + { + "epoch": 1.62, + "learning_rate": 5.639935611136888e-05, + "loss": 0.007, + "step": 626510 + }, + { + "epoch": 1.62, + "learning_rate": 5.6395467894997417e-05, + "loss": 0.0084, + "step": 626520 + }, + { + "epoch": 1.62, + "learning_rate": 5.639157967862595e-05, + "loss": 0.011, + "step": 626530 + }, + { + "epoch": 1.62, + "learning_rate": 5.6387691462254486e-05, + "loss": 0.0089, + "step": 626540 + }, + { + "epoch": 1.62, + "learning_rate": 5.638380324588303e-05, + "loss": 0.0063, + "step": 626550 + }, + { + "epoch": 1.62, + "learning_rate": 5.637991502951156e-05, + "loss": 0.0067, + "step": 626560 + }, + { + "epoch": 1.62, + "learning_rate": 5.63760268131401e-05, + "loss": 0.0097, + "step": 626570 + }, + { + "epoch": 1.62, + "learning_rate": 5.637213859676863e-05, + "loss": 0.0078, + "step": 626580 + }, + { + "epoch": 1.62, + "learning_rate": 5.636825038039717e-05, + "loss": 0.0075, + "step": 626590 + }, + { + "epoch": 1.62, + "learning_rate": 5.6364362164025695e-05, + "loss": 0.0067, + "step": 626600 + }, + { + "epoch": 1.62, + "learning_rate": 5.636047394765423e-05, + "loss": 0.0109, + "step": 626610 + }, + { + "epoch": 1.62, + "learning_rate": 5.6356585731282765e-05, + "loss": 0.0077, + "step": 626620 + }, + { + "epoch": 1.62, + "learning_rate": 5.63526975149113e-05, + "loss": 0.0084, + "step": 626630 + }, + { + "epoch": 1.62, + "learning_rate": 5.6348809298539835e-05, + "loss": 0.0067, + "step": 626640 + }, + { + "epoch": 1.62, + "learning_rate": 5.6344921082168377e-05, + "loss": 0.0096, + "step": 626650 + }, + { + "epoch": 1.62, + "learning_rate": 5.634103286579691e-05, + "loss": 0.0086, + "step": 626660 + }, + { + "epoch": 1.62, + "learning_rate": 5.6337144649425446e-05, + "loss": 0.0111, + "step": 626670 + }, + { + "epoch": 1.62, + "learning_rate": 5.633325643305398e-05, + "loss": 0.0099, + "step": 626680 + }, + { + "epoch": 1.62, + "learning_rate": 5.6329368216682516e-05, + "loss": 0.0078, + "step": 626690 + }, + { + "epoch": 1.62, + "learning_rate": 5.632548000031105e-05, + "loss": 0.0094, + "step": 626700 + }, + { + "epoch": 1.62, + "learning_rate": 5.6321591783939586e-05, + "loss": 0.0106, + "step": 626710 + }, + { + "epoch": 1.62, + "learning_rate": 5.631770356756812e-05, + "loss": 0.0066, + "step": 626720 + }, + { + "epoch": 1.62, + "learning_rate": 5.631381535119666e-05, + "loss": 0.0079, + "step": 626730 + }, + { + "epoch": 1.62, + "learning_rate": 5.63099271348252e-05, + "loss": 0.0077, + "step": 626740 + }, + { + "epoch": 1.62, + "learning_rate": 5.630603891845373e-05, + "loss": 0.0068, + "step": 626750 + }, + { + "epoch": 1.62, + "learning_rate": 5.630215070208227e-05, + "loss": 0.0105, + "step": 626760 + }, + { + "epoch": 1.62, + "learning_rate": 5.62982624857108e-05, + "loss": 0.0064, + "step": 626770 + }, + { + "epoch": 1.62, + "learning_rate": 5.6294374269339336e-05, + "loss": 0.0075, + "step": 626780 + }, + { + "epoch": 1.62, + "learning_rate": 5.629048605296787e-05, + "loss": 0.0054, + "step": 626790 + }, + { + "epoch": 1.62, + "learning_rate": 5.6286597836596406e-05, + "loss": 0.0065, + "step": 626800 + }, + { + "epoch": 1.62, + "learning_rate": 5.628270962022495e-05, + "loss": 0.0088, + "step": 626810 + }, + { + "epoch": 1.62, + "learning_rate": 5.627882140385348e-05, + "loss": 0.0093, + "step": 626820 + }, + { + "epoch": 1.62, + "learning_rate": 5.627493318748202e-05, + "loss": 0.0099, + "step": 626830 + }, + { + "epoch": 1.62, + "learning_rate": 5.627104497111055e-05, + "loss": 0.0059, + "step": 626840 + }, + { + "epoch": 1.62, + "learning_rate": 5.626715675473908e-05, + "loss": 0.0104, + "step": 626850 + }, + { + "epoch": 1.62, + "learning_rate": 5.6263268538367615e-05, + "loss": 0.0059, + "step": 626860 + }, + { + "epoch": 1.62, + "learning_rate": 5.625938032199615e-05, + "loss": 0.0086, + "step": 626870 + }, + { + "epoch": 1.62, + "learning_rate": 5.6255492105624685e-05, + "loss": 0.0075, + "step": 626880 + }, + { + "epoch": 1.62, + "learning_rate": 5.625160388925322e-05, + "loss": 0.0072, + "step": 626890 + }, + { + "epoch": 1.63, + "learning_rate": 5.6247715672881755e-05, + "loss": 0.0076, + "step": 626900 + }, + { + "epoch": 1.63, + "learning_rate": 5.6243827456510296e-05, + "loss": 0.009, + "step": 626910 + }, + { + "epoch": 1.63, + "learning_rate": 5.623993924013883e-05, + "loss": 0.0095, + "step": 626920 + }, + { + "epoch": 1.63, + "learning_rate": 5.6236051023767366e-05, + "loss": 0.0078, + "step": 626930 + }, + { + "epoch": 1.63, + "learning_rate": 5.62321628073959e-05, + "loss": 0.0099, + "step": 626940 + }, + { + "epoch": 1.63, + "learning_rate": 5.6228274591024436e-05, + "loss": 0.0083, + "step": 626950 + }, + { + "epoch": 1.63, + "learning_rate": 5.622438637465297e-05, + "loss": 0.0089, + "step": 626960 + }, + { + "epoch": 1.63, + "learning_rate": 5.6220498158281506e-05, + "loss": 0.0104, + "step": 626970 + }, + { + "epoch": 1.63, + "learning_rate": 5.621660994191004e-05, + "loss": 0.0067, + "step": 626980 + }, + { + "epoch": 1.63, + "learning_rate": 5.6212721725538575e-05, + "loss": 0.0085, + "step": 626990 + }, + { + "epoch": 1.63, + "learning_rate": 5.620883350916712e-05, + "loss": 0.0098, + "step": 627000 + }, + { + "epoch": 1.63, + "eval_cer": 0.8816397026611297, + "eval_loss": 0.005602034740149975, + "eval_runtime": 108.0184, + "eval_samples_per_second": 18.515, + "eval_steps_per_second": 4.629, + "step": 627000 + }, + { + "epoch": 1.63, + "learning_rate": 5.620494529279565e-05, + "loss": 0.0061, + "step": 627010 + }, + { + "epoch": 1.63, + "learning_rate": 5.620105707642419e-05, + "loss": 0.0078, + "step": 627020 + }, + { + "epoch": 1.63, + "learning_rate": 5.619716886005272e-05, + "loss": 0.0106, + "step": 627030 + }, + { + "epoch": 1.63, + "learning_rate": 5.6193280643681256e-05, + "loss": 0.0078, + "step": 627040 + }, + { + "epoch": 1.63, + "learning_rate": 5.618939242730979e-05, + "loss": 0.0089, + "step": 627050 + }, + { + "epoch": 1.63, + "learning_rate": 5.6185504210938326e-05, + "loss": 0.0101, + "step": 627060 + }, + { + "epoch": 1.63, + "learning_rate": 5.618161599456686e-05, + "loss": 0.0119, + "step": 627070 + }, + { + "epoch": 1.63, + "learning_rate": 5.61777277781954e-05, + "loss": 0.0078, + "step": 627080 + }, + { + "epoch": 1.63, + "learning_rate": 5.6173839561823924e-05, + "loss": 0.0101, + "step": 627090 + }, + { + "epoch": 1.63, + "learning_rate": 5.6169951345452466e-05, + "loss": 0.0102, + "step": 627100 + }, + { + "epoch": 1.63, + "learning_rate": 5.6166063129081e-05, + "loss": 0.0077, + "step": 627110 + }, + { + "epoch": 1.63, + "learning_rate": 5.6162174912709535e-05, + "loss": 0.006, + "step": 627120 + }, + { + "epoch": 1.63, + "learning_rate": 5.615828669633807e-05, + "loss": 0.0085, + "step": 627130 + }, + { + "epoch": 1.63, + "learning_rate": 5.6154398479966605e-05, + "loss": 0.0094, + "step": 627140 + }, + { + "epoch": 1.63, + "learning_rate": 5.615051026359514e-05, + "loss": 0.0098, + "step": 627150 + }, + { + "epoch": 1.63, + "learning_rate": 5.6146622047223675e-05, + "loss": 0.0084, + "step": 627160 + }, + { + "epoch": 1.63, + "learning_rate": 5.614273383085221e-05, + "loss": 0.0066, + "step": 627170 + }, + { + "epoch": 1.63, + "learning_rate": 5.613884561448075e-05, + "loss": 0.0079, + "step": 627180 + }, + { + "epoch": 1.63, + "learning_rate": 5.6134957398109286e-05, + "loss": 0.0091, + "step": 627190 + }, + { + "epoch": 1.63, + "learning_rate": 5.613106918173782e-05, + "loss": 0.0128, + "step": 627200 + }, + { + "epoch": 1.63, + "learning_rate": 5.6127180965366356e-05, + "loss": 0.0069, + "step": 627210 + }, + { + "epoch": 1.63, + "learning_rate": 5.612329274899489e-05, + "loss": 0.0072, + "step": 627220 + }, + { + "epoch": 1.63, + "learning_rate": 5.6119404532623426e-05, + "loss": 0.0093, + "step": 627230 + }, + { + "epoch": 1.63, + "learning_rate": 5.611551631625196e-05, + "loss": 0.0054, + "step": 627240 + }, + { + "epoch": 1.63, + "learning_rate": 5.6111628099880495e-05, + "loss": 0.0094, + "step": 627250 + }, + { + "epoch": 1.63, + "learning_rate": 5.610773988350904e-05, + "loss": 0.008, + "step": 627260 + }, + { + "epoch": 1.63, + "learning_rate": 5.610385166713757e-05, + "loss": 0.008, + "step": 627270 + }, + { + "epoch": 1.63, + "learning_rate": 5.609996345076611e-05, + "loss": 0.0096, + "step": 627280 + }, + { + "epoch": 1.63, + "learning_rate": 5.609607523439464e-05, + "loss": 0.006, + "step": 627290 + }, + { + "epoch": 1.63, + "learning_rate": 5.6092187018023176e-05, + "loss": 0.009, + "step": 627300 + }, + { + "epoch": 1.63, + "learning_rate": 5.608829880165171e-05, + "loss": 0.008, + "step": 627310 + }, + { + "epoch": 1.63, + "learning_rate": 5.6084410585280246e-05, + "loss": 0.0092, + "step": 627320 + }, + { + "epoch": 1.63, + "learning_rate": 5.608052236890878e-05, + "loss": 0.0071, + "step": 627330 + }, + { + "epoch": 1.63, + "learning_rate": 5.607663415253731e-05, + "loss": 0.0089, + "step": 627340 + }, + { + "epoch": 1.63, + "learning_rate": 5.6072745936165844e-05, + "loss": 0.0067, + "step": 627350 + }, + { + "epoch": 1.63, + "learning_rate": 5.6068857719794386e-05, + "loss": 0.0076, + "step": 627360 + }, + { + "epoch": 1.63, + "learning_rate": 5.606496950342292e-05, + "loss": 0.007, + "step": 627370 + }, + { + "epoch": 1.63, + "learning_rate": 5.6061081287051455e-05, + "loss": 0.0075, + "step": 627380 + }, + { + "epoch": 1.63, + "learning_rate": 5.605719307067999e-05, + "loss": 0.0107, + "step": 627390 + }, + { + "epoch": 1.63, + "learning_rate": 5.6053304854308525e-05, + "loss": 0.0076, + "step": 627400 + }, + { + "epoch": 1.63, + "learning_rate": 5.604941663793706e-05, + "loss": 0.0101, + "step": 627410 + }, + { + "epoch": 1.63, + "learning_rate": 5.6045528421565595e-05, + "loss": 0.012, + "step": 627420 + }, + { + "epoch": 1.63, + "learning_rate": 5.604164020519413e-05, + "loss": 0.0103, + "step": 627430 + }, + { + "epoch": 1.63, + "learning_rate": 5.603775198882267e-05, + "loss": 0.0092, + "step": 627440 + }, + { + "epoch": 1.63, + "learning_rate": 5.6033863772451206e-05, + "loss": 0.0075, + "step": 627450 + }, + { + "epoch": 1.63, + "learning_rate": 5.602997555607974e-05, + "loss": 0.0082, + "step": 627460 + }, + { + "epoch": 1.63, + "learning_rate": 5.6026087339708276e-05, + "loss": 0.0096, + "step": 627470 + }, + { + "epoch": 1.63, + "learning_rate": 5.602219912333681e-05, + "loss": 0.0078, + "step": 627480 + }, + { + "epoch": 1.63, + "learning_rate": 5.6018310906965346e-05, + "loss": 0.0095, + "step": 627490 + }, + { + "epoch": 1.63, + "learning_rate": 5.601442269059388e-05, + "loss": 0.0093, + "step": 627500 + }, + { + "epoch": 1.63, + "learning_rate": 5.6010534474222415e-05, + "loss": 0.0088, + "step": 627510 + }, + { + "epoch": 1.63, + "learning_rate": 5.600664625785096e-05, + "loss": 0.0083, + "step": 627520 + }, + { + "epoch": 1.63, + "learning_rate": 5.600275804147949e-05, + "loss": 0.0078, + "step": 627530 + }, + { + "epoch": 1.63, + "learning_rate": 5.5998869825108027e-05, + "loss": 0.0063, + "step": 627540 + }, + { + "epoch": 1.63, + "learning_rate": 5.599498160873656e-05, + "loss": 0.0095, + "step": 627550 + }, + { + "epoch": 1.63, + "learning_rate": 5.5991093392365096e-05, + "loss": 0.0105, + "step": 627560 + }, + { + "epoch": 1.63, + "learning_rate": 5.598720517599363e-05, + "loss": 0.0078, + "step": 627570 + }, + { + "epoch": 1.63, + "learning_rate": 5.5983316959622166e-05, + "loss": 0.0075, + "step": 627580 + }, + { + "epoch": 1.63, + "learning_rate": 5.5979428743250694e-05, + "loss": 0.0083, + "step": 627590 + }, + { + "epoch": 1.63, + "learning_rate": 5.597554052687923e-05, + "loss": 0.007, + "step": 627600 + }, + { + "epoch": 1.63, + "learning_rate": 5.5971652310507764e-05, + "loss": 0.0123, + "step": 627610 + }, + { + "epoch": 1.63, + "learning_rate": 5.5967764094136306e-05, + "loss": 0.0078, + "step": 627620 + }, + { + "epoch": 1.63, + "learning_rate": 5.596387587776484e-05, + "loss": 0.0089, + "step": 627630 + }, + { + "epoch": 1.63, + "learning_rate": 5.5959987661393375e-05, + "loss": 0.0096, + "step": 627640 + }, + { + "epoch": 1.63, + "learning_rate": 5.595609944502191e-05, + "loss": 0.0083, + "step": 627650 + }, + { + "epoch": 1.63, + "learning_rate": 5.5952211228650445e-05, + "loss": 0.0067, + "step": 627660 + }, + { + "epoch": 1.63, + "learning_rate": 5.594832301227898e-05, + "loss": 0.008, + "step": 627670 + }, + { + "epoch": 1.63, + "learning_rate": 5.5944434795907515e-05, + "loss": 0.0088, + "step": 627680 + }, + { + "epoch": 1.63, + "learning_rate": 5.594054657953605e-05, + "loss": 0.0074, + "step": 627690 + }, + { + "epoch": 1.63, + "learning_rate": 5.593665836316459e-05, + "loss": 0.0082, + "step": 627700 + }, + { + "epoch": 1.63, + "learning_rate": 5.5932770146793126e-05, + "loss": 0.0082, + "step": 627710 + }, + { + "epoch": 1.63, + "learning_rate": 5.592888193042166e-05, + "loss": 0.0091, + "step": 627720 + }, + { + "epoch": 1.63, + "learning_rate": 5.5924993714050196e-05, + "loss": 0.0075, + "step": 627730 + }, + { + "epoch": 1.63, + "learning_rate": 5.592110549767873e-05, + "loss": 0.0077, + "step": 627740 + }, + { + "epoch": 1.63, + "learning_rate": 5.5917217281307265e-05, + "loss": 0.0074, + "step": 627750 + }, + { + "epoch": 1.63, + "learning_rate": 5.59133290649358e-05, + "loss": 0.0089, + "step": 627760 + }, + { + "epoch": 1.63, + "learning_rate": 5.5909440848564335e-05, + "loss": 0.0122, + "step": 627770 + }, + { + "epoch": 1.63, + "learning_rate": 5.590555263219288e-05, + "loss": 0.0095, + "step": 627780 + }, + { + "epoch": 1.63, + "learning_rate": 5.590166441582141e-05, + "loss": 0.0077, + "step": 627790 + }, + { + "epoch": 1.63, + "learning_rate": 5.5897776199449947e-05, + "loss": 0.0096, + "step": 627800 + }, + { + "epoch": 1.63, + "learning_rate": 5.589388798307848e-05, + "loss": 0.0084, + "step": 627810 + }, + { + "epoch": 1.63, + "learning_rate": 5.5889999766707016e-05, + "loss": 0.0073, + "step": 627820 + }, + { + "epoch": 1.63, + "learning_rate": 5.588611155033555e-05, + "loss": 0.0102, + "step": 627830 + }, + { + "epoch": 1.63, + "learning_rate": 5.588222333396408e-05, + "loss": 0.0075, + "step": 627840 + }, + { + "epoch": 1.63, + "learning_rate": 5.5878335117592614e-05, + "loss": 0.0079, + "step": 627850 + }, + { + "epoch": 1.63, + "learning_rate": 5.587444690122115e-05, + "loss": 0.008, + "step": 627860 + }, + { + "epoch": 1.63, + "learning_rate": 5.5870558684849684e-05, + "loss": 0.0082, + "step": 627870 + }, + { + "epoch": 1.63, + "learning_rate": 5.5866670468478225e-05, + "loss": 0.0103, + "step": 627880 + }, + { + "epoch": 1.63, + "learning_rate": 5.586278225210676e-05, + "loss": 0.0093, + "step": 627890 + }, + { + "epoch": 1.63, + "learning_rate": 5.5858894035735295e-05, + "loss": 0.0079, + "step": 627900 + }, + { + "epoch": 1.63, + "learning_rate": 5.585500581936383e-05, + "loss": 0.0078, + "step": 627910 + }, + { + "epoch": 1.63, + "learning_rate": 5.5851117602992365e-05, + "loss": 0.0073, + "step": 627920 + }, + { + "epoch": 1.63, + "learning_rate": 5.58472293866209e-05, + "loss": 0.0083, + "step": 627930 + }, + { + "epoch": 1.63, + "learning_rate": 5.5843341170249435e-05, + "loss": 0.0078, + "step": 627940 + }, + { + "epoch": 1.63, + "learning_rate": 5.583945295387797e-05, + "loss": 0.0079, + "step": 627950 + }, + { + "epoch": 1.63, + "learning_rate": 5.583556473750651e-05, + "loss": 0.0077, + "step": 627960 + }, + { + "epoch": 1.63, + "learning_rate": 5.5831676521135046e-05, + "loss": 0.0098, + "step": 627970 + }, + { + "epoch": 1.63, + "learning_rate": 5.582778830476358e-05, + "loss": 0.01, + "step": 627980 + }, + { + "epoch": 1.63, + "learning_rate": 5.5823900088392116e-05, + "loss": 0.0097, + "step": 627990 + }, + { + "epoch": 1.63, + "learning_rate": 5.582001187202065e-05, + "loss": 0.0107, + "step": 628000 + }, + { + "epoch": 1.63, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.005415888503193855, + "eval_runtime": 107.942, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 628000 + }, + { + "epoch": 1.63, + "learning_rate": 5.5816123655649185e-05, + "loss": 0.0066, + "step": 628010 + }, + { + "epoch": 1.63, + "learning_rate": 5.581223543927772e-05, + "loss": 0.0096, + "step": 628020 + }, + { + "epoch": 1.63, + "learning_rate": 5.5808347222906255e-05, + "loss": 0.01, + "step": 628030 + }, + { + "epoch": 1.63, + "learning_rate": 5.58044590065348e-05, + "loss": 0.0069, + "step": 628040 + }, + { + "epoch": 1.63, + "learning_rate": 5.580057079016333e-05, + "loss": 0.008, + "step": 628050 + }, + { + "epoch": 1.63, + "learning_rate": 5.5796682573791867e-05, + "loss": 0.0089, + "step": 628060 + }, + { + "epoch": 1.63, + "learning_rate": 5.57927943574204e-05, + "loss": 0.0079, + "step": 628070 + }, + { + "epoch": 1.63, + "learning_rate": 5.5788906141048936e-05, + "loss": 0.0094, + "step": 628080 + }, + { + "epoch": 1.63, + "learning_rate": 5.5785017924677464e-05, + "loss": 0.0086, + "step": 628090 + }, + { + "epoch": 1.63, + "learning_rate": 5.5781129708306e-05, + "loss": 0.0074, + "step": 628100 + }, + { + "epoch": 1.63, + "learning_rate": 5.5777241491934534e-05, + "loss": 0.0072, + "step": 628110 + }, + { + "epoch": 1.63, + "learning_rate": 5.577335327556307e-05, + "loss": 0.0085, + "step": 628120 + }, + { + "epoch": 1.63, + "learning_rate": 5.5769465059191604e-05, + "loss": 0.0078, + "step": 628130 + }, + { + "epoch": 1.63, + "learning_rate": 5.5765576842820145e-05, + "loss": 0.0063, + "step": 628140 + }, + { + "epoch": 1.63, + "learning_rate": 5.576168862644868e-05, + "loss": 0.0079, + "step": 628150 + }, + { + "epoch": 1.63, + "learning_rate": 5.5757800410077215e-05, + "loss": 0.0067, + "step": 628160 + }, + { + "epoch": 1.63, + "learning_rate": 5.575391219370575e-05, + "loss": 0.0094, + "step": 628170 + }, + { + "epoch": 1.63, + "learning_rate": 5.5750023977334285e-05, + "loss": 0.007, + "step": 628180 + }, + { + "epoch": 1.63, + "learning_rate": 5.574613576096282e-05, + "loss": 0.0094, + "step": 628190 + }, + { + "epoch": 1.63, + "learning_rate": 5.5742247544591355e-05, + "loss": 0.0077, + "step": 628200 + }, + { + "epoch": 1.63, + "learning_rate": 5.573835932821989e-05, + "loss": 0.0088, + "step": 628210 + }, + { + "epoch": 1.63, + "learning_rate": 5.573447111184843e-05, + "loss": 0.0098, + "step": 628220 + }, + { + "epoch": 1.63, + "learning_rate": 5.5730582895476966e-05, + "loss": 0.0094, + "step": 628230 + }, + { + "epoch": 1.63, + "learning_rate": 5.57266946791055e-05, + "loss": 0.0088, + "step": 628240 + }, + { + "epoch": 1.63, + "learning_rate": 5.5722806462734036e-05, + "loss": 0.0065, + "step": 628250 + }, + { + "epoch": 1.63, + "learning_rate": 5.571891824636257e-05, + "loss": 0.0085, + "step": 628260 + }, + { + "epoch": 1.63, + "learning_rate": 5.5715030029991105e-05, + "loss": 0.0094, + "step": 628270 + }, + { + "epoch": 1.63, + "learning_rate": 5.571114181361964e-05, + "loss": 0.0104, + "step": 628280 + }, + { + "epoch": 1.63, + "learning_rate": 5.5707253597248175e-05, + "loss": 0.0071, + "step": 628290 + }, + { + "epoch": 1.63, + "learning_rate": 5.570336538087671e-05, + "loss": 0.007, + "step": 628300 + }, + { + "epoch": 1.63, + "learning_rate": 5.569947716450525e-05, + "loss": 0.007, + "step": 628310 + }, + { + "epoch": 1.63, + "learning_rate": 5.5695588948133786e-05, + "loss": 0.0076, + "step": 628320 + }, + { + "epoch": 1.63, + "learning_rate": 5.569170073176232e-05, + "loss": 0.0098, + "step": 628330 + }, + { + "epoch": 1.63, + "learning_rate": 5.568781251539085e-05, + "loss": 0.0093, + "step": 628340 + }, + { + "epoch": 1.63, + "learning_rate": 5.5683924299019384e-05, + "loss": 0.0082, + "step": 628350 + }, + { + "epoch": 1.63, + "learning_rate": 5.568003608264792e-05, + "loss": 0.0088, + "step": 628360 + }, + { + "epoch": 1.63, + "learning_rate": 5.5676147866276454e-05, + "loss": 0.0067, + "step": 628370 + }, + { + "epoch": 1.63, + "learning_rate": 5.567225964990499e-05, + "loss": 0.0092, + "step": 628380 + }, + { + "epoch": 1.63, + "learning_rate": 5.5668371433533524e-05, + "loss": 0.0096, + "step": 628390 + }, + { + "epoch": 1.63, + "learning_rate": 5.566448321716206e-05, + "loss": 0.0073, + "step": 628400 + }, + { + "epoch": 1.63, + "learning_rate": 5.56605950007906e-05, + "loss": 0.0064, + "step": 628410 + }, + { + "epoch": 1.63, + "learning_rate": 5.5656706784419135e-05, + "loss": 0.0087, + "step": 628420 + }, + { + "epoch": 1.63, + "learning_rate": 5.565281856804767e-05, + "loss": 0.0079, + "step": 628430 + }, + { + "epoch": 1.63, + "learning_rate": 5.5648930351676205e-05, + "loss": 0.0079, + "step": 628440 + }, + { + "epoch": 1.63, + "learning_rate": 5.564504213530474e-05, + "loss": 0.0054, + "step": 628450 + }, + { + "epoch": 1.63, + "learning_rate": 5.5641153918933275e-05, + "loss": 0.0097, + "step": 628460 + }, + { + "epoch": 1.63, + "learning_rate": 5.563726570256181e-05, + "loss": 0.0101, + "step": 628470 + }, + { + "epoch": 1.63, + "learning_rate": 5.5633377486190344e-05, + "loss": 0.0095, + "step": 628480 + }, + { + "epoch": 1.63, + "learning_rate": 5.5629489269818886e-05, + "loss": 0.0109, + "step": 628490 + }, + { + "epoch": 1.63, + "learning_rate": 5.562560105344742e-05, + "loss": 0.0073, + "step": 628500 + }, + { + "epoch": 1.63, + "learning_rate": 5.5621712837075956e-05, + "loss": 0.0075, + "step": 628510 + }, + { + "epoch": 1.63, + "learning_rate": 5.561782462070449e-05, + "loss": 0.0079, + "step": 628520 + }, + { + "epoch": 1.63, + "learning_rate": 5.5613936404333025e-05, + "loss": 0.009, + "step": 628530 + }, + { + "epoch": 1.63, + "learning_rate": 5.561004818796156e-05, + "loss": 0.0064, + "step": 628540 + }, + { + "epoch": 1.63, + "learning_rate": 5.5606159971590095e-05, + "loss": 0.0081, + "step": 628550 + }, + { + "epoch": 1.63, + "learning_rate": 5.560227175521863e-05, + "loss": 0.0069, + "step": 628560 + }, + { + "epoch": 1.63, + "learning_rate": 5.559838353884717e-05, + "loss": 0.0097, + "step": 628570 + }, + { + "epoch": 1.63, + "learning_rate": 5.559449532247569e-05, + "loss": 0.0073, + "step": 628580 + }, + { + "epoch": 1.63, + "learning_rate": 5.5590607106104235e-05, + "loss": 0.0092, + "step": 628590 + }, + { + "epoch": 1.63, + "learning_rate": 5.558671888973277e-05, + "loss": 0.0125, + "step": 628600 + }, + { + "epoch": 1.63, + "learning_rate": 5.5582830673361304e-05, + "loss": 0.0113, + "step": 628610 + }, + { + "epoch": 1.63, + "learning_rate": 5.557894245698984e-05, + "loss": 0.007, + "step": 628620 + }, + { + "epoch": 1.63, + "learning_rate": 5.5575054240618374e-05, + "loss": 0.0075, + "step": 628630 + }, + { + "epoch": 1.63, + "learning_rate": 5.557116602424691e-05, + "loss": 0.0076, + "step": 628640 + }, + { + "epoch": 1.63, + "learning_rate": 5.5567277807875444e-05, + "loss": 0.0061, + "step": 628650 + }, + { + "epoch": 1.63, + "learning_rate": 5.556338959150398e-05, + "loss": 0.0088, + "step": 628660 + }, + { + "epoch": 1.63, + "learning_rate": 5.555950137513252e-05, + "loss": 0.009, + "step": 628670 + }, + { + "epoch": 1.63, + "learning_rate": 5.5555613158761055e-05, + "loss": 0.0064, + "step": 628680 + }, + { + "epoch": 1.63, + "learning_rate": 5.555172494238959e-05, + "loss": 0.0126, + "step": 628690 + }, + { + "epoch": 1.63, + "learning_rate": 5.5547836726018125e-05, + "loss": 0.0083, + "step": 628700 + }, + { + "epoch": 1.63, + "learning_rate": 5.554394850964666e-05, + "loss": 0.007, + "step": 628710 + }, + { + "epoch": 1.63, + "learning_rate": 5.5540060293275194e-05, + "loss": 0.0082, + "step": 628720 + }, + { + "epoch": 1.63, + "learning_rate": 5.553617207690373e-05, + "loss": 0.0054, + "step": 628730 + }, + { + "epoch": 1.63, + "learning_rate": 5.5532283860532264e-05, + "loss": 0.007, + "step": 628740 + }, + { + "epoch": 1.63, + "learning_rate": 5.5528395644160806e-05, + "loss": 0.0143, + "step": 628750 + }, + { + "epoch": 1.63, + "learning_rate": 5.552450742778934e-05, + "loss": 0.0075, + "step": 628760 + }, + { + "epoch": 1.63, + "learning_rate": 5.5520619211417876e-05, + "loss": 0.0079, + "step": 628770 + }, + { + "epoch": 1.63, + "learning_rate": 5.551673099504641e-05, + "loss": 0.0079, + "step": 628780 + }, + { + "epoch": 1.63, + "learning_rate": 5.5512842778674945e-05, + "loss": 0.0084, + "step": 628790 + }, + { + "epoch": 1.63, + "learning_rate": 5.550895456230348e-05, + "loss": 0.0073, + "step": 628800 + }, + { + "epoch": 1.63, + "learning_rate": 5.5505066345932015e-05, + "loss": 0.0091, + "step": 628810 + }, + { + "epoch": 1.63, + "learning_rate": 5.550117812956055e-05, + "loss": 0.007, + "step": 628820 + }, + { + "epoch": 1.63, + "learning_rate": 5.549728991318908e-05, + "loss": 0.0088, + "step": 628830 + }, + { + "epoch": 1.63, + "learning_rate": 5.549340169681761e-05, + "loss": 0.0068, + "step": 628840 + }, + { + "epoch": 1.63, + "learning_rate": 5.5489513480446154e-05, + "loss": 0.0087, + "step": 628850 + }, + { + "epoch": 1.63, + "learning_rate": 5.548562526407469e-05, + "loss": 0.0072, + "step": 628860 + }, + { + "epoch": 1.63, + "learning_rate": 5.5481737047703224e-05, + "loss": 0.0082, + "step": 628870 + }, + { + "epoch": 1.63, + "learning_rate": 5.547784883133176e-05, + "loss": 0.0058, + "step": 628880 + }, + { + "epoch": 1.63, + "learning_rate": 5.5473960614960294e-05, + "loss": 0.0063, + "step": 628890 + }, + { + "epoch": 1.63, + "learning_rate": 5.547007239858883e-05, + "loss": 0.0077, + "step": 628900 + }, + { + "epoch": 1.63, + "learning_rate": 5.5466184182217364e-05, + "loss": 0.0073, + "step": 628910 + }, + { + "epoch": 1.63, + "learning_rate": 5.54622959658459e-05, + "loss": 0.0096, + "step": 628920 + }, + { + "epoch": 1.63, + "learning_rate": 5.545840774947444e-05, + "loss": 0.0103, + "step": 628930 + }, + { + "epoch": 1.63, + "learning_rate": 5.5454519533102975e-05, + "loss": 0.0075, + "step": 628940 + }, + { + "epoch": 1.63, + "learning_rate": 5.545063131673151e-05, + "loss": 0.0082, + "step": 628950 + }, + { + "epoch": 1.63, + "learning_rate": 5.5446743100360045e-05, + "loss": 0.0089, + "step": 628960 + }, + { + "epoch": 1.63, + "learning_rate": 5.544285488398858e-05, + "loss": 0.0086, + "step": 628970 + }, + { + "epoch": 1.63, + "learning_rate": 5.5438966667617114e-05, + "loss": 0.0067, + "step": 628980 + }, + { + "epoch": 1.63, + "learning_rate": 5.543507845124565e-05, + "loss": 0.0101, + "step": 628990 + }, + { + "epoch": 1.63, + "learning_rate": 5.5431190234874184e-05, + "loss": 0.0123, + "step": 629000 + }, + { + "epoch": 1.63, + "eval_cer": 0.8816522993935373, + "eval_loss": 0.005537708289921284, + "eval_runtime": 107.8233, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 629000 + }, + { + "epoch": 1.63, + "learning_rate": 5.5427302018502726e-05, + "loss": 0.0107, + "step": 629010 + }, + { + "epoch": 1.63, + "learning_rate": 5.542341380213126e-05, + "loss": 0.0085, + "step": 629020 + }, + { + "epoch": 1.63, + "learning_rate": 5.5419525585759796e-05, + "loss": 0.0109, + "step": 629030 + }, + { + "epoch": 1.63, + "learning_rate": 5.541563736938833e-05, + "loss": 0.0099, + "step": 629040 + }, + { + "epoch": 1.63, + "learning_rate": 5.5411749153016865e-05, + "loss": 0.0118, + "step": 629050 + }, + { + "epoch": 1.63, + "learning_rate": 5.54078609366454e-05, + "loss": 0.0122, + "step": 629060 + }, + { + "epoch": 1.63, + "learning_rate": 5.5403972720273935e-05, + "loss": 0.0075, + "step": 629070 + }, + { + "epoch": 1.63, + "learning_rate": 5.540008450390246e-05, + "loss": 0.0108, + "step": 629080 + }, + { + "epoch": 1.63, + "learning_rate": 5.5396196287531e-05, + "loss": 0.0087, + "step": 629090 + }, + { + "epoch": 1.63, + "learning_rate": 5.539230807115953e-05, + "loss": 0.0069, + "step": 629100 + }, + { + "epoch": 1.63, + "learning_rate": 5.5388419854788074e-05, + "loss": 0.0104, + "step": 629110 + }, + { + "epoch": 1.63, + "learning_rate": 5.538453163841661e-05, + "loss": 0.0085, + "step": 629120 + }, + { + "epoch": 1.63, + "learning_rate": 5.5380643422045144e-05, + "loss": 0.0107, + "step": 629130 + }, + { + "epoch": 1.63, + "learning_rate": 5.537675520567368e-05, + "loss": 0.0102, + "step": 629140 + }, + { + "epoch": 1.63, + "learning_rate": 5.5372866989302214e-05, + "loss": 0.0089, + "step": 629150 + }, + { + "epoch": 1.63, + "learning_rate": 5.536897877293075e-05, + "loss": 0.0075, + "step": 629160 + }, + { + "epoch": 1.63, + "learning_rate": 5.5365090556559284e-05, + "loss": 0.014, + "step": 629170 + }, + { + "epoch": 1.63, + "learning_rate": 5.536120234018782e-05, + "loss": 0.0115, + "step": 629180 + }, + { + "epoch": 1.63, + "learning_rate": 5.535731412381636e-05, + "loss": 0.0078, + "step": 629190 + }, + { + "epoch": 1.63, + "learning_rate": 5.5353425907444895e-05, + "loss": 0.008, + "step": 629200 + }, + { + "epoch": 1.63, + "learning_rate": 5.534953769107343e-05, + "loss": 0.0062, + "step": 629210 + }, + { + "epoch": 1.63, + "learning_rate": 5.5345649474701965e-05, + "loss": 0.0081, + "step": 629220 + }, + { + "epoch": 1.63, + "learning_rate": 5.53417612583305e-05, + "loss": 0.0095, + "step": 629230 + }, + { + "epoch": 1.63, + "learning_rate": 5.5337873041959034e-05, + "loss": 0.009, + "step": 629240 + }, + { + "epoch": 1.63, + "learning_rate": 5.533398482558757e-05, + "loss": 0.009, + "step": 629250 + }, + { + "epoch": 1.63, + "learning_rate": 5.5330096609216104e-05, + "loss": 0.0097, + "step": 629260 + }, + { + "epoch": 1.63, + "learning_rate": 5.5326208392844646e-05, + "loss": 0.0071, + "step": 629270 + }, + { + "epoch": 1.63, + "learning_rate": 5.532232017647318e-05, + "loss": 0.0073, + "step": 629280 + }, + { + "epoch": 1.63, + "learning_rate": 5.5318431960101715e-05, + "loss": 0.0099, + "step": 629290 + }, + { + "epoch": 1.63, + "learning_rate": 5.531454374373025e-05, + "loss": 0.0076, + "step": 629300 + }, + { + "epoch": 1.63, + "learning_rate": 5.5310655527358785e-05, + "loss": 0.0086, + "step": 629310 + }, + { + "epoch": 1.63, + "learning_rate": 5.530676731098732e-05, + "loss": 0.0096, + "step": 629320 + }, + { + "epoch": 1.63, + "learning_rate": 5.530287909461585e-05, + "loss": 0.009, + "step": 629330 + }, + { + "epoch": 1.63, + "learning_rate": 5.529899087824438e-05, + "loss": 0.0081, + "step": 629340 + }, + { + "epoch": 1.63, + "learning_rate": 5.529510266187292e-05, + "loss": 0.0083, + "step": 629350 + }, + { + "epoch": 1.63, + "learning_rate": 5.529121444550145e-05, + "loss": 0.0069, + "step": 629360 + }, + { + "epoch": 1.63, + "learning_rate": 5.5287326229129994e-05, + "loss": 0.0098, + "step": 629370 + }, + { + "epoch": 1.63, + "learning_rate": 5.528343801275853e-05, + "loss": 0.0065, + "step": 629380 + }, + { + "epoch": 1.63, + "learning_rate": 5.5279549796387064e-05, + "loss": 0.0094, + "step": 629390 + }, + { + "epoch": 1.63, + "learning_rate": 5.52756615800156e-05, + "loss": 0.0086, + "step": 629400 + }, + { + "epoch": 1.63, + "learning_rate": 5.5271773363644134e-05, + "loss": 0.01, + "step": 629410 + }, + { + "epoch": 1.63, + "learning_rate": 5.526788514727267e-05, + "loss": 0.0088, + "step": 629420 + }, + { + "epoch": 1.63, + "learning_rate": 5.5263996930901204e-05, + "loss": 0.0096, + "step": 629430 + }, + { + "epoch": 1.63, + "learning_rate": 5.526010871452974e-05, + "loss": 0.0103, + "step": 629440 + }, + { + "epoch": 1.63, + "learning_rate": 5.525622049815828e-05, + "loss": 0.0106, + "step": 629450 + }, + { + "epoch": 1.63, + "learning_rate": 5.5252332281786815e-05, + "loss": 0.0066, + "step": 629460 + }, + { + "epoch": 1.63, + "learning_rate": 5.524844406541535e-05, + "loss": 0.008, + "step": 629470 + }, + { + "epoch": 1.63, + "learning_rate": 5.5244555849043885e-05, + "loss": 0.0084, + "step": 629480 + }, + { + "epoch": 1.63, + "learning_rate": 5.524066763267242e-05, + "loss": 0.0091, + "step": 629490 + }, + { + "epoch": 1.63, + "learning_rate": 5.5236779416300954e-05, + "loss": 0.009, + "step": 629500 + }, + { + "epoch": 1.63, + "learning_rate": 5.523289119992949e-05, + "loss": 0.0076, + "step": 629510 + }, + { + "epoch": 1.63, + "learning_rate": 5.5229002983558024e-05, + "loss": 0.0087, + "step": 629520 + }, + { + "epoch": 1.63, + "learning_rate": 5.5225114767186566e-05, + "loss": 0.0076, + "step": 629530 + }, + { + "epoch": 1.63, + "learning_rate": 5.52212265508151e-05, + "loss": 0.0073, + "step": 629540 + }, + { + "epoch": 1.63, + "learning_rate": 5.5217338334443635e-05, + "loss": 0.0076, + "step": 629550 + }, + { + "epoch": 1.63, + "learning_rate": 5.521345011807217e-05, + "loss": 0.0088, + "step": 629560 + }, + { + "epoch": 1.63, + "learning_rate": 5.5209561901700705e-05, + "loss": 0.0089, + "step": 629570 + }, + { + "epoch": 1.63, + "learning_rate": 5.520567368532923e-05, + "loss": 0.008, + "step": 629580 + }, + { + "epoch": 1.63, + "learning_rate": 5.520178546895777e-05, + "loss": 0.0069, + "step": 629590 + }, + { + "epoch": 1.63, + "learning_rate": 5.51978972525863e-05, + "loss": 0.0101, + "step": 629600 + }, + { + "epoch": 1.63, + "learning_rate": 5.519400903621484e-05, + "loss": 0.0094, + "step": 629610 + }, + { + "epoch": 1.63, + "learning_rate": 5.519012081984337e-05, + "loss": 0.0102, + "step": 629620 + }, + { + "epoch": 1.63, + "learning_rate": 5.5186232603471914e-05, + "loss": 0.0107, + "step": 629630 + }, + { + "epoch": 1.63, + "learning_rate": 5.518234438710045e-05, + "loss": 0.0071, + "step": 629640 + }, + { + "epoch": 1.63, + "learning_rate": 5.5178456170728984e-05, + "loss": 0.008, + "step": 629650 + }, + { + "epoch": 1.63, + "learning_rate": 5.517456795435752e-05, + "loss": 0.0081, + "step": 629660 + }, + { + "epoch": 1.63, + "learning_rate": 5.5170679737986054e-05, + "loss": 0.0099, + "step": 629670 + }, + { + "epoch": 1.63, + "learning_rate": 5.516679152161459e-05, + "loss": 0.0074, + "step": 629680 + }, + { + "epoch": 1.63, + "learning_rate": 5.5162903305243123e-05, + "loss": 0.0078, + "step": 629690 + }, + { + "epoch": 1.63, + "learning_rate": 5.515901508887166e-05, + "loss": 0.0103, + "step": 629700 + }, + { + "epoch": 1.63, + "learning_rate": 5.515512687250019e-05, + "loss": 0.0089, + "step": 629710 + }, + { + "epoch": 1.63, + "learning_rate": 5.5151238656128735e-05, + "loss": 0.0092, + "step": 629720 + }, + { + "epoch": 1.63, + "learning_rate": 5.514735043975727e-05, + "loss": 0.009, + "step": 629730 + }, + { + "epoch": 1.63, + "learning_rate": 5.5143462223385805e-05, + "loss": 0.0097, + "step": 629740 + }, + { + "epoch": 1.63, + "learning_rate": 5.513957400701434e-05, + "loss": 0.0109, + "step": 629750 + }, + { + "epoch": 1.63, + "learning_rate": 5.5135685790642874e-05, + "loss": 0.0083, + "step": 629760 + }, + { + "epoch": 1.63, + "learning_rate": 5.513179757427141e-05, + "loss": 0.0106, + "step": 629770 + }, + { + "epoch": 1.63, + "learning_rate": 5.5127909357899944e-05, + "loss": 0.0077, + "step": 629780 + }, + { + "epoch": 1.63, + "learning_rate": 5.512402114152848e-05, + "loss": 0.0075, + "step": 629790 + }, + { + "epoch": 1.63, + "learning_rate": 5.512013292515702e-05, + "loss": 0.008, + "step": 629800 + }, + { + "epoch": 1.63, + "learning_rate": 5.5116244708785555e-05, + "loss": 0.0086, + "step": 629810 + }, + { + "epoch": 1.63, + "learning_rate": 5.5112356492414083e-05, + "loss": 0.0099, + "step": 629820 + }, + { + "epoch": 1.63, + "learning_rate": 5.510846827604262e-05, + "loss": 0.0072, + "step": 629830 + }, + { + "epoch": 1.63, + "learning_rate": 5.510458005967115e-05, + "loss": 0.0093, + "step": 629840 + }, + { + "epoch": 1.63, + "learning_rate": 5.510069184329969e-05, + "loss": 0.0085, + "step": 629850 + }, + { + "epoch": 1.63, + "learning_rate": 5.509680362692822e-05, + "loss": 0.0097, + "step": 629860 + }, + { + "epoch": 1.63, + "learning_rate": 5.509291541055676e-05, + "loss": 0.0116, + "step": 629870 + }, + { + "epoch": 1.63, + "learning_rate": 5.508902719418529e-05, + "loss": 0.0092, + "step": 629880 + }, + { + "epoch": 1.63, + "learning_rate": 5.508513897781383e-05, + "loss": 0.0086, + "step": 629890 + }, + { + "epoch": 1.63, + "learning_rate": 5.508125076144237e-05, + "loss": 0.0073, + "step": 629900 + }, + { + "epoch": 1.63, + "learning_rate": 5.5077362545070904e-05, + "loss": 0.008, + "step": 629910 + }, + { + "epoch": 1.63, + "learning_rate": 5.507347432869944e-05, + "loss": 0.0069, + "step": 629920 + }, + { + "epoch": 1.63, + "learning_rate": 5.5069586112327974e-05, + "loss": 0.0096, + "step": 629930 + }, + { + "epoch": 1.63, + "learning_rate": 5.506569789595651e-05, + "loss": 0.0081, + "step": 629940 + }, + { + "epoch": 1.63, + "learning_rate": 5.5061809679585043e-05, + "loss": 0.0102, + "step": 629950 + }, + { + "epoch": 1.63, + "learning_rate": 5.505792146321358e-05, + "loss": 0.0071, + "step": 629960 + }, + { + "epoch": 1.63, + "learning_rate": 5.505403324684211e-05, + "loss": 0.0083, + "step": 629970 + }, + { + "epoch": 1.63, + "learning_rate": 5.5050145030470655e-05, + "loss": 0.0082, + "step": 629980 + }, + { + "epoch": 1.63, + "learning_rate": 5.504625681409919e-05, + "loss": 0.0109, + "step": 629990 + }, + { + "epoch": 1.63, + "learning_rate": 5.5042368597727725e-05, + "loss": 0.0115, + "step": 630000 + }, + { + "epoch": 1.63, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.005582030396908522, + "eval_runtime": 107.8577, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 630000 + }, + { + "epoch": 1.63, + "learning_rate": 5.503848038135626e-05, + "loss": 0.0085, + "step": 630010 + }, + { + "epoch": 1.63, + "learning_rate": 5.5034592164984794e-05, + "loss": 0.0082, + "step": 630020 + }, + { + "epoch": 1.63, + "learning_rate": 5.503070394861333e-05, + "loss": 0.0082, + "step": 630030 + }, + { + "epoch": 1.63, + "learning_rate": 5.5026815732241864e-05, + "loss": 0.007, + "step": 630040 + }, + { + "epoch": 1.63, + "learning_rate": 5.50229275158704e-05, + "loss": 0.01, + "step": 630050 + }, + { + "epoch": 1.63, + "learning_rate": 5.501903929949894e-05, + "loss": 0.0066, + "step": 630060 + }, + { + "epoch": 1.63, + "learning_rate": 5.501515108312746e-05, + "loss": 0.0118, + "step": 630070 + }, + { + "epoch": 1.63, + "learning_rate": 5.5011262866756003e-05, + "loss": 0.0174, + "step": 630080 + }, + { + "epoch": 1.63, + "learning_rate": 5.500737465038454e-05, + "loss": 0.008, + "step": 630090 + }, + { + "epoch": 1.63, + "learning_rate": 5.500348643401307e-05, + "loss": 0.0092, + "step": 630100 + }, + { + "epoch": 1.63, + "learning_rate": 5.499959821764161e-05, + "loss": 0.0082, + "step": 630110 + }, + { + "epoch": 1.63, + "learning_rate": 5.499571000127014e-05, + "loss": 0.0089, + "step": 630120 + }, + { + "epoch": 1.63, + "learning_rate": 5.499182178489868e-05, + "loss": 0.0064, + "step": 630130 + }, + { + "epoch": 1.63, + "learning_rate": 5.498793356852721e-05, + "loss": 0.0072, + "step": 630140 + }, + { + "epoch": 1.63, + "learning_rate": 5.498404535215575e-05, + "loss": 0.0085, + "step": 630150 + }, + { + "epoch": 1.63, + "learning_rate": 5.498015713578429e-05, + "loss": 0.0095, + "step": 630160 + }, + { + "epoch": 1.63, + "learning_rate": 5.4976268919412824e-05, + "loss": 0.0072, + "step": 630170 + }, + { + "epoch": 1.63, + "learning_rate": 5.497238070304136e-05, + "loss": 0.0097, + "step": 630180 + }, + { + "epoch": 1.63, + "learning_rate": 5.4968492486669894e-05, + "loss": 0.0106, + "step": 630190 + }, + { + "epoch": 1.63, + "learning_rate": 5.496460427029843e-05, + "loss": 0.0113, + "step": 630200 + }, + { + "epoch": 1.63, + "learning_rate": 5.496071605392696e-05, + "loss": 0.0092, + "step": 630210 + }, + { + "epoch": 1.63, + "learning_rate": 5.49568278375555e-05, + "loss": 0.007, + "step": 630220 + }, + { + "epoch": 1.63, + "learning_rate": 5.495293962118403e-05, + "loss": 0.0088, + "step": 630230 + }, + { + "epoch": 1.63, + "learning_rate": 5.4949051404812575e-05, + "loss": 0.0059, + "step": 630240 + }, + { + "epoch": 1.63, + "learning_rate": 5.494516318844111e-05, + "loss": 0.0103, + "step": 630250 + }, + { + "epoch": 1.63, + "learning_rate": 5.4941274972069644e-05, + "loss": 0.0084, + "step": 630260 + }, + { + "epoch": 1.63, + "learning_rate": 5.493738675569818e-05, + "loss": 0.007, + "step": 630270 + }, + { + "epoch": 1.63, + "learning_rate": 5.4933498539326714e-05, + "loss": 0.0057, + "step": 630280 + }, + { + "epoch": 1.63, + "learning_rate": 5.492961032295525e-05, + "loss": 0.0079, + "step": 630290 + }, + { + "epoch": 1.63, + "learning_rate": 5.4925722106583784e-05, + "loss": 0.0083, + "step": 630300 + }, + { + "epoch": 1.63, + "learning_rate": 5.492183389021232e-05, + "loss": 0.0088, + "step": 630310 + }, + { + "epoch": 1.63, + "learning_rate": 5.491794567384085e-05, + "loss": 0.0098, + "step": 630320 + }, + { + "epoch": 1.63, + "learning_rate": 5.491405745746938e-05, + "loss": 0.0083, + "step": 630330 + }, + { + "epoch": 1.63, + "learning_rate": 5.491016924109792e-05, + "loss": 0.0072, + "step": 630340 + }, + { + "epoch": 1.63, + "learning_rate": 5.490628102472646e-05, + "loss": 0.0079, + "step": 630350 + }, + { + "epoch": 1.63, + "learning_rate": 5.490239280835499e-05, + "loss": 0.01, + "step": 630360 + }, + { + "epoch": 1.63, + "learning_rate": 5.489850459198353e-05, + "loss": 0.0101, + "step": 630370 + }, + { + "epoch": 1.63, + "learning_rate": 5.489461637561206e-05, + "loss": 0.0073, + "step": 630380 + }, + { + "epoch": 1.63, + "learning_rate": 5.48907281592406e-05, + "loss": 0.0078, + "step": 630390 + }, + { + "epoch": 1.63, + "learning_rate": 5.488683994286913e-05, + "loss": 0.0113, + "step": 630400 + }, + { + "epoch": 1.63, + "learning_rate": 5.488295172649767e-05, + "loss": 0.0072, + "step": 630410 + }, + { + "epoch": 1.63, + "learning_rate": 5.487906351012621e-05, + "loss": 0.0091, + "step": 630420 + }, + { + "epoch": 1.63, + "learning_rate": 5.4875175293754744e-05, + "loss": 0.0085, + "step": 630430 + }, + { + "epoch": 1.63, + "learning_rate": 5.487128707738328e-05, + "loss": 0.0086, + "step": 630440 + }, + { + "epoch": 1.63, + "learning_rate": 5.4867398861011814e-05, + "loss": 0.0097, + "step": 630450 + }, + { + "epoch": 1.63, + "learning_rate": 5.486351064464035e-05, + "loss": 0.0075, + "step": 630460 + }, + { + "epoch": 1.63, + "learning_rate": 5.485962242826888e-05, + "loss": 0.0087, + "step": 630470 + }, + { + "epoch": 1.63, + "learning_rate": 5.485573421189742e-05, + "loss": 0.0077, + "step": 630480 + }, + { + "epoch": 1.63, + "learning_rate": 5.485184599552595e-05, + "loss": 0.0074, + "step": 630490 + }, + { + "epoch": 1.63, + "learning_rate": 5.4847957779154495e-05, + "loss": 0.0088, + "step": 630500 + }, + { + "epoch": 1.63, + "learning_rate": 5.484406956278303e-05, + "loss": 0.007, + "step": 630510 + }, + { + "epoch": 1.63, + "learning_rate": 5.4840181346411564e-05, + "loss": 0.0098, + "step": 630520 + }, + { + "epoch": 1.63, + "learning_rate": 5.48362931300401e-05, + "loss": 0.0074, + "step": 630530 + }, + { + "epoch": 1.63, + "learning_rate": 5.4832404913668634e-05, + "loss": 0.0066, + "step": 630540 + }, + { + "epoch": 1.63, + "learning_rate": 5.482851669729717e-05, + "loss": 0.0088, + "step": 630550 + }, + { + "epoch": 1.63, + "learning_rate": 5.4824628480925704e-05, + "loss": 0.0056, + "step": 630560 + }, + { + "epoch": 1.63, + "learning_rate": 5.482074026455423e-05, + "loss": 0.0084, + "step": 630570 + }, + { + "epoch": 1.63, + "learning_rate": 5.481685204818277e-05, + "loss": 0.0119, + "step": 630580 + }, + { + "epoch": 1.63, + "learning_rate": 5.48129638318113e-05, + "loss": 0.0084, + "step": 630590 + }, + { + "epoch": 1.63, + "learning_rate": 5.480907561543984e-05, + "loss": 0.0074, + "step": 630600 + }, + { + "epoch": 1.63, + "learning_rate": 5.480518739906838e-05, + "loss": 0.0078, + "step": 630610 + }, + { + "epoch": 1.63, + "learning_rate": 5.480129918269691e-05, + "loss": 0.0095, + "step": 630620 + }, + { + "epoch": 1.63, + "learning_rate": 5.479741096632545e-05, + "loss": 0.0076, + "step": 630630 + }, + { + "epoch": 1.63, + "learning_rate": 5.479352274995398e-05, + "loss": 0.0051, + "step": 630640 + }, + { + "epoch": 1.63, + "learning_rate": 5.478963453358252e-05, + "loss": 0.0073, + "step": 630650 + }, + { + "epoch": 1.63, + "learning_rate": 5.478574631721105e-05, + "loss": 0.01, + "step": 630660 + }, + { + "epoch": 1.63, + "learning_rate": 5.478185810083959e-05, + "loss": 0.0072, + "step": 630670 + }, + { + "epoch": 1.63, + "learning_rate": 5.477796988446813e-05, + "loss": 0.0103, + "step": 630680 + }, + { + "epoch": 1.63, + "learning_rate": 5.4774081668096664e-05, + "loss": 0.0044, + "step": 630690 + }, + { + "epoch": 1.63, + "learning_rate": 5.47701934517252e-05, + "loss": 0.0072, + "step": 630700 + }, + { + "epoch": 1.63, + "learning_rate": 5.4766305235353734e-05, + "loss": 0.0088, + "step": 630710 + }, + { + "epoch": 1.63, + "learning_rate": 5.476241701898227e-05, + "loss": 0.0092, + "step": 630720 + }, + { + "epoch": 1.63, + "learning_rate": 5.47585288026108e-05, + "loss": 0.0097, + "step": 630730 + }, + { + "epoch": 1.63, + "learning_rate": 5.475464058623934e-05, + "loss": 0.0075, + "step": 630740 + }, + { + "epoch": 1.63, + "learning_rate": 5.475075236986787e-05, + "loss": 0.0076, + "step": 630750 + }, + { + "epoch": 1.64, + "learning_rate": 5.4746864153496415e-05, + "loss": 0.0091, + "step": 630760 + }, + { + "epoch": 1.64, + "learning_rate": 5.474297593712495e-05, + "loss": 0.0126, + "step": 630770 + }, + { + "epoch": 1.64, + "learning_rate": 5.4739087720753484e-05, + "loss": 0.0083, + "step": 630780 + }, + { + "epoch": 1.64, + "learning_rate": 5.473519950438202e-05, + "loss": 0.0119, + "step": 630790 + }, + { + "epoch": 1.64, + "learning_rate": 5.4731311288010554e-05, + "loss": 0.009, + "step": 630800 + }, + { + "epoch": 1.64, + "learning_rate": 5.472742307163909e-05, + "loss": 0.0091, + "step": 630810 + }, + { + "epoch": 1.64, + "learning_rate": 5.472353485526762e-05, + "loss": 0.0099, + "step": 630820 + }, + { + "epoch": 1.64, + "learning_rate": 5.471964663889615e-05, + "loss": 0.0069, + "step": 630830 + }, + { + "epoch": 1.64, + "learning_rate": 5.471575842252469e-05, + "loss": 0.0143, + "step": 630840 + }, + { + "epoch": 1.64, + "learning_rate": 5.471187020615322e-05, + "loss": 0.0071, + "step": 630850 + }, + { + "epoch": 1.64, + "learning_rate": 5.470798198978176e-05, + "loss": 0.0123, + "step": 630860 + }, + { + "epoch": 1.64, + "learning_rate": 5.47040937734103e-05, + "loss": 0.0072, + "step": 630870 + }, + { + "epoch": 1.64, + "learning_rate": 5.470020555703883e-05, + "loss": 0.0073, + "step": 630880 + }, + { + "epoch": 1.64, + "learning_rate": 5.469631734066737e-05, + "loss": 0.0088, + "step": 630890 + }, + { + "epoch": 1.64, + "learning_rate": 5.46924291242959e-05, + "loss": 0.01, + "step": 630900 + }, + { + "epoch": 1.64, + "learning_rate": 5.468854090792444e-05, + "loss": 0.0102, + "step": 630910 + }, + { + "epoch": 1.64, + "learning_rate": 5.468465269155297e-05, + "loss": 0.0104, + "step": 630920 + }, + { + "epoch": 1.64, + "learning_rate": 5.468076447518151e-05, + "loss": 0.0091, + "step": 630930 + }, + { + "epoch": 1.64, + "learning_rate": 5.467687625881005e-05, + "loss": 0.0088, + "step": 630940 + }, + { + "epoch": 1.64, + "learning_rate": 5.4672988042438584e-05, + "loss": 0.008, + "step": 630950 + }, + { + "epoch": 1.64, + "learning_rate": 5.466909982606712e-05, + "loss": 0.0078, + "step": 630960 + }, + { + "epoch": 1.64, + "learning_rate": 5.4665211609695654e-05, + "loss": 0.0062, + "step": 630970 + }, + { + "epoch": 1.64, + "learning_rate": 5.466132339332419e-05, + "loss": 0.0098, + "step": 630980 + }, + { + "epoch": 1.64, + "learning_rate": 5.465743517695272e-05, + "loss": 0.0073, + "step": 630990 + }, + { + "epoch": 1.64, + "learning_rate": 5.465354696058126e-05, + "loss": 0.0064, + "step": 631000 + }, + { + "epoch": 1.64, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.0054400768131017685, + "eval_runtime": 107.7582, + "eval_samples_per_second": 18.56, + "eval_steps_per_second": 4.64, + "step": 631000 + }, + { + "epoch": 1.64, + "learning_rate": 5.464965874420979e-05, + "loss": 0.0078, + "step": 631010 + }, + { + "epoch": 1.64, + "learning_rate": 5.464577052783833e-05, + "loss": 0.0093, + "step": 631020 + }, + { + "epoch": 1.64, + "learning_rate": 5.464188231146687e-05, + "loss": 0.0082, + "step": 631030 + }, + { + "epoch": 1.64, + "learning_rate": 5.4637994095095404e-05, + "loss": 0.0068, + "step": 631040 + }, + { + "epoch": 1.64, + "learning_rate": 5.463410587872394e-05, + "loss": 0.0077, + "step": 631050 + }, + { + "epoch": 1.64, + "learning_rate": 5.463021766235247e-05, + "loss": 0.0074, + "step": 631060 + }, + { + "epoch": 1.64, + "learning_rate": 5.4626329445981e-05, + "loss": 0.008, + "step": 631070 + }, + { + "epoch": 1.64, + "learning_rate": 5.462244122960954e-05, + "loss": 0.0093, + "step": 631080 + }, + { + "epoch": 1.64, + "learning_rate": 5.461855301323807e-05, + "loss": 0.0074, + "step": 631090 + }, + { + "epoch": 1.64, + "learning_rate": 5.461466479686661e-05, + "loss": 0.0087, + "step": 631100 + }, + { + "epoch": 1.64, + "learning_rate": 5.461077658049514e-05, + "loss": 0.0095, + "step": 631110 + }, + { + "epoch": 1.64, + "learning_rate": 5.460688836412368e-05, + "loss": 0.0087, + "step": 631120 + }, + { + "epoch": 1.64, + "learning_rate": 5.460300014775222e-05, + "loss": 0.0066, + "step": 631130 + }, + { + "epoch": 1.64, + "learning_rate": 5.459911193138075e-05, + "loss": 0.0076, + "step": 631140 + }, + { + "epoch": 1.64, + "learning_rate": 5.459522371500929e-05, + "loss": 0.0087, + "step": 631150 + }, + { + "epoch": 1.64, + "learning_rate": 5.459133549863782e-05, + "loss": 0.0122, + "step": 631160 + }, + { + "epoch": 1.64, + "learning_rate": 5.458744728226636e-05, + "loss": 0.0104, + "step": 631170 + }, + { + "epoch": 1.64, + "learning_rate": 5.458355906589489e-05, + "loss": 0.0079, + "step": 631180 + }, + { + "epoch": 1.64, + "learning_rate": 5.457967084952343e-05, + "loss": 0.0062, + "step": 631190 + }, + { + "epoch": 1.64, + "learning_rate": 5.457578263315196e-05, + "loss": 0.0081, + "step": 631200 + }, + { + "epoch": 1.64, + "learning_rate": 5.4571894416780504e-05, + "loss": 0.0112, + "step": 631210 + }, + { + "epoch": 1.64, + "learning_rate": 5.456800620040904e-05, + "loss": 0.0104, + "step": 631220 + }, + { + "epoch": 1.64, + "learning_rate": 5.4564117984037573e-05, + "loss": 0.0129, + "step": 631230 + }, + { + "epoch": 1.64, + "learning_rate": 5.456022976766611e-05, + "loss": 0.0067, + "step": 631240 + }, + { + "epoch": 1.64, + "learning_rate": 5.455634155129464e-05, + "loss": 0.0105, + "step": 631250 + }, + { + "epoch": 1.64, + "learning_rate": 5.455245333492318e-05, + "loss": 0.0095, + "step": 631260 + }, + { + "epoch": 1.64, + "learning_rate": 5.454856511855171e-05, + "loss": 0.0077, + "step": 631270 + }, + { + "epoch": 1.64, + "learning_rate": 5.454467690218025e-05, + "loss": 0.0075, + "step": 631280 + }, + { + "epoch": 1.64, + "learning_rate": 5.454078868580879e-05, + "loss": 0.0071, + "step": 631290 + }, + { + "epoch": 1.64, + "learning_rate": 5.4536900469437324e-05, + "loss": 0.0075, + "step": 631300 + }, + { + "epoch": 1.64, + "learning_rate": 5.453301225306585e-05, + "loss": 0.0094, + "step": 631310 + }, + { + "epoch": 1.64, + "learning_rate": 5.452912403669439e-05, + "loss": 0.0076, + "step": 631320 + }, + { + "epoch": 1.64, + "learning_rate": 5.452523582032292e-05, + "loss": 0.0107, + "step": 631330 + }, + { + "epoch": 1.64, + "learning_rate": 5.452134760395146e-05, + "loss": 0.0088, + "step": 631340 + }, + { + "epoch": 1.64, + "learning_rate": 5.451745938757999e-05, + "loss": 0.0072, + "step": 631350 + }, + { + "epoch": 1.64, + "learning_rate": 5.451357117120853e-05, + "loss": 0.0092, + "step": 631360 + }, + { + "epoch": 1.64, + "learning_rate": 5.450968295483706e-05, + "loss": 0.0059, + "step": 631370 + }, + { + "epoch": 1.64, + "learning_rate": 5.4505794738465596e-05, + "loss": 0.0082, + "step": 631380 + }, + { + "epoch": 1.64, + "learning_rate": 5.450190652209414e-05, + "loss": 0.009, + "step": 631390 + }, + { + "epoch": 1.64, + "learning_rate": 5.449801830572267e-05, + "loss": 0.0098, + "step": 631400 + }, + { + "epoch": 1.64, + "learning_rate": 5.449413008935121e-05, + "loss": 0.0109, + "step": 631410 + }, + { + "epoch": 1.64, + "learning_rate": 5.449024187297974e-05, + "loss": 0.0115, + "step": 631420 + }, + { + "epoch": 1.64, + "learning_rate": 5.448635365660828e-05, + "loss": 0.0081, + "step": 631430 + }, + { + "epoch": 1.64, + "learning_rate": 5.448246544023681e-05, + "loss": 0.0086, + "step": 631440 + }, + { + "epoch": 1.64, + "learning_rate": 5.447857722386535e-05, + "loss": 0.0124, + "step": 631450 + }, + { + "epoch": 1.64, + "learning_rate": 5.447468900749388e-05, + "loss": 0.0078, + "step": 631460 + }, + { + "epoch": 1.64, + "learning_rate": 5.4470800791122424e-05, + "loss": 0.0094, + "step": 631470 + }, + { + "epoch": 1.64, + "learning_rate": 5.446691257475096e-05, + "loss": 0.0068, + "step": 631480 + }, + { + "epoch": 1.64, + "learning_rate": 5.4463024358379493e-05, + "loss": 0.0062, + "step": 631490 + }, + { + "epoch": 1.64, + "learning_rate": 5.445913614200803e-05, + "loss": 0.0087, + "step": 631500 + }, + { + "epoch": 1.64, + "learning_rate": 5.445524792563656e-05, + "loss": 0.0088, + "step": 631510 + }, + { + "epoch": 1.64, + "learning_rate": 5.44513597092651e-05, + "loss": 0.0071, + "step": 631520 + }, + { + "epoch": 1.64, + "learning_rate": 5.444747149289363e-05, + "loss": 0.009, + "step": 631530 + }, + { + "epoch": 1.64, + "learning_rate": 5.444358327652217e-05, + "loss": 0.0128, + "step": 631540 + }, + { + "epoch": 1.64, + "learning_rate": 5.443969506015071e-05, + "loss": 0.0095, + "step": 631550 + }, + { + "epoch": 1.64, + "learning_rate": 5.443580684377923e-05, + "loss": 0.0053, + "step": 631560 + }, + { + "epoch": 1.64, + "learning_rate": 5.443191862740777e-05, + "loss": 0.0072, + "step": 631570 + }, + { + "epoch": 1.64, + "learning_rate": 5.442803041103631e-05, + "loss": 0.0115, + "step": 631580 + }, + { + "epoch": 1.64, + "learning_rate": 5.442414219466484e-05, + "loss": 0.0083, + "step": 631590 + }, + { + "epoch": 1.64, + "learning_rate": 5.442025397829338e-05, + "loss": 0.0062, + "step": 631600 + }, + { + "epoch": 1.64, + "learning_rate": 5.441636576192191e-05, + "loss": 0.0095, + "step": 631610 + }, + { + "epoch": 1.64, + "learning_rate": 5.441247754555045e-05, + "loss": 0.0097, + "step": 631620 + }, + { + "epoch": 1.64, + "learning_rate": 5.440858932917898e-05, + "loss": 0.008, + "step": 631630 + }, + { + "epoch": 1.64, + "learning_rate": 5.4404701112807516e-05, + "loss": 0.0069, + "step": 631640 + }, + { + "epoch": 1.64, + "learning_rate": 5.440081289643606e-05, + "loss": 0.0069, + "step": 631650 + }, + { + "epoch": 1.64, + "learning_rate": 5.439692468006459e-05, + "loss": 0.0072, + "step": 631660 + }, + { + "epoch": 1.64, + "learning_rate": 5.439303646369313e-05, + "loss": 0.0071, + "step": 631670 + }, + { + "epoch": 1.64, + "learning_rate": 5.438914824732166e-05, + "loss": 0.0095, + "step": 631680 + }, + { + "epoch": 1.64, + "learning_rate": 5.43852600309502e-05, + "loss": 0.0078, + "step": 631690 + }, + { + "epoch": 1.64, + "learning_rate": 5.438137181457873e-05, + "loss": 0.0073, + "step": 631700 + }, + { + "epoch": 1.64, + "learning_rate": 5.437748359820727e-05, + "loss": 0.0075, + "step": 631710 + }, + { + "epoch": 1.64, + "learning_rate": 5.43735953818358e-05, + "loss": 0.0094, + "step": 631720 + }, + { + "epoch": 1.64, + "learning_rate": 5.4369707165464344e-05, + "loss": 0.006, + "step": 631730 + }, + { + "epoch": 1.64, + "learning_rate": 5.436581894909288e-05, + "loss": 0.0081, + "step": 631740 + }, + { + "epoch": 1.64, + "learning_rate": 5.436193073272141e-05, + "loss": 0.0059, + "step": 631750 + }, + { + "epoch": 1.64, + "learning_rate": 5.435804251634995e-05, + "loss": 0.0067, + "step": 631760 + }, + { + "epoch": 1.64, + "learning_rate": 5.435415429997848e-05, + "loss": 0.0117, + "step": 631770 + }, + { + "epoch": 1.64, + "learning_rate": 5.435026608360702e-05, + "loss": 0.0079, + "step": 631780 + }, + { + "epoch": 1.64, + "learning_rate": 5.434637786723555e-05, + "loss": 0.0081, + "step": 631790 + }, + { + "epoch": 1.64, + "learning_rate": 5.434248965086409e-05, + "loss": 0.009, + "step": 631800 + }, + { + "epoch": 1.64, + "learning_rate": 5.4338601434492616e-05, + "loss": 0.0085, + "step": 631810 + }, + { + "epoch": 1.64, + "learning_rate": 5.433471321812115e-05, + "loss": 0.0067, + "step": 631820 + }, + { + "epoch": 1.64, + "learning_rate": 5.433082500174969e-05, + "loss": 0.0077, + "step": 631830 + }, + { + "epoch": 1.64, + "learning_rate": 5.432693678537823e-05, + "loss": 0.0078, + "step": 631840 + }, + { + "epoch": 1.64, + "learning_rate": 5.432304856900676e-05, + "loss": 0.0097, + "step": 631850 + }, + { + "epoch": 1.64, + "learning_rate": 5.43191603526353e-05, + "loss": 0.01, + "step": 631860 + }, + { + "epoch": 1.64, + "learning_rate": 5.431527213626383e-05, + "loss": 0.009, + "step": 631870 + }, + { + "epoch": 1.64, + "learning_rate": 5.4311383919892367e-05, + "loss": 0.0064, + "step": 631880 + }, + { + "epoch": 1.64, + "learning_rate": 5.43074957035209e-05, + "loss": 0.008, + "step": 631890 + }, + { + "epoch": 1.64, + "learning_rate": 5.4303607487149436e-05, + "loss": 0.0066, + "step": 631900 + }, + { + "epoch": 1.64, + "learning_rate": 5.429971927077798e-05, + "loss": 0.0056, + "step": 631910 + }, + { + "epoch": 1.64, + "learning_rate": 5.429583105440651e-05, + "loss": 0.0093, + "step": 631920 + }, + { + "epoch": 1.64, + "learning_rate": 5.429194283803505e-05, + "loss": 0.0099, + "step": 631930 + }, + { + "epoch": 1.64, + "learning_rate": 5.428805462166358e-05, + "loss": 0.0087, + "step": 631940 + }, + { + "epoch": 1.64, + "learning_rate": 5.428416640529212e-05, + "loss": 0.0073, + "step": 631950 + }, + { + "epoch": 1.64, + "learning_rate": 5.428027818892065e-05, + "loss": 0.0068, + "step": 631960 + }, + { + "epoch": 1.64, + "learning_rate": 5.427638997254919e-05, + "loss": 0.0083, + "step": 631970 + }, + { + "epoch": 1.64, + "learning_rate": 5.427250175617772e-05, + "loss": 0.006, + "step": 631980 + }, + { + "epoch": 1.64, + "learning_rate": 5.4268613539806264e-05, + "loss": 0.0083, + "step": 631990 + }, + { + "epoch": 1.64, + "learning_rate": 5.42647253234348e-05, + "loss": 0.0084, + "step": 632000 + }, + { + "epoch": 1.64, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.005452393088489771, + "eval_runtime": 107.8252, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 632000 + }, + { + "epoch": 1.64, + "learning_rate": 5.426083710706333e-05, + "loss": 0.0071, + "step": 632010 + }, + { + "epoch": 1.64, + "learning_rate": 5.425694889069187e-05, + "loss": 0.0097, + "step": 632020 + }, + { + "epoch": 1.64, + "learning_rate": 5.42530606743204e-05, + "loss": 0.0083, + "step": 632030 + }, + { + "epoch": 1.64, + "learning_rate": 5.424917245794894e-05, + "loss": 0.0072, + "step": 632040 + }, + { + "epoch": 1.64, + "learning_rate": 5.424528424157747e-05, + "loss": 0.0069, + "step": 632050 + }, + { + "epoch": 1.64, + "learning_rate": 5.4241396025206e-05, + "loss": 0.007, + "step": 632060 + }, + { + "epoch": 1.64, + "learning_rate": 5.4237507808834536e-05, + "loss": 0.0086, + "step": 632070 + }, + { + "epoch": 1.64, + "learning_rate": 5.423361959246307e-05, + "loss": 0.008, + "step": 632080 + }, + { + "epoch": 1.64, + "learning_rate": 5.422973137609161e-05, + "loss": 0.0063, + "step": 632090 + }, + { + "epoch": 1.64, + "learning_rate": 5.422584315972015e-05, + "loss": 0.0073, + "step": 632100 + }, + { + "epoch": 1.64, + "learning_rate": 5.422195494334868e-05, + "loss": 0.0111, + "step": 632110 + }, + { + "epoch": 1.64, + "learning_rate": 5.421806672697722e-05, + "loss": 0.0084, + "step": 632120 + }, + { + "epoch": 1.64, + "learning_rate": 5.421417851060575e-05, + "loss": 0.0102, + "step": 632130 + }, + { + "epoch": 1.64, + "learning_rate": 5.4210290294234287e-05, + "loss": 0.0074, + "step": 632140 + }, + { + "epoch": 1.64, + "learning_rate": 5.420640207786282e-05, + "loss": 0.007, + "step": 632150 + }, + { + "epoch": 1.64, + "learning_rate": 5.4202513861491356e-05, + "loss": 0.0102, + "step": 632160 + }, + { + "epoch": 1.64, + "learning_rate": 5.41986256451199e-05, + "loss": 0.008, + "step": 632170 + }, + { + "epoch": 1.64, + "learning_rate": 5.419473742874843e-05, + "loss": 0.0083, + "step": 632180 + }, + { + "epoch": 1.64, + "learning_rate": 5.419084921237697e-05, + "loss": 0.0083, + "step": 632190 + }, + { + "epoch": 1.64, + "learning_rate": 5.41869609960055e-05, + "loss": 0.0073, + "step": 632200 + }, + { + "epoch": 1.64, + "learning_rate": 5.418307277963404e-05, + "loss": 0.009, + "step": 632210 + }, + { + "epoch": 1.64, + "learning_rate": 5.417918456326257e-05, + "loss": 0.0077, + "step": 632220 + }, + { + "epoch": 1.64, + "learning_rate": 5.417529634689111e-05, + "loss": 0.0081, + "step": 632230 + }, + { + "epoch": 1.64, + "learning_rate": 5.417140813051964e-05, + "loss": 0.0047, + "step": 632240 + }, + { + "epoch": 1.64, + "learning_rate": 5.4167519914148184e-05, + "loss": 0.0086, + "step": 632250 + }, + { + "epoch": 1.64, + "learning_rate": 5.416363169777672e-05, + "loss": 0.0054, + "step": 632260 + }, + { + "epoch": 1.64, + "learning_rate": 5.415974348140525e-05, + "loss": 0.0091, + "step": 632270 + }, + { + "epoch": 1.64, + "learning_rate": 5.415585526503379e-05, + "loss": 0.0054, + "step": 632280 + }, + { + "epoch": 1.64, + "learning_rate": 5.415196704866232e-05, + "loss": 0.006, + "step": 632290 + }, + { + "epoch": 1.64, + "learning_rate": 5.414807883229085e-05, + "loss": 0.0068, + "step": 632300 + }, + { + "epoch": 1.64, + "learning_rate": 5.4144190615919386e-05, + "loss": 0.0062, + "step": 632310 + }, + { + "epoch": 1.64, + "learning_rate": 5.414030239954792e-05, + "loss": 0.0098, + "step": 632320 + }, + { + "epoch": 1.64, + "learning_rate": 5.4136414183176456e-05, + "loss": 0.0068, + "step": 632330 + }, + { + "epoch": 1.64, + "learning_rate": 5.413252596680499e-05, + "loss": 0.0095, + "step": 632340 + }, + { + "epoch": 1.64, + "learning_rate": 5.412863775043353e-05, + "loss": 0.0091, + "step": 632350 + }, + { + "epoch": 1.64, + "learning_rate": 5.412474953406207e-05, + "loss": 0.0076, + "step": 632360 + }, + { + "epoch": 1.64, + "learning_rate": 5.41208613176906e-05, + "loss": 0.0106, + "step": 632370 + }, + { + "epoch": 1.64, + "learning_rate": 5.411697310131914e-05, + "loss": 0.0082, + "step": 632380 + }, + { + "epoch": 1.64, + "learning_rate": 5.411308488494767e-05, + "loss": 0.0068, + "step": 632390 + }, + { + "epoch": 1.64, + "learning_rate": 5.4109196668576206e-05, + "loss": 0.0085, + "step": 632400 + }, + { + "epoch": 1.64, + "learning_rate": 5.410530845220474e-05, + "loss": 0.0086, + "step": 632410 + }, + { + "epoch": 1.64, + "learning_rate": 5.4101420235833276e-05, + "loss": 0.0086, + "step": 632420 + }, + { + "epoch": 1.64, + "learning_rate": 5.409753201946182e-05, + "loss": 0.0065, + "step": 632430 + }, + { + "epoch": 1.64, + "learning_rate": 5.409364380309035e-05, + "loss": 0.0061, + "step": 632440 + }, + { + "epoch": 1.64, + "learning_rate": 5.408975558671889e-05, + "loss": 0.0082, + "step": 632450 + }, + { + "epoch": 1.64, + "learning_rate": 5.408586737034742e-05, + "loss": 0.0061, + "step": 632460 + }, + { + "epoch": 1.64, + "learning_rate": 5.408197915397596e-05, + "loss": 0.0067, + "step": 632470 + }, + { + "epoch": 1.64, + "learning_rate": 5.407809093760449e-05, + "loss": 0.0067, + "step": 632480 + }, + { + "epoch": 1.64, + "learning_rate": 5.407420272123303e-05, + "loss": 0.0084, + "step": 632490 + }, + { + "epoch": 1.64, + "learning_rate": 5.407031450486156e-05, + "loss": 0.0081, + "step": 632500 + }, + { + "epoch": 1.64, + "learning_rate": 5.40664262884901e-05, + "loss": 0.0088, + "step": 632510 + }, + { + "epoch": 1.64, + "learning_rate": 5.406253807211864e-05, + "loss": 0.0089, + "step": 632520 + }, + { + "epoch": 1.64, + "learning_rate": 5.405864985574717e-05, + "loss": 0.0075, + "step": 632530 + }, + { + "epoch": 1.64, + "learning_rate": 5.405476163937571e-05, + "loss": 0.0084, + "step": 632540 + }, + { + "epoch": 1.64, + "learning_rate": 5.4050873423004236e-05, + "loss": 0.0091, + "step": 632550 + }, + { + "epoch": 1.64, + "learning_rate": 5.404698520663277e-05, + "loss": 0.0109, + "step": 632560 + }, + { + "epoch": 1.64, + "learning_rate": 5.4043096990261306e-05, + "loss": 0.0078, + "step": 632570 + }, + { + "epoch": 1.64, + "learning_rate": 5.403920877388984e-05, + "loss": 0.0096, + "step": 632580 + }, + { + "epoch": 1.64, + "learning_rate": 5.4035320557518376e-05, + "loss": 0.0085, + "step": 632590 + }, + { + "epoch": 1.64, + "learning_rate": 5.403143234114691e-05, + "loss": 0.007, + "step": 632600 + }, + { + "epoch": 1.64, + "learning_rate": 5.4027544124775445e-05, + "loss": 0.008, + "step": 632610 + }, + { + "epoch": 1.64, + "learning_rate": 5.402365590840399e-05, + "loss": 0.0095, + "step": 632620 + }, + { + "epoch": 1.64, + "learning_rate": 5.401976769203252e-05, + "loss": 0.0091, + "step": 632630 + }, + { + "epoch": 1.64, + "learning_rate": 5.401587947566106e-05, + "loss": 0.0099, + "step": 632640 + }, + { + "epoch": 1.64, + "learning_rate": 5.401199125928959e-05, + "loss": 0.01, + "step": 632650 + }, + { + "epoch": 1.64, + "learning_rate": 5.4008103042918126e-05, + "loss": 0.0054, + "step": 632660 + }, + { + "epoch": 1.64, + "learning_rate": 5.400421482654666e-05, + "loss": 0.015, + "step": 632670 + }, + { + "epoch": 1.64, + "learning_rate": 5.4000326610175196e-05, + "loss": 0.0087, + "step": 632680 + }, + { + "epoch": 1.64, + "learning_rate": 5.399643839380373e-05, + "loss": 0.0092, + "step": 632690 + }, + { + "epoch": 1.64, + "learning_rate": 5.399255017743227e-05, + "loss": 0.0107, + "step": 632700 + }, + { + "epoch": 1.64, + "learning_rate": 5.398866196106081e-05, + "loss": 0.0077, + "step": 632710 + }, + { + "epoch": 1.64, + "learning_rate": 5.398477374468934e-05, + "loss": 0.0086, + "step": 632720 + }, + { + "epoch": 1.64, + "learning_rate": 5.398088552831788e-05, + "loss": 0.0075, + "step": 632730 + }, + { + "epoch": 1.64, + "learning_rate": 5.397699731194641e-05, + "loss": 0.0094, + "step": 632740 + }, + { + "epoch": 1.64, + "learning_rate": 5.397310909557495e-05, + "loss": 0.0114, + "step": 632750 + }, + { + "epoch": 1.64, + "learning_rate": 5.396922087920348e-05, + "loss": 0.0091, + "step": 632760 + }, + { + "epoch": 1.64, + "learning_rate": 5.396533266283202e-05, + "loss": 0.0109, + "step": 632770 + }, + { + "epoch": 1.64, + "learning_rate": 5.396144444646056e-05, + "loss": 0.0069, + "step": 632780 + }, + { + "epoch": 1.64, + "learning_rate": 5.395755623008909e-05, + "loss": 0.0063, + "step": 632790 + }, + { + "epoch": 1.64, + "learning_rate": 5.395366801371762e-05, + "loss": 0.0088, + "step": 632800 + }, + { + "epoch": 1.64, + "learning_rate": 5.3949779797346156e-05, + "loss": 0.0087, + "step": 632810 + }, + { + "epoch": 1.64, + "learning_rate": 5.394589158097469e-05, + "loss": 0.009, + "step": 632820 + }, + { + "epoch": 1.64, + "learning_rate": 5.3942003364603226e-05, + "loss": 0.008, + "step": 632830 + }, + { + "epoch": 1.64, + "learning_rate": 5.393811514823176e-05, + "loss": 0.0078, + "step": 632840 + }, + { + "epoch": 1.64, + "learning_rate": 5.3934226931860296e-05, + "loss": 0.0069, + "step": 632850 + }, + { + "epoch": 1.64, + "learning_rate": 5.393033871548883e-05, + "loss": 0.0085, + "step": 632860 + }, + { + "epoch": 1.64, + "learning_rate": 5.3926450499117365e-05, + "loss": 0.0123, + "step": 632870 + }, + { + "epoch": 1.64, + "learning_rate": 5.392256228274591e-05, + "loss": 0.0078, + "step": 632880 + }, + { + "epoch": 1.64, + "learning_rate": 5.391867406637444e-05, + "loss": 0.0075, + "step": 632890 + }, + { + "epoch": 1.64, + "learning_rate": 5.391478585000298e-05, + "loss": 0.008, + "step": 632900 + }, + { + "epoch": 1.64, + "learning_rate": 5.391089763363151e-05, + "loss": 0.0068, + "step": 632910 + }, + { + "epoch": 1.64, + "learning_rate": 5.3907009417260046e-05, + "loss": 0.0087, + "step": 632920 + }, + { + "epoch": 1.64, + "learning_rate": 5.390312120088858e-05, + "loss": 0.0086, + "step": 632930 + }, + { + "epoch": 1.64, + "learning_rate": 5.3899232984517116e-05, + "loss": 0.0061, + "step": 632940 + }, + { + "epoch": 1.64, + "learning_rate": 5.389534476814565e-05, + "loss": 0.0111, + "step": 632950 + }, + { + "epoch": 1.64, + "learning_rate": 5.389145655177419e-05, + "loss": 0.0106, + "step": 632960 + }, + { + "epoch": 1.64, + "learning_rate": 5.388756833540273e-05, + "loss": 0.0109, + "step": 632970 + }, + { + "epoch": 1.64, + "learning_rate": 5.388368011903126e-05, + "loss": 0.014, + "step": 632980 + }, + { + "epoch": 1.64, + "learning_rate": 5.38797919026598e-05, + "loss": 0.0063, + "step": 632990 + }, + { + "epoch": 1.64, + "learning_rate": 5.387590368628833e-05, + "loss": 0.0107, + "step": 633000 + }, + { + "epoch": 1.64, + "eval_cer": 0.8816536990304715, + "eval_loss": 0.005239309277385473, + "eval_runtime": 107.9136, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 633000 + }, + { + "epoch": 1.64, + "learning_rate": 5.387201546991687e-05, + "loss": 0.0074, + "step": 633010 + }, + { + "epoch": 1.64, + "learning_rate": 5.38681272535454e-05, + "loss": 0.0081, + "step": 633020 + }, + { + "epoch": 1.64, + "learning_rate": 5.386423903717394e-05, + "loss": 0.0056, + "step": 633030 + }, + { + "epoch": 1.64, + "learning_rate": 5.386035082080248e-05, + "loss": 0.01, + "step": 633040 + }, + { + "epoch": 1.64, + "learning_rate": 5.3856462604431e-05, + "loss": 0.0107, + "step": 633050 + }, + { + "epoch": 1.64, + "learning_rate": 5.385257438805954e-05, + "loss": 0.0072, + "step": 633060 + }, + { + "epoch": 1.64, + "learning_rate": 5.3848686171688076e-05, + "loss": 0.01, + "step": 633070 + }, + { + "epoch": 1.64, + "learning_rate": 5.384479795531661e-05, + "loss": 0.0072, + "step": 633080 + }, + { + "epoch": 1.64, + "learning_rate": 5.3840909738945146e-05, + "loss": 0.0103, + "step": 633090 + }, + { + "epoch": 1.64, + "learning_rate": 5.383702152257368e-05, + "loss": 0.0077, + "step": 633100 + }, + { + "epoch": 1.64, + "learning_rate": 5.3833133306202216e-05, + "loss": 0.0078, + "step": 633110 + }, + { + "epoch": 1.64, + "learning_rate": 5.382924508983075e-05, + "loss": 0.0083, + "step": 633120 + }, + { + "epoch": 1.64, + "learning_rate": 5.3825356873459285e-05, + "loss": 0.0091, + "step": 633130 + }, + { + "epoch": 1.64, + "learning_rate": 5.382146865708783e-05, + "loss": 0.0098, + "step": 633140 + }, + { + "epoch": 1.64, + "learning_rate": 5.381758044071636e-05, + "loss": 0.0065, + "step": 633150 + }, + { + "epoch": 1.64, + "learning_rate": 5.3813692224344897e-05, + "loss": 0.0062, + "step": 633160 + }, + { + "epoch": 1.64, + "learning_rate": 5.380980400797343e-05, + "loss": 0.0055, + "step": 633170 + }, + { + "epoch": 1.64, + "learning_rate": 5.3805915791601966e-05, + "loss": 0.0078, + "step": 633180 + }, + { + "epoch": 1.64, + "learning_rate": 5.38020275752305e-05, + "loss": 0.0099, + "step": 633190 + }, + { + "epoch": 1.64, + "learning_rate": 5.3798139358859036e-05, + "loss": 0.0086, + "step": 633200 + }, + { + "epoch": 1.64, + "learning_rate": 5.379425114248757e-05, + "loss": 0.0091, + "step": 633210 + }, + { + "epoch": 1.64, + "learning_rate": 5.379036292611611e-05, + "loss": 0.0101, + "step": 633220 + }, + { + "epoch": 1.64, + "learning_rate": 5.378647470974465e-05, + "loss": 0.0073, + "step": 633230 + }, + { + "epoch": 1.64, + "learning_rate": 5.378258649337318e-05, + "loss": 0.0053, + "step": 633240 + }, + { + "epoch": 1.64, + "learning_rate": 5.377869827700172e-05, + "loss": 0.0066, + "step": 633250 + }, + { + "epoch": 1.64, + "learning_rate": 5.377481006063025e-05, + "loss": 0.01, + "step": 633260 + }, + { + "epoch": 1.64, + "learning_rate": 5.377092184425879e-05, + "loss": 0.0068, + "step": 633270 + }, + { + "epoch": 1.64, + "learning_rate": 5.376703362788732e-05, + "loss": 0.0086, + "step": 633280 + }, + { + "epoch": 1.64, + "learning_rate": 5.3763145411515857e-05, + "loss": 0.0089, + "step": 633290 + }, + { + "epoch": 1.64, + "learning_rate": 5.3759257195144385e-05, + "loss": 0.0091, + "step": 633300 + }, + { + "epoch": 1.64, + "learning_rate": 5.375536897877292e-05, + "loss": 0.009, + "step": 633310 + }, + { + "epoch": 1.64, + "learning_rate": 5.375148076240146e-05, + "loss": 0.0089, + "step": 633320 + }, + { + "epoch": 1.64, + "learning_rate": 5.3747592546029996e-05, + "loss": 0.0088, + "step": 633330 + }, + { + "epoch": 1.64, + "learning_rate": 5.374370432965853e-05, + "loss": 0.0126, + "step": 633340 + }, + { + "epoch": 1.64, + "learning_rate": 5.3739816113287066e-05, + "loss": 0.0063, + "step": 633350 + }, + { + "epoch": 1.64, + "learning_rate": 5.37359278969156e-05, + "loss": 0.0114, + "step": 633360 + }, + { + "epoch": 1.64, + "learning_rate": 5.3732039680544135e-05, + "loss": 0.0104, + "step": 633370 + }, + { + "epoch": 1.64, + "learning_rate": 5.372815146417267e-05, + "loss": 0.0086, + "step": 633380 + }, + { + "epoch": 1.64, + "learning_rate": 5.3724263247801205e-05, + "loss": 0.0068, + "step": 633390 + }, + { + "epoch": 1.64, + "learning_rate": 5.372037503142975e-05, + "loss": 0.0074, + "step": 633400 + }, + { + "epoch": 1.64, + "learning_rate": 5.371648681505828e-05, + "loss": 0.0074, + "step": 633410 + }, + { + "epoch": 1.64, + "learning_rate": 5.3712598598686817e-05, + "loss": 0.0074, + "step": 633420 + }, + { + "epoch": 1.64, + "learning_rate": 5.370871038231535e-05, + "loss": 0.0075, + "step": 633430 + }, + { + "epoch": 1.64, + "learning_rate": 5.3704822165943886e-05, + "loss": 0.0058, + "step": 633440 + }, + { + "epoch": 1.64, + "learning_rate": 5.370093394957242e-05, + "loss": 0.0077, + "step": 633450 + }, + { + "epoch": 1.64, + "learning_rate": 5.3697045733200956e-05, + "loss": 0.0075, + "step": 633460 + }, + { + "epoch": 1.64, + "learning_rate": 5.369315751682949e-05, + "loss": 0.0102, + "step": 633470 + }, + { + "epoch": 1.64, + "learning_rate": 5.368926930045803e-05, + "loss": 0.0066, + "step": 633480 + }, + { + "epoch": 1.64, + "learning_rate": 5.368538108408657e-05, + "loss": 0.0093, + "step": 633490 + }, + { + "epoch": 1.64, + "learning_rate": 5.36814928677151e-05, + "loss": 0.0073, + "step": 633500 + }, + { + "epoch": 1.64, + "learning_rate": 5.367760465134364e-05, + "loss": 0.0106, + "step": 633510 + }, + { + "epoch": 1.64, + "learning_rate": 5.367371643497217e-05, + "loss": 0.007, + "step": 633520 + }, + { + "epoch": 1.64, + "learning_rate": 5.366982821860071e-05, + "loss": 0.0086, + "step": 633530 + }, + { + "epoch": 1.64, + "learning_rate": 5.366594000222924e-05, + "loss": 0.0073, + "step": 633540 + }, + { + "epoch": 1.64, + "learning_rate": 5.366205178585777e-05, + "loss": 0.0085, + "step": 633550 + }, + { + "epoch": 1.64, + "learning_rate": 5.3658163569486305e-05, + "loss": 0.0064, + "step": 633560 + }, + { + "epoch": 1.64, + "learning_rate": 5.365427535311484e-05, + "loss": 0.0091, + "step": 633570 + }, + { + "epoch": 1.64, + "learning_rate": 5.365038713674338e-05, + "loss": 0.0092, + "step": 633580 + }, + { + "epoch": 1.64, + "learning_rate": 5.3646498920371916e-05, + "loss": 0.009, + "step": 633590 + }, + { + "epoch": 1.64, + "learning_rate": 5.364261070400045e-05, + "loss": 0.0071, + "step": 633600 + }, + { + "epoch": 1.64, + "learning_rate": 5.3638722487628986e-05, + "loss": 0.0084, + "step": 633610 + }, + { + "epoch": 1.64, + "learning_rate": 5.363483427125752e-05, + "loss": 0.0106, + "step": 633620 + }, + { + "epoch": 1.64, + "learning_rate": 5.3630946054886055e-05, + "loss": 0.0083, + "step": 633630 + }, + { + "epoch": 1.64, + "learning_rate": 5.362705783851459e-05, + "loss": 0.0094, + "step": 633640 + }, + { + "epoch": 1.64, + "learning_rate": 5.3623169622143125e-05, + "loss": 0.0088, + "step": 633650 + }, + { + "epoch": 1.64, + "learning_rate": 5.361928140577167e-05, + "loss": 0.0106, + "step": 633660 + }, + { + "epoch": 1.64, + "learning_rate": 5.36153931894002e-05, + "loss": 0.0099, + "step": 633670 + }, + { + "epoch": 1.64, + "learning_rate": 5.3611504973028737e-05, + "loss": 0.0075, + "step": 633680 + }, + { + "epoch": 1.64, + "learning_rate": 5.360761675665727e-05, + "loss": 0.0083, + "step": 633690 + }, + { + "epoch": 1.64, + "learning_rate": 5.3603728540285806e-05, + "loss": 0.0049, + "step": 633700 + }, + { + "epoch": 1.64, + "learning_rate": 5.359984032391434e-05, + "loss": 0.0085, + "step": 633710 + }, + { + "epoch": 1.64, + "learning_rate": 5.3595952107542876e-05, + "loss": 0.0125, + "step": 633720 + }, + { + "epoch": 1.64, + "learning_rate": 5.359206389117141e-05, + "loss": 0.0073, + "step": 633730 + }, + { + "epoch": 1.64, + "learning_rate": 5.358817567479995e-05, + "loss": 0.0078, + "step": 633740 + }, + { + "epoch": 1.64, + "learning_rate": 5.358428745842849e-05, + "loss": 0.0082, + "step": 633750 + }, + { + "epoch": 1.64, + "learning_rate": 5.358039924205702e-05, + "loss": 0.0072, + "step": 633760 + }, + { + "epoch": 1.64, + "learning_rate": 5.357651102568556e-05, + "loss": 0.0084, + "step": 633770 + }, + { + "epoch": 1.64, + "learning_rate": 5.357262280931409e-05, + "loss": 0.0077, + "step": 633780 + }, + { + "epoch": 1.64, + "learning_rate": 5.356873459294262e-05, + "loss": 0.0088, + "step": 633790 + }, + { + "epoch": 1.64, + "learning_rate": 5.3564846376571155e-05, + "loss": 0.0102, + "step": 633800 + }, + { + "epoch": 1.64, + "learning_rate": 5.356095816019969e-05, + "loss": 0.0063, + "step": 633810 + }, + { + "epoch": 1.64, + "learning_rate": 5.3557069943828225e-05, + "loss": 0.0085, + "step": 633820 + }, + { + "epoch": 1.64, + "learning_rate": 5.355318172745676e-05, + "loss": 0.0092, + "step": 633830 + }, + { + "epoch": 1.64, + "learning_rate": 5.35492935110853e-05, + "loss": 0.0067, + "step": 633840 + }, + { + "epoch": 1.64, + "learning_rate": 5.3545405294713836e-05, + "loss": 0.0093, + "step": 633850 + }, + { + "epoch": 1.64, + "learning_rate": 5.354151707834237e-05, + "loss": 0.0088, + "step": 633860 + }, + { + "epoch": 1.64, + "learning_rate": 5.3537628861970906e-05, + "loss": 0.0092, + "step": 633870 + }, + { + "epoch": 1.64, + "learning_rate": 5.353374064559944e-05, + "loss": 0.0087, + "step": 633880 + }, + { + "epoch": 1.64, + "learning_rate": 5.3529852429227975e-05, + "loss": 0.0081, + "step": 633890 + }, + { + "epoch": 1.64, + "learning_rate": 5.352596421285651e-05, + "loss": 0.0095, + "step": 633900 + }, + { + "epoch": 1.64, + "learning_rate": 5.3522075996485045e-05, + "loss": 0.0103, + "step": 633910 + }, + { + "epoch": 1.64, + "learning_rate": 5.351818778011358e-05, + "loss": 0.0113, + "step": 633920 + }, + { + "epoch": 1.64, + "learning_rate": 5.351429956374212e-05, + "loss": 0.0094, + "step": 633930 + }, + { + "epoch": 1.64, + "learning_rate": 5.3510411347370656e-05, + "loss": 0.0062, + "step": 633940 + }, + { + "epoch": 1.64, + "learning_rate": 5.350652313099919e-05, + "loss": 0.0096, + "step": 633950 + }, + { + "epoch": 1.64, + "learning_rate": 5.3502634914627726e-05, + "loss": 0.0088, + "step": 633960 + }, + { + "epoch": 1.64, + "learning_rate": 5.349874669825626e-05, + "loss": 0.0079, + "step": 633970 + }, + { + "epoch": 1.64, + "learning_rate": 5.3494858481884796e-05, + "loss": 0.0102, + "step": 633980 + }, + { + "epoch": 1.64, + "learning_rate": 5.349097026551333e-05, + "loss": 0.0083, + "step": 633990 + }, + { + "epoch": 1.64, + "learning_rate": 5.3487082049141866e-05, + "loss": 0.0062, + "step": 634000 + }, + { + "epoch": 1.64, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.005355716682970524, + "eval_runtime": 107.9589, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.631, + "step": 634000 + }, + { + "epoch": 1.64, + "learning_rate": 5.348319383277041e-05, + "loss": 0.0087, + "step": 634010 + }, + { + "epoch": 1.64, + "learning_rate": 5.347930561639894e-05, + "loss": 0.0063, + "step": 634020 + }, + { + "epoch": 1.64, + "learning_rate": 5.347541740002748e-05, + "loss": 0.0094, + "step": 634030 + }, + { + "epoch": 1.64, + "learning_rate": 5.3471529183656005e-05, + "loss": 0.0075, + "step": 634040 + }, + { + "epoch": 1.64, + "learning_rate": 5.346764096728454e-05, + "loss": 0.0092, + "step": 634050 + }, + { + "epoch": 1.64, + "learning_rate": 5.3463752750913075e-05, + "loss": 0.0074, + "step": 634060 + }, + { + "epoch": 1.64, + "learning_rate": 5.345986453454161e-05, + "loss": 0.0064, + "step": 634070 + }, + { + "epoch": 1.64, + "learning_rate": 5.3455976318170145e-05, + "loss": 0.0109, + "step": 634080 + }, + { + "epoch": 1.64, + "learning_rate": 5.345208810179868e-05, + "loss": 0.0085, + "step": 634090 + }, + { + "epoch": 1.64, + "learning_rate": 5.3448199885427214e-05, + "loss": 0.0068, + "step": 634100 + }, + { + "epoch": 1.64, + "learning_rate": 5.3444311669055756e-05, + "loss": 0.0077, + "step": 634110 + }, + { + "epoch": 1.64, + "learning_rate": 5.344042345268429e-05, + "loss": 0.0069, + "step": 634120 + }, + { + "epoch": 1.64, + "learning_rate": 5.3436535236312826e-05, + "loss": 0.0074, + "step": 634130 + }, + { + "epoch": 1.64, + "learning_rate": 5.343264701994136e-05, + "loss": 0.0082, + "step": 634140 + }, + { + "epoch": 1.64, + "learning_rate": 5.3428758803569895e-05, + "loss": 0.0094, + "step": 634150 + }, + { + "epoch": 1.64, + "learning_rate": 5.342487058719843e-05, + "loss": 0.0087, + "step": 634160 + }, + { + "epoch": 1.64, + "learning_rate": 5.3420982370826965e-05, + "loss": 0.0088, + "step": 634170 + }, + { + "epoch": 1.64, + "learning_rate": 5.34170941544555e-05, + "loss": 0.0067, + "step": 634180 + }, + { + "epoch": 1.64, + "learning_rate": 5.341320593808404e-05, + "loss": 0.0072, + "step": 634190 + }, + { + "epoch": 1.64, + "learning_rate": 5.3409317721712576e-05, + "loss": 0.0078, + "step": 634200 + }, + { + "epoch": 1.64, + "learning_rate": 5.340542950534111e-05, + "loss": 0.0075, + "step": 634210 + }, + { + "epoch": 1.64, + "learning_rate": 5.3401541288969646e-05, + "loss": 0.0077, + "step": 634220 + }, + { + "epoch": 1.64, + "learning_rate": 5.339765307259818e-05, + "loss": 0.0111, + "step": 634230 + }, + { + "epoch": 1.64, + "learning_rate": 5.3393764856226716e-05, + "loss": 0.0064, + "step": 634240 + }, + { + "epoch": 1.64, + "learning_rate": 5.338987663985525e-05, + "loss": 0.0086, + "step": 634250 + }, + { + "epoch": 1.64, + "learning_rate": 5.3385988423483786e-05, + "loss": 0.0087, + "step": 634260 + }, + { + "epoch": 1.64, + "learning_rate": 5.338210020711233e-05, + "loss": 0.0061, + "step": 634270 + }, + { + "epoch": 1.64, + "learning_rate": 5.337821199074086e-05, + "loss": 0.0072, + "step": 634280 + }, + { + "epoch": 1.64, + "learning_rate": 5.337432377436939e-05, + "loss": 0.0116, + "step": 634290 + }, + { + "epoch": 1.64, + "learning_rate": 5.3370435557997925e-05, + "loss": 0.0079, + "step": 634300 + }, + { + "epoch": 1.64, + "learning_rate": 5.336654734162646e-05, + "loss": 0.0079, + "step": 634310 + }, + { + "epoch": 1.64, + "learning_rate": 5.3362659125254995e-05, + "loss": 0.0053, + "step": 634320 + }, + { + "epoch": 1.64, + "learning_rate": 5.335877090888353e-05, + "loss": 0.0057, + "step": 634330 + }, + { + "epoch": 1.64, + "learning_rate": 5.3354882692512064e-05, + "loss": 0.0114, + "step": 634340 + }, + { + "epoch": 1.64, + "learning_rate": 5.33509944761406e-05, + "loss": 0.0073, + "step": 634350 + }, + { + "epoch": 1.64, + "learning_rate": 5.3347106259769134e-05, + "loss": 0.0075, + "step": 634360 + }, + { + "epoch": 1.64, + "learning_rate": 5.3343218043397676e-05, + "loss": 0.0073, + "step": 634370 + }, + { + "epoch": 1.64, + "learning_rate": 5.333932982702621e-05, + "loss": 0.0109, + "step": 634380 + }, + { + "epoch": 1.64, + "learning_rate": 5.3335441610654746e-05, + "loss": 0.0083, + "step": 634390 + }, + { + "epoch": 1.64, + "learning_rate": 5.333155339428328e-05, + "loss": 0.0078, + "step": 634400 + }, + { + "epoch": 1.64, + "learning_rate": 5.3327665177911815e-05, + "loss": 0.0087, + "step": 634410 + }, + { + "epoch": 1.64, + "learning_rate": 5.332377696154035e-05, + "loss": 0.0108, + "step": 634420 + }, + { + "epoch": 1.64, + "learning_rate": 5.3319888745168885e-05, + "loss": 0.0116, + "step": 634430 + }, + { + "epoch": 1.64, + "learning_rate": 5.331600052879742e-05, + "loss": 0.0072, + "step": 634440 + }, + { + "epoch": 1.64, + "learning_rate": 5.331211231242596e-05, + "loss": 0.0112, + "step": 634450 + }, + { + "epoch": 1.64, + "learning_rate": 5.3308224096054496e-05, + "loss": 0.0097, + "step": 634460 + }, + { + "epoch": 1.64, + "learning_rate": 5.330433587968303e-05, + "loss": 0.0081, + "step": 634470 + }, + { + "epoch": 1.64, + "learning_rate": 5.3300447663311566e-05, + "loss": 0.0066, + "step": 634480 + }, + { + "epoch": 1.64, + "learning_rate": 5.32965594469401e-05, + "loss": 0.008, + "step": 634490 + }, + { + "epoch": 1.64, + "learning_rate": 5.3292671230568636e-05, + "loss": 0.01, + "step": 634500 + }, + { + "epoch": 1.64, + "learning_rate": 5.328878301419717e-05, + "loss": 0.0096, + "step": 634510 + }, + { + "epoch": 1.64, + "learning_rate": 5.3284894797825706e-05, + "loss": 0.0083, + "step": 634520 + }, + { + "epoch": 1.64, + "learning_rate": 5.328100658145425e-05, + "loss": 0.0104, + "step": 634530 + }, + { + "epoch": 1.64, + "learning_rate": 5.327711836508277e-05, + "loss": 0.0097, + "step": 634540 + }, + { + "epoch": 1.64, + "learning_rate": 5.327323014871131e-05, + "loss": 0.0067, + "step": 634550 + }, + { + "epoch": 1.64, + "learning_rate": 5.3269341932339845e-05, + "loss": 0.0109, + "step": 634560 + }, + { + "epoch": 1.64, + "learning_rate": 5.326545371596838e-05, + "loss": 0.0095, + "step": 634570 + }, + { + "epoch": 1.64, + "learning_rate": 5.3261565499596915e-05, + "loss": 0.0126, + "step": 634580 + }, + { + "epoch": 1.64, + "learning_rate": 5.325767728322545e-05, + "loss": 0.0077, + "step": 634590 + }, + { + "epoch": 1.64, + "learning_rate": 5.3253789066853984e-05, + "loss": 0.0112, + "step": 634600 + }, + { + "epoch": 1.64, + "learning_rate": 5.324990085048252e-05, + "loss": 0.0087, + "step": 634610 + }, + { + "epoch": 1.65, + "learning_rate": 5.3246012634111054e-05, + "loss": 0.0089, + "step": 634620 + }, + { + "epoch": 1.65, + "learning_rate": 5.3242124417739596e-05, + "loss": 0.006, + "step": 634630 + }, + { + "epoch": 1.65, + "learning_rate": 5.323823620136813e-05, + "loss": 0.0074, + "step": 634640 + }, + { + "epoch": 1.65, + "learning_rate": 5.3234347984996666e-05, + "loss": 0.0076, + "step": 634650 + }, + { + "epoch": 1.65, + "learning_rate": 5.32304597686252e-05, + "loss": 0.0068, + "step": 634660 + }, + { + "epoch": 1.65, + "learning_rate": 5.3226571552253735e-05, + "loss": 0.0085, + "step": 634670 + }, + { + "epoch": 1.65, + "learning_rate": 5.322268333588227e-05, + "loss": 0.0099, + "step": 634680 + }, + { + "epoch": 1.65, + "learning_rate": 5.3218795119510805e-05, + "loss": 0.0096, + "step": 634690 + }, + { + "epoch": 1.65, + "learning_rate": 5.321490690313934e-05, + "loss": 0.0089, + "step": 634700 + }, + { + "epoch": 1.65, + "learning_rate": 5.321101868676788e-05, + "loss": 0.0081, + "step": 634710 + }, + { + "epoch": 1.65, + "learning_rate": 5.3207130470396416e-05, + "loss": 0.0085, + "step": 634720 + }, + { + "epoch": 1.65, + "learning_rate": 5.320324225402495e-05, + "loss": 0.0101, + "step": 634730 + }, + { + "epoch": 1.65, + "learning_rate": 5.3199354037653486e-05, + "loss": 0.0083, + "step": 634740 + }, + { + "epoch": 1.65, + "learning_rate": 5.319546582128202e-05, + "loss": 0.0068, + "step": 634750 + }, + { + "epoch": 1.65, + "learning_rate": 5.3191577604910556e-05, + "loss": 0.0117, + "step": 634760 + }, + { + "epoch": 1.65, + "learning_rate": 5.318768938853909e-05, + "loss": 0.0104, + "step": 634770 + }, + { + "epoch": 1.65, + "learning_rate": 5.3183801172167625e-05, + "loss": 0.0065, + "step": 634780 + }, + { + "epoch": 1.65, + "learning_rate": 5.3179912955796154e-05, + "loss": 0.0112, + "step": 634790 + }, + { + "epoch": 1.65, + "learning_rate": 5.317602473942469e-05, + "loss": 0.0105, + "step": 634800 + }, + { + "epoch": 1.65, + "learning_rate": 5.317213652305323e-05, + "loss": 0.0068, + "step": 634810 + }, + { + "epoch": 1.65, + "learning_rate": 5.3168248306681765e-05, + "loss": 0.0074, + "step": 634820 + }, + { + "epoch": 1.65, + "learning_rate": 5.31643600903103e-05, + "loss": 0.0082, + "step": 634830 + }, + { + "epoch": 1.65, + "learning_rate": 5.3160471873938835e-05, + "loss": 0.008, + "step": 634840 + }, + { + "epoch": 1.65, + "learning_rate": 5.315658365756737e-05, + "loss": 0.0069, + "step": 634850 + }, + { + "epoch": 1.65, + "learning_rate": 5.3152695441195904e-05, + "loss": 0.0074, + "step": 634860 + }, + { + "epoch": 1.65, + "learning_rate": 5.314880722482444e-05, + "loss": 0.0077, + "step": 634870 + }, + { + "epoch": 1.65, + "learning_rate": 5.3144919008452974e-05, + "loss": 0.009, + "step": 634880 + }, + { + "epoch": 1.65, + "learning_rate": 5.3141030792081516e-05, + "loss": 0.0125, + "step": 634890 + }, + { + "epoch": 1.65, + "learning_rate": 5.313714257571005e-05, + "loss": 0.0087, + "step": 634900 + }, + { + "epoch": 1.65, + "learning_rate": 5.3133254359338585e-05, + "loss": 0.009, + "step": 634910 + }, + { + "epoch": 1.65, + "learning_rate": 5.312936614296712e-05, + "loss": 0.0077, + "step": 634920 + }, + { + "epoch": 1.65, + "learning_rate": 5.3125477926595655e-05, + "loss": 0.0085, + "step": 634930 + }, + { + "epoch": 1.65, + "learning_rate": 5.312158971022419e-05, + "loss": 0.0093, + "step": 634940 + }, + { + "epoch": 1.65, + "learning_rate": 5.3117701493852725e-05, + "loss": 0.0077, + "step": 634950 + }, + { + "epoch": 1.65, + "learning_rate": 5.311381327748126e-05, + "loss": 0.007, + "step": 634960 + }, + { + "epoch": 1.65, + "learning_rate": 5.31099250611098e-05, + "loss": 0.0056, + "step": 634970 + }, + { + "epoch": 1.65, + "learning_rate": 5.3106036844738336e-05, + "loss": 0.0117, + "step": 634980 + }, + { + "epoch": 1.65, + "learning_rate": 5.310214862836687e-05, + "loss": 0.0078, + "step": 634990 + }, + { + "epoch": 1.65, + "learning_rate": 5.3098260411995406e-05, + "loss": 0.0047, + "step": 635000 + }, + { + "epoch": 1.65, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.005286786239594221, + "eval_runtime": 107.9393, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 635000 + }, + { + "epoch": 1.65, + "learning_rate": 5.309437219562394e-05, + "loss": 0.0077, + "step": 635010 + }, + { + "epoch": 1.65, + "learning_rate": 5.3090483979252476e-05, + "loss": 0.0082, + "step": 635020 + }, + { + "epoch": 1.65, + "learning_rate": 5.3086595762881004e-05, + "loss": 0.0077, + "step": 635030 + }, + { + "epoch": 1.65, + "learning_rate": 5.308270754650954e-05, + "loss": 0.0109, + "step": 635040 + }, + { + "epoch": 1.65, + "learning_rate": 5.3078819330138074e-05, + "loss": 0.0085, + "step": 635050 + }, + { + "epoch": 1.65, + "learning_rate": 5.307493111376661e-05, + "loss": 0.0095, + "step": 635060 + }, + { + "epoch": 1.65, + "learning_rate": 5.307104289739515e-05, + "loss": 0.01, + "step": 635070 + }, + { + "epoch": 1.65, + "learning_rate": 5.3067154681023685e-05, + "loss": 0.0074, + "step": 635080 + }, + { + "epoch": 1.65, + "learning_rate": 5.306326646465222e-05, + "loss": 0.0093, + "step": 635090 + }, + { + "epoch": 1.65, + "learning_rate": 5.3059378248280755e-05, + "loss": 0.0082, + "step": 635100 + }, + { + "epoch": 1.65, + "learning_rate": 5.305549003190929e-05, + "loss": 0.0091, + "step": 635110 + }, + { + "epoch": 1.65, + "learning_rate": 5.3051601815537824e-05, + "loss": 0.0084, + "step": 635120 + }, + { + "epoch": 1.65, + "learning_rate": 5.304771359916636e-05, + "loss": 0.0093, + "step": 635130 + }, + { + "epoch": 1.65, + "learning_rate": 5.3043825382794894e-05, + "loss": 0.0081, + "step": 635140 + }, + { + "epoch": 1.65, + "learning_rate": 5.3039937166423436e-05, + "loss": 0.0084, + "step": 635150 + }, + { + "epoch": 1.65, + "learning_rate": 5.303604895005197e-05, + "loss": 0.0082, + "step": 635160 + }, + { + "epoch": 1.65, + "learning_rate": 5.3032160733680505e-05, + "loss": 0.0072, + "step": 635170 + }, + { + "epoch": 1.65, + "learning_rate": 5.302827251730904e-05, + "loss": 0.0101, + "step": 635180 + }, + { + "epoch": 1.65, + "learning_rate": 5.3024384300937575e-05, + "loss": 0.0076, + "step": 635190 + }, + { + "epoch": 1.65, + "learning_rate": 5.302049608456611e-05, + "loss": 0.0084, + "step": 635200 + }, + { + "epoch": 1.65, + "learning_rate": 5.3016607868194645e-05, + "loss": 0.0073, + "step": 635210 + }, + { + "epoch": 1.65, + "learning_rate": 5.301271965182318e-05, + "loss": 0.0092, + "step": 635220 + }, + { + "epoch": 1.65, + "learning_rate": 5.3008831435451715e-05, + "loss": 0.0096, + "step": 635230 + }, + { + "epoch": 1.65, + "learning_rate": 5.3004943219080256e-05, + "loss": 0.0088, + "step": 635240 + }, + { + "epoch": 1.65, + "learning_rate": 5.300105500270879e-05, + "loss": 0.0075, + "step": 635250 + }, + { + "epoch": 1.65, + "learning_rate": 5.2997166786337326e-05, + "loss": 0.0079, + "step": 635260 + }, + { + "epoch": 1.65, + "learning_rate": 5.299327856996586e-05, + "loss": 0.0076, + "step": 635270 + }, + { + "epoch": 1.65, + "learning_rate": 5.298939035359439e-05, + "loss": 0.0071, + "step": 635280 + }, + { + "epoch": 1.65, + "learning_rate": 5.2985502137222924e-05, + "loss": 0.0135, + "step": 635290 + }, + { + "epoch": 1.65, + "learning_rate": 5.298161392085146e-05, + "loss": 0.0078, + "step": 635300 + }, + { + "epoch": 1.65, + "learning_rate": 5.2977725704479993e-05, + "loss": 0.0108, + "step": 635310 + }, + { + "epoch": 1.65, + "learning_rate": 5.297383748810853e-05, + "loss": 0.0077, + "step": 635320 + }, + { + "epoch": 1.65, + "learning_rate": 5.296994927173707e-05, + "loss": 0.0091, + "step": 635330 + }, + { + "epoch": 1.65, + "learning_rate": 5.2966061055365605e-05, + "loss": 0.0081, + "step": 635340 + }, + { + "epoch": 1.65, + "learning_rate": 5.296217283899414e-05, + "loss": 0.0097, + "step": 635350 + }, + { + "epoch": 1.65, + "learning_rate": 5.2958284622622675e-05, + "loss": 0.0085, + "step": 635360 + }, + { + "epoch": 1.65, + "learning_rate": 5.295439640625121e-05, + "loss": 0.0081, + "step": 635370 + }, + { + "epoch": 1.65, + "learning_rate": 5.2950508189879744e-05, + "loss": 0.0059, + "step": 635380 + }, + { + "epoch": 1.65, + "learning_rate": 5.294661997350828e-05, + "loss": 0.0081, + "step": 635390 + }, + { + "epoch": 1.65, + "learning_rate": 5.2942731757136814e-05, + "loss": 0.0095, + "step": 635400 + }, + { + "epoch": 1.65, + "learning_rate": 5.293884354076535e-05, + "loss": 0.0081, + "step": 635410 + }, + { + "epoch": 1.65, + "learning_rate": 5.293495532439389e-05, + "loss": 0.0092, + "step": 635420 + }, + { + "epoch": 1.65, + "learning_rate": 5.2931067108022425e-05, + "loss": 0.009, + "step": 635430 + }, + { + "epoch": 1.65, + "learning_rate": 5.292717889165096e-05, + "loss": 0.0156, + "step": 635440 + }, + { + "epoch": 1.65, + "learning_rate": 5.2923290675279495e-05, + "loss": 0.0079, + "step": 635450 + }, + { + "epoch": 1.65, + "learning_rate": 5.291940245890803e-05, + "loss": 0.0083, + "step": 635460 + }, + { + "epoch": 1.65, + "learning_rate": 5.2915514242536565e-05, + "loss": 0.0086, + "step": 635470 + }, + { + "epoch": 1.65, + "learning_rate": 5.29116260261651e-05, + "loss": 0.0078, + "step": 635480 + }, + { + "epoch": 1.65, + "learning_rate": 5.2907737809793635e-05, + "loss": 0.0094, + "step": 635490 + }, + { + "epoch": 1.65, + "learning_rate": 5.2903849593422176e-05, + "loss": 0.0072, + "step": 635500 + }, + { + "epoch": 1.65, + "learning_rate": 5.289996137705071e-05, + "loss": 0.0099, + "step": 635510 + }, + { + "epoch": 1.65, + "learning_rate": 5.2896073160679246e-05, + "loss": 0.0067, + "step": 635520 + }, + { + "epoch": 1.65, + "learning_rate": 5.2892184944307774e-05, + "loss": 0.0061, + "step": 635530 + }, + { + "epoch": 1.65, + "learning_rate": 5.288829672793631e-05, + "loss": 0.0086, + "step": 635540 + }, + { + "epoch": 1.65, + "learning_rate": 5.2884408511564844e-05, + "loss": 0.0077, + "step": 635550 + }, + { + "epoch": 1.65, + "learning_rate": 5.288052029519338e-05, + "loss": 0.008, + "step": 635560 + }, + { + "epoch": 1.65, + "learning_rate": 5.2876632078821913e-05, + "loss": 0.0067, + "step": 635570 + }, + { + "epoch": 1.65, + "learning_rate": 5.287274386245045e-05, + "loss": 0.0095, + "step": 635580 + }, + { + "epoch": 1.65, + "learning_rate": 5.286885564607898e-05, + "loss": 0.0089, + "step": 635590 + }, + { + "epoch": 1.65, + "learning_rate": 5.2864967429707525e-05, + "loss": 0.0099, + "step": 635600 + }, + { + "epoch": 1.65, + "learning_rate": 5.286107921333606e-05, + "loss": 0.0069, + "step": 635610 + }, + { + "epoch": 1.65, + "learning_rate": 5.2857190996964595e-05, + "loss": 0.0073, + "step": 635620 + }, + { + "epoch": 1.65, + "learning_rate": 5.285330278059313e-05, + "loss": 0.0079, + "step": 635630 + }, + { + "epoch": 1.65, + "learning_rate": 5.2849414564221664e-05, + "loss": 0.0076, + "step": 635640 + }, + { + "epoch": 1.65, + "learning_rate": 5.28455263478502e-05, + "loss": 0.008, + "step": 635650 + }, + { + "epoch": 1.65, + "learning_rate": 5.2841638131478734e-05, + "loss": 0.0072, + "step": 635660 + }, + { + "epoch": 1.65, + "learning_rate": 5.283774991510727e-05, + "loss": 0.0115, + "step": 635670 + }, + { + "epoch": 1.65, + "learning_rate": 5.283386169873581e-05, + "loss": 0.0081, + "step": 635680 + }, + { + "epoch": 1.65, + "learning_rate": 5.2829973482364345e-05, + "loss": 0.0091, + "step": 635690 + }, + { + "epoch": 1.65, + "learning_rate": 5.282608526599288e-05, + "loss": 0.0097, + "step": 635700 + }, + { + "epoch": 1.65, + "learning_rate": 5.2822197049621415e-05, + "loss": 0.0061, + "step": 635710 + }, + { + "epoch": 1.65, + "learning_rate": 5.281830883324995e-05, + "loss": 0.0062, + "step": 635720 + }, + { + "epoch": 1.65, + "learning_rate": 5.2814420616878485e-05, + "loss": 0.0073, + "step": 635730 + }, + { + "epoch": 1.65, + "learning_rate": 5.281053240050702e-05, + "loss": 0.0094, + "step": 635740 + }, + { + "epoch": 1.65, + "learning_rate": 5.2806644184135554e-05, + "loss": 0.0077, + "step": 635750 + }, + { + "epoch": 1.65, + "learning_rate": 5.2802755967764096e-05, + "loss": 0.0094, + "step": 635760 + }, + { + "epoch": 1.65, + "learning_rate": 5.279886775139263e-05, + "loss": 0.0086, + "step": 635770 + }, + { + "epoch": 1.65, + "learning_rate": 5.279497953502116e-05, + "loss": 0.0078, + "step": 635780 + }, + { + "epoch": 1.65, + "learning_rate": 5.2791091318649694e-05, + "loss": 0.0123, + "step": 635790 + }, + { + "epoch": 1.65, + "learning_rate": 5.278720310227823e-05, + "loss": 0.0065, + "step": 635800 + }, + { + "epoch": 1.65, + "learning_rate": 5.2783314885906764e-05, + "loss": 0.0051, + "step": 635810 + }, + { + "epoch": 1.65, + "learning_rate": 5.27794266695353e-05, + "loss": 0.0077, + "step": 635820 + }, + { + "epoch": 1.65, + "learning_rate": 5.277553845316383e-05, + "loss": 0.0092, + "step": 635830 + }, + { + "epoch": 1.65, + "learning_rate": 5.277165023679237e-05, + "loss": 0.008, + "step": 635840 + }, + { + "epoch": 1.65, + "learning_rate": 5.27677620204209e-05, + "loss": 0.0092, + "step": 635850 + }, + { + "epoch": 1.65, + "learning_rate": 5.2763873804049445e-05, + "loss": 0.0079, + "step": 635860 + }, + { + "epoch": 1.65, + "learning_rate": 5.275998558767798e-05, + "loss": 0.0101, + "step": 635870 + }, + { + "epoch": 1.65, + "learning_rate": 5.2756097371306514e-05, + "loss": 0.0087, + "step": 635880 + }, + { + "epoch": 1.65, + "learning_rate": 5.275220915493505e-05, + "loss": 0.0096, + "step": 635890 + }, + { + "epoch": 1.65, + "learning_rate": 5.2748320938563584e-05, + "loss": 0.008, + "step": 635900 + }, + { + "epoch": 1.65, + "learning_rate": 5.274443272219212e-05, + "loss": 0.0102, + "step": 635910 + }, + { + "epoch": 1.65, + "learning_rate": 5.2740544505820654e-05, + "loss": 0.0115, + "step": 635920 + }, + { + "epoch": 1.65, + "learning_rate": 5.273665628944919e-05, + "loss": 0.0074, + "step": 635930 + }, + { + "epoch": 1.65, + "learning_rate": 5.273276807307773e-05, + "loss": 0.008, + "step": 635940 + }, + { + "epoch": 1.65, + "learning_rate": 5.2728879856706265e-05, + "loss": 0.0084, + "step": 635950 + }, + { + "epoch": 1.65, + "learning_rate": 5.27249916403348e-05, + "loss": 0.0092, + "step": 635960 + }, + { + "epoch": 1.65, + "learning_rate": 5.2721103423963335e-05, + "loss": 0.0104, + "step": 635970 + }, + { + "epoch": 1.65, + "learning_rate": 5.271721520759187e-05, + "loss": 0.011, + "step": 635980 + }, + { + "epoch": 1.65, + "learning_rate": 5.2713326991220405e-05, + "loss": 0.0051, + "step": 635990 + }, + { + "epoch": 1.65, + "learning_rate": 5.270943877484894e-05, + "loss": 0.0082, + "step": 636000 + }, + { + "epoch": 1.65, + "eval_cer": 0.8817012866862336, + "eval_loss": 0.005146949551999569, + "eval_runtime": 108.0488, + "eval_samples_per_second": 18.51, + "eval_steps_per_second": 4.628, + "step": 636000 + }, + { + "epoch": 1.65, + "learning_rate": 5.2705550558477474e-05, + "loss": 0.0081, + "step": 636010 + }, + { + "epoch": 1.65, + "learning_rate": 5.2701662342106016e-05, + "loss": 0.0068, + "step": 636020 + }, + { + "epoch": 1.65, + "learning_rate": 5.269777412573454e-05, + "loss": 0.0096, + "step": 636030 + }, + { + "epoch": 1.65, + "learning_rate": 5.269388590936308e-05, + "loss": 0.0072, + "step": 636040 + }, + { + "epoch": 1.65, + "learning_rate": 5.2689997692991614e-05, + "loss": 0.0082, + "step": 636050 + }, + { + "epoch": 1.65, + "learning_rate": 5.268610947662015e-05, + "loss": 0.0062, + "step": 636060 + }, + { + "epoch": 1.65, + "learning_rate": 5.2682221260248684e-05, + "loss": 0.0086, + "step": 636070 + }, + { + "epoch": 1.65, + "learning_rate": 5.267833304387722e-05, + "loss": 0.0073, + "step": 636080 + }, + { + "epoch": 1.65, + "learning_rate": 5.267444482750575e-05, + "loss": 0.0081, + "step": 636090 + }, + { + "epoch": 1.65, + "learning_rate": 5.267055661113429e-05, + "loss": 0.0093, + "step": 636100 + }, + { + "epoch": 1.65, + "learning_rate": 5.266666839476282e-05, + "loss": 0.0101, + "step": 636110 + }, + { + "epoch": 1.65, + "learning_rate": 5.2662780178391365e-05, + "loss": 0.0071, + "step": 636120 + }, + { + "epoch": 1.65, + "learning_rate": 5.26588919620199e-05, + "loss": 0.0057, + "step": 636130 + }, + { + "epoch": 1.65, + "learning_rate": 5.2655003745648434e-05, + "loss": 0.0091, + "step": 636140 + }, + { + "epoch": 1.65, + "learning_rate": 5.265111552927697e-05, + "loss": 0.01, + "step": 636150 + }, + { + "epoch": 1.65, + "learning_rate": 5.2647227312905504e-05, + "loss": 0.0081, + "step": 636160 + }, + { + "epoch": 1.65, + "learning_rate": 5.264333909653404e-05, + "loss": 0.0059, + "step": 636170 + }, + { + "epoch": 1.65, + "learning_rate": 5.2639450880162574e-05, + "loss": 0.0093, + "step": 636180 + }, + { + "epoch": 1.65, + "learning_rate": 5.263556266379111e-05, + "loss": 0.006, + "step": 636190 + }, + { + "epoch": 1.65, + "learning_rate": 5.263167444741965e-05, + "loss": 0.0081, + "step": 636200 + }, + { + "epoch": 1.65, + "learning_rate": 5.2627786231048185e-05, + "loss": 0.0089, + "step": 636210 + }, + { + "epoch": 1.65, + "learning_rate": 5.262389801467672e-05, + "loss": 0.0068, + "step": 636220 + }, + { + "epoch": 1.65, + "learning_rate": 5.2620009798305255e-05, + "loss": 0.0052, + "step": 636230 + }, + { + "epoch": 1.65, + "learning_rate": 5.261612158193379e-05, + "loss": 0.0122, + "step": 636240 + }, + { + "epoch": 1.65, + "learning_rate": 5.2612233365562325e-05, + "loss": 0.0116, + "step": 636250 + }, + { + "epoch": 1.65, + "learning_rate": 5.260834514919086e-05, + "loss": 0.0093, + "step": 636260 + }, + { + "epoch": 1.65, + "learning_rate": 5.260445693281939e-05, + "loss": 0.0076, + "step": 636270 + }, + { + "epoch": 1.65, + "learning_rate": 5.260056871644792e-05, + "loss": 0.0065, + "step": 636280 + }, + { + "epoch": 1.65, + "learning_rate": 5.259668050007646e-05, + "loss": 0.0101, + "step": 636290 + }, + { + "epoch": 1.65, + "learning_rate": 5.2592792283705e-05, + "loss": 0.0089, + "step": 636300 + }, + { + "epoch": 1.65, + "learning_rate": 5.2588904067333534e-05, + "loss": 0.0082, + "step": 636310 + }, + { + "epoch": 1.65, + "learning_rate": 5.258501585096207e-05, + "loss": 0.008, + "step": 636320 + }, + { + "epoch": 1.65, + "learning_rate": 5.2581127634590604e-05, + "loss": 0.008, + "step": 636330 + }, + { + "epoch": 1.65, + "learning_rate": 5.257723941821914e-05, + "loss": 0.0094, + "step": 636340 + }, + { + "epoch": 1.65, + "learning_rate": 5.257335120184767e-05, + "loss": 0.0066, + "step": 636350 + }, + { + "epoch": 1.65, + "learning_rate": 5.256946298547621e-05, + "loss": 0.0068, + "step": 636360 + }, + { + "epoch": 1.65, + "learning_rate": 5.256557476910474e-05, + "loss": 0.0062, + "step": 636370 + }, + { + "epoch": 1.65, + "learning_rate": 5.2561686552733285e-05, + "loss": 0.0061, + "step": 636380 + }, + { + "epoch": 1.65, + "learning_rate": 5.255779833636182e-05, + "loss": 0.0073, + "step": 636390 + }, + { + "epoch": 1.65, + "learning_rate": 5.2553910119990354e-05, + "loss": 0.0099, + "step": 636400 + }, + { + "epoch": 1.65, + "learning_rate": 5.255002190361889e-05, + "loss": 0.0073, + "step": 636410 + }, + { + "epoch": 1.65, + "learning_rate": 5.2546133687247424e-05, + "loss": 0.007, + "step": 636420 + }, + { + "epoch": 1.65, + "learning_rate": 5.254224547087596e-05, + "loss": 0.0106, + "step": 636430 + }, + { + "epoch": 1.65, + "learning_rate": 5.2538357254504494e-05, + "loss": 0.0073, + "step": 636440 + }, + { + "epoch": 1.65, + "learning_rate": 5.253446903813303e-05, + "loss": 0.0075, + "step": 636450 + }, + { + "epoch": 1.65, + "learning_rate": 5.253058082176157e-05, + "loss": 0.0101, + "step": 636460 + }, + { + "epoch": 1.65, + "learning_rate": 5.2526692605390105e-05, + "loss": 0.0088, + "step": 636470 + }, + { + "epoch": 1.65, + "learning_rate": 5.252280438901864e-05, + "loss": 0.0092, + "step": 636480 + }, + { + "epoch": 1.65, + "learning_rate": 5.2518916172647175e-05, + "loss": 0.0093, + "step": 636490 + }, + { + "epoch": 1.65, + "learning_rate": 5.251502795627571e-05, + "loss": 0.0067, + "step": 636500 + }, + { + "epoch": 1.65, + "learning_rate": 5.2511139739904245e-05, + "loss": 0.0104, + "step": 636510 + }, + { + "epoch": 1.65, + "learning_rate": 5.250725152353277e-05, + "loss": 0.009, + "step": 636520 + }, + { + "epoch": 1.65, + "learning_rate": 5.250336330716131e-05, + "loss": 0.0063, + "step": 636530 + }, + { + "epoch": 1.65, + "learning_rate": 5.249947509078984e-05, + "loss": 0.0066, + "step": 636540 + }, + { + "epoch": 1.65, + "learning_rate": 5.249558687441838e-05, + "loss": 0.007, + "step": 636550 + }, + { + "epoch": 1.65, + "learning_rate": 5.249169865804692e-05, + "loss": 0.0054, + "step": 636560 + }, + { + "epoch": 1.65, + "learning_rate": 5.2487810441675454e-05, + "loss": 0.0054, + "step": 636570 + }, + { + "epoch": 1.65, + "learning_rate": 5.248392222530399e-05, + "loss": 0.0087, + "step": 636580 + }, + { + "epoch": 1.65, + "learning_rate": 5.2480034008932524e-05, + "loss": 0.0083, + "step": 636590 + }, + { + "epoch": 1.65, + "learning_rate": 5.247614579256106e-05, + "loss": 0.0087, + "step": 636600 + }, + { + "epoch": 1.65, + "learning_rate": 5.247225757618959e-05, + "loss": 0.0098, + "step": 636610 + }, + { + "epoch": 1.65, + "learning_rate": 5.246836935981813e-05, + "loss": 0.0087, + "step": 636620 + }, + { + "epoch": 1.65, + "learning_rate": 5.246448114344666e-05, + "loss": 0.0092, + "step": 636630 + }, + { + "epoch": 1.65, + "learning_rate": 5.2460592927075205e-05, + "loss": 0.0113, + "step": 636640 + }, + { + "epoch": 1.65, + "learning_rate": 5.245670471070374e-05, + "loss": 0.0069, + "step": 636650 + }, + { + "epoch": 1.65, + "learning_rate": 5.2452816494332274e-05, + "loss": 0.0068, + "step": 636660 + }, + { + "epoch": 1.65, + "learning_rate": 5.244892827796081e-05, + "loss": 0.0112, + "step": 636670 + }, + { + "epoch": 1.65, + "learning_rate": 5.2445040061589344e-05, + "loss": 0.0094, + "step": 636680 + }, + { + "epoch": 1.65, + "learning_rate": 5.244115184521788e-05, + "loss": 0.0073, + "step": 636690 + }, + { + "epoch": 1.65, + "learning_rate": 5.2437263628846414e-05, + "loss": 0.0083, + "step": 636700 + }, + { + "epoch": 1.65, + "learning_rate": 5.243337541247495e-05, + "loss": 0.0085, + "step": 636710 + }, + { + "epoch": 1.65, + "learning_rate": 5.2429487196103483e-05, + "loss": 0.0088, + "step": 636720 + }, + { + "epoch": 1.65, + "learning_rate": 5.2425598979732025e-05, + "loss": 0.0111, + "step": 636730 + }, + { + "epoch": 1.65, + "learning_rate": 5.242171076336056e-05, + "loss": 0.0058, + "step": 636740 + }, + { + "epoch": 1.65, + "learning_rate": 5.2417822546989095e-05, + "loss": 0.0103, + "step": 636750 + }, + { + "epoch": 1.65, + "learning_rate": 5.241393433061763e-05, + "loss": 0.0072, + "step": 636760 + }, + { + "epoch": 1.65, + "learning_rate": 5.241004611424616e-05, + "loss": 0.0069, + "step": 636770 + }, + { + "epoch": 1.65, + "learning_rate": 5.240615789787469e-05, + "loss": 0.0105, + "step": 636780 + }, + { + "epoch": 1.65, + "learning_rate": 5.240226968150323e-05, + "loss": 0.009, + "step": 636790 + }, + { + "epoch": 1.65, + "learning_rate": 5.239838146513176e-05, + "loss": 0.0099, + "step": 636800 + }, + { + "epoch": 1.65, + "learning_rate": 5.23944932487603e-05, + "loss": 0.0075, + "step": 636810 + }, + { + "epoch": 1.65, + "learning_rate": 5.239060503238883e-05, + "loss": 0.0113, + "step": 636820 + }, + { + "epoch": 1.65, + "learning_rate": 5.2386716816017374e-05, + "loss": 0.0067, + "step": 636830 + }, + { + "epoch": 1.65, + "learning_rate": 5.238282859964591e-05, + "loss": 0.0096, + "step": 636840 + }, + { + "epoch": 1.65, + "learning_rate": 5.2378940383274443e-05, + "loss": 0.0085, + "step": 636850 + }, + { + "epoch": 1.65, + "learning_rate": 5.237505216690298e-05, + "loss": 0.0096, + "step": 636860 + }, + { + "epoch": 1.65, + "learning_rate": 5.237116395053151e-05, + "loss": 0.0099, + "step": 636870 + }, + { + "epoch": 1.65, + "learning_rate": 5.236727573416005e-05, + "loss": 0.0082, + "step": 636880 + }, + { + "epoch": 1.65, + "learning_rate": 5.236338751778858e-05, + "loss": 0.0096, + "step": 636890 + }, + { + "epoch": 1.65, + "learning_rate": 5.235949930141712e-05, + "loss": 0.0076, + "step": 636900 + }, + { + "epoch": 1.65, + "learning_rate": 5.235561108504566e-05, + "loss": 0.0057, + "step": 636910 + }, + { + "epoch": 1.65, + "learning_rate": 5.2351722868674194e-05, + "loss": 0.0095, + "step": 636920 + }, + { + "epoch": 1.65, + "learning_rate": 5.234783465230273e-05, + "loss": 0.0089, + "step": 636930 + }, + { + "epoch": 1.65, + "learning_rate": 5.2343946435931264e-05, + "loss": 0.0064, + "step": 636940 + }, + { + "epoch": 1.65, + "learning_rate": 5.23400582195598e-05, + "loss": 0.007, + "step": 636950 + }, + { + "epoch": 1.65, + "learning_rate": 5.2336170003188334e-05, + "loss": 0.0055, + "step": 636960 + }, + { + "epoch": 1.65, + "learning_rate": 5.233228178681687e-05, + "loss": 0.0091, + "step": 636970 + }, + { + "epoch": 1.65, + "learning_rate": 5.2328393570445403e-05, + "loss": 0.007, + "step": 636980 + }, + { + "epoch": 1.65, + "learning_rate": 5.2324505354073945e-05, + "loss": 0.0087, + "step": 636990 + }, + { + "epoch": 1.65, + "learning_rate": 5.232061713770248e-05, + "loss": 0.0057, + "step": 637000 + }, + { + "epoch": 1.65, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.005305544938892126, + "eval_runtime": 107.7801, + "eval_samples_per_second": 18.556, + "eval_steps_per_second": 4.639, + "step": 637000 + }, + { + "epoch": 1.65, + "learning_rate": 5.2316728921331015e-05, + "loss": 0.0079, + "step": 637010 + }, + { + "epoch": 1.65, + "learning_rate": 5.231284070495954e-05, + "loss": 0.0086, + "step": 637020 + }, + { + "epoch": 1.65, + "learning_rate": 5.230895248858808e-05, + "loss": 0.0111, + "step": 637030 + }, + { + "epoch": 1.65, + "learning_rate": 5.230506427221661e-05, + "loss": 0.0082, + "step": 637040 + }, + { + "epoch": 1.65, + "learning_rate": 5.230117605584515e-05, + "loss": 0.0091, + "step": 637050 + }, + { + "epoch": 1.65, + "learning_rate": 5.229728783947368e-05, + "loss": 0.009, + "step": 637060 + }, + { + "epoch": 1.65, + "learning_rate": 5.229339962310222e-05, + "loss": 0.007, + "step": 637070 + }, + { + "epoch": 1.65, + "learning_rate": 5.228951140673075e-05, + "loss": 0.0087, + "step": 637080 + }, + { + "epoch": 1.65, + "learning_rate": 5.2285623190359294e-05, + "loss": 0.0097, + "step": 637090 + }, + { + "epoch": 1.65, + "learning_rate": 5.228173497398783e-05, + "loss": 0.008, + "step": 637100 + }, + { + "epoch": 1.65, + "learning_rate": 5.2277846757616363e-05, + "loss": 0.0085, + "step": 637110 + }, + { + "epoch": 1.65, + "learning_rate": 5.22739585412449e-05, + "loss": 0.0104, + "step": 637120 + }, + { + "epoch": 1.65, + "learning_rate": 5.227007032487343e-05, + "loss": 0.0109, + "step": 637130 + }, + { + "epoch": 1.65, + "learning_rate": 5.226618210850197e-05, + "loss": 0.0112, + "step": 637140 + }, + { + "epoch": 1.65, + "learning_rate": 5.22622938921305e-05, + "loss": 0.0107, + "step": 637150 + }, + { + "epoch": 1.65, + "learning_rate": 5.225840567575904e-05, + "loss": 0.0074, + "step": 637160 + }, + { + "epoch": 1.65, + "learning_rate": 5.225451745938758e-05, + "loss": 0.0085, + "step": 637170 + }, + { + "epoch": 1.65, + "learning_rate": 5.2250629243016114e-05, + "loss": 0.0066, + "step": 637180 + }, + { + "epoch": 1.65, + "learning_rate": 5.224674102664465e-05, + "loss": 0.0101, + "step": 637190 + }, + { + "epoch": 1.65, + "learning_rate": 5.2242852810273184e-05, + "loss": 0.0096, + "step": 637200 + }, + { + "epoch": 1.65, + "learning_rate": 5.223896459390172e-05, + "loss": 0.0089, + "step": 637210 + }, + { + "epoch": 1.65, + "learning_rate": 5.2235076377530254e-05, + "loss": 0.0085, + "step": 637220 + }, + { + "epoch": 1.65, + "learning_rate": 5.223118816115879e-05, + "loss": 0.0113, + "step": 637230 + }, + { + "epoch": 1.65, + "learning_rate": 5.222729994478732e-05, + "loss": 0.0092, + "step": 637240 + }, + { + "epoch": 1.65, + "learning_rate": 5.2223411728415865e-05, + "loss": 0.0066, + "step": 637250 + }, + { + "epoch": 1.65, + "learning_rate": 5.22195235120444e-05, + "loss": 0.0077, + "step": 637260 + }, + { + "epoch": 1.65, + "learning_rate": 5.221563529567293e-05, + "loss": 0.0107, + "step": 637270 + }, + { + "epoch": 1.65, + "learning_rate": 5.221174707930146e-05, + "loss": 0.0096, + "step": 637280 + }, + { + "epoch": 1.65, + "learning_rate": 5.220785886293e-05, + "loss": 0.0089, + "step": 637290 + }, + { + "epoch": 1.65, + "learning_rate": 5.220397064655853e-05, + "loss": 0.0078, + "step": 637300 + }, + { + "epoch": 1.65, + "learning_rate": 5.220008243018707e-05, + "loss": 0.0108, + "step": 637310 + }, + { + "epoch": 1.65, + "learning_rate": 5.21961942138156e-05, + "loss": 0.0069, + "step": 637320 + }, + { + "epoch": 1.65, + "learning_rate": 5.219230599744414e-05, + "loss": 0.0065, + "step": 637330 + }, + { + "epoch": 1.65, + "learning_rate": 5.218841778107267e-05, + "loss": 0.0089, + "step": 637340 + }, + { + "epoch": 1.65, + "learning_rate": 5.2184529564701214e-05, + "loss": 0.0074, + "step": 637350 + }, + { + "epoch": 1.65, + "learning_rate": 5.218064134832975e-05, + "loss": 0.0083, + "step": 637360 + }, + { + "epoch": 1.65, + "learning_rate": 5.217675313195828e-05, + "loss": 0.006, + "step": 637370 + }, + { + "epoch": 1.65, + "learning_rate": 5.217286491558682e-05, + "loss": 0.0094, + "step": 637380 + }, + { + "epoch": 1.65, + "learning_rate": 5.216897669921535e-05, + "loss": 0.0094, + "step": 637390 + }, + { + "epoch": 1.65, + "learning_rate": 5.216508848284389e-05, + "loss": 0.0087, + "step": 637400 + }, + { + "epoch": 1.65, + "learning_rate": 5.216120026647242e-05, + "loss": 0.0071, + "step": 637410 + }, + { + "epoch": 1.65, + "learning_rate": 5.215731205010096e-05, + "loss": 0.0096, + "step": 637420 + }, + { + "epoch": 1.65, + "learning_rate": 5.21534238337295e-05, + "loss": 0.0111, + "step": 637430 + }, + { + "epoch": 1.65, + "learning_rate": 5.2149535617358034e-05, + "loss": 0.0074, + "step": 637440 + }, + { + "epoch": 1.65, + "learning_rate": 5.214564740098657e-05, + "loss": 0.0079, + "step": 637450 + }, + { + "epoch": 1.65, + "learning_rate": 5.2141759184615104e-05, + "loss": 0.0085, + "step": 637460 + }, + { + "epoch": 1.65, + "learning_rate": 5.213787096824364e-05, + "loss": 0.0077, + "step": 637470 + }, + { + "epoch": 1.65, + "learning_rate": 5.2133982751872174e-05, + "loss": 0.0079, + "step": 637480 + }, + { + "epoch": 1.65, + "learning_rate": 5.213009453550071e-05, + "loss": 0.0062, + "step": 637490 + }, + { + "epoch": 1.65, + "learning_rate": 5.212620631912924e-05, + "loss": 0.0083, + "step": 637500 + }, + { + "epoch": 1.65, + "learning_rate": 5.212231810275777e-05, + "loss": 0.0082, + "step": 637510 + }, + { + "epoch": 1.65, + "learning_rate": 5.2118429886386306e-05, + "loss": 0.0082, + "step": 637520 + }, + { + "epoch": 1.65, + "learning_rate": 5.211454167001485e-05, + "loss": 0.0126, + "step": 637530 + }, + { + "epoch": 1.65, + "learning_rate": 5.211065345364338e-05, + "loss": 0.0067, + "step": 637540 + }, + { + "epoch": 1.65, + "learning_rate": 5.210676523727192e-05, + "loss": 0.0061, + "step": 637550 + }, + { + "epoch": 1.65, + "learning_rate": 5.210287702090045e-05, + "loss": 0.0086, + "step": 637560 + }, + { + "epoch": 1.65, + "learning_rate": 5.209898880452899e-05, + "loss": 0.0059, + "step": 637570 + }, + { + "epoch": 1.65, + "learning_rate": 5.209510058815752e-05, + "loss": 0.0083, + "step": 637580 + }, + { + "epoch": 1.65, + "learning_rate": 5.209121237178606e-05, + "loss": 0.0056, + "step": 637590 + }, + { + "epoch": 1.65, + "learning_rate": 5.208732415541459e-05, + "loss": 0.0091, + "step": 637600 + }, + { + "epoch": 1.65, + "learning_rate": 5.2083435939043134e-05, + "loss": 0.0107, + "step": 637610 + }, + { + "epoch": 1.65, + "learning_rate": 5.207954772267167e-05, + "loss": 0.0101, + "step": 637620 + }, + { + "epoch": 1.65, + "learning_rate": 5.20756595063002e-05, + "loss": 0.0087, + "step": 637630 + }, + { + "epoch": 1.65, + "learning_rate": 5.207177128992874e-05, + "loss": 0.0075, + "step": 637640 + }, + { + "epoch": 1.65, + "learning_rate": 5.206788307355727e-05, + "loss": 0.0078, + "step": 637650 + }, + { + "epoch": 1.65, + "learning_rate": 5.206399485718581e-05, + "loss": 0.0071, + "step": 637660 + }, + { + "epoch": 1.65, + "learning_rate": 5.206010664081434e-05, + "loss": 0.0099, + "step": 637670 + }, + { + "epoch": 1.65, + "learning_rate": 5.205621842444288e-05, + "loss": 0.0091, + "step": 637680 + }, + { + "epoch": 1.65, + "learning_rate": 5.205233020807142e-05, + "loss": 0.0078, + "step": 637690 + }, + { + "epoch": 1.65, + "learning_rate": 5.2048441991699954e-05, + "loss": 0.0089, + "step": 637700 + }, + { + "epoch": 1.65, + "learning_rate": 5.204455377532849e-05, + "loss": 0.0074, + "step": 637710 + }, + { + "epoch": 1.65, + "learning_rate": 5.2040665558957024e-05, + "loss": 0.0094, + "step": 637720 + }, + { + "epoch": 1.65, + "learning_rate": 5.203677734258556e-05, + "loss": 0.0101, + "step": 637730 + }, + { + "epoch": 1.65, + "learning_rate": 5.2032889126214094e-05, + "loss": 0.0082, + "step": 637740 + }, + { + "epoch": 1.65, + "learning_rate": 5.202900090984263e-05, + "loss": 0.0073, + "step": 637750 + }, + { + "epoch": 1.65, + "learning_rate": 5.2025112693471157e-05, + "loss": 0.0108, + "step": 637760 + }, + { + "epoch": 1.65, + "learning_rate": 5.202122447709969e-05, + "loss": 0.0075, + "step": 637770 + }, + { + "epoch": 1.65, + "learning_rate": 5.2017336260728226e-05, + "loss": 0.013, + "step": 637780 + }, + { + "epoch": 1.65, + "learning_rate": 5.201344804435677e-05, + "loss": 0.008, + "step": 637790 + }, + { + "epoch": 1.65, + "learning_rate": 5.20095598279853e-05, + "loss": 0.008, + "step": 637800 + }, + { + "epoch": 1.65, + "learning_rate": 5.200567161161384e-05, + "loss": 0.008, + "step": 637810 + }, + { + "epoch": 1.65, + "learning_rate": 5.200178339524237e-05, + "loss": 0.0081, + "step": 637820 + }, + { + "epoch": 1.65, + "learning_rate": 5.199789517887091e-05, + "loss": 0.0094, + "step": 637830 + }, + { + "epoch": 1.65, + "learning_rate": 5.199400696249944e-05, + "loss": 0.0061, + "step": 637840 + }, + { + "epoch": 1.65, + "learning_rate": 5.199011874612798e-05, + "loss": 0.0084, + "step": 637850 + }, + { + "epoch": 1.65, + "learning_rate": 5.198623052975651e-05, + "loss": 0.0109, + "step": 637860 + }, + { + "epoch": 1.65, + "learning_rate": 5.1982342313385054e-05, + "loss": 0.0083, + "step": 637870 + }, + { + "epoch": 1.65, + "learning_rate": 5.197845409701359e-05, + "loss": 0.0097, + "step": 637880 + }, + { + "epoch": 1.65, + "learning_rate": 5.197456588064212e-05, + "loss": 0.0085, + "step": 637890 + }, + { + "epoch": 1.65, + "learning_rate": 5.197067766427066e-05, + "loss": 0.0057, + "step": 637900 + }, + { + "epoch": 1.65, + "learning_rate": 5.196678944789919e-05, + "loss": 0.0068, + "step": 637910 + }, + { + "epoch": 1.65, + "learning_rate": 5.196290123152773e-05, + "loss": 0.0088, + "step": 637920 + }, + { + "epoch": 1.65, + "learning_rate": 5.195901301515626e-05, + "loss": 0.0098, + "step": 637930 + }, + { + "epoch": 1.65, + "learning_rate": 5.19551247987848e-05, + "loss": 0.0075, + "step": 637940 + }, + { + "epoch": 1.65, + "learning_rate": 5.195123658241334e-05, + "loss": 0.0078, + "step": 637950 + }, + { + "epoch": 1.65, + "learning_rate": 5.1947348366041874e-05, + "loss": 0.0079, + "step": 637960 + }, + { + "epoch": 1.65, + "learning_rate": 5.194346014967041e-05, + "loss": 0.0081, + "step": 637970 + }, + { + "epoch": 1.65, + "learning_rate": 5.1939571933298944e-05, + "loss": 0.0074, + "step": 637980 + }, + { + "epoch": 1.65, + "learning_rate": 5.193568371692748e-05, + "loss": 0.0083, + "step": 637990 + }, + { + "epoch": 1.65, + "learning_rate": 5.1931795500556014e-05, + "loss": 0.01, + "step": 638000 + }, + { + "epoch": 1.65, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.005293059162795544, + "eval_runtime": 107.9559, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.632, + "step": 638000 + }, + { + "epoch": 1.65, + "learning_rate": 5.192790728418454e-05, + "loss": 0.0094, + "step": 638010 + }, + { + "epoch": 1.65, + "learning_rate": 5.1924019067813076e-05, + "loss": 0.0091, + "step": 638020 + }, + { + "epoch": 1.65, + "learning_rate": 5.192013085144161e-05, + "loss": 0.0063, + "step": 638030 + }, + { + "epoch": 1.65, + "learning_rate": 5.1916242635070146e-05, + "loss": 0.0101, + "step": 638040 + }, + { + "epoch": 1.65, + "learning_rate": 5.191235441869869e-05, + "loss": 0.0066, + "step": 638050 + }, + { + "epoch": 1.65, + "learning_rate": 5.190846620232722e-05, + "loss": 0.0069, + "step": 638060 + }, + { + "epoch": 1.65, + "learning_rate": 5.190457798595576e-05, + "loss": 0.011, + "step": 638070 + }, + { + "epoch": 1.65, + "learning_rate": 5.190068976958429e-05, + "loss": 0.0091, + "step": 638080 + }, + { + "epoch": 1.65, + "learning_rate": 5.189680155321283e-05, + "loss": 0.0091, + "step": 638090 + }, + { + "epoch": 1.65, + "learning_rate": 5.189291333684136e-05, + "loss": 0.0068, + "step": 638100 + }, + { + "epoch": 1.65, + "learning_rate": 5.18890251204699e-05, + "loss": 0.0094, + "step": 638110 + }, + { + "epoch": 1.65, + "learning_rate": 5.188513690409843e-05, + "loss": 0.0064, + "step": 638120 + }, + { + "epoch": 1.65, + "learning_rate": 5.188124868772697e-05, + "loss": 0.011, + "step": 638130 + }, + { + "epoch": 1.65, + "learning_rate": 5.187736047135551e-05, + "loss": 0.0071, + "step": 638140 + }, + { + "epoch": 1.65, + "learning_rate": 5.187347225498404e-05, + "loss": 0.0097, + "step": 638150 + }, + { + "epoch": 1.65, + "learning_rate": 5.186958403861258e-05, + "loss": 0.0101, + "step": 638160 + }, + { + "epoch": 1.65, + "learning_rate": 5.186569582224111e-05, + "loss": 0.0078, + "step": 638170 + }, + { + "epoch": 1.65, + "learning_rate": 5.186180760586965e-05, + "loss": 0.0084, + "step": 638180 + }, + { + "epoch": 1.65, + "learning_rate": 5.185791938949818e-05, + "loss": 0.0065, + "step": 638190 + }, + { + "epoch": 1.65, + "learning_rate": 5.185403117312672e-05, + "loss": 0.01, + "step": 638200 + }, + { + "epoch": 1.65, + "learning_rate": 5.185014295675525e-05, + "loss": 0.0067, + "step": 638210 + }, + { + "epoch": 1.65, + "learning_rate": 5.1846254740383794e-05, + "loss": 0.0074, + "step": 638220 + }, + { + "epoch": 1.65, + "learning_rate": 5.184236652401233e-05, + "loss": 0.0072, + "step": 638230 + }, + { + "epoch": 1.65, + "learning_rate": 5.1838478307640864e-05, + "loss": 0.0067, + "step": 638240 + }, + { + "epoch": 1.65, + "learning_rate": 5.18345900912694e-05, + "loss": 0.01, + "step": 638250 + }, + { + "epoch": 1.65, + "learning_rate": 5.183070187489793e-05, + "loss": 0.009, + "step": 638260 + }, + { + "epoch": 1.65, + "learning_rate": 5.182681365852646e-05, + "loss": 0.0091, + "step": 638270 + }, + { + "epoch": 1.65, + "learning_rate": 5.1822925442154996e-05, + "loss": 0.007, + "step": 638280 + }, + { + "epoch": 1.65, + "learning_rate": 5.181903722578353e-05, + "loss": 0.0109, + "step": 638290 + }, + { + "epoch": 1.65, + "learning_rate": 5.1815149009412066e-05, + "loss": 0.0067, + "step": 638300 + }, + { + "epoch": 1.65, + "learning_rate": 5.18112607930406e-05, + "loss": 0.0089, + "step": 638310 + }, + { + "epoch": 1.65, + "learning_rate": 5.180737257666914e-05, + "loss": 0.0067, + "step": 638320 + }, + { + "epoch": 1.65, + "learning_rate": 5.180348436029768e-05, + "loss": 0.009, + "step": 638330 + }, + { + "epoch": 1.65, + "learning_rate": 5.179959614392621e-05, + "loss": 0.0072, + "step": 638340 + }, + { + "epoch": 1.65, + "learning_rate": 5.179570792755475e-05, + "loss": 0.0096, + "step": 638350 + }, + { + "epoch": 1.65, + "learning_rate": 5.179181971118328e-05, + "loss": 0.0081, + "step": 638360 + }, + { + "epoch": 1.65, + "learning_rate": 5.178793149481182e-05, + "loss": 0.0094, + "step": 638370 + }, + { + "epoch": 1.65, + "learning_rate": 5.178404327844035e-05, + "loss": 0.0099, + "step": 638380 + }, + { + "epoch": 1.65, + "learning_rate": 5.178015506206889e-05, + "loss": 0.0095, + "step": 638390 + }, + { + "epoch": 1.65, + "learning_rate": 5.177626684569743e-05, + "loss": 0.0066, + "step": 638400 + }, + { + "epoch": 1.65, + "learning_rate": 5.177237862932596e-05, + "loss": 0.0101, + "step": 638410 + }, + { + "epoch": 1.65, + "learning_rate": 5.17684904129545e-05, + "loss": 0.0077, + "step": 638420 + }, + { + "epoch": 1.65, + "learning_rate": 5.176460219658303e-05, + "loss": 0.009, + "step": 638430 + }, + { + "epoch": 1.65, + "learning_rate": 5.176071398021157e-05, + "loss": 0.0076, + "step": 638440 + }, + { + "epoch": 1.65, + "learning_rate": 5.17568257638401e-05, + "loss": 0.0085, + "step": 638450 + }, + { + "epoch": 1.65, + "learning_rate": 5.175293754746864e-05, + "loss": 0.0069, + "step": 638460 + }, + { + "epoch": 1.66, + "learning_rate": 5.174904933109717e-05, + "loss": 0.0078, + "step": 638470 + }, + { + "epoch": 1.66, + "learning_rate": 5.1745161114725714e-05, + "loss": 0.0062, + "step": 638480 + }, + { + "epoch": 1.66, + "learning_rate": 5.174127289835425e-05, + "loss": 0.0068, + "step": 638490 + }, + { + "epoch": 1.66, + "learning_rate": 5.1737384681982784e-05, + "loss": 0.0088, + "step": 638500 + }, + { + "epoch": 1.66, + "learning_rate": 5.173349646561131e-05, + "loss": 0.0079, + "step": 638510 + }, + { + "epoch": 1.66, + "learning_rate": 5.172960824923985e-05, + "loss": 0.0069, + "step": 638520 + }, + { + "epoch": 1.66, + "learning_rate": 5.172572003286838e-05, + "loss": 0.0098, + "step": 638530 + }, + { + "epoch": 1.66, + "learning_rate": 5.1721831816496916e-05, + "loss": 0.0057, + "step": 638540 + }, + { + "epoch": 1.66, + "learning_rate": 5.171794360012545e-05, + "loss": 0.0101, + "step": 638550 + }, + { + "epoch": 1.66, + "learning_rate": 5.1714055383753986e-05, + "loss": 0.0111, + "step": 638560 + }, + { + "epoch": 1.66, + "learning_rate": 5.171016716738252e-05, + "loss": 0.0077, + "step": 638570 + }, + { + "epoch": 1.66, + "learning_rate": 5.170627895101106e-05, + "loss": 0.0082, + "step": 638580 + }, + { + "epoch": 1.66, + "learning_rate": 5.17023907346396e-05, + "loss": 0.0118, + "step": 638590 + }, + { + "epoch": 1.66, + "learning_rate": 5.169850251826813e-05, + "loss": 0.0143, + "step": 638600 + }, + { + "epoch": 1.66, + "learning_rate": 5.169461430189667e-05, + "loss": 0.0069, + "step": 638610 + }, + { + "epoch": 1.66, + "learning_rate": 5.16907260855252e-05, + "loss": 0.0069, + "step": 638620 + }, + { + "epoch": 1.66, + "learning_rate": 5.168683786915374e-05, + "loss": 0.008, + "step": 638630 + }, + { + "epoch": 1.66, + "learning_rate": 5.168294965278227e-05, + "loss": 0.0063, + "step": 638640 + }, + { + "epoch": 1.66, + "learning_rate": 5.167906143641081e-05, + "loss": 0.0067, + "step": 638650 + }, + { + "epoch": 1.66, + "learning_rate": 5.167517322003935e-05, + "loss": 0.0081, + "step": 638660 + }, + { + "epoch": 1.66, + "learning_rate": 5.167128500366788e-05, + "loss": 0.0059, + "step": 638670 + }, + { + "epoch": 1.66, + "learning_rate": 5.166739678729642e-05, + "loss": 0.0086, + "step": 638680 + }, + { + "epoch": 1.66, + "learning_rate": 5.166350857092495e-05, + "loss": 0.0094, + "step": 638690 + }, + { + "epoch": 1.66, + "learning_rate": 5.165962035455349e-05, + "loss": 0.009, + "step": 638700 + }, + { + "epoch": 1.66, + "learning_rate": 5.165573213818202e-05, + "loss": 0.0095, + "step": 638710 + }, + { + "epoch": 1.66, + "learning_rate": 5.165184392181056e-05, + "loss": 0.007, + "step": 638720 + }, + { + "epoch": 1.66, + "learning_rate": 5.164795570543909e-05, + "loss": 0.0072, + "step": 638730 + }, + { + "epoch": 1.66, + "learning_rate": 5.1644067489067634e-05, + "loss": 0.0076, + "step": 638740 + }, + { + "epoch": 1.66, + "learning_rate": 5.164017927269617e-05, + "loss": 0.0077, + "step": 638750 + }, + { + "epoch": 1.66, + "learning_rate": 5.16362910563247e-05, + "loss": 0.0129, + "step": 638760 + }, + { + "epoch": 1.66, + "learning_rate": 5.163240283995323e-05, + "loss": 0.0085, + "step": 638770 + }, + { + "epoch": 1.66, + "learning_rate": 5.1628514623581767e-05, + "loss": 0.0098, + "step": 638780 + }, + { + "epoch": 1.66, + "learning_rate": 5.16246264072103e-05, + "loss": 0.0072, + "step": 638790 + }, + { + "epoch": 1.66, + "learning_rate": 5.1620738190838836e-05, + "loss": 0.0076, + "step": 638800 + }, + { + "epoch": 1.66, + "learning_rate": 5.161684997446737e-05, + "loss": 0.0099, + "step": 638810 + }, + { + "epoch": 1.66, + "learning_rate": 5.1612961758095906e-05, + "loss": 0.0073, + "step": 638820 + }, + { + "epoch": 1.66, + "learning_rate": 5.160907354172444e-05, + "loss": 0.0073, + "step": 638830 + }, + { + "epoch": 1.66, + "learning_rate": 5.160518532535298e-05, + "loss": 0.0087, + "step": 638840 + }, + { + "epoch": 1.66, + "learning_rate": 5.160129710898152e-05, + "loss": 0.0086, + "step": 638850 + }, + { + "epoch": 1.66, + "learning_rate": 5.159740889261005e-05, + "loss": 0.0084, + "step": 638860 + }, + { + "epoch": 1.66, + "learning_rate": 5.159352067623859e-05, + "loss": 0.0068, + "step": 638870 + }, + { + "epoch": 1.66, + "learning_rate": 5.158963245986712e-05, + "loss": 0.0067, + "step": 638880 + }, + { + "epoch": 1.66, + "learning_rate": 5.158574424349566e-05, + "loss": 0.0073, + "step": 638890 + }, + { + "epoch": 1.66, + "learning_rate": 5.158185602712419e-05, + "loss": 0.0137, + "step": 638900 + }, + { + "epoch": 1.66, + "learning_rate": 5.1577967810752727e-05, + "loss": 0.0084, + "step": 638910 + }, + { + "epoch": 1.66, + "learning_rate": 5.157407959438127e-05, + "loss": 0.009, + "step": 638920 + }, + { + "epoch": 1.66, + "learning_rate": 5.15701913780098e-05, + "loss": 0.0068, + "step": 638930 + }, + { + "epoch": 1.66, + "learning_rate": 5.156630316163834e-05, + "loss": 0.0098, + "step": 638940 + }, + { + "epoch": 1.66, + "learning_rate": 5.156241494526687e-05, + "loss": 0.0076, + "step": 638950 + }, + { + "epoch": 1.66, + "learning_rate": 5.155852672889541e-05, + "loss": 0.0055, + "step": 638960 + }, + { + "epoch": 1.66, + "learning_rate": 5.155463851252394e-05, + "loss": 0.0105, + "step": 638970 + }, + { + "epoch": 1.66, + "learning_rate": 5.155075029615248e-05, + "loss": 0.0071, + "step": 638980 + }, + { + "epoch": 1.66, + "learning_rate": 5.154686207978101e-05, + "loss": 0.0101, + "step": 638990 + }, + { + "epoch": 1.66, + "learning_rate": 5.154297386340954e-05, + "loss": 0.0095, + "step": 639000 + }, + { + "epoch": 1.66, + "eval_cer": 0.8816564983043399, + "eval_loss": 0.005335902329534292, + "eval_runtime": 107.8798, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 639000 + }, + { + "epoch": 1.66, + "learning_rate": 5.1539085647038075e-05, + "loss": 0.0056, + "step": 639010 + }, + { + "epoch": 1.66, + "learning_rate": 5.153519743066662e-05, + "loss": 0.0079, + "step": 639020 + }, + { + "epoch": 1.66, + "learning_rate": 5.153130921429515e-05, + "loss": 0.0089, + "step": 639030 + }, + { + "epoch": 1.66, + "learning_rate": 5.1527420997923687e-05, + "loss": 0.0075, + "step": 639040 + }, + { + "epoch": 1.66, + "learning_rate": 5.152353278155222e-05, + "loss": 0.0065, + "step": 639050 + }, + { + "epoch": 1.66, + "learning_rate": 5.1519644565180756e-05, + "loss": 0.0092, + "step": 639060 + }, + { + "epoch": 1.66, + "learning_rate": 5.151575634880929e-05, + "loss": 0.0095, + "step": 639070 + }, + { + "epoch": 1.66, + "learning_rate": 5.1511868132437826e-05, + "loss": 0.0112, + "step": 639080 + }, + { + "epoch": 1.66, + "learning_rate": 5.150797991606636e-05, + "loss": 0.0095, + "step": 639090 + }, + { + "epoch": 1.66, + "learning_rate": 5.15040916996949e-05, + "loss": 0.0078, + "step": 639100 + }, + { + "epoch": 1.66, + "learning_rate": 5.150020348332344e-05, + "loss": 0.011, + "step": 639110 + }, + { + "epoch": 1.66, + "learning_rate": 5.149631526695197e-05, + "loss": 0.0076, + "step": 639120 + }, + { + "epoch": 1.66, + "learning_rate": 5.149242705058051e-05, + "loss": 0.0079, + "step": 639130 + }, + { + "epoch": 1.66, + "learning_rate": 5.148853883420904e-05, + "loss": 0.0061, + "step": 639140 + }, + { + "epoch": 1.66, + "learning_rate": 5.148465061783758e-05, + "loss": 0.0065, + "step": 639150 + }, + { + "epoch": 1.66, + "learning_rate": 5.148076240146611e-05, + "loss": 0.0067, + "step": 639160 + }, + { + "epoch": 1.66, + "learning_rate": 5.1476874185094647e-05, + "loss": 0.0093, + "step": 639170 + }, + { + "epoch": 1.66, + "learning_rate": 5.147298596872319e-05, + "loss": 0.0065, + "step": 639180 + }, + { + "epoch": 1.66, + "learning_rate": 5.146909775235172e-05, + "loss": 0.0067, + "step": 639190 + }, + { + "epoch": 1.66, + "learning_rate": 5.146520953598026e-05, + "loss": 0.0074, + "step": 639200 + }, + { + "epoch": 1.66, + "learning_rate": 5.146132131960879e-05, + "loss": 0.0065, + "step": 639210 + }, + { + "epoch": 1.66, + "learning_rate": 5.145743310323733e-05, + "loss": 0.0093, + "step": 639220 + }, + { + "epoch": 1.66, + "learning_rate": 5.145354488686586e-05, + "loss": 0.0079, + "step": 639230 + }, + { + "epoch": 1.66, + "learning_rate": 5.14496566704944e-05, + "loss": 0.0083, + "step": 639240 + }, + { + "epoch": 1.66, + "learning_rate": 5.1445768454122925e-05, + "loss": 0.0073, + "step": 639250 + }, + { + "epoch": 1.66, + "learning_rate": 5.144188023775146e-05, + "loss": 0.0101, + "step": 639260 + }, + { + "epoch": 1.66, + "learning_rate": 5.1437992021379995e-05, + "loss": 0.0081, + "step": 639270 + }, + { + "epoch": 1.66, + "learning_rate": 5.143410380500854e-05, + "loss": 0.008, + "step": 639280 + }, + { + "epoch": 1.66, + "learning_rate": 5.143021558863707e-05, + "loss": 0.0099, + "step": 639290 + }, + { + "epoch": 1.66, + "learning_rate": 5.1426327372265607e-05, + "loss": 0.0084, + "step": 639300 + }, + { + "epoch": 1.66, + "learning_rate": 5.142243915589414e-05, + "loss": 0.0057, + "step": 639310 + }, + { + "epoch": 1.66, + "learning_rate": 5.1418550939522676e-05, + "loss": 0.0068, + "step": 639320 + }, + { + "epoch": 1.66, + "learning_rate": 5.141466272315121e-05, + "loss": 0.012, + "step": 639330 + }, + { + "epoch": 1.66, + "learning_rate": 5.1410774506779746e-05, + "loss": 0.0088, + "step": 639340 + }, + { + "epoch": 1.66, + "learning_rate": 5.140688629040828e-05, + "loss": 0.009, + "step": 639350 + }, + { + "epoch": 1.66, + "learning_rate": 5.140299807403682e-05, + "loss": 0.0092, + "step": 639360 + }, + { + "epoch": 1.66, + "learning_rate": 5.139910985766536e-05, + "loss": 0.0081, + "step": 639370 + }, + { + "epoch": 1.66, + "learning_rate": 5.139522164129389e-05, + "loss": 0.0096, + "step": 639380 + }, + { + "epoch": 1.66, + "learning_rate": 5.139133342492243e-05, + "loss": 0.0085, + "step": 639390 + }, + { + "epoch": 1.66, + "learning_rate": 5.138744520855096e-05, + "loss": 0.0064, + "step": 639400 + }, + { + "epoch": 1.66, + "learning_rate": 5.13835569921795e-05, + "loss": 0.0085, + "step": 639410 + }, + { + "epoch": 1.66, + "learning_rate": 5.137966877580803e-05, + "loss": 0.0106, + "step": 639420 + }, + { + "epoch": 1.66, + "learning_rate": 5.1375780559436566e-05, + "loss": 0.0118, + "step": 639430 + }, + { + "epoch": 1.66, + "learning_rate": 5.13718923430651e-05, + "loss": 0.0062, + "step": 639440 + }, + { + "epoch": 1.66, + "learning_rate": 5.136800412669364e-05, + "loss": 0.0066, + "step": 639450 + }, + { + "epoch": 1.66, + "learning_rate": 5.136411591032218e-05, + "loss": 0.0094, + "step": 639460 + }, + { + "epoch": 1.66, + "learning_rate": 5.136022769395071e-05, + "loss": 0.0073, + "step": 639470 + }, + { + "epoch": 1.66, + "learning_rate": 5.135633947757925e-05, + "loss": 0.0073, + "step": 639480 + }, + { + "epoch": 1.66, + "learning_rate": 5.135245126120778e-05, + "loss": 0.0093, + "step": 639490 + }, + { + "epoch": 1.66, + "learning_rate": 5.134856304483631e-05, + "loss": 0.0068, + "step": 639500 + }, + { + "epoch": 1.66, + "learning_rate": 5.1344674828464845e-05, + "loss": 0.0087, + "step": 639510 + }, + { + "epoch": 1.66, + "learning_rate": 5.134078661209338e-05, + "loss": 0.0064, + "step": 639520 + }, + { + "epoch": 1.66, + "learning_rate": 5.1336898395721915e-05, + "loss": 0.0092, + "step": 639530 + }, + { + "epoch": 1.66, + "learning_rate": 5.133301017935046e-05, + "loss": 0.0077, + "step": 639540 + }, + { + "epoch": 1.66, + "learning_rate": 5.132912196297899e-05, + "loss": 0.0098, + "step": 639550 + }, + { + "epoch": 1.66, + "learning_rate": 5.1325233746607526e-05, + "loss": 0.0072, + "step": 639560 + }, + { + "epoch": 1.66, + "learning_rate": 5.132134553023606e-05, + "loss": 0.0072, + "step": 639570 + }, + { + "epoch": 1.66, + "learning_rate": 5.1317457313864596e-05, + "loss": 0.0096, + "step": 639580 + }, + { + "epoch": 1.66, + "learning_rate": 5.131356909749313e-05, + "loss": 0.0048, + "step": 639590 + }, + { + "epoch": 1.66, + "learning_rate": 5.1309680881121666e-05, + "loss": 0.0069, + "step": 639600 + }, + { + "epoch": 1.66, + "learning_rate": 5.13057926647502e-05, + "loss": 0.0092, + "step": 639610 + }, + { + "epoch": 1.66, + "learning_rate": 5.1301904448378736e-05, + "loss": 0.0125, + "step": 639620 + }, + { + "epoch": 1.66, + "learning_rate": 5.129801623200728e-05, + "loss": 0.008, + "step": 639630 + }, + { + "epoch": 1.66, + "learning_rate": 5.129412801563581e-05, + "loss": 0.0072, + "step": 639640 + }, + { + "epoch": 1.66, + "learning_rate": 5.129023979926435e-05, + "loss": 0.0103, + "step": 639650 + }, + { + "epoch": 1.66, + "learning_rate": 5.128635158289288e-05, + "loss": 0.0077, + "step": 639660 + }, + { + "epoch": 1.66, + "learning_rate": 5.128246336652142e-05, + "loss": 0.01, + "step": 639670 + }, + { + "epoch": 1.66, + "learning_rate": 5.127857515014995e-05, + "loss": 0.0075, + "step": 639680 + }, + { + "epoch": 1.66, + "learning_rate": 5.1274686933778486e-05, + "loss": 0.009, + "step": 639690 + }, + { + "epoch": 1.66, + "learning_rate": 5.127079871740702e-05, + "loss": 0.0087, + "step": 639700 + }, + { + "epoch": 1.66, + "learning_rate": 5.126691050103556e-05, + "loss": 0.0072, + "step": 639710 + }, + { + "epoch": 1.66, + "learning_rate": 5.12630222846641e-05, + "loss": 0.0075, + "step": 639720 + }, + { + "epoch": 1.66, + "learning_rate": 5.125913406829263e-05, + "loss": 0.007, + "step": 639730 + }, + { + "epoch": 1.66, + "learning_rate": 5.125524585192117e-05, + "loss": 0.0083, + "step": 639740 + }, + { + "epoch": 1.66, + "learning_rate": 5.1251357635549696e-05, + "loss": 0.0079, + "step": 639750 + }, + { + "epoch": 1.66, + "learning_rate": 5.124746941917823e-05, + "loss": 0.0042, + "step": 639760 + }, + { + "epoch": 1.66, + "learning_rate": 5.1243581202806765e-05, + "loss": 0.0068, + "step": 639770 + }, + { + "epoch": 1.66, + "learning_rate": 5.12396929864353e-05, + "loss": 0.009, + "step": 639780 + }, + { + "epoch": 1.66, + "learning_rate": 5.1235804770063835e-05, + "loss": 0.0104, + "step": 639790 + }, + { + "epoch": 1.66, + "learning_rate": 5.123191655369237e-05, + "loss": 0.0099, + "step": 639800 + }, + { + "epoch": 1.66, + "learning_rate": 5.122802833732091e-05, + "loss": 0.007, + "step": 639810 + }, + { + "epoch": 1.66, + "learning_rate": 5.1224140120949446e-05, + "loss": 0.0111, + "step": 639820 + }, + { + "epoch": 1.66, + "learning_rate": 5.122025190457798e-05, + "loss": 0.0068, + "step": 639830 + }, + { + "epoch": 1.66, + "learning_rate": 5.1216363688206516e-05, + "loss": 0.0097, + "step": 639840 + }, + { + "epoch": 1.66, + "learning_rate": 5.121247547183505e-05, + "loss": 0.0075, + "step": 639850 + }, + { + "epoch": 1.66, + "learning_rate": 5.1208587255463586e-05, + "loss": 0.0094, + "step": 639860 + }, + { + "epoch": 1.66, + "learning_rate": 5.120469903909212e-05, + "loss": 0.0103, + "step": 639870 + }, + { + "epoch": 1.66, + "learning_rate": 5.1200810822720656e-05, + "loss": 0.0095, + "step": 639880 + }, + { + "epoch": 1.66, + "learning_rate": 5.11969226063492e-05, + "loss": 0.0069, + "step": 639890 + }, + { + "epoch": 1.66, + "learning_rate": 5.119303438997773e-05, + "loss": 0.0076, + "step": 639900 + }, + { + "epoch": 1.66, + "learning_rate": 5.118914617360627e-05, + "loss": 0.0105, + "step": 639910 + }, + { + "epoch": 1.66, + "learning_rate": 5.11852579572348e-05, + "loss": 0.0092, + "step": 639920 + }, + { + "epoch": 1.66, + "learning_rate": 5.118136974086334e-05, + "loss": 0.0116, + "step": 639930 + }, + { + "epoch": 1.66, + "learning_rate": 5.117748152449187e-05, + "loss": 0.0077, + "step": 639940 + }, + { + "epoch": 1.66, + "learning_rate": 5.1173593308120406e-05, + "loss": 0.013, + "step": 639950 + }, + { + "epoch": 1.66, + "learning_rate": 5.116970509174894e-05, + "loss": 0.0077, + "step": 639960 + }, + { + "epoch": 1.66, + "learning_rate": 5.116581687537748e-05, + "loss": 0.0085, + "step": 639970 + }, + { + "epoch": 1.66, + "learning_rate": 5.116192865900602e-05, + "loss": 0.0098, + "step": 639980 + }, + { + "epoch": 1.66, + "learning_rate": 5.115804044263455e-05, + "loss": 0.0072, + "step": 639990 + }, + { + "epoch": 1.66, + "learning_rate": 5.115415222626308e-05, + "loss": 0.008, + "step": 640000 + }, + { + "epoch": 1.66, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.005218719597905874, + "eval_runtime": 107.9407, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 640000 + }, + { + "epoch": 1.66, + "learning_rate": 5.1150264009891616e-05, + "loss": 0.0117, + "step": 640010 + }, + { + "epoch": 1.66, + "learning_rate": 5.114637579352015e-05, + "loss": 0.0093, + "step": 640020 + }, + { + "epoch": 1.66, + "learning_rate": 5.1142487577148685e-05, + "loss": 0.0089, + "step": 640030 + }, + { + "epoch": 1.66, + "learning_rate": 5.113859936077722e-05, + "loss": 0.0073, + "step": 640040 + }, + { + "epoch": 1.66, + "learning_rate": 5.1134711144405755e-05, + "loss": 0.0078, + "step": 640050 + }, + { + "epoch": 1.66, + "learning_rate": 5.113082292803429e-05, + "loss": 0.0091, + "step": 640060 + }, + { + "epoch": 1.66, + "learning_rate": 5.112693471166283e-05, + "loss": 0.0061, + "step": 640070 + }, + { + "epoch": 1.66, + "learning_rate": 5.1123046495291366e-05, + "loss": 0.0078, + "step": 640080 + }, + { + "epoch": 1.66, + "learning_rate": 5.11191582789199e-05, + "loss": 0.007, + "step": 640090 + }, + { + "epoch": 1.66, + "learning_rate": 5.1115270062548436e-05, + "loss": 0.011, + "step": 640100 + }, + { + "epoch": 1.66, + "learning_rate": 5.111138184617697e-05, + "loss": 0.0079, + "step": 640110 + }, + { + "epoch": 1.66, + "learning_rate": 5.1107493629805506e-05, + "loss": 0.0063, + "step": 640120 + }, + { + "epoch": 1.66, + "learning_rate": 5.110360541343404e-05, + "loss": 0.0076, + "step": 640130 + }, + { + "epoch": 1.66, + "learning_rate": 5.1099717197062576e-05, + "loss": 0.0075, + "step": 640140 + }, + { + "epoch": 1.66, + "learning_rate": 5.109582898069112e-05, + "loss": 0.0055, + "step": 640150 + }, + { + "epoch": 1.66, + "learning_rate": 5.109194076431965e-05, + "loss": 0.0074, + "step": 640160 + }, + { + "epoch": 1.66, + "learning_rate": 5.108805254794819e-05, + "loss": 0.0072, + "step": 640170 + }, + { + "epoch": 1.66, + "learning_rate": 5.108416433157672e-05, + "loss": 0.0078, + "step": 640180 + }, + { + "epoch": 1.66, + "learning_rate": 5.1080276115205257e-05, + "loss": 0.0106, + "step": 640190 + }, + { + "epoch": 1.66, + "learning_rate": 5.107638789883379e-05, + "loss": 0.0065, + "step": 640200 + }, + { + "epoch": 1.66, + "learning_rate": 5.1072499682462326e-05, + "loss": 0.01, + "step": 640210 + }, + { + "epoch": 1.66, + "learning_rate": 5.106861146609086e-05, + "loss": 0.0101, + "step": 640220 + }, + { + "epoch": 1.66, + "learning_rate": 5.10647232497194e-05, + "loss": 0.0089, + "step": 640230 + }, + { + "epoch": 1.66, + "learning_rate": 5.1060835033347924e-05, + "loss": 0.0092, + "step": 640240 + }, + { + "epoch": 1.66, + "learning_rate": 5.1056946816976466e-05, + "loss": 0.0071, + "step": 640250 + }, + { + "epoch": 1.66, + "learning_rate": 5.1053058600605e-05, + "loss": 0.0084, + "step": 640260 + }, + { + "epoch": 1.66, + "learning_rate": 5.1049170384233536e-05, + "loss": 0.0083, + "step": 640270 + }, + { + "epoch": 1.66, + "learning_rate": 5.104528216786207e-05, + "loss": 0.0112, + "step": 640280 + }, + { + "epoch": 1.66, + "learning_rate": 5.1041393951490605e-05, + "loss": 0.0114, + "step": 640290 + }, + { + "epoch": 1.66, + "learning_rate": 5.103750573511914e-05, + "loss": 0.0088, + "step": 640300 + }, + { + "epoch": 1.66, + "learning_rate": 5.1033617518747675e-05, + "loss": 0.0112, + "step": 640310 + }, + { + "epoch": 1.66, + "learning_rate": 5.102972930237621e-05, + "loss": 0.0069, + "step": 640320 + }, + { + "epoch": 1.66, + "learning_rate": 5.102584108600475e-05, + "loss": 0.0083, + "step": 640330 + }, + { + "epoch": 1.66, + "learning_rate": 5.1021952869633286e-05, + "loss": 0.0101, + "step": 640340 + }, + { + "epoch": 1.66, + "learning_rate": 5.101806465326182e-05, + "loss": 0.0082, + "step": 640350 + }, + { + "epoch": 1.66, + "learning_rate": 5.1014176436890356e-05, + "loss": 0.0089, + "step": 640360 + }, + { + "epoch": 1.66, + "learning_rate": 5.101028822051889e-05, + "loss": 0.0114, + "step": 640370 + }, + { + "epoch": 1.66, + "learning_rate": 5.1006400004147426e-05, + "loss": 0.0085, + "step": 640380 + }, + { + "epoch": 1.66, + "learning_rate": 5.100251178777596e-05, + "loss": 0.0129, + "step": 640390 + }, + { + "epoch": 1.66, + "learning_rate": 5.0998623571404495e-05, + "loss": 0.0101, + "step": 640400 + }, + { + "epoch": 1.66, + "learning_rate": 5.099473535503304e-05, + "loss": 0.0124, + "step": 640410 + }, + { + "epoch": 1.66, + "learning_rate": 5.099084713866157e-05, + "loss": 0.0064, + "step": 640420 + }, + { + "epoch": 1.66, + "learning_rate": 5.098695892229011e-05, + "loss": 0.0084, + "step": 640430 + }, + { + "epoch": 1.66, + "learning_rate": 5.098307070591864e-05, + "loss": 0.0068, + "step": 640440 + }, + { + "epoch": 1.66, + "learning_rate": 5.0979182489547177e-05, + "loss": 0.0079, + "step": 640450 + }, + { + "epoch": 1.66, + "learning_rate": 5.097529427317571e-05, + "loss": 0.0069, + "step": 640460 + }, + { + "epoch": 1.66, + "learning_rate": 5.0971406056804246e-05, + "loss": 0.0082, + "step": 640470 + }, + { + "epoch": 1.66, + "learning_rate": 5.096751784043278e-05, + "loss": 0.0062, + "step": 640480 + }, + { + "epoch": 1.66, + "learning_rate": 5.096362962406131e-05, + "loss": 0.0109, + "step": 640490 + }, + { + "epoch": 1.66, + "learning_rate": 5.0959741407689844e-05, + "loss": 0.0134, + "step": 640500 + }, + { + "epoch": 1.66, + "learning_rate": 5.0955853191318386e-05, + "loss": 0.009, + "step": 640510 + }, + { + "epoch": 1.66, + "learning_rate": 5.095196497494692e-05, + "loss": 0.0061, + "step": 640520 + }, + { + "epoch": 1.66, + "learning_rate": 5.0948076758575455e-05, + "loss": 0.0109, + "step": 640530 + }, + { + "epoch": 1.66, + "learning_rate": 5.094418854220399e-05, + "loss": 0.0103, + "step": 640540 + }, + { + "epoch": 1.66, + "learning_rate": 5.0940300325832525e-05, + "loss": 0.0069, + "step": 640550 + }, + { + "epoch": 1.66, + "learning_rate": 5.093641210946106e-05, + "loss": 0.0064, + "step": 640560 + }, + { + "epoch": 1.66, + "learning_rate": 5.0932523893089595e-05, + "loss": 0.0067, + "step": 640570 + }, + { + "epoch": 1.66, + "learning_rate": 5.092863567671813e-05, + "loss": 0.0088, + "step": 640580 + }, + { + "epoch": 1.66, + "learning_rate": 5.092474746034667e-05, + "loss": 0.011, + "step": 640590 + }, + { + "epoch": 1.66, + "learning_rate": 5.0920859243975206e-05, + "loss": 0.0072, + "step": 640600 + }, + { + "epoch": 1.66, + "learning_rate": 5.091697102760374e-05, + "loss": 0.0089, + "step": 640610 + }, + { + "epoch": 1.66, + "learning_rate": 5.0913082811232276e-05, + "loss": 0.0065, + "step": 640620 + }, + { + "epoch": 1.66, + "learning_rate": 5.090919459486081e-05, + "loss": 0.0067, + "step": 640630 + }, + { + "epoch": 1.66, + "learning_rate": 5.0905306378489346e-05, + "loss": 0.0073, + "step": 640640 + }, + { + "epoch": 1.66, + "learning_rate": 5.090141816211788e-05, + "loss": 0.0075, + "step": 640650 + }, + { + "epoch": 1.66, + "learning_rate": 5.0897529945746415e-05, + "loss": 0.0068, + "step": 640660 + }, + { + "epoch": 1.66, + "learning_rate": 5.089364172937496e-05, + "loss": 0.0091, + "step": 640670 + }, + { + "epoch": 1.66, + "learning_rate": 5.088975351300349e-05, + "loss": 0.009, + "step": 640680 + }, + { + "epoch": 1.66, + "learning_rate": 5.088586529663203e-05, + "loss": 0.0082, + "step": 640690 + }, + { + "epoch": 1.66, + "learning_rate": 5.088197708026056e-05, + "loss": 0.0081, + "step": 640700 + }, + { + "epoch": 1.66, + "learning_rate": 5.0878088863889097e-05, + "loss": 0.006, + "step": 640710 + }, + { + "epoch": 1.66, + "learning_rate": 5.087420064751763e-05, + "loss": 0.0098, + "step": 640720 + }, + { + "epoch": 1.66, + "learning_rate": 5.0870312431146166e-05, + "loss": 0.0089, + "step": 640730 + }, + { + "epoch": 1.66, + "learning_rate": 5.0866424214774694e-05, + "loss": 0.0115, + "step": 640740 + }, + { + "epoch": 1.66, + "learning_rate": 5.086253599840323e-05, + "loss": 0.0078, + "step": 640750 + }, + { + "epoch": 1.66, + "learning_rate": 5.0858647782031764e-05, + "loss": 0.0092, + "step": 640760 + }, + { + "epoch": 1.66, + "learning_rate": 5.0854759565660306e-05, + "loss": 0.0066, + "step": 640770 + }, + { + "epoch": 1.66, + "learning_rate": 5.085087134928884e-05, + "loss": 0.0098, + "step": 640780 + }, + { + "epoch": 1.66, + "learning_rate": 5.0846983132917375e-05, + "loss": 0.0084, + "step": 640790 + }, + { + "epoch": 1.66, + "learning_rate": 5.084309491654591e-05, + "loss": 0.0051, + "step": 640800 + }, + { + "epoch": 1.66, + "learning_rate": 5.0839206700174445e-05, + "loss": 0.0105, + "step": 640810 + }, + { + "epoch": 1.66, + "learning_rate": 5.083531848380298e-05, + "loss": 0.0091, + "step": 640820 + }, + { + "epoch": 1.66, + "learning_rate": 5.0831430267431515e-05, + "loss": 0.0119, + "step": 640830 + }, + { + "epoch": 1.66, + "learning_rate": 5.082754205106005e-05, + "loss": 0.0094, + "step": 640840 + }, + { + "epoch": 1.66, + "learning_rate": 5.082365383468859e-05, + "loss": 0.008, + "step": 640850 + }, + { + "epoch": 1.66, + "learning_rate": 5.0819765618317126e-05, + "loss": 0.0085, + "step": 640860 + }, + { + "epoch": 1.66, + "learning_rate": 5.081587740194566e-05, + "loss": 0.0086, + "step": 640870 + }, + { + "epoch": 1.66, + "learning_rate": 5.0811989185574196e-05, + "loss": 0.0129, + "step": 640880 + }, + { + "epoch": 1.66, + "learning_rate": 5.080810096920273e-05, + "loss": 0.0087, + "step": 640890 + }, + { + "epoch": 1.66, + "learning_rate": 5.0804212752831266e-05, + "loss": 0.0064, + "step": 640900 + }, + { + "epoch": 1.66, + "learning_rate": 5.08003245364598e-05, + "loss": 0.0064, + "step": 640910 + }, + { + "epoch": 1.66, + "learning_rate": 5.0796436320088335e-05, + "loss": 0.0071, + "step": 640920 + }, + { + "epoch": 1.66, + "learning_rate": 5.079254810371687e-05, + "loss": 0.0069, + "step": 640930 + }, + { + "epoch": 1.66, + "learning_rate": 5.078865988734541e-05, + "loss": 0.0095, + "step": 640940 + }, + { + "epoch": 1.66, + "learning_rate": 5.078477167097395e-05, + "loss": 0.01, + "step": 640950 + }, + { + "epoch": 1.66, + "learning_rate": 5.078088345460248e-05, + "loss": 0.0091, + "step": 640960 + }, + { + "epoch": 1.66, + "learning_rate": 5.0776995238231016e-05, + "loss": 0.0103, + "step": 640970 + }, + { + "epoch": 1.66, + "learning_rate": 5.077310702185955e-05, + "loss": 0.0057, + "step": 640980 + }, + { + "epoch": 1.66, + "learning_rate": 5.076921880548808e-05, + "loss": 0.0085, + "step": 640990 + }, + { + "epoch": 1.66, + "learning_rate": 5.0765330589116614e-05, + "loss": 0.0097, + "step": 641000 + }, + { + "epoch": 1.66, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.005241747945547104, + "eval_runtime": 107.7049, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, + "step": 641000 + }, + { + "epoch": 1.66, + "learning_rate": 5.076144237274515e-05, + "loss": 0.0089, + "step": 641010 + }, + { + "epoch": 1.66, + "learning_rate": 5.0757554156373684e-05, + "loss": 0.0068, + "step": 641020 + }, + { + "epoch": 1.66, + "learning_rate": 5.075366594000222e-05, + "loss": 0.0067, + "step": 641030 + }, + { + "epoch": 1.66, + "learning_rate": 5.074977772363076e-05, + "loss": 0.0076, + "step": 641040 + }, + { + "epoch": 1.66, + "learning_rate": 5.0745889507259295e-05, + "loss": 0.0081, + "step": 641050 + }, + { + "epoch": 1.66, + "learning_rate": 5.074200129088783e-05, + "loss": 0.0069, + "step": 641060 + }, + { + "epoch": 1.66, + "learning_rate": 5.0738113074516365e-05, + "loss": 0.0076, + "step": 641070 + }, + { + "epoch": 1.66, + "learning_rate": 5.07342248581449e-05, + "loss": 0.0095, + "step": 641080 + }, + { + "epoch": 1.66, + "learning_rate": 5.0730336641773435e-05, + "loss": 0.0071, + "step": 641090 + }, + { + "epoch": 1.66, + "learning_rate": 5.072644842540197e-05, + "loss": 0.0086, + "step": 641100 + }, + { + "epoch": 1.66, + "learning_rate": 5.0722560209030505e-05, + "loss": 0.0108, + "step": 641110 + }, + { + "epoch": 1.66, + "learning_rate": 5.0718671992659046e-05, + "loss": 0.0111, + "step": 641120 + }, + { + "epoch": 1.66, + "learning_rate": 5.071478377628758e-05, + "loss": 0.0088, + "step": 641130 + }, + { + "epoch": 1.66, + "learning_rate": 5.0710895559916116e-05, + "loss": 0.0073, + "step": 641140 + }, + { + "epoch": 1.66, + "learning_rate": 5.070700734354465e-05, + "loss": 0.0096, + "step": 641150 + }, + { + "epoch": 1.66, + "learning_rate": 5.0703119127173186e-05, + "loss": 0.0077, + "step": 641160 + }, + { + "epoch": 1.66, + "learning_rate": 5.069923091080172e-05, + "loss": 0.0072, + "step": 641170 + }, + { + "epoch": 1.66, + "learning_rate": 5.0695342694430255e-05, + "loss": 0.0106, + "step": 641180 + }, + { + "epoch": 1.66, + "learning_rate": 5.069145447805879e-05, + "loss": 0.0117, + "step": 641190 + }, + { + "epoch": 1.66, + "learning_rate": 5.068756626168733e-05, + "loss": 0.0076, + "step": 641200 + }, + { + "epoch": 1.66, + "learning_rate": 5.068367804531587e-05, + "loss": 0.0066, + "step": 641210 + }, + { + "epoch": 1.66, + "learning_rate": 5.06797898289444e-05, + "loss": 0.0082, + "step": 641220 + }, + { + "epoch": 1.66, + "learning_rate": 5.0675901612572936e-05, + "loss": 0.0092, + "step": 641230 + }, + { + "epoch": 1.66, + "learning_rate": 5.0672013396201465e-05, + "loss": 0.0096, + "step": 641240 + }, + { + "epoch": 1.66, + "learning_rate": 5.066812517983e-05, + "loss": 0.0099, + "step": 641250 + }, + { + "epoch": 1.66, + "learning_rate": 5.0664236963458534e-05, + "loss": 0.0086, + "step": 641260 + }, + { + "epoch": 1.66, + "learning_rate": 5.066034874708707e-05, + "loss": 0.0079, + "step": 641270 + }, + { + "epoch": 1.66, + "learning_rate": 5.0656460530715604e-05, + "loss": 0.0078, + "step": 641280 + }, + { + "epoch": 1.66, + "learning_rate": 5.065257231434414e-05, + "loss": 0.0082, + "step": 641290 + }, + { + "epoch": 1.66, + "learning_rate": 5.064868409797268e-05, + "loss": 0.0074, + "step": 641300 + }, + { + "epoch": 1.66, + "learning_rate": 5.0644795881601215e-05, + "loss": 0.0094, + "step": 641310 + }, + { + "epoch": 1.66, + "learning_rate": 5.064090766522975e-05, + "loss": 0.0081, + "step": 641320 + }, + { + "epoch": 1.66, + "learning_rate": 5.0637019448858285e-05, + "loss": 0.009, + "step": 641330 + }, + { + "epoch": 1.66, + "learning_rate": 5.063313123248682e-05, + "loss": 0.0102, + "step": 641340 + }, + { + "epoch": 1.66, + "learning_rate": 5.0629243016115355e-05, + "loss": 0.0084, + "step": 641350 + }, + { + "epoch": 1.66, + "learning_rate": 5.062535479974389e-05, + "loss": 0.007, + "step": 641360 + }, + { + "epoch": 1.66, + "learning_rate": 5.0621466583372424e-05, + "loss": 0.007, + "step": 641370 + }, + { + "epoch": 1.66, + "learning_rate": 5.0617578367000966e-05, + "loss": 0.0084, + "step": 641380 + }, + { + "epoch": 1.66, + "learning_rate": 5.06136901506295e-05, + "loss": 0.011, + "step": 641390 + }, + { + "epoch": 1.66, + "learning_rate": 5.0609801934258036e-05, + "loss": 0.0075, + "step": 641400 + }, + { + "epoch": 1.66, + "learning_rate": 5.060591371788657e-05, + "loss": 0.0072, + "step": 641410 + }, + { + "epoch": 1.66, + "learning_rate": 5.0602025501515106e-05, + "loss": 0.0097, + "step": 641420 + }, + { + "epoch": 1.66, + "learning_rate": 5.059813728514364e-05, + "loss": 0.0058, + "step": 641430 + }, + { + "epoch": 1.66, + "learning_rate": 5.0594249068772175e-05, + "loss": 0.0142, + "step": 641440 + }, + { + "epoch": 1.66, + "learning_rate": 5.059036085240071e-05, + "loss": 0.0063, + "step": 641450 + }, + { + "epoch": 1.66, + "learning_rate": 5.058647263602925e-05, + "loss": 0.0084, + "step": 641460 + }, + { + "epoch": 1.66, + "learning_rate": 5.058258441965779e-05, + "loss": 0.0083, + "step": 641470 + }, + { + "epoch": 1.66, + "learning_rate": 5.0578696203286315e-05, + "loss": 0.01, + "step": 641480 + }, + { + "epoch": 1.66, + "learning_rate": 5.057480798691485e-05, + "loss": 0.0073, + "step": 641490 + }, + { + "epoch": 1.66, + "learning_rate": 5.0570919770543384e-05, + "loss": 0.0076, + "step": 641500 + }, + { + "epoch": 1.66, + "learning_rate": 5.056703155417192e-05, + "loss": 0.0098, + "step": 641510 + }, + { + "epoch": 1.66, + "learning_rate": 5.0563143337800454e-05, + "loss": 0.0086, + "step": 641520 + }, + { + "epoch": 1.66, + "learning_rate": 5.055925512142899e-05, + "loss": 0.0095, + "step": 641530 + }, + { + "epoch": 1.66, + "learning_rate": 5.0555366905057524e-05, + "loss": 0.0082, + "step": 641540 + }, + { + "epoch": 1.66, + "learning_rate": 5.055147868868606e-05, + "loss": 0.008, + "step": 641550 + }, + { + "epoch": 1.66, + "learning_rate": 5.05475904723146e-05, + "loss": 0.0061, + "step": 641560 + }, + { + "epoch": 1.66, + "learning_rate": 5.0543702255943135e-05, + "loss": 0.0095, + "step": 641570 + }, + { + "epoch": 1.66, + "learning_rate": 5.053981403957167e-05, + "loss": 0.0083, + "step": 641580 + }, + { + "epoch": 1.66, + "learning_rate": 5.0535925823200205e-05, + "loss": 0.0065, + "step": 641590 + }, + { + "epoch": 1.66, + "learning_rate": 5.053203760682874e-05, + "loss": 0.0087, + "step": 641600 + }, + { + "epoch": 1.66, + "learning_rate": 5.0528149390457275e-05, + "loss": 0.0067, + "step": 641610 + }, + { + "epoch": 1.66, + "learning_rate": 5.052426117408581e-05, + "loss": 0.0113, + "step": 641620 + }, + { + "epoch": 1.66, + "learning_rate": 5.0520372957714344e-05, + "loss": 0.0102, + "step": 641630 + }, + { + "epoch": 1.66, + "learning_rate": 5.0516484741342886e-05, + "loss": 0.0072, + "step": 641640 + }, + { + "epoch": 1.66, + "learning_rate": 5.051259652497142e-05, + "loss": 0.0094, + "step": 641650 + }, + { + "epoch": 1.66, + "learning_rate": 5.0508708308599956e-05, + "loss": 0.0094, + "step": 641660 + }, + { + "epoch": 1.66, + "learning_rate": 5.050482009222849e-05, + "loss": 0.006, + "step": 641670 + }, + { + "epoch": 1.66, + "learning_rate": 5.0500931875857026e-05, + "loss": 0.0073, + "step": 641680 + }, + { + "epoch": 1.66, + "learning_rate": 5.049704365948556e-05, + "loss": 0.0079, + "step": 641690 + }, + { + "epoch": 1.66, + "learning_rate": 5.0493155443114095e-05, + "loss": 0.0133, + "step": 641700 + }, + { + "epoch": 1.66, + "learning_rate": 5.048926722674263e-05, + "loss": 0.0065, + "step": 641710 + }, + { + "epoch": 1.66, + "learning_rate": 5.048537901037117e-05, + "loss": 0.0087, + "step": 641720 + }, + { + "epoch": 1.66, + "learning_rate": 5.048149079399969e-05, + "loss": 0.0079, + "step": 641730 + }, + { + "epoch": 1.66, + "learning_rate": 5.0477602577628235e-05, + "loss": 0.0109, + "step": 641740 + }, + { + "epoch": 1.66, + "learning_rate": 5.047371436125677e-05, + "loss": 0.0125, + "step": 641750 + }, + { + "epoch": 1.66, + "learning_rate": 5.0469826144885304e-05, + "loss": 0.0116, + "step": 641760 + }, + { + "epoch": 1.66, + "learning_rate": 5.046593792851384e-05, + "loss": 0.0076, + "step": 641770 + }, + { + "epoch": 1.66, + "learning_rate": 5.0462049712142374e-05, + "loss": 0.0071, + "step": 641780 + }, + { + "epoch": 1.66, + "learning_rate": 5.045816149577091e-05, + "loss": 0.0097, + "step": 641790 + }, + { + "epoch": 1.66, + "learning_rate": 5.0454273279399444e-05, + "loss": 0.0125, + "step": 641800 + }, + { + "epoch": 1.66, + "learning_rate": 5.045038506302798e-05, + "loss": 0.0068, + "step": 641810 + }, + { + "epoch": 1.66, + "learning_rate": 5.044649684665652e-05, + "loss": 0.0093, + "step": 641820 + }, + { + "epoch": 1.66, + "learning_rate": 5.0442608630285055e-05, + "loss": 0.0088, + "step": 641830 + }, + { + "epoch": 1.66, + "learning_rate": 5.043872041391359e-05, + "loss": 0.0097, + "step": 641840 + }, + { + "epoch": 1.66, + "learning_rate": 5.0434832197542125e-05, + "loss": 0.0081, + "step": 641850 + }, + { + "epoch": 1.66, + "learning_rate": 5.043094398117066e-05, + "loss": 0.0073, + "step": 641860 + }, + { + "epoch": 1.66, + "learning_rate": 5.0427055764799195e-05, + "loss": 0.0079, + "step": 641870 + }, + { + "epoch": 1.66, + "learning_rate": 5.042316754842773e-05, + "loss": 0.0069, + "step": 641880 + }, + { + "epoch": 1.66, + "learning_rate": 5.0419279332056264e-05, + "loss": 0.0106, + "step": 641890 + }, + { + "epoch": 1.66, + "learning_rate": 5.0415391115684806e-05, + "loss": 0.0072, + "step": 641900 + }, + { + "epoch": 1.66, + "learning_rate": 5.041150289931334e-05, + "loss": 0.0096, + "step": 641910 + }, + { + "epoch": 1.66, + "learning_rate": 5.0407614682941876e-05, + "loss": 0.0075, + "step": 641920 + }, + { + "epoch": 1.66, + "learning_rate": 5.040372646657041e-05, + "loss": 0.0094, + "step": 641930 + }, + { + "epoch": 1.66, + "learning_rate": 5.0399838250198945e-05, + "loss": 0.0093, + "step": 641940 + }, + { + "epoch": 1.66, + "learning_rate": 5.039595003382748e-05, + "loss": 0.0104, + "step": 641950 + }, + { + "epoch": 1.66, + "learning_rate": 5.0392061817456015e-05, + "loss": 0.0093, + "step": 641960 + }, + { + "epoch": 1.66, + "learning_rate": 5.038817360108455e-05, + "loss": 0.0069, + "step": 641970 + }, + { + "epoch": 1.66, + "learning_rate": 5.038428538471308e-05, + "loss": 0.0076, + "step": 641980 + }, + { + "epoch": 1.66, + "learning_rate": 5.038039716834161e-05, + "loss": 0.006, + "step": 641990 + }, + { + "epoch": 1.66, + "learning_rate": 5.0376508951970155e-05, + "loss": 0.0082, + "step": 642000 + }, + { + "epoch": 1.66, + "eval_cer": 0.88167329394755, + "eval_loss": 0.005268983077257872, + "eval_runtime": 107.7603, + "eval_samples_per_second": 18.56, + "eval_steps_per_second": 4.64, + "step": 642000 + }, + { + "epoch": 1.66, + "learning_rate": 5.037262073559869e-05, + "loss": 0.0058, + "step": 642010 + }, + { + "epoch": 1.66, + "learning_rate": 5.0368732519227224e-05, + "loss": 0.0084, + "step": 642020 + }, + { + "epoch": 1.66, + "learning_rate": 5.036484430285576e-05, + "loss": 0.0084, + "step": 642030 + }, + { + "epoch": 1.66, + "learning_rate": 5.0360956086484294e-05, + "loss": 0.0079, + "step": 642040 + }, + { + "epoch": 1.66, + "learning_rate": 5.035706787011283e-05, + "loss": 0.0053, + "step": 642050 + }, + { + "epoch": 1.66, + "learning_rate": 5.0353179653741364e-05, + "loss": 0.0094, + "step": 642060 + }, + { + "epoch": 1.66, + "learning_rate": 5.03492914373699e-05, + "loss": 0.0087, + "step": 642070 + }, + { + "epoch": 1.66, + "learning_rate": 5.034540322099844e-05, + "loss": 0.0054, + "step": 642080 + }, + { + "epoch": 1.66, + "learning_rate": 5.0341515004626975e-05, + "loss": 0.0093, + "step": 642090 + }, + { + "epoch": 1.66, + "learning_rate": 5.033762678825551e-05, + "loss": 0.01, + "step": 642100 + }, + { + "epoch": 1.66, + "learning_rate": 5.0333738571884045e-05, + "loss": 0.0093, + "step": 642110 + }, + { + "epoch": 1.66, + "learning_rate": 5.032985035551258e-05, + "loss": 0.0092, + "step": 642120 + }, + { + "epoch": 1.66, + "learning_rate": 5.0325962139141115e-05, + "loss": 0.0097, + "step": 642130 + }, + { + "epoch": 1.66, + "learning_rate": 5.032207392276965e-05, + "loss": 0.0107, + "step": 642140 + }, + { + "epoch": 1.66, + "learning_rate": 5.0318185706398184e-05, + "loss": 0.0076, + "step": 642150 + }, + { + "epoch": 1.66, + "learning_rate": 5.0314297490026726e-05, + "loss": 0.0069, + "step": 642160 + }, + { + "epoch": 1.66, + "learning_rate": 5.031040927365526e-05, + "loss": 0.008, + "step": 642170 + }, + { + "epoch": 1.66, + "learning_rate": 5.0306521057283796e-05, + "loss": 0.009, + "step": 642180 + }, + { + "epoch": 1.66, + "learning_rate": 5.030263284091233e-05, + "loss": 0.0072, + "step": 642190 + }, + { + "epoch": 1.66, + "learning_rate": 5.0298744624540865e-05, + "loss": 0.0061, + "step": 642200 + }, + { + "epoch": 1.66, + "learning_rate": 5.02948564081694e-05, + "loss": 0.0086, + "step": 642210 + }, + { + "epoch": 1.66, + "learning_rate": 5.0290968191797935e-05, + "loss": 0.0089, + "step": 642220 + }, + { + "epoch": 1.66, + "learning_rate": 5.028707997542646e-05, + "loss": 0.0101, + "step": 642230 + }, + { + "epoch": 1.66, + "learning_rate": 5.0283191759055e-05, + "loss": 0.0102, + "step": 642240 + }, + { + "epoch": 1.66, + "learning_rate": 5.027930354268353e-05, + "loss": 0.0075, + "step": 642250 + }, + { + "epoch": 1.66, + "learning_rate": 5.0275415326312075e-05, + "loss": 0.0084, + "step": 642260 + }, + { + "epoch": 1.66, + "learning_rate": 5.027152710994061e-05, + "loss": 0.0081, + "step": 642270 + }, + { + "epoch": 1.66, + "learning_rate": 5.0267638893569144e-05, + "loss": 0.0093, + "step": 642280 + }, + { + "epoch": 1.66, + "learning_rate": 5.026375067719768e-05, + "loss": 0.0071, + "step": 642290 + }, + { + "epoch": 1.66, + "learning_rate": 5.0259862460826214e-05, + "loss": 0.0099, + "step": 642300 + }, + { + "epoch": 1.66, + "learning_rate": 5.025597424445475e-05, + "loss": 0.0084, + "step": 642310 + }, + { + "epoch": 1.66, + "learning_rate": 5.0252086028083284e-05, + "loss": 0.0108, + "step": 642320 + }, + { + "epoch": 1.67, + "learning_rate": 5.024819781171182e-05, + "loss": 0.0072, + "step": 642330 + }, + { + "epoch": 1.67, + "learning_rate": 5.0244309595340353e-05, + "loss": 0.0065, + "step": 642340 + }, + { + "epoch": 1.67, + "learning_rate": 5.0240421378968895e-05, + "loss": 0.0097, + "step": 642350 + }, + { + "epoch": 1.67, + "learning_rate": 5.023653316259743e-05, + "loss": 0.0092, + "step": 642360 + }, + { + "epoch": 1.67, + "learning_rate": 5.0232644946225965e-05, + "loss": 0.0076, + "step": 642370 + }, + { + "epoch": 1.67, + "learning_rate": 5.02287567298545e-05, + "loss": 0.0078, + "step": 642380 + }, + { + "epoch": 1.67, + "learning_rate": 5.0224868513483035e-05, + "loss": 0.0065, + "step": 642390 + }, + { + "epoch": 1.67, + "learning_rate": 5.022098029711157e-05, + "loss": 0.0093, + "step": 642400 + }, + { + "epoch": 1.67, + "learning_rate": 5.0217092080740104e-05, + "loss": 0.0082, + "step": 642410 + }, + { + "epoch": 1.67, + "learning_rate": 5.021320386436864e-05, + "loss": 0.0093, + "step": 642420 + }, + { + "epoch": 1.67, + "learning_rate": 5.020931564799718e-05, + "loss": 0.0093, + "step": 642430 + }, + { + "epoch": 1.67, + "learning_rate": 5.0205427431625716e-05, + "loss": 0.0078, + "step": 642440 + }, + { + "epoch": 1.67, + "learning_rate": 5.020153921525425e-05, + "loss": 0.0059, + "step": 642450 + }, + { + "epoch": 1.67, + "learning_rate": 5.0197650998882785e-05, + "loss": 0.0073, + "step": 642460 + }, + { + "epoch": 1.67, + "learning_rate": 5.019376278251132e-05, + "loss": 0.0066, + "step": 642470 + }, + { + "epoch": 1.67, + "learning_rate": 5.018987456613985e-05, + "loss": 0.0085, + "step": 642480 + }, + { + "epoch": 1.67, + "learning_rate": 5.018598634976838e-05, + "loss": 0.0075, + "step": 642490 + }, + { + "epoch": 1.67, + "learning_rate": 5.018209813339692e-05, + "loss": 0.0069, + "step": 642500 + }, + { + "epoch": 1.67, + "learning_rate": 5.017820991702545e-05, + "loss": 0.0107, + "step": 642510 + }, + { + "epoch": 1.67, + "learning_rate": 5.017432170065399e-05, + "loss": 0.0081, + "step": 642520 + }, + { + "epoch": 1.67, + "learning_rate": 5.017043348428253e-05, + "loss": 0.0086, + "step": 642530 + }, + { + "epoch": 1.67, + "learning_rate": 5.0166545267911064e-05, + "loss": 0.009, + "step": 642540 + }, + { + "epoch": 1.67, + "learning_rate": 5.01626570515396e-05, + "loss": 0.0073, + "step": 642550 + }, + { + "epoch": 1.67, + "learning_rate": 5.0158768835168134e-05, + "loss": 0.0059, + "step": 642560 + }, + { + "epoch": 1.67, + "learning_rate": 5.015488061879667e-05, + "loss": 0.006, + "step": 642570 + }, + { + "epoch": 1.67, + "learning_rate": 5.0150992402425204e-05, + "loss": 0.0085, + "step": 642580 + }, + { + "epoch": 1.67, + "learning_rate": 5.014710418605374e-05, + "loss": 0.011, + "step": 642590 + }, + { + "epoch": 1.67, + "learning_rate": 5.0143215969682273e-05, + "loss": 0.009, + "step": 642600 + }, + { + "epoch": 1.67, + "learning_rate": 5.0139327753310815e-05, + "loss": 0.0083, + "step": 642610 + }, + { + "epoch": 1.67, + "learning_rate": 5.013543953693935e-05, + "loss": 0.007, + "step": 642620 + }, + { + "epoch": 1.67, + "learning_rate": 5.0131551320567885e-05, + "loss": 0.0089, + "step": 642630 + }, + { + "epoch": 1.67, + "learning_rate": 5.012766310419642e-05, + "loss": 0.0066, + "step": 642640 + }, + { + "epoch": 1.67, + "learning_rate": 5.0123774887824955e-05, + "loss": 0.0098, + "step": 642650 + }, + { + "epoch": 1.67, + "learning_rate": 5.011988667145349e-05, + "loss": 0.0065, + "step": 642660 + }, + { + "epoch": 1.67, + "learning_rate": 5.0115998455082024e-05, + "loss": 0.0075, + "step": 642670 + }, + { + "epoch": 1.67, + "learning_rate": 5.011211023871056e-05, + "loss": 0.0077, + "step": 642680 + }, + { + "epoch": 1.67, + "learning_rate": 5.01082220223391e-05, + "loss": 0.0071, + "step": 642690 + }, + { + "epoch": 1.67, + "learning_rate": 5.0104333805967636e-05, + "loss": 0.0101, + "step": 642700 + }, + { + "epoch": 1.67, + "learning_rate": 5.010044558959617e-05, + "loss": 0.008, + "step": 642710 + }, + { + "epoch": 1.67, + "learning_rate": 5.0096557373224705e-05, + "loss": 0.0091, + "step": 642720 + }, + { + "epoch": 1.67, + "learning_rate": 5.0092669156853233e-05, + "loss": 0.0062, + "step": 642730 + }, + { + "epoch": 1.67, + "learning_rate": 5.008878094048177e-05, + "loss": 0.0068, + "step": 642740 + }, + { + "epoch": 1.67, + "learning_rate": 5.00848927241103e-05, + "loss": 0.0098, + "step": 642750 + }, + { + "epoch": 1.67, + "learning_rate": 5.008100450773884e-05, + "loss": 0.0067, + "step": 642760 + }, + { + "epoch": 1.67, + "learning_rate": 5.007711629136737e-05, + "loss": 0.0061, + "step": 642770 + }, + { + "epoch": 1.67, + "learning_rate": 5.007322807499591e-05, + "loss": 0.0076, + "step": 642780 + }, + { + "epoch": 1.67, + "learning_rate": 5.006933985862445e-05, + "loss": 0.0069, + "step": 642790 + }, + { + "epoch": 1.67, + "learning_rate": 5.0065451642252984e-05, + "loss": 0.0075, + "step": 642800 + }, + { + "epoch": 1.67, + "learning_rate": 5.006156342588152e-05, + "loss": 0.0077, + "step": 642810 + }, + { + "epoch": 1.67, + "learning_rate": 5.0057675209510054e-05, + "loss": 0.0087, + "step": 642820 + }, + { + "epoch": 1.67, + "learning_rate": 5.005378699313859e-05, + "loss": 0.0063, + "step": 642830 + }, + { + "epoch": 1.67, + "learning_rate": 5.0049898776767124e-05, + "loss": 0.0059, + "step": 642840 + }, + { + "epoch": 1.67, + "learning_rate": 5.004601056039566e-05, + "loss": 0.0103, + "step": 642850 + }, + { + "epoch": 1.67, + "learning_rate": 5.004212234402419e-05, + "loss": 0.0102, + "step": 642860 + }, + { + "epoch": 1.67, + "learning_rate": 5.0038234127652735e-05, + "loss": 0.0089, + "step": 642870 + }, + { + "epoch": 1.67, + "learning_rate": 5.003434591128127e-05, + "loss": 0.0111, + "step": 642880 + }, + { + "epoch": 1.67, + "learning_rate": 5.0030457694909805e-05, + "loss": 0.0094, + "step": 642890 + }, + { + "epoch": 1.67, + "learning_rate": 5.002656947853834e-05, + "loss": 0.0084, + "step": 642900 + }, + { + "epoch": 1.67, + "learning_rate": 5.0022681262166874e-05, + "loss": 0.0088, + "step": 642910 + }, + { + "epoch": 1.67, + "learning_rate": 5.001879304579541e-05, + "loss": 0.0093, + "step": 642920 + }, + { + "epoch": 1.67, + "learning_rate": 5.0014904829423944e-05, + "loss": 0.0057, + "step": 642930 + }, + { + "epoch": 1.67, + "learning_rate": 5.001101661305248e-05, + "loss": 0.0081, + "step": 642940 + }, + { + "epoch": 1.67, + "learning_rate": 5.000712839668102e-05, + "loss": 0.0087, + "step": 642950 + }, + { + "epoch": 1.67, + "learning_rate": 5.0003240180309556e-05, + "loss": 0.0082, + "step": 642960 + }, + { + "epoch": 1.67, + "learning_rate": 4.9999351963938084e-05, + "loss": 0.0099, + "step": 642970 + }, + { + "epoch": 1.67, + "learning_rate": 4.999546374756662e-05, + "loss": 0.0076, + "step": 642980 + }, + { + "epoch": 1.67, + "learning_rate": 4.999157553119515e-05, + "loss": 0.0067, + "step": 642990 + }, + { + "epoch": 1.67, + "learning_rate": 4.998768731482369e-05, + "loss": 0.0089, + "step": 643000 + }, + { + "epoch": 1.67, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.005269117187708616, + "eval_runtime": 107.7748, + "eval_samples_per_second": 18.557, + "eval_steps_per_second": 4.639, + "step": 643000 + }, + { + "epoch": 1.67, + "learning_rate": 4.998379909845222e-05, + "loss": 0.0094, + "step": 643010 + }, + { + "epoch": 1.67, + "learning_rate": 4.997991088208076e-05, + "loss": 0.0074, + "step": 643020 + }, + { + "epoch": 1.67, + "learning_rate": 4.997602266570929e-05, + "loss": 0.0074, + "step": 643030 + }, + { + "epoch": 1.67, + "learning_rate": 4.997213444933783e-05, + "loss": 0.0068, + "step": 643040 + }, + { + "epoch": 1.67, + "learning_rate": 4.996824623296637e-05, + "loss": 0.0079, + "step": 643050 + }, + { + "epoch": 1.67, + "learning_rate": 4.9964358016594904e-05, + "loss": 0.0081, + "step": 643060 + }, + { + "epoch": 1.67, + "learning_rate": 4.996046980022344e-05, + "loss": 0.0068, + "step": 643070 + }, + { + "epoch": 1.67, + "learning_rate": 4.9956581583851974e-05, + "loss": 0.0061, + "step": 643080 + }, + { + "epoch": 1.67, + "learning_rate": 4.995269336748051e-05, + "loss": 0.0071, + "step": 643090 + }, + { + "epoch": 1.67, + "learning_rate": 4.9948805151109044e-05, + "loss": 0.0065, + "step": 643100 + }, + { + "epoch": 1.67, + "learning_rate": 4.994491693473758e-05, + "loss": 0.0091, + "step": 643110 + }, + { + "epoch": 1.67, + "learning_rate": 4.994102871836611e-05, + "loss": 0.0063, + "step": 643120 + }, + { + "epoch": 1.67, + "learning_rate": 4.9937140501994655e-05, + "loss": 0.007, + "step": 643130 + }, + { + "epoch": 1.67, + "learning_rate": 4.993325228562319e-05, + "loss": 0.0081, + "step": 643140 + }, + { + "epoch": 1.67, + "learning_rate": 4.9929364069251725e-05, + "loss": 0.0089, + "step": 643150 + }, + { + "epoch": 1.67, + "learning_rate": 4.992547585288026e-05, + "loss": 0.0076, + "step": 643160 + }, + { + "epoch": 1.67, + "learning_rate": 4.9921587636508794e-05, + "loss": 0.0091, + "step": 643170 + }, + { + "epoch": 1.67, + "learning_rate": 4.991769942013733e-05, + "loss": 0.008, + "step": 643180 + }, + { + "epoch": 1.67, + "learning_rate": 4.9913811203765864e-05, + "loss": 0.0102, + "step": 643190 + }, + { + "epoch": 1.67, + "learning_rate": 4.99099229873944e-05, + "loss": 0.0088, + "step": 643200 + }, + { + "epoch": 1.67, + "learning_rate": 4.990603477102294e-05, + "loss": 0.0099, + "step": 643210 + }, + { + "epoch": 1.67, + "learning_rate": 4.990214655465146e-05, + "loss": 0.0084, + "step": 643220 + }, + { + "epoch": 1.67, + "learning_rate": 4.9898258338280004e-05, + "loss": 0.0096, + "step": 643230 + }, + { + "epoch": 1.67, + "learning_rate": 4.989437012190854e-05, + "loss": 0.008, + "step": 643240 + }, + { + "epoch": 1.67, + "learning_rate": 4.989048190553707e-05, + "loss": 0.007, + "step": 643250 + }, + { + "epoch": 1.67, + "learning_rate": 4.988659368916561e-05, + "loss": 0.0081, + "step": 643260 + }, + { + "epoch": 1.67, + "learning_rate": 4.988270547279414e-05, + "loss": 0.0076, + "step": 643270 + }, + { + "epoch": 1.67, + "learning_rate": 4.987881725642268e-05, + "loss": 0.0072, + "step": 643280 + }, + { + "epoch": 1.67, + "learning_rate": 4.987492904005121e-05, + "loss": 0.0091, + "step": 643290 + }, + { + "epoch": 1.67, + "learning_rate": 4.987104082367975e-05, + "loss": 0.0083, + "step": 643300 + }, + { + "epoch": 1.67, + "learning_rate": 4.986715260730829e-05, + "loss": 0.0062, + "step": 643310 + }, + { + "epoch": 1.67, + "learning_rate": 4.9863264390936824e-05, + "loss": 0.0097, + "step": 643320 + }, + { + "epoch": 1.67, + "learning_rate": 4.985937617456536e-05, + "loss": 0.0065, + "step": 643330 + }, + { + "epoch": 1.67, + "learning_rate": 4.9855487958193894e-05, + "loss": 0.0084, + "step": 643340 + }, + { + "epoch": 1.67, + "learning_rate": 4.985159974182243e-05, + "loss": 0.0134, + "step": 643350 + }, + { + "epoch": 1.67, + "learning_rate": 4.9847711525450964e-05, + "loss": 0.0078, + "step": 643360 + }, + { + "epoch": 1.67, + "learning_rate": 4.98438233090795e-05, + "loss": 0.0089, + "step": 643370 + }, + { + "epoch": 1.67, + "learning_rate": 4.983993509270803e-05, + "loss": 0.0065, + "step": 643380 + }, + { + "epoch": 1.67, + "learning_rate": 4.9836046876336575e-05, + "loss": 0.0093, + "step": 643390 + }, + { + "epoch": 1.67, + "learning_rate": 4.983215865996511e-05, + "loss": 0.0088, + "step": 643400 + }, + { + "epoch": 1.67, + "learning_rate": 4.9828270443593645e-05, + "loss": 0.007, + "step": 643410 + }, + { + "epoch": 1.67, + "learning_rate": 4.982438222722218e-05, + "loss": 0.0082, + "step": 643420 + }, + { + "epoch": 1.67, + "learning_rate": 4.9820494010850714e-05, + "loss": 0.0096, + "step": 643430 + }, + { + "epoch": 1.67, + "learning_rate": 4.981660579447925e-05, + "loss": 0.0069, + "step": 643440 + }, + { + "epoch": 1.67, + "learning_rate": 4.9812717578107784e-05, + "loss": 0.0121, + "step": 643450 + }, + { + "epoch": 1.67, + "learning_rate": 4.980882936173632e-05, + "loss": 0.007, + "step": 643460 + }, + { + "epoch": 1.67, + "learning_rate": 4.980494114536485e-05, + "loss": 0.0076, + "step": 643470 + }, + { + "epoch": 1.67, + "learning_rate": 4.980105292899338e-05, + "loss": 0.0138, + "step": 643480 + }, + { + "epoch": 1.67, + "learning_rate": 4.9797164712621924e-05, + "loss": 0.0055, + "step": 643490 + }, + { + "epoch": 1.67, + "learning_rate": 4.979327649625046e-05, + "loss": 0.0076, + "step": 643500 + }, + { + "epoch": 1.67, + "learning_rate": 4.978938827987899e-05, + "loss": 0.0081, + "step": 643510 + }, + { + "epoch": 1.67, + "learning_rate": 4.978550006350753e-05, + "loss": 0.0076, + "step": 643520 + }, + { + "epoch": 1.67, + "learning_rate": 4.978161184713606e-05, + "loss": 0.0095, + "step": 643530 + }, + { + "epoch": 1.67, + "learning_rate": 4.97777236307646e-05, + "loss": 0.0078, + "step": 643540 + }, + { + "epoch": 1.67, + "learning_rate": 4.977383541439313e-05, + "loss": 0.0088, + "step": 643550 + }, + { + "epoch": 1.67, + "learning_rate": 4.976994719802167e-05, + "loss": 0.0108, + "step": 643560 + }, + { + "epoch": 1.67, + "learning_rate": 4.976605898165021e-05, + "loss": 0.0098, + "step": 643570 + }, + { + "epoch": 1.67, + "learning_rate": 4.9762170765278744e-05, + "loss": 0.0069, + "step": 643580 + }, + { + "epoch": 1.67, + "learning_rate": 4.975828254890728e-05, + "loss": 0.0063, + "step": 643590 + }, + { + "epoch": 1.67, + "learning_rate": 4.9754394332535814e-05, + "loss": 0.0109, + "step": 643600 + }, + { + "epoch": 1.67, + "learning_rate": 4.975050611616435e-05, + "loss": 0.0052, + "step": 643610 + }, + { + "epoch": 1.67, + "learning_rate": 4.9746617899792884e-05, + "loss": 0.0084, + "step": 643620 + }, + { + "epoch": 1.67, + "learning_rate": 4.974272968342142e-05, + "loss": 0.0074, + "step": 643630 + }, + { + "epoch": 1.67, + "learning_rate": 4.973884146704995e-05, + "loss": 0.0073, + "step": 643640 + }, + { + "epoch": 1.67, + "learning_rate": 4.973495325067849e-05, + "loss": 0.0069, + "step": 643650 + }, + { + "epoch": 1.67, + "learning_rate": 4.973106503430703e-05, + "loss": 0.0096, + "step": 643660 + }, + { + "epoch": 1.67, + "learning_rate": 4.9727176817935565e-05, + "loss": 0.0077, + "step": 643670 + }, + { + "epoch": 1.67, + "learning_rate": 4.97232886015641e-05, + "loss": 0.0096, + "step": 643680 + }, + { + "epoch": 1.67, + "learning_rate": 4.9719400385192634e-05, + "loss": 0.0076, + "step": 643690 + }, + { + "epoch": 1.67, + "learning_rate": 4.971551216882117e-05, + "loss": 0.0085, + "step": 643700 + }, + { + "epoch": 1.67, + "learning_rate": 4.9711623952449704e-05, + "loss": 0.0104, + "step": 643710 + }, + { + "epoch": 1.67, + "learning_rate": 4.970773573607823e-05, + "loss": 0.0094, + "step": 643720 + }, + { + "epoch": 1.67, + "learning_rate": 4.970384751970677e-05, + "loss": 0.0073, + "step": 643730 + }, + { + "epoch": 1.67, + "learning_rate": 4.96999593033353e-05, + "loss": 0.0062, + "step": 643740 + }, + { + "epoch": 1.67, + "learning_rate": 4.969607108696384e-05, + "loss": 0.0097, + "step": 643750 + }, + { + "epoch": 1.67, + "learning_rate": 4.969218287059238e-05, + "loss": 0.0074, + "step": 643760 + }, + { + "epoch": 1.67, + "learning_rate": 4.968829465422091e-05, + "loss": 0.0089, + "step": 643770 + }, + { + "epoch": 1.67, + "learning_rate": 4.968440643784945e-05, + "loss": 0.0062, + "step": 643780 + }, + { + "epoch": 1.67, + "learning_rate": 4.968051822147798e-05, + "loss": 0.009, + "step": 643790 + }, + { + "epoch": 1.67, + "learning_rate": 4.967663000510652e-05, + "loss": 0.0099, + "step": 643800 + }, + { + "epoch": 1.67, + "learning_rate": 4.967274178873505e-05, + "loss": 0.008, + "step": 643810 + }, + { + "epoch": 1.67, + "learning_rate": 4.966885357236359e-05, + "loss": 0.0062, + "step": 643820 + }, + { + "epoch": 1.67, + "learning_rate": 4.966496535599212e-05, + "loss": 0.0079, + "step": 643830 + }, + { + "epoch": 1.67, + "learning_rate": 4.9661077139620664e-05, + "loss": 0.0076, + "step": 643840 + }, + { + "epoch": 1.67, + "learning_rate": 4.96571889232492e-05, + "loss": 0.0086, + "step": 643850 + }, + { + "epoch": 1.67, + "learning_rate": 4.9653300706877734e-05, + "loss": 0.0073, + "step": 643860 + }, + { + "epoch": 1.67, + "learning_rate": 4.964941249050627e-05, + "loss": 0.0073, + "step": 643870 + }, + { + "epoch": 1.67, + "learning_rate": 4.9645524274134803e-05, + "loss": 0.0073, + "step": 643880 + }, + { + "epoch": 1.67, + "learning_rate": 4.964163605776334e-05, + "loss": 0.0076, + "step": 643890 + }, + { + "epoch": 1.67, + "learning_rate": 4.963774784139187e-05, + "loss": 0.0059, + "step": 643900 + }, + { + "epoch": 1.67, + "learning_rate": 4.963385962502041e-05, + "loss": 0.008, + "step": 643910 + }, + { + "epoch": 1.67, + "learning_rate": 4.962997140864895e-05, + "loss": 0.0107, + "step": 643920 + }, + { + "epoch": 1.67, + "learning_rate": 4.9626083192277485e-05, + "loss": 0.0067, + "step": 643930 + }, + { + "epoch": 1.67, + "learning_rate": 4.962219497590602e-05, + "loss": 0.0072, + "step": 643940 + }, + { + "epoch": 1.67, + "learning_rate": 4.9618306759534554e-05, + "loss": 0.0092, + "step": 643950 + }, + { + "epoch": 1.67, + "learning_rate": 4.961441854316309e-05, + "loss": 0.0069, + "step": 643960 + }, + { + "epoch": 1.67, + "learning_rate": 4.961053032679162e-05, + "loss": 0.008, + "step": 643970 + }, + { + "epoch": 1.67, + "learning_rate": 4.960664211042015e-05, + "loss": 0.0088, + "step": 643980 + }, + { + "epoch": 1.67, + "learning_rate": 4.960275389404869e-05, + "loss": 0.0077, + "step": 643990 + }, + { + "epoch": 1.67, + "learning_rate": 4.959886567767722e-05, + "loss": 0.0075, + "step": 644000 + }, + { + "epoch": 1.67, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.005179722793400288, + "eval_runtime": 107.801, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, + "step": 644000 + }, + { + "epoch": 1.67, + "learning_rate": 4.959497746130576e-05, + "loss": 0.0078, + "step": 644010 + }, + { + "epoch": 1.67, + "learning_rate": 4.95910892449343e-05, + "loss": 0.0082, + "step": 644020 + }, + { + "epoch": 1.67, + "learning_rate": 4.958720102856283e-05, + "loss": 0.0074, + "step": 644030 + }, + { + "epoch": 1.67, + "learning_rate": 4.958331281219137e-05, + "loss": 0.0083, + "step": 644040 + }, + { + "epoch": 1.67, + "learning_rate": 4.95794245958199e-05, + "loss": 0.0081, + "step": 644050 + }, + { + "epoch": 1.67, + "learning_rate": 4.957553637944844e-05, + "loss": 0.0077, + "step": 644060 + }, + { + "epoch": 1.67, + "learning_rate": 4.957164816307697e-05, + "loss": 0.0063, + "step": 644070 + }, + { + "epoch": 1.67, + "learning_rate": 4.956775994670551e-05, + "loss": 0.0093, + "step": 644080 + }, + { + "epoch": 1.67, + "learning_rate": 4.956387173033404e-05, + "loss": 0.0118, + "step": 644090 + }, + { + "epoch": 1.67, + "learning_rate": 4.9559983513962584e-05, + "loss": 0.008, + "step": 644100 + }, + { + "epoch": 1.67, + "learning_rate": 4.955609529759112e-05, + "loss": 0.0088, + "step": 644110 + }, + { + "epoch": 1.67, + "learning_rate": 4.9552207081219654e-05, + "loss": 0.0103, + "step": 644120 + }, + { + "epoch": 1.67, + "learning_rate": 4.954831886484819e-05, + "loss": 0.0083, + "step": 644130 + }, + { + "epoch": 1.67, + "learning_rate": 4.9544430648476723e-05, + "loss": 0.0086, + "step": 644140 + }, + { + "epoch": 1.67, + "learning_rate": 4.954054243210526e-05, + "loss": 0.0134, + "step": 644150 + }, + { + "epoch": 1.67, + "learning_rate": 4.953665421573379e-05, + "loss": 0.0079, + "step": 644160 + }, + { + "epoch": 1.67, + "learning_rate": 4.953276599936233e-05, + "loss": 0.0072, + "step": 644170 + }, + { + "epoch": 1.67, + "learning_rate": 4.952887778299087e-05, + "loss": 0.011, + "step": 644180 + }, + { + "epoch": 1.67, + "learning_rate": 4.9524989566619405e-05, + "loss": 0.0056, + "step": 644190 + }, + { + "epoch": 1.67, + "learning_rate": 4.952110135024794e-05, + "loss": 0.0078, + "step": 644200 + }, + { + "epoch": 1.67, + "learning_rate": 4.951721313387647e-05, + "loss": 0.0088, + "step": 644210 + }, + { + "epoch": 1.67, + "learning_rate": 4.9513324917505e-05, + "loss": 0.0066, + "step": 644220 + }, + { + "epoch": 1.67, + "learning_rate": 4.950943670113354e-05, + "loss": 0.0073, + "step": 644230 + }, + { + "epoch": 1.67, + "learning_rate": 4.950554848476207e-05, + "loss": 0.0098, + "step": 644240 + }, + { + "epoch": 1.67, + "learning_rate": 4.950166026839061e-05, + "loss": 0.0113, + "step": 644250 + }, + { + "epoch": 1.67, + "learning_rate": 4.949777205201914e-05, + "loss": 0.0104, + "step": 644260 + }, + { + "epoch": 1.67, + "learning_rate": 4.949388383564768e-05, + "loss": 0.0078, + "step": 644270 + }, + { + "epoch": 1.67, + "learning_rate": 4.948999561927622e-05, + "loss": 0.0079, + "step": 644280 + }, + { + "epoch": 1.67, + "learning_rate": 4.948610740290475e-05, + "loss": 0.0087, + "step": 644290 + }, + { + "epoch": 1.67, + "learning_rate": 4.948221918653329e-05, + "loss": 0.0085, + "step": 644300 + }, + { + "epoch": 1.67, + "learning_rate": 4.947833097016182e-05, + "loss": 0.007, + "step": 644310 + }, + { + "epoch": 1.67, + "learning_rate": 4.947444275379036e-05, + "loss": 0.0067, + "step": 644320 + }, + { + "epoch": 1.67, + "learning_rate": 4.947055453741889e-05, + "loss": 0.01, + "step": 644330 + }, + { + "epoch": 1.67, + "learning_rate": 4.946666632104743e-05, + "loss": 0.0076, + "step": 644340 + }, + { + "epoch": 1.67, + "learning_rate": 4.946277810467596e-05, + "loss": 0.0081, + "step": 644350 + }, + { + "epoch": 1.67, + "learning_rate": 4.9458889888304504e-05, + "loss": 0.0101, + "step": 644360 + }, + { + "epoch": 1.67, + "learning_rate": 4.945500167193304e-05, + "loss": 0.0096, + "step": 644370 + }, + { + "epoch": 1.67, + "learning_rate": 4.9451113455561574e-05, + "loss": 0.0083, + "step": 644380 + }, + { + "epoch": 1.67, + "learning_rate": 4.944722523919011e-05, + "loss": 0.0078, + "step": 644390 + }, + { + "epoch": 1.67, + "learning_rate": 4.944333702281864e-05, + "loss": 0.0079, + "step": 644400 + }, + { + "epoch": 1.67, + "learning_rate": 4.943944880644718e-05, + "loss": 0.0077, + "step": 644410 + }, + { + "epoch": 1.67, + "learning_rate": 4.943556059007571e-05, + "loss": 0.0061, + "step": 644420 + }, + { + "epoch": 1.67, + "learning_rate": 4.943167237370425e-05, + "loss": 0.009, + "step": 644430 + }, + { + "epoch": 1.67, + "learning_rate": 4.942778415733279e-05, + "loss": 0.0077, + "step": 644440 + }, + { + "epoch": 1.67, + "learning_rate": 4.9423895940961324e-05, + "loss": 0.0075, + "step": 644450 + }, + { + "epoch": 1.67, + "learning_rate": 4.942000772458985e-05, + "loss": 0.0102, + "step": 644460 + }, + { + "epoch": 1.67, + "learning_rate": 4.941611950821839e-05, + "loss": 0.0058, + "step": 644470 + }, + { + "epoch": 1.67, + "learning_rate": 4.941223129184692e-05, + "loss": 0.0084, + "step": 644480 + }, + { + "epoch": 1.67, + "learning_rate": 4.940834307547546e-05, + "loss": 0.0079, + "step": 644490 + }, + { + "epoch": 1.67, + "learning_rate": 4.940445485910399e-05, + "loss": 0.0115, + "step": 644500 + }, + { + "epoch": 1.67, + "learning_rate": 4.940056664273253e-05, + "loss": 0.0077, + "step": 644510 + }, + { + "epoch": 1.67, + "learning_rate": 4.939667842636106e-05, + "loss": 0.0117, + "step": 644520 + }, + { + "epoch": 1.67, + "learning_rate": 4.9392790209989597e-05, + "loss": 0.0054, + "step": 644530 + }, + { + "epoch": 1.67, + "learning_rate": 4.938890199361814e-05, + "loss": 0.0057, + "step": 644540 + }, + { + "epoch": 1.67, + "learning_rate": 4.938501377724667e-05, + "loss": 0.0082, + "step": 644550 + }, + { + "epoch": 1.67, + "learning_rate": 4.938112556087521e-05, + "loss": 0.0073, + "step": 644560 + }, + { + "epoch": 1.67, + "learning_rate": 4.937723734450374e-05, + "loss": 0.01, + "step": 644570 + }, + { + "epoch": 1.67, + "learning_rate": 4.937334912813228e-05, + "loss": 0.0062, + "step": 644580 + }, + { + "epoch": 1.67, + "learning_rate": 4.936946091176081e-05, + "loss": 0.0058, + "step": 644590 + }, + { + "epoch": 1.67, + "learning_rate": 4.936557269538935e-05, + "loss": 0.0084, + "step": 644600 + }, + { + "epoch": 1.67, + "learning_rate": 4.936168447901788e-05, + "loss": 0.0102, + "step": 644610 + }, + { + "epoch": 1.67, + "learning_rate": 4.9357796262646424e-05, + "loss": 0.0082, + "step": 644620 + }, + { + "epoch": 1.67, + "learning_rate": 4.935390804627496e-05, + "loss": 0.0095, + "step": 644630 + }, + { + "epoch": 1.67, + "learning_rate": 4.9350019829903494e-05, + "loss": 0.0077, + "step": 644640 + }, + { + "epoch": 1.67, + "learning_rate": 4.934613161353203e-05, + "loss": 0.0095, + "step": 644650 + }, + { + "epoch": 1.67, + "learning_rate": 4.934224339716056e-05, + "loss": 0.0078, + "step": 644660 + }, + { + "epoch": 1.67, + "learning_rate": 4.93383551807891e-05, + "loss": 0.007, + "step": 644670 + }, + { + "epoch": 1.67, + "learning_rate": 4.933446696441763e-05, + "loss": 0.0079, + "step": 644680 + }, + { + "epoch": 1.67, + "learning_rate": 4.933057874804617e-05, + "loss": 0.0102, + "step": 644690 + }, + { + "epoch": 1.67, + "learning_rate": 4.932669053167471e-05, + "loss": 0.0082, + "step": 644700 + }, + { + "epoch": 1.67, + "learning_rate": 4.932280231530323e-05, + "loss": 0.007, + "step": 644710 + }, + { + "epoch": 1.67, + "learning_rate": 4.931891409893177e-05, + "loss": 0.0103, + "step": 644720 + }, + { + "epoch": 1.67, + "learning_rate": 4.931502588256031e-05, + "loss": 0.0093, + "step": 644730 + }, + { + "epoch": 1.67, + "learning_rate": 4.931113766618884e-05, + "loss": 0.0077, + "step": 644740 + }, + { + "epoch": 1.67, + "learning_rate": 4.930724944981738e-05, + "loss": 0.0067, + "step": 644750 + }, + { + "epoch": 1.67, + "learning_rate": 4.930336123344591e-05, + "loss": 0.0113, + "step": 644760 + }, + { + "epoch": 1.67, + "learning_rate": 4.929947301707445e-05, + "loss": 0.0062, + "step": 644770 + }, + { + "epoch": 1.67, + "learning_rate": 4.929558480070298e-05, + "loss": 0.0081, + "step": 644780 + }, + { + "epoch": 1.67, + "learning_rate": 4.9291696584331517e-05, + "loss": 0.0166, + "step": 644790 + }, + { + "epoch": 1.67, + "learning_rate": 4.928780836796006e-05, + "loss": 0.0076, + "step": 644800 + }, + { + "epoch": 1.67, + "learning_rate": 4.928392015158859e-05, + "loss": 0.0115, + "step": 644810 + }, + { + "epoch": 1.67, + "learning_rate": 4.928003193521713e-05, + "loss": 0.0126, + "step": 644820 + }, + { + "epoch": 1.67, + "learning_rate": 4.927614371884566e-05, + "loss": 0.008, + "step": 644830 + }, + { + "epoch": 1.67, + "learning_rate": 4.92722555024742e-05, + "loss": 0.0057, + "step": 644840 + }, + { + "epoch": 1.67, + "learning_rate": 4.926836728610273e-05, + "loss": 0.0086, + "step": 644850 + }, + { + "epoch": 1.67, + "learning_rate": 4.926447906973127e-05, + "loss": 0.0077, + "step": 644860 + }, + { + "epoch": 1.67, + "learning_rate": 4.92605908533598e-05, + "loss": 0.0099, + "step": 644870 + }, + { + "epoch": 1.67, + "learning_rate": 4.9256702636988344e-05, + "loss": 0.0087, + "step": 644880 + }, + { + "epoch": 1.67, + "learning_rate": 4.925281442061688e-05, + "loss": 0.0075, + "step": 644890 + }, + { + "epoch": 1.67, + "learning_rate": 4.9248926204245414e-05, + "loss": 0.0089, + "step": 644900 + }, + { + "epoch": 1.67, + "learning_rate": 4.924503798787395e-05, + "loss": 0.0074, + "step": 644910 + }, + { + "epoch": 1.67, + "learning_rate": 4.924114977150248e-05, + "loss": 0.0161, + "step": 644920 + }, + { + "epoch": 1.67, + "learning_rate": 4.923726155513102e-05, + "loss": 0.0085, + "step": 644930 + }, + { + "epoch": 1.67, + "learning_rate": 4.923337333875955e-05, + "loss": 0.0082, + "step": 644940 + }, + { + "epoch": 1.67, + "learning_rate": 4.922948512238809e-05, + "loss": 0.0105, + "step": 644950 + }, + { + "epoch": 1.67, + "learning_rate": 4.9225596906016616e-05, + "loss": 0.0071, + "step": 644960 + }, + { + "epoch": 1.67, + "learning_rate": 4.922170868964515e-05, + "loss": 0.006, + "step": 644970 + }, + { + "epoch": 1.67, + "learning_rate": 4.921782047327369e-05, + "loss": 0.0082, + "step": 644980 + }, + { + "epoch": 1.67, + "learning_rate": 4.921393225690223e-05, + "loss": 0.0102, + "step": 644990 + }, + { + "epoch": 1.67, + "learning_rate": 4.921004404053076e-05, + "loss": 0.0078, + "step": 645000 + }, + { + "epoch": 1.67, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.0051052626222372055, + "eval_runtime": 107.7487, + "eval_samples_per_second": 18.562, + "eval_steps_per_second": 4.64, + "step": 645000 + }, + { + "epoch": 1.67, + "learning_rate": 4.92061558241593e-05, + "loss": 0.0079, + "step": 645010 + }, + { + "epoch": 1.67, + "learning_rate": 4.920226760778783e-05, + "loss": 0.0077, + "step": 645020 + }, + { + "epoch": 1.67, + "learning_rate": 4.919837939141637e-05, + "loss": 0.0115, + "step": 645030 + }, + { + "epoch": 1.67, + "learning_rate": 4.91944911750449e-05, + "loss": 0.0078, + "step": 645040 + }, + { + "epoch": 1.67, + "learning_rate": 4.9190602958673436e-05, + "loss": 0.0093, + "step": 645050 + }, + { + "epoch": 1.67, + "learning_rate": 4.918671474230198e-05, + "loss": 0.0077, + "step": 645060 + }, + { + "epoch": 1.67, + "learning_rate": 4.918282652593051e-05, + "loss": 0.0088, + "step": 645070 + }, + { + "epoch": 1.67, + "learning_rate": 4.917893830955905e-05, + "loss": 0.0091, + "step": 645080 + }, + { + "epoch": 1.67, + "learning_rate": 4.917505009318758e-05, + "loss": 0.0081, + "step": 645090 + }, + { + "epoch": 1.67, + "learning_rate": 4.917116187681612e-05, + "loss": 0.0059, + "step": 645100 + }, + { + "epoch": 1.67, + "learning_rate": 4.916727366044465e-05, + "loss": 0.0067, + "step": 645110 + }, + { + "epoch": 1.67, + "learning_rate": 4.916338544407319e-05, + "loss": 0.0077, + "step": 645120 + }, + { + "epoch": 1.67, + "learning_rate": 4.915949722770172e-05, + "loss": 0.0088, + "step": 645130 + }, + { + "epoch": 1.67, + "learning_rate": 4.915560901133026e-05, + "loss": 0.0095, + "step": 645140 + }, + { + "epoch": 1.67, + "learning_rate": 4.91517207949588e-05, + "loss": 0.0082, + "step": 645150 + }, + { + "epoch": 1.67, + "learning_rate": 4.9147832578587334e-05, + "loss": 0.0071, + "step": 645160 + }, + { + "epoch": 1.67, + "learning_rate": 4.914394436221587e-05, + "loss": 0.0083, + "step": 645170 + }, + { + "epoch": 1.67, + "learning_rate": 4.91400561458444e-05, + "loss": 0.0095, + "step": 645180 + }, + { + "epoch": 1.67, + "learning_rate": 4.913616792947294e-05, + "loss": 0.0072, + "step": 645190 + }, + { + "epoch": 1.67, + "learning_rate": 4.913227971310147e-05, + "loss": 0.0095, + "step": 645200 + }, + { + "epoch": 1.67, + "learning_rate": 4.912839149673e-05, + "loss": 0.0074, + "step": 645210 + }, + { + "epoch": 1.67, + "learning_rate": 4.9124503280358536e-05, + "loss": 0.0066, + "step": 645220 + }, + { + "epoch": 1.67, + "learning_rate": 4.912061506398707e-05, + "loss": 0.0083, + "step": 645230 + }, + { + "epoch": 1.67, + "learning_rate": 4.9116726847615606e-05, + "loss": 0.0066, + "step": 645240 + }, + { + "epoch": 1.67, + "learning_rate": 4.911283863124415e-05, + "loss": 0.0093, + "step": 645250 + }, + { + "epoch": 1.67, + "learning_rate": 4.910895041487268e-05, + "loss": 0.0089, + "step": 645260 + }, + { + "epoch": 1.67, + "learning_rate": 4.910506219850122e-05, + "loss": 0.0092, + "step": 645270 + }, + { + "epoch": 1.67, + "learning_rate": 4.910117398212975e-05, + "loss": 0.0069, + "step": 645280 + }, + { + "epoch": 1.67, + "learning_rate": 4.909728576575829e-05, + "loss": 0.006, + "step": 645290 + }, + { + "epoch": 1.67, + "learning_rate": 4.909339754938682e-05, + "loss": 0.0116, + "step": 645300 + }, + { + "epoch": 1.67, + "learning_rate": 4.9089509333015356e-05, + "loss": 0.0071, + "step": 645310 + }, + { + "epoch": 1.67, + "learning_rate": 4.908562111664389e-05, + "loss": 0.0073, + "step": 645320 + }, + { + "epoch": 1.67, + "learning_rate": 4.908173290027243e-05, + "loss": 0.0071, + "step": 645330 + }, + { + "epoch": 1.67, + "learning_rate": 4.907784468390097e-05, + "loss": 0.0105, + "step": 645340 + }, + { + "epoch": 1.67, + "learning_rate": 4.90739564675295e-05, + "loss": 0.0085, + "step": 645350 + }, + { + "epoch": 1.67, + "learning_rate": 4.907006825115804e-05, + "loss": 0.0121, + "step": 645360 + }, + { + "epoch": 1.67, + "learning_rate": 4.906618003478657e-05, + "loss": 0.0091, + "step": 645370 + }, + { + "epoch": 1.67, + "learning_rate": 4.906229181841511e-05, + "loss": 0.0113, + "step": 645380 + }, + { + "epoch": 1.67, + "learning_rate": 4.905840360204364e-05, + "loss": 0.005, + "step": 645390 + }, + { + "epoch": 1.67, + "learning_rate": 4.905451538567218e-05, + "loss": 0.0053, + "step": 645400 + }, + { + "epoch": 1.67, + "learning_rate": 4.905062716930072e-05, + "loss": 0.0073, + "step": 645410 + }, + { + "epoch": 1.67, + "learning_rate": 4.9046738952929253e-05, + "loss": 0.0077, + "step": 645420 + }, + { + "epoch": 1.67, + "learning_rate": 4.904285073655779e-05, + "loss": 0.0098, + "step": 645430 + }, + { + "epoch": 1.67, + "learning_rate": 4.903896252018632e-05, + "loss": 0.0079, + "step": 645440 + }, + { + "epoch": 1.67, + "learning_rate": 4.903507430381485e-05, + "loss": 0.0073, + "step": 645450 + }, + { + "epoch": 1.67, + "learning_rate": 4.9031186087443386e-05, + "loss": 0.011, + "step": 645460 + }, + { + "epoch": 1.67, + "learning_rate": 4.902729787107192e-05, + "loss": 0.0096, + "step": 645470 + }, + { + "epoch": 1.67, + "learning_rate": 4.9023409654700456e-05, + "loss": 0.0093, + "step": 645480 + }, + { + "epoch": 1.67, + "learning_rate": 4.901952143832899e-05, + "loss": 0.0094, + "step": 645490 + }, + { + "epoch": 1.67, + "learning_rate": 4.9015633221957526e-05, + "loss": 0.0066, + "step": 645500 + }, + { + "epoch": 1.67, + "learning_rate": 4.901174500558607e-05, + "loss": 0.0096, + "step": 645510 + }, + { + "epoch": 1.67, + "learning_rate": 4.90078567892146e-05, + "loss": 0.0108, + "step": 645520 + }, + { + "epoch": 1.67, + "learning_rate": 4.900396857284314e-05, + "loss": 0.0064, + "step": 645530 + }, + { + "epoch": 1.67, + "learning_rate": 4.900008035647167e-05, + "loss": 0.008, + "step": 645540 + }, + { + "epoch": 1.67, + "learning_rate": 4.899619214010021e-05, + "loss": 0.0066, + "step": 645550 + }, + { + "epoch": 1.67, + "learning_rate": 4.899230392372874e-05, + "loss": 0.0106, + "step": 645560 + }, + { + "epoch": 1.67, + "learning_rate": 4.8988415707357276e-05, + "loss": 0.0079, + "step": 645570 + }, + { + "epoch": 1.67, + "learning_rate": 4.898452749098581e-05, + "loss": 0.0137, + "step": 645580 + }, + { + "epoch": 1.67, + "learning_rate": 4.898063927461435e-05, + "loss": 0.0101, + "step": 645590 + }, + { + "epoch": 1.67, + "learning_rate": 4.897675105824289e-05, + "loss": 0.0089, + "step": 645600 + }, + { + "epoch": 1.67, + "learning_rate": 4.897286284187142e-05, + "loss": 0.0107, + "step": 645610 + }, + { + "epoch": 1.67, + "learning_rate": 4.896897462549996e-05, + "loss": 0.0096, + "step": 645620 + }, + { + "epoch": 1.67, + "learning_rate": 4.896508640912849e-05, + "loss": 0.0106, + "step": 645630 + }, + { + "epoch": 1.67, + "learning_rate": 4.896119819275703e-05, + "loss": 0.0104, + "step": 645640 + }, + { + "epoch": 1.67, + "learning_rate": 4.895730997638556e-05, + "loss": 0.007, + "step": 645650 + }, + { + "epoch": 1.67, + "learning_rate": 4.89534217600141e-05, + "loss": 0.008, + "step": 645660 + }, + { + "epoch": 1.67, + "learning_rate": 4.894953354364264e-05, + "loss": 0.0065, + "step": 645670 + }, + { + "epoch": 1.67, + "learning_rate": 4.8945645327271173e-05, + "loss": 0.0074, + "step": 645680 + }, + { + "epoch": 1.67, + "learning_rate": 4.894175711089971e-05, + "loss": 0.0074, + "step": 645690 + }, + { + "epoch": 1.67, + "learning_rate": 4.8937868894528236e-05, + "loss": 0.0103, + "step": 645700 + }, + { + "epoch": 1.67, + "learning_rate": 4.893398067815677e-05, + "loss": 0.0105, + "step": 645710 + }, + { + "epoch": 1.67, + "learning_rate": 4.8930092461785306e-05, + "loss": 0.0081, + "step": 645720 + }, + { + "epoch": 1.67, + "learning_rate": 4.892620424541384e-05, + "loss": 0.0086, + "step": 645730 + }, + { + "epoch": 1.67, + "learning_rate": 4.8922316029042376e-05, + "loss": 0.0065, + "step": 645740 + }, + { + "epoch": 1.67, + "learning_rate": 4.891842781267091e-05, + "loss": 0.0073, + "step": 645750 + }, + { + "epoch": 1.67, + "learning_rate": 4.8914539596299446e-05, + "loss": 0.0071, + "step": 645760 + }, + { + "epoch": 1.67, + "learning_rate": 4.891065137992799e-05, + "loss": 0.008, + "step": 645770 + }, + { + "epoch": 1.67, + "learning_rate": 4.890676316355652e-05, + "loss": 0.0079, + "step": 645780 + }, + { + "epoch": 1.67, + "learning_rate": 4.890287494718506e-05, + "loss": 0.0071, + "step": 645790 + }, + { + "epoch": 1.67, + "learning_rate": 4.889898673081359e-05, + "loss": 0.0069, + "step": 645800 + }, + { + "epoch": 1.67, + "learning_rate": 4.8895098514442127e-05, + "loss": 0.0073, + "step": 645810 + }, + { + "epoch": 1.67, + "learning_rate": 4.889121029807066e-05, + "loss": 0.0092, + "step": 645820 + }, + { + "epoch": 1.67, + "learning_rate": 4.8887322081699196e-05, + "loss": 0.0088, + "step": 645830 + }, + { + "epoch": 1.67, + "learning_rate": 4.888343386532773e-05, + "loss": 0.0066, + "step": 645840 + }, + { + "epoch": 1.67, + "learning_rate": 4.887954564895627e-05, + "loss": 0.008, + "step": 645850 + }, + { + "epoch": 1.67, + "learning_rate": 4.887565743258481e-05, + "loss": 0.0072, + "step": 645860 + }, + { + "epoch": 1.67, + "learning_rate": 4.887176921621334e-05, + "loss": 0.0087, + "step": 645870 + }, + { + "epoch": 1.67, + "learning_rate": 4.886788099984188e-05, + "loss": 0.0065, + "step": 645880 + }, + { + "epoch": 1.67, + "learning_rate": 4.886399278347041e-05, + "loss": 0.0088, + "step": 645890 + }, + { + "epoch": 1.67, + "learning_rate": 4.886010456709895e-05, + "loss": 0.0083, + "step": 645900 + }, + { + "epoch": 1.67, + "learning_rate": 4.885621635072748e-05, + "loss": 0.0084, + "step": 645910 + }, + { + "epoch": 1.67, + "learning_rate": 4.885232813435602e-05, + "loss": 0.0076, + "step": 645920 + }, + { + "epoch": 1.67, + "learning_rate": 4.884843991798456e-05, + "loss": 0.0154, + "step": 645930 + }, + { + "epoch": 1.67, + "learning_rate": 4.884455170161309e-05, + "loss": 0.0092, + "step": 645940 + }, + { + "epoch": 1.67, + "learning_rate": 4.884066348524162e-05, + "loss": 0.0093, + "step": 645950 + }, + { + "epoch": 1.67, + "learning_rate": 4.8836775268870156e-05, + "loss": 0.0099, + "step": 645960 + }, + { + "epoch": 1.67, + "learning_rate": 4.883288705249869e-05, + "loss": 0.0086, + "step": 645970 + }, + { + "epoch": 1.67, + "learning_rate": 4.8828998836127226e-05, + "loss": 0.012, + "step": 645980 + }, + { + "epoch": 1.67, + "learning_rate": 4.882511061975576e-05, + "loss": 0.0079, + "step": 645990 + }, + { + "epoch": 1.67, + "learning_rate": 4.8821222403384296e-05, + "loss": 0.0097, + "step": 646000 + }, + { + "epoch": 1.67, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.00513434037566185, + "eval_runtime": 108.0024, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.63, + "step": 646000 + }, + { + "epoch": 1.67, + "learning_rate": 4.881733418701283e-05, + "loss": 0.0096, + "step": 646010 + }, + { + "epoch": 1.67, + "learning_rate": 4.8813445970641365e-05, + "loss": 0.0062, + "step": 646020 + }, + { + "epoch": 1.67, + "learning_rate": 4.880955775426991e-05, + "loss": 0.0069, + "step": 646030 + }, + { + "epoch": 1.67, + "learning_rate": 4.880566953789844e-05, + "loss": 0.0081, + "step": 646040 + }, + { + "epoch": 1.67, + "learning_rate": 4.880178132152698e-05, + "loss": 0.0072, + "step": 646050 + }, + { + "epoch": 1.67, + "learning_rate": 4.879789310515551e-05, + "loss": 0.0086, + "step": 646060 + }, + { + "epoch": 1.67, + "learning_rate": 4.8794004888784047e-05, + "loss": 0.0078, + "step": 646070 + }, + { + "epoch": 1.67, + "learning_rate": 4.879011667241258e-05, + "loss": 0.008, + "step": 646080 + }, + { + "epoch": 1.67, + "learning_rate": 4.8786228456041116e-05, + "loss": 0.0066, + "step": 646090 + }, + { + "epoch": 1.67, + "learning_rate": 4.878234023966965e-05, + "loss": 0.0088, + "step": 646100 + }, + { + "epoch": 1.67, + "learning_rate": 4.877845202329819e-05, + "loss": 0.0111, + "step": 646110 + }, + { + "epoch": 1.67, + "learning_rate": 4.877456380692673e-05, + "loss": 0.01, + "step": 646120 + }, + { + "epoch": 1.67, + "learning_rate": 4.877067559055526e-05, + "loss": 0.0059, + "step": 646130 + }, + { + "epoch": 1.67, + "learning_rate": 4.87667873741838e-05, + "loss": 0.0075, + "step": 646140 + }, + { + "epoch": 1.67, + "learning_rate": 4.876289915781233e-05, + "loss": 0.0065, + "step": 646150 + }, + { + "epoch": 1.67, + "learning_rate": 4.875901094144087e-05, + "loss": 0.0077, + "step": 646160 + }, + { + "epoch": 1.67, + "learning_rate": 4.87551227250694e-05, + "loss": 0.0091, + "step": 646170 + }, + { + "epoch": 1.67, + "learning_rate": 4.875123450869794e-05, + "loss": 0.0078, + "step": 646180 + }, + { + "epoch": 1.68, + "learning_rate": 4.874734629232648e-05, + "loss": 0.0069, + "step": 646190 + }, + { + "epoch": 1.68, + "learning_rate": 4.8743458075955e-05, + "loss": 0.0086, + "step": 646200 + }, + { + "epoch": 1.68, + "learning_rate": 4.873956985958354e-05, + "loss": 0.0088, + "step": 646210 + }, + { + "epoch": 1.68, + "learning_rate": 4.8735681643212076e-05, + "loss": 0.0069, + "step": 646220 + }, + { + "epoch": 1.68, + "learning_rate": 4.873179342684061e-05, + "loss": 0.0062, + "step": 646230 + }, + { + "epoch": 1.68, + "learning_rate": 4.8727905210469146e-05, + "loss": 0.0074, + "step": 646240 + }, + { + "epoch": 1.68, + "learning_rate": 4.872401699409768e-05, + "loss": 0.0087, + "step": 646250 + }, + { + "epoch": 1.68, + "learning_rate": 4.8720128777726216e-05, + "loss": 0.009, + "step": 646260 + }, + { + "epoch": 1.68, + "learning_rate": 4.871624056135475e-05, + "loss": 0.007, + "step": 646270 + }, + { + "epoch": 1.68, + "learning_rate": 4.8712352344983285e-05, + "loss": 0.0067, + "step": 646280 + }, + { + "epoch": 1.68, + "learning_rate": 4.870846412861183e-05, + "loss": 0.0073, + "step": 646290 + }, + { + "epoch": 1.68, + "learning_rate": 4.870457591224036e-05, + "loss": 0.0075, + "step": 646300 + }, + { + "epoch": 1.68, + "learning_rate": 4.87006876958689e-05, + "loss": 0.0091, + "step": 646310 + }, + { + "epoch": 1.68, + "learning_rate": 4.869679947949743e-05, + "loss": 0.0071, + "step": 646320 + }, + { + "epoch": 1.68, + "learning_rate": 4.8692911263125967e-05, + "loss": 0.0062, + "step": 646330 + }, + { + "epoch": 1.68, + "learning_rate": 4.86890230467545e-05, + "loss": 0.007, + "step": 646340 + }, + { + "epoch": 1.68, + "learning_rate": 4.8685134830383036e-05, + "loss": 0.0074, + "step": 646350 + }, + { + "epoch": 1.68, + "learning_rate": 4.868124661401157e-05, + "loss": 0.0067, + "step": 646360 + }, + { + "epoch": 1.68, + "learning_rate": 4.867735839764011e-05, + "loss": 0.0102, + "step": 646370 + }, + { + "epoch": 1.68, + "learning_rate": 4.867347018126865e-05, + "loss": 0.0073, + "step": 646380 + }, + { + "epoch": 1.68, + "learning_rate": 4.866958196489718e-05, + "loss": 0.0073, + "step": 646390 + }, + { + "epoch": 1.68, + "learning_rate": 4.866569374852572e-05, + "loss": 0.008, + "step": 646400 + }, + { + "epoch": 1.68, + "learning_rate": 4.866180553215425e-05, + "loss": 0.0067, + "step": 646410 + }, + { + "epoch": 1.68, + "learning_rate": 4.865791731578279e-05, + "loss": 0.0099, + "step": 646420 + }, + { + "epoch": 1.68, + "learning_rate": 4.865402909941132e-05, + "loss": 0.0083, + "step": 646430 + }, + { + "epoch": 1.68, + "learning_rate": 4.865014088303986e-05, + "loss": 0.0078, + "step": 646440 + }, + { + "epoch": 1.68, + "learning_rate": 4.8646252666668385e-05, + "loss": 0.0087, + "step": 646450 + }, + { + "epoch": 1.68, + "learning_rate": 4.864236445029692e-05, + "loss": 0.0091, + "step": 646460 + }, + { + "epoch": 1.68, + "learning_rate": 4.863847623392546e-05, + "loss": 0.0087, + "step": 646470 + }, + { + "epoch": 1.68, + "learning_rate": 4.8634588017553996e-05, + "loss": 0.0084, + "step": 646480 + }, + { + "epoch": 1.68, + "learning_rate": 4.863069980118253e-05, + "loss": 0.0061, + "step": 646490 + }, + { + "epoch": 1.68, + "learning_rate": 4.8626811584811066e-05, + "loss": 0.0118, + "step": 646500 + }, + { + "epoch": 1.68, + "learning_rate": 4.86229233684396e-05, + "loss": 0.0082, + "step": 646510 + }, + { + "epoch": 1.68, + "learning_rate": 4.8619035152068136e-05, + "loss": 0.0065, + "step": 646520 + }, + { + "epoch": 1.68, + "learning_rate": 4.861514693569667e-05, + "loss": 0.0082, + "step": 646530 + }, + { + "epoch": 1.68, + "learning_rate": 4.8611258719325205e-05, + "loss": 0.0077, + "step": 646540 + }, + { + "epoch": 1.68, + "learning_rate": 4.860737050295374e-05, + "loss": 0.0085, + "step": 646550 + }, + { + "epoch": 1.68, + "learning_rate": 4.860348228658228e-05, + "loss": 0.0105, + "step": 646560 + }, + { + "epoch": 1.68, + "learning_rate": 4.859959407021082e-05, + "loss": 0.0079, + "step": 646570 + }, + { + "epoch": 1.68, + "learning_rate": 4.859570585383935e-05, + "loss": 0.0111, + "step": 646580 + }, + { + "epoch": 1.68, + "learning_rate": 4.8591817637467886e-05, + "loss": 0.0097, + "step": 646590 + }, + { + "epoch": 1.68, + "learning_rate": 4.858792942109642e-05, + "loss": 0.0113, + "step": 646600 + }, + { + "epoch": 1.68, + "learning_rate": 4.8584041204724956e-05, + "loss": 0.0079, + "step": 646610 + }, + { + "epoch": 1.68, + "learning_rate": 4.858015298835349e-05, + "loss": 0.0093, + "step": 646620 + }, + { + "epoch": 1.68, + "learning_rate": 4.8576264771982026e-05, + "loss": 0.013, + "step": 646630 + }, + { + "epoch": 1.68, + "learning_rate": 4.857237655561057e-05, + "loss": 0.0096, + "step": 646640 + }, + { + "epoch": 1.68, + "learning_rate": 4.85684883392391e-05, + "loss": 0.0065, + "step": 646650 + }, + { + "epoch": 1.68, + "learning_rate": 4.856460012286764e-05, + "loss": 0.0073, + "step": 646660 + }, + { + "epoch": 1.68, + "learning_rate": 4.856071190649617e-05, + "loss": 0.0089, + "step": 646670 + }, + { + "epoch": 1.68, + "learning_rate": 4.855682369012471e-05, + "loss": 0.0086, + "step": 646680 + }, + { + "epoch": 1.68, + "learning_rate": 4.8552935473753235e-05, + "loss": 0.0058, + "step": 646690 + }, + { + "epoch": 1.68, + "learning_rate": 4.854904725738177e-05, + "loss": 0.0084, + "step": 646700 + }, + { + "epoch": 1.68, + "learning_rate": 4.8545159041010305e-05, + "loss": 0.006, + "step": 646710 + }, + { + "epoch": 1.68, + "learning_rate": 4.854127082463884e-05, + "loss": 0.0105, + "step": 646720 + }, + { + "epoch": 1.68, + "learning_rate": 4.8537382608267375e-05, + "loss": 0.0111, + "step": 646730 + }, + { + "epoch": 1.68, + "learning_rate": 4.8533494391895916e-05, + "loss": 0.0105, + "step": 646740 + }, + { + "epoch": 1.68, + "learning_rate": 4.852960617552445e-05, + "loss": 0.0096, + "step": 646750 + }, + { + "epoch": 1.68, + "learning_rate": 4.8525717959152986e-05, + "loss": 0.0081, + "step": 646760 + }, + { + "epoch": 1.68, + "learning_rate": 4.852182974278152e-05, + "loss": 0.0071, + "step": 646770 + }, + { + "epoch": 1.68, + "learning_rate": 4.8517941526410056e-05, + "loss": 0.007, + "step": 646780 + }, + { + "epoch": 1.68, + "learning_rate": 4.851405331003859e-05, + "loss": 0.0089, + "step": 646790 + }, + { + "epoch": 1.68, + "learning_rate": 4.8510165093667125e-05, + "loss": 0.0102, + "step": 646800 + }, + { + "epoch": 1.68, + "learning_rate": 4.850627687729566e-05, + "loss": 0.0081, + "step": 646810 + }, + { + "epoch": 1.68, + "learning_rate": 4.85023886609242e-05, + "loss": 0.0137, + "step": 646820 + }, + { + "epoch": 1.68, + "learning_rate": 4.849850044455274e-05, + "loss": 0.0087, + "step": 646830 + }, + { + "epoch": 1.68, + "learning_rate": 4.849461222818127e-05, + "loss": 0.0066, + "step": 646840 + }, + { + "epoch": 1.68, + "learning_rate": 4.8490724011809806e-05, + "loss": 0.0064, + "step": 646850 + }, + { + "epoch": 1.68, + "learning_rate": 4.848683579543834e-05, + "loss": 0.0087, + "step": 646860 + }, + { + "epoch": 1.68, + "learning_rate": 4.8482947579066876e-05, + "loss": 0.0064, + "step": 646870 + }, + { + "epoch": 1.68, + "learning_rate": 4.847905936269541e-05, + "loss": 0.0093, + "step": 646880 + }, + { + "epoch": 1.68, + "learning_rate": 4.8475171146323946e-05, + "loss": 0.0102, + "step": 646890 + }, + { + "epoch": 1.68, + "learning_rate": 4.847128292995249e-05, + "loss": 0.0076, + "step": 646900 + }, + { + "epoch": 1.68, + "learning_rate": 4.846739471358102e-05, + "loss": 0.008, + "step": 646910 + }, + { + "epoch": 1.68, + "learning_rate": 4.846350649720956e-05, + "loss": 0.006, + "step": 646920 + }, + { + "epoch": 1.68, + "learning_rate": 4.845961828083809e-05, + "loss": 0.0076, + "step": 646930 + }, + { + "epoch": 1.68, + "learning_rate": 4.845573006446662e-05, + "loss": 0.0104, + "step": 646940 + }, + { + "epoch": 1.68, + "learning_rate": 4.8451841848095155e-05, + "loss": 0.0089, + "step": 646950 + }, + { + "epoch": 1.68, + "learning_rate": 4.844795363172369e-05, + "loss": 0.0071, + "step": 646960 + }, + { + "epoch": 1.68, + "learning_rate": 4.8444065415352225e-05, + "loss": 0.008, + "step": 646970 + }, + { + "epoch": 1.68, + "learning_rate": 4.844017719898076e-05, + "loss": 0.0091, + "step": 646980 + }, + { + "epoch": 1.68, + "learning_rate": 4.8436288982609294e-05, + "loss": 0.0118, + "step": 646990 + }, + { + "epoch": 1.68, + "learning_rate": 4.8432400766237836e-05, + "loss": 0.0079, + "step": 647000 + }, + { + "epoch": 1.68, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.005205851048231125, + "eval_runtime": 107.5257, + "eval_samples_per_second": 18.6, + "eval_steps_per_second": 4.65, + "step": 647000 + }, + { + "epoch": 1.68, + "learning_rate": 4.842851254986637e-05, + "loss": 0.0118, + "step": 647010 + }, + { + "epoch": 1.68, + "learning_rate": 4.8424624333494906e-05, + "loss": 0.0064, + "step": 647020 + }, + { + "epoch": 1.68, + "learning_rate": 4.842073611712344e-05, + "loss": 0.0095, + "step": 647030 + }, + { + "epoch": 1.68, + "learning_rate": 4.8416847900751976e-05, + "loss": 0.009, + "step": 647040 + }, + { + "epoch": 1.68, + "learning_rate": 4.841295968438051e-05, + "loss": 0.0079, + "step": 647050 + }, + { + "epoch": 1.68, + "learning_rate": 4.8409071468009045e-05, + "loss": 0.0088, + "step": 647060 + }, + { + "epoch": 1.68, + "learning_rate": 4.840518325163758e-05, + "loss": 0.0096, + "step": 647070 + }, + { + "epoch": 1.68, + "learning_rate": 4.840129503526612e-05, + "loss": 0.0128, + "step": 647080 + }, + { + "epoch": 1.68, + "learning_rate": 4.839740681889466e-05, + "loss": 0.0104, + "step": 647090 + }, + { + "epoch": 1.68, + "learning_rate": 4.839351860252319e-05, + "loss": 0.0089, + "step": 647100 + }, + { + "epoch": 1.68, + "learning_rate": 4.8389630386151726e-05, + "loss": 0.0077, + "step": 647110 + }, + { + "epoch": 1.68, + "learning_rate": 4.838574216978026e-05, + "loss": 0.0066, + "step": 647120 + }, + { + "epoch": 1.68, + "learning_rate": 4.8381853953408796e-05, + "loss": 0.0098, + "step": 647130 + }, + { + "epoch": 1.68, + "learning_rate": 4.837796573703733e-05, + "loss": 0.0071, + "step": 647140 + }, + { + "epoch": 1.68, + "learning_rate": 4.8374077520665866e-05, + "loss": 0.0069, + "step": 647150 + }, + { + "epoch": 1.68, + "learning_rate": 4.837018930429441e-05, + "loss": 0.0086, + "step": 647160 + }, + { + "epoch": 1.68, + "learning_rate": 4.836630108792294e-05, + "loss": 0.0093, + "step": 647170 + }, + { + "epoch": 1.68, + "learning_rate": 4.836241287155148e-05, + "loss": 0.0062, + "step": 647180 + }, + { + "epoch": 1.68, + "learning_rate": 4.8358524655180005e-05, + "loss": 0.0067, + "step": 647190 + }, + { + "epoch": 1.68, + "learning_rate": 4.835463643880854e-05, + "loss": 0.0095, + "step": 647200 + }, + { + "epoch": 1.68, + "learning_rate": 4.8350748222437075e-05, + "loss": 0.0076, + "step": 647210 + }, + { + "epoch": 1.68, + "learning_rate": 4.834686000606561e-05, + "loss": 0.0103, + "step": 647220 + }, + { + "epoch": 1.68, + "learning_rate": 4.8342971789694145e-05, + "loss": 0.0051, + "step": 647230 + }, + { + "epoch": 1.68, + "learning_rate": 4.833908357332268e-05, + "loss": 0.0103, + "step": 647240 + }, + { + "epoch": 1.68, + "learning_rate": 4.8335195356951214e-05, + "loss": 0.0092, + "step": 647250 + }, + { + "epoch": 1.68, + "learning_rate": 4.8331307140579756e-05, + "loss": 0.0065, + "step": 647260 + }, + { + "epoch": 1.68, + "learning_rate": 4.832741892420829e-05, + "loss": 0.0091, + "step": 647270 + }, + { + "epoch": 1.68, + "learning_rate": 4.8323530707836826e-05, + "loss": 0.0082, + "step": 647280 + }, + { + "epoch": 1.68, + "learning_rate": 4.831964249146536e-05, + "loss": 0.0076, + "step": 647290 + }, + { + "epoch": 1.68, + "learning_rate": 4.8315754275093896e-05, + "loss": 0.0073, + "step": 647300 + }, + { + "epoch": 1.68, + "learning_rate": 4.831186605872243e-05, + "loss": 0.0102, + "step": 647310 + }, + { + "epoch": 1.68, + "learning_rate": 4.8307977842350965e-05, + "loss": 0.0077, + "step": 647320 + }, + { + "epoch": 1.68, + "learning_rate": 4.83040896259795e-05, + "loss": 0.0096, + "step": 647330 + }, + { + "epoch": 1.68, + "learning_rate": 4.830020140960804e-05, + "loss": 0.006, + "step": 647340 + }, + { + "epoch": 1.68, + "learning_rate": 4.8296313193236577e-05, + "loss": 0.0075, + "step": 647350 + }, + { + "epoch": 1.68, + "learning_rate": 4.829242497686511e-05, + "loss": 0.0086, + "step": 647360 + }, + { + "epoch": 1.68, + "learning_rate": 4.8288536760493646e-05, + "loss": 0.0098, + "step": 647370 + }, + { + "epoch": 1.68, + "learning_rate": 4.828464854412218e-05, + "loss": 0.0067, + "step": 647380 + }, + { + "epoch": 1.68, + "learning_rate": 4.8280760327750716e-05, + "loss": 0.0094, + "step": 647390 + }, + { + "epoch": 1.68, + "learning_rate": 4.827687211137925e-05, + "loss": 0.0084, + "step": 647400 + }, + { + "epoch": 1.68, + "learning_rate": 4.8272983895007786e-05, + "loss": 0.0081, + "step": 647410 + }, + { + "epoch": 1.68, + "learning_rate": 4.826909567863633e-05, + "loss": 0.009, + "step": 647420 + }, + { + "epoch": 1.68, + "learning_rate": 4.826520746226486e-05, + "loss": 0.0072, + "step": 647430 + }, + { + "epoch": 1.68, + "learning_rate": 4.826131924589339e-05, + "loss": 0.0096, + "step": 647440 + }, + { + "epoch": 1.68, + "learning_rate": 4.8257431029521925e-05, + "loss": 0.0067, + "step": 647450 + }, + { + "epoch": 1.68, + "learning_rate": 4.825354281315046e-05, + "loss": 0.0104, + "step": 647460 + }, + { + "epoch": 1.68, + "learning_rate": 4.8249654596778995e-05, + "loss": 0.0077, + "step": 647470 + }, + { + "epoch": 1.68, + "learning_rate": 4.824576638040753e-05, + "loss": 0.0092, + "step": 647480 + }, + { + "epoch": 1.68, + "learning_rate": 4.8241878164036065e-05, + "loss": 0.0062, + "step": 647490 + }, + { + "epoch": 1.68, + "learning_rate": 4.82379899476646e-05, + "loss": 0.0106, + "step": 647500 + }, + { + "epoch": 1.68, + "learning_rate": 4.8234101731293134e-05, + "loss": 0.0102, + "step": 647510 + }, + { + "epoch": 1.68, + "learning_rate": 4.8230213514921676e-05, + "loss": 0.0083, + "step": 647520 + }, + { + "epoch": 1.68, + "learning_rate": 4.822632529855021e-05, + "loss": 0.0086, + "step": 647530 + }, + { + "epoch": 1.68, + "learning_rate": 4.8222437082178746e-05, + "loss": 0.008, + "step": 647540 + }, + { + "epoch": 1.68, + "learning_rate": 4.821854886580728e-05, + "loss": 0.0074, + "step": 647550 + }, + { + "epoch": 1.68, + "learning_rate": 4.8214660649435815e-05, + "loss": 0.0086, + "step": 647560 + }, + { + "epoch": 1.68, + "learning_rate": 4.821077243306435e-05, + "loss": 0.0058, + "step": 647570 + }, + { + "epoch": 1.68, + "learning_rate": 4.8206884216692885e-05, + "loss": 0.0073, + "step": 647580 + }, + { + "epoch": 1.68, + "learning_rate": 4.820299600032142e-05, + "loss": 0.007, + "step": 647590 + }, + { + "epoch": 1.68, + "learning_rate": 4.819910778394996e-05, + "loss": 0.0065, + "step": 647600 + }, + { + "epoch": 1.68, + "learning_rate": 4.8195219567578497e-05, + "loss": 0.0098, + "step": 647610 + }, + { + "epoch": 1.68, + "learning_rate": 4.819133135120703e-05, + "loss": 0.0091, + "step": 647620 + }, + { + "epoch": 1.68, + "learning_rate": 4.8187443134835566e-05, + "loss": 0.0065, + "step": 647630 + }, + { + "epoch": 1.68, + "learning_rate": 4.81835549184641e-05, + "loss": 0.008, + "step": 647640 + }, + { + "epoch": 1.68, + "learning_rate": 4.8179666702092636e-05, + "loss": 0.01, + "step": 647650 + }, + { + "epoch": 1.68, + "learning_rate": 4.817577848572117e-05, + "loss": 0.0079, + "step": 647660 + }, + { + "epoch": 1.68, + "learning_rate": 4.8171890269349706e-05, + "loss": 0.008, + "step": 647670 + }, + { + "epoch": 1.68, + "learning_rate": 4.816800205297825e-05, + "loss": 0.0092, + "step": 647680 + }, + { + "epoch": 1.68, + "learning_rate": 4.816411383660677e-05, + "loss": 0.0066, + "step": 647690 + }, + { + "epoch": 1.68, + "learning_rate": 4.816022562023531e-05, + "loss": 0.0083, + "step": 647700 + }, + { + "epoch": 1.68, + "learning_rate": 4.8156337403863845e-05, + "loss": 0.0077, + "step": 647710 + }, + { + "epoch": 1.68, + "learning_rate": 4.815244918749238e-05, + "loss": 0.0073, + "step": 647720 + }, + { + "epoch": 1.68, + "learning_rate": 4.8148560971120915e-05, + "loss": 0.0123, + "step": 647730 + }, + { + "epoch": 1.68, + "learning_rate": 4.814467275474945e-05, + "loss": 0.0081, + "step": 647740 + }, + { + "epoch": 1.68, + "learning_rate": 4.8140784538377985e-05, + "loss": 0.0084, + "step": 647750 + }, + { + "epoch": 1.68, + "learning_rate": 4.813689632200652e-05, + "loss": 0.0065, + "step": 647760 + }, + { + "epoch": 1.68, + "learning_rate": 4.8133008105635054e-05, + "loss": 0.0111, + "step": 647770 + }, + { + "epoch": 1.68, + "learning_rate": 4.8129119889263596e-05, + "loss": 0.0078, + "step": 647780 + }, + { + "epoch": 1.68, + "learning_rate": 4.812523167289213e-05, + "loss": 0.0067, + "step": 647790 + }, + { + "epoch": 1.68, + "learning_rate": 4.8121343456520666e-05, + "loss": 0.0077, + "step": 647800 + }, + { + "epoch": 1.68, + "learning_rate": 4.81174552401492e-05, + "loss": 0.0071, + "step": 647810 + }, + { + "epoch": 1.68, + "learning_rate": 4.8113567023777735e-05, + "loss": 0.008, + "step": 647820 + }, + { + "epoch": 1.68, + "learning_rate": 4.810967880740627e-05, + "loss": 0.0071, + "step": 647830 + }, + { + "epoch": 1.68, + "learning_rate": 4.8105790591034805e-05, + "loss": 0.0053, + "step": 647840 + }, + { + "epoch": 1.68, + "learning_rate": 4.810190237466334e-05, + "loss": 0.0072, + "step": 647850 + }, + { + "epoch": 1.68, + "learning_rate": 4.8098014158291875e-05, + "loss": 0.0102, + "step": 647860 + }, + { + "epoch": 1.68, + "learning_rate": 4.8094125941920416e-05, + "loss": 0.0065, + "step": 647870 + }, + { + "epoch": 1.68, + "learning_rate": 4.809023772554895e-05, + "loss": 0.0132, + "step": 647880 + }, + { + "epoch": 1.68, + "learning_rate": 4.8086349509177486e-05, + "loss": 0.0079, + "step": 647890 + }, + { + "epoch": 1.68, + "learning_rate": 4.808246129280602e-05, + "loss": 0.0074, + "step": 647900 + }, + { + "epoch": 1.68, + "learning_rate": 4.8078573076434556e-05, + "loss": 0.0086, + "step": 647910 + }, + { + "epoch": 1.68, + "learning_rate": 4.807468486006309e-05, + "loss": 0.0088, + "step": 647920 + }, + { + "epoch": 1.68, + "learning_rate": 4.8070796643691626e-05, + "loss": 0.0074, + "step": 647930 + }, + { + "epoch": 1.68, + "learning_rate": 4.8066908427320154e-05, + "loss": 0.0075, + "step": 647940 + }, + { + "epoch": 1.68, + "learning_rate": 4.806302021094869e-05, + "loss": 0.0086, + "step": 647950 + }, + { + "epoch": 1.68, + "learning_rate": 4.8059131994577223e-05, + "loss": 0.0109, + "step": 647960 + }, + { + "epoch": 1.68, + "learning_rate": 4.8055243778205765e-05, + "loss": 0.0097, + "step": 647970 + }, + { + "epoch": 1.68, + "learning_rate": 4.80513555618343e-05, + "loss": 0.0074, + "step": 647980 + }, + { + "epoch": 1.68, + "learning_rate": 4.8047467345462835e-05, + "loss": 0.0073, + "step": 647990 + }, + { + "epoch": 1.68, + "learning_rate": 4.804357912909137e-05, + "loss": 0.0071, + "step": 648000 + }, + { + "epoch": 1.68, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.005112422164529562, + "eval_runtime": 107.9114, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.633, + "step": 648000 + }, + { + "epoch": 1.68, + "learning_rate": 4.8039690912719905e-05, + "loss": 0.0072, + "step": 648010 + }, + { + "epoch": 1.68, + "learning_rate": 4.803580269634844e-05, + "loss": 0.0086, + "step": 648020 + }, + { + "epoch": 1.68, + "learning_rate": 4.8031914479976974e-05, + "loss": 0.01, + "step": 648030 + }, + { + "epoch": 1.68, + "learning_rate": 4.802802626360551e-05, + "loss": 0.0065, + "step": 648040 + }, + { + "epoch": 1.68, + "learning_rate": 4.802413804723405e-05, + "loss": 0.0096, + "step": 648050 + }, + { + "epoch": 1.68, + "learning_rate": 4.8020249830862586e-05, + "loss": 0.0089, + "step": 648060 + }, + { + "epoch": 1.68, + "learning_rate": 4.801636161449112e-05, + "loss": 0.0082, + "step": 648070 + }, + { + "epoch": 1.68, + "learning_rate": 4.8012473398119655e-05, + "loss": 0.0069, + "step": 648080 + }, + { + "epoch": 1.68, + "learning_rate": 4.800858518174819e-05, + "loss": 0.0098, + "step": 648090 + }, + { + "epoch": 1.68, + "learning_rate": 4.8004696965376725e-05, + "loss": 0.015, + "step": 648100 + }, + { + "epoch": 1.68, + "learning_rate": 4.800080874900526e-05, + "loss": 0.0063, + "step": 648110 + }, + { + "epoch": 1.68, + "learning_rate": 4.7996920532633795e-05, + "loss": 0.0086, + "step": 648120 + }, + { + "epoch": 1.68, + "learning_rate": 4.7993032316262336e-05, + "loss": 0.0083, + "step": 648130 + }, + { + "epoch": 1.68, + "learning_rate": 4.798914409989087e-05, + "loss": 0.0081, + "step": 648140 + }, + { + "epoch": 1.68, + "learning_rate": 4.7985255883519406e-05, + "loss": 0.0072, + "step": 648150 + }, + { + "epoch": 1.68, + "learning_rate": 4.798136766714794e-05, + "loss": 0.0069, + "step": 648160 + }, + { + "epoch": 1.68, + "learning_rate": 4.7977479450776476e-05, + "loss": 0.0074, + "step": 648170 + }, + { + "epoch": 1.68, + "learning_rate": 4.7973591234405004e-05, + "loss": 0.0064, + "step": 648180 + }, + { + "epoch": 1.68, + "learning_rate": 4.796970301803354e-05, + "loss": 0.0075, + "step": 648190 + }, + { + "epoch": 1.68, + "learning_rate": 4.7965814801662074e-05, + "loss": 0.0087, + "step": 648200 + }, + { + "epoch": 1.68, + "learning_rate": 4.796192658529061e-05, + "loss": 0.0072, + "step": 648210 + }, + { + "epoch": 1.68, + "learning_rate": 4.7958038368919143e-05, + "loss": 0.0076, + "step": 648220 + }, + { + "epoch": 1.68, + "learning_rate": 4.7954150152547685e-05, + "loss": 0.0081, + "step": 648230 + }, + { + "epoch": 1.68, + "learning_rate": 4.795026193617622e-05, + "loss": 0.0081, + "step": 648240 + }, + { + "epoch": 1.68, + "learning_rate": 4.7946373719804755e-05, + "loss": 0.0087, + "step": 648250 + }, + { + "epoch": 1.68, + "learning_rate": 4.794248550343329e-05, + "loss": 0.0072, + "step": 648260 + }, + { + "epoch": 1.68, + "learning_rate": 4.7938597287061825e-05, + "loss": 0.0098, + "step": 648270 + }, + { + "epoch": 1.68, + "learning_rate": 4.793470907069036e-05, + "loss": 0.0089, + "step": 648280 + }, + { + "epoch": 1.68, + "learning_rate": 4.7930820854318894e-05, + "loss": 0.0092, + "step": 648290 + }, + { + "epoch": 1.68, + "learning_rate": 4.792693263794743e-05, + "loss": 0.0091, + "step": 648300 + }, + { + "epoch": 1.68, + "learning_rate": 4.792304442157597e-05, + "loss": 0.0078, + "step": 648310 + }, + { + "epoch": 1.68, + "learning_rate": 4.7919156205204506e-05, + "loss": 0.0083, + "step": 648320 + }, + { + "epoch": 1.68, + "learning_rate": 4.791526798883304e-05, + "loss": 0.0079, + "step": 648330 + }, + { + "epoch": 1.68, + "learning_rate": 4.7911379772461575e-05, + "loss": 0.0105, + "step": 648340 + }, + { + "epoch": 1.68, + "learning_rate": 4.790749155609011e-05, + "loss": 0.0091, + "step": 648350 + }, + { + "epoch": 1.68, + "learning_rate": 4.7903603339718645e-05, + "loss": 0.0098, + "step": 648360 + }, + { + "epoch": 1.68, + "learning_rate": 4.789971512334718e-05, + "loss": 0.0079, + "step": 648370 + }, + { + "epoch": 1.68, + "learning_rate": 4.7895826906975715e-05, + "loss": 0.0081, + "step": 648380 + }, + { + "epoch": 1.68, + "learning_rate": 4.7891938690604256e-05, + "loss": 0.0078, + "step": 648390 + }, + { + "epoch": 1.68, + "learning_rate": 4.788805047423279e-05, + "loss": 0.0062, + "step": 648400 + }, + { + "epoch": 1.68, + "learning_rate": 4.7884162257861326e-05, + "loss": 0.0052, + "step": 648410 + }, + { + "epoch": 1.68, + "learning_rate": 4.788027404148986e-05, + "loss": 0.0061, + "step": 648420 + }, + { + "epoch": 1.68, + "learning_rate": 4.787638582511839e-05, + "loss": 0.0087, + "step": 648430 + }, + { + "epoch": 1.68, + "learning_rate": 4.7872497608746924e-05, + "loss": 0.0091, + "step": 648440 + }, + { + "epoch": 1.68, + "learning_rate": 4.786860939237546e-05, + "loss": 0.0087, + "step": 648450 + }, + { + "epoch": 1.68, + "learning_rate": 4.7864721176003994e-05, + "loss": 0.0077, + "step": 648460 + }, + { + "epoch": 1.68, + "learning_rate": 4.786083295963253e-05, + "loss": 0.0104, + "step": 648470 + }, + { + "epoch": 1.68, + "learning_rate": 4.785694474326106e-05, + "loss": 0.006, + "step": 648480 + }, + { + "epoch": 1.68, + "learning_rate": 4.7853056526889605e-05, + "loss": 0.0055, + "step": 648490 + }, + { + "epoch": 1.68, + "learning_rate": 4.784916831051814e-05, + "loss": 0.0076, + "step": 648500 + }, + { + "epoch": 1.68, + "learning_rate": 4.7845280094146675e-05, + "loss": 0.0082, + "step": 648510 + }, + { + "epoch": 1.68, + "learning_rate": 4.784139187777521e-05, + "loss": 0.01, + "step": 648520 + }, + { + "epoch": 1.68, + "learning_rate": 4.7837503661403744e-05, + "loss": 0.006, + "step": 648530 + }, + { + "epoch": 1.68, + "learning_rate": 4.783361544503228e-05, + "loss": 0.0073, + "step": 648540 + }, + { + "epoch": 1.68, + "learning_rate": 4.7829727228660814e-05, + "loss": 0.0088, + "step": 648550 + }, + { + "epoch": 1.68, + "learning_rate": 4.782583901228935e-05, + "loss": 0.0069, + "step": 648560 + }, + { + "epoch": 1.68, + "learning_rate": 4.782195079591789e-05, + "loss": 0.0095, + "step": 648570 + }, + { + "epoch": 1.68, + "learning_rate": 4.7818062579546426e-05, + "loss": 0.0089, + "step": 648580 + }, + { + "epoch": 1.68, + "learning_rate": 4.781417436317496e-05, + "loss": 0.0072, + "step": 648590 + }, + { + "epoch": 1.68, + "learning_rate": 4.7810286146803495e-05, + "loss": 0.0092, + "step": 648600 + }, + { + "epoch": 1.68, + "learning_rate": 4.780639793043203e-05, + "loss": 0.006, + "step": 648610 + }, + { + "epoch": 1.68, + "learning_rate": 4.7802509714060565e-05, + "loss": 0.0084, + "step": 648620 + }, + { + "epoch": 1.68, + "learning_rate": 4.77986214976891e-05, + "loss": 0.0087, + "step": 648630 + }, + { + "epoch": 1.68, + "learning_rate": 4.7794733281317635e-05, + "loss": 0.008, + "step": 648640 + }, + { + "epoch": 1.68, + "learning_rate": 4.7790845064946176e-05, + "loss": 0.0091, + "step": 648650 + }, + { + "epoch": 1.68, + "learning_rate": 4.778695684857471e-05, + "loss": 0.0063, + "step": 648660 + }, + { + "epoch": 1.68, + "learning_rate": 4.7783068632203246e-05, + "loss": 0.0082, + "step": 648670 + }, + { + "epoch": 1.68, + "learning_rate": 4.7779180415831774e-05, + "loss": 0.009, + "step": 648680 + }, + { + "epoch": 1.68, + "learning_rate": 4.777529219946031e-05, + "loss": 0.0078, + "step": 648690 + }, + { + "epoch": 1.68, + "learning_rate": 4.7771403983088844e-05, + "loss": 0.0113, + "step": 648700 + }, + { + "epoch": 1.68, + "learning_rate": 4.776751576671738e-05, + "loss": 0.0104, + "step": 648710 + }, + { + "epoch": 1.68, + "learning_rate": 4.7763627550345914e-05, + "loss": 0.0085, + "step": 648720 + }, + { + "epoch": 1.68, + "learning_rate": 4.775973933397445e-05, + "loss": 0.0077, + "step": 648730 + }, + { + "epoch": 1.68, + "learning_rate": 4.775585111760298e-05, + "loss": 0.0074, + "step": 648740 + }, + { + "epoch": 1.68, + "learning_rate": 4.7751962901231525e-05, + "loss": 0.007, + "step": 648750 + }, + { + "epoch": 1.68, + "learning_rate": 4.774807468486006e-05, + "loss": 0.0108, + "step": 648760 + }, + { + "epoch": 1.68, + "learning_rate": 4.7744186468488595e-05, + "loss": 0.0083, + "step": 648770 + }, + { + "epoch": 1.68, + "learning_rate": 4.774029825211713e-05, + "loss": 0.0077, + "step": 648780 + }, + { + "epoch": 1.68, + "learning_rate": 4.7736410035745664e-05, + "loss": 0.0085, + "step": 648790 + }, + { + "epoch": 1.68, + "learning_rate": 4.77325218193742e-05, + "loss": 0.0076, + "step": 648800 + }, + { + "epoch": 1.68, + "learning_rate": 4.7728633603002734e-05, + "loss": 0.0089, + "step": 648810 + }, + { + "epoch": 1.68, + "learning_rate": 4.772474538663127e-05, + "loss": 0.007, + "step": 648820 + }, + { + "epoch": 1.68, + "learning_rate": 4.772085717025981e-05, + "loss": 0.008, + "step": 648830 + }, + { + "epoch": 1.68, + "learning_rate": 4.7716968953888345e-05, + "loss": 0.0081, + "step": 648840 + }, + { + "epoch": 1.68, + "learning_rate": 4.771308073751688e-05, + "loss": 0.0065, + "step": 648850 + }, + { + "epoch": 1.68, + "learning_rate": 4.7709192521145415e-05, + "loss": 0.0101, + "step": 648860 + }, + { + "epoch": 1.68, + "learning_rate": 4.770530430477395e-05, + "loss": 0.0068, + "step": 648870 + }, + { + "epoch": 1.68, + "learning_rate": 4.7701416088402485e-05, + "loss": 0.008, + "step": 648880 + }, + { + "epoch": 1.68, + "learning_rate": 4.769752787203102e-05, + "loss": 0.0102, + "step": 648890 + }, + { + "epoch": 1.68, + "learning_rate": 4.7693639655659555e-05, + "loss": 0.0078, + "step": 648900 + }, + { + "epoch": 1.68, + "learning_rate": 4.7689751439288096e-05, + "loss": 0.0075, + "step": 648910 + }, + { + "epoch": 1.68, + "learning_rate": 4.768586322291663e-05, + "loss": 0.0105, + "step": 648920 + }, + { + "epoch": 1.68, + "learning_rate": 4.768197500654516e-05, + "loss": 0.0078, + "step": 648930 + }, + { + "epoch": 1.68, + "learning_rate": 4.7678086790173694e-05, + "loss": 0.0103, + "step": 648940 + }, + { + "epoch": 1.68, + "learning_rate": 4.767419857380223e-05, + "loss": 0.006, + "step": 648950 + }, + { + "epoch": 1.68, + "learning_rate": 4.7670310357430764e-05, + "loss": 0.0122, + "step": 648960 + }, + { + "epoch": 1.68, + "learning_rate": 4.76664221410593e-05, + "loss": 0.0097, + "step": 648970 + }, + { + "epoch": 1.68, + "learning_rate": 4.7662533924687834e-05, + "loss": 0.0078, + "step": 648980 + }, + { + "epoch": 1.68, + "learning_rate": 4.765864570831637e-05, + "loss": 0.0069, + "step": 648990 + }, + { + "epoch": 1.68, + "learning_rate": 4.76547574919449e-05, + "loss": 0.0087, + "step": 649000 + }, + { + "epoch": 1.68, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.005129742436110973, + "eval_runtime": 108.1719, + "eval_samples_per_second": 18.489, + "eval_steps_per_second": 4.622, + "step": 649000 + }, + { + "epoch": 1.68, + "learning_rate": 4.7650869275573445e-05, + "loss": 0.0078, + "step": 649010 + }, + { + "epoch": 1.68, + "learning_rate": 4.764698105920198e-05, + "loss": 0.0075, + "step": 649020 + }, + { + "epoch": 1.68, + "learning_rate": 4.7643092842830515e-05, + "loss": 0.011, + "step": 649030 + }, + { + "epoch": 1.68, + "learning_rate": 4.763920462645905e-05, + "loss": 0.0101, + "step": 649040 + }, + { + "epoch": 1.68, + "learning_rate": 4.7635316410087584e-05, + "loss": 0.0108, + "step": 649050 + }, + { + "epoch": 1.68, + "learning_rate": 4.763142819371612e-05, + "loss": 0.0073, + "step": 649060 + }, + { + "epoch": 1.68, + "learning_rate": 4.7627539977344654e-05, + "loss": 0.0096, + "step": 649070 + }, + { + "epoch": 1.68, + "learning_rate": 4.762365176097319e-05, + "loss": 0.0075, + "step": 649080 + }, + { + "epoch": 1.68, + "learning_rate": 4.761976354460173e-05, + "loss": 0.0068, + "step": 649090 + }, + { + "epoch": 1.68, + "learning_rate": 4.7615875328230265e-05, + "loss": 0.0105, + "step": 649100 + }, + { + "epoch": 1.68, + "learning_rate": 4.76119871118588e-05, + "loss": 0.0086, + "step": 649110 + }, + { + "epoch": 1.68, + "learning_rate": 4.7608098895487335e-05, + "loss": 0.0071, + "step": 649120 + }, + { + "epoch": 1.68, + "learning_rate": 4.760421067911587e-05, + "loss": 0.0119, + "step": 649130 + }, + { + "epoch": 1.68, + "learning_rate": 4.7600322462744405e-05, + "loss": 0.01, + "step": 649140 + }, + { + "epoch": 1.68, + "learning_rate": 4.759643424637294e-05, + "loss": 0.0113, + "step": 649150 + }, + { + "epoch": 1.68, + "learning_rate": 4.7592546030001475e-05, + "loss": 0.0089, + "step": 649160 + }, + { + "epoch": 1.68, + "learning_rate": 4.758865781363001e-05, + "loss": 0.0074, + "step": 649170 + }, + { + "epoch": 1.68, + "learning_rate": 4.758476959725854e-05, + "loss": 0.0062, + "step": 649180 + }, + { + "epoch": 1.68, + "learning_rate": 4.758088138088708e-05, + "loss": 0.0085, + "step": 649190 + }, + { + "epoch": 1.68, + "learning_rate": 4.7576993164515614e-05, + "loss": 0.0088, + "step": 649200 + }, + { + "epoch": 1.68, + "learning_rate": 4.757310494814415e-05, + "loss": 0.0096, + "step": 649210 + }, + { + "epoch": 1.68, + "learning_rate": 4.7569216731772684e-05, + "loss": 0.0075, + "step": 649220 + }, + { + "epoch": 1.68, + "learning_rate": 4.756532851540122e-05, + "loss": 0.0093, + "step": 649230 + }, + { + "epoch": 1.68, + "learning_rate": 4.7561440299029754e-05, + "loss": 0.0046, + "step": 649240 + }, + { + "epoch": 1.68, + "learning_rate": 4.755755208265829e-05, + "loss": 0.0091, + "step": 649250 + }, + { + "epoch": 1.68, + "learning_rate": 4.755366386628682e-05, + "loss": 0.0071, + "step": 649260 + }, + { + "epoch": 1.68, + "learning_rate": 4.7549775649915365e-05, + "loss": 0.007, + "step": 649270 + }, + { + "epoch": 1.68, + "learning_rate": 4.75458874335439e-05, + "loss": 0.0075, + "step": 649280 + }, + { + "epoch": 1.68, + "learning_rate": 4.7541999217172435e-05, + "loss": 0.0093, + "step": 649290 + }, + { + "epoch": 1.68, + "learning_rate": 4.753811100080097e-05, + "loss": 0.0118, + "step": 649300 + }, + { + "epoch": 1.68, + "learning_rate": 4.7534222784429504e-05, + "loss": 0.0089, + "step": 649310 + }, + { + "epoch": 1.68, + "learning_rate": 4.753033456805804e-05, + "loss": 0.0098, + "step": 649320 + }, + { + "epoch": 1.68, + "learning_rate": 4.7526446351686574e-05, + "loss": 0.0091, + "step": 649330 + }, + { + "epoch": 1.68, + "learning_rate": 4.752255813531511e-05, + "loss": 0.0076, + "step": 649340 + }, + { + "epoch": 1.68, + "learning_rate": 4.7518669918943644e-05, + "loss": 0.0047, + "step": 649350 + }, + { + "epoch": 1.68, + "learning_rate": 4.7514781702572185e-05, + "loss": 0.0074, + "step": 649360 + }, + { + "epoch": 1.68, + "learning_rate": 4.751089348620072e-05, + "loss": 0.009, + "step": 649370 + }, + { + "epoch": 1.68, + "learning_rate": 4.7507005269829255e-05, + "loss": 0.0057, + "step": 649380 + }, + { + "epoch": 1.68, + "learning_rate": 4.750311705345779e-05, + "loss": 0.0095, + "step": 649390 + }, + { + "epoch": 1.68, + "learning_rate": 4.7499228837086325e-05, + "loss": 0.009, + "step": 649400 + }, + { + "epoch": 1.68, + "learning_rate": 4.749534062071486e-05, + "loss": 0.01, + "step": 649410 + }, + { + "epoch": 1.68, + "learning_rate": 4.749145240434339e-05, + "loss": 0.0081, + "step": 649420 + }, + { + "epoch": 1.68, + "learning_rate": 4.748756418797192e-05, + "loss": 0.0065, + "step": 649430 + }, + { + "epoch": 1.68, + "learning_rate": 4.748367597160046e-05, + "loss": 0.0085, + "step": 649440 + }, + { + "epoch": 1.68, + "learning_rate": 4.747978775522899e-05, + "loss": 0.0091, + "step": 649450 + }, + { + "epoch": 1.68, + "learning_rate": 4.7475899538857534e-05, + "loss": 0.0082, + "step": 649460 + }, + { + "epoch": 1.68, + "learning_rate": 4.747201132248607e-05, + "loss": 0.0059, + "step": 649470 + }, + { + "epoch": 1.68, + "learning_rate": 4.7468123106114604e-05, + "loss": 0.007, + "step": 649480 + }, + { + "epoch": 1.68, + "learning_rate": 4.746423488974314e-05, + "loss": 0.0083, + "step": 649490 + }, + { + "epoch": 1.68, + "learning_rate": 4.7460346673371673e-05, + "loss": 0.0099, + "step": 649500 + }, + { + "epoch": 1.68, + "learning_rate": 4.745645845700021e-05, + "loss": 0.0088, + "step": 649510 + }, + { + "epoch": 1.68, + "learning_rate": 4.745257024062874e-05, + "loss": 0.0068, + "step": 649520 + }, + { + "epoch": 1.68, + "learning_rate": 4.744868202425728e-05, + "loss": 0.0074, + "step": 649530 + }, + { + "epoch": 1.68, + "learning_rate": 4.744479380788582e-05, + "loss": 0.0073, + "step": 649540 + }, + { + "epoch": 1.68, + "learning_rate": 4.7440905591514355e-05, + "loss": 0.0068, + "step": 649550 + }, + { + "epoch": 1.68, + "learning_rate": 4.743701737514289e-05, + "loss": 0.0061, + "step": 649560 + }, + { + "epoch": 1.68, + "learning_rate": 4.7433129158771424e-05, + "loss": 0.0092, + "step": 649570 + }, + { + "epoch": 1.68, + "learning_rate": 4.742924094239996e-05, + "loss": 0.0095, + "step": 649580 + }, + { + "epoch": 1.68, + "learning_rate": 4.7425352726028494e-05, + "loss": 0.0086, + "step": 649590 + }, + { + "epoch": 1.68, + "learning_rate": 4.742146450965703e-05, + "loss": 0.007, + "step": 649600 + }, + { + "epoch": 1.68, + "learning_rate": 4.7417576293285564e-05, + "loss": 0.0077, + "step": 649610 + }, + { + "epoch": 1.68, + "learning_rate": 4.7413688076914105e-05, + "loss": 0.0069, + "step": 649620 + }, + { + "epoch": 1.68, + "learning_rate": 4.740979986054264e-05, + "loss": 0.009, + "step": 649630 + }, + { + "epoch": 1.68, + "learning_rate": 4.7405911644171175e-05, + "loss": 0.0098, + "step": 649640 + }, + { + "epoch": 1.68, + "learning_rate": 4.740202342779971e-05, + "loss": 0.0068, + "step": 649650 + }, + { + "epoch": 1.68, + "learning_rate": 4.7398135211428245e-05, + "loss": 0.0086, + "step": 649660 + }, + { + "epoch": 1.68, + "learning_rate": 4.739424699505677e-05, + "loss": 0.0092, + "step": 649670 + }, + { + "epoch": 1.68, + "learning_rate": 4.739035877868531e-05, + "loss": 0.0065, + "step": 649680 + }, + { + "epoch": 1.68, + "learning_rate": 4.738647056231384e-05, + "loss": 0.0088, + "step": 649690 + }, + { + "epoch": 1.68, + "learning_rate": 4.738258234594238e-05, + "loss": 0.0077, + "step": 649700 + }, + { + "epoch": 1.68, + "learning_rate": 4.737869412957091e-05, + "loss": 0.0094, + "step": 649710 + }, + { + "epoch": 1.68, + "learning_rate": 4.7374805913199454e-05, + "loss": 0.0065, + "step": 649720 + }, + { + "epoch": 1.68, + "learning_rate": 4.737091769682799e-05, + "loss": 0.0069, + "step": 649730 + }, + { + "epoch": 1.68, + "learning_rate": 4.7367029480456524e-05, + "loss": 0.0087, + "step": 649740 + }, + { + "epoch": 1.68, + "learning_rate": 4.736314126408506e-05, + "loss": 0.0068, + "step": 649750 + }, + { + "epoch": 1.68, + "learning_rate": 4.7359253047713593e-05, + "loss": 0.0105, + "step": 649760 + }, + { + "epoch": 1.68, + "learning_rate": 4.735536483134213e-05, + "loss": 0.0073, + "step": 649770 + }, + { + "epoch": 1.68, + "learning_rate": 4.735147661497066e-05, + "loss": 0.0084, + "step": 649780 + }, + { + "epoch": 1.68, + "learning_rate": 4.73475883985992e-05, + "loss": 0.0108, + "step": 649790 + }, + { + "epoch": 1.68, + "learning_rate": 4.734370018222774e-05, + "loss": 0.0072, + "step": 649800 + }, + { + "epoch": 1.68, + "learning_rate": 4.7339811965856274e-05, + "loss": 0.0082, + "step": 649810 + }, + { + "epoch": 1.68, + "learning_rate": 4.733592374948481e-05, + "loss": 0.0063, + "step": 649820 + }, + { + "epoch": 1.68, + "learning_rate": 4.7332035533113344e-05, + "loss": 0.0086, + "step": 649830 + }, + { + "epoch": 1.68, + "learning_rate": 4.732814731674188e-05, + "loss": 0.0069, + "step": 649840 + }, + { + "epoch": 1.68, + "learning_rate": 4.7324259100370414e-05, + "loss": 0.0059, + "step": 649850 + }, + { + "epoch": 1.68, + "learning_rate": 4.732037088399895e-05, + "loss": 0.0108, + "step": 649860 + }, + { + "epoch": 1.68, + "learning_rate": 4.7316482667627484e-05, + "loss": 0.0069, + "step": 649870 + }, + { + "epoch": 1.68, + "learning_rate": 4.7312594451256025e-05, + "loss": 0.0091, + "step": 649880 + }, + { + "epoch": 1.68, + "learning_rate": 4.730870623488456e-05, + "loss": 0.0103, + "step": 649890 + }, + { + "epoch": 1.68, + "learning_rate": 4.7304818018513095e-05, + "loss": 0.0065, + "step": 649900 + }, + { + "epoch": 1.68, + "learning_rate": 4.730092980214163e-05, + "loss": 0.0075, + "step": 649910 + }, + { + "epoch": 1.68, + "learning_rate": 4.729704158577016e-05, + "loss": 0.0082, + "step": 649920 + }, + { + "epoch": 1.68, + "learning_rate": 4.729315336939869e-05, + "loss": 0.0057, + "step": 649930 + }, + { + "epoch": 1.68, + "learning_rate": 4.728926515302723e-05, + "loss": 0.0083, + "step": 649940 + }, + { + "epoch": 1.68, + "learning_rate": 4.728537693665576e-05, + "loss": 0.007, + "step": 649950 + }, + { + "epoch": 1.68, + "learning_rate": 4.72814887202843e-05, + "loss": 0.011, + "step": 649960 + }, + { + "epoch": 1.68, + "learning_rate": 4.727760050391283e-05, + "loss": 0.0097, + "step": 649970 + }, + { + "epoch": 1.68, + "learning_rate": 4.7273712287541374e-05, + "loss": 0.0079, + "step": 649980 + }, + { + "epoch": 1.68, + "learning_rate": 4.726982407116991e-05, + "loss": 0.0071, + "step": 649990 + }, + { + "epoch": 1.68, + "learning_rate": 4.7265935854798444e-05, + "loss": 0.0083, + "step": 650000 + }, + { + "epoch": 1.68, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.005187535658478737, + "eval_runtime": 107.9437, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 650000 + }, + { + "epoch": 1.68, + "learning_rate": 4.726204763842698e-05, + "loss": 0.0114, + "step": 650010 + }, + { + "epoch": 1.68, + "learning_rate": 4.725815942205551e-05, + "loss": 0.0081, + "step": 650020 + }, + { + "epoch": 1.68, + "learning_rate": 4.725427120568405e-05, + "loss": 0.0079, + "step": 650030 + }, + { + "epoch": 1.68, + "learning_rate": 4.725038298931258e-05, + "loss": 0.0084, + "step": 650040 + }, + { + "epoch": 1.69, + "learning_rate": 4.724649477294112e-05, + "loss": 0.0077, + "step": 650050 + }, + { + "epoch": 1.69, + "learning_rate": 4.724260655656966e-05, + "loss": 0.0075, + "step": 650060 + }, + { + "epoch": 1.69, + "learning_rate": 4.7238718340198194e-05, + "loss": 0.0078, + "step": 650070 + }, + { + "epoch": 1.69, + "learning_rate": 4.723483012382673e-05, + "loss": 0.007, + "step": 650080 + }, + { + "epoch": 1.69, + "learning_rate": 4.7230941907455264e-05, + "loss": 0.0063, + "step": 650090 + }, + { + "epoch": 1.69, + "learning_rate": 4.72270536910838e-05, + "loss": 0.0066, + "step": 650100 + }, + { + "epoch": 1.69, + "learning_rate": 4.7223165474712334e-05, + "loss": 0.0096, + "step": 650110 + }, + { + "epoch": 1.69, + "learning_rate": 4.721927725834087e-05, + "loss": 0.0072, + "step": 650120 + }, + { + "epoch": 1.69, + "learning_rate": 4.7215389041969404e-05, + "loss": 0.0092, + "step": 650130 + }, + { + "epoch": 1.69, + "learning_rate": 4.7211500825597945e-05, + "loss": 0.0079, + "step": 650140 + }, + { + "epoch": 1.69, + "learning_rate": 4.720761260922648e-05, + "loss": 0.0083, + "step": 650150 + }, + { + "epoch": 1.69, + "learning_rate": 4.7203724392855015e-05, + "loss": 0.006, + "step": 650160 + }, + { + "epoch": 1.69, + "learning_rate": 4.719983617648354e-05, + "loss": 0.0087, + "step": 650170 + }, + { + "epoch": 1.69, + "learning_rate": 4.719594796011208e-05, + "loss": 0.008, + "step": 650180 + }, + { + "epoch": 1.69, + "learning_rate": 4.719205974374061e-05, + "loss": 0.0084, + "step": 650190 + }, + { + "epoch": 1.69, + "learning_rate": 4.718817152736915e-05, + "loss": 0.007, + "step": 650200 + }, + { + "epoch": 1.69, + "learning_rate": 4.718428331099768e-05, + "loss": 0.008, + "step": 650210 + }, + { + "epoch": 1.69, + "learning_rate": 4.718039509462622e-05, + "loss": 0.0051, + "step": 650220 + }, + { + "epoch": 1.69, + "learning_rate": 4.717650687825475e-05, + "loss": 0.0061, + "step": 650230 + }, + { + "epoch": 1.69, + "learning_rate": 4.7172618661883294e-05, + "loss": 0.0069, + "step": 650240 + }, + { + "epoch": 1.69, + "learning_rate": 4.716873044551183e-05, + "loss": 0.0098, + "step": 650250 + }, + { + "epoch": 1.69, + "learning_rate": 4.7164842229140364e-05, + "loss": 0.0097, + "step": 650260 + }, + { + "epoch": 1.69, + "learning_rate": 4.71609540127689e-05, + "loss": 0.0064, + "step": 650270 + }, + { + "epoch": 1.69, + "learning_rate": 4.715706579639743e-05, + "loss": 0.0068, + "step": 650280 + }, + { + "epoch": 1.69, + "learning_rate": 4.715317758002597e-05, + "loss": 0.0071, + "step": 650290 + }, + { + "epoch": 1.69, + "learning_rate": 4.71492893636545e-05, + "loss": 0.0078, + "step": 650300 + }, + { + "epoch": 1.69, + "learning_rate": 4.714540114728304e-05, + "loss": 0.0069, + "step": 650310 + }, + { + "epoch": 1.69, + "learning_rate": 4.714151293091158e-05, + "loss": 0.0061, + "step": 650320 + }, + { + "epoch": 1.69, + "learning_rate": 4.7137624714540114e-05, + "loss": 0.0087, + "step": 650330 + }, + { + "epoch": 1.69, + "learning_rate": 4.713373649816865e-05, + "loss": 0.0084, + "step": 650340 + }, + { + "epoch": 1.69, + "learning_rate": 4.7129848281797184e-05, + "loss": 0.0097, + "step": 650350 + }, + { + "epoch": 1.69, + "learning_rate": 4.712596006542572e-05, + "loss": 0.0088, + "step": 650360 + }, + { + "epoch": 1.69, + "learning_rate": 4.7122071849054254e-05, + "loss": 0.0075, + "step": 650370 + }, + { + "epoch": 1.69, + "learning_rate": 4.711818363268279e-05, + "loss": 0.0148, + "step": 650380 + }, + { + "epoch": 1.69, + "learning_rate": 4.7114295416311324e-05, + "loss": 0.009, + "step": 650390 + }, + { + "epoch": 1.69, + "learning_rate": 4.7110407199939865e-05, + "loss": 0.007, + "step": 650400 + }, + { + "epoch": 1.69, + "learning_rate": 4.71065189835684e-05, + "loss": 0.0107, + "step": 650410 + }, + { + "epoch": 1.69, + "learning_rate": 4.710263076719693e-05, + "loss": 0.0081, + "step": 650420 + }, + { + "epoch": 1.69, + "learning_rate": 4.709874255082546e-05, + "loss": 0.0098, + "step": 650430 + }, + { + "epoch": 1.69, + "learning_rate": 4.7094854334454e-05, + "loss": 0.0068, + "step": 650440 + }, + { + "epoch": 1.69, + "learning_rate": 4.709096611808253e-05, + "loss": 0.0089, + "step": 650450 + }, + { + "epoch": 1.69, + "learning_rate": 4.708707790171107e-05, + "loss": 0.0069, + "step": 650460 + }, + { + "epoch": 1.69, + "learning_rate": 4.70831896853396e-05, + "loss": 0.0114, + "step": 650470 + }, + { + "epoch": 1.69, + "learning_rate": 4.707930146896814e-05, + "loss": 0.0114, + "step": 650480 + }, + { + "epoch": 1.69, + "learning_rate": 4.707541325259667e-05, + "loss": 0.006, + "step": 650490 + }, + { + "epoch": 1.69, + "learning_rate": 4.7071525036225214e-05, + "loss": 0.0085, + "step": 650500 + }, + { + "epoch": 1.69, + "learning_rate": 4.706763681985375e-05, + "loss": 0.007, + "step": 650510 + }, + { + "epoch": 1.69, + "learning_rate": 4.7063748603482284e-05, + "loss": 0.0071, + "step": 650520 + }, + { + "epoch": 1.69, + "learning_rate": 4.705986038711082e-05, + "loss": 0.0068, + "step": 650530 + }, + { + "epoch": 1.69, + "learning_rate": 4.705597217073935e-05, + "loss": 0.0069, + "step": 650540 + }, + { + "epoch": 1.69, + "learning_rate": 4.705208395436789e-05, + "loss": 0.0092, + "step": 650550 + }, + { + "epoch": 1.69, + "learning_rate": 4.704819573799642e-05, + "loss": 0.0067, + "step": 650560 + }, + { + "epoch": 1.69, + "learning_rate": 4.704430752162496e-05, + "loss": 0.0093, + "step": 650570 + }, + { + "epoch": 1.69, + "learning_rate": 4.70404193052535e-05, + "loss": 0.0075, + "step": 650580 + }, + { + "epoch": 1.69, + "learning_rate": 4.7036531088882034e-05, + "loss": 0.01, + "step": 650590 + }, + { + "epoch": 1.69, + "learning_rate": 4.703264287251057e-05, + "loss": 0.0083, + "step": 650600 + }, + { + "epoch": 1.69, + "learning_rate": 4.7028754656139104e-05, + "loss": 0.0104, + "step": 650610 + }, + { + "epoch": 1.69, + "learning_rate": 4.702486643976764e-05, + "loss": 0.007, + "step": 650620 + }, + { + "epoch": 1.69, + "learning_rate": 4.7020978223396174e-05, + "loss": 0.0077, + "step": 650630 + }, + { + "epoch": 1.69, + "learning_rate": 4.701709000702471e-05, + "loss": 0.0107, + "step": 650640 + }, + { + "epoch": 1.69, + "learning_rate": 4.7013201790653244e-05, + "loss": 0.0072, + "step": 650650 + }, + { + "epoch": 1.69, + "learning_rate": 4.700931357428177e-05, + "loss": 0.0075, + "step": 650660 + }, + { + "epoch": 1.69, + "learning_rate": 4.7005425357910306e-05, + "loss": 0.007, + "step": 650670 + }, + { + "epoch": 1.69, + "learning_rate": 4.700153714153885e-05, + "loss": 0.0068, + "step": 650680 + }, + { + "epoch": 1.69, + "learning_rate": 4.699764892516738e-05, + "loss": 0.0077, + "step": 650690 + }, + { + "epoch": 1.69, + "learning_rate": 4.699376070879592e-05, + "loss": 0.0077, + "step": 650700 + }, + { + "epoch": 1.69, + "learning_rate": 4.698987249242445e-05, + "loss": 0.0056, + "step": 650710 + }, + { + "epoch": 1.69, + "learning_rate": 4.698598427605299e-05, + "loss": 0.0075, + "step": 650720 + }, + { + "epoch": 1.69, + "learning_rate": 4.698209605968152e-05, + "loss": 0.0101, + "step": 650730 + }, + { + "epoch": 1.69, + "learning_rate": 4.697820784331006e-05, + "loss": 0.0078, + "step": 650740 + }, + { + "epoch": 1.69, + "learning_rate": 4.697431962693859e-05, + "loss": 0.0061, + "step": 650750 + }, + { + "epoch": 1.69, + "learning_rate": 4.697043141056713e-05, + "loss": 0.0095, + "step": 650760 + }, + { + "epoch": 1.69, + "learning_rate": 4.696654319419567e-05, + "loss": 0.0092, + "step": 650770 + }, + { + "epoch": 1.69, + "learning_rate": 4.6962654977824203e-05, + "loss": 0.0086, + "step": 650780 + }, + { + "epoch": 1.69, + "learning_rate": 4.695876676145274e-05, + "loss": 0.0071, + "step": 650790 + }, + { + "epoch": 1.69, + "learning_rate": 4.695487854508127e-05, + "loss": 0.0059, + "step": 650800 + }, + { + "epoch": 1.69, + "learning_rate": 4.695099032870981e-05, + "loss": 0.0058, + "step": 650810 + }, + { + "epoch": 1.69, + "learning_rate": 4.694710211233834e-05, + "loss": 0.006, + "step": 650820 + }, + { + "epoch": 1.69, + "learning_rate": 4.694321389596688e-05, + "loss": 0.0072, + "step": 650830 + }, + { + "epoch": 1.69, + "learning_rate": 4.693932567959541e-05, + "loss": 0.0079, + "step": 650840 + }, + { + "epoch": 1.69, + "learning_rate": 4.6935437463223954e-05, + "loss": 0.0063, + "step": 650850 + }, + { + "epoch": 1.69, + "learning_rate": 4.693154924685249e-05, + "loss": 0.0065, + "step": 650860 + }, + { + "epoch": 1.69, + "learning_rate": 4.6927661030481024e-05, + "loss": 0.0097, + "step": 650870 + }, + { + "epoch": 1.69, + "learning_rate": 4.692377281410956e-05, + "loss": 0.0133, + "step": 650880 + }, + { + "epoch": 1.69, + "learning_rate": 4.6919884597738094e-05, + "loss": 0.0077, + "step": 650890 + }, + { + "epoch": 1.69, + "learning_rate": 4.691599638136663e-05, + "loss": 0.0061, + "step": 650900 + }, + { + "epoch": 1.69, + "learning_rate": 4.691210816499516e-05, + "loss": 0.0107, + "step": 650910 + }, + { + "epoch": 1.69, + "learning_rate": 4.690821994862369e-05, + "loss": 0.0074, + "step": 650920 + }, + { + "epoch": 1.69, + "learning_rate": 4.6904331732252226e-05, + "loss": 0.0071, + "step": 650930 + }, + { + "epoch": 1.69, + "learning_rate": 4.690044351588076e-05, + "loss": 0.0094, + "step": 650940 + }, + { + "epoch": 1.69, + "learning_rate": 4.68965552995093e-05, + "loss": 0.0073, + "step": 650950 + }, + { + "epoch": 1.69, + "learning_rate": 4.689266708313784e-05, + "loss": 0.0078, + "step": 650960 + }, + { + "epoch": 1.69, + "learning_rate": 4.688877886676637e-05, + "loss": 0.0072, + "step": 650970 + }, + { + "epoch": 1.69, + "learning_rate": 4.688489065039491e-05, + "loss": 0.0104, + "step": 650980 + }, + { + "epoch": 1.69, + "learning_rate": 4.688100243402344e-05, + "loss": 0.0054, + "step": 650990 + }, + { + "epoch": 1.69, + "learning_rate": 4.687711421765198e-05, + "loss": 0.0129, + "step": 651000 + }, + { + "epoch": 1.69, + "eval_cer": 0.8816648961259449, + "eval_loss": 0.005368160083889961, + "eval_runtime": 107.9578, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.631, + "step": 651000 + }, + { + "epoch": 1.69, + "learning_rate": 4.687322600128051e-05, + "loss": 0.0092, + "step": 651010 + }, + { + "epoch": 1.69, + "learning_rate": 4.686933778490905e-05, + "loss": 0.0078, + "step": 651020 + }, + { + "epoch": 1.69, + "learning_rate": 4.686544956853759e-05, + "loss": 0.0087, + "step": 651030 + }, + { + "epoch": 1.69, + "learning_rate": 4.6861561352166123e-05, + "loss": 0.0068, + "step": 651040 + }, + { + "epoch": 1.69, + "learning_rate": 4.685767313579466e-05, + "loss": 0.01, + "step": 651050 + }, + { + "epoch": 1.69, + "learning_rate": 4.685378491942319e-05, + "loss": 0.0064, + "step": 651060 + }, + { + "epoch": 1.69, + "learning_rate": 4.684989670305173e-05, + "loss": 0.0075, + "step": 651070 + }, + { + "epoch": 1.69, + "learning_rate": 4.684600848668026e-05, + "loss": 0.0065, + "step": 651080 + }, + { + "epoch": 1.69, + "learning_rate": 4.68421202703088e-05, + "loss": 0.0101, + "step": 651090 + }, + { + "epoch": 1.69, + "learning_rate": 4.683823205393733e-05, + "loss": 0.0084, + "step": 651100 + }, + { + "epoch": 1.69, + "learning_rate": 4.6834343837565874e-05, + "loss": 0.009, + "step": 651110 + }, + { + "epoch": 1.69, + "learning_rate": 4.683045562119441e-05, + "loss": 0.0075, + "step": 651120 + }, + { + "epoch": 1.69, + "learning_rate": 4.6826567404822944e-05, + "loss": 0.0075, + "step": 651130 + }, + { + "epoch": 1.69, + "learning_rate": 4.682267918845148e-05, + "loss": 0.0069, + "step": 651140 + }, + { + "epoch": 1.69, + "learning_rate": 4.6818790972080014e-05, + "loss": 0.0074, + "step": 651150 + }, + { + "epoch": 1.69, + "learning_rate": 4.681490275570854e-05, + "loss": 0.0084, + "step": 651160 + }, + { + "epoch": 1.69, + "learning_rate": 4.681101453933708e-05, + "loss": 0.0063, + "step": 651170 + }, + { + "epoch": 1.69, + "learning_rate": 4.680712632296561e-05, + "loss": 0.0085, + "step": 651180 + }, + { + "epoch": 1.69, + "learning_rate": 4.6803238106594146e-05, + "loss": 0.0082, + "step": 651190 + }, + { + "epoch": 1.69, + "learning_rate": 4.679934989022268e-05, + "loss": 0.0093, + "step": 651200 + }, + { + "epoch": 1.69, + "learning_rate": 4.679546167385122e-05, + "loss": 0.0075, + "step": 651210 + }, + { + "epoch": 1.69, + "learning_rate": 4.679157345747976e-05, + "loss": 0.0092, + "step": 651220 + }, + { + "epoch": 1.69, + "learning_rate": 4.678768524110829e-05, + "loss": 0.0096, + "step": 651230 + }, + { + "epoch": 1.69, + "learning_rate": 4.678379702473683e-05, + "loss": 0.0074, + "step": 651240 + }, + { + "epoch": 1.69, + "learning_rate": 4.677990880836536e-05, + "loss": 0.0065, + "step": 651250 + }, + { + "epoch": 1.69, + "learning_rate": 4.67760205919939e-05, + "loss": 0.0066, + "step": 651260 + }, + { + "epoch": 1.69, + "learning_rate": 4.677213237562243e-05, + "loss": 0.0131, + "step": 651270 + }, + { + "epoch": 1.69, + "learning_rate": 4.676824415925097e-05, + "loss": 0.0083, + "step": 651280 + }, + { + "epoch": 1.69, + "learning_rate": 4.676435594287951e-05, + "loss": 0.0095, + "step": 651290 + }, + { + "epoch": 1.69, + "learning_rate": 4.6760467726508043e-05, + "loss": 0.0104, + "step": 651300 + }, + { + "epoch": 1.69, + "learning_rate": 4.675657951013658e-05, + "loss": 0.0086, + "step": 651310 + }, + { + "epoch": 1.69, + "learning_rate": 4.675269129376511e-05, + "loss": 0.0067, + "step": 651320 + }, + { + "epoch": 1.69, + "learning_rate": 4.674880307739365e-05, + "loss": 0.0071, + "step": 651330 + }, + { + "epoch": 1.69, + "learning_rate": 4.674491486102218e-05, + "loss": 0.0087, + "step": 651340 + }, + { + "epoch": 1.69, + "learning_rate": 4.674102664465072e-05, + "loss": 0.0088, + "step": 651350 + }, + { + "epoch": 1.69, + "learning_rate": 4.673713842827925e-05, + "loss": 0.0083, + "step": 651360 + }, + { + "epoch": 1.69, + "learning_rate": 4.6733250211907794e-05, + "loss": 0.0078, + "step": 651370 + }, + { + "epoch": 1.69, + "learning_rate": 4.672936199553633e-05, + "loss": 0.0057, + "step": 651380 + }, + { + "epoch": 1.69, + "learning_rate": 4.6725473779164864e-05, + "loss": 0.0085, + "step": 651390 + }, + { + "epoch": 1.69, + "learning_rate": 4.67215855627934e-05, + "loss": 0.0116, + "step": 651400 + }, + { + "epoch": 1.69, + "learning_rate": 4.671769734642193e-05, + "loss": 0.0077, + "step": 651410 + }, + { + "epoch": 1.69, + "learning_rate": 4.671380913005046e-05, + "loss": 0.0081, + "step": 651420 + }, + { + "epoch": 1.69, + "learning_rate": 4.6709920913678997e-05, + "loss": 0.0068, + "step": 651430 + }, + { + "epoch": 1.69, + "learning_rate": 4.670603269730753e-05, + "loss": 0.0095, + "step": 651440 + }, + { + "epoch": 1.69, + "learning_rate": 4.6702144480936066e-05, + "loss": 0.006, + "step": 651450 + }, + { + "epoch": 1.69, + "learning_rate": 4.66982562645646e-05, + "loss": 0.0084, + "step": 651460 + }, + { + "epoch": 1.69, + "learning_rate": 4.669436804819314e-05, + "loss": 0.0055, + "step": 651470 + }, + { + "epoch": 1.69, + "learning_rate": 4.669047983182168e-05, + "loss": 0.0068, + "step": 651480 + }, + { + "epoch": 1.69, + "learning_rate": 4.668659161545021e-05, + "loss": 0.0065, + "step": 651490 + }, + { + "epoch": 1.69, + "learning_rate": 4.668270339907875e-05, + "loss": 0.0071, + "step": 651500 + }, + { + "epoch": 1.69, + "learning_rate": 4.667881518270728e-05, + "loss": 0.0099, + "step": 651510 + }, + { + "epoch": 1.69, + "learning_rate": 4.667492696633582e-05, + "loss": 0.0067, + "step": 651520 + }, + { + "epoch": 1.69, + "learning_rate": 4.667103874996435e-05, + "loss": 0.0072, + "step": 651530 + }, + { + "epoch": 1.69, + "learning_rate": 4.666715053359289e-05, + "loss": 0.0083, + "step": 651540 + }, + { + "epoch": 1.69, + "learning_rate": 4.666326231722143e-05, + "loss": 0.0073, + "step": 651550 + }, + { + "epoch": 1.69, + "learning_rate": 4.665937410084996e-05, + "loss": 0.0083, + "step": 651560 + }, + { + "epoch": 1.69, + "learning_rate": 4.66554858844785e-05, + "loss": 0.0078, + "step": 651570 + }, + { + "epoch": 1.69, + "learning_rate": 4.665159766810703e-05, + "loss": 0.0078, + "step": 651580 + }, + { + "epoch": 1.69, + "learning_rate": 4.664770945173557e-05, + "loss": 0.0073, + "step": 651590 + }, + { + "epoch": 1.69, + "learning_rate": 4.66438212353641e-05, + "loss": 0.0086, + "step": 651600 + }, + { + "epoch": 1.69, + "learning_rate": 4.663993301899264e-05, + "loss": 0.0079, + "step": 651610 + }, + { + "epoch": 1.69, + "learning_rate": 4.663604480262117e-05, + "loss": 0.0086, + "step": 651620 + }, + { + "epoch": 1.69, + "learning_rate": 4.6632156586249714e-05, + "loss": 0.0096, + "step": 651630 + }, + { + "epoch": 1.69, + "learning_rate": 4.662826836987825e-05, + "loss": 0.0097, + "step": 651640 + }, + { + "epoch": 1.69, + "learning_rate": 4.6624380153506784e-05, + "loss": 0.0078, + "step": 651650 + }, + { + "epoch": 1.69, + "learning_rate": 4.662049193713531e-05, + "loss": 0.0074, + "step": 651660 + }, + { + "epoch": 1.69, + "learning_rate": 4.661660372076385e-05, + "loss": 0.0067, + "step": 651670 + }, + { + "epoch": 1.69, + "learning_rate": 4.661271550439238e-05, + "loss": 0.0073, + "step": 651680 + }, + { + "epoch": 1.69, + "learning_rate": 4.6608827288020917e-05, + "loss": 0.0085, + "step": 651690 + }, + { + "epoch": 1.69, + "learning_rate": 4.660493907164945e-05, + "loss": 0.009, + "step": 651700 + }, + { + "epoch": 1.69, + "learning_rate": 4.6601050855277986e-05, + "loss": 0.009, + "step": 651710 + }, + { + "epoch": 1.69, + "learning_rate": 4.659716263890652e-05, + "loss": 0.0172, + "step": 651720 + }, + { + "epoch": 1.69, + "learning_rate": 4.659327442253506e-05, + "loss": 0.0089, + "step": 651730 + }, + { + "epoch": 1.69, + "learning_rate": 4.65893862061636e-05, + "loss": 0.008, + "step": 651740 + }, + { + "epoch": 1.69, + "learning_rate": 4.658549798979213e-05, + "loss": 0.0073, + "step": 651750 + }, + { + "epoch": 1.69, + "learning_rate": 4.658160977342067e-05, + "loss": 0.0106, + "step": 651760 + }, + { + "epoch": 1.69, + "learning_rate": 4.65777215570492e-05, + "loss": 0.0056, + "step": 651770 + }, + { + "epoch": 1.69, + "learning_rate": 4.657383334067774e-05, + "loss": 0.0108, + "step": 651780 + }, + { + "epoch": 1.69, + "learning_rate": 4.656994512430627e-05, + "loss": 0.0078, + "step": 651790 + }, + { + "epoch": 1.69, + "learning_rate": 4.656605690793481e-05, + "loss": 0.0071, + "step": 651800 + }, + { + "epoch": 1.69, + "learning_rate": 4.656216869156335e-05, + "loss": 0.0093, + "step": 651810 + }, + { + "epoch": 1.69, + "learning_rate": 4.655828047519188e-05, + "loss": 0.0058, + "step": 651820 + }, + { + "epoch": 1.69, + "learning_rate": 4.655439225882042e-05, + "loss": 0.0078, + "step": 651830 + }, + { + "epoch": 1.69, + "learning_rate": 4.655050404244895e-05, + "loss": 0.0069, + "step": 651840 + }, + { + "epoch": 1.69, + "learning_rate": 4.654661582607749e-05, + "loss": 0.0073, + "step": 651850 + }, + { + "epoch": 1.69, + "learning_rate": 4.654272760970602e-05, + "loss": 0.0084, + "step": 651860 + }, + { + "epoch": 1.69, + "learning_rate": 4.653883939333456e-05, + "loss": 0.0109, + "step": 651870 + }, + { + "epoch": 1.69, + "learning_rate": 4.653495117696309e-05, + "loss": 0.0059, + "step": 651880 + }, + { + "epoch": 1.69, + "learning_rate": 4.6531062960591634e-05, + "loss": 0.0099, + "step": 651890 + }, + { + "epoch": 1.69, + "learning_rate": 4.652717474422017e-05, + "loss": 0.0065, + "step": 651900 + }, + { + "epoch": 1.69, + "learning_rate": 4.65232865278487e-05, + "loss": 0.0069, + "step": 651910 + }, + { + "epoch": 1.69, + "learning_rate": 4.651939831147723e-05, + "loss": 0.0065, + "step": 651920 + }, + { + "epoch": 1.69, + "learning_rate": 4.651551009510577e-05, + "loss": 0.005, + "step": 651930 + }, + { + "epoch": 1.69, + "learning_rate": 4.65116218787343e-05, + "loss": 0.0102, + "step": 651940 + }, + { + "epoch": 1.69, + "learning_rate": 4.6507733662362837e-05, + "loss": 0.0101, + "step": 651950 + }, + { + "epoch": 1.69, + "learning_rate": 4.650384544599137e-05, + "loss": 0.0082, + "step": 651960 + }, + { + "epoch": 1.69, + "learning_rate": 4.6499957229619906e-05, + "loss": 0.0069, + "step": 651970 + }, + { + "epoch": 1.69, + "learning_rate": 4.649606901324844e-05, + "loss": 0.0092, + "step": 651980 + }, + { + "epoch": 1.69, + "learning_rate": 4.649218079687698e-05, + "loss": 0.0107, + "step": 651990 + }, + { + "epoch": 1.69, + "learning_rate": 4.648829258050552e-05, + "loss": 0.0075, + "step": 652000 + }, + { + "epoch": 1.69, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.005205278750509024, + "eval_runtime": 107.7051, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, + "step": 652000 + }, + { + "epoch": 1.69, + "learning_rate": 4.648440436413405e-05, + "loss": 0.0078, + "step": 652010 + }, + { + "epoch": 1.69, + "learning_rate": 4.648051614776259e-05, + "loss": 0.0067, + "step": 652020 + }, + { + "epoch": 1.69, + "learning_rate": 4.647662793139112e-05, + "loss": 0.006, + "step": 652030 + }, + { + "epoch": 1.69, + "learning_rate": 4.647273971501966e-05, + "loss": 0.008, + "step": 652040 + }, + { + "epoch": 1.69, + "learning_rate": 4.646885149864819e-05, + "loss": 0.0059, + "step": 652050 + }, + { + "epoch": 1.69, + "learning_rate": 4.646496328227673e-05, + "loss": 0.0106, + "step": 652060 + }, + { + "epoch": 1.69, + "learning_rate": 4.646107506590526e-05, + "loss": 0.0094, + "step": 652070 + }, + { + "epoch": 1.69, + "learning_rate": 4.64571868495338e-05, + "loss": 0.0065, + "step": 652080 + }, + { + "epoch": 1.69, + "learning_rate": 4.645329863316234e-05, + "loss": 0.0079, + "step": 652090 + }, + { + "epoch": 1.69, + "learning_rate": 4.644941041679087e-05, + "loss": 0.0106, + "step": 652100 + }, + { + "epoch": 1.69, + "learning_rate": 4.644552220041941e-05, + "loss": 0.0062, + "step": 652110 + }, + { + "epoch": 1.69, + "learning_rate": 4.644163398404794e-05, + "loss": 0.0108, + "step": 652120 + }, + { + "epoch": 1.69, + "learning_rate": 4.643774576767648e-05, + "loss": 0.0106, + "step": 652130 + }, + { + "epoch": 1.69, + "learning_rate": 4.643385755130501e-05, + "loss": 0.0082, + "step": 652140 + }, + { + "epoch": 1.69, + "learning_rate": 4.642996933493354e-05, + "loss": 0.007, + "step": 652150 + }, + { + "epoch": 1.69, + "learning_rate": 4.6426081118562075e-05, + "loss": 0.0086, + "step": 652160 + }, + { + "epoch": 1.69, + "learning_rate": 4.642219290219061e-05, + "loss": 0.0094, + "step": 652170 + }, + { + "epoch": 1.69, + "learning_rate": 4.641830468581915e-05, + "loss": 0.0074, + "step": 652180 + }, + { + "epoch": 1.69, + "learning_rate": 4.641441646944769e-05, + "loss": 0.0099, + "step": 652190 + }, + { + "epoch": 1.69, + "learning_rate": 4.641052825307622e-05, + "loss": 0.0079, + "step": 652200 + }, + { + "epoch": 1.69, + "learning_rate": 4.6406640036704756e-05, + "loss": 0.0072, + "step": 652210 + }, + { + "epoch": 1.69, + "learning_rate": 4.640275182033329e-05, + "loss": 0.0085, + "step": 652220 + }, + { + "epoch": 1.69, + "learning_rate": 4.6398863603961826e-05, + "loss": 0.0102, + "step": 652230 + }, + { + "epoch": 1.69, + "learning_rate": 4.639497538759036e-05, + "loss": 0.0097, + "step": 652240 + }, + { + "epoch": 1.69, + "learning_rate": 4.6391087171218896e-05, + "loss": 0.0092, + "step": 652250 + }, + { + "epoch": 1.69, + "learning_rate": 4.638719895484744e-05, + "loss": 0.0064, + "step": 652260 + }, + { + "epoch": 1.69, + "learning_rate": 4.638331073847597e-05, + "loss": 0.0073, + "step": 652270 + }, + { + "epoch": 1.69, + "learning_rate": 4.637942252210451e-05, + "loss": 0.0085, + "step": 652280 + }, + { + "epoch": 1.69, + "learning_rate": 4.637553430573304e-05, + "loss": 0.0071, + "step": 652290 + }, + { + "epoch": 1.69, + "learning_rate": 4.637164608936158e-05, + "loss": 0.0101, + "step": 652300 + }, + { + "epoch": 1.69, + "learning_rate": 4.636775787299011e-05, + "loss": 0.0087, + "step": 652310 + }, + { + "epoch": 1.69, + "learning_rate": 4.636386965661865e-05, + "loss": 0.0098, + "step": 652320 + }, + { + "epoch": 1.69, + "learning_rate": 4.635998144024718e-05, + "loss": 0.0087, + "step": 652330 + }, + { + "epoch": 1.69, + "learning_rate": 4.635609322387572e-05, + "loss": 0.0095, + "step": 652340 + }, + { + "epoch": 1.69, + "learning_rate": 4.635220500750426e-05, + "loss": 0.0076, + "step": 652350 + }, + { + "epoch": 1.69, + "learning_rate": 4.634831679113279e-05, + "loss": 0.0093, + "step": 652360 + }, + { + "epoch": 1.69, + "learning_rate": 4.634442857476133e-05, + "loss": 0.0085, + "step": 652370 + }, + { + "epoch": 1.69, + "learning_rate": 4.634054035838986e-05, + "loss": 0.0066, + "step": 652380 + }, + { + "epoch": 1.69, + "learning_rate": 4.63366521420184e-05, + "loss": 0.0079, + "step": 652390 + }, + { + "epoch": 1.69, + "learning_rate": 4.6332763925646926e-05, + "loss": 0.0072, + "step": 652400 + }, + { + "epoch": 1.69, + "learning_rate": 4.632887570927546e-05, + "loss": 0.0078, + "step": 652410 + }, + { + "epoch": 1.69, + "learning_rate": 4.6324987492903995e-05, + "loss": 0.0066, + "step": 652420 + }, + { + "epoch": 1.69, + "learning_rate": 4.632109927653253e-05, + "loss": 0.0079, + "step": 652430 + }, + { + "epoch": 1.69, + "learning_rate": 4.631721106016107e-05, + "loss": 0.0089, + "step": 652440 + }, + { + "epoch": 1.69, + "learning_rate": 4.631332284378961e-05, + "loss": 0.0055, + "step": 652450 + }, + { + "epoch": 1.69, + "learning_rate": 4.630943462741814e-05, + "loss": 0.0065, + "step": 652460 + }, + { + "epoch": 1.69, + "learning_rate": 4.6305546411046676e-05, + "loss": 0.008, + "step": 652470 + }, + { + "epoch": 1.69, + "learning_rate": 4.630165819467521e-05, + "loss": 0.0098, + "step": 652480 + }, + { + "epoch": 1.69, + "learning_rate": 4.6297769978303746e-05, + "loss": 0.008, + "step": 652490 + }, + { + "epoch": 1.69, + "learning_rate": 4.629388176193228e-05, + "loss": 0.0081, + "step": 652500 + }, + { + "epoch": 1.69, + "learning_rate": 4.6289993545560816e-05, + "loss": 0.0089, + "step": 652510 + }, + { + "epoch": 1.69, + "learning_rate": 4.628610532918936e-05, + "loss": 0.007, + "step": 652520 + }, + { + "epoch": 1.69, + "learning_rate": 4.628221711281789e-05, + "loss": 0.0074, + "step": 652530 + }, + { + "epoch": 1.69, + "learning_rate": 4.627832889644643e-05, + "loss": 0.0095, + "step": 652540 + }, + { + "epoch": 1.69, + "learning_rate": 4.627444068007496e-05, + "loss": 0.008, + "step": 652550 + }, + { + "epoch": 1.69, + "learning_rate": 4.62705524637035e-05, + "loss": 0.0094, + "step": 652560 + }, + { + "epoch": 1.69, + "learning_rate": 4.626666424733203e-05, + "loss": 0.0076, + "step": 652570 + }, + { + "epoch": 1.69, + "learning_rate": 4.626277603096057e-05, + "loss": 0.0091, + "step": 652580 + }, + { + "epoch": 1.69, + "learning_rate": 4.62588878145891e-05, + "loss": 0.0092, + "step": 652590 + }, + { + "epoch": 1.69, + "learning_rate": 4.625499959821764e-05, + "loss": 0.0066, + "step": 652600 + }, + { + "epoch": 1.69, + "learning_rate": 4.625111138184618e-05, + "loss": 0.0097, + "step": 652610 + }, + { + "epoch": 1.69, + "learning_rate": 4.624722316547471e-05, + "loss": 0.0085, + "step": 652620 + }, + { + "epoch": 1.69, + "learning_rate": 4.624333494910325e-05, + "loss": 0.0082, + "step": 652630 + }, + { + "epoch": 1.69, + "learning_rate": 4.623944673273178e-05, + "loss": 0.0066, + "step": 652640 + }, + { + "epoch": 1.69, + "learning_rate": 4.623555851636031e-05, + "loss": 0.0097, + "step": 652650 + }, + { + "epoch": 1.69, + "learning_rate": 4.6231670299988846e-05, + "loss": 0.0087, + "step": 652660 + }, + { + "epoch": 1.69, + "learning_rate": 4.622778208361738e-05, + "loss": 0.0073, + "step": 652670 + }, + { + "epoch": 1.69, + "learning_rate": 4.6223893867245915e-05, + "loss": 0.0087, + "step": 652680 + }, + { + "epoch": 1.69, + "learning_rate": 4.622000565087445e-05, + "loss": 0.0238, + "step": 652690 + }, + { + "epoch": 1.69, + "learning_rate": 4.621611743450299e-05, + "loss": 0.0074, + "step": 652700 + }, + { + "epoch": 1.69, + "learning_rate": 4.621222921813153e-05, + "loss": 0.006, + "step": 652710 + }, + { + "epoch": 1.69, + "learning_rate": 4.620834100176006e-05, + "loss": 0.0086, + "step": 652720 + }, + { + "epoch": 1.69, + "learning_rate": 4.6204452785388596e-05, + "loss": 0.0056, + "step": 652730 + }, + { + "epoch": 1.69, + "learning_rate": 4.620056456901713e-05, + "loss": 0.0058, + "step": 652740 + }, + { + "epoch": 1.69, + "learning_rate": 4.6196676352645666e-05, + "loss": 0.0083, + "step": 652750 + }, + { + "epoch": 1.69, + "learning_rate": 4.61927881362742e-05, + "loss": 0.0066, + "step": 652760 + }, + { + "epoch": 1.69, + "learning_rate": 4.6188899919902736e-05, + "loss": 0.0089, + "step": 652770 + }, + { + "epoch": 1.69, + "learning_rate": 4.618501170353128e-05, + "loss": 0.0073, + "step": 652780 + }, + { + "epoch": 1.69, + "learning_rate": 4.618112348715981e-05, + "loss": 0.0097, + "step": 652790 + }, + { + "epoch": 1.69, + "learning_rate": 4.617723527078835e-05, + "loss": 0.0105, + "step": 652800 + }, + { + "epoch": 1.69, + "learning_rate": 4.617334705441688e-05, + "loss": 0.0066, + "step": 652810 + }, + { + "epoch": 1.69, + "learning_rate": 4.616945883804542e-05, + "loss": 0.0067, + "step": 652820 + }, + { + "epoch": 1.69, + "learning_rate": 4.616557062167395e-05, + "loss": 0.0076, + "step": 652830 + }, + { + "epoch": 1.69, + "learning_rate": 4.6161682405302487e-05, + "loss": 0.0098, + "step": 652840 + }, + { + "epoch": 1.69, + "learning_rate": 4.615779418893102e-05, + "loss": 0.005, + "step": 652850 + }, + { + "epoch": 1.69, + "learning_rate": 4.615390597255956e-05, + "loss": 0.0088, + "step": 652860 + }, + { + "epoch": 1.69, + "learning_rate": 4.61500177561881e-05, + "loss": 0.0077, + "step": 652870 + }, + { + "epoch": 1.69, + "learning_rate": 4.614612953981663e-05, + "loss": 0.0068, + "step": 652880 + }, + { + "epoch": 1.69, + "learning_rate": 4.614224132344517e-05, + "loss": 0.0073, + "step": 652890 + }, + { + "epoch": 1.69, + "learning_rate": 4.6138353107073696e-05, + "loss": 0.015, + "step": 652900 + }, + { + "epoch": 1.69, + "learning_rate": 4.613446489070223e-05, + "loss": 0.0102, + "step": 652910 + }, + { + "epoch": 1.69, + "learning_rate": 4.6130576674330766e-05, + "loss": 0.0074, + "step": 652920 + }, + { + "epoch": 1.69, + "learning_rate": 4.61266884579593e-05, + "loss": 0.0083, + "step": 652930 + }, + { + "epoch": 1.69, + "learning_rate": 4.6122800241587835e-05, + "loss": 0.0094, + "step": 652940 + }, + { + "epoch": 1.69, + "learning_rate": 4.611891202521637e-05, + "loss": 0.0086, + "step": 652950 + }, + { + "epoch": 1.69, + "learning_rate": 4.611502380884491e-05, + "loss": 0.0087, + "step": 652960 + }, + { + "epoch": 1.69, + "learning_rate": 4.6111135592473447e-05, + "loss": 0.0111, + "step": 652970 + }, + { + "epoch": 1.69, + "learning_rate": 4.610724737610198e-05, + "loss": 0.0075, + "step": 652980 + }, + { + "epoch": 1.69, + "learning_rate": 4.6103359159730516e-05, + "loss": 0.0063, + "step": 652990 + }, + { + "epoch": 1.69, + "learning_rate": 4.609947094335905e-05, + "loss": 0.0068, + "step": 653000 + }, + { + "epoch": 1.69, + "eval_cer": 0.8816914892276944, + "eval_loss": 0.005161790177226067, + "eval_runtime": 107.7473, + "eval_samples_per_second": 18.562, + "eval_steps_per_second": 4.64, + "step": 653000 + }, + { + "epoch": 1.69, + "learning_rate": 4.6095582726987586e-05, + "loss": 0.0063, + "step": 653010 + }, + { + "epoch": 1.69, + "learning_rate": 4.609169451061612e-05, + "loss": 0.0101, + "step": 653020 + }, + { + "epoch": 1.69, + "learning_rate": 4.6087806294244656e-05, + "loss": 0.0066, + "step": 653030 + }, + { + "epoch": 1.69, + "learning_rate": 4.60839180778732e-05, + "loss": 0.0091, + "step": 653040 + }, + { + "epoch": 1.69, + "learning_rate": 4.608002986150173e-05, + "loss": 0.0058, + "step": 653050 + }, + { + "epoch": 1.69, + "learning_rate": 4.607614164513027e-05, + "loss": 0.0062, + "step": 653060 + }, + { + "epoch": 1.69, + "learning_rate": 4.60722534287588e-05, + "loss": 0.0063, + "step": 653070 + }, + { + "epoch": 1.69, + "learning_rate": 4.606836521238734e-05, + "loss": 0.0061, + "step": 653080 + }, + { + "epoch": 1.69, + "learning_rate": 4.606447699601587e-05, + "loss": 0.0077, + "step": 653090 + }, + { + "epoch": 1.69, + "learning_rate": 4.6060588779644407e-05, + "loss": 0.0068, + "step": 653100 + }, + { + "epoch": 1.69, + "learning_rate": 4.605670056327294e-05, + "loss": 0.008, + "step": 653110 + }, + { + "epoch": 1.69, + "learning_rate": 4.605281234690148e-05, + "loss": 0.0088, + "step": 653120 + }, + { + "epoch": 1.69, + "learning_rate": 4.604892413053002e-05, + "loss": 0.0079, + "step": 653130 + }, + { + "epoch": 1.69, + "learning_rate": 4.604503591415855e-05, + "loss": 0.0091, + "step": 653140 + }, + { + "epoch": 1.69, + "learning_rate": 4.604114769778708e-05, + "loss": 0.0069, + "step": 653150 + }, + { + "epoch": 1.69, + "learning_rate": 4.6037259481415616e-05, + "loss": 0.0067, + "step": 653160 + }, + { + "epoch": 1.69, + "learning_rate": 4.603337126504415e-05, + "loss": 0.0056, + "step": 653170 + }, + { + "epoch": 1.69, + "learning_rate": 4.6029483048672685e-05, + "loss": 0.0088, + "step": 653180 + }, + { + "epoch": 1.69, + "learning_rate": 4.602559483230122e-05, + "loss": 0.0099, + "step": 653190 + }, + { + "epoch": 1.69, + "learning_rate": 4.6021706615929755e-05, + "loss": 0.0092, + "step": 653200 + }, + { + "epoch": 1.69, + "learning_rate": 4.601781839955829e-05, + "loss": 0.0074, + "step": 653210 + }, + { + "epoch": 1.69, + "learning_rate": 4.601393018318683e-05, + "loss": 0.0071, + "step": 653220 + }, + { + "epoch": 1.69, + "learning_rate": 4.6010041966815367e-05, + "loss": 0.0062, + "step": 653230 + }, + { + "epoch": 1.69, + "learning_rate": 4.60061537504439e-05, + "loss": 0.0068, + "step": 653240 + }, + { + "epoch": 1.69, + "learning_rate": 4.6002265534072436e-05, + "loss": 0.0066, + "step": 653250 + }, + { + "epoch": 1.69, + "learning_rate": 4.599837731770097e-05, + "loss": 0.0079, + "step": 653260 + }, + { + "epoch": 1.69, + "learning_rate": 4.5994489101329506e-05, + "loss": 0.0069, + "step": 653270 + }, + { + "epoch": 1.69, + "learning_rate": 4.599060088495804e-05, + "loss": 0.0081, + "step": 653280 + }, + { + "epoch": 1.69, + "learning_rate": 4.5986712668586576e-05, + "loss": 0.0095, + "step": 653290 + }, + { + "epoch": 1.69, + "learning_rate": 4.598282445221512e-05, + "loss": 0.0076, + "step": 653300 + }, + { + "epoch": 1.69, + "learning_rate": 4.597893623584365e-05, + "loss": 0.0078, + "step": 653310 + }, + { + "epoch": 1.69, + "learning_rate": 4.597504801947219e-05, + "loss": 0.0105, + "step": 653320 + }, + { + "epoch": 1.69, + "learning_rate": 4.597115980310072e-05, + "loss": 0.0091, + "step": 653330 + }, + { + "epoch": 1.69, + "learning_rate": 4.596727158672926e-05, + "loss": 0.008, + "step": 653340 + }, + { + "epoch": 1.69, + "learning_rate": 4.596338337035779e-05, + "loss": 0.0096, + "step": 653350 + }, + { + "epoch": 1.69, + "learning_rate": 4.5959495153986327e-05, + "loss": 0.0059, + "step": 653360 + }, + { + "epoch": 1.69, + "learning_rate": 4.595560693761486e-05, + "loss": 0.0088, + "step": 653370 + }, + { + "epoch": 1.69, + "learning_rate": 4.5951718721243396e-05, + "loss": 0.0102, + "step": 653380 + }, + { + "epoch": 1.69, + "learning_rate": 4.5947830504871924e-05, + "loss": 0.008, + "step": 653390 + }, + { + "epoch": 1.69, + "learning_rate": 4.5943942288500466e-05, + "loss": 0.0108, + "step": 653400 + }, + { + "epoch": 1.69, + "learning_rate": 4.5940054072129e-05, + "loss": 0.0095, + "step": 653410 + }, + { + "epoch": 1.69, + "learning_rate": 4.5936165855757536e-05, + "loss": 0.0067, + "step": 653420 + }, + { + "epoch": 1.69, + "learning_rate": 4.593227763938607e-05, + "loss": 0.0068, + "step": 653430 + }, + { + "epoch": 1.69, + "learning_rate": 4.5928389423014605e-05, + "loss": 0.007, + "step": 653440 + }, + { + "epoch": 1.69, + "learning_rate": 4.592450120664314e-05, + "loss": 0.0088, + "step": 653450 + }, + { + "epoch": 1.69, + "learning_rate": 4.5920612990271675e-05, + "loss": 0.0074, + "step": 653460 + }, + { + "epoch": 1.69, + "learning_rate": 4.591672477390021e-05, + "loss": 0.009, + "step": 653470 + }, + { + "epoch": 1.69, + "learning_rate": 4.5912836557528745e-05, + "loss": 0.0096, + "step": 653480 + }, + { + "epoch": 1.69, + "learning_rate": 4.5908948341157286e-05, + "loss": 0.0065, + "step": 653490 + }, + { + "epoch": 1.69, + "learning_rate": 4.590506012478582e-05, + "loss": 0.0113, + "step": 653500 + }, + { + "epoch": 1.69, + "learning_rate": 4.5901171908414356e-05, + "loss": 0.008, + "step": 653510 + }, + { + "epoch": 1.69, + "learning_rate": 4.589728369204289e-05, + "loss": 0.016, + "step": 653520 + }, + { + "epoch": 1.69, + "learning_rate": 4.5893395475671426e-05, + "loss": 0.0124, + "step": 653530 + }, + { + "epoch": 1.69, + "learning_rate": 4.588950725929996e-05, + "loss": 0.0067, + "step": 653540 + }, + { + "epoch": 1.69, + "learning_rate": 4.5885619042928496e-05, + "loss": 0.007, + "step": 653550 + }, + { + "epoch": 1.69, + "learning_rate": 4.588173082655703e-05, + "loss": 0.0067, + "step": 653560 + }, + { + "epoch": 1.69, + "learning_rate": 4.587784261018557e-05, + "loss": 0.0059, + "step": 653570 + }, + { + "epoch": 1.69, + "learning_rate": 4.587395439381411e-05, + "loss": 0.0102, + "step": 653580 + }, + { + "epoch": 1.69, + "learning_rate": 4.587006617744264e-05, + "loss": 0.0063, + "step": 653590 + }, + { + "epoch": 1.69, + "learning_rate": 4.586617796107118e-05, + "loss": 0.0085, + "step": 653600 + }, + { + "epoch": 1.69, + "learning_rate": 4.586228974469971e-05, + "loss": 0.0076, + "step": 653610 + }, + { + "epoch": 1.69, + "learning_rate": 4.5858401528328246e-05, + "loss": 0.0067, + "step": 653620 + }, + { + "epoch": 1.69, + "learning_rate": 4.585451331195678e-05, + "loss": 0.0063, + "step": 653630 + }, + { + "epoch": 1.69, + "learning_rate": 4.585062509558531e-05, + "loss": 0.0096, + "step": 653640 + }, + { + "epoch": 1.69, + "learning_rate": 4.5846736879213844e-05, + "loss": 0.0069, + "step": 653650 + }, + { + "epoch": 1.69, + "learning_rate": 4.584284866284238e-05, + "loss": 0.0082, + "step": 653660 + }, + { + "epoch": 1.69, + "learning_rate": 4.583896044647092e-05, + "loss": 0.0073, + "step": 653670 + }, + { + "epoch": 1.69, + "learning_rate": 4.5835072230099456e-05, + "loss": 0.0074, + "step": 653680 + }, + { + "epoch": 1.69, + "learning_rate": 4.583118401372799e-05, + "loss": 0.0074, + "step": 653690 + }, + { + "epoch": 1.69, + "learning_rate": 4.5827295797356525e-05, + "loss": 0.011, + "step": 653700 + }, + { + "epoch": 1.69, + "learning_rate": 4.582340758098506e-05, + "loss": 0.0091, + "step": 653710 + }, + { + "epoch": 1.69, + "learning_rate": 4.5819519364613595e-05, + "loss": 0.0077, + "step": 653720 + }, + { + "epoch": 1.69, + "learning_rate": 4.581563114824213e-05, + "loss": 0.0116, + "step": 653730 + }, + { + "epoch": 1.69, + "learning_rate": 4.5811742931870665e-05, + "loss": 0.0073, + "step": 653740 + }, + { + "epoch": 1.69, + "learning_rate": 4.5807854715499206e-05, + "loss": 0.0087, + "step": 653750 + }, + { + "epoch": 1.69, + "learning_rate": 4.580396649912774e-05, + "loss": 0.0074, + "step": 653760 + }, + { + "epoch": 1.69, + "learning_rate": 4.5800078282756276e-05, + "loss": 0.0062, + "step": 653770 + }, + { + "epoch": 1.69, + "learning_rate": 4.579619006638481e-05, + "loss": 0.0095, + "step": 653780 + }, + { + "epoch": 1.69, + "learning_rate": 4.5792301850013346e-05, + "loss": 0.0141, + "step": 653790 + }, + { + "epoch": 1.69, + "learning_rate": 4.578841363364188e-05, + "loss": 0.0087, + "step": 653800 + }, + { + "epoch": 1.69, + "learning_rate": 4.5784525417270416e-05, + "loss": 0.0103, + "step": 653810 + }, + { + "epoch": 1.69, + "learning_rate": 4.578063720089895e-05, + "loss": 0.0082, + "step": 653820 + }, + { + "epoch": 1.69, + "learning_rate": 4.577674898452749e-05, + "loss": 0.0088, + "step": 653830 + }, + { + "epoch": 1.69, + "learning_rate": 4.577286076815603e-05, + "loss": 0.0064, + "step": 653840 + }, + { + "epoch": 1.69, + "learning_rate": 4.576897255178456e-05, + "loss": 0.0059, + "step": 653850 + }, + { + "epoch": 1.69, + "learning_rate": 4.57650843354131e-05, + "loss": 0.0089, + "step": 653860 + }, + { + "epoch": 1.69, + "learning_rate": 4.576119611904163e-05, + "loss": 0.0063, + "step": 653870 + }, + { + "epoch": 1.69, + "learning_rate": 4.5757307902670166e-05, + "loss": 0.0091, + "step": 653880 + }, + { + "epoch": 1.69, + "learning_rate": 4.5753419686298695e-05, + "loss": 0.007, + "step": 653890 + }, + { + "epoch": 1.7, + "learning_rate": 4.574953146992723e-05, + "loss": 0.01, + "step": 653900 + }, + { + "epoch": 1.7, + "learning_rate": 4.5745643253555764e-05, + "loss": 0.0067, + "step": 653910 + }, + { + "epoch": 1.7, + "learning_rate": 4.57417550371843e-05, + "loss": 0.0088, + "step": 653920 + }, + { + "epoch": 1.7, + "learning_rate": 4.573786682081284e-05, + "loss": 0.0107, + "step": 653930 + }, + { + "epoch": 1.7, + "learning_rate": 4.5733978604441376e-05, + "loss": 0.0094, + "step": 653940 + }, + { + "epoch": 1.7, + "learning_rate": 4.573009038806991e-05, + "loss": 0.0098, + "step": 653950 + }, + { + "epoch": 1.7, + "learning_rate": 4.5726202171698445e-05, + "loss": 0.0083, + "step": 653960 + }, + { + "epoch": 1.7, + "learning_rate": 4.572231395532698e-05, + "loss": 0.0073, + "step": 653970 + }, + { + "epoch": 1.7, + "learning_rate": 4.5718425738955515e-05, + "loss": 0.0077, + "step": 653980 + }, + { + "epoch": 1.7, + "learning_rate": 4.571453752258405e-05, + "loss": 0.0092, + "step": 653990 + }, + { + "epoch": 1.7, + "learning_rate": 4.5710649306212585e-05, + "loss": 0.0054, + "step": 654000 + }, + { + "epoch": 1.7, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.005244317930191755, + "eval_runtime": 108.0147, + "eval_samples_per_second": 18.516, + "eval_steps_per_second": 4.629, + "step": 654000 + }, + { + "epoch": 1.7, + "learning_rate": 4.5706761089841126e-05, + "loss": 0.0084, + "step": 654010 + }, + { + "epoch": 1.7, + "learning_rate": 4.570287287346966e-05, + "loss": 0.0106, + "step": 654020 + }, + { + "epoch": 1.7, + "learning_rate": 4.5698984657098196e-05, + "loss": 0.0073, + "step": 654030 + }, + { + "epoch": 1.7, + "learning_rate": 4.569509644072673e-05, + "loss": 0.01, + "step": 654040 + }, + { + "epoch": 1.7, + "learning_rate": 4.5691208224355266e-05, + "loss": 0.0078, + "step": 654050 + }, + { + "epoch": 1.7, + "learning_rate": 4.56873200079838e-05, + "loss": 0.0067, + "step": 654060 + }, + { + "epoch": 1.7, + "learning_rate": 4.5683431791612336e-05, + "loss": 0.0083, + "step": 654070 + }, + { + "epoch": 1.7, + "learning_rate": 4.567954357524087e-05, + "loss": 0.0069, + "step": 654080 + }, + { + "epoch": 1.7, + "learning_rate": 4.567565535886941e-05, + "loss": 0.0073, + "step": 654090 + }, + { + "epoch": 1.7, + "learning_rate": 4.567176714249795e-05, + "loss": 0.0076, + "step": 654100 + }, + { + "epoch": 1.7, + "learning_rate": 4.566787892612648e-05, + "loss": 0.0071, + "step": 654110 + }, + { + "epoch": 1.7, + "learning_rate": 4.566399070975502e-05, + "loss": 0.0059, + "step": 654120 + }, + { + "epoch": 1.7, + "learning_rate": 4.566010249338355e-05, + "loss": 0.007, + "step": 654130 + }, + { + "epoch": 1.7, + "learning_rate": 4.565621427701208e-05, + "loss": 0.0114, + "step": 654140 + }, + { + "epoch": 1.7, + "learning_rate": 4.5652326060640614e-05, + "loss": 0.0121, + "step": 654150 + }, + { + "epoch": 1.7, + "learning_rate": 4.564843784426915e-05, + "loss": 0.0132, + "step": 654160 + }, + { + "epoch": 1.7, + "learning_rate": 4.5644549627897684e-05, + "loss": 0.0075, + "step": 654170 + }, + { + "epoch": 1.7, + "learning_rate": 4.564066141152622e-05, + "loss": 0.0062, + "step": 654180 + }, + { + "epoch": 1.7, + "learning_rate": 4.563677319515476e-05, + "loss": 0.0089, + "step": 654190 + }, + { + "epoch": 1.7, + "learning_rate": 4.5632884978783296e-05, + "loss": 0.007, + "step": 654200 + }, + { + "epoch": 1.7, + "learning_rate": 4.562899676241183e-05, + "loss": 0.0076, + "step": 654210 + }, + { + "epoch": 1.7, + "learning_rate": 4.5625108546040365e-05, + "loss": 0.0086, + "step": 654220 + }, + { + "epoch": 1.7, + "learning_rate": 4.56212203296689e-05, + "loss": 0.0073, + "step": 654230 + }, + { + "epoch": 1.7, + "learning_rate": 4.5617332113297435e-05, + "loss": 0.008, + "step": 654240 + }, + { + "epoch": 1.7, + "learning_rate": 4.561344389692597e-05, + "loss": 0.0103, + "step": 654250 + }, + { + "epoch": 1.7, + "learning_rate": 4.5609555680554505e-05, + "loss": 0.0099, + "step": 654260 + }, + { + "epoch": 1.7, + "learning_rate": 4.5605667464183046e-05, + "loss": 0.0115, + "step": 654270 + }, + { + "epoch": 1.7, + "learning_rate": 4.560177924781158e-05, + "loss": 0.0068, + "step": 654280 + }, + { + "epoch": 1.7, + "learning_rate": 4.5597891031440116e-05, + "loss": 0.0109, + "step": 654290 + }, + { + "epoch": 1.7, + "learning_rate": 4.559400281506865e-05, + "loss": 0.0084, + "step": 654300 + }, + { + "epoch": 1.7, + "learning_rate": 4.5590114598697186e-05, + "loss": 0.008, + "step": 654310 + }, + { + "epoch": 1.7, + "learning_rate": 4.558622638232572e-05, + "loss": 0.0051, + "step": 654320 + }, + { + "epoch": 1.7, + "learning_rate": 4.5582338165954256e-05, + "loss": 0.0066, + "step": 654330 + }, + { + "epoch": 1.7, + "learning_rate": 4.557844994958279e-05, + "loss": 0.007, + "step": 654340 + }, + { + "epoch": 1.7, + "learning_rate": 4.557456173321133e-05, + "loss": 0.0099, + "step": 654350 + }, + { + "epoch": 1.7, + "learning_rate": 4.557067351683987e-05, + "loss": 0.0096, + "step": 654360 + }, + { + "epoch": 1.7, + "learning_rate": 4.55667853004684e-05, + "loss": 0.0087, + "step": 654370 + }, + { + "epoch": 1.7, + "learning_rate": 4.5562897084096937e-05, + "loss": 0.0083, + "step": 654380 + }, + { + "epoch": 1.7, + "learning_rate": 4.5559008867725465e-05, + "loss": 0.007, + "step": 654390 + }, + { + "epoch": 1.7, + "learning_rate": 4.5555120651354e-05, + "loss": 0.008, + "step": 654400 + }, + { + "epoch": 1.7, + "learning_rate": 4.5551232434982534e-05, + "loss": 0.0076, + "step": 654410 + }, + { + "epoch": 1.7, + "learning_rate": 4.554734421861107e-05, + "loss": 0.0086, + "step": 654420 + }, + { + "epoch": 1.7, + "learning_rate": 4.5543456002239604e-05, + "loss": 0.0075, + "step": 654430 + }, + { + "epoch": 1.7, + "learning_rate": 4.553956778586814e-05, + "loss": 0.008, + "step": 654440 + }, + { + "epoch": 1.7, + "learning_rate": 4.553567956949668e-05, + "loss": 0.0083, + "step": 654450 + }, + { + "epoch": 1.7, + "learning_rate": 4.5531791353125215e-05, + "loss": 0.0081, + "step": 654460 + }, + { + "epoch": 1.7, + "learning_rate": 4.552790313675375e-05, + "loss": 0.0081, + "step": 654470 + }, + { + "epoch": 1.7, + "learning_rate": 4.5524014920382285e-05, + "loss": 0.0061, + "step": 654480 + }, + { + "epoch": 1.7, + "learning_rate": 4.552012670401082e-05, + "loss": 0.006, + "step": 654490 + }, + { + "epoch": 1.7, + "learning_rate": 4.5516238487639355e-05, + "loss": 0.0084, + "step": 654500 + }, + { + "epoch": 1.7, + "learning_rate": 4.551235027126789e-05, + "loss": 0.021, + "step": 654510 + }, + { + "epoch": 1.7, + "learning_rate": 4.5508462054896425e-05, + "loss": 0.0095, + "step": 654520 + }, + { + "epoch": 1.7, + "learning_rate": 4.5504573838524966e-05, + "loss": 0.0079, + "step": 654530 + }, + { + "epoch": 1.7, + "learning_rate": 4.55006856221535e-05, + "loss": 0.009, + "step": 654540 + }, + { + "epoch": 1.7, + "learning_rate": 4.5496797405782036e-05, + "loss": 0.0087, + "step": 654550 + }, + { + "epoch": 1.7, + "learning_rate": 4.549290918941057e-05, + "loss": 0.0086, + "step": 654560 + }, + { + "epoch": 1.7, + "learning_rate": 4.5489020973039106e-05, + "loss": 0.0086, + "step": 654570 + }, + { + "epoch": 1.7, + "learning_rate": 4.548513275666764e-05, + "loss": 0.0083, + "step": 654580 + }, + { + "epoch": 1.7, + "learning_rate": 4.5481244540296175e-05, + "loss": 0.009, + "step": 654590 + }, + { + "epoch": 1.7, + "learning_rate": 4.547735632392471e-05, + "loss": 0.0079, + "step": 654600 + }, + { + "epoch": 1.7, + "learning_rate": 4.547346810755325e-05, + "loss": 0.009, + "step": 654610 + }, + { + "epoch": 1.7, + "learning_rate": 4.546957989118179e-05, + "loss": 0.008, + "step": 654620 + }, + { + "epoch": 1.7, + "learning_rate": 4.5465691674810315e-05, + "loss": 0.0064, + "step": 654630 + }, + { + "epoch": 1.7, + "learning_rate": 4.546180345843885e-05, + "loss": 0.0067, + "step": 654640 + }, + { + "epoch": 1.7, + "learning_rate": 4.5457915242067385e-05, + "loss": 0.0076, + "step": 654650 + }, + { + "epoch": 1.7, + "learning_rate": 4.545402702569592e-05, + "loss": 0.0073, + "step": 654660 + }, + { + "epoch": 1.7, + "learning_rate": 4.5450138809324454e-05, + "loss": 0.0107, + "step": 654670 + }, + { + "epoch": 1.7, + "learning_rate": 4.544625059295299e-05, + "loss": 0.0063, + "step": 654680 + }, + { + "epoch": 1.7, + "learning_rate": 4.5442362376581524e-05, + "loss": 0.012, + "step": 654690 + }, + { + "epoch": 1.7, + "learning_rate": 4.543847416021006e-05, + "loss": 0.0091, + "step": 654700 + }, + { + "epoch": 1.7, + "learning_rate": 4.54345859438386e-05, + "loss": 0.0075, + "step": 654710 + }, + { + "epoch": 1.7, + "learning_rate": 4.5430697727467135e-05, + "loss": 0.0065, + "step": 654720 + }, + { + "epoch": 1.7, + "learning_rate": 4.542680951109567e-05, + "loss": 0.0049, + "step": 654730 + }, + { + "epoch": 1.7, + "learning_rate": 4.5422921294724205e-05, + "loss": 0.0061, + "step": 654740 + }, + { + "epoch": 1.7, + "learning_rate": 4.541903307835274e-05, + "loss": 0.0066, + "step": 654750 + }, + { + "epoch": 1.7, + "learning_rate": 4.5415144861981275e-05, + "loss": 0.0056, + "step": 654760 + }, + { + "epoch": 1.7, + "learning_rate": 4.541125664560981e-05, + "loss": 0.0086, + "step": 654770 + }, + { + "epoch": 1.7, + "learning_rate": 4.5407368429238345e-05, + "loss": 0.0113, + "step": 654780 + }, + { + "epoch": 1.7, + "learning_rate": 4.5403480212866886e-05, + "loss": 0.0059, + "step": 654790 + }, + { + "epoch": 1.7, + "learning_rate": 4.539959199649542e-05, + "loss": 0.0081, + "step": 654800 + }, + { + "epoch": 1.7, + "learning_rate": 4.5395703780123956e-05, + "loss": 0.0075, + "step": 654810 + }, + { + "epoch": 1.7, + "learning_rate": 4.539181556375249e-05, + "loss": 0.0087, + "step": 654820 + }, + { + "epoch": 1.7, + "learning_rate": 4.5387927347381026e-05, + "loss": 0.0084, + "step": 654830 + }, + { + "epoch": 1.7, + "learning_rate": 4.538403913100956e-05, + "loss": 0.0104, + "step": 654840 + }, + { + "epoch": 1.7, + "learning_rate": 4.5380150914638095e-05, + "loss": 0.009, + "step": 654850 + }, + { + "epoch": 1.7, + "learning_rate": 4.537626269826663e-05, + "loss": 0.0071, + "step": 654860 + }, + { + "epoch": 1.7, + "learning_rate": 4.5372374481895165e-05, + "loss": 0.0059, + "step": 654870 + }, + { + "epoch": 1.7, + "learning_rate": 4.536848626552369e-05, + "loss": 0.0089, + "step": 654880 + }, + { + "epoch": 1.7, + "learning_rate": 4.5364598049152235e-05, + "loss": 0.0066, + "step": 654890 + }, + { + "epoch": 1.7, + "learning_rate": 4.536070983278077e-05, + "loss": 0.007, + "step": 654900 + }, + { + "epoch": 1.7, + "learning_rate": 4.5356821616409305e-05, + "loss": 0.0095, + "step": 654910 + }, + { + "epoch": 1.7, + "learning_rate": 4.535293340003784e-05, + "loss": 0.0072, + "step": 654920 + }, + { + "epoch": 1.7, + "learning_rate": 4.5349045183666374e-05, + "loss": 0.0093, + "step": 654930 + }, + { + "epoch": 1.7, + "learning_rate": 4.534515696729491e-05, + "loss": 0.0076, + "step": 654940 + }, + { + "epoch": 1.7, + "learning_rate": 4.5341268750923444e-05, + "loss": 0.009, + "step": 654950 + }, + { + "epoch": 1.7, + "learning_rate": 4.533738053455198e-05, + "loss": 0.0092, + "step": 654960 + }, + { + "epoch": 1.7, + "learning_rate": 4.5333492318180514e-05, + "loss": 0.0094, + "step": 654970 + }, + { + "epoch": 1.7, + "learning_rate": 4.5329604101809055e-05, + "loss": 0.0062, + "step": 654980 + }, + { + "epoch": 1.7, + "learning_rate": 4.532571588543759e-05, + "loss": 0.0063, + "step": 654990 + }, + { + "epoch": 1.7, + "learning_rate": 4.5321827669066125e-05, + "loss": 0.0078, + "step": 655000 + }, + { + "epoch": 1.7, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.005221130792051554, + "eval_runtime": 107.696, + "eval_samples_per_second": 18.571, + "eval_steps_per_second": 4.643, + "step": 655000 + }, + { + "epoch": 1.7, + "learning_rate": 4.531793945269466e-05, + "loss": 0.0087, + "step": 655010 + }, + { + "epoch": 1.7, + "learning_rate": 4.5314051236323195e-05, + "loss": 0.0102, + "step": 655020 + }, + { + "epoch": 1.7, + "learning_rate": 4.531016301995173e-05, + "loss": 0.0071, + "step": 655030 + }, + { + "epoch": 1.7, + "learning_rate": 4.5306274803580265e-05, + "loss": 0.0068, + "step": 655040 + }, + { + "epoch": 1.7, + "learning_rate": 4.53023865872088e-05, + "loss": 0.008, + "step": 655050 + }, + { + "epoch": 1.7, + "learning_rate": 4.529849837083734e-05, + "loss": 0.0071, + "step": 655060 + }, + { + "epoch": 1.7, + "learning_rate": 4.5294610154465876e-05, + "loss": 0.0084, + "step": 655070 + }, + { + "epoch": 1.7, + "learning_rate": 4.529072193809441e-05, + "loss": 0.0103, + "step": 655080 + }, + { + "epoch": 1.7, + "learning_rate": 4.5286833721722946e-05, + "loss": 0.0092, + "step": 655090 + }, + { + "epoch": 1.7, + "learning_rate": 4.528294550535148e-05, + "loss": 0.0084, + "step": 655100 + }, + { + "epoch": 1.7, + "learning_rate": 4.5279057288980015e-05, + "loss": 0.0067, + "step": 655110 + }, + { + "epoch": 1.7, + "learning_rate": 4.527516907260855e-05, + "loss": 0.0064, + "step": 655120 + }, + { + "epoch": 1.7, + "learning_rate": 4.527128085623708e-05, + "loss": 0.0105, + "step": 655130 + }, + { + "epoch": 1.7, + "learning_rate": 4.526739263986561e-05, + "loss": 0.01, + "step": 655140 + }, + { + "epoch": 1.7, + "learning_rate": 4.526350442349415e-05, + "loss": 0.009, + "step": 655150 + }, + { + "epoch": 1.7, + "learning_rate": 4.525961620712269e-05, + "loss": 0.0073, + "step": 655160 + }, + { + "epoch": 1.7, + "learning_rate": 4.5255727990751225e-05, + "loss": 0.009, + "step": 655170 + }, + { + "epoch": 1.7, + "learning_rate": 4.525183977437976e-05, + "loss": 0.0097, + "step": 655180 + }, + { + "epoch": 1.7, + "learning_rate": 4.5247951558008294e-05, + "loss": 0.0064, + "step": 655190 + }, + { + "epoch": 1.7, + "learning_rate": 4.524406334163683e-05, + "loss": 0.0065, + "step": 655200 + }, + { + "epoch": 1.7, + "learning_rate": 4.5240175125265364e-05, + "loss": 0.0081, + "step": 655210 + }, + { + "epoch": 1.7, + "learning_rate": 4.52362869088939e-05, + "loss": 0.0057, + "step": 655220 + }, + { + "epoch": 1.7, + "learning_rate": 4.5232398692522434e-05, + "loss": 0.0081, + "step": 655230 + }, + { + "epoch": 1.7, + "learning_rate": 4.5228510476150975e-05, + "loss": 0.0086, + "step": 655240 + }, + { + "epoch": 1.7, + "learning_rate": 4.522462225977951e-05, + "loss": 0.0075, + "step": 655250 + }, + { + "epoch": 1.7, + "learning_rate": 4.5220734043408045e-05, + "loss": 0.0073, + "step": 655260 + }, + { + "epoch": 1.7, + "learning_rate": 4.521684582703658e-05, + "loss": 0.009, + "step": 655270 + }, + { + "epoch": 1.7, + "learning_rate": 4.5212957610665115e-05, + "loss": 0.0094, + "step": 655280 + }, + { + "epoch": 1.7, + "learning_rate": 4.520906939429365e-05, + "loss": 0.0066, + "step": 655290 + }, + { + "epoch": 1.7, + "learning_rate": 4.5205181177922185e-05, + "loss": 0.0072, + "step": 655300 + }, + { + "epoch": 1.7, + "learning_rate": 4.520129296155072e-05, + "loss": 0.0073, + "step": 655310 + }, + { + "epoch": 1.7, + "learning_rate": 4.519740474517926e-05, + "loss": 0.0071, + "step": 655320 + }, + { + "epoch": 1.7, + "learning_rate": 4.5193516528807796e-05, + "loss": 0.0129, + "step": 655330 + }, + { + "epoch": 1.7, + "learning_rate": 4.518962831243633e-05, + "loss": 0.0079, + "step": 655340 + }, + { + "epoch": 1.7, + "learning_rate": 4.5185740096064866e-05, + "loss": 0.0096, + "step": 655350 + }, + { + "epoch": 1.7, + "learning_rate": 4.51818518796934e-05, + "loss": 0.0091, + "step": 655360 + }, + { + "epoch": 1.7, + "learning_rate": 4.5177963663321935e-05, + "loss": 0.0076, + "step": 655370 + }, + { + "epoch": 1.7, + "learning_rate": 4.5174075446950463e-05, + "loss": 0.0073, + "step": 655380 + }, + { + "epoch": 1.7, + "learning_rate": 4.5170187230579e-05, + "loss": 0.0103, + "step": 655390 + }, + { + "epoch": 1.7, + "learning_rate": 4.516629901420753e-05, + "loss": 0.0085, + "step": 655400 + }, + { + "epoch": 1.7, + "learning_rate": 4.516241079783607e-05, + "loss": 0.0087, + "step": 655410 + }, + { + "epoch": 1.7, + "learning_rate": 4.515852258146461e-05, + "loss": 0.0089, + "step": 655420 + }, + { + "epoch": 1.7, + "learning_rate": 4.5154634365093144e-05, + "loss": 0.0088, + "step": 655430 + }, + { + "epoch": 1.7, + "learning_rate": 4.515074614872168e-05, + "loss": 0.008, + "step": 655440 + }, + { + "epoch": 1.7, + "learning_rate": 4.5146857932350214e-05, + "loss": 0.0072, + "step": 655450 + }, + { + "epoch": 1.7, + "learning_rate": 4.514296971597875e-05, + "loss": 0.0082, + "step": 655460 + }, + { + "epoch": 1.7, + "learning_rate": 4.5139081499607284e-05, + "loss": 0.0073, + "step": 655470 + }, + { + "epoch": 1.7, + "learning_rate": 4.513519328323582e-05, + "loss": 0.0059, + "step": 655480 + }, + { + "epoch": 1.7, + "learning_rate": 4.5131305066864354e-05, + "loss": 0.0068, + "step": 655490 + }, + { + "epoch": 1.7, + "learning_rate": 4.5127416850492895e-05, + "loss": 0.0081, + "step": 655500 + }, + { + "epoch": 1.7, + "learning_rate": 4.512352863412143e-05, + "loss": 0.0079, + "step": 655510 + }, + { + "epoch": 1.7, + "learning_rate": 4.5119640417749965e-05, + "loss": 0.0086, + "step": 655520 + }, + { + "epoch": 1.7, + "learning_rate": 4.51157522013785e-05, + "loss": 0.0064, + "step": 655530 + }, + { + "epoch": 1.7, + "learning_rate": 4.5111863985007035e-05, + "loss": 0.0074, + "step": 655540 + }, + { + "epoch": 1.7, + "learning_rate": 4.510797576863557e-05, + "loss": 0.0053, + "step": 655550 + }, + { + "epoch": 1.7, + "learning_rate": 4.5104087552264104e-05, + "loss": 0.0095, + "step": 655560 + }, + { + "epoch": 1.7, + "learning_rate": 4.510019933589264e-05, + "loss": 0.0096, + "step": 655570 + }, + { + "epoch": 1.7, + "learning_rate": 4.509631111952118e-05, + "loss": 0.0096, + "step": 655580 + }, + { + "epoch": 1.7, + "learning_rate": 4.5092422903149716e-05, + "loss": 0.0063, + "step": 655590 + }, + { + "epoch": 1.7, + "learning_rate": 4.508853468677825e-05, + "loss": 0.0087, + "step": 655600 + }, + { + "epoch": 1.7, + "learning_rate": 4.5084646470406786e-05, + "loss": 0.0111, + "step": 655610 + }, + { + "epoch": 1.7, + "learning_rate": 4.508075825403532e-05, + "loss": 0.0079, + "step": 655620 + }, + { + "epoch": 1.7, + "learning_rate": 4.507687003766385e-05, + "loss": 0.0125, + "step": 655630 + }, + { + "epoch": 1.7, + "learning_rate": 4.507298182129238e-05, + "loss": 0.008, + "step": 655640 + }, + { + "epoch": 1.7, + "learning_rate": 4.506909360492092e-05, + "loss": 0.0094, + "step": 655650 + }, + { + "epoch": 1.7, + "learning_rate": 4.506520538854945e-05, + "loss": 0.007, + "step": 655660 + }, + { + "epoch": 1.7, + "learning_rate": 4.506131717217799e-05, + "loss": 0.0065, + "step": 655670 + }, + { + "epoch": 1.7, + "learning_rate": 4.505742895580653e-05, + "loss": 0.008, + "step": 655680 + }, + { + "epoch": 1.7, + "learning_rate": 4.5053540739435064e-05, + "loss": 0.0079, + "step": 655690 + }, + { + "epoch": 1.7, + "learning_rate": 4.50496525230636e-05, + "loss": 0.0087, + "step": 655700 + }, + { + "epoch": 1.7, + "learning_rate": 4.5045764306692134e-05, + "loss": 0.0073, + "step": 655710 + }, + { + "epoch": 1.7, + "learning_rate": 4.504187609032067e-05, + "loss": 0.0083, + "step": 655720 + }, + { + "epoch": 1.7, + "learning_rate": 4.5037987873949204e-05, + "loss": 0.0072, + "step": 655730 + }, + { + "epoch": 1.7, + "learning_rate": 4.503409965757774e-05, + "loss": 0.0066, + "step": 655740 + }, + { + "epoch": 1.7, + "learning_rate": 4.5030211441206274e-05, + "loss": 0.0057, + "step": 655750 + }, + { + "epoch": 1.7, + "learning_rate": 4.5026323224834815e-05, + "loss": 0.0082, + "step": 655760 + }, + { + "epoch": 1.7, + "learning_rate": 4.502243500846335e-05, + "loss": 0.0109, + "step": 655770 + }, + { + "epoch": 1.7, + "learning_rate": 4.5018546792091885e-05, + "loss": 0.0073, + "step": 655780 + }, + { + "epoch": 1.7, + "learning_rate": 4.501465857572042e-05, + "loss": 0.0084, + "step": 655790 + }, + { + "epoch": 1.7, + "learning_rate": 4.5010770359348955e-05, + "loss": 0.0063, + "step": 655800 + }, + { + "epoch": 1.7, + "learning_rate": 4.500688214297749e-05, + "loss": 0.0091, + "step": 655810 + }, + { + "epoch": 1.7, + "learning_rate": 4.5002993926606024e-05, + "loss": 0.008, + "step": 655820 + }, + { + "epoch": 1.7, + "learning_rate": 4.499910571023456e-05, + "loss": 0.0094, + "step": 655830 + }, + { + "epoch": 1.7, + "learning_rate": 4.49952174938631e-05, + "loss": 0.0081, + "step": 655840 + }, + { + "epoch": 1.7, + "learning_rate": 4.4991329277491636e-05, + "loss": 0.0076, + "step": 655850 + }, + { + "epoch": 1.7, + "learning_rate": 4.498744106112017e-05, + "loss": 0.0107, + "step": 655860 + }, + { + "epoch": 1.7, + "learning_rate": 4.49835528447487e-05, + "loss": 0.0063, + "step": 655870 + }, + { + "epoch": 1.7, + "learning_rate": 4.4979664628377234e-05, + "loss": 0.0065, + "step": 655880 + }, + { + "epoch": 1.7, + "learning_rate": 4.497577641200577e-05, + "loss": 0.0093, + "step": 655890 + }, + { + "epoch": 1.7, + "learning_rate": 4.49718881956343e-05, + "loss": 0.0065, + "step": 655900 + }, + { + "epoch": 1.7, + "learning_rate": 4.496799997926284e-05, + "loss": 0.006, + "step": 655910 + }, + { + "epoch": 1.7, + "learning_rate": 4.496411176289137e-05, + "loss": 0.0066, + "step": 655920 + }, + { + "epoch": 1.7, + "learning_rate": 4.496022354651991e-05, + "loss": 0.0081, + "step": 655930 + }, + { + "epoch": 1.7, + "learning_rate": 4.495633533014845e-05, + "loss": 0.009, + "step": 655940 + }, + { + "epoch": 1.7, + "learning_rate": 4.4952447113776984e-05, + "loss": 0.0114, + "step": 655950 + }, + { + "epoch": 1.7, + "learning_rate": 4.494855889740552e-05, + "loss": 0.0075, + "step": 655960 + }, + { + "epoch": 1.7, + "learning_rate": 4.4944670681034054e-05, + "loss": 0.0069, + "step": 655970 + }, + { + "epoch": 1.7, + "learning_rate": 4.494078246466259e-05, + "loss": 0.0083, + "step": 655980 + }, + { + "epoch": 1.7, + "learning_rate": 4.4936894248291124e-05, + "loss": 0.0066, + "step": 655990 + }, + { + "epoch": 1.7, + "learning_rate": 4.493300603191966e-05, + "loss": 0.0096, + "step": 656000 + }, + { + "epoch": 1.7, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.005197363439947367, + "eval_runtime": 108.0429, + "eval_samples_per_second": 18.511, + "eval_steps_per_second": 4.628, + "step": 656000 + }, + { + "epoch": 1.7, + "learning_rate": 4.4929117815548194e-05, + "loss": 0.0084, + "step": 656010 + }, + { + "epoch": 1.7, + "learning_rate": 4.4925229599176735e-05, + "loss": 0.0082, + "step": 656020 + }, + { + "epoch": 1.7, + "learning_rate": 4.492134138280527e-05, + "loss": 0.0084, + "step": 656030 + }, + { + "epoch": 1.7, + "learning_rate": 4.4917453166433805e-05, + "loss": 0.0106, + "step": 656040 + }, + { + "epoch": 1.7, + "learning_rate": 4.491356495006234e-05, + "loss": 0.0129, + "step": 656050 + }, + { + "epoch": 1.7, + "learning_rate": 4.4909676733690875e-05, + "loss": 0.0082, + "step": 656060 + }, + { + "epoch": 1.7, + "learning_rate": 4.490578851731941e-05, + "loss": 0.0083, + "step": 656070 + }, + { + "epoch": 1.7, + "learning_rate": 4.4901900300947944e-05, + "loss": 0.0063, + "step": 656080 + }, + { + "epoch": 1.7, + "learning_rate": 4.489801208457648e-05, + "loss": 0.0063, + "step": 656090 + }, + { + "epoch": 1.7, + "learning_rate": 4.489412386820502e-05, + "loss": 0.0079, + "step": 656100 + }, + { + "epoch": 1.7, + "learning_rate": 4.4890235651833556e-05, + "loss": 0.009, + "step": 656110 + }, + { + "epoch": 1.7, + "learning_rate": 4.4886347435462084e-05, + "loss": 0.0081, + "step": 656120 + }, + { + "epoch": 1.7, + "learning_rate": 4.488245921909062e-05, + "loss": 0.0082, + "step": 656130 + }, + { + "epoch": 1.7, + "learning_rate": 4.4878571002719154e-05, + "loss": 0.0072, + "step": 656140 + }, + { + "epoch": 1.7, + "learning_rate": 4.487468278634769e-05, + "loss": 0.0064, + "step": 656150 + }, + { + "epoch": 1.7, + "learning_rate": 4.487079456997622e-05, + "loss": 0.0084, + "step": 656160 + }, + { + "epoch": 1.7, + "learning_rate": 4.486690635360476e-05, + "loss": 0.0073, + "step": 656170 + }, + { + "epoch": 1.7, + "learning_rate": 4.486301813723329e-05, + "loss": 0.0073, + "step": 656180 + }, + { + "epoch": 1.7, + "learning_rate": 4.485912992086183e-05, + "loss": 0.0068, + "step": 656190 + }, + { + "epoch": 1.7, + "learning_rate": 4.485524170449037e-05, + "loss": 0.0085, + "step": 656200 + }, + { + "epoch": 1.7, + "learning_rate": 4.4851353488118904e-05, + "loss": 0.0084, + "step": 656210 + }, + { + "epoch": 1.7, + "learning_rate": 4.484746527174744e-05, + "loss": 0.01, + "step": 656220 + }, + { + "epoch": 1.7, + "learning_rate": 4.4843577055375974e-05, + "loss": 0.01, + "step": 656230 + }, + { + "epoch": 1.7, + "learning_rate": 4.483968883900451e-05, + "loss": 0.0112, + "step": 656240 + }, + { + "epoch": 1.7, + "learning_rate": 4.4835800622633044e-05, + "loss": 0.0089, + "step": 656250 + }, + { + "epoch": 1.7, + "learning_rate": 4.483191240626158e-05, + "loss": 0.0076, + "step": 656260 + }, + { + "epoch": 1.7, + "learning_rate": 4.4828024189890114e-05, + "loss": 0.0071, + "step": 656270 + }, + { + "epoch": 1.7, + "learning_rate": 4.482413597351865e-05, + "loss": 0.0071, + "step": 656280 + }, + { + "epoch": 1.7, + "learning_rate": 4.482024775714719e-05, + "loss": 0.0071, + "step": 656290 + }, + { + "epoch": 1.7, + "learning_rate": 4.4816359540775725e-05, + "loss": 0.009, + "step": 656300 + }, + { + "epoch": 1.7, + "learning_rate": 4.481247132440426e-05, + "loss": 0.006, + "step": 656310 + }, + { + "epoch": 1.7, + "learning_rate": 4.4808583108032795e-05, + "loss": 0.0074, + "step": 656320 + }, + { + "epoch": 1.7, + "learning_rate": 4.480469489166133e-05, + "loss": 0.0066, + "step": 656330 + }, + { + "epoch": 1.7, + "learning_rate": 4.4800806675289864e-05, + "loss": 0.0083, + "step": 656340 + }, + { + "epoch": 1.7, + "learning_rate": 4.47969184589184e-05, + "loss": 0.0073, + "step": 656350 + }, + { + "epoch": 1.7, + "learning_rate": 4.4793030242546934e-05, + "loss": 0.0077, + "step": 656360 + }, + { + "epoch": 1.7, + "learning_rate": 4.478914202617546e-05, + "loss": 0.0079, + "step": 656370 + }, + { + "epoch": 1.7, + "learning_rate": 4.4785253809804e-05, + "loss": 0.0081, + "step": 656380 + }, + { + "epoch": 1.7, + "learning_rate": 4.478136559343254e-05, + "loss": 0.0058, + "step": 656390 + }, + { + "epoch": 1.7, + "learning_rate": 4.4777477377061073e-05, + "loss": 0.008, + "step": 656400 + }, + { + "epoch": 1.7, + "learning_rate": 4.477358916068961e-05, + "loss": 0.0086, + "step": 656410 + }, + { + "epoch": 1.7, + "learning_rate": 4.476970094431814e-05, + "loss": 0.0074, + "step": 656420 + }, + { + "epoch": 1.7, + "learning_rate": 4.476581272794668e-05, + "loss": 0.0082, + "step": 656430 + }, + { + "epoch": 1.7, + "learning_rate": 4.476192451157521e-05, + "loss": 0.0081, + "step": 656440 + }, + { + "epoch": 1.7, + "learning_rate": 4.475803629520375e-05, + "loss": 0.0084, + "step": 656450 + }, + { + "epoch": 1.7, + "learning_rate": 4.475414807883228e-05, + "loss": 0.007, + "step": 656460 + }, + { + "epoch": 1.7, + "learning_rate": 4.4750259862460824e-05, + "loss": 0.0102, + "step": 656470 + }, + { + "epoch": 1.7, + "learning_rate": 4.474637164608936e-05, + "loss": 0.0085, + "step": 656480 + }, + { + "epoch": 1.7, + "learning_rate": 4.4742483429717894e-05, + "loss": 0.0056, + "step": 656490 + }, + { + "epoch": 1.7, + "learning_rate": 4.473859521334643e-05, + "loss": 0.0064, + "step": 656500 + }, + { + "epoch": 1.7, + "learning_rate": 4.4734706996974964e-05, + "loss": 0.0079, + "step": 656510 + }, + { + "epoch": 1.7, + "learning_rate": 4.47308187806035e-05, + "loss": 0.0096, + "step": 656520 + }, + { + "epoch": 1.7, + "learning_rate": 4.4726930564232033e-05, + "loss": 0.0067, + "step": 656530 + }, + { + "epoch": 1.7, + "learning_rate": 4.472304234786057e-05, + "loss": 0.0097, + "step": 656540 + }, + { + "epoch": 1.7, + "learning_rate": 4.471915413148911e-05, + "loss": 0.011, + "step": 656550 + }, + { + "epoch": 1.7, + "learning_rate": 4.4715265915117645e-05, + "loss": 0.0078, + "step": 656560 + }, + { + "epoch": 1.7, + "learning_rate": 4.471137769874618e-05, + "loss": 0.011, + "step": 656570 + }, + { + "epoch": 1.7, + "learning_rate": 4.4707489482374715e-05, + "loss": 0.0091, + "step": 656580 + }, + { + "epoch": 1.7, + "learning_rate": 4.470360126600325e-05, + "loss": 0.0065, + "step": 656590 + }, + { + "epoch": 1.7, + "learning_rate": 4.4699713049631784e-05, + "loss": 0.0075, + "step": 656600 + }, + { + "epoch": 1.7, + "learning_rate": 4.469582483326032e-05, + "loss": 0.0106, + "step": 656610 + }, + { + "epoch": 1.7, + "learning_rate": 4.469193661688885e-05, + "loss": 0.006, + "step": 656620 + }, + { + "epoch": 1.7, + "learning_rate": 4.468804840051738e-05, + "loss": 0.0093, + "step": 656630 + }, + { + "epoch": 1.7, + "learning_rate": 4.468416018414592e-05, + "loss": 0.0091, + "step": 656640 + }, + { + "epoch": 1.7, + "learning_rate": 4.468027196777446e-05, + "loss": 0.0072, + "step": 656650 + }, + { + "epoch": 1.7, + "learning_rate": 4.4676383751402993e-05, + "loss": 0.0072, + "step": 656660 + }, + { + "epoch": 1.7, + "learning_rate": 4.467249553503153e-05, + "loss": 0.0095, + "step": 656670 + }, + { + "epoch": 1.7, + "learning_rate": 4.466860731866006e-05, + "loss": 0.0078, + "step": 656680 + }, + { + "epoch": 1.7, + "learning_rate": 4.46647191022886e-05, + "loss": 0.01, + "step": 656690 + }, + { + "epoch": 1.7, + "learning_rate": 4.466083088591713e-05, + "loss": 0.0089, + "step": 656700 + }, + { + "epoch": 1.7, + "learning_rate": 4.465694266954567e-05, + "loss": 0.0069, + "step": 656710 + }, + { + "epoch": 1.7, + "learning_rate": 4.46530544531742e-05, + "loss": 0.0092, + "step": 656720 + }, + { + "epoch": 1.7, + "learning_rate": 4.4649166236802744e-05, + "loss": 0.0063, + "step": 656730 + }, + { + "epoch": 1.7, + "learning_rate": 4.464527802043128e-05, + "loss": 0.0085, + "step": 656740 + }, + { + "epoch": 1.7, + "learning_rate": 4.4641389804059814e-05, + "loss": 0.0105, + "step": 656750 + }, + { + "epoch": 1.7, + "learning_rate": 4.463750158768835e-05, + "loss": 0.0085, + "step": 656760 + }, + { + "epoch": 1.7, + "learning_rate": 4.4633613371316884e-05, + "loss": 0.0069, + "step": 656770 + }, + { + "epoch": 1.7, + "learning_rate": 4.462972515494542e-05, + "loss": 0.0074, + "step": 656780 + }, + { + "epoch": 1.7, + "learning_rate": 4.4625836938573953e-05, + "loss": 0.007, + "step": 656790 + }, + { + "epoch": 1.7, + "learning_rate": 4.462194872220249e-05, + "loss": 0.0091, + "step": 656800 + }, + { + "epoch": 1.7, + "learning_rate": 4.461806050583103e-05, + "loss": 0.0091, + "step": 656810 + }, + { + "epoch": 1.7, + "learning_rate": 4.4614172289459565e-05, + "loss": 0.0097, + "step": 656820 + }, + { + "epoch": 1.7, + "learning_rate": 4.46102840730881e-05, + "loss": 0.0075, + "step": 656830 + }, + { + "epoch": 1.7, + "learning_rate": 4.4606395856716635e-05, + "loss": 0.0091, + "step": 656840 + }, + { + "epoch": 1.7, + "learning_rate": 4.460250764034517e-05, + "loss": 0.0073, + "step": 656850 + }, + { + "epoch": 1.7, + "learning_rate": 4.4598619423973704e-05, + "loss": 0.0072, + "step": 656860 + }, + { + "epoch": 1.7, + "learning_rate": 4.459473120760223e-05, + "loss": 0.0087, + "step": 656870 + }, + { + "epoch": 1.7, + "learning_rate": 4.459084299123077e-05, + "loss": 0.0072, + "step": 656880 + }, + { + "epoch": 1.7, + "learning_rate": 4.45869547748593e-05, + "loss": 0.0194, + "step": 656890 + }, + { + "epoch": 1.7, + "learning_rate": 4.458306655848784e-05, + "loss": 0.0083, + "step": 656900 + }, + { + "epoch": 1.7, + "learning_rate": 4.457917834211638e-05, + "loss": 0.0087, + "step": 656910 + }, + { + "epoch": 1.7, + "learning_rate": 4.4575290125744913e-05, + "loss": 0.0066, + "step": 656920 + }, + { + "epoch": 1.7, + "learning_rate": 4.457140190937345e-05, + "loss": 0.0118, + "step": 656930 + }, + { + "epoch": 1.7, + "learning_rate": 4.456751369300198e-05, + "loss": 0.0075, + "step": 656940 + }, + { + "epoch": 1.7, + "learning_rate": 4.456362547663052e-05, + "loss": 0.0077, + "step": 656950 + }, + { + "epoch": 1.7, + "learning_rate": 4.455973726025905e-05, + "loss": 0.0065, + "step": 656960 + }, + { + "epoch": 1.7, + "learning_rate": 4.455584904388759e-05, + "loss": 0.0065, + "step": 656970 + }, + { + "epoch": 1.7, + "learning_rate": 4.455196082751612e-05, + "loss": 0.0091, + "step": 656980 + }, + { + "epoch": 1.7, + "learning_rate": 4.4548072611144664e-05, + "loss": 0.0074, + "step": 656990 + }, + { + "epoch": 1.7, + "learning_rate": 4.45441843947732e-05, + "loss": 0.0077, + "step": 657000 + }, + { + "epoch": 1.7, + "eval_cer": 0.88167329394755, + "eval_loss": 0.005158776883035898, + "eval_runtime": 108.0407, + "eval_samples_per_second": 18.512, + "eval_steps_per_second": 4.628, + "step": 657000 + }, + { + "epoch": 1.7, + "learning_rate": 4.4540296178401734e-05, + "loss": 0.0071, + "step": 657010 + }, + { + "epoch": 1.7, + "learning_rate": 4.453640796203027e-05, + "loss": 0.009, + "step": 657020 + }, + { + "epoch": 1.7, + "learning_rate": 4.4532519745658804e-05, + "loss": 0.0086, + "step": 657030 + }, + { + "epoch": 1.7, + "learning_rate": 4.452863152928734e-05, + "loss": 0.0072, + "step": 657040 + }, + { + "epoch": 1.7, + "learning_rate": 4.452474331291587e-05, + "loss": 0.0076, + "step": 657050 + }, + { + "epoch": 1.7, + "learning_rate": 4.452085509654441e-05, + "loss": 0.0076, + "step": 657060 + }, + { + "epoch": 1.7, + "learning_rate": 4.451696688017295e-05, + "loss": 0.0077, + "step": 657070 + }, + { + "epoch": 1.7, + "learning_rate": 4.4513078663801485e-05, + "loss": 0.0086, + "step": 657080 + }, + { + "epoch": 1.7, + "learning_rate": 4.450919044743002e-05, + "loss": 0.0084, + "step": 657090 + }, + { + "epoch": 1.7, + "learning_rate": 4.4505302231058554e-05, + "loss": 0.0084, + "step": 657100 + }, + { + "epoch": 1.7, + "learning_rate": 4.450141401468709e-05, + "loss": 0.0069, + "step": 657110 + }, + { + "epoch": 1.7, + "learning_rate": 4.449752579831562e-05, + "loss": 0.0087, + "step": 657120 + }, + { + "epoch": 1.7, + "learning_rate": 4.449363758194415e-05, + "loss": 0.0064, + "step": 657130 + }, + { + "epoch": 1.7, + "learning_rate": 4.448974936557269e-05, + "loss": 0.0075, + "step": 657140 + }, + { + "epoch": 1.7, + "learning_rate": 4.448586114920122e-05, + "loss": 0.0068, + "step": 657150 + }, + { + "epoch": 1.7, + "learning_rate": 4.448197293282976e-05, + "loss": 0.005, + "step": 657160 + }, + { + "epoch": 1.7, + "learning_rate": 4.44780847164583e-05, + "loss": 0.0065, + "step": 657170 + }, + { + "epoch": 1.7, + "learning_rate": 4.447419650008683e-05, + "loss": 0.0055, + "step": 657180 + }, + { + "epoch": 1.7, + "learning_rate": 4.447030828371537e-05, + "loss": 0.0076, + "step": 657190 + }, + { + "epoch": 1.7, + "learning_rate": 4.44664200673439e-05, + "loss": 0.0071, + "step": 657200 + }, + { + "epoch": 1.7, + "learning_rate": 4.446253185097244e-05, + "loss": 0.0091, + "step": 657210 + }, + { + "epoch": 1.7, + "learning_rate": 4.445864363460097e-05, + "loss": 0.0081, + "step": 657220 + }, + { + "epoch": 1.7, + "learning_rate": 4.445475541822951e-05, + "loss": 0.0071, + "step": 657230 + }, + { + "epoch": 1.7, + "learning_rate": 4.445086720185804e-05, + "loss": 0.0075, + "step": 657240 + }, + { + "epoch": 1.7, + "learning_rate": 4.4446978985486584e-05, + "loss": 0.0071, + "step": 657250 + }, + { + "epoch": 1.7, + "learning_rate": 4.444309076911512e-05, + "loss": 0.0072, + "step": 657260 + }, + { + "epoch": 1.7, + "learning_rate": 4.4439202552743654e-05, + "loss": 0.0067, + "step": 657270 + }, + { + "epoch": 1.7, + "learning_rate": 4.443531433637219e-05, + "loss": 0.0091, + "step": 657280 + }, + { + "epoch": 1.7, + "learning_rate": 4.4431426120000724e-05, + "loss": 0.0049, + "step": 657290 + }, + { + "epoch": 1.7, + "learning_rate": 4.442753790362926e-05, + "loss": 0.0081, + "step": 657300 + }, + { + "epoch": 1.7, + "learning_rate": 4.442364968725779e-05, + "loss": 0.0089, + "step": 657310 + }, + { + "epoch": 1.7, + "learning_rate": 4.441976147088633e-05, + "loss": 0.0072, + "step": 657320 + }, + { + "epoch": 1.7, + "learning_rate": 4.441587325451487e-05, + "loss": 0.0074, + "step": 657330 + }, + { + "epoch": 1.7, + "learning_rate": 4.4411985038143405e-05, + "loss": 0.0117, + "step": 657340 + }, + { + "epoch": 1.7, + "learning_rate": 4.440809682177194e-05, + "loss": 0.0105, + "step": 657350 + }, + { + "epoch": 1.7, + "learning_rate": 4.440420860540047e-05, + "loss": 0.0095, + "step": 657360 + }, + { + "epoch": 1.7, + "learning_rate": 4.4400320389029e-05, + "loss": 0.0099, + "step": 657370 + }, + { + "epoch": 1.7, + "learning_rate": 4.439643217265754e-05, + "loss": 0.0086, + "step": 657380 + }, + { + "epoch": 1.7, + "learning_rate": 4.439254395628607e-05, + "loss": 0.0096, + "step": 657390 + }, + { + "epoch": 1.7, + "learning_rate": 4.438865573991461e-05, + "loss": 0.0093, + "step": 657400 + }, + { + "epoch": 1.7, + "learning_rate": 4.438476752354314e-05, + "loss": 0.0109, + "step": 657410 + }, + { + "epoch": 1.7, + "learning_rate": 4.438087930717168e-05, + "loss": 0.0068, + "step": 657420 + }, + { + "epoch": 1.7, + "learning_rate": 4.437699109080022e-05, + "loss": 0.0092, + "step": 657430 + }, + { + "epoch": 1.7, + "learning_rate": 4.437310287442875e-05, + "loss": 0.007, + "step": 657440 + }, + { + "epoch": 1.7, + "learning_rate": 4.436921465805729e-05, + "loss": 0.0087, + "step": 657450 + }, + { + "epoch": 1.7, + "learning_rate": 4.436532644168582e-05, + "loss": 0.0088, + "step": 657460 + }, + { + "epoch": 1.7, + "learning_rate": 4.436143822531436e-05, + "loss": 0.0093, + "step": 657470 + }, + { + "epoch": 1.7, + "learning_rate": 4.435755000894289e-05, + "loss": 0.0061, + "step": 657480 + }, + { + "epoch": 1.7, + "learning_rate": 4.435366179257143e-05, + "loss": 0.0064, + "step": 657490 + }, + { + "epoch": 1.7, + "learning_rate": 4.434977357619996e-05, + "loss": 0.0065, + "step": 657500 + }, + { + "epoch": 1.7, + "learning_rate": 4.4345885359828504e-05, + "loss": 0.0087, + "step": 657510 + }, + { + "epoch": 1.7, + "learning_rate": 4.434199714345704e-05, + "loss": 0.0079, + "step": 657520 + }, + { + "epoch": 1.7, + "learning_rate": 4.4338108927085574e-05, + "loss": 0.0066, + "step": 657530 + }, + { + "epoch": 1.7, + "learning_rate": 4.433422071071411e-05, + "loss": 0.0064, + "step": 657540 + }, + { + "epoch": 1.7, + "learning_rate": 4.4330332494342644e-05, + "loss": 0.0076, + "step": 657550 + }, + { + "epoch": 1.7, + "learning_rate": 4.432644427797118e-05, + "loss": 0.0079, + "step": 657560 + }, + { + "epoch": 1.7, + "learning_rate": 4.432255606159971e-05, + "loss": 0.0079, + "step": 657570 + }, + { + "epoch": 1.7, + "learning_rate": 4.431866784522825e-05, + "loss": 0.0094, + "step": 657580 + }, + { + "epoch": 1.7, + "learning_rate": 4.431477962885678e-05, + "loss": 0.0097, + "step": 657590 + }, + { + "epoch": 1.7, + "learning_rate": 4.4310891412485325e-05, + "loss": 0.0083, + "step": 657600 + }, + { + "epoch": 1.7, + "learning_rate": 4.430700319611385e-05, + "loss": 0.0064, + "step": 657610 + }, + { + "epoch": 1.7, + "learning_rate": 4.430311497974239e-05, + "loss": 0.0055, + "step": 657620 + }, + { + "epoch": 1.7, + "learning_rate": 4.429922676337092e-05, + "loss": 0.0077, + "step": 657630 + }, + { + "epoch": 1.7, + "learning_rate": 4.429533854699946e-05, + "loss": 0.01, + "step": 657640 + }, + { + "epoch": 1.7, + "learning_rate": 4.429145033062799e-05, + "loss": 0.0083, + "step": 657650 + }, + { + "epoch": 1.7, + "learning_rate": 4.428756211425653e-05, + "loss": 0.0127, + "step": 657660 + }, + { + "epoch": 1.7, + "learning_rate": 4.428367389788506e-05, + "loss": 0.0044, + "step": 657670 + }, + { + "epoch": 1.7, + "learning_rate": 4.42797856815136e-05, + "loss": 0.0121, + "step": 657680 + }, + { + "epoch": 1.7, + "learning_rate": 4.427589746514213e-05, + "loss": 0.0115, + "step": 657690 + }, + { + "epoch": 1.7, + "learning_rate": 4.427200924877067e-05, + "loss": 0.0074, + "step": 657700 + }, + { + "epoch": 1.7, + "learning_rate": 4.426812103239921e-05, + "loss": 0.0078, + "step": 657710 + }, + { + "epoch": 1.7, + "learning_rate": 4.426423281602774e-05, + "loss": 0.008, + "step": 657720 + }, + { + "epoch": 1.7, + "learning_rate": 4.426034459965628e-05, + "loss": 0.0081, + "step": 657730 + }, + { + "epoch": 1.7, + "learning_rate": 4.425645638328481e-05, + "loss": 0.0083, + "step": 657740 + }, + { + "epoch": 1.7, + "learning_rate": 4.425256816691335e-05, + "loss": 0.0075, + "step": 657750 + }, + { + "epoch": 1.71, + "learning_rate": 4.424867995054188e-05, + "loss": 0.0087, + "step": 657760 + }, + { + "epoch": 1.71, + "learning_rate": 4.424479173417042e-05, + "loss": 0.0071, + "step": 657770 + }, + { + "epoch": 1.71, + "learning_rate": 4.424090351779896e-05, + "loss": 0.0076, + "step": 657780 + }, + { + "epoch": 1.71, + "learning_rate": 4.4237015301427494e-05, + "loss": 0.0051, + "step": 657790 + }, + { + "epoch": 1.71, + "learning_rate": 4.423312708505603e-05, + "loss": 0.0073, + "step": 657800 + }, + { + "epoch": 1.71, + "learning_rate": 4.4229238868684564e-05, + "loss": 0.0078, + "step": 657810 + }, + { + "epoch": 1.71, + "learning_rate": 4.42253506523131e-05, + "loss": 0.01, + "step": 657820 + }, + { + "epoch": 1.71, + "learning_rate": 4.422146243594163e-05, + "loss": 0.0079, + "step": 657830 + }, + { + "epoch": 1.71, + "learning_rate": 4.421757421957017e-05, + "loss": 0.0078, + "step": 657840 + }, + { + "epoch": 1.71, + "learning_rate": 4.42136860031987e-05, + "loss": 0.0078, + "step": 657850 + }, + { + "epoch": 1.71, + "learning_rate": 4.420979778682723e-05, + "loss": 0.0075, + "step": 657860 + }, + { + "epoch": 1.71, + "learning_rate": 4.4205909570455766e-05, + "loss": 0.0052, + "step": 657870 + }, + { + "epoch": 1.71, + "learning_rate": 4.420202135408431e-05, + "loss": 0.009, + "step": 657880 + }, + { + "epoch": 1.71, + "learning_rate": 4.419813313771284e-05, + "loss": 0.0052, + "step": 657890 + }, + { + "epoch": 1.71, + "learning_rate": 4.419424492134138e-05, + "loss": 0.0072, + "step": 657900 + }, + { + "epoch": 1.71, + "learning_rate": 4.419035670496991e-05, + "loss": 0.0088, + "step": 657910 + }, + { + "epoch": 1.71, + "learning_rate": 4.418646848859845e-05, + "loss": 0.007, + "step": 657920 + }, + { + "epoch": 1.71, + "learning_rate": 4.418258027222698e-05, + "loss": 0.0118, + "step": 657930 + }, + { + "epoch": 1.71, + "learning_rate": 4.417869205585552e-05, + "loss": 0.0083, + "step": 657940 + }, + { + "epoch": 1.71, + "learning_rate": 4.417480383948405e-05, + "loss": 0.0106, + "step": 657950 + }, + { + "epoch": 1.71, + "learning_rate": 4.417091562311259e-05, + "loss": 0.0069, + "step": 657960 + }, + { + "epoch": 1.71, + "learning_rate": 4.416702740674113e-05, + "loss": 0.0052, + "step": 657970 + }, + { + "epoch": 1.71, + "learning_rate": 4.416313919036966e-05, + "loss": 0.0084, + "step": 657980 + }, + { + "epoch": 1.71, + "learning_rate": 4.41592509739982e-05, + "loss": 0.0079, + "step": 657990 + }, + { + "epoch": 1.71, + "learning_rate": 4.415536275762673e-05, + "loss": 0.0094, + "step": 658000 + }, + { + "epoch": 1.71, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.005186532158404589, + "eval_runtime": 107.9432, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 658000 + }, + { + "epoch": 1.71, + "learning_rate": 4.415147454125527e-05, + "loss": 0.008, + "step": 658010 + }, + { + "epoch": 1.71, + "learning_rate": 4.41475863248838e-05, + "loss": 0.0104, + "step": 658020 + }, + { + "epoch": 1.71, + "learning_rate": 4.414369810851234e-05, + "loss": 0.0098, + "step": 658030 + }, + { + "epoch": 1.71, + "learning_rate": 4.413980989214088e-05, + "loss": 0.0079, + "step": 658040 + }, + { + "epoch": 1.71, + "learning_rate": 4.4135921675769414e-05, + "loss": 0.0062, + "step": 658050 + }, + { + "epoch": 1.71, + "learning_rate": 4.413203345939795e-05, + "loss": 0.0086, + "step": 658060 + }, + { + "epoch": 1.71, + "learning_rate": 4.4128145243026483e-05, + "loss": 0.0085, + "step": 658070 + }, + { + "epoch": 1.71, + "learning_rate": 4.412425702665502e-05, + "loss": 0.0074, + "step": 658080 + }, + { + "epoch": 1.71, + "learning_rate": 4.412036881028355e-05, + "loss": 0.0091, + "step": 658090 + }, + { + "epoch": 1.71, + "learning_rate": 4.411648059391209e-05, + "loss": 0.0085, + "step": 658100 + }, + { + "epoch": 1.71, + "learning_rate": 4.4112592377540616e-05, + "loss": 0.0089, + "step": 658110 + }, + { + "epoch": 1.71, + "learning_rate": 4.410870416116915e-05, + "loss": 0.0066, + "step": 658120 + }, + { + "epoch": 1.71, + "learning_rate": 4.4104815944797686e-05, + "loss": 0.0118, + "step": 658130 + }, + { + "epoch": 1.71, + "learning_rate": 4.410092772842623e-05, + "loss": 0.0075, + "step": 658140 + }, + { + "epoch": 1.71, + "learning_rate": 4.409703951205476e-05, + "loss": 0.0087, + "step": 658150 + }, + { + "epoch": 1.71, + "learning_rate": 4.40931512956833e-05, + "loss": 0.0066, + "step": 658160 + }, + { + "epoch": 1.71, + "learning_rate": 4.408926307931183e-05, + "loss": 0.0065, + "step": 658170 + }, + { + "epoch": 1.71, + "learning_rate": 4.408537486294037e-05, + "loss": 0.0097, + "step": 658180 + }, + { + "epoch": 1.71, + "learning_rate": 4.40814866465689e-05, + "loss": 0.0082, + "step": 658190 + }, + { + "epoch": 1.71, + "learning_rate": 4.407759843019744e-05, + "loss": 0.0081, + "step": 658200 + }, + { + "epoch": 1.71, + "learning_rate": 4.407371021382597e-05, + "loss": 0.0067, + "step": 658210 + }, + { + "epoch": 1.71, + "learning_rate": 4.406982199745451e-05, + "loss": 0.0059, + "step": 658220 + }, + { + "epoch": 1.71, + "learning_rate": 4.406593378108305e-05, + "loss": 0.0065, + "step": 658230 + }, + { + "epoch": 1.71, + "learning_rate": 4.406204556471158e-05, + "loss": 0.0103, + "step": 658240 + }, + { + "epoch": 1.71, + "learning_rate": 4.405815734834012e-05, + "loss": 0.0078, + "step": 658250 + }, + { + "epoch": 1.71, + "learning_rate": 4.405426913196865e-05, + "loss": 0.0082, + "step": 658260 + }, + { + "epoch": 1.71, + "learning_rate": 4.405038091559719e-05, + "loss": 0.0068, + "step": 658270 + }, + { + "epoch": 1.71, + "learning_rate": 4.404649269922572e-05, + "loss": 0.0086, + "step": 658280 + }, + { + "epoch": 1.71, + "learning_rate": 4.404260448285426e-05, + "loss": 0.0072, + "step": 658290 + }, + { + "epoch": 1.71, + "learning_rate": 4.40387162664828e-05, + "loss": 0.01, + "step": 658300 + }, + { + "epoch": 1.71, + "learning_rate": 4.4034828050111334e-05, + "loss": 0.01, + "step": 658310 + }, + { + "epoch": 1.71, + "learning_rate": 4.403093983373987e-05, + "loss": 0.0062, + "step": 658320 + }, + { + "epoch": 1.71, + "learning_rate": 4.4027051617368403e-05, + "loss": 0.0063, + "step": 658330 + }, + { + "epoch": 1.71, + "learning_rate": 4.402316340099694e-05, + "loss": 0.0064, + "step": 658340 + }, + { + "epoch": 1.71, + "learning_rate": 4.401927518462547e-05, + "loss": 0.0093, + "step": 658350 + }, + { + "epoch": 1.71, + "learning_rate": 4.4015386968254e-05, + "loss": 0.0116, + "step": 658360 + }, + { + "epoch": 1.71, + "learning_rate": 4.4011498751882536e-05, + "loss": 0.0067, + "step": 658370 + }, + { + "epoch": 1.71, + "learning_rate": 4.400761053551107e-05, + "loss": 0.0086, + "step": 658380 + }, + { + "epoch": 1.71, + "learning_rate": 4.4003722319139606e-05, + "loss": 0.0084, + "step": 658390 + }, + { + "epoch": 1.71, + "learning_rate": 4.399983410276815e-05, + "loss": 0.0075, + "step": 658400 + }, + { + "epoch": 1.71, + "learning_rate": 4.399594588639668e-05, + "loss": 0.0108, + "step": 658410 + }, + { + "epoch": 1.71, + "learning_rate": 4.399205767002522e-05, + "loss": 0.0089, + "step": 658420 + }, + { + "epoch": 1.71, + "learning_rate": 4.398816945365375e-05, + "loss": 0.0088, + "step": 658430 + }, + { + "epoch": 1.71, + "learning_rate": 4.398428123728229e-05, + "loss": 0.0087, + "step": 658440 + }, + { + "epoch": 1.71, + "learning_rate": 4.398039302091082e-05, + "loss": 0.0075, + "step": 658450 + }, + { + "epoch": 1.71, + "learning_rate": 4.3976504804539357e-05, + "loss": 0.0105, + "step": 658460 + }, + { + "epoch": 1.71, + "learning_rate": 4.397261658816789e-05, + "loss": 0.0085, + "step": 658470 + }, + { + "epoch": 1.71, + "learning_rate": 4.396872837179643e-05, + "loss": 0.0058, + "step": 658480 + }, + { + "epoch": 1.71, + "learning_rate": 4.396484015542497e-05, + "loss": 0.0088, + "step": 658490 + }, + { + "epoch": 1.71, + "learning_rate": 4.39609519390535e-05, + "loss": 0.0089, + "step": 658500 + }, + { + "epoch": 1.71, + "learning_rate": 4.395706372268204e-05, + "loss": 0.0093, + "step": 658510 + }, + { + "epoch": 1.71, + "learning_rate": 4.395317550631057e-05, + "loss": 0.007, + "step": 658520 + }, + { + "epoch": 1.71, + "learning_rate": 4.394928728993911e-05, + "loss": 0.0086, + "step": 658530 + }, + { + "epoch": 1.71, + "learning_rate": 4.394539907356764e-05, + "loss": 0.0076, + "step": 658540 + }, + { + "epoch": 1.71, + "learning_rate": 4.394151085719618e-05, + "loss": 0.0097, + "step": 658550 + }, + { + "epoch": 1.71, + "learning_rate": 4.393762264082472e-05, + "loss": 0.0084, + "step": 658560 + }, + { + "epoch": 1.71, + "learning_rate": 4.3933734424453254e-05, + "loss": 0.0083, + "step": 658570 + }, + { + "epoch": 1.71, + "learning_rate": 4.392984620808179e-05, + "loss": 0.0089, + "step": 658580 + }, + { + "epoch": 1.71, + "learning_rate": 4.392595799171032e-05, + "loss": 0.0079, + "step": 658590 + }, + { + "epoch": 1.71, + "learning_rate": 4.392206977533885e-05, + "loss": 0.009, + "step": 658600 + }, + { + "epoch": 1.71, + "learning_rate": 4.3918181558967386e-05, + "loss": 0.0093, + "step": 658610 + }, + { + "epoch": 1.71, + "learning_rate": 4.391429334259592e-05, + "loss": 0.0055, + "step": 658620 + }, + { + "epoch": 1.71, + "learning_rate": 4.3910405126224456e-05, + "loss": 0.0071, + "step": 658630 + }, + { + "epoch": 1.71, + "learning_rate": 4.390651690985299e-05, + "loss": 0.008, + "step": 658640 + }, + { + "epoch": 1.71, + "learning_rate": 4.3902628693481526e-05, + "loss": 0.0067, + "step": 658650 + }, + { + "epoch": 1.71, + "learning_rate": 4.389874047711007e-05, + "loss": 0.0071, + "step": 658660 + }, + { + "epoch": 1.71, + "learning_rate": 4.38948522607386e-05, + "loss": 0.0084, + "step": 658670 + }, + { + "epoch": 1.71, + "learning_rate": 4.389096404436714e-05, + "loss": 0.009, + "step": 658680 + }, + { + "epoch": 1.71, + "learning_rate": 4.388707582799567e-05, + "loss": 0.0098, + "step": 658690 + }, + { + "epoch": 1.71, + "learning_rate": 4.388318761162421e-05, + "loss": 0.0104, + "step": 658700 + }, + { + "epoch": 1.71, + "learning_rate": 4.387929939525274e-05, + "loss": 0.0071, + "step": 658710 + }, + { + "epoch": 1.71, + "learning_rate": 4.3875411178881277e-05, + "loss": 0.0084, + "step": 658720 + }, + { + "epoch": 1.71, + "learning_rate": 4.387152296250981e-05, + "loss": 0.0095, + "step": 658730 + }, + { + "epoch": 1.71, + "learning_rate": 4.386763474613835e-05, + "loss": 0.0073, + "step": 658740 + }, + { + "epoch": 1.71, + "learning_rate": 4.386374652976689e-05, + "loss": 0.0096, + "step": 658750 + }, + { + "epoch": 1.71, + "learning_rate": 4.385985831339542e-05, + "loss": 0.0076, + "step": 658760 + }, + { + "epoch": 1.71, + "learning_rate": 4.385597009702396e-05, + "loss": 0.0161, + "step": 658770 + }, + { + "epoch": 1.71, + "learning_rate": 4.385208188065249e-05, + "loss": 0.0053, + "step": 658780 + }, + { + "epoch": 1.71, + "learning_rate": 4.384819366428103e-05, + "loss": 0.0045, + "step": 658790 + }, + { + "epoch": 1.71, + "learning_rate": 4.384430544790956e-05, + "loss": 0.0085, + "step": 658800 + }, + { + "epoch": 1.71, + "learning_rate": 4.38404172315381e-05, + "loss": 0.0075, + "step": 658810 + }, + { + "epoch": 1.71, + "learning_rate": 4.383652901516664e-05, + "loss": 0.0061, + "step": 658820 + }, + { + "epoch": 1.71, + "learning_rate": 4.3832640798795174e-05, + "loss": 0.0075, + "step": 658830 + }, + { + "epoch": 1.71, + "learning_rate": 4.382875258242371e-05, + "loss": 0.0071, + "step": 658840 + }, + { + "epoch": 1.71, + "learning_rate": 4.3824864366052237e-05, + "loss": 0.0085, + "step": 658850 + }, + { + "epoch": 1.71, + "learning_rate": 4.382097614968077e-05, + "loss": 0.0079, + "step": 658860 + }, + { + "epoch": 1.71, + "learning_rate": 4.3817087933309306e-05, + "loss": 0.0124, + "step": 658870 + }, + { + "epoch": 1.71, + "learning_rate": 4.381319971693784e-05, + "loss": 0.0067, + "step": 658880 + }, + { + "epoch": 1.71, + "learning_rate": 4.3809311500566376e-05, + "loss": 0.0085, + "step": 658890 + }, + { + "epoch": 1.71, + "learning_rate": 4.380542328419491e-05, + "loss": 0.0088, + "step": 658900 + }, + { + "epoch": 1.71, + "learning_rate": 4.3801535067823446e-05, + "loss": 0.0088, + "step": 658910 + }, + { + "epoch": 1.71, + "learning_rate": 4.379764685145199e-05, + "loss": 0.0067, + "step": 658920 + }, + { + "epoch": 1.71, + "learning_rate": 4.379375863508052e-05, + "loss": 0.0096, + "step": 658930 + }, + { + "epoch": 1.71, + "learning_rate": 4.378987041870906e-05, + "loss": 0.0081, + "step": 658940 + }, + { + "epoch": 1.71, + "learning_rate": 4.378598220233759e-05, + "loss": 0.0097, + "step": 658950 + }, + { + "epoch": 1.71, + "learning_rate": 4.378209398596613e-05, + "loss": 0.0077, + "step": 658960 + }, + { + "epoch": 1.71, + "learning_rate": 4.377820576959466e-05, + "loss": 0.0076, + "step": 658970 + }, + { + "epoch": 1.71, + "learning_rate": 4.3774317553223197e-05, + "loss": 0.0086, + "step": 658980 + }, + { + "epoch": 1.71, + "learning_rate": 4.377042933685173e-05, + "loss": 0.0084, + "step": 658990 + }, + { + "epoch": 1.71, + "learning_rate": 4.3766541120480266e-05, + "loss": 0.0061, + "step": 659000 + }, + { + "epoch": 1.71, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.005243065766990185, + "eval_runtime": 107.9368, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 659000 + }, + { + "epoch": 1.71, + "learning_rate": 4.376265290410881e-05, + "loss": 0.0086, + "step": 659010 + }, + { + "epoch": 1.71, + "learning_rate": 4.375876468773734e-05, + "loss": 0.0087, + "step": 659020 + }, + { + "epoch": 1.71, + "learning_rate": 4.375487647136588e-05, + "loss": 0.0077, + "step": 659030 + }, + { + "epoch": 1.71, + "learning_rate": 4.375098825499441e-05, + "loss": 0.0067, + "step": 659040 + }, + { + "epoch": 1.71, + "learning_rate": 4.374710003862295e-05, + "loss": 0.0092, + "step": 659050 + }, + { + "epoch": 1.71, + "learning_rate": 4.374321182225148e-05, + "loss": 0.0118, + "step": 659060 + }, + { + "epoch": 1.71, + "learning_rate": 4.373932360588002e-05, + "loss": 0.0092, + "step": 659070 + }, + { + "epoch": 1.71, + "learning_rate": 4.373543538950855e-05, + "loss": 0.0084, + "step": 659080 + }, + { + "epoch": 1.71, + "learning_rate": 4.3731547173137094e-05, + "loss": 0.006, + "step": 659090 + }, + { + "epoch": 1.71, + "learning_rate": 4.372765895676562e-05, + "loss": 0.0103, + "step": 659100 + }, + { + "epoch": 1.71, + "learning_rate": 4.3723770740394156e-05, + "loss": 0.0094, + "step": 659110 + }, + { + "epoch": 1.71, + "learning_rate": 4.371988252402269e-05, + "loss": 0.0075, + "step": 659120 + }, + { + "epoch": 1.71, + "learning_rate": 4.3715994307651226e-05, + "loss": 0.0087, + "step": 659130 + }, + { + "epoch": 1.71, + "learning_rate": 4.371210609127976e-05, + "loss": 0.0069, + "step": 659140 + }, + { + "epoch": 1.71, + "learning_rate": 4.3708217874908296e-05, + "loss": 0.0079, + "step": 659150 + }, + { + "epoch": 1.71, + "learning_rate": 4.370432965853683e-05, + "loss": 0.0077, + "step": 659160 + }, + { + "epoch": 1.71, + "learning_rate": 4.3700441442165366e-05, + "loss": 0.0073, + "step": 659170 + }, + { + "epoch": 1.71, + "learning_rate": 4.36965532257939e-05, + "loss": 0.0071, + "step": 659180 + }, + { + "epoch": 1.71, + "learning_rate": 4.369266500942244e-05, + "loss": 0.0088, + "step": 659190 + }, + { + "epoch": 1.71, + "learning_rate": 4.368877679305098e-05, + "loss": 0.0073, + "step": 659200 + }, + { + "epoch": 1.71, + "learning_rate": 4.368488857667951e-05, + "loss": 0.0076, + "step": 659210 + }, + { + "epoch": 1.71, + "learning_rate": 4.368100036030805e-05, + "loss": 0.0075, + "step": 659220 + }, + { + "epoch": 1.71, + "learning_rate": 4.367711214393658e-05, + "loss": 0.0052, + "step": 659230 + }, + { + "epoch": 1.71, + "learning_rate": 4.3673223927565116e-05, + "loss": 0.007, + "step": 659240 + }, + { + "epoch": 1.71, + "learning_rate": 4.366933571119365e-05, + "loss": 0.0071, + "step": 659250 + }, + { + "epoch": 1.71, + "learning_rate": 4.3665447494822186e-05, + "loss": 0.01, + "step": 659260 + }, + { + "epoch": 1.71, + "learning_rate": 4.366155927845073e-05, + "loss": 0.0105, + "step": 659270 + }, + { + "epoch": 1.71, + "learning_rate": 4.365767106207926e-05, + "loss": 0.0097, + "step": 659280 + }, + { + "epoch": 1.71, + "learning_rate": 4.36537828457078e-05, + "loss": 0.0069, + "step": 659290 + }, + { + "epoch": 1.71, + "learning_rate": 4.364989462933633e-05, + "loss": 0.0101, + "step": 659300 + }, + { + "epoch": 1.71, + "learning_rate": 4.364600641296487e-05, + "loss": 0.0072, + "step": 659310 + }, + { + "epoch": 1.71, + "learning_rate": 4.36421181965934e-05, + "loss": 0.0081, + "step": 659320 + }, + { + "epoch": 1.71, + "learning_rate": 4.363822998022194e-05, + "loss": 0.0092, + "step": 659330 + }, + { + "epoch": 1.71, + "learning_rate": 4.363434176385047e-05, + "loss": 0.0073, + "step": 659340 + }, + { + "epoch": 1.71, + "learning_rate": 4.3630453547479e-05, + "loss": 0.0106, + "step": 659350 + }, + { + "epoch": 1.71, + "learning_rate": 4.3626565331107535e-05, + "loss": 0.01, + "step": 659360 + }, + { + "epoch": 1.71, + "learning_rate": 4.3622677114736076e-05, + "loss": 0.009, + "step": 659370 + }, + { + "epoch": 1.71, + "learning_rate": 4.361878889836461e-05, + "loss": 0.0073, + "step": 659380 + }, + { + "epoch": 1.71, + "learning_rate": 4.3614900681993146e-05, + "loss": 0.0062, + "step": 659390 + }, + { + "epoch": 1.71, + "learning_rate": 4.361101246562168e-05, + "loss": 0.006, + "step": 659400 + }, + { + "epoch": 1.71, + "learning_rate": 4.3607124249250216e-05, + "loss": 0.0108, + "step": 659410 + }, + { + "epoch": 1.71, + "learning_rate": 4.360323603287875e-05, + "loss": 0.0106, + "step": 659420 + }, + { + "epoch": 1.71, + "learning_rate": 4.3599347816507286e-05, + "loss": 0.0079, + "step": 659430 + }, + { + "epoch": 1.71, + "learning_rate": 4.359545960013582e-05, + "loss": 0.0084, + "step": 659440 + }, + { + "epoch": 1.71, + "learning_rate": 4.359157138376436e-05, + "loss": 0.007, + "step": 659450 + }, + { + "epoch": 1.71, + "learning_rate": 4.35876831673929e-05, + "loss": 0.0111, + "step": 659460 + }, + { + "epoch": 1.71, + "learning_rate": 4.358379495102143e-05, + "loss": 0.0093, + "step": 659470 + }, + { + "epoch": 1.71, + "learning_rate": 4.357990673464997e-05, + "loss": 0.0067, + "step": 659480 + }, + { + "epoch": 1.71, + "learning_rate": 4.35760185182785e-05, + "loss": 0.0056, + "step": 659490 + }, + { + "epoch": 1.71, + "learning_rate": 4.3572130301907036e-05, + "loss": 0.0118, + "step": 659500 + }, + { + "epoch": 1.71, + "learning_rate": 4.356824208553557e-05, + "loss": 0.007, + "step": 659510 + }, + { + "epoch": 1.71, + "learning_rate": 4.3564353869164106e-05, + "loss": 0.0071, + "step": 659520 + }, + { + "epoch": 1.71, + "learning_rate": 4.356046565279265e-05, + "loss": 0.0078, + "step": 659530 + }, + { + "epoch": 1.71, + "learning_rate": 4.355657743642118e-05, + "loss": 0.0085, + "step": 659540 + }, + { + "epoch": 1.71, + "learning_rate": 4.355268922004972e-05, + "loss": 0.0059, + "step": 659550 + }, + { + "epoch": 1.71, + "learning_rate": 4.354880100367825e-05, + "loss": 0.007, + "step": 659560 + }, + { + "epoch": 1.71, + "learning_rate": 4.354491278730679e-05, + "loss": 0.0092, + "step": 659570 + }, + { + "epoch": 1.71, + "learning_rate": 4.354102457093532e-05, + "loss": 0.0065, + "step": 659580 + }, + { + "epoch": 1.71, + "learning_rate": 4.353713635456386e-05, + "loss": 0.0062, + "step": 659590 + }, + { + "epoch": 1.71, + "learning_rate": 4.3533248138192385e-05, + "loss": 0.0078, + "step": 659600 + }, + { + "epoch": 1.71, + "learning_rate": 4.352935992182092e-05, + "loss": 0.0084, + "step": 659610 + }, + { + "epoch": 1.71, + "learning_rate": 4.3525471705449455e-05, + "loss": 0.0063, + "step": 659620 + }, + { + "epoch": 1.71, + "learning_rate": 4.3521583489077996e-05, + "loss": 0.0066, + "step": 659630 + }, + { + "epoch": 1.71, + "learning_rate": 4.351769527270653e-05, + "loss": 0.0079, + "step": 659640 + }, + { + "epoch": 1.71, + "learning_rate": 4.3513807056335066e-05, + "loss": 0.0072, + "step": 659650 + }, + { + "epoch": 1.71, + "learning_rate": 4.35099188399636e-05, + "loss": 0.0094, + "step": 659660 + }, + { + "epoch": 1.71, + "learning_rate": 4.3506030623592136e-05, + "loss": 0.0099, + "step": 659670 + }, + { + "epoch": 1.71, + "learning_rate": 4.350214240722067e-05, + "loss": 0.0067, + "step": 659680 + }, + { + "epoch": 1.71, + "learning_rate": 4.3498254190849206e-05, + "loss": 0.0061, + "step": 659690 + }, + { + "epoch": 1.71, + "learning_rate": 4.349436597447774e-05, + "loss": 0.0077, + "step": 659700 + }, + { + "epoch": 1.71, + "learning_rate": 4.349047775810628e-05, + "loss": 0.0064, + "step": 659710 + }, + { + "epoch": 1.71, + "learning_rate": 4.348658954173482e-05, + "loss": 0.0092, + "step": 659720 + }, + { + "epoch": 1.71, + "learning_rate": 4.348270132536335e-05, + "loss": 0.0106, + "step": 659730 + }, + { + "epoch": 1.71, + "learning_rate": 4.347881310899189e-05, + "loss": 0.0062, + "step": 659740 + }, + { + "epoch": 1.71, + "learning_rate": 4.347492489262042e-05, + "loss": 0.0062, + "step": 659750 + }, + { + "epoch": 1.71, + "learning_rate": 4.3471036676248956e-05, + "loss": 0.0106, + "step": 659760 + }, + { + "epoch": 1.71, + "learning_rate": 4.346714845987749e-05, + "loss": 0.0101, + "step": 659770 + }, + { + "epoch": 1.71, + "learning_rate": 4.3463260243506026e-05, + "loss": 0.0134, + "step": 659780 + }, + { + "epoch": 1.71, + "learning_rate": 4.345937202713457e-05, + "loss": 0.0098, + "step": 659790 + }, + { + "epoch": 1.71, + "learning_rate": 4.34554838107631e-05, + "loss": 0.0066, + "step": 659800 + }, + { + "epoch": 1.71, + "learning_rate": 4.345159559439164e-05, + "loss": 0.0066, + "step": 659810 + }, + { + "epoch": 1.71, + "learning_rate": 4.344770737802017e-05, + "loss": 0.0081, + "step": 659820 + }, + { + "epoch": 1.71, + "learning_rate": 4.344381916164871e-05, + "loss": 0.0122, + "step": 659830 + }, + { + "epoch": 1.71, + "learning_rate": 4.3439930945277235e-05, + "loss": 0.0075, + "step": 659840 + }, + { + "epoch": 1.71, + "learning_rate": 4.343604272890577e-05, + "loss": 0.0104, + "step": 659850 + }, + { + "epoch": 1.71, + "learning_rate": 4.3432154512534305e-05, + "loss": 0.0087, + "step": 659860 + }, + { + "epoch": 1.71, + "learning_rate": 4.342826629616284e-05, + "loss": 0.0069, + "step": 659870 + }, + { + "epoch": 1.71, + "learning_rate": 4.3424378079791375e-05, + "loss": 0.0073, + "step": 659880 + }, + { + "epoch": 1.71, + "learning_rate": 4.3420489863419916e-05, + "loss": 0.0097, + "step": 659890 + }, + { + "epoch": 1.71, + "learning_rate": 4.341660164704845e-05, + "loss": 0.0087, + "step": 659900 + }, + { + "epoch": 1.71, + "learning_rate": 4.3412713430676986e-05, + "loss": 0.0085, + "step": 659910 + }, + { + "epoch": 1.71, + "learning_rate": 4.340882521430552e-05, + "loss": 0.0067, + "step": 659920 + }, + { + "epoch": 1.71, + "learning_rate": 4.3404936997934056e-05, + "loss": 0.0059, + "step": 659930 + }, + { + "epoch": 1.71, + "learning_rate": 4.340104878156259e-05, + "loss": 0.0091, + "step": 659940 + }, + { + "epoch": 1.71, + "learning_rate": 4.3397160565191126e-05, + "loss": 0.0076, + "step": 659950 + }, + { + "epoch": 1.71, + "learning_rate": 4.339327234881966e-05, + "loss": 0.0087, + "step": 659960 + }, + { + "epoch": 1.71, + "learning_rate": 4.33893841324482e-05, + "loss": 0.0078, + "step": 659970 + }, + { + "epoch": 1.71, + "learning_rate": 4.338549591607674e-05, + "loss": 0.0074, + "step": 659980 + }, + { + "epoch": 1.71, + "learning_rate": 4.338160769970527e-05, + "loss": 0.0069, + "step": 659990 + }, + { + "epoch": 1.71, + "learning_rate": 4.3377719483333807e-05, + "loss": 0.0097, + "step": 660000 + }, + { + "epoch": 1.71, + "eval_cer": 0.8816648961259449, + "eval_loss": 0.0051537686958909035, + "eval_runtime": 107.9648, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, + "step": 660000 + }, + { + "epoch": 1.71, + "learning_rate": 4.337383126696234e-05, + "loss": 0.0066, + "step": 660010 + }, + { + "epoch": 1.71, + "learning_rate": 4.3369943050590876e-05, + "loss": 0.0065, + "step": 660020 + }, + { + "epoch": 1.71, + "learning_rate": 4.336605483421941e-05, + "loss": 0.0064, + "step": 660030 + }, + { + "epoch": 1.71, + "learning_rate": 4.3362166617847946e-05, + "loss": 0.0087, + "step": 660040 + }, + { + "epoch": 1.71, + "learning_rate": 4.335827840147649e-05, + "loss": 0.007, + "step": 660050 + }, + { + "epoch": 1.71, + "learning_rate": 4.335439018510502e-05, + "loss": 0.0065, + "step": 660060 + }, + { + "epoch": 1.71, + "learning_rate": 4.335050196873356e-05, + "loss": 0.0113, + "step": 660070 + }, + { + "epoch": 1.71, + "learning_rate": 4.334661375236209e-05, + "loss": 0.0077, + "step": 660080 + }, + { + "epoch": 1.71, + "learning_rate": 4.334272553599062e-05, + "loss": 0.0071, + "step": 660090 + }, + { + "epoch": 1.71, + "learning_rate": 4.3338837319619155e-05, + "loss": 0.0101, + "step": 660100 + }, + { + "epoch": 1.71, + "learning_rate": 4.333494910324769e-05, + "loss": 0.0076, + "step": 660110 + }, + { + "epoch": 1.71, + "learning_rate": 4.3331060886876225e-05, + "loss": 0.0088, + "step": 660120 + }, + { + "epoch": 1.71, + "learning_rate": 4.332717267050476e-05, + "loss": 0.0061, + "step": 660130 + }, + { + "epoch": 1.71, + "learning_rate": 4.3323284454133295e-05, + "loss": 0.0086, + "step": 660140 + }, + { + "epoch": 1.71, + "learning_rate": 4.3319396237761836e-05, + "loss": 0.0088, + "step": 660150 + }, + { + "epoch": 1.71, + "learning_rate": 4.331550802139037e-05, + "loss": 0.0071, + "step": 660160 + }, + { + "epoch": 1.71, + "learning_rate": 4.3311619805018906e-05, + "loss": 0.0083, + "step": 660170 + }, + { + "epoch": 1.71, + "learning_rate": 4.330773158864744e-05, + "loss": 0.0078, + "step": 660180 + }, + { + "epoch": 1.71, + "learning_rate": 4.3303843372275976e-05, + "loss": 0.0087, + "step": 660190 + }, + { + "epoch": 1.71, + "learning_rate": 4.329995515590451e-05, + "loss": 0.0096, + "step": 660200 + }, + { + "epoch": 1.71, + "learning_rate": 4.3296066939533045e-05, + "loss": 0.0108, + "step": 660210 + }, + { + "epoch": 1.71, + "learning_rate": 4.329217872316158e-05, + "loss": 0.0069, + "step": 660220 + }, + { + "epoch": 1.71, + "learning_rate": 4.328829050679012e-05, + "loss": 0.0098, + "step": 660230 + }, + { + "epoch": 1.71, + "learning_rate": 4.328440229041866e-05, + "loss": 0.0055, + "step": 660240 + }, + { + "epoch": 1.71, + "learning_rate": 4.328051407404719e-05, + "loss": 0.01, + "step": 660250 + }, + { + "epoch": 1.71, + "learning_rate": 4.3276625857675727e-05, + "loss": 0.0088, + "step": 660260 + }, + { + "epoch": 1.71, + "learning_rate": 4.327273764130426e-05, + "loss": 0.008, + "step": 660270 + }, + { + "epoch": 1.71, + "learning_rate": 4.3268849424932796e-05, + "loss": 0.0082, + "step": 660280 + }, + { + "epoch": 1.71, + "learning_rate": 4.326496120856133e-05, + "loss": 0.0102, + "step": 660290 + }, + { + "epoch": 1.71, + "learning_rate": 4.3261072992189866e-05, + "loss": 0.0062, + "step": 660300 + }, + { + "epoch": 1.71, + "learning_rate": 4.325718477581841e-05, + "loss": 0.0135, + "step": 660310 + }, + { + "epoch": 1.71, + "learning_rate": 4.325329655944694e-05, + "loss": 0.0046, + "step": 660320 + }, + { + "epoch": 1.71, + "learning_rate": 4.324940834307548e-05, + "loss": 0.0062, + "step": 660330 + }, + { + "epoch": 1.71, + "learning_rate": 4.3245520126704005e-05, + "loss": 0.0073, + "step": 660340 + }, + { + "epoch": 1.71, + "learning_rate": 4.324163191033254e-05, + "loss": 0.0085, + "step": 660350 + }, + { + "epoch": 1.71, + "learning_rate": 4.3237743693961075e-05, + "loss": 0.0071, + "step": 660360 + }, + { + "epoch": 1.71, + "learning_rate": 4.323385547758961e-05, + "loss": 0.0105, + "step": 660370 + }, + { + "epoch": 1.71, + "learning_rate": 4.3229967261218145e-05, + "loss": 0.0088, + "step": 660380 + }, + { + "epoch": 1.71, + "learning_rate": 4.322607904484668e-05, + "loss": 0.0059, + "step": 660390 + }, + { + "epoch": 1.71, + "learning_rate": 4.3222190828475215e-05, + "loss": 0.0088, + "step": 660400 + }, + { + "epoch": 1.71, + "learning_rate": 4.3218302612103756e-05, + "loss": 0.0087, + "step": 660410 + }, + { + "epoch": 1.71, + "learning_rate": 4.321441439573229e-05, + "loss": 0.0088, + "step": 660420 + }, + { + "epoch": 1.71, + "learning_rate": 4.3210526179360826e-05, + "loss": 0.0091, + "step": 660430 + }, + { + "epoch": 1.71, + "learning_rate": 4.320663796298936e-05, + "loss": 0.008, + "step": 660440 + }, + { + "epoch": 1.71, + "learning_rate": 4.3202749746617896e-05, + "loss": 0.009, + "step": 660450 + }, + { + "epoch": 1.71, + "learning_rate": 4.319886153024643e-05, + "loss": 0.0101, + "step": 660460 + }, + { + "epoch": 1.71, + "learning_rate": 4.3194973313874965e-05, + "loss": 0.0087, + "step": 660470 + }, + { + "epoch": 1.71, + "learning_rate": 4.31910850975035e-05, + "loss": 0.0075, + "step": 660480 + }, + { + "epoch": 1.71, + "learning_rate": 4.3187196881132035e-05, + "loss": 0.0079, + "step": 660490 + }, + { + "epoch": 1.71, + "learning_rate": 4.318330866476058e-05, + "loss": 0.0095, + "step": 660500 + }, + { + "epoch": 1.71, + "learning_rate": 4.317942044838911e-05, + "loss": 0.0079, + "step": 660510 + }, + { + "epoch": 1.71, + "learning_rate": 4.3175532232017646e-05, + "loss": 0.007, + "step": 660520 + }, + { + "epoch": 1.71, + "learning_rate": 4.317164401564618e-05, + "loss": 0.007, + "step": 660530 + }, + { + "epoch": 1.71, + "learning_rate": 4.3167755799274716e-05, + "loss": 0.0093, + "step": 660540 + }, + { + "epoch": 1.71, + "learning_rate": 4.316386758290325e-05, + "loss": 0.0091, + "step": 660550 + }, + { + "epoch": 1.71, + "learning_rate": 4.3159979366531786e-05, + "loss": 0.0077, + "step": 660560 + }, + { + "epoch": 1.71, + "learning_rate": 4.315609115016032e-05, + "loss": 0.0099, + "step": 660570 + }, + { + "epoch": 1.71, + "learning_rate": 4.315220293378886e-05, + "loss": 0.0096, + "step": 660580 + }, + { + "epoch": 1.71, + "learning_rate": 4.3148314717417384e-05, + "loss": 0.0073, + "step": 660590 + }, + { + "epoch": 1.71, + "learning_rate": 4.3144426501045925e-05, + "loss": 0.0118, + "step": 660600 + }, + { + "epoch": 1.71, + "learning_rate": 4.314053828467446e-05, + "loss": 0.0062, + "step": 660610 + }, + { + "epoch": 1.71, + "learning_rate": 4.3136650068302995e-05, + "loss": 0.0119, + "step": 660620 + }, + { + "epoch": 1.71, + "learning_rate": 4.313276185193153e-05, + "loss": 0.008, + "step": 660630 + }, + { + "epoch": 1.71, + "learning_rate": 4.3128873635560065e-05, + "loss": 0.0062, + "step": 660640 + }, + { + "epoch": 1.71, + "learning_rate": 4.31249854191886e-05, + "loss": 0.0092, + "step": 660650 + }, + { + "epoch": 1.71, + "learning_rate": 4.3121097202817135e-05, + "loss": 0.0085, + "step": 660660 + }, + { + "epoch": 1.71, + "learning_rate": 4.311720898644567e-05, + "loss": 0.0105, + "step": 660670 + }, + { + "epoch": 1.71, + "learning_rate": 4.311332077007421e-05, + "loss": 0.008, + "step": 660680 + }, + { + "epoch": 1.71, + "learning_rate": 4.3109432553702746e-05, + "loss": 0.0077, + "step": 660690 + }, + { + "epoch": 1.71, + "learning_rate": 4.310554433733128e-05, + "loss": 0.0054, + "step": 660700 + }, + { + "epoch": 1.71, + "learning_rate": 4.3101656120959816e-05, + "loss": 0.009, + "step": 660710 + }, + { + "epoch": 1.71, + "learning_rate": 4.309776790458835e-05, + "loss": 0.0066, + "step": 660720 + }, + { + "epoch": 1.71, + "learning_rate": 4.3093879688216885e-05, + "loss": 0.0061, + "step": 660730 + }, + { + "epoch": 1.71, + "learning_rate": 4.308999147184542e-05, + "loss": 0.0084, + "step": 660740 + }, + { + "epoch": 1.71, + "learning_rate": 4.3086103255473955e-05, + "loss": 0.0053, + "step": 660750 + }, + { + "epoch": 1.71, + "learning_rate": 4.30822150391025e-05, + "loss": 0.0086, + "step": 660760 + }, + { + "epoch": 1.71, + "learning_rate": 4.307832682273103e-05, + "loss": 0.0064, + "step": 660770 + }, + { + "epoch": 1.71, + "learning_rate": 4.3074438606359566e-05, + "loss": 0.0059, + "step": 660780 + }, + { + "epoch": 1.71, + "learning_rate": 4.30705503899881e-05, + "loss": 0.0068, + "step": 660790 + }, + { + "epoch": 1.71, + "learning_rate": 4.3066662173616636e-05, + "loss": 0.0086, + "step": 660800 + }, + { + "epoch": 1.71, + "learning_rate": 4.306277395724517e-05, + "loss": 0.008, + "step": 660810 + }, + { + "epoch": 1.71, + "learning_rate": 4.3058885740873706e-05, + "loss": 0.0052, + "step": 660820 + }, + { + "epoch": 1.71, + "learning_rate": 4.305499752450224e-05, + "loss": 0.0066, + "step": 660830 + }, + { + "epoch": 1.71, + "learning_rate": 4.305110930813077e-05, + "loss": 0.0075, + "step": 660840 + }, + { + "epoch": 1.71, + "learning_rate": 4.3047221091759304e-05, + "loss": 0.0103, + "step": 660850 + }, + { + "epoch": 1.71, + "learning_rate": 4.3043332875387845e-05, + "loss": 0.0078, + "step": 660860 + }, + { + "epoch": 1.71, + "learning_rate": 4.303944465901638e-05, + "loss": 0.0104, + "step": 660870 + }, + { + "epoch": 1.71, + "learning_rate": 4.3035556442644915e-05, + "loss": 0.01, + "step": 660880 + }, + { + "epoch": 1.71, + "learning_rate": 4.303166822627345e-05, + "loss": 0.0065, + "step": 660890 + }, + { + "epoch": 1.71, + "learning_rate": 4.3027780009901985e-05, + "loss": 0.0069, + "step": 660900 + }, + { + "epoch": 1.71, + "learning_rate": 4.302389179353052e-05, + "loss": 0.01, + "step": 660910 + }, + { + "epoch": 1.71, + "learning_rate": 4.3020003577159055e-05, + "loss": 0.0084, + "step": 660920 + }, + { + "epoch": 1.71, + "learning_rate": 4.301611536078759e-05, + "loss": 0.0097, + "step": 660930 + }, + { + "epoch": 1.71, + "learning_rate": 4.301222714441613e-05, + "loss": 0.0082, + "step": 660940 + }, + { + "epoch": 1.71, + "learning_rate": 4.3008338928044666e-05, + "loss": 0.0066, + "step": 660950 + }, + { + "epoch": 1.71, + "learning_rate": 4.30044507116732e-05, + "loss": 0.0079, + "step": 660960 + }, + { + "epoch": 1.71, + "learning_rate": 4.3000562495301736e-05, + "loss": 0.0077, + "step": 660970 + }, + { + "epoch": 1.71, + "learning_rate": 4.299667427893027e-05, + "loss": 0.0068, + "step": 660980 + }, + { + "epoch": 1.71, + "learning_rate": 4.2992786062558805e-05, + "loss": 0.0069, + "step": 660990 + }, + { + "epoch": 1.71, + "learning_rate": 4.298889784618734e-05, + "loss": 0.0074, + "step": 661000 + }, + { + "epoch": 1.71, + "eval_cer": 0.8816522993935373, + "eval_loss": 0.00525335967540741, + "eval_runtime": 107.9903, + "eval_samples_per_second": 18.52, + "eval_steps_per_second": 4.63, + "step": 661000 + }, + { + "epoch": 1.71, + "learning_rate": 4.2985009629815875e-05, + "loss": 0.009, + "step": 661010 + }, + { + "epoch": 1.71, + "learning_rate": 4.298112141344442e-05, + "loss": 0.0088, + "step": 661020 + }, + { + "epoch": 1.71, + "learning_rate": 4.297723319707295e-05, + "loss": 0.0087, + "step": 661030 + }, + { + "epoch": 1.71, + "learning_rate": 4.2973344980701486e-05, + "loss": 0.008, + "step": 661040 + }, + { + "epoch": 1.71, + "learning_rate": 4.296945676433002e-05, + "loss": 0.0101, + "step": 661050 + }, + { + "epoch": 1.71, + "learning_rate": 4.2965568547958556e-05, + "loss": 0.0077, + "step": 661060 + }, + { + "epoch": 1.71, + "learning_rate": 4.296168033158709e-05, + "loss": 0.0077, + "step": 661070 + }, + { + "epoch": 1.71, + "learning_rate": 4.2957792115215626e-05, + "loss": 0.0066, + "step": 661080 + }, + { + "epoch": 1.71, + "learning_rate": 4.2953903898844154e-05, + "loss": 0.0085, + "step": 661090 + }, + { + "epoch": 1.71, + "learning_rate": 4.295001568247269e-05, + "loss": 0.0092, + "step": 661100 + }, + { + "epoch": 1.71, + "learning_rate": 4.2946127466101224e-05, + "loss": 0.0099, + "step": 661110 + }, + { + "epoch": 1.71, + "learning_rate": 4.2942239249729765e-05, + "loss": 0.009, + "step": 661120 + }, + { + "epoch": 1.71, + "learning_rate": 4.29383510333583e-05, + "loss": 0.0052, + "step": 661130 + }, + { + "epoch": 1.71, + "learning_rate": 4.2934462816986835e-05, + "loss": 0.0055, + "step": 661140 + }, + { + "epoch": 1.71, + "learning_rate": 4.293057460061537e-05, + "loss": 0.0074, + "step": 661150 + }, + { + "epoch": 1.71, + "learning_rate": 4.2926686384243905e-05, + "loss": 0.0071, + "step": 661160 + }, + { + "epoch": 1.71, + "learning_rate": 4.292279816787244e-05, + "loss": 0.0083, + "step": 661170 + }, + { + "epoch": 1.71, + "learning_rate": 4.2918909951500974e-05, + "loss": 0.0076, + "step": 661180 + }, + { + "epoch": 1.71, + "learning_rate": 4.291502173512951e-05, + "loss": 0.0081, + "step": 661190 + }, + { + "epoch": 1.71, + "learning_rate": 4.291113351875805e-05, + "loss": 0.007, + "step": 661200 + }, + { + "epoch": 1.71, + "learning_rate": 4.2907245302386586e-05, + "loss": 0.007, + "step": 661210 + }, + { + "epoch": 1.71, + "learning_rate": 4.290335708601512e-05, + "loss": 0.008, + "step": 661220 + }, + { + "epoch": 1.71, + "learning_rate": 4.2899468869643656e-05, + "loss": 0.0085, + "step": 661230 + }, + { + "epoch": 1.71, + "learning_rate": 4.289558065327219e-05, + "loss": 0.0077, + "step": 661240 + }, + { + "epoch": 1.71, + "learning_rate": 4.2891692436900725e-05, + "loss": 0.0084, + "step": 661250 + }, + { + "epoch": 1.71, + "learning_rate": 4.288780422052926e-05, + "loss": 0.0071, + "step": 661260 + }, + { + "epoch": 1.71, + "learning_rate": 4.2883916004157795e-05, + "loss": 0.0083, + "step": 661270 + }, + { + "epoch": 1.71, + "learning_rate": 4.288002778778634e-05, + "loss": 0.0063, + "step": 661280 + }, + { + "epoch": 1.71, + "learning_rate": 4.287613957141487e-05, + "loss": 0.0081, + "step": 661290 + }, + { + "epoch": 1.71, + "learning_rate": 4.2872251355043406e-05, + "loss": 0.0093, + "step": 661300 + }, + { + "epoch": 1.71, + "learning_rate": 4.286836313867194e-05, + "loss": 0.0107, + "step": 661310 + }, + { + "epoch": 1.71, + "learning_rate": 4.2864474922300476e-05, + "loss": 0.0067, + "step": 661320 + }, + { + "epoch": 1.71, + "learning_rate": 4.2860586705929004e-05, + "loss": 0.0068, + "step": 661330 + }, + { + "epoch": 1.71, + "learning_rate": 4.285669848955754e-05, + "loss": 0.0075, + "step": 661340 + }, + { + "epoch": 1.71, + "learning_rate": 4.2852810273186074e-05, + "loss": 0.0091, + "step": 661350 + }, + { + "epoch": 1.71, + "learning_rate": 4.284892205681461e-05, + "loss": 0.0098, + "step": 661360 + }, + { + "epoch": 1.71, + "learning_rate": 4.2845033840443144e-05, + "loss": 0.0078, + "step": 661370 + }, + { + "epoch": 1.71, + "learning_rate": 4.2841145624071685e-05, + "loss": 0.0068, + "step": 661380 + }, + { + "epoch": 1.71, + "learning_rate": 4.283725740770022e-05, + "loss": 0.0111, + "step": 661390 + }, + { + "epoch": 1.71, + "learning_rate": 4.2833369191328755e-05, + "loss": 0.0091, + "step": 661400 + }, + { + "epoch": 1.71, + "learning_rate": 4.282948097495729e-05, + "loss": 0.0073, + "step": 661410 + }, + { + "epoch": 1.71, + "learning_rate": 4.2825592758585825e-05, + "loss": 0.0123, + "step": 661420 + }, + { + "epoch": 1.71, + "learning_rate": 4.282170454221436e-05, + "loss": 0.0076, + "step": 661430 + }, + { + "epoch": 1.71, + "learning_rate": 4.2817816325842894e-05, + "loss": 0.0112, + "step": 661440 + }, + { + "epoch": 1.71, + "learning_rate": 4.281392810947143e-05, + "loss": 0.009, + "step": 661450 + }, + { + "epoch": 1.71, + "learning_rate": 4.281003989309997e-05, + "loss": 0.0074, + "step": 661460 + }, + { + "epoch": 1.71, + "learning_rate": 4.2806151676728506e-05, + "loss": 0.0068, + "step": 661470 + }, + { + "epoch": 1.71, + "learning_rate": 4.280226346035704e-05, + "loss": 0.0092, + "step": 661480 + }, + { + "epoch": 1.71, + "learning_rate": 4.2798375243985575e-05, + "loss": 0.0087, + "step": 661490 + }, + { + "epoch": 1.71, + "learning_rate": 4.279448702761411e-05, + "loss": 0.0092, + "step": 661500 + }, + { + "epoch": 1.71, + "learning_rate": 4.2790598811242645e-05, + "loss": 0.0075, + "step": 661510 + }, + { + "epoch": 1.71, + "learning_rate": 4.278671059487118e-05, + "loss": 0.0062, + "step": 661520 + }, + { + "epoch": 1.71, + "learning_rate": 4.2782822378499715e-05, + "loss": 0.0097, + "step": 661530 + }, + { + "epoch": 1.71, + "learning_rate": 4.2778934162128257e-05, + "loss": 0.0074, + "step": 661540 + }, + { + "epoch": 1.71, + "learning_rate": 4.277504594575679e-05, + "loss": 0.0102, + "step": 661550 + }, + { + "epoch": 1.71, + "learning_rate": 4.2771157729385326e-05, + "loss": 0.0073, + "step": 661560 + }, + { + "epoch": 1.71, + "learning_rate": 4.276726951301386e-05, + "loss": 0.0077, + "step": 661570 + }, + { + "epoch": 1.71, + "learning_rate": 4.276338129664239e-05, + "loss": 0.0098, + "step": 661580 + }, + { + "epoch": 1.71, + "learning_rate": 4.2759493080270924e-05, + "loss": 0.0097, + "step": 661590 + }, + { + "epoch": 1.71, + "learning_rate": 4.275560486389946e-05, + "loss": 0.0088, + "step": 661600 + }, + { + "epoch": 1.71, + "learning_rate": 4.2751716647527994e-05, + "loss": 0.0112, + "step": 661610 + }, + { + "epoch": 1.72, + "learning_rate": 4.274782843115653e-05, + "loss": 0.0084, + "step": 661620 + }, + { + "epoch": 1.72, + "learning_rate": 4.2743940214785064e-05, + "loss": 0.0118, + "step": 661630 + }, + { + "epoch": 1.72, + "learning_rate": 4.2740051998413605e-05, + "loss": 0.0085, + "step": 661640 + }, + { + "epoch": 1.72, + "learning_rate": 4.273616378204214e-05, + "loss": 0.0084, + "step": 661650 + }, + { + "epoch": 1.72, + "learning_rate": 4.2732275565670675e-05, + "loss": 0.0079, + "step": 661660 + }, + { + "epoch": 1.72, + "learning_rate": 4.272838734929921e-05, + "loss": 0.0086, + "step": 661670 + }, + { + "epoch": 1.72, + "learning_rate": 4.2724499132927745e-05, + "loss": 0.0065, + "step": 661680 + }, + { + "epoch": 1.72, + "learning_rate": 4.272061091655628e-05, + "loss": 0.0075, + "step": 661690 + }, + { + "epoch": 1.72, + "learning_rate": 4.2716722700184814e-05, + "loss": 0.0053, + "step": 661700 + }, + { + "epoch": 1.72, + "learning_rate": 4.271283448381335e-05, + "loss": 0.0083, + "step": 661710 + }, + { + "epoch": 1.72, + "learning_rate": 4.270894626744189e-05, + "loss": 0.0063, + "step": 661720 + }, + { + "epoch": 1.72, + "learning_rate": 4.2705058051070426e-05, + "loss": 0.0065, + "step": 661730 + }, + { + "epoch": 1.72, + "learning_rate": 4.270116983469896e-05, + "loss": 0.009, + "step": 661740 + }, + { + "epoch": 1.72, + "learning_rate": 4.2697281618327495e-05, + "loss": 0.0095, + "step": 661750 + }, + { + "epoch": 1.72, + "learning_rate": 4.269339340195603e-05, + "loss": 0.0092, + "step": 661760 + }, + { + "epoch": 1.72, + "learning_rate": 4.2689505185584565e-05, + "loss": 0.0064, + "step": 661770 + }, + { + "epoch": 1.72, + "learning_rate": 4.26856169692131e-05, + "loss": 0.0095, + "step": 661780 + }, + { + "epoch": 1.72, + "learning_rate": 4.2681728752841635e-05, + "loss": 0.0085, + "step": 661790 + }, + { + "epoch": 1.72, + "learning_rate": 4.267784053647017e-05, + "loss": 0.0084, + "step": 661800 + }, + { + "epoch": 1.72, + "learning_rate": 4.267395232009871e-05, + "loss": 0.0075, + "step": 661810 + }, + { + "epoch": 1.72, + "learning_rate": 4.2670064103727246e-05, + "loss": 0.0096, + "step": 661820 + }, + { + "epoch": 1.72, + "learning_rate": 4.2666175887355774e-05, + "loss": 0.0082, + "step": 661830 + }, + { + "epoch": 1.72, + "learning_rate": 4.266228767098431e-05, + "loss": 0.0093, + "step": 661840 + }, + { + "epoch": 1.72, + "learning_rate": 4.2658399454612844e-05, + "loss": 0.0069, + "step": 661850 + }, + { + "epoch": 1.72, + "learning_rate": 4.265451123824138e-05, + "loss": 0.0079, + "step": 661860 + }, + { + "epoch": 1.72, + "learning_rate": 4.2650623021869914e-05, + "loss": 0.0069, + "step": 661870 + }, + { + "epoch": 1.72, + "learning_rate": 4.264673480549845e-05, + "loss": 0.0101, + "step": 661880 + }, + { + "epoch": 1.72, + "learning_rate": 4.2642846589126984e-05, + "loss": 0.0065, + "step": 661890 + }, + { + "epoch": 1.72, + "learning_rate": 4.263895837275552e-05, + "loss": 0.0068, + "step": 661900 + }, + { + "epoch": 1.72, + "learning_rate": 4.263507015638406e-05, + "loss": 0.008, + "step": 661910 + }, + { + "epoch": 1.72, + "learning_rate": 4.2631181940012595e-05, + "loss": 0.0102, + "step": 661920 + }, + { + "epoch": 1.72, + "learning_rate": 4.262729372364113e-05, + "loss": 0.0067, + "step": 661930 + }, + { + "epoch": 1.72, + "learning_rate": 4.2623405507269665e-05, + "loss": 0.0091, + "step": 661940 + }, + { + "epoch": 1.72, + "learning_rate": 4.26195172908982e-05, + "loss": 0.009, + "step": 661950 + }, + { + "epoch": 1.72, + "learning_rate": 4.2615629074526734e-05, + "loss": 0.0065, + "step": 661960 + }, + { + "epoch": 1.72, + "learning_rate": 4.261174085815527e-05, + "loss": 0.0078, + "step": 661970 + }, + { + "epoch": 1.72, + "learning_rate": 4.2607852641783804e-05, + "loss": 0.0074, + "step": 661980 + }, + { + "epoch": 1.72, + "learning_rate": 4.2603964425412346e-05, + "loss": 0.0072, + "step": 661990 + }, + { + "epoch": 1.72, + "learning_rate": 4.260007620904088e-05, + "loss": 0.0109, + "step": 662000 + }, + { + "epoch": 1.72, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.005079487804323435, + "eval_runtime": 107.8535, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, + "step": 662000 + }, + { + "epoch": 1.72, + "learning_rate": 4.2596187992669415e-05, + "loss": 0.0105, + "step": 662010 + }, + { + "epoch": 1.72, + "learning_rate": 4.259229977629795e-05, + "loss": 0.0075, + "step": 662020 + }, + { + "epoch": 1.72, + "learning_rate": 4.2588411559926485e-05, + "loss": 0.0106, + "step": 662030 + }, + { + "epoch": 1.72, + "learning_rate": 4.258452334355502e-05, + "loss": 0.0101, + "step": 662040 + }, + { + "epoch": 1.72, + "learning_rate": 4.2580635127183555e-05, + "loss": 0.0072, + "step": 662050 + }, + { + "epoch": 1.72, + "learning_rate": 4.257674691081209e-05, + "loss": 0.0161, + "step": 662060 + }, + { + "epoch": 1.72, + "learning_rate": 4.257285869444063e-05, + "loss": 0.0093, + "step": 662070 + }, + { + "epoch": 1.72, + "learning_rate": 4.256897047806915e-05, + "loss": 0.0073, + "step": 662080 + }, + { + "epoch": 1.72, + "learning_rate": 4.2565082261697694e-05, + "loss": 0.0066, + "step": 662090 + }, + { + "epoch": 1.72, + "learning_rate": 4.256119404532623e-05, + "loss": 0.0104, + "step": 662100 + }, + { + "epoch": 1.72, + "learning_rate": 4.2557305828954764e-05, + "loss": 0.0092, + "step": 662110 + }, + { + "epoch": 1.72, + "learning_rate": 4.25534176125833e-05, + "loss": 0.0059, + "step": 662120 + }, + { + "epoch": 1.72, + "learning_rate": 4.2549529396211834e-05, + "loss": 0.0074, + "step": 662130 + }, + { + "epoch": 1.72, + "learning_rate": 4.254564117984037e-05, + "loss": 0.0056, + "step": 662140 + }, + { + "epoch": 1.72, + "learning_rate": 4.2541752963468903e-05, + "loss": 0.006, + "step": 662150 + }, + { + "epoch": 1.72, + "learning_rate": 4.253786474709744e-05, + "loss": 0.0084, + "step": 662160 + }, + { + "epoch": 1.72, + "learning_rate": 4.253397653072598e-05, + "loss": 0.0105, + "step": 662170 + }, + { + "epoch": 1.72, + "learning_rate": 4.2530088314354515e-05, + "loss": 0.0074, + "step": 662180 + }, + { + "epoch": 1.72, + "learning_rate": 4.252620009798305e-05, + "loss": 0.0071, + "step": 662190 + }, + { + "epoch": 1.72, + "learning_rate": 4.2522311881611585e-05, + "loss": 0.0071, + "step": 662200 + }, + { + "epoch": 1.72, + "learning_rate": 4.251842366524012e-05, + "loss": 0.0081, + "step": 662210 + }, + { + "epoch": 1.72, + "learning_rate": 4.2514535448868654e-05, + "loss": 0.011, + "step": 662220 + }, + { + "epoch": 1.72, + "learning_rate": 4.251064723249719e-05, + "loss": 0.0068, + "step": 662230 + }, + { + "epoch": 1.72, + "learning_rate": 4.2506759016125724e-05, + "loss": 0.0077, + "step": 662240 + }, + { + "epoch": 1.72, + "learning_rate": 4.2502870799754266e-05, + "loss": 0.0075, + "step": 662250 + }, + { + "epoch": 1.72, + "learning_rate": 4.24989825833828e-05, + "loss": 0.0133, + "step": 662260 + }, + { + "epoch": 1.72, + "learning_rate": 4.2495094367011335e-05, + "loss": 0.0097, + "step": 662270 + }, + { + "epoch": 1.72, + "learning_rate": 4.249120615063987e-05, + "loss": 0.0068, + "step": 662280 + }, + { + "epoch": 1.72, + "learning_rate": 4.2487317934268405e-05, + "loss": 0.0074, + "step": 662290 + }, + { + "epoch": 1.72, + "learning_rate": 4.248342971789694e-05, + "loss": 0.0097, + "step": 662300 + }, + { + "epoch": 1.72, + "learning_rate": 4.2479541501525475e-05, + "loss": 0.0097, + "step": 662310 + }, + { + "epoch": 1.72, + "learning_rate": 4.247565328515401e-05, + "loss": 0.0087, + "step": 662320 + }, + { + "epoch": 1.72, + "learning_rate": 4.247176506878254e-05, + "loss": 0.0072, + "step": 662330 + }, + { + "epoch": 1.72, + "learning_rate": 4.246787685241107e-05, + "loss": 0.0096, + "step": 662340 + }, + { + "epoch": 1.72, + "learning_rate": 4.2463988636039614e-05, + "loss": 0.0101, + "step": 662350 + }, + { + "epoch": 1.72, + "learning_rate": 4.246010041966815e-05, + "loss": 0.0097, + "step": 662360 + }, + { + "epoch": 1.72, + "learning_rate": 4.2456212203296684e-05, + "loss": 0.0095, + "step": 662370 + }, + { + "epoch": 1.72, + "learning_rate": 4.245232398692522e-05, + "loss": 0.0082, + "step": 662380 + }, + { + "epoch": 1.72, + "learning_rate": 4.2448435770553754e-05, + "loss": 0.0076, + "step": 662390 + }, + { + "epoch": 1.72, + "learning_rate": 4.244454755418229e-05, + "loss": 0.0064, + "step": 662400 + }, + { + "epoch": 1.72, + "learning_rate": 4.2440659337810823e-05, + "loss": 0.0087, + "step": 662410 + }, + { + "epoch": 1.72, + "learning_rate": 4.243677112143936e-05, + "loss": 0.0062, + "step": 662420 + }, + { + "epoch": 1.72, + "learning_rate": 4.24328829050679e-05, + "loss": 0.0069, + "step": 662430 + }, + { + "epoch": 1.72, + "learning_rate": 4.2428994688696435e-05, + "loss": 0.0068, + "step": 662440 + }, + { + "epoch": 1.72, + "learning_rate": 4.242510647232497e-05, + "loss": 0.0128, + "step": 662450 + }, + { + "epoch": 1.72, + "learning_rate": 4.2421218255953504e-05, + "loss": 0.0079, + "step": 662460 + }, + { + "epoch": 1.72, + "learning_rate": 4.241733003958204e-05, + "loss": 0.0082, + "step": 662470 + }, + { + "epoch": 1.72, + "learning_rate": 4.2413441823210574e-05, + "loss": 0.0094, + "step": 662480 + }, + { + "epoch": 1.72, + "learning_rate": 4.240955360683911e-05, + "loss": 0.01, + "step": 662490 + }, + { + "epoch": 1.72, + "learning_rate": 4.2405665390467644e-05, + "loss": 0.0105, + "step": 662500 + }, + { + "epoch": 1.72, + "learning_rate": 4.2401777174096186e-05, + "loss": 0.0085, + "step": 662510 + }, + { + "epoch": 1.72, + "learning_rate": 4.239788895772472e-05, + "loss": 0.0051, + "step": 662520 + }, + { + "epoch": 1.72, + "learning_rate": 4.2394000741353255e-05, + "loss": 0.0067, + "step": 662530 + }, + { + "epoch": 1.72, + "learning_rate": 4.239011252498179e-05, + "loss": 0.007, + "step": 662540 + }, + { + "epoch": 1.72, + "learning_rate": 4.2386224308610325e-05, + "loss": 0.0081, + "step": 662550 + }, + { + "epoch": 1.72, + "learning_rate": 4.238233609223886e-05, + "loss": 0.0098, + "step": 662560 + }, + { + "epoch": 1.72, + "learning_rate": 4.237844787586739e-05, + "loss": 0.0078, + "step": 662570 + }, + { + "epoch": 1.72, + "learning_rate": 4.237455965949592e-05, + "loss": 0.0059, + "step": 662580 + }, + { + "epoch": 1.72, + "learning_rate": 4.237067144312446e-05, + "loss": 0.0078, + "step": 662590 + }, + { + "epoch": 1.72, + "learning_rate": 4.236678322675299e-05, + "loss": 0.0082, + "step": 662600 + }, + { + "epoch": 1.72, + "learning_rate": 4.2362895010381534e-05, + "loss": 0.008, + "step": 662610 + }, + { + "epoch": 1.72, + "learning_rate": 4.235900679401007e-05, + "loss": 0.0087, + "step": 662620 + }, + { + "epoch": 1.72, + "learning_rate": 4.2355118577638604e-05, + "loss": 0.0066, + "step": 662630 + }, + { + "epoch": 1.72, + "learning_rate": 4.235123036126714e-05, + "loss": 0.007, + "step": 662640 + }, + { + "epoch": 1.72, + "learning_rate": 4.2347342144895674e-05, + "loss": 0.0066, + "step": 662650 + }, + { + "epoch": 1.72, + "learning_rate": 4.234345392852421e-05, + "loss": 0.0074, + "step": 662660 + }, + { + "epoch": 1.72, + "learning_rate": 4.233956571215274e-05, + "loss": 0.0064, + "step": 662670 + }, + { + "epoch": 1.72, + "learning_rate": 4.233567749578128e-05, + "loss": 0.0099, + "step": 662680 + }, + { + "epoch": 1.72, + "learning_rate": 4.233178927940982e-05, + "loss": 0.0067, + "step": 662690 + }, + { + "epoch": 1.72, + "learning_rate": 4.2327901063038355e-05, + "loss": 0.0062, + "step": 662700 + }, + { + "epoch": 1.72, + "learning_rate": 4.232401284666689e-05, + "loss": 0.0076, + "step": 662710 + }, + { + "epoch": 1.72, + "learning_rate": 4.2320124630295424e-05, + "loss": 0.0073, + "step": 662720 + }, + { + "epoch": 1.72, + "learning_rate": 4.231623641392396e-05, + "loss": 0.01, + "step": 662730 + }, + { + "epoch": 1.72, + "learning_rate": 4.2312348197552494e-05, + "loss": 0.0077, + "step": 662740 + }, + { + "epoch": 1.72, + "learning_rate": 4.230845998118103e-05, + "loss": 0.008, + "step": 662750 + }, + { + "epoch": 1.72, + "learning_rate": 4.2304571764809564e-05, + "loss": 0.0097, + "step": 662760 + }, + { + "epoch": 1.72, + "learning_rate": 4.2300683548438106e-05, + "loss": 0.0151, + "step": 662770 + }, + { + "epoch": 1.72, + "learning_rate": 4.229679533206664e-05, + "loss": 0.0065, + "step": 662780 + }, + { + "epoch": 1.72, + "learning_rate": 4.2292907115695175e-05, + "loss": 0.0084, + "step": 662790 + }, + { + "epoch": 1.72, + "learning_rate": 4.228901889932371e-05, + "loss": 0.0104, + "step": 662800 + }, + { + "epoch": 1.72, + "learning_rate": 4.2285130682952245e-05, + "loss": 0.0082, + "step": 662810 + }, + { + "epoch": 1.72, + "learning_rate": 4.228124246658077e-05, + "loss": 0.0075, + "step": 662820 + }, + { + "epoch": 1.72, + "learning_rate": 4.227735425020931e-05, + "loss": 0.0091, + "step": 662830 + }, + { + "epoch": 1.72, + "learning_rate": 4.227346603383784e-05, + "loss": 0.0099, + "step": 662840 + }, + { + "epoch": 1.72, + "learning_rate": 4.226957781746638e-05, + "loss": 0.0091, + "step": 662850 + }, + { + "epoch": 1.72, + "learning_rate": 4.226568960109491e-05, + "loss": 0.0065, + "step": 662860 + }, + { + "epoch": 1.72, + "learning_rate": 4.2261801384723454e-05, + "loss": 0.0086, + "step": 662870 + }, + { + "epoch": 1.72, + "learning_rate": 4.225791316835199e-05, + "loss": 0.0055, + "step": 662880 + }, + { + "epoch": 1.72, + "learning_rate": 4.2254024951980524e-05, + "loss": 0.0073, + "step": 662890 + }, + { + "epoch": 1.72, + "learning_rate": 4.225013673560906e-05, + "loss": 0.0068, + "step": 662900 + }, + { + "epoch": 1.72, + "learning_rate": 4.2246248519237594e-05, + "loss": 0.0096, + "step": 662910 + }, + { + "epoch": 1.72, + "learning_rate": 4.224236030286613e-05, + "loss": 0.0119, + "step": 662920 + }, + { + "epoch": 1.72, + "learning_rate": 4.223847208649466e-05, + "loss": 0.0088, + "step": 662930 + }, + { + "epoch": 1.72, + "learning_rate": 4.22345838701232e-05, + "loss": 0.0076, + "step": 662940 + }, + { + "epoch": 1.72, + "learning_rate": 4.223069565375174e-05, + "loss": 0.0062, + "step": 662950 + }, + { + "epoch": 1.72, + "learning_rate": 4.2226807437380275e-05, + "loss": 0.0063, + "step": 662960 + }, + { + "epoch": 1.72, + "learning_rate": 4.222291922100881e-05, + "loss": 0.0074, + "step": 662970 + }, + { + "epoch": 1.72, + "learning_rate": 4.2219031004637344e-05, + "loss": 0.0085, + "step": 662980 + }, + { + "epoch": 1.72, + "learning_rate": 4.221514278826588e-05, + "loss": 0.0079, + "step": 662990 + }, + { + "epoch": 1.72, + "learning_rate": 4.2211254571894414e-05, + "loss": 0.007, + "step": 663000 + }, + { + "epoch": 1.72, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.005077589303255081, + "eval_runtime": 107.9194, + "eval_samples_per_second": 18.532, + "eval_steps_per_second": 4.633, + "step": 663000 + }, + { + "epoch": 1.72, + "learning_rate": 4.220736635552295e-05, + "loss": 0.0058, + "step": 663010 + }, + { + "epoch": 1.72, + "learning_rate": 4.2203478139151484e-05, + "loss": 0.0078, + "step": 663020 + }, + { + "epoch": 1.72, + "learning_rate": 4.2199589922780025e-05, + "loss": 0.0084, + "step": 663030 + }, + { + "epoch": 1.72, + "learning_rate": 4.219570170640856e-05, + "loss": 0.0083, + "step": 663040 + }, + { + "epoch": 1.72, + "learning_rate": 4.2191813490037095e-05, + "loss": 0.0057, + "step": 663050 + }, + { + "epoch": 1.72, + "learning_rate": 4.218792527366563e-05, + "loss": 0.0078, + "step": 663060 + }, + { + "epoch": 1.72, + "learning_rate": 4.218403705729416e-05, + "loss": 0.0073, + "step": 663070 + }, + { + "epoch": 1.72, + "learning_rate": 4.218014884092269e-05, + "loss": 0.0084, + "step": 663080 + }, + { + "epoch": 1.72, + "learning_rate": 4.217626062455123e-05, + "loss": 0.0083, + "step": 663090 + }, + { + "epoch": 1.72, + "learning_rate": 4.217237240817976e-05, + "loss": 0.007, + "step": 663100 + }, + { + "epoch": 1.72, + "learning_rate": 4.21684841918083e-05, + "loss": 0.0093, + "step": 663110 + }, + { + "epoch": 1.72, + "learning_rate": 4.216459597543683e-05, + "loss": 0.0094, + "step": 663120 + }, + { + "epoch": 1.72, + "learning_rate": 4.2160707759065374e-05, + "loss": 0.0072, + "step": 663130 + }, + { + "epoch": 1.72, + "learning_rate": 4.215681954269391e-05, + "loss": 0.0096, + "step": 663140 + }, + { + "epoch": 1.72, + "learning_rate": 4.2152931326322444e-05, + "loss": 0.0076, + "step": 663150 + }, + { + "epoch": 1.72, + "learning_rate": 4.214904310995098e-05, + "loss": 0.0089, + "step": 663160 + }, + { + "epoch": 1.72, + "learning_rate": 4.2145154893579514e-05, + "loss": 0.0059, + "step": 663170 + }, + { + "epoch": 1.72, + "learning_rate": 4.214126667720805e-05, + "loss": 0.0143, + "step": 663180 + }, + { + "epoch": 1.72, + "learning_rate": 4.213737846083658e-05, + "loss": 0.0093, + "step": 663190 + }, + { + "epoch": 1.72, + "learning_rate": 4.213349024446512e-05, + "loss": 0.0071, + "step": 663200 + }, + { + "epoch": 1.72, + "learning_rate": 4.212960202809365e-05, + "loss": 0.0096, + "step": 663210 + }, + { + "epoch": 1.72, + "learning_rate": 4.2125713811722195e-05, + "loss": 0.0093, + "step": 663220 + }, + { + "epoch": 1.72, + "learning_rate": 4.212182559535073e-05, + "loss": 0.0078, + "step": 663230 + }, + { + "epoch": 1.72, + "learning_rate": 4.2117937378979264e-05, + "loss": 0.0111, + "step": 663240 + }, + { + "epoch": 1.72, + "learning_rate": 4.21140491626078e-05, + "loss": 0.0073, + "step": 663250 + }, + { + "epoch": 1.72, + "learning_rate": 4.2110160946236334e-05, + "loss": 0.0108, + "step": 663260 + }, + { + "epoch": 1.72, + "learning_rate": 4.210627272986487e-05, + "loss": 0.0092, + "step": 663270 + }, + { + "epoch": 1.72, + "learning_rate": 4.2102384513493404e-05, + "loss": 0.0097, + "step": 663280 + }, + { + "epoch": 1.72, + "learning_rate": 4.209849629712194e-05, + "loss": 0.011, + "step": 663290 + }, + { + "epoch": 1.72, + "learning_rate": 4.209460808075048e-05, + "loss": 0.007, + "step": 663300 + }, + { + "epoch": 1.72, + "learning_rate": 4.2090719864379015e-05, + "loss": 0.0064, + "step": 663310 + }, + { + "epoch": 1.72, + "learning_rate": 4.208683164800754e-05, + "loss": 0.0096, + "step": 663320 + }, + { + "epoch": 1.72, + "learning_rate": 4.208294343163608e-05, + "loss": 0.0073, + "step": 663330 + }, + { + "epoch": 1.72, + "learning_rate": 4.207905521526461e-05, + "loss": 0.0089, + "step": 663340 + }, + { + "epoch": 1.72, + "learning_rate": 4.207516699889315e-05, + "loss": 0.0055, + "step": 663350 + }, + { + "epoch": 1.72, + "learning_rate": 4.207127878252168e-05, + "loss": 0.009, + "step": 663360 + }, + { + "epoch": 1.72, + "learning_rate": 4.206739056615022e-05, + "loss": 0.0077, + "step": 663370 + }, + { + "epoch": 1.72, + "learning_rate": 4.206350234977875e-05, + "loss": 0.0051, + "step": 663380 + }, + { + "epoch": 1.72, + "learning_rate": 4.205961413340729e-05, + "loss": 0.0124, + "step": 663390 + }, + { + "epoch": 1.72, + "learning_rate": 4.205572591703583e-05, + "loss": 0.0092, + "step": 663400 + }, + { + "epoch": 1.72, + "learning_rate": 4.2051837700664364e-05, + "loss": 0.006, + "step": 663410 + }, + { + "epoch": 1.72, + "learning_rate": 4.20479494842929e-05, + "loss": 0.0086, + "step": 663420 + }, + { + "epoch": 1.72, + "learning_rate": 4.2044061267921433e-05, + "loss": 0.0069, + "step": 663430 + }, + { + "epoch": 1.72, + "learning_rate": 4.204017305154997e-05, + "loss": 0.0074, + "step": 663440 + }, + { + "epoch": 1.72, + "learning_rate": 4.20362848351785e-05, + "loss": 0.0073, + "step": 663450 + }, + { + "epoch": 1.72, + "learning_rate": 4.203239661880704e-05, + "loss": 0.0103, + "step": 663460 + }, + { + "epoch": 1.72, + "learning_rate": 4.202850840243557e-05, + "loss": 0.0223, + "step": 663470 + }, + { + "epoch": 1.72, + "learning_rate": 4.2024620186064115e-05, + "loss": 0.0087, + "step": 663480 + }, + { + "epoch": 1.72, + "learning_rate": 4.202073196969265e-05, + "loss": 0.0101, + "step": 663490 + }, + { + "epoch": 1.72, + "learning_rate": 4.2016843753321184e-05, + "loss": 0.0092, + "step": 663500 + }, + { + "epoch": 1.72, + "learning_rate": 4.201295553694972e-05, + "loss": 0.0058, + "step": 663510 + }, + { + "epoch": 1.72, + "learning_rate": 4.2009067320578254e-05, + "loss": 0.0063, + "step": 663520 + }, + { + "epoch": 1.72, + "learning_rate": 4.200517910420679e-05, + "loss": 0.0094, + "step": 663530 + }, + { + "epoch": 1.72, + "learning_rate": 4.2001290887835324e-05, + "loss": 0.0068, + "step": 663540 + }, + { + "epoch": 1.72, + "learning_rate": 4.199740267146386e-05, + "loss": 0.011, + "step": 663550 + }, + { + "epoch": 1.72, + "learning_rate": 4.19935144550924e-05, + "loss": 0.0085, + "step": 663560 + }, + { + "epoch": 1.72, + "learning_rate": 4.198962623872092e-05, + "loss": 0.0105, + "step": 663570 + }, + { + "epoch": 1.72, + "learning_rate": 4.198573802234946e-05, + "loss": 0.0073, + "step": 663580 + }, + { + "epoch": 1.72, + "learning_rate": 4.1981849805978e-05, + "loss": 0.0071, + "step": 663590 + }, + { + "epoch": 1.72, + "learning_rate": 4.197796158960653e-05, + "loss": 0.0087, + "step": 663600 + }, + { + "epoch": 1.72, + "learning_rate": 4.197407337323507e-05, + "loss": 0.0067, + "step": 663610 + }, + { + "epoch": 1.72, + "learning_rate": 4.19701851568636e-05, + "loss": 0.0065, + "step": 663620 + }, + { + "epoch": 1.72, + "learning_rate": 4.196629694049214e-05, + "loss": 0.0085, + "step": 663630 + }, + { + "epoch": 1.72, + "learning_rate": 4.196240872412067e-05, + "loss": 0.0065, + "step": 663640 + }, + { + "epoch": 1.72, + "learning_rate": 4.195852050774921e-05, + "loss": 0.0086, + "step": 663650 + }, + { + "epoch": 1.72, + "learning_rate": 4.195463229137775e-05, + "loss": 0.0068, + "step": 663660 + }, + { + "epoch": 1.72, + "learning_rate": 4.1950744075006284e-05, + "loss": 0.0088, + "step": 663670 + }, + { + "epoch": 1.72, + "learning_rate": 4.194685585863482e-05, + "loss": 0.0114, + "step": 663680 + }, + { + "epoch": 1.72, + "learning_rate": 4.1942967642263353e-05, + "loss": 0.0068, + "step": 663690 + }, + { + "epoch": 1.72, + "learning_rate": 4.193907942589189e-05, + "loss": 0.0114, + "step": 663700 + }, + { + "epoch": 1.72, + "learning_rate": 4.193519120952042e-05, + "loss": 0.0093, + "step": 663710 + }, + { + "epoch": 1.72, + "learning_rate": 4.193130299314896e-05, + "loss": 0.0099, + "step": 663720 + }, + { + "epoch": 1.72, + "learning_rate": 4.192741477677749e-05, + "loss": 0.0101, + "step": 663730 + }, + { + "epoch": 1.72, + "learning_rate": 4.1923526560406035e-05, + "loss": 0.007, + "step": 663740 + }, + { + "epoch": 1.72, + "learning_rate": 4.191963834403457e-05, + "loss": 0.0085, + "step": 663750 + }, + { + "epoch": 1.72, + "learning_rate": 4.1915750127663104e-05, + "loss": 0.0071, + "step": 663760 + }, + { + "epoch": 1.72, + "learning_rate": 4.191186191129164e-05, + "loss": 0.0099, + "step": 663770 + }, + { + "epoch": 1.72, + "learning_rate": 4.1907973694920174e-05, + "loss": 0.0072, + "step": 663780 + }, + { + "epoch": 1.72, + "learning_rate": 4.190408547854871e-05, + "loss": 0.0094, + "step": 663790 + }, + { + "epoch": 1.72, + "learning_rate": 4.1900197262177244e-05, + "loss": 0.007, + "step": 663800 + }, + { + "epoch": 1.72, + "learning_rate": 4.189630904580577e-05, + "loss": 0.0083, + "step": 663810 + }, + { + "epoch": 1.72, + "learning_rate": 4.189242082943431e-05, + "loss": 0.0085, + "step": 663820 + }, + { + "epoch": 1.72, + "learning_rate": 4.188853261306284e-05, + "loss": 0.0078, + "step": 663830 + }, + { + "epoch": 1.72, + "learning_rate": 4.188464439669138e-05, + "loss": 0.0071, + "step": 663840 + }, + { + "epoch": 1.72, + "learning_rate": 4.188075618031992e-05, + "loss": 0.0084, + "step": 663850 + }, + { + "epoch": 1.72, + "learning_rate": 4.187686796394845e-05, + "loss": 0.0115, + "step": 663860 + }, + { + "epoch": 1.72, + "learning_rate": 4.187297974757699e-05, + "loss": 0.0081, + "step": 663870 + }, + { + "epoch": 1.72, + "learning_rate": 4.186909153120552e-05, + "loss": 0.0084, + "step": 663880 + }, + { + "epoch": 1.72, + "learning_rate": 4.186520331483406e-05, + "loss": 0.0102, + "step": 663890 + }, + { + "epoch": 1.72, + "learning_rate": 4.186131509846259e-05, + "loss": 0.0067, + "step": 663900 + }, + { + "epoch": 1.72, + "learning_rate": 4.185742688209113e-05, + "loss": 0.0079, + "step": 663910 + }, + { + "epoch": 1.72, + "learning_rate": 4.185353866571967e-05, + "loss": 0.0104, + "step": 663920 + }, + { + "epoch": 1.72, + "learning_rate": 4.1849650449348204e-05, + "loss": 0.0093, + "step": 663930 + }, + { + "epoch": 1.72, + "learning_rate": 4.184576223297674e-05, + "loss": 0.0067, + "step": 663940 + }, + { + "epoch": 1.72, + "learning_rate": 4.1841874016605273e-05, + "loss": 0.0076, + "step": 663950 + }, + { + "epoch": 1.72, + "learning_rate": 4.183798580023381e-05, + "loss": 0.0068, + "step": 663960 + }, + { + "epoch": 1.72, + "learning_rate": 4.183409758386234e-05, + "loss": 0.0079, + "step": 663970 + }, + { + "epoch": 1.72, + "learning_rate": 4.183020936749088e-05, + "loss": 0.0081, + "step": 663980 + }, + { + "epoch": 1.72, + "learning_rate": 4.182632115111941e-05, + "loss": 0.0068, + "step": 663990 + }, + { + "epoch": 1.72, + "learning_rate": 4.1822432934747954e-05, + "loss": 0.0069, + "step": 664000 + }, + { + "epoch": 1.72, + "eval_cer": 0.8816536990304715, + "eval_loss": 0.0050833625718951225, + "eval_runtime": 107.9937, + "eval_samples_per_second": 18.52, + "eval_steps_per_second": 4.63, + "step": 664000 + }, + { + "epoch": 1.72, + "learning_rate": 4.181854471837649e-05, + "loss": 0.0101, + "step": 664010 + }, + { + "epoch": 1.72, + "learning_rate": 4.1814656502005024e-05, + "loss": 0.0087, + "step": 664020 + }, + { + "epoch": 1.72, + "learning_rate": 4.181076828563356e-05, + "loss": 0.0086, + "step": 664030 + }, + { + "epoch": 1.72, + "learning_rate": 4.1806880069262094e-05, + "loss": 0.0108, + "step": 664040 + }, + { + "epoch": 1.72, + "learning_rate": 4.180299185289063e-05, + "loss": 0.0092, + "step": 664050 + }, + { + "epoch": 1.72, + "learning_rate": 4.179910363651916e-05, + "loss": 0.0067, + "step": 664060 + }, + { + "epoch": 1.72, + "learning_rate": 4.179521542014769e-05, + "loss": 0.0079, + "step": 664070 + }, + { + "epoch": 1.72, + "learning_rate": 4.1791327203776227e-05, + "loss": 0.0079, + "step": 664080 + }, + { + "epoch": 1.72, + "learning_rate": 4.178743898740476e-05, + "loss": 0.0077, + "step": 664090 + }, + { + "epoch": 1.72, + "learning_rate": 4.17835507710333e-05, + "loss": 0.0068, + "step": 664100 + }, + { + "epoch": 1.72, + "learning_rate": 4.177966255466184e-05, + "loss": 0.0065, + "step": 664110 + }, + { + "epoch": 1.72, + "learning_rate": 4.177577433829037e-05, + "loss": 0.0082, + "step": 664120 + }, + { + "epoch": 1.72, + "learning_rate": 4.177188612191891e-05, + "loss": 0.0058, + "step": 664130 + }, + { + "epoch": 1.72, + "learning_rate": 4.176799790554744e-05, + "loss": 0.0132, + "step": 664140 + }, + { + "epoch": 1.72, + "learning_rate": 4.176410968917598e-05, + "loss": 0.0088, + "step": 664150 + }, + { + "epoch": 1.72, + "learning_rate": 4.176022147280451e-05, + "loss": 0.0083, + "step": 664160 + }, + { + "epoch": 1.72, + "learning_rate": 4.175633325643305e-05, + "loss": 0.0071, + "step": 664170 + }, + { + "epoch": 1.72, + "learning_rate": 4.175244504006159e-05, + "loss": 0.0084, + "step": 664180 + }, + { + "epoch": 1.72, + "learning_rate": 4.1748556823690124e-05, + "loss": 0.0067, + "step": 664190 + }, + { + "epoch": 1.72, + "learning_rate": 4.174466860731866e-05, + "loss": 0.008, + "step": 664200 + }, + { + "epoch": 1.72, + "learning_rate": 4.174078039094719e-05, + "loss": 0.0092, + "step": 664210 + }, + { + "epoch": 1.72, + "learning_rate": 4.173689217457573e-05, + "loss": 0.0076, + "step": 664220 + }, + { + "epoch": 1.72, + "learning_rate": 4.173300395820426e-05, + "loss": 0.0078, + "step": 664230 + }, + { + "epoch": 1.72, + "learning_rate": 4.17291157418328e-05, + "loss": 0.0091, + "step": 664240 + }, + { + "epoch": 1.72, + "learning_rate": 4.172522752546133e-05, + "loss": 0.0136, + "step": 664250 + }, + { + "epoch": 1.72, + "learning_rate": 4.1721339309089874e-05, + "loss": 0.0069, + "step": 664260 + }, + { + "epoch": 1.72, + "learning_rate": 4.171745109271841e-05, + "loss": 0.0071, + "step": 664270 + }, + { + "epoch": 1.72, + "learning_rate": 4.1713562876346944e-05, + "loss": 0.0066, + "step": 664280 + }, + { + "epoch": 1.72, + "learning_rate": 4.170967465997548e-05, + "loss": 0.0114, + "step": 664290 + }, + { + "epoch": 1.72, + "learning_rate": 4.1705786443604014e-05, + "loss": 0.0105, + "step": 664300 + }, + { + "epoch": 1.72, + "learning_rate": 4.170189822723254e-05, + "loss": 0.0078, + "step": 664310 + }, + { + "epoch": 1.72, + "learning_rate": 4.169801001086108e-05, + "loss": 0.0086, + "step": 664320 + }, + { + "epoch": 1.72, + "learning_rate": 4.169412179448961e-05, + "loss": 0.0083, + "step": 664330 + }, + { + "epoch": 1.72, + "learning_rate": 4.1690233578118147e-05, + "loss": 0.0071, + "step": 664340 + }, + { + "epoch": 1.72, + "learning_rate": 4.168634536174668e-05, + "loss": 0.0069, + "step": 664350 + }, + { + "epoch": 1.72, + "learning_rate": 4.168245714537522e-05, + "loss": 0.0111, + "step": 664360 + }, + { + "epoch": 1.72, + "learning_rate": 4.167856892900376e-05, + "loss": 0.0065, + "step": 664370 + }, + { + "epoch": 1.72, + "learning_rate": 4.167468071263229e-05, + "loss": 0.012, + "step": 664380 + }, + { + "epoch": 1.72, + "learning_rate": 4.167079249626083e-05, + "loss": 0.008, + "step": 664390 + }, + { + "epoch": 1.72, + "learning_rate": 4.166690427988936e-05, + "loss": 0.0098, + "step": 664400 + }, + { + "epoch": 1.72, + "learning_rate": 4.16630160635179e-05, + "loss": 0.0059, + "step": 664410 + }, + { + "epoch": 1.72, + "learning_rate": 4.165912784714643e-05, + "loss": 0.0106, + "step": 664420 + }, + { + "epoch": 1.72, + "learning_rate": 4.165523963077497e-05, + "loss": 0.0097, + "step": 664430 + }, + { + "epoch": 1.72, + "learning_rate": 4.165135141440351e-05, + "loss": 0.0089, + "step": 664440 + }, + { + "epoch": 1.72, + "learning_rate": 4.1647463198032044e-05, + "loss": 0.0088, + "step": 664450 + }, + { + "epoch": 1.72, + "learning_rate": 4.164357498166058e-05, + "loss": 0.0081, + "step": 664460 + }, + { + "epoch": 1.72, + "learning_rate": 4.163968676528911e-05, + "loss": 0.0082, + "step": 664470 + }, + { + "epoch": 1.72, + "learning_rate": 4.163579854891765e-05, + "loss": 0.0092, + "step": 664480 + }, + { + "epoch": 1.72, + "learning_rate": 4.163191033254618e-05, + "loss": 0.0084, + "step": 664490 + }, + { + "epoch": 1.72, + "learning_rate": 4.162802211617472e-05, + "loss": 0.0061, + "step": 664500 + }, + { + "epoch": 1.72, + "learning_rate": 4.162413389980325e-05, + "loss": 0.007, + "step": 664510 + }, + { + "epoch": 1.72, + "learning_rate": 4.1620245683431794e-05, + "loss": 0.0059, + "step": 664520 + }, + { + "epoch": 1.72, + "learning_rate": 4.161635746706033e-05, + "loss": 0.0074, + "step": 664530 + }, + { + "epoch": 1.72, + "learning_rate": 4.1612469250688864e-05, + "loss": 0.0066, + "step": 664540 + }, + { + "epoch": 1.72, + "learning_rate": 4.16085810343174e-05, + "loss": 0.0058, + "step": 664550 + }, + { + "epoch": 1.72, + "learning_rate": 4.160469281794593e-05, + "loss": 0.0065, + "step": 664560 + }, + { + "epoch": 1.72, + "learning_rate": 4.160080460157446e-05, + "loss": 0.009, + "step": 664570 + }, + { + "epoch": 1.72, + "learning_rate": 4.1596916385203e-05, + "loss": 0.0076, + "step": 664580 + }, + { + "epoch": 1.72, + "learning_rate": 4.159302816883153e-05, + "loss": 0.0078, + "step": 664590 + }, + { + "epoch": 1.72, + "learning_rate": 4.1589139952460067e-05, + "loss": 0.0108, + "step": 664600 + }, + { + "epoch": 1.72, + "learning_rate": 4.15852517360886e-05, + "loss": 0.0056, + "step": 664610 + }, + { + "epoch": 1.72, + "learning_rate": 4.158136351971714e-05, + "loss": 0.0086, + "step": 664620 + }, + { + "epoch": 1.72, + "learning_rate": 4.157747530334568e-05, + "loss": 0.0103, + "step": 664630 + }, + { + "epoch": 1.72, + "learning_rate": 4.157358708697421e-05, + "loss": 0.006, + "step": 664640 + }, + { + "epoch": 1.72, + "learning_rate": 4.156969887060275e-05, + "loss": 0.01, + "step": 664650 + }, + { + "epoch": 1.72, + "learning_rate": 4.156581065423128e-05, + "loss": 0.0062, + "step": 664660 + }, + { + "epoch": 1.72, + "learning_rate": 4.156192243785982e-05, + "loss": 0.0079, + "step": 664670 + }, + { + "epoch": 1.72, + "learning_rate": 4.155803422148835e-05, + "loss": 0.0063, + "step": 664680 + }, + { + "epoch": 1.72, + "learning_rate": 4.155414600511689e-05, + "loss": 0.011, + "step": 664690 + }, + { + "epoch": 1.72, + "learning_rate": 4.155025778874542e-05, + "loss": 0.0065, + "step": 664700 + }, + { + "epoch": 1.72, + "learning_rate": 4.1546369572373964e-05, + "loss": 0.0094, + "step": 664710 + }, + { + "epoch": 1.72, + "learning_rate": 4.15424813560025e-05, + "loss": 0.0092, + "step": 664720 + }, + { + "epoch": 1.72, + "learning_rate": 4.153859313963103e-05, + "loss": 0.0067, + "step": 664730 + }, + { + "epoch": 1.72, + "learning_rate": 4.153470492325957e-05, + "loss": 0.0085, + "step": 664740 + }, + { + "epoch": 1.72, + "learning_rate": 4.15308167068881e-05, + "loss": 0.009, + "step": 664750 + }, + { + "epoch": 1.72, + "learning_rate": 4.152692849051664e-05, + "loss": 0.0066, + "step": 664760 + }, + { + "epoch": 1.72, + "learning_rate": 4.152304027414517e-05, + "loss": 0.0094, + "step": 664770 + }, + { + "epoch": 1.72, + "learning_rate": 4.151915205777371e-05, + "loss": 0.0068, + "step": 664780 + }, + { + "epoch": 1.72, + "learning_rate": 4.151526384140225e-05, + "loss": 0.0075, + "step": 664790 + }, + { + "epoch": 1.72, + "learning_rate": 4.1511375625030784e-05, + "loss": 0.0086, + "step": 664800 + }, + { + "epoch": 1.72, + "learning_rate": 4.150748740865931e-05, + "loss": 0.0079, + "step": 664810 + }, + { + "epoch": 1.72, + "learning_rate": 4.150359919228785e-05, + "loss": 0.0073, + "step": 664820 + }, + { + "epoch": 1.72, + "learning_rate": 4.149971097591638e-05, + "loss": 0.0097, + "step": 664830 + }, + { + "epoch": 1.72, + "learning_rate": 4.149582275954492e-05, + "loss": 0.0118, + "step": 664840 + }, + { + "epoch": 1.72, + "learning_rate": 4.149193454317345e-05, + "loss": 0.0073, + "step": 664850 + }, + { + "epoch": 1.72, + "learning_rate": 4.1488046326801986e-05, + "loss": 0.009, + "step": 664860 + }, + { + "epoch": 1.72, + "learning_rate": 4.148415811043052e-05, + "loss": 0.0076, + "step": 664870 + }, + { + "epoch": 1.72, + "learning_rate": 4.1480269894059056e-05, + "loss": 0.0069, + "step": 664880 + }, + { + "epoch": 1.72, + "learning_rate": 4.14763816776876e-05, + "loss": 0.0072, + "step": 664890 + }, + { + "epoch": 1.72, + "learning_rate": 4.147249346131613e-05, + "loss": 0.009, + "step": 664900 + }, + { + "epoch": 1.72, + "learning_rate": 4.146860524494467e-05, + "loss": 0.0118, + "step": 664910 + }, + { + "epoch": 1.72, + "learning_rate": 4.14647170285732e-05, + "loss": 0.0091, + "step": 664920 + }, + { + "epoch": 1.72, + "learning_rate": 4.146082881220174e-05, + "loss": 0.0112, + "step": 664930 + }, + { + "epoch": 1.72, + "learning_rate": 4.145694059583027e-05, + "loss": 0.0082, + "step": 664940 + }, + { + "epoch": 1.72, + "learning_rate": 4.145305237945881e-05, + "loss": 0.007, + "step": 664950 + }, + { + "epoch": 1.72, + "learning_rate": 4.144916416308734e-05, + "loss": 0.0095, + "step": 664960 + }, + { + "epoch": 1.72, + "learning_rate": 4.1445275946715883e-05, + "loss": 0.0092, + "step": 664970 + }, + { + "epoch": 1.72, + "learning_rate": 4.144138773034442e-05, + "loss": 0.0082, + "step": 664980 + }, + { + "epoch": 1.72, + "learning_rate": 4.143749951397295e-05, + "loss": 0.0077, + "step": 664990 + }, + { + "epoch": 1.72, + "learning_rate": 4.143361129760149e-05, + "loss": 0.0068, + "step": 665000 + }, + { + "epoch": 1.72, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.004966807551681995, + "eval_runtime": 107.8902, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 665000 + }, + { + "epoch": 1.72, + "learning_rate": 4.142972308123002e-05, + "loss": 0.0067, + "step": 665010 + }, + { + "epoch": 1.72, + "learning_rate": 4.142583486485856e-05, + "loss": 0.0095, + "step": 665020 + }, + { + "epoch": 1.72, + "learning_rate": 4.142194664848709e-05, + "loss": 0.0089, + "step": 665030 + }, + { + "epoch": 1.72, + "learning_rate": 4.141805843211563e-05, + "loss": 0.0061, + "step": 665040 + }, + { + "epoch": 1.72, + "learning_rate": 4.1414170215744156e-05, + "loss": 0.0104, + "step": 665050 + }, + { + "epoch": 1.72, + "learning_rate": 4.141028199937269e-05, + "loss": 0.0076, + "step": 665060 + }, + { + "epoch": 1.72, + "learning_rate": 4.140639378300123e-05, + "loss": 0.0071, + "step": 665070 + }, + { + "epoch": 1.72, + "learning_rate": 4.140250556662977e-05, + "loss": 0.0062, + "step": 665080 + }, + { + "epoch": 1.72, + "learning_rate": 4.13986173502583e-05, + "loss": 0.0087, + "step": 665090 + }, + { + "epoch": 1.72, + "learning_rate": 4.139472913388684e-05, + "loss": 0.0062, + "step": 665100 + }, + { + "epoch": 1.72, + "learning_rate": 4.139084091751537e-05, + "loss": 0.0091, + "step": 665110 + }, + { + "epoch": 1.72, + "learning_rate": 4.1386952701143906e-05, + "loss": 0.0074, + "step": 665120 + }, + { + "epoch": 1.72, + "learning_rate": 4.138306448477244e-05, + "loss": 0.0089, + "step": 665130 + }, + { + "epoch": 1.72, + "learning_rate": 4.1379176268400976e-05, + "loss": 0.0077, + "step": 665140 + }, + { + "epoch": 1.72, + "learning_rate": 4.137528805202952e-05, + "loss": 0.0075, + "step": 665150 + }, + { + "epoch": 1.72, + "learning_rate": 4.137139983565805e-05, + "loss": 0.0071, + "step": 665160 + }, + { + "epoch": 1.72, + "learning_rate": 4.136751161928659e-05, + "loss": 0.0089, + "step": 665170 + }, + { + "epoch": 1.72, + "learning_rate": 4.136362340291512e-05, + "loss": 0.0083, + "step": 665180 + }, + { + "epoch": 1.72, + "learning_rate": 4.135973518654366e-05, + "loss": 0.0092, + "step": 665190 + }, + { + "epoch": 1.72, + "learning_rate": 4.135584697017219e-05, + "loss": 0.0095, + "step": 665200 + }, + { + "epoch": 1.72, + "learning_rate": 4.135195875380073e-05, + "loss": 0.0084, + "step": 665210 + }, + { + "epoch": 1.72, + "learning_rate": 4.134807053742926e-05, + "loss": 0.0079, + "step": 665220 + }, + { + "epoch": 1.72, + "learning_rate": 4.1344182321057803e-05, + "loss": 0.0134, + "step": 665230 + }, + { + "epoch": 1.72, + "learning_rate": 4.134029410468634e-05, + "loss": 0.0083, + "step": 665240 + }, + { + "epoch": 1.72, + "learning_rate": 4.133640588831487e-05, + "loss": 0.0071, + "step": 665250 + }, + { + "epoch": 1.72, + "learning_rate": 4.133251767194341e-05, + "loss": 0.0056, + "step": 665260 + }, + { + "epoch": 1.72, + "learning_rate": 4.132862945557194e-05, + "loss": 0.0082, + "step": 665270 + }, + { + "epoch": 1.72, + "learning_rate": 4.132474123920048e-05, + "loss": 0.009, + "step": 665280 + }, + { + "epoch": 1.72, + "learning_rate": 4.132085302282901e-05, + "loss": 0.0051, + "step": 665290 + }, + { + "epoch": 1.72, + "learning_rate": 4.131696480645754e-05, + "loss": 0.0077, + "step": 665300 + }, + { + "epoch": 1.72, + "learning_rate": 4.1313076590086076e-05, + "loss": 0.0069, + "step": 665310 + }, + { + "epoch": 1.72, + "learning_rate": 4.130918837371461e-05, + "loss": 0.0076, + "step": 665320 + }, + { + "epoch": 1.72, + "learning_rate": 4.130530015734315e-05, + "loss": 0.0052, + "step": 665330 + }, + { + "epoch": 1.72, + "learning_rate": 4.130141194097169e-05, + "loss": 0.0096, + "step": 665340 + }, + { + "epoch": 1.72, + "learning_rate": 4.129752372460022e-05, + "loss": 0.0102, + "step": 665350 + }, + { + "epoch": 1.72, + "learning_rate": 4.129363550822876e-05, + "loss": 0.0086, + "step": 665360 + }, + { + "epoch": 1.72, + "learning_rate": 4.128974729185729e-05, + "loss": 0.0075, + "step": 665370 + }, + { + "epoch": 1.72, + "learning_rate": 4.1285859075485826e-05, + "loss": 0.0059, + "step": 665380 + }, + { + "epoch": 1.72, + "learning_rate": 4.128197085911436e-05, + "loss": 0.0079, + "step": 665390 + }, + { + "epoch": 1.72, + "learning_rate": 4.1278082642742896e-05, + "loss": 0.0077, + "step": 665400 + }, + { + "epoch": 1.72, + "learning_rate": 4.127419442637144e-05, + "loss": 0.0075, + "step": 665410 + }, + { + "epoch": 1.72, + "learning_rate": 4.127030620999997e-05, + "loss": 0.008, + "step": 665420 + }, + { + "epoch": 1.72, + "learning_rate": 4.126641799362851e-05, + "loss": 0.011, + "step": 665430 + }, + { + "epoch": 1.72, + "learning_rate": 4.126252977725704e-05, + "loss": 0.0068, + "step": 665440 + }, + { + "epoch": 1.72, + "learning_rate": 4.125864156088558e-05, + "loss": 0.0065, + "step": 665450 + }, + { + "epoch": 1.72, + "learning_rate": 4.125475334451411e-05, + "loss": 0.0066, + "step": 665460 + }, + { + "epoch": 1.72, + "learning_rate": 4.125086512814265e-05, + "loss": 0.0082, + "step": 665470 + }, + { + "epoch": 1.73, + "learning_rate": 4.124697691177118e-05, + "loss": 0.0071, + "step": 665480 + }, + { + "epoch": 1.73, + "learning_rate": 4.124308869539972e-05, + "loss": 0.0082, + "step": 665490 + }, + { + "epoch": 1.73, + "learning_rate": 4.123920047902826e-05, + "loss": 0.0099, + "step": 665500 + }, + { + "epoch": 1.73, + "learning_rate": 4.123531226265679e-05, + "loss": 0.009, + "step": 665510 + }, + { + "epoch": 1.73, + "learning_rate": 4.123142404628533e-05, + "loss": 0.0061, + "step": 665520 + }, + { + "epoch": 1.73, + "learning_rate": 4.122753582991386e-05, + "loss": 0.0067, + "step": 665530 + }, + { + "epoch": 1.73, + "learning_rate": 4.12236476135424e-05, + "loss": 0.0084, + "step": 665540 + }, + { + "epoch": 1.73, + "learning_rate": 4.1219759397170926e-05, + "loss": 0.0073, + "step": 665550 + }, + { + "epoch": 1.73, + "learning_rate": 4.121587118079946e-05, + "loss": 0.0065, + "step": 665560 + }, + { + "epoch": 1.73, + "learning_rate": 4.1211982964427996e-05, + "loss": 0.0101, + "step": 665570 + }, + { + "epoch": 1.73, + "learning_rate": 4.120809474805653e-05, + "loss": 0.0061, + "step": 665580 + }, + { + "epoch": 1.73, + "learning_rate": 4.120420653168507e-05, + "loss": 0.0073, + "step": 665590 + }, + { + "epoch": 1.73, + "learning_rate": 4.120031831531361e-05, + "loss": 0.0102, + "step": 665600 + }, + { + "epoch": 1.73, + "learning_rate": 4.119643009894214e-05, + "loss": 0.0089, + "step": 665610 + }, + { + "epoch": 1.73, + "learning_rate": 4.1192541882570677e-05, + "loss": 0.007, + "step": 665620 + }, + { + "epoch": 1.73, + "learning_rate": 4.118865366619921e-05, + "loss": 0.0091, + "step": 665630 + }, + { + "epoch": 1.73, + "learning_rate": 4.1184765449827746e-05, + "loss": 0.0061, + "step": 665640 + }, + { + "epoch": 1.73, + "learning_rate": 4.118087723345628e-05, + "loss": 0.0074, + "step": 665650 + }, + { + "epoch": 1.73, + "learning_rate": 4.1176989017084816e-05, + "loss": 0.0077, + "step": 665660 + }, + { + "epoch": 1.73, + "learning_rate": 4.117310080071336e-05, + "loss": 0.0089, + "step": 665670 + }, + { + "epoch": 1.73, + "learning_rate": 4.116921258434189e-05, + "loss": 0.0075, + "step": 665680 + }, + { + "epoch": 1.73, + "learning_rate": 4.116532436797043e-05, + "loss": 0.0074, + "step": 665690 + }, + { + "epoch": 1.73, + "learning_rate": 4.116143615159896e-05, + "loss": 0.0084, + "step": 665700 + }, + { + "epoch": 1.73, + "learning_rate": 4.11575479352275e-05, + "loss": 0.0082, + "step": 665710 + }, + { + "epoch": 1.73, + "learning_rate": 4.115365971885603e-05, + "loss": 0.0067, + "step": 665720 + }, + { + "epoch": 1.73, + "learning_rate": 4.114977150248457e-05, + "loss": 0.0071, + "step": 665730 + }, + { + "epoch": 1.73, + "learning_rate": 4.11458832861131e-05, + "loss": 0.0069, + "step": 665740 + }, + { + "epoch": 1.73, + "learning_rate": 4.114199506974164e-05, + "loss": 0.0069, + "step": 665750 + }, + { + "epoch": 1.73, + "learning_rate": 4.113810685337018e-05, + "loss": 0.0079, + "step": 665760 + }, + { + "epoch": 1.73, + "learning_rate": 4.113421863699871e-05, + "loss": 0.0071, + "step": 665770 + }, + { + "epoch": 1.73, + "learning_rate": 4.113033042062725e-05, + "loss": 0.0057, + "step": 665780 + }, + { + "epoch": 1.73, + "learning_rate": 4.112644220425578e-05, + "loss": 0.0054, + "step": 665790 + }, + { + "epoch": 1.73, + "learning_rate": 4.112255398788431e-05, + "loss": 0.0112, + "step": 665800 + }, + { + "epoch": 1.73, + "learning_rate": 4.1118665771512846e-05, + "loss": 0.0096, + "step": 665810 + }, + { + "epoch": 1.73, + "learning_rate": 4.111477755514138e-05, + "loss": 0.0087, + "step": 665820 + }, + { + "epoch": 1.73, + "learning_rate": 4.1110889338769915e-05, + "loss": 0.0088, + "step": 665830 + }, + { + "epoch": 1.73, + "learning_rate": 4.110700112239845e-05, + "loss": 0.0068, + "step": 665840 + }, + { + "epoch": 1.73, + "learning_rate": 4.110311290602699e-05, + "loss": 0.0099, + "step": 665850 + }, + { + "epoch": 1.73, + "learning_rate": 4.109922468965553e-05, + "loss": 0.0083, + "step": 665860 + }, + { + "epoch": 1.73, + "learning_rate": 4.109533647328406e-05, + "loss": 0.0072, + "step": 665870 + }, + { + "epoch": 1.73, + "learning_rate": 4.1091448256912597e-05, + "loss": 0.0089, + "step": 665880 + }, + { + "epoch": 1.73, + "learning_rate": 4.108756004054113e-05, + "loss": 0.009, + "step": 665890 + }, + { + "epoch": 1.73, + "learning_rate": 4.1083671824169666e-05, + "loss": 0.0101, + "step": 665900 + }, + { + "epoch": 1.73, + "learning_rate": 4.10797836077982e-05, + "loss": 0.0058, + "step": 665910 + }, + { + "epoch": 1.73, + "learning_rate": 4.1075895391426736e-05, + "loss": 0.0095, + "step": 665920 + }, + { + "epoch": 1.73, + "learning_rate": 4.107200717505528e-05, + "loss": 0.0072, + "step": 665930 + }, + { + "epoch": 1.73, + "learning_rate": 4.106811895868381e-05, + "loss": 0.009, + "step": 665940 + }, + { + "epoch": 1.73, + "learning_rate": 4.106423074231235e-05, + "loss": 0.0085, + "step": 665950 + }, + { + "epoch": 1.73, + "learning_rate": 4.106034252594088e-05, + "loss": 0.0097, + "step": 665960 + }, + { + "epoch": 1.73, + "learning_rate": 4.105645430956942e-05, + "loss": 0.009, + "step": 665970 + }, + { + "epoch": 1.73, + "learning_rate": 4.105256609319795e-05, + "loss": 0.0086, + "step": 665980 + }, + { + "epoch": 1.73, + "learning_rate": 4.104867787682649e-05, + "loss": 0.0063, + "step": 665990 + }, + { + "epoch": 1.73, + "learning_rate": 4.104478966045502e-05, + "loss": 0.0063, + "step": 666000 + }, + { + "epoch": 1.73, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.005011801607906818, + "eval_runtime": 107.759, + "eval_samples_per_second": 18.56, + "eval_steps_per_second": 4.64, + "step": 666000 + }, + { + "epoch": 1.73, + "learning_rate": 4.1040901444083557e-05, + "loss": 0.0064, + "step": 666010 + }, + { + "epoch": 1.73, + "learning_rate": 4.10370132277121e-05, + "loss": 0.0094, + "step": 666020 + }, + { + "epoch": 1.73, + "learning_rate": 4.103312501134063e-05, + "loss": 0.0114, + "step": 666030 + }, + { + "epoch": 1.73, + "learning_rate": 4.102923679496917e-05, + "loss": 0.0072, + "step": 666040 + }, + { + "epoch": 1.73, + "learning_rate": 4.1025348578597696e-05, + "loss": 0.0058, + "step": 666050 + }, + { + "epoch": 1.73, + "learning_rate": 4.102146036222623e-05, + "loss": 0.0075, + "step": 666060 + }, + { + "epoch": 1.73, + "learning_rate": 4.1017572145854766e-05, + "loss": 0.0094, + "step": 666070 + }, + { + "epoch": 1.73, + "learning_rate": 4.10136839294833e-05, + "loss": 0.01, + "step": 666080 + }, + { + "epoch": 1.73, + "learning_rate": 4.1009795713111835e-05, + "loss": 0.0104, + "step": 666090 + }, + { + "epoch": 1.73, + "learning_rate": 4.100590749674037e-05, + "loss": 0.0071, + "step": 666100 + }, + { + "epoch": 1.73, + "learning_rate": 4.1002019280368905e-05, + "loss": 0.0085, + "step": 666110 + }, + { + "epoch": 1.73, + "learning_rate": 4.099813106399745e-05, + "loss": 0.0076, + "step": 666120 + }, + { + "epoch": 1.73, + "learning_rate": 4.099424284762598e-05, + "loss": 0.0066, + "step": 666130 + }, + { + "epoch": 1.73, + "learning_rate": 4.0990354631254516e-05, + "loss": 0.0073, + "step": 666140 + }, + { + "epoch": 1.73, + "learning_rate": 4.098646641488305e-05, + "loss": 0.0069, + "step": 666150 + }, + { + "epoch": 1.73, + "learning_rate": 4.0982578198511586e-05, + "loss": 0.0063, + "step": 666160 + }, + { + "epoch": 1.73, + "learning_rate": 4.097868998214012e-05, + "loss": 0.0083, + "step": 666170 + }, + { + "epoch": 1.73, + "learning_rate": 4.0974801765768656e-05, + "loss": 0.0073, + "step": 666180 + }, + { + "epoch": 1.73, + "learning_rate": 4.097091354939719e-05, + "loss": 0.0079, + "step": 666190 + }, + { + "epoch": 1.73, + "learning_rate": 4.096702533302573e-05, + "loss": 0.008, + "step": 666200 + }, + { + "epoch": 1.73, + "learning_rate": 4.096313711665427e-05, + "loss": 0.0091, + "step": 666210 + }, + { + "epoch": 1.73, + "learning_rate": 4.09592489002828e-05, + "loss": 0.0071, + "step": 666220 + }, + { + "epoch": 1.73, + "learning_rate": 4.095536068391134e-05, + "loss": 0.0056, + "step": 666230 + }, + { + "epoch": 1.73, + "learning_rate": 4.095147246753987e-05, + "loss": 0.0057, + "step": 666240 + }, + { + "epoch": 1.73, + "learning_rate": 4.094758425116841e-05, + "loss": 0.0108, + "step": 666250 + }, + { + "epoch": 1.73, + "learning_rate": 4.094369603479694e-05, + "loss": 0.0062, + "step": 666260 + }, + { + "epoch": 1.73, + "learning_rate": 4.0939807818425476e-05, + "loss": 0.0075, + "step": 666270 + }, + { + "epoch": 1.73, + "learning_rate": 4.093591960205402e-05, + "loss": 0.0062, + "step": 666280 + }, + { + "epoch": 1.73, + "learning_rate": 4.093203138568255e-05, + "loss": 0.0075, + "step": 666290 + }, + { + "epoch": 1.73, + "learning_rate": 4.092814316931108e-05, + "loss": 0.0076, + "step": 666300 + }, + { + "epoch": 1.73, + "learning_rate": 4.0924254952939616e-05, + "loss": 0.0074, + "step": 666310 + }, + { + "epoch": 1.73, + "learning_rate": 4.092036673656815e-05, + "loss": 0.0077, + "step": 666320 + }, + { + "epoch": 1.73, + "learning_rate": 4.0916478520196686e-05, + "loss": 0.0054, + "step": 666330 + }, + { + "epoch": 1.73, + "learning_rate": 4.091259030382522e-05, + "loss": 0.0085, + "step": 666340 + }, + { + "epoch": 1.73, + "learning_rate": 4.0908702087453755e-05, + "loss": 0.0073, + "step": 666350 + }, + { + "epoch": 1.73, + "learning_rate": 4.090481387108229e-05, + "loss": 0.0089, + "step": 666360 + }, + { + "epoch": 1.73, + "learning_rate": 4.0900925654710825e-05, + "loss": 0.0069, + "step": 666370 + }, + { + "epoch": 1.73, + "learning_rate": 4.089703743833937e-05, + "loss": 0.006, + "step": 666380 + }, + { + "epoch": 1.73, + "learning_rate": 4.08931492219679e-05, + "loss": 0.0069, + "step": 666390 + }, + { + "epoch": 1.73, + "learning_rate": 4.0889261005596436e-05, + "loss": 0.0092, + "step": 666400 + }, + { + "epoch": 1.73, + "learning_rate": 4.088537278922497e-05, + "loss": 0.0079, + "step": 666410 + }, + { + "epoch": 1.73, + "learning_rate": 4.0881484572853506e-05, + "loss": 0.0095, + "step": 666420 + }, + { + "epoch": 1.73, + "learning_rate": 4.087759635648204e-05, + "loss": 0.0104, + "step": 666430 + }, + { + "epoch": 1.73, + "learning_rate": 4.0873708140110576e-05, + "loss": 0.0088, + "step": 666440 + }, + { + "epoch": 1.73, + "learning_rate": 4.086981992373911e-05, + "loss": 0.0074, + "step": 666450 + }, + { + "epoch": 1.73, + "learning_rate": 4.086593170736765e-05, + "loss": 0.0082, + "step": 666460 + }, + { + "epoch": 1.73, + "learning_rate": 4.086204349099619e-05, + "loss": 0.01, + "step": 666470 + }, + { + "epoch": 1.73, + "learning_rate": 4.085815527462472e-05, + "loss": 0.0075, + "step": 666480 + }, + { + "epoch": 1.73, + "learning_rate": 4.085426705825326e-05, + "loss": 0.0066, + "step": 666490 + }, + { + "epoch": 1.73, + "learning_rate": 4.085037884188179e-05, + "loss": 0.0061, + "step": 666500 + }, + { + "epoch": 1.73, + "learning_rate": 4.084649062551033e-05, + "loss": 0.0071, + "step": 666510 + }, + { + "epoch": 1.73, + "learning_rate": 4.084260240913886e-05, + "loss": 0.0057, + "step": 666520 + }, + { + "epoch": 1.73, + "learning_rate": 4.0838714192767396e-05, + "loss": 0.0074, + "step": 666530 + }, + { + "epoch": 1.73, + "learning_rate": 4.0834825976395925e-05, + "loss": 0.0063, + "step": 666540 + }, + { + "epoch": 1.73, + "learning_rate": 4.083093776002446e-05, + "loss": 0.0079, + "step": 666550 + }, + { + "epoch": 1.73, + "learning_rate": 4.0827049543653e-05, + "loss": 0.006, + "step": 666560 + }, + { + "epoch": 1.73, + "learning_rate": 4.0823161327281536e-05, + "loss": 0.0119, + "step": 666570 + }, + { + "epoch": 1.73, + "learning_rate": 4.081927311091007e-05, + "loss": 0.0088, + "step": 666580 + }, + { + "epoch": 1.73, + "learning_rate": 4.0815384894538606e-05, + "loss": 0.0071, + "step": 666590 + }, + { + "epoch": 1.73, + "learning_rate": 4.081149667816714e-05, + "loss": 0.0056, + "step": 666600 + }, + { + "epoch": 1.73, + "learning_rate": 4.0807608461795675e-05, + "loss": 0.006, + "step": 666610 + }, + { + "epoch": 1.73, + "learning_rate": 4.080372024542421e-05, + "loss": 0.0078, + "step": 666620 + }, + { + "epoch": 1.73, + "learning_rate": 4.0799832029052745e-05, + "loss": 0.0066, + "step": 666630 + }, + { + "epoch": 1.73, + "learning_rate": 4.079594381268129e-05, + "loss": 0.0082, + "step": 666640 + }, + { + "epoch": 1.73, + "learning_rate": 4.079205559630982e-05, + "loss": 0.0061, + "step": 666650 + }, + { + "epoch": 1.73, + "learning_rate": 4.0788167379938356e-05, + "loss": 0.0072, + "step": 666660 + }, + { + "epoch": 1.73, + "learning_rate": 4.078427916356689e-05, + "loss": 0.0104, + "step": 666670 + }, + { + "epoch": 1.73, + "learning_rate": 4.0780390947195426e-05, + "loss": 0.0073, + "step": 666680 + }, + { + "epoch": 1.73, + "learning_rate": 4.077650273082396e-05, + "loss": 0.0074, + "step": 666690 + }, + { + "epoch": 1.73, + "learning_rate": 4.0772614514452496e-05, + "loss": 0.0072, + "step": 666700 + }, + { + "epoch": 1.73, + "learning_rate": 4.076872629808103e-05, + "loss": 0.0098, + "step": 666710 + }, + { + "epoch": 1.73, + "learning_rate": 4.076483808170957e-05, + "loss": 0.0083, + "step": 666720 + }, + { + "epoch": 1.73, + "learning_rate": 4.076094986533811e-05, + "loss": 0.0082, + "step": 666730 + }, + { + "epoch": 1.73, + "learning_rate": 4.075706164896664e-05, + "loss": 0.0085, + "step": 666740 + }, + { + "epoch": 1.73, + "learning_rate": 4.075317343259518e-05, + "loss": 0.0095, + "step": 666750 + }, + { + "epoch": 1.73, + "learning_rate": 4.074928521622371e-05, + "loss": 0.0084, + "step": 666760 + }, + { + "epoch": 1.73, + "learning_rate": 4.074539699985225e-05, + "loss": 0.0087, + "step": 666770 + }, + { + "epoch": 1.73, + "learning_rate": 4.074150878348078e-05, + "loss": 0.0065, + "step": 666780 + }, + { + "epoch": 1.73, + "learning_rate": 4.073762056710931e-05, + "loss": 0.0096, + "step": 666790 + }, + { + "epoch": 1.73, + "learning_rate": 4.0733732350737844e-05, + "loss": 0.0084, + "step": 666800 + }, + { + "epoch": 1.73, + "learning_rate": 4.072984413436638e-05, + "loss": 0.0084, + "step": 666810 + }, + { + "epoch": 1.73, + "learning_rate": 4.072595591799492e-05, + "loss": 0.0053, + "step": 666820 + }, + { + "epoch": 1.73, + "learning_rate": 4.0722067701623456e-05, + "loss": 0.0065, + "step": 666830 + }, + { + "epoch": 1.73, + "learning_rate": 4.071817948525199e-05, + "loss": 0.0084, + "step": 666840 + }, + { + "epoch": 1.73, + "learning_rate": 4.0714291268880526e-05, + "loss": 0.0067, + "step": 666850 + }, + { + "epoch": 1.73, + "learning_rate": 4.071040305250906e-05, + "loss": 0.007, + "step": 666860 + }, + { + "epoch": 1.73, + "learning_rate": 4.0706514836137595e-05, + "loss": 0.0064, + "step": 666870 + }, + { + "epoch": 1.73, + "learning_rate": 4.070262661976613e-05, + "loss": 0.0084, + "step": 666880 + }, + { + "epoch": 1.73, + "learning_rate": 4.0698738403394665e-05, + "loss": 0.0076, + "step": 666890 + }, + { + "epoch": 1.73, + "learning_rate": 4.069485018702321e-05, + "loss": 0.0104, + "step": 666900 + }, + { + "epoch": 1.73, + "learning_rate": 4.069096197065174e-05, + "loss": 0.0063, + "step": 666910 + }, + { + "epoch": 1.73, + "learning_rate": 4.0687073754280276e-05, + "loss": 0.0071, + "step": 666920 + }, + { + "epoch": 1.73, + "learning_rate": 4.068318553790881e-05, + "loss": 0.0143, + "step": 666930 + }, + { + "epoch": 1.73, + "learning_rate": 4.0679297321537346e-05, + "loss": 0.008, + "step": 666940 + }, + { + "epoch": 1.73, + "learning_rate": 4.067540910516588e-05, + "loss": 0.0089, + "step": 666950 + }, + { + "epoch": 1.73, + "learning_rate": 4.0671520888794416e-05, + "loss": 0.0095, + "step": 666960 + }, + { + "epoch": 1.73, + "learning_rate": 4.066763267242295e-05, + "loss": 0.0065, + "step": 666970 + }, + { + "epoch": 1.73, + "learning_rate": 4.066374445605149e-05, + "loss": 0.009, + "step": 666980 + }, + { + "epoch": 1.73, + "learning_rate": 4.065985623968003e-05, + "loss": 0.0066, + "step": 666990 + }, + { + "epoch": 1.73, + "learning_rate": 4.065596802330856e-05, + "loss": 0.0083, + "step": 667000 + }, + { + "epoch": 1.73, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.005013938993215561, + "eval_runtime": 107.9123, + "eval_samples_per_second": 18.534, + "eval_steps_per_second": 4.633, + "step": 667000 + }, + { + "epoch": 1.73, + "learning_rate": 4.06520798069371e-05, + "loss": 0.0077, + "step": 667010 + }, + { + "epoch": 1.73, + "learning_rate": 4.064819159056563e-05, + "loss": 0.0072, + "step": 667020 + }, + { + "epoch": 1.73, + "learning_rate": 4.0644303374194167e-05, + "loss": 0.0095, + "step": 667030 + }, + { + "epoch": 1.73, + "learning_rate": 4.0640415157822695e-05, + "loss": 0.0068, + "step": 667040 + }, + { + "epoch": 1.73, + "learning_rate": 4.063652694145123e-05, + "loss": 0.0068, + "step": 667050 + }, + { + "epoch": 1.73, + "learning_rate": 4.0632638725079764e-05, + "loss": 0.0079, + "step": 667060 + }, + { + "epoch": 1.73, + "learning_rate": 4.06287505087083e-05, + "loss": 0.0094, + "step": 667070 + }, + { + "epoch": 1.73, + "learning_rate": 4.062486229233684e-05, + "loss": 0.0073, + "step": 667080 + }, + { + "epoch": 1.73, + "learning_rate": 4.0620974075965376e-05, + "loss": 0.0073, + "step": 667090 + }, + { + "epoch": 1.73, + "learning_rate": 4.061708585959391e-05, + "loss": 0.0056, + "step": 667100 + }, + { + "epoch": 1.73, + "learning_rate": 4.0613197643222445e-05, + "loss": 0.0104, + "step": 667110 + }, + { + "epoch": 1.73, + "learning_rate": 4.060930942685098e-05, + "loss": 0.0081, + "step": 667120 + }, + { + "epoch": 1.73, + "learning_rate": 4.0605421210479515e-05, + "loss": 0.0069, + "step": 667130 + }, + { + "epoch": 1.73, + "learning_rate": 4.060153299410805e-05, + "loss": 0.0053, + "step": 667140 + }, + { + "epoch": 1.73, + "learning_rate": 4.0597644777736585e-05, + "loss": 0.0073, + "step": 667150 + }, + { + "epoch": 1.73, + "learning_rate": 4.0593756561365127e-05, + "loss": 0.011, + "step": 667160 + }, + { + "epoch": 1.73, + "learning_rate": 4.058986834499366e-05, + "loss": 0.0113, + "step": 667170 + }, + { + "epoch": 1.73, + "learning_rate": 4.0585980128622196e-05, + "loss": 0.0082, + "step": 667180 + }, + { + "epoch": 1.73, + "learning_rate": 4.058209191225073e-05, + "loss": 0.0089, + "step": 667190 + }, + { + "epoch": 1.73, + "learning_rate": 4.0578203695879266e-05, + "loss": 0.0094, + "step": 667200 + }, + { + "epoch": 1.73, + "learning_rate": 4.05743154795078e-05, + "loss": 0.0066, + "step": 667210 + }, + { + "epoch": 1.73, + "learning_rate": 4.0570427263136336e-05, + "loss": 0.0077, + "step": 667220 + }, + { + "epoch": 1.73, + "learning_rate": 4.056653904676487e-05, + "loss": 0.0077, + "step": 667230 + }, + { + "epoch": 1.73, + "learning_rate": 4.056265083039341e-05, + "loss": 0.0082, + "step": 667240 + }, + { + "epoch": 1.73, + "learning_rate": 4.055876261402195e-05, + "loss": 0.0082, + "step": 667250 + }, + { + "epoch": 1.73, + "learning_rate": 4.055487439765048e-05, + "loss": 0.0075, + "step": 667260 + }, + { + "epoch": 1.73, + "learning_rate": 4.055098618127902e-05, + "loss": 0.0074, + "step": 667270 + }, + { + "epoch": 1.73, + "learning_rate": 4.054709796490755e-05, + "loss": 0.0065, + "step": 667280 + }, + { + "epoch": 1.73, + "learning_rate": 4.054320974853608e-05, + "loss": 0.0093, + "step": 667290 + }, + { + "epoch": 1.73, + "learning_rate": 4.0539321532164615e-05, + "loss": 0.0093, + "step": 667300 + }, + { + "epoch": 1.73, + "learning_rate": 4.053543331579315e-05, + "loss": 0.0129, + "step": 667310 + }, + { + "epoch": 1.73, + "learning_rate": 4.0531545099421684e-05, + "loss": 0.0105, + "step": 667320 + }, + { + "epoch": 1.73, + "learning_rate": 4.052765688305022e-05, + "loss": 0.0096, + "step": 667330 + }, + { + "epoch": 1.73, + "learning_rate": 4.052376866667876e-05, + "loss": 0.0091, + "step": 667340 + }, + { + "epoch": 1.73, + "learning_rate": 4.0519880450307296e-05, + "loss": 0.009, + "step": 667350 + }, + { + "epoch": 1.73, + "learning_rate": 4.051599223393583e-05, + "loss": 0.0086, + "step": 667360 + }, + { + "epoch": 1.73, + "learning_rate": 4.0512104017564365e-05, + "loss": 0.0083, + "step": 667370 + }, + { + "epoch": 1.73, + "learning_rate": 4.05082158011929e-05, + "loss": 0.008, + "step": 667380 + }, + { + "epoch": 1.73, + "learning_rate": 4.0504327584821435e-05, + "loss": 0.0066, + "step": 667390 + }, + { + "epoch": 1.73, + "learning_rate": 4.050043936844997e-05, + "loss": 0.0063, + "step": 667400 + }, + { + "epoch": 1.73, + "learning_rate": 4.0496551152078505e-05, + "loss": 0.0062, + "step": 667410 + }, + { + "epoch": 1.73, + "learning_rate": 4.049266293570704e-05, + "loss": 0.0078, + "step": 667420 + }, + { + "epoch": 1.73, + "learning_rate": 4.048877471933558e-05, + "loss": 0.0117, + "step": 667430 + }, + { + "epoch": 1.73, + "learning_rate": 4.0484886502964116e-05, + "loss": 0.0073, + "step": 667440 + }, + { + "epoch": 1.73, + "learning_rate": 4.048099828659265e-05, + "loss": 0.0069, + "step": 667450 + }, + { + "epoch": 1.73, + "learning_rate": 4.0477110070221186e-05, + "loss": 0.0074, + "step": 667460 + }, + { + "epoch": 1.73, + "learning_rate": 4.047322185384972e-05, + "loss": 0.0099, + "step": 667470 + }, + { + "epoch": 1.73, + "learning_rate": 4.0469333637478256e-05, + "loss": 0.0089, + "step": 667480 + }, + { + "epoch": 1.73, + "learning_rate": 4.046544542110679e-05, + "loss": 0.0071, + "step": 667490 + }, + { + "epoch": 1.73, + "learning_rate": 4.0461557204735325e-05, + "loss": 0.0071, + "step": 667500 + }, + { + "epoch": 1.73, + "learning_rate": 4.045766898836387e-05, + "loss": 0.0077, + "step": 667510 + }, + { + "epoch": 1.73, + "learning_rate": 4.04537807719924e-05, + "loss": 0.007, + "step": 667520 + }, + { + "epoch": 1.73, + "learning_rate": 4.044989255562094e-05, + "loss": 0.0121, + "step": 667530 + }, + { + "epoch": 1.73, + "learning_rate": 4.0446004339249465e-05, + "loss": 0.0083, + "step": 667540 + }, + { + "epoch": 1.73, + "learning_rate": 4.0442116122878e-05, + "loss": 0.0068, + "step": 667550 + }, + { + "epoch": 1.73, + "learning_rate": 4.0438227906506535e-05, + "loss": 0.008, + "step": 667560 + }, + { + "epoch": 1.73, + "learning_rate": 4.043433969013507e-05, + "loss": 0.0074, + "step": 667570 + }, + { + "epoch": 1.73, + "learning_rate": 4.0430451473763604e-05, + "loss": 0.0097, + "step": 667580 + }, + { + "epoch": 1.73, + "learning_rate": 4.042656325739214e-05, + "loss": 0.0072, + "step": 667590 + }, + { + "epoch": 1.73, + "learning_rate": 4.0422675041020674e-05, + "loss": 0.0071, + "step": 667600 + }, + { + "epoch": 1.73, + "learning_rate": 4.0418786824649216e-05, + "loss": 0.0076, + "step": 667610 + }, + { + "epoch": 1.73, + "learning_rate": 4.041489860827775e-05, + "loss": 0.0062, + "step": 667620 + }, + { + "epoch": 1.73, + "learning_rate": 4.0411010391906285e-05, + "loss": 0.009, + "step": 667630 + }, + { + "epoch": 1.73, + "learning_rate": 4.040712217553482e-05, + "loss": 0.0099, + "step": 667640 + }, + { + "epoch": 1.73, + "learning_rate": 4.0403233959163355e-05, + "loss": 0.0065, + "step": 667650 + }, + { + "epoch": 1.73, + "learning_rate": 4.039934574279189e-05, + "loss": 0.0091, + "step": 667660 + }, + { + "epoch": 1.73, + "learning_rate": 4.0395457526420425e-05, + "loss": 0.0066, + "step": 667670 + }, + { + "epoch": 1.73, + "learning_rate": 4.039156931004896e-05, + "loss": 0.01, + "step": 667680 + }, + { + "epoch": 1.73, + "learning_rate": 4.03876810936775e-05, + "loss": 0.0059, + "step": 667690 + }, + { + "epoch": 1.73, + "learning_rate": 4.0383792877306036e-05, + "loss": 0.0095, + "step": 667700 + }, + { + "epoch": 1.73, + "learning_rate": 4.037990466093457e-05, + "loss": 0.0076, + "step": 667710 + }, + { + "epoch": 1.73, + "learning_rate": 4.0376016444563106e-05, + "loss": 0.0096, + "step": 667720 + }, + { + "epoch": 1.73, + "learning_rate": 4.037212822819164e-05, + "loss": 0.0069, + "step": 667730 + }, + { + "epoch": 1.73, + "learning_rate": 4.0368240011820176e-05, + "loss": 0.0078, + "step": 667740 + }, + { + "epoch": 1.73, + "learning_rate": 4.036435179544871e-05, + "loss": 0.0079, + "step": 667750 + }, + { + "epoch": 1.73, + "learning_rate": 4.0360463579077245e-05, + "loss": 0.0081, + "step": 667760 + }, + { + "epoch": 1.73, + "learning_rate": 4.035657536270579e-05, + "loss": 0.0106, + "step": 667770 + }, + { + "epoch": 1.73, + "learning_rate": 4.035268714633431e-05, + "loss": 0.0066, + "step": 667780 + }, + { + "epoch": 1.73, + "learning_rate": 4.034879892996285e-05, + "loss": 0.0056, + "step": 667790 + }, + { + "epoch": 1.73, + "learning_rate": 4.0344910713591385e-05, + "loss": 0.0074, + "step": 667800 + }, + { + "epoch": 1.73, + "learning_rate": 4.034102249721992e-05, + "loss": 0.0078, + "step": 667810 + }, + { + "epoch": 1.73, + "learning_rate": 4.0337134280848455e-05, + "loss": 0.0066, + "step": 667820 + }, + { + "epoch": 1.73, + "learning_rate": 4.033324606447699e-05, + "loss": 0.0081, + "step": 667830 + }, + { + "epoch": 1.73, + "learning_rate": 4.0329357848105524e-05, + "loss": 0.0084, + "step": 667840 + }, + { + "epoch": 1.73, + "learning_rate": 4.032546963173406e-05, + "loss": 0.008, + "step": 667850 + }, + { + "epoch": 1.73, + "learning_rate": 4.0321581415362594e-05, + "loss": 0.0071, + "step": 667860 + }, + { + "epoch": 1.73, + "learning_rate": 4.0317693198991136e-05, + "loss": 0.0115, + "step": 667870 + }, + { + "epoch": 1.73, + "learning_rate": 4.031380498261967e-05, + "loss": 0.0075, + "step": 667880 + }, + { + "epoch": 1.73, + "learning_rate": 4.0309916766248205e-05, + "loss": 0.0073, + "step": 667890 + }, + { + "epoch": 1.73, + "learning_rate": 4.030602854987674e-05, + "loss": 0.006, + "step": 667900 + }, + { + "epoch": 1.73, + "learning_rate": 4.0302140333505275e-05, + "loss": 0.0109, + "step": 667910 + }, + { + "epoch": 1.73, + "learning_rate": 4.029825211713381e-05, + "loss": 0.0077, + "step": 667920 + }, + { + "epoch": 1.73, + "learning_rate": 4.0294363900762345e-05, + "loss": 0.0108, + "step": 667930 + }, + { + "epoch": 1.73, + "learning_rate": 4.029047568439088e-05, + "loss": 0.0077, + "step": 667940 + }, + { + "epoch": 1.73, + "learning_rate": 4.028658746801942e-05, + "loss": 0.0099, + "step": 667950 + }, + { + "epoch": 1.73, + "learning_rate": 4.0282699251647956e-05, + "loss": 0.0059, + "step": 667960 + }, + { + "epoch": 1.73, + "learning_rate": 4.027881103527649e-05, + "loss": 0.0082, + "step": 667970 + }, + { + "epoch": 1.73, + "learning_rate": 4.0274922818905026e-05, + "loss": 0.0104, + "step": 667980 + }, + { + "epoch": 1.73, + "learning_rate": 4.027103460253356e-05, + "loss": 0.0077, + "step": 667990 + }, + { + "epoch": 1.73, + "learning_rate": 4.0267146386162096e-05, + "loss": 0.0069, + "step": 668000 + }, + { + "epoch": 1.73, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.005121828522533178, + "eval_runtime": 107.7417, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, + "step": 668000 + }, + { + "epoch": 1.73, + "learning_rate": 4.026325816979063e-05, + "loss": 0.0053, + "step": 668010 + }, + { + "epoch": 1.73, + "learning_rate": 4.0259369953419165e-05, + "loss": 0.0096, + "step": 668020 + }, + { + "epoch": 1.73, + "learning_rate": 4.0255481737047693e-05, + "loss": 0.0078, + "step": 668030 + }, + { + "epoch": 1.73, + "learning_rate": 4.025159352067623e-05, + "loss": 0.0107, + "step": 668040 + }, + { + "epoch": 1.73, + "learning_rate": 4.024770530430477e-05, + "loss": 0.0074, + "step": 668050 + }, + { + "epoch": 1.73, + "learning_rate": 4.0243817087933305e-05, + "loss": 0.0083, + "step": 668060 + }, + { + "epoch": 1.73, + "learning_rate": 4.023992887156184e-05, + "loss": 0.0077, + "step": 668070 + }, + { + "epoch": 1.73, + "learning_rate": 4.0236040655190374e-05, + "loss": 0.0067, + "step": 668080 + }, + { + "epoch": 1.73, + "learning_rate": 4.023215243881891e-05, + "loss": 0.0066, + "step": 668090 + }, + { + "epoch": 1.73, + "learning_rate": 4.0228264222447444e-05, + "loss": 0.0081, + "step": 668100 + }, + { + "epoch": 1.73, + "learning_rate": 4.022437600607598e-05, + "loss": 0.0103, + "step": 668110 + }, + { + "epoch": 1.73, + "learning_rate": 4.0220487789704514e-05, + "loss": 0.0074, + "step": 668120 + }, + { + "epoch": 1.73, + "learning_rate": 4.0216599573333056e-05, + "loss": 0.0064, + "step": 668130 + }, + { + "epoch": 1.73, + "learning_rate": 4.021271135696159e-05, + "loss": 0.0093, + "step": 668140 + }, + { + "epoch": 1.73, + "learning_rate": 4.0208823140590125e-05, + "loss": 0.0088, + "step": 668150 + }, + { + "epoch": 1.73, + "learning_rate": 4.020493492421866e-05, + "loss": 0.0061, + "step": 668160 + }, + { + "epoch": 1.73, + "learning_rate": 4.0201046707847195e-05, + "loss": 0.0064, + "step": 668170 + }, + { + "epoch": 1.73, + "learning_rate": 4.019715849147573e-05, + "loss": 0.0065, + "step": 668180 + }, + { + "epoch": 1.73, + "learning_rate": 4.0193270275104265e-05, + "loss": 0.007, + "step": 668190 + }, + { + "epoch": 1.73, + "learning_rate": 4.01893820587328e-05, + "loss": 0.0109, + "step": 668200 + }, + { + "epoch": 1.73, + "learning_rate": 4.018549384236134e-05, + "loss": 0.0073, + "step": 668210 + }, + { + "epoch": 1.73, + "learning_rate": 4.0181605625989876e-05, + "loss": 0.0101, + "step": 668220 + }, + { + "epoch": 1.73, + "learning_rate": 4.017771740961841e-05, + "loss": 0.0088, + "step": 668230 + }, + { + "epoch": 1.73, + "learning_rate": 4.0173829193246946e-05, + "loss": 0.0069, + "step": 668240 + }, + { + "epoch": 1.73, + "learning_rate": 4.016994097687548e-05, + "loss": 0.0122, + "step": 668250 + }, + { + "epoch": 1.73, + "learning_rate": 4.0166052760504016e-05, + "loss": 0.0068, + "step": 668260 + }, + { + "epoch": 1.73, + "learning_rate": 4.016216454413255e-05, + "loss": 0.0099, + "step": 668270 + }, + { + "epoch": 1.73, + "learning_rate": 4.015827632776108e-05, + "loss": 0.0073, + "step": 668280 + }, + { + "epoch": 1.73, + "learning_rate": 4.015438811138961e-05, + "loss": 0.0082, + "step": 668290 + }, + { + "epoch": 1.73, + "learning_rate": 4.015049989501815e-05, + "loss": 0.0088, + "step": 668300 + }, + { + "epoch": 1.73, + "learning_rate": 4.014661167864669e-05, + "loss": 0.0079, + "step": 668310 + }, + { + "epoch": 1.73, + "learning_rate": 4.0142723462275225e-05, + "loss": 0.0085, + "step": 668320 + }, + { + "epoch": 1.73, + "learning_rate": 4.013883524590376e-05, + "loss": 0.0096, + "step": 668330 + }, + { + "epoch": 1.73, + "learning_rate": 4.0134947029532294e-05, + "loss": 0.0104, + "step": 668340 + }, + { + "epoch": 1.73, + "learning_rate": 4.013105881316083e-05, + "loss": 0.0096, + "step": 668350 + }, + { + "epoch": 1.73, + "learning_rate": 4.0127170596789364e-05, + "loss": 0.0094, + "step": 668360 + }, + { + "epoch": 1.73, + "learning_rate": 4.01232823804179e-05, + "loss": 0.0077, + "step": 668370 + }, + { + "epoch": 1.73, + "learning_rate": 4.0119394164046434e-05, + "loss": 0.007, + "step": 668380 + }, + { + "epoch": 1.73, + "learning_rate": 4.0115505947674976e-05, + "loss": 0.0085, + "step": 668390 + }, + { + "epoch": 1.73, + "learning_rate": 4.011161773130351e-05, + "loss": 0.0051, + "step": 668400 + }, + { + "epoch": 1.73, + "learning_rate": 4.0107729514932045e-05, + "loss": 0.0072, + "step": 668410 + }, + { + "epoch": 1.73, + "learning_rate": 4.010384129856058e-05, + "loss": 0.0092, + "step": 668420 + }, + { + "epoch": 1.73, + "learning_rate": 4.0099953082189115e-05, + "loss": 0.0075, + "step": 668430 + }, + { + "epoch": 1.73, + "learning_rate": 4.009606486581765e-05, + "loss": 0.006, + "step": 668440 + }, + { + "epoch": 1.73, + "learning_rate": 4.0092176649446185e-05, + "loss": 0.0061, + "step": 668450 + }, + { + "epoch": 1.73, + "learning_rate": 4.008828843307472e-05, + "loss": 0.0084, + "step": 668460 + }, + { + "epoch": 1.73, + "learning_rate": 4.008440021670326e-05, + "loss": 0.0088, + "step": 668470 + }, + { + "epoch": 1.73, + "learning_rate": 4.0080512000331796e-05, + "loss": 0.0073, + "step": 668480 + }, + { + "epoch": 1.73, + "learning_rate": 4.007662378396033e-05, + "loss": 0.0081, + "step": 668490 + }, + { + "epoch": 1.73, + "learning_rate": 4.0072735567588866e-05, + "loss": 0.009, + "step": 668500 + }, + { + "epoch": 1.73, + "learning_rate": 4.00688473512174e-05, + "loss": 0.0082, + "step": 668510 + }, + { + "epoch": 1.73, + "learning_rate": 4.0064959134845936e-05, + "loss": 0.0064, + "step": 668520 + }, + { + "epoch": 1.73, + "learning_rate": 4.0061070918474464e-05, + "loss": 0.0068, + "step": 668530 + }, + { + "epoch": 1.73, + "learning_rate": 4.0057182702103e-05, + "loss": 0.0072, + "step": 668540 + }, + { + "epoch": 1.73, + "learning_rate": 4.005329448573153e-05, + "loss": 0.0079, + "step": 668550 + }, + { + "epoch": 1.73, + "learning_rate": 4.004940626936007e-05, + "loss": 0.0073, + "step": 668560 + }, + { + "epoch": 1.73, + "learning_rate": 4.004551805298861e-05, + "loss": 0.0093, + "step": 668570 + }, + { + "epoch": 1.73, + "learning_rate": 4.0041629836617145e-05, + "loss": 0.0088, + "step": 668580 + }, + { + "epoch": 1.73, + "learning_rate": 4.003774162024568e-05, + "loss": 0.0093, + "step": 668590 + }, + { + "epoch": 1.73, + "learning_rate": 4.0033853403874214e-05, + "loss": 0.008, + "step": 668600 + }, + { + "epoch": 1.73, + "learning_rate": 4.002996518750275e-05, + "loss": 0.0098, + "step": 668610 + }, + { + "epoch": 1.73, + "learning_rate": 4.0026076971131284e-05, + "loss": 0.0115, + "step": 668620 + }, + { + "epoch": 1.73, + "learning_rate": 4.002218875475982e-05, + "loss": 0.0071, + "step": 668630 + }, + { + "epoch": 1.73, + "learning_rate": 4.0018300538388354e-05, + "loss": 0.0078, + "step": 668640 + }, + { + "epoch": 1.73, + "learning_rate": 4.0014412322016895e-05, + "loss": 0.0101, + "step": 668650 + }, + { + "epoch": 1.73, + "learning_rate": 4.001052410564543e-05, + "loss": 0.006, + "step": 668660 + }, + { + "epoch": 1.73, + "learning_rate": 4.0006635889273965e-05, + "loss": 0.0064, + "step": 668670 + }, + { + "epoch": 1.73, + "learning_rate": 4.00027476729025e-05, + "loss": 0.0091, + "step": 668680 + }, + { + "epoch": 1.73, + "learning_rate": 3.9998859456531035e-05, + "loss": 0.0062, + "step": 668690 + }, + { + "epoch": 1.73, + "learning_rate": 3.999497124015957e-05, + "loss": 0.0084, + "step": 668700 + }, + { + "epoch": 1.73, + "learning_rate": 3.9991083023788105e-05, + "loss": 0.0077, + "step": 668710 + }, + { + "epoch": 1.73, + "learning_rate": 3.998719480741664e-05, + "loss": 0.0081, + "step": 668720 + }, + { + "epoch": 1.73, + "learning_rate": 3.9983306591045174e-05, + "loss": 0.0074, + "step": 668730 + }, + { + "epoch": 1.73, + "learning_rate": 3.9979418374673716e-05, + "loss": 0.0079, + "step": 668740 + }, + { + "epoch": 1.73, + "learning_rate": 3.997553015830225e-05, + "loss": 0.0098, + "step": 668750 + }, + { + "epoch": 1.73, + "learning_rate": 3.9971641941930786e-05, + "loss": 0.0092, + "step": 668760 + }, + { + "epoch": 1.73, + "learning_rate": 3.996775372555932e-05, + "loss": 0.0094, + "step": 668770 + }, + { + "epoch": 1.73, + "learning_rate": 3.996386550918785e-05, + "loss": 0.0077, + "step": 668780 + }, + { + "epoch": 1.73, + "learning_rate": 3.9959977292816384e-05, + "loss": 0.0078, + "step": 668790 + }, + { + "epoch": 1.73, + "learning_rate": 3.995608907644492e-05, + "loss": 0.011, + "step": 668800 + }, + { + "epoch": 1.73, + "learning_rate": 3.995220086007345e-05, + "loss": 0.0089, + "step": 668810 + }, + { + "epoch": 1.73, + "learning_rate": 3.994831264370199e-05, + "loss": 0.0067, + "step": 668820 + }, + { + "epoch": 1.73, + "learning_rate": 3.994442442733053e-05, + "loss": 0.0106, + "step": 668830 + }, + { + "epoch": 1.73, + "learning_rate": 3.9940536210959065e-05, + "loss": 0.0132, + "step": 668840 + }, + { + "epoch": 1.73, + "learning_rate": 3.99366479945876e-05, + "loss": 0.0074, + "step": 668850 + }, + { + "epoch": 1.73, + "learning_rate": 3.9932759778216134e-05, + "loss": 0.0081, + "step": 668860 + }, + { + "epoch": 1.73, + "learning_rate": 3.992887156184467e-05, + "loss": 0.0071, + "step": 668870 + }, + { + "epoch": 1.73, + "learning_rate": 3.9924983345473204e-05, + "loss": 0.008, + "step": 668880 + }, + { + "epoch": 1.73, + "learning_rate": 3.992109512910174e-05, + "loss": 0.0072, + "step": 668890 + }, + { + "epoch": 1.73, + "learning_rate": 3.9917206912730274e-05, + "loss": 0.0084, + "step": 668900 + }, + { + "epoch": 1.73, + "learning_rate": 3.991331869635881e-05, + "loss": 0.0081, + "step": 668910 + }, + { + "epoch": 1.73, + "learning_rate": 3.990943047998735e-05, + "loss": 0.0102, + "step": 668920 + }, + { + "epoch": 1.73, + "learning_rate": 3.9905542263615885e-05, + "loss": 0.0112, + "step": 668930 + }, + { + "epoch": 1.73, + "learning_rate": 3.990165404724442e-05, + "loss": 0.0096, + "step": 668940 + }, + { + "epoch": 1.73, + "learning_rate": 3.9897765830872955e-05, + "loss": 0.0089, + "step": 668950 + }, + { + "epoch": 1.73, + "learning_rate": 3.989387761450149e-05, + "loss": 0.0078, + "step": 668960 + }, + { + "epoch": 1.73, + "learning_rate": 3.9889989398130025e-05, + "loss": 0.0099, + "step": 668970 + }, + { + "epoch": 1.73, + "learning_rate": 3.988610118175856e-05, + "loss": 0.0069, + "step": 668980 + }, + { + "epoch": 1.73, + "learning_rate": 3.9882212965387094e-05, + "loss": 0.0089, + "step": 668990 + }, + { + "epoch": 1.73, + "learning_rate": 3.9878324749015636e-05, + "loss": 0.01, + "step": 669000 + }, + { + "epoch": 1.73, + "eval_cer": 0.8816592975782083, + "eval_loss": 0.005148761440068483, + "eval_runtime": 107.7864, + "eval_samples_per_second": 18.555, + "eval_steps_per_second": 4.639, + "step": 669000 + }, + { + "epoch": 1.73, + "learning_rate": 3.987443653264417e-05, + "loss": 0.0073, + "step": 669010 + }, + { + "epoch": 1.73, + "learning_rate": 3.98705483162727e-05, + "loss": 0.0071, + "step": 669020 + }, + { + "epoch": 1.73, + "learning_rate": 3.9866660099901234e-05, + "loss": 0.0073, + "step": 669030 + }, + { + "epoch": 1.73, + "learning_rate": 3.986277188352977e-05, + "loss": 0.008, + "step": 669040 + }, + { + "epoch": 1.73, + "learning_rate": 3.9858883667158303e-05, + "loss": 0.0085, + "step": 669050 + }, + { + "epoch": 1.73, + "learning_rate": 3.985499545078684e-05, + "loss": 0.0091, + "step": 669060 + }, + { + "epoch": 1.73, + "learning_rate": 3.985110723441537e-05, + "loss": 0.0085, + "step": 669070 + }, + { + "epoch": 1.73, + "learning_rate": 3.984721901804391e-05, + "loss": 0.007, + "step": 669080 + }, + { + "epoch": 1.73, + "learning_rate": 3.984333080167244e-05, + "loss": 0.0076, + "step": 669090 + }, + { + "epoch": 1.73, + "learning_rate": 3.9839442585300985e-05, + "loss": 0.0071, + "step": 669100 + }, + { + "epoch": 1.73, + "learning_rate": 3.983555436892952e-05, + "loss": 0.0072, + "step": 669110 + }, + { + "epoch": 1.73, + "learning_rate": 3.9831666152558054e-05, + "loss": 0.0076, + "step": 669120 + }, + { + "epoch": 1.73, + "learning_rate": 3.982777793618659e-05, + "loss": 0.0064, + "step": 669130 + }, + { + "epoch": 1.73, + "learning_rate": 3.9823889719815124e-05, + "loss": 0.0079, + "step": 669140 + }, + { + "epoch": 1.73, + "learning_rate": 3.982000150344366e-05, + "loss": 0.0114, + "step": 669150 + }, + { + "epoch": 1.73, + "learning_rate": 3.9816113287072194e-05, + "loss": 0.0073, + "step": 669160 + }, + { + "epoch": 1.73, + "learning_rate": 3.981222507070073e-05, + "loss": 0.0061, + "step": 669170 + }, + { + "epoch": 1.73, + "learning_rate": 3.980833685432927e-05, + "loss": 0.0068, + "step": 669180 + }, + { + "epoch": 1.73, + "learning_rate": 3.9804448637957805e-05, + "loss": 0.0076, + "step": 669190 + }, + { + "epoch": 1.73, + "learning_rate": 3.980056042158634e-05, + "loss": 0.0084, + "step": 669200 + }, + { + "epoch": 1.73, + "learning_rate": 3.9796672205214875e-05, + "loss": 0.0047, + "step": 669210 + }, + { + "epoch": 1.73, + "learning_rate": 3.979278398884341e-05, + "loss": 0.0102, + "step": 669220 + }, + { + "epoch": 1.73, + "learning_rate": 3.9788895772471945e-05, + "loss": 0.0075, + "step": 669230 + }, + { + "epoch": 1.73, + "learning_rate": 3.978500755610048e-05, + "loss": 0.0073, + "step": 669240 + }, + { + "epoch": 1.73, + "learning_rate": 3.9781119339729014e-05, + "loss": 0.008, + "step": 669250 + }, + { + "epoch": 1.73, + "learning_rate": 3.9777231123357556e-05, + "loss": 0.0092, + "step": 669260 + }, + { + "epoch": 1.73, + "learning_rate": 3.977334290698608e-05, + "loss": 0.007, + "step": 669270 + }, + { + "epoch": 1.73, + "learning_rate": 3.976945469061462e-05, + "loss": 0.006, + "step": 669280 + }, + { + "epoch": 1.73, + "learning_rate": 3.9765566474243154e-05, + "loss": 0.0091, + "step": 669290 + }, + { + "epoch": 1.73, + "learning_rate": 3.976167825787169e-05, + "loss": 0.0093, + "step": 669300 + }, + { + "epoch": 1.73, + "learning_rate": 3.9757790041500223e-05, + "loss": 0.0072, + "step": 669310 + }, + { + "epoch": 1.73, + "learning_rate": 3.975390182512876e-05, + "loss": 0.0062, + "step": 669320 + }, + { + "epoch": 1.73, + "learning_rate": 3.975001360875729e-05, + "loss": 0.0077, + "step": 669330 + }, + { + "epoch": 1.74, + "learning_rate": 3.974612539238583e-05, + "loss": 0.0064, + "step": 669340 + }, + { + "epoch": 1.74, + "learning_rate": 3.974223717601436e-05, + "loss": 0.008, + "step": 669350 + }, + { + "epoch": 1.74, + "learning_rate": 3.9738348959642905e-05, + "loss": 0.0086, + "step": 669360 + }, + { + "epoch": 1.74, + "learning_rate": 3.973446074327144e-05, + "loss": 0.0061, + "step": 669370 + }, + { + "epoch": 1.74, + "learning_rate": 3.9730572526899974e-05, + "loss": 0.009, + "step": 669380 + }, + { + "epoch": 1.74, + "learning_rate": 3.972668431052851e-05, + "loss": 0.0072, + "step": 669390 + }, + { + "epoch": 1.74, + "learning_rate": 3.9722796094157044e-05, + "loss": 0.008, + "step": 669400 + }, + { + "epoch": 1.74, + "learning_rate": 3.971890787778558e-05, + "loss": 0.0098, + "step": 669410 + }, + { + "epoch": 1.74, + "learning_rate": 3.9715019661414114e-05, + "loss": 0.0057, + "step": 669420 + }, + { + "epoch": 1.74, + "learning_rate": 3.971113144504265e-05, + "loss": 0.0095, + "step": 669430 + }, + { + "epoch": 1.74, + "learning_rate": 3.970724322867119e-05, + "loss": 0.0076, + "step": 669440 + }, + { + "epoch": 1.74, + "learning_rate": 3.9703355012299725e-05, + "loss": 0.0061, + "step": 669450 + }, + { + "epoch": 1.74, + "learning_rate": 3.969946679592826e-05, + "loss": 0.0094, + "step": 669460 + }, + { + "epoch": 1.74, + "learning_rate": 3.9695578579556795e-05, + "loss": 0.0082, + "step": 669470 + }, + { + "epoch": 1.74, + "learning_rate": 3.969169036318533e-05, + "loss": 0.0184, + "step": 669480 + }, + { + "epoch": 1.74, + "learning_rate": 3.9687802146813865e-05, + "loss": 0.0087, + "step": 669490 + }, + { + "epoch": 1.74, + "learning_rate": 3.96839139304424e-05, + "loss": 0.0088, + "step": 669500 + }, + { + "epoch": 1.74, + "learning_rate": 3.9680025714070934e-05, + "loss": 0.0099, + "step": 669510 + }, + { + "epoch": 1.74, + "learning_rate": 3.967613749769946e-05, + "loss": 0.0078, + "step": 669520 + }, + { + "epoch": 1.74, + "learning_rate": 3.9672249281328e-05, + "loss": 0.0082, + "step": 669530 + }, + { + "epoch": 1.74, + "learning_rate": 3.966836106495654e-05, + "loss": 0.0072, + "step": 669540 + }, + { + "epoch": 1.74, + "learning_rate": 3.9664472848585074e-05, + "loss": 0.0073, + "step": 669550 + }, + { + "epoch": 1.74, + "learning_rate": 3.966058463221361e-05, + "loss": 0.0114, + "step": 669560 + }, + { + "epoch": 1.74, + "learning_rate": 3.9656696415842143e-05, + "loss": 0.0092, + "step": 669570 + }, + { + "epoch": 1.74, + "learning_rate": 3.965280819947068e-05, + "loss": 0.0062, + "step": 669580 + }, + { + "epoch": 1.74, + "learning_rate": 3.964891998309921e-05, + "loss": 0.0078, + "step": 669590 + }, + { + "epoch": 1.74, + "learning_rate": 3.964503176672775e-05, + "loss": 0.0111, + "step": 669600 + }, + { + "epoch": 1.74, + "learning_rate": 3.964114355035628e-05, + "loss": 0.0107, + "step": 669610 + }, + { + "epoch": 1.74, + "learning_rate": 3.9637255333984824e-05, + "loss": 0.0092, + "step": 669620 + }, + { + "epoch": 1.74, + "learning_rate": 3.963336711761336e-05, + "loss": 0.0097, + "step": 669630 + }, + { + "epoch": 1.74, + "learning_rate": 3.9629478901241894e-05, + "loss": 0.0079, + "step": 669640 + }, + { + "epoch": 1.74, + "learning_rate": 3.962559068487043e-05, + "loss": 0.008, + "step": 669650 + }, + { + "epoch": 1.74, + "learning_rate": 3.9621702468498964e-05, + "loss": 0.0114, + "step": 669660 + }, + { + "epoch": 1.74, + "learning_rate": 3.96178142521275e-05, + "loss": 0.0119, + "step": 669670 + }, + { + "epoch": 1.74, + "learning_rate": 3.9613926035756034e-05, + "loss": 0.0093, + "step": 669680 + }, + { + "epoch": 1.74, + "learning_rate": 3.961003781938457e-05, + "loss": 0.0077, + "step": 669690 + }, + { + "epoch": 1.74, + "learning_rate": 3.960614960301311e-05, + "loss": 0.0061, + "step": 669700 + }, + { + "epoch": 1.74, + "learning_rate": 3.9602261386641645e-05, + "loss": 0.0081, + "step": 669710 + }, + { + "epoch": 1.74, + "learning_rate": 3.959837317027018e-05, + "loss": 0.007, + "step": 669720 + }, + { + "epoch": 1.74, + "learning_rate": 3.9594484953898715e-05, + "loss": 0.0048, + "step": 669730 + }, + { + "epoch": 1.74, + "learning_rate": 3.959059673752725e-05, + "loss": 0.0077, + "step": 669740 + }, + { + "epoch": 1.74, + "learning_rate": 3.9586708521155784e-05, + "loss": 0.0098, + "step": 669750 + }, + { + "epoch": 1.74, + "learning_rate": 3.958282030478432e-05, + "loss": 0.0081, + "step": 669760 + }, + { + "epoch": 1.74, + "learning_rate": 3.957893208841285e-05, + "loss": 0.0076, + "step": 669770 + }, + { + "epoch": 1.74, + "learning_rate": 3.957504387204138e-05, + "loss": 0.0081, + "step": 669780 + }, + { + "epoch": 1.74, + "learning_rate": 3.957115565566992e-05, + "loss": 0.0056, + "step": 669790 + }, + { + "epoch": 1.74, + "learning_rate": 3.956726743929846e-05, + "loss": 0.0087, + "step": 669800 + }, + { + "epoch": 1.74, + "learning_rate": 3.9563379222926994e-05, + "loss": 0.008, + "step": 669810 + }, + { + "epoch": 1.74, + "learning_rate": 3.955949100655553e-05, + "loss": 0.0087, + "step": 669820 + }, + { + "epoch": 1.74, + "learning_rate": 3.955560279018406e-05, + "loss": 0.0071, + "step": 669830 + }, + { + "epoch": 1.74, + "learning_rate": 3.95517145738126e-05, + "loss": 0.0173, + "step": 669840 + }, + { + "epoch": 1.74, + "learning_rate": 3.954782635744113e-05, + "loss": 0.0066, + "step": 669850 + }, + { + "epoch": 1.74, + "learning_rate": 3.954393814106967e-05, + "loss": 0.0083, + "step": 669860 + }, + { + "epoch": 1.74, + "learning_rate": 3.95400499246982e-05, + "loss": 0.0066, + "step": 669870 + }, + { + "epoch": 1.74, + "learning_rate": 3.9536161708326744e-05, + "loss": 0.0098, + "step": 669880 + }, + { + "epoch": 1.74, + "learning_rate": 3.953227349195528e-05, + "loss": 0.0087, + "step": 669890 + }, + { + "epoch": 1.74, + "learning_rate": 3.9528385275583814e-05, + "loss": 0.0057, + "step": 669900 + }, + { + "epoch": 1.74, + "learning_rate": 3.952449705921235e-05, + "loss": 0.0088, + "step": 669910 + }, + { + "epoch": 1.74, + "learning_rate": 3.9520608842840884e-05, + "loss": 0.0111, + "step": 669920 + }, + { + "epoch": 1.74, + "learning_rate": 3.951672062646942e-05, + "loss": 0.0072, + "step": 669930 + }, + { + "epoch": 1.74, + "learning_rate": 3.9512832410097954e-05, + "loss": 0.007, + "step": 669940 + }, + { + "epoch": 1.74, + "learning_rate": 3.950894419372649e-05, + "loss": 0.0119, + "step": 669950 + }, + { + "epoch": 1.74, + "learning_rate": 3.950505597735503e-05, + "loss": 0.0062, + "step": 669960 + }, + { + "epoch": 1.74, + "learning_rate": 3.9501167760983565e-05, + "loss": 0.0096, + "step": 669970 + }, + { + "epoch": 1.74, + "learning_rate": 3.94972795446121e-05, + "loss": 0.0061, + "step": 669980 + }, + { + "epoch": 1.74, + "learning_rate": 3.9493391328240635e-05, + "loss": 0.0078, + "step": 669990 + }, + { + "epoch": 1.74, + "learning_rate": 3.948950311186917e-05, + "loss": 0.0099, + "step": 670000 + }, + { + "epoch": 1.74, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.005133858881890774, + "eval_runtime": 107.9299, + "eval_samples_per_second": 18.531, + "eval_steps_per_second": 4.633, + "step": 670000 + }, + { + "epoch": 1.74, + "learning_rate": 3.9485614895497704e-05, + "loss": 0.0056, + "step": 670010 + }, + { + "epoch": 1.74, + "learning_rate": 3.948172667912623e-05, + "loss": 0.0103, + "step": 670020 + }, + { + "epoch": 1.74, + "learning_rate": 3.947783846275477e-05, + "loss": 0.0142, + "step": 670030 + }, + { + "epoch": 1.74, + "learning_rate": 3.94739502463833e-05, + "loss": 0.0069, + "step": 670040 + }, + { + "epoch": 1.74, + "learning_rate": 3.947006203001184e-05, + "loss": 0.0089, + "step": 670050 + }, + { + "epoch": 1.74, + "learning_rate": 3.946617381364038e-05, + "loss": 0.0086, + "step": 670060 + }, + { + "epoch": 1.74, + "learning_rate": 3.9462285597268914e-05, + "loss": 0.0107, + "step": 670070 + }, + { + "epoch": 1.74, + "learning_rate": 3.945839738089745e-05, + "loss": 0.0117, + "step": 670080 + }, + { + "epoch": 1.74, + "learning_rate": 3.945450916452598e-05, + "loss": 0.007, + "step": 670090 + }, + { + "epoch": 1.74, + "learning_rate": 3.945062094815452e-05, + "loss": 0.0081, + "step": 670100 + }, + { + "epoch": 1.74, + "learning_rate": 3.944673273178305e-05, + "loss": 0.007, + "step": 670110 + }, + { + "epoch": 1.74, + "learning_rate": 3.944284451541159e-05, + "loss": 0.0073, + "step": 670120 + }, + { + "epoch": 1.74, + "learning_rate": 3.943895629904012e-05, + "loss": 0.0079, + "step": 670130 + }, + { + "epoch": 1.74, + "learning_rate": 3.9435068082668664e-05, + "loss": 0.007, + "step": 670140 + }, + { + "epoch": 1.74, + "learning_rate": 3.94311798662972e-05, + "loss": 0.0072, + "step": 670150 + }, + { + "epoch": 1.74, + "learning_rate": 3.9427291649925734e-05, + "loss": 0.008, + "step": 670160 + }, + { + "epoch": 1.74, + "learning_rate": 3.942340343355427e-05, + "loss": 0.0085, + "step": 670170 + }, + { + "epoch": 1.74, + "learning_rate": 3.9419515217182804e-05, + "loss": 0.0069, + "step": 670180 + }, + { + "epoch": 1.74, + "learning_rate": 3.941562700081134e-05, + "loss": 0.0118, + "step": 670190 + }, + { + "epoch": 1.74, + "learning_rate": 3.9411738784439874e-05, + "loss": 0.008, + "step": 670200 + }, + { + "epoch": 1.74, + "learning_rate": 3.940785056806841e-05, + "loss": 0.0079, + "step": 670210 + }, + { + "epoch": 1.74, + "learning_rate": 3.940396235169694e-05, + "loss": 0.0098, + "step": 670220 + }, + { + "epoch": 1.74, + "learning_rate": 3.9400074135325485e-05, + "loss": 0.0074, + "step": 670230 + }, + { + "epoch": 1.74, + "learning_rate": 3.939618591895402e-05, + "loss": 0.0085, + "step": 670240 + }, + { + "epoch": 1.74, + "learning_rate": 3.9392297702582555e-05, + "loss": 0.0081, + "step": 670250 + }, + { + "epoch": 1.74, + "learning_rate": 3.938840948621109e-05, + "loss": 0.0068, + "step": 670260 + }, + { + "epoch": 1.74, + "learning_rate": 3.938452126983962e-05, + "loss": 0.006, + "step": 670270 + }, + { + "epoch": 1.74, + "learning_rate": 3.938063305346815e-05, + "loss": 0.0066, + "step": 670280 + }, + { + "epoch": 1.74, + "learning_rate": 3.937674483709669e-05, + "loss": 0.0068, + "step": 670290 + }, + { + "epoch": 1.74, + "learning_rate": 3.937285662072522e-05, + "loss": 0.008, + "step": 670300 + }, + { + "epoch": 1.74, + "learning_rate": 3.936896840435376e-05, + "loss": 0.0096, + "step": 670310 + }, + { + "epoch": 1.74, + "learning_rate": 3.936508018798229e-05, + "loss": 0.0084, + "step": 670320 + }, + { + "epoch": 1.74, + "learning_rate": 3.9361191971610834e-05, + "loss": 0.0068, + "step": 670330 + }, + { + "epoch": 1.74, + "learning_rate": 3.935730375523937e-05, + "loss": 0.0067, + "step": 670340 + }, + { + "epoch": 1.74, + "learning_rate": 3.93534155388679e-05, + "loss": 0.0064, + "step": 670350 + }, + { + "epoch": 1.74, + "learning_rate": 3.934952732249644e-05, + "loss": 0.0077, + "step": 670360 + }, + { + "epoch": 1.74, + "learning_rate": 3.934563910612497e-05, + "loss": 0.006, + "step": 670370 + }, + { + "epoch": 1.74, + "learning_rate": 3.934175088975351e-05, + "loss": 0.0075, + "step": 670380 + }, + { + "epoch": 1.74, + "learning_rate": 3.933786267338204e-05, + "loss": 0.0084, + "step": 670390 + }, + { + "epoch": 1.74, + "learning_rate": 3.933397445701058e-05, + "loss": 0.0076, + "step": 670400 + }, + { + "epoch": 1.74, + "learning_rate": 3.933008624063912e-05, + "loss": 0.0084, + "step": 670410 + }, + { + "epoch": 1.74, + "learning_rate": 3.9326198024267654e-05, + "loss": 0.0076, + "step": 670420 + }, + { + "epoch": 1.74, + "learning_rate": 3.932230980789619e-05, + "loss": 0.0054, + "step": 670430 + }, + { + "epoch": 1.74, + "learning_rate": 3.9318421591524724e-05, + "loss": 0.0057, + "step": 670440 + }, + { + "epoch": 1.74, + "learning_rate": 3.931453337515326e-05, + "loss": 0.0083, + "step": 670450 + }, + { + "epoch": 1.74, + "learning_rate": 3.9310645158781794e-05, + "loss": 0.0099, + "step": 670460 + }, + { + "epoch": 1.74, + "learning_rate": 3.930675694241033e-05, + "loss": 0.006, + "step": 670470 + }, + { + "epoch": 1.74, + "learning_rate": 3.930286872603886e-05, + "loss": 0.0067, + "step": 670480 + }, + { + "epoch": 1.74, + "learning_rate": 3.9298980509667405e-05, + "loss": 0.0079, + "step": 670490 + }, + { + "epoch": 1.74, + "learning_rate": 3.929509229329594e-05, + "loss": 0.0087, + "step": 670500 + }, + { + "epoch": 1.74, + "learning_rate": 3.929120407692447e-05, + "loss": 0.006, + "step": 670510 + }, + { + "epoch": 1.74, + "learning_rate": 3.9287315860553e-05, + "loss": 0.0081, + "step": 670520 + }, + { + "epoch": 1.74, + "learning_rate": 3.928342764418154e-05, + "loss": 0.007, + "step": 670530 + }, + { + "epoch": 1.74, + "learning_rate": 3.927953942781007e-05, + "loss": 0.0107, + "step": 670540 + }, + { + "epoch": 1.74, + "learning_rate": 3.927565121143861e-05, + "loss": 0.0075, + "step": 670550 + }, + { + "epoch": 1.74, + "learning_rate": 3.927176299506714e-05, + "loss": 0.007, + "step": 670560 + }, + { + "epoch": 1.74, + "learning_rate": 3.926787477869568e-05, + "loss": 0.0078, + "step": 670570 + }, + { + "epoch": 1.74, + "learning_rate": 3.926398656232421e-05, + "loss": 0.0064, + "step": 670580 + }, + { + "epoch": 1.74, + "learning_rate": 3.9260098345952753e-05, + "loss": 0.0101, + "step": 670590 + }, + { + "epoch": 1.74, + "learning_rate": 3.925621012958129e-05, + "loss": 0.007, + "step": 670600 + }, + { + "epoch": 1.74, + "learning_rate": 3.925232191320982e-05, + "loss": 0.0079, + "step": 670610 + }, + { + "epoch": 1.74, + "learning_rate": 3.924843369683836e-05, + "loss": 0.0083, + "step": 670620 + }, + { + "epoch": 1.74, + "learning_rate": 3.924454548046689e-05, + "loss": 0.0084, + "step": 670630 + }, + { + "epoch": 1.74, + "learning_rate": 3.924065726409543e-05, + "loss": 0.0075, + "step": 670640 + }, + { + "epoch": 1.74, + "learning_rate": 3.923676904772396e-05, + "loss": 0.0093, + "step": 670650 + }, + { + "epoch": 1.74, + "learning_rate": 3.92328808313525e-05, + "loss": 0.0073, + "step": 670660 + }, + { + "epoch": 1.74, + "learning_rate": 3.922899261498104e-05, + "loss": 0.0092, + "step": 670670 + }, + { + "epoch": 1.74, + "learning_rate": 3.9225104398609574e-05, + "loss": 0.0065, + "step": 670680 + }, + { + "epoch": 1.74, + "learning_rate": 3.922121618223811e-05, + "loss": 0.0066, + "step": 670690 + }, + { + "epoch": 1.74, + "learning_rate": 3.9217327965866644e-05, + "loss": 0.0061, + "step": 670700 + }, + { + "epoch": 1.74, + "learning_rate": 3.921343974949518e-05, + "loss": 0.0088, + "step": 670710 + }, + { + "epoch": 1.74, + "learning_rate": 3.9209551533123713e-05, + "loss": 0.0097, + "step": 670720 + }, + { + "epoch": 1.74, + "learning_rate": 3.920566331675225e-05, + "loss": 0.0065, + "step": 670730 + }, + { + "epoch": 1.74, + "learning_rate": 3.920177510038078e-05, + "loss": 0.0083, + "step": 670740 + }, + { + "epoch": 1.74, + "learning_rate": 3.9197886884009325e-05, + "loss": 0.0067, + "step": 670750 + }, + { + "epoch": 1.74, + "learning_rate": 3.9193998667637846e-05, + "loss": 0.0067, + "step": 670760 + }, + { + "epoch": 1.74, + "learning_rate": 3.919011045126639e-05, + "loss": 0.0103, + "step": 670770 + }, + { + "epoch": 1.74, + "learning_rate": 3.918622223489492e-05, + "loss": 0.0085, + "step": 670780 + }, + { + "epoch": 1.74, + "learning_rate": 3.918233401852346e-05, + "loss": 0.0083, + "step": 670790 + }, + { + "epoch": 1.74, + "learning_rate": 3.917844580215199e-05, + "loss": 0.006, + "step": 670800 + }, + { + "epoch": 1.74, + "learning_rate": 3.917455758578053e-05, + "loss": 0.0061, + "step": 670810 + }, + { + "epoch": 1.74, + "learning_rate": 3.917066936940906e-05, + "loss": 0.0084, + "step": 670820 + }, + { + "epoch": 1.74, + "learning_rate": 3.91667811530376e-05, + "loss": 0.0077, + "step": 670830 + }, + { + "epoch": 1.74, + "learning_rate": 3.916289293666613e-05, + "loss": 0.006, + "step": 670840 + }, + { + "epoch": 1.74, + "learning_rate": 3.9159004720294673e-05, + "loss": 0.006, + "step": 670850 + }, + { + "epoch": 1.74, + "learning_rate": 3.915511650392321e-05, + "loss": 0.0062, + "step": 670860 + }, + { + "epoch": 1.74, + "learning_rate": 3.915122828755174e-05, + "loss": 0.0074, + "step": 670870 + }, + { + "epoch": 1.74, + "learning_rate": 3.914734007118028e-05, + "loss": 0.0074, + "step": 670880 + }, + { + "epoch": 1.74, + "learning_rate": 3.914345185480881e-05, + "loss": 0.0095, + "step": 670890 + }, + { + "epoch": 1.74, + "learning_rate": 3.913956363843735e-05, + "loss": 0.006, + "step": 670900 + }, + { + "epoch": 1.74, + "learning_rate": 3.913567542206588e-05, + "loss": 0.0055, + "step": 670910 + }, + { + "epoch": 1.74, + "learning_rate": 3.913178720569442e-05, + "loss": 0.0085, + "step": 670920 + }, + { + "epoch": 1.74, + "learning_rate": 3.912789898932296e-05, + "loss": 0.0088, + "step": 670930 + }, + { + "epoch": 1.74, + "learning_rate": 3.9124010772951494e-05, + "loss": 0.0117, + "step": 670940 + }, + { + "epoch": 1.74, + "learning_rate": 3.912012255658003e-05, + "loss": 0.0078, + "step": 670950 + }, + { + "epoch": 1.74, + "learning_rate": 3.9116234340208564e-05, + "loss": 0.0097, + "step": 670960 + }, + { + "epoch": 1.74, + "learning_rate": 3.91123461238371e-05, + "loss": 0.0067, + "step": 670970 + }, + { + "epoch": 1.74, + "learning_rate": 3.9108457907465633e-05, + "loss": 0.0073, + "step": 670980 + }, + { + "epoch": 1.74, + "learning_rate": 3.910456969109417e-05, + "loss": 0.0103, + "step": 670990 + }, + { + "epoch": 1.74, + "learning_rate": 3.91006814747227e-05, + "loss": 0.0069, + "step": 671000 + }, + { + "epoch": 1.74, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.005163580644875765, + "eval_runtime": 107.8528, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, + "step": 671000 + }, + { + "epoch": 1.74, + "learning_rate": 3.909679325835123e-05, + "loss": 0.0099, + "step": 671010 + }, + { + "epoch": 1.74, + "learning_rate": 3.9092905041979766e-05, + "loss": 0.007, + "step": 671020 + }, + { + "epoch": 1.74, + "learning_rate": 3.908901682560831e-05, + "loss": 0.0075, + "step": 671030 + }, + { + "epoch": 1.74, + "learning_rate": 3.908512860923684e-05, + "loss": 0.0086, + "step": 671040 + }, + { + "epoch": 1.74, + "learning_rate": 3.908124039286538e-05, + "loss": 0.0076, + "step": 671050 + }, + { + "epoch": 1.74, + "learning_rate": 3.907735217649391e-05, + "loss": 0.0082, + "step": 671060 + }, + { + "epoch": 1.74, + "learning_rate": 3.907346396012245e-05, + "loss": 0.0084, + "step": 671070 + }, + { + "epoch": 1.74, + "learning_rate": 3.906957574375098e-05, + "loss": 0.0098, + "step": 671080 + }, + { + "epoch": 1.74, + "learning_rate": 3.906568752737952e-05, + "loss": 0.0157, + "step": 671090 + }, + { + "epoch": 1.74, + "learning_rate": 3.906179931100805e-05, + "loss": 0.0093, + "step": 671100 + }, + { + "epoch": 1.74, + "learning_rate": 3.905791109463659e-05, + "loss": 0.0092, + "step": 671110 + }, + { + "epoch": 1.74, + "learning_rate": 3.905402287826513e-05, + "loss": 0.0094, + "step": 671120 + }, + { + "epoch": 1.74, + "learning_rate": 3.905013466189366e-05, + "loss": 0.0082, + "step": 671130 + }, + { + "epoch": 1.74, + "learning_rate": 3.90462464455222e-05, + "loss": 0.0063, + "step": 671140 + }, + { + "epoch": 1.74, + "learning_rate": 3.904235822915073e-05, + "loss": 0.0079, + "step": 671150 + }, + { + "epoch": 1.74, + "learning_rate": 3.903847001277927e-05, + "loss": 0.0088, + "step": 671160 + }, + { + "epoch": 1.74, + "learning_rate": 3.90345817964078e-05, + "loss": 0.0092, + "step": 671170 + }, + { + "epoch": 1.74, + "learning_rate": 3.903069358003634e-05, + "loss": 0.0077, + "step": 671180 + }, + { + "epoch": 1.74, + "learning_rate": 3.902680536366488e-05, + "loss": 0.0092, + "step": 671190 + }, + { + "epoch": 1.74, + "learning_rate": 3.9022917147293414e-05, + "loss": 0.0075, + "step": 671200 + }, + { + "epoch": 1.74, + "learning_rate": 3.901902893092195e-05, + "loss": 0.0075, + "step": 671210 + }, + { + "epoch": 1.74, + "learning_rate": 3.9015140714550484e-05, + "loss": 0.007, + "step": 671220 + }, + { + "epoch": 1.74, + "learning_rate": 3.901125249817902e-05, + "loss": 0.0096, + "step": 671230 + }, + { + "epoch": 1.74, + "learning_rate": 3.900736428180755e-05, + "loss": 0.0086, + "step": 671240 + }, + { + "epoch": 1.74, + "learning_rate": 3.900347606543609e-05, + "loss": 0.0084, + "step": 671250 + }, + { + "epoch": 1.74, + "learning_rate": 3.8999587849064616e-05, + "loss": 0.0078, + "step": 671260 + }, + { + "epoch": 1.74, + "learning_rate": 3.899569963269315e-05, + "loss": 0.0109, + "step": 671270 + }, + { + "epoch": 1.74, + "learning_rate": 3.8991811416321686e-05, + "loss": 0.0104, + "step": 671280 + }, + { + "epoch": 1.74, + "learning_rate": 3.898792319995023e-05, + "loss": 0.0081, + "step": 671290 + }, + { + "epoch": 1.74, + "learning_rate": 3.898403498357876e-05, + "loss": 0.0066, + "step": 671300 + }, + { + "epoch": 1.74, + "learning_rate": 3.89801467672073e-05, + "loss": 0.0097, + "step": 671310 + }, + { + "epoch": 1.74, + "learning_rate": 3.897625855083583e-05, + "loss": 0.0083, + "step": 671320 + }, + { + "epoch": 1.74, + "learning_rate": 3.897237033446437e-05, + "loss": 0.0065, + "step": 671330 + }, + { + "epoch": 1.74, + "learning_rate": 3.89684821180929e-05, + "loss": 0.0073, + "step": 671340 + }, + { + "epoch": 1.74, + "learning_rate": 3.896459390172144e-05, + "loss": 0.0056, + "step": 671350 + }, + { + "epoch": 1.74, + "learning_rate": 3.896070568534997e-05, + "loss": 0.0062, + "step": 671360 + }, + { + "epoch": 1.74, + "learning_rate": 3.895681746897851e-05, + "loss": 0.0091, + "step": 671370 + }, + { + "epoch": 1.74, + "learning_rate": 3.895292925260705e-05, + "loss": 0.0068, + "step": 671380 + }, + { + "epoch": 1.74, + "learning_rate": 3.894904103623558e-05, + "loss": 0.0072, + "step": 671390 + }, + { + "epoch": 1.74, + "learning_rate": 3.894515281986412e-05, + "loss": 0.0065, + "step": 671400 + }, + { + "epoch": 1.74, + "learning_rate": 3.894126460349265e-05, + "loss": 0.0081, + "step": 671410 + }, + { + "epoch": 1.74, + "learning_rate": 3.893737638712119e-05, + "loss": 0.0058, + "step": 671420 + }, + { + "epoch": 1.74, + "learning_rate": 3.893348817074972e-05, + "loss": 0.0061, + "step": 671430 + }, + { + "epoch": 1.74, + "learning_rate": 3.892959995437826e-05, + "loss": 0.0064, + "step": 671440 + }, + { + "epoch": 1.74, + "learning_rate": 3.89257117380068e-05, + "loss": 0.0069, + "step": 671450 + }, + { + "epoch": 1.74, + "learning_rate": 3.8921823521635334e-05, + "loss": 0.0083, + "step": 671460 + }, + { + "epoch": 1.74, + "learning_rate": 3.891793530526387e-05, + "loss": 0.0071, + "step": 671470 + }, + { + "epoch": 1.74, + "learning_rate": 3.8914047088892404e-05, + "loss": 0.0101, + "step": 671480 + }, + { + "epoch": 1.74, + "learning_rate": 3.891015887252094e-05, + "loss": 0.0086, + "step": 671490 + }, + { + "epoch": 1.74, + "learning_rate": 3.890627065614947e-05, + "loss": 0.0069, + "step": 671500 + }, + { + "epoch": 1.74, + "learning_rate": 3.8902382439778e-05, + "loss": 0.0083, + "step": 671510 + }, + { + "epoch": 1.74, + "learning_rate": 3.8898494223406536e-05, + "loss": 0.0068, + "step": 671520 + }, + { + "epoch": 1.74, + "learning_rate": 3.889460600703507e-05, + "loss": 0.0102, + "step": 671530 + }, + { + "epoch": 1.74, + "learning_rate": 3.8890717790663606e-05, + "loss": 0.0114, + "step": 671540 + }, + { + "epoch": 1.74, + "learning_rate": 3.888682957429215e-05, + "loss": 0.007, + "step": 671550 + }, + { + "epoch": 1.74, + "learning_rate": 3.888294135792068e-05, + "loss": 0.0077, + "step": 671560 + }, + { + "epoch": 1.74, + "learning_rate": 3.887905314154922e-05, + "loss": 0.0078, + "step": 671570 + }, + { + "epoch": 1.74, + "learning_rate": 3.887516492517775e-05, + "loss": 0.0095, + "step": 671580 + }, + { + "epoch": 1.74, + "learning_rate": 3.887127670880629e-05, + "loss": 0.0124, + "step": 671590 + }, + { + "epoch": 1.74, + "learning_rate": 3.886738849243482e-05, + "loss": 0.0076, + "step": 671600 + }, + { + "epoch": 1.74, + "learning_rate": 3.886350027606336e-05, + "loss": 0.0064, + "step": 671610 + }, + { + "epoch": 1.74, + "learning_rate": 3.885961205969189e-05, + "loss": 0.0073, + "step": 671620 + }, + { + "epoch": 1.74, + "learning_rate": 3.8855723843320427e-05, + "loss": 0.0057, + "step": 671630 + }, + { + "epoch": 1.74, + "learning_rate": 3.885183562694897e-05, + "loss": 0.0067, + "step": 671640 + }, + { + "epoch": 1.74, + "learning_rate": 3.88479474105775e-05, + "loss": 0.0075, + "step": 671650 + }, + { + "epoch": 1.74, + "learning_rate": 3.884405919420604e-05, + "loss": 0.0074, + "step": 671660 + }, + { + "epoch": 1.74, + "learning_rate": 3.884017097783457e-05, + "loss": 0.0094, + "step": 671670 + }, + { + "epoch": 1.74, + "learning_rate": 3.883628276146311e-05, + "loss": 0.0082, + "step": 671680 + }, + { + "epoch": 1.74, + "learning_rate": 3.883239454509164e-05, + "loss": 0.0118, + "step": 671690 + }, + { + "epoch": 1.74, + "learning_rate": 3.882850632872018e-05, + "loss": 0.0062, + "step": 671700 + }, + { + "epoch": 1.74, + "learning_rate": 3.882461811234871e-05, + "loss": 0.0065, + "step": 671710 + }, + { + "epoch": 1.74, + "learning_rate": 3.8820729895977254e-05, + "loss": 0.0064, + "step": 671720 + }, + { + "epoch": 1.74, + "learning_rate": 3.881684167960579e-05, + "loss": 0.0066, + "step": 671730 + }, + { + "epoch": 1.74, + "learning_rate": 3.8812953463234324e-05, + "loss": 0.0071, + "step": 671740 + }, + { + "epoch": 1.74, + "learning_rate": 3.880906524686285e-05, + "loss": 0.0071, + "step": 671750 + }, + { + "epoch": 1.74, + "learning_rate": 3.8805177030491386e-05, + "loss": 0.0059, + "step": 671760 + }, + { + "epoch": 1.74, + "learning_rate": 3.880128881411992e-05, + "loss": 0.0069, + "step": 671770 + }, + { + "epoch": 1.74, + "learning_rate": 3.8797400597748456e-05, + "loss": 0.0085, + "step": 671780 + }, + { + "epoch": 1.74, + "learning_rate": 3.879351238137699e-05, + "loss": 0.0076, + "step": 671790 + }, + { + "epoch": 1.74, + "learning_rate": 3.8789624165005526e-05, + "loss": 0.0076, + "step": 671800 + }, + { + "epoch": 1.74, + "learning_rate": 3.878573594863406e-05, + "loss": 0.0102, + "step": 671810 + }, + { + "epoch": 1.74, + "learning_rate": 3.87818477322626e-05, + "loss": 0.0079, + "step": 671820 + }, + { + "epoch": 1.74, + "learning_rate": 3.877795951589114e-05, + "loss": 0.0073, + "step": 671830 + }, + { + "epoch": 1.74, + "learning_rate": 3.877407129951967e-05, + "loss": 0.0055, + "step": 671840 + }, + { + "epoch": 1.74, + "learning_rate": 3.877018308314821e-05, + "loss": 0.0058, + "step": 671850 + }, + { + "epoch": 1.74, + "learning_rate": 3.876629486677674e-05, + "loss": 0.0074, + "step": 671860 + }, + { + "epoch": 1.74, + "learning_rate": 3.876240665040528e-05, + "loss": 0.0078, + "step": 671870 + }, + { + "epoch": 1.74, + "learning_rate": 3.875851843403381e-05, + "loss": 0.0056, + "step": 671880 + }, + { + "epoch": 1.74, + "learning_rate": 3.8754630217662346e-05, + "loss": 0.0065, + "step": 671890 + }, + { + "epoch": 1.74, + "learning_rate": 3.875074200129089e-05, + "loss": 0.0093, + "step": 671900 + }, + { + "epoch": 1.74, + "learning_rate": 3.874685378491942e-05, + "loss": 0.0069, + "step": 671910 + }, + { + "epoch": 1.74, + "learning_rate": 3.874296556854796e-05, + "loss": 0.008, + "step": 671920 + }, + { + "epoch": 1.74, + "learning_rate": 3.873907735217649e-05, + "loss": 0.0091, + "step": 671930 + }, + { + "epoch": 1.74, + "learning_rate": 3.873518913580503e-05, + "loss": 0.0084, + "step": 671940 + }, + { + "epoch": 1.74, + "learning_rate": 3.873130091943356e-05, + "loss": 0.0098, + "step": 671950 + }, + { + "epoch": 1.74, + "learning_rate": 3.87274127030621e-05, + "loss": 0.0065, + "step": 671960 + }, + { + "epoch": 1.74, + "learning_rate": 3.872352448669063e-05, + "loss": 0.009, + "step": 671970 + }, + { + "epoch": 1.74, + "learning_rate": 3.8719636270319174e-05, + "loss": 0.0073, + "step": 671980 + }, + { + "epoch": 1.74, + "learning_rate": 3.871574805394771e-05, + "loss": 0.0052, + "step": 671990 + }, + { + "epoch": 1.74, + "learning_rate": 3.871185983757624e-05, + "loss": 0.008, + "step": 672000 + }, + { + "epoch": 1.74, + "eval_cer": 0.8816508997566032, + "eval_loss": 0.00507059833034873, + "eval_runtime": 107.8496, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, + "step": 672000 + }, + { + "epoch": 1.74, + "learning_rate": 3.870797162120477e-05, + "loss": 0.01, + "step": 672010 + }, + { + "epoch": 1.74, + "learning_rate": 3.8704083404833306e-05, + "loss": 0.0073, + "step": 672020 + }, + { + "epoch": 1.74, + "learning_rate": 3.870019518846184e-05, + "loss": 0.0084, + "step": 672030 + }, + { + "epoch": 1.74, + "learning_rate": 3.8696306972090376e-05, + "loss": 0.0082, + "step": 672040 + }, + { + "epoch": 1.74, + "learning_rate": 3.869241875571891e-05, + "loss": 0.0114, + "step": 672050 + }, + { + "epoch": 1.74, + "learning_rate": 3.8688530539347446e-05, + "loss": 0.0093, + "step": 672060 + }, + { + "epoch": 1.74, + "learning_rate": 3.868464232297598e-05, + "loss": 0.0082, + "step": 672070 + }, + { + "epoch": 1.74, + "learning_rate": 3.868075410660452e-05, + "loss": 0.0097, + "step": 672080 + }, + { + "epoch": 1.74, + "learning_rate": 3.867686589023306e-05, + "loss": 0.0088, + "step": 672090 + }, + { + "epoch": 1.74, + "learning_rate": 3.867297767386159e-05, + "loss": 0.0108, + "step": 672100 + }, + { + "epoch": 1.74, + "learning_rate": 3.866908945749013e-05, + "loss": 0.0081, + "step": 672110 + }, + { + "epoch": 1.74, + "learning_rate": 3.866520124111866e-05, + "loss": 0.0071, + "step": 672120 + }, + { + "epoch": 1.74, + "learning_rate": 3.86613130247472e-05, + "loss": 0.0078, + "step": 672130 + }, + { + "epoch": 1.74, + "learning_rate": 3.865742480837573e-05, + "loss": 0.0068, + "step": 672140 + }, + { + "epoch": 1.74, + "learning_rate": 3.8653536592004266e-05, + "loss": 0.0081, + "step": 672150 + }, + { + "epoch": 1.74, + "learning_rate": 3.864964837563281e-05, + "loss": 0.0085, + "step": 672160 + }, + { + "epoch": 1.74, + "learning_rate": 3.864576015926134e-05, + "loss": 0.01, + "step": 672170 + }, + { + "epoch": 1.74, + "learning_rate": 3.864187194288988e-05, + "loss": 0.0081, + "step": 672180 + }, + { + "epoch": 1.74, + "learning_rate": 3.863798372651841e-05, + "loss": 0.0069, + "step": 672190 + }, + { + "epoch": 1.74, + "learning_rate": 3.863409551014695e-05, + "loss": 0.0081, + "step": 672200 + }, + { + "epoch": 1.74, + "learning_rate": 3.863020729377548e-05, + "loss": 0.0086, + "step": 672210 + }, + { + "epoch": 1.74, + "learning_rate": 3.862631907740402e-05, + "loss": 0.0101, + "step": 672220 + }, + { + "epoch": 1.74, + "learning_rate": 3.862243086103255e-05, + "loss": 0.0099, + "step": 672230 + }, + { + "epoch": 1.74, + "learning_rate": 3.8618542644661094e-05, + "loss": 0.0079, + "step": 672240 + }, + { + "epoch": 1.74, + "learning_rate": 3.8614654428289615e-05, + "loss": 0.0054, + "step": 672250 + }, + { + "epoch": 1.74, + "learning_rate": 3.861076621191816e-05, + "loss": 0.0095, + "step": 672260 + }, + { + "epoch": 1.74, + "learning_rate": 3.860687799554669e-05, + "loss": 0.0058, + "step": 672270 + }, + { + "epoch": 1.74, + "learning_rate": 3.8602989779175226e-05, + "loss": 0.01, + "step": 672280 + }, + { + "epoch": 1.74, + "learning_rate": 3.859910156280376e-05, + "loss": 0.0062, + "step": 672290 + }, + { + "epoch": 1.74, + "learning_rate": 3.8595213346432296e-05, + "loss": 0.0065, + "step": 672300 + }, + { + "epoch": 1.74, + "learning_rate": 3.859132513006083e-05, + "loss": 0.0119, + "step": 672310 + }, + { + "epoch": 1.74, + "learning_rate": 3.8587436913689366e-05, + "loss": 0.006, + "step": 672320 + }, + { + "epoch": 1.74, + "learning_rate": 3.85835486973179e-05, + "loss": 0.0091, + "step": 672330 + }, + { + "epoch": 1.74, + "learning_rate": 3.857966048094644e-05, + "loss": 0.0073, + "step": 672340 + }, + { + "epoch": 1.74, + "learning_rate": 3.857577226457498e-05, + "loss": 0.007, + "step": 672350 + }, + { + "epoch": 1.74, + "learning_rate": 3.857188404820351e-05, + "loss": 0.0094, + "step": 672360 + }, + { + "epoch": 1.74, + "learning_rate": 3.856799583183205e-05, + "loss": 0.0065, + "step": 672370 + }, + { + "epoch": 1.74, + "learning_rate": 3.856410761546058e-05, + "loss": 0.0083, + "step": 672380 + }, + { + "epoch": 1.74, + "learning_rate": 3.856021939908912e-05, + "loss": 0.0088, + "step": 672390 + }, + { + "epoch": 1.74, + "learning_rate": 3.855633118271765e-05, + "loss": 0.0136, + "step": 672400 + }, + { + "epoch": 1.74, + "learning_rate": 3.8552442966346186e-05, + "loss": 0.0099, + "step": 672410 + }, + { + "epoch": 1.74, + "learning_rate": 3.854855474997473e-05, + "loss": 0.0157, + "step": 672420 + }, + { + "epoch": 1.74, + "learning_rate": 3.854466653360326e-05, + "loss": 0.0082, + "step": 672430 + }, + { + "epoch": 1.74, + "learning_rate": 3.85407783172318e-05, + "loss": 0.007, + "step": 672440 + }, + { + "epoch": 1.74, + "learning_rate": 3.853689010086033e-05, + "loss": 0.0067, + "step": 672450 + }, + { + "epoch": 1.74, + "learning_rate": 3.853300188448887e-05, + "loss": 0.013, + "step": 672460 + }, + { + "epoch": 1.74, + "learning_rate": 3.85291136681174e-05, + "loss": 0.0075, + "step": 672470 + }, + { + "epoch": 1.74, + "learning_rate": 3.852522545174594e-05, + "loss": 0.0093, + "step": 672480 + }, + { + "epoch": 1.74, + "learning_rate": 3.852133723537447e-05, + "loss": 0.0096, + "step": 672490 + }, + { + "epoch": 1.74, + "learning_rate": 3.8517449019003e-05, + "loss": 0.0073, + "step": 672500 + }, + { + "epoch": 1.74, + "learning_rate": 3.8513560802631535e-05, + "loss": 0.0065, + "step": 672510 + }, + { + "epoch": 1.74, + "learning_rate": 3.850967258626008e-05, + "loss": 0.0089, + "step": 672520 + }, + { + "epoch": 1.74, + "learning_rate": 3.850578436988861e-05, + "loss": 0.0097, + "step": 672530 + }, + { + "epoch": 1.74, + "learning_rate": 3.8501896153517146e-05, + "loss": 0.0111, + "step": 672540 + }, + { + "epoch": 1.74, + "learning_rate": 3.849800793714568e-05, + "loss": 0.0068, + "step": 672550 + }, + { + "epoch": 1.74, + "learning_rate": 3.8494119720774216e-05, + "loss": 0.0066, + "step": 672560 + }, + { + "epoch": 1.74, + "learning_rate": 3.849023150440275e-05, + "loss": 0.0056, + "step": 672570 + }, + { + "epoch": 1.74, + "learning_rate": 3.8486343288031286e-05, + "loss": 0.0095, + "step": 672580 + }, + { + "epoch": 1.74, + "learning_rate": 3.848245507165982e-05, + "loss": 0.0087, + "step": 672590 + }, + { + "epoch": 1.74, + "learning_rate": 3.847856685528836e-05, + "loss": 0.0088, + "step": 672600 + }, + { + "epoch": 1.74, + "learning_rate": 3.84746786389169e-05, + "loss": 0.0084, + "step": 672610 + }, + { + "epoch": 1.74, + "learning_rate": 3.847079042254543e-05, + "loss": 0.0101, + "step": 672620 + }, + { + "epoch": 1.74, + "learning_rate": 3.846690220617397e-05, + "loss": 0.0087, + "step": 672630 + }, + { + "epoch": 1.74, + "learning_rate": 3.84630139898025e-05, + "loss": 0.0073, + "step": 672640 + }, + { + "epoch": 1.74, + "learning_rate": 3.8459125773431037e-05, + "loss": 0.0088, + "step": 672650 + }, + { + "epoch": 1.74, + "learning_rate": 3.845523755705957e-05, + "loss": 0.0088, + "step": 672660 + }, + { + "epoch": 1.74, + "learning_rate": 3.8451349340688106e-05, + "loss": 0.0069, + "step": 672670 + }, + { + "epoch": 1.74, + "learning_rate": 3.844746112431665e-05, + "loss": 0.0075, + "step": 672680 + }, + { + "epoch": 1.74, + "learning_rate": 3.844357290794518e-05, + "loss": 0.0079, + "step": 672690 + }, + { + "epoch": 1.74, + "learning_rate": 3.843968469157372e-05, + "loss": 0.0063, + "step": 672700 + }, + { + "epoch": 1.74, + "learning_rate": 3.843579647520225e-05, + "loss": 0.0065, + "step": 672710 + }, + { + "epoch": 1.74, + "learning_rate": 3.843190825883079e-05, + "loss": 0.0093, + "step": 672720 + }, + { + "epoch": 1.74, + "learning_rate": 3.842802004245932e-05, + "loss": 0.007, + "step": 672730 + }, + { + "epoch": 1.74, + "learning_rate": 3.842413182608786e-05, + "loss": 0.0076, + "step": 672740 + }, + { + "epoch": 1.74, + "learning_rate": 3.8420243609716385e-05, + "loss": 0.0078, + "step": 672750 + }, + { + "epoch": 1.74, + "learning_rate": 3.841635539334492e-05, + "loss": 0.0103, + "step": 672760 + }, + { + "epoch": 1.74, + "learning_rate": 3.8412467176973455e-05, + "loss": 0.0075, + "step": 672770 + }, + { + "epoch": 1.74, + "learning_rate": 3.8408578960601997e-05, + "loss": 0.0084, + "step": 672780 + }, + { + "epoch": 1.74, + "learning_rate": 3.840469074423053e-05, + "loss": 0.007, + "step": 672790 + }, + { + "epoch": 1.74, + "learning_rate": 3.8400802527859066e-05, + "loss": 0.008, + "step": 672800 + }, + { + "epoch": 1.74, + "learning_rate": 3.83969143114876e-05, + "loss": 0.0078, + "step": 672810 + }, + { + "epoch": 1.74, + "learning_rate": 3.8393026095116136e-05, + "loss": 0.0102, + "step": 672820 + }, + { + "epoch": 1.74, + "learning_rate": 3.838913787874467e-05, + "loss": 0.0068, + "step": 672830 + }, + { + "epoch": 1.74, + "learning_rate": 3.8385249662373206e-05, + "loss": 0.0077, + "step": 672840 + }, + { + "epoch": 1.74, + "learning_rate": 3.838136144600174e-05, + "loss": 0.0081, + "step": 672850 + }, + { + "epoch": 1.74, + "learning_rate": 3.837747322963028e-05, + "loss": 0.0091, + "step": 672860 + }, + { + "epoch": 1.74, + "learning_rate": 3.837358501325882e-05, + "loss": 0.0087, + "step": 672870 + }, + { + "epoch": 1.74, + "learning_rate": 3.836969679688735e-05, + "loss": 0.0072, + "step": 672880 + }, + { + "epoch": 1.74, + "learning_rate": 3.836580858051589e-05, + "loss": 0.0096, + "step": 672890 + }, + { + "epoch": 1.74, + "learning_rate": 3.836192036414442e-05, + "loss": 0.0073, + "step": 672900 + }, + { + "epoch": 1.74, + "learning_rate": 3.8358032147772957e-05, + "loss": 0.0102, + "step": 672910 + }, + { + "epoch": 1.74, + "learning_rate": 3.835414393140149e-05, + "loss": 0.0068, + "step": 672920 + }, + { + "epoch": 1.74, + "learning_rate": 3.8350255715030026e-05, + "loss": 0.0075, + "step": 672930 + }, + { + "epoch": 1.74, + "learning_rate": 3.834636749865856e-05, + "loss": 0.0088, + "step": 672940 + }, + { + "epoch": 1.74, + "learning_rate": 3.83424792822871e-05, + "loss": 0.0048, + "step": 672950 + }, + { + "epoch": 1.74, + "learning_rate": 3.833859106591564e-05, + "loss": 0.009, + "step": 672960 + }, + { + "epoch": 1.74, + "learning_rate": 3.833470284954417e-05, + "loss": 0.0073, + "step": 672970 + }, + { + "epoch": 1.74, + "learning_rate": 3.833081463317271e-05, + "loss": 0.0082, + "step": 672980 + }, + { + "epoch": 1.74, + "learning_rate": 3.8326926416801235e-05, + "loss": 0.0086, + "step": 672990 + }, + { + "epoch": 1.74, + "learning_rate": 3.832303820042977e-05, + "loss": 0.0095, + "step": 673000 + }, + { + "epoch": 1.74, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.005063023883849382, + "eval_runtime": 108.0509, + "eval_samples_per_second": 18.51, + "eval_steps_per_second": 4.627, + "step": 673000 + }, + { + "epoch": 1.74, + "learning_rate": 3.8319149984058305e-05, + "loss": 0.0098, + "step": 673010 + }, + { + "epoch": 1.74, + "learning_rate": 3.831526176768684e-05, + "loss": 0.0068, + "step": 673020 + }, + { + "epoch": 1.74, + "learning_rate": 3.8311373551315375e-05, + "loss": 0.0071, + "step": 673030 + }, + { + "epoch": 1.74, + "learning_rate": 3.8307485334943917e-05, + "loss": 0.0094, + "step": 673040 + }, + { + "epoch": 1.74, + "learning_rate": 3.830359711857245e-05, + "loss": 0.006, + "step": 673050 + }, + { + "epoch": 1.74, + "learning_rate": 3.8299708902200986e-05, + "loss": 0.0064, + "step": 673060 + }, + { + "epoch": 1.74, + "learning_rate": 3.829582068582952e-05, + "loss": 0.0074, + "step": 673070 + }, + { + "epoch": 1.74, + "learning_rate": 3.8291932469458056e-05, + "loss": 0.0081, + "step": 673080 + }, + { + "epoch": 1.74, + "learning_rate": 3.828804425308659e-05, + "loss": 0.0069, + "step": 673090 + }, + { + "epoch": 1.74, + "learning_rate": 3.8284156036715126e-05, + "loss": 0.0052, + "step": 673100 + }, + { + "epoch": 1.74, + "learning_rate": 3.828026782034366e-05, + "loss": 0.0088, + "step": 673110 + }, + { + "epoch": 1.74, + "learning_rate": 3.8276379603972195e-05, + "loss": 0.0078, + "step": 673120 + }, + { + "epoch": 1.74, + "learning_rate": 3.827249138760074e-05, + "loss": 0.0086, + "step": 673130 + }, + { + "epoch": 1.74, + "learning_rate": 3.826860317122927e-05, + "loss": 0.0077, + "step": 673140 + }, + { + "epoch": 1.74, + "learning_rate": 3.826471495485781e-05, + "loss": 0.0086, + "step": 673150 + }, + { + "epoch": 1.74, + "learning_rate": 3.826082673848634e-05, + "loss": 0.0064, + "step": 673160 + }, + { + "epoch": 1.74, + "learning_rate": 3.8256938522114876e-05, + "loss": 0.0062, + "step": 673170 + }, + { + "epoch": 1.74, + "learning_rate": 3.825305030574341e-05, + "loss": 0.0074, + "step": 673180 + }, + { + "epoch": 1.75, + "learning_rate": 3.8249162089371946e-05, + "loss": 0.0068, + "step": 673190 + }, + { + "epoch": 1.75, + "learning_rate": 3.824527387300048e-05, + "loss": 0.007, + "step": 673200 + }, + { + "epoch": 1.75, + "learning_rate": 3.824138565662902e-05, + "loss": 0.0056, + "step": 673210 + }, + { + "epoch": 1.75, + "learning_rate": 3.823749744025756e-05, + "loss": 0.0083, + "step": 673220 + }, + { + "epoch": 1.75, + "learning_rate": 3.823360922388609e-05, + "loss": 0.0081, + "step": 673230 + }, + { + "epoch": 1.75, + "learning_rate": 3.822972100751462e-05, + "loss": 0.0076, + "step": 673240 + }, + { + "epoch": 1.75, + "learning_rate": 3.8225832791143155e-05, + "loss": 0.007, + "step": 673250 + }, + { + "epoch": 1.75, + "learning_rate": 3.822194457477169e-05, + "loss": 0.0075, + "step": 673260 + }, + { + "epoch": 1.75, + "learning_rate": 3.8218056358400225e-05, + "loss": 0.006, + "step": 673270 + }, + { + "epoch": 1.75, + "learning_rate": 3.821416814202876e-05, + "loss": 0.0114, + "step": 673280 + }, + { + "epoch": 1.75, + "learning_rate": 3.8210279925657295e-05, + "loss": 0.0084, + "step": 673290 + }, + { + "epoch": 1.75, + "learning_rate": 3.820639170928583e-05, + "loss": 0.0068, + "step": 673300 + }, + { + "epoch": 1.75, + "learning_rate": 3.820250349291437e-05, + "loss": 0.0094, + "step": 673310 + }, + { + "epoch": 1.75, + "learning_rate": 3.8198615276542906e-05, + "loss": 0.0078, + "step": 673320 + }, + { + "epoch": 1.75, + "learning_rate": 3.819472706017144e-05, + "loss": 0.0066, + "step": 673330 + }, + { + "epoch": 1.75, + "learning_rate": 3.8190838843799976e-05, + "loss": 0.0091, + "step": 673340 + }, + { + "epoch": 1.75, + "learning_rate": 3.818695062742851e-05, + "loss": 0.0078, + "step": 673350 + }, + { + "epoch": 1.75, + "learning_rate": 3.8183062411057046e-05, + "loss": 0.0059, + "step": 673360 + }, + { + "epoch": 1.75, + "learning_rate": 3.817917419468558e-05, + "loss": 0.0065, + "step": 673370 + }, + { + "epoch": 1.75, + "learning_rate": 3.8175285978314115e-05, + "loss": 0.0108, + "step": 673380 + }, + { + "epoch": 1.75, + "learning_rate": 3.817139776194266e-05, + "loss": 0.012, + "step": 673390 + }, + { + "epoch": 1.75, + "learning_rate": 3.816750954557119e-05, + "loss": 0.0106, + "step": 673400 + }, + { + "epoch": 1.75, + "learning_rate": 3.816362132919973e-05, + "loss": 0.009, + "step": 673410 + }, + { + "epoch": 1.75, + "learning_rate": 3.815973311282826e-05, + "loss": 0.0063, + "step": 673420 + }, + { + "epoch": 1.75, + "learning_rate": 3.8155844896456796e-05, + "loss": 0.0094, + "step": 673430 + }, + { + "epoch": 1.75, + "learning_rate": 3.815195668008533e-05, + "loss": 0.0112, + "step": 673440 + }, + { + "epoch": 1.75, + "learning_rate": 3.8148068463713866e-05, + "loss": 0.0072, + "step": 673450 + }, + { + "epoch": 1.75, + "learning_rate": 3.81441802473424e-05, + "loss": 0.0081, + "step": 673460 + }, + { + "epoch": 1.75, + "learning_rate": 3.814029203097094e-05, + "loss": 0.0056, + "step": 673470 + }, + { + "epoch": 1.75, + "learning_rate": 3.813640381459948e-05, + "loss": 0.0075, + "step": 673480 + }, + { + "epoch": 1.75, + "learning_rate": 3.8132515598228006e-05, + "loss": 0.0084, + "step": 673490 + }, + { + "epoch": 1.75, + "learning_rate": 3.812862738185654e-05, + "loss": 0.0088, + "step": 673500 + }, + { + "epoch": 1.75, + "learning_rate": 3.8124739165485075e-05, + "loss": 0.0078, + "step": 673510 + }, + { + "epoch": 1.75, + "learning_rate": 3.812085094911361e-05, + "loss": 0.0066, + "step": 673520 + }, + { + "epoch": 1.75, + "learning_rate": 3.8116962732742145e-05, + "loss": 0.0076, + "step": 673530 + }, + { + "epoch": 1.75, + "learning_rate": 3.811307451637068e-05, + "loss": 0.0071, + "step": 673540 + }, + { + "epoch": 1.75, + "learning_rate": 3.8109186299999215e-05, + "loss": 0.0094, + "step": 673550 + }, + { + "epoch": 1.75, + "learning_rate": 3.810529808362775e-05, + "loss": 0.0073, + "step": 673560 + }, + { + "epoch": 1.75, + "learning_rate": 3.810140986725629e-05, + "loss": 0.0065, + "step": 673570 + }, + { + "epoch": 1.75, + "learning_rate": 3.8097521650884826e-05, + "loss": 0.0073, + "step": 673580 + }, + { + "epoch": 1.75, + "learning_rate": 3.809363343451336e-05, + "loss": 0.0078, + "step": 673590 + }, + { + "epoch": 1.75, + "learning_rate": 3.8089745218141896e-05, + "loss": 0.0073, + "step": 673600 + }, + { + "epoch": 1.75, + "learning_rate": 3.808585700177043e-05, + "loss": 0.0073, + "step": 673610 + }, + { + "epoch": 1.75, + "learning_rate": 3.8081968785398966e-05, + "loss": 0.0094, + "step": 673620 + }, + { + "epoch": 1.75, + "learning_rate": 3.80780805690275e-05, + "loss": 0.0085, + "step": 673630 + }, + { + "epoch": 1.75, + "learning_rate": 3.8074192352656035e-05, + "loss": 0.008, + "step": 673640 + }, + { + "epoch": 1.75, + "learning_rate": 3.807030413628458e-05, + "loss": 0.0106, + "step": 673650 + }, + { + "epoch": 1.75, + "learning_rate": 3.806641591991311e-05, + "loss": 0.0088, + "step": 673660 + }, + { + "epoch": 1.75, + "learning_rate": 3.806252770354165e-05, + "loss": 0.0075, + "step": 673670 + }, + { + "epoch": 1.75, + "learning_rate": 3.805863948717018e-05, + "loss": 0.0051, + "step": 673680 + }, + { + "epoch": 1.75, + "learning_rate": 3.8054751270798716e-05, + "loss": 0.0068, + "step": 673690 + }, + { + "epoch": 1.75, + "learning_rate": 3.805086305442725e-05, + "loss": 0.0116, + "step": 673700 + }, + { + "epoch": 1.75, + "learning_rate": 3.8046974838055786e-05, + "loss": 0.0081, + "step": 673710 + }, + { + "epoch": 1.75, + "learning_rate": 3.804308662168432e-05, + "loss": 0.008, + "step": 673720 + }, + { + "epoch": 1.75, + "learning_rate": 3.803919840531286e-05, + "loss": 0.008, + "step": 673730 + }, + { + "epoch": 1.75, + "learning_rate": 3.8035310188941384e-05, + "loss": 0.0089, + "step": 673740 + }, + { + "epoch": 1.75, + "learning_rate": 3.8031421972569926e-05, + "loss": 0.0064, + "step": 673750 + }, + { + "epoch": 1.75, + "learning_rate": 3.802753375619846e-05, + "loss": 0.0059, + "step": 673760 + }, + { + "epoch": 1.75, + "learning_rate": 3.8023645539826995e-05, + "loss": 0.0063, + "step": 673770 + }, + { + "epoch": 1.75, + "learning_rate": 3.801975732345553e-05, + "loss": 0.0086, + "step": 673780 + }, + { + "epoch": 1.75, + "learning_rate": 3.8015869107084065e-05, + "loss": 0.0074, + "step": 673790 + }, + { + "epoch": 1.75, + "learning_rate": 3.80119808907126e-05, + "loss": 0.0082, + "step": 673800 + }, + { + "epoch": 1.75, + "learning_rate": 3.8008092674341135e-05, + "loss": 0.0078, + "step": 673810 + }, + { + "epoch": 1.75, + "learning_rate": 3.800420445796967e-05, + "loss": 0.0085, + "step": 673820 + }, + { + "epoch": 1.75, + "learning_rate": 3.800031624159821e-05, + "loss": 0.0078, + "step": 673830 + }, + { + "epoch": 1.75, + "learning_rate": 3.7996428025226746e-05, + "loss": 0.0092, + "step": 673840 + }, + { + "epoch": 1.75, + "learning_rate": 3.799253980885528e-05, + "loss": 0.007, + "step": 673850 + }, + { + "epoch": 1.75, + "learning_rate": 3.7988651592483816e-05, + "loss": 0.0084, + "step": 673860 + }, + { + "epoch": 1.75, + "learning_rate": 3.798476337611235e-05, + "loss": 0.0074, + "step": 673870 + }, + { + "epoch": 1.75, + "learning_rate": 3.7980875159740886e-05, + "loss": 0.0088, + "step": 673880 + }, + { + "epoch": 1.75, + "learning_rate": 3.797698694336942e-05, + "loss": 0.0064, + "step": 673890 + }, + { + "epoch": 1.75, + "learning_rate": 3.7973098726997955e-05, + "loss": 0.0075, + "step": 673900 + }, + { + "epoch": 1.75, + "learning_rate": 3.79692105106265e-05, + "loss": 0.0077, + "step": 673910 + }, + { + "epoch": 1.75, + "learning_rate": 3.796532229425503e-05, + "loss": 0.0057, + "step": 673920 + }, + { + "epoch": 1.75, + "learning_rate": 3.796143407788357e-05, + "loss": 0.0093, + "step": 673930 + }, + { + "epoch": 1.75, + "learning_rate": 3.79575458615121e-05, + "loss": 0.0072, + "step": 673940 + }, + { + "epoch": 1.75, + "learning_rate": 3.7953657645140636e-05, + "loss": 0.0066, + "step": 673950 + }, + { + "epoch": 1.75, + "learning_rate": 3.794976942876917e-05, + "loss": 0.0074, + "step": 673960 + }, + { + "epoch": 1.75, + "learning_rate": 3.7945881212397706e-05, + "loss": 0.0097, + "step": 673970 + }, + { + "epoch": 1.75, + "learning_rate": 3.794199299602624e-05, + "loss": 0.0086, + "step": 673980 + }, + { + "epoch": 1.75, + "learning_rate": 3.793810477965477e-05, + "loss": 0.0078, + "step": 673990 + }, + { + "epoch": 1.75, + "learning_rate": 3.7934216563283304e-05, + "loss": 0.0062, + "step": 674000 + }, + { + "epoch": 1.75, + "eval_cer": 0.8816830914060892, + "eval_loss": 0.004991509020328522, + "eval_runtime": 108.0875, + "eval_samples_per_second": 18.504, + "eval_steps_per_second": 4.626, + "step": 674000 + }, + { + "epoch": 1.75, + "learning_rate": 3.7930328346911846e-05, + "loss": 0.0074, + "step": 674010 + }, + { + "epoch": 1.75, + "learning_rate": 3.792644013054038e-05, + "loss": 0.0093, + "step": 674020 + }, + { + "epoch": 1.75, + "learning_rate": 3.7922551914168915e-05, + "loss": 0.0126, + "step": 674030 + }, + { + "epoch": 1.75, + "learning_rate": 3.791866369779745e-05, + "loss": 0.0077, + "step": 674040 + }, + { + "epoch": 1.75, + "learning_rate": 3.7914775481425985e-05, + "loss": 0.0088, + "step": 674050 + }, + { + "epoch": 1.75, + "learning_rate": 3.791088726505452e-05, + "loss": 0.0074, + "step": 674060 + }, + { + "epoch": 1.75, + "learning_rate": 3.7906999048683055e-05, + "loss": 0.0102, + "step": 674070 + }, + { + "epoch": 1.75, + "learning_rate": 3.790311083231159e-05, + "loss": 0.0074, + "step": 674080 + }, + { + "epoch": 1.75, + "learning_rate": 3.789922261594013e-05, + "loss": 0.0116, + "step": 674090 + }, + { + "epoch": 1.75, + "learning_rate": 3.7895334399568666e-05, + "loss": 0.0064, + "step": 674100 + }, + { + "epoch": 1.75, + "learning_rate": 3.78914461831972e-05, + "loss": 0.0081, + "step": 674110 + }, + { + "epoch": 1.75, + "learning_rate": 3.7887557966825736e-05, + "loss": 0.007, + "step": 674120 + }, + { + "epoch": 1.75, + "learning_rate": 3.788366975045427e-05, + "loss": 0.0058, + "step": 674130 + }, + { + "epoch": 1.75, + "learning_rate": 3.7879781534082805e-05, + "loss": 0.0073, + "step": 674140 + }, + { + "epoch": 1.75, + "learning_rate": 3.787589331771134e-05, + "loss": 0.0061, + "step": 674150 + }, + { + "epoch": 1.75, + "learning_rate": 3.7872005101339875e-05, + "loss": 0.0061, + "step": 674160 + }, + { + "epoch": 1.75, + "learning_rate": 3.786811688496842e-05, + "loss": 0.0094, + "step": 674170 + }, + { + "epoch": 1.75, + "learning_rate": 3.786422866859695e-05, + "loss": 0.0046, + "step": 674180 + }, + { + "epoch": 1.75, + "learning_rate": 3.7860340452225487e-05, + "loss": 0.0078, + "step": 674190 + }, + { + "epoch": 1.75, + "learning_rate": 3.785645223585402e-05, + "loss": 0.009, + "step": 674200 + }, + { + "epoch": 1.75, + "learning_rate": 3.7852564019482556e-05, + "loss": 0.01, + "step": 674210 + }, + { + "epoch": 1.75, + "learning_rate": 3.784867580311109e-05, + "loss": 0.0055, + "step": 674220 + }, + { + "epoch": 1.75, + "learning_rate": 3.784478758673962e-05, + "loss": 0.0096, + "step": 674230 + }, + { + "epoch": 1.75, + "learning_rate": 3.7840899370368154e-05, + "loss": 0.0155, + "step": 674240 + }, + { + "epoch": 1.75, + "learning_rate": 3.783701115399669e-05, + "loss": 0.0081, + "step": 674250 + }, + { + "epoch": 1.75, + "learning_rate": 3.7833122937625224e-05, + "loss": 0.0075, + "step": 674260 + }, + { + "epoch": 1.75, + "learning_rate": 3.7829234721253765e-05, + "loss": 0.0084, + "step": 674270 + }, + { + "epoch": 1.75, + "learning_rate": 3.78253465048823e-05, + "loss": 0.0068, + "step": 674280 + }, + { + "epoch": 1.75, + "learning_rate": 3.7821458288510835e-05, + "loss": 0.0068, + "step": 674290 + }, + { + "epoch": 1.75, + "learning_rate": 3.781757007213937e-05, + "loss": 0.0085, + "step": 674300 + }, + { + "epoch": 1.75, + "learning_rate": 3.7813681855767905e-05, + "loss": 0.0078, + "step": 674310 + }, + { + "epoch": 1.75, + "learning_rate": 3.780979363939644e-05, + "loss": 0.0072, + "step": 674320 + }, + { + "epoch": 1.75, + "learning_rate": 3.7805905423024975e-05, + "loss": 0.0088, + "step": 674330 + }, + { + "epoch": 1.75, + "learning_rate": 3.780201720665351e-05, + "loss": 0.0095, + "step": 674340 + }, + { + "epoch": 1.75, + "learning_rate": 3.779812899028205e-05, + "loss": 0.0075, + "step": 674350 + }, + { + "epoch": 1.75, + "learning_rate": 3.7794240773910586e-05, + "loss": 0.0077, + "step": 674360 + }, + { + "epoch": 1.75, + "learning_rate": 3.779035255753912e-05, + "loss": 0.0056, + "step": 674370 + }, + { + "epoch": 1.75, + "learning_rate": 3.7786464341167656e-05, + "loss": 0.0078, + "step": 674380 + }, + { + "epoch": 1.75, + "learning_rate": 3.778257612479619e-05, + "loss": 0.008, + "step": 674390 + }, + { + "epoch": 1.75, + "learning_rate": 3.7778687908424725e-05, + "loss": 0.0064, + "step": 674400 + }, + { + "epoch": 1.75, + "learning_rate": 3.777479969205326e-05, + "loss": 0.0082, + "step": 674410 + }, + { + "epoch": 1.75, + "learning_rate": 3.7770911475681795e-05, + "loss": 0.0081, + "step": 674420 + }, + { + "epoch": 1.75, + "learning_rate": 3.776702325931033e-05, + "loss": 0.0099, + "step": 674430 + }, + { + "epoch": 1.75, + "learning_rate": 3.776313504293887e-05, + "loss": 0.0081, + "step": 674440 + }, + { + "epoch": 1.75, + "learning_rate": 3.7759246826567407e-05, + "loss": 0.0101, + "step": 674450 + }, + { + "epoch": 1.75, + "learning_rate": 3.775535861019594e-05, + "loss": 0.0101, + "step": 674460 + }, + { + "epoch": 1.75, + "learning_rate": 3.7751470393824476e-05, + "loss": 0.0068, + "step": 674470 + }, + { + "epoch": 1.75, + "learning_rate": 3.7747582177453004e-05, + "loss": 0.0057, + "step": 674480 + }, + { + "epoch": 1.75, + "learning_rate": 3.774369396108154e-05, + "loss": 0.0082, + "step": 674490 + }, + { + "epoch": 1.75, + "learning_rate": 3.7739805744710074e-05, + "loss": 0.0085, + "step": 674500 + }, + { + "epoch": 1.75, + "learning_rate": 3.773591752833861e-05, + "loss": 0.0083, + "step": 674510 + }, + { + "epoch": 1.75, + "learning_rate": 3.7732029311967144e-05, + "loss": 0.0047, + "step": 674520 + }, + { + "epoch": 1.75, + "learning_rate": 3.772814109559568e-05, + "loss": 0.006, + "step": 674530 + }, + { + "epoch": 1.75, + "learning_rate": 3.772425287922422e-05, + "loss": 0.0056, + "step": 674540 + }, + { + "epoch": 1.75, + "learning_rate": 3.7720364662852755e-05, + "loss": 0.008, + "step": 674550 + }, + { + "epoch": 1.75, + "learning_rate": 3.771647644648129e-05, + "loss": 0.0059, + "step": 674560 + }, + { + "epoch": 1.75, + "learning_rate": 3.7712588230109825e-05, + "loss": 0.0064, + "step": 674570 + }, + { + "epoch": 1.75, + "learning_rate": 3.770870001373836e-05, + "loss": 0.0088, + "step": 674580 + }, + { + "epoch": 1.75, + "learning_rate": 3.7704811797366895e-05, + "loss": 0.007, + "step": 674590 + }, + { + "epoch": 1.75, + "learning_rate": 3.770092358099543e-05, + "loss": 0.0085, + "step": 674600 + }, + { + "epoch": 1.75, + "learning_rate": 3.7697035364623964e-05, + "loss": 0.0091, + "step": 674610 + }, + { + "epoch": 1.75, + "learning_rate": 3.7693147148252506e-05, + "loss": 0.0097, + "step": 674620 + }, + { + "epoch": 1.75, + "learning_rate": 3.768925893188104e-05, + "loss": 0.0066, + "step": 674630 + }, + { + "epoch": 1.75, + "learning_rate": 3.7685370715509576e-05, + "loss": 0.0066, + "step": 674640 + }, + { + "epoch": 1.75, + "learning_rate": 3.768148249913811e-05, + "loss": 0.0075, + "step": 674650 + }, + { + "epoch": 1.75, + "learning_rate": 3.7677594282766645e-05, + "loss": 0.0078, + "step": 674660 + }, + { + "epoch": 1.75, + "learning_rate": 3.767370606639518e-05, + "loss": 0.0062, + "step": 674670 + }, + { + "epoch": 1.75, + "learning_rate": 3.7669817850023715e-05, + "loss": 0.0077, + "step": 674680 + }, + { + "epoch": 1.75, + "learning_rate": 3.766592963365225e-05, + "loss": 0.0077, + "step": 674690 + }, + { + "epoch": 1.75, + "learning_rate": 3.766204141728079e-05, + "loss": 0.0065, + "step": 674700 + }, + { + "epoch": 1.75, + "learning_rate": 3.7658153200909326e-05, + "loss": 0.0062, + "step": 674710 + }, + { + "epoch": 1.75, + "learning_rate": 3.765426498453786e-05, + "loss": 0.0079, + "step": 674720 + }, + { + "epoch": 1.75, + "learning_rate": 3.765037676816639e-05, + "loss": 0.0085, + "step": 674730 + }, + { + "epoch": 1.75, + "learning_rate": 3.7646488551794924e-05, + "loss": 0.0085, + "step": 674740 + }, + { + "epoch": 1.75, + "learning_rate": 3.764260033542346e-05, + "loss": 0.0085, + "step": 674750 + }, + { + "epoch": 1.75, + "learning_rate": 3.7638712119051994e-05, + "loss": 0.008, + "step": 674760 + }, + { + "epoch": 1.75, + "learning_rate": 3.763482390268053e-05, + "loss": 0.0078, + "step": 674770 + }, + { + "epoch": 1.75, + "learning_rate": 3.7630935686309064e-05, + "loss": 0.0111, + "step": 674780 + }, + { + "epoch": 1.75, + "learning_rate": 3.76270474699376e-05, + "loss": 0.0095, + "step": 674790 + }, + { + "epoch": 1.75, + "learning_rate": 3.762315925356614e-05, + "loss": 0.0079, + "step": 674800 + }, + { + "epoch": 1.75, + "learning_rate": 3.7619271037194675e-05, + "loss": 0.0082, + "step": 674810 + }, + { + "epoch": 1.75, + "learning_rate": 3.761538282082321e-05, + "loss": 0.0073, + "step": 674820 + }, + { + "epoch": 1.75, + "learning_rate": 3.7611494604451745e-05, + "loss": 0.0073, + "step": 674830 + }, + { + "epoch": 1.75, + "learning_rate": 3.760760638808028e-05, + "loss": 0.0072, + "step": 674840 + }, + { + "epoch": 1.75, + "learning_rate": 3.7603718171708815e-05, + "loss": 0.0062, + "step": 674850 + }, + { + "epoch": 1.75, + "learning_rate": 3.759982995533735e-05, + "loss": 0.0077, + "step": 674860 + }, + { + "epoch": 1.75, + "learning_rate": 3.7595941738965884e-05, + "loss": 0.005, + "step": 674870 + }, + { + "epoch": 1.75, + "learning_rate": 3.7592053522594426e-05, + "loss": 0.0076, + "step": 674880 + }, + { + "epoch": 1.75, + "learning_rate": 3.758816530622296e-05, + "loss": 0.0102, + "step": 674890 + }, + { + "epoch": 1.75, + "learning_rate": 3.7584277089851496e-05, + "loss": 0.0062, + "step": 674900 + }, + { + "epoch": 1.75, + "learning_rate": 3.758038887348003e-05, + "loss": 0.0094, + "step": 674910 + }, + { + "epoch": 1.75, + "learning_rate": 3.7576500657108565e-05, + "loss": 0.0057, + "step": 674920 + }, + { + "epoch": 1.75, + "learning_rate": 3.75726124407371e-05, + "loss": 0.012, + "step": 674930 + }, + { + "epoch": 1.75, + "learning_rate": 3.7568724224365635e-05, + "loss": 0.0097, + "step": 674940 + }, + { + "epoch": 1.75, + "learning_rate": 3.756483600799417e-05, + "loss": 0.01, + "step": 674950 + }, + { + "epoch": 1.75, + "learning_rate": 3.756094779162271e-05, + "loss": 0.0079, + "step": 674960 + }, + { + "epoch": 1.75, + "learning_rate": 3.7557059575251246e-05, + "loss": 0.0078, + "step": 674970 + }, + { + "epoch": 1.75, + "learning_rate": 3.7553171358879775e-05, + "loss": 0.007, + "step": 674980 + }, + { + "epoch": 1.75, + "learning_rate": 3.754928314250831e-05, + "loss": 0.0074, + "step": 674990 + }, + { + "epoch": 1.75, + "learning_rate": 3.7545394926136844e-05, + "loss": 0.0091, + "step": 675000 + }, + { + "epoch": 1.75, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.00502510741353035, + "eval_runtime": 108.0489, + "eval_samples_per_second": 18.51, + "eval_steps_per_second": 4.628, + "step": 675000 + }, + { + "epoch": 1.75, + "learning_rate": 3.754150670976538e-05, + "loss": 0.0073, + "step": 675010 + }, + { + "epoch": 1.75, + "learning_rate": 3.7537618493393914e-05, + "loss": 0.0076, + "step": 675020 + }, + { + "epoch": 1.75, + "learning_rate": 3.753373027702245e-05, + "loss": 0.0047, + "step": 675030 + }, + { + "epoch": 1.75, + "learning_rate": 3.7529842060650984e-05, + "loss": 0.0078, + "step": 675040 + }, + { + "epoch": 1.75, + "learning_rate": 3.752595384427952e-05, + "loss": 0.0072, + "step": 675050 + }, + { + "epoch": 1.75, + "learning_rate": 3.752206562790806e-05, + "loss": 0.0073, + "step": 675060 + }, + { + "epoch": 1.75, + "learning_rate": 3.7518177411536595e-05, + "loss": 0.0061, + "step": 675070 + }, + { + "epoch": 1.75, + "learning_rate": 3.751428919516513e-05, + "loss": 0.0091, + "step": 675080 + }, + { + "epoch": 1.75, + "learning_rate": 3.7510400978793665e-05, + "loss": 0.0083, + "step": 675090 + }, + { + "epoch": 1.75, + "learning_rate": 3.75065127624222e-05, + "loss": 0.0083, + "step": 675100 + }, + { + "epoch": 1.75, + "learning_rate": 3.7502624546050734e-05, + "loss": 0.0077, + "step": 675110 + }, + { + "epoch": 1.75, + "learning_rate": 3.749873632967927e-05, + "loss": 0.0094, + "step": 675120 + }, + { + "epoch": 1.75, + "learning_rate": 3.7494848113307804e-05, + "loss": 0.0057, + "step": 675130 + }, + { + "epoch": 1.75, + "learning_rate": 3.7490959896936346e-05, + "loss": 0.008, + "step": 675140 + }, + { + "epoch": 1.75, + "learning_rate": 3.748707168056488e-05, + "loss": 0.0087, + "step": 675150 + }, + { + "epoch": 1.75, + "learning_rate": 3.7483183464193416e-05, + "loss": 0.0074, + "step": 675160 + }, + { + "epoch": 1.75, + "learning_rate": 3.7479295247821944e-05, + "loss": 0.0092, + "step": 675170 + }, + { + "epoch": 1.75, + "learning_rate": 3.747540703145048e-05, + "loss": 0.0057, + "step": 675180 + }, + { + "epoch": 1.75, + "learning_rate": 3.747151881507902e-05, + "loss": 0.0072, + "step": 675190 + }, + { + "epoch": 1.75, + "learning_rate": 3.7467630598707555e-05, + "loss": 0.007, + "step": 675200 + }, + { + "epoch": 1.75, + "learning_rate": 3.746374238233609e-05, + "loss": 0.0123, + "step": 675210 + }, + { + "epoch": 1.75, + "learning_rate": 3.7459854165964625e-05, + "loss": 0.0109, + "step": 675220 + }, + { + "epoch": 1.75, + "learning_rate": 3.745596594959316e-05, + "loss": 0.0092, + "step": 675230 + }, + { + "epoch": 1.75, + "learning_rate": 3.7452077733221694e-05, + "loss": 0.0082, + "step": 675240 + }, + { + "epoch": 1.75, + "learning_rate": 3.744818951685023e-05, + "loss": 0.0075, + "step": 675250 + }, + { + "epoch": 1.75, + "learning_rate": 3.7444301300478764e-05, + "loss": 0.007, + "step": 675260 + }, + { + "epoch": 1.75, + "learning_rate": 3.7440413084107306e-05, + "loss": 0.006, + "step": 675270 + }, + { + "epoch": 1.75, + "learning_rate": 3.743652486773584e-05, + "loss": 0.0084, + "step": 675280 + }, + { + "epoch": 1.75, + "learning_rate": 3.743263665136437e-05, + "loss": 0.0073, + "step": 675290 + }, + { + "epoch": 1.75, + "learning_rate": 3.7428748434992904e-05, + "loss": 0.0057, + "step": 675300 + }, + { + "epoch": 1.75, + "learning_rate": 3.742486021862144e-05, + "loss": 0.0056, + "step": 675310 + }, + { + "epoch": 1.75, + "learning_rate": 3.742097200224998e-05, + "loss": 0.0077, + "step": 675320 + }, + { + "epoch": 1.75, + "learning_rate": 3.7417083785878515e-05, + "loss": 0.0086, + "step": 675330 + }, + { + "epoch": 1.75, + "learning_rate": 3.741319556950705e-05, + "loss": 0.0072, + "step": 675340 + }, + { + "epoch": 1.75, + "learning_rate": 3.7409307353135585e-05, + "loss": 0.0094, + "step": 675350 + }, + { + "epoch": 1.75, + "learning_rate": 3.740541913676412e-05, + "loss": 0.0073, + "step": 675360 + }, + { + "epoch": 1.75, + "learning_rate": 3.7401530920392654e-05, + "loss": 0.0067, + "step": 675370 + }, + { + "epoch": 1.75, + "learning_rate": 3.739764270402119e-05, + "loss": 0.0076, + "step": 675380 + }, + { + "epoch": 1.75, + "learning_rate": 3.7393754487649724e-05, + "loss": 0.0075, + "step": 675390 + }, + { + "epoch": 1.75, + "learning_rate": 3.7389866271278266e-05, + "loss": 0.011, + "step": 675400 + }, + { + "epoch": 1.75, + "learning_rate": 3.7385978054906794e-05, + "loss": 0.0094, + "step": 675410 + }, + { + "epoch": 1.75, + "learning_rate": 3.738208983853533e-05, + "loss": 0.006, + "step": 675420 + }, + { + "epoch": 1.75, + "learning_rate": 3.7378201622163864e-05, + "loss": 0.0075, + "step": 675430 + }, + { + "epoch": 1.75, + "learning_rate": 3.73743134057924e-05, + "loss": 0.0075, + "step": 675440 + }, + { + "epoch": 1.75, + "learning_rate": 3.737042518942094e-05, + "loss": 0.0068, + "step": 675450 + }, + { + "epoch": 1.75, + "learning_rate": 3.7366536973049475e-05, + "loss": 0.008, + "step": 675460 + }, + { + "epoch": 1.75, + "learning_rate": 3.736264875667801e-05, + "loss": 0.0079, + "step": 675470 + }, + { + "epoch": 1.75, + "learning_rate": 3.7358760540306545e-05, + "loss": 0.0075, + "step": 675480 + }, + { + "epoch": 1.75, + "learning_rate": 3.735487232393508e-05, + "loss": 0.0072, + "step": 675490 + }, + { + "epoch": 1.75, + "learning_rate": 3.7350984107563614e-05, + "loss": 0.0085, + "step": 675500 + }, + { + "epoch": 1.75, + "learning_rate": 3.734709589119215e-05, + "loss": 0.0061, + "step": 675510 + }, + { + "epoch": 1.75, + "learning_rate": 3.7343207674820684e-05, + "loss": 0.0075, + "step": 675520 + }, + { + "epoch": 1.75, + "learning_rate": 3.7339319458449226e-05, + "loss": 0.0072, + "step": 675530 + }, + { + "epoch": 1.75, + "learning_rate": 3.7335431242077754e-05, + "loss": 0.0093, + "step": 675540 + }, + { + "epoch": 1.75, + "learning_rate": 3.733154302570629e-05, + "loss": 0.0116, + "step": 675550 + }, + { + "epoch": 1.75, + "learning_rate": 3.7327654809334824e-05, + "loss": 0.0081, + "step": 675560 + }, + { + "epoch": 1.75, + "learning_rate": 3.732376659296336e-05, + "loss": 0.0053, + "step": 675570 + }, + { + "epoch": 1.75, + "learning_rate": 3.73198783765919e-05, + "loss": 0.0087, + "step": 675580 + }, + { + "epoch": 1.75, + "learning_rate": 3.7315990160220435e-05, + "loss": 0.0066, + "step": 675590 + }, + { + "epoch": 1.75, + "learning_rate": 3.731210194384897e-05, + "loss": 0.0083, + "step": 675600 + }, + { + "epoch": 1.75, + "learning_rate": 3.7308213727477505e-05, + "loss": 0.0078, + "step": 675610 + }, + { + "epoch": 1.75, + "learning_rate": 3.730432551110604e-05, + "loss": 0.0059, + "step": 675620 + }, + { + "epoch": 1.75, + "learning_rate": 3.7300437294734574e-05, + "loss": 0.0118, + "step": 675630 + }, + { + "epoch": 1.75, + "learning_rate": 3.729654907836311e-05, + "loss": 0.0076, + "step": 675640 + }, + { + "epoch": 1.75, + "learning_rate": 3.7292660861991644e-05, + "loss": 0.007, + "step": 675650 + }, + { + "epoch": 1.75, + "learning_rate": 3.728877264562018e-05, + "loss": 0.0129, + "step": 675660 + }, + { + "epoch": 1.75, + "learning_rate": 3.7284884429248714e-05, + "loss": 0.0083, + "step": 675670 + }, + { + "epoch": 1.75, + "learning_rate": 3.728099621287725e-05, + "loss": 0.0099, + "step": 675680 + }, + { + "epoch": 1.75, + "learning_rate": 3.7277107996505784e-05, + "loss": 0.0111, + "step": 675690 + }, + { + "epoch": 1.75, + "learning_rate": 3.727321978013432e-05, + "loss": 0.0105, + "step": 675700 + }, + { + "epoch": 1.75, + "learning_rate": 3.726933156376286e-05, + "loss": 0.006, + "step": 675710 + }, + { + "epoch": 1.75, + "learning_rate": 3.7265443347391395e-05, + "loss": 0.009, + "step": 675720 + }, + { + "epoch": 1.75, + "learning_rate": 3.726155513101993e-05, + "loss": 0.0109, + "step": 675730 + }, + { + "epoch": 1.75, + "learning_rate": 3.7257666914648465e-05, + "loss": 0.0072, + "step": 675740 + }, + { + "epoch": 1.75, + "learning_rate": 3.7253778698277e-05, + "loss": 0.0088, + "step": 675750 + }, + { + "epoch": 1.75, + "learning_rate": 3.7249890481905534e-05, + "loss": 0.009, + "step": 675760 + }, + { + "epoch": 1.75, + "learning_rate": 3.724600226553407e-05, + "loss": 0.0069, + "step": 675770 + }, + { + "epoch": 1.75, + "learning_rate": 3.7242114049162604e-05, + "loss": 0.0095, + "step": 675780 + }, + { + "epoch": 1.75, + "learning_rate": 3.723822583279114e-05, + "loss": 0.0086, + "step": 675790 + }, + { + "epoch": 1.75, + "learning_rate": 3.7234337616419674e-05, + "loss": 0.0099, + "step": 675800 + }, + { + "epoch": 1.75, + "learning_rate": 3.723044940004821e-05, + "loss": 0.0073, + "step": 675810 + }, + { + "epoch": 1.75, + "learning_rate": 3.7226561183676744e-05, + "loss": 0.0092, + "step": 675820 + }, + { + "epoch": 1.75, + "learning_rate": 3.722267296730528e-05, + "loss": 0.0076, + "step": 675830 + }, + { + "epoch": 1.75, + "learning_rate": 3.721878475093381e-05, + "loss": 0.0076, + "step": 675840 + }, + { + "epoch": 1.75, + "learning_rate": 3.7214896534562355e-05, + "loss": 0.0105, + "step": 675850 + }, + { + "epoch": 1.75, + "learning_rate": 3.721100831819089e-05, + "loss": 0.0087, + "step": 675860 + }, + { + "epoch": 1.75, + "learning_rate": 3.7207120101819425e-05, + "loss": 0.008, + "step": 675870 + }, + { + "epoch": 1.75, + "learning_rate": 3.720323188544796e-05, + "loss": 0.0062, + "step": 675880 + }, + { + "epoch": 1.75, + "learning_rate": 3.7199343669076494e-05, + "loss": 0.007, + "step": 675890 + }, + { + "epoch": 1.75, + "learning_rate": 3.719545545270503e-05, + "loss": 0.0082, + "step": 675900 + }, + { + "epoch": 1.75, + "learning_rate": 3.7191567236333564e-05, + "loss": 0.0101, + "step": 675910 + }, + { + "epoch": 1.75, + "learning_rate": 3.71876790199621e-05, + "loss": 0.0072, + "step": 675920 + }, + { + "epoch": 1.75, + "learning_rate": 3.7183790803590634e-05, + "loss": 0.0068, + "step": 675930 + }, + { + "epoch": 1.75, + "learning_rate": 3.717990258721917e-05, + "loss": 0.0079, + "step": 675940 + }, + { + "epoch": 1.75, + "learning_rate": 3.7176014370847704e-05, + "loss": 0.0104, + "step": 675950 + }, + { + "epoch": 1.75, + "learning_rate": 3.717212615447624e-05, + "loss": 0.0084, + "step": 675960 + }, + { + "epoch": 1.75, + "learning_rate": 3.716823793810477e-05, + "loss": 0.0049, + "step": 675970 + }, + { + "epoch": 1.75, + "learning_rate": 3.7164349721733315e-05, + "loss": 0.0097, + "step": 675980 + }, + { + "epoch": 1.75, + "learning_rate": 3.716046150536185e-05, + "loss": 0.0078, + "step": 675990 + }, + { + "epoch": 1.75, + "learning_rate": 3.7156573288990385e-05, + "loss": 0.0102, + "step": 676000 + }, + { + "epoch": 1.75, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.005067652557045221, + "eval_runtime": 107.7059, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, + "step": 676000 + }, + { + "epoch": 1.75, + "learning_rate": 3.715268507261892e-05, + "loss": 0.0069, + "step": 676010 + }, + { + "epoch": 1.75, + "learning_rate": 3.7148796856247454e-05, + "loss": 0.0073, + "step": 676020 + }, + { + "epoch": 1.75, + "learning_rate": 3.714490863987599e-05, + "loss": 0.0096, + "step": 676030 + }, + { + "epoch": 1.75, + "learning_rate": 3.7141020423504524e-05, + "loss": 0.007, + "step": 676040 + }, + { + "epoch": 1.75, + "learning_rate": 3.713713220713306e-05, + "loss": 0.01, + "step": 676050 + }, + { + "epoch": 1.75, + "learning_rate": 3.7133243990761594e-05, + "loss": 0.0067, + "step": 676060 + }, + { + "epoch": 1.75, + "learning_rate": 3.712935577439013e-05, + "loss": 0.0067, + "step": 676070 + }, + { + "epoch": 1.75, + "learning_rate": 3.7125467558018663e-05, + "loss": 0.0054, + "step": 676080 + }, + { + "epoch": 1.75, + "learning_rate": 3.71215793416472e-05, + "loss": 0.0079, + "step": 676090 + }, + { + "epoch": 1.75, + "learning_rate": 3.711769112527573e-05, + "loss": 0.0074, + "step": 676100 + }, + { + "epoch": 1.75, + "learning_rate": 3.7113802908904275e-05, + "loss": 0.0075, + "step": 676110 + }, + { + "epoch": 1.75, + "learning_rate": 3.710991469253281e-05, + "loss": 0.0073, + "step": 676120 + }, + { + "epoch": 1.75, + "learning_rate": 3.7106026476161345e-05, + "loss": 0.0078, + "step": 676130 + }, + { + "epoch": 1.75, + "learning_rate": 3.710213825978988e-05, + "loss": 0.0089, + "step": 676140 + }, + { + "epoch": 1.75, + "learning_rate": 3.7098250043418414e-05, + "loss": 0.0081, + "step": 676150 + }, + { + "epoch": 1.75, + "learning_rate": 3.709436182704695e-05, + "loss": 0.0075, + "step": 676160 + }, + { + "epoch": 1.75, + "learning_rate": 3.7090473610675484e-05, + "loss": 0.0084, + "step": 676170 + }, + { + "epoch": 1.75, + "learning_rate": 3.708658539430402e-05, + "loss": 0.009, + "step": 676180 + }, + { + "epoch": 1.75, + "learning_rate": 3.7082697177932554e-05, + "loss": 0.0084, + "step": 676190 + }, + { + "epoch": 1.75, + "learning_rate": 3.707880896156109e-05, + "loss": 0.0096, + "step": 676200 + }, + { + "epoch": 1.75, + "learning_rate": 3.7074920745189623e-05, + "loss": 0.0131, + "step": 676210 + }, + { + "epoch": 1.75, + "learning_rate": 3.707103252881816e-05, + "loss": 0.0081, + "step": 676220 + }, + { + "epoch": 1.75, + "learning_rate": 3.706714431244669e-05, + "loss": 0.0091, + "step": 676230 + }, + { + "epoch": 1.75, + "learning_rate": 3.7063256096075235e-05, + "loss": 0.0108, + "step": 676240 + }, + { + "epoch": 1.75, + "learning_rate": 3.705936787970377e-05, + "loss": 0.0087, + "step": 676250 + }, + { + "epoch": 1.75, + "learning_rate": 3.7055479663332305e-05, + "loss": 0.0091, + "step": 676260 + }, + { + "epoch": 1.75, + "learning_rate": 3.705159144696084e-05, + "loss": 0.0066, + "step": 676270 + }, + { + "epoch": 1.75, + "learning_rate": 3.704770323058937e-05, + "loss": 0.0071, + "step": 676280 + }, + { + "epoch": 1.75, + "learning_rate": 3.704381501421791e-05, + "loss": 0.0064, + "step": 676290 + }, + { + "epoch": 1.75, + "learning_rate": 3.7039926797846444e-05, + "loss": 0.0076, + "step": 676300 + }, + { + "epoch": 1.75, + "learning_rate": 3.703603858147498e-05, + "loss": 0.0061, + "step": 676310 + }, + { + "epoch": 1.75, + "learning_rate": 3.7032150365103514e-05, + "loss": 0.0079, + "step": 676320 + }, + { + "epoch": 1.75, + "learning_rate": 3.702826214873205e-05, + "loss": 0.0077, + "step": 676330 + }, + { + "epoch": 1.75, + "learning_rate": 3.7024373932360583e-05, + "loss": 0.0065, + "step": 676340 + }, + { + "epoch": 1.75, + "learning_rate": 3.702048571598912e-05, + "loss": 0.0085, + "step": 676350 + }, + { + "epoch": 1.75, + "learning_rate": 3.701659749961765e-05, + "loss": 0.0064, + "step": 676360 + }, + { + "epoch": 1.75, + "learning_rate": 3.7012709283246195e-05, + "loss": 0.0072, + "step": 676370 + }, + { + "epoch": 1.75, + "learning_rate": 3.700882106687473e-05, + "loss": 0.0048, + "step": 676380 + }, + { + "epoch": 1.75, + "learning_rate": 3.7004932850503265e-05, + "loss": 0.006, + "step": 676390 + }, + { + "epoch": 1.75, + "learning_rate": 3.70010446341318e-05, + "loss": 0.0084, + "step": 676400 + }, + { + "epoch": 1.75, + "learning_rate": 3.699715641776033e-05, + "loss": 0.008, + "step": 676410 + }, + { + "epoch": 1.75, + "learning_rate": 3.699326820138887e-05, + "loss": 0.0072, + "step": 676420 + }, + { + "epoch": 1.75, + "learning_rate": 3.6989379985017404e-05, + "loss": 0.0118, + "step": 676430 + }, + { + "epoch": 1.75, + "learning_rate": 3.698549176864594e-05, + "loss": 0.0065, + "step": 676440 + }, + { + "epoch": 1.75, + "learning_rate": 3.6981603552274474e-05, + "loss": 0.0101, + "step": 676450 + }, + { + "epoch": 1.75, + "learning_rate": 3.697771533590301e-05, + "loss": 0.0059, + "step": 676460 + }, + { + "epoch": 1.75, + "learning_rate": 3.6973827119531543e-05, + "loss": 0.0065, + "step": 676470 + }, + { + "epoch": 1.75, + "learning_rate": 3.696993890316008e-05, + "loss": 0.01, + "step": 676480 + }, + { + "epoch": 1.75, + "learning_rate": 3.696605068678861e-05, + "loss": 0.0073, + "step": 676490 + }, + { + "epoch": 1.75, + "learning_rate": 3.6962162470417155e-05, + "loss": 0.0089, + "step": 676500 + }, + { + "epoch": 1.75, + "learning_rate": 3.695827425404569e-05, + "loss": 0.0086, + "step": 676510 + }, + { + "epoch": 1.75, + "learning_rate": 3.6954386037674225e-05, + "loss": 0.0078, + "step": 676520 + }, + { + "epoch": 1.75, + "learning_rate": 3.695049782130275e-05, + "loss": 0.0064, + "step": 676530 + }, + { + "epoch": 1.75, + "learning_rate": 3.694660960493129e-05, + "loss": 0.0097, + "step": 676540 + }, + { + "epoch": 1.75, + "learning_rate": 3.694272138855983e-05, + "loss": 0.0078, + "step": 676550 + }, + { + "epoch": 1.75, + "learning_rate": 3.6938833172188364e-05, + "loss": 0.0089, + "step": 676560 + }, + { + "epoch": 1.75, + "learning_rate": 3.69349449558169e-05, + "loss": 0.0081, + "step": 676570 + }, + { + "epoch": 1.75, + "learning_rate": 3.6931056739445434e-05, + "loss": 0.0102, + "step": 676580 + }, + { + "epoch": 1.75, + "learning_rate": 3.692716852307397e-05, + "loss": 0.0076, + "step": 676590 + }, + { + "epoch": 1.75, + "learning_rate": 3.6923280306702503e-05, + "loss": 0.0076, + "step": 676600 + }, + { + "epoch": 1.75, + "learning_rate": 3.691939209033104e-05, + "loss": 0.0055, + "step": 676610 + }, + { + "epoch": 1.75, + "learning_rate": 3.691550387395957e-05, + "loss": 0.006, + "step": 676620 + }, + { + "epoch": 1.75, + "learning_rate": 3.6911615657588115e-05, + "loss": 0.0091, + "step": 676630 + }, + { + "epoch": 1.75, + "learning_rate": 3.690772744121665e-05, + "loss": 0.0081, + "step": 676640 + }, + { + "epoch": 1.75, + "learning_rate": 3.690383922484518e-05, + "loss": 0.0075, + "step": 676650 + }, + { + "epoch": 1.75, + "learning_rate": 3.689995100847371e-05, + "loss": 0.0076, + "step": 676660 + }, + { + "epoch": 1.75, + "learning_rate": 3.689606279210225e-05, + "loss": 0.0071, + "step": 676670 + }, + { + "epoch": 1.75, + "learning_rate": 3.689217457573079e-05, + "loss": 0.0074, + "step": 676680 + }, + { + "epoch": 1.75, + "learning_rate": 3.6888286359359324e-05, + "loss": 0.0082, + "step": 676690 + }, + { + "epoch": 1.75, + "learning_rate": 3.688439814298786e-05, + "loss": 0.0064, + "step": 676700 + }, + { + "epoch": 1.75, + "learning_rate": 3.6880509926616394e-05, + "loss": 0.0078, + "step": 676710 + }, + { + "epoch": 1.75, + "learning_rate": 3.687662171024493e-05, + "loss": 0.0121, + "step": 676720 + }, + { + "epoch": 1.75, + "learning_rate": 3.687273349387346e-05, + "loss": 0.0101, + "step": 676730 + }, + { + "epoch": 1.75, + "learning_rate": 3.6868845277502e-05, + "loss": 0.0066, + "step": 676740 + }, + { + "epoch": 1.75, + "learning_rate": 3.686495706113053e-05, + "loss": 0.0086, + "step": 676750 + }, + { + "epoch": 1.75, + "learning_rate": 3.6861068844759075e-05, + "loss": 0.0075, + "step": 676760 + }, + { + "epoch": 1.75, + "learning_rate": 3.685718062838761e-05, + "loss": 0.0096, + "step": 676770 + }, + { + "epoch": 1.75, + "learning_rate": 3.685329241201614e-05, + "loss": 0.0083, + "step": 676780 + }, + { + "epoch": 1.75, + "learning_rate": 3.684940419564467e-05, + "loss": 0.0079, + "step": 676790 + }, + { + "epoch": 1.75, + "learning_rate": 3.684551597927321e-05, + "loss": 0.0069, + "step": 676800 + }, + { + "epoch": 1.75, + "learning_rate": 3.684162776290175e-05, + "loss": 0.0088, + "step": 676810 + }, + { + "epoch": 1.75, + "learning_rate": 3.6837739546530284e-05, + "loss": 0.0073, + "step": 676820 + }, + { + "epoch": 1.75, + "learning_rate": 3.683385133015882e-05, + "loss": 0.0079, + "step": 676830 + }, + { + "epoch": 1.75, + "learning_rate": 3.6829963113787354e-05, + "loss": 0.0069, + "step": 676840 + }, + { + "epoch": 1.75, + "learning_rate": 3.682607489741589e-05, + "loss": 0.0063, + "step": 676850 + }, + { + "epoch": 1.75, + "learning_rate": 3.682218668104442e-05, + "loss": 0.0056, + "step": 676860 + }, + { + "epoch": 1.75, + "learning_rate": 3.681829846467296e-05, + "loss": 0.0055, + "step": 676870 + }, + { + "epoch": 1.75, + "learning_rate": 3.681441024830149e-05, + "loss": 0.0054, + "step": 676880 + }, + { + "epoch": 1.75, + "learning_rate": 3.6810522031930035e-05, + "loss": 0.009, + "step": 676890 + }, + { + "epoch": 1.75, + "learning_rate": 3.680663381555856e-05, + "loss": 0.0063, + "step": 676900 + }, + { + "epoch": 1.75, + "learning_rate": 3.68027455991871e-05, + "loss": 0.0085, + "step": 676910 + }, + { + "epoch": 1.75, + "learning_rate": 3.679885738281563e-05, + "loss": 0.0077, + "step": 676920 + }, + { + "epoch": 1.75, + "learning_rate": 3.679496916644417e-05, + "loss": 0.0093, + "step": 676930 + }, + { + "epoch": 1.75, + "learning_rate": 3.679108095007271e-05, + "loss": 0.0063, + "step": 676940 + }, + { + "epoch": 1.75, + "learning_rate": 3.6787192733701244e-05, + "loss": 0.0072, + "step": 676950 + }, + { + "epoch": 1.75, + "learning_rate": 3.678330451732978e-05, + "loss": 0.0075, + "step": 676960 + }, + { + "epoch": 1.75, + "learning_rate": 3.6779416300958314e-05, + "loss": 0.0077, + "step": 676970 + }, + { + "epoch": 1.75, + "learning_rate": 3.677552808458685e-05, + "loss": 0.0093, + "step": 676980 + }, + { + "epoch": 1.75, + "learning_rate": 3.677163986821538e-05, + "loss": 0.0085, + "step": 676990 + }, + { + "epoch": 1.75, + "learning_rate": 3.676775165184392e-05, + "loss": 0.0086, + "step": 677000 + }, + { + "epoch": 1.75, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.005042629782110453, + "eval_runtime": 108.0533, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 677000 + }, + { + "epoch": 1.75, + "learning_rate": 3.676386343547245e-05, + "loss": 0.0103, + "step": 677010 + }, + { + "epoch": 1.75, + "learning_rate": 3.6759975219100995e-05, + "loss": 0.0082, + "step": 677020 + }, + { + "epoch": 1.75, + "learning_rate": 3.675608700272952e-05, + "loss": 0.0064, + "step": 677030 + }, + { + "epoch": 1.75, + "learning_rate": 3.675219878635806e-05, + "loss": 0.0082, + "step": 677040 + }, + { + "epoch": 1.76, + "learning_rate": 3.674831056998659e-05, + "loss": 0.0071, + "step": 677050 + }, + { + "epoch": 1.76, + "learning_rate": 3.674442235361513e-05, + "loss": 0.0061, + "step": 677060 + }, + { + "epoch": 1.76, + "learning_rate": 3.674053413724367e-05, + "loss": 0.0075, + "step": 677070 + }, + { + "epoch": 1.76, + "learning_rate": 3.6736645920872204e-05, + "loss": 0.0084, + "step": 677080 + }, + { + "epoch": 1.76, + "learning_rate": 3.673275770450074e-05, + "loss": 0.0072, + "step": 677090 + }, + { + "epoch": 1.76, + "learning_rate": 3.6728869488129274e-05, + "loss": 0.009, + "step": 677100 + }, + { + "epoch": 1.76, + "learning_rate": 3.672498127175781e-05, + "loss": 0.0065, + "step": 677110 + }, + { + "epoch": 1.76, + "learning_rate": 3.672109305538634e-05, + "loss": 0.008, + "step": 677120 + }, + { + "epoch": 1.76, + "learning_rate": 3.671720483901488e-05, + "loss": 0.0082, + "step": 677130 + }, + { + "epoch": 1.76, + "learning_rate": 3.671331662264341e-05, + "loss": 0.0072, + "step": 677140 + }, + { + "epoch": 1.76, + "learning_rate": 3.670942840627195e-05, + "loss": 0.0069, + "step": 677150 + }, + { + "epoch": 1.76, + "learning_rate": 3.670554018990048e-05, + "loss": 0.0072, + "step": 677160 + }, + { + "epoch": 1.76, + "learning_rate": 3.670165197352902e-05, + "loss": 0.0058, + "step": 677170 + }, + { + "epoch": 1.76, + "learning_rate": 3.669776375715755e-05, + "loss": 0.0076, + "step": 677180 + }, + { + "epoch": 1.76, + "learning_rate": 3.669387554078609e-05, + "loss": 0.0101, + "step": 677190 + }, + { + "epoch": 1.76, + "learning_rate": 3.668998732441462e-05, + "loss": 0.0072, + "step": 677200 + }, + { + "epoch": 1.76, + "learning_rate": 3.6686099108043164e-05, + "loss": 0.017, + "step": 677210 + }, + { + "epoch": 1.76, + "learning_rate": 3.66822108916717e-05, + "loss": 0.009, + "step": 677220 + }, + { + "epoch": 1.76, + "learning_rate": 3.6678322675300234e-05, + "loss": 0.0084, + "step": 677230 + }, + { + "epoch": 1.76, + "learning_rate": 3.667443445892877e-05, + "loss": 0.0074, + "step": 677240 + }, + { + "epoch": 1.76, + "learning_rate": 3.66705462425573e-05, + "loss": 0.0069, + "step": 677250 + }, + { + "epoch": 1.76, + "learning_rate": 3.666665802618584e-05, + "loss": 0.0073, + "step": 677260 + }, + { + "epoch": 1.76, + "learning_rate": 3.666276980981437e-05, + "loss": 0.0153, + "step": 677270 + }, + { + "epoch": 1.76, + "learning_rate": 3.665888159344291e-05, + "loss": 0.0058, + "step": 677280 + }, + { + "epoch": 1.76, + "learning_rate": 3.665499337707144e-05, + "loss": 0.0062, + "step": 677290 + }, + { + "epoch": 1.76, + "learning_rate": 3.665110516069998e-05, + "loss": 0.0086, + "step": 677300 + }, + { + "epoch": 1.76, + "learning_rate": 3.664721694432851e-05, + "loss": 0.0075, + "step": 677310 + }, + { + "epoch": 1.76, + "learning_rate": 3.664332872795705e-05, + "loss": 0.0067, + "step": 677320 + }, + { + "epoch": 1.76, + "learning_rate": 3.663944051158558e-05, + "loss": 0.0103, + "step": 677330 + }, + { + "epoch": 1.76, + "learning_rate": 3.6635552295214124e-05, + "loss": 0.0092, + "step": 677340 + }, + { + "epoch": 1.76, + "learning_rate": 3.663166407884266e-05, + "loss": 0.0079, + "step": 677350 + }, + { + "epoch": 1.76, + "learning_rate": 3.6627775862471194e-05, + "loss": 0.0063, + "step": 677360 + }, + { + "epoch": 1.76, + "learning_rate": 3.662388764609973e-05, + "loss": 0.0073, + "step": 677370 + }, + { + "epoch": 1.76, + "learning_rate": 3.661999942972826e-05, + "loss": 0.0071, + "step": 677380 + }, + { + "epoch": 1.76, + "learning_rate": 3.66161112133568e-05, + "loss": 0.0077, + "step": 677390 + }, + { + "epoch": 1.76, + "learning_rate": 3.661222299698533e-05, + "loss": 0.0066, + "step": 677400 + }, + { + "epoch": 1.76, + "learning_rate": 3.660833478061387e-05, + "loss": 0.0069, + "step": 677410 + }, + { + "epoch": 1.76, + "learning_rate": 3.66044465642424e-05, + "loss": 0.0091, + "step": 677420 + }, + { + "epoch": 1.76, + "learning_rate": 3.660055834787094e-05, + "loss": 0.0079, + "step": 677430 + }, + { + "epoch": 1.76, + "learning_rate": 3.659667013149947e-05, + "loss": 0.0078, + "step": 677440 + }, + { + "epoch": 1.76, + "learning_rate": 3.659278191512801e-05, + "loss": 0.006, + "step": 677450 + }, + { + "epoch": 1.76, + "learning_rate": 3.658889369875654e-05, + "loss": 0.0074, + "step": 677460 + }, + { + "epoch": 1.76, + "learning_rate": 3.6585005482385084e-05, + "loss": 0.0096, + "step": 677470 + }, + { + "epoch": 1.76, + "learning_rate": 3.658111726601362e-05, + "loss": 0.0073, + "step": 677480 + }, + { + "epoch": 1.76, + "learning_rate": 3.6577229049642154e-05, + "loss": 0.0068, + "step": 677490 + }, + { + "epoch": 1.76, + "learning_rate": 3.657334083327069e-05, + "loss": 0.0066, + "step": 677500 + }, + { + "epoch": 1.76, + "learning_rate": 3.656945261689922e-05, + "loss": 0.0079, + "step": 677510 + }, + { + "epoch": 1.76, + "learning_rate": 3.656556440052776e-05, + "loss": 0.0079, + "step": 677520 + }, + { + "epoch": 1.76, + "learning_rate": 3.656167618415629e-05, + "loss": 0.0072, + "step": 677530 + }, + { + "epoch": 1.76, + "learning_rate": 3.655778796778483e-05, + "loss": 0.0074, + "step": 677540 + }, + { + "epoch": 1.76, + "learning_rate": 3.655389975141336e-05, + "loss": 0.0058, + "step": 677550 + }, + { + "epoch": 1.76, + "learning_rate": 3.65500115350419e-05, + "loss": 0.0076, + "step": 677560 + }, + { + "epoch": 1.76, + "learning_rate": 3.654612331867043e-05, + "loss": 0.0097, + "step": 677570 + }, + { + "epoch": 1.76, + "learning_rate": 3.654223510229897e-05, + "loss": 0.008, + "step": 677580 + }, + { + "epoch": 1.76, + "learning_rate": 3.65383468859275e-05, + "loss": 0.0047, + "step": 677590 + }, + { + "epoch": 1.76, + "learning_rate": 3.6534458669556044e-05, + "loss": 0.0085, + "step": 677600 + }, + { + "epoch": 1.76, + "learning_rate": 3.653057045318458e-05, + "loss": 0.0067, + "step": 677610 + }, + { + "epoch": 1.76, + "learning_rate": 3.6526682236813113e-05, + "loss": 0.0073, + "step": 677620 + }, + { + "epoch": 1.76, + "learning_rate": 3.652279402044165e-05, + "loss": 0.007, + "step": 677630 + }, + { + "epoch": 1.76, + "learning_rate": 3.651890580407018e-05, + "loss": 0.0088, + "step": 677640 + }, + { + "epoch": 1.76, + "learning_rate": 3.651501758769872e-05, + "loss": 0.0062, + "step": 677650 + }, + { + "epoch": 1.76, + "learning_rate": 3.651112937132725e-05, + "loss": 0.0112, + "step": 677660 + }, + { + "epoch": 1.76, + "learning_rate": 3.650724115495579e-05, + "loss": 0.0082, + "step": 677670 + }, + { + "epoch": 1.76, + "learning_rate": 3.650335293858432e-05, + "loss": 0.0075, + "step": 677680 + }, + { + "epoch": 1.76, + "learning_rate": 3.649946472221286e-05, + "loss": 0.0089, + "step": 677690 + }, + { + "epoch": 1.76, + "learning_rate": 3.649557650584139e-05, + "loss": 0.0073, + "step": 677700 + }, + { + "epoch": 1.76, + "learning_rate": 3.649168828946993e-05, + "loss": 0.0074, + "step": 677710 + }, + { + "epoch": 1.76, + "learning_rate": 3.648780007309846e-05, + "loss": 0.0053, + "step": 677720 + }, + { + "epoch": 1.76, + "learning_rate": 3.6483911856727004e-05, + "loss": 0.0083, + "step": 677730 + }, + { + "epoch": 1.76, + "learning_rate": 3.648002364035554e-05, + "loss": 0.0083, + "step": 677740 + }, + { + "epoch": 1.76, + "learning_rate": 3.6476135423984073e-05, + "loss": 0.0082, + "step": 677750 + }, + { + "epoch": 1.76, + "learning_rate": 3.647224720761261e-05, + "loss": 0.0067, + "step": 677760 + }, + { + "epoch": 1.76, + "learning_rate": 3.6468358991241136e-05, + "loss": 0.0064, + "step": 677770 + }, + { + "epoch": 1.76, + "learning_rate": 3.646447077486968e-05, + "loss": 0.0085, + "step": 677780 + }, + { + "epoch": 1.76, + "learning_rate": 3.646058255849821e-05, + "loss": 0.0056, + "step": 677790 + }, + { + "epoch": 1.76, + "learning_rate": 3.645669434212675e-05, + "loss": 0.009, + "step": 677800 + }, + { + "epoch": 1.76, + "learning_rate": 3.645280612575528e-05, + "loss": 0.0073, + "step": 677810 + }, + { + "epoch": 1.76, + "learning_rate": 3.644891790938382e-05, + "loss": 0.0081, + "step": 677820 + }, + { + "epoch": 1.76, + "learning_rate": 3.644502969301235e-05, + "loss": 0.0078, + "step": 677830 + }, + { + "epoch": 1.76, + "learning_rate": 3.644114147664089e-05, + "loss": 0.0095, + "step": 677840 + }, + { + "epoch": 1.76, + "learning_rate": 3.643725326026942e-05, + "loss": 0.0093, + "step": 677850 + }, + { + "epoch": 1.76, + "learning_rate": 3.6433365043897964e-05, + "loss": 0.007, + "step": 677860 + }, + { + "epoch": 1.76, + "learning_rate": 3.64294768275265e-05, + "loss": 0.0087, + "step": 677870 + }, + { + "epoch": 1.76, + "learning_rate": 3.6425588611155033e-05, + "loss": 0.0128, + "step": 677880 + }, + { + "epoch": 1.76, + "learning_rate": 3.642170039478356e-05, + "loss": 0.0058, + "step": 677890 + }, + { + "epoch": 1.76, + "learning_rate": 3.6417812178412096e-05, + "loss": 0.0078, + "step": 677900 + }, + { + "epoch": 1.76, + "learning_rate": 3.641392396204064e-05, + "loss": 0.0058, + "step": 677910 + }, + { + "epoch": 1.76, + "learning_rate": 3.641003574566917e-05, + "loss": 0.0081, + "step": 677920 + }, + { + "epoch": 1.76, + "learning_rate": 3.640614752929771e-05, + "loss": 0.0062, + "step": 677930 + }, + { + "epoch": 1.76, + "learning_rate": 3.640225931292624e-05, + "loss": 0.0081, + "step": 677940 + }, + { + "epoch": 1.76, + "learning_rate": 3.639837109655478e-05, + "loss": 0.0063, + "step": 677950 + }, + { + "epoch": 1.76, + "learning_rate": 3.639448288018331e-05, + "loss": 0.0094, + "step": 677960 + }, + { + "epoch": 1.76, + "learning_rate": 3.639059466381185e-05, + "loss": 0.0067, + "step": 677970 + }, + { + "epoch": 1.76, + "learning_rate": 3.638670644744038e-05, + "loss": 0.0051, + "step": 677980 + }, + { + "epoch": 1.76, + "learning_rate": 3.6382818231068924e-05, + "loss": 0.0096, + "step": 677990 + }, + { + "epoch": 1.76, + "learning_rate": 3.637893001469746e-05, + "loss": 0.0085, + "step": 678000 + }, + { + "epoch": 1.76, + "eval_cer": 0.8817012866862336, + "eval_loss": 0.0050600310787558556, + "eval_runtime": 107.7885, + "eval_samples_per_second": 18.555, + "eval_steps_per_second": 4.639, + "step": 678000 + }, + { + "epoch": 1.76, + "learning_rate": 3.6375041798325993e-05, + "loss": 0.0085, + "step": 678010 + }, + { + "epoch": 1.76, + "learning_rate": 3.637115358195452e-05, + "loss": 0.0086, + "step": 678020 + }, + { + "epoch": 1.76, + "learning_rate": 3.6367265365583056e-05, + "loss": 0.0069, + "step": 678030 + }, + { + "epoch": 1.76, + "learning_rate": 3.63633771492116e-05, + "loss": 0.0071, + "step": 678040 + }, + { + "epoch": 1.76, + "learning_rate": 3.635948893284013e-05, + "loss": 0.0077, + "step": 678050 + }, + { + "epoch": 1.76, + "learning_rate": 3.635560071646867e-05, + "loss": 0.0053, + "step": 678060 + }, + { + "epoch": 1.76, + "learning_rate": 3.63517125000972e-05, + "loss": 0.0091, + "step": 678070 + }, + { + "epoch": 1.76, + "learning_rate": 3.634782428372574e-05, + "loss": 0.0075, + "step": 678080 + }, + { + "epoch": 1.76, + "learning_rate": 3.634393606735427e-05, + "loss": 0.008, + "step": 678090 + }, + { + "epoch": 1.76, + "learning_rate": 3.634004785098281e-05, + "loss": 0.0065, + "step": 678100 + }, + { + "epoch": 1.76, + "learning_rate": 3.633615963461134e-05, + "loss": 0.007, + "step": 678110 + }, + { + "epoch": 1.76, + "learning_rate": 3.6332271418239884e-05, + "loss": 0.0081, + "step": 678120 + }, + { + "epoch": 1.76, + "learning_rate": 3.632838320186842e-05, + "loss": 0.0081, + "step": 678130 + }, + { + "epoch": 1.76, + "learning_rate": 3.632449498549695e-05, + "loss": 0.0078, + "step": 678140 + }, + { + "epoch": 1.76, + "learning_rate": 3.632060676912548e-05, + "loss": 0.0081, + "step": 678150 + }, + { + "epoch": 1.76, + "learning_rate": 3.6316718552754016e-05, + "loss": 0.0092, + "step": 678160 + }, + { + "epoch": 1.76, + "learning_rate": 3.631283033638256e-05, + "loss": 0.0078, + "step": 678170 + }, + { + "epoch": 1.76, + "learning_rate": 3.630894212001109e-05, + "loss": 0.0096, + "step": 678180 + }, + { + "epoch": 1.76, + "learning_rate": 3.630505390363963e-05, + "loss": 0.0087, + "step": 678190 + }, + { + "epoch": 1.76, + "learning_rate": 3.630116568726816e-05, + "loss": 0.0105, + "step": 678200 + }, + { + "epoch": 1.76, + "learning_rate": 3.62972774708967e-05, + "loss": 0.015, + "step": 678210 + }, + { + "epoch": 1.76, + "learning_rate": 3.629338925452523e-05, + "loss": 0.009, + "step": 678220 + }, + { + "epoch": 1.76, + "learning_rate": 3.628950103815377e-05, + "loss": 0.0074, + "step": 678230 + }, + { + "epoch": 1.76, + "learning_rate": 3.62856128217823e-05, + "loss": 0.0084, + "step": 678240 + }, + { + "epoch": 1.76, + "learning_rate": 3.6281724605410844e-05, + "loss": 0.0078, + "step": 678250 + }, + { + "epoch": 1.76, + "learning_rate": 3.627783638903938e-05, + "loss": 0.008, + "step": 678260 + }, + { + "epoch": 1.76, + "learning_rate": 3.6273948172667907e-05, + "loss": 0.0074, + "step": 678270 + }, + { + "epoch": 1.76, + "learning_rate": 3.627005995629644e-05, + "loss": 0.0056, + "step": 678280 + }, + { + "epoch": 1.76, + "learning_rate": 3.6266171739924976e-05, + "loss": 0.0106, + "step": 678290 + }, + { + "epoch": 1.76, + "learning_rate": 3.626228352355352e-05, + "loss": 0.0073, + "step": 678300 + }, + { + "epoch": 1.76, + "learning_rate": 3.625839530718205e-05, + "loss": 0.0077, + "step": 678310 + }, + { + "epoch": 1.76, + "learning_rate": 3.625450709081059e-05, + "loss": 0.0094, + "step": 678320 + }, + { + "epoch": 1.76, + "learning_rate": 3.625061887443912e-05, + "loss": 0.0081, + "step": 678330 + }, + { + "epoch": 1.76, + "learning_rate": 3.624673065806766e-05, + "loss": 0.0061, + "step": 678340 + }, + { + "epoch": 1.76, + "learning_rate": 3.624284244169619e-05, + "loss": 0.0073, + "step": 678350 + }, + { + "epoch": 1.76, + "learning_rate": 3.623895422532473e-05, + "loss": 0.0069, + "step": 678360 + }, + { + "epoch": 1.76, + "learning_rate": 3.623506600895326e-05, + "loss": 0.0075, + "step": 678370 + }, + { + "epoch": 1.76, + "learning_rate": 3.6231177792581804e-05, + "loss": 0.0077, + "step": 678380 + }, + { + "epoch": 1.76, + "learning_rate": 3.622728957621033e-05, + "loss": 0.0128, + "step": 678390 + }, + { + "epoch": 1.76, + "learning_rate": 3.6223401359838867e-05, + "loss": 0.0071, + "step": 678400 + }, + { + "epoch": 1.76, + "learning_rate": 3.62195131434674e-05, + "loss": 0.0054, + "step": 678410 + }, + { + "epoch": 1.76, + "learning_rate": 3.6215624927095936e-05, + "loss": 0.0086, + "step": 678420 + }, + { + "epoch": 1.76, + "learning_rate": 3.621173671072448e-05, + "loss": 0.0057, + "step": 678430 + }, + { + "epoch": 1.76, + "learning_rate": 3.620784849435301e-05, + "loss": 0.011, + "step": 678440 + }, + { + "epoch": 1.76, + "learning_rate": 3.620396027798155e-05, + "loss": 0.0076, + "step": 678450 + }, + { + "epoch": 1.76, + "learning_rate": 3.620007206161008e-05, + "loss": 0.007, + "step": 678460 + }, + { + "epoch": 1.76, + "learning_rate": 3.619618384523862e-05, + "loss": 0.0151, + "step": 678470 + }, + { + "epoch": 1.76, + "learning_rate": 3.619229562886715e-05, + "loss": 0.0063, + "step": 678480 + }, + { + "epoch": 1.76, + "learning_rate": 3.618840741249569e-05, + "loss": 0.0087, + "step": 678490 + }, + { + "epoch": 1.76, + "learning_rate": 3.618451919612422e-05, + "loss": 0.0057, + "step": 678500 + }, + { + "epoch": 1.76, + "learning_rate": 3.618063097975276e-05, + "loss": 0.0078, + "step": 678510 + }, + { + "epoch": 1.76, + "learning_rate": 3.617674276338129e-05, + "loss": 0.0082, + "step": 678520 + }, + { + "epoch": 1.76, + "learning_rate": 3.6172854547009827e-05, + "loss": 0.0071, + "step": 678530 + }, + { + "epoch": 1.76, + "learning_rate": 3.616896633063836e-05, + "loss": 0.009, + "step": 678540 + }, + { + "epoch": 1.76, + "learning_rate": 3.6165078114266896e-05, + "loss": 0.007, + "step": 678550 + }, + { + "epoch": 1.76, + "learning_rate": 3.616118989789544e-05, + "loss": 0.0086, + "step": 678560 + }, + { + "epoch": 1.76, + "learning_rate": 3.615730168152397e-05, + "loss": 0.0061, + "step": 678570 + }, + { + "epoch": 1.76, + "learning_rate": 3.615341346515251e-05, + "loss": 0.009, + "step": 678580 + }, + { + "epoch": 1.76, + "learning_rate": 3.614952524878104e-05, + "loss": 0.0085, + "step": 678590 + }, + { + "epoch": 1.76, + "learning_rate": 3.614563703240958e-05, + "loss": 0.0092, + "step": 678600 + }, + { + "epoch": 1.76, + "learning_rate": 3.614174881603811e-05, + "loss": 0.0062, + "step": 678610 + }, + { + "epoch": 1.76, + "learning_rate": 3.613786059966665e-05, + "loss": 0.0058, + "step": 678620 + }, + { + "epoch": 1.76, + "learning_rate": 3.613397238329518e-05, + "loss": 0.0101, + "step": 678630 + }, + { + "epoch": 1.76, + "learning_rate": 3.613008416692372e-05, + "loss": 0.0059, + "step": 678640 + }, + { + "epoch": 1.76, + "learning_rate": 3.612619595055225e-05, + "loss": 0.0067, + "step": 678650 + }, + { + "epoch": 1.76, + "learning_rate": 3.6122307734180787e-05, + "loss": 0.0103, + "step": 678660 + }, + { + "epoch": 1.76, + "learning_rate": 3.611841951780932e-05, + "loss": 0.0072, + "step": 678670 + }, + { + "epoch": 1.76, + "learning_rate": 3.6114531301437856e-05, + "loss": 0.0063, + "step": 678680 + }, + { + "epoch": 1.76, + "learning_rate": 3.611064308506639e-05, + "loss": 0.0071, + "step": 678690 + }, + { + "epoch": 1.76, + "learning_rate": 3.610675486869493e-05, + "loss": 0.0113, + "step": 678700 + }, + { + "epoch": 1.76, + "learning_rate": 3.610286665232347e-05, + "loss": 0.0056, + "step": 678710 + }, + { + "epoch": 1.76, + "learning_rate": 3.6098978435952e-05, + "loss": 0.0085, + "step": 678720 + }, + { + "epoch": 1.76, + "learning_rate": 3.609509021958054e-05, + "loss": 0.0088, + "step": 678730 + }, + { + "epoch": 1.76, + "learning_rate": 3.609120200320907e-05, + "loss": 0.0051, + "step": 678740 + }, + { + "epoch": 1.76, + "learning_rate": 3.608731378683761e-05, + "loss": 0.0101, + "step": 678750 + }, + { + "epoch": 1.76, + "learning_rate": 3.608342557046614e-05, + "loss": 0.0083, + "step": 678760 + }, + { + "epoch": 1.76, + "learning_rate": 3.607953735409468e-05, + "loss": 0.0064, + "step": 678770 + }, + { + "epoch": 1.76, + "learning_rate": 3.607564913772321e-05, + "loss": 0.0075, + "step": 678780 + }, + { + "epoch": 1.76, + "learning_rate": 3.6071760921351746e-05, + "loss": 0.0069, + "step": 678790 + }, + { + "epoch": 1.76, + "learning_rate": 3.606787270498028e-05, + "loss": 0.0072, + "step": 678800 + }, + { + "epoch": 1.76, + "learning_rate": 3.6063984488608816e-05, + "loss": 0.0065, + "step": 678810 + }, + { + "epoch": 1.76, + "learning_rate": 3.606009627223735e-05, + "loss": 0.0086, + "step": 678820 + }, + { + "epoch": 1.76, + "learning_rate": 3.605620805586589e-05, + "loss": 0.0055, + "step": 678830 + }, + { + "epoch": 1.76, + "learning_rate": 3.605231983949443e-05, + "loss": 0.008, + "step": 678840 + }, + { + "epoch": 1.76, + "learning_rate": 3.604843162312296e-05, + "loss": 0.0095, + "step": 678850 + }, + { + "epoch": 1.76, + "learning_rate": 3.60445434067515e-05, + "loss": 0.0061, + "step": 678860 + }, + { + "epoch": 1.76, + "learning_rate": 3.604065519038003e-05, + "loss": 0.0077, + "step": 678870 + }, + { + "epoch": 1.76, + "learning_rate": 3.603676697400857e-05, + "loss": 0.0067, + "step": 678880 + }, + { + "epoch": 1.76, + "learning_rate": 3.60328787576371e-05, + "loss": 0.0059, + "step": 678890 + }, + { + "epoch": 1.76, + "learning_rate": 3.602899054126564e-05, + "loss": 0.0097, + "step": 678900 + }, + { + "epoch": 1.76, + "learning_rate": 3.602510232489417e-05, + "loss": 0.0074, + "step": 678910 + }, + { + "epoch": 1.76, + "learning_rate": 3.6021214108522706e-05, + "loss": 0.0075, + "step": 678920 + }, + { + "epoch": 1.76, + "learning_rate": 3.601732589215124e-05, + "loss": 0.0069, + "step": 678930 + }, + { + "epoch": 1.76, + "learning_rate": 3.6013437675779776e-05, + "loss": 0.0071, + "step": 678940 + }, + { + "epoch": 1.76, + "learning_rate": 3.600954945940831e-05, + "loss": 0.0083, + "step": 678950 + }, + { + "epoch": 1.76, + "learning_rate": 3.600566124303685e-05, + "loss": 0.0065, + "step": 678960 + }, + { + "epoch": 1.76, + "learning_rate": 3.600177302666539e-05, + "loss": 0.008, + "step": 678970 + }, + { + "epoch": 1.76, + "learning_rate": 3.599788481029392e-05, + "loss": 0.0056, + "step": 678980 + }, + { + "epoch": 1.76, + "learning_rate": 3.599399659392246e-05, + "loss": 0.0069, + "step": 678990 + }, + { + "epoch": 1.76, + "learning_rate": 3.599010837755099e-05, + "loss": 0.0079, + "step": 679000 + }, + { + "epoch": 1.76, + "eval_cer": 0.8816592975782083, + "eval_loss": 0.00512329675257206, + "eval_runtime": 108.0539, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 679000 + }, + { + "epoch": 1.76, + "learning_rate": 3.598622016117953e-05, + "loss": 0.0068, + "step": 679010 + }, + { + "epoch": 1.76, + "learning_rate": 3.598233194480806e-05, + "loss": 0.0103, + "step": 679020 + }, + { + "epoch": 1.76, + "learning_rate": 3.59784437284366e-05, + "loss": 0.0082, + "step": 679030 + }, + { + "epoch": 1.76, + "learning_rate": 3.597455551206513e-05, + "loss": 0.0083, + "step": 679040 + }, + { + "epoch": 1.76, + "learning_rate": 3.5970667295693666e-05, + "loss": 0.0123, + "step": 679050 + }, + { + "epoch": 1.76, + "learning_rate": 3.59667790793222e-05, + "loss": 0.0088, + "step": 679060 + }, + { + "epoch": 1.76, + "learning_rate": 3.5962890862950736e-05, + "loss": 0.0074, + "step": 679070 + }, + { + "epoch": 1.76, + "learning_rate": 3.595900264657927e-05, + "loss": 0.0068, + "step": 679080 + }, + { + "epoch": 1.76, + "learning_rate": 3.595511443020781e-05, + "loss": 0.0083, + "step": 679090 + }, + { + "epoch": 1.76, + "learning_rate": 3.595122621383635e-05, + "loss": 0.0058, + "step": 679100 + }, + { + "epoch": 1.76, + "learning_rate": 3.594733799746488e-05, + "loss": 0.0071, + "step": 679110 + }, + { + "epoch": 1.76, + "learning_rate": 3.594344978109342e-05, + "loss": 0.0099, + "step": 679120 + }, + { + "epoch": 1.76, + "learning_rate": 3.5939561564721945e-05, + "loss": 0.0072, + "step": 679130 + }, + { + "epoch": 1.76, + "learning_rate": 3.593567334835049e-05, + "loss": 0.0107, + "step": 679140 + }, + { + "epoch": 1.76, + "learning_rate": 3.593178513197902e-05, + "loss": 0.0064, + "step": 679150 + }, + { + "epoch": 1.76, + "learning_rate": 3.592789691560756e-05, + "loss": 0.0069, + "step": 679160 + }, + { + "epoch": 1.76, + "learning_rate": 3.592400869923609e-05, + "loss": 0.0094, + "step": 679170 + }, + { + "epoch": 1.76, + "learning_rate": 3.5920120482864626e-05, + "loss": 0.0081, + "step": 679180 + }, + { + "epoch": 1.76, + "learning_rate": 3.591623226649316e-05, + "loss": 0.0074, + "step": 679190 + }, + { + "epoch": 1.76, + "learning_rate": 3.5912344050121696e-05, + "loss": 0.01, + "step": 679200 + }, + { + "epoch": 1.76, + "learning_rate": 3.590845583375023e-05, + "loss": 0.0091, + "step": 679210 + }, + { + "epoch": 1.76, + "learning_rate": 3.590456761737877e-05, + "loss": 0.0109, + "step": 679220 + }, + { + "epoch": 1.76, + "learning_rate": 3.590067940100731e-05, + "loss": 0.0082, + "step": 679230 + }, + { + "epoch": 1.76, + "learning_rate": 3.589679118463584e-05, + "loss": 0.0077, + "step": 679240 + }, + { + "epoch": 1.76, + "learning_rate": 3.589290296826438e-05, + "loss": 0.0099, + "step": 679250 + }, + { + "epoch": 1.76, + "learning_rate": 3.5889014751892905e-05, + "loss": 0.0106, + "step": 679260 + }, + { + "epoch": 1.76, + "learning_rate": 3.588512653552145e-05, + "loss": 0.0067, + "step": 679270 + }, + { + "epoch": 1.76, + "learning_rate": 3.588123831914998e-05, + "loss": 0.008, + "step": 679280 + }, + { + "epoch": 1.76, + "learning_rate": 3.587735010277852e-05, + "loss": 0.0099, + "step": 679290 + }, + { + "epoch": 1.76, + "learning_rate": 3.587346188640705e-05, + "loss": 0.007, + "step": 679300 + }, + { + "epoch": 1.76, + "learning_rate": 3.5869573670035586e-05, + "loss": 0.0088, + "step": 679310 + }, + { + "epoch": 1.76, + "learning_rate": 3.586568545366412e-05, + "loss": 0.0057, + "step": 679320 + }, + { + "epoch": 1.76, + "learning_rate": 3.5861797237292656e-05, + "loss": 0.0073, + "step": 679330 + }, + { + "epoch": 1.76, + "learning_rate": 3.585790902092119e-05, + "loss": 0.0075, + "step": 679340 + }, + { + "epoch": 1.76, + "learning_rate": 3.585402080454973e-05, + "loss": 0.0078, + "step": 679350 + }, + { + "epoch": 1.76, + "learning_rate": 3.585013258817827e-05, + "loss": 0.0058, + "step": 679360 + }, + { + "epoch": 1.76, + "learning_rate": 3.58462443718068e-05, + "loss": 0.0073, + "step": 679370 + }, + { + "epoch": 1.76, + "learning_rate": 3.584235615543533e-05, + "loss": 0.0093, + "step": 679380 + }, + { + "epoch": 1.76, + "learning_rate": 3.5838467939063865e-05, + "loss": 0.0095, + "step": 679390 + }, + { + "epoch": 1.76, + "learning_rate": 3.583457972269241e-05, + "loss": 0.0112, + "step": 679400 + }, + { + "epoch": 1.76, + "learning_rate": 3.583069150632094e-05, + "loss": 0.0135, + "step": 679410 + }, + { + "epoch": 1.76, + "learning_rate": 3.582680328994948e-05, + "loss": 0.0098, + "step": 679420 + }, + { + "epoch": 1.76, + "learning_rate": 3.582291507357801e-05, + "loss": 0.0088, + "step": 679430 + }, + { + "epoch": 1.76, + "learning_rate": 3.5819026857206546e-05, + "loss": 0.008, + "step": 679440 + }, + { + "epoch": 1.76, + "learning_rate": 3.581513864083508e-05, + "loss": 0.0068, + "step": 679450 + }, + { + "epoch": 1.76, + "learning_rate": 3.5811250424463616e-05, + "loss": 0.0077, + "step": 679460 + }, + { + "epoch": 1.76, + "learning_rate": 3.580736220809215e-05, + "loss": 0.009, + "step": 679470 + }, + { + "epoch": 1.76, + "learning_rate": 3.580347399172069e-05, + "loss": 0.0073, + "step": 679480 + }, + { + "epoch": 1.76, + "learning_rate": 3.579958577534923e-05, + "loss": 0.0076, + "step": 679490 + }, + { + "epoch": 1.76, + "learning_rate": 3.579569755897776e-05, + "loss": 0.0088, + "step": 679500 + }, + { + "epoch": 1.76, + "learning_rate": 3.579180934260629e-05, + "loss": 0.012, + "step": 679510 + }, + { + "epoch": 1.76, + "learning_rate": 3.5787921126234825e-05, + "loss": 0.0068, + "step": 679520 + }, + { + "epoch": 1.76, + "learning_rate": 3.578403290986337e-05, + "loss": 0.0077, + "step": 679530 + }, + { + "epoch": 1.76, + "learning_rate": 3.57801446934919e-05, + "loss": 0.0047, + "step": 679540 + }, + { + "epoch": 1.76, + "learning_rate": 3.577625647712044e-05, + "loss": 0.0062, + "step": 679550 + }, + { + "epoch": 1.76, + "learning_rate": 3.577236826074897e-05, + "loss": 0.0074, + "step": 679560 + }, + { + "epoch": 1.76, + "learning_rate": 3.5768480044377506e-05, + "loss": 0.0087, + "step": 679570 + }, + { + "epoch": 1.76, + "learning_rate": 3.576459182800604e-05, + "loss": 0.0083, + "step": 679580 + }, + { + "epoch": 1.76, + "learning_rate": 3.5760703611634576e-05, + "loss": 0.0082, + "step": 679590 + }, + { + "epoch": 1.76, + "learning_rate": 3.575681539526311e-05, + "loss": 0.0101, + "step": 679600 + }, + { + "epoch": 1.76, + "learning_rate": 3.575292717889165e-05, + "loss": 0.0088, + "step": 679610 + }, + { + "epoch": 1.76, + "learning_rate": 3.574903896252019e-05, + "loss": 0.0091, + "step": 679620 + }, + { + "epoch": 1.76, + "learning_rate": 3.5745150746148716e-05, + "loss": 0.0091, + "step": 679630 + }, + { + "epoch": 1.76, + "learning_rate": 3.574126252977725e-05, + "loss": 0.009, + "step": 679640 + }, + { + "epoch": 1.76, + "learning_rate": 3.5737374313405785e-05, + "loss": 0.0098, + "step": 679650 + }, + { + "epoch": 1.76, + "learning_rate": 3.573348609703433e-05, + "loss": 0.0065, + "step": 679660 + }, + { + "epoch": 1.76, + "learning_rate": 3.572959788066286e-05, + "loss": 0.0115, + "step": 679670 + }, + { + "epoch": 1.76, + "learning_rate": 3.5725709664291397e-05, + "loss": 0.0108, + "step": 679680 + }, + { + "epoch": 1.76, + "learning_rate": 3.572182144791993e-05, + "loss": 0.008, + "step": 679690 + }, + { + "epoch": 1.76, + "learning_rate": 3.5717933231548466e-05, + "loss": 0.0111, + "step": 679700 + }, + { + "epoch": 1.76, + "learning_rate": 3.5714045015177e-05, + "loss": 0.0081, + "step": 679710 + }, + { + "epoch": 1.76, + "learning_rate": 3.5710156798805536e-05, + "loss": 0.0104, + "step": 679720 + }, + { + "epoch": 1.76, + "learning_rate": 3.570626858243407e-05, + "loss": 0.0064, + "step": 679730 + }, + { + "epoch": 1.76, + "learning_rate": 3.570238036606261e-05, + "loss": 0.0073, + "step": 679740 + }, + { + "epoch": 1.76, + "learning_rate": 3.569849214969115e-05, + "loss": 0.0069, + "step": 679750 + }, + { + "epoch": 1.76, + "learning_rate": 3.5694603933319675e-05, + "loss": 0.0078, + "step": 679760 + }, + { + "epoch": 1.76, + "learning_rate": 3.569071571694821e-05, + "loss": 0.0067, + "step": 679770 + }, + { + "epoch": 1.76, + "learning_rate": 3.5686827500576745e-05, + "loss": 0.0057, + "step": 679780 + }, + { + "epoch": 1.76, + "learning_rate": 3.568293928420529e-05, + "loss": 0.011, + "step": 679790 + }, + { + "epoch": 1.76, + "learning_rate": 3.567905106783382e-05, + "loss": 0.0083, + "step": 679800 + }, + { + "epoch": 1.76, + "learning_rate": 3.5675162851462357e-05, + "loss": 0.0084, + "step": 679810 + }, + { + "epoch": 1.76, + "learning_rate": 3.567127463509089e-05, + "loss": 0.0063, + "step": 679820 + }, + { + "epoch": 1.76, + "learning_rate": 3.5667386418719426e-05, + "loss": 0.0089, + "step": 679830 + }, + { + "epoch": 1.76, + "learning_rate": 3.566349820234796e-05, + "loss": 0.0079, + "step": 679840 + }, + { + "epoch": 1.76, + "learning_rate": 3.5659609985976496e-05, + "loss": 0.0077, + "step": 679850 + }, + { + "epoch": 1.76, + "learning_rate": 3.565572176960503e-05, + "loss": 0.0068, + "step": 679860 + }, + { + "epoch": 1.76, + "learning_rate": 3.565183355323357e-05, + "loss": 0.0089, + "step": 679870 + }, + { + "epoch": 1.76, + "learning_rate": 3.56479453368621e-05, + "loss": 0.0122, + "step": 679880 + }, + { + "epoch": 1.76, + "learning_rate": 3.5644057120490635e-05, + "loss": 0.006, + "step": 679890 + }, + { + "epoch": 1.76, + "learning_rate": 3.564016890411917e-05, + "loss": 0.0073, + "step": 679900 + }, + { + "epoch": 1.76, + "learning_rate": 3.5636280687747705e-05, + "loss": 0.0082, + "step": 679910 + }, + { + "epoch": 1.76, + "learning_rate": 3.563239247137625e-05, + "loss": 0.008, + "step": 679920 + }, + { + "epoch": 1.76, + "learning_rate": 3.562850425500478e-05, + "loss": 0.0097, + "step": 679930 + }, + { + "epoch": 1.76, + "learning_rate": 3.5624616038633317e-05, + "loss": 0.0061, + "step": 679940 + }, + { + "epoch": 1.76, + "learning_rate": 3.562072782226185e-05, + "loss": 0.0077, + "step": 679950 + }, + { + "epoch": 1.76, + "learning_rate": 3.5616839605890386e-05, + "loss": 0.0089, + "step": 679960 + }, + { + "epoch": 1.76, + "learning_rate": 3.561295138951892e-05, + "loss": 0.0087, + "step": 679970 + }, + { + "epoch": 1.76, + "learning_rate": 3.5609063173147456e-05, + "loss": 0.0092, + "step": 679980 + }, + { + "epoch": 1.76, + "learning_rate": 3.560517495677599e-05, + "loss": 0.0096, + "step": 679990 + }, + { + "epoch": 1.76, + "learning_rate": 3.5601286740404526e-05, + "loss": 0.006, + "step": 680000 + }, + { + "epoch": 1.76, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.005062996409833431, + "eval_runtime": 107.9149, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 680000 + }, + { + "epoch": 1.76, + "learning_rate": 3.559739852403306e-05, + "loss": 0.0052, + "step": 680010 + }, + { + "epoch": 1.76, + "learning_rate": 3.5593510307661595e-05, + "loss": 0.0064, + "step": 680020 + }, + { + "epoch": 1.76, + "learning_rate": 3.558962209129013e-05, + "loss": 0.0052, + "step": 680030 + }, + { + "epoch": 1.76, + "learning_rate": 3.5585733874918665e-05, + "loss": 0.0084, + "step": 680040 + }, + { + "epoch": 1.76, + "learning_rate": 3.55818456585472e-05, + "loss": 0.0117, + "step": 680050 + }, + { + "epoch": 1.76, + "learning_rate": 3.557795744217574e-05, + "loss": 0.005, + "step": 680060 + }, + { + "epoch": 1.76, + "learning_rate": 3.5574069225804277e-05, + "loss": 0.0104, + "step": 680070 + }, + { + "epoch": 1.76, + "learning_rate": 3.557018100943281e-05, + "loss": 0.0075, + "step": 680080 + }, + { + "epoch": 1.76, + "learning_rate": 3.5566292793061346e-05, + "loss": 0.0066, + "step": 680090 + }, + { + "epoch": 1.76, + "learning_rate": 3.556240457668988e-05, + "loss": 0.0076, + "step": 680100 + }, + { + "epoch": 1.76, + "learning_rate": 3.5558516360318416e-05, + "loss": 0.0114, + "step": 680110 + }, + { + "epoch": 1.76, + "learning_rate": 3.555462814394695e-05, + "loss": 0.0079, + "step": 680120 + }, + { + "epoch": 1.76, + "learning_rate": 3.5550739927575486e-05, + "loss": 0.0092, + "step": 680130 + }, + { + "epoch": 1.76, + "learning_rate": 3.554685171120402e-05, + "loss": 0.0092, + "step": 680140 + }, + { + "epoch": 1.76, + "learning_rate": 3.5542963494832555e-05, + "loss": 0.0058, + "step": 680150 + }, + { + "epoch": 1.76, + "learning_rate": 3.553907527846109e-05, + "loss": 0.0093, + "step": 680160 + }, + { + "epoch": 1.76, + "learning_rate": 3.5535187062089625e-05, + "loss": 0.0071, + "step": 680170 + }, + { + "epoch": 1.76, + "learning_rate": 3.553129884571816e-05, + "loss": 0.0083, + "step": 680180 + }, + { + "epoch": 1.76, + "learning_rate": 3.55274106293467e-05, + "loss": 0.0076, + "step": 680190 + }, + { + "epoch": 1.76, + "learning_rate": 3.5523522412975237e-05, + "loss": 0.0111, + "step": 680200 + }, + { + "epoch": 1.76, + "learning_rate": 3.551963419660377e-05, + "loss": 0.006, + "step": 680210 + }, + { + "epoch": 1.76, + "learning_rate": 3.5515745980232306e-05, + "loss": 0.0066, + "step": 680220 + }, + { + "epoch": 1.76, + "learning_rate": 3.551185776386084e-05, + "loss": 0.0064, + "step": 680230 + }, + { + "epoch": 1.76, + "learning_rate": 3.5507969547489376e-05, + "loss": 0.0072, + "step": 680240 + }, + { + "epoch": 1.76, + "learning_rate": 3.550408133111791e-05, + "loss": 0.0062, + "step": 680250 + }, + { + "epoch": 1.76, + "learning_rate": 3.5500193114746446e-05, + "loss": 0.0074, + "step": 680260 + }, + { + "epoch": 1.76, + "learning_rate": 3.549630489837498e-05, + "loss": 0.0074, + "step": 680270 + }, + { + "epoch": 1.76, + "learning_rate": 3.5492416682003515e-05, + "loss": 0.0067, + "step": 680280 + }, + { + "epoch": 1.76, + "learning_rate": 3.548852846563205e-05, + "loss": 0.0066, + "step": 680290 + }, + { + "epoch": 1.76, + "learning_rate": 3.5484640249260585e-05, + "loss": 0.0069, + "step": 680300 + }, + { + "epoch": 1.76, + "learning_rate": 3.548075203288912e-05, + "loss": 0.007, + "step": 680310 + }, + { + "epoch": 1.76, + "learning_rate": 3.547686381651766e-05, + "loss": 0.0094, + "step": 680320 + }, + { + "epoch": 1.76, + "learning_rate": 3.5472975600146196e-05, + "loss": 0.0077, + "step": 680330 + }, + { + "epoch": 1.76, + "learning_rate": 3.546908738377473e-05, + "loss": 0.0073, + "step": 680340 + }, + { + "epoch": 1.76, + "learning_rate": 3.5465199167403266e-05, + "loss": 0.0086, + "step": 680350 + }, + { + "epoch": 1.76, + "learning_rate": 3.54613109510318e-05, + "loss": 0.0066, + "step": 680360 + }, + { + "epoch": 1.76, + "learning_rate": 3.5457422734660336e-05, + "loss": 0.0077, + "step": 680370 + }, + { + "epoch": 1.76, + "learning_rate": 3.545353451828887e-05, + "loss": 0.0051, + "step": 680380 + }, + { + "epoch": 1.76, + "learning_rate": 3.5449646301917406e-05, + "loss": 0.0067, + "step": 680390 + }, + { + "epoch": 1.76, + "learning_rate": 3.544575808554594e-05, + "loss": 0.0091, + "step": 680400 + }, + { + "epoch": 1.76, + "learning_rate": 3.5441869869174475e-05, + "loss": 0.0091, + "step": 680410 + }, + { + "epoch": 1.76, + "learning_rate": 3.543798165280301e-05, + "loss": 0.007, + "step": 680420 + }, + { + "epoch": 1.76, + "learning_rate": 3.5434093436431545e-05, + "loss": 0.0088, + "step": 680430 + }, + { + "epoch": 1.76, + "learning_rate": 3.543020522006008e-05, + "loss": 0.0061, + "step": 680440 + }, + { + "epoch": 1.76, + "learning_rate": 3.542631700368862e-05, + "loss": 0.0087, + "step": 680450 + }, + { + "epoch": 1.76, + "learning_rate": 3.5422428787317156e-05, + "loss": 0.0092, + "step": 680460 + }, + { + "epoch": 1.76, + "learning_rate": 3.541854057094569e-05, + "loss": 0.0072, + "step": 680470 + }, + { + "epoch": 1.76, + "learning_rate": 3.5414652354574226e-05, + "loss": 0.0068, + "step": 680480 + }, + { + "epoch": 1.76, + "learning_rate": 3.541076413820276e-05, + "loss": 0.0065, + "step": 680490 + }, + { + "epoch": 1.76, + "learning_rate": 3.5406875921831296e-05, + "loss": 0.0072, + "step": 680500 + }, + { + "epoch": 1.76, + "learning_rate": 3.540298770545983e-05, + "loss": 0.0086, + "step": 680510 + }, + { + "epoch": 1.76, + "learning_rate": 3.5399099489088366e-05, + "loss": 0.0089, + "step": 680520 + }, + { + "epoch": 1.76, + "learning_rate": 3.53952112727169e-05, + "loss": 0.0081, + "step": 680530 + }, + { + "epoch": 1.76, + "learning_rate": 3.5391323056345435e-05, + "loss": 0.0095, + "step": 680540 + }, + { + "epoch": 1.76, + "learning_rate": 3.538743483997397e-05, + "loss": 0.0069, + "step": 680550 + }, + { + "epoch": 1.76, + "learning_rate": 3.5383546623602505e-05, + "loss": 0.0084, + "step": 680560 + }, + { + "epoch": 1.76, + "learning_rate": 3.537965840723104e-05, + "loss": 0.0086, + "step": 680570 + }, + { + "epoch": 1.76, + "learning_rate": 3.537577019085958e-05, + "loss": 0.0072, + "step": 680580 + }, + { + "epoch": 1.76, + "learning_rate": 3.5371881974488116e-05, + "loss": 0.0057, + "step": 680590 + }, + { + "epoch": 1.76, + "learning_rate": 3.536799375811665e-05, + "loss": 0.0086, + "step": 680600 + }, + { + "epoch": 1.76, + "learning_rate": 3.5364105541745186e-05, + "loss": 0.0066, + "step": 680610 + }, + { + "epoch": 1.76, + "learning_rate": 3.5360217325373714e-05, + "loss": 0.0075, + "step": 680620 + }, + { + "epoch": 1.76, + "learning_rate": 3.5356329109002256e-05, + "loss": 0.0082, + "step": 680630 + }, + { + "epoch": 1.76, + "learning_rate": 3.535244089263079e-05, + "loss": 0.0058, + "step": 680640 + }, + { + "epoch": 1.76, + "learning_rate": 3.5348552676259326e-05, + "loss": 0.0077, + "step": 680650 + }, + { + "epoch": 1.76, + "learning_rate": 3.534466445988786e-05, + "loss": 0.005, + "step": 680660 + }, + { + "epoch": 1.76, + "learning_rate": 3.5340776243516395e-05, + "loss": 0.006, + "step": 680670 + }, + { + "epoch": 1.76, + "learning_rate": 3.533688802714493e-05, + "loss": 0.0075, + "step": 680680 + }, + { + "epoch": 1.76, + "learning_rate": 3.5332999810773465e-05, + "loss": 0.0079, + "step": 680690 + }, + { + "epoch": 1.76, + "learning_rate": 3.5329111594402e-05, + "loss": 0.0068, + "step": 680700 + }, + { + "epoch": 1.76, + "learning_rate": 3.532522337803054e-05, + "loss": 0.007, + "step": 680710 + }, + { + "epoch": 1.76, + "learning_rate": 3.5321335161659076e-05, + "loss": 0.0056, + "step": 680720 + }, + { + "epoch": 1.76, + "learning_rate": 3.531744694528761e-05, + "loss": 0.0107, + "step": 680730 + }, + { + "epoch": 1.76, + "learning_rate": 3.5313558728916146e-05, + "loss": 0.0066, + "step": 680740 + }, + { + "epoch": 1.76, + "learning_rate": 3.5309670512544674e-05, + "loss": 0.0076, + "step": 680750 + }, + { + "epoch": 1.76, + "learning_rate": 3.5305782296173216e-05, + "loss": 0.0087, + "step": 680760 + }, + { + "epoch": 1.76, + "learning_rate": 3.530189407980175e-05, + "loss": 0.0103, + "step": 680770 + }, + { + "epoch": 1.76, + "learning_rate": 3.5298005863430286e-05, + "loss": 0.0085, + "step": 680780 + }, + { + "epoch": 1.76, + "learning_rate": 3.529411764705882e-05, + "loss": 0.0055, + "step": 680790 + }, + { + "epoch": 1.76, + "learning_rate": 3.5290229430687355e-05, + "loss": 0.0068, + "step": 680800 + }, + { + "epoch": 1.76, + "learning_rate": 3.528634121431589e-05, + "loss": 0.0096, + "step": 680810 + }, + { + "epoch": 1.76, + "learning_rate": 3.5282452997944425e-05, + "loss": 0.008, + "step": 680820 + }, + { + "epoch": 1.76, + "learning_rate": 3.527856478157296e-05, + "loss": 0.0058, + "step": 680830 + }, + { + "epoch": 1.76, + "learning_rate": 3.52746765652015e-05, + "loss": 0.0068, + "step": 680840 + }, + { + "epoch": 1.76, + "learning_rate": 3.5270788348830036e-05, + "loss": 0.0105, + "step": 680850 + }, + { + "epoch": 1.76, + "learning_rate": 3.526690013245857e-05, + "loss": 0.006, + "step": 680860 + }, + { + "epoch": 1.76, + "learning_rate": 3.52630119160871e-05, + "loss": 0.0064, + "step": 680870 + }, + { + "epoch": 1.76, + "learning_rate": 3.5259123699715634e-05, + "loss": 0.0062, + "step": 680880 + }, + { + "epoch": 1.76, + "learning_rate": 3.5255235483344176e-05, + "loss": 0.0093, + "step": 680890 + }, + { + "epoch": 1.76, + "learning_rate": 3.525134726697271e-05, + "loss": 0.0089, + "step": 680900 + }, + { + "epoch": 1.77, + "learning_rate": 3.5247459050601246e-05, + "loss": 0.0075, + "step": 680910 + }, + { + "epoch": 1.77, + "learning_rate": 3.524357083422978e-05, + "loss": 0.0074, + "step": 680920 + }, + { + "epoch": 1.77, + "learning_rate": 3.5239682617858315e-05, + "loss": 0.0093, + "step": 680930 + }, + { + "epoch": 1.77, + "learning_rate": 3.523579440148685e-05, + "loss": 0.0096, + "step": 680940 + }, + { + "epoch": 1.77, + "learning_rate": 3.5231906185115385e-05, + "loss": 0.0079, + "step": 680950 + }, + { + "epoch": 1.77, + "learning_rate": 3.522801796874392e-05, + "loss": 0.0076, + "step": 680960 + }, + { + "epoch": 1.77, + "learning_rate": 3.522412975237246e-05, + "loss": 0.0073, + "step": 680970 + }, + { + "epoch": 1.77, + "learning_rate": 3.5220241536000996e-05, + "loss": 0.008, + "step": 680980 + }, + { + "epoch": 1.77, + "learning_rate": 3.521635331962953e-05, + "loss": 0.0072, + "step": 680990 + }, + { + "epoch": 1.77, + "learning_rate": 3.521246510325806e-05, + "loss": 0.0071, + "step": 681000 + }, + { + "epoch": 1.77, + "eval_cer": 0.88167329394755, + "eval_loss": 0.004988801199942827, + "eval_runtime": 107.9177, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 681000 + }, + { + "epoch": 1.77, + "learning_rate": 3.5208576886886594e-05, + "loss": 0.0076, + "step": 681010 + }, + { + "epoch": 1.77, + "learning_rate": 3.5204688670515136e-05, + "loss": 0.0057, + "step": 681020 + }, + { + "epoch": 1.77, + "learning_rate": 3.520080045414367e-05, + "loss": 0.0067, + "step": 681030 + }, + { + "epoch": 1.77, + "learning_rate": 3.5196912237772206e-05, + "loss": 0.007, + "step": 681040 + }, + { + "epoch": 1.77, + "learning_rate": 3.519302402140074e-05, + "loss": 0.0066, + "step": 681050 + }, + { + "epoch": 1.77, + "learning_rate": 3.5189135805029275e-05, + "loss": 0.0092, + "step": 681060 + }, + { + "epoch": 1.77, + "learning_rate": 3.518524758865781e-05, + "loss": 0.0083, + "step": 681070 + }, + { + "epoch": 1.77, + "learning_rate": 3.5181359372286345e-05, + "loss": 0.0078, + "step": 681080 + }, + { + "epoch": 1.77, + "learning_rate": 3.517747115591488e-05, + "loss": 0.0072, + "step": 681090 + }, + { + "epoch": 1.77, + "learning_rate": 3.517358293954342e-05, + "loss": 0.0077, + "step": 681100 + }, + { + "epoch": 1.77, + "learning_rate": 3.5169694723171956e-05, + "loss": 0.0082, + "step": 681110 + }, + { + "epoch": 1.77, + "learning_rate": 3.5165806506800484e-05, + "loss": 0.0107, + "step": 681120 + }, + { + "epoch": 1.77, + "learning_rate": 3.516191829042902e-05, + "loss": 0.0091, + "step": 681130 + }, + { + "epoch": 1.77, + "learning_rate": 3.5158030074057554e-05, + "loss": 0.0066, + "step": 681140 + }, + { + "epoch": 1.77, + "learning_rate": 3.5154141857686096e-05, + "loss": 0.0078, + "step": 681150 + }, + { + "epoch": 1.77, + "learning_rate": 3.515025364131463e-05, + "loss": 0.0052, + "step": 681160 + }, + { + "epoch": 1.77, + "learning_rate": 3.5146365424943166e-05, + "loss": 0.0103, + "step": 681170 + }, + { + "epoch": 1.77, + "learning_rate": 3.51424772085717e-05, + "loss": 0.0071, + "step": 681180 + }, + { + "epoch": 1.77, + "learning_rate": 3.5138588992200235e-05, + "loss": 0.0073, + "step": 681190 + }, + { + "epoch": 1.77, + "learning_rate": 3.513470077582877e-05, + "loss": 0.0075, + "step": 681200 + }, + { + "epoch": 1.77, + "learning_rate": 3.5130812559457305e-05, + "loss": 0.0074, + "step": 681210 + }, + { + "epoch": 1.77, + "learning_rate": 3.512692434308584e-05, + "loss": 0.0106, + "step": 681220 + }, + { + "epoch": 1.77, + "learning_rate": 3.512303612671438e-05, + "loss": 0.0076, + "step": 681230 + }, + { + "epoch": 1.77, + "learning_rate": 3.511914791034291e-05, + "loss": 0.0106, + "step": 681240 + }, + { + "epoch": 1.77, + "learning_rate": 3.5115259693971444e-05, + "loss": 0.0083, + "step": 681250 + }, + { + "epoch": 1.77, + "learning_rate": 3.511137147759998e-05, + "loss": 0.0073, + "step": 681260 + }, + { + "epoch": 1.77, + "learning_rate": 3.5107483261228514e-05, + "loss": 0.0096, + "step": 681270 + }, + { + "epoch": 1.77, + "learning_rate": 3.5103595044857056e-05, + "loss": 0.0058, + "step": 681280 + }, + { + "epoch": 1.77, + "learning_rate": 3.509970682848559e-05, + "loss": 0.0071, + "step": 681290 + }, + { + "epoch": 1.77, + "learning_rate": 3.5095818612114125e-05, + "loss": 0.0062, + "step": 681300 + }, + { + "epoch": 1.77, + "learning_rate": 3.509193039574266e-05, + "loss": 0.0094, + "step": 681310 + }, + { + "epoch": 1.77, + "learning_rate": 3.5088042179371195e-05, + "loss": 0.0097, + "step": 681320 + }, + { + "epoch": 1.77, + "learning_rate": 3.508415396299973e-05, + "loss": 0.0076, + "step": 681330 + }, + { + "epoch": 1.77, + "learning_rate": 3.5080265746628265e-05, + "loss": 0.0072, + "step": 681340 + }, + { + "epoch": 1.77, + "learning_rate": 3.50763775302568e-05, + "loss": 0.0071, + "step": 681350 + }, + { + "epoch": 1.77, + "learning_rate": 3.5072489313885335e-05, + "loss": 0.0064, + "step": 681360 + }, + { + "epoch": 1.77, + "learning_rate": 3.506860109751387e-05, + "loss": 0.0072, + "step": 681370 + }, + { + "epoch": 1.77, + "learning_rate": 3.5064712881142404e-05, + "loss": 0.0056, + "step": 681380 + }, + { + "epoch": 1.77, + "learning_rate": 3.506082466477094e-05, + "loss": 0.0069, + "step": 681390 + }, + { + "epoch": 1.77, + "learning_rate": 3.5056936448399474e-05, + "loss": 0.0077, + "step": 681400 + }, + { + "epoch": 1.77, + "learning_rate": 3.505304823202801e-05, + "loss": 0.0074, + "step": 681410 + }, + { + "epoch": 1.77, + "learning_rate": 3.504916001565655e-05, + "loss": 0.0068, + "step": 681420 + }, + { + "epoch": 1.77, + "learning_rate": 3.5045271799285085e-05, + "loss": 0.0088, + "step": 681430 + }, + { + "epoch": 1.77, + "learning_rate": 3.504138358291362e-05, + "loss": 0.0063, + "step": 681440 + }, + { + "epoch": 1.77, + "learning_rate": 3.5037495366542155e-05, + "loss": 0.0071, + "step": 681450 + }, + { + "epoch": 1.77, + "learning_rate": 3.503360715017069e-05, + "loss": 0.0077, + "step": 681460 + }, + { + "epoch": 1.77, + "learning_rate": 3.5029718933799225e-05, + "loss": 0.0061, + "step": 681470 + }, + { + "epoch": 1.77, + "learning_rate": 3.502583071742776e-05, + "loss": 0.0067, + "step": 681480 + }, + { + "epoch": 1.77, + "learning_rate": 3.5021942501056295e-05, + "loss": 0.0055, + "step": 681490 + }, + { + "epoch": 1.77, + "learning_rate": 3.501805428468483e-05, + "loss": 0.006, + "step": 681500 + }, + { + "epoch": 1.77, + "learning_rate": 3.5014166068313364e-05, + "loss": 0.0084, + "step": 681510 + }, + { + "epoch": 1.77, + "learning_rate": 3.50102778519419e-05, + "loss": 0.0094, + "step": 681520 + }, + { + "epoch": 1.77, + "learning_rate": 3.5006389635570434e-05, + "loss": 0.0064, + "step": 681530 + }, + { + "epoch": 1.77, + "learning_rate": 3.500250141919897e-05, + "loss": 0.0068, + "step": 681540 + }, + { + "epoch": 1.77, + "learning_rate": 3.499861320282751e-05, + "loss": 0.0092, + "step": 681550 + }, + { + "epoch": 1.77, + "learning_rate": 3.4994724986456045e-05, + "loss": 0.0056, + "step": 681560 + }, + { + "epoch": 1.77, + "learning_rate": 3.499083677008458e-05, + "loss": 0.0063, + "step": 681570 + }, + { + "epoch": 1.77, + "learning_rate": 3.4986948553713115e-05, + "loss": 0.0069, + "step": 681580 + }, + { + "epoch": 1.77, + "learning_rate": 3.498306033734165e-05, + "loss": 0.0096, + "step": 681590 + }, + { + "epoch": 1.77, + "learning_rate": 3.4979172120970185e-05, + "loss": 0.0076, + "step": 681600 + }, + { + "epoch": 1.77, + "learning_rate": 3.497528390459872e-05, + "loss": 0.0085, + "step": 681610 + }, + { + "epoch": 1.77, + "learning_rate": 3.4971395688227255e-05, + "loss": 0.0088, + "step": 681620 + }, + { + "epoch": 1.77, + "learning_rate": 3.496750747185579e-05, + "loss": 0.0079, + "step": 681630 + }, + { + "epoch": 1.77, + "learning_rate": 3.4963619255484324e-05, + "loss": 0.0082, + "step": 681640 + }, + { + "epoch": 1.77, + "learning_rate": 3.495973103911286e-05, + "loss": 0.0087, + "step": 681650 + }, + { + "epoch": 1.77, + "learning_rate": 3.4955842822741394e-05, + "loss": 0.0136, + "step": 681660 + }, + { + "epoch": 1.77, + "learning_rate": 3.495195460636993e-05, + "loss": 0.0079, + "step": 681670 + }, + { + "epoch": 1.77, + "learning_rate": 3.494806638999847e-05, + "loss": 0.0068, + "step": 681680 + }, + { + "epoch": 1.77, + "learning_rate": 3.4944178173627005e-05, + "loss": 0.0074, + "step": 681690 + }, + { + "epoch": 1.77, + "learning_rate": 3.494028995725554e-05, + "loss": 0.0065, + "step": 681700 + }, + { + "epoch": 1.77, + "learning_rate": 3.4936401740884075e-05, + "loss": 0.0062, + "step": 681710 + }, + { + "epoch": 1.77, + "learning_rate": 3.493251352451261e-05, + "loss": 0.0069, + "step": 681720 + }, + { + "epoch": 1.77, + "learning_rate": 3.4928625308141145e-05, + "loss": 0.0059, + "step": 681730 + }, + { + "epoch": 1.77, + "learning_rate": 3.492473709176968e-05, + "loss": 0.0069, + "step": 681740 + }, + { + "epoch": 1.77, + "learning_rate": 3.4920848875398215e-05, + "loss": 0.0085, + "step": 681750 + }, + { + "epoch": 1.77, + "learning_rate": 3.491696065902675e-05, + "loss": 0.0069, + "step": 681760 + }, + { + "epoch": 1.77, + "learning_rate": 3.4913072442655284e-05, + "loss": 0.0086, + "step": 681770 + }, + { + "epoch": 1.77, + "learning_rate": 3.490918422628382e-05, + "loss": 0.0071, + "step": 681780 + }, + { + "epoch": 1.77, + "learning_rate": 3.4905296009912354e-05, + "loss": 0.0058, + "step": 681790 + }, + { + "epoch": 1.77, + "learning_rate": 3.490140779354089e-05, + "loss": 0.0097, + "step": 681800 + }, + { + "epoch": 1.77, + "learning_rate": 3.489751957716943e-05, + "loss": 0.0056, + "step": 681810 + }, + { + "epoch": 1.77, + "learning_rate": 3.4893631360797965e-05, + "loss": 0.0079, + "step": 681820 + }, + { + "epoch": 1.77, + "learning_rate": 3.48897431444265e-05, + "loss": 0.0094, + "step": 681830 + }, + { + "epoch": 1.77, + "learning_rate": 3.4885854928055035e-05, + "loss": 0.0057, + "step": 681840 + }, + { + "epoch": 1.77, + "learning_rate": 3.488196671168357e-05, + "loss": 0.006, + "step": 681850 + }, + { + "epoch": 1.77, + "learning_rate": 3.4878078495312105e-05, + "loss": 0.0081, + "step": 681860 + }, + { + "epoch": 1.77, + "learning_rate": 3.487419027894064e-05, + "loss": 0.0055, + "step": 681870 + }, + { + "epoch": 1.77, + "learning_rate": 3.4870302062569175e-05, + "loss": 0.0067, + "step": 681880 + }, + { + "epoch": 1.77, + "learning_rate": 3.486641384619771e-05, + "loss": 0.0086, + "step": 681890 + }, + { + "epoch": 1.77, + "learning_rate": 3.4862525629826244e-05, + "loss": 0.0048, + "step": 681900 + }, + { + "epoch": 1.77, + "learning_rate": 3.485863741345478e-05, + "loss": 0.0067, + "step": 681910 + }, + { + "epoch": 1.77, + "learning_rate": 3.4854749197083314e-05, + "loss": 0.0091, + "step": 681920 + }, + { + "epoch": 1.77, + "learning_rate": 3.485086098071185e-05, + "loss": 0.0094, + "step": 681930 + }, + { + "epoch": 1.77, + "learning_rate": 3.484697276434039e-05, + "loss": 0.0077, + "step": 681940 + }, + { + "epoch": 1.77, + "learning_rate": 3.4843084547968925e-05, + "loss": 0.0094, + "step": 681950 + }, + { + "epoch": 1.77, + "learning_rate": 3.483919633159746e-05, + "loss": 0.0075, + "step": 681960 + }, + { + "epoch": 1.77, + "learning_rate": 3.4835308115225995e-05, + "loss": 0.0092, + "step": 681970 + }, + { + "epoch": 1.77, + "learning_rate": 3.483141989885453e-05, + "loss": 0.0086, + "step": 681980 + }, + { + "epoch": 1.77, + "learning_rate": 3.4827531682483065e-05, + "loss": 0.0071, + "step": 681990 + }, + { + "epoch": 1.77, + "learning_rate": 3.48236434661116e-05, + "loss": 0.0079, + "step": 682000 + }, + { + "epoch": 1.77, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.004874969832599163, + "eval_runtime": 107.8015, + "eval_samples_per_second": 18.553, + "eval_steps_per_second": 4.638, + "step": 682000 + }, + { + "epoch": 1.77, + "learning_rate": 3.4819755249740135e-05, + "loss": 0.0052, + "step": 682010 + }, + { + "epoch": 1.77, + "learning_rate": 3.481586703336867e-05, + "loss": 0.0065, + "step": 682020 + }, + { + "epoch": 1.77, + "learning_rate": 3.4811978816997204e-05, + "loss": 0.0099, + "step": 682030 + }, + { + "epoch": 1.77, + "learning_rate": 3.480809060062574e-05, + "loss": 0.0072, + "step": 682040 + }, + { + "epoch": 1.77, + "learning_rate": 3.4804202384254274e-05, + "loss": 0.0047, + "step": 682050 + }, + { + "epoch": 1.77, + "learning_rate": 3.480031416788281e-05, + "loss": 0.0061, + "step": 682060 + }, + { + "epoch": 1.77, + "learning_rate": 3.479642595151135e-05, + "loss": 0.0079, + "step": 682070 + }, + { + "epoch": 1.77, + "learning_rate": 3.4792537735139885e-05, + "loss": 0.0074, + "step": 682080 + }, + { + "epoch": 1.77, + "learning_rate": 3.478864951876842e-05, + "loss": 0.0069, + "step": 682090 + }, + { + "epoch": 1.77, + "learning_rate": 3.4784761302396955e-05, + "loss": 0.0082, + "step": 682100 + }, + { + "epoch": 1.77, + "learning_rate": 3.478087308602548e-05, + "loss": 0.0067, + "step": 682110 + }, + { + "epoch": 1.77, + "learning_rate": 3.4776984869654025e-05, + "loss": 0.0051, + "step": 682120 + }, + { + "epoch": 1.77, + "learning_rate": 3.477309665328256e-05, + "loss": 0.0066, + "step": 682130 + }, + { + "epoch": 1.77, + "learning_rate": 3.4769208436911095e-05, + "loss": 0.0076, + "step": 682140 + }, + { + "epoch": 1.77, + "learning_rate": 3.476532022053963e-05, + "loss": 0.0062, + "step": 682150 + }, + { + "epoch": 1.77, + "learning_rate": 3.4761432004168164e-05, + "loss": 0.0058, + "step": 682160 + }, + { + "epoch": 1.77, + "learning_rate": 3.47575437877967e-05, + "loss": 0.0102, + "step": 682170 + }, + { + "epoch": 1.77, + "learning_rate": 3.4753655571425234e-05, + "loss": 0.0135, + "step": 682180 + }, + { + "epoch": 1.77, + "learning_rate": 3.474976735505377e-05, + "loss": 0.0088, + "step": 682190 + }, + { + "epoch": 1.77, + "learning_rate": 3.474587913868231e-05, + "loss": 0.0111, + "step": 682200 + }, + { + "epoch": 1.77, + "learning_rate": 3.4741990922310845e-05, + "loss": 0.0073, + "step": 682210 + }, + { + "epoch": 1.77, + "learning_rate": 3.473810270593938e-05, + "loss": 0.0054, + "step": 682220 + }, + { + "epoch": 1.77, + "learning_rate": 3.4734214489567915e-05, + "loss": 0.0091, + "step": 682230 + }, + { + "epoch": 1.77, + "learning_rate": 3.473032627319644e-05, + "loss": 0.0058, + "step": 682240 + }, + { + "epoch": 1.77, + "learning_rate": 3.4726438056824985e-05, + "loss": 0.0073, + "step": 682250 + }, + { + "epoch": 1.77, + "learning_rate": 3.472254984045352e-05, + "loss": 0.0091, + "step": 682260 + }, + { + "epoch": 1.77, + "learning_rate": 3.4718661624082054e-05, + "loss": 0.0085, + "step": 682270 + }, + { + "epoch": 1.77, + "learning_rate": 3.471477340771059e-05, + "loss": 0.0067, + "step": 682280 + }, + { + "epoch": 1.77, + "learning_rate": 3.4710885191339124e-05, + "loss": 0.0086, + "step": 682290 + }, + { + "epoch": 1.77, + "learning_rate": 3.470699697496766e-05, + "loss": 0.0078, + "step": 682300 + }, + { + "epoch": 1.77, + "learning_rate": 3.4703108758596194e-05, + "loss": 0.0061, + "step": 682310 + }, + { + "epoch": 1.77, + "learning_rate": 3.469922054222473e-05, + "loss": 0.0084, + "step": 682320 + }, + { + "epoch": 1.77, + "learning_rate": 3.469533232585327e-05, + "loss": 0.0101, + "step": 682330 + }, + { + "epoch": 1.77, + "learning_rate": 3.4691444109481805e-05, + "loss": 0.0072, + "step": 682340 + }, + { + "epoch": 1.77, + "learning_rate": 3.468755589311034e-05, + "loss": 0.0054, + "step": 682350 + }, + { + "epoch": 1.77, + "learning_rate": 3.468366767673887e-05, + "loss": 0.0078, + "step": 682360 + }, + { + "epoch": 1.77, + "learning_rate": 3.46797794603674e-05, + "loss": 0.0102, + "step": 682370 + }, + { + "epoch": 1.77, + "learning_rate": 3.4675891243995945e-05, + "loss": 0.0078, + "step": 682380 + }, + { + "epoch": 1.77, + "learning_rate": 3.467200302762448e-05, + "loss": 0.0089, + "step": 682390 + }, + { + "epoch": 1.77, + "learning_rate": 3.4668114811253014e-05, + "loss": 0.0077, + "step": 682400 + }, + { + "epoch": 1.77, + "learning_rate": 3.466422659488155e-05, + "loss": 0.0071, + "step": 682410 + }, + { + "epoch": 1.77, + "learning_rate": 3.4660338378510084e-05, + "loss": 0.0071, + "step": 682420 + }, + { + "epoch": 1.77, + "learning_rate": 3.465645016213862e-05, + "loss": 0.0089, + "step": 682430 + }, + { + "epoch": 1.77, + "learning_rate": 3.4652561945767154e-05, + "loss": 0.0072, + "step": 682440 + }, + { + "epoch": 1.77, + "learning_rate": 3.464867372939569e-05, + "loss": 0.0065, + "step": 682450 + }, + { + "epoch": 1.77, + "learning_rate": 3.464478551302423e-05, + "loss": 0.0096, + "step": 682460 + }, + { + "epoch": 1.77, + "learning_rate": 3.4640897296652765e-05, + "loss": 0.0081, + "step": 682470 + }, + { + "epoch": 1.77, + "learning_rate": 3.463700908028129e-05, + "loss": 0.0079, + "step": 682480 + }, + { + "epoch": 1.77, + "learning_rate": 3.463312086390983e-05, + "loss": 0.0052, + "step": 682490 + }, + { + "epoch": 1.77, + "learning_rate": 3.462923264753836e-05, + "loss": 0.0062, + "step": 682500 + }, + { + "epoch": 1.77, + "learning_rate": 3.4625344431166905e-05, + "loss": 0.0062, + "step": 682510 + }, + { + "epoch": 1.77, + "learning_rate": 3.462145621479544e-05, + "loss": 0.0087, + "step": 682520 + }, + { + "epoch": 1.77, + "learning_rate": 3.4617567998423974e-05, + "loss": 0.0082, + "step": 682530 + }, + { + "epoch": 1.77, + "learning_rate": 3.461367978205251e-05, + "loss": 0.0057, + "step": 682540 + }, + { + "epoch": 1.77, + "learning_rate": 3.4609791565681044e-05, + "loss": 0.008, + "step": 682550 + }, + { + "epoch": 1.77, + "learning_rate": 3.460590334930958e-05, + "loss": 0.0094, + "step": 682560 + }, + { + "epoch": 1.77, + "learning_rate": 3.4602015132938114e-05, + "loss": 0.0075, + "step": 682570 + }, + { + "epoch": 1.77, + "learning_rate": 3.459812691656665e-05, + "loss": 0.0069, + "step": 682580 + }, + { + "epoch": 1.77, + "learning_rate": 3.459423870019519e-05, + "loss": 0.0065, + "step": 682590 + }, + { + "epoch": 1.77, + "learning_rate": 3.4590350483823725e-05, + "loss": 0.0047, + "step": 682600 + }, + { + "epoch": 1.77, + "learning_rate": 3.458646226745225e-05, + "loss": 0.0068, + "step": 682610 + }, + { + "epoch": 1.77, + "learning_rate": 3.458257405108079e-05, + "loss": 0.0054, + "step": 682620 + }, + { + "epoch": 1.77, + "learning_rate": 3.457868583470932e-05, + "loss": 0.0094, + "step": 682630 + }, + { + "epoch": 1.77, + "learning_rate": 3.4574797618337865e-05, + "loss": 0.0097, + "step": 682640 + }, + { + "epoch": 1.77, + "learning_rate": 3.45709094019664e-05, + "loss": 0.0076, + "step": 682650 + }, + { + "epoch": 1.77, + "learning_rate": 3.4567021185594934e-05, + "loss": 0.0053, + "step": 682660 + }, + { + "epoch": 1.77, + "learning_rate": 3.456313296922347e-05, + "loss": 0.0072, + "step": 682670 + }, + { + "epoch": 1.77, + "learning_rate": 3.4559244752852004e-05, + "loss": 0.0079, + "step": 682680 + }, + { + "epoch": 1.77, + "learning_rate": 3.455535653648054e-05, + "loss": 0.0078, + "step": 682690 + }, + { + "epoch": 1.77, + "learning_rate": 3.4551468320109074e-05, + "loss": 0.0053, + "step": 682700 + }, + { + "epoch": 1.77, + "learning_rate": 3.454758010373761e-05, + "loss": 0.0096, + "step": 682710 + }, + { + "epoch": 1.77, + "learning_rate": 3.4543691887366144e-05, + "loss": 0.006, + "step": 682720 + }, + { + "epoch": 1.77, + "learning_rate": 3.453980367099468e-05, + "loss": 0.0042, + "step": 682730 + }, + { + "epoch": 1.77, + "learning_rate": 3.453591545462321e-05, + "loss": 0.0055, + "step": 682740 + }, + { + "epoch": 1.77, + "learning_rate": 3.453202723825175e-05, + "loss": 0.0108, + "step": 682750 + }, + { + "epoch": 1.77, + "learning_rate": 3.452813902188028e-05, + "loss": 0.0059, + "step": 682760 + }, + { + "epoch": 1.77, + "learning_rate": 3.4524250805508825e-05, + "loss": 0.0083, + "step": 682770 + }, + { + "epoch": 1.77, + "learning_rate": 3.452036258913736e-05, + "loss": 0.0089, + "step": 682780 + }, + { + "epoch": 1.77, + "learning_rate": 3.4516474372765894e-05, + "loss": 0.006, + "step": 682790 + }, + { + "epoch": 1.77, + "learning_rate": 3.451258615639443e-05, + "loss": 0.0071, + "step": 682800 + }, + { + "epoch": 1.77, + "learning_rate": 3.4508697940022964e-05, + "loss": 0.0071, + "step": 682810 + }, + { + "epoch": 1.77, + "learning_rate": 3.45048097236515e-05, + "loss": 0.0075, + "step": 682820 + }, + { + "epoch": 1.77, + "learning_rate": 3.4500921507280034e-05, + "loss": 0.0085, + "step": 682830 + }, + { + "epoch": 1.77, + "learning_rate": 3.449703329090857e-05, + "loss": 0.0088, + "step": 682840 + }, + { + "epoch": 1.77, + "learning_rate": 3.4493145074537104e-05, + "loss": 0.0069, + "step": 682850 + }, + { + "epoch": 1.77, + "learning_rate": 3.448925685816564e-05, + "loss": 0.0104, + "step": 682860 + }, + { + "epoch": 1.77, + "learning_rate": 3.448536864179417e-05, + "loss": 0.0112, + "step": 682870 + }, + { + "epoch": 1.77, + "learning_rate": 3.448148042542271e-05, + "loss": 0.0077, + "step": 682880 + }, + { + "epoch": 1.77, + "learning_rate": 3.447759220905124e-05, + "loss": 0.0082, + "step": 682890 + }, + { + "epoch": 1.77, + "learning_rate": 3.447370399267978e-05, + "loss": 0.0063, + "step": 682900 + }, + { + "epoch": 1.77, + "learning_rate": 3.446981577630832e-05, + "loss": 0.0098, + "step": 682910 + }, + { + "epoch": 1.77, + "learning_rate": 3.4465927559936854e-05, + "loss": 0.0072, + "step": 682920 + }, + { + "epoch": 1.77, + "learning_rate": 3.446203934356539e-05, + "loss": 0.0054, + "step": 682930 + }, + { + "epoch": 1.77, + "learning_rate": 3.4458151127193924e-05, + "loss": 0.0123, + "step": 682940 + }, + { + "epoch": 1.77, + "learning_rate": 3.445426291082246e-05, + "loss": 0.0075, + "step": 682950 + }, + { + "epoch": 1.77, + "learning_rate": 3.4450374694450994e-05, + "loss": 0.0074, + "step": 682960 + }, + { + "epoch": 1.77, + "learning_rate": 3.444648647807953e-05, + "loss": 0.008, + "step": 682970 + }, + { + "epoch": 1.77, + "learning_rate": 3.4442598261708064e-05, + "loss": 0.0071, + "step": 682980 + }, + { + "epoch": 1.77, + "learning_rate": 3.44387100453366e-05, + "loss": 0.0079, + "step": 682990 + }, + { + "epoch": 1.77, + "learning_rate": 3.443482182896513e-05, + "loss": 0.0072, + "step": 683000 + }, + { + "epoch": 1.77, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.00494320597499609, + "eval_runtime": 107.8159, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.638, + "step": 683000 + }, + { + "epoch": 1.77, + "learning_rate": 3.443093361259367e-05, + "loss": 0.0079, + "step": 683010 + }, + { + "epoch": 1.77, + "learning_rate": 3.44270453962222e-05, + "loss": 0.0058, + "step": 683020 + }, + { + "epoch": 1.77, + "learning_rate": 3.442315717985074e-05, + "loss": 0.0086, + "step": 683030 + }, + { + "epoch": 1.77, + "learning_rate": 3.441926896347928e-05, + "loss": 0.0087, + "step": 683040 + }, + { + "epoch": 1.77, + "learning_rate": 3.4415380747107814e-05, + "loss": 0.0076, + "step": 683050 + }, + { + "epoch": 1.77, + "learning_rate": 3.441149253073635e-05, + "loss": 0.005, + "step": 683060 + }, + { + "epoch": 1.77, + "learning_rate": 3.4407604314364884e-05, + "loss": 0.0059, + "step": 683070 + }, + { + "epoch": 1.77, + "learning_rate": 3.440371609799342e-05, + "loss": 0.0065, + "step": 683080 + }, + { + "epoch": 1.77, + "learning_rate": 3.4399827881621954e-05, + "loss": 0.0073, + "step": 683090 + }, + { + "epoch": 1.77, + "learning_rate": 3.439593966525049e-05, + "loss": 0.0065, + "step": 683100 + }, + { + "epoch": 1.77, + "learning_rate": 3.4392051448879024e-05, + "loss": 0.0071, + "step": 683110 + }, + { + "epoch": 1.77, + "learning_rate": 3.438816323250756e-05, + "loss": 0.0084, + "step": 683120 + }, + { + "epoch": 1.77, + "learning_rate": 3.438427501613609e-05, + "loss": 0.0089, + "step": 683130 + }, + { + "epoch": 1.77, + "learning_rate": 3.438038679976463e-05, + "loss": 0.0064, + "step": 683140 + }, + { + "epoch": 1.77, + "learning_rate": 3.437649858339316e-05, + "loss": 0.0065, + "step": 683150 + }, + { + "epoch": 1.77, + "learning_rate": 3.43726103670217e-05, + "loss": 0.0048, + "step": 683160 + }, + { + "epoch": 1.77, + "learning_rate": 3.436872215065024e-05, + "loss": 0.0072, + "step": 683170 + }, + { + "epoch": 1.77, + "learning_rate": 3.4364833934278774e-05, + "loss": 0.0066, + "step": 683180 + }, + { + "epoch": 1.77, + "learning_rate": 3.436094571790731e-05, + "loss": 0.0114, + "step": 683190 + }, + { + "epoch": 1.77, + "learning_rate": 3.4357057501535844e-05, + "loss": 0.009, + "step": 683200 + }, + { + "epoch": 1.77, + "learning_rate": 3.435316928516438e-05, + "loss": 0.0098, + "step": 683210 + }, + { + "epoch": 1.77, + "learning_rate": 3.4349281068792914e-05, + "loss": 0.0093, + "step": 683220 + }, + { + "epoch": 1.77, + "learning_rate": 3.434539285242145e-05, + "loss": 0.008, + "step": 683230 + }, + { + "epoch": 1.77, + "learning_rate": 3.4341504636049983e-05, + "loss": 0.0076, + "step": 683240 + }, + { + "epoch": 1.77, + "learning_rate": 3.433761641967852e-05, + "loss": 0.0115, + "step": 683250 + }, + { + "epoch": 1.77, + "learning_rate": 3.433372820330705e-05, + "loss": 0.005, + "step": 683260 + }, + { + "epoch": 1.77, + "learning_rate": 3.432983998693559e-05, + "loss": 0.0066, + "step": 683270 + }, + { + "epoch": 1.77, + "learning_rate": 3.432595177056412e-05, + "loss": 0.0081, + "step": 683280 + }, + { + "epoch": 1.77, + "learning_rate": 3.432206355419266e-05, + "loss": 0.0065, + "step": 683290 + }, + { + "epoch": 1.77, + "learning_rate": 3.43181753378212e-05, + "loss": 0.0077, + "step": 683300 + }, + { + "epoch": 1.77, + "learning_rate": 3.4314287121449734e-05, + "loss": 0.008, + "step": 683310 + }, + { + "epoch": 1.77, + "learning_rate": 3.431039890507827e-05, + "loss": 0.0063, + "step": 683320 + }, + { + "epoch": 1.77, + "learning_rate": 3.4306510688706804e-05, + "loss": 0.0071, + "step": 683330 + }, + { + "epoch": 1.77, + "learning_rate": 3.430262247233534e-05, + "loss": 0.0071, + "step": 683340 + }, + { + "epoch": 1.77, + "learning_rate": 3.4298734255963874e-05, + "loss": 0.0143, + "step": 683350 + }, + { + "epoch": 1.77, + "learning_rate": 3.429484603959241e-05, + "loss": 0.009, + "step": 683360 + }, + { + "epoch": 1.77, + "learning_rate": 3.4290957823220943e-05, + "loss": 0.0097, + "step": 683370 + }, + { + "epoch": 1.77, + "learning_rate": 3.428706960684948e-05, + "loss": 0.0074, + "step": 683380 + }, + { + "epoch": 1.77, + "learning_rate": 3.428318139047801e-05, + "loss": 0.0064, + "step": 683390 + }, + { + "epoch": 1.77, + "learning_rate": 3.427929317410655e-05, + "loss": 0.0077, + "step": 683400 + }, + { + "epoch": 1.77, + "learning_rate": 3.427540495773508e-05, + "loss": 0.0066, + "step": 683410 + }, + { + "epoch": 1.77, + "learning_rate": 3.427151674136362e-05, + "loss": 0.0051, + "step": 683420 + }, + { + "epoch": 1.77, + "learning_rate": 3.426762852499216e-05, + "loss": 0.0069, + "step": 683430 + }, + { + "epoch": 1.77, + "learning_rate": 3.4263740308620694e-05, + "loss": 0.0084, + "step": 683440 + }, + { + "epoch": 1.77, + "learning_rate": 3.425985209224923e-05, + "loss": 0.0059, + "step": 683450 + }, + { + "epoch": 1.77, + "learning_rate": 3.4255963875877764e-05, + "loss": 0.0082, + "step": 683460 + }, + { + "epoch": 1.77, + "learning_rate": 3.42520756595063e-05, + "loss": 0.0069, + "step": 683470 + }, + { + "epoch": 1.77, + "learning_rate": 3.4248187443134834e-05, + "loss": 0.0079, + "step": 683480 + }, + { + "epoch": 1.77, + "learning_rate": 3.424429922676337e-05, + "loss": 0.0099, + "step": 683490 + }, + { + "epoch": 1.77, + "learning_rate": 3.4240411010391903e-05, + "loss": 0.0105, + "step": 683500 + }, + { + "epoch": 1.77, + "learning_rate": 3.423652279402044e-05, + "loss": 0.0087, + "step": 683510 + }, + { + "epoch": 1.77, + "learning_rate": 3.423263457764897e-05, + "loss": 0.0093, + "step": 683520 + }, + { + "epoch": 1.77, + "learning_rate": 3.422874636127751e-05, + "loss": 0.0059, + "step": 683530 + }, + { + "epoch": 1.77, + "learning_rate": 3.422485814490604e-05, + "loss": 0.0075, + "step": 683540 + }, + { + "epoch": 1.77, + "learning_rate": 3.422096992853458e-05, + "loss": 0.0086, + "step": 683550 + }, + { + "epoch": 1.77, + "learning_rate": 3.421708171216312e-05, + "loss": 0.0092, + "step": 683560 + }, + { + "epoch": 1.77, + "learning_rate": 3.4213193495791654e-05, + "loss": 0.0071, + "step": 683570 + }, + { + "epoch": 1.77, + "learning_rate": 3.420930527942019e-05, + "loss": 0.0096, + "step": 683580 + }, + { + "epoch": 1.77, + "learning_rate": 3.4205417063048724e-05, + "loss": 0.0091, + "step": 683590 + }, + { + "epoch": 1.77, + "learning_rate": 3.420152884667725e-05, + "loss": 0.0059, + "step": 683600 + }, + { + "epoch": 1.77, + "learning_rate": 3.4197640630305794e-05, + "loss": 0.0062, + "step": 683610 + }, + { + "epoch": 1.77, + "learning_rate": 3.419375241393433e-05, + "loss": 0.0064, + "step": 683620 + }, + { + "epoch": 1.77, + "learning_rate": 3.4189864197562863e-05, + "loss": 0.0116, + "step": 683630 + }, + { + "epoch": 1.77, + "learning_rate": 3.41859759811914e-05, + "loss": 0.0124, + "step": 683640 + }, + { + "epoch": 1.77, + "learning_rate": 3.418208776481993e-05, + "loss": 0.0061, + "step": 683650 + }, + { + "epoch": 1.77, + "learning_rate": 3.417819954844847e-05, + "loss": 0.0078, + "step": 683660 + }, + { + "epoch": 1.77, + "learning_rate": 3.4174311332077e-05, + "loss": 0.0058, + "step": 683670 + }, + { + "epoch": 1.77, + "learning_rate": 3.417042311570554e-05, + "loss": 0.0074, + "step": 683680 + }, + { + "epoch": 1.77, + "learning_rate": 3.416653489933408e-05, + "loss": 0.0067, + "step": 683690 + }, + { + "epoch": 1.77, + "learning_rate": 3.4162646682962614e-05, + "loss": 0.0086, + "step": 683700 + }, + { + "epoch": 1.77, + "learning_rate": 3.415875846659115e-05, + "loss": 0.0088, + "step": 683710 + }, + { + "epoch": 1.77, + "learning_rate": 3.415487025021968e-05, + "loss": 0.0131, + "step": 683720 + }, + { + "epoch": 1.77, + "learning_rate": 3.415098203384821e-05, + "loss": 0.0076, + "step": 683730 + }, + { + "epoch": 1.77, + "learning_rate": 3.4147093817476754e-05, + "loss": 0.0083, + "step": 683740 + }, + { + "epoch": 1.77, + "learning_rate": 3.414320560110529e-05, + "loss": 0.0166, + "step": 683750 + }, + { + "epoch": 1.77, + "learning_rate": 3.413931738473382e-05, + "loss": 0.0072, + "step": 683760 + }, + { + "epoch": 1.77, + "learning_rate": 3.413542916836236e-05, + "loss": 0.0076, + "step": 683770 + }, + { + "epoch": 1.77, + "learning_rate": 3.413154095199089e-05, + "loss": 0.0093, + "step": 683780 + }, + { + "epoch": 1.77, + "learning_rate": 3.412765273561943e-05, + "loss": 0.0065, + "step": 683790 + }, + { + "epoch": 1.77, + "learning_rate": 3.412376451924796e-05, + "loss": 0.0071, + "step": 683800 + }, + { + "epoch": 1.77, + "learning_rate": 3.41198763028765e-05, + "loss": 0.0086, + "step": 683810 + }, + { + "epoch": 1.77, + "learning_rate": 3.411598808650504e-05, + "loss": 0.01, + "step": 683820 + }, + { + "epoch": 1.77, + "learning_rate": 3.4112099870133574e-05, + "loss": 0.0068, + "step": 683830 + }, + { + "epoch": 1.77, + "learning_rate": 3.410821165376211e-05, + "loss": 0.0089, + "step": 683840 + }, + { + "epoch": 1.77, + "learning_rate": 3.410432343739064e-05, + "loss": 0.0064, + "step": 683850 + }, + { + "epoch": 1.77, + "learning_rate": 3.410043522101917e-05, + "loss": 0.0086, + "step": 683860 + }, + { + "epoch": 1.77, + "learning_rate": 3.4096547004647714e-05, + "loss": 0.0066, + "step": 683870 + }, + { + "epoch": 1.77, + "learning_rate": 3.409265878827625e-05, + "loss": 0.0062, + "step": 683880 + }, + { + "epoch": 1.77, + "learning_rate": 3.408877057190478e-05, + "loss": 0.007, + "step": 683890 + }, + { + "epoch": 1.77, + "learning_rate": 3.408488235553332e-05, + "loss": 0.0059, + "step": 683900 + }, + { + "epoch": 1.77, + "learning_rate": 3.408099413916185e-05, + "loss": 0.0096, + "step": 683910 + }, + { + "epoch": 1.77, + "learning_rate": 3.407710592279039e-05, + "loss": 0.0093, + "step": 683920 + }, + { + "epoch": 1.77, + "learning_rate": 3.407321770641892e-05, + "loss": 0.0095, + "step": 683930 + }, + { + "epoch": 1.77, + "learning_rate": 3.406932949004746e-05, + "loss": 0.0068, + "step": 683940 + }, + { + "epoch": 1.77, + "learning_rate": 3.4065441273676e-05, + "loss": 0.0075, + "step": 683950 + }, + { + "epoch": 1.77, + "learning_rate": 3.4061553057304534e-05, + "loss": 0.0073, + "step": 683960 + }, + { + "epoch": 1.77, + "learning_rate": 3.405766484093306e-05, + "loss": 0.0068, + "step": 683970 + }, + { + "epoch": 1.77, + "learning_rate": 3.40537766245616e-05, + "loss": 0.0067, + "step": 683980 + }, + { + "epoch": 1.77, + "learning_rate": 3.404988840819013e-05, + "loss": 0.0065, + "step": 683990 + }, + { + "epoch": 1.77, + "learning_rate": 3.4046000191818674e-05, + "loss": 0.0057, + "step": 684000 + }, + { + "epoch": 1.77, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.005055462475866079, + "eval_runtime": 107.5085, + "eval_samples_per_second": 18.603, + "eval_steps_per_second": 4.651, + "step": 684000 + }, + { + "epoch": 1.77, + "learning_rate": 3.404211197544721e-05, + "loss": 0.0084, + "step": 684010 + }, + { + "epoch": 1.77, + "learning_rate": 3.403822375907574e-05, + "loss": 0.0081, + "step": 684020 + }, + { + "epoch": 1.77, + "learning_rate": 3.403433554270428e-05, + "loss": 0.0093, + "step": 684030 + }, + { + "epoch": 1.77, + "learning_rate": 3.403044732633281e-05, + "loss": 0.0074, + "step": 684040 + }, + { + "epoch": 1.77, + "learning_rate": 3.402655910996135e-05, + "loss": 0.0088, + "step": 684050 + }, + { + "epoch": 1.77, + "learning_rate": 3.402267089358988e-05, + "loss": 0.0059, + "step": 684060 + }, + { + "epoch": 1.77, + "learning_rate": 3.401878267721842e-05, + "loss": 0.0076, + "step": 684070 + }, + { + "epoch": 1.77, + "learning_rate": 3.401489446084696e-05, + "loss": 0.0063, + "step": 684080 + }, + { + "epoch": 1.77, + "learning_rate": 3.4011006244475494e-05, + "loss": 0.0075, + "step": 684090 + }, + { + "epoch": 1.77, + "learning_rate": 3.400711802810402e-05, + "loss": 0.0068, + "step": 684100 + }, + { + "epoch": 1.77, + "learning_rate": 3.400322981173256e-05, + "loss": 0.0079, + "step": 684110 + }, + { + "epoch": 1.77, + "learning_rate": 3.399934159536109e-05, + "loss": 0.009, + "step": 684120 + }, + { + "epoch": 1.77, + "learning_rate": 3.3995453378989634e-05, + "loss": 0.0058, + "step": 684130 + }, + { + "epoch": 1.77, + "learning_rate": 3.399156516261817e-05, + "loss": 0.0089, + "step": 684140 + }, + { + "epoch": 1.77, + "learning_rate": 3.39876769462467e-05, + "loss": 0.0068, + "step": 684150 + }, + { + "epoch": 1.77, + "learning_rate": 3.398378872987524e-05, + "loss": 0.0066, + "step": 684160 + }, + { + "epoch": 1.77, + "learning_rate": 3.397990051350377e-05, + "loss": 0.0065, + "step": 684170 + }, + { + "epoch": 1.77, + "learning_rate": 3.397601229713231e-05, + "loss": 0.0102, + "step": 684180 + }, + { + "epoch": 1.77, + "learning_rate": 3.397212408076084e-05, + "loss": 0.0089, + "step": 684190 + }, + { + "epoch": 1.77, + "learning_rate": 3.396823586438938e-05, + "loss": 0.0094, + "step": 684200 + }, + { + "epoch": 1.77, + "learning_rate": 3.396434764801791e-05, + "loss": 0.0076, + "step": 684210 + }, + { + "epoch": 1.77, + "learning_rate": 3.396045943164645e-05, + "loss": 0.0078, + "step": 684220 + }, + { + "epoch": 1.77, + "learning_rate": 3.395657121527498e-05, + "loss": 0.0054, + "step": 684230 + }, + { + "epoch": 1.77, + "learning_rate": 3.395268299890352e-05, + "loss": 0.0107, + "step": 684240 + }, + { + "epoch": 1.77, + "learning_rate": 3.394879478253205e-05, + "loss": 0.0068, + "step": 684250 + }, + { + "epoch": 1.77, + "learning_rate": 3.394490656616059e-05, + "loss": 0.007, + "step": 684260 + }, + { + "epoch": 1.77, + "learning_rate": 3.394101834978913e-05, + "loss": 0.0106, + "step": 684270 + }, + { + "epoch": 1.77, + "learning_rate": 3.393713013341766e-05, + "loss": 0.0083, + "step": 684280 + }, + { + "epoch": 1.77, + "learning_rate": 3.39332419170462e-05, + "loss": 0.0087, + "step": 684290 + }, + { + "epoch": 1.77, + "learning_rate": 3.392935370067473e-05, + "loss": 0.008, + "step": 684300 + }, + { + "epoch": 1.77, + "learning_rate": 3.392546548430327e-05, + "loss": 0.0069, + "step": 684310 + }, + { + "epoch": 1.77, + "learning_rate": 3.39215772679318e-05, + "loss": 0.0071, + "step": 684320 + }, + { + "epoch": 1.77, + "learning_rate": 3.391768905156034e-05, + "loss": 0.007, + "step": 684330 + }, + { + "epoch": 1.77, + "learning_rate": 3.391380083518887e-05, + "loss": 0.0099, + "step": 684340 + }, + { + "epoch": 1.77, + "learning_rate": 3.390991261881741e-05, + "loss": 0.0103, + "step": 684350 + }, + { + "epoch": 1.77, + "learning_rate": 3.390602440244594e-05, + "loss": 0.0067, + "step": 684360 + }, + { + "epoch": 1.77, + "learning_rate": 3.390213618607448e-05, + "loss": 0.0066, + "step": 684370 + }, + { + "epoch": 1.77, + "learning_rate": 3.389824796970301e-05, + "loss": 0.0077, + "step": 684380 + }, + { + "epoch": 1.77, + "learning_rate": 3.389435975333155e-05, + "loss": 0.0071, + "step": 684390 + }, + { + "epoch": 1.77, + "learning_rate": 3.389047153696009e-05, + "loss": 0.0126, + "step": 684400 + }, + { + "epoch": 1.77, + "learning_rate": 3.388658332058862e-05, + "loss": 0.0087, + "step": 684410 + }, + { + "epoch": 1.77, + "learning_rate": 3.388269510421716e-05, + "loss": 0.0082, + "step": 684420 + }, + { + "epoch": 1.77, + "learning_rate": 3.387880688784569e-05, + "loss": 0.0045, + "step": 684430 + }, + { + "epoch": 1.77, + "learning_rate": 3.387491867147423e-05, + "loss": 0.0087, + "step": 684440 + }, + { + "epoch": 1.77, + "learning_rate": 3.387103045510276e-05, + "loss": 0.0058, + "step": 684450 + }, + { + "epoch": 1.77, + "learning_rate": 3.38671422387313e-05, + "loss": 0.0083, + "step": 684460 + }, + { + "epoch": 1.77, + "learning_rate": 3.386325402235983e-05, + "loss": 0.0091, + "step": 684470 + }, + { + "epoch": 1.77, + "learning_rate": 3.385936580598837e-05, + "loss": 0.0069, + "step": 684480 + }, + { + "epoch": 1.77, + "learning_rate": 3.38554775896169e-05, + "loss": 0.0081, + "step": 684490 + }, + { + "epoch": 1.77, + "learning_rate": 3.385158937324544e-05, + "loss": 0.0085, + "step": 684500 + }, + { + "epoch": 1.77, + "learning_rate": 3.384770115687397e-05, + "loss": 0.0093, + "step": 684510 + }, + { + "epoch": 1.77, + "learning_rate": 3.384381294050251e-05, + "loss": 0.0067, + "step": 684520 + }, + { + "epoch": 1.77, + "learning_rate": 3.383992472413105e-05, + "loss": 0.0066, + "step": 684530 + }, + { + "epoch": 1.77, + "learning_rate": 3.383603650775958e-05, + "loss": 0.0057, + "step": 684540 + }, + { + "epoch": 1.77, + "learning_rate": 3.383214829138812e-05, + "loss": 0.0094, + "step": 684550 + }, + { + "epoch": 1.77, + "learning_rate": 3.382826007501665e-05, + "loss": 0.0065, + "step": 684560 + }, + { + "epoch": 1.77, + "learning_rate": 3.382437185864519e-05, + "loss": 0.0072, + "step": 684570 + }, + { + "epoch": 1.77, + "learning_rate": 3.382048364227372e-05, + "loss": 0.0081, + "step": 684580 + }, + { + "epoch": 1.77, + "learning_rate": 3.381659542590226e-05, + "loss": 0.0078, + "step": 684590 + }, + { + "epoch": 1.77, + "learning_rate": 3.381270720953079e-05, + "loss": 0.0073, + "step": 684600 + }, + { + "epoch": 1.77, + "learning_rate": 3.380881899315933e-05, + "loss": 0.0063, + "step": 684610 + }, + { + "epoch": 1.77, + "learning_rate": 3.380493077678786e-05, + "loss": 0.0065, + "step": 684620 + }, + { + "epoch": 1.77, + "learning_rate": 3.38010425604164e-05, + "loss": 0.0068, + "step": 684630 + }, + { + "epoch": 1.77, + "learning_rate": 3.379715434404493e-05, + "loss": 0.0075, + "step": 684640 + }, + { + "epoch": 1.77, + "learning_rate": 3.379326612767347e-05, + "loss": 0.0068, + "step": 684650 + }, + { + "epoch": 1.77, + "learning_rate": 3.378937791130201e-05, + "loss": 0.0079, + "step": 684660 + }, + { + "epoch": 1.77, + "learning_rate": 3.378548969493054e-05, + "loss": 0.0073, + "step": 684670 + }, + { + "epoch": 1.77, + "learning_rate": 3.378160147855908e-05, + "loss": 0.0065, + "step": 684680 + }, + { + "epoch": 1.77, + "learning_rate": 3.377771326218761e-05, + "loss": 0.0076, + "step": 684690 + }, + { + "epoch": 1.77, + "learning_rate": 3.377382504581615e-05, + "loss": 0.0045, + "step": 684700 + }, + { + "epoch": 1.77, + "learning_rate": 3.376993682944468e-05, + "loss": 0.0069, + "step": 684710 + }, + { + "epoch": 1.77, + "learning_rate": 3.376604861307322e-05, + "loss": 0.0082, + "step": 684720 + }, + { + "epoch": 1.77, + "learning_rate": 3.376216039670175e-05, + "loss": 0.0055, + "step": 684730 + }, + { + "epoch": 1.77, + "learning_rate": 3.375827218033029e-05, + "loss": 0.0073, + "step": 684740 + }, + { + "epoch": 1.77, + "learning_rate": 3.375438396395882e-05, + "loss": 0.0071, + "step": 684750 + }, + { + "epoch": 1.77, + "learning_rate": 3.375049574758736e-05, + "loss": 0.0106, + "step": 684760 + }, + { + "epoch": 1.78, + "learning_rate": 3.374660753121589e-05, + "loss": 0.0074, + "step": 684770 + }, + { + "epoch": 1.78, + "learning_rate": 3.374271931484443e-05, + "loss": 0.0081, + "step": 684780 + }, + { + "epoch": 1.78, + "learning_rate": 3.373883109847297e-05, + "loss": 0.0082, + "step": 684790 + }, + { + "epoch": 1.78, + "learning_rate": 3.37349428821015e-05, + "loss": 0.0077, + "step": 684800 + }, + { + "epoch": 1.78, + "learning_rate": 3.373105466573004e-05, + "loss": 0.0075, + "step": 684810 + }, + { + "epoch": 1.78, + "learning_rate": 3.372716644935857e-05, + "loss": 0.0068, + "step": 684820 + }, + { + "epoch": 1.78, + "learning_rate": 3.372327823298711e-05, + "loss": 0.0078, + "step": 684830 + }, + { + "epoch": 1.78, + "learning_rate": 3.371939001661564e-05, + "loss": 0.0083, + "step": 684840 + }, + { + "epoch": 1.78, + "learning_rate": 3.371550180024418e-05, + "loss": 0.0074, + "step": 684850 + }, + { + "epoch": 1.78, + "learning_rate": 3.371161358387271e-05, + "loss": 0.0074, + "step": 684860 + }, + { + "epoch": 1.78, + "learning_rate": 3.370772536750125e-05, + "loss": 0.0107, + "step": 684870 + }, + { + "epoch": 1.78, + "learning_rate": 3.370383715112978e-05, + "loss": 0.0078, + "step": 684880 + }, + { + "epoch": 1.78, + "learning_rate": 3.369994893475832e-05, + "loss": 0.0069, + "step": 684890 + }, + { + "epoch": 1.78, + "learning_rate": 3.369606071838685e-05, + "loss": 0.0073, + "step": 684900 + }, + { + "epoch": 1.78, + "learning_rate": 3.369217250201539e-05, + "loss": 0.008, + "step": 684910 + }, + { + "epoch": 1.78, + "learning_rate": 3.368828428564393e-05, + "loss": 0.0061, + "step": 684920 + }, + { + "epoch": 1.78, + "learning_rate": 3.368439606927246e-05, + "loss": 0.0072, + "step": 684930 + }, + { + "epoch": 1.78, + "learning_rate": 3.3680507852901e-05, + "loss": 0.0075, + "step": 684940 + }, + { + "epoch": 1.78, + "learning_rate": 3.367661963652953e-05, + "loss": 0.0099, + "step": 684950 + }, + { + "epoch": 1.78, + "learning_rate": 3.367273142015807e-05, + "loss": 0.0072, + "step": 684960 + }, + { + "epoch": 1.78, + "learning_rate": 3.36688432037866e-05, + "loss": 0.0065, + "step": 684970 + }, + { + "epoch": 1.78, + "learning_rate": 3.366495498741514e-05, + "loss": 0.0092, + "step": 684980 + }, + { + "epoch": 1.78, + "learning_rate": 3.366106677104367e-05, + "loss": 0.0129, + "step": 684990 + }, + { + "epoch": 1.78, + "learning_rate": 3.365717855467221e-05, + "loss": 0.0097, + "step": 685000 + }, + { + "epoch": 1.78, + "eval_cer": 0.881688689953826, + "eval_loss": 0.004874881356954575, + "eval_runtime": 107.9053, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, + "step": 685000 + }, + { + "epoch": 1.78, + "learning_rate": 3.365329033830074e-05, + "loss": 0.0082, + "step": 685010 + }, + { + "epoch": 1.78, + "learning_rate": 3.364940212192928e-05, + "loss": 0.0099, + "step": 685020 + }, + { + "epoch": 1.78, + "learning_rate": 3.364551390555781e-05, + "loss": 0.0086, + "step": 685030 + }, + { + "epoch": 1.78, + "learning_rate": 3.364162568918635e-05, + "loss": 0.0072, + "step": 685040 + }, + { + "epoch": 1.78, + "learning_rate": 3.363773747281489e-05, + "loss": 0.0082, + "step": 685050 + }, + { + "epoch": 1.78, + "learning_rate": 3.363384925644342e-05, + "loss": 0.0096, + "step": 685060 + }, + { + "epoch": 1.78, + "learning_rate": 3.362996104007196e-05, + "loss": 0.0063, + "step": 685070 + }, + { + "epoch": 1.78, + "learning_rate": 3.362607282370049e-05, + "loss": 0.0074, + "step": 685080 + }, + { + "epoch": 1.78, + "learning_rate": 3.362218460732902e-05, + "loss": 0.0078, + "step": 685090 + }, + { + "epoch": 1.78, + "learning_rate": 3.361829639095756e-05, + "loss": 0.0064, + "step": 685100 + }, + { + "epoch": 1.78, + "learning_rate": 3.36144081745861e-05, + "loss": 0.0073, + "step": 685110 + }, + { + "epoch": 1.78, + "learning_rate": 3.361051995821463e-05, + "loss": 0.0066, + "step": 685120 + }, + { + "epoch": 1.78, + "learning_rate": 3.360663174184317e-05, + "loss": 0.0082, + "step": 685130 + }, + { + "epoch": 1.78, + "learning_rate": 3.36027435254717e-05, + "loss": 0.0118, + "step": 685140 + }, + { + "epoch": 1.78, + "learning_rate": 3.359885530910024e-05, + "loss": 0.0082, + "step": 685150 + }, + { + "epoch": 1.78, + "learning_rate": 3.359496709272877e-05, + "loss": 0.0077, + "step": 685160 + }, + { + "epoch": 1.78, + "learning_rate": 3.359107887635731e-05, + "loss": 0.0081, + "step": 685170 + }, + { + "epoch": 1.78, + "learning_rate": 3.358719065998585e-05, + "loss": 0.0075, + "step": 685180 + }, + { + "epoch": 1.78, + "learning_rate": 3.358330244361438e-05, + "loss": 0.0071, + "step": 685190 + }, + { + "epoch": 1.78, + "learning_rate": 3.357941422724292e-05, + "loss": 0.0069, + "step": 685200 + }, + { + "epoch": 1.78, + "learning_rate": 3.3575526010871446e-05, + "loss": 0.009, + "step": 685210 + }, + { + "epoch": 1.78, + "learning_rate": 3.357163779449998e-05, + "loss": 0.0065, + "step": 685220 + }, + { + "epoch": 1.78, + "learning_rate": 3.356774957812852e-05, + "loss": 0.0049, + "step": 685230 + }, + { + "epoch": 1.78, + "learning_rate": 3.356386136175706e-05, + "loss": 0.0079, + "step": 685240 + }, + { + "epoch": 1.78, + "learning_rate": 3.355997314538559e-05, + "loss": 0.0082, + "step": 685250 + }, + { + "epoch": 1.78, + "learning_rate": 3.355608492901413e-05, + "loss": 0.0107, + "step": 685260 + }, + { + "epoch": 1.78, + "learning_rate": 3.355219671264266e-05, + "loss": 0.0074, + "step": 685270 + }, + { + "epoch": 1.78, + "learning_rate": 3.35483084962712e-05, + "loss": 0.0079, + "step": 685280 + }, + { + "epoch": 1.78, + "learning_rate": 3.354442027989973e-05, + "loss": 0.008, + "step": 685290 + }, + { + "epoch": 1.78, + "learning_rate": 3.3540532063528267e-05, + "loss": 0.0106, + "step": 685300 + }, + { + "epoch": 1.78, + "learning_rate": 3.353664384715681e-05, + "loss": 0.007, + "step": 685310 + }, + { + "epoch": 1.78, + "learning_rate": 3.353275563078534e-05, + "loss": 0.0063, + "step": 685320 + }, + { + "epoch": 1.78, + "learning_rate": 3.352886741441388e-05, + "loss": 0.0116, + "step": 685330 + }, + { + "epoch": 1.78, + "learning_rate": 3.3524979198042406e-05, + "loss": 0.0076, + "step": 685340 + }, + { + "epoch": 1.78, + "learning_rate": 3.352109098167094e-05, + "loss": 0.0101, + "step": 685350 + }, + { + "epoch": 1.78, + "learning_rate": 3.351720276529948e-05, + "loss": 0.0061, + "step": 685360 + }, + { + "epoch": 1.78, + "learning_rate": 3.351331454892802e-05, + "loss": 0.0079, + "step": 685370 + }, + { + "epoch": 1.78, + "learning_rate": 3.350942633255655e-05, + "loss": 0.0092, + "step": 685380 + }, + { + "epoch": 1.78, + "learning_rate": 3.350553811618509e-05, + "loss": 0.0097, + "step": 685390 + }, + { + "epoch": 1.78, + "learning_rate": 3.350164989981362e-05, + "loss": 0.0135, + "step": 685400 + }, + { + "epoch": 1.78, + "learning_rate": 3.349776168344216e-05, + "loss": 0.0074, + "step": 685410 + }, + { + "epoch": 1.78, + "learning_rate": 3.349387346707069e-05, + "loss": 0.0075, + "step": 685420 + }, + { + "epoch": 1.78, + "learning_rate": 3.3489985250699227e-05, + "loss": 0.0089, + "step": 685430 + }, + { + "epoch": 1.78, + "learning_rate": 3.348609703432777e-05, + "loss": 0.0082, + "step": 685440 + }, + { + "epoch": 1.78, + "learning_rate": 3.34822088179563e-05, + "loss": 0.0054, + "step": 685450 + }, + { + "epoch": 1.78, + "learning_rate": 3.347832060158483e-05, + "loss": 0.0064, + "step": 685460 + }, + { + "epoch": 1.78, + "learning_rate": 3.3474432385213366e-05, + "loss": 0.0065, + "step": 685470 + }, + { + "epoch": 1.78, + "learning_rate": 3.34705441688419e-05, + "loss": 0.0103, + "step": 685480 + }, + { + "epoch": 1.78, + "learning_rate": 3.346665595247044e-05, + "loss": 0.0104, + "step": 685490 + }, + { + "epoch": 1.78, + "learning_rate": 3.346276773609898e-05, + "loss": 0.0078, + "step": 685500 + }, + { + "epoch": 1.78, + "learning_rate": 3.345887951972751e-05, + "loss": 0.0073, + "step": 685510 + }, + { + "epoch": 1.78, + "learning_rate": 3.345499130335605e-05, + "loss": 0.0074, + "step": 685520 + }, + { + "epoch": 1.78, + "learning_rate": 3.345110308698458e-05, + "loss": 0.0078, + "step": 685530 + }, + { + "epoch": 1.78, + "learning_rate": 3.344721487061312e-05, + "loss": 0.0063, + "step": 685540 + }, + { + "epoch": 1.78, + "learning_rate": 3.344332665424165e-05, + "loss": 0.0123, + "step": 685550 + }, + { + "epoch": 1.78, + "learning_rate": 3.3439438437870187e-05, + "loss": 0.0067, + "step": 685560 + }, + { + "epoch": 1.78, + "learning_rate": 3.343555022149872e-05, + "loss": 0.0095, + "step": 685570 + }, + { + "epoch": 1.78, + "learning_rate": 3.343166200512726e-05, + "loss": 0.0071, + "step": 685580 + }, + { + "epoch": 1.78, + "learning_rate": 3.342777378875579e-05, + "loss": 0.0072, + "step": 685590 + }, + { + "epoch": 1.78, + "learning_rate": 3.3423885572384326e-05, + "loss": 0.0056, + "step": 685600 + }, + { + "epoch": 1.78, + "learning_rate": 3.341999735601286e-05, + "loss": 0.0069, + "step": 685610 + }, + { + "epoch": 1.78, + "learning_rate": 3.3416109139641396e-05, + "loss": 0.008, + "step": 685620 + }, + { + "epoch": 1.78, + "learning_rate": 3.341222092326994e-05, + "loss": 0.0076, + "step": 685630 + }, + { + "epoch": 1.78, + "learning_rate": 3.340833270689847e-05, + "loss": 0.0088, + "step": 685640 + }, + { + "epoch": 1.78, + "learning_rate": 3.340444449052701e-05, + "loss": 0.0096, + "step": 685650 + }, + { + "epoch": 1.78, + "learning_rate": 3.340055627415554e-05, + "loss": 0.0053, + "step": 685660 + }, + { + "epoch": 1.78, + "learning_rate": 3.339666805778408e-05, + "loss": 0.0078, + "step": 685670 + }, + { + "epoch": 1.78, + "learning_rate": 3.339277984141261e-05, + "loss": 0.0074, + "step": 685680 + }, + { + "epoch": 1.78, + "learning_rate": 3.3388891625041147e-05, + "loss": 0.0085, + "step": 685690 + }, + { + "epoch": 1.78, + "learning_rate": 3.338500340866968e-05, + "loss": 0.0078, + "step": 685700 + }, + { + "epoch": 1.78, + "learning_rate": 3.3381115192298216e-05, + "loss": 0.011, + "step": 685710 + }, + { + "epoch": 1.78, + "learning_rate": 3.337722697592675e-05, + "loss": 0.009, + "step": 685720 + }, + { + "epoch": 1.78, + "learning_rate": 3.3373338759555286e-05, + "loss": 0.0065, + "step": 685730 + }, + { + "epoch": 1.78, + "learning_rate": 3.336945054318382e-05, + "loss": 0.0064, + "step": 685740 + }, + { + "epoch": 1.78, + "learning_rate": 3.3365562326812356e-05, + "loss": 0.0059, + "step": 685750 + }, + { + "epoch": 1.78, + "learning_rate": 3.33616741104409e-05, + "loss": 0.0058, + "step": 685760 + }, + { + "epoch": 1.78, + "learning_rate": 3.335778589406943e-05, + "loss": 0.0075, + "step": 685770 + }, + { + "epoch": 1.78, + "learning_rate": 3.335389767769797e-05, + "loss": 0.0057, + "step": 685780 + }, + { + "epoch": 1.78, + "learning_rate": 3.33500094613265e-05, + "loss": 0.0085, + "step": 685790 + }, + { + "epoch": 1.78, + "learning_rate": 3.334612124495504e-05, + "loss": 0.0078, + "step": 685800 + }, + { + "epoch": 1.78, + "learning_rate": 3.334223302858357e-05, + "loss": 0.0054, + "step": 685810 + }, + { + "epoch": 1.78, + "learning_rate": 3.3338344812212106e-05, + "loss": 0.0112, + "step": 685820 + }, + { + "epoch": 1.78, + "learning_rate": 3.333445659584064e-05, + "loss": 0.0086, + "step": 685830 + }, + { + "epoch": 1.78, + "learning_rate": 3.3330568379469176e-05, + "loss": 0.0119, + "step": 685840 + }, + { + "epoch": 1.78, + "learning_rate": 3.332668016309771e-05, + "loss": 0.0054, + "step": 685850 + }, + { + "epoch": 1.78, + "learning_rate": 3.3322791946726246e-05, + "loss": 0.0076, + "step": 685860 + }, + { + "epoch": 1.78, + "learning_rate": 3.331890373035478e-05, + "loss": 0.009, + "step": 685870 + }, + { + "epoch": 1.78, + "learning_rate": 3.3315015513983316e-05, + "loss": 0.0089, + "step": 685880 + }, + { + "epoch": 1.78, + "learning_rate": 3.331112729761186e-05, + "loss": 0.0068, + "step": 685890 + }, + { + "epoch": 1.78, + "learning_rate": 3.330723908124039e-05, + "loss": 0.0081, + "step": 685900 + }, + { + "epoch": 1.78, + "learning_rate": 3.330335086486893e-05, + "loss": 0.009, + "step": 685910 + }, + { + "epoch": 1.78, + "learning_rate": 3.329946264849746e-05, + "loss": 0.0084, + "step": 685920 + }, + { + "epoch": 1.78, + "learning_rate": 3.3295574432126e-05, + "loss": 0.0084, + "step": 685930 + }, + { + "epoch": 1.78, + "learning_rate": 3.329168621575453e-05, + "loss": 0.0112, + "step": 685940 + }, + { + "epoch": 1.78, + "learning_rate": 3.3287797999383066e-05, + "loss": 0.008, + "step": 685950 + }, + { + "epoch": 1.78, + "learning_rate": 3.32839097830116e-05, + "loss": 0.005, + "step": 685960 + }, + { + "epoch": 1.78, + "learning_rate": 3.3280021566640136e-05, + "loss": 0.0063, + "step": 685970 + }, + { + "epoch": 1.78, + "learning_rate": 3.327613335026867e-05, + "loss": 0.0068, + "step": 685980 + }, + { + "epoch": 1.78, + "learning_rate": 3.3272245133897206e-05, + "loss": 0.0093, + "step": 685990 + }, + { + "epoch": 1.78, + "learning_rate": 3.326835691752574e-05, + "loss": 0.0074, + "step": 686000 + }, + { + "epoch": 1.78, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.004924887791275978, + "eval_runtime": 107.9307, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.633, + "step": 686000 + }, + { + "epoch": 1.78, + "learning_rate": 3.3264468701154276e-05, + "loss": 0.0065, + "step": 686010 + }, + { + "epoch": 1.78, + "learning_rate": 3.326058048478282e-05, + "loss": 0.0071, + "step": 686020 + }, + { + "epoch": 1.78, + "learning_rate": 3.325669226841135e-05, + "loss": 0.0117, + "step": 686030 + }, + { + "epoch": 1.78, + "learning_rate": 3.325280405203989e-05, + "loss": 0.0079, + "step": 686040 + }, + { + "epoch": 1.78, + "learning_rate": 3.324891583566842e-05, + "loss": 0.0103, + "step": 686050 + }, + { + "epoch": 1.78, + "learning_rate": 3.324502761929696e-05, + "loss": 0.0077, + "step": 686060 + }, + { + "epoch": 1.78, + "learning_rate": 3.324113940292549e-05, + "loss": 0.007, + "step": 686070 + }, + { + "epoch": 1.78, + "learning_rate": 3.3237251186554026e-05, + "loss": 0.0069, + "step": 686080 + }, + { + "epoch": 1.78, + "learning_rate": 3.323336297018256e-05, + "loss": 0.01, + "step": 686090 + }, + { + "epoch": 1.78, + "learning_rate": 3.3229474753811096e-05, + "loss": 0.0075, + "step": 686100 + }, + { + "epoch": 1.78, + "learning_rate": 3.322558653743963e-05, + "loss": 0.0079, + "step": 686110 + }, + { + "epoch": 1.78, + "learning_rate": 3.3221698321068166e-05, + "loss": 0.0097, + "step": 686120 + }, + { + "epoch": 1.78, + "learning_rate": 3.32178101046967e-05, + "loss": 0.0054, + "step": 686130 + }, + { + "epoch": 1.78, + "learning_rate": 3.3213921888325236e-05, + "loss": 0.006, + "step": 686140 + }, + { + "epoch": 1.78, + "learning_rate": 3.321003367195378e-05, + "loss": 0.006, + "step": 686150 + }, + { + "epoch": 1.78, + "learning_rate": 3.320614545558231e-05, + "loss": 0.0096, + "step": 686160 + }, + { + "epoch": 1.78, + "learning_rate": 3.320225723921085e-05, + "loss": 0.0086, + "step": 686170 + }, + { + "epoch": 1.78, + "learning_rate": 3.319836902283938e-05, + "loss": 0.007, + "step": 686180 + }, + { + "epoch": 1.78, + "learning_rate": 3.319448080646792e-05, + "loss": 0.0061, + "step": 686190 + }, + { + "epoch": 1.78, + "learning_rate": 3.319059259009645e-05, + "loss": 0.0064, + "step": 686200 + }, + { + "epoch": 1.78, + "learning_rate": 3.3186704373724986e-05, + "loss": 0.007, + "step": 686210 + }, + { + "epoch": 1.78, + "learning_rate": 3.318281615735352e-05, + "loss": 0.0076, + "step": 686220 + }, + { + "epoch": 1.78, + "learning_rate": 3.3178927940982056e-05, + "loss": 0.0054, + "step": 686230 + }, + { + "epoch": 1.78, + "learning_rate": 3.317503972461059e-05, + "loss": 0.0098, + "step": 686240 + }, + { + "epoch": 1.78, + "learning_rate": 3.3171151508239126e-05, + "loss": 0.0072, + "step": 686250 + }, + { + "epoch": 1.78, + "learning_rate": 3.316726329186766e-05, + "loss": 0.0095, + "step": 686260 + }, + { + "epoch": 1.78, + "learning_rate": 3.3163375075496196e-05, + "loss": 0.0084, + "step": 686270 + }, + { + "epoch": 1.78, + "learning_rate": 3.315948685912474e-05, + "loss": 0.0067, + "step": 686280 + }, + { + "epoch": 1.78, + "learning_rate": 3.315559864275327e-05, + "loss": 0.0081, + "step": 686290 + }, + { + "epoch": 1.78, + "learning_rate": 3.315171042638181e-05, + "loss": 0.0062, + "step": 686300 + }, + { + "epoch": 1.78, + "learning_rate": 3.314782221001034e-05, + "loss": 0.0089, + "step": 686310 + }, + { + "epoch": 1.78, + "learning_rate": 3.314393399363888e-05, + "loss": 0.0078, + "step": 686320 + }, + { + "epoch": 1.78, + "learning_rate": 3.314004577726741e-05, + "loss": 0.0072, + "step": 686330 + }, + { + "epoch": 1.78, + "learning_rate": 3.3136157560895946e-05, + "loss": 0.0149, + "step": 686340 + }, + { + "epoch": 1.78, + "learning_rate": 3.313226934452448e-05, + "loss": 0.0058, + "step": 686350 + }, + { + "epoch": 1.78, + "learning_rate": 3.3128381128153016e-05, + "loss": 0.0061, + "step": 686360 + }, + { + "epoch": 1.78, + "learning_rate": 3.312449291178155e-05, + "loss": 0.0052, + "step": 686370 + }, + { + "epoch": 1.78, + "learning_rate": 3.3120604695410086e-05, + "loss": 0.0069, + "step": 686380 + }, + { + "epoch": 1.78, + "learning_rate": 3.311671647903862e-05, + "loss": 0.0063, + "step": 686390 + }, + { + "epoch": 1.78, + "learning_rate": 3.3112828262667156e-05, + "loss": 0.006, + "step": 686400 + }, + { + "epoch": 1.78, + "learning_rate": 3.31089400462957e-05, + "loss": 0.0077, + "step": 686410 + }, + { + "epoch": 1.78, + "learning_rate": 3.310505182992423e-05, + "loss": 0.0067, + "step": 686420 + }, + { + "epoch": 1.78, + "learning_rate": 3.310116361355277e-05, + "loss": 0.0083, + "step": 686430 + }, + { + "epoch": 1.78, + "learning_rate": 3.30972753971813e-05, + "loss": 0.0084, + "step": 686440 + }, + { + "epoch": 1.78, + "learning_rate": 3.309338718080983e-05, + "loss": 0.0084, + "step": 686450 + }, + { + "epoch": 1.78, + "learning_rate": 3.308949896443837e-05, + "loss": 0.0071, + "step": 686460 + }, + { + "epoch": 1.78, + "learning_rate": 3.3085610748066906e-05, + "loss": 0.0061, + "step": 686470 + }, + { + "epoch": 1.78, + "learning_rate": 3.308172253169544e-05, + "loss": 0.0068, + "step": 686480 + }, + { + "epoch": 1.78, + "learning_rate": 3.3077834315323976e-05, + "loss": 0.0073, + "step": 686490 + }, + { + "epoch": 1.78, + "learning_rate": 3.307394609895251e-05, + "loss": 0.0066, + "step": 686500 + }, + { + "epoch": 1.78, + "learning_rate": 3.3070057882581046e-05, + "loss": 0.0073, + "step": 686510 + }, + { + "epoch": 1.78, + "learning_rate": 3.306616966620958e-05, + "loss": 0.0071, + "step": 686520 + }, + { + "epoch": 1.78, + "learning_rate": 3.3062281449838116e-05, + "loss": 0.0081, + "step": 686530 + }, + { + "epoch": 1.78, + "learning_rate": 3.305839323346666e-05, + "loss": 0.0059, + "step": 686540 + }, + { + "epoch": 1.78, + "learning_rate": 3.305450501709519e-05, + "loss": 0.0088, + "step": 686550 + }, + { + "epoch": 1.78, + "learning_rate": 3.305061680072373e-05, + "loss": 0.0073, + "step": 686560 + }, + { + "epoch": 1.78, + "learning_rate": 3.304672858435226e-05, + "loss": 0.007, + "step": 686570 + }, + { + "epoch": 1.78, + "learning_rate": 3.304284036798079e-05, + "loss": 0.0077, + "step": 686580 + }, + { + "epoch": 1.78, + "learning_rate": 3.303895215160933e-05, + "loss": 0.007, + "step": 686590 + }, + { + "epoch": 1.78, + "learning_rate": 3.3035063935237866e-05, + "loss": 0.0062, + "step": 686600 + }, + { + "epoch": 1.78, + "learning_rate": 3.30311757188664e-05, + "loss": 0.0061, + "step": 686610 + }, + { + "epoch": 1.78, + "learning_rate": 3.3027287502494936e-05, + "loss": 0.0065, + "step": 686620 + }, + { + "epoch": 1.78, + "learning_rate": 3.302339928612347e-05, + "loss": 0.0089, + "step": 686630 + }, + { + "epoch": 1.78, + "learning_rate": 3.3019511069752006e-05, + "loss": 0.0064, + "step": 686640 + }, + { + "epoch": 1.78, + "learning_rate": 3.301562285338054e-05, + "loss": 0.007, + "step": 686650 + }, + { + "epoch": 1.78, + "learning_rate": 3.3011734637009076e-05, + "loss": 0.0065, + "step": 686660 + }, + { + "epoch": 1.78, + "learning_rate": 3.300784642063762e-05, + "loss": 0.0094, + "step": 686670 + }, + { + "epoch": 1.78, + "learning_rate": 3.300395820426615e-05, + "loss": 0.0074, + "step": 686680 + }, + { + "epoch": 1.78, + "learning_rate": 3.300006998789469e-05, + "loss": 0.0065, + "step": 686690 + }, + { + "epoch": 1.78, + "learning_rate": 3.2996181771523215e-05, + "loss": 0.0083, + "step": 686700 + }, + { + "epoch": 1.78, + "learning_rate": 3.299229355515175e-05, + "loss": 0.0064, + "step": 686710 + }, + { + "epoch": 1.78, + "learning_rate": 3.298840533878029e-05, + "loss": 0.0078, + "step": 686720 + }, + { + "epoch": 1.78, + "learning_rate": 3.2984517122408826e-05, + "loss": 0.0113, + "step": 686730 + }, + { + "epoch": 1.78, + "learning_rate": 3.298062890603736e-05, + "loss": 0.005, + "step": 686740 + }, + { + "epoch": 1.78, + "learning_rate": 3.2976740689665896e-05, + "loss": 0.0062, + "step": 686750 + }, + { + "epoch": 1.78, + "learning_rate": 3.297285247329443e-05, + "loss": 0.0065, + "step": 686760 + }, + { + "epoch": 1.78, + "learning_rate": 3.2968964256922966e-05, + "loss": 0.0071, + "step": 686770 + }, + { + "epoch": 1.78, + "learning_rate": 3.29650760405515e-05, + "loss": 0.0081, + "step": 686780 + }, + { + "epoch": 1.78, + "learning_rate": 3.2961187824180035e-05, + "loss": 0.0058, + "step": 686790 + }, + { + "epoch": 1.78, + "learning_rate": 3.295729960780858e-05, + "loss": 0.0089, + "step": 686800 + }, + { + "epoch": 1.78, + "learning_rate": 3.295341139143711e-05, + "loss": 0.0082, + "step": 686810 + }, + { + "epoch": 1.78, + "learning_rate": 3.294952317506565e-05, + "loss": 0.0064, + "step": 686820 + }, + { + "epoch": 1.78, + "learning_rate": 3.2945634958694175e-05, + "loss": 0.0067, + "step": 686830 + }, + { + "epoch": 1.78, + "learning_rate": 3.294174674232271e-05, + "loss": 0.0055, + "step": 686840 + }, + { + "epoch": 1.78, + "learning_rate": 3.293785852595125e-05, + "loss": 0.0109, + "step": 686850 + }, + { + "epoch": 1.78, + "learning_rate": 3.2933970309579786e-05, + "loss": 0.0075, + "step": 686860 + }, + { + "epoch": 1.78, + "learning_rate": 3.293008209320832e-05, + "loss": 0.0083, + "step": 686870 + }, + { + "epoch": 1.78, + "learning_rate": 3.2926193876836856e-05, + "loss": 0.008, + "step": 686880 + }, + { + "epoch": 1.78, + "learning_rate": 3.292230566046539e-05, + "loss": 0.0085, + "step": 686890 + }, + { + "epoch": 1.78, + "learning_rate": 3.2918417444093926e-05, + "loss": 0.0095, + "step": 686900 + }, + { + "epoch": 1.78, + "learning_rate": 3.291452922772246e-05, + "loss": 0.0082, + "step": 686910 + }, + { + "epoch": 1.78, + "learning_rate": 3.2910641011350995e-05, + "loss": 0.0086, + "step": 686920 + }, + { + "epoch": 1.78, + "learning_rate": 3.290675279497953e-05, + "loss": 0.0103, + "step": 686930 + }, + { + "epoch": 1.78, + "learning_rate": 3.290286457860807e-05, + "loss": 0.0084, + "step": 686940 + }, + { + "epoch": 1.78, + "learning_rate": 3.28989763622366e-05, + "loss": 0.0093, + "step": 686950 + }, + { + "epoch": 1.78, + "learning_rate": 3.2895088145865135e-05, + "loss": 0.0084, + "step": 686960 + }, + { + "epoch": 1.78, + "learning_rate": 3.289119992949367e-05, + "loss": 0.0088, + "step": 686970 + }, + { + "epoch": 1.78, + "learning_rate": 3.2887311713122205e-05, + "loss": 0.0093, + "step": 686980 + }, + { + "epoch": 1.78, + "learning_rate": 3.2883423496750746e-05, + "loss": 0.0066, + "step": 686990 + }, + { + "epoch": 1.78, + "learning_rate": 3.287953528037928e-05, + "loss": 0.0064, + "step": 687000 + }, + { + "epoch": 1.78, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.004868320655077696, + "eval_runtime": 107.8854, + "eval_samples_per_second": 18.538, + "eval_steps_per_second": 4.635, + "step": 687000 + }, + { + "epoch": 1.78, + "learning_rate": 3.2875647064007816e-05, + "loss": 0.0093, + "step": 687010 + }, + { + "epoch": 1.78, + "learning_rate": 3.287175884763635e-05, + "loss": 0.0051, + "step": 687020 + }, + { + "epoch": 1.78, + "learning_rate": 3.2867870631264886e-05, + "loss": 0.0068, + "step": 687030 + }, + { + "epoch": 1.78, + "learning_rate": 3.286398241489342e-05, + "loss": 0.0066, + "step": 687040 + }, + { + "epoch": 1.78, + "learning_rate": 3.2860094198521955e-05, + "loss": 0.0083, + "step": 687050 + }, + { + "epoch": 1.78, + "learning_rate": 3.285620598215049e-05, + "loss": 0.0089, + "step": 687060 + }, + { + "epoch": 1.78, + "learning_rate": 3.2852317765779025e-05, + "loss": 0.0077, + "step": 687070 + }, + { + "epoch": 1.78, + "learning_rate": 3.284842954940756e-05, + "loss": 0.0076, + "step": 687080 + }, + { + "epoch": 1.78, + "learning_rate": 3.2844541333036095e-05, + "loss": 0.0122, + "step": 687090 + }, + { + "epoch": 1.78, + "learning_rate": 3.284065311666463e-05, + "loss": 0.0073, + "step": 687100 + }, + { + "epoch": 1.78, + "learning_rate": 3.2836764900293165e-05, + "loss": 0.0101, + "step": 687110 + }, + { + "epoch": 1.78, + "learning_rate": 3.2832876683921706e-05, + "loss": 0.0085, + "step": 687120 + }, + { + "epoch": 1.78, + "learning_rate": 3.282898846755024e-05, + "loss": 0.0078, + "step": 687130 + }, + { + "epoch": 1.78, + "learning_rate": 3.2825100251178776e-05, + "loss": 0.0062, + "step": 687140 + }, + { + "epoch": 1.78, + "learning_rate": 3.282121203480731e-05, + "loss": 0.0093, + "step": 687150 + }, + { + "epoch": 1.78, + "learning_rate": 3.2817323818435846e-05, + "loss": 0.0081, + "step": 687160 + }, + { + "epoch": 1.78, + "learning_rate": 3.281343560206438e-05, + "loss": 0.0061, + "step": 687170 + }, + { + "epoch": 1.78, + "learning_rate": 3.2809547385692915e-05, + "loss": 0.0075, + "step": 687180 + }, + { + "epoch": 1.78, + "learning_rate": 3.280565916932145e-05, + "loss": 0.0095, + "step": 687190 + }, + { + "epoch": 1.78, + "learning_rate": 3.2801770952949985e-05, + "loss": 0.0086, + "step": 687200 + }, + { + "epoch": 1.78, + "learning_rate": 3.279788273657852e-05, + "loss": 0.008, + "step": 687210 + }, + { + "epoch": 1.78, + "learning_rate": 3.2793994520207055e-05, + "loss": 0.007, + "step": 687220 + }, + { + "epoch": 1.78, + "learning_rate": 3.279010630383559e-05, + "loss": 0.0073, + "step": 687230 + }, + { + "epoch": 1.78, + "learning_rate": 3.2786218087464125e-05, + "loss": 0.0079, + "step": 687240 + }, + { + "epoch": 1.78, + "learning_rate": 3.2782329871092666e-05, + "loss": 0.0058, + "step": 687250 + }, + { + "epoch": 1.78, + "learning_rate": 3.27784416547212e-05, + "loss": 0.0062, + "step": 687260 + }, + { + "epoch": 1.78, + "learning_rate": 3.2774553438349736e-05, + "loss": 0.0112, + "step": 687270 + }, + { + "epoch": 1.78, + "learning_rate": 3.277066522197827e-05, + "loss": 0.0095, + "step": 687280 + }, + { + "epoch": 1.78, + "learning_rate": 3.2766777005606806e-05, + "loss": 0.0077, + "step": 687290 + }, + { + "epoch": 1.78, + "learning_rate": 3.276288878923534e-05, + "loss": 0.0064, + "step": 687300 + }, + { + "epoch": 1.78, + "learning_rate": 3.2759000572863875e-05, + "loss": 0.0066, + "step": 687310 + }, + { + "epoch": 1.78, + "learning_rate": 3.275511235649241e-05, + "loss": 0.0082, + "step": 687320 + }, + { + "epoch": 1.78, + "learning_rate": 3.2751224140120945e-05, + "loss": 0.0075, + "step": 687330 + }, + { + "epoch": 1.78, + "learning_rate": 3.274733592374948e-05, + "loss": 0.006, + "step": 687340 + }, + { + "epoch": 1.78, + "learning_rate": 3.2743447707378015e-05, + "loss": 0.0073, + "step": 687350 + }, + { + "epoch": 1.78, + "learning_rate": 3.273955949100655e-05, + "loss": 0.0064, + "step": 687360 + }, + { + "epoch": 1.78, + "learning_rate": 3.2735671274635085e-05, + "loss": 0.0082, + "step": 687370 + }, + { + "epoch": 1.78, + "learning_rate": 3.2731783058263626e-05, + "loss": 0.0063, + "step": 687380 + }, + { + "epoch": 1.78, + "learning_rate": 3.272789484189216e-05, + "loss": 0.0056, + "step": 687390 + }, + { + "epoch": 1.78, + "learning_rate": 3.2724006625520696e-05, + "loss": 0.0104, + "step": 687400 + }, + { + "epoch": 1.78, + "learning_rate": 3.272011840914923e-05, + "loss": 0.0094, + "step": 687410 + }, + { + "epoch": 1.78, + "learning_rate": 3.2716230192777766e-05, + "loss": 0.0103, + "step": 687420 + }, + { + "epoch": 1.78, + "learning_rate": 3.27123419764063e-05, + "loss": 0.008, + "step": 687430 + }, + { + "epoch": 1.78, + "learning_rate": 3.2708453760034835e-05, + "loss": 0.0074, + "step": 687440 + }, + { + "epoch": 1.78, + "learning_rate": 3.270456554366337e-05, + "loss": 0.0057, + "step": 687450 + }, + { + "epoch": 1.78, + "learning_rate": 3.2700677327291905e-05, + "loss": 0.0078, + "step": 687460 + }, + { + "epoch": 1.78, + "learning_rate": 3.269678911092044e-05, + "loss": 0.0078, + "step": 687470 + }, + { + "epoch": 1.78, + "learning_rate": 3.2692900894548975e-05, + "loss": 0.0104, + "step": 687480 + }, + { + "epoch": 1.78, + "learning_rate": 3.268901267817751e-05, + "loss": 0.0094, + "step": 687490 + }, + { + "epoch": 1.78, + "learning_rate": 3.2685124461806045e-05, + "loss": 0.008, + "step": 687500 + }, + { + "epoch": 1.78, + "learning_rate": 3.2681236245434586e-05, + "loss": 0.0078, + "step": 687510 + }, + { + "epoch": 1.78, + "learning_rate": 3.267734802906312e-05, + "loss": 0.0076, + "step": 687520 + }, + { + "epoch": 1.78, + "learning_rate": 3.2673459812691656e-05, + "loss": 0.007, + "step": 687530 + }, + { + "epoch": 1.78, + "learning_rate": 3.266957159632019e-05, + "loss": 0.0082, + "step": 687540 + }, + { + "epoch": 1.78, + "learning_rate": 3.2665683379948726e-05, + "loss": 0.0063, + "step": 687550 + }, + { + "epoch": 1.78, + "learning_rate": 3.266179516357726e-05, + "loss": 0.006, + "step": 687560 + }, + { + "epoch": 1.78, + "learning_rate": 3.2657906947205795e-05, + "loss": 0.0081, + "step": 687570 + }, + { + "epoch": 1.78, + "learning_rate": 3.265401873083433e-05, + "loss": 0.009, + "step": 687580 + }, + { + "epoch": 1.78, + "learning_rate": 3.2650130514462865e-05, + "loss": 0.008, + "step": 687590 + }, + { + "epoch": 1.78, + "learning_rate": 3.26462422980914e-05, + "loss": 0.0057, + "step": 687600 + }, + { + "epoch": 1.78, + "learning_rate": 3.2642354081719935e-05, + "loss": 0.0083, + "step": 687610 + }, + { + "epoch": 1.78, + "learning_rate": 3.263846586534847e-05, + "loss": 0.0093, + "step": 687620 + }, + { + "epoch": 1.78, + "learning_rate": 3.2634577648977005e-05, + "loss": 0.0091, + "step": 687630 + }, + { + "epoch": 1.78, + "learning_rate": 3.2630689432605546e-05, + "loss": 0.006, + "step": 687640 + }, + { + "epoch": 1.78, + "learning_rate": 3.262680121623408e-05, + "loss": 0.0085, + "step": 687650 + }, + { + "epoch": 1.78, + "learning_rate": 3.2622912999862616e-05, + "loss": 0.0086, + "step": 687660 + }, + { + "epoch": 1.78, + "learning_rate": 3.261902478349115e-05, + "loss": 0.0073, + "step": 687670 + }, + { + "epoch": 1.78, + "learning_rate": 3.2615136567119686e-05, + "loss": 0.0076, + "step": 687680 + }, + { + "epoch": 1.78, + "learning_rate": 3.261124835074822e-05, + "loss": 0.0068, + "step": 687690 + }, + { + "epoch": 1.78, + "learning_rate": 3.2607360134376755e-05, + "loss": 0.0054, + "step": 687700 + }, + { + "epoch": 1.78, + "learning_rate": 3.260347191800529e-05, + "loss": 0.008, + "step": 687710 + }, + { + "epoch": 1.78, + "learning_rate": 3.2599583701633825e-05, + "loss": 0.007, + "step": 687720 + }, + { + "epoch": 1.78, + "learning_rate": 3.259569548526236e-05, + "loss": 0.007, + "step": 687730 + }, + { + "epoch": 1.78, + "learning_rate": 3.2591807268890895e-05, + "loss": 0.0073, + "step": 687740 + }, + { + "epoch": 1.78, + "learning_rate": 3.258791905251943e-05, + "loss": 0.0071, + "step": 687750 + }, + { + "epoch": 1.78, + "learning_rate": 3.2584030836147964e-05, + "loss": 0.0072, + "step": 687760 + }, + { + "epoch": 1.78, + "learning_rate": 3.2580142619776506e-05, + "loss": 0.0072, + "step": 687770 + }, + { + "epoch": 1.78, + "learning_rate": 3.257625440340504e-05, + "loss": 0.0072, + "step": 687780 + }, + { + "epoch": 1.78, + "learning_rate": 3.2572366187033576e-05, + "loss": 0.0066, + "step": 687790 + }, + { + "epoch": 1.78, + "learning_rate": 3.256847797066211e-05, + "loss": 0.0075, + "step": 687800 + }, + { + "epoch": 1.78, + "learning_rate": 3.2564589754290646e-05, + "loss": 0.0093, + "step": 687810 + }, + { + "epoch": 1.78, + "learning_rate": 3.256070153791918e-05, + "loss": 0.0079, + "step": 687820 + }, + { + "epoch": 1.78, + "learning_rate": 3.2556813321547715e-05, + "loss": 0.0083, + "step": 687830 + }, + { + "epoch": 1.78, + "learning_rate": 3.255292510517625e-05, + "loss": 0.0072, + "step": 687840 + }, + { + "epoch": 1.78, + "learning_rate": 3.2549036888804785e-05, + "loss": 0.0123, + "step": 687850 + }, + { + "epoch": 1.78, + "learning_rate": 3.254514867243332e-05, + "loss": 0.0125, + "step": 687860 + }, + { + "epoch": 1.78, + "learning_rate": 3.2541260456061855e-05, + "loss": 0.0087, + "step": 687870 + }, + { + "epoch": 1.78, + "learning_rate": 3.253737223969039e-05, + "loss": 0.0067, + "step": 687880 + }, + { + "epoch": 1.78, + "learning_rate": 3.2533484023318924e-05, + "loss": 0.0069, + "step": 687890 + }, + { + "epoch": 1.78, + "learning_rate": 3.2529595806947466e-05, + "loss": 0.0073, + "step": 687900 + }, + { + "epoch": 1.78, + "learning_rate": 3.2525707590576e-05, + "loss": 0.0084, + "step": 687910 + }, + { + "epoch": 1.78, + "learning_rate": 3.2521819374204536e-05, + "loss": 0.0082, + "step": 687920 + }, + { + "epoch": 1.78, + "learning_rate": 3.251793115783307e-05, + "loss": 0.0063, + "step": 687930 + }, + { + "epoch": 1.78, + "learning_rate": 3.25140429414616e-05, + "loss": 0.0073, + "step": 687940 + }, + { + "epoch": 1.78, + "learning_rate": 3.251015472509014e-05, + "loss": 0.0078, + "step": 687950 + }, + { + "epoch": 1.78, + "learning_rate": 3.2506266508718675e-05, + "loss": 0.0093, + "step": 687960 + }, + { + "epoch": 1.78, + "learning_rate": 3.250237829234721e-05, + "loss": 0.0071, + "step": 687970 + }, + { + "epoch": 1.78, + "learning_rate": 3.2498490075975745e-05, + "loss": 0.0065, + "step": 687980 + }, + { + "epoch": 1.78, + "learning_rate": 3.249460185960428e-05, + "loss": 0.0078, + "step": 687990 + }, + { + "epoch": 1.78, + "learning_rate": 3.2490713643232815e-05, + "loss": 0.0107, + "step": 688000 + }, + { + "epoch": 1.78, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.004783975426107645, + "eval_runtime": 108.0049, + "eval_samples_per_second": 18.518, + "eval_steps_per_second": 4.629, + "step": 688000 + }, + { + "epoch": 1.78, + "learning_rate": 3.248682542686135e-05, + "loss": 0.0049, + "step": 688010 + }, + { + "epoch": 1.78, + "learning_rate": 3.2482937210489884e-05, + "loss": 0.0076, + "step": 688020 + }, + { + "epoch": 1.78, + "learning_rate": 3.2479048994118426e-05, + "loss": 0.0085, + "step": 688030 + }, + { + "epoch": 1.78, + "learning_rate": 3.247516077774696e-05, + "loss": 0.0049, + "step": 688040 + }, + { + "epoch": 1.78, + "learning_rate": 3.2471272561375496e-05, + "loss": 0.0089, + "step": 688050 + }, + { + "epoch": 1.78, + "learning_rate": 3.246738434500403e-05, + "loss": 0.0059, + "step": 688060 + }, + { + "epoch": 1.78, + "learning_rate": 3.246349612863256e-05, + "loss": 0.0085, + "step": 688070 + }, + { + "epoch": 1.78, + "learning_rate": 3.24596079122611e-05, + "loss": 0.0078, + "step": 688080 + }, + { + "epoch": 1.78, + "learning_rate": 3.2455719695889635e-05, + "loss": 0.0109, + "step": 688090 + }, + { + "epoch": 1.78, + "learning_rate": 3.245183147951817e-05, + "loss": 0.0076, + "step": 688100 + }, + { + "epoch": 1.78, + "learning_rate": 3.2447943263146705e-05, + "loss": 0.0114, + "step": 688110 + }, + { + "epoch": 1.78, + "learning_rate": 3.244405504677524e-05, + "loss": 0.0083, + "step": 688120 + }, + { + "epoch": 1.78, + "learning_rate": 3.2440166830403775e-05, + "loss": 0.005, + "step": 688130 + }, + { + "epoch": 1.78, + "learning_rate": 3.243627861403231e-05, + "loss": 0.008, + "step": 688140 + }, + { + "epoch": 1.78, + "learning_rate": 3.2432390397660844e-05, + "loss": 0.0078, + "step": 688150 + }, + { + "epoch": 1.78, + "learning_rate": 3.2428502181289386e-05, + "loss": 0.0086, + "step": 688160 + }, + { + "epoch": 1.78, + "learning_rate": 3.242461396491792e-05, + "loss": 0.006, + "step": 688170 + }, + { + "epoch": 1.78, + "learning_rate": 3.2420725748546456e-05, + "loss": 0.0111, + "step": 688180 + }, + { + "epoch": 1.78, + "learning_rate": 3.2416837532174984e-05, + "loss": 0.0073, + "step": 688190 + }, + { + "epoch": 1.78, + "learning_rate": 3.241294931580352e-05, + "loss": 0.0089, + "step": 688200 + }, + { + "epoch": 1.78, + "learning_rate": 3.240906109943206e-05, + "loss": 0.0112, + "step": 688210 + }, + { + "epoch": 1.78, + "learning_rate": 3.2405172883060595e-05, + "loss": 0.0077, + "step": 688220 + }, + { + "epoch": 1.78, + "learning_rate": 3.240128466668913e-05, + "loss": 0.0075, + "step": 688230 + }, + { + "epoch": 1.78, + "learning_rate": 3.2397396450317665e-05, + "loss": 0.0073, + "step": 688240 + }, + { + "epoch": 1.78, + "learning_rate": 3.23935082339462e-05, + "loss": 0.0068, + "step": 688250 + }, + { + "epoch": 1.78, + "learning_rate": 3.2389620017574735e-05, + "loss": 0.0091, + "step": 688260 + }, + { + "epoch": 1.78, + "learning_rate": 3.238573180120327e-05, + "loss": 0.0059, + "step": 688270 + }, + { + "epoch": 1.78, + "learning_rate": 3.2381843584831804e-05, + "loss": 0.0077, + "step": 688280 + }, + { + "epoch": 1.78, + "learning_rate": 3.2377955368460346e-05, + "loss": 0.0067, + "step": 688290 + }, + { + "epoch": 1.78, + "learning_rate": 3.237406715208888e-05, + "loss": 0.0055, + "step": 688300 + }, + { + "epoch": 1.78, + "learning_rate": 3.237017893571741e-05, + "loss": 0.0092, + "step": 688310 + }, + { + "epoch": 1.78, + "learning_rate": 3.2366290719345944e-05, + "loss": 0.0105, + "step": 688320 + }, + { + "epoch": 1.78, + "learning_rate": 3.236240250297448e-05, + "loss": 0.0072, + "step": 688330 + }, + { + "epoch": 1.78, + "learning_rate": 3.235851428660302e-05, + "loss": 0.0098, + "step": 688340 + }, + { + "epoch": 1.78, + "learning_rate": 3.2354626070231555e-05, + "loss": 0.0066, + "step": 688350 + }, + { + "epoch": 1.78, + "learning_rate": 3.235073785386009e-05, + "loss": 0.0076, + "step": 688360 + }, + { + "epoch": 1.78, + "learning_rate": 3.2346849637488625e-05, + "loss": 0.0085, + "step": 688370 + }, + { + "epoch": 1.78, + "learning_rate": 3.234296142111716e-05, + "loss": 0.0067, + "step": 688380 + }, + { + "epoch": 1.78, + "learning_rate": 3.2339073204745695e-05, + "loss": 0.0176, + "step": 688390 + }, + { + "epoch": 1.78, + "learning_rate": 3.233518498837423e-05, + "loss": 0.0105, + "step": 688400 + }, + { + "epoch": 1.78, + "learning_rate": 3.2331296772002764e-05, + "loss": 0.01, + "step": 688410 + }, + { + "epoch": 1.78, + "learning_rate": 3.23274085556313e-05, + "loss": 0.0085, + "step": 688420 + }, + { + "epoch": 1.78, + "learning_rate": 3.232352033925984e-05, + "loss": 0.007, + "step": 688430 + }, + { + "epoch": 1.78, + "learning_rate": 3.231963212288837e-05, + "loss": 0.0084, + "step": 688440 + }, + { + "epoch": 1.78, + "learning_rate": 3.2315743906516904e-05, + "loss": 0.0064, + "step": 688450 + }, + { + "epoch": 1.78, + "learning_rate": 3.231185569014544e-05, + "loss": 0.0095, + "step": 688460 + }, + { + "epoch": 1.78, + "learning_rate": 3.2307967473773974e-05, + "loss": 0.0086, + "step": 688470 + }, + { + "epoch": 1.78, + "learning_rate": 3.2304079257402515e-05, + "loss": 0.0088, + "step": 688480 + }, + { + "epoch": 1.78, + "learning_rate": 3.230019104103105e-05, + "loss": 0.0096, + "step": 688490 + }, + { + "epoch": 1.78, + "learning_rate": 3.2296302824659585e-05, + "loss": 0.0062, + "step": 688500 + }, + { + "epoch": 1.78, + "learning_rate": 3.229241460828812e-05, + "loss": 0.0059, + "step": 688510 + }, + { + "epoch": 1.78, + "learning_rate": 3.2288526391916655e-05, + "loss": 0.0058, + "step": 688520 + }, + { + "epoch": 1.78, + "learning_rate": 3.228463817554519e-05, + "loss": 0.0073, + "step": 688530 + }, + { + "epoch": 1.78, + "learning_rate": 3.2280749959173724e-05, + "loss": 0.0091, + "step": 688540 + }, + { + "epoch": 1.78, + "learning_rate": 3.227686174280226e-05, + "loss": 0.0086, + "step": 688550 + }, + { + "epoch": 1.78, + "learning_rate": 3.2272973526430794e-05, + "loss": 0.0062, + "step": 688560 + }, + { + "epoch": 1.78, + "learning_rate": 3.226908531005933e-05, + "loss": 0.0071, + "step": 688570 + }, + { + "epoch": 1.78, + "learning_rate": 3.2265197093687864e-05, + "loss": 0.0086, + "step": 688580 + }, + { + "epoch": 1.78, + "learning_rate": 3.22613088773164e-05, + "loss": 0.0076, + "step": 688590 + }, + { + "epoch": 1.78, + "learning_rate": 3.2257420660944934e-05, + "loss": 0.0086, + "step": 688600 + }, + { + "epoch": 1.78, + "learning_rate": 3.2253532444573475e-05, + "loss": 0.0102, + "step": 688610 + }, + { + "epoch": 1.79, + "learning_rate": 3.224964422820201e-05, + "loss": 0.0107, + "step": 688620 + }, + { + "epoch": 1.79, + "learning_rate": 3.2245756011830545e-05, + "loss": 0.0073, + "step": 688630 + }, + { + "epoch": 1.79, + "learning_rate": 3.224186779545908e-05, + "loss": 0.0069, + "step": 688640 + }, + { + "epoch": 1.79, + "learning_rate": 3.2237979579087615e-05, + "loss": 0.0089, + "step": 688650 + }, + { + "epoch": 1.79, + "learning_rate": 3.223409136271615e-05, + "loss": 0.0079, + "step": 688660 + }, + { + "epoch": 1.79, + "learning_rate": 3.2230203146344684e-05, + "loss": 0.0083, + "step": 688670 + }, + { + "epoch": 1.79, + "learning_rate": 3.222631492997322e-05, + "loss": 0.0073, + "step": 688680 + }, + { + "epoch": 1.79, + "learning_rate": 3.2222426713601754e-05, + "loss": 0.0079, + "step": 688690 + }, + { + "epoch": 1.79, + "learning_rate": 3.221853849723029e-05, + "loss": 0.0072, + "step": 688700 + }, + { + "epoch": 1.79, + "learning_rate": 3.2214650280858824e-05, + "loss": 0.0072, + "step": 688710 + }, + { + "epoch": 1.79, + "learning_rate": 3.221076206448736e-05, + "loss": 0.0052, + "step": 688720 + }, + { + "epoch": 1.79, + "learning_rate": 3.2206873848115893e-05, + "loss": 0.0061, + "step": 688730 + }, + { + "epoch": 1.79, + "learning_rate": 3.2202985631744435e-05, + "loss": 0.008, + "step": 688740 + }, + { + "epoch": 1.79, + "learning_rate": 3.219909741537297e-05, + "loss": 0.0052, + "step": 688750 + }, + { + "epoch": 1.79, + "learning_rate": 3.2195209199001505e-05, + "loss": 0.0071, + "step": 688760 + }, + { + "epoch": 1.79, + "learning_rate": 3.219132098263004e-05, + "loss": 0.0072, + "step": 688770 + }, + { + "epoch": 1.79, + "learning_rate": 3.2187432766258575e-05, + "loss": 0.0098, + "step": 688780 + }, + { + "epoch": 1.79, + "learning_rate": 3.218354454988711e-05, + "loss": 0.0095, + "step": 688790 + }, + { + "epoch": 1.79, + "learning_rate": 3.2179656333515644e-05, + "loss": 0.0076, + "step": 688800 + }, + { + "epoch": 1.79, + "learning_rate": 3.217576811714418e-05, + "loss": 0.0086, + "step": 688810 + }, + { + "epoch": 1.79, + "learning_rate": 3.2171879900772714e-05, + "loss": 0.0077, + "step": 688820 + }, + { + "epoch": 1.79, + "learning_rate": 3.216799168440125e-05, + "loss": 0.0081, + "step": 688830 + }, + { + "epoch": 1.79, + "learning_rate": 3.2164103468029784e-05, + "loss": 0.0078, + "step": 688840 + }, + { + "epoch": 1.79, + "learning_rate": 3.216021525165832e-05, + "loss": 0.0065, + "step": 688850 + }, + { + "epoch": 1.79, + "learning_rate": 3.2156327035286853e-05, + "loss": 0.0081, + "step": 688860 + }, + { + "epoch": 1.79, + "learning_rate": 3.2152438818915395e-05, + "loss": 0.007, + "step": 688870 + }, + { + "epoch": 1.79, + "learning_rate": 3.214855060254393e-05, + "loss": 0.0081, + "step": 688880 + }, + { + "epoch": 1.79, + "learning_rate": 3.2144662386172465e-05, + "loss": 0.0053, + "step": 688890 + }, + { + "epoch": 1.79, + "learning_rate": 3.2140774169801e-05, + "loss": 0.0048, + "step": 688900 + }, + { + "epoch": 1.79, + "learning_rate": 3.2136885953429535e-05, + "loss": 0.0073, + "step": 688910 + }, + { + "epoch": 1.79, + "learning_rate": 3.213299773705807e-05, + "loss": 0.0058, + "step": 688920 + }, + { + "epoch": 1.79, + "learning_rate": 3.2129109520686604e-05, + "loss": 0.0085, + "step": 688930 + }, + { + "epoch": 1.79, + "learning_rate": 3.212522130431514e-05, + "loss": 0.007, + "step": 688940 + }, + { + "epoch": 1.79, + "learning_rate": 3.2121333087943674e-05, + "loss": 0.0116, + "step": 688950 + }, + { + "epoch": 1.79, + "learning_rate": 3.211744487157221e-05, + "loss": 0.0109, + "step": 688960 + }, + { + "epoch": 1.79, + "learning_rate": 3.2113556655200744e-05, + "loss": 0.0059, + "step": 688970 + }, + { + "epoch": 1.79, + "learning_rate": 3.210966843882928e-05, + "loss": 0.0073, + "step": 688980 + }, + { + "epoch": 1.79, + "learning_rate": 3.2105780222457813e-05, + "loss": 0.006, + "step": 688990 + }, + { + "epoch": 1.79, + "learning_rate": 3.2101892006086355e-05, + "loss": 0.0075, + "step": 689000 + }, + { + "epoch": 1.79, + "eval_cer": 0.881657897941274, + "eval_loss": 0.0048148115165531635, + "eval_runtime": 107.906, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, + "step": 689000 + }, + { + "epoch": 1.79, + "learning_rate": 3.209800378971489e-05, + "loss": 0.0083, + "step": 689010 + }, + { + "epoch": 1.79, + "learning_rate": 3.2094115573343425e-05, + "loss": 0.0053, + "step": 689020 + }, + { + "epoch": 1.79, + "learning_rate": 3.209022735697196e-05, + "loss": 0.0062, + "step": 689030 + }, + { + "epoch": 1.79, + "learning_rate": 3.2086339140600495e-05, + "loss": 0.0073, + "step": 689040 + }, + { + "epoch": 1.79, + "learning_rate": 3.208245092422903e-05, + "loss": 0.0072, + "step": 689050 + }, + { + "epoch": 1.79, + "learning_rate": 3.2078562707857564e-05, + "loss": 0.0068, + "step": 689060 + }, + { + "epoch": 1.79, + "learning_rate": 3.20746744914861e-05, + "loss": 0.0071, + "step": 689070 + }, + { + "epoch": 1.79, + "learning_rate": 3.2070786275114634e-05, + "loss": 0.0048, + "step": 689080 + }, + { + "epoch": 1.79, + "learning_rate": 3.206689805874317e-05, + "loss": 0.0067, + "step": 689090 + }, + { + "epoch": 1.79, + "learning_rate": 3.2063009842371704e-05, + "loss": 0.0065, + "step": 689100 + }, + { + "epoch": 1.79, + "learning_rate": 3.205912162600024e-05, + "loss": 0.0061, + "step": 689110 + }, + { + "epoch": 1.79, + "learning_rate": 3.2055233409628773e-05, + "loss": 0.0061, + "step": 689120 + }, + { + "epoch": 1.79, + "learning_rate": 3.2051345193257315e-05, + "loss": 0.0069, + "step": 689130 + }, + { + "epoch": 1.79, + "learning_rate": 3.204745697688585e-05, + "loss": 0.0068, + "step": 689140 + }, + { + "epoch": 1.79, + "learning_rate": 3.2043568760514385e-05, + "loss": 0.0071, + "step": 689150 + }, + { + "epoch": 1.79, + "learning_rate": 3.203968054414292e-05, + "loss": 0.0072, + "step": 689160 + }, + { + "epoch": 1.79, + "learning_rate": 3.2035792327771455e-05, + "loss": 0.0052, + "step": 689170 + }, + { + "epoch": 1.79, + "learning_rate": 3.203190411139999e-05, + "loss": 0.0079, + "step": 689180 + }, + { + "epoch": 1.79, + "learning_rate": 3.2028015895028524e-05, + "loss": 0.0061, + "step": 689190 + }, + { + "epoch": 1.79, + "learning_rate": 3.202412767865706e-05, + "loss": 0.01, + "step": 689200 + }, + { + "epoch": 1.79, + "learning_rate": 3.2020239462285594e-05, + "loss": 0.007, + "step": 689210 + }, + { + "epoch": 1.79, + "learning_rate": 3.201635124591413e-05, + "loss": 0.0057, + "step": 689220 + }, + { + "epoch": 1.79, + "learning_rate": 3.2012463029542664e-05, + "loss": 0.0075, + "step": 689230 + }, + { + "epoch": 1.79, + "learning_rate": 3.20085748131712e-05, + "loss": 0.0062, + "step": 689240 + }, + { + "epoch": 1.79, + "learning_rate": 3.2004686596799733e-05, + "loss": 0.0078, + "step": 689250 + }, + { + "epoch": 1.79, + "learning_rate": 3.2000798380428275e-05, + "loss": 0.006, + "step": 689260 + }, + { + "epoch": 1.79, + "learning_rate": 3.199691016405681e-05, + "loss": 0.0052, + "step": 689270 + }, + { + "epoch": 1.79, + "learning_rate": 3.1993021947685345e-05, + "loss": 0.0102, + "step": 689280 + }, + { + "epoch": 1.79, + "learning_rate": 3.198913373131388e-05, + "loss": 0.0055, + "step": 689290 + }, + { + "epoch": 1.79, + "learning_rate": 3.1985245514942414e-05, + "loss": 0.0082, + "step": 689300 + }, + { + "epoch": 1.79, + "learning_rate": 3.198135729857095e-05, + "loss": 0.0069, + "step": 689310 + }, + { + "epoch": 1.79, + "learning_rate": 3.1977469082199484e-05, + "loss": 0.008, + "step": 689320 + }, + { + "epoch": 1.79, + "learning_rate": 3.197358086582802e-05, + "loss": 0.0073, + "step": 689330 + }, + { + "epoch": 1.79, + "learning_rate": 3.1969692649456554e-05, + "loss": 0.007, + "step": 689340 + }, + { + "epoch": 1.79, + "learning_rate": 3.196580443308509e-05, + "loss": 0.0064, + "step": 689350 + }, + { + "epoch": 1.79, + "learning_rate": 3.1961916216713624e-05, + "loss": 0.0069, + "step": 689360 + }, + { + "epoch": 1.79, + "learning_rate": 3.195802800034216e-05, + "loss": 0.0071, + "step": 689370 + }, + { + "epoch": 1.79, + "learning_rate": 3.195413978397069e-05, + "loss": 0.0112, + "step": 689380 + }, + { + "epoch": 1.79, + "learning_rate": 3.1950251567599235e-05, + "loss": 0.0082, + "step": 689390 + }, + { + "epoch": 1.79, + "learning_rate": 3.194636335122777e-05, + "loss": 0.0082, + "step": 689400 + }, + { + "epoch": 1.79, + "learning_rate": 3.1942475134856305e-05, + "loss": 0.0074, + "step": 689410 + }, + { + "epoch": 1.79, + "learning_rate": 3.193858691848484e-05, + "loss": 0.0076, + "step": 689420 + }, + { + "epoch": 1.79, + "learning_rate": 3.193469870211337e-05, + "loss": 0.0089, + "step": 689430 + }, + { + "epoch": 1.79, + "learning_rate": 3.193081048574191e-05, + "loss": 0.0109, + "step": 689440 + }, + { + "epoch": 1.79, + "learning_rate": 3.1926922269370444e-05, + "loss": 0.0075, + "step": 689450 + }, + { + "epoch": 1.79, + "learning_rate": 3.192303405299898e-05, + "loss": 0.0067, + "step": 689460 + }, + { + "epoch": 1.79, + "learning_rate": 3.1919145836627514e-05, + "loss": 0.0088, + "step": 689470 + }, + { + "epoch": 1.79, + "learning_rate": 3.191525762025605e-05, + "loss": 0.0073, + "step": 689480 + }, + { + "epoch": 1.79, + "learning_rate": 3.1911369403884584e-05, + "loss": 0.0067, + "step": 689490 + }, + { + "epoch": 1.79, + "learning_rate": 3.190748118751312e-05, + "loss": 0.006, + "step": 689500 + }, + { + "epoch": 1.79, + "learning_rate": 3.190359297114165e-05, + "loss": 0.0072, + "step": 689510 + }, + { + "epoch": 1.79, + "learning_rate": 3.1899704754770195e-05, + "loss": 0.0085, + "step": 689520 + }, + { + "epoch": 1.79, + "learning_rate": 3.189581653839873e-05, + "loss": 0.0076, + "step": 689530 + }, + { + "epoch": 1.79, + "learning_rate": 3.1891928322027265e-05, + "loss": 0.0045, + "step": 689540 + }, + { + "epoch": 1.79, + "learning_rate": 3.18880401056558e-05, + "loss": 0.0066, + "step": 689550 + }, + { + "epoch": 1.79, + "learning_rate": 3.188415188928433e-05, + "loss": 0.0137, + "step": 689560 + }, + { + "epoch": 1.79, + "learning_rate": 3.188026367291287e-05, + "loss": 0.0096, + "step": 689570 + }, + { + "epoch": 1.79, + "learning_rate": 3.1876375456541404e-05, + "loss": 0.0116, + "step": 689580 + }, + { + "epoch": 1.79, + "learning_rate": 3.187248724016994e-05, + "loss": 0.0061, + "step": 689590 + }, + { + "epoch": 1.79, + "learning_rate": 3.1868599023798474e-05, + "loss": 0.0083, + "step": 689600 + }, + { + "epoch": 1.79, + "learning_rate": 3.186471080742701e-05, + "loss": 0.0071, + "step": 689610 + }, + { + "epoch": 1.79, + "learning_rate": 3.1860822591055544e-05, + "loss": 0.0076, + "step": 689620 + }, + { + "epoch": 1.79, + "learning_rate": 3.185693437468408e-05, + "loss": 0.0086, + "step": 689630 + }, + { + "epoch": 1.79, + "learning_rate": 3.185304615831261e-05, + "loss": 0.0083, + "step": 689640 + }, + { + "epoch": 1.79, + "learning_rate": 3.1849157941941155e-05, + "loss": 0.0094, + "step": 689650 + }, + { + "epoch": 1.79, + "learning_rate": 3.184526972556969e-05, + "loss": 0.0078, + "step": 689660 + }, + { + "epoch": 1.79, + "learning_rate": 3.1841381509198225e-05, + "loss": 0.0108, + "step": 689670 + }, + { + "epoch": 1.79, + "learning_rate": 3.183749329282675e-05, + "loss": 0.0056, + "step": 689680 + }, + { + "epoch": 1.79, + "learning_rate": 3.183360507645529e-05, + "loss": 0.0095, + "step": 689690 + }, + { + "epoch": 1.79, + "learning_rate": 3.182971686008383e-05, + "loss": 0.0095, + "step": 689700 + }, + { + "epoch": 1.79, + "learning_rate": 3.1825828643712364e-05, + "loss": 0.008, + "step": 689710 + }, + { + "epoch": 1.79, + "learning_rate": 3.18219404273409e-05, + "loss": 0.0107, + "step": 689720 + }, + { + "epoch": 1.79, + "learning_rate": 3.1818052210969434e-05, + "loss": 0.006, + "step": 689730 + }, + { + "epoch": 1.79, + "learning_rate": 3.181416399459797e-05, + "loss": 0.0093, + "step": 689740 + }, + { + "epoch": 1.79, + "learning_rate": 3.1810275778226504e-05, + "loss": 0.0081, + "step": 689750 + }, + { + "epoch": 1.79, + "learning_rate": 3.180638756185504e-05, + "loss": 0.006, + "step": 689760 + }, + { + "epoch": 1.79, + "learning_rate": 3.180249934548357e-05, + "loss": 0.0087, + "step": 689770 + }, + { + "epoch": 1.79, + "learning_rate": 3.179861112911211e-05, + "loss": 0.0122, + "step": 689780 + }, + { + "epoch": 1.79, + "learning_rate": 3.179472291274065e-05, + "loss": 0.0103, + "step": 689790 + }, + { + "epoch": 1.79, + "learning_rate": 3.179083469636918e-05, + "loss": 0.0106, + "step": 689800 + }, + { + "epoch": 1.79, + "learning_rate": 3.178694647999771e-05, + "loss": 0.0074, + "step": 689810 + }, + { + "epoch": 1.79, + "learning_rate": 3.178305826362625e-05, + "loss": 0.0052, + "step": 689820 + }, + { + "epoch": 1.79, + "learning_rate": 3.177917004725478e-05, + "loss": 0.0074, + "step": 689830 + }, + { + "epoch": 1.79, + "learning_rate": 3.1775281830883324e-05, + "loss": 0.0075, + "step": 689840 + }, + { + "epoch": 1.79, + "learning_rate": 3.177139361451186e-05, + "loss": 0.0081, + "step": 689850 + }, + { + "epoch": 1.79, + "learning_rate": 3.1767505398140394e-05, + "loss": 0.0065, + "step": 689860 + }, + { + "epoch": 1.79, + "learning_rate": 3.176361718176893e-05, + "loss": 0.01, + "step": 689870 + }, + { + "epoch": 1.79, + "learning_rate": 3.1759728965397464e-05, + "loss": 0.0082, + "step": 689880 + }, + { + "epoch": 1.79, + "learning_rate": 3.1755840749026e-05, + "loss": 0.0065, + "step": 689890 + }, + { + "epoch": 1.79, + "learning_rate": 3.175195253265453e-05, + "loss": 0.0063, + "step": 689900 + }, + { + "epoch": 1.79, + "learning_rate": 3.174806431628307e-05, + "loss": 0.0077, + "step": 689910 + }, + { + "epoch": 1.79, + "learning_rate": 3.174417609991161e-05, + "loss": 0.0088, + "step": 689920 + }, + { + "epoch": 1.79, + "learning_rate": 3.174028788354014e-05, + "loss": 0.0093, + "step": 689930 + }, + { + "epoch": 1.79, + "learning_rate": 3.173639966716867e-05, + "loss": 0.0088, + "step": 689940 + }, + { + "epoch": 1.79, + "learning_rate": 3.173251145079721e-05, + "loss": 0.007, + "step": 689950 + }, + { + "epoch": 1.79, + "learning_rate": 3.172862323442574e-05, + "loss": 0.0065, + "step": 689960 + }, + { + "epoch": 1.79, + "learning_rate": 3.1724735018054284e-05, + "loss": 0.0097, + "step": 689970 + }, + { + "epoch": 1.79, + "learning_rate": 3.172084680168282e-05, + "loss": 0.0081, + "step": 689980 + }, + { + "epoch": 1.79, + "learning_rate": 3.1716958585311354e-05, + "loss": 0.0098, + "step": 689990 + }, + { + "epoch": 1.79, + "learning_rate": 3.171307036893989e-05, + "loss": 0.0066, + "step": 690000 + }, + { + "epoch": 1.79, + "eval_cer": 0.88167329394755, + "eval_loss": 0.004875406622886658, + "eval_runtime": 107.9167, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 690000 + }, + { + "epoch": 1.79, + "learning_rate": 3.1709182152568424e-05, + "loss": 0.0085, + "step": 690010 + }, + { + "epoch": 1.79, + "learning_rate": 3.170529393619696e-05, + "loss": 0.0063, + "step": 690020 + }, + { + "epoch": 1.79, + "learning_rate": 3.170140571982549e-05, + "loss": 0.0071, + "step": 690030 + }, + { + "epoch": 1.79, + "learning_rate": 3.169751750345403e-05, + "loss": 0.0078, + "step": 690040 + }, + { + "epoch": 1.79, + "learning_rate": 3.169362928708256e-05, + "loss": 0.007, + "step": 690050 + }, + { + "epoch": 1.79, + "learning_rate": 3.16897410707111e-05, + "loss": 0.007, + "step": 690060 + }, + { + "epoch": 1.79, + "learning_rate": 3.168585285433963e-05, + "loss": 0.0056, + "step": 690070 + }, + { + "epoch": 1.79, + "learning_rate": 3.168196463796817e-05, + "loss": 0.0078, + "step": 690080 + }, + { + "epoch": 1.79, + "learning_rate": 3.16780764215967e-05, + "loss": 0.0084, + "step": 690090 + }, + { + "epoch": 1.79, + "learning_rate": 3.1674188205225244e-05, + "loss": 0.0066, + "step": 690100 + }, + { + "epoch": 1.79, + "learning_rate": 3.167029998885378e-05, + "loss": 0.0089, + "step": 690110 + }, + { + "epoch": 1.79, + "learning_rate": 3.1666411772482314e-05, + "loss": 0.0069, + "step": 690120 + }, + { + "epoch": 1.79, + "learning_rate": 3.166252355611085e-05, + "loss": 0.0065, + "step": 690130 + }, + { + "epoch": 1.79, + "learning_rate": 3.1658635339739384e-05, + "loss": 0.0098, + "step": 690140 + }, + { + "epoch": 1.79, + "learning_rate": 3.165474712336792e-05, + "loss": 0.0079, + "step": 690150 + }, + { + "epoch": 1.79, + "learning_rate": 3.165085890699645e-05, + "loss": 0.0097, + "step": 690160 + }, + { + "epoch": 1.79, + "learning_rate": 3.164697069062499e-05, + "loss": 0.0072, + "step": 690170 + }, + { + "epoch": 1.79, + "learning_rate": 3.164308247425352e-05, + "loss": 0.0113, + "step": 690180 + }, + { + "epoch": 1.79, + "learning_rate": 3.163919425788206e-05, + "loss": 0.0086, + "step": 690190 + }, + { + "epoch": 1.79, + "learning_rate": 3.163530604151059e-05, + "loss": 0.0079, + "step": 690200 + }, + { + "epoch": 1.79, + "learning_rate": 3.163141782513913e-05, + "loss": 0.008, + "step": 690210 + }, + { + "epoch": 1.79, + "learning_rate": 3.162752960876766e-05, + "loss": 0.0079, + "step": 690220 + }, + { + "epoch": 1.79, + "learning_rate": 3.1623641392396204e-05, + "loss": 0.0075, + "step": 690230 + }, + { + "epoch": 1.79, + "learning_rate": 3.161975317602474e-05, + "loss": 0.0077, + "step": 690240 + }, + { + "epoch": 1.79, + "learning_rate": 3.1615864959653274e-05, + "loss": 0.0089, + "step": 690250 + }, + { + "epoch": 1.79, + "learning_rate": 3.161197674328181e-05, + "loss": 0.0052, + "step": 690260 + }, + { + "epoch": 1.79, + "learning_rate": 3.1608088526910343e-05, + "loss": 0.0069, + "step": 690270 + }, + { + "epoch": 1.79, + "learning_rate": 3.160420031053888e-05, + "loss": 0.0096, + "step": 690280 + }, + { + "epoch": 1.79, + "learning_rate": 3.160031209416741e-05, + "loss": 0.0073, + "step": 690290 + }, + { + "epoch": 1.79, + "learning_rate": 3.159642387779595e-05, + "loss": 0.0093, + "step": 690300 + }, + { + "epoch": 1.79, + "learning_rate": 3.159253566142448e-05, + "loss": 0.0095, + "step": 690310 + }, + { + "epoch": 1.79, + "learning_rate": 3.158864744505302e-05, + "loss": 0.0068, + "step": 690320 + }, + { + "epoch": 1.79, + "learning_rate": 3.158475922868155e-05, + "loss": 0.011, + "step": 690330 + }, + { + "epoch": 1.79, + "learning_rate": 3.158087101231009e-05, + "loss": 0.0079, + "step": 690340 + }, + { + "epoch": 1.79, + "learning_rate": 3.157698279593862e-05, + "loss": 0.0059, + "step": 690350 + }, + { + "epoch": 1.79, + "learning_rate": 3.1573094579567164e-05, + "loss": 0.0067, + "step": 690360 + }, + { + "epoch": 1.79, + "learning_rate": 3.15692063631957e-05, + "loss": 0.0055, + "step": 690370 + }, + { + "epoch": 1.79, + "learning_rate": 3.1565318146824234e-05, + "loss": 0.0091, + "step": 690380 + }, + { + "epoch": 1.79, + "learning_rate": 3.156142993045277e-05, + "loss": 0.0101, + "step": 690390 + }, + { + "epoch": 1.79, + "learning_rate": 3.1557541714081303e-05, + "loss": 0.0067, + "step": 690400 + }, + { + "epoch": 1.79, + "learning_rate": 3.155365349770984e-05, + "loss": 0.0091, + "step": 690410 + }, + { + "epoch": 1.79, + "learning_rate": 3.154976528133837e-05, + "loss": 0.0071, + "step": 690420 + }, + { + "epoch": 1.79, + "learning_rate": 3.154587706496691e-05, + "loss": 0.0073, + "step": 690430 + }, + { + "epoch": 1.79, + "learning_rate": 3.154198884859544e-05, + "loss": 0.0075, + "step": 690440 + }, + { + "epoch": 1.79, + "learning_rate": 3.153810063222398e-05, + "loss": 0.0061, + "step": 690450 + }, + { + "epoch": 1.79, + "learning_rate": 3.153421241585251e-05, + "loss": 0.0067, + "step": 690460 + }, + { + "epoch": 1.79, + "learning_rate": 3.153032419948105e-05, + "loss": 0.0092, + "step": 690470 + }, + { + "epoch": 1.79, + "learning_rate": 3.152643598310958e-05, + "loss": 0.0071, + "step": 690480 + }, + { + "epoch": 1.79, + "learning_rate": 3.1522547766738124e-05, + "loss": 0.0072, + "step": 690490 + }, + { + "epoch": 1.79, + "learning_rate": 3.151865955036666e-05, + "loss": 0.008, + "step": 690500 + }, + { + "epoch": 1.79, + "learning_rate": 3.1514771333995194e-05, + "loss": 0.006, + "step": 690510 + }, + { + "epoch": 1.79, + "learning_rate": 3.151088311762373e-05, + "loss": 0.0089, + "step": 690520 + }, + { + "epoch": 1.79, + "learning_rate": 3.1506994901252263e-05, + "loss": 0.0071, + "step": 690530 + }, + { + "epoch": 1.79, + "learning_rate": 3.15031066848808e-05, + "loss": 0.0088, + "step": 690540 + }, + { + "epoch": 1.79, + "learning_rate": 3.149921846850933e-05, + "loss": 0.0059, + "step": 690550 + }, + { + "epoch": 1.79, + "learning_rate": 3.149533025213787e-05, + "loss": 0.0062, + "step": 690560 + }, + { + "epoch": 1.79, + "learning_rate": 3.14914420357664e-05, + "loss": 0.0068, + "step": 690570 + }, + { + "epoch": 1.79, + "learning_rate": 3.148755381939494e-05, + "loss": 0.0067, + "step": 690580 + }, + { + "epoch": 1.79, + "learning_rate": 3.148366560302347e-05, + "loss": 0.0093, + "step": 690590 + }, + { + "epoch": 1.79, + "learning_rate": 3.147977738665201e-05, + "loss": 0.0098, + "step": 690600 + }, + { + "epoch": 1.79, + "learning_rate": 3.147588917028054e-05, + "loss": 0.0064, + "step": 690610 + }, + { + "epoch": 1.79, + "learning_rate": 3.1472000953909084e-05, + "loss": 0.0058, + "step": 690620 + }, + { + "epoch": 1.79, + "learning_rate": 3.146811273753762e-05, + "loss": 0.0107, + "step": 690630 + }, + { + "epoch": 1.79, + "learning_rate": 3.1464224521166154e-05, + "loss": 0.0154, + "step": 690640 + }, + { + "epoch": 1.79, + "learning_rate": 3.146033630479469e-05, + "loss": 0.0094, + "step": 690650 + }, + { + "epoch": 1.79, + "learning_rate": 3.1456448088423223e-05, + "loss": 0.0071, + "step": 690660 + }, + { + "epoch": 1.79, + "learning_rate": 3.145255987205176e-05, + "loss": 0.008, + "step": 690670 + }, + { + "epoch": 1.79, + "learning_rate": 3.144867165568029e-05, + "loss": 0.006, + "step": 690680 + }, + { + "epoch": 1.79, + "learning_rate": 3.144478343930883e-05, + "loss": 0.0054, + "step": 690690 + }, + { + "epoch": 1.79, + "learning_rate": 3.144089522293736e-05, + "loss": 0.0082, + "step": 690700 + }, + { + "epoch": 1.79, + "learning_rate": 3.14370070065659e-05, + "loss": 0.0079, + "step": 690710 + }, + { + "epoch": 1.79, + "learning_rate": 3.143311879019443e-05, + "loss": 0.0101, + "step": 690720 + }, + { + "epoch": 1.79, + "learning_rate": 3.142923057382297e-05, + "loss": 0.0085, + "step": 690730 + }, + { + "epoch": 1.79, + "learning_rate": 3.14253423574515e-05, + "loss": 0.0064, + "step": 690740 + }, + { + "epoch": 1.79, + "learning_rate": 3.1421454141080044e-05, + "loss": 0.0088, + "step": 690750 + }, + { + "epoch": 1.79, + "learning_rate": 3.141756592470858e-05, + "loss": 0.0071, + "step": 690760 + }, + { + "epoch": 1.79, + "learning_rate": 3.1413677708337114e-05, + "loss": 0.008, + "step": 690770 + }, + { + "epoch": 1.79, + "learning_rate": 3.140978949196565e-05, + "loss": 0.0072, + "step": 690780 + }, + { + "epoch": 1.79, + "learning_rate": 3.1405901275594183e-05, + "loss": 0.0079, + "step": 690790 + }, + { + "epoch": 1.79, + "learning_rate": 3.140201305922272e-05, + "loss": 0.0068, + "step": 690800 + }, + { + "epoch": 1.79, + "learning_rate": 3.139812484285125e-05, + "loss": 0.0072, + "step": 690810 + }, + { + "epoch": 1.79, + "learning_rate": 3.139423662647979e-05, + "loss": 0.0084, + "step": 690820 + }, + { + "epoch": 1.79, + "learning_rate": 3.139034841010832e-05, + "loss": 0.0084, + "step": 690830 + }, + { + "epoch": 1.79, + "learning_rate": 3.138646019373686e-05, + "loss": 0.0051, + "step": 690840 + }, + { + "epoch": 1.79, + "learning_rate": 3.138257197736539e-05, + "loss": 0.0073, + "step": 690850 + }, + { + "epoch": 1.79, + "learning_rate": 3.137868376099393e-05, + "loss": 0.0054, + "step": 690860 + }, + { + "epoch": 1.79, + "learning_rate": 3.137479554462246e-05, + "loss": 0.0068, + "step": 690870 + }, + { + "epoch": 1.79, + "learning_rate": 3.1370907328251004e-05, + "loss": 0.0056, + "step": 690880 + }, + { + "epoch": 1.79, + "learning_rate": 3.136701911187954e-05, + "loss": 0.0059, + "step": 690890 + }, + { + "epoch": 1.79, + "learning_rate": 3.1363130895508074e-05, + "loss": 0.0104, + "step": 690900 + }, + { + "epoch": 1.79, + "learning_rate": 3.135924267913661e-05, + "loss": 0.0102, + "step": 690910 + }, + { + "epoch": 1.79, + "learning_rate": 3.1355354462765137e-05, + "loss": 0.0082, + "step": 690920 + }, + { + "epoch": 1.79, + "learning_rate": 3.135146624639368e-05, + "loss": 0.0076, + "step": 690930 + }, + { + "epoch": 1.79, + "learning_rate": 3.134757803002221e-05, + "loss": 0.0089, + "step": 690940 + }, + { + "epoch": 1.79, + "learning_rate": 3.134368981365075e-05, + "loss": 0.0086, + "step": 690950 + }, + { + "epoch": 1.79, + "learning_rate": 3.133980159727928e-05, + "loss": 0.0079, + "step": 690960 + }, + { + "epoch": 1.79, + "learning_rate": 3.133591338090782e-05, + "loss": 0.0083, + "step": 690970 + }, + { + "epoch": 1.79, + "learning_rate": 3.133202516453635e-05, + "loss": 0.0078, + "step": 690980 + }, + { + "epoch": 1.79, + "learning_rate": 3.132813694816489e-05, + "loss": 0.0126, + "step": 690990 + }, + { + "epoch": 1.79, + "learning_rate": 3.132424873179342e-05, + "loss": 0.0087, + "step": 691000 + }, + { + "epoch": 1.79, + "eval_cer": 0.8816550986674057, + "eval_loss": 0.004775453358888626, + "eval_runtime": 107.7867, + "eval_samples_per_second": 18.555, + "eval_steps_per_second": 4.639, + "step": 691000 + }, + { + "epoch": 1.79, + "learning_rate": 3.1320360515421964e-05, + "loss": 0.0098, + "step": 691010 + }, + { + "epoch": 1.79, + "learning_rate": 3.13164722990505e-05, + "loss": 0.0075, + "step": 691020 + }, + { + "epoch": 1.79, + "learning_rate": 3.1312584082679034e-05, + "loss": 0.0059, + "step": 691030 + }, + { + "epoch": 1.79, + "learning_rate": 3.130869586630756e-05, + "loss": 0.0068, + "step": 691040 + }, + { + "epoch": 1.79, + "learning_rate": 3.1304807649936097e-05, + "loss": 0.0073, + "step": 691050 + }, + { + "epoch": 1.79, + "learning_rate": 3.130091943356464e-05, + "loss": 0.0073, + "step": 691060 + }, + { + "epoch": 1.79, + "learning_rate": 3.129703121719317e-05, + "loss": 0.0116, + "step": 691070 + }, + { + "epoch": 1.79, + "learning_rate": 3.129314300082171e-05, + "loss": 0.0089, + "step": 691080 + }, + { + "epoch": 1.79, + "learning_rate": 3.128925478445024e-05, + "loss": 0.0085, + "step": 691090 + }, + { + "epoch": 1.79, + "learning_rate": 3.128536656807878e-05, + "loss": 0.0069, + "step": 691100 + }, + { + "epoch": 1.79, + "learning_rate": 3.128147835170731e-05, + "loss": 0.0068, + "step": 691110 + }, + { + "epoch": 1.79, + "learning_rate": 3.127759013533585e-05, + "loss": 0.0068, + "step": 691120 + }, + { + "epoch": 1.79, + "learning_rate": 3.127370191896438e-05, + "loss": 0.0092, + "step": 691130 + }, + { + "epoch": 1.79, + "learning_rate": 3.126981370259292e-05, + "loss": 0.0079, + "step": 691140 + }, + { + "epoch": 1.79, + "learning_rate": 3.126592548622146e-05, + "loss": 0.0093, + "step": 691150 + }, + { + "epoch": 1.79, + "learning_rate": 3.1262037269849994e-05, + "loss": 0.0065, + "step": 691160 + }, + { + "epoch": 1.79, + "learning_rate": 3.125814905347852e-05, + "loss": 0.007, + "step": 691170 + }, + { + "epoch": 1.79, + "learning_rate": 3.1254260837107057e-05, + "loss": 0.0071, + "step": 691180 + }, + { + "epoch": 1.79, + "learning_rate": 3.125037262073559e-05, + "loss": 0.006, + "step": 691190 + }, + { + "epoch": 1.79, + "learning_rate": 3.124648440436413e-05, + "loss": 0.0065, + "step": 691200 + }, + { + "epoch": 1.79, + "learning_rate": 3.124259618799267e-05, + "loss": 0.0067, + "step": 691210 + }, + { + "epoch": 1.79, + "learning_rate": 3.12387079716212e-05, + "loss": 0.0073, + "step": 691220 + }, + { + "epoch": 1.79, + "learning_rate": 3.123481975524974e-05, + "loss": 0.0058, + "step": 691230 + }, + { + "epoch": 1.79, + "learning_rate": 3.123093153887827e-05, + "loss": 0.0069, + "step": 691240 + }, + { + "epoch": 1.79, + "learning_rate": 3.122704332250681e-05, + "loss": 0.0086, + "step": 691250 + }, + { + "epoch": 1.79, + "learning_rate": 3.122315510613534e-05, + "loss": 0.0072, + "step": 691260 + }, + { + "epoch": 1.79, + "learning_rate": 3.121926688976388e-05, + "loss": 0.0066, + "step": 691270 + }, + { + "epoch": 1.79, + "learning_rate": 3.121537867339242e-05, + "loss": 0.0071, + "step": 691280 + }, + { + "epoch": 1.79, + "learning_rate": 3.121149045702095e-05, + "loss": 0.0072, + "step": 691290 + }, + { + "epoch": 1.79, + "learning_rate": 3.120760224064948e-05, + "loss": 0.0098, + "step": 691300 + }, + { + "epoch": 1.79, + "learning_rate": 3.1203714024278017e-05, + "loss": 0.0067, + "step": 691310 + }, + { + "epoch": 1.79, + "learning_rate": 3.119982580790655e-05, + "loss": 0.0089, + "step": 691320 + }, + { + "epoch": 1.79, + "learning_rate": 3.119593759153509e-05, + "loss": 0.0087, + "step": 691330 + }, + { + "epoch": 1.79, + "learning_rate": 3.119204937516363e-05, + "loss": 0.008, + "step": 691340 + }, + { + "epoch": 1.79, + "learning_rate": 3.118816115879216e-05, + "loss": 0.0109, + "step": 691350 + }, + { + "epoch": 1.79, + "learning_rate": 3.11842729424207e-05, + "loss": 0.0072, + "step": 691360 + }, + { + "epoch": 1.79, + "learning_rate": 3.118038472604923e-05, + "loss": 0.0067, + "step": 691370 + }, + { + "epoch": 1.79, + "learning_rate": 3.117649650967777e-05, + "loss": 0.0088, + "step": 691380 + }, + { + "epoch": 1.79, + "learning_rate": 3.11726082933063e-05, + "loss": 0.0061, + "step": 691390 + }, + { + "epoch": 1.79, + "learning_rate": 3.116872007693484e-05, + "loss": 0.0077, + "step": 691400 + }, + { + "epoch": 1.79, + "learning_rate": 3.116483186056338e-05, + "loss": 0.0101, + "step": 691410 + }, + { + "epoch": 1.79, + "learning_rate": 3.116094364419191e-05, + "loss": 0.0094, + "step": 691420 + }, + { + "epoch": 1.79, + "learning_rate": 3.115705542782044e-05, + "loss": 0.0072, + "step": 691430 + }, + { + "epoch": 1.79, + "learning_rate": 3.1153167211448976e-05, + "loss": 0.0091, + "step": 691440 + }, + { + "epoch": 1.79, + "learning_rate": 3.114927899507751e-05, + "loss": 0.0093, + "step": 691450 + }, + { + "epoch": 1.79, + "learning_rate": 3.114539077870605e-05, + "loss": 0.0069, + "step": 691460 + }, + { + "epoch": 1.79, + "learning_rate": 3.114150256233459e-05, + "loss": 0.0086, + "step": 691470 + }, + { + "epoch": 1.79, + "learning_rate": 3.113761434596312e-05, + "loss": 0.006, + "step": 691480 + }, + { + "epoch": 1.79, + "learning_rate": 3.113372612959166e-05, + "loss": 0.0072, + "step": 691490 + }, + { + "epoch": 1.79, + "learning_rate": 3.112983791322019e-05, + "loss": 0.0083, + "step": 691500 + }, + { + "epoch": 1.79, + "learning_rate": 3.112594969684873e-05, + "loss": 0.0078, + "step": 691510 + }, + { + "epoch": 1.79, + "learning_rate": 3.112206148047726e-05, + "loss": 0.0105, + "step": 691520 + }, + { + "epoch": 1.79, + "learning_rate": 3.11181732641058e-05, + "loss": 0.0074, + "step": 691530 + }, + { + "epoch": 1.79, + "learning_rate": 3.111428504773433e-05, + "loss": 0.0069, + "step": 691540 + }, + { + "epoch": 1.79, + "learning_rate": 3.111039683136287e-05, + "loss": 0.0084, + "step": 691550 + }, + { + "epoch": 1.79, + "learning_rate": 3.11065086149914e-05, + "loss": 0.0071, + "step": 691560 + }, + { + "epoch": 1.79, + "learning_rate": 3.1102620398619936e-05, + "loss": 0.0078, + "step": 691570 + }, + { + "epoch": 1.79, + "learning_rate": 3.109873218224847e-05, + "loss": 0.0067, + "step": 691580 + }, + { + "epoch": 1.79, + "learning_rate": 3.109484396587701e-05, + "loss": 0.0043, + "step": 691590 + }, + { + "epoch": 1.79, + "learning_rate": 3.109095574950555e-05, + "loss": 0.0063, + "step": 691600 + }, + { + "epoch": 1.79, + "learning_rate": 3.108706753313408e-05, + "loss": 0.0082, + "step": 691610 + }, + { + "epoch": 1.79, + "learning_rate": 3.108317931676262e-05, + "loss": 0.0103, + "step": 691620 + }, + { + "epoch": 1.79, + "learning_rate": 3.107929110039115e-05, + "loss": 0.0088, + "step": 691630 + }, + { + "epoch": 1.79, + "learning_rate": 3.107540288401969e-05, + "loss": 0.009, + "step": 691640 + }, + { + "epoch": 1.79, + "learning_rate": 3.107151466764822e-05, + "loss": 0.008, + "step": 691650 + }, + { + "epoch": 1.79, + "learning_rate": 3.106762645127676e-05, + "loss": 0.0109, + "step": 691660 + }, + { + "epoch": 1.79, + "learning_rate": 3.106373823490529e-05, + "loss": 0.0069, + "step": 691670 + }, + { + "epoch": 1.79, + "learning_rate": 3.105985001853383e-05, + "loss": 0.007, + "step": 691680 + }, + { + "epoch": 1.79, + "learning_rate": 3.105596180216236e-05, + "loss": 0.0062, + "step": 691690 + }, + { + "epoch": 1.79, + "learning_rate": 3.1052073585790896e-05, + "loss": 0.0087, + "step": 691700 + }, + { + "epoch": 1.79, + "learning_rate": 3.104818536941943e-05, + "loss": 0.0076, + "step": 691710 + }, + { + "epoch": 1.79, + "learning_rate": 3.104429715304797e-05, + "loss": 0.0082, + "step": 691720 + }, + { + "epoch": 1.79, + "learning_rate": 3.104040893667651e-05, + "loss": 0.0083, + "step": 691730 + }, + { + "epoch": 1.79, + "learning_rate": 3.103652072030504e-05, + "loss": 0.0073, + "step": 691740 + }, + { + "epoch": 1.79, + "learning_rate": 3.103263250393358e-05, + "loss": 0.0109, + "step": 691750 + }, + { + "epoch": 1.79, + "learning_rate": 3.102874428756211e-05, + "loss": 0.0072, + "step": 691760 + }, + { + "epoch": 1.79, + "learning_rate": 3.102485607119065e-05, + "loss": 0.0072, + "step": 691770 + }, + { + "epoch": 1.79, + "learning_rate": 3.102096785481918e-05, + "loss": 0.0077, + "step": 691780 + }, + { + "epoch": 1.79, + "learning_rate": 3.101707963844772e-05, + "loss": 0.013, + "step": 691790 + }, + { + "epoch": 1.79, + "learning_rate": 3.101319142207625e-05, + "loss": 0.0075, + "step": 691800 + }, + { + "epoch": 1.79, + "learning_rate": 3.100930320570479e-05, + "loss": 0.0074, + "step": 691810 + }, + { + "epoch": 1.79, + "learning_rate": 3.100541498933332e-05, + "loss": 0.0089, + "step": 691820 + }, + { + "epoch": 1.79, + "learning_rate": 3.1001526772961856e-05, + "loss": 0.0109, + "step": 691830 + }, + { + "epoch": 1.79, + "learning_rate": 3.099763855659039e-05, + "loss": 0.0076, + "step": 691840 + }, + { + "epoch": 1.79, + "learning_rate": 3.099375034021893e-05, + "loss": 0.0058, + "step": 691850 + }, + { + "epoch": 1.79, + "learning_rate": 3.098986212384747e-05, + "loss": 0.0063, + "step": 691860 + }, + { + "epoch": 1.79, + "learning_rate": 3.0985973907476e-05, + "loss": 0.0097, + "step": 691870 + }, + { + "epoch": 1.79, + "learning_rate": 3.098208569110454e-05, + "loss": 0.0078, + "step": 691880 + }, + { + "epoch": 1.79, + "learning_rate": 3.097819747473307e-05, + "loss": 0.0068, + "step": 691890 + }, + { + "epoch": 1.79, + "learning_rate": 3.097430925836161e-05, + "loss": 0.0072, + "step": 691900 + }, + { + "epoch": 1.79, + "learning_rate": 3.097042104199014e-05, + "loss": 0.0073, + "step": 691910 + }, + { + "epoch": 1.79, + "learning_rate": 3.096653282561868e-05, + "loss": 0.0081, + "step": 691920 + }, + { + "epoch": 1.79, + "learning_rate": 3.096264460924721e-05, + "loss": 0.0092, + "step": 691930 + }, + { + "epoch": 1.79, + "learning_rate": 3.095875639287575e-05, + "loss": 0.0049, + "step": 691940 + }, + { + "epoch": 1.79, + "learning_rate": 3.095486817650428e-05, + "loss": 0.0072, + "step": 691950 + }, + { + "epoch": 1.79, + "learning_rate": 3.0950979960132816e-05, + "loss": 0.0058, + "step": 691960 + }, + { + "epoch": 1.79, + "learning_rate": 3.094709174376135e-05, + "loss": 0.0059, + "step": 691970 + }, + { + "epoch": 1.79, + "learning_rate": 3.094320352738989e-05, + "loss": 0.0078, + "step": 691980 + }, + { + "epoch": 1.79, + "learning_rate": 3.093931531101843e-05, + "loss": 0.0105, + "step": 691990 + }, + { + "epoch": 1.79, + "learning_rate": 3.093542709464696e-05, + "loss": 0.0078, + "step": 692000 + }, + { + "epoch": 1.79, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.0048337411135435104, + "eval_runtime": 107.7159, + "eval_samples_per_second": 18.567, + "eval_steps_per_second": 4.642, + "step": 692000 + }, + { + "epoch": 1.79, + "learning_rate": 3.09315388782755e-05, + "loss": 0.0086, + "step": 692010 + }, + { + "epoch": 1.79, + "learning_rate": 3.092765066190403e-05, + "loss": 0.0076, + "step": 692020 + }, + { + "epoch": 1.79, + "learning_rate": 3.092376244553257e-05, + "loss": 0.0056, + "step": 692030 + }, + { + "epoch": 1.79, + "learning_rate": 3.09198742291611e-05, + "loss": 0.006, + "step": 692040 + }, + { + "epoch": 1.79, + "learning_rate": 3.091598601278964e-05, + "loss": 0.0092, + "step": 692050 + }, + { + "epoch": 1.79, + "learning_rate": 3.091209779641817e-05, + "loss": 0.0089, + "step": 692060 + }, + { + "epoch": 1.79, + "learning_rate": 3.090820958004671e-05, + "loss": 0.0081, + "step": 692070 + }, + { + "epoch": 1.79, + "learning_rate": 3.090432136367524e-05, + "loss": 0.0061, + "step": 692080 + }, + { + "epoch": 1.79, + "learning_rate": 3.0900433147303776e-05, + "loss": 0.008, + "step": 692090 + }, + { + "epoch": 1.79, + "learning_rate": 3.089654493093231e-05, + "loss": 0.0086, + "step": 692100 + }, + { + "epoch": 1.79, + "learning_rate": 3.089265671456085e-05, + "loss": 0.0096, + "step": 692110 + }, + { + "epoch": 1.79, + "learning_rate": 3.088876849818939e-05, + "loss": 0.0098, + "step": 692120 + }, + { + "epoch": 1.79, + "learning_rate": 3.088488028181792e-05, + "loss": 0.007, + "step": 692130 + }, + { + "epoch": 1.79, + "learning_rate": 3.088099206544646e-05, + "loss": 0.0103, + "step": 692140 + }, + { + "epoch": 1.79, + "learning_rate": 3.087710384907499e-05, + "loss": 0.0088, + "step": 692150 + }, + { + "epoch": 1.79, + "learning_rate": 3.087321563270353e-05, + "loss": 0.0101, + "step": 692160 + }, + { + "epoch": 1.79, + "learning_rate": 3.086932741633206e-05, + "loss": 0.0055, + "step": 692170 + }, + { + "epoch": 1.79, + "learning_rate": 3.08654391999606e-05, + "loss": 0.0074, + "step": 692180 + }, + { + "epoch": 1.79, + "learning_rate": 3.086155098358913e-05, + "loss": 0.0056, + "step": 692190 + }, + { + "epoch": 1.79, + "learning_rate": 3.085766276721767e-05, + "loss": 0.0086, + "step": 692200 + }, + { + "epoch": 1.79, + "learning_rate": 3.08537745508462e-05, + "loss": 0.0078, + "step": 692210 + }, + { + "epoch": 1.79, + "learning_rate": 3.0849886334474736e-05, + "loss": 0.0099, + "step": 692220 + }, + { + "epoch": 1.79, + "learning_rate": 3.084599811810327e-05, + "loss": 0.0074, + "step": 692230 + }, + { + "epoch": 1.79, + "learning_rate": 3.084210990173181e-05, + "loss": 0.007, + "step": 692240 + }, + { + "epoch": 1.79, + "learning_rate": 3.083822168536035e-05, + "loss": 0.008, + "step": 692250 + }, + { + "epoch": 1.79, + "learning_rate": 3.083433346898888e-05, + "loss": 0.0073, + "step": 692260 + }, + { + "epoch": 1.79, + "learning_rate": 3.083044525261742e-05, + "loss": 0.0069, + "step": 692270 + }, + { + "epoch": 1.79, + "learning_rate": 3.0826557036245946e-05, + "loss": 0.0068, + "step": 692280 + }, + { + "epoch": 1.79, + "learning_rate": 3.082266881987449e-05, + "loss": 0.007, + "step": 692290 + }, + { + "epoch": 1.79, + "learning_rate": 3.081878060350302e-05, + "loss": 0.0126, + "step": 692300 + }, + { + "epoch": 1.79, + "learning_rate": 3.081489238713156e-05, + "loss": 0.0072, + "step": 692310 + }, + { + "epoch": 1.79, + "learning_rate": 3.081100417076009e-05, + "loss": 0.0063, + "step": 692320 + }, + { + "epoch": 1.79, + "learning_rate": 3.0807115954388627e-05, + "loss": 0.0082, + "step": 692330 + }, + { + "epoch": 1.79, + "learning_rate": 3.080322773801716e-05, + "loss": 0.0065, + "step": 692340 + }, + { + "epoch": 1.79, + "learning_rate": 3.0799339521645696e-05, + "loss": 0.0096, + "step": 692350 + }, + { + "epoch": 1.79, + "learning_rate": 3.079545130527423e-05, + "loss": 0.0068, + "step": 692360 + }, + { + "epoch": 1.79, + "learning_rate": 3.079156308890277e-05, + "loss": 0.0069, + "step": 692370 + }, + { + "epoch": 1.79, + "learning_rate": 3.078767487253131e-05, + "loss": 0.0068, + "step": 692380 + }, + { + "epoch": 1.79, + "learning_rate": 3.078378665615984e-05, + "loss": 0.0056, + "step": 692390 + }, + { + "epoch": 1.79, + "learning_rate": 3.077989843978838e-05, + "loss": 0.0075, + "step": 692400 + }, + { + "epoch": 1.79, + "learning_rate": 3.0776010223416905e-05, + "loss": 0.0088, + "step": 692410 + }, + { + "epoch": 1.79, + "learning_rate": 3.077212200704545e-05, + "loss": 0.0059, + "step": 692420 + }, + { + "epoch": 1.79, + "learning_rate": 3.076823379067398e-05, + "loss": 0.0102, + "step": 692430 + }, + { + "epoch": 1.79, + "learning_rate": 3.076434557430252e-05, + "loss": 0.0067, + "step": 692440 + }, + { + "epoch": 1.79, + "learning_rate": 3.076045735793105e-05, + "loss": 0.0114, + "step": 692450 + }, + { + "epoch": 1.79, + "learning_rate": 3.0756569141559587e-05, + "loss": 0.0069, + "step": 692460 + }, + { + "epoch": 1.79, + "learning_rate": 3.075268092518812e-05, + "loss": 0.0062, + "step": 692470 + }, + { + "epoch": 1.8, + "learning_rate": 3.0748792708816656e-05, + "loss": 0.0091, + "step": 692480 + }, + { + "epoch": 1.8, + "learning_rate": 3.074490449244519e-05, + "loss": 0.0093, + "step": 692490 + }, + { + "epoch": 1.8, + "learning_rate": 3.074101627607373e-05, + "loss": 0.0069, + "step": 692500 + }, + { + "epoch": 1.8, + "learning_rate": 3.073712805970227e-05, + "loss": 0.0063, + "step": 692510 + }, + { + "epoch": 1.8, + "learning_rate": 3.07332398433308e-05, + "loss": 0.0065, + "step": 692520 + }, + { + "epoch": 1.8, + "learning_rate": 3.072935162695933e-05, + "loss": 0.0064, + "step": 692530 + }, + { + "epoch": 1.8, + "learning_rate": 3.0725463410587865e-05, + "loss": 0.0079, + "step": 692540 + }, + { + "epoch": 1.8, + "learning_rate": 3.072157519421641e-05, + "loss": 0.0062, + "step": 692550 + }, + { + "epoch": 1.8, + "learning_rate": 3.071768697784494e-05, + "loss": 0.0079, + "step": 692560 + }, + { + "epoch": 1.8, + "learning_rate": 3.071379876147348e-05, + "loss": 0.0086, + "step": 692570 + }, + { + "epoch": 1.8, + "learning_rate": 3.070991054510201e-05, + "loss": 0.0051, + "step": 692580 + }, + { + "epoch": 1.8, + "learning_rate": 3.0706022328730547e-05, + "loss": 0.006, + "step": 692590 + }, + { + "epoch": 1.8, + "learning_rate": 3.070213411235908e-05, + "loss": 0.008, + "step": 692600 + }, + { + "epoch": 1.8, + "learning_rate": 3.0698245895987616e-05, + "loss": 0.0076, + "step": 692610 + }, + { + "epoch": 1.8, + "learning_rate": 3.069435767961615e-05, + "loss": 0.0046, + "step": 692620 + }, + { + "epoch": 1.8, + "learning_rate": 3.0690469463244686e-05, + "loss": 0.008, + "step": 692630 + }, + { + "epoch": 1.8, + "learning_rate": 3.068658124687323e-05, + "loss": 0.0085, + "step": 692640 + }, + { + "epoch": 1.8, + "learning_rate": 3.068269303050176e-05, + "loss": 0.0074, + "step": 692650 + }, + { + "epoch": 1.8, + "learning_rate": 3.067880481413029e-05, + "loss": 0.0075, + "step": 692660 + }, + { + "epoch": 1.8, + "learning_rate": 3.0674916597758825e-05, + "loss": 0.0069, + "step": 692670 + }, + { + "epoch": 1.8, + "learning_rate": 3.067102838138736e-05, + "loss": 0.0074, + "step": 692680 + }, + { + "epoch": 1.8, + "learning_rate": 3.06671401650159e-05, + "loss": 0.0085, + "step": 692690 + }, + { + "epoch": 1.8, + "learning_rate": 3.066325194864444e-05, + "loss": 0.0049, + "step": 692700 + }, + { + "epoch": 1.8, + "learning_rate": 3.065936373227297e-05, + "loss": 0.0075, + "step": 692710 + }, + { + "epoch": 1.8, + "learning_rate": 3.0655475515901507e-05, + "loss": 0.0071, + "step": 692720 + }, + { + "epoch": 1.8, + "learning_rate": 3.065158729953004e-05, + "loss": 0.0048, + "step": 692730 + }, + { + "epoch": 1.8, + "learning_rate": 3.0647699083158576e-05, + "loss": 0.0067, + "step": 692740 + }, + { + "epoch": 1.8, + "learning_rate": 3.064381086678711e-05, + "loss": 0.0066, + "step": 692750 + }, + { + "epoch": 1.8, + "learning_rate": 3.0639922650415646e-05, + "loss": 0.0095, + "step": 692760 + }, + { + "epoch": 1.8, + "learning_rate": 3.063603443404419e-05, + "loss": 0.007, + "step": 692770 + }, + { + "epoch": 1.8, + "learning_rate": 3.0632146217672716e-05, + "loss": 0.0095, + "step": 692780 + }, + { + "epoch": 1.8, + "learning_rate": 3.062825800130125e-05, + "loss": 0.007, + "step": 692790 + }, + { + "epoch": 1.8, + "learning_rate": 3.0624369784929785e-05, + "loss": 0.0089, + "step": 692800 + }, + { + "epoch": 1.8, + "learning_rate": 3.062048156855832e-05, + "loss": 0.0064, + "step": 692810 + }, + { + "epoch": 1.8, + "learning_rate": 3.061659335218686e-05, + "loss": 0.0077, + "step": 692820 + }, + { + "epoch": 1.8, + "learning_rate": 3.06127051358154e-05, + "loss": 0.0086, + "step": 692830 + }, + { + "epoch": 1.8, + "learning_rate": 3.060881691944393e-05, + "loss": 0.0069, + "step": 692840 + }, + { + "epoch": 1.8, + "learning_rate": 3.0604928703072467e-05, + "loss": 0.0076, + "step": 692850 + }, + { + "epoch": 1.8, + "learning_rate": 3.0601040486701e-05, + "loss": 0.01, + "step": 692860 + }, + { + "epoch": 1.8, + "learning_rate": 3.0597152270329536e-05, + "loss": 0.0073, + "step": 692870 + }, + { + "epoch": 1.8, + "learning_rate": 3.059326405395807e-05, + "loss": 0.0079, + "step": 692880 + }, + { + "epoch": 1.8, + "learning_rate": 3.0589375837586606e-05, + "loss": 0.0094, + "step": 692890 + }, + { + "epoch": 1.8, + "learning_rate": 3.058548762121514e-05, + "loss": 0.0068, + "step": 692900 + }, + { + "epoch": 1.8, + "learning_rate": 3.0581599404843676e-05, + "loss": 0.011, + "step": 692910 + }, + { + "epoch": 1.8, + "learning_rate": 3.057771118847221e-05, + "loss": 0.0069, + "step": 692920 + }, + { + "epoch": 1.8, + "learning_rate": 3.0573822972100745e-05, + "loss": 0.0057, + "step": 692930 + }, + { + "epoch": 1.8, + "learning_rate": 3.056993475572928e-05, + "loss": 0.0117, + "step": 692940 + }, + { + "epoch": 1.8, + "learning_rate": 3.056604653935782e-05, + "loss": 0.008, + "step": 692950 + }, + { + "epoch": 1.8, + "learning_rate": 3.056215832298636e-05, + "loss": 0.01, + "step": 692960 + }, + { + "epoch": 1.8, + "learning_rate": 3.055827010661489e-05, + "loss": 0.0088, + "step": 692970 + }, + { + "epoch": 1.8, + "learning_rate": 3.0554381890243426e-05, + "loss": 0.0077, + "step": 692980 + }, + { + "epoch": 1.8, + "learning_rate": 3.055049367387196e-05, + "loss": 0.0051, + "step": 692990 + }, + { + "epoch": 1.8, + "learning_rate": 3.0546605457500496e-05, + "loss": 0.0101, + "step": 693000 + }, + { + "epoch": 1.8, + "eval_cer": 0.8816495001196689, + "eval_loss": 0.004749494604766369, + "eval_runtime": 107.7534, + "eval_samples_per_second": 18.561, + "eval_steps_per_second": 4.64, + "step": 693000 + }, + { + "epoch": 1.8, + "learning_rate": 3.054271724112903e-05, + "loss": 0.0095, + "step": 693010 + }, + { + "epoch": 1.8, + "learning_rate": 3.0538829024757566e-05, + "loss": 0.0098, + "step": 693020 + }, + { + "epoch": 1.8, + "learning_rate": 3.05349408083861e-05, + "loss": 0.0081, + "step": 693030 + }, + { + "epoch": 1.8, + "learning_rate": 3.0531052592014636e-05, + "loss": 0.0101, + "step": 693040 + }, + { + "epoch": 1.8, + "learning_rate": 3.052716437564317e-05, + "loss": 0.0067, + "step": 693050 + }, + { + "epoch": 1.8, + "learning_rate": 3.0523276159271705e-05, + "loss": 0.0094, + "step": 693060 + }, + { + "epoch": 1.8, + "learning_rate": 3.051938794290024e-05, + "loss": 0.0082, + "step": 693070 + }, + { + "epoch": 1.8, + "learning_rate": 3.051549972652878e-05, + "loss": 0.0078, + "step": 693080 + }, + { + "epoch": 1.8, + "learning_rate": 3.0511611510157313e-05, + "loss": 0.0077, + "step": 693090 + }, + { + "epoch": 1.8, + "learning_rate": 3.050772329378585e-05, + "loss": 0.0063, + "step": 693100 + }, + { + "epoch": 1.8, + "learning_rate": 3.0503835077414386e-05, + "loss": 0.0076, + "step": 693110 + }, + { + "epoch": 1.8, + "learning_rate": 3.049994686104292e-05, + "loss": 0.0085, + "step": 693120 + }, + { + "epoch": 1.8, + "learning_rate": 3.0496058644671456e-05, + "loss": 0.0059, + "step": 693130 + }, + { + "epoch": 1.8, + "learning_rate": 3.0492170428299994e-05, + "loss": 0.0096, + "step": 693140 + }, + { + "epoch": 1.8, + "learning_rate": 3.0488282211928526e-05, + "loss": 0.0056, + "step": 693150 + }, + { + "epoch": 1.8, + "learning_rate": 3.048439399555706e-05, + "loss": 0.0072, + "step": 693160 + }, + { + "epoch": 1.8, + "learning_rate": 3.0480505779185596e-05, + "loss": 0.0051, + "step": 693170 + }, + { + "epoch": 1.8, + "learning_rate": 3.047661756281413e-05, + "loss": 0.0062, + "step": 693180 + }, + { + "epoch": 1.8, + "learning_rate": 3.047272934644267e-05, + "loss": 0.0079, + "step": 693190 + }, + { + "epoch": 1.8, + "learning_rate": 3.0468841130071204e-05, + "loss": 0.0073, + "step": 693200 + }, + { + "epoch": 1.8, + "learning_rate": 3.046495291369974e-05, + "loss": 0.0084, + "step": 693210 + }, + { + "epoch": 1.8, + "learning_rate": 3.0461064697328273e-05, + "loss": 0.0073, + "step": 693220 + }, + { + "epoch": 1.8, + "learning_rate": 3.045717648095681e-05, + "loss": 0.0073, + "step": 693230 + }, + { + "epoch": 1.8, + "learning_rate": 3.0453288264585346e-05, + "loss": 0.0048, + "step": 693240 + }, + { + "epoch": 1.8, + "learning_rate": 3.044940004821388e-05, + "loss": 0.0102, + "step": 693250 + }, + { + "epoch": 1.8, + "learning_rate": 3.0445511831842416e-05, + "loss": 0.0093, + "step": 693260 + }, + { + "epoch": 1.8, + "learning_rate": 3.0441623615470954e-05, + "loss": 0.0064, + "step": 693270 + }, + { + "epoch": 1.8, + "learning_rate": 3.0437735399099486e-05, + "loss": 0.0091, + "step": 693280 + }, + { + "epoch": 1.8, + "learning_rate": 3.043384718272802e-05, + "loss": 0.0074, + "step": 693290 + }, + { + "epoch": 1.8, + "learning_rate": 3.0429958966356556e-05, + "loss": 0.008, + "step": 693300 + }, + { + "epoch": 1.8, + "learning_rate": 3.042607074998509e-05, + "loss": 0.0085, + "step": 693310 + }, + { + "epoch": 1.8, + "learning_rate": 3.042218253361363e-05, + "loss": 0.0093, + "step": 693320 + }, + { + "epoch": 1.8, + "learning_rate": 3.0418294317242164e-05, + "loss": 0.0062, + "step": 693330 + }, + { + "epoch": 1.8, + "learning_rate": 3.04144061008707e-05, + "loss": 0.0081, + "step": 693340 + }, + { + "epoch": 1.8, + "learning_rate": 3.0410517884499233e-05, + "loss": 0.0095, + "step": 693350 + }, + { + "epoch": 1.8, + "learning_rate": 3.040662966812777e-05, + "loss": 0.0085, + "step": 693360 + }, + { + "epoch": 1.8, + "learning_rate": 3.0402741451756306e-05, + "loss": 0.0078, + "step": 693370 + }, + { + "epoch": 1.8, + "learning_rate": 3.039885323538484e-05, + "loss": 0.007, + "step": 693380 + }, + { + "epoch": 1.8, + "learning_rate": 3.0394965019013376e-05, + "loss": 0.0087, + "step": 693390 + }, + { + "epoch": 1.8, + "learning_rate": 3.0391076802641908e-05, + "loss": 0.0087, + "step": 693400 + }, + { + "epoch": 1.8, + "learning_rate": 3.0387188586270446e-05, + "loss": 0.0043, + "step": 693410 + }, + { + "epoch": 1.8, + "learning_rate": 3.038330036989898e-05, + "loss": 0.0086, + "step": 693420 + }, + { + "epoch": 1.8, + "learning_rate": 3.0379412153527516e-05, + "loss": 0.0085, + "step": 693430 + }, + { + "epoch": 1.8, + "learning_rate": 3.037552393715605e-05, + "loss": 0.0059, + "step": 693440 + }, + { + "epoch": 1.8, + "learning_rate": 3.037163572078459e-05, + "loss": 0.0065, + "step": 693450 + }, + { + "epoch": 1.8, + "learning_rate": 3.0367747504413124e-05, + "loss": 0.0062, + "step": 693460 + }, + { + "epoch": 1.8, + "learning_rate": 3.036385928804166e-05, + "loss": 0.012, + "step": 693470 + }, + { + "epoch": 1.8, + "learning_rate": 3.0359971071670193e-05, + "loss": 0.0097, + "step": 693480 + }, + { + "epoch": 1.8, + "learning_rate": 3.035608285529873e-05, + "loss": 0.0073, + "step": 693490 + }, + { + "epoch": 1.8, + "learning_rate": 3.0352194638927266e-05, + "loss": 0.0085, + "step": 693500 + }, + { + "epoch": 1.8, + "learning_rate": 3.03483064225558e-05, + "loss": 0.0051, + "step": 693510 + }, + { + "epoch": 1.8, + "learning_rate": 3.0344418206184336e-05, + "loss": 0.006, + "step": 693520 + }, + { + "epoch": 1.8, + "learning_rate": 3.0340529989812868e-05, + "loss": 0.0079, + "step": 693530 + }, + { + "epoch": 1.8, + "learning_rate": 3.0336641773441406e-05, + "loss": 0.0069, + "step": 693540 + }, + { + "epoch": 1.8, + "learning_rate": 3.033275355706994e-05, + "loss": 0.0067, + "step": 693550 + }, + { + "epoch": 1.8, + "learning_rate": 3.0328865340698476e-05, + "loss": 0.0064, + "step": 693560 + }, + { + "epoch": 1.8, + "learning_rate": 3.032497712432701e-05, + "loss": 0.0083, + "step": 693570 + }, + { + "epoch": 1.8, + "learning_rate": 3.032108890795555e-05, + "loss": 0.0091, + "step": 693580 + }, + { + "epoch": 1.8, + "learning_rate": 3.0317200691584084e-05, + "loss": 0.0073, + "step": 693590 + }, + { + "epoch": 1.8, + "learning_rate": 3.031331247521262e-05, + "loss": 0.0061, + "step": 693600 + }, + { + "epoch": 1.8, + "learning_rate": 3.0309424258841153e-05, + "loss": 0.0078, + "step": 693610 + }, + { + "epoch": 1.8, + "learning_rate": 3.030553604246969e-05, + "loss": 0.0076, + "step": 693620 + }, + { + "epoch": 1.8, + "learning_rate": 3.0301647826098226e-05, + "loss": 0.0086, + "step": 693630 + }, + { + "epoch": 1.8, + "learning_rate": 3.029775960972676e-05, + "loss": 0.0075, + "step": 693640 + }, + { + "epoch": 1.8, + "learning_rate": 3.0293871393355293e-05, + "loss": 0.0074, + "step": 693650 + }, + { + "epoch": 1.8, + "learning_rate": 3.0289983176983828e-05, + "loss": 0.0059, + "step": 693660 + }, + { + "epoch": 1.8, + "learning_rate": 3.0286094960612366e-05, + "loss": 0.008, + "step": 693670 + }, + { + "epoch": 1.8, + "learning_rate": 3.02822067442409e-05, + "loss": 0.0063, + "step": 693680 + }, + { + "epoch": 1.8, + "learning_rate": 3.0278318527869436e-05, + "loss": 0.0066, + "step": 693690 + }, + { + "epoch": 1.8, + "learning_rate": 3.027443031149797e-05, + "loss": 0.0074, + "step": 693700 + }, + { + "epoch": 1.8, + "learning_rate": 3.027054209512651e-05, + "loss": 0.0076, + "step": 693710 + }, + { + "epoch": 1.8, + "learning_rate": 3.0266653878755044e-05, + "loss": 0.0089, + "step": 693720 + }, + { + "epoch": 1.8, + "learning_rate": 3.026276566238358e-05, + "loss": 0.0085, + "step": 693730 + }, + { + "epoch": 1.8, + "learning_rate": 3.0258877446012113e-05, + "loss": 0.0093, + "step": 693740 + }, + { + "epoch": 1.8, + "learning_rate": 3.025498922964065e-05, + "loss": 0.0068, + "step": 693750 + }, + { + "epoch": 1.8, + "learning_rate": 3.0251101013269186e-05, + "loss": 0.0084, + "step": 693760 + }, + { + "epoch": 1.8, + "learning_rate": 3.0247212796897718e-05, + "loss": 0.0095, + "step": 693770 + }, + { + "epoch": 1.8, + "learning_rate": 3.0243324580526253e-05, + "loss": 0.0083, + "step": 693780 + }, + { + "epoch": 1.8, + "learning_rate": 3.0239436364154788e-05, + "loss": 0.0114, + "step": 693790 + }, + { + "epoch": 1.8, + "learning_rate": 3.0235548147783326e-05, + "loss": 0.0059, + "step": 693800 + }, + { + "epoch": 1.8, + "learning_rate": 3.023165993141186e-05, + "loss": 0.0071, + "step": 693810 + }, + { + "epoch": 1.8, + "learning_rate": 3.0227771715040396e-05, + "loss": 0.0078, + "step": 693820 + }, + { + "epoch": 1.8, + "learning_rate": 3.022388349866893e-05, + "loss": 0.0057, + "step": 693830 + }, + { + "epoch": 1.8, + "learning_rate": 3.021999528229747e-05, + "loss": 0.0082, + "step": 693840 + }, + { + "epoch": 1.8, + "learning_rate": 3.0216107065926003e-05, + "loss": 0.0058, + "step": 693850 + }, + { + "epoch": 1.8, + "learning_rate": 3.021221884955454e-05, + "loss": 0.0056, + "step": 693860 + }, + { + "epoch": 1.8, + "learning_rate": 3.0208330633183073e-05, + "loss": 0.0099, + "step": 693870 + }, + { + "epoch": 1.8, + "learning_rate": 3.020444241681161e-05, + "loss": 0.007, + "step": 693880 + }, + { + "epoch": 1.8, + "learning_rate": 3.0200554200440146e-05, + "loss": 0.0064, + "step": 693890 + }, + { + "epoch": 1.8, + "learning_rate": 3.0196665984068678e-05, + "loss": 0.0073, + "step": 693900 + }, + { + "epoch": 1.8, + "learning_rate": 3.0192777767697213e-05, + "loss": 0.0082, + "step": 693910 + }, + { + "epoch": 1.8, + "learning_rate": 3.0188889551325748e-05, + "loss": 0.0074, + "step": 693920 + }, + { + "epoch": 1.8, + "learning_rate": 3.0185001334954286e-05, + "loss": 0.0084, + "step": 693930 + }, + { + "epoch": 1.8, + "learning_rate": 3.018111311858282e-05, + "loss": 0.0077, + "step": 693940 + }, + { + "epoch": 1.8, + "learning_rate": 3.0177224902211355e-05, + "loss": 0.0073, + "step": 693950 + }, + { + "epoch": 1.8, + "learning_rate": 3.017333668583989e-05, + "loss": 0.0083, + "step": 693960 + }, + { + "epoch": 1.8, + "learning_rate": 3.0169448469468425e-05, + "loss": 0.0098, + "step": 693970 + }, + { + "epoch": 1.8, + "learning_rate": 3.0165560253096963e-05, + "loss": 0.0079, + "step": 693980 + }, + { + "epoch": 1.8, + "learning_rate": 3.01616720367255e-05, + "loss": 0.0069, + "step": 693990 + }, + { + "epoch": 1.8, + "learning_rate": 3.0157783820354033e-05, + "loss": 0.0054, + "step": 694000 + }, + { + "epoch": 1.8, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.004784898832440376, + "eval_runtime": 107.6263, + "eval_samples_per_second": 18.583, + "eval_steps_per_second": 4.646, + "step": 694000 + }, + { + "epoch": 1.8, + "learning_rate": 3.0153895603982568e-05, + "loss": 0.0083, + "step": 694010 + }, + { + "epoch": 1.8, + "learning_rate": 3.01500073876111e-05, + "loss": 0.0052, + "step": 694020 + }, + { + "epoch": 1.8, + "learning_rate": 3.0146119171239638e-05, + "loss": 0.0085, + "step": 694030 + }, + { + "epoch": 1.8, + "learning_rate": 3.0142230954868173e-05, + "loss": 0.0062, + "step": 694040 + }, + { + "epoch": 1.8, + "learning_rate": 3.0138342738496707e-05, + "loss": 0.0069, + "step": 694050 + }, + { + "epoch": 1.8, + "learning_rate": 3.0134454522125242e-05, + "loss": 0.0099, + "step": 694060 + }, + { + "epoch": 1.8, + "learning_rate": 3.013056630575378e-05, + "loss": 0.0084, + "step": 694070 + }, + { + "epoch": 1.8, + "learning_rate": 3.0126678089382315e-05, + "loss": 0.0077, + "step": 694080 + }, + { + "epoch": 1.8, + "learning_rate": 3.012278987301085e-05, + "loss": 0.009, + "step": 694090 + }, + { + "epoch": 1.8, + "learning_rate": 3.0118901656639385e-05, + "loss": 0.0085, + "step": 694100 + }, + { + "epoch": 1.8, + "learning_rate": 3.0115013440267923e-05, + "loss": 0.0083, + "step": 694110 + }, + { + "epoch": 1.8, + "learning_rate": 3.0111125223896458e-05, + "loss": 0.0064, + "step": 694120 + }, + { + "epoch": 1.8, + "learning_rate": 3.0107237007524993e-05, + "loss": 0.0077, + "step": 694130 + }, + { + "epoch": 1.8, + "learning_rate": 3.0103348791153528e-05, + "loss": 0.0094, + "step": 694140 + }, + { + "epoch": 1.8, + "learning_rate": 3.009946057478206e-05, + "loss": 0.0068, + "step": 694150 + }, + { + "epoch": 1.8, + "learning_rate": 3.0095572358410598e-05, + "loss": 0.0071, + "step": 694160 + }, + { + "epoch": 1.8, + "learning_rate": 3.0091684142039133e-05, + "loss": 0.0049, + "step": 694170 + }, + { + "epoch": 1.8, + "learning_rate": 3.0087795925667667e-05, + "loss": 0.0085, + "step": 694180 + }, + { + "epoch": 1.8, + "learning_rate": 3.0083907709296202e-05, + "loss": 0.0061, + "step": 694190 + }, + { + "epoch": 1.8, + "learning_rate": 3.008001949292474e-05, + "loss": 0.0077, + "step": 694200 + }, + { + "epoch": 1.8, + "learning_rate": 3.0076131276553275e-05, + "loss": 0.0078, + "step": 694210 + }, + { + "epoch": 1.8, + "learning_rate": 3.007224306018181e-05, + "loss": 0.0052, + "step": 694220 + }, + { + "epoch": 1.8, + "learning_rate": 3.0068354843810345e-05, + "loss": 0.0056, + "step": 694230 + }, + { + "epoch": 1.8, + "learning_rate": 3.0064466627438883e-05, + "loss": 0.0077, + "step": 694240 + }, + { + "epoch": 1.8, + "learning_rate": 3.0060578411067418e-05, + "loss": 0.0086, + "step": 694250 + }, + { + "epoch": 1.8, + "learning_rate": 3.0056690194695953e-05, + "loss": 0.008, + "step": 694260 + }, + { + "epoch": 1.8, + "learning_rate": 3.0052801978324485e-05, + "loss": 0.0077, + "step": 694270 + }, + { + "epoch": 1.8, + "learning_rate": 3.004891376195302e-05, + "loss": 0.0058, + "step": 694280 + }, + { + "epoch": 1.8, + "learning_rate": 3.0045025545581558e-05, + "loss": 0.0093, + "step": 694290 + }, + { + "epoch": 1.8, + "learning_rate": 3.0041137329210093e-05, + "loss": 0.0075, + "step": 694300 + }, + { + "epoch": 1.8, + "learning_rate": 3.0037249112838627e-05, + "loss": 0.0066, + "step": 694310 + }, + { + "epoch": 1.8, + "learning_rate": 3.0033360896467162e-05, + "loss": 0.0063, + "step": 694320 + }, + { + "epoch": 1.8, + "learning_rate": 3.00294726800957e-05, + "loss": 0.0088, + "step": 694330 + }, + { + "epoch": 1.8, + "learning_rate": 3.0025584463724235e-05, + "loss": 0.0078, + "step": 694340 + }, + { + "epoch": 1.8, + "learning_rate": 3.002169624735277e-05, + "loss": 0.0088, + "step": 694350 + }, + { + "epoch": 1.8, + "learning_rate": 3.0017808030981305e-05, + "loss": 0.01, + "step": 694360 + }, + { + "epoch": 1.8, + "learning_rate": 3.0013919814609843e-05, + "loss": 0.0057, + "step": 694370 + }, + { + "epoch": 1.8, + "learning_rate": 3.0010031598238378e-05, + "loss": 0.0085, + "step": 694380 + }, + { + "epoch": 1.8, + "learning_rate": 3.000614338186691e-05, + "loss": 0.0082, + "step": 694390 + }, + { + "epoch": 1.8, + "learning_rate": 3.0002255165495445e-05, + "loss": 0.0072, + "step": 694400 + }, + { + "epoch": 1.8, + "learning_rate": 2.999836694912398e-05, + "loss": 0.007, + "step": 694410 + }, + { + "epoch": 1.8, + "learning_rate": 2.9994478732752518e-05, + "loss": 0.0086, + "step": 694420 + }, + { + "epoch": 1.8, + "learning_rate": 2.9990590516381053e-05, + "loss": 0.0055, + "step": 694430 + }, + { + "epoch": 1.8, + "learning_rate": 2.9986702300009587e-05, + "loss": 0.0075, + "step": 694440 + }, + { + "epoch": 1.8, + "learning_rate": 2.9982814083638122e-05, + "loss": 0.0054, + "step": 694450 + }, + { + "epoch": 1.8, + "learning_rate": 2.997892586726666e-05, + "loss": 0.0064, + "step": 694460 + }, + { + "epoch": 1.8, + "learning_rate": 2.9975037650895195e-05, + "loss": 0.007, + "step": 694470 + }, + { + "epoch": 1.8, + "learning_rate": 2.997114943452373e-05, + "loss": 0.0065, + "step": 694480 + }, + { + "epoch": 1.8, + "learning_rate": 2.9967261218152265e-05, + "loss": 0.0161, + "step": 694490 + }, + { + "epoch": 1.8, + "learning_rate": 2.9963373001780803e-05, + "loss": 0.0084, + "step": 694500 + }, + { + "epoch": 1.8, + "learning_rate": 2.9959484785409338e-05, + "loss": 0.0044, + "step": 694510 + }, + { + "epoch": 1.8, + "learning_rate": 2.995559656903787e-05, + "loss": 0.0082, + "step": 694520 + }, + { + "epoch": 1.8, + "learning_rate": 2.9951708352666405e-05, + "loss": 0.01, + "step": 694530 + }, + { + "epoch": 1.8, + "learning_rate": 2.994782013629494e-05, + "loss": 0.0047, + "step": 694540 + }, + { + "epoch": 1.8, + "learning_rate": 2.9943931919923478e-05, + "loss": 0.0069, + "step": 694550 + }, + { + "epoch": 1.8, + "learning_rate": 2.9940043703552013e-05, + "loss": 0.006, + "step": 694560 + }, + { + "epoch": 1.8, + "learning_rate": 2.9936155487180547e-05, + "loss": 0.0093, + "step": 694570 + }, + { + "epoch": 1.8, + "learning_rate": 2.9932267270809082e-05, + "loss": 0.0117, + "step": 694580 + }, + { + "epoch": 1.8, + "learning_rate": 2.992837905443762e-05, + "loss": 0.0067, + "step": 694590 + }, + { + "epoch": 1.8, + "learning_rate": 2.9924490838066155e-05, + "loss": 0.0082, + "step": 694600 + }, + { + "epoch": 1.8, + "learning_rate": 2.992060262169469e-05, + "loss": 0.0077, + "step": 694610 + }, + { + "epoch": 1.8, + "learning_rate": 2.9916714405323225e-05, + "loss": 0.0084, + "step": 694620 + }, + { + "epoch": 1.8, + "learning_rate": 2.9912826188951763e-05, + "loss": 0.0068, + "step": 694630 + }, + { + "epoch": 1.8, + "learning_rate": 2.9908937972580295e-05, + "loss": 0.01, + "step": 694640 + }, + { + "epoch": 1.8, + "learning_rate": 2.990504975620883e-05, + "loss": 0.0085, + "step": 694650 + }, + { + "epoch": 1.8, + "learning_rate": 2.9901161539837365e-05, + "loss": 0.0065, + "step": 694660 + }, + { + "epoch": 1.8, + "learning_rate": 2.98972733234659e-05, + "loss": 0.0091, + "step": 694670 + }, + { + "epoch": 1.8, + "learning_rate": 2.9893385107094438e-05, + "loss": 0.0089, + "step": 694680 + }, + { + "epoch": 1.8, + "learning_rate": 2.9889496890722973e-05, + "loss": 0.0081, + "step": 694690 + }, + { + "epoch": 1.8, + "learning_rate": 2.9885608674351507e-05, + "loss": 0.0082, + "step": 694700 + }, + { + "epoch": 1.8, + "learning_rate": 2.9881720457980042e-05, + "loss": 0.0085, + "step": 694710 + }, + { + "epoch": 1.8, + "learning_rate": 2.987783224160858e-05, + "loss": 0.008, + "step": 694720 + }, + { + "epoch": 1.8, + "learning_rate": 2.9873944025237115e-05, + "loss": 0.0071, + "step": 694730 + }, + { + "epoch": 1.8, + "learning_rate": 2.987005580886565e-05, + "loss": 0.0084, + "step": 694740 + }, + { + "epoch": 1.8, + "learning_rate": 2.9866167592494185e-05, + "loss": 0.0079, + "step": 694750 + }, + { + "epoch": 1.8, + "learning_rate": 2.9862279376122723e-05, + "loss": 0.0062, + "step": 694760 + }, + { + "epoch": 1.8, + "learning_rate": 2.9858391159751255e-05, + "loss": 0.0104, + "step": 694770 + }, + { + "epoch": 1.8, + "learning_rate": 2.985450294337979e-05, + "loss": 0.0079, + "step": 694780 + }, + { + "epoch": 1.8, + "learning_rate": 2.9850614727008325e-05, + "loss": 0.008, + "step": 694790 + }, + { + "epoch": 1.8, + "learning_rate": 2.984672651063686e-05, + "loss": 0.006, + "step": 694800 + }, + { + "epoch": 1.8, + "learning_rate": 2.9842838294265398e-05, + "loss": 0.0117, + "step": 694810 + }, + { + "epoch": 1.8, + "learning_rate": 2.9838950077893932e-05, + "loss": 0.0093, + "step": 694820 + }, + { + "epoch": 1.8, + "learning_rate": 2.9835061861522467e-05, + "loss": 0.0068, + "step": 694830 + }, + { + "epoch": 1.8, + "learning_rate": 2.9831173645151002e-05, + "loss": 0.0088, + "step": 694840 + }, + { + "epoch": 1.8, + "learning_rate": 2.982728542877954e-05, + "loss": 0.0091, + "step": 694850 + }, + { + "epoch": 1.8, + "learning_rate": 2.9823397212408075e-05, + "loss": 0.0075, + "step": 694860 + }, + { + "epoch": 1.8, + "learning_rate": 2.981950899603661e-05, + "loss": 0.0054, + "step": 694870 + }, + { + "epoch": 1.8, + "learning_rate": 2.9815620779665145e-05, + "loss": 0.0076, + "step": 694880 + }, + { + "epoch": 1.8, + "learning_rate": 2.9811732563293677e-05, + "loss": 0.0092, + "step": 694890 + }, + { + "epoch": 1.8, + "learning_rate": 2.9807844346922215e-05, + "loss": 0.0069, + "step": 694900 + }, + { + "epoch": 1.8, + "learning_rate": 2.980395613055075e-05, + "loss": 0.0064, + "step": 694910 + }, + { + "epoch": 1.8, + "learning_rate": 2.9800067914179284e-05, + "loss": 0.0075, + "step": 694920 + }, + { + "epoch": 1.8, + "learning_rate": 2.979617969780782e-05, + "loss": 0.0073, + "step": 694930 + }, + { + "epoch": 1.8, + "learning_rate": 2.9792291481436358e-05, + "loss": 0.0077, + "step": 694940 + }, + { + "epoch": 1.8, + "learning_rate": 2.9788403265064892e-05, + "loss": 0.008, + "step": 694950 + }, + { + "epoch": 1.8, + "learning_rate": 2.9784515048693427e-05, + "loss": 0.0084, + "step": 694960 + }, + { + "epoch": 1.8, + "learning_rate": 2.9780626832321962e-05, + "loss": 0.0057, + "step": 694970 + }, + { + "epoch": 1.8, + "learning_rate": 2.97767386159505e-05, + "loss": 0.0087, + "step": 694980 + }, + { + "epoch": 1.8, + "learning_rate": 2.9772850399579035e-05, + "loss": 0.0091, + "step": 694990 + }, + { + "epoch": 1.8, + "learning_rate": 2.976896218320757e-05, + "loss": 0.006, + "step": 695000 + }, + { + "epoch": 1.8, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.004791451618075371, + "eval_runtime": 107.7436, + "eval_samples_per_second": 18.563, + "eval_steps_per_second": 4.641, + "step": 695000 + }, + { + "epoch": 1.8, + "learning_rate": 2.97650739668361e-05, + "loss": 0.0068, + "step": 695010 + }, + { + "epoch": 1.8, + "learning_rate": 2.9761185750464636e-05, + "loss": 0.0071, + "step": 695020 + }, + { + "epoch": 1.8, + "learning_rate": 2.9757297534093175e-05, + "loss": 0.0068, + "step": 695030 + }, + { + "epoch": 1.8, + "learning_rate": 2.975340931772171e-05, + "loss": 0.0083, + "step": 695040 + }, + { + "epoch": 1.8, + "learning_rate": 2.9749521101350244e-05, + "loss": 0.0074, + "step": 695050 + }, + { + "epoch": 1.8, + "learning_rate": 2.974563288497878e-05, + "loss": 0.0067, + "step": 695060 + }, + { + "epoch": 1.8, + "learning_rate": 2.9741744668607318e-05, + "loss": 0.0067, + "step": 695070 + }, + { + "epoch": 1.8, + "learning_rate": 2.9737856452235852e-05, + "loss": 0.0086, + "step": 695080 + }, + { + "epoch": 1.8, + "learning_rate": 2.9733968235864387e-05, + "loss": 0.0098, + "step": 695090 + }, + { + "epoch": 1.8, + "learning_rate": 2.9730080019492922e-05, + "loss": 0.0082, + "step": 695100 + }, + { + "epoch": 1.8, + "learning_rate": 2.972619180312146e-05, + "loss": 0.0086, + "step": 695110 + }, + { + "epoch": 1.8, + "learning_rate": 2.9722303586749995e-05, + "loss": 0.0067, + "step": 695120 + }, + { + "epoch": 1.8, + "learning_rate": 2.971841537037853e-05, + "loss": 0.0071, + "step": 695130 + }, + { + "epoch": 1.8, + "learning_rate": 2.971452715400706e-05, + "loss": 0.0089, + "step": 695140 + }, + { + "epoch": 1.8, + "learning_rate": 2.9710638937635596e-05, + "loss": 0.0102, + "step": 695150 + }, + { + "epoch": 1.8, + "learning_rate": 2.9706750721264135e-05, + "loss": 0.0084, + "step": 695160 + }, + { + "epoch": 1.8, + "learning_rate": 2.970286250489267e-05, + "loss": 0.009, + "step": 695170 + }, + { + "epoch": 1.8, + "learning_rate": 2.9698974288521204e-05, + "loss": 0.0071, + "step": 695180 + }, + { + "epoch": 1.8, + "learning_rate": 2.969508607214974e-05, + "loss": 0.0072, + "step": 695190 + }, + { + "epoch": 1.8, + "learning_rate": 2.9691197855778278e-05, + "loss": 0.0094, + "step": 695200 + }, + { + "epoch": 1.8, + "learning_rate": 2.9687309639406812e-05, + "loss": 0.0067, + "step": 695210 + }, + { + "epoch": 1.8, + "learning_rate": 2.9683421423035347e-05, + "loss": 0.0068, + "step": 695220 + }, + { + "epoch": 1.8, + "learning_rate": 2.9679533206663882e-05, + "loss": 0.0092, + "step": 695230 + }, + { + "epoch": 1.8, + "learning_rate": 2.967564499029242e-05, + "loss": 0.0066, + "step": 695240 + }, + { + "epoch": 1.8, + "learning_rate": 2.9671756773920955e-05, + "loss": 0.0068, + "step": 695250 + }, + { + "epoch": 1.8, + "learning_rate": 2.9667868557549487e-05, + "loss": 0.009, + "step": 695260 + }, + { + "epoch": 1.8, + "learning_rate": 2.966398034117802e-05, + "loss": 0.0072, + "step": 695270 + }, + { + "epoch": 1.8, + "learning_rate": 2.9660092124806556e-05, + "loss": 0.0061, + "step": 695280 + }, + { + "epoch": 1.8, + "learning_rate": 2.9656203908435095e-05, + "loss": 0.0067, + "step": 695290 + }, + { + "epoch": 1.8, + "learning_rate": 2.965231569206363e-05, + "loss": 0.0115, + "step": 695300 + }, + { + "epoch": 1.8, + "learning_rate": 2.9648427475692164e-05, + "loss": 0.0072, + "step": 695310 + }, + { + "epoch": 1.8, + "learning_rate": 2.96445392593207e-05, + "loss": 0.007, + "step": 695320 + }, + { + "epoch": 1.8, + "learning_rate": 2.9640651042949234e-05, + "loss": 0.0072, + "step": 695330 + }, + { + "epoch": 1.8, + "learning_rate": 2.9636762826577772e-05, + "loss": 0.0081, + "step": 695340 + }, + { + "epoch": 1.8, + "learning_rate": 2.9632874610206307e-05, + "loss": 0.0044, + "step": 695350 + }, + { + "epoch": 1.8, + "learning_rate": 2.9628986393834842e-05, + "loss": 0.0065, + "step": 695360 + }, + { + "epoch": 1.8, + "learning_rate": 2.9625098177463377e-05, + "loss": 0.0087, + "step": 695370 + }, + { + "epoch": 1.8, + "learning_rate": 2.9621209961091915e-05, + "loss": 0.0099, + "step": 695380 + }, + { + "epoch": 1.8, + "learning_rate": 2.9617321744720447e-05, + "loss": 0.0067, + "step": 695390 + }, + { + "epoch": 1.8, + "learning_rate": 2.961343352834898e-05, + "loss": 0.0068, + "step": 695400 + }, + { + "epoch": 1.8, + "learning_rate": 2.9609545311977516e-05, + "loss": 0.0074, + "step": 695410 + }, + { + "epoch": 1.8, + "learning_rate": 2.960565709560605e-05, + "loss": 0.0064, + "step": 695420 + }, + { + "epoch": 1.8, + "learning_rate": 2.960176887923459e-05, + "loss": 0.009, + "step": 695430 + }, + { + "epoch": 1.8, + "learning_rate": 2.9597880662863124e-05, + "loss": 0.0077, + "step": 695440 + }, + { + "epoch": 1.8, + "learning_rate": 2.959399244649166e-05, + "loss": 0.0077, + "step": 695450 + }, + { + "epoch": 1.8, + "learning_rate": 2.9590104230120194e-05, + "loss": 0.0069, + "step": 695460 + }, + { + "epoch": 1.8, + "learning_rate": 2.9586216013748732e-05, + "loss": 0.0089, + "step": 695470 + }, + { + "epoch": 1.8, + "learning_rate": 2.9582327797377267e-05, + "loss": 0.0056, + "step": 695480 + }, + { + "epoch": 1.8, + "learning_rate": 2.9578439581005802e-05, + "loss": 0.0116, + "step": 695490 + }, + { + "epoch": 1.8, + "learning_rate": 2.9574551364634337e-05, + "loss": 0.006, + "step": 695500 + }, + { + "epoch": 1.8, + "learning_rate": 2.957066314826287e-05, + "loss": 0.0073, + "step": 695510 + }, + { + "epoch": 1.8, + "learning_rate": 2.9566774931891407e-05, + "loss": 0.0092, + "step": 695520 + }, + { + "epoch": 1.8, + "learning_rate": 2.956288671551994e-05, + "loss": 0.0064, + "step": 695530 + }, + { + "epoch": 1.8, + "learning_rate": 2.9558998499148476e-05, + "loss": 0.0062, + "step": 695540 + }, + { + "epoch": 1.8, + "learning_rate": 2.955511028277701e-05, + "loss": 0.0077, + "step": 695550 + }, + { + "epoch": 1.8, + "learning_rate": 2.955122206640555e-05, + "loss": 0.009, + "step": 695560 + }, + { + "epoch": 1.8, + "learning_rate": 2.9547333850034084e-05, + "loss": 0.0082, + "step": 695570 + }, + { + "epoch": 1.8, + "learning_rate": 2.954344563366262e-05, + "loss": 0.0051, + "step": 695580 + }, + { + "epoch": 1.8, + "learning_rate": 2.9539557417291154e-05, + "loss": 0.0059, + "step": 695590 + }, + { + "epoch": 1.8, + "learning_rate": 2.9535669200919692e-05, + "loss": 0.0086, + "step": 695600 + }, + { + "epoch": 1.8, + "learning_rate": 2.9531780984548227e-05, + "loss": 0.0071, + "step": 695610 + }, + { + "epoch": 1.8, + "learning_rate": 2.9527892768176762e-05, + "loss": 0.0065, + "step": 695620 + }, + { + "epoch": 1.8, + "learning_rate": 2.9524004551805294e-05, + "loss": 0.0085, + "step": 695630 + }, + { + "epoch": 1.8, + "learning_rate": 2.952011633543383e-05, + "loss": 0.0078, + "step": 695640 + }, + { + "epoch": 1.8, + "learning_rate": 2.9516228119062367e-05, + "loss": 0.0067, + "step": 695650 + }, + { + "epoch": 1.8, + "learning_rate": 2.95123399026909e-05, + "loss": 0.0103, + "step": 695660 + }, + { + "epoch": 1.8, + "learning_rate": 2.9508451686319436e-05, + "loss": 0.0055, + "step": 695670 + }, + { + "epoch": 1.8, + "learning_rate": 2.950456346994797e-05, + "loss": 0.0063, + "step": 695680 + }, + { + "epoch": 1.8, + "learning_rate": 2.950067525357651e-05, + "loss": 0.0054, + "step": 695690 + }, + { + "epoch": 1.8, + "learning_rate": 2.9496787037205044e-05, + "loss": 0.0066, + "step": 695700 + }, + { + "epoch": 1.8, + "learning_rate": 2.949289882083358e-05, + "loss": 0.0071, + "step": 695710 + }, + { + "epoch": 1.8, + "learning_rate": 2.9489010604462114e-05, + "loss": 0.0051, + "step": 695720 + }, + { + "epoch": 1.8, + "learning_rate": 2.9485122388090652e-05, + "loss": 0.0071, + "step": 695730 + }, + { + "epoch": 1.8, + "learning_rate": 2.9481234171719187e-05, + "loss": 0.0062, + "step": 695740 + }, + { + "epoch": 1.8, + "learning_rate": 2.9477345955347722e-05, + "loss": 0.0094, + "step": 695750 + }, + { + "epoch": 1.8, + "learning_rate": 2.9473457738976254e-05, + "loss": 0.0092, + "step": 695760 + }, + { + "epoch": 1.8, + "learning_rate": 2.946956952260479e-05, + "loss": 0.0071, + "step": 695770 + }, + { + "epoch": 1.8, + "learning_rate": 2.9465681306233327e-05, + "loss": 0.0079, + "step": 695780 + }, + { + "epoch": 1.8, + "learning_rate": 2.946179308986186e-05, + "loss": 0.0091, + "step": 695790 + }, + { + "epoch": 1.8, + "learning_rate": 2.9457904873490396e-05, + "loss": 0.0066, + "step": 695800 + }, + { + "epoch": 1.8, + "learning_rate": 2.945401665711893e-05, + "loss": 0.0074, + "step": 695810 + }, + { + "epoch": 1.8, + "learning_rate": 2.945012844074747e-05, + "loss": 0.0069, + "step": 695820 + }, + { + "epoch": 1.8, + "learning_rate": 2.9446240224376004e-05, + "loss": 0.0087, + "step": 695830 + }, + { + "epoch": 1.8, + "learning_rate": 2.944235200800454e-05, + "loss": 0.0058, + "step": 695840 + }, + { + "epoch": 1.8, + "learning_rate": 2.9438463791633074e-05, + "loss": 0.0069, + "step": 695850 + }, + { + "epoch": 1.8, + "learning_rate": 2.9434575575261612e-05, + "loss": 0.0063, + "step": 695860 + }, + { + "epoch": 1.8, + "learning_rate": 2.9430687358890147e-05, + "loss": 0.0102, + "step": 695870 + }, + { + "epoch": 1.8, + "learning_rate": 2.942679914251868e-05, + "loss": 0.0098, + "step": 695880 + }, + { + "epoch": 1.8, + "learning_rate": 2.9422910926147213e-05, + "loss": 0.0089, + "step": 695890 + }, + { + "epoch": 1.8, + "learning_rate": 2.941902270977575e-05, + "loss": 0.0072, + "step": 695900 + }, + { + "epoch": 1.8, + "learning_rate": 2.9415134493404287e-05, + "loss": 0.0076, + "step": 695910 + }, + { + "epoch": 1.8, + "learning_rate": 2.941124627703282e-05, + "loss": 0.0105, + "step": 695920 + }, + { + "epoch": 1.8, + "learning_rate": 2.9407358060661356e-05, + "loss": 0.0059, + "step": 695930 + }, + { + "epoch": 1.8, + "learning_rate": 2.940346984428989e-05, + "loss": 0.009, + "step": 695940 + }, + { + "epoch": 1.8, + "learning_rate": 2.939958162791843e-05, + "loss": 0.0087, + "step": 695950 + }, + { + "epoch": 1.8, + "learning_rate": 2.9395693411546964e-05, + "loss": 0.0071, + "step": 695960 + }, + { + "epoch": 1.8, + "learning_rate": 2.93918051951755e-05, + "loss": 0.008, + "step": 695970 + }, + { + "epoch": 1.8, + "learning_rate": 2.9387916978804034e-05, + "loss": 0.0101, + "step": 695980 + }, + { + "epoch": 1.8, + "learning_rate": 2.9384028762432572e-05, + "loss": 0.0097, + "step": 695990 + }, + { + "epoch": 1.8, + "learning_rate": 2.9380140546061107e-05, + "loss": 0.0075, + "step": 696000 + }, + { + "epoch": 1.8, + "eval_cer": 0.8816327044764588, + "eval_loss": 0.004856035113334656, + "eval_runtime": 107.862, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.636, + "step": 696000 + }, + { + "epoch": 1.8, + "learning_rate": 2.937625232968964e-05, + "loss": 0.0067, + "step": 696010 + }, + { + "epoch": 1.8, + "learning_rate": 2.9372364113318173e-05, + "loss": 0.0093, + "step": 696020 + }, + { + "epoch": 1.8, + "learning_rate": 2.936847589694671e-05, + "loss": 0.0081, + "step": 696030 + }, + { + "epoch": 1.8, + "learning_rate": 2.9364587680575247e-05, + "loss": 0.0079, + "step": 696040 + }, + { + "epoch": 1.8, + "learning_rate": 2.936069946420378e-05, + "loss": 0.0092, + "step": 696050 + }, + { + "epoch": 1.8, + "learning_rate": 2.9356811247832316e-05, + "loss": 0.0074, + "step": 696060 + }, + { + "epoch": 1.8, + "learning_rate": 2.935292303146085e-05, + "loss": 0.0087, + "step": 696070 + }, + { + "epoch": 1.8, + "learning_rate": 2.934903481508939e-05, + "loss": 0.0082, + "step": 696080 + }, + { + "epoch": 1.8, + "learning_rate": 2.9345146598717924e-05, + "loss": 0.0094, + "step": 696090 + }, + { + "epoch": 1.8, + "learning_rate": 2.934125838234646e-05, + "loss": 0.0068, + "step": 696100 + }, + { + "epoch": 1.8, + "learning_rate": 2.9337370165974994e-05, + "loss": 0.01, + "step": 696110 + }, + { + "epoch": 1.8, + "learning_rate": 2.9333481949603532e-05, + "loss": 0.0044, + "step": 696120 + }, + { + "epoch": 1.8, + "learning_rate": 2.9329593733232064e-05, + "loss": 0.0076, + "step": 696130 + }, + { + "epoch": 1.8, + "learning_rate": 2.93257055168606e-05, + "loss": 0.0076, + "step": 696140 + }, + { + "epoch": 1.8, + "learning_rate": 2.9321817300489133e-05, + "loss": 0.0061, + "step": 696150 + }, + { + "epoch": 1.8, + "learning_rate": 2.9317929084117668e-05, + "loss": 0.0067, + "step": 696160 + }, + { + "epoch": 1.8, + "learning_rate": 2.9314040867746207e-05, + "loss": 0.0063, + "step": 696170 + }, + { + "epoch": 1.8, + "learning_rate": 2.931015265137474e-05, + "loss": 0.0075, + "step": 696180 + }, + { + "epoch": 1.8, + "learning_rate": 2.9306264435003276e-05, + "loss": 0.0074, + "step": 696190 + }, + { + "epoch": 1.8, + "learning_rate": 2.930237621863181e-05, + "loss": 0.0049, + "step": 696200 + }, + { + "epoch": 1.8, + "learning_rate": 2.929848800226035e-05, + "loss": 0.0107, + "step": 696210 + }, + { + "epoch": 1.8, + "learning_rate": 2.9294599785888884e-05, + "loss": 0.0104, + "step": 696220 + }, + { + "epoch": 1.8, + "learning_rate": 2.929071156951742e-05, + "loss": 0.0075, + "step": 696230 + }, + { + "epoch": 1.8, + "learning_rate": 2.9286823353145954e-05, + "loss": 0.0061, + "step": 696240 + }, + { + "epoch": 1.8, + "learning_rate": 2.9282935136774485e-05, + "loss": 0.0098, + "step": 696250 + }, + { + "epoch": 1.8, + "learning_rate": 2.9279046920403024e-05, + "loss": 0.0066, + "step": 696260 + }, + { + "epoch": 1.8, + "learning_rate": 2.927515870403156e-05, + "loss": 0.0059, + "step": 696270 + }, + { + "epoch": 1.8, + "learning_rate": 2.9271270487660093e-05, + "loss": 0.0063, + "step": 696280 + }, + { + "epoch": 1.8, + "learning_rate": 2.9267382271288628e-05, + "loss": 0.0095, + "step": 696290 + }, + { + "epoch": 1.8, + "learning_rate": 2.9263494054917167e-05, + "loss": 0.0061, + "step": 696300 + }, + { + "epoch": 1.8, + "learning_rate": 2.92596058385457e-05, + "loss": 0.0081, + "step": 696310 + }, + { + "epoch": 1.8, + "learning_rate": 2.9255717622174236e-05, + "loss": 0.0081, + "step": 696320 + }, + { + "epoch": 1.8, + "learning_rate": 2.925182940580277e-05, + "loss": 0.0075, + "step": 696330 + }, + { + "epoch": 1.81, + "learning_rate": 2.924794118943131e-05, + "loss": 0.0068, + "step": 696340 + }, + { + "epoch": 1.81, + "learning_rate": 2.9244052973059844e-05, + "loss": 0.0119, + "step": 696350 + }, + { + "epoch": 1.81, + "learning_rate": 2.924016475668838e-05, + "loss": 0.0085, + "step": 696360 + }, + { + "epoch": 1.81, + "learning_rate": 2.9236276540316914e-05, + "loss": 0.0096, + "step": 696370 + }, + { + "epoch": 1.81, + "learning_rate": 2.9232388323945445e-05, + "loss": 0.0063, + "step": 696380 + }, + { + "epoch": 1.81, + "learning_rate": 2.9228500107573984e-05, + "loss": 0.0064, + "step": 696390 + }, + { + "epoch": 1.81, + "learning_rate": 2.922461189120252e-05, + "loss": 0.0083, + "step": 696400 + }, + { + "epoch": 1.81, + "learning_rate": 2.9220723674831053e-05, + "loss": 0.0079, + "step": 696410 + }, + { + "epoch": 1.81, + "learning_rate": 2.9216835458459588e-05, + "loss": 0.0084, + "step": 696420 + }, + { + "epoch": 1.81, + "learning_rate": 2.9212947242088126e-05, + "loss": 0.0059, + "step": 696430 + }, + { + "epoch": 1.81, + "learning_rate": 2.920905902571666e-05, + "loss": 0.0082, + "step": 696440 + }, + { + "epoch": 1.81, + "learning_rate": 2.9205170809345196e-05, + "loss": 0.0092, + "step": 696450 + }, + { + "epoch": 1.81, + "learning_rate": 2.920128259297373e-05, + "loss": 0.0068, + "step": 696460 + }, + { + "epoch": 1.81, + "learning_rate": 2.919739437660227e-05, + "loss": 0.0056, + "step": 696470 + }, + { + "epoch": 1.81, + "learning_rate": 2.9193506160230804e-05, + "loss": 0.0143, + "step": 696480 + }, + { + "epoch": 1.81, + "learning_rate": 2.918961794385934e-05, + "loss": 0.0075, + "step": 696490 + }, + { + "epoch": 1.81, + "learning_rate": 2.918572972748787e-05, + "loss": 0.011, + "step": 696500 + }, + { + "epoch": 1.81, + "learning_rate": 2.9181841511116405e-05, + "loss": 0.0062, + "step": 696510 + }, + { + "epoch": 1.81, + "learning_rate": 2.9177953294744944e-05, + "loss": 0.0065, + "step": 696520 + }, + { + "epoch": 1.81, + "learning_rate": 2.917406507837348e-05, + "loss": 0.0081, + "step": 696530 + }, + { + "epoch": 1.81, + "learning_rate": 2.9170176862002013e-05, + "loss": 0.0065, + "step": 696540 + }, + { + "epoch": 1.81, + "learning_rate": 2.9166288645630548e-05, + "loss": 0.0058, + "step": 696550 + }, + { + "epoch": 1.81, + "learning_rate": 2.9162400429259086e-05, + "loss": 0.0086, + "step": 696560 + }, + { + "epoch": 1.81, + "learning_rate": 2.915851221288762e-05, + "loss": 0.0067, + "step": 696570 + }, + { + "epoch": 1.81, + "learning_rate": 2.9154623996516156e-05, + "loss": 0.006, + "step": 696580 + }, + { + "epoch": 1.81, + "learning_rate": 2.915073578014469e-05, + "loss": 0.0071, + "step": 696590 + }, + { + "epoch": 1.81, + "learning_rate": 2.914684756377323e-05, + "loss": 0.0083, + "step": 696600 + }, + { + "epoch": 1.81, + "learning_rate": 2.9142959347401764e-05, + "loss": 0.0078, + "step": 696610 + }, + { + "epoch": 1.81, + "learning_rate": 2.91390711310303e-05, + "loss": 0.0063, + "step": 696620 + }, + { + "epoch": 1.81, + "learning_rate": 2.913518291465883e-05, + "loss": 0.0056, + "step": 696630 + }, + { + "epoch": 1.81, + "learning_rate": 2.9131294698287365e-05, + "loss": 0.0087, + "step": 696640 + }, + { + "epoch": 1.81, + "learning_rate": 2.9127406481915904e-05, + "loss": 0.0079, + "step": 696650 + }, + { + "epoch": 1.81, + "learning_rate": 2.912351826554444e-05, + "loss": 0.0077, + "step": 696660 + }, + { + "epoch": 1.81, + "learning_rate": 2.9119630049172973e-05, + "loss": 0.0091, + "step": 696670 + }, + { + "epoch": 1.81, + "learning_rate": 2.9115741832801508e-05, + "loss": 0.0072, + "step": 696680 + }, + { + "epoch": 1.81, + "learning_rate": 2.9111853616430046e-05, + "loss": 0.0057, + "step": 696690 + }, + { + "epoch": 1.81, + "learning_rate": 2.910796540005858e-05, + "loss": 0.0048, + "step": 696700 + }, + { + "epoch": 1.81, + "learning_rate": 2.9104077183687116e-05, + "loss": 0.0088, + "step": 696710 + }, + { + "epoch": 1.81, + "learning_rate": 2.910018896731565e-05, + "loss": 0.0059, + "step": 696720 + }, + { + "epoch": 1.81, + "learning_rate": 2.9096300750944186e-05, + "loss": 0.0071, + "step": 696730 + }, + { + "epoch": 1.81, + "learning_rate": 2.9092412534572724e-05, + "loss": 0.0062, + "step": 696740 + }, + { + "epoch": 1.81, + "learning_rate": 2.9088524318201256e-05, + "loss": 0.0076, + "step": 696750 + }, + { + "epoch": 1.81, + "learning_rate": 2.908463610182979e-05, + "loss": 0.0071, + "step": 696760 + }, + { + "epoch": 1.81, + "learning_rate": 2.9080747885458325e-05, + "loss": 0.0107, + "step": 696770 + }, + { + "epoch": 1.81, + "learning_rate": 2.907685966908686e-05, + "loss": 0.0069, + "step": 696780 + }, + { + "epoch": 1.81, + "learning_rate": 2.90729714527154e-05, + "loss": 0.0057, + "step": 696790 + }, + { + "epoch": 1.81, + "learning_rate": 2.9069083236343933e-05, + "loss": 0.0078, + "step": 696800 + }, + { + "epoch": 1.81, + "learning_rate": 2.9065195019972468e-05, + "loss": 0.007, + "step": 696810 + }, + { + "epoch": 1.81, + "learning_rate": 2.9061306803601003e-05, + "loss": 0.0079, + "step": 696820 + }, + { + "epoch": 1.81, + "learning_rate": 2.905741858722954e-05, + "loss": 0.0082, + "step": 696830 + }, + { + "epoch": 1.81, + "learning_rate": 2.9053530370858076e-05, + "loss": 0.0082, + "step": 696840 + }, + { + "epoch": 1.81, + "learning_rate": 2.904964215448661e-05, + "loss": 0.0071, + "step": 696850 + }, + { + "epoch": 1.81, + "learning_rate": 2.9045753938115146e-05, + "loss": 0.0075, + "step": 696860 + }, + { + "epoch": 1.81, + "learning_rate": 2.9041865721743677e-05, + "loss": 0.0085, + "step": 696870 + }, + { + "epoch": 1.81, + "learning_rate": 2.9037977505372216e-05, + "loss": 0.0078, + "step": 696880 + }, + { + "epoch": 1.81, + "learning_rate": 2.903408928900075e-05, + "loss": 0.0073, + "step": 696890 + }, + { + "epoch": 1.81, + "learning_rate": 2.9030201072629285e-05, + "loss": 0.0089, + "step": 696900 + }, + { + "epoch": 1.81, + "learning_rate": 2.902631285625782e-05, + "loss": 0.0078, + "step": 696910 + }, + { + "epoch": 1.81, + "learning_rate": 2.902242463988636e-05, + "loss": 0.007, + "step": 696920 + }, + { + "epoch": 1.81, + "learning_rate": 2.9018536423514893e-05, + "loss": 0.0085, + "step": 696930 + }, + { + "epoch": 1.81, + "learning_rate": 2.9014648207143428e-05, + "loss": 0.0078, + "step": 696940 + }, + { + "epoch": 1.81, + "learning_rate": 2.9010759990771963e-05, + "loss": 0.0088, + "step": 696950 + }, + { + "epoch": 1.81, + "learning_rate": 2.90068717744005e-05, + "loss": 0.0065, + "step": 696960 + }, + { + "epoch": 1.81, + "learning_rate": 2.9002983558029036e-05, + "loss": 0.0059, + "step": 696970 + }, + { + "epoch": 1.81, + "learning_rate": 2.899909534165757e-05, + "loss": 0.0056, + "step": 696980 + }, + { + "epoch": 1.81, + "learning_rate": 2.8995207125286106e-05, + "loss": 0.0086, + "step": 696990 + }, + { + "epoch": 1.81, + "learning_rate": 2.8991318908914637e-05, + "loss": 0.0083, + "step": 697000 + }, + { + "epoch": 1.81, + "eval_cer": 0.8816564983043399, + "eval_loss": 0.004735656548291445, + "eval_runtime": 107.8044, + "eval_samples_per_second": 18.552, + "eval_steps_per_second": 4.638, + "step": 697000 + }, + { + "epoch": 1.81, + "learning_rate": 2.8987430692543176e-05, + "loss": 0.0103, + "step": 697010 + }, + { + "epoch": 1.81, + "learning_rate": 2.898354247617171e-05, + "loss": 0.0063, + "step": 697020 + }, + { + "epoch": 1.81, + "learning_rate": 2.8979654259800245e-05, + "loss": 0.0114, + "step": 697030 + }, + { + "epoch": 1.81, + "learning_rate": 2.897576604342878e-05, + "loss": 0.0059, + "step": 697040 + }, + { + "epoch": 1.81, + "learning_rate": 2.897187782705732e-05, + "loss": 0.0089, + "step": 697050 + }, + { + "epoch": 1.81, + "learning_rate": 2.8967989610685853e-05, + "loss": 0.0079, + "step": 697060 + }, + { + "epoch": 1.81, + "learning_rate": 2.8964101394314388e-05, + "loss": 0.0086, + "step": 697070 + }, + { + "epoch": 1.81, + "learning_rate": 2.8960213177942923e-05, + "loss": 0.0051, + "step": 697080 + }, + { + "epoch": 1.81, + "learning_rate": 2.895632496157146e-05, + "loss": 0.0071, + "step": 697090 + }, + { + "epoch": 1.81, + "learning_rate": 2.8952436745199996e-05, + "loss": 0.007, + "step": 697100 + }, + { + "epoch": 1.81, + "learning_rate": 2.894854852882853e-05, + "loss": 0.007, + "step": 697110 + }, + { + "epoch": 1.81, + "learning_rate": 2.8944660312457062e-05, + "loss": 0.0074, + "step": 697120 + }, + { + "epoch": 1.81, + "learning_rate": 2.8940772096085597e-05, + "loss": 0.0054, + "step": 697130 + }, + { + "epoch": 1.81, + "learning_rate": 2.8936883879714136e-05, + "loss": 0.0055, + "step": 697140 + }, + { + "epoch": 1.81, + "learning_rate": 2.893299566334267e-05, + "loss": 0.0064, + "step": 697150 + }, + { + "epoch": 1.81, + "learning_rate": 2.8929107446971205e-05, + "loss": 0.0115, + "step": 697160 + }, + { + "epoch": 1.81, + "learning_rate": 2.892521923059974e-05, + "loss": 0.0075, + "step": 697170 + }, + { + "epoch": 1.81, + "learning_rate": 2.892133101422828e-05, + "loss": 0.0052, + "step": 697180 + }, + { + "epoch": 1.81, + "learning_rate": 2.8917442797856813e-05, + "loss": 0.0078, + "step": 697190 + }, + { + "epoch": 1.81, + "learning_rate": 2.8913554581485348e-05, + "loss": 0.0065, + "step": 697200 + }, + { + "epoch": 1.81, + "learning_rate": 2.8909666365113883e-05, + "loss": 0.0071, + "step": 697210 + }, + { + "epoch": 1.81, + "learning_rate": 2.890577814874242e-05, + "loss": 0.0052, + "step": 697220 + }, + { + "epoch": 1.81, + "learning_rate": 2.8901889932370956e-05, + "loss": 0.0093, + "step": 697230 + }, + { + "epoch": 1.81, + "learning_rate": 2.889800171599949e-05, + "loss": 0.0075, + "step": 697240 + }, + { + "epoch": 1.81, + "learning_rate": 2.8894113499628022e-05, + "loss": 0.0135, + "step": 697250 + }, + { + "epoch": 1.81, + "learning_rate": 2.8890225283256557e-05, + "loss": 0.0079, + "step": 697260 + }, + { + "epoch": 1.81, + "learning_rate": 2.8886337066885096e-05, + "loss": 0.0066, + "step": 697270 + }, + { + "epoch": 1.81, + "learning_rate": 2.888244885051363e-05, + "loss": 0.0062, + "step": 697280 + }, + { + "epoch": 1.81, + "learning_rate": 2.8878560634142165e-05, + "loss": 0.0074, + "step": 697290 + }, + { + "epoch": 1.81, + "learning_rate": 2.88746724177707e-05, + "loss": 0.0064, + "step": 697300 + }, + { + "epoch": 1.81, + "learning_rate": 2.887078420139924e-05, + "loss": 0.0104, + "step": 697310 + }, + { + "epoch": 1.81, + "learning_rate": 2.8866895985027773e-05, + "loss": 0.0066, + "step": 697320 + }, + { + "epoch": 1.81, + "learning_rate": 2.8863007768656308e-05, + "loss": 0.0092, + "step": 697330 + }, + { + "epoch": 1.81, + "learning_rate": 2.8859119552284843e-05, + "loss": 0.0074, + "step": 697340 + }, + { + "epoch": 1.81, + "learning_rate": 2.885523133591338e-05, + "loss": 0.0051, + "step": 697350 + }, + { + "epoch": 1.81, + "learning_rate": 2.8851343119541916e-05, + "loss": 0.0061, + "step": 697360 + }, + { + "epoch": 1.81, + "learning_rate": 2.8847454903170448e-05, + "loss": 0.0082, + "step": 697370 + }, + { + "epoch": 1.81, + "learning_rate": 2.8843566686798982e-05, + "loss": 0.0082, + "step": 697380 + }, + { + "epoch": 1.81, + "learning_rate": 2.8839678470427517e-05, + "loss": 0.0061, + "step": 697390 + }, + { + "epoch": 1.81, + "learning_rate": 2.8835790254056055e-05, + "loss": 0.0071, + "step": 697400 + }, + { + "epoch": 1.81, + "learning_rate": 2.883190203768459e-05, + "loss": 0.0086, + "step": 697410 + }, + { + "epoch": 1.81, + "learning_rate": 2.8828013821313125e-05, + "loss": 0.0071, + "step": 697420 + }, + { + "epoch": 1.81, + "learning_rate": 2.882412560494166e-05, + "loss": 0.0064, + "step": 697430 + }, + { + "epoch": 1.81, + "learning_rate": 2.88202373885702e-05, + "loss": 0.0093, + "step": 697440 + }, + { + "epoch": 1.81, + "learning_rate": 2.8816349172198733e-05, + "loss": 0.0079, + "step": 697450 + }, + { + "epoch": 1.81, + "learning_rate": 2.8812460955827268e-05, + "loss": 0.0094, + "step": 697460 + }, + { + "epoch": 1.81, + "learning_rate": 2.8808572739455803e-05, + "loss": 0.0091, + "step": 697470 + }, + { + "epoch": 1.81, + "learning_rate": 2.880468452308434e-05, + "loss": 0.0076, + "step": 697480 + }, + { + "epoch": 1.81, + "learning_rate": 2.8800796306712873e-05, + "loss": 0.005, + "step": 697490 + }, + { + "epoch": 1.81, + "learning_rate": 2.8796908090341407e-05, + "loss": 0.0099, + "step": 697500 + }, + { + "epoch": 1.81, + "learning_rate": 2.8793019873969942e-05, + "loss": 0.007, + "step": 697510 + }, + { + "epoch": 1.81, + "learning_rate": 2.8789131657598477e-05, + "loss": 0.0109, + "step": 697520 + }, + { + "epoch": 1.81, + "learning_rate": 2.8785243441227015e-05, + "loss": 0.0319, + "step": 697530 + }, + { + "epoch": 1.81, + "learning_rate": 2.878135522485555e-05, + "loss": 0.0065, + "step": 697540 + }, + { + "epoch": 1.81, + "learning_rate": 2.8777467008484085e-05, + "loss": 0.0073, + "step": 697550 + }, + { + "epoch": 1.81, + "learning_rate": 2.877357879211262e-05, + "loss": 0.0058, + "step": 697560 + }, + { + "epoch": 1.81, + "learning_rate": 2.8769690575741158e-05, + "loss": 0.0123, + "step": 697570 + }, + { + "epoch": 1.81, + "learning_rate": 2.8765802359369693e-05, + "loss": 0.0098, + "step": 697580 + }, + { + "epoch": 1.81, + "learning_rate": 2.8761914142998228e-05, + "loss": 0.0076, + "step": 697590 + }, + { + "epoch": 1.81, + "learning_rate": 2.8758025926626763e-05, + "loss": 0.0075, + "step": 697600 + }, + { + "epoch": 1.81, + "learning_rate": 2.87541377102553e-05, + "loss": 0.0059, + "step": 697610 + }, + { + "epoch": 1.81, + "learning_rate": 2.8750249493883833e-05, + "loss": 0.0075, + "step": 697620 + }, + { + "epoch": 1.81, + "learning_rate": 2.8746361277512367e-05, + "loss": 0.0069, + "step": 697630 + }, + { + "epoch": 1.81, + "learning_rate": 2.8742473061140902e-05, + "loss": 0.0081, + "step": 697640 + }, + { + "epoch": 1.81, + "learning_rate": 2.8738584844769437e-05, + "loss": 0.0063, + "step": 697650 + }, + { + "epoch": 1.81, + "learning_rate": 2.8734696628397975e-05, + "loss": 0.0068, + "step": 697660 + }, + { + "epoch": 1.81, + "learning_rate": 2.873080841202651e-05, + "loss": 0.0069, + "step": 697670 + }, + { + "epoch": 1.81, + "learning_rate": 2.8726920195655045e-05, + "loss": 0.0105, + "step": 697680 + }, + { + "epoch": 1.81, + "learning_rate": 2.872303197928358e-05, + "loss": 0.0084, + "step": 697690 + }, + { + "epoch": 1.81, + "learning_rate": 2.8719143762912118e-05, + "loss": 0.0112, + "step": 697700 + }, + { + "epoch": 1.81, + "learning_rate": 2.8715255546540653e-05, + "loss": 0.0093, + "step": 697710 + }, + { + "epoch": 1.81, + "learning_rate": 2.8711367330169188e-05, + "loss": 0.008, + "step": 697720 + }, + { + "epoch": 1.81, + "learning_rate": 2.8707479113797723e-05, + "loss": 0.0122, + "step": 697730 + }, + { + "epoch": 1.81, + "learning_rate": 2.8703590897426254e-05, + "loss": 0.0082, + "step": 697740 + }, + { + "epoch": 1.81, + "learning_rate": 2.8699702681054793e-05, + "loss": 0.0082, + "step": 697750 + }, + { + "epoch": 1.81, + "learning_rate": 2.8695814464683327e-05, + "loss": 0.0069, + "step": 697760 + }, + { + "epoch": 1.81, + "learning_rate": 2.8691926248311862e-05, + "loss": 0.0054, + "step": 697770 + }, + { + "epoch": 1.81, + "learning_rate": 2.8688038031940397e-05, + "loss": 0.0081, + "step": 697780 + }, + { + "epoch": 1.81, + "learning_rate": 2.8684149815568935e-05, + "loss": 0.0068, + "step": 697790 + }, + { + "epoch": 1.81, + "learning_rate": 2.868026159919747e-05, + "loss": 0.0066, + "step": 697800 + }, + { + "epoch": 1.81, + "learning_rate": 2.8676373382826005e-05, + "loss": 0.0066, + "step": 697810 + }, + { + "epoch": 1.81, + "learning_rate": 2.867248516645454e-05, + "loss": 0.0089, + "step": 697820 + }, + { + "epoch": 1.81, + "learning_rate": 2.8668596950083078e-05, + "loss": 0.0086, + "step": 697830 + }, + { + "epoch": 1.81, + "learning_rate": 2.8664708733711613e-05, + "loss": 0.0068, + "step": 697840 + }, + { + "epoch": 1.81, + "learning_rate": 2.8660820517340148e-05, + "loss": 0.0124, + "step": 697850 + }, + { + "epoch": 1.81, + "learning_rate": 2.8656932300968683e-05, + "loss": 0.0119, + "step": 697860 + }, + { + "epoch": 1.81, + "learning_rate": 2.8653044084597214e-05, + "loss": 0.0069, + "step": 697870 + }, + { + "epoch": 1.81, + "learning_rate": 2.8649155868225753e-05, + "loss": 0.0082, + "step": 697880 + }, + { + "epoch": 1.81, + "learning_rate": 2.8645267651854287e-05, + "loss": 0.0058, + "step": 697890 + }, + { + "epoch": 1.81, + "learning_rate": 2.8641379435482822e-05, + "loss": 0.0116, + "step": 697900 + }, + { + "epoch": 1.81, + "learning_rate": 2.8637491219111357e-05, + "loss": 0.0089, + "step": 697910 + }, + { + "epoch": 1.81, + "learning_rate": 2.8633603002739895e-05, + "loss": 0.0063, + "step": 697920 + }, + { + "epoch": 1.81, + "learning_rate": 2.862971478636843e-05, + "loss": 0.0066, + "step": 697930 + }, + { + "epoch": 1.81, + "learning_rate": 2.8625826569996965e-05, + "loss": 0.0056, + "step": 697940 + }, + { + "epoch": 1.81, + "learning_rate": 2.86219383536255e-05, + "loss": 0.0061, + "step": 697950 + }, + { + "epoch": 1.81, + "learning_rate": 2.8618050137254038e-05, + "loss": 0.0073, + "step": 697960 + }, + { + "epoch": 1.81, + "learning_rate": 2.8614161920882573e-05, + "loss": 0.0062, + "step": 697970 + }, + { + "epoch": 1.81, + "learning_rate": 2.8610273704511108e-05, + "loss": 0.0077, + "step": 697980 + }, + { + "epoch": 1.81, + "learning_rate": 2.860638548813964e-05, + "loss": 0.0052, + "step": 697990 + }, + { + "epoch": 1.81, + "learning_rate": 2.8602497271768174e-05, + "loss": 0.0049, + "step": 698000 + }, + { + "epoch": 1.81, + "eval_cer": 0.8816467008458005, + "eval_loss": 0.004819649271667004, + "eval_runtime": 107.8195, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.637, + "step": 698000 + }, + { + "epoch": 1.81, + "learning_rate": 2.8598609055396713e-05, + "loss": 0.0071, + "step": 698010 + }, + { + "epoch": 1.81, + "learning_rate": 2.8594720839025247e-05, + "loss": 0.0065, + "step": 698020 + }, + { + "epoch": 1.81, + "learning_rate": 2.8590832622653782e-05, + "loss": 0.0103, + "step": 698030 + }, + { + "epoch": 1.81, + "learning_rate": 2.8586944406282317e-05, + "loss": 0.0074, + "step": 698040 + }, + { + "epoch": 1.81, + "learning_rate": 2.8583056189910855e-05, + "loss": 0.0084, + "step": 698050 + }, + { + "epoch": 1.81, + "learning_rate": 2.857916797353939e-05, + "loss": 0.007, + "step": 698060 + }, + { + "epoch": 1.81, + "learning_rate": 2.8575279757167925e-05, + "loss": 0.0078, + "step": 698070 + }, + { + "epoch": 1.81, + "learning_rate": 2.857139154079646e-05, + "loss": 0.0089, + "step": 698080 + }, + { + "epoch": 1.81, + "learning_rate": 2.8567503324424995e-05, + "loss": 0.0065, + "step": 698090 + }, + { + "epoch": 1.81, + "learning_rate": 2.8563615108053533e-05, + "loss": 0.0052, + "step": 698100 + }, + { + "epoch": 1.81, + "learning_rate": 2.8559726891682068e-05, + "loss": 0.0071, + "step": 698110 + }, + { + "epoch": 1.81, + "learning_rate": 2.85558386753106e-05, + "loss": 0.0076, + "step": 698120 + }, + { + "epoch": 1.81, + "learning_rate": 2.8551950458939134e-05, + "loss": 0.0068, + "step": 698130 + }, + { + "epoch": 1.81, + "learning_rate": 2.8548062242567673e-05, + "loss": 0.0067, + "step": 698140 + }, + { + "epoch": 1.81, + "learning_rate": 2.8544174026196207e-05, + "loss": 0.0105, + "step": 698150 + }, + { + "epoch": 1.81, + "learning_rate": 2.8540285809824742e-05, + "loss": 0.0073, + "step": 698160 + }, + { + "epoch": 1.81, + "learning_rate": 2.8536397593453277e-05, + "loss": 0.009, + "step": 698170 + }, + { + "epoch": 1.81, + "learning_rate": 2.8532509377081812e-05, + "loss": 0.0076, + "step": 698180 + }, + { + "epoch": 1.81, + "learning_rate": 2.852862116071035e-05, + "loss": 0.0103, + "step": 698190 + }, + { + "epoch": 1.81, + "learning_rate": 2.8524732944338885e-05, + "loss": 0.0071, + "step": 698200 + }, + { + "epoch": 1.81, + "learning_rate": 2.852084472796742e-05, + "loss": 0.0078, + "step": 698210 + }, + { + "epoch": 1.81, + "learning_rate": 2.8516956511595955e-05, + "loss": 0.0067, + "step": 698220 + }, + { + "epoch": 1.81, + "learning_rate": 2.8513068295224493e-05, + "loss": 0.009, + "step": 698230 + }, + { + "epoch": 1.81, + "learning_rate": 2.8509180078853025e-05, + "loss": 0.0096, + "step": 698240 + }, + { + "epoch": 1.81, + "learning_rate": 2.850529186248156e-05, + "loss": 0.0082, + "step": 698250 + }, + { + "epoch": 1.81, + "learning_rate": 2.8501403646110094e-05, + "loss": 0.0052, + "step": 698260 + }, + { + "epoch": 1.81, + "learning_rate": 2.849751542973863e-05, + "loss": 0.0048, + "step": 698270 + }, + { + "epoch": 1.81, + "learning_rate": 2.8493627213367167e-05, + "loss": 0.0065, + "step": 698280 + }, + { + "epoch": 1.81, + "learning_rate": 2.8489738996995702e-05, + "loss": 0.0069, + "step": 698290 + }, + { + "epoch": 1.81, + "learning_rate": 2.8485850780624237e-05, + "loss": 0.007, + "step": 698300 + }, + { + "epoch": 1.81, + "learning_rate": 2.8481962564252772e-05, + "loss": 0.0073, + "step": 698310 + }, + { + "epoch": 1.81, + "learning_rate": 2.847807434788131e-05, + "loss": 0.0066, + "step": 698320 + }, + { + "epoch": 1.81, + "learning_rate": 2.8474186131509845e-05, + "loss": 0.0131, + "step": 698330 + }, + { + "epoch": 1.81, + "learning_rate": 2.847029791513838e-05, + "loss": 0.0089, + "step": 698340 + }, + { + "epoch": 1.81, + "learning_rate": 2.8466409698766915e-05, + "loss": 0.0103, + "step": 698350 + }, + { + "epoch": 1.81, + "learning_rate": 2.8462521482395446e-05, + "loss": 0.0066, + "step": 698360 + }, + { + "epoch": 1.81, + "learning_rate": 2.8458633266023984e-05, + "loss": 0.0094, + "step": 698370 + }, + { + "epoch": 1.81, + "learning_rate": 2.845474504965252e-05, + "loss": 0.01, + "step": 698380 + }, + { + "epoch": 1.81, + "learning_rate": 2.8450856833281054e-05, + "loss": 0.0078, + "step": 698390 + }, + { + "epoch": 1.81, + "learning_rate": 2.844696861690959e-05, + "loss": 0.0092, + "step": 698400 + }, + { + "epoch": 1.81, + "learning_rate": 2.8443080400538127e-05, + "loss": 0.0057, + "step": 698410 + }, + { + "epoch": 1.81, + "learning_rate": 2.8439192184166662e-05, + "loss": 0.0057, + "step": 698420 + }, + { + "epoch": 1.81, + "learning_rate": 2.8435303967795197e-05, + "loss": 0.0059, + "step": 698430 + }, + { + "epoch": 1.81, + "learning_rate": 2.8431415751423732e-05, + "loss": 0.0083, + "step": 698440 + }, + { + "epoch": 1.81, + "learning_rate": 2.842752753505227e-05, + "loss": 0.0087, + "step": 698450 + }, + { + "epoch": 1.81, + "learning_rate": 2.8423639318680805e-05, + "loss": 0.0098, + "step": 698460 + }, + { + "epoch": 1.81, + "learning_rate": 2.841975110230934e-05, + "loss": 0.0058, + "step": 698470 + }, + { + "epoch": 1.81, + "learning_rate": 2.8415862885937875e-05, + "loss": 0.0097, + "step": 698480 + }, + { + "epoch": 1.81, + "learning_rate": 2.8411974669566406e-05, + "loss": 0.0066, + "step": 698490 + }, + { + "epoch": 1.81, + "learning_rate": 2.8408086453194944e-05, + "loss": 0.0068, + "step": 698500 + }, + { + "epoch": 1.81, + "learning_rate": 2.840419823682348e-05, + "loss": 0.0073, + "step": 698510 + }, + { + "epoch": 1.81, + "learning_rate": 2.8400310020452014e-05, + "loss": 0.0071, + "step": 698520 + }, + { + "epoch": 1.81, + "learning_rate": 2.839642180408055e-05, + "loss": 0.01, + "step": 698530 + }, + { + "epoch": 1.81, + "learning_rate": 2.8392533587709087e-05, + "loss": 0.0085, + "step": 698540 + }, + { + "epoch": 1.81, + "learning_rate": 2.8388645371337622e-05, + "loss": 0.0088, + "step": 698550 + }, + { + "epoch": 1.81, + "learning_rate": 2.8384757154966157e-05, + "loss": 0.006, + "step": 698560 + }, + { + "epoch": 1.81, + "learning_rate": 2.8380868938594692e-05, + "loss": 0.0073, + "step": 698570 + }, + { + "epoch": 1.81, + "learning_rate": 2.837698072222323e-05, + "loss": 0.009, + "step": 698580 + }, + { + "epoch": 1.81, + "learning_rate": 2.8373092505851765e-05, + "loss": 0.0096, + "step": 698590 + }, + { + "epoch": 1.81, + "learning_rate": 2.83692042894803e-05, + "loss": 0.0067, + "step": 698600 + }, + { + "epoch": 1.81, + "learning_rate": 2.836531607310883e-05, + "loss": 0.0076, + "step": 698610 + }, + { + "epoch": 1.81, + "learning_rate": 2.8361427856737366e-05, + "loss": 0.0061, + "step": 698620 + }, + { + "epoch": 1.81, + "learning_rate": 2.8357539640365904e-05, + "loss": 0.0084, + "step": 698630 + }, + { + "epoch": 1.81, + "learning_rate": 2.835365142399444e-05, + "loss": 0.008, + "step": 698640 + }, + { + "epoch": 1.81, + "learning_rate": 2.8349763207622974e-05, + "loss": 0.0077, + "step": 698650 + }, + { + "epoch": 1.81, + "learning_rate": 2.834587499125151e-05, + "loss": 0.0065, + "step": 698660 + }, + { + "epoch": 1.81, + "learning_rate": 2.8341986774880047e-05, + "loss": 0.0084, + "step": 698670 + }, + { + "epoch": 1.81, + "learning_rate": 2.8338098558508582e-05, + "loss": 0.0069, + "step": 698680 + }, + { + "epoch": 1.81, + "learning_rate": 2.8334210342137117e-05, + "loss": 0.0065, + "step": 698690 + }, + { + "epoch": 1.81, + "learning_rate": 2.8330322125765652e-05, + "loss": 0.0088, + "step": 698700 + }, + { + "epoch": 1.81, + "learning_rate": 2.832643390939419e-05, + "loss": 0.0072, + "step": 698710 + }, + { + "epoch": 1.81, + "learning_rate": 2.8322545693022725e-05, + "loss": 0.0069, + "step": 698720 + }, + { + "epoch": 1.81, + "learning_rate": 2.831865747665126e-05, + "loss": 0.0068, + "step": 698730 + }, + { + "epoch": 1.81, + "learning_rate": 2.831476926027979e-05, + "loss": 0.0082, + "step": 698740 + }, + { + "epoch": 1.81, + "learning_rate": 2.8310881043908326e-05, + "loss": 0.0086, + "step": 698750 + }, + { + "epoch": 1.81, + "learning_rate": 2.8306992827536864e-05, + "loss": 0.0069, + "step": 698760 + }, + { + "epoch": 1.81, + "learning_rate": 2.83031046111654e-05, + "loss": 0.006, + "step": 698770 + }, + { + "epoch": 1.81, + "learning_rate": 2.8299216394793934e-05, + "loss": 0.007, + "step": 698780 + }, + { + "epoch": 1.81, + "learning_rate": 2.829532817842247e-05, + "loss": 0.0062, + "step": 698790 + }, + { + "epoch": 1.81, + "learning_rate": 2.8291439962051007e-05, + "loss": 0.0083, + "step": 698800 + }, + { + "epoch": 1.81, + "learning_rate": 2.8287551745679542e-05, + "loss": 0.0063, + "step": 698810 + }, + { + "epoch": 1.81, + "learning_rate": 2.8283663529308077e-05, + "loss": 0.006, + "step": 698820 + }, + { + "epoch": 1.81, + "learning_rate": 2.8279775312936612e-05, + "loss": 0.0068, + "step": 698830 + }, + { + "epoch": 1.81, + "learning_rate": 2.827588709656515e-05, + "loss": 0.0057, + "step": 698840 + }, + { + "epoch": 1.81, + "learning_rate": 2.8271998880193685e-05, + "loss": 0.0057, + "step": 698850 + }, + { + "epoch": 1.81, + "learning_rate": 2.8268110663822216e-05, + "loss": 0.0071, + "step": 698860 + }, + { + "epoch": 1.81, + "learning_rate": 2.826422244745075e-05, + "loss": 0.0066, + "step": 698870 + }, + { + "epoch": 1.81, + "learning_rate": 2.8260334231079286e-05, + "loss": 0.0078, + "step": 698880 + }, + { + "epoch": 1.81, + "learning_rate": 2.8256446014707824e-05, + "loss": 0.0063, + "step": 698890 + }, + { + "epoch": 1.81, + "learning_rate": 2.825255779833636e-05, + "loss": 0.0072, + "step": 698900 + }, + { + "epoch": 1.81, + "learning_rate": 2.8248669581964894e-05, + "loss": 0.0078, + "step": 698910 + }, + { + "epoch": 1.81, + "learning_rate": 2.824478136559343e-05, + "loss": 0.0069, + "step": 698920 + }, + { + "epoch": 1.81, + "learning_rate": 2.8240893149221967e-05, + "loss": 0.0047, + "step": 698930 + }, + { + "epoch": 1.81, + "learning_rate": 2.8237004932850502e-05, + "loss": 0.0078, + "step": 698940 + }, + { + "epoch": 1.81, + "learning_rate": 2.8233116716479037e-05, + "loss": 0.0082, + "step": 698950 + }, + { + "epoch": 1.81, + "learning_rate": 2.8229228500107572e-05, + "loss": 0.0067, + "step": 698960 + }, + { + "epoch": 1.81, + "learning_rate": 2.822534028373611e-05, + "loss": 0.0062, + "step": 698970 + }, + { + "epoch": 1.81, + "learning_rate": 2.822145206736464e-05, + "loss": 0.0054, + "step": 698980 + }, + { + "epoch": 1.81, + "learning_rate": 2.8217563850993176e-05, + "loss": 0.009, + "step": 698990 + }, + { + "epoch": 1.81, + "learning_rate": 2.821367563462171e-05, + "loss": 0.007, + "step": 699000 + }, + { + "epoch": 1.81, + "eval_cer": 0.8816564983043399, + "eval_loss": 0.004687727894634008, + "eval_runtime": 107.7875, + "eval_samples_per_second": 18.555, + "eval_steps_per_second": 4.639, + "step": 699000 + }, + { + "epoch": 1.81, + "learning_rate": 2.8209787418250246e-05, + "loss": 0.0046, + "step": 699010 + }, + { + "epoch": 1.81, + "learning_rate": 2.8205899201878784e-05, + "loss": 0.0052, + "step": 699020 + }, + { + "epoch": 1.81, + "learning_rate": 2.820201098550732e-05, + "loss": 0.0068, + "step": 699030 + }, + { + "epoch": 1.81, + "learning_rate": 2.8198122769135854e-05, + "loss": 0.0071, + "step": 699040 + }, + { + "epoch": 1.81, + "learning_rate": 2.819423455276439e-05, + "loss": 0.008, + "step": 699050 + }, + { + "epoch": 1.81, + "learning_rate": 2.8190346336392927e-05, + "loss": 0.0079, + "step": 699060 + }, + { + "epoch": 1.81, + "learning_rate": 2.8186458120021462e-05, + "loss": 0.0078, + "step": 699070 + }, + { + "epoch": 1.81, + "learning_rate": 2.8182569903649997e-05, + "loss": 0.0077, + "step": 699080 + }, + { + "epoch": 1.81, + "learning_rate": 2.8178681687278532e-05, + "loss": 0.0068, + "step": 699090 + }, + { + "epoch": 1.81, + "learning_rate": 2.817479347090707e-05, + "loss": 0.0061, + "step": 699100 + }, + { + "epoch": 1.81, + "learning_rate": 2.81709052545356e-05, + "loss": 0.0066, + "step": 699110 + }, + { + "epoch": 1.81, + "learning_rate": 2.8167017038164136e-05, + "loss": 0.0059, + "step": 699120 + }, + { + "epoch": 1.81, + "learning_rate": 2.816312882179267e-05, + "loss": 0.0071, + "step": 699130 + }, + { + "epoch": 1.81, + "learning_rate": 2.8159240605421206e-05, + "loss": 0.008, + "step": 699140 + }, + { + "epoch": 1.81, + "learning_rate": 2.8155352389049744e-05, + "loss": 0.0072, + "step": 699150 + }, + { + "epoch": 1.81, + "learning_rate": 2.815146417267828e-05, + "loss": 0.0059, + "step": 699160 + }, + { + "epoch": 1.81, + "learning_rate": 2.8147575956306814e-05, + "loss": 0.0074, + "step": 699170 + }, + { + "epoch": 1.81, + "learning_rate": 2.814368773993535e-05, + "loss": 0.0082, + "step": 699180 + }, + { + "epoch": 1.81, + "learning_rate": 2.8139799523563887e-05, + "loss": 0.0088, + "step": 699190 + }, + { + "epoch": 1.81, + "learning_rate": 2.8135911307192422e-05, + "loss": 0.0066, + "step": 699200 + }, + { + "epoch": 1.81, + "learning_rate": 2.8132023090820957e-05, + "loss": 0.0084, + "step": 699210 + }, + { + "epoch": 1.81, + "learning_rate": 2.8128134874449492e-05, + "loss": 0.0083, + "step": 699220 + }, + { + "epoch": 1.81, + "learning_rate": 2.8124246658078023e-05, + "loss": 0.0072, + "step": 699230 + }, + { + "epoch": 1.81, + "learning_rate": 2.812035844170656e-05, + "loss": 0.0052, + "step": 699240 + }, + { + "epoch": 1.81, + "learning_rate": 2.8116470225335096e-05, + "loss": 0.0115, + "step": 699250 + }, + { + "epoch": 1.81, + "learning_rate": 2.811258200896363e-05, + "loss": 0.0097, + "step": 699260 + }, + { + "epoch": 1.81, + "learning_rate": 2.8108693792592166e-05, + "loss": 0.0079, + "step": 699270 + }, + { + "epoch": 1.81, + "learning_rate": 2.8104805576220704e-05, + "loss": 0.009, + "step": 699280 + }, + { + "epoch": 1.81, + "learning_rate": 2.810091735984924e-05, + "loss": 0.0074, + "step": 699290 + }, + { + "epoch": 1.81, + "learning_rate": 2.8097029143477774e-05, + "loss": 0.0067, + "step": 699300 + }, + { + "epoch": 1.81, + "learning_rate": 2.809314092710631e-05, + "loss": 0.0059, + "step": 699310 + }, + { + "epoch": 1.81, + "learning_rate": 2.8089252710734847e-05, + "loss": 0.0089, + "step": 699320 + }, + { + "epoch": 1.81, + "learning_rate": 2.8085364494363382e-05, + "loss": 0.0062, + "step": 699330 + }, + { + "epoch": 1.81, + "learning_rate": 2.8081476277991917e-05, + "loss": 0.0114, + "step": 699340 + }, + { + "epoch": 1.81, + "learning_rate": 2.8077588061620452e-05, + "loss": 0.0053, + "step": 699350 + }, + { + "epoch": 1.81, + "learning_rate": 2.8073699845248983e-05, + "loss": 0.0069, + "step": 699360 + }, + { + "epoch": 1.81, + "learning_rate": 2.806981162887752e-05, + "loss": 0.0119, + "step": 699370 + }, + { + "epoch": 1.81, + "learning_rate": 2.8065923412506056e-05, + "loss": 0.006, + "step": 699380 + }, + { + "epoch": 1.81, + "learning_rate": 2.806203519613459e-05, + "loss": 0.0059, + "step": 699390 + }, + { + "epoch": 1.81, + "learning_rate": 2.8058146979763126e-05, + "loss": 0.0079, + "step": 699400 + }, + { + "epoch": 1.81, + "learning_rate": 2.8054258763391664e-05, + "loss": 0.0083, + "step": 699410 + }, + { + "epoch": 1.81, + "learning_rate": 2.80503705470202e-05, + "loss": 0.0065, + "step": 699420 + }, + { + "epoch": 1.81, + "learning_rate": 2.8046482330648734e-05, + "loss": 0.0092, + "step": 699430 + }, + { + "epoch": 1.81, + "learning_rate": 2.804259411427727e-05, + "loss": 0.0063, + "step": 699440 + }, + { + "epoch": 1.81, + "learning_rate": 2.8038705897905807e-05, + "loss": 0.0059, + "step": 699450 + }, + { + "epoch": 1.81, + "learning_rate": 2.8034817681534342e-05, + "loss": 0.0064, + "step": 699460 + }, + { + "epoch": 1.81, + "learning_rate": 2.8030929465162877e-05, + "loss": 0.0086, + "step": 699470 + }, + { + "epoch": 1.81, + "learning_rate": 2.802704124879141e-05, + "loss": 0.0096, + "step": 699480 + }, + { + "epoch": 1.81, + "learning_rate": 2.8023153032419943e-05, + "loss": 0.0074, + "step": 699490 + }, + { + "epoch": 1.81, + "learning_rate": 2.801926481604848e-05, + "loss": 0.0046, + "step": 699500 + }, + { + "epoch": 1.81, + "learning_rate": 2.8015376599677016e-05, + "loss": 0.0061, + "step": 699510 + }, + { + "epoch": 1.81, + "learning_rate": 2.801148838330555e-05, + "loss": 0.009, + "step": 699520 + }, + { + "epoch": 1.81, + "learning_rate": 2.8007600166934086e-05, + "loss": 0.0069, + "step": 699530 + }, + { + "epoch": 1.81, + "learning_rate": 2.800371195056262e-05, + "loss": 0.0065, + "step": 699540 + }, + { + "epoch": 1.81, + "learning_rate": 2.799982373419116e-05, + "loss": 0.0061, + "step": 699550 + }, + { + "epoch": 1.81, + "learning_rate": 2.7995935517819694e-05, + "loss": 0.0067, + "step": 699560 + }, + { + "epoch": 1.81, + "learning_rate": 2.799204730144823e-05, + "loss": 0.008, + "step": 699570 + }, + { + "epoch": 1.81, + "learning_rate": 2.7988159085076764e-05, + "loss": 0.005, + "step": 699580 + }, + { + "epoch": 1.81, + "learning_rate": 2.7984270868705302e-05, + "loss": 0.0113, + "step": 699590 + }, + { + "epoch": 1.81, + "learning_rate": 2.7980382652333833e-05, + "loss": 0.006, + "step": 699600 + }, + { + "epoch": 1.81, + "learning_rate": 2.797649443596237e-05, + "loss": 0.0089, + "step": 699610 + }, + { + "epoch": 1.81, + "learning_rate": 2.7972606219590903e-05, + "loss": 0.0054, + "step": 699620 + }, + { + "epoch": 1.81, + "learning_rate": 2.7968718003219438e-05, + "loss": 0.0101, + "step": 699630 + }, + { + "epoch": 1.81, + "learning_rate": 2.7964829786847976e-05, + "loss": 0.0075, + "step": 699640 + }, + { + "epoch": 1.81, + "learning_rate": 2.796094157047651e-05, + "loss": 0.0085, + "step": 699650 + }, + { + "epoch": 1.81, + "learning_rate": 2.7957053354105046e-05, + "loss": 0.0078, + "step": 699660 + }, + { + "epoch": 1.81, + "learning_rate": 2.795316513773358e-05, + "loss": 0.0078, + "step": 699670 + }, + { + "epoch": 1.81, + "learning_rate": 2.794927692136212e-05, + "loss": 0.0081, + "step": 699680 + }, + { + "epoch": 1.81, + "learning_rate": 2.7945388704990654e-05, + "loss": 0.008, + "step": 699690 + }, + { + "epoch": 1.81, + "learning_rate": 2.794150048861919e-05, + "loss": 0.006, + "step": 699700 + }, + { + "epoch": 1.81, + "learning_rate": 2.7937612272247724e-05, + "loss": 0.0071, + "step": 699710 + }, + { + "epoch": 1.81, + "learning_rate": 2.7933724055876262e-05, + "loss": 0.006, + "step": 699720 + }, + { + "epoch": 1.81, + "learning_rate": 2.7929835839504793e-05, + "loss": 0.0096, + "step": 699730 + }, + { + "epoch": 1.81, + "learning_rate": 2.7925947623133328e-05, + "loss": 0.0067, + "step": 699740 + }, + { + "epoch": 1.81, + "learning_rate": 2.7922059406761863e-05, + "loss": 0.0067, + "step": 699750 + }, + { + "epoch": 1.81, + "learning_rate": 2.7918171190390398e-05, + "loss": 0.0053, + "step": 699760 + }, + { + "epoch": 1.81, + "learning_rate": 2.7914282974018936e-05, + "loss": 0.0068, + "step": 699770 + }, + { + "epoch": 1.81, + "learning_rate": 2.791039475764747e-05, + "loss": 0.0063, + "step": 699780 + }, + { + "epoch": 1.81, + "learning_rate": 2.7906506541276006e-05, + "loss": 0.0068, + "step": 699790 + }, + { + "epoch": 1.81, + "learning_rate": 2.790261832490454e-05, + "loss": 0.006, + "step": 699800 + }, + { + "epoch": 1.81, + "learning_rate": 2.789873010853308e-05, + "loss": 0.0075, + "step": 699810 + }, + { + "epoch": 1.81, + "learning_rate": 2.7894841892161614e-05, + "loss": 0.007, + "step": 699820 + }, + { + "epoch": 1.81, + "learning_rate": 2.789095367579015e-05, + "loss": 0.0091, + "step": 699830 + }, + { + "epoch": 1.81, + "learning_rate": 2.7887065459418684e-05, + "loss": 0.0078, + "step": 699840 + }, + { + "epoch": 1.81, + "learning_rate": 2.7883177243047215e-05, + "loss": 0.0066, + "step": 699850 + }, + { + "epoch": 1.81, + "learning_rate": 2.7879289026675753e-05, + "loss": 0.0091, + "step": 699860 + }, + { + "epoch": 1.81, + "learning_rate": 2.7875400810304288e-05, + "loss": 0.0064, + "step": 699870 + }, + { + "epoch": 1.81, + "learning_rate": 2.7871512593932823e-05, + "loss": 0.0096, + "step": 699880 + }, + { + "epoch": 1.81, + "learning_rate": 2.7867624377561358e-05, + "loss": 0.0068, + "step": 699890 + }, + { + "epoch": 1.81, + "learning_rate": 2.7863736161189896e-05, + "loss": 0.0061, + "step": 699900 + }, + { + "epoch": 1.81, + "learning_rate": 2.785984794481843e-05, + "loss": 0.0062, + "step": 699910 + }, + { + "epoch": 1.81, + "learning_rate": 2.7855959728446966e-05, + "loss": 0.0072, + "step": 699920 + }, + { + "epoch": 1.81, + "learning_rate": 2.78520715120755e-05, + "loss": 0.0057, + "step": 699930 + }, + { + "epoch": 1.81, + "learning_rate": 2.784818329570404e-05, + "loss": 0.0067, + "step": 699940 + }, + { + "epoch": 1.81, + "learning_rate": 2.7844295079332574e-05, + "loss": 0.0077, + "step": 699950 + }, + { + "epoch": 1.81, + "learning_rate": 2.784040686296111e-05, + "loss": 0.0087, + "step": 699960 + }, + { + "epoch": 1.81, + "learning_rate": 2.7836518646589644e-05, + "loss": 0.0066, + "step": 699970 + }, + { + "epoch": 1.81, + "learning_rate": 2.7832630430218175e-05, + "loss": 0.007, + "step": 699980 + }, + { + "epoch": 1.81, + "learning_rate": 2.7828742213846713e-05, + "loss": 0.0084, + "step": 699990 + }, + { + "epoch": 1.81, + "learning_rate": 2.7824853997475248e-05, + "loss": 0.0151, + "step": 700000 + }, + { + "epoch": 1.81, + "eval_cer": 0.88167329394755, + "eval_loss": 0.004671318922191858, + "eval_runtime": 107.97, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 700000 + }, + { + "epoch": 1.81, + "learning_rate": 2.7820965781103783e-05, + "loss": 0.0065, + "step": 700010 + }, + { + "epoch": 1.81, + "learning_rate": 2.7817077564732318e-05, + "loss": 0.007, + "step": 700020 + }, + { + "epoch": 1.81, + "learning_rate": 2.7813189348360856e-05, + "loss": 0.0085, + "step": 700030 + }, + { + "epoch": 1.81, + "learning_rate": 2.780930113198939e-05, + "loss": 0.008, + "step": 700040 + }, + { + "epoch": 1.81, + "learning_rate": 2.7805412915617926e-05, + "loss": 0.0107, + "step": 700050 + }, + { + "epoch": 1.81, + "learning_rate": 2.780152469924646e-05, + "loss": 0.0078, + "step": 700060 + }, + { + "epoch": 1.81, + "learning_rate": 2.7797636482875e-05, + "loss": 0.0056, + "step": 700070 + }, + { + "epoch": 1.81, + "learning_rate": 2.7793748266503534e-05, + "loss": 0.0058, + "step": 700080 + }, + { + "epoch": 1.81, + "learning_rate": 2.778986005013207e-05, + "loss": 0.0086, + "step": 700090 + }, + { + "epoch": 1.81, + "learning_rate": 2.77859718337606e-05, + "loss": 0.0075, + "step": 700100 + }, + { + "epoch": 1.81, + "learning_rate": 2.7782083617389135e-05, + "loss": 0.0072, + "step": 700110 + }, + { + "epoch": 1.81, + "learning_rate": 2.7778195401017673e-05, + "loss": 0.0071, + "step": 700120 + }, + { + "epoch": 1.81, + "learning_rate": 2.7774307184646208e-05, + "loss": 0.0101, + "step": 700130 + }, + { + "epoch": 1.81, + "learning_rate": 2.7770418968274743e-05, + "loss": 0.0056, + "step": 700140 + }, + { + "epoch": 1.81, + "learning_rate": 2.7766530751903278e-05, + "loss": 0.0063, + "step": 700150 + }, + { + "epoch": 1.81, + "learning_rate": 2.7762642535531816e-05, + "loss": 0.006, + "step": 700160 + }, + { + "epoch": 1.81, + "learning_rate": 2.775875431916035e-05, + "loss": 0.0072, + "step": 700170 + }, + { + "epoch": 1.81, + "learning_rate": 2.7754866102788886e-05, + "loss": 0.0081, + "step": 700180 + }, + { + "epoch": 1.81, + "learning_rate": 2.775097788641742e-05, + "loss": 0.0066, + "step": 700190 + }, + { + "epoch": 1.82, + "learning_rate": 2.774708967004596e-05, + "loss": 0.007, + "step": 700200 + }, + { + "epoch": 1.82, + "learning_rate": 2.7743201453674494e-05, + "loss": 0.0076, + "step": 700210 + }, + { + "epoch": 1.82, + "learning_rate": 2.7739313237303025e-05, + "loss": 0.0098, + "step": 700220 + }, + { + "epoch": 1.82, + "learning_rate": 2.773542502093156e-05, + "loss": 0.0065, + "step": 700230 + }, + { + "epoch": 1.82, + "learning_rate": 2.7731536804560095e-05, + "loss": 0.0074, + "step": 700240 + }, + { + "epoch": 1.82, + "learning_rate": 2.7727648588188633e-05, + "loss": 0.0077, + "step": 700250 + }, + { + "epoch": 1.82, + "learning_rate": 2.7723760371817168e-05, + "loss": 0.008, + "step": 700260 + }, + { + "epoch": 1.82, + "learning_rate": 2.7719872155445703e-05, + "loss": 0.0071, + "step": 700270 + }, + { + "epoch": 1.82, + "learning_rate": 2.7715983939074238e-05, + "loss": 0.0062, + "step": 700280 + }, + { + "epoch": 1.82, + "learning_rate": 2.7712095722702776e-05, + "loss": 0.0071, + "step": 700290 + }, + { + "epoch": 1.82, + "learning_rate": 2.770820750633131e-05, + "loss": 0.0087, + "step": 700300 + }, + { + "epoch": 1.82, + "learning_rate": 2.7704319289959846e-05, + "loss": 0.007, + "step": 700310 + }, + { + "epoch": 1.82, + "learning_rate": 2.770043107358838e-05, + "loss": 0.009, + "step": 700320 + }, + { + "epoch": 1.82, + "learning_rate": 2.769654285721692e-05, + "loss": 0.0089, + "step": 700330 + }, + { + "epoch": 1.82, + "learning_rate": 2.7692654640845454e-05, + "loss": 0.0073, + "step": 700340 + }, + { + "epoch": 1.82, + "learning_rate": 2.7688766424473985e-05, + "loss": 0.008, + "step": 700350 + }, + { + "epoch": 1.82, + "learning_rate": 2.768487820810252e-05, + "loss": 0.0068, + "step": 700360 + }, + { + "epoch": 1.82, + "learning_rate": 2.7680989991731055e-05, + "loss": 0.0068, + "step": 700370 + }, + { + "epoch": 1.82, + "learning_rate": 2.7677101775359593e-05, + "loss": 0.0074, + "step": 700380 + }, + { + "epoch": 1.82, + "learning_rate": 2.7673213558988128e-05, + "loss": 0.0075, + "step": 700390 + }, + { + "epoch": 1.82, + "learning_rate": 2.7669325342616663e-05, + "loss": 0.008, + "step": 700400 + }, + { + "epoch": 1.82, + "learning_rate": 2.7665437126245198e-05, + "loss": 0.0074, + "step": 700410 + }, + { + "epoch": 1.82, + "learning_rate": 2.7661548909873736e-05, + "loss": 0.0056, + "step": 700420 + }, + { + "epoch": 1.82, + "learning_rate": 2.765766069350227e-05, + "loss": 0.0071, + "step": 700430 + }, + { + "epoch": 1.82, + "learning_rate": 2.7653772477130806e-05, + "loss": 0.0064, + "step": 700440 + }, + { + "epoch": 1.82, + "learning_rate": 2.764988426075934e-05, + "loss": 0.005, + "step": 700450 + }, + { + "epoch": 1.82, + "learning_rate": 2.764599604438788e-05, + "loss": 0.0098, + "step": 700460 + }, + { + "epoch": 1.82, + "learning_rate": 2.764210782801641e-05, + "loss": 0.0063, + "step": 700470 + }, + { + "epoch": 1.82, + "learning_rate": 2.7638219611644945e-05, + "loss": 0.0069, + "step": 700480 + }, + { + "epoch": 1.82, + "learning_rate": 2.763433139527348e-05, + "loss": 0.0083, + "step": 700490 + }, + { + "epoch": 1.82, + "learning_rate": 2.7630443178902015e-05, + "loss": 0.0069, + "step": 700500 + }, + { + "epoch": 1.82, + "learning_rate": 2.7626554962530553e-05, + "loss": 0.0093, + "step": 700510 + }, + { + "epoch": 1.82, + "learning_rate": 2.7622666746159088e-05, + "loss": 0.0071, + "step": 700520 + }, + { + "epoch": 1.82, + "learning_rate": 2.7618778529787623e-05, + "loss": 0.0076, + "step": 700530 + }, + { + "epoch": 1.82, + "learning_rate": 2.7614890313416158e-05, + "loss": 0.0067, + "step": 700540 + }, + { + "epoch": 1.82, + "learning_rate": 2.7611002097044696e-05, + "loss": 0.0078, + "step": 700550 + }, + { + "epoch": 1.82, + "learning_rate": 2.760711388067323e-05, + "loss": 0.0116, + "step": 700560 + }, + { + "epoch": 1.82, + "learning_rate": 2.7603225664301766e-05, + "loss": 0.0048, + "step": 700570 + }, + { + "epoch": 1.82, + "learning_rate": 2.75993374479303e-05, + "loss": 0.0077, + "step": 700580 + }, + { + "epoch": 1.82, + "learning_rate": 2.759544923155884e-05, + "loss": 0.0073, + "step": 700590 + }, + { + "epoch": 1.82, + "learning_rate": 2.759156101518737e-05, + "loss": 0.0086, + "step": 700600 + }, + { + "epoch": 1.82, + "learning_rate": 2.7587672798815905e-05, + "loss": 0.0069, + "step": 700610 + }, + { + "epoch": 1.82, + "learning_rate": 2.758378458244444e-05, + "loss": 0.0063, + "step": 700620 + }, + { + "epoch": 1.82, + "learning_rate": 2.7579896366072975e-05, + "loss": 0.0084, + "step": 700630 + }, + { + "epoch": 1.82, + "learning_rate": 2.7576008149701513e-05, + "loss": 0.0053, + "step": 700640 + }, + { + "epoch": 1.82, + "learning_rate": 2.7572119933330048e-05, + "loss": 0.009, + "step": 700650 + }, + { + "epoch": 1.82, + "learning_rate": 2.7568231716958583e-05, + "loss": 0.0064, + "step": 700660 + }, + { + "epoch": 1.82, + "learning_rate": 2.7564343500587118e-05, + "loss": 0.0086, + "step": 700670 + }, + { + "epoch": 1.82, + "learning_rate": 2.7560455284215656e-05, + "loss": 0.0101, + "step": 700680 + }, + { + "epoch": 1.82, + "learning_rate": 2.755656706784419e-05, + "loss": 0.0077, + "step": 700690 + }, + { + "epoch": 1.82, + "learning_rate": 2.7552678851472726e-05, + "loss": 0.0074, + "step": 700700 + }, + { + "epoch": 1.82, + "learning_rate": 2.754879063510126e-05, + "loss": 0.0067, + "step": 700710 + }, + { + "epoch": 1.82, + "learning_rate": 2.7544902418729792e-05, + "loss": 0.0074, + "step": 700720 + }, + { + "epoch": 1.82, + "learning_rate": 2.754101420235833e-05, + "loss": 0.0058, + "step": 700730 + }, + { + "epoch": 1.82, + "learning_rate": 2.7537125985986865e-05, + "loss": 0.007, + "step": 700740 + }, + { + "epoch": 1.82, + "learning_rate": 2.75332377696154e-05, + "loss": 0.0078, + "step": 700750 + }, + { + "epoch": 1.82, + "learning_rate": 2.7529349553243935e-05, + "loss": 0.0054, + "step": 700760 + }, + { + "epoch": 1.82, + "learning_rate": 2.7525461336872473e-05, + "loss": 0.0077, + "step": 700770 + }, + { + "epoch": 1.82, + "learning_rate": 2.7521573120501008e-05, + "loss": 0.0056, + "step": 700780 + }, + { + "epoch": 1.82, + "learning_rate": 2.7517684904129543e-05, + "loss": 0.0094, + "step": 700790 + }, + { + "epoch": 1.82, + "learning_rate": 2.7513796687758078e-05, + "loss": 0.0066, + "step": 700800 + }, + { + "epoch": 1.82, + "learning_rate": 2.7509908471386616e-05, + "loss": 0.0066, + "step": 700810 + }, + { + "epoch": 1.82, + "learning_rate": 2.750602025501515e-05, + "loss": 0.0067, + "step": 700820 + }, + { + "epoch": 1.82, + "learning_rate": 2.7502132038643686e-05, + "loss": 0.0104, + "step": 700830 + }, + { + "epoch": 1.82, + "learning_rate": 2.7498243822272217e-05, + "loss": 0.0075, + "step": 700840 + }, + { + "epoch": 1.82, + "learning_rate": 2.7494355605900752e-05, + "loss": 0.0081, + "step": 700850 + }, + { + "epoch": 1.82, + "learning_rate": 2.749046738952929e-05, + "loss": 0.0086, + "step": 700860 + }, + { + "epoch": 1.82, + "learning_rate": 2.7486579173157825e-05, + "loss": 0.0087, + "step": 700870 + }, + { + "epoch": 1.82, + "learning_rate": 2.748269095678636e-05, + "loss": 0.0052, + "step": 700880 + }, + { + "epoch": 1.82, + "learning_rate": 2.7478802740414895e-05, + "loss": 0.0082, + "step": 700890 + }, + { + "epoch": 1.82, + "learning_rate": 2.7474914524043433e-05, + "loss": 0.0059, + "step": 700900 + }, + { + "epoch": 1.82, + "learning_rate": 2.7471026307671968e-05, + "loss": 0.0096, + "step": 700910 + }, + { + "epoch": 1.82, + "learning_rate": 2.7467138091300503e-05, + "loss": 0.0057, + "step": 700920 + }, + { + "epoch": 1.82, + "learning_rate": 2.7463249874929038e-05, + "loss": 0.0095, + "step": 700930 + }, + { + "epoch": 1.82, + "learning_rate": 2.7459361658557573e-05, + "loss": 0.0105, + "step": 700940 + }, + { + "epoch": 1.82, + "learning_rate": 2.745547344218611e-05, + "loss": 0.0063, + "step": 700950 + }, + { + "epoch": 1.82, + "learning_rate": 2.7451585225814646e-05, + "loss": 0.01, + "step": 700960 + }, + { + "epoch": 1.82, + "learning_rate": 2.7447697009443177e-05, + "loss": 0.0058, + "step": 700970 + }, + { + "epoch": 1.82, + "learning_rate": 2.7443808793071712e-05, + "loss": 0.0057, + "step": 700980 + }, + { + "epoch": 1.82, + "learning_rate": 2.7439920576700247e-05, + "loss": 0.0089, + "step": 700990 + }, + { + "epoch": 1.82, + "learning_rate": 2.7436032360328785e-05, + "loss": 0.0071, + "step": 701000 + }, + { + "epoch": 1.82, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.0047097280621528625, + "eval_runtime": 107.7701, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.64, + "step": 701000 + }, + { + "epoch": 1.82, + "learning_rate": 2.743214414395732e-05, + "loss": 0.0093, + "step": 701010 + }, + { + "epoch": 1.82, + "learning_rate": 2.7428255927585855e-05, + "loss": 0.0052, + "step": 701020 + }, + { + "epoch": 1.82, + "learning_rate": 2.742436771121439e-05, + "loss": 0.0073, + "step": 701030 + }, + { + "epoch": 1.82, + "learning_rate": 2.7420479494842928e-05, + "loss": 0.004, + "step": 701040 + }, + { + "epoch": 1.82, + "learning_rate": 2.7416591278471463e-05, + "loss": 0.0088, + "step": 701050 + }, + { + "epoch": 1.82, + "learning_rate": 2.7412703062099998e-05, + "loss": 0.0077, + "step": 701060 + }, + { + "epoch": 1.82, + "learning_rate": 2.7408814845728533e-05, + "loss": 0.0071, + "step": 701070 + }, + { + "epoch": 1.82, + "learning_rate": 2.740492662935707e-05, + "loss": 0.007, + "step": 701080 + }, + { + "epoch": 1.82, + "learning_rate": 2.7401038412985602e-05, + "loss": 0.0057, + "step": 701090 + }, + { + "epoch": 1.82, + "learning_rate": 2.7397150196614137e-05, + "loss": 0.0064, + "step": 701100 + }, + { + "epoch": 1.82, + "learning_rate": 2.7393261980242672e-05, + "loss": 0.008, + "step": 701110 + }, + { + "epoch": 1.82, + "learning_rate": 2.7389373763871207e-05, + "loss": 0.0078, + "step": 701120 + }, + { + "epoch": 1.82, + "learning_rate": 2.7385485547499745e-05, + "loss": 0.0082, + "step": 701130 + }, + { + "epoch": 1.82, + "learning_rate": 2.738159733112828e-05, + "loss": 0.0068, + "step": 701140 + }, + { + "epoch": 1.82, + "learning_rate": 2.7377709114756815e-05, + "loss": 0.0072, + "step": 701150 + }, + { + "epoch": 1.82, + "learning_rate": 2.737382089838535e-05, + "loss": 0.0077, + "step": 701160 + }, + { + "epoch": 1.82, + "learning_rate": 2.7369932682013888e-05, + "loss": 0.007, + "step": 701170 + }, + { + "epoch": 1.82, + "learning_rate": 2.7366044465642423e-05, + "loss": 0.0107, + "step": 701180 + }, + { + "epoch": 1.82, + "learning_rate": 2.7362156249270958e-05, + "loss": 0.0069, + "step": 701190 + }, + { + "epoch": 1.82, + "learning_rate": 2.7358268032899493e-05, + "loss": 0.0089, + "step": 701200 + }, + { + "epoch": 1.82, + "learning_rate": 2.735437981652803e-05, + "loss": 0.0071, + "step": 701210 + }, + { + "epoch": 1.82, + "learning_rate": 2.7350491600156562e-05, + "loss": 0.0068, + "step": 701220 + }, + { + "epoch": 1.82, + "learning_rate": 2.7346603383785097e-05, + "loss": 0.0094, + "step": 701230 + }, + { + "epoch": 1.82, + "learning_rate": 2.7342715167413632e-05, + "loss": 0.0094, + "step": 701240 + }, + { + "epoch": 1.82, + "learning_rate": 2.7338826951042167e-05, + "loss": 0.0063, + "step": 701250 + }, + { + "epoch": 1.82, + "learning_rate": 2.7334938734670705e-05, + "loss": 0.0073, + "step": 701260 + }, + { + "epoch": 1.82, + "learning_rate": 2.733105051829924e-05, + "loss": 0.0062, + "step": 701270 + }, + { + "epoch": 1.82, + "learning_rate": 2.7327162301927775e-05, + "loss": 0.0089, + "step": 701280 + }, + { + "epoch": 1.82, + "learning_rate": 2.732327408555631e-05, + "loss": 0.0074, + "step": 701290 + }, + { + "epoch": 1.82, + "learning_rate": 2.7319385869184848e-05, + "loss": 0.0062, + "step": 701300 + }, + { + "epoch": 1.82, + "learning_rate": 2.7315497652813383e-05, + "loss": 0.0063, + "step": 701310 + }, + { + "epoch": 1.82, + "learning_rate": 2.7311609436441918e-05, + "loss": 0.0062, + "step": 701320 + }, + { + "epoch": 1.82, + "learning_rate": 2.7307721220070453e-05, + "loss": 0.0061, + "step": 701330 + }, + { + "epoch": 1.82, + "learning_rate": 2.7303833003698984e-05, + "loss": 0.0088, + "step": 701340 + }, + { + "epoch": 1.82, + "learning_rate": 2.7299944787327522e-05, + "loss": 0.0075, + "step": 701350 + }, + { + "epoch": 1.82, + "learning_rate": 2.7296056570956057e-05, + "loss": 0.0071, + "step": 701360 + }, + { + "epoch": 1.82, + "learning_rate": 2.7292168354584592e-05, + "loss": 0.0054, + "step": 701370 + }, + { + "epoch": 1.82, + "learning_rate": 2.7288280138213127e-05, + "loss": 0.0126, + "step": 701380 + }, + { + "epoch": 1.82, + "learning_rate": 2.7284391921841665e-05, + "loss": 0.0069, + "step": 701390 + }, + { + "epoch": 1.82, + "learning_rate": 2.72805037054702e-05, + "loss": 0.0065, + "step": 701400 + }, + { + "epoch": 1.82, + "learning_rate": 2.7276615489098735e-05, + "loss": 0.0071, + "step": 701410 + }, + { + "epoch": 1.82, + "learning_rate": 2.727272727272727e-05, + "loss": 0.0075, + "step": 701420 + }, + { + "epoch": 1.82, + "learning_rate": 2.7268839056355808e-05, + "loss": 0.0131, + "step": 701430 + }, + { + "epoch": 1.82, + "learning_rate": 2.7264950839984343e-05, + "loss": 0.0075, + "step": 701440 + }, + { + "epoch": 1.82, + "learning_rate": 2.7261062623612878e-05, + "loss": 0.0078, + "step": 701450 + }, + { + "epoch": 1.82, + "learning_rate": 2.725717440724141e-05, + "loss": 0.0069, + "step": 701460 + }, + { + "epoch": 1.82, + "learning_rate": 2.7253286190869944e-05, + "loss": 0.0084, + "step": 701470 + }, + { + "epoch": 1.82, + "learning_rate": 2.7249397974498482e-05, + "loss": 0.0061, + "step": 701480 + }, + { + "epoch": 1.82, + "learning_rate": 2.7245509758127017e-05, + "loss": 0.0073, + "step": 701490 + }, + { + "epoch": 1.82, + "learning_rate": 2.7241621541755552e-05, + "loss": 0.0086, + "step": 701500 + }, + { + "epoch": 1.82, + "learning_rate": 2.7237733325384087e-05, + "loss": 0.0058, + "step": 701510 + }, + { + "epoch": 1.82, + "learning_rate": 2.7233845109012625e-05, + "loss": 0.0071, + "step": 701520 + }, + { + "epoch": 1.82, + "learning_rate": 2.722995689264116e-05, + "loss": 0.0049, + "step": 701530 + }, + { + "epoch": 1.82, + "learning_rate": 2.7226068676269695e-05, + "loss": 0.0067, + "step": 701540 + }, + { + "epoch": 1.82, + "learning_rate": 2.722218045989823e-05, + "loss": 0.0106, + "step": 701550 + }, + { + "epoch": 1.82, + "learning_rate": 2.7218292243526768e-05, + "loss": 0.0057, + "step": 701560 + }, + { + "epoch": 1.82, + "learning_rate": 2.7214404027155303e-05, + "loss": 0.01, + "step": 701570 + }, + { + "epoch": 1.82, + "learning_rate": 2.7210515810783838e-05, + "loss": 0.0082, + "step": 701580 + }, + { + "epoch": 1.82, + "learning_rate": 2.720662759441237e-05, + "loss": 0.0071, + "step": 701590 + }, + { + "epoch": 1.82, + "learning_rate": 2.7202739378040904e-05, + "loss": 0.0074, + "step": 701600 + }, + { + "epoch": 1.82, + "learning_rate": 2.7198851161669442e-05, + "loss": 0.0089, + "step": 701610 + }, + { + "epoch": 1.82, + "learning_rate": 2.7194962945297977e-05, + "loss": 0.0082, + "step": 701620 + }, + { + "epoch": 1.82, + "learning_rate": 2.7191074728926512e-05, + "loss": 0.0057, + "step": 701630 + }, + { + "epoch": 1.82, + "learning_rate": 2.7187186512555047e-05, + "loss": 0.0075, + "step": 701640 + }, + { + "epoch": 1.82, + "learning_rate": 2.7183298296183585e-05, + "loss": 0.0063, + "step": 701650 + }, + { + "epoch": 1.82, + "learning_rate": 2.717941007981212e-05, + "loss": 0.0075, + "step": 701660 + }, + { + "epoch": 1.82, + "learning_rate": 2.7175521863440655e-05, + "loss": 0.0076, + "step": 701670 + }, + { + "epoch": 1.82, + "learning_rate": 2.717163364706919e-05, + "loss": 0.0098, + "step": 701680 + }, + { + "epoch": 1.82, + "learning_rate": 2.7167745430697728e-05, + "loss": 0.0097, + "step": 701690 + }, + { + "epoch": 1.82, + "learning_rate": 2.7163857214326263e-05, + "loss": 0.008, + "step": 701700 + }, + { + "epoch": 1.82, + "learning_rate": 2.7159968997954794e-05, + "loss": 0.0054, + "step": 701710 + }, + { + "epoch": 1.82, + "learning_rate": 2.715608078158333e-05, + "loss": 0.0062, + "step": 701720 + }, + { + "epoch": 1.82, + "learning_rate": 2.7152192565211864e-05, + "loss": 0.0065, + "step": 701730 + }, + { + "epoch": 1.82, + "learning_rate": 2.7148304348840402e-05, + "loss": 0.011, + "step": 701740 + }, + { + "epoch": 1.82, + "learning_rate": 2.7144416132468937e-05, + "loss": 0.0068, + "step": 701750 + }, + { + "epoch": 1.82, + "learning_rate": 2.7140527916097472e-05, + "loss": 0.0066, + "step": 701760 + }, + { + "epoch": 1.82, + "learning_rate": 2.7136639699726007e-05, + "loss": 0.0081, + "step": 701770 + }, + { + "epoch": 1.82, + "learning_rate": 2.7132751483354545e-05, + "loss": 0.0058, + "step": 701780 + }, + { + "epoch": 1.82, + "learning_rate": 2.712886326698308e-05, + "loss": 0.0081, + "step": 701790 + }, + { + "epoch": 1.82, + "learning_rate": 2.7124975050611615e-05, + "loss": 0.008, + "step": 701800 + }, + { + "epoch": 1.82, + "learning_rate": 2.712108683424015e-05, + "loss": 0.008, + "step": 701810 + }, + { + "epoch": 1.82, + "learning_rate": 2.7117198617868688e-05, + "loss": 0.0056, + "step": 701820 + }, + { + "epoch": 1.82, + "learning_rate": 2.7113310401497223e-05, + "loss": 0.0082, + "step": 701830 + }, + { + "epoch": 1.82, + "learning_rate": 2.7109422185125754e-05, + "loss": 0.0066, + "step": 701840 + }, + { + "epoch": 1.82, + "learning_rate": 2.710553396875429e-05, + "loss": 0.005, + "step": 701850 + }, + { + "epoch": 1.82, + "learning_rate": 2.7101645752382824e-05, + "loss": 0.0055, + "step": 701860 + }, + { + "epoch": 1.82, + "learning_rate": 2.7097757536011362e-05, + "loss": 0.0083, + "step": 701870 + }, + { + "epoch": 1.82, + "learning_rate": 2.7093869319639897e-05, + "loss": 0.0067, + "step": 701880 + }, + { + "epoch": 1.82, + "learning_rate": 2.7089981103268432e-05, + "loss": 0.0079, + "step": 701890 + }, + { + "epoch": 1.82, + "learning_rate": 2.7086092886896967e-05, + "loss": 0.0091, + "step": 701900 + }, + { + "epoch": 1.82, + "learning_rate": 2.7082204670525505e-05, + "loss": 0.0086, + "step": 701910 + }, + { + "epoch": 1.82, + "learning_rate": 2.707831645415404e-05, + "loss": 0.0077, + "step": 701920 + }, + { + "epoch": 1.82, + "learning_rate": 2.7074428237782575e-05, + "loss": 0.0082, + "step": 701930 + }, + { + "epoch": 1.82, + "learning_rate": 2.707054002141111e-05, + "loss": 0.0087, + "step": 701940 + }, + { + "epoch": 1.82, + "learning_rate": 2.7066651805039648e-05, + "loss": 0.0089, + "step": 701950 + }, + { + "epoch": 1.82, + "learning_rate": 2.706276358866818e-05, + "loss": 0.0074, + "step": 701960 + }, + { + "epoch": 1.82, + "learning_rate": 2.7058875372296714e-05, + "loss": 0.007, + "step": 701970 + }, + { + "epoch": 1.82, + "learning_rate": 2.705498715592525e-05, + "loss": 0.0049, + "step": 701980 + }, + { + "epoch": 1.82, + "learning_rate": 2.7051098939553784e-05, + "loss": 0.0074, + "step": 701990 + }, + { + "epoch": 1.82, + "learning_rate": 2.7047210723182322e-05, + "loss": 0.0054, + "step": 702000 + }, + { + "epoch": 1.82, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.004621751606464386, + "eval_runtime": 107.8759, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 702000 + }, + { + "epoch": 1.82, + "learning_rate": 2.7043322506810857e-05, + "loss": 0.0067, + "step": 702010 + }, + { + "epoch": 1.82, + "learning_rate": 2.7039434290439392e-05, + "loss": 0.0087, + "step": 702020 + }, + { + "epoch": 1.82, + "learning_rate": 2.7035546074067927e-05, + "loss": 0.01, + "step": 702030 + }, + { + "epoch": 1.82, + "learning_rate": 2.7031657857696465e-05, + "loss": 0.0076, + "step": 702040 + }, + { + "epoch": 1.82, + "learning_rate": 2.7027769641325e-05, + "loss": 0.0104, + "step": 702050 + }, + { + "epoch": 1.82, + "learning_rate": 2.7023881424953535e-05, + "loss": 0.0057, + "step": 702060 + }, + { + "epoch": 1.82, + "learning_rate": 2.701999320858207e-05, + "loss": 0.0092, + "step": 702070 + }, + { + "epoch": 1.82, + "learning_rate": 2.70161049922106e-05, + "loss": 0.0079, + "step": 702080 + }, + { + "epoch": 1.82, + "learning_rate": 2.701221677583914e-05, + "loss": 0.0052, + "step": 702090 + }, + { + "epoch": 1.82, + "learning_rate": 2.7008328559467674e-05, + "loss": 0.0057, + "step": 702100 + }, + { + "epoch": 1.82, + "learning_rate": 2.700444034309621e-05, + "loss": 0.008, + "step": 702110 + }, + { + "epoch": 1.82, + "learning_rate": 2.7000552126724744e-05, + "loss": 0.008, + "step": 702120 + }, + { + "epoch": 1.82, + "learning_rate": 2.6996663910353282e-05, + "loss": 0.0093, + "step": 702130 + }, + { + "epoch": 1.82, + "learning_rate": 2.6992775693981817e-05, + "loss": 0.0076, + "step": 702140 + }, + { + "epoch": 1.82, + "learning_rate": 2.6988887477610352e-05, + "loss": 0.0077, + "step": 702150 + }, + { + "epoch": 1.82, + "learning_rate": 2.6984999261238887e-05, + "loss": 0.0047, + "step": 702160 + }, + { + "epoch": 1.82, + "learning_rate": 2.6981111044867425e-05, + "loss": 0.0049, + "step": 702170 + }, + { + "epoch": 1.82, + "learning_rate": 2.697722282849596e-05, + "loss": 0.0064, + "step": 702180 + }, + { + "epoch": 1.82, + "learning_rate": 2.6973334612124495e-05, + "loss": 0.0092, + "step": 702190 + }, + { + "epoch": 1.82, + "learning_rate": 2.696944639575303e-05, + "loss": 0.006, + "step": 702200 + }, + { + "epoch": 1.82, + "learning_rate": 2.696555817938156e-05, + "loss": 0.0071, + "step": 702210 + }, + { + "epoch": 1.82, + "learning_rate": 2.69616699630101e-05, + "loss": 0.0087, + "step": 702220 + }, + { + "epoch": 1.82, + "learning_rate": 2.6957781746638634e-05, + "loss": 0.0081, + "step": 702230 + }, + { + "epoch": 1.82, + "learning_rate": 2.695389353026717e-05, + "loss": 0.0066, + "step": 702240 + }, + { + "epoch": 1.82, + "learning_rate": 2.6950005313895704e-05, + "loss": 0.0085, + "step": 702250 + }, + { + "epoch": 1.82, + "learning_rate": 2.6946117097524242e-05, + "loss": 0.0112, + "step": 702260 + }, + { + "epoch": 1.82, + "learning_rate": 2.6942228881152777e-05, + "loss": 0.0129, + "step": 702270 + }, + { + "epoch": 1.82, + "learning_rate": 2.6938340664781312e-05, + "loss": 0.0087, + "step": 702280 + }, + { + "epoch": 1.82, + "learning_rate": 2.6934452448409847e-05, + "loss": 0.006, + "step": 702290 + }, + { + "epoch": 1.82, + "learning_rate": 2.693056423203838e-05, + "loss": 0.006, + "step": 702300 + }, + { + "epoch": 1.82, + "learning_rate": 2.692667601566692e-05, + "loss": 0.0049, + "step": 702310 + }, + { + "epoch": 1.82, + "learning_rate": 2.6922787799295455e-05, + "loss": 0.0062, + "step": 702320 + }, + { + "epoch": 1.82, + "learning_rate": 2.6918899582923986e-05, + "loss": 0.0056, + "step": 702330 + }, + { + "epoch": 1.82, + "learning_rate": 2.691501136655252e-05, + "loss": 0.0087, + "step": 702340 + }, + { + "epoch": 1.82, + "learning_rate": 2.6911123150181056e-05, + "loss": 0.0091, + "step": 702350 + }, + { + "epoch": 1.82, + "learning_rate": 2.6907234933809594e-05, + "loss": 0.0101, + "step": 702360 + }, + { + "epoch": 1.82, + "learning_rate": 2.690334671743813e-05, + "loss": 0.0064, + "step": 702370 + }, + { + "epoch": 1.82, + "learning_rate": 2.6899458501066664e-05, + "loss": 0.0083, + "step": 702380 + }, + { + "epoch": 1.82, + "learning_rate": 2.68955702846952e-05, + "loss": 0.006, + "step": 702390 + }, + { + "epoch": 1.82, + "learning_rate": 2.6891682068323737e-05, + "loss": 0.0066, + "step": 702400 + }, + { + "epoch": 1.82, + "learning_rate": 2.6887793851952272e-05, + "loss": 0.0072, + "step": 702410 + }, + { + "epoch": 1.82, + "learning_rate": 2.6883905635580807e-05, + "loss": 0.0069, + "step": 702420 + }, + { + "epoch": 1.82, + "learning_rate": 2.688001741920934e-05, + "loss": 0.0087, + "step": 702430 + }, + { + "epoch": 1.82, + "learning_rate": 2.687612920283788e-05, + "loss": 0.0084, + "step": 702440 + }, + { + "epoch": 1.82, + "learning_rate": 2.6872240986466415e-05, + "loss": 0.0083, + "step": 702450 + }, + { + "epoch": 1.82, + "learning_rate": 2.6868352770094946e-05, + "loss": 0.0114, + "step": 702460 + }, + { + "epoch": 1.82, + "learning_rate": 2.686446455372348e-05, + "loss": 0.0067, + "step": 702470 + }, + { + "epoch": 1.82, + "learning_rate": 2.6860576337352016e-05, + "loss": 0.0084, + "step": 702480 + }, + { + "epoch": 1.82, + "learning_rate": 2.6856688120980554e-05, + "loss": 0.0068, + "step": 702490 + }, + { + "epoch": 1.82, + "learning_rate": 2.685279990460909e-05, + "loss": 0.0064, + "step": 702500 + }, + { + "epoch": 1.82, + "learning_rate": 2.6848911688237624e-05, + "loss": 0.0054, + "step": 702510 + }, + { + "epoch": 1.82, + "learning_rate": 2.684502347186616e-05, + "loss": 0.0077, + "step": 702520 + }, + { + "epoch": 1.82, + "learning_rate": 2.6841135255494697e-05, + "loss": 0.0096, + "step": 702530 + }, + { + "epoch": 1.82, + "learning_rate": 2.6837247039123232e-05, + "loss": 0.007, + "step": 702540 + }, + { + "epoch": 1.82, + "learning_rate": 2.6833358822751767e-05, + "loss": 0.0062, + "step": 702550 + }, + { + "epoch": 1.82, + "learning_rate": 2.68294706063803e-05, + "loss": 0.0062, + "step": 702560 + }, + { + "epoch": 1.82, + "learning_rate": 2.682558239000884e-05, + "loss": 0.0075, + "step": 702570 + }, + { + "epoch": 1.82, + "learning_rate": 2.682169417363737e-05, + "loss": 0.0068, + "step": 702580 + }, + { + "epoch": 1.82, + "learning_rate": 2.6817805957265906e-05, + "loss": 0.0079, + "step": 702590 + }, + { + "epoch": 1.82, + "learning_rate": 2.681391774089444e-05, + "loss": 0.0097, + "step": 702600 + }, + { + "epoch": 1.82, + "learning_rate": 2.6810029524522976e-05, + "loss": 0.0071, + "step": 702610 + }, + { + "epoch": 1.82, + "learning_rate": 2.6806141308151514e-05, + "loss": 0.0061, + "step": 702620 + }, + { + "epoch": 1.82, + "learning_rate": 2.680225309178005e-05, + "loss": 0.0058, + "step": 702630 + }, + { + "epoch": 1.82, + "learning_rate": 2.6798364875408584e-05, + "loss": 0.0063, + "step": 702640 + }, + { + "epoch": 1.82, + "learning_rate": 2.679447665903712e-05, + "loss": 0.0082, + "step": 702650 + }, + { + "epoch": 1.82, + "learning_rate": 2.6790588442665657e-05, + "loss": 0.0104, + "step": 702660 + }, + { + "epoch": 1.82, + "learning_rate": 2.6786700226294192e-05, + "loss": 0.0073, + "step": 702670 + }, + { + "epoch": 1.82, + "learning_rate": 2.6782812009922727e-05, + "loss": 0.0071, + "step": 702680 + }, + { + "epoch": 1.82, + "learning_rate": 2.677892379355126e-05, + "loss": 0.0095, + "step": 702690 + }, + { + "epoch": 1.82, + "learning_rate": 2.67750355771798e-05, + "loss": 0.006, + "step": 702700 + }, + { + "epoch": 1.82, + "learning_rate": 2.677114736080833e-05, + "loss": 0.0117, + "step": 702710 + }, + { + "epoch": 1.82, + "learning_rate": 2.6767259144436866e-05, + "loss": 0.0076, + "step": 702720 + }, + { + "epoch": 1.82, + "learning_rate": 2.67633709280654e-05, + "loss": 0.0063, + "step": 702730 + }, + { + "epoch": 1.82, + "learning_rate": 2.6759482711693936e-05, + "loss": 0.0079, + "step": 702740 + }, + { + "epoch": 1.82, + "learning_rate": 2.6755594495322474e-05, + "loss": 0.0076, + "step": 702750 + }, + { + "epoch": 1.82, + "learning_rate": 2.675170627895101e-05, + "loss": 0.0053, + "step": 702760 + }, + { + "epoch": 1.82, + "learning_rate": 2.6747818062579544e-05, + "loss": 0.0063, + "step": 702770 + }, + { + "epoch": 1.82, + "learning_rate": 2.674392984620808e-05, + "loss": 0.0091, + "step": 702780 + }, + { + "epoch": 1.82, + "learning_rate": 2.6740041629836617e-05, + "loss": 0.0057, + "step": 702790 + }, + { + "epoch": 1.82, + "learning_rate": 2.6736153413465152e-05, + "loss": 0.0078, + "step": 702800 + }, + { + "epoch": 1.82, + "learning_rate": 2.6732265197093687e-05, + "loss": 0.0074, + "step": 702810 + }, + { + "epoch": 1.82, + "learning_rate": 2.672837698072222e-05, + "loss": 0.007, + "step": 702820 + }, + { + "epoch": 1.82, + "learning_rate": 2.6724488764350753e-05, + "loss": 0.0061, + "step": 702830 + }, + { + "epoch": 1.82, + "learning_rate": 2.672060054797929e-05, + "loss": 0.0106, + "step": 702840 + }, + { + "epoch": 1.82, + "learning_rate": 2.6716712331607826e-05, + "loss": 0.0068, + "step": 702850 + }, + { + "epoch": 1.82, + "learning_rate": 2.671282411523636e-05, + "loss": 0.0055, + "step": 702860 + }, + { + "epoch": 1.82, + "learning_rate": 2.6708935898864896e-05, + "loss": 0.0096, + "step": 702870 + }, + { + "epoch": 1.82, + "learning_rate": 2.6705047682493434e-05, + "loss": 0.0086, + "step": 702880 + }, + { + "epoch": 1.82, + "learning_rate": 2.670115946612197e-05, + "loss": 0.0102, + "step": 702890 + }, + { + "epoch": 1.82, + "learning_rate": 2.6697271249750504e-05, + "loss": 0.0063, + "step": 702900 + }, + { + "epoch": 1.82, + "learning_rate": 2.669338303337904e-05, + "loss": 0.0107, + "step": 702910 + }, + { + "epoch": 1.82, + "learning_rate": 2.6689494817007577e-05, + "loss": 0.0067, + "step": 702920 + }, + { + "epoch": 1.82, + "learning_rate": 2.6685606600636112e-05, + "loss": 0.0075, + "step": 702930 + }, + { + "epoch": 1.82, + "learning_rate": 2.6681718384264647e-05, + "loss": 0.0083, + "step": 702940 + }, + { + "epoch": 1.82, + "learning_rate": 2.6677830167893178e-05, + "loss": 0.0077, + "step": 702950 + }, + { + "epoch": 1.82, + "learning_rate": 2.6673941951521713e-05, + "loss": 0.0071, + "step": 702960 + }, + { + "epoch": 1.82, + "learning_rate": 2.667005373515025e-05, + "loss": 0.0062, + "step": 702970 + }, + { + "epoch": 1.82, + "learning_rate": 2.6666165518778786e-05, + "loss": 0.0063, + "step": 702980 + }, + { + "epoch": 1.82, + "learning_rate": 2.666227730240732e-05, + "loss": 0.0078, + "step": 702990 + }, + { + "epoch": 1.82, + "learning_rate": 2.6658389086035856e-05, + "loss": 0.0066, + "step": 703000 + }, + { + "epoch": 1.82, + "eval_cer": 0.8816453012088664, + "eval_loss": 0.004601156339049339, + "eval_runtime": 107.7473, + "eval_samples_per_second": 18.562, + "eval_steps_per_second": 4.64, + "step": 703000 + }, + { + "epoch": 1.82, + "learning_rate": 2.6654500869664394e-05, + "loss": 0.0082, + "step": 703010 + }, + { + "epoch": 1.82, + "learning_rate": 2.665061265329293e-05, + "loss": 0.0077, + "step": 703020 + }, + { + "epoch": 1.82, + "learning_rate": 2.6646724436921464e-05, + "loss": 0.008, + "step": 703030 + }, + { + "epoch": 1.82, + "learning_rate": 2.664283622055e-05, + "loss": 0.0083, + "step": 703040 + }, + { + "epoch": 1.82, + "learning_rate": 2.6638948004178537e-05, + "loss": 0.0101, + "step": 703050 + }, + { + "epoch": 1.82, + "learning_rate": 2.6635059787807072e-05, + "loss": 0.0065, + "step": 703060 + }, + { + "epoch": 1.82, + "learning_rate": 2.6631171571435607e-05, + "loss": 0.0068, + "step": 703070 + }, + { + "epoch": 1.82, + "learning_rate": 2.6627283355064138e-05, + "loss": 0.0075, + "step": 703080 + }, + { + "epoch": 1.82, + "learning_rate": 2.6623395138692673e-05, + "loss": 0.0084, + "step": 703090 + }, + { + "epoch": 1.82, + "learning_rate": 2.661950692232121e-05, + "loss": 0.0063, + "step": 703100 + }, + { + "epoch": 1.82, + "learning_rate": 2.6615618705949746e-05, + "loss": 0.0091, + "step": 703110 + }, + { + "epoch": 1.82, + "learning_rate": 2.661173048957828e-05, + "loss": 0.0072, + "step": 703120 + }, + { + "epoch": 1.82, + "learning_rate": 2.6607842273206816e-05, + "loss": 0.0073, + "step": 703130 + }, + { + "epoch": 1.82, + "learning_rate": 2.6603954056835354e-05, + "loss": 0.0064, + "step": 703140 + }, + { + "epoch": 1.82, + "learning_rate": 2.660006584046389e-05, + "loss": 0.0101, + "step": 703150 + }, + { + "epoch": 1.82, + "learning_rate": 2.6596177624092424e-05, + "loss": 0.0067, + "step": 703160 + }, + { + "epoch": 1.82, + "learning_rate": 2.659228940772096e-05, + "loss": 0.0092, + "step": 703170 + }, + { + "epoch": 1.82, + "learning_rate": 2.6588401191349497e-05, + "loss": 0.0063, + "step": 703180 + }, + { + "epoch": 1.82, + "learning_rate": 2.658451297497803e-05, + "loss": 0.0059, + "step": 703190 + }, + { + "epoch": 1.82, + "learning_rate": 2.6580624758606563e-05, + "loss": 0.0077, + "step": 703200 + }, + { + "epoch": 1.82, + "learning_rate": 2.6576736542235098e-05, + "loss": 0.0071, + "step": 703210 + }, + { + "epoch": 1.82, + "learning_rate": 2.6572848325863633e-05, + "loss": 0.0064, + "step": 703220 + }, + { + "epoch": 1.82, + "learning_rate": 2.656896010949217e-05, + "loss": 0.0148, + "step": 703230 + }, + { + "epoch": 1.82, + "learning_rate": 2.6565071893120706e-05, + "loss": 0.0053, + "step": 703240 + }, + { + "epoch": 1.82, + "learning_rate": 2.656118367674924e-05, + "loss": 0.0079, + "step": 703250 + }, + { + "epoch": 1.82, + "learning_rate": 2.6557295460377776e-05, + "loss": 0.0067, + "step": 703260 + }, + { + "epoch": 1.82, + "learning_rate": 2.6553407244006314e-05, + "loss": 0.0081, + "step": 703270 + }, + { + "epoch": 1.82, + "learning_rate": 2.654951902763485e-05, + "loss": 0.0077, + "step": 703280 + }, + { + "epoch": 1.82, + "learning_rate": 2.6545630811263384e-05, + "loss": 0.0079, + "step": 703290 + }, + { + "epoch": 1.82, + "learning_rate": 2.654174259489192e-05, + "loss": 0.0075, + "step": 703300 + }, + { + "epoch": 1.82, + "learning_rate": 2.6537854378520457e-05, + "loss": 0.0079, + "step": 703310 + }, + { + "epoch": 1.82, + "learning_rate": 2.653396616214899e-05, + "loss": 0.0068, + "step": 703320 + }, + { + "epoch": 1.82, + "learning_rate": 2.6530077945777523e-05, + "loss": 0.0072, + "step": 703330 + }, + { + "epoch": 1.82, + "learning_rate": 2.6526189729406058e-05, + "loss": 0.008, + "step": 703340 + }, + { + "epoch": 1.82, + "learning_rate": 2.6522301513034593e-05, + "loss": 0.0092, + "step": 703350 + }, + { + "epoch": 1.82, + "learning_rate": 2.651841329666313e-05, + "loss": 0.0069, + "step": 703360 + }, + { + "epoch": 1.82, + "learning_rate": 2.6514525080291666e-05, + "loss": 0.0085, + "step": 703370 + }, + { + "epoch": 1.82, + "learning_rate": 2.65106368639202e-05, + "loss": 0.0084, + "step": 703380 + }, + { + "epoch": 1.82, + "learning_rate": 2.6506748647548736e-05, + "loss": 0.0089, + "step": 703390 + }, + { + "epoch": 1.82, + "learning_rate": 2.6502860431177274e-05, + "loss": 0.0094, + "step": 703400 + }, + { + "epoch": 1.82, + "learning_rate": 2.649897221480581e-05, + "loss": 0.0061, + "step": 703410 + }, + { + "epoch": 1.82, + "learning_rate": 2.6495083998434344e-05, + "loss": 0.0079, + "step": 703420 + }, + { + "epoch": 1.82, + "learning_rate": 2.649119578206288e-05, + "loss": 0.0079, + "step": 703430 + }, + { + "epoch": 1.82, + "learning_rate": 2.6487307565691417e-05, + "loss": 0.0071, + "step": 703440 + }, + { + "epoch": 1.82, + "learning_rate": 2.6483419349319948e-05, + "loss": 0.0068, + "step": 703450 + }, + { + "epoch": 1.82, + "learning_rate": 2.6479531132948483e-05, + "loss": 0.0068, + "step": 703460 + }, + { + "epoch": 1.82, + "learning_rate": 2.6475642916577018e-05, + "loss": 0.0077, + "step": 703470 + }, + { + "epoch": 1.82, + "learning_rate": 2.6471754700205553e-05, + "loss": 0.0083, + "step": 703480 + }, + { + "epoch": 1.82, + "learning_rate": 2.646786648383409e-05, + "loss": 0.0055, + "step": 703490 + }, + { + "epoch": 1.82, + "learning_rate": 2.6463978267462626e-05, + "loss": 0.007, + "step": 703500 + }, + { + "epoch": 1.82, + "learning_rate": 2.646009005109116e-05, + "loss": 0.0085, + "step": 703510 + }, + { + "epoch": 1.82, + "learning_rate": 2.6456201834719696e-05, + "loss": 0.0075, + "step": 703520 + }, + { + "epoch": 1.82, + "learning_rate": 2.6452313618348234e-05, + "loss": 0.0072, + "step": 703530 + }, + { + "epoch": 1.82, + "learning_rate": 2.644842540197677e-05, + "loss": 0.0101, + "step": 703540 + }, + { + "epoch": 1.82, + "learning_rate": 2.6444537185605304e-05, + "loss": 0.0153, + "step": 703550 + }, + { + "epoch": 1.82, + "learning_rate": 2.644064896923384e-05, + "loss": 0.007, + "step": 703560 + }, + { + "epoch": 1.82, + "learning_rate": 2.643676075286237e-05, + "loss": 0.0046, + "step": 703570 + }, + { + "epoch": 1.82, + "learning_rate": 2.6432872536490908e-05, + "loss": 0.0101, + "step": 703580 + }, + { + "epoch": 1.82, + "learning_rate": 2.6428984320119443e-05, + "loss": 0.0068, + "step": 703590 + }, + { + "epoch": 1.82, + "learning_rate": 2.6425096103747978e-05, + "loss": 0.0083, + "step": 703600 + }, + { + "epoch": 1.82, + "learning_rate": 2.6421207887376513e-05, + "loss": 0.007, + "step": 703610 + }, + { + "epoch": 1.82, + "learning_rate": 2.641731967100505e-05, + "loss": 0.0067, + "step": 703620 + }, + { + "epoch": 1.82, + "learning_rate": 2.6413431454633586e-05, + "loss": 0.0067, + "step": 703630 + }, + { + "epoch": 1.82, + "learning_rate": 2.640954323826212e-05, + "loss": 0.0073, + "step": 703640 + }, + { + "epoch": 1.82, + "learning_rate": 2.6405655021890656e-05, + "loss": 0.0078, + "step": 703650 + }, + { + "epoch": 1.82, + "learning_rate": 2.6401766805519194e-05, + "loss": 0.0093, + "step": 703660 + }, + { + "epoch": 1.82, + "learning_rate": 2.639787858914773e-05, + "loss": 0.0087, + "step": 703670 + }, + { + "epoch": 1.82, + "learning_rate": 2.6393990372776264e-05, + "loss": 0.0084, + "step": 703680 + }, + { + "epoch": 1.82, + "learning_rate": 2.63901021564048e-05, + "loss": 0.0075, + "step": 703690 + }, + { + "epoch": 1.82, + "learning_rate": 2.638621394003333e-05, + "loss": 0.0054, + "step": 703700 + }, + { + "epoch": 1.82, + "learning_rate": 2.6382325723661868e-05, + "loss": 0.0077, + "step": 703710 + }, + { + "epoch": 1.82, + "learning_rate": 2.6378437507290403e-05, + "loss": 0.0077, + "step": 703720 + }, + { + "epoch": 1.82, + "learning_rate": 2.6374549290918938e-05, + "loss": 0.0162, + "step": 703730 + }, + { + "epoch": 1.82, + "learning_rate": 2.6370661074547473e-05, + "loss": 0.0084, + "step": 703740 + }, + { + "epoch": 1.82, + "learning_rate": 2.6366772858176008e-05, + "loss": 0.0068, + "step": 703750 + }, + { + "epoch": 1.82, + "learning_rate": 2.6362884641804546e-05, + "loss": 0.0079, + "step": 703760 + }, + { + "epoch": 1.82, + "learning_rate": 2.635899642543308e-05, + "loss": 0.0061, + "step": 703770 + }, + { + "epoch": 1.82, + "learning_rate": 2.6355108209061616e-05, + "loss": 0.0071, + "step": 703780 + }, + { + "epoch": 1.82, + "learning_rate": 2.635121999269015e-05, + "loss": 0.0093, + "step": 703790 + }, + { + "epoch": 1.82, + "learning_rate": 2.634733177631869e-05, + "loss": 0.0181, + "step": 703800 + }, + { + "epoch": 1.82, + "learning_rate": 2.6343443559947224e-05, + "loss": 0.0092, + "step": 703810 + }, + { + "epoch": 1.82, + "learning_rate": 2.6339555343575755e-05, + "loss": 0.0085, + "step": 703820 + }, + { + "epoch": 1.82, + "learning_rate": 2.633566712720429e-05, + "loss": 0.0082, + "step": 703830 + }, + { + "epoch": 1.82, + "learning_rate": 2.6331778910832825e-05, + "loss": 0.0089, + "step": 703840 + }, + { + "epoch": 1.82, + "learning_rate": 2.6327890694461363e-05, + "loss": 0.0094, + "step": 703850 + }, + { + "epoch": 1.82, + "learning_rate": 2.6324002478089898e-05, + "loss": 0.0078, + "step": 703860 + }, + { + "epoch": 1.82, + "learning_rate": 2.6320114261718433e-05, + "loss": 0.0082, + "step": 703870 + }, + { + "epoch": 1.82, + "learning_rate": 2.6316226045346968e-05, + "loss": 0.0077, + "step": 703880 + }, + { + "epoch": 1.82, + "learning_rate": 2.6312337828975506e-05, + "loss": 0.0083, + "step": 703890 + }, + { + "epoch": 1.82, + "learning_rate": 2.630844961260404e-05, + "loss": 0.0074, + "step": 703900 + }, + { + "epoch": 1.82, + "learning_rate": 2.6304561396232576e-05, + "loss": 0.0098, + "step": 703910 + }, + { + "epoch": 1.82, + "learning_rate": 2.630067317986111e-05, + "loss": 0.0111, + "step": 703920 + }, + { + "epoch": 1.82, + "learning_rate": 2.629678496348965e-05, + "loss": 0.0056, + "step": 703930 + }, + { + "epoch": 1.82, + "learning_rate": 2.6292896747118184e-05, + "loss": 0.0086, + "step": 703940 + }, + { + "epoch": 1.82, + "learning_rate": 2.6289008530746715e-05, + "loss": 0.0082, + "step": 703950 + }, + { + "epoch": 1.82, + "learning_rate": 2.628512031437525e-05, + "loss": 0.0079, + "step": 703960 + }, + { + "epoch": 1.82, + "learning_rate": 2.6281232098003785e-05, + "loss": 0.0062, + "step": 703970 + }, + { + "epoch": 1.82, + "learning_rate": 2.6277343881632323e-05, + "loss": 0.005, + "step": 703980 + }, + { + "epoch": 1.82, + "learning_rate": 2.6273455665260858e-05, + "loss": 0.0065, + "step": 703990 + }, + { + "epoch": 1.82, + "learning_rate": 2.6269567448889393e-05, + "loss": 0.0061, + "step": 704000 + }, + { + "epoch": 1.82, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.004665213171392679, + "eval_runtime": 107.9314, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.633, + "step": 704000 + }, + { + "epoch": 1.82, + "learning_rate": 2.6265679232517928e-05, + "loss": 0.0105, + "step": 704010 + }, + { + "epoch": 1.82, + "learning_rate": 2.6261791016146466e-05, + "loss": 0.0067, + "step": 704020 + }, + { + "epoch": 1.82, + "learning_rate": 2.6257902799775e-05, + "loss": 0.0064, + "step": 704030 + }, + { + "epoch": 1.82, + "learning_rate": 2.6254014583403536e-05, + "loss": 0.0073, + "step": 704040 + }, + { + "epoch": 1.82, + "learning_rate": 2.625012636703207e-05, + "loss": 0.0094, + "step": 704050 + }, + { + "epoch": 1.83, + "learning_rate": 2.624623815066061e-05, + "loss": 0.0094, + "step": 704060 + }, + { + "epoch": 1.83, + "learning_rate": 2.624234993428914e-05, + "loss": 0.0053, + "step": 704070 + }, + { + "epoch": 1.83, + "learning_rate": 2.6238461717917675e-05, + "loss": 0.0084, + "step": 704080 + }, + { + "epoch": 1.83, + "learning_rate": 2.623457350154621e-05, + "loss": 0.0057, + "step": 704090 + }, + { + "epoch": 1.83, + "learning_rate": 2.6230685285174745e-05, + "loss": 0.0052, + "step": 704100 + }, + { + "epoch": 1.83, + "learning_rate": 2.6226797068803283e-05, + "loss": 0.0058, + "step": 704110 + }, + { + "epoch": 1.83, + "learning_rate": 2.6222908852431818e-05, + "loss": 0.0076, + "step": 704120 + }, + { + "epoch": 1.83, + "learning_rate": 2.6219020636060353e-05, + "loss": 0.0076, + "step": 704130 + }, + { + "epoch": 1.83, + "learning_rate": 2.6215132419688888e-05, + "loss": 0.0082, + "step": 704140 + }, + { + "epoch": 1.83, + "learning_rate": 2.6211244203317426e-05, + "loss": 0.0063, + "step": 704150 + }, + { + "epoch": 1.83, + "learning_rate": 2.620735598694596e-05, + "loss": 0.0069, + "step": 704160 + }, + { + "epoch": 1.83, + "learning_rate": 2.6203467770574496e-05, + "loss": 0.0073, + "step": 704170 + }, + { + "epoch": 1.83, + "learning_rate": 2.619957955420303e-05, + "loss": 0.0084, + "step": 704180 + }, + { + "epoch": 1.83, + "learning_rate": 2.6195691337831562e-05, + "loss": 0.0102, + "step": 704190 + }, + { + "epoch": 1.83, + "learning_rate": 2.61918031214601e-05, + "loss": 0.0069, + "step": 704200 + }, + { + "epoch": 1.83, + "learning_rate": 2.6187914905088635e-05, + "loss": 0.006, + "step": 704210 + }, + { + "epoch": 1.83, + "learning_rate": 2.618402668871717e-05, + "loss": 0.0079, + "step": 704220 + }, + { + "epoch": 1.83, + "learning_rate": 2.6180138472345705e-05, + "loss": 0.0128, + "step": 704230 + }, + { + "epoch": 1.83, + "learning_rate": 2.6176250255974243e-05, + "loss": 0.0053, + "step": 704240 + }, + { + "epoch": 1.83, + "learning_rate": 2.6172362039602778e-05, + "loss": 0.0073, + "step": 704250 + }, + { + "epoch": 1.83, + "learning_rate": 2.6168473823231313e-05, + "loss": 0.009, + "step": 704260 + }, + { + "epoch": 1.83, + "learning_rate": 2.6164585606859848e-05, + "loss": 0.0071, + "step": 704270 + }, + { + "epoch": 1.83, + "learning_rate": 2.6160697390488386e-05, + "loss": 0.0083, + "step": 704280 + }, + { + "epoch": 1.83, + "learning_rate": 2.615680917411692e-05, + "loss": 0.007, + "step": 704290 + }, + { + "epoch": 1.83, + "learning_rate": 2.6152920957745456e-05, + "loss": 0.0053, + "step": 704300 + }, + { + "epoch": 1.83, + "learning_rate": 2.614903274137399e-05, + "loss": 0.0043, + "step": 704310 + }, + { + "epoch": 1.83, + "learning_rate": 2.6145144525002522e-05, + "loss": 0.007, + "step": 704320 + }, + { + "epoch": 1.83, + "learning_rate": 2.614125630863106e-05, + "loss": 0.007, + "step": 704330 + }, + { + "epoch": 1.83, + "learning_rate": 2.6137368092259595e-05, + "loss": 0.011, + "step": 704340 + }, + { + "epoch": 1.83, + "learning_rate": 2.613347987588813e-05, + "loss": 0.0069, + "step": 704350 + }, + { + "epoch": 1.83, + "learning_rate": 2.6129591659516665e-05, + "loss": 0.0073, + "step": 704360 + }, + { + "epoch": 1.83, + "learning_rate": 2.6125703443145203e-05, + "loss": 0.0127, + "step": 704370 + }, + { + "epoch": 1.83, + "learning_rate": 2.6121815226773738e-05, + "loss": 0.0056, + "step": 704380 + }, + { + "epoch": 1.83, + "learning_rate": 2.6117927010402273e-05, + "loss": 0.0036, + "step": 704390 + }, + { + "epoch": 1.83, + "learning_rate": 2.6114038794030808e-05, + "loss": 0.009, + "step": 704400 + }, + { + "epoch": 1.83, + "learning_rate": 2.6110150577659346e-05, + "loss": 0.0071, + "step": 704410 + }, + { + "epoch": 1.83, + "learning_rate": 2.610626236128788e-05, + "loss": 0.0058, + "step": 704420 + }, + { + "epoch": 1.83, + "learning_rate": 2.6102374144916416e-05, + "loss": 0.0066, + "step": 704430 + }, + { + "epoch": 1.83, + "learning_rate": 2.6098485928544947e-05, + "loss": 0.0071, + "step": 704440 + }, + { + "epoch": 1.83, + "learning_rate": 2.6094597712173482e-05, + "loss": 0.0077, + "step": 704450 + }, + { + "epoch": 1.83, + "learning_rate": 2.609070949580202e-05, + "loss": 0.0089, + "step": 704460 + }, + { + "epoch": 1.83, + "learning_rate": 2.6086821279430555e-05, + "loss": 0.0062, + "step": 704470 + }, + { + "epoch": 1.83, + "learning_rate": 2.608293306305909e-05, + "loss": 0.007, + "step": 704480 + }, + { + "epoch": 1.83, + "learning_rate": 2.6079044846687625e-05, + "loss": 0.0059, + "step": 704490 + }, + { + "epoch": 1.83, + "learning_rate": 2.6075156630316163e-05, + "loss": 0.0079, + "step": 704500 + }, + { + "epoch": 1.83, + "learning_rate": 2.6071268413944698e-05, + "loss": 0.0073, + "step": 704510 + }, + { + "epoch": 1.83, + "learning_rate": 2.6067380197573233e-05, + "loss": 0.005, + "step": 704520 + }, + { + "epoch": 1.83, + "learning_rate": 2.6063491981201768e-05, + "loss": 0.0081, + "step": 704530 + }, + { + "epoch": 1.83, + "learning_rate": 2.6059603764830306e-05, + "loss": 0.0105, + "step": 704540 + }, + { + "epoch": 1.83, + "learning_rate": 2.605571554845884e-05, + "loss": 0.0066, + "step": 704550 + }, + { + "epoch": 1.83, + "learning_rate": 2.6051827332087375e-05, + "loss": 0.0082, + "step": 704560 + }, + { + "epoch": 1.83, + "learning_rate": 2.6047939115715907e-05, + "loss": 0.0079, + "step": 704570 + }, + { + "epoch": 1.83, + "learning_rate": 2.6044050899344442e-05, + "loss": 0.0075, + "step": 704580 + }, + { + "epoch": 1.83, + "learning_rate": 2.604016268297298e-05, + "loss": 0.0075, + "step": 704590 + }, + { + "epoch": 1.83, + "learning_rate": 2.6036274466601515e-05, + "loss": 0.0089, + "step": 704600 + }, + { + "epoch": 1.83, + "learning_rate": 2.603238625023005e-05, + "loss": 0.0078, + "step": 704610 + }, + { + "epoch": 1.83, + "learning_rate": 2.6028498033858585e-05, + "loss": 0.0067, + "step": 704620 + }, + { + "epoch": 1.83, + "learning_rate": 2.6024609817487123e-05, + "loss": 0.0067, + "step": 704630 + }, + { + "epoch": 1.83, + "learning_rate": 2.6020721601115658e-05, + "loss": 0.0059, + "step": 704640 + }, + { + "epoch": 1.83, + "learning_rate": 2.6016833384744193e-05, + "loss": 0.0083, + "step": 704650 + }, + { + "epoch": 1.83, + "learning_rate": 2.6012945168372727e-05, + "loss": 0.0057, + "step": 704660 + }, + { + "epoch": 1.83, + "learning_rate": 2.6009056952001266e-05, + "loss": 0.006, + "step": 704670 + }, + { + "epoch": 1.83, + "learning_rate": 2.60051687356298e-05, + "loss": 0.0076, + "step": 704680 + }, + { + "epoch": 1.83, + "learning_rate": 2.6001280519258332e-05, + "loss": 0.0078, + "step": 704690 + }, + { + "epoch": 1.83, + "learning_rate": 2.5997392302886867e-05, + "loss": 0.0068, + "step": 704700 + }, + { + "epoch": 1.83, + "learning_rate": 2.5993504086515402e-05, + "loss": 0.0068, + "step": 704710 + }, + { + "epoch": 1.83, + "learning_rate": 2.598961587014394e-05, + "loss": 0.0107, + "step": 704720 + }, + { + "epoch": 1.83, + "learning_rate": 2.5985727653772475e-05, + "loss": 0.0097, + "step": 704730 + }, + { + "epoch": 1.83, + "learning_rate": 2.598183943740101e-05, + "loss": 0.0083, + "step": 704740 + }, + { + "epoch": 1.83, + "learning_rate": 2.5977951221029545e-05, + "loss": 0.0068, + "step": 704750 + }, + { + "epoch": 1.83, + "learning_rate": 2.5974063004658083e-05, + "loss": 0.008, + "step": 704760 + }, + { + "epoch": 1.83, + "learning_rate": 2.5970174788286618e-05, + "loss": 0.0064, + "step": 704770 + }, + { + "epoch": 1.83, + "learning_rate": 2.5966286571915153e-05, + "loss": 0.0071, + "step": 704780 + }, + { + "epoch": 1.83, + "learning_rate": 2.5962398355543687e-05, + "loss": 0.0056, + "step": 704790 + }, + { + "epoch": 1.83, + "learning_rate": 2.5958510139172226e-05, + "loss": 0.0065, + "step": 704800 + }, + { + "epoch": 1.83, + "learning_rate": 2.5954621922800757e-05, + "loss": 0.0065, + "step": 704810 + }, + { + "epoch": 1.83, + "learning_rate": 2.5950733706429292e-05, + "loss": 0.0066, + "step": 704820 + }, + { + "epoch": 1.83, + "learning_rate": 2.5946845490057827e-05, + "loss": 0.0076, + "step": 704830 + }, + { + "epoch": 1.83, + "learning_rate": 2.5942957273686362e-05, + "loss": 0.0089, + "step": 704840 + }, + { + "epoch": 1.83, + "learning_rate": 2.59390690573149e-05, + "loss": 0.0067, + "step": 704850 + }, + { + "epoch": 1.83, + "learning_rate": 2.5935180840943435e-05, + "loss": 0.0099, + "step": 704860 + }, + { + "epoch": 1.83, + "learning_rate": 2.593129262457197e-05, + "loss": 0.0056, + "step": 704870 + }, + { + "epoch": 1.83, + "learning_rate": 2.5927404408200505e-05, + "loss": 0.0071, + "step": 704880 + }, + { + "epoch": 1.83, + "learning_rate": 2.5923516191829043e-05, + "loss": 0.0089, + "step": 704890 + }, + { + "epoch": 1.83, + "learning_rate": 2.5919627975457578e-05, + "loss": 0.0076, + "step": 704900 + }, + { + "epoch": 1.83, + "learning_rate": 2.5915739759086113e-05, + "loss": 0.0045, + "step": 704910 + }, + { + "epoch": 1.83, + "learning_rate": 2.5911851542714647e-05, + "loss": 0.0085, + "step": 704920 + }, + { + "epoch": 1.83, + "learning_rate": 2.5907963326343186e-05, + "loss": 0.0081, + "step": 704930 + }, + { + "epoch": 1.83, + "learning_rate": 2.5904075109971717e-05, + "loss": 0.0074, + "step": 704940 + }, + { + "epoch": 1.83, + "learning_rate": 2.5900186893600252e-05, + "loss": 0.0112, + "step": 704950 + }, + { + "epoch": 1.83, + "learning_rate": 2.5896298677228787e-05, + "loss": 0.0088, + "step": 704960 + }, + { + "epoch": 1.83, + "learning_rate": 2.5892410460857322e-05, + "loss": 0.0066, + "step": 704970 + }, + { + "epoch": 1.83, + "learning_rate": 2.588852224448586e-05, + "loss": 0.0101, + "step": 704980 + }, + { + "epoch": 1.83, + "learning_rate": 2.5884634028114395e-05, + "loss": 0.0083, + "step": 704990 + }, + { + "epoch": 1.83, + "learning_rate": 2.588074581174293e-05, + "loss": 0.0078, + "step": 705000 + }, + { + "epoch": 1.83, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.004623005166649818, + "eval_runtime": 107.8175, + "eval_samples_per_second": 18.55, + "eval_steps_per_second": 4.637, + "step": 705000 + }, + { + "epoch": 1.83, + "learning_rate": 2.5876857595371465e-05, + "loss": 0.0086, + "step": 705010 + }, + { + "epoch": 1.83, + "learning_rate": 2.5872969379000003e-05, + "loss": 0.0053, + "step": 705020 + }, + { + "epoch": 1.83, + "learning_rate": 2.5869081162628538e-05, + "loss": 0.0074, + "step": 705030 + }, + { + "epoch": 1.83, + "learning_rate": 2.5865192946257073e-05, + "loss": 0.0071, + "step": 705040 + }, + { + "epoch": 1.83, + "learning_rate": 2.5861304729885607e-05, + "loss": 0.0063, + "step": 705050 + }, + { + "epoch": 1.83, + "learning_rate": 2.585741651351414e-05, + "loss": 0.0061, + "step": 705060 + }, + { + "epoch": 1.83, + "learning_rate": 2.5853528297142677e-05, + "loss": 0.0063, + "step": 705070 + }, + { + "epoch": 1.83, + "learning_rate": 2.5849640080771212e-05, + "loss": 0.0063, + "step": 705080 + }, + { + "epoch": 1.83, + "learning_rate": 2.5845751864399747e-05, + "loss": 0.0056, + "step": 705090 + }, + { + "epoch": 1.83, + "learning_rate": 2.5841863648028282e-05, + "loss": 0.0084, + "step": 705100 + }, + { + "epoch": 1.83, + "learning_rate": 2.5837975431656817e-05, + "loss": 0.0064, + "step": 705110 + }, + { + "epoch": 1.83, + "learning_rate": 2.5834087215285355e-05, + "loss": 0.0062, + "step": 705120 + }, + { + "epoch": 1.83, + "learning_rate": 2.583019899891389e-05, + "loss": 0.0063, + "step": 705130 + }, + { + "epoch": 1.83, + "learning_rate": 2.5826310782542425e-05, + "loss": 0.0079, + "step": 705140 + }, + { + "epoch": 1.83, + "learning_rate": 2.582242256617096e-05, + "loss": 0.0074, + "step": 705150 + }, + { + "epoch": 1.83, + "learning_rate": 2.5818534349799498e-05, + "loss": 0.0058, + "step": 705160 + }, + { + "epoch": 1.83, + "learning_rate": 2.5814646133428033e-05, + "loss": 0.0088, + "step": 705170 + }, + { + "epoch": 1.83, + "learning_rate": 2.5810757917056567e-05, + "loss": 0.006, + "step": 705180 + }, + { + "epoch": 1.83, + "learning_rate": 2.58068697006851e-05, + "loss": 0.0077, + "step": 705190 + }, + { + "epoch": 1.83, + "learning_rate": 2.5802981484313634e-05, + "loss": 0.0075, + "step": 705200 + }, + { + "epoch": 1.83, + "learning_rate": 2.5799093267942172e-05, + "loss": 0.0088, + "step": 705210 + }, + { + "epoch": 1.83, + "learning_rate": 2.5795205051570707e-05, + "loss": 0.0087, + "step": 705220 + }, + { + "epoch": 1.83, + "learning_rate": 2.579131683519924e-05, + "loss": 0.0076, + "step": 705230 + }, + { + "epoch": 1.83, + "learning_rate": 2.5787428618827777e-05, + "loss": 0.0064, + "step": 705240 + }, + { + "epoch": 1.83, + "learning_rate": 2.5783540402456315e-05, + "loss": 0.0088, + "step": 705250 + }, + { + "epoch": 1.83, + "learning_rate": 2.577965218608485e-05, + "loss": 0.0071, + "step": 705260 + }, + { + "epoch": 1.83, + "learning_rate": 2.5775763969713385e-05, + "loss": 0.0083, + "step": 705270 + }, + { + "epoch": 1.83, + "learning_rate": 2.577187575334192e-05, + "loss": 0.0077, + "step": 705280 + }, + { + "epoch": 1.83, + "learning_rate": 2.5767987536970458e-05, + "loss": 0.0082, + "step": 705290 + }, + { + "epoch": 1.83, + "learning_rate": 2.5764099320598992e-05, + "loss": 0.0094, + "step": 705300 + }, + { + "epoch": 1.83, + "learning_rate": 2.5760211104227524e-05, + "loss": 0.0051, + "step": 705310 + }, + { + "epoch": 1.83, + "learning_rate": 2.575632288785606e-05, + "loss": 0.0101, + "step": 705320 + }, + { + "epoch": 1.83, + "learning_rate": 2.5752434671484594e-05, + "loss": 0.0073, + "step": 705330 + }, + { + "epoch": 1.83, + "learning_rate": 2.5748546455113132e-05, + "loss": 0.0053, + "step": 705340 + }, + { + "epoch": 1.83, + "learning_rate": 2.5744658238741667e-05, + "loss": 0.0092, + "step": 705350 + }, + { + "epoch": 1.83, + "learning_rate": 2.57407700223702e-05, + "loss": 0.0078, + "step": 705360 + }, + { + "epoch": 1.83, + "learning_rate": 2.5736881805998737e-05, + "loss": 0.0063, + "step": 705370 + }, + { + "epoch": 1.83, + "learning_rate": 2.5732993589627275e-05, + "loss": 0.0091, + "step": 705380 + }, + { + "epoch": 1.83, + "learning_rate": 2.572910537325581e-05, + "loss": 0.0062, + "step": 705390 + }, + { + "epoch": 1.83, + "learning_rate": 2.5725217156884345e-05, + "loss": 0.0097, + "step": 705400 + }, + { + "epoch": 1.83, + "learning_rate": 2.572132894051288e-05, + "loss": 0.0082, + "step": 705410 + }, + { + "epoch": 1.83, + "learning_rate": 2.5717440724141418e-05, + "loss": 0.0059, + "step": 705420 + }, + { + "epoch": 1.83, + "learning_rate": 2.571355250776995e-05, + "loss": 0.0064, + "step": 705430 + }, + { + "epoch": 1.83, + "learning_rate": 2.5709664291398484e-05, + "loss": 0.0071, + "step": 705440 + }, + { + "epoch": 1.83, + "learning_rate": 2.570577607502702e-05, + "loss": 0.007, + "step": 705450 + }, + { + "epoch": 1.83, + "learning_rate": 2.5701887858655554e-05, + "loss": 0.006, + "step": 705460 + }, + { + "epoch": 1.83, + "learning_rate": 2.5697999642284092e-05, + "loss": 0.0088, + "step": 705470 + }, + { + "epoch": 1.83, + "learning_rate": 2.5694111425912627e-05, + "loss": 0.008, + "step": 705480 + }, + { + "epoch": 1.83, + "learning_rate": 2.569022320954116e-05, + "loss": 0.0074, + "step": 705490 + }, + { + "epoch": 1.83, + "learning_rate": 2.5686334993169697e-05, + "loss": 0.0084, + "step": 705500 + }, + { + "epoch": 1.83, + "learning_rate": 2.5682446776798235e-05, + "loss": 0.0059, + "step": 705510 + }, + { + "epoch": 1.83, + "learning_rate": 2.567855856042677e-05, + "loss": 0.0075, + "step": 705520 + }, + { + "epoch": 1.83, + "learning_rate": 2.5674670344055304e-05, + "loss": 0.0105, + "step": 705530 + }, + { + "epoch": 1.83, + "learning_rate": 2.567078212768384e-05, + "loss": 0.006, + "step": 705540 + }, + { + "epoch": 1.83, + "learning_rate": 2.5666893911312378e-05, + "loss": 0.0091, + "step": 705550 + }, + { + "epoch": 1.83, + "learning_rate": 2.566300569494091e-05, + "loss": 0.0057, + "step": 705560 + }, + { + "epoch": 1.83, + "learning_rate": 2.5659117478569444e-05, + "loss": 0.0097, + "step": 705570 + }, + { + "epoch": 1.83, + "learning_rate": 2.565522926219798e-05, + "loss": 0.0053, + "step": 705580 + }, + { + "epoch": 1.83, + "learning_rate": 2.5651341045826514e-05, + "loss": 0.0067, + "step": 705590 + }, + { + "epoch": 1.83, + "learning_rate": 2.5647452829455052e-05, + "loss": 0.0058, + "step": 705600 + }, + { + "epoch": 1.83, + "learning_rate": 2.5643564613083587e-05, + "loss": 0.0061, + "step": 705610 + }, + { + "epoch": 1.83, + "learning_rate": 2.563967639671212e-05, + "loss": 0.0055, + "step": 705620 + }, + { + "epoch": 1.83, + "learning_rate": 2.5635788180340656e-05, + "loss": 0.0074, + "step": 705630 + }, + { + "epoch": 1.83, + "learning_rate": 2.5631899963969195e-05, + "loss": 0.0071, + "step": 705640 + }, + { + "epoch": 1.83, + "learning_rate": 2.562801174759773e-05, + "loss": 0.0071, + "step": 705650 + }, + { + "epoch": 1.83, + "learning_rate": 2.5624123531226264e-05, + "loss": 0.0073, + "step": 705660 + }, + { + "epoch": 1.83, + "learning_rate": 2.56202353148548e-05, + "loss": 0.0058, + "step": 705670 + }, + { + "epoch": 1.83, + "learning_rate": 2.561634709848333e-05, + "loss": 0.0102, + "step": 705680 + }, + { + "epoch": 1.83, + "learning_rate": 2.561245888211187e-05, + "loss": 0.0088, + "step": 705690 + }, + { + "epoch": 1.83, + "learning_rate": 2.5608570665740404e-05, + "loss": 0.006, + "step": 705700 + }, + { + "epoch": 1.83, + "learning_rate": 2.560468244936894e-05, + "loss": 0.0096, + "step": 705710 + }, + { + "epoch": 1.83, + "learning_rate": 2.5600794232997474e-05, + "loss": 0.0073, + "step": 705720 + }, + { + "epoch": 1.83, + "learning_rate": 2.5596906016626012e-05, + "loss": 0.0066, + "step": 705730 + }, + { + "epoch": 1.83, + "learning_rate": 2.5593017800254547e-05, + "loss": 0.009, + "step": 705740 + }, + { + "epoch": 1.83, + "learning_rate": 2.558912958388308e-05, + "loss": 0.0096, + "step": 705750 + }, + { + "epoch": 1.83, + "learning_rate": 2.5585241367511616e-05, + "loss": 0.0072, + "step": 705760 + }, + { + "epoch": 1.83, + "learning_rate": 2.5581353151140155e-05, + "loss": 0.0093, + "step": 705770 + }, + { + "epoch": 1.83, + "learning_rate": 2.557746493476869e-05, + "loss": 0.0074, + "step": 705780 + }, + { + "epoch": 1.83, + "learning_rate": 2.5573576718397224e-05, + "loss": 0.0066, + "step": 705790 + }, + { + "epoch": 1.83, + "learning_rate": 2.556968850202576e-05, + "loss": 0.0069, + "step": 705800 + }, + { + "epoch": 1.83, + "learning_rate": 2.556580028565429e-05, + "loss": 0.0078, + "step": 705810 + }, + { + "epoch": 1.83, + "learning_rate": 2.556191206928283e-05, + "loss": 0.0066, + "step": 705820 + }, + { + "epoch": 1.83, + "learning_rate": 2.5558023852911364e-05, + "loss": 0.0083, + "step": 705830 + }, + { + "epoch": 1.83, + "learning_rate": 2.55541356365399e-05, + "loss": 0.007, + "step": 705840 + }, + { + "epoch": 1.83, + "learning_rate": 2.5550247420168434e-05, + "loss": 0.0074, + "step": 705850 + }, + { + "epoch": 1.83, + "learning_rate": 2.5546359203796972e-05, + "loss": 0.0075, + "step": 705860 + }, + { + "epoch": 1.83, + "learning_rate": 2.5542470987425507e-05, + "loss": 0.005, + "step": 705870 + }, + { + "epoch": 1.83, + "learning_rate": 2.553858277105404e-05, + "loss": 0.0063, + "step": 705880 + }, + { + "epoch": 1.83, + "learning_rate": 2.5534694554682576e-05, + "loss": 0.0053, + "step": 705890 + }, + { + "epoch": 1.83, + "learning_rate": 2.5530806338311115e-05, + "loss": 0.0082, + "step": 705900 + }, + { + "epoch": 1.83, + "learning_rate": 2.552691812193965e-05, + "loss": 0.0057, + "step": 705910 + }, + { + "epoch": 1.83, + "learning_rate": 2.5523029905568184e-05, + "loss": 0.007, + "step": 705920 + }, + { + "epoch": 1.83, + "learning_rate": 2.5519141689196716e-05, + "loss": 0.0086, + "step": 705930 + }, + { + "epoch": 1.83, + "learning_rate": 2.551525347282525e-05, + "loss": 0.0081, + "step": 705940 + }, + { + "epoch": 1.83, + "learning_rate": 2.551136525645379e-05, + "loss": 0.012, + "step": 705950 + }, + { + "epoch": 1.83, + "learning_rate": 2.5507477040082324e-05, + "loss": 0.0086, + "step": 705960 + }, + { + "epoch": 1.83, + "learning_rate": 2.550358882371086e-05, + "loss": 0.0089, + "step": 705970 + }, + { + "epoch": 1.83, + "learning_rate": 2.5499700607339394e-05, + "loss": 0.0104, + "step": 705980 + }, + { + "epoch": 1.83, + "learning_rate": 2.5495812390967932e-05, + "loss": 0.0088, + "step": 705990 + }, + { + "epoch": 1.83, + "learning_rate": 2.5491924174596467e-05, + "loss": 0.0094, + "step": 706000 + }, + { + "epoch": 1.83, + "eval_cer": 0.8816592975782083, + "eval_loss": 0.004630614072084427, + "eval_runtime": 107.9819, + "eval_samples_per_second": 18.522, + "eval_steps_per_second": 4.63, + "step": 706000 + }, + { + "epoch": 1.83, + "learning_rate": 2.5488035958225e-05, + "loss": 0.0078, + "step": 706010 + }, + { + "epoch": 1.83, + "learning_rate": 2.5484147741853536e-05, + "loss": 0.0082, + "step": 706020 + }, + { + "epoch": 1.83, + "learning_rate": 2.5480259525482075e-05, + "loss": 0.0075, + "step": 706030 + }, + { + "epoch": 1.83, + "learning_rate": 2.547637130911061e-05, + "loss": 0.006, + "step": 706040 + }, + { + "epoch": 1.83, + "learning_rate": 2.547248309273914e-05, + "loss": 0.0078, + "step": 706050 + }, + { + "epoch": 1.83, + "learning_rate": 2.5468594876367676e-05, + "loss": 0.0101, + "step": 706060 + }, + { + "epoch": 1.83, + "learning_rate": 2.546470665999621e-05, + "loss": 0.0076, + "step": 706070 + }, + { + "epoch": 1.83, + "learning_rate": 2.546081844362475e-05, + "loss": 0.0095, + "step": 706080 + }, + { + "epoch": 1.83, + "learning_rate": 2.5456930227253284e-05, + "loss": 0.0055, + "step": 706090 + }, + { + "epoch": 1.83, + "learning_rate": 2.545304201088182e-05, + "loss": 0.0073, + "step": 706100 + }, + { + "epoch": 1.83, + "learning_rate": 2.5449153794510354e-05, + "loss": 0.006, + "step": 706110 + }, + { + "epoch": 1.83, + "learning_rate": 2.5445265578138892e-05, + "loss": 0.0063, + "step": 706120 + }, + { + "epoch": 1.83, + "learning_rate": 2.5441377361767427e-05, + "loss": 0.0091, + "step": 706130 + }, + { + "epoch": 1.83, + "learning_rate": 2.543748914539596e-05, + "loss": 0.0068, + "step": 706140 + }, + { + "epoch": 1.83, + "learning_rate": 2.5433600929024496e-05, + "loss": 0.0082, + "step": 706150 + }, + { + "epoch": 1.83, + "learning_rate": 2.5429712712653035e-05, + "loss": 0.0066, + "step": 706160 + }, + { + "epoch": 1.83, + "learning_rate": 2.542582449628157e-05, + "loss": 0.007, + "step": 706170 + }, + { + "epoch": 1.83, + "learning_rate": 2.54219362799101e-05, + "loss": 0.0069, + "step": 706180 + }, + { + "epoch": 1.83, + "learning_rate": 2.5418048063538636e-05, + "loss": 0.0087, + "step": 706190 + }, + { + "epoch": 1.83, + "learning_rate": 2.541415984716717e-05, + "loss": 0.0085, + "step": 706200 + }, + { + "epoch": 1.83, + "learning_rate": 2.541027163079571e-05, + "loss": 0.0073, + "step": 706210 + }, + { + "epoch": 1.83, + "learning_rate": 2.5406383414424244e-05, + "loss": 0.0069, + "step": 706220 + }, + { + "epoch": 1.83, + "learning_rate": 2.540249519805278e-05, + "loss": 0.0088, + "step": 706230 + }, + { + "epoch": 1.83, + "learning_rate": 2.5398606981681314e-05, + "loss": 0.0073, + "step": 706240 + }, + { + "epoch": 1.83, + "learning_rate": 2.5394718765309852e-05, + "loss": 0.006, + "step": 706250 + }, + { + "epoch": 1.83, + "learning_rate": 2.5390830548938387e-05, + "loss": 0.0069, + "step": 706260 + }, + { + "epoch": 1.83, + "learning_rate": 2.538694233256692e-05, + "loss": 0.0067, + "step": 706270 + }, + { + "epoch": 1.83, + "learning_rate": 2.5383054116195456e-05, + "loss": 0.0074, + "step": 706280 + }, + { + "epoch": 1.83, + "learning_rate": 2.5379165899823995e-05, + "loss": 0.0076, + "step": 706290 + }, + { + "epoch": 1.83, + "learning_rate": 2.5375277683452526e-05, + "loss": 0.0079, + "step": 706300 + }, + { + "epoch": 1.83, + "learning_rate": 2.537138946708106e-05, + "loss": 0.008, + "step": 706310 + }, + { + "epoch": 1.83, + "learning_rate": 2.5367501250709596e-05, + "loss": 0.0071, + "step": 706320 + }, + { + "epoch": 1.83, + "learning_rate": 2.536361303433813e-05, + "loss": 0.0084, + "step": 706330 + }, + { + "epoch": 1.83, + "learning_rate": 2.535972481796667e-05, + "loss": 0.0076, + "step": 706340 + }, + { + "epoch": 1.83, + "learning_rate": 2.5355836601595204e-05, + "loss": 0.0049, + "step": 706350 + }, + { + "epoch": 1.83, + "learning_rate": 2.535194838522374e-05, + "loss": 0.0073, + "step": 706360 + }, + { + "epoch": 1.83, + "learning_rate": 2.5348060168852274e-05, + "loss": 0.0074, + "step": 706370 + }, + { + "epoch": 1.83, + "learning_rate": 2.5344171952480812e-05, + "loss": 0.0084, + "step": 706380 + }, + { + "epoch": 1.83, + "learning_rate": 2.5340283736109347e-05, + "loss": 0.0091, + "step": 706390 + }, + { + "epoch": 1.83, + "learning_rate": 2.533639551973788e-05, + "loss": 0.0057, + "step": 706400 + }, + { + "epoch": 1.83, + "learning_rate": 2.5332507303366416e-05, + "loss": 0.0063, + "step": 706410 + }, + { + "epoch": 1.83, + "learning_rate": 2.5328619086994955e-05, + "loss": 0.0077, + "step": 706420 + }, + { + "epoch": 1.83, + "learning_rate": 2.5324730870623486e-05, + "loss": 0.0062, + "step": 706430 + }, + { + "epoch": 1.83, + "learning_rate": 2.532084265425202e-05, + "loss": 0.0081, + "step": 706440 + }, + { + "epoch": 1.83, + "learning_rate": 2.5316954437880556e-05, + "loss": 0.0064, + "step": 706450 + }, + { + "epoch": 1.83, + "learning_rate": 2.531306622150909e-05, + "loss": 0.0084, + "step": 706460 + }, + { + "epoch": 1.83, + "learning_rate": 2.530917800513763e-05, + "loss": 0.0096, + "step": 706470 + }, + { + "epoch": 1.83, + "learning_rate": 2.5305289788766164e-05, + "loss": 0.0103, + "step": 706480 + }, + { + "epoch": 1.83, + "learning_rate": 2.53014015723947e-05, + "loss": 0.0051, + "step": 706490 + }, + { + "epoch": 1.83, + "learning_rate": 2.5297513356023233e-05, + "loss": 0.0078, + "step": 706500 + }, + { + "epoch": 1.83, + "learning_rate": 2.529362513965177e-05, + "loss": 0.0063, + "step": 706510 + }, + { + "epoch": 1.83, + "learning_rate": 2.5289736923280307e-05, + "loss": 0.0104, + "step": 706520 + }, + { + "epoch": 1.83, + "learning_rate": 2.528584870690884e-05, + "loss": 0.0066, + "step": 706530 + }, + { + "epoch": 1.83, + "learning_rate": 2.5281960490537376e-05, + "loss": 0.0063, + "step": 706540 + }, + { + "epoch": 1.83, + "learning_rate": 2.5278072274165908e-05, + "loss": 0.0101, + "step": 706550 + }, + { + "epoch": 1.83, + "learning_rate": 2.5274184057794443e-05, + "loss": 0.0101, + "step": 706560 + }, + { + "epoch": 1.83, + "learning_rate": 2.527029584142298e-05, + "loss": 0.0059, + "step": 706570 + }, + { + "epoch": 1.83, + "learning_rate": 2.5266407625051516e-05, + "loss": 0.0083, + "step": 706580 + }, + { + "epoch": 1.83, + "learning_rate": 2.526251940868005e-05, + "loss": 0.0076, + "step": 706590 + }, + { + "epoch": 1.83, + "learning_rate": 2.5258631192308585e-05, + "loss": 0.0076, + "step": 706600 + }, + { + "epoch": 1.83, + "learning_rate": 2.5254742975937124e-05, + "loss": 0.0079, + "step": 706610 + }, + { + "epoch": 1.83, + "learning_rate": 2.525085475956566e-05, + "loss": 0.0111, + "step": 706620 + }, + { + "epoch": 1.83, + "learning_rate": 2.5246966543194193e-05, + "loss": 0.007, + "step": 706630 + }, + { + "epoch": 1.83, + "learning_rate": 2.524307832682273e-05, + "loss": 0.0052, + "step": 706640 + }, + { + "epoch": 1.83, + "learning_rate": 2.5239190110451267e-05, + "loss": 0.0087, + "step": 706650 + }, + { + "epoch": 1.83, + "learning_rate": 2.52353018940798e-05, + "loss": 0.0065, + "step": 706660 + }, + { + "epoch": 1.83, + "learning_rate": 2.5231413677708333e-05, + "loss": 0.0095, + "step": 706670 + }, + { + "epoch": 1.83, + "learning_rate": 2.5227525461336868e-05, + "loss": 0.0052, + "step": 706680 + }, + { + "epoch": 1.83, + "learning_rate": 2.5223637244965403e-05, + "loss": 0.0087, + "step": 706690 + }, + { + "epoch": 1.83, + "learning_rate": 2.521974902859394e-05, + "loss": 0.0066, + "step": 706700 + }, + { + "epoch": 1.83, + "learning_rate": 2.5215860812222476e-05, + "loss": 0.0076, + "step": 706710 + }, + { + "epoch": 1.83, + "learning_rate": 2.521197259585101e-05, + "loss": 0.0085, + "step": 706720 + }, + { + "epoch": 1.83, + "learning_rate": 2.5208084379479545e-05, + "loss": 0.0071, + "step": 706730 + }, + { + "epoch": 1.83, + "learning_rate": 2.5204196163108084e-05, + "loss": 0.0081, + "step": 706740 + }, + { + "epoch": 1.83, + "learning_rate": 2.520030794673662e-05, + "loss": 0.0093, + "step": 706750 + }, + { + "epoch": 1.83, + "learning_rate": 2.5196419730365153e-05, + "loss": 0.0071, + "step": 706760 + }, + { + "epoch": 1.83, + "learning_rate": 2.5192531513993688e-05, + "loss": 0.0058, + "step": 706770 + }, + { + "epoch": 1.83, + "learning_rate": 2.5188643297622227e-05, + "loss": 0.0072, + "step": 706780 + }, + { + "epoch": 1.83, + "learning_rate": 2.518475508125076e-05, + "loss": 0.0081, + "step": 706790 + }, + { + "epoch": 1.83, + "learning_rate": 2.5180866864879293e-05, + "loss": 0.008, + "step": 706800 + }, + { + "epoch": 1.83, + "learning_rate": 2.5176978648507828e-05, + "loss": 0.0082, + "step": 706810 + }, + { + "epoch": 1.83, + "learning_rate": 2.5173090432136363e-05, + "loss": 0.0092, + "step": 706820 + }, + { + "epoch": 1.83, + "learning_rate": 2.51692022157649e-05, + "loss": 0.0094, + "step": 706830 + }, + { + "epoch": 1.83, + "learning_rate": 2.5165313999393436e-05, + "loss": 0.0109, + "step": 706840 + }, + { + "epoch": 1.83, + "learning_rate": 2.516142578302197e-05, + "loss": 0.0073, + "step": 706850 + }, + { + "epoch": 1.83, + "learning_rate": 2.5157537566650505e-05, + "loss": 0.0076, + "step": 706860 + }, + { + "epoch": 1.83, + "learning_rate": 2.5153649350279044e-05, + "loss": 0.0074, + "step": 706870 + }, + { + "epoch": 1.83, + "learning_rate": 2.514976113390758e-05, + "loss": 0.0077, + "step": 706880 + }, + { + "epoch": 1.83, + "learning_rate": 2.5145872917536113e-05, + "loss": 0.0092, + "step": 706890 + }, + { + "epoch": 1.83, + "learning_rate": 2.5141984701164648e-05, + "loss": 0.0078, + "step": 706900 + }, + { + "epoch": 1.83, + "learning_rate": 2.5138096484793187e-05, + "loss": 0.0076, + "step": 706910 + }, + { + "epoch": 1.83, + "learning_rate": 2.5134208268421718e-05, + "loss": 0.0058, + "step": 706920 + }, + { + "epoch": 1.83, + "learning_rate": 2.5130320052050253e-05, + "loss": 0.0102, + "step": 706930 + }, + { + "epoch": 1.83, + "learning_rate": 2.5126431835678788e-05, + "loss": 0.0076, + "step": 706940 + }, + { + "epoch": 1.83, + "learning_rate": 2.5122543619307323e-05, + "loss": 0.0066, + "step": 706950 + }, + { + "epoch": 1.83, + "learning_rate": 2.511865540293586e-05, + "loss": 0.0075, + "step": 706960 + }, + { + "epoch": 1.83, + "learning_rate": 2.5114767186564396e-05, + "loss": 0.0076, + "step": 706970 + }, + { + "epoch": 1.83, + "learning_rate": 2.511087897019293e-05, + "loss": 0.0057, + "step": 706980 + }, + { + "epoch": 1.83, + "learning_rate": 2.5106990753821465e-05, + "loss": 0.0085, + "step": 706990 + }, + { + "epoch": 1.83, + "learning_rate": 2.5103102537450004e-05, + "loss": 0.0058, + "step": 707000 + }, + { + "epoch": 1.83, + "eval_cer": 0.8816550986674057, + "eval_loss": 0.004591579083353281, + "eval_runtime": 107.8494, + "eval_samples_per_second": 18.544, + "eval_steps_per_second": 4.636, + "step": 707000 + }, + { + "epoch": 1.83, + "learning_rate": 2.509921432107854e-05, + "loss": 0.0054, + "step": 707010 + }, + { + "epoch": 1.83, + "learning_rate": 2.5095326104707073e-05, + "loss": 0.0088, + "step": 707020 + }, + { + "epoch": 1.83, + "learning_rate": 2.5091437888335608e-05, + "loss": 0.0108, + "step": 707030 + }, + { + "epoch": 1.83, + "learning_rate": 2.5087549671964146e-05, + "loss": 0.0101, + "step": 707040 + }, + { + "epoch": 1.83, + "learning_rate": 2.5083661455592678e-05, + "loss": 0.0072, + "step": 707050 + }, + { + "epoch": 1.83, + "learning_rate": 2.5079773239221213e-05, + "loss": 0.0097, + "step": 707060 + }, + { + "epoch": 1.83, + "learning_rate": 2.5075885022849748e-05, + "loss": 0.0118, + "step": 707070 + }, + { + "epoch": 1.83, + "learning_rate": 2.5071996806478283e-05, + "loss": 0.0074, + "step": 707080 + }, + { + "epoch": 1.83, + "learning_rate": 2.506810859010682e-05, + "loss": 0.0073, + "step": 707090 + }, + { + "epoch": 1.83, + "learning_rate": 2.5064220373735356e-05, + "loss": 0.0073, + "step": 707100 + }, + { + "epoch": 1.83, + "learning_rate": 2.506033215736389e-05, + "loss": 0.0096, + "step": 707110 + }, + { + "epoch": 1.83, + "learning_rate": 2.5056443940992425e-05, + "loss": 0.0066, + "step": 707120 + }, + { + "epoch": 1.83, + "learning_rate": 2.5052555724620964e-05, + "loss": 0.0086, + "step": 707130 + }, + { + "epoch": 1.83, + "learning_rate": 2.50486675082495e-05, + "loss": 0.0085, + "step": 707140 + }, + { + "epoch": 1.83, + "learning_rate": 2.5044779291878033e-05, + "loss": 0.0048, + "step": 707150 + }, + { + "epoch": 1.83, + "learning_rate": 2.5040891075506568e-05, + "loss": 0.0074, + "step": 707160 + }, + { + "epoch": 1.83, + "learning_rate": 2.50370028591351e-05, + "loss": 0.0083, + "step": 707170 + }, + { + "epoch": 1.83, + "learning_rate": 2.5033114642763638e-05, + "loss": 0.0091, + "step": 707180 + }, + { + "epoch": 1.83, + "learning_rate": 2.5029226426392173e-05, + "loss": 0.0065, + "step": 707190 + }, + { + "epoch": 1.83, + "learning_rate": 2.5025338210020708e-05, + "loss": 0.0062, + "step": 707200 + }, + { + "epoch": 1.83, + "learning_rate": 2.5021449993649243e-05, + "loss": 0.0062, + "step": 707210 + }, + { + "epoch": 1.83, + "learning_rate": 2.501756177727778e-05, + "loss": 0.0069, + "step": 707220 + }, + { + "epoch": 1.83, + "learning_rate": 2.5013673560906316e-05, + "loss": 0.0064, + "step": 707230 + }, + { + "epoch": 1.83, + "learning_rate": 2.500978534453485e-05, + "loss": 0.0069, + "step": 707240 + }, + { + "epoch": 1.83, + "learning_rate": 2.5005897128163385e-05, + "loss": 0.0065, + "step": 707250 + }, + { + "epoch": 1.83, + "learning_rate": 2.5002008911791924e-05, + "loss": 0.0062, + "step": 707260 + }, + { + "epoch": 1.83, + "learning_rate": 2.499812069542046e-05, + "loss": 0.0078, + "step": 707270 + }, + { + "epoch": 1.83, + "learning_rate": 2.4994232479048993e-05, + "loss": 0.0056, + "step": 707280 + }, + { + "epoch": 1.83, + "learning_rate": 2.4990344262677525e-05, + "loss": 0.0058, + "step": 707290 + }, + { + "epoch": 1.83, + "learning_rate": 2.498645604630606e-05, + "loss": 0.0158, + "step": 707300 + }, + { + "epoch": 1.83, + "learning_rate": 2.4982567829934598e-05, + "loss": 0.0076, + "step": 707310 + }, + { + "epoch": 1.83, + "learning_rate": 2.4978679613563133e-05, + "loss": 0.0054, + "step": 707320 + }, + { + "epoch": 1.83, + "learning_rate": 2.4974791397191668e-05, + "loss": 0.0083, + "step": 707330 + }, + { + "epoch": 1.83, + "learning_rate": 2.4970903180820203e-05, + "loss": 0.0066, + "step": 707340 + }, + { + "epoch": 1.83, + "learning_rate": 2.496701496444874e-05, + "loss": 0.0097, + "step": 707350 + }, + { + "epoch": 1.83, + "learning_rate": 2.4963126748077276e-05, + "loss": 0.006, + "step": 707360 + }, + { + "epoch": 1.83, + "learning_rate": 2.495923853170581e-05, + "loss": 0.0061, + "step": 707370 + }, + { + "epoch": 1.83, + "learning_rate": 2.4955350315334345e-05, + "loss": 0.0075, + "step": 707380 + }, + { + "epoch": 1.83, + "learning_rate": 2.4951462098962884e-05, + "loss": 0.0065, + "step": 707390 + }, + { + "epoch": 1.83, + "learning_rate": 2.494757388259142e-05, + "loss": 0.0064, + "step": 707400 + }, + { + "epoch": 1.83, + "learning_rate": 2.4943685666219953e-05, + "loss": 0.0103, + "step": 707410 + }, + { + "epoch": 1.83, + "learning_rate": 2.4939797449848485e-05, + "loss": 0.0057, + "step": 707420 + }, + { + "epoch": 1.83, + "learning_rate": 2.493590923347702e-05, + "loss": 0.0086, + "step": 707430 + }, + { + "epoch": 1.83, + "learning_rate": 2.4932021017105558e-05, + "loss": 0.0107, + "step": 707440 + }, + { + "epoch": 1.83, + "learning_rate": 2.4928132800734093e-05, + "loss": 0.0054, + "step": 707450 + }, + { + "epoch": 1.83, + "learning_rate": 2.4924244584362628e-05, + "loss": 0.0059, + "step": 707460 + }, + { + "epoch": 1.83, + "learning_rate": 2.4920356367991162e-05, + "loss": 0.0076, + "step": 707470 + }, + { + "epoch": 1.83, + "learning_rate": 2.49164681516197e-05, + "loss": 0.0096, + "step": 707480 + }, + { + "epoch": 1.83, + "learning_rate": 2.4912579935248236e-05, + "loss": 0.0093, + "step": 707490 + }, + { + "epoch": 1.83, + "learning_rate": 2.490869171887677e-05, + "loss": 0.0073, + "step": 707500 + }, + { + "epoch": 1.83, + "learning_rate": 2.4904803502505305e-05, + "loss": 0.0077, + "step": 707510 + }, + { + "epoch": 1.83, + "learning_rate": 2.4900915286133844e-05, + "loss": 0.0082, + "step": 707520 + }, + { + "epoch": 1.83, + "learning_rate": 2.489702706976238e-05, + "loss": 0.0093, + "step": 707530 + }, + { + "epoch": 1.83, + "learning_rate": 2.489313885339091e-05, + "loss": 0.0063, + "step": 707540 + }, + { + "epoch": 1.83, + "learning_rate": 2.4889250637019445e-05, + "loss": 0.009, + "step": 707550 + }, + { + "epoch": 1.83, + "learning_rate": 2.488536242064798e-05, + "loss": 0.0057, + "step": 707560 + }, + { + "epoch": 1.83, + "learning_rate": 2.4881474204276518e-05, + "loss": 0.0083, + "step": 707570 + }, + { + "epoch": 1.83, + "learning_rate": 2.4877585987905053e-05, + "loss": 0.0084, + "step": 707580 + }, + { + "epoch": 1.83, + "learning_rate": 2.4873697771533588e-05, + "loss": 0.008, + "step": 707590 + }, + { + "epoch": 1.83, + "learning_rate": 2.4869809555162122e-05, + "loss": 0.0077, + "step": 707600 + }, + { + "epoch": 1.83, + "learning_rate": 2.486592133879066e-05, + "loss": 0.0101, + "step": 707610 + }, + { + "epoch": 1.83, + "learning_rate": 2.4862033122419196e-05, + "loss": 0.0066, + "step": 707620 + }, + { + "epoch": 1.83, + "learning_rate": 2.485814490604773e-05, + "loss": 0.0079, + "step": 707630 + }, + { + "epoch": 1.83, + "learning_rate": 2.4854256689676265e-05, + "loss": 0.0065, + "step": 707640 + }, + { + "epoch": 1.83, + "learning_rate": 2.4850368473304804e-05, + "loss": 0.0079, + "step": 707650 + }, + { + "epoch": 1.83, + "learning_rate": 2.484648025693334e-05, + "loss": 0.0055, + "step": 707660 + }, + { + "epoch": 1.83, + "learning_rate": 2.484259204056187e-05, + "loss": 0.0064, + "step": 707670 + }, + { + "epoch": 1.83, + "learning_rate": 2.4838703824190405e-05, + "loss": 0.0049, + "step": 707680 + }, + { + "epoch": 1.83, + "learning_rate": 2.483481560781894e-05, + "loss": 0.0079, + "step": 707690 + }, + { + "epoch": 1.83, + "learning_rate": 2.4830927391447478e-05, + "loss": 0.0067, + "step": 707700 + }, + { + "epoch": 1.83, + "learning_rate": 2.4827039175076013e-05, + "loss": 0.0103, + "step": 707710 + }, + { + "epoch": 1.83, + "learning_rate": 2.4823150958704548e-05, + "loss": 0.008, + "step": 707720 + }, + { + "epoch": 1.83, + "learning_rate": 2.4819262742333082e-05, + "loss": 0.0057, + "step": 707730 + }, + { + "epoch": 1.83, + "learning_rate": 2.481537452596162e-05, + "loss": 0.0069, + "step": 707740 + }, + { + "epoch": 1.83, + "learning_rate": 2.4811486309590156e-05, + "loss": 0.0075, + "step": 707750 + }, + { + "epoch": 1.83, + "learning_rate": 2.480759809321869e-05, + "loss": 0.0068, + "step": 707760 + }, + { + "epoch": 1.83, + "learning_rate": 2.4803709876847225e-05, + "loss": 0.0086, + "step": 707770 + }, + { + "epoch": 1.83, + "learning_rate": 2.4799821660475764e-05, + "loss": 0.0068, + "step": 707780 + }, + { + "epoch": 1.83, + "learning_rate": 2.4795933444104295e-05, + "loss": 0.0076, + "step": 707790 + }, + { + "epoch": 1.83, + "learning_rate": 2.479204522773283e-05, + "loss": 0.0045, + "step": 707800 + }, + { + "epoch": 1.83, + "learning_rate": 2.4788157011361365e-05, + "loss": 0.0075, + "step": 707810 + }, + { + "epoch": 1.83, + "learning_rate": 2.47842687949899e-05, + "loss": 0.0133, + "step": 707820 + }, + { + "epoch": 1.83, + "learning_rate": 2.4780380578618438e-05, + "loss": 0.006, + "step": 707830 + }, + { + "epoch": 1.83, + "learning_rate": 2.4776492362246973e-05, + "loss": 0.0073, + "step": 707840 + }, + { + "epoch": 1.83, + "learning_rate": 2.4772604145875508e-05, + "loss": 0.0065, + "step": 707850 + }, + { + "epoch": 1.83, + "learning_rate": 2.4768715929504042e-05, + "loss": 0.0088, + "step": 707860 + }, + { + "epoch": 1.83, + "learning_rate": 2.476482771313258e-05, + "loss": 0.0052, + "step": 707870 + }, + { + "epoch": 1.83, + "learning_rate": 2.4760939496761116e-05, + "loss": 0.0073, + "step": 707880 + }, + { + "epoch": 1.83, + "learning_rate": 2.475705128038965e-05, + "loss": 0.0097, + "step": 707890 + }, + { + "epoch": 1.83, + "learning_rate": 2.4753163064018185e-05, + "loss": 0.0073, + "step": 707900 + }, + { + "epoch": 1.84, + "learning_rate": 2.474927484764672e-05, + "loss": 0.0059, + "step": 707910 + }, + { + "epoch": 1.84, + "learning_rate": 2.4745386631275255e-05, + "loss": 0.0068, + "step": 707920 + }, + { + "epoch": 1.84, + "learning_rate": 2.474149841490379e-05, + "loss": 0.0071, + "step": 707930 + }, + { + "epoch": 1.84, + "learning_rate": 2.4737610198532325e-05, + "loss": 0.0078, + "step": 707940 + }, + { + "epoch": 1.84, + "learning_rate": 2.473372198216086e-05, + "loss": 0.0076, + "step": 707950 + }, + { + "epoch": 1.84, + "learning_rate": 2.4729833765789394e-05, + "loss": 0.0059, + "step": 707960 + }, + { + "epoch": 1.84, + "learning_rate": 2.4725945549417933e-05, + "loss": 0.0078, + "step": 707970 + }, + { + "epoch": 1.84, + "learning_rate": 2.4722057333046468e-05, + "loss": 0.0057, + "step": 707980 + }, + { + "epoch": 1.84, + "learning_rate": 2.4718169116675002e-05, + "loss": 0.0065, + "step": 707990 + }, + { + "epoch": 1.84, + "learning_rate": 2.4714280900303537e-05, + "loss": 0.006, + "step": 708000 + }, + { + "epoch": 1.84, + "eval_cer": 0.8816481004827348, + "eval_loss": 0.004648663103580475, + "eval_runtime": 107.9525, + "eval_samples_per_second": 18.527, + "eval_steps_per_second": 4.632, + "step": 708000 + }, + { + "epoch": 1.84, + "learning_rate": 2.4710392683932075e-05, + "loss": 0.0102, + "step": 708010 + }, + { + "epoch": 1.84, + "learning_rate": 2.470650446756061e-05, + "loss": 0.0075, + "step": 708020 + }, + { + "epoch": 1.84, + "learning_rate": 2.4702616251189145e-05, + "loss": 0.0065, + "step": 708030 + }, + { + "epoch": 1.84, + "learning_rate": 2.4698728034817677e-05, + "loss": 0.0081, + "step": 708040 + }, + { + "epoch": 1.84, + "learning_rate": 2.469483981844621e-05, + "loss": 0.0119, + "step": 708050 + }, + { + "epoch": 1.84, + "learning_rate": 2.469095160207475e-05, + "loss": 0.0081, + "step": 708060 + }, + { + "epoch": 1.84, + "learning_rate": 2.4687063385703285e-05, + "loss": 0.0094, + "step": 708070 + }, + { + "epoch": 1.84, + "learning_rate": 2.468317516933182e-05, + "loss": 0.0059, + "step": 708080 + }, + { + "epoch": 1.84, + "learning_rate": 2.4679286952960354e-05, + "loss": 0.0077, + "step": 708090 + }, + { + "epoch": 1.84, + "learning_rate": 2.4675398736588893e-05, + "loss": 0.0076, + "step": 708100 + }, + { + "epoch": 1.84, + "learning_rate": 2.4671510520217427e-05, + "loss": 0.0071, + "step": 708110 + }, + { + "epoch": 1.84, + "learning_rate": 2.4667622303845962e-05, + "loss": 0.0079, + "step": 708120 + }, + { + "epoch": 1.84, + "learning_rate": 2.4663734087474497e-05, + "loss": 0.0087, + "step": 708130 + }, + { + "epoch": 1.84, + "learning_rate": 2.4659845871103035e-05, + "loss": 0.0071, + "step": 708140 + }, + { + "epoch": 1.84, + "learning_rate": 2.465595765473157e-05, + "loss": 0.0067, + "step": 708150 + }, + { + "epoch": 1.84, + "learning_rate": 2.4652069438360102e-05, + "loss": 0.0078, + "step": 708160 + }, + { + "epoch": 1.84, + "learning_rate": 2.4648181221988637e-05, + "loss": 0.006, + "step": 708170 + }, + { + "epoch": 1.84, + "learning_rate": 2.464429300561717e-05, + "loss": 0.0093, + "step": 708180 + }, + { + "epoch": 1.84, + "learning_rate": 2.464040478924571e-05, + "loss": 0.0072, + "step": 708190 + }, + { + "epoch": 1.84, + "learning_rate": 2.4636516572874245e-05, + "loss": 0.0109, + "step": 708200 + }, + { + "epoch": 1.84, + "learning_rate": 2.463262835650278e-05, + "loss": 0.0057, + "step": 708210 + }, + { + "epoch": 1.84, + "learning_rate": 2.4628740140131314e-05, + "loss": 0.0069, + "step": 708220 + }, + { + "epoch": 1.84, + "learning_rate": 2.4624851923759853e-05, + "loss": 0.0073, + "step": 708230 + }, + { + "epoch": 1.84, + "learning_rate": 2.4620963707388387e-05, + "loss": 0.0113, + "step": 708240 + }, + { + "epoch": 1.84, + "learning_rate": 2.4617075491016922e-05, + "loss": 0.008, + "step": 708250 + }, + { + "epoch": 1.84, + "learning_rate": 2.4613187274645457e-05, + "loss": 0.0081, + "step": 708260 + }, + { + "epoch": 1.84, + "learning_rate": 2.4609299058273995e-05, + "loss": 0.0063, + "step": 708270 + }, + { + "epoch": 1.84, + "learning_rate": 2.460541084190253e-05, + "loss": 0.0056, + "step": 708280 + }, + { + "epoch": 1.84, + "learning_rate": 2.4601522625531062e-05, + "loss": 0.0091, + "step": 708290 + }, + { + "epoch": 1.84, + "learning_rate": 2.4597634409159597e-05, + "loss": 0.0099, + "step": 708300 + }, + { + "epoch": 1.84, + "learning_rate": 2.459374619278813e-05, + "loss": 0.0071, + "step": 708310 + }, + { + "epoch": 1.84, + "learning_rate": 2.458985797641667e-05, + "loss": 0.0067, + "step": 708320 + }, + { + "epoch": 1.84, + "learning_rate": 2.4585969760045205e-05, + "loss": 0.0076, + "step": 708330 + }, + { + "epoch": 1.84, + "learning_rate": 2.458208154367374e-05, + "loss": 0.0096, + "step": 708340 + }, + { + "epoch": 1.84, + "learning_rate": 2.4578193327302274e-05, + "loss": 0.0058, + "step": 708350 + }, + { + "epoch": 1.84, + "learning_rate": 2.4574305110930813e-05, + "loss": 0.0073, + "step": 708360 + }, + { + "epoch": 1.84, + "learning_rate": 2.4570416894559347e-05, + "loss": 0.0124, + "step": 708370 + }, + { + "epoch": 1.84, + "learning_rate": 2.4566528678187882e-05, + "loss": 0.0061, + "step": 708380 + }, + { + "epoch": 1.84, + "learning_rate": 2.4562640461816417e-05, + "loss": 0.0099, + "step": 708390 + }, + { + "epoch": 1.84, + "learning_rate": 2.4558752245444955e-05, + "loss": 0.007, + "step": 708400 + }, + { + "epoch": 1.84, + "learning_rate": 2.4554864029073487e-05, + "loss": 0.0063, + "step": 708410 + }, + { + "epoch": 1.84, + "learning_rate": 2.4550975812702022e-05, + "loss": 0.0082, + "step": 708420 + }, + { + "epoch": 1.84, + "learning_rate": 2.4547087596330557e-05, + "loss": 0.0063, + "step": 708430 + }, + { + "epoch": 1.84, + "learning_rate": 2.454319937995909e-05, + "loss": 0.0062, + "step": 708440 + }, + { + "epoch": 1.84, + "learning_rate": 2.453931116358763e-05, + "loss": 0.0077, + "step": 708450 + }, + { + "epoch": 1.84, + "learning_rate": 2.4535422947216165e-05, + "loss": 0.0056, + "step": 708460 + }, + { + "epoch": 1.84, + "learning_rate": 2.45315347308447e-05, + "loss": 0.0093, + "step": 708470 + }, + { + "epoch": 1.84, + "learning_rate": 2.4527646514473234e-05, + "loss": 0.0095, + "step": 708480 + }, + { + "epoch": 1.84, + "learning_rate": 2.4523758298101773e-05, + "loss": 0.0092, + "step": 708490 + }, + { + "epoch": 1.84, + "learning_rate": 2.4519870081730307e-05, + "loss": 0.0082, + "step": 708500 + }, + { + "epoch": 1.84, + "learning_rate": 2.4515981865358842e-05, + "loss": 0.0111, + "step": 708510 + }, + { + "epoch": 1.84, + "learning_rate": 2.4512093648987377e-05, + "loss": 0.0052, + "step": 708520 + }, + { + "epoch": 1.84, + "learning_rate": 2.4508205432615915e-05, + "loss": 0.0065, + "step": 708530 + }, + { + "epoch": 1.84, + "learning_rate": 2.4504317216244447e-05, + "loss": 0.008, + "step": 708540 + }, + { + "epoch": 1.84, + "learning_rate": 2.4500428999872982e-05, + "loss": 0.0049, + "step": 708550 + }, + { + "epoch": 1.84, + "learning_rate": 2.4496540783501517e-05, + "loss": 0.0051, + "step": 708560 + }, + { + "epoch": 1.84, + "learning_rate": 2.449265256713005e-05, + "loss": 0.0074, + "step": 708570 + }, + { + "epoch": 1.84, + "learning_rate": 2.448876435075859e-05, + "loss": 0.008, + "step": 708580 + }, + { + "epoch": 1.84, + "learning_rate": 2.4484876134387125e-05, + "loss": 0.0095, + "step": 708590 + }, + { + "epoch": 1.84, + "learning_rate": 2.448098791801566e-05, + "loss": 0.0069, + "step": 708600 + }, + { + "epoch": 1.84, + "learning_rate": 2.4477099701644194e-05, + "loss": 0.0065, + "step": 708610 + }, + { + "epoch": 1.84, + "learning_rate": 2.4473211485272733e-05, + "loss": 0.0065, + "step": 708620 + }, + { + "epoch": 1.84, + "learning_rate": 2.4469323268901267e-05, + "loss": 0.0088, + "step": 708630 + }, + { + "epoch": 1.84, + "learning_rate": 2.4465435052529802e-05, + "loss": 0.009, + "step": 708640 + }, + { + "epoch": 1.84, + "learning_rate": 2.4461546836158337e-05, + "loss": 0.0111, + "step": 708650 + }, + { + "epoch": 1.84, + "learning_rate": 2.445765861978687e-05, + "loss": 0.0119, + "step": 708660 + }, + { + "epoch": 1.84, + "learning_rate": 2.4453770403415407e-05, + "loss": 0.0057, + "step": 708670 + }, + { + "epoch": 1.84, + "learning_rate": 2.4449882187043942e-05, + "loss": 0.0055, + "step": 708680 + }, + { + "epoch": 1.84, + "learning_rate": 2.4445993970672477e-05, + "loss": 0.007, + "step": 708690 + }, + { + "epoch": 1.84, + "learning_rate": 2.444210575430101e-05, + "loss": 0.007, + "step": 708700 + }, + { + "epoch": 1.84, + "learning_rate": 2.443821753792955e-05, + "loss": 0.0094, + "step": 708710 + }, + { + "epoch": 1.84, + "learning_rate": 2.4434329321558085e-05, + "loss": 0.0077, + "step": 708720 + }, + { + "epoch": 1.84, + "learning_rate": 2.443044110518662e-05, + "loss": 0.0096, + "step": 708730 + }, + { + "epoch": 1.84, + "learning_rate": 2.4426552888815154e-05, + "loss": 0.0103, + "step": 708740 + }, + { + "epoch": 1.84, + "learning_rate": 2.4422664672443693e-05, + "loss": 0.0072, + "step": 708750 + }, + { + "epoch": 1.84, + "learning_rate": 2.4418776456072227e-05, + "loss": 0.0092, + "step": 708760 + }, + { + "epoch": 1.84, + "learning_rate": 2.4414888239700762e-05, + "loss": 0.0064, + "step": 708770 + }, + { + "epoch": 1.84, + "learning_rate": 2.4411000023329294e-05, + "loss": 0.0094, + "step": 708780 + }, + { + "epoch": 1.84, + "learning_rate": 2.440711180695783e-05, + "loss": 0.0073, + "step": 708790 + }, + { + "epoch": 1.84, + "learning_rate": 2.4403223590586367e-05, + "loss": 0.0075, + "step": 708800 + }, + { + "epoch": 1.84, + "learning_rate": 2.43993353742149e-05, + "loss": 0.0098, + "step": 708810 + }, + { + "epoch": 1.84, + "learning_rate": 2.4395447157843437e-05, + "loss": 0.0064, + "step": 708820 + }, + { + "epoch": 1.84, + "learning_rate": 2.439155894147197e-05, + "loss": 0.0078, + "step": 708830 + }, + { + "epoch": 1.84, + "learning_rate": 2.438767072510051e-05, + "loss": 0.0078, + "step": 708840 + }, + { + "epoch": 1.84, + "learning_rate": 2.4383782508729045e-05, + "loss": 0.0089, + "step": 708850 + }, + { + "epoch": 1.84, + "learning_rate": 2.437989429235758e-05, + "loss": 0.0085, + "step": 708860 + }, + { + "epoch": 1.84, + "learning_rate": 2.4376006075986114e-05, + "loss": 0.0067, + "step": 708870 + }, + { + "epoch": 1.84, + "learning_rate": 2.4372117859614652e-05, + "loss": 0.0072, + "step": 708880 + }, + { + "epoch": 1.84, + "learning_rate": 2.4368229643243187e-05, + "loss": 0.0078, + "step": 708890 + }, + { + "epoch": 1.84, + "learning_rate": 2.4364341426871722e-05, + "loss": 0.0068, + "step": 708900 + }, + { + "epoch": 1.84, + "learning_rate": 2.4360453210500254e-05, + "loss": 0.0056, + "step": 708910 + }, + { + "epoch": 1.84, + "learning_rate": 2.435656499412879e-05, + "loss": 0.0065, + "step": 708920 + }, + { + "epoch": 1.84, + "learning_rate": 2.4352676777757327e-05, + "loss": 0.0072, + "step": 708930 + }, + { + "epoch": 1.84, + "learning_rate": 2.434878856138586e-05, + "loss": 0.0078, + "step": 708940 + }, + { + "epoch": 1.84, + "learning_rate": 2.4344900345014397e-05, + "loss": 0.0071, + "step": 708950 + }, + { + "epoch": 1.84, + "learning_rate": 2.434101212864293e-05, + "loss": 0.0084, + "step": 708960 + }, + { + "epoch": 1.84, + "learning_rate": 2.433712391227147e-05, + "loss": 0.0058, + "step": 708970 + }, + { + "epoch": 1.84, + "learning_rate": 2.4333235695900004e-05, + "loss": 0.0086, + "step": 708980 + }, + { + "epoch": 1.84, + "learning_rate": 2.432934747952854e-05, + "loss": 0.0066, + "step": 708990 + }, + { + "epoch": 1.84, + "learning_rate": 2.4325459263157074e-05, + "loss": 0.007, + "step": 709000 + }, + { + "epoch": 1.84, + "eval_cer": 0.8816355037503272, + "eval_loss": 0.004716834053397179, + "eval_runtime": 107.9456, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 709000 + }, + { + "epoch": 1.84, + "learning_rate": 2.4321571046785612e-05, + "loss": 0.0075, + "step": 709010 + }, + { + "epoch": 1.84, + "learning_rate": 2.4317682830414147e-05, + "loss": 0.0085, + "step": 709020 + }, + { + "epoch": 1.84, + "learning_rate": 2.431379461404268e-05, + "loss": 0.0058, + "step": 709030 + }, + { + "epoch": 1.84, + "learning_rate": 2.4309906397671214e-05, + "loss": 0.0119, + "step": 709040 + }, + { + "epoch": 1.84, + "learning_rate": 2.430601818129975e-05, + "loss": 0.0096, + "step": 709050 + }, + { + "epoch": 1.84, + "learning_rate": 2.4302129964928287e-05, + "loss": 0.0083, + "step": 709060 + }, + { + "epoch": 1.84, + "learning_rate": 2.429824174855682e-05, + "loss": 0.0077, + "step": 709070 + }, + { + "epoch": 1.84, + "learning_rate": 2.4294353532185356e-05, + "loss": 0.0098, + "step": 709080 + }, + { + "epoch": 1.84, + "learning_rate": 2.429046531581389e-05, + "loss": 0.0116, + "step": 709090 + }, + { + "epoch": 1.84, + "learning_rate": 2.428657709944243e-05, + "loss": 0.0071, + "step": 709100 + }, + { + "epoch": 1.84, + "learning_rate": 2.4282688883070964e-05, + "loss": 0.0062, + "step": 709110 + }, + { + "epoch": 1.84, + "learning_rate": 2.42788006666995e-05, + "loss": 0.0084, + "step": 709120 + }, + { + "epoch": 1.84, + "learning_rate": 2.4274912450328034e-05, + "loss": 0.0078, + "step": 709130 + }, + { + "epoch": 1.84, + "learning_rate": 2.4271024233956572e-05, + "loss": 0.0075, + "step": 709140 + }, + { + "epoch": 1.84, + "learning_rate": 2.4267136017585107e-05, + "loss": 0.0065, + "step": 709150 + }, + { + "epoch": 1.84, + "learning_rate": 2.426324780121364e-05, + "loss": 0.0105, + "step": 709160 + }, + { + "epoch": 1.84, + "learning_rate": 2.4259359584842174e-05, + "loss": 0.0083, + "step": 709170 + }, + { + "epoch": 1.84, + "learning_rate": 2.425547136847071e-05, + "loss": 0.007, + "step": 709180 + }, + { + "epoch": 1.84, + "learning_rate": 2.4251583152099247e-05, + "loss": 0.0081, + "step": 709190 + }, + { + "epoch": 1.84, + "learning_rate": 2.424769493572778e-05, + "loss": 0.0057, + "step": 709200 + }, + { + "epoch": 1.84, + "learning_rate": 2.4243806719356316e-05, + "loss": 0.0078, + "step": 709210 + }, + { + "epoch": 1.84, + "learning_rate": 2.423991850298485e-05, + "loss": 0.0061, + "step": 709220 + }, + { + "epoch": 1.84, + "learning_rate": 2.423603028661339e-05, + "loss": 0.0062, + "step": 709230 + }, + { + "epoch": 1.84, + "learning_rate": 2.4232142070241924e-05, + "loss": 0.008, + "step": 709240 + }, + { + "epoch": 1.84, + "learning_rate": 2.422825385387046e-05, + "loss": 0.007, + "step": 709250 + }, + { + "epoch": 1.84, + "learning_rate": 2.4224365637498994e-05, + "loss": 0.0084, + "step": 709260 + }, + { + "epoch": 1.84, + "learning_rate": 2.422047742112753e-05, + "loss": 0.0075, + "step": 709270 + }, + { + "epoch": 1.84, + "learning_rate": 2.4216589204756064e-05, + "loss": 0.0111, + "step": 709280 + }, + { + "epoch": 1.84, + "learning_rate": 2.42127009883846e-05, + "loss": 0.0083, + "step": 709290 + }, + { + "epoch": 1.84, + "learning_rate": 2.4208812772013134e-05, + "loss": 0.0053, + "step": 709300 + }, + { + "epoch": 1.84, + "learning_rate": 2.420492455564167e-05, + "loss": 0.0089, + "step": 709310 + }, + { + "epoch": 1.84, + "learning_rate": 2.4201036339270203e-05, + "loss": 0.0064, + "step": 709320 + }, + { + "epoch": 1.84, + "learning_rate": 2.419714812289874e-05, + "loss": 0.0081, + "step": 709330 + }, + { + "epoch": 1.84, + "learning_rate": 2.4193259906527276e-05, + "loss": 0.0068, + "step": 709340 + }, + { + "epoch": 1.84, + "learning_rate": 2.418937169015581e-05, + "loss": 0.0061, + "step": 709350 + }, + { + "epoch": 1.84, + "learning_rate": 2.4185483473784346e-05, + "loss": 0.0063, + "step": 709360 + }, + { + "epoch": 1.84, + "learning_rate": 2.4181595257412884e-05, + "loss": 0.0066, + "step": 709370 + }, + { + "epoch": 1.84, + "learning_rate": 2.417770704104142e-05, + "loss": 0.0091, + "step": 709380 + }, + { + "epoch": 1.84, + "learning_rate": 2.4173818824669954e-05, + "loss": 0.0079, + "step": 709390 + }, + { + "epoch": 1.84, + "learning_rate": 2.4169930608298486e-05, + "loss": 0.0071, + "step": 709400 + }, + { + "epoch": 1.84, + "learning_rate": 2.416604239192702e-05, + "loss": 0.0087, + "step": 709410 + }, + { + "epoch": 1.84, + "learning_rate": 2.416215417555556e-05, + "loss": 0.0083, + "step": 709420 + }, + { + "epoch": 1.84, + "learning_rate": 2.4158265959184094e-05, + "loss": 0.0085, + "step": 709430 + }, + { + "epoch": 1.84, + "learning_rate": 2.415437774281263e-05, + "loss": 0.0086, + "step": 709440 + }, + { + "epoch": 1.84, + "learning_rate": 2.4150489526441163e-05, + "loss": 0.0059, + "step": 709450 + }, + { + "epoch": 1.84, + "learning_rate": 2.41466013100697e-05, + "loss": 0.0135, + "step": 709460 + }, + { + "epoch": 1.84, + "learning_rate": 2.4142713093698236e-05, + "loss": 0.0074, + "step": 709470 + }, + { + "epoch": 1.84, + "learning_rate": 2.413882487732677e-05, + "loss": 0.0068, + "step": 709480 + }, + { + "epoch": 1.84, + "learning_rate": 2.4134936660955306e-05, + "loss": 0.0177, + "step": 709490 + }, + { + "epoch": 1.84, + "learning_rate": 2.4131048444583844e-05, + "loss": 0.01, + "step": 709500 + }, + { + "epoch": 1.84, + "learning_rate": 2.412716022821238e-05, + "loss": 0.0073, + "step": 709510 + }, + { + "epoch": 1.84, + "learning_rate": 2.4123272011840914e-05, + "loss": 0.0058, + "step": 709520 + }, + { + "epoch": 1.84, + "learning_rate": 2.4119383795469446e-05, + "loss": 0.0094, + "step": 709530 + }, + { + "epoch": 1.84, + "learning_rate": 2.411549557909798e-05, + "loss": 0.0106, + "step": 709540 + }, + { + "epoch": 1.84, + "learning_rate": 2.411160736272652e-05, + "loss": 0.0088, + "step": 709550 + }, + { + "epoch": 1.84, + "learning_rate": 2.4107719146355054e-05, + "loss": 0.0109, + "step": 709560 + }, + { + "epoch": 1.84, + "learning_rate": 2.410383092998359e-05, + "loss": 0.0064, + "step": 709570 + }, + { + "epoch": 1.84, + "learning_rate": 2.4099942713612123e-05, + "loss": 0.0083, + "step": 709580 + }, + { + "epoch": 1.84, + "learning_rate": 2.409605449724066e-05, + "loss": 0.0057, + "step": 709590 + }, + { + "epoch": 1.84, + "learning_rate": 2.4092166280869196e-05, + "loss": 0.0067, + "step": 709600 + }, + { + "epoch": 1.84, + "learning_rate": 2.408827806449773e-05, + "loss": 0.0076, + "step": 709610 + }, + { + "epoch": 1.84, + "learning_rate": 2.4084389848126266e-05, + "loss": 0.0094, + "step": 709620 + }, + { + "epoch": 1.84, + "learning_rate": 2.4080501631754804e-05, + "loss": 0.0067, + "step": 709630 + }, + { + "epoch": 1.84, + "learning_rate": 2.407661341538334e-05, + "loss": 0.0084, + "step": 709640 + }, + { + "epoch": 1.84, + "learning_rate": 2.407272519901187e-05, + "loss": 0.0074, + "step": 709650 + }, + { + "epoch": 1.84, + "learning_rate": 2.4068836982640406e-05, + "loss": 0.0091, + "step": 709660 + }, + { + "epoch": 1.84, + "learning_rate": 2.406494876626894e-05, + "loss": 0.0071, + "step": 709670 + }, + { + "epoch": 1.84, + "learning_rate": 2.406106054989748e-05, + "loss": 0.0067, + "step": 709680 + }, + { + "epoch": 1.84, + "learning_rate": 2.4057172333526014e-05, + "loss": 0.0069, + "step": 709690 + }, + { + "epoch": 1.84, + "learning_rate": 2.405328411715455e-05, + "loss": 0.0085, + "step": 709700 + }, + { + "epoch": 1.84, + "learning_rate": 2.4049395900783083e-05, + "loss": 0.0108, + "step": 709710 + }, + { + "epoch": 1.84, + "learning_rate": 2.404550768441162e-05, + "loss": 0.0081, + "step": 709720 + }, + { + "epoch": 1.84, + "learning_rate": 2.4041619468040156e-05, + "loss": 0.0078, + "step": 709730 + }, + { + "epoch": 1.84, + "learning_rate": 2.403773125166869e-05, + "loss": 0.013, + "step": 709740 + }, + { + "epoch": 1.84, + "learning_rate": 2.4033843035297226e-05, + "loss": 0.0067, + "step": 709750 + }, + { + "epoch": 1.84, + "learning_rate": 2.4029954818925764e-05, + "loss": 0.0063, + "step": 709760 + }, + { + "epoch": 1.84, + "learning_rate": 2.40260666025543e-05, + "loss": 0.0076, + "step": 709770 + }, + { + "epoch": 1.84, + "learning_rate": 2.402217838618283e-05, + "loss": 0.006, + "step": 709780 + }, + { + "epoch": 1.84, + "learning_rate": 2.4018290169811366e-05, + "loss": 0.0088, + "step": 709790 + }, + { + "epoch": 1.84, + "learning_rate": 2.40144019534399e-05, + "loss": 0.0086, + "step": 709800 + }, + { + "epoch": 1.84, + "learning_rate": 2.401051373706844e-05, + "loss": 0.0086, + "step": 709810 + }, + { + "epoch": 1.84, + "learning_rate": 2.4006625520696974e-05, + "loss": 0.0069, + "step": 709820 + }, + { + "epoch": 1.84, + "learning_rate": 2.400273730432551e-05, + "loss": 0.0082, + "step": 709830 + }, + { + "epoch": 1.84, + "learning_rate": 2.3998849087954043e-05, + "loss": 0.0087, + "step": 709840 + }, + { + "epoch": 1.84, + "learning_rate": 2.399496087158258e-05, + "loss": 0.0088, + "step": 709850 + }, + { + "epoch": 1.84, + "learning_rate": 2.3991072655211116e-05, + "loss": 0.0074, + "step": 709860 + }, + { + "epoch": 1.84, + "learning_rate": 2.398718443883965e-05, + "loss": 0.0068, + "step": 709870 + }, + { + "epoch": 1.84, + "learning_rate": 2.3983296222468186e-05, + "loss": 0.006, + "step": 709880 + }, + { + "epoch": 1.84, + "learning_rate": 2.3979408006096724e-05, + "loss": 0.007, + "step": 709890 + }, + { + "epoch": 1.84, + "learning_rate": 2.3975519789725256e-05, + "loss": 0.0072, + "step": 709900 + }, + { + "epoch": 1.84, + "learning_rate": 2.397163157335379e-05, + "loss": 0.0057, + "step": 709910 + }, + { + "epoch": 1.84, + "learning_rate": 2.3967743356982326e-05, + "loss": 0.0066, + "step": 709920 + }, + { + "epoch": 1.84, + "learning_rate": 2.396385514061086e-05, + "loss": 0.0062, + "step": 709930 + }, + { + "epoch": 1.84, + "learning_rate": 2.39599669242394e-05, + "loss": 0.007, + "step": 709940 + }, + { + "epoch": 1.84, + "learning_rate": 2.3956078707867933e-05, + "loss": 0.0076, + "step": 709950 + }, + { + "epoch": 1.84, + "learning_rate": 2.395219049149647e-05, + "loss": 0.0063, + "step": 709960 + }, + { + "epoch": 1.84, + "learning_rate": 2.3948302275125003e-05, + "loss": 0.0084, + "step": 709970 + }, + { + "epoch": 1.84, + "learning_rate": 2.394441405875354e-05, + "loss": 0.0074, + "step": 709980 + }, + { + "epoch": 1.84, + "learning_rate": 2.3940525842382076e-05, + "loss": 0.0089, + "step": 709990 + }, + { + "epoch": 1.84, + "learning_rate": 2.393663762601061e-05, + "loss": 0.0087, + "step": 710000 + }, + { + "epoch": 1.84, + "eval_cer": 0.881642501934998, + "eval_loss": 0.00460857292637229, + "eval_runtime": 107.9419, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 710000 + }, + { + "epoch": 1.84, + "learning_rate": 2.3932749409639146e-05, + "loss": 0.0064, + "step": 710010 + }, + { + "epoch": 1.84, + "learning_rate": 2.3928861193267678e-05, + "loss": 0.0111, + "step": 710020 + }, + { + "epoch": 1.84, + "learning_rate": 2.3924972976896216e-05, + "loss": 0.0067, + "step": 710030 + }, + { + "epoch": 1.84, + "learning_rate": 2.392108476052475e-05, + "loss": 0.0085, + "step": 710040 + }, + { + "epoch": 1.84, + "learning_rate": 2.3917196544153285e-05, + "loss": 0.0082, + "step": 710050 + }, + { + "epoch": 1.84, + "learning_rate": 2.391330832778182e-05, + "loss": 0.0061, + "step": 710060 + }, + { + "epoch": 1.84, + "learning_rate": 2.390942011141036e-05, + "loss": 0.007, + "step": 710070 + }, + { + "epoch": 1.84, + "learning_rate": 2.3905531895038893e-05, + "loss": 0.007, + "step": 710080 + }, + { + "epoch": 1.84, + "learning_rate": 2.390164367866743e-05, + "loss": 0.0073, + "step": 710090 + }, + { + "epoch": 1.84, + "learning_rate": 2.3897755462295963e-05, + "loss": 0.0081, + "step": 710100 + }, + { + "epoch": 1.84, + "learning_rate": 2.38938672459245e-05, + "loss": 0.0066, + "step": 710110 + }, + { + "epoch": 1.84, + "learning_rate": 2.3889979029553036e-05, + "loss": 0.0078, + "step": 710120 + }, + { + "epoch": 1.84, + "learning_rate": 2.388609081318157e-05, + "loss": 0.0064, + "step": 710130 + }, + { + "epoch": 1.84, + "learning_rate": 2.3882202596810106e-05, + "loss": 0.0078, + "step": 710140 + }, + { + "epoch": 1.84, + "learning_rate": 2.3878314380438638e-05, + "loss": 0.0076, + "step": 710150 + }, + { + "epoch": 1.84, + "learning_rate": 2.3874426164067176e-05, + "loss": 0.005, + "step": 710160 + }, + { + "epoch": 1.84, + "learning_rate": 2.387053794769571e-05, + "loss": 0.0058, + "step": 710170 + }, + { + "epoch": 1.84, + "learning_rate": 2.3866649731324245e-05, + "loss": 0.0066, + "step": 710180 + }, + { + "epoch": 1.84, + "learning_rate": 2.386276151495278e-05, + "loss": 0.0049, + "step": 710190 + }, + { + "epoch": 1.84, + "learning_rate": 2.385887329858132e-05, + "loss": 0.0086, + "step": 710200 + }, + { + "epoch": 1.84, + "learning_rate": 2.3854985082209853e-05, + "loss": 0.0073, + "step": 710210 + }, + { + "epoch": 1.84, + "learning_rate": 2.385109686583839e-05, + "loss": 0.008, + "step": 710220 + }, + { + "epoch": 1.84, + "learning_rate": 2.3847208649466923e-05, + "loss": 0.0061, + "step": 710230 + }, + { + "epoch": 1.84, + "learning_rate": 2.384332043309546e-05, + "loss": 0.0091, + "step": 710240 + }, + { + "epoch": 1.84, + "learning_rate": 2.3839432216723996e-05, + "loss": 0.0073, + "step": 710250 + }, + { + "epoch": 1.84, + "learning_rate": 2.383554400035253e-05, + "loss": 0.0054, + "step": 710260 + }, + { + "epoch": 1.84, + "learning_rate": 2.3831655783981063e-05, + "loss": 0.0056, + "step": 710270 + }, + { + "epoch": 1.84, + "learning_rate": 2.3827767567609597e-05, + "loss": 0.0074, + "step": 710280 + }, + { + "epoch": 1.84, + "learning_rate": 2.3823879351238136e-05, + "loss": 0.0077, + "step": 710290 + }, + { + "epoch": 1.84, + "learning_rate": 2.381999113486667e-05, + "loss": 0.0061, + "step": 710300 + }, + { + "epoch": 1.84, + "learning_rate": 2.3816102918495205e-05, + "loss": 0.007, + "step": 710310 + }, + { + "epoch": 1.84, + "learning_rate": 2.381221470212374e-05, + "loss": 0.0081, + "step": 710320 + }, + { + "epoch": 1.84, + "learning_rate": 2.380832648575228e-05, + "loss": 0.0065, + "step": 710330 + }, + { + "epoch": 1.84, + "learning_rate": 2.3804438269380813e-05, + "loss": 0.0069, + "step": 710340 + }, + { + "epoch": 1.84, + "learning_rate": 2.3800550053009348e-05, + "loss": 0.0089, + "step": 710350 + }, + { + "epoch": 1.84, + "learning_rate": 2.3796661836637883e-05, + "loss": 0.008, + "step": 710360 + }, + { + "epoch": 1.84, + "learning_rate": 2.379277362026642e-05, + "loss": 0.0069, + "step": 710370 + }, + { + "epoch": 1.84, + "learning_rate": 2.3788885403894956e-05, + "loss": 0.0078, + "step": 710380 + }, + { + "epoch": 1.84, + "learning_rate": 2.378499718752349e-05, + "loss": 0.0065, + "step": 710390 + }, + { + "epoch": 1.84, + "learning_rate": 2.3781108971152023e-05, + "loss": 0.0113, + "step": 710400 + }, + { + "epoch": 1.84, + "learning_rate": 2.3777220754780557e-05, + "loss": 0.0057, + "step": 710410 + }, + { + "epoch": 1.84, + "learning_rate": 2.3773332538409096e-05, + "loss": 0.0095, + "step": 710420 + }, + { + "epoch": 1.84, + "learning_rate": 2.376944432203763e-05, + "loss": 0.0105, + "step": 710430 + }, + { + "epoch": 1.84, + "learning_rate": 2.3765556105666165e-05, + "loss": 0.0067, + "step": 710440 + }, + { + "epoch": 1.84, + "learning_rate": 2.37616678892947e-05, + "loss": 0.0073, + "step": 710450 + }, + { + "epoch": 1.84, + "learning_rate": 2.375777967292324e-05, + "loss": 0.0067, + "step": 710460 + }, + { + "epoch": 1.84, + "learning_rate": 2.3753891456551773e-05, + "loss": 0.0091, + "step": 710470 + }, + { + "epoch": 1.84, + "learning_rate": 2.3750003240180308e-05, + "loss": 0.0107, + "step": 710480 + }, + { + "epoch": 1.84, + "learning_rate": 2.3746115023808843e-05, + "loss": 0.0103, + "step": 710490 + }, + { + "epoch": 1.84, + "learning_rate": 2.374222680743738e-05, + "loss": 0.0092, + "step": 710500 + }, + { + "epoch": 1.84, + "learning_rate": 2.3738338591065916e-05, + "loss": 0.0086, + "step": 710510 + }, + { + "epoch": 1.84, + "learning_rate": 2.3734450374694448e-05, + "loss": 0.0076, + "step": 710520 + }, + { + "epoch": 1.84, + "learning_rate": 2.3730562158322983e-05, + "loss": 0.0058, + "step": 710530 + }, + { + "epoch": 1.84, + "learning_rate": 2.3726673941951517e-05, + "loss": 0.008, + "step": 710540 + }, + { + "epoch": 1.84, + "learning_rate": 2.3722785725580056e-05, + "loss": 0.0084, + "step": 710550 + }, + { + "epoch": 1.84, + "learning_rate": 2.371889750920859e-05, + "loss": 0.0057, + "step": 710560 + }, + { + "epoch": 1.84, + "learning_rate": 2.3715009292837125e-05, + "loss": 0.0051, + "step": 710570 + }, + { + "epoch": 1.84, + "learning_rate": 2.371112107646566e-05, + "loss": 0.0079, + "step": 710580 + }, + { + "epoch": 1.84, + "learning_rate": 2.37072328600942e-05, + "loss": 0.0044, + "step": 710590 + }, + { + "epoch": 1.84, + "learning_rate": 2.3703344643722733e-05, + "loss": 0.0083, + "step": 710600 + }, + { + "epoch": 1.84, + "learning_rate": 2.3699456427351268e-05, + "loss": 0.0058, + "step": 710610 + }, + { + "epoch": 1.84, + "learning_rate": 2.3695568210979803e-05, + "loss": 0.0077, + "step": 710620 + }, + { + "epoch": 1.84, + "learning_rate": 2.369167999460834e-05, + "loss": 0.0087, + "step": 710630 + }, + { + "epoch": 1.84, + "learning_rate": 2.3687791778236873e-05, + "loss": 0.0056, + "step": 710640 + }, + { + "epoch": 1.84, + "learning_rate": 2.3683903561865408e-05, + "loss": 0.006, + "step": 710650 + }, + { + "epoch": 1.84, + "learning_rate": 2.3680015345493943e-05, + "loss": 0.0076, + "step": 710660 + }, + { + "epoch": 1.84, + "learning_rate": 2.3676127129122477e-05, + "loss": 0.0069, + "step": 710670 + }, + { + "epoch": 1.84, + "learning_rate": 2.3672238912751016e-05, + "loss": 0.0094, + "step": 710680 + }, + { + "epoch": 1.84, + "learning_rate": 2.366835069637955e-05, + "loss": 0.0087, + "step": 710690 + }, + { + "epoch": 1.84, + "learning_rate": 2.3664462480008085e-05, + "loss": 0.0077, + "step": 710700 + }, + { + "epoch": 1.84, + "learning_rate": 2.366057426363662e-05, + "loss": 0.0076, + "step": 710710 + }, + { + "epoch": 1.84, + "learning_rate": 2.3656686047265155e-05, + "loss": 0.0104, + "step": 710720 + }, + { + "epoch": 1.84, + "learning_rate": 2.3652797830893693e-05, + "loss": 0.0104, + "step": 710730 + }, + { + "epoch": 1.84, + "learning_rate": 2.3648909614522228e-05, + "loss": 0.0076, + "step": 710740 + }, + { + "epoch": 1.84, + "learning_rate": 2.3645021398150763e-05, + "loss": 0.0078, + "step": 710750 + }, + { + "epoch": 1.84, + "learning_rate": 2.3641133181779298e-05, + "loss": 0.0089, + "step": 710760 + }, + { + "epoch": 1.84, + "learning_rate": 2.363724496540783e-05, + "loss": 0.009, + "step": 710770 + }, + { + "epoch": 1.84, + "learning_rate": 2.3633356749036368e-05, + "loss": 0.0112, + "step": 710780 + }, + { + "epoch": 1.84, + "learning_rate": 2.3629468532664903e-05, + "loss": 0.0074, + "step": 710790 + }, + { + "epoch": 1.84, + "learning_rate": 2.3625580316293437e-05, + "loss": 0.0048, + "step": 710800 + }, + { + "epoch": 1.84, + "learning_rate": 2.3621692099921972e-05, + "loss": 0.0061, + "step": 710810 + }, + { + "epoch": 1.84, + "learning_rate": 2.361780388355051e-05, + "loss": 0.0081, + "step": 710820 + }, + { + "epoch": 1.84, + "learning_rate": 2.3613915667179045e-05, + "loss": 0.0094, + "step": 710830 + }, + { + "epoch": 1.84, + "learning_rate": 2.361002745080758e-05, + "loss": 0.009, + "step": 710840 + }, + { + "epoch": 1.84, + "learning_rate": 2.3606139234436115e-05, + "loss": 0.0064, + "step": 710850 + }, + { + "epoch": 1.84, + "learning_rate": 2.3602251018064653e-05, + "loss": 0.0091, + "step": 710860 + }, + { + "epoch": 1.84, + "learning_rate": 2.3598362801693188e-05, + "loss": 0.0089, + "step": 710870 + }, + { + "epoch": 1.84, + "learning_rate": 2.3594474585321723e-05, + "loss": 0.0061, + "step": 710880 + }, + { + "epoch": 1.84, + "learning_rate": 2.3590586368950255e-05, + "loss": 0.0071, + "step": 710890 + }, + { + "epoch": 1.84, + "learning_rate": 2.358669815257879e-05, + "loss": 0.0083, + "step": 710900 + }, + { + "epoch": 1.84, + "learning_rate": 2.3582809936207328e-05, + "loss": 0.0081, + "step": 710910 + }, + { + "epoch": 1.84, + "learning_rate": 2.3578921719835862e-05, + "loss": 0.0064, + "step": 710920 + }, + { + "epoch": 1.84, + "learning_rate": 2.3575033503464397e-05, + "loss": 0.0078, + "step": 710930 + }, + { + "epoch": 1.84, + "learning_rate": 2.3571145287092932e-05, + "loss": 0.0094, + "step": 710940 + }, + { + "epoch": 1.84, + "learning_rate": 2.356725707072147e-05, + "loss": 0.0088, + "step": 710950 + }, + { + "epoch": 1.84, + "learning_rate": 2.3563368854350005e-05, + "loss": 0.0055, + "step": 710960 + }, + { + "epoch": 1.84, + "learning_rate": 2.355948063797854e-05, + "loss": 0.0094, + "step": 710970 + }, + { + "epoch": 1.84, + "learning_rate": 2.3555592421607075e-05, + "loss": 0.0063, + "step": 710980 + }, + { + "epoch": 1.84, + "learning_rate": 2.3551704205235613e-05, + "loss": 0.0046, + "step": 710990 + }, + { + "epoch": 1.84, + "learning_rate": 2.3547815988864148e-05, + "loss": 0.0083, + "step": 711000 + }, + { + "epoch": 1.84, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.004514896310865879, + "eval_runtime": 107.7072, + "eval_samples_per_second": 18.569, + "eval_steps_per_second": 4.642, + "step": 711000 + }, + { + "epoch": 1.84, + "learning_rate": 2.3543927772492683e-05, + "loss": 0.0106, + "step": 711010 + }, + { + "epoch": 1.84, + "learning_rate": 2.3540039556121214e-05, + "loss": 0.007, + "step": 711020 + }, + { + "epoch": 1.84, + "learning_rate": 2.353615133974975e-05, + "loss": 0.0063, + "step": 711030 + }, + { + "epoch": 1.84, + "learning_rate": 2.3532263123378288e-05, + "loss": 0.0073, + "step": 711040 + }, + { + "epoch": 1.84, + "learning_rate": 2.3528374907006822e-05, + "loss": 0.0051, + "step": 711050 + }, + { + "epoch": 1.84, + "learning_rate": 2.3524486690635357e-05, + "loss": 0.0124, + "step": 711060 + }, + { + "epoch": 1.84, + "learning_rate": 2.3520598474263892e-05, + "loss": 0.0062, + "step": 711070 + }, + { + "epoch": 1.84, + "learning_rate": 2.351671025789243e-05, + "loss": 0.0071, + "step": 711080 + }, + { + "epoch": 1.84, + "learning_rate": 2.3512822041520965e-05, + "loss": 0.0062, + "step": 711090 + }, + { + "epoch": 1.84, + "learning_rate": 2.35089338251495e-05, + "loss": 0.0079, + "step": 711100 + }, + { + "epoch": 1.84, + "learning_rate": 2.3505045608778035e-05, + "loss": 0.0075, + "step": 711110 + }, + { + "epoch": 1.84, + "learning_rate": 2.3501157392406573e-05, + "loss": 0.0089, + "step": 711120 + }, + { + "epoch": 1.84, + "learning_rate": 2.3497269176035108e-05, + "loss": 0.0077, + "step": 711130 + }, + { + "epoch": 1.84, + "learning_rate": 2.349338095966364e-05, + "loss": 0.0072, + "step": 711140 + }, + { + "epoch": 1.84, + "learning_rate": 2.3489492743292174e-05, + "loss": 0.008, + "step": 711150 + }, + { + "epoch": 1.84, + "learning_rate": 2.348560452692071e-05, + "loss": 0.008, + "step": 711160 + }, + { + "epoch": 1.84, + "learning_rate": 2.3481716310549248e-05, + "loss": 0.0057, + "step": 711170 + }, + { + "epoch": 1.84, + "learning_rate": 2.3477828094177782e-05, + "loss": 0.0075, + "step": 711180 + }, + { + "epoch": 1.84, + "learning_rate": 2.3473939877806317e-05, + "loss": 0.0069, + "step": 711190 + }, + { + "epoch": 1.84, + "learning_rate": 2.3470051661434852e-05, + "loss": 0.0062, + "step": 711200 + }, + { + "epoch": 1.84, + "learning_rate": 2.346616344506339e-05, + "loss": 0.0068, + "step": 711210 + }, + { + "epoch": 1.84, + "learning_rate": 2.3462275228691925e-05, + "loss": 0.0109, + "step": 711220 + }, + { + "epoch": 1.84, + "learning_rate": 2.345838701232046e-05, + "loss": 0.0063, + "step": 711230 + }, + { + "epoch": 1.84, + "learning_rate": 2.3454498795948995e-05, + "loss": 0.0072, + "step": 711240 + }, + { + "epoch": 1.84, + "learning_rate": 2.3450610579577533e-05, + "loss": 0.0087, + "step": 711250 + }, + { + "epoch": 1.84, + "learning_rate": 2.3446722363206065e-05, + "loss": 0.0054, + "step": 711260 + }, + { + "epoch": 1.84, + "learning_rate": 2.34428341468346e-05, + "loss": 0.0053, + "step": 711270 + }, + { + "epoch": 1.84, + "learning_rate": 2.3438945930463134e-05, + "loss": 0.0098, + "step": 711280 + }, + { + "epoch": 1.84, + "learning_rate": 2.343505771409167e-05, + "loss": 0.0077, + "step": 711290 + }, + { + "epoch": 1.84, + "learning_rate": 2.3431169497720208e-05, + "loss": 0.0077, + "step": 711300 + }, + { + "epoch": 1.84, + "learning_rate": 2.3427281281348742e-05, + "loss": 0.0072, + "step": 711310 + }, + { + "epoch": 1.84, + "learning_rate": 2.3423393064977277e-05, + "loss": 0.0089, + "step": 711320 + }, + { + "epoch": 1.84, + "learning_rate": 2.3419504848605812e-05, + "loss": 0.0065, + "step": 711330 + }, + { + "epoch": 1.84, + "learning_rate": 2.341561663223435e-05, + "loss": 0.0084, + "step": 711340 + }, + { + "epoch": 1.84, + "learning_rate": 2.3411728415862885e-05, + "loss": 0.007, + "step": 711350 + }, + { + "epoch": 1.84, + "learning_rate": 2.340784019949142e-05, + "loss": 0.0073, + "step": 711360 + }, + { + "epoch": 1.84, + "learning_rate": 2.3403951983119955e-05, + "loss": 0.0099, + "step": 711370 + }, + { + "epoch": 1.84, + "learning_rate": 2.3400063766748493e-05, + "loss": 0.006, + "step": 711380 + }, + { + "epoch": 1.84, + "learning_rate": 2.3396175550377025e-05, + "loss": 0.0089, + "step": 711390 + }, + { + "epoch": 1.84, + "learning_rate": 2.339228733400556e-05, + "loss": 0.0106, + "step": 711400 + }, + { + "epoch": 1.84, + "learning_rate": 2.3388399117634094e-05, + "loss": 0.0085, + "step": 711410 + }, + { + "epoch": 1.84, + "learning_rate": 2.338451090126263e-05, + "loss": 0.0114, + "step": 711420 + }, + { + "epoch": 1.84, + "learning_rate": 2.3380622684891168e-05, + "loss": 0.0072, + "step": 711430 + }, + { + "epoch": 1.84, + "learning_rate": 2.3376734468519702e-05, + "loss": 0.0061, + "step": 711440 + }, + { + "epoch": 1.84, + "learning_rate": 2.3372846252148237e-05, + "loss": 0.0078, + "step": 711450 + }, + { + "epoch": 1.84, + "learning_rate": 2.3368958035776772e-05, + "loss": 0.0059, + "step": 711460 + }, + { + "epoch": 1.84, + "learning_rate": 2.336506981940531e-05, + "loss": 0.009, + "step": 711470 + }, + { + "epoch": 1.84, + "learning_rate": 2.3361181603033845e-05, + "loss": 0.0084, + "step": 711480 + }, + { + "epoch": 1.84, + "learning_rate": 2.335729338666238e-05, + "loss": 0.0074, + "step": 711490 + }, + { + "epoch": 1.84, + "learning_rate": 2.3353405170290915e-05, + "loss": 0.0086, + "step": 711500 + }, + { + "epoch": 1.84, + "learning_rate": 2.3349516953919446e-05, + "loss": 0.0058, + "step": 711510 + }, + { + "epoch": 1.84, + "learning_rate": 2.3345628737547985e-05, + "loss": 0.0075, + "step": 711520 + }, + { + "epoch": 1.84, + "learning_rate": 2.334174052117652e-05, + "loss": 0.0063, + "step": 711530 + }, + { + "epoch": 1.84, + "learning_rate": 2.3337852304805054e-05, + "loss": 0.0091, + "step": 711540 + }, + { + "epoch": 1.84, + "learning_rate": 2.333396408843359e-05, + "loss": 0.0065, + "step": 711550 + }, + { + "epoch": 1.84, + "learning_rate": 2.3330075872062128e-05, + "loss": 0.0064, + "step": 711560 + }, + { + "epoch": 1.84, + "learning_rate": 2.3326187655690662e-05, + "loss": 0.0078, + "step": 711570 + }, + { + "epoch": 1.84, + "learning_rate": 2.3322299439319197e-05, + "loss": 0.0093, + "step": 711580 + }, + { + "epoch": 1.84, + "learning_rate": 2.3318411222947732e-05, + "loss": 0.01, + "step": 711590 + }, + { + "epoch": 1.84, + "learning_rate": 2.331452300657627e-05, + "loss": 0.0069, + "step": 711600 + }, + { + "epoch": 1.84, + "learning_rate": 2.3310634790204805e-05, + "loss": 0.0084, + "step": 711610 + }, + { + "epoch": 1.84, + "learning_rate": 2.330674657383334e-05, + "loss": 0.009, + "step": 711620 + }, + { + "epoch": 1.84, + "learning_rate": 2.3302858357461875e-05, + "loss": 0.0067, + "step": 711630 + }, + { + "epoch": 1.84, + "learning_rate": 2.3298970141090406e-05, + "loss": 0.0067, + "step": 711640 + }, + { + "epoch": 1.84, + "learning_rate": 2.3295081924718945e-05, + "loss": 0.0098, + "step": 711650 + }, + { + "epoch": 1.84, + "learning_rate": 2.329119370834748e-05, + "loss": 0.0078, + "step": 711660 + }, + { + "epoch": 1.84, + "learning_rate": 2.3287305491976014e-05, + "loss": 0.0082, + "step": 711670 + }, + { + "epoch": 1.84, + "learning_rate": 2.328341727560455e-05, + "loss": 0.0065, + "step": 711680 + }, + { + "epoch": 1.84, + "learning_rate": 2.3279529059233087e-05, + "loss": 0.0084, + "step": 711690 + }, + { + "epoch": 1.84, + "learning_rate": 2.3275640842861622e-05, + "loss": 0.0069, + "step": 711700 + }, + { + "epoch": 1.84, + "learning_rate": 2.3271752626490157e-05, + "loss": 0.0068, + "step": 711710 + }, + { + "epoch": 1.84, + "learning_rate": 2.3267864410118692e-05, + "loss": 0.0072, + "step": 711720 + }, + { + "epoch": 1.84, + "learning_rate": 2.326397619374723e-05, + "loss": 0.0068, + "step": 711730 + }, + { + "epoch": 1.84, + "learning_rate": 2.3260087977375765e-05, + "loss": 0.0085, + "step": 711740 + }, + { + "epoch": 1.84, + "learning_rate": 2.32561997610043e-05, + "loss": 0.0075, + "step": 711750 + }, + { + "epoch": 1.84, + "learning_rate": 2.325231154463283e-05, + "loss": 0.0055, + "step": 711760 + }, + { + "epoch": 1.85, + "learning_rate": 2.3248423328261366e-05, + "loss": 0.0093, + "step": 711770 + }, + { + "epoch": 1.85, + "learning_rate": 2.3244535111889905e-05, + "loss": 0.007, + "step": 711780 + }, + { + "epoch": 1.85, + "learning_rate": 2.324064689551844e-05, + "loss": 0.0075, + "step": 711790 + }, + { + "epoch": 1.85, + "learning_rate": 2.3236758679146974e-05, + "loss": 0.0103, + "step": 711800 + }, + { + "epoch": 1.85, + "learning_rate": 2.323287046277551e-05, + "loss": 0.0084, + "step": 711810 + }, + { + "epoch": 1.85, + "learning_rate": 2.3228982246404047e-05, + "loss": 0.0088, + "step": 711820 + }, + { + "epoch": 1.85, + "learning_rate": 2.3225094030032582e-05, + "loss": 0.007, + "step": 711830 + }, + { + "epoch": 1.85, + "learning_rate": 2.3221205813661117e-05, + "loss": 0.0077, + "step": 711840 + }, + { + "epoch": 1.85, + "learning_rate": 2.3217317597289652e-05, + "loss": 0.0083, + "step": 711850 + }, + { + "epoch": 1.85, + "learning_rate": 2.321342938091819e-05, + "loss": 0.0093, + "step": 711860 + }, + { + "epoch": 1.85, + "learning_rate": 2.3209541164546725e-05, + "loss": 0.0056, + "step": 711870 + }, + { + "epoch": 1.85, + "learning_rate": 2.3205652948175257e-05, + "loss": 0.0079, + "step": 711880 + }, + { + "epoch": 1.85, + "learning_rate": 2.320176473180379e-05, + "loss": 0.0066, + "step": 711890 + }, + { + "epoch": 1.85, + "learning_rate": 2.3197876515432326e-05, + "loss": 0.0077, + "step": 711900 + }, + { + "epoch": 1.85, + "learning_rate": 2.3193988299060865e-05, + "loss": 0.0074, + "step": 711910 + }, + { + "epoch": 1.85, + "learning_rate": 2.31901000826894e-05, + "loss": 0.0085, + "step": 711920 + }, + { + "epoch": 1.85, + "learning_rate": 2.3186211866317934e-05, + "loss": 0.0105, + "step": 711930 + }, + { + "epoch": 1.85, + "learning_rate": 2.318232364994647e-05, + "loss": 0.0075, + "step": 711940 + }, + { + "epoch": 1.85, + "learning_rate": 2.3178435433575007e-05, + "loss": 0.0054, + "step": 711950 + }, + { + "epoch": 1.85, + "learning_rate": 2.3174547217203542e-05, + "loss": 0.0112, + "step": 711960 + }, + { + "epoch": 1.85, + "learning_rate": 2.3170659000832077e-05, + "loss": 0.0094, + "step": 711970 + }, + { + "epoch": 1.85, + "learning_rate": 2.3166770784460612e-05, + "loss": 0.0096, + "step": 711980 + }, + { + "epoch": 1.85, + "learning_rate": 2.316288256808915e-05, + "loss": 0.0063, + "step": 711990 + }, + { + "epoch": 1.85, + "learning_rate": 2.3158994351717685e-05, + "loss": 0.0065, + "step": 712000 + }, + { + "epoch": 1.85, + "eval_cer": 0.8816439015719323, + "eval_loss": 0.004501926247030497, + "eval_runtime": 107.8113, + "eval_samples_per_second": 18.551, + "eval_steps_per_second": 4.638, + "step": 712000 + }, + { + "epoch": 1.85, + "learning_rate": 2.3155106135346217e-05, + "loss": 0.0066, + "step": 712010 + }, + { + "epoch": 1.85, + "learning_rate": 2.315121791897475e-05, + "loss": 0.0074, + "step": 712020 + }, + { + "epoch": 1.85, + "learning_rate": 2.3147329702603286e-05, + "loss": 0.0054, + "step": 712030 + }, + { + "epoch": 1.85, + "learning_rate": 2.3143441486231825e-05, + "loss": 0.0085, + "step": 712040 + }, + { + "epoch": 1.85, + "learning_rate": 2.313955326986036e-05, + "loss": 0.0077, + "step": 712050 + }, + { + "epoch": 1.85, + "learning_rate": 2.3135665053488894e-05, + "loss": 0.0052, + "step": 712060 + }, + { + "epoch": 1.85, + "learning_rate": 2.313177683711743e-05, + "loss": 0.0068, + "step": 712070 + }, + { + "epoch": 1.85, + "learning_rate": 2.3127888620745964e-05, + "loss": 0.007, + "step": 712080 + }, + { + "epoch": 1.85, + "learning_rate": 2.3124000404374502e-05, + "loss": 0.0073, + "step": 712090 + }, + { + "epoch": 1.85, + "learning_rate": 2.3120112188003037e-05, + "loss": 0.0075, + "step": 712100 + }, + { + "epoch": 1.85, + "learning_rate": 2.3116223971631572e-05, + "loss": 0.0062, + "step": 712110 + }, + { + "epoch": 1.85, + "learning_rate": 2.3112335755260107e-05, + "loss": 0.0097, + "step": 712120 + }, + { + "epoch": 1.85, + "learning_rate": 2.3108447538888642e-05, + "loss": 0.0069, + "step": 712130 + }, + { + "epoch": 1.85, + "learning_rate": 2.3104559322517177e-05, + "loss": 0.0049, + "step": 712140 + }, + { + "epoch": 1.85, + "learning_rate": 2.310067110614571e-05, + "loss": 0.0068, + "step": 712150 + }, + { + "epoch": 1.85, + "learning_rate": 2.3096782889774246e-05, + "loss": 0.0075, + "step": 712160 + }, + { + "epoch": 1.85, + "learning_rate": 2.309289467340278e-05, + "loss": 0.0068, + "step": 712170 + }, + { + "epoch": 1.85, + "learning_rate": 2.308900645703132e-05, + "loss": 0.0082, + "step": 712180 + }, + { + "epoch": 1.85, + "learning_rate": 2.3085118240659854e-05, + "loss": 0.0074, + "step": 712190 + }, + { + "epoch": 1.85, + "learning_rate": 2.308123002428839e-05, + "loss": 0.0065, + "step": 712200 + }, + { + "epoch": 1.85, + "learning_rate": 2.3077341807916924e-05, + "loss": 0.0098, + "step": 712210 + }, + { + "epoch": 1.85, + "learning_rate": 2.3073453591545462e-05, + "loss": 0.0066, + "step": 712220 + }, + { + "epoch": 1.85, + "learning_rate": 2.3069565375173997e-05, + "loss": 0.0086, + "step": 712230 + }, + { + "epoch": 1.85, + "learning_rate": 2.3065677158802532e-05, + "loss": 0.0075, + "step": 712240 + }, + { + "epoch": 1.85, + "learning_rate": 2.3061788942431067e-05, + "loss": 0.0061, + "step": 712250 + }, + { + "epoch": 1.85, + "learning_rate": 2.30579007260596e-05, + "loss": 0.0062, + "step": 712260 + }, + { + "epoch": 1.85, + "learning_rate": 2.3054012509688137e-05, + "loss": 0.0081, + "step": 712270 + }, + { + "epoch": 1.85, + "learning_rate": 2.305012429331667e-05, + "loss": 0.0065, + "step": 712280 + }, + { + "epoch": 1.85, + "learning_rate": 2.3046236076945206e-05, + "loss": 0.0081, + "step": 712290 + }, + { + "epoch": 1.85, + "learning_rate": 2.304234786057374e-05, + "loss": 0.0064, + "step": 712300 + }, + { + "epoch": 1.85, + "learning_rate": 2.303845964420228e-05, + "loss": 0.0062, + "step": 712310 + }, + { + "epoch": 1.85, + "learning_rate": 2.3034571427830814e-05, + "loss": 0.0066, + "step": 712320 + }, + { + "epoch": 1.85, + "learning_rate": 2.303068321145935e-05, + "loss": 0.0082, + "step": 712330 + }, + { + "epoch": 1.85, + "learning_rate": 2.3026794995087884e-05, + "loss": 0.0079, + "step": 712340 + }, + { + "epoch": 1.85, + "learning_rate": 2.3022906778716422e-05, + "loss": 0.0086, + "step": 712350 + }, + { + "epoch": 1.85, + "learning_rate": 2.3019018562344957e-05, + "loss": 0.0064, + "step": 712360 + }, + { + "epoch": 1.85, + "learning_rate": 2.3015130345973492e-05, + "loss": 0.0085, + "step": 712370 + }, + { + "epoch": 1.85, + "learning_rate": 2.3011242129602023e-05, + "loss": 0.0068, + "step": 712380 + }, + { + "epoch": 1.85, + "learning_rate": 2.3007353913230558e-05, + "loss": 0.0094, + "step": 712390 + }, + { + "epoch": 1.85, + "learning_rate": 2.3003465696859097e-05, + "loss": 0.0062, + "step": 712400 + }, + { + "epoch": 1.85, + "learning_rate": 2.299957748048763e-05, + "loss": 0.0088, + "step": 712410 + }, + { + "epoch": 1.85, + "learning_rate": 2.2995689264116166e-05, + "loss": 0.0076, + "step": 712420 + }, + { + "epoch": 1.85, + "learning_rate": 2.29918010477447e-05, + "loss": 0.0099, + "step": 712430 + }, + { + "epoch": 1.85, + "learning_rate": 2.298791283137324e-05, + "loss": 0.0071, + "step": 712440 + }, + { + "epoch": 1.85, + "learning_rate": 2.2984024615001774e-05, + "loss": 0.0077, + "step": 712450 + }, + { + "epoch": 1.85, + "learning_rate": 2.298013639863031e-05, + "loss": 0.0083, + "step": 712460 + }, + { + "epoch": 1.85, + "learning_rate": 2.2976248182258844e-05, + "loss": 0.0067, + "step": 712470 + }, + { + "epoch": 1.85, + "learning_rate": 2.2972359965887382e-05, + "loss": 0.0055, + "step": 712480 + }, + { + "epoch": 1.85, + "learning_rate": 2.2968471749515917e-05, + "loss": 0.0059, + "step": 712490 + }, + { + "epoch": 1.85, + "learning_rate": 2.2964583533144452e-05, + "loss": 0.0064, + "step": 712500 + }, + { + "epoch": 1.85, + "learning_rate": 2.2960695316772983e-05, + "loss": 0.0056, + "step": 712510 + }, + { + "epoch": 1.85, + "learning_rate": 2.2956807100401518e-05, + "loss": 0.0099, + "step": 712520 + }, + { + "epoch": 1.85, + "learning_rate": 2.2952918884030057e-05, + "loss": 0.0069, + "step": 712530 + }, + { + "epoch": 1.85, + "learning_rate": 2.294903066765859e-05, + "loss": 0.007, + "step": 712540 + }, + { + "epoch": 1.85, + "learning_rate": 2.2945142451287126e-05, + "loss": 0.0069, + "step": 712550 + }, + { + "epoch": 1.85, + "learning_rate": 2.294125423491566e-05, + "loss": 0.0071, + "step": 712560 + }, + { + "epoch": 1.85, + "learning_rate": 2.29373660185442e-05, + "loss": 0.008, + "step": 712570 + }, + { + "epoch": 1.85, + "learning_rate": 2.2933477802172734e-05, + "loss": 0.0102, + "step": 712580 + }, + { + "epoch": 1.85, + "learning_rate": 2.292958958580127e-05, + "loss": 0.0068, + "step": 712590 + }, + { + "epoch": 1.85, + "learning_rate": 2.2925701369429804e-05, + "loss": 0.0062, + "step": 712600 + }, + { + "epoch": 1.85, + "learning_rate": 2.2921813153058342e-05, + "loss": 0.0099, + "step": 712610 + }, + { + "epoch": 1.85, + "learning_rate": 2.2917924936686877e-05, + "loss": 0.0088, + "step": 712620 + }, + { + "epoch": 1.85, + "learning_rate": 2.291403672031541e-05, + "loss": 0.0064, + "step": 712630 + }, + { + "epoch": 1.85, + "learning_rate": 2.2910148503943943e-05, + "loss": 0.0084, + "step": 712640 + }, + { + "epoch": 1.85, + "learning_rate": 2.2906260287572478e-05, + "loss": 0.0066, + "step": 712650 + }, + { + "epoch": 1.85, + "learning_rate": 2.2902372071201016e-05, + "loss": 0.012, + "step": 712660 + }, + { + "epoch": 1.85, + "learning_rate": 2.289848385482955e-05, + "loss": 0.0051, + "step": 712670 + }, + { + "epoch": 1.85, + "learning_rate": 2.2894595638458086e-05, + "loss": 0.0064, + "step": 712680 + }, + { + "epoch": 1.85, + "learning_rate": 2.289070742208662e-05, + "loss": 0.0072, + "step": 712690 + }, + { + "epoch": 1.85, + "learning_rate": 2.288681920571516e-05, + "loss": 0.0094, + "step": 712700 + }, + { + "epoch": 1.85, + "learning_rate": 2.2882930989343694e-05, + "loss": 0.0092, + "step": 712710 + }, + { + "epoch": 1.85, + "learning_rate": 2.287904277297223e-05, + "loss": 0.0056, + "step": 712720 + }, + { + "epoch": 1.85, + "learning_rate": 2.2875154556600764e-05, + "loss": 0.007, + "step": 712730 + }, + { + "epoch": 1.85, + "learning_rate": 2.2871266340229302e-05, + "loss": 0.0063, + "step": 712740 + }, + { + "epoch": 1.85, + "learning_rate": 2.2867378123857834e-05, + "loss": 0.0095, + "step": 712750 + }, + { + "epoch": 1.85, + "learning_rate": 2.286348990748637e-05, + "loss": 0.007, + "step": 712760 + }, + { + "epoch": 1.85, + "learning_rate": 2.2859601691114903e-05, + "loss": 0.006, + "step": 712770 + }, + { + "epoch": 1.85, + "learning_rate": 2.2855713474743438e-05, + "loss": 0.0094, + "step": 712780 + }, + { + "epoch": 1.85, + "learning_rate": 2.2851825258371976e-05, + "loss": 0.0077, + "step": 712790 + }, + { + "epoch": 1.85, + "learning_rate": 2.284793704200051e-05, + "loss": 0.008, + "step": 712800 + }, + { + "epoch": 1.85, + "learning_rate": 2.2844048825629046e-05, + "loss": 0.007, + "step": 712810 + }, + { + "epoch": 1.85, + "learning_rate": 2.284016060925758e-05, + "loss": 0.0083, + "step": 712820 + }, + { + "epoch": 1.85, + "learning_rate": 2.283627239288612e-05, + "loss": 0.0071, + "step": 712830 + }, + { + "epoch": 1.85, + "learning_rate": 2.2832384176514654e-05, + "loss": 0.0065, + "step": 712840 + }, + { + "epoch": 1.85, + "learning_rate": 2.282849596014319e-05, + "loss": 0.0065, + "step": 712850 + }, + { + "epoch": 1.85, + "learning_rate": 2.2824607743771724e-05, + "loss": 0.0092, + "step": 712860 + }, + { + "epoch": 1.85, + "learning_rate": 2.2820719527400262e-05, + "loss": 0.0108, + "step": 712870 + }, + { + "epoch": 1.85, + "learning_rate": 2.2816831311028794e-05, + "loss": 0.0075, + "step": 712880 + }, + { + "epoch": 1.85, + "learning_rate": 2.281294309465733e-05, + "loss": 0.0069, + "step": 712890 + }, + { + "epoch": 1.85, + "learning_rate": 2.2809054878285863e-05, + "loss": 0.0076, + "step": 712900 + }, + { + "epoch": 1.85, + "learning_rate": 2.2805166661914398e-05, + "loss": 0.0076, + "step": 712910 + }, + { + "epoch": 1.85, + "learning_rate": 2.2801278445542936e-05, + "loss": 0.0063, + "step": 712920 + }, + { + "epoch": 1.85, + "learning_rate": 2.279739022917147e-05, + "loss": 0.0087, + "step": 712930 + }, + { + "epoch": 1.85, + "learning_rate": 2.2793502012800006e-05, + "loss": 0.0053, + "step": 712940 + }, + { + "epoch": 1.85, + "learning_rate": 2.278961379642854e-05, + "loss": 0.0094, + "step": 712950 + }, + { + "epoch": 1.85, + "learning_rate": 2.278572558005708e-05, + "loss": 0.0082, + "step": 712960 + }, + { + "epoch": 1.85, + "learning_rate": 2.2781837363685614e-05, + "loss": 0.0058, + "step": 712970 + }, + { + "epoch": 1.85, + "learning_rate": 2.277794914731415e-05, + "loss": 0.0068, + "step": 712980 + }, + { + "epoch": 1.85, + "learning_rate": 2.2774060930942684e-05, + "loss": 0.0116, + "step": 712990 + }, + { + "epoch": 1.85, + "learning_rate": 2.2770172714571215e-05, + "loss": 0.0081, + "step": 713000 + }, + { + "epoch": 1.85, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.004550943151116371, + "eval_runtime": 107.8933, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 713000 + }, + { + "epoch": 1.85, + "learning_rate": 2.2766284498199754e-05, + "loss": 0.0067, + "step": 713010 + }, + { + "epoch": 1.85, + "learning_rate": 2.276239628182829e-05, + "loss": 0.0072, + "step": 713020 + }, + { + "epoch": 1.85, + "learning_rate": 2.2758508065456823e-05, + "loss": 0.0065, + "step": 713030 + }, + { + "epoch": 1.85, + "learning_rate": 2.2754619849085358e-05, + "loss": 0.0049, + "step": 713040 + }, + { + "epoch": 1.85, + "learning_rate": 2.2750731632713896e-05, + "loss": 0.0079, + "step": 713050 + }, + { + "epoch": 1.85, + "learning_rate": 2.274684341634243e-05, + "loss": 0.007, + "step": 713060 + }, + { + "epoch": 1.85, + "learning_rate": 2.2742955199970966e-05, + "loss": 0.0062, + "step": 713070 + }, + { + "epoch": 1.85, + "learning_rate": 2.27390669835995e-05, + "loss": 0.0088, + "step": 713080 + }, + { + "epoch": 1.85, + "learning_rate": 2.273517876722804e-05, + "loss": 0.0064, + "step": 713090 + }, + { + "epoch": 1.85, + "learning_rate": 2.2731290550856574e-05, + "loss": 0.0067, + "step": 713100 + }, + { + "epoch": 1.85, + "learning_rate": 2.272740233448511e-05, + "loss": 0.0091, + "step": 713110 + }, + { + "epoch": 1.85, + "learning_rate": 2.2723514118113644e-05, + "loss": 0.0069, + "step": 713120 + }, + { + "epoch": 1.85, + "learning_rate": 2.2719625901742175e-05, + "loss": 0.0093, + "step": 713130 + }, + { + "epoch": 1.85, + "learning_rate": 2.2715737685370714e-05, + "loss": 0.0083, + "step": 713140 + }, + { + "epoch": 1.85, + "learning_rate": 2.271184946899925e-05, + "loss": 0.0104, + "step": 713150 + }, + { + "epoch": 1.85, + "learning_rate": 2.2707961252627783e-05, + "loss": 0.0066, + "step": 713160 + }, + { + "epoch": 1.85, + "learning_rate": 2.2704073036256318e-05, + "loss": 0.0068, + "step": 713170 + }, + { + "epoch": 1.85, + "learning_rate": 2.2700184819884856e-05, + "loss": 0.0077, + "step": 713180 + }, + { + "epoch": 1.85, + "learning_rate": 2.269629660351339e-05, + "loss": 0.0117, + "step": 713190 + }, + { + "epoch": 1.85, + "learning_rate": 2.2692408387141926e-05, + "loss": 0.0079, + "step": 713200 + }, + { + "epoch": 1.85, + "learning_rate": 2.268852017077046e-05, + "loss": 0.0091, + "step": 713210 + }, + { + "epoch": 1.85, + "learning_rate": 2.2684631954399e-05, + "loss": 0.0074, + "step": 713220 + }, + { + "epoch": 1.85, + "learning_rate": 2.2680743738027534e-05, + "loss": 0.0065, + "step": 713230 + }, + { + "epoch": 1.85, + "learning_rate": 2.267685552165607e-05, + "loss": 0.0069, + "step": 713240 + }, + { + "epoch": 1.85, + "learning_rate": 2.26729673052846e-05, + "loss": 0.0077, + "step": 713250 + }, + { + "epoch": 1.85, + "learning_rate": 2.2669079088913135e-05, + "loss": 0.0081, + "step": 713260 + }, + { + "epoch": 1.85, + "learning_rate": 2.2665190872541674e-05, + "loss": 0.0088, + "step": 713270 + }, + { + "epoch": 1.85, + "learning_rate": 2.266130265617021e-05, + "loss": 0.0115, + "step": 713280 + }, + { + "epoch": 1.85, + "learning_rate": 2.2657414439798743e-05, + "loss": 0.0078, + "step": 713290 + }, + { + "epoch": 1.85, + "learning_rate": 2.2653526223427278e-05, + "loss": 0.0058, + "step": 713300 + }, + { + "epoch": 1.85, + "learning_rate": 2.2649638007055816e-05, + "loss": 0.009, + "step": 713310 + }, + { + "epoch": 1.85, + "learning_rate": 2.264574979068435e-05, + "loss": 0.0063, + "step": 713320 + }, + { + "epoch": 1.85, + "learning_rate": 2.2641861574312886e-05, + "loss": 0.0082, + "step": 713330 + }, + { + "epoch": 1.85, + "learning_rate": 2.263797335794142e-05, + "loss": 0.0075, + "step": 713340 + }, + { + "epoch": 1.85, + "learning_rate": 2.263408514156996e-05, + "loss": 0.0077, + "step": 713350 + }, + { + "epoch": 1.85, + "learning_rate": 2.2630196925198494e-05, + "loss": 0.0064, + "step": 713360 + }, + { + "epoch": 1.85, + "learning_rate": 2.2626308708827026e-05, + "loss": 0.0074, + "step": 713370 + }, + { + "epoch": 1.85, + "learning_rate": 2.262242049245556e-05, + "loss": 0.0114, + "step": 713380 + }, + { + "epoch": 1.85, + "learning_rate": 2.2618532276084095e-05, + "loss": 0.0079, + "step": 713390 + }, + { + "epoch": 1.85, + "learning_rate": 2.2614644059712634e-05, + "loss": 0.0074, + "step": 713400 + }, + { + "epoch": 1.85, + "learning_rate": 2.261075584334117e-05, + "loss": 0.01, + "step": 713410 + }, + { + "epoch": 1.85, + "learning_rate": 2.2606867626969703e-05, + "loss": 0.0088, + "step": 713420 + }, + { + "epoch": 1.85, + "learning_rate": 2.2602979410598238e-05, + "loss": 0.0062, + "step": 713430 + }, + { + "epoch": 1.85, + "learning_rate": 2.2599091194226776e-05, + "loss": 0.0062, + "step": 713440 + }, + { + "epoch": 1.85, + "learning_rate": 2.259520297785531e-05, + "loss": 0.008, + "step": 713450 + }, + { + "epoch": 1.85, + "learning_rate": 2.2591314761483846e-05, + "loss": 0.0087, + "step": 713460 + }, + { + "epoch": 1.85, + "learning_rate": 2.258742654511238e-05, + "loss": 0.0062, + "step": 713470 + }, + { + "epoch": 1.85, + "learning_rate": 2.2583538328740916e-05, + "loss": 0.0069, + "step": 713480 + }, + { + "epoch": 1.85, + "learning_rate": 2.2579650112369454e-05, + "loss": 0.0105, + "step": 713490 + }, + { + "epoch": 1.85, + "learning_rate": 2.2575761895997986e-05, + "loss": 0.0087, + "step": 713500 + }, + { + "epoch": 1.85, + "learning_rate": 2.257187367962652e-05, + "loss": 0.0059, + "step": 713510 + }, + { + "epoch": 1.85, + "learning_rate": 2.2567985463255055e-05, + "loss": 0.0066, + "step": 713520 + }, + { + "epoch": 1.85, + "learning_rate": 2.256409724688359e-05, + "loss": 0.01, + "step": 713530 + }, + { + "epoch": 1.85, + "learning_rate": 2.256020903051213e-05, + "loss": 0.0055, + "step": 713540 + }, + { + "epoch": 1.85, + "learning_rate": 2.2556320814140663e-05, + "loss": 0.0063, + "step": 713550 + }, + { + "epoch": 1.85, + "learning_rate": 2.2552432597769198e-05, + "loss": 0.0063, + "step": 713560 + }, + { + "epoch": 1.85, + "learning_rate": 2.2548544381397733e-05, + "loss": 0.0083, + "step": 713570 + }, + { + "epoch": 1.85, + "learning_rate": 2.254465616502627e-05, + "loss": 0.0059, + "step": 713580 + }, + { + "epoch": 1.85, + "learning_rate": 2.2540767948654806e-05, + "loss": 0.0059, + "step": 713590 + }, + { + "epoch": 1.85, + "learning_rate": 2.253687973228334e-05, + "loss": 0.0069, + "step": 713600 + }, + { + "epoch": 1.85, + "learning_rate": 2.2532991515911876e-05, + "loss": 0.0067, + "step": 713610 + }, + { + "epoch": 1.85, + "learning_rate": 2.2529103299540407e-05, + "loss": 0.0068, + "step": 713620 + }, + { + "epoch": 1.85, + "learning_rate": 2.2525215083168945e-05, + "loss": 0.0087, + "step": 713630 + }, + { + "epoch": 1.85, + "learning_rate": 2.252132686679748e-05, + "loss": 0.0083, + "step": 713640 + }, + { + "epoch": 1.85, + "learning_rate": 2.2517438650426015e-05, + "loss": 0.0058, + "step": 713650 + }, + { + "epoch": 1.85, + "learning_rate": 2.251355043405455e-05, + "loss": 0.0085, + "step": 713660 + }, + { + "epoch": 1.85, + "learning_rate": 2.250966221768309e-05, + "loss": 0.0056, + "step": 713670 + }, + { + "epoch": 1.85, + "learning_rate": 2.2505774001311623e-05, + "loss": 0.0071, + "step": 713680 + }, + { + "epoch": 1.85, + "learning_rate": 2.2501885784940158e-05, + "loss": 0.0083, + "step": 713690 + }, + { + "epoch": 1.85, + "learning_rate": 2.2497997568568693e-05, + "loss": 0.008, + "step": 713700 + }, + { + "epoch": 1.85, + "learning_rate": 2.249410935219723e-05, + "loss": 0.0078, + "step": 713710 + }, + { + "epoch": 1.85, + "learning_rate": 2.2490221135825766e-05, + "loss": 0.0051, + "step": 713720 + }, + { + "epoch": 1.85, + "learning_rate": 2.24863329194543e-05, + "loss": 0.0056, + "step": 713730 + }, + { + "epoch": 1.85, + "learning_rate": 2.2482444703082836e-05, + "loss": 0.0052, + "step": 713740 + }, + { + "epoch": 1.85, + "learning_rate": 2.2478556486711367e-05, + "loss": 0.0061, + "step": 713750 + }, + { + "epoch": 1.85, + "learning_rate": 2.2474668270339905e-05, + "loss": 0.0059, + "step": 713760 + }, + { + "epoch": 1.85, + "learning_rate": 2.247078005396844e-05, + "loss": 0.0052, + "step": 713770 + }, + { + "epoch": 1.85, + "learning_rate": 2.2466891837596975e-05, + "loss": 0.0078, + "step": 713780 + }, + { + "epoch": 1.85, + "learning_rate": 2.246300362122551e-05, + "loss": 0.0081, + "step": 713790 + }, + { + "epoch": 1.85, + "learning_rate": 2.2459115404854048e-05, + "loss": 0.0107, + "step": 713800 + }, + { + "epoch": 1.85, + "learning_rate": 2.2455227188482583e-05, + "loss": 0.0088, + "step": 713810 + }, + { + "epoch": 1.85, + "learning_rate": 2.2451338972111118e-05, + "loss": 0.0066, + "step": 713820 + }, + { + "epoch": 1.85, + "learning_rate": 2.2447450755739653e-05, + "loss": 0.0062, + "step": 713830 + }, + { + "epoch": 1.85, + "learning_rate": 2.244356253936819e-05, + "loss": 0.0088, + "step": 713840 + }, + { + "epoch": 1.85, + "learning_rate": 2.2439674322996726e-05, + "loss": 0.006, + "step": 713850 + }, + { + "epoch": 1.85, + "learning_rate": 2.243578610662526e-05, + "loss": 0.0067, + "step": 713860 + }, + { + "epoch": 1.85, + "learning_rate": 2.2431897890253792e-05, + "loss": 0.0098, + "step": 713870 + }, + { + "epoch": 1.85, + "learning_rate": 2.2428009673882327e-05, + "loss": 0.007, + "step": 713880 + }, + { + "epoch": 1.85, + "learning_rate": 2.2424121457510865e-05, + "loss": 0.0065, + "step": 713890 + }, + { + "epoch": 1.85, + "learning_rate": 2.24202332411394e-05, + "loss": 0.0074, + "step": 713900 + }, + { + "epoch": 1.85, + "learning_rate": 2.2416345024767935e-05, + "loss": 0.0085, + "step": 713910 + }, + { + "epoch": 1.85, + "learning_rate": 2.241245680839647e-05, + "loss": 0.0073, + "step": 713920 + }, + { + "epoch": 1.85, + "learning_rate": 2.2408568592025008e-05, + "loss": 0.0065, + "step": 713930 + }, + { + "epoch": 1.85, + "learning_rate": 2.2404680375653543e-05, + "loss": 0.005, + "step": 713940 + }, + { + "epoch": 1.85, + "learning_rate": 2.2400792159282078e-05, + "loss": 0.0058, + "step": 713950 + }, + { + "epoch": 1.85, + "learning_rate": 2.2396903942910613e-05, + "loss": 0.0087, + "step": 713960 + }, + { + "epoch": 1.85, + "learning_rate": 2.239301572653915e-05, + "loss": 0.0071, + "step": 713970 + }, + { + "epoch": 1.85, + "learning_rate": 2.2389127510167686e-05, + "loss": 0.0058, + "step": 713980 + }, + { + "epoch": 1.85, + "learning_rate": 2.2385239293796217e-05, + "loss": 0.0098, + "step": 713990 + }, + { + "epoch": 1.85, + "learning_rate": 2.2381351077424752e-05, + "loss": 0.006, + "step": 714000 + }, + { + "epoch": 1.85, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.004546701442450285, + "eval_runtime": 107.8645, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, + "step": 714000 + }, + { + "epoch": 1.85, + "learning_rate": 2.2377462861053287e-05, + "loss": 0.0107, + "step": 714010 + }, + { + "epoch": 1.85, + "learning_rate": 2.2373574644681825e-05, + "loss": 0.0077, + "step": 714020 + }, + { + "epoch": 1.85, + "learning_rate": 2.236968642831036e-05, + "loss": 0.0079, + "step": 714030 + }, + { + "epoch": 1.85, + "learning_rate": 2.2365798211938895e-05, + "loss": 0.007, + "step": 714040 + }, + { + "epoch": 1.85, + "learning_rate": 2.236190999556743e-05, + "loss": 0.007, + "step": 714050 + }, + { + "epoch": 1.85, + "learning_rate": 2.2358021779195968e-05, + "loss": 0.007, + "step": 714060 + }, + { + "epoch": 1.85, + "learning_rate": 2.2354133562824503e-05, + "loss": 0.0069, + "step": 714070 + }, + { + "epoch": 1.85, + "learning_rate": 2.2350245346453038e-05, + "loss": 0.0082, + "step": 714080 + }, + { + "epoch": 1.85, + "learning_rate": 2.2346357130081573e-05, + "loss": 0.0081, + "step": 714090 + }, + { + "epoch": 1.85, + "learning_rate": 2.234246891371011e-05, + "loss": 0.0072, + "step": 714100 + }, + { + "epoch": 1.85, + "learning_rate": 2.2338580697338646e-05, + "loss": 0.007, + "step": 714110 + }, + { + "epoch": 1.85, + "learning_rate": 2.2334692480967177e-05, + "loss": 0.0086, + "step": 714120 + }, + { + "epoch": 1.85, + "learning_rate": 2.2330804264595712e-05, + "loss": 0.0059, + "step": 714130 + }, + { + "epoch": 1.85, + "learning_rate": 2.2326916048224247e-05, + "loss": 0.0069, + "step": 714140 + }, + { + "epoch": 1.85, + "learning_rate": 2.2323027831852785e-05, + "loss": 0.0092, + "step": 714150 + }, + { + "epoch": 1.85, + "learning_rate": 2.231913961548132e-05, + "loss": 0.0078, + "step": 714160 + }, + { + "epoch": 1.85, + "learning_rate": 2.2315251399109855e-05, + "loss": 0.0061, + "step": 714170 + }, + { + "epoch": 1.85, + "learning_rate": 2.231136318273839e-05, + "loss": 0.0059, + "step": 714180 + }, + { + "epoch": 1.85, + "learning_rate": 2.2307474966366928e-05, + "loss": 0.0078, + "step": 714190 + }, + { + "epoch": 1.85, + "learning_rate": 2.2303586749995463e-05, + "loss": 0.0077, + "step": 714200 + }, + { + "epoch": 1.85, + "learning_rate": 2.2299698533623998e-05, + "loss": 0.0066, + "step": 714210 + }, + { + "epoch": 1.85, + "learning_rate": 2.2295810317252533e-05, + "loss": 0.0088, + "step": 714220 + }, + { + "epoch": 1.85, + "learning_rate": 2.229192210088107e-05, + "loss": 0.0066, + "step": 714230 + }, + { + "epoch": 1.85, + "learning_rate": 2.2288033884509603e-05, + "loss": 0.0089, + "step": 714240 + }, + { + "epoch": 1.85, + "learning_rate": 2.2284145668138137e-05, + "loss": 0.0079, + "step": 714250 + }, + { + "epoch": 1.85, + "learning_rate": 2.2280257451766672e-05, + "loss": 0.0091, + "step": 714260 + }, + { + "epoch": 1.85, + "learning_rate": 2.2276369235395207e-05, + "loss": 0.0086, + "step": 714270 + }, + { + "epoch": 1.85, + "learning_rate": 2.2272481019023745e-05, + "loss": 0.0086, + "step": 714280 + }, + { + "epoch": 1.85, + "learning_rate": 2.226859280265228e-05, + "loss": 0.0061, + "step": 714290 + }, + { + "epoch": 1.85, + "learning_rate": 2.2264704586280815e-05, + "loss": 0.0082, + "step": 714300 + }, + { + "epoch": 1.85, + "learning_rate": 2.226081636990935e-05, + "loss": 0.009, + "step": 714310 + }, + { + "epoch": 1.85, + "learning_rate": 2.2256928153537888e-05, + "loss": 0.0139, + "step": 714320 + }, + { + "epoch": 1.85, + "learning_rate": 2.2253039937166423e-05, + "loss": 0.0069, + "step": 714330 + }, + { + "epoch": 1.85, + "learning_rate": 2.2249151720794958e-05, + "loss": 0.0057, + "step": 714340 + }, + { + "epoch": 1.85, + "learning_rate": 2.2245263504423493e-05, + "loss": 0.0068, + "step": 714350 + }, + { + "epoch": 1.85, + "learning_rate": 2.224137528805203e-05, + "loss": 0.0067, + "step": 714360 + }, + { + "epoch": 1.85, + "learning_rate": 2.2237487071680563e-05, + "loss": 0.0086, + "step": 714370 + }, + { + "epoch": 1.85, + "learning_rate": 2.2233598855309097e-05, + "loss": 0.0072, + "step": 714380 + }, + { + "epoch": 1.85, + "learning_rate": 2.2229710638937632e-05, + "loss": 0.0049, + "step": 714390 + }, + { + "epoch": 1.85, + "learning_rate": 2.2225822422566167e-05, + "loss": 0.0088, + "step": 714400 + }, + { + "epoch": 1.85, + "learning_rate": 2.2221934206194705e-05, + "loss": 0.0063, + "step": 714410 + }, + { + "epoch": 1.85, + "learning_rate": 2.221804598982324e-05, + "loss": 0.0073, + "step": 714420 + }, + { + "epoch": 1.85, + "learning_rate": 2.2214157773451775e-05, + "loss": 0.0086, + "step": 714430 + }, + { + "epoch": 1.85, + "learning_rate": 2.221026955708031e-05, + "loss": 0.0061, + "step": 714440 + }, + { + "epoch": 1.85, + "learning_rate": 2.2206381340708848e-05, + "loss": 0.0098, + "step": 714450 + }, + { + "epoch": 1.85, + "learning_rate": 2.2202493124337383e-05, + "loss": 0.0093, + "step": 714460 + }, + { + "epoch": 1.85, + "learning_rate": 2.2198604907965918e-05, + "loss": 0.0076, + "step": 714470 + }, + { + "epoch": 1.85, + "learning_rate": 2.2194716691594453e-05, + "loss": 0.0087, + "step": 714480 + }, + { + "epoch": 1.85, + "learning_rate": 2.2190828475222984e-05, + "loss": 0.0074, + "step": 714490 + }, + { + "epoch": 1.85, + "learning_rate": 2.2186940258851522e-05, + "loss": 0.0054, + "step": 714500 + }, + { + "epoch": 1.85, + "learning_rate": 2.2183052042480057e-05, + "loss": 0.006, + "step": 714510 + }, + { + "epoch": 1.85, + "learning_rate": 2.2179163826108592e-05, + "loss": 0.0064, + "step": 714520 + }, + { + "epoch": 1.85, + "learning_rate": 2.2175275609737127e-05, + "loss": 0.0067, + "step": 714530 + }, + { + "epoch": 1.85, + "learning_rate": 2.2171387393365665e-05, + "loss": 0.009, + "step": 714540 + }, + { + "epoch": 1.85, + "learning_rate": 2.21674991769942e-05, + "loss": 0.0053, + "step": 714550 + }, + { + "epoch": 1.85, + "learning_rate": 2.2163610960622735e-05, + "loss": 0.0096, + "step": 714560 + }, + { + "epoch": 1.85, + "learning_rate": 2.215972274425127e-05, + "loss": 0.0078, + "step": 714570 + }, + { + "epoch": 1.85, + "learning_rate": 2.2155834527879808e-05, + "loss": 0.0045, + "step": 714580 + }, + { + "epoch": 1.85, + "learning_rate": 2.2151946311508343e-05, + "loss": 0.0065, + "step": 714590 + }, + { + "epoch": 1.85, + "learning_rate": 2.2148058095136878e-05, + "loss": 0.0075, + "step": 714600 + }, + { + "epoch": 1.85, + "learning_rate": 2.214416987876541e-05, + "loss": 0.0068, + "step": 714610 + }, + { + "epoch": 1.85, + "learning_rate": 2.2140281662393944e-05, + "loss": 0.0073, + "step": 714620 + }, + { + "epoch": 1.85, + "learning_rate": 2.2136393446022482e-05, + "loss": 0.0086, + "step": 714630 + }, + { + "epoch": 1.85, + "learning_rate": 2.2132505229651017e-05, + "loss": 0.0077, + "step": 714640 + }, + { + "epoch": 1.85, + "learning_rate": 2.2128617013279552e-05, + "loss": 0.0075, + "step": 714650 + }, + { + "epoch": 1.85, + "learning_rate": 2.2124728796908087e-05, + "loss": 0.007, + "step": 714660 + }, + { + "epoch": 1.85, + "learning_rate": 2.2120840580536625e-05, + "loss": 0.0074, + "step": 714670 + }, + { + "epoch": 1.85, + "learning_rate": 2.211695236416516e-05, + "loss": 0.0065, + "step": 714680 + }, + { + "epoch": 1.85, + "learning_rate": 2.2113064147793695e-05, + "loss": 0.0078, + "step": 714690 + }, + { + "epoch": 1.85, + "learning_rate": 2.210917593142223e-05, + "loss": 0.0064, + "step": 714700 + }, + { + "epoch": 1.85, + "learning_rate": 2.2105287715050768e-05, + "loss": 0.0069, + "step": 714710 + }, + { + "epoch": 1.85, + "learning_rate": 2.2101399498679303e-05, + "loss": 0.0069, + "step": 714720 + }, + { + "epoch": 1.85, + "learning_rate": 2.2097511282307838e-05, + "loss": 0.0078, + "step": 714730 + }, + { + "epoch": 1.85, + "learning_rate": 2.209362306593637e-05, + "loss": 0.0072, + "step": 714740 + }, + { + "epoch": 1.85, + "learning_rate": 2.2089734849564904e-05, + "loss": 0.0059, + "step": 714750 + }, + { + "epoch": 1.85, + "learning_rate": 2.2085846633193442e-05, + "loss": 0.0115, + "step": 714760 + }, + { + "epoch": 1.85, + "learning_rate": 2.2081958416821977e-05, + "loss": 0.0086, + "step": 714770 + }, + { + "epoch": 1.85, + "learning_rate": 2.2078070200450512e-05, + "loss": 0.0062, + "step": 714780 + }, + { + "epoch": 1.85, + "learning_rate": 2.2074181984079047e-05, + "loss": 0.0063, + "step": 714790 + }, + { + "epoch": 1.85, + "learning_rate": 2.2070293767707585e-05, + "loss": 0.0053, + "step": 714800 + }, + { + "epoch": 1.85, + "learning_rate": 2.206640555133612e-05, + "loss": 0.0071, + "step": 714810 + }, + { + "epoch": 1.85, + "learning_rate": 2.2062517334964655e-05, + "loss": 0.0075, + "step": 714820 + }, + { + "epoch": 1.85, + "learning_rate": 2.205862911859319e-05, + "loss": 0.0083, + "step": 714830 + }, + { + "epoch": 1.85, + "learning_rate": 2.2054740902221725e-05, + "loss": 0.013, + "step": 714840 + }, + { + "epoch": 1.85, + "learning_rate": 2.2050852685850263e-05, + "loss": 0.0063, + "step": 714850 + }, + { + "epoch": 1.85, + "learning_rate": 2.2046964469478794e-05, + "loss": 0.0061, + "step": 714860 + }, + { + "epoch": 1.85, + "learning_rate": 2.204307625310733e-05, + "loss": 0.0063, + "step": 714870 + }, + { + "epoch": 1.85, + "learning_rate": 2.2039188036735864e-05, + "loss": 0.0076, + "step": 714880 + }, + { + "epoch": 1.85, + "learning_rate": 2.2035299820364402e-05, + "loss": 0.0087, + "step": 714890 + }, + { + "epoch": 1.85, + "learning_rate": 2.2031411603992937e-05, + "loss": 0.0078, + "step": 714900 + }, + { + "epoch": 1.85, + "learning_rate": 2.2027523387621472e-05, + "loss": 0.0096, + "step": 714910 + }, + { + "epoch": 1.85, + "learning_rate": 2.2023635171250007e-05, + "loss": 0.0077, + "step": 714920 + }, + { + "epoch": 1.85, + "learning_rate": 2.2019746954878542e-05, + "loss": 0.0069, + "step": 714930 + }, + { + "epoch": 1.85, + "learning_rate": 2.201585873850708e-05, + "loss": 0.0113, + "step": 714940 + }, + { + "epoch": 1.85, + "learning_rate": 2.2011970522135615e-05, + "loss": 0.0115, + "step": 714950 + }, + { + "epoch": 1.85, + "learning_rate": 2.200808230576415e-05, + "loss": 0.0065, + "step": 714960 + }, + { + "epoch": 1.85, + "learning_rate": 2.2004194089392685e-05, + "loss": 0.008, + "step": 714970 + }, + { + "epoch": 1.85, + "learning_rate": 2.2000305873021223e-05, + "loss": 0.0064, + "step": 714980 + }, + { + "epoch": 1.85, + "learning_rate": 2.1996417656649754e-05, + "loss": 0.0075, + "step": 714990 + }, + { + "epoch": 1.85, + "learning_rate": 2.199252944027829e-05, + "loss": 0.0061, + "step": 715000 + }, + { + "epoch": 1.85, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.004574858583509922, + "eval_runtime": 107.8934, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 715000 + }, + { + "epoch": 1.85, + "learning_rate": 2.1988641223906824e-05, + "loss": 0.0066, + "step": 715010 + }, + { + "epoch": 1.85, + "learning_rate": 2.198475300753536e-05, + "loss": 0.0071, + "step": 715020 + }, + { + "epoch": 1.85, + "learning_rate": 2.1980864791163897e-05, + "loss": 0.0066, + "step": 715030 + }, + { + "epoch": 1.85, + "learning_rate": 2.1976976574792432e-05, + "loss": 0.0067, + "step": 715040 + }, + { + "epoch": 1.85, + "learning_rate": 2.1973088358420967e-05, + "loss": 0.0071, + "step": 715050 + }, + { + "epoch": 1.85, + "learning_rate": 2.1969200142049502e-05, + "loss": 0.0076, + "step": 715060 + }, + { + "epoch": 1.85, + "learning_rate": 2.196531192567804e-05, + "loss": 0.0059, + "step": 715070 + }, + { + "epoch": 1.85, + "learning_rate": 2.1961423709306575e-05, + "loss": 0.0093, + "step": 715080 + }, + { + "epoch": 1.85, + "learning_rate": 2.195753549293511e-05, + "loss": 0.0061, + "step": 715090 + }, + { + "epoch": 1.85, + "learning_rate": 2.1953647276563645e-05, + "loss": 0.0088, + "step": 715100 + }, + { + "epoch": 1.85, + "learning_rate": 2.1949759060192176e-05, + "loss": 0.0071, + "step": 715110 + }, + { + "epoch": 1.85, + "learning_rate": 2.1945870843820714e-05, + "loss": 0.0056, + "step": 715120 + }, + { + "epoch": 1.85, + "learning_rate": 2.194198262744925e-05, + "loss": 0.0069, + "step": 715130 + }, + { + "epoch": 1.85, + "learning_rate": 2.1938094411077784e-05, + "loss": 0.0071, + "step": 715140 + }, + { + "epoch": 1.85, + "learning_rate": 2.193420619470632e-05, + "loss": 0.007, + "step": 715150 + }, + { + "epoch": 1.85, + "learning_rate": 2.1930317978334857e-05, + "loss": 0.0086, + "step": 715160 + }, + { + "epoch": 1.85, + "learning_rate": 2.1926429761963392e-05, + "loss": 0.0089, + "step": 715170 + }, + { + "epoch": 1.85, + "learning_rate": 2.1922541545591927e-05, + "loss": 0.0073, + "step": 715180 + }, + { + "epoch": 1.85, + "learning_rate": 2.1918653329220462e-05, + "loss": 0.007, + "step": 715190 + }, + { + "epoch": 1.85, + "learning_rate": 2.1914765112849e-05, + "loss": 0.0086, + "step": 715200 + }, + { + "epoch": 1.85, + "learning_rate": 2.1910876896477535e-05, + "loss": 0.0067, + "step": 715210 + }, + { + "epoch": 1.85, + "learning_rate": 2.190698868010607e-05, + "loss": 0.0054, + "step": 715220 + }, + { + "epoch": 1.85, + "learning_rate": 2.19031004637346e-05, + "loss": 0.007, + "step": 715230 + }, + { + "epoch": 1.85, + "learning_rate": 2.1899212247363136e-05, + "loss": 0.0066, + "step": 715240 + }, + { + "epoch": 1.85, + "learning_rate": 2.1895324030991674e-05, + "loss": 0.0054, + "step": 715250 + }, + { + "epoch": 1.85, + "learning_rate": 2.189143581462021e-05, + "loss": 0.0091, + "step": 715260 + }, + { + "epoch": 1.85, + "learning_rate": 2.1887547598248744e-05, + "loss": 0.0094, + "step": 715270 + }, + { + "epoch": 1.85, + "learning_rate": 2.188365938187728e-05, + "loss": 0.007, + "step": 715280 + }, + { + "epoch": 1.85, + "learning_rate": 2.1879771165505817e-05, + "loss": 0.0077, + "step": 715290 + }, + { + "epoch": 1.85, + "learning_rate": 2.1875882949134352e-05, + "loss": 0.007, + "step": 715300 + }, + { + "epoch": 1.85, + "learning_rate": 2.1871994732762887e-05, + "loss": 0.0054, + "step": 715310 + }, + { + "epoch": 1.85, + "learning_rate": 2.1868106516391422e-05, + "loss": 0.0058, + "step": 715320 + }, + { + "epoch": 1.85, + "learning_rate": 2.186421830001996e-05, + "loss": 0.0105, + "step": 715330 + }, + { + "epoch": 1.85, + "learning_rate": 2.1860330083648495e-05, + "loss": 0.0086, + "step": 715340 + }, + { + "epoch": 1.85, + "learning_rate": 2.185644186727703e-05, + "loss": 0.0072, + "step": 715350 + }, + { + "epoch": 1.85, + "learning_rate": 2.185255365090556e-05, + "loss": 0.008, + "step": 715360 + }, + { + "epoch": 1.85, + "learning_rate": 2.1848665434534096e-05, + "loss": 0.009, + "step": 715370 + }, + { + "epoch": 1.85, + "learning_rate": 2.1844777218162634e-05, + "loss": 0.0073, + "step": 715380 + }, + { + "epoch": 1.85, + "learning_rate": 2.184088900179117e-05, + "loss": 0.0082, + "step": 715390 + }, + { + "epoch": 1.85, + "learning_rate": 2.1837000785419704e-05, + "loss": 0.0084, + "step": 715400 + }, + { + "epoch": 1.85, + "learning_rate": 2.183311256904824e-05, + "loss": 0.0135, + "step": 715410 + }, + { + "epoch": 1.85, + "learning_rate": 2.1829224352676777e-05, + "loss": 0.0067, + "step": 715420 + }, + { + "epoch": 1.85, + "learning_rate": 2.1825336136305312e-05, + "loss": 0.0074, + "step": 715430 + }, + { + "epoch": 1.85, + "learning_rate": 2.1821447919933847e-05, + "loss": 0.0062, + "step": 715440 + }, + { + "epoch": 1.85, + "learning_rate": 2.1817559703562382e-05, + "loss": 0.0051, + "step": 715450 + }, + { + "epoch": 1.85, + "learning_rate": 2.181367148719092e-05, + "loss": 0.0052, + "step": 715460 + }, + { + "epoch": 1.85, + "learning_rate": 2.1809783270819455e-05, + "loss": 0.0078, + "step": 715470 + }, + { + "epoch": 1.85, + "learning_rate": 2.1805895054447986e-05, + "loss": 0.0071, + "step": 715480 + }, + { + "epoch": 1.85, + "learning_rate": 2.180200683807652e-05, + "loss": 0.0073, + "step": 715490 + }, + { + "epoch": 1.85, + "learning_rate": 2.1798118621705056e-05, + "loss": 0.0132, + "step": 715500 + }, + { + "epoch": 1.85, + "learning_rate": 2.1794230405333594e-05, + "loss": 0.0094, + "step": 715510 + }, + { + "epoch": 1.85, + "learning_rate": 2.179034218896213e-05, + "loss": 0.0094, + "step": 715520 + }, + { + "epoch": 1.85, + "learning_rate": 2.1786453972590664e-05, + "loss": 0.0087, + "step": 715530 + }, + { + "epoch": 1.85, + "learning_rate": 2.17825657562192e-05, + "loss": 0.0071, + "step": 715540 + }, + { + "epoch": 1.85, + "learning_rate": 2.1778677539847737e-05, + "loss": 0.0092, + "step": 715550 + }, + { + "epoch": 1.85, + "learning_rate": 2.1774789323476272e-05, + "loss": 0.0109, + "step": 715560 + }, + { + "epoch": 1.85, + "learning_rate": 2.1770901107104807e-05, + "loss": 0.006, + "step": 715570 + }, + { + "epoch": 1.85, + "learning_rate": 2.1767012890733342e-05, + "loss": 0.0067, + "step": 715580 + }, + { + "epoch": 1.85, + "learning_rate": 2.176312467436188e-05, + "loss": 0.0065, + "step": 715590 + }, + { + "epoch": 1.85, + "learning_rate": 2.1759236457990415e-05, + "loss": 0.0056, + "step": 715600 + }, + { + "epoch": 1.85, + "learning_rate": 2.1755348241618946e-05, + "loss": 0.0093, + "step": 715610 + }, + { + "epoch": 1.85, + "learning_rate": 2.175146002524748e-05, + "loss": 0.0085, + "step": 715620 + }, + { + "epoch": 1.86, + "learning_rate": 2.1747571808876016e-05, + "loss": 0.0069, + "step": 715630 + }, + { + "epoch": 1.86, + "learning_rate": 2.1743683592504554e-05, + "loss": 0.0077, + "step": 715640 + }, + { + "epoch": 1.86, + "learning_rate": 2.173979537613309e-05, + "loss": 0.0076, + "step": 715650 + }, + { + "epoch": 1.86, + "learning_rate": 2.1735907159761624e-05, + "loss": 0.0076, + "step": 715660 + }, + { + "epoch": 1.86, + "learning_rate": 2.173201894339016e-05, + "loss": 0.0069, + "step": 715670 + }, + { + "epoch": 1.86, + "learning_rate": 2.1728130727018697e-05, + "loss": 0.0075, + "step": 715680 + }, + { + "epoch": 1.86, + "learning_rate": 2.1724242510647232e-05, + "loss": 0.0063, + "step": 715690 + }, + { + "epoch": 1.86, + "learning_rate": 2.1720354294275767e-05, + "loss": 0.0053, + "step": 715700 + }, + { + "epoch": 1.86, + "learning_rate": 2.1716466077904302e-05, + "loss": 0.0084, + "step": 715710 + }, + { + "epoch": 1.86, + "learning_rate": 2.171257786153284e-05, + "loss": 0.0084, + "step": 715720 + }, + { + "epoch": 1.86, + "learning_rate": 2.170868964516137e-05, + "loss": 0.0085, + "step": 715730 + }, + { + "epoch": 1.86, + "learning_rate": 2.1704801428789906e-05, + "loss": 0.0062, + "step": 715740 + }, + { + "epoch": 1.86, + "learning_rate": 2.170091321241844e-05, + "loss": 0.007, + "step": 715750 + }, + { + "epoch": 1.86, + "learning_rate": 2.1697024996046976e-05, + "loss": 0.0079, + "step": 715760 + }, + { + "epoch": 1.86, + "learning_rate": 2.1693136779675514e-05, + "loss": 0.0071, + "step": 715770 + }, + { + "epoch": 1.86, + "learning_rate": 2.168924856330405e-05, + "loss": 0.0099, + "step": 715780 + }, + { + "epoch": 1.86, + "learning_rate": 2.1685360346932584e-05, + "loss": 0.0082, + "step": 715790 + }, + { + "epoch": 1.86, + "learning_rate": 2.168147213056112e-05, + "loss": 0.0092, + "step": 715800 + }, + { + "epoch": 1.86, + "learning_rate": 2.1677583914189657e-05, + "loss": 0.0067, + "step": 715810 + }, + { + "epoch": 1.86, + "learning_rate": 2.1673695697818192e-05, + "loss": 0.0054, + "step": 715820 + }, + { + "epoch": 1.86, + "learning_rate": 2.1669807481446727e-05, + "loss": 0.0069, + "step": 715830 + }, + { + "epoch": 1.86, + "learning_rate": 2.166591926507526e-05, + "loss": 0.0086, + "step": 715840 + }, + { + "epoch": 1.86, + "learning_rate": 2.1662031048703793e-05, + "loss": 0.0064, + "step": 715850 + }, + { + "epoch": 1.86, + "learning_rate": 2.165814283233233e-05, + "loss": 0.0075, + "step": 715860 + }, + { + "epoch": 1.86, + "learning_rate": 2.1654254615960866e-05, + "loss": 0.006, + "step": 715870 + }, + { + "epoch": 1.86, + "learning_rate": 2.16503663995894e-05, + "loss": 0.0072, + "step": 715880 + }, + { + "epoch": 1.86, + "learning_rate": 2.1646478183217936e-05, + "loss": 0.0084, + "step": 715890 + }, + { + "epoch": 1.86, + "learning_rate": 2.1642589966846474e-05, + "loss": 0.0055, + "step": 715900 + }, + { + "epoch": 1.86, + "learning_rate": 2.163870175047501e-05, + "loss": 0.0096, + "step": 715910 + }, + { + "epoch": 1.86, + "learning_rate": 2.1634813534103544e-05, + "loss": 0.0064, + "step": 715920 + }, + { + "epoch": 1.86, + "learning_rate": 2.163092531773208e-05, + "loss": 0.0083, + "step": 715930 + }, + { + "epoch": 1.86, + "learning_rate": 2.1627037101360617e-05, + "loss": 0.0077, + "step": 715940 + }, + { + "epoch": 1.86, + "learning_rate": 2.1623148884989152e-05, + "loss": 0.0083, + "step": 715950 + }, + { + "epoch": 1.86, + "learning_rate": 2.1619260668617687e-05, + "loss": 0.0076, + "step": 715960 + }, + { + "epoch": 1.86, + "learning_rate": 2.161537245224622e-05, + "loss": 0.0076, + "step": 715970 + }, + { + "epoch": 1.86, + "learning_rate": 2.1611484235874753e-05, + "loss": 0.008, + "step": 715980 + }, + { + "epoch": 1.86, + "learning_rate": 2.160759601950329e-05, + "loss": 0.0062, + "step": 715990 + }, + { + "epoch": 1.86, + "learning_rate": 2.1603707803131826e-05, + "loss": 0.0059, + "step": 716000 + }, + { + "epoch": 1.86, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.004547602031379938, + "eval_runtime": 107.8685, + "eval_samples_per_second": 18.541, + "eval_steps_per_second": 4.635, + "step": 716000 + }, + { + "epoch": 1.86, + "learning_rate": 2.159981958676036e-05, + "loss": 0.0093, + "step": 716010 + }, + { + "epoch": 1.86, + "learning_rate": 2.1595931370388896e-05, + "loss": 0.0072, + "step": 716020 + }, + { + "epoch": 1.86, + "learning_rate": 2.1592043154017434e-05, + "loss": 0.0079, + "step": 716030 + }, + { + "epoch": 1.86, + "learning_rate": 2.158815493764597e-05, + "loss": 0.0082, + "step": 716040 + }, + { + "epoch": 1.86, + "learning_rate": 2.1584266721274504e-05, + "loss": 0.005, + "step": 716050 + }, + { + "epoch": 1.86, + "learning_rate": 2.158037850490304e-05, + "loss": 0.0095, + "step": 716060 + }, + { + "epoch": 1.86, + "learning_rate": 2.1576490288531577e-05, + "loss": 0.0095, + "step": 716070 + }, + { + "epoch": 1.86, + "learning_rate": 2.1572602072160112e-05, + "loss": 0.0059, + "step": 716080 + }, + { + "epoch": 1.86, + "learning_rate": 2.1568713855788647e-05, + "loss": 0.0072, + "step": 716090 + }, + { + "epoch": 1.86, + "learning_rate": 2.1564825639417178e-05, + "loss": 0.005, + "step": 716100 + }, + { + "epoch": 1.86, + "learning_rate": 2.1560937423045713e-05, + "loss": 0.0065, + "step": 716110 + }, + { + "epoch": 1.86, + "learning_rate": 2.155704920667425e-05, + "loss": 0.0053, + "step": 716120 + }, + { + "epoch": 1.86, + "learning_rate": 2.1553160990302786e-05, + "loss": 0.0053, + "step": 716130 + }, + { + "epoch": 1.86, + "learning_rate": 2.154927277393132e-05, + "loss": 0.0058, + "step": 716140 + }, + { + "epoch": 1.86, + "learning_rate": 2.1545384557559856e-05, + "loss": 0.0073, + "step": 716150 + }, + { + "epoch": 1.86, + "learning_rate": 2.1541496341188394e-05, + "loss": 0.0083, + "step": 716160 + }, + { + "epoch": 1.86, + "learning_rate": 2.153760812481693e-05, + "loss": 0.0083, + "step": 716170 + }, + { + "epoch": 1.86, + "learning_rate": 2.1533719908445464e-05, + "loss": 0.0073, + "step": 716180 + }, + { + "epoch": 1.86, + "learning_rate": 2.1529831692074e-05, + "loss": 0.0075, + "step": 716190 + }, + { + "epoch": 1.86, + "learning_rate": 2.1525943475702537e-05, + "loss": 0.0075, + "step": 716200 + }, + { + "epoch": 1.86, + "learning_rate": 2.1522055259331072e-05, + "loss": 0.0093, + "step": 716210 + }, + { + "epoch": 1.86, + "learning_rate": 2.1518167042959607e-05, + "loss": 0.0082, + "step": 716220 + }, + { + "epoch": 1.86, + "learning_rate": 2.1514278826588138e-05, + "loss": 0.0062, + "step": 716230 + }, + { + "epoch": 1.86, + "learning_rate": 2.1510390610216673e-05, + "loss": 0.0059, + "step": 716240 + }, + { + "epoch": 1.86, + "learning_rate": 2.150650239384521e-05, + "loss": 0.0095, + "step": 716250 + }, + { + "epoch": 1.86, + "learning_rate": 2.1502614177473746e-05, + "loss": 0.007, + "step": 716260 + }, + { + "epoch": 1.86, + "learning_rate": 2.149872596110228e-05, + "loss": 0.0065, + "step": 716270 + }, + { + "epoch": 1.86, + "learning_rate": 2.1494837744730816e-05, + "loss": 0.0062, + "step": 716280 + }, + { + "epoch": 1.86, + "learning_rate": 2.149094952835935e-05, + "loss": 0.0064, + "step": 716290 + }, + { + "epoch": 1.86, + "learning_rate": 2.148706131198789e-05, + "loss": 0.0066, + "step": 716300 + }, + { + "epoch": 1.86, + "learning_rate": 2.1483173095616424e-05, + "loss": 0.0063, + "step": 716310 + }, + { + "epoch": 1.86, + "learning_rate": 2.147928487924496e-05, + "loss": 0.008, + "step": 716320 + }, + { + "epoch": 1.86, + "learning_rate": 2.1475396662873494e-05, + "loss": 0.0073, + "step": 716330 + }, + { + "epoch": 1.86, + "learning_rate": 2.1471508446502032e-05, + "loss": 0.0069, + "step": 716340 + }, + { + "epoch": 1.86, + "learning_rate": 2.1467620230130563e-05, + "loss": 0.0059, + "step": 716350 + }, + { + "epoch": 1.86, + "learning_rate": 2.1463732013759098e-05, + "loss": 0.0044, + "step": 716360 + }, + { + "epoch": 1.86, + "learning_rate": 2.1459843797387633e-05, + "loss": 0.0086, + "step": 716370 + }, + { + "epoch": 1.86, + "learning_rate": 2.1455955581016168e-05, + "loss": 0.0067, + "step": 716380 + }, + { + "epoch": 1.86, + "learning_rate": 2.1452067364644706e-05, + "loss": 0.0074, + "step": 716390 + }, + { + "epoch": 1.86, + "learning_rate": 2.144817914827324e-05, + "loss": 0.0066, + "step": 716400 + }, + { + "epoch": 1.86, + "learning_rate": 2.1444290931901776e-05, + "loss": 0.0087, + "step": 716410 + }, + { + "epoch": 1.86, + "learning_rate": 2.144040271553031e-05, + "loss": 0.0046, + "step": 716420 + }, + { + "epoch": 1.86, + "learning_rate": 2.143651449915885e-05, + "loss": 0.0071, + "step": 716430 + }, + { + "epoch": 1.86, + "learning_rate": 2.1432626282787384e-05, + "loss": 0.0101, + "step": 716440 + }, + { + "epoch": 1.86, + "learning_rate": 2.142873806641592e-05, + "loss": 0.0059, + "step": 716450 + }, + { + "epoch": 1.86, + "learning_rate": 2.1424849850044454e-05, + "loss": 0.0072, + "step": 716460 + }, + { + "epoch": 1.86, + "learning_rate": 2.1420961633672985e-05, + "loss": 0.0045, + "step": 716470 + }, + { + "epoch": 1.86, + "learning_rate": 2.1417073417301523e-05, + "loss": 0.0082, + "step": 716480 + }, + { + "epoch": 1.86, + "learning_rate": 2.1413185200930058e-05, + "loss": 0.0056, + "step": 716490 + }, + { + "epoch": 1.86, + "learning_rate": 2.1409296984558593e-05, + "loss": 0.0055, + "step": 716500 + }, + { + "epoch": 1.86, + "learning_rate": 2.1405408768187128e-05, + "loss": 0.0072, + "step": 716510 + }, + { + "epoch": 1.86, + "learning_rate": 2.1401520551815666e-05, + "loss": 0.0068, + "step": 716520 + }, + { + "epoch": 1.86, + "learning_rate": 2.13976323354442e-05, + "loss": 0.0067, + "step": 716530 + }, + { + "epoch": 1.86, + "learning_rate": 2.1393744119072736e-05, + "loss": 0.0091, + "step": 716540 + }, + { + "epoch": 1.86, + "learning_rate": 2.138985590270127e-05, + "loss": 0.0067, + "step": 716550 + }, + { + "epoch": 1.86, + "learning_rate": 2.138596768632981e-05, + "loss": 0.0083, + "step": 716560 + }, + { + "epoch": 1.86, + "learning_rate": 2.1382079469958344e-05, + "loss": 0.0073, + "step": 716570 + }, + { + "epoch": 1.86, + "learning_rate": 2.137819125358688e-05, + "loss": 0.0056, + "step": 716580 + }, + { + "epoch": 1.86, + "learning_rate": 2.1374303037215414e-05, + "loss": 0.0067, + "step": 716590 + }, + { + "epoch": 1.86, + "learning_rate": 2.1370414820843945e-05, + "loss": 0.0097, + "step": 716600 + }, + { + "epoch": 1.86, + "learning_rate": 2.1366526604472483e-05, + "loss": 0.0067, + "step": 716610 + }, + { + "epoch": 1.86, + "learning_rate": 2.1362638388101018e-05, + "loss": 0.0078, + "step": 716620 + }, + { + "epoch": 1.86, + "learning_rate": 2.1358750171729553e-05, + "loss": 0.0072, + "step": 716630 + }, + { + "epoch": 1.86, + "learning_rate": 2.1354861955358088e-05, + "loss": 0.0061, + "step": 716640 + }, + { + "epoch": 1.86, + "learning_rate": 2.1350973738986626e-05, + "loss": 0.0081, + "step": 716650 + }, + { + "epoch": 1.86, + "learning_rate": 2.134708552261516e-05, + "loss": 0.0059, + "step": 716660 + }, + { + "epoch": 1.86, + "learning_rate": 2.1343197306243696e-05, + "loss": 0.0069, + "step": 716670 + }, + { + "epoch": 1.86, + "learning_rate": 2.133930908987223e-05, + "loss": 0.0067, + "step": 716680 + }, + { + "epoch": 1.86, + "learning_rate": 2.133542087350077e-05, + "loss": 0.0067, + "step": 716690 + }, + { + "epoch": 1.86, + "learning_rate": 2.1331532657129304e-05, + "loss": 0.0065, + "step": 716700 + }, + { + "epoch": 1.86, + "learning_rate": 2.132764444075784e-05, + "loss": 0.0071, + "step": 716710 + }, + { + "epoch": 1.86, + "learning_rate": 2.132375622438637e-05, + "loss": 0.0074, + "step": 716720 + }, + { + "epoch": 1.86, + "learning_rate": 2.1319868008014905e-05, + "loss": 0.0068, + "step": 716730 + }, + { + "epoch": 1.86, + "learning_rate": 2.1315979791643443e-05, + "loss": 0.009, + "step": 716740 + }, + { + "epoch": 1.86, + "learning_rate": 2.1312091575271978e-05, + "loss": 0.007, + "step": 716750 + }, + { + "epoch": 1.86, + "learning_rate": 2.1308203358900513e-05, + "loss": 0.0083, + "step": 716760 + }, + { + "epoch": 1.86, + "learning_rate": 2.1304315142529048e-05, + "loss": 0.0071, + "step": 716770 + }, + { + "epoch": 1.86, + "learning_rate": 2.1300426926157586e-05, + "loss": 0.0073, + "step": 716780 + }, + { + "epoch": 1.86, + "learning_rate": 2.129653870978612e-05, + "loss": 0.0077, + "step": 716790 + }, + { + "epoch": 1.86, + "learning_rate": 2.1292650493414656e-05, + "loss": 0.0074, + "step": 716800 + }, + { + "epoch": 1.86, + "learning_rate": 2.128876227704319e-05, + "loss": 0.0062, + "step": 716810 + }, + { + "epoch": 1.86, + "learning_rate": 2.128487406067173e-05, + "loss": 0.0094, + "step": 716820 + }, + { + "epoch": 1.86, + "learning_rate": 2.1280985844300264e-05, + "loss": 0.0078, + "step": 716830 + }, + { + "epoch": 1.86, + "learning_rate": 2.12770976279288e-05, + "loss": 0.0065, + "step": 716840 + }, + { + "epoch": 1.86, + "learning_rate": 2.127320941155733e-05, + "loss": 0.0078, + "step": 716850 + }, + { + "epoch": 1.86, + "learning_rate": 2.1269321195185865e-05, + "loss": 0.0084, + "step": 716860 + }, + { + "epoch": 1.86, + "learning_rate": 2.1265432978814403e-05, + "loss": 0.0066, + "step": 716870 + }, + { + "epoch": 1.86, + "learning_rate": 2.1261544762442938e-05, + "loss": 0.0077, + "step": 716880 + }, + { + "epoch": 1.86, + "learning_rate": 2.1257656546071473e-05, + "loss": 0.0087, + "step": 716890 + }, + { + "epoch": 1.86, + "learning_rate": 2.1253768329700008e-05, + "loss": 0.008, + "step": 716900 + }, + { + "epoch": 1.86, + "learning_rate": 2.1249880113328546e-05, + "loss": 0.0083, + "step": 716910 + }, + { + "epoch": 1.86, + "learning_rate": 2.124599189695708e-05, + "loss": 0.0076, + "step": 716920 + }, + { + "epoch": 1.86, + "learning_rate": 2.1242103680585616e-05, + "loss": 0.0055, + "step": 716930 + }, + { + "epoch": 1.86, + "learning_rate": 2.123821546421415e-05, + "loss": 0.0093, + "step": 716940 + }, + { + "epoch": 1.86, + "learning_rate": 2.123432724784269e-05, + "loss": 0.0062, + "step": 716950 + }, + { + "epoch": 1.86, + "learning_rate": 2.1230439031471224e-05, + "loss": 0.007, + "step": 716960 + }, + { + "epoch": 1.86, + "learning_rate": 2.1226550815099755e-05, + "loss": 0.0083, + "step": 716970 + }, + { + "epoch": 1.86, + "learning_rate": 2.122266259872829e-05, + "loss": 0.0063, + "step": 716980 + }, + { + "epoch": 1.86, + "learning_rate": 2.1218774382356825e-05, + "loss": 0.0107, + "step": 716990 + }, + { + "epoch": 1.86, + "learning_rate": 2.1214886165985363e-05, + "loss": 0.0063, + "step": 717000 + }, + { + "epoch": 1.86, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.0045911758206784725, + "eval_runtime": 107.8933, + "eval_samples_per_second": 18.537, + "eval_steps_per_second": 4.634, + "step": 717000 + }, + { + "epoch": 1.86, + "learning_rate": 2.1210997949613898e-05, + "loss": 0.0072, + "step": 717010 + }, + { + "epoch": 1.86, + "learning_rate": 2.1207109733242433e-05, + "loss": 0.0069, + "step": 717020 + }, + { + "epoch": 1.86, + "learning_rate": 2.1203221516870968e-05, + "loss": 0.0062, + "step": 717030 + }, + { + "epoch": 1.86, + "learning_rate": 2.1199333300499506e-05, + "loss": 0.0072, + "step": 717040 + }, + { + "epoch": 1.86, + "learning_rate": 2.119544508412804e-05, + "loss": 0.0079, + "step": 717050 + }, + { + "epoch": 1.86, + "learning_rate": 2.1191556867756576e-05, + "loss": 0.006, + "step": 717060 + }, + { + "epoch": 1.86, + "learning_rate": 2.118766865138511e-05, + "loss": 0.0085, + "step": 717070 + }, + { + "epoch": 1.86, + "learning_rate": 2.118378043501365e-05, + "loss": 0.0063, + "step": 717080 + }, + { + "epoch": 1.86, + "learning_rate": 2.1179892218642184e-05, + "loss": 0.0073, + "step": 717090 + }, + { + "epoch": 1.86, + "learning_rate": 2.1176004002270715e-05, + "loss": 0.0074, + "step": 717100 + }, + { + "epoch": 1.86, + "learning_rate": 2.117211578589925e-05, + "loss": 0.0064, + "step": 717110 + }, + { + "epoch": 1.86, + "learning_rate": 2.1168227569527785e-05, + "loss": 0.0049, + "step": 717120 + }, + { + "epoch": 1.86, + "learning_rate": 2.1164339353156323e-05, + "loss": 0.006, + "step": 717130 + }, + { + "epoch": 1.86, + "learning_rate": 2.1160451136784858e-05, + "loss": 0.0067, + "step": 717140 + }, + { + "epoch": 1.86, + "learning_rate": 2.1156562920413393e-05, + "loss": 0.0051, + "step": 717150 + }, + { + "epoch": 1.86, + "learning_rate": 2.1152674704041928e-05, + "loss": 0.0064, + "step": 717160 + }, + { + "epoch": 1.86, + "learning_rate": 2.1148786487670466e-05, + "loss": 0.0078, + "step": 717170 + }, + { + "epoch": 1.86, + "learning_rate": 2.1144898271299e-05, + "loss": 0.006, + "step": 717180 + }, + { + "epoch": 1.86, + "learning_rate": 2.1141010054927536e-05, + "loss": 0.007, + "step": 717190 + }, + { + "epoch": 1.86, + "learning_rate": 2.113712183855607e-05, + "loss": 0.0071, + "step": 717200 + }, + { + "epoch": 1.86, + "learning_rate": 2.113323362218461e-05, + "loss": 0.0066, + "step": 717210 + }, + { + "epoch": 1.86, + "learning_rate": 2.112934540581314e-05, + "loss": 0.0057, + "step": 717220 + }, + { + "epoch": 1.86, + "learning_rate": 2.1125457189441675e-05, + "loss": 0.0046, + "step": 717230 + }, + { + "epoch": 1.86, + "learning_rate": 2.112156897307021e-05, + "loss": 0.0059, + "step": 717240 + }, + { + "epoch": 1.86, + "learning_rate": 2.1117680756698745e-05, + "loss": 0.0093, + "step": 717250 + }, + { + "epoch": 1.86, + "learning_rate": 2.1113792540327283e-05, + "loss": 0.0078, + "step": 717260 + }, + { + "epoch": 1.86, + "learning_rate": 2.1109904323955818e-05, + "loss": 0.0058, + "step": 717270 + }, + { + "epoch": 1.86, + "learning_rate": 2.1106016107584353e-05, + "loss": 0.0089, + "step": 717280 + }, + { + "epoch": 1.86, + "learning_rate": 2.1102127891212888e-05, + "loss": 0.0092, + "step": 717290 + }, + { + "epoch": 1.86, + "learning_rate": 2.1098239674841426e-05, + "loss": 0.0048, + "step": 717300 + }, + { + "epoch": 1.86, + "learning_rate": 2.109435145846996e-05, + "loss": 0.0064, + "step": 717310 + }, + { + "epoch": 1.86, + "learning_rate": 2.1090463242098496e-05, + "loss": 0.0064, + "step": 717320 + }, + { + "epoch": 1.86, + "learning_rate": 2.108657502572703e-05, + "loss": 0.0071, + "step": 717330 + }, + { + "epoch": 1.86, + "learning_rate": 2.1082686809355562e-05, + "loss": 0.0109, + "step": 717340 + }, + { + "epoch": 1.86, + "learning_rate": 2.10787985929841e-05, + "loss": 0.0079, + "step": 717350 + }, + { + "epoch": 1.86, + "learning_rate": 2.1074910376612635e-05, + "loss": 0.0079, + "step": 717360 + }, + { + "epoch": 1.86, + "learning_rate": 2.107102216024117e-05, + "loss": 0.0059, + "step": 717370 + }, + { + "epoch": 1.86, + "learning_rate": 2.1067133943869705e-05, + "loss": 0.0071, + "step": 717380 + }, + { + "epoch": 1.86, + "learning_rate": 2.1063245727498243e-05, + "loss": 0.0067, + "step": 717390 + }, + { + "epoch": 1.86, + "learning_rate": 2.1059357511126778e-05, + "loss": 0.0062, + "step": 717400 + }, + { + "epoch": 1.86, + "learning_rate": 2.1055469294755313e-05, + "loss": 0.0056, + "step": 717410 + }, + { + "epoch": 1.86, + "learning_rate": 2.1051581078383848e-05, + "loss": 0.0099, + "step": 717420 + }, + { + "epoch": 1.86, + "learning_rate": 2.1047692862012386e-05, + "loss": 0.0064, + "step": 717430 + }, + { + "epoch": 1.86, + "learning_rate": 2.104380464564092e-05, + "loss": 0.0097, + "step": 717440 + }, + { + "epoch": 1.86, + "learning_rate": 2.1039916429269456e-05, + "loss": 0.0058, + "step": 717450 + }, + { + "epoch": 1.86, + "learning_rate": 2.103602821289799e-05, + "loss": 0.007, + "step": 717460 + }, + { + "epoch": 1.86, + "learning_rate": 2.1032139996526522e-05, + "loss": 0.0067, + "step": 717470 + }, + { + "epoch": 1.86, + "learning_rate": 2.102825178015506e-05, + "loss": 0.0071, + "step": 717480 + }, + { + "epoch": 1.86, + "learning_rate": 2.1024363563783595e-05, + "loss": 0.008, + "step": 717490 + }, + { + "epoch": 1.86, + "learning_rate": 2.102047534741213e-05, + "loss": 0.0069, + "step": 717500 + }, + { + "epoch": 1.86, + "learning_rate": 2.1016587131040665e-05, + "loss": 0.0106, + "step": 717510 + }, + { + "epoch": 1.86, + "learning_rate": 2.1012698914669203e-05, + "loss": 0.005, + "step": 717520 + }, + { + "epoch": 1.86, + "learning_rate": 2.1008810698297738e-05, + "loss": 0.0058, + "step": 717530 + }, + { + "epoch": 1.86, + "learning_rate": 2.1004922481926273e-05, + "loss": 0.0074, + "step": 717540 + }, + { + "epoch": 1.86, + "learning_rate": 2.1001034265554808e-05, + "loss": 0.0069, + "step": 717550 + }, + { + "epoch": 1.86, + "learning_rate": 2.0997146049183346e-05, + "loss": 0.0057, + "step": 717560 + }, + { + "epoch": 1.86, + "learning_rate": 2.099325783281188e-05, + "loss": 0.008, + "step": 717570 + }, + { + "epoch": 1.86, + "learning_rate": 2.0989369616440416e-05, + "loss": 0.0057, + "step": 717580 + }, + { + "epoch": 1.86, + "learning_rate": 2.0985481400068947e-05, + "loss": 0.0063, + "step": 717590 + }, + { + "epoch": 1.86, + "learning_rate": 2.0981593183697482e-05, + "loss": 0.0073, + "step": 717600 + }, + { + "epoch": 1.86, + "learning_rate": 2.097770496732602e-05, + "loss": 0.0073, + "step": 717610 + }, + { + "epoch": 1.86, + "learning_rate": 2.0973816750954555e-05, + "loss": 0.006, + "step": 717620 + }, + { + "epoch": 1.86, + "learning_rate": 2.096992853458309e-05, + "loss": 0.0072, + "step": 717630 + }, + { + "epoch": 1.86, + "learning_rate": 2.0966040318211625e-05, + "loss": 0.0074, + "step": 717640 + }, + { + "epoch": 1.86, + "learning_rate": 2.0962152101840163e-05, + "loss": 0.0085, + "step": 717650 + }, + { + "epoch": 1.86, + "learning_rate": 2.0958263885468698e-05, + "loss": 0.0101, + "step": 717660 + }, + { + "epoch": 1.86, + "learning_rate": 2.0954375669097233e-05, + "loss": 0.007, + "step": 717670 + }, + { + "epoch": 1.86, + "learning_rate": 2.0950487452725768e-05, + "loss": 0.0092, + "step": 717680 + }, + { + "epoch": 1.86, + "learning_rate": 2.0946599236354303e-05, + "loss": 0.0108, + "step": 717690 + }, + { + "epoch": 1.86, + "learning_rate": 2.094271101998284e-05, + "loss": 0.0076, + "step": 717700 + }, + { + "epoch": 1.86, + "learning_rate": 2.0938822803611376e-05, + "loss": 0.0079, + "step": 717710 + }, + { + "epoch": 1.86, + "learning_rate": 2.0934934587239907e-05, + "loss": 0.0097, + "step": 717720 + }, + { + "epoch": 1.86, + "learning_rate": 2.0931046370868442e-05, + "loss": 0.0057, + "step": 717730 + }, + { + "epoch": 1.86, + "learning_rate": 2.0927158154496977e-05, + "loss": 0.0058, + "step": 717740 + }, + { + "epoch": 1.86, + "learning_rate": 2.0923269938125515e-05, + "loss": 0.0072, + "step": 717750 + }, + { + "epoch": 1.86, + "learning_rate": 2.091938172175405e-05, + "loss": 0.0069, + "step": 717760 + }, + { + "epoch": 1.86, + "learning_rate": 2.0915493505382585e-05, + "loss": 0.0074, + "step": 717770 + }, + { + "epoch": 1.86, + "learning_rate": 2.091160528901112e-05, + "loss": 0.006, + "step": 717780 + }, + { + "epoch": 1.86, + "learning_rate": 2.0907717072639658e-05, + "loss": 0.0073, + "step": 717790 + }, + { + "epoch": 1.86, + "learning_rate": 2.0903828856268193e-05, + "loss": 0.0054, + "step": 717800 + }, + { + "epoch": 1.86, + "learning_rate": 2.0899940639896728e-05, + "loss": 0.0063, + "step": 717810 + }, + { + "epoch": 1.86, + "learning_rate": 2.0896052423525263e-05, + "loss": 0.0086, + "step": 717820 + }, + { + "epoch": 1.86, + "learning_rate": 2.08921642071538e-05, + "loss": 0.007, + "step": 717830 + }, + { + "epoch": 1.86, + "learning_rate": 2.0888275990782332e-05, + "loss": 0.0084, + "step": 717840 + }, + { + "epoch": 1.86, + "learning_rate": 2.0884387774410867e-05, + "loss": 0.0078, + "step": 717850 + }, + { + "epoch": 1.86, + "learning_rate": 2.0880499558039402e-05, + "loss": 0.0087, + "step": 717860 + }, + { + "epoch": 1.86, + "learning_rate": 2.0876611341667937e-05, + "loss": 0.0081, + "step": 717870 + }, + { + "epoch": 1.86, + "learning_rate": 2.0872723125296475e-05, + "loss": 0.0101, + "step": 717880 + }, + { + "epoch": 1.86, + "learning_rate": 2.086883490892501e-05, + "loss": 0.0062, + "step": 717890 + }, + { + "epoch": 1.86, + "learning_rate": 2.0864946692553545e-05, + "loss": 0.007, + "step": 717900 + }, + { + "epoch": 1.86, + "learning_rate": 2.086105847618208e-05, + "loss": 0.0082, + "step": 717910 + }, + { + "epoch": 1.86, + "learning_rate": 2.0857170259810618e-05, + "loss": 0.0112, + "step": 717920 + }, + { + "epoch": 1.86, + "learning_rate": 2.0853282043439153e-05, + "loss": 0.0083, + "step": 717930 + }, + { + "epoch": 1.86, + "learning_rate": 2.0849393827067688e-05, + "loss": 0.0082, + "step": 717940 + }, + { + "epoch": 1.86, + "learning_rate": 2.0845505610696223e-05, + "loss": 0.0065, + "step": 717950 + }, + { + "epoch": 1.86, + "learning_rate": 2.0841617394324754e-05, + "loss": 0.0056, + "step": 717960 + }, + { + "epoch": 1.86, + "learning_rate": 2.0837729177953292e-05, + "loss": 0.0065, + "step": 717970 + }, + { + "epoch": 1.86, + "learning_rate": 2.0833840961581827e-05, + "loss": 0.0091, + "step": 717980 + }, + { + "epoch": 1.86, + "learning_rate": 2.0829952745210362e-05, + "loss": 0.0111, + "step": 717990 + }, + { + "epoch": 1.86, + "learning_rate": 2.0826064528838897e-05, + "loss": 0.0059, + "step": 718000 + }, + { + "epoch": 1.86, + "eval_cer": 0.8816536990304715, + "eval_loss": 0.004619268234819174, + "eval_runtime": 107.8627, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.636, + "step": 718000 + }, + { + "epoch": 1.86, + "learning_rate": 2.0822176312467435e-05, + "loss": 0.0051, + "step": 718010 + }, + { + "epoch": 1.86, + "learning_rate": 2.081828809609597e-05, + "loss": 0.0088, + "step": 718020 + }, + { + "epoch": 1.86, + "learning_rate": 2.0814399879724505e-05, + "loss": 0.0103, + "step": 718030 + }, + { + "epoch": 1.86, + "learning_rate": 2.081051166335304e-05, + "loss": 0.0098, + "step": 718040 + }, + { + "epoch": 1.86, + "learning_rate": 2.0806623446981578e-05, + "loss": 0.0098, + "step": 718050 + }, + { + "epoch": 1.86, + "learning_rate": 2.0802735230610113e-05, + "loss": 0.0066, + "step": 718060 + }, + { + "epoch": 1.86, + "learning_rate": 2.0798847014238648e-05, + "loss": 0.0089, + "step": 718070 + }, + { + "epoch": 1.86, + "learning_rate": 2.0794958797867182e-05, + "loss": 0.0056, + "step": 718080 + }, + { + "epoch": 1.86, + "learning_rate": 2.0791070581495714e-05, + "loss": 0.0061, + "step": 718090 + }, + { + "epoch": 1.86, + "learning_rate": 2.0787182365124252e-05, + "loss": 0.0085, + "step": 718100 + }, + { + "epoch": 1.86, + "learning_rate": 2.0783294148752787e-05, + "loss": 0.0066, + "step": 718110 + }, + { + "epoch": 1.86, + "learning_rate": 2.0779405932381322e-05, + "loss": 0.0062, + "step": 718120 + }, + { + "epoch": 1.86, + "learning_rate": 2.0775517716009857e-05, + "loss": 0.0082, + "step": 718130 + }, + { + "epoch": 1.86, + "learning_rate": 2.0771629499638395e-05, + "loss": 0.0075, + "step": 718140 + }, + { + "epoch": 1.86, + "learning_rate": 2.076774128326693e-05, + "loss": 0.0071, + "step": 718150 + }, + { + "epoch": 1.86, + "learning_rate": 2.0763853066895465e-05, + "loss": 0.0114, + "step": 718160 + }, + { + "epoch": 1.86, + "learning_rate": 2.0759964850524e-05, + "loss": 0.0088, + "step": 718170 + }, + { + "epoch": 1.86, + "learning_rate": 2.0756076634152538e-05, + "loss": 0.0075, + "step": 718180 + }, + { + "epoch": 1.86, + "learning_rate": 2.0752188417781073e-05, + "loss": 0.0061, + "step": 718190 + }, + { + "epoch": 1.86, + "learning_rate": 2.0748300201409608e-05, + "loss": 0.008, + "step": 718200 + }, + { + "epoch": 1.86, + "learning_rate": 2.074441198503814e-05, + "loss": 0.0079, + "step": 718210 + }, + { + "epoch": 1.86, + "learning_rate": 2.0740523768666674e-05, + "loss": 0.0065, + "step": 718220 + }, + { + "epoch": 1.86, + "learning_rate": 2.0736635552295212e-05, + "loss": 0.0076, + "step": 718230 + }, + { + "epoch": 1.86, + "learning_rate": 2.0732747335923747e-05, + "loss": 0.007, + "step": 718240 + }, + { + "epoch": 1.86, + "learning_rate": 2.0728859119552282e-05, + "loss": 0.0074, + "step": 718250 + }, + { + "epoch": 1.86, + "learning_rate": 2.0724970903180817e-05, + "loss": 0.009, + "step": 718260 + }, + { + "epoch": 1.86, + "learning_rate": 2.0721082686809355e-05, + "loss": 0.007, + "step": 718270 + }, + { + "epoch": 1.86, + "learning_rate": 2.071719447043789e-05, + "loss": 0.0082, + "step": 718280 + }, + { + "epoch": 1.86, + "learning_rate": 2.0713306254066425e-05, + "loss": 0.0071, + "step": 718290 + }, + { + "epoch": 1.86, + "learning_rate": 2.070941803769496e-05, + "loss": 0.0053, + "step": 718300 + }, + { + "epoch": 1.86, + "learning_rate": 2.0705529821323498e-05, + "loss": 0.0064, + "step": 718310 + }, + { + "epoch": 1.86, + "learning_rate": 2.0701641604952033e-05, + "loss": 0.006, + "step": 718320 + }, + { + "epoch": 1.86, + "learning_rate": 2.0697753388580568e-05, + "loss": 0.0076, + "step": 718330 + }, + { + "epoch": 1.86, + "learning_rate": 2.06938651722091e-05, + "loss": 0.0085, + "step": 718340 + }, + { + "epoch": 1.86, + "learning_rate": 2.0689976955837634e-05, + "loss": 0.011, + "step": 718350 + }, + { + "epoch": 1.86, + "learning_rate": 2.0686088739466172e-05, + "loss": 0.0079, + "step": 718360 + }, + { + "epoch": 1.86, + "learning_rate": 2.0682200523094707e-05, + "loss": 0.0076, + "step": 718370 + }, + { + "epoch": 1.86, + "learning_rate": 2.0678312306723242e-05, + "loss": 0.0066, + "step": 718380 + }, + { + "epoch": 1.86, + "learning_rate": 2.0674424090351777e-05, + "loss": 0.0111, + "step": 718390 + }, + { + "epoch": 1.86, + "learning_rate": 2.0670535873980315e-05, + "loss": 0.0065, + "step": 718400 + }, + { + "epoch": 1.86, + "learning_rate": 2.066664765760885e-05, + "loss": 0.0098, + "step": 718410 + }, + { + "epoch": 1.86, + "learning_rate": 2.0662759441237385e-05, + "loss": 0.0095, + "step": 718420 + }, + { + "epoch": 1.86, + "learning_rate": 2.065887122486592e-05, + "loss": 0.0054, + "step": 718430 + }, + { + "epoch": 1.86, + "learning_rate": 2.0654983008494458e-05, + "loss": 0.0083, + "step": 718440 + }, + { + "epoch": 1.86, + "learning_rate": 2.0651094792122993e-05, + "loss": 0.0069, + "step": 718450 + }, + { + "epoch": 1.86, + "learning_rate": 2.0647206575751524e-05, + "loss": 0.0087, + "step": 718460 + }, + { + "epoch": 1.86, + "learning_rate": 2.064331835938006e-05, + "loss": 0.0081, + "step": 718470 + }, + { + "epoch": 1.86, + "learning_rate": 2.0639430143008594e-05, + "loss": 0.0055, + "step": 718480 + }, + { + "epoch": 1.86, + "learning_rate": 2.0635541926637132e-05, + "loss": 0.0094, + "step": 718490 + }, + { + "epoch": 1.86, + "learning_rate": 2.0631653710265667e-05, + "loss": 0.0062, + "step": 718500 + }, + { + "epoch": 1.86, + "learning_rate": 2.0627765493894202e-05, + "loss": 0.0091, + "step": 718510 + }, + { + "epoch": 1.86, + "learning_rate": 2.0623877277522737e-05, + "loss": 0.0067, + "step": 718520 + }, + { + "epoch": 1.86, + "learning_rate": 2.0619989061151275e-05, + "loss": 0.0096, + "step": 718530 + }, + { + "epoch": 1.86, + "learning_rate": 2.061610084477981e-05, + "loss": 0.0067, + "step": 718540 + }, + { + "epoch": 1.86, + "learning_rate": 2.0612212628408345e-05, + "loss": 0.0061, + "step": 718550 + }, + { + "epoch": 1.86, + "learning_rate": 2.060832441203688e-05, + "loss": 0.0072, + "step": 718560 + }, + { + "epoch": 1.86, + "learning_rate": 2.0604436195665418e-05, + "loss": 0.0083, + "step": 718570 + }, + { + "epoch": 1.86, + "learning_rate": 2.060054797929395e-05, + "loss": 0.0093, + "step": 718580 + }, + { + "epoch": 1.86, + "learning_rate": 2.0596659762922484e-05, + "loss": 0.006, + "step": 718590 + }, + { + "epoch": 1.86, + "learning_rate": 2.059277154655102e-05, + "loss": 0.0073, + "step": 718600 + }, + { + "epoch": 1.86, + "learning_rate": 2.0588883330179554e-05, + "loss": 0.0081, + "step": 718610 + }, + { + "epoch": 1.86, + "learning_rate": 2.0584995113808092e-05, + "loss": 0.0099, + "step": 718620 + }, + { + "epoch": 1.86, + "learning_rate": 2.0581106897436627e-05, + "loss": 0.0057, + "step": 718630 + }, + { + "epoch": 1.86, + "learning_rate": 2.0577218681065162e-05, + "loss": 0.0062, + "step": 718640 + }, + { + "epoch": 1.86, + "learning_rate": 2.0573330464693697e-05, + "loss": 0.0065, + "step": 718650 + }, + { + "epoch": 1.86, + "learning_rate": 2.0569442248322235e-05, + "loss": 0.0101, + "step": 718660 + }, + { + "epoch": 1.86, + "learning_rate": 2.056555403195077e-05, + "loss": 0.0117, + "step": 718670 + }, + { + "epoch": 1.86, + "learning_rate": 2.0561665815579305e-05, + "loss": 0.0071, + "step": 718680 + }, + { + "epoch": 1.86, + "learning_rate": 2.055777759920784e-05, + "loss": 0.0059, + "step": 718690 + }, + { + "epoch": 1.86, + "learning_rate": 2.0553889382836378e-05, + "loss": 0.0087, + "step": 718700 + }, + { + "epoch": 1.86, + "learning_rate": 2.055000116646491e-05, + "loss": 0.0068, + "step": 718710 + }, + { + "epoch": 1.86, + "learning_rate": 2.0546112950093444e-05, + "loss": 0.0053, + "step": 718720 + }, + { + "epoch": 1.86, + "learning_rate": 2.054222473372198e-05, + "loss": 0.0059, + "step": 718730 + }, + { + "epoch": 1.86, + "learning_rate": 2.0538336517350514e-05, + "loss": 0.007, + "step": 718740 + }, + { + "epoch": 1.86, + "learning_rate": 2.0534448300979052e-05, + "loss": 0.0065, + "step": 718750 + }, + { + "epoch": 1.86, + "learning_rate": 2.0530560084607587e-05, + "loss": 0.0083, + "step": 718760 + }, + { + "epoch": 1.86, + "learning_rate": 2.0526671868236122e-05, + "loss": 0.0073, + "step": 718770 + }, + { + "epoch": 1.86, + "learning_rate": 2.0522783651864657e-05, + "loss": 0.0077, + "step": 718780 + }, + { + "epoch": 1.86, + "learning_rate": 2.0518895435493195e-05, + "loss": 0.0065, + "step": 718790 + }, + { + "epoch": 1.86, + "learning_rate": 2.051500721912173e-05, + "loss": 0.0079, + "step": 718800 + }, + { + "epoch": 1.86, + "learning_rate": 2.0511119002750265e-05, + "loss": 0.0058, + "step": 718810 + }, + { + "epoch": 1.86, + "learning_rate": 2.05072307863788e-05, + "loss": 0.0063, + "step": 718820 + }, + { + "epoch": 1.86, + "learning_rate": 2.050334257000733e-05, + "loss": 0.0065, + "step": 718830 + }, + { + "epoch": 1.86, + "learning_rate": 2.049945435363587e-05, + "loss": 0.0094, + "step": 718840 + }, + { + "epoch": 1.86, + "learning_rate": 2.0495566137264404e-05, + "loss": 0.0084, + "step": 718850 + }, + { + "epoch": 1.86, + "learning_rate": 2.049167792089294e-05, + "loss": 0.0048, + "step": 718860 + }, + { + "epoch": 1.86, + "learning_rate": 2.0487789704521474e-05, + "loss": 0.0095, + "step": 718870 + }, + { + "epoch": 1.86, + "learning_rate": 2.0483901488150012e-05, + "loss": 0.0041, + "step": 718880 + }, + { + "epoch": 1.86, + "learning_rate": 2.0480013271778547e-05, + "loss": 0.0089, + "step": 718890 + }, + { + "epoch": 1.86, + "learning_rate": 2.0476125055407082e-05, + "loss": 0.0054, + "step": 718900 + }, + { + "epoch": 1.86, + "learning_rate": 2.0472236839035617e-05, + "loss": 0.0106, + "step": 718910 + }, + { + "epoch": 1.86, + "learning_rate": 2.0468348622664155e-05, + "loss": 0.0066, + "step": 718920 + }, + { + "epoch": 1.86, + "learning_rate": 2.046446040629269e-05, + "loss": 0.0074, + "step": 718930 + }, + { + "epoch": 1.86, + "learning_rate": 2.0460572189921225e-05, + "loss": 0.0052, + "step": 718940 + }, + { + "epoch": 1.86, + "learning_rate": 2.045668397354976e-05, + "loss": 0.0102, + "step": 718950 + }, + { + "epoch": 1.86, + "learning_rate": 2.045279575717829e-05, + "loss": 0.0089, + "step": 718960 + }, + { + "epoch": 1.86, + "learning_rate": 2.044890754080683e-05, + "loss": 0.0106, + "step": 718970 + }, + { + "epoch": 1.86, + "learning_rate": 2.0445019324435364e-05, + "loss": 0.0105, + "step": 718980 + }, + { + "epoch": 1.86, + "learning_rate": 2.04411311080639e-05, + "loss": 0.005, + "step": 718990 + }, + { + "epoch": 1.86, + "learning_rate": 2.0437242891692434e-05, + "loss": 0.0064, + "step": 719000 + }, + { + "epoch": 1.86, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.004639680031687021, + "eval_runtime": 107.9354, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.632, + "step": 719000 + }, + { + "epoch": 1.86, + "learning_rate": 2.0433354675320972e-05, + "loss": 0.0082, + "step": 719010 + }, + { + "epoch": 1.86, + "learning_rate": 2.0429466458949507e-05, + "loss": 0.0072, + "step": 719020 + }, + { + "epoch": 1.86, + "learning_rate": 2.0425578242578042e-05, + "loss": 0.0074, + "step": 719030 + }, + { + "epoch": 1.86, + "learning_rate": 2.0421690026206577e-05, + "loss": 0.0079, + "step": 719040 + }, + { + "epoch": 1.86, + "learning_rate": 2.041780180983511e-05, + "loss": 0.0097, + "step": 719050 + }, + { + "epoch": 1.86, + "learning_rate": 2.041391359346365e-05, + "loss": 0.0061, + "step": 719060 + }, + { + "epoch": 1.86, + "learning_rate": 2.0410025377092185e-05, + "loss": 0.0081, + "step": 719070 + }, + { + "epoch": 1.86, + "learning_rate": 2.0406137160720716e-05, + "loss": 0.0053, + "step": 719080 + }, + { + "epoch": 1.86, + "learning_rate": 2.040224894434925e-05, + "loss": 0.0064, + "step": 719090 + }, + { + "epoch": 1.86, + "learning_rate": 2.0398360727977786e-05, + "loss": 0.0054, + "step": 719100 + }, + { + "epoch": 1.86, + "learning_rate": 2.0394472511606324e-05, + "loss": 0.0064, + "step": 719110 + }, + { + "epoch": 1.86, + "learning_rate": 2.039058429523486e-05, + "loss": 0.0085, + "step": 719120 + }, + { + "epoch": 1.86, + "learning_rate": 2.0386696078863394e-05, + "loss": 0.0065, + "step": 719130 + }, + { + "epoch": 1.86, + "learning_rate": 2.038280786249193e-05, + "loss": 0.0088, + "step": 719140 + }, + { + "epoch": 1.86, + "learning_rate": 2.0378919646120467e-05, + "loss": 0.0072, + "step": 719150 + }, + { + "epoch": 1.86, + "learning_rate": 2.0375031429749002e-05, + "loss": 0.0102, + "step": 719160 + }, + { + "epoch": 1.86, + "learning_rate": 2.0371143213377537e-05, + "loss": 0.0078, + "step": 719170 + }, + { + "epoch": 1.86, + "learning_rate": 2.036725499700607e-05, + "loss": 0.0067, + "step": 719180 + }, + { + "epoch": 1.86, + "learning_rate": 2.036336678063461e-05, + "loss": 0.0082, + "step": 719190 + }, + { + "epoch": 1.86, + "learning_rate": 2.035947856426314e-05, + "loss": 0.0064, + "step": 719200 + }, + { + "epoch": 1.86, + "learning_rate": 2.0355590347891676e-05, + "loss": 0.0081, + "step": 719210 + }, + { + "epoch": 1.86, + "learning_rate": 2.035170213152021e-05, + "loss": 0.0051, + "step": 719220 + }, + { + "epoch": 1.86, + "learning_rate": 2.0347813915148746e-05, + "loss": 0.0073, + "step": 719230 + }, + { + "epoch": 1.86, + "learning_rate": 2.0343925698777284e-05, + "loss": 0.0054, + "step": 719240 + }, + { + "epoch": 1.86, + "learning_rate": 2.034003748240582e-05, + "loss": 0.0083, + "step": 719250 + }, + { + "epoch": 1.86, + "learning_rate": 2.0336149266034354e-05, + "loss": 0.0082, + "step": 719260 + }, + { + "epoch": 1.86, + "learning_rate": 2.033226104966289e-05, + "loss": 0.0072, + "step": 719270 + }, + { + "epoch": 1.86, + "learning_rate": 2.0328372833291427e-05, + "loss": 0.0074, + "step": 719280 + }, + { + "epoch": 1.86, + "learning_rate": 2.0324484616919962e-05, + "loss": 0.0044, + "step": 719290 + }, + { + "epoch": 1.86, + "learning_rate": 2.0320596400548497e-05, + "loss": 0.0086, + "step": 719300 + }, + { + "epoch": 1.86, + "learning_rate": 2.031670818417703e-05, + "loss": 0.0092, + "step": 719310 + }, + { + "epoch": 1.86, + "learning_rate": 2.031281996780557e-05, + "loss": 0.0109, + "step": 719320 + }, + { + "epoch": 1.86, + "learning_rate": 2.03089317514341e-05, + "loss": 0.0071, + "step": 719330 + }, + { + "epoch": 1.86, + "learning_rate": 2.0305043535062636e-05, + "loss": 0.0076, + "step": 719340 + }, + { + "epoch": 1.86, + "learning_rate": 2.030115531869117e-05, + "loss": 0.0078, + "step": 719350 + }, + { + "epoch": 1.86, + "learning_rate": 2.0297267102319706e-05, + "loss": 0.0081, + "step": 719360 + }, + { + "epoch": 1.86, + "learning_rate": 2.0293378885948244e-05, + "loss": 0.0087, + "step": 719370 + }, + { + "epoch": 1.86, + "learning_rate": 2.028949066957678e-05, + "loss": 0.0076, + "step": 719380 + }, + { + "epoch": 1.86, + "learning_rate": 2.0285602453205314e-05, + "loss": 0.0101, + "step": 719390 + }, + { + "epoch": 1.86, + "learning_rate": 2.028171423683385e-05, + "loss": 0.0074, + "step": 719400 + }, + { + "epoch": 1.86, + "learning_rate": 2.0277826020462387e-05, + "loss": 0.0082, + "step": 719410 + }, + { + "epoch": 1.86, + "learning_rate": 2.027393780409092e-05, + "loss": 0.0074, + "step": 719420 + }, + { + "epoch": 1.86, + "learning_rate": 2.0270049587719457e-05, + "loss": 0.0077, + "step": 719430 + }, + { + "epoch": 1.86, + "learning_rate": 2.026616137134799e-05, + "loss": 0.0128, + "step": 719440 + }, + { + "epoch": 1.86, + "learning_rate": 2.0262273154976523e-05, + "loss": 0.007, + "step": 719450 + }, + { + "epoch": 1.86, + "learning_rate": 2.025838493860506e-05, + "loss": 0.0095, + "step": 719460 + }, + { + "epoch": 1.86, + "learning_rate": 2.0254496722233596e-05, + "loss": 0.0055, + "step": 719470 + }, + { + "epoch": 1.86, + "learning_rate": 2.025060850586213e-05, + "loss": 0.0106, + "step": 719480 + }, + { + "epoch": 1.87, + "learning_rate": 2.0246720289490666e-05, + "loss": 0.0099, + "step": 719490 + }, + { + "epoch": 1.87, + "learning_rate": 2.0242832073119204e-05, + "loss": 0.0081, + "step": 719500 + }, + { + "epoch": 1.87, + "learning_rate": 2.023894385674774e-05, + "loss": 0.0066, + "step": 719510 + }, + { + "epoch": 1.87, + "learning_rate": 2.0235055640376274e-05, + "loss": 0.0065, + "step": 719520 + }, + { + "epoch": 1.87, + "learning_rate": 2.023116742400481e-05, + "loss": 0.0084, + "step": 719530 + }, + { + "epoch": 1.87, + "learning_rate": 2.0227279207633347e-05, + "loss": 0.0058, + "step": 719540 + }, + { + "epoch": 1.87, + "learning_rate": 2.022339099126188e-05, + "loss": 0.0082, + "step": 719550 + }, + { + "epoch": 1.87, + "learning_rate": 2.0219502774890417e-05, + "loss": 0.0075, + "step": 719560 + }, + { + "epoch": 1.87, + "learning_rate": 2.021561455851895e-05, + "loss": 0.0071, + "step": 719570 + }, + { + "epoch": 1.87, + "learning_rate": 2.0211726342147483e-05, + "loss": 0.0052, + "step": 719580 + }, + { + "epoch": 1.87, + "learning_rate": 2.020783812577602e-05, + "loss": 0.0109, + "step": 719590 + }, + { + "epoch": 1.87, + "learning_rate": 2.0203949909404556e-05, + "loss": 0.0092, + "step": 719600 + }, + { + "epoch": 1.87, + "learning_rate": 2.020006169303309e-05, + "loss": 0.0067, + "step": 719610 + }, + { + "epoch": 1.87, + "learning_rate": 2.0196173476661626e-05, + "loss": 0.0096, + "step": 719620 + }, + { + "epoch": 1.87, + "learning_rate": 2.0192285260290164e-05, + "loss": 0.0094, + "step": 719630 + }, + { + "epoch": 1.87, + "learning_rate": 2.01883970439187e-05, + "loss": 0.0071, + "step": 719640 + }, + { + "epoch": 1.87, + "learning_rate": 2.0184508827547234e-05, + "loss": 0.0107, + "step": 719650 + }, + { + "epoch": 1.87, + "learning_rate": 2.018062061117577e-05, + "loss": 0.0072, + "step": 719660 + }, + { + "epoch": 1.87, + "learning_rate": 2.0176732394804307e-05, + "loss": 0.0073, + "step": 719670 + }, + { + "epoch": 1.87, + "learning_rate": 2.017284417843284e-05, + "loss": 0.0098, + "step": 719680 + }, + { + "epoch": 1.87, + "learning_rate": 2.0168955962061376e-05, + "loss": 0.0074, + "step": 719690 + }, + { + "epoch": 1.87, + "learning_rate": 2.0165067745689908e-05, + "loss": 0.0073, + "step": 719700 + }, + { + "epoch": 1.87, + "learning_rate": 2.0161179529318443e-05, + "loss": 0.0052, + "step": 719710 + }, + { + "epoch": 1.87, + "learning_rate": 2.015729131294698e-05, + "loss": 0.0071, + "step": 719720 + }, + { + "epoch": 1.87, + "learning_rate": 2.0153403096575516e-05, + "loss": 0.0095, + "step": 719730 + }, + { + "epoch": 1.87, + "learning_rate": 2.014951488020405e-05, + "loss": 0.0068, + "step": 719740 + }, + { + "epoch": 1.87, + "learning_rate": 2.0145626663832586e-05, + "loss": 0.005, + "step": 719750 + }, + { + "epoch": 1.87, + "learning_rate": 2.0141738447461124e-05, + "loss": 0.0058, + "step": 719760 + }, + { + "epoch": 1.87, + "learning_rate": 2.013785023108966e-05, + "loss": 0.0069, + "step": 719770 + }, + { + "epoch": 1.87, + "learning_rate": 2.0133962014718194e-05, + "loss": 0.0053, + "step": 719780 + }, + { + "epoch": 1.87, + "learning_rate": 2.013007379834673e-05, + "loss": 0.012, + "step": 719790 + }, + { + "epoch": 1.87, + "learning_rate": 2.0126185581975267e-05, + "loss": 0.0067, + "step": 719800 + }, + { + "epoch": 1.87, + "learning_rate": 2.01222973656038e-05, + "loss": 0.0084, + "step": 719810 + }, + { + "epoch": 1.87, + "learning_rate": 2.0118409149232333e-05, + "loss": 0.0079, + "step": 719820 + }, + { + "epoch": 1.87, + "learning_rate": 2.0114520932860868e-05, + "loss": 0.0071, + "step": 719830 + }, + { + "epoch": 1.87, + "learning_rate": 2.0110632716489403e-05, + "loss": 0.0078, + "step": 719840 + }, + { + "epoch": 1.87, + "learning_rate": 2.010674450011794e-05, + "loss": 0.01, + "step": 719850 + }, + { + "epoch": 1.87, + "learning_rate": 2.0102856283746476e-05, + "loss": 0.0052, + "step": 719860 + }, + { + "epoch": 1.87, + "learning_rate": 2.009896806737501e-05, + "loss": 0.0065, + "step": 719870 + }, + { + "epoch": 1.87, + "learning_rate": 2.0095079851003546e-05, + "loss": 0.0071, + "step": 719880 + }, + { + "epoch": 1.87, + "learning_rate": 2.0091191634632084e-05, + "loss": 0.0101, + "step": 719890 + }, + { + "epoch": 1.87, + "learning_rate": 2.008730341826062e-05, + "loss": 0.0063, + "step": 719900 + }, + { + "epoch": 1.87, + "learning_rate": 2.0083415201889154e-05, + "loss": 0.009, + "step": 719910 + }, + { + "epoch": 1.87, + "learning_rate": 2.007952698551769e-05, + "loss": 0.0077, + "step": 719920 + }, + { + "epoch": 1.87, + "learning_rate": 2.0075638769146227e-05, + "loss": 0.0072, + "step": 719930 + }, + { + "epoch": 1.87, + "learning_rate": 2.007175055277476e-05, + "loss": 0.0083, + "step": 719940 + }, + { + "epoch": 1.87, + "learning_rate": 2.0067862336403293e-05, + "loss": 0.0061, + "step": 719950 + }, + { + "epoch": 1.87, + "learning_rate": 2.0063974120031828e-05, + "loss": 0.008, + "step": 719960 + }, + { + "epoch": 1.87, + "learning_rate": 2.0060085903660363e-05, + "loss": 0.008, + "step": 719970 + }, + { + "epoch": 1.87, + "learning_rate": 2.00561976872889e-05, + "loss": 0.0061, + "step": 719980 + }, + { + "epoch": 1.87, + "learning_rate": 2.0052309470917436e-05, + "loss": 0.0077, + "step": 719990 + }, + { + "epoch": 1.87, + "learning_rate": 2.004842125454597e-05, + "loss": 0.0043, + "step": 720000 + }, + { + "epoch": 1.87, + "eval_cer": 0.8816858906799576, + "eval_loss": 0.004609877709299326, + "eval_runtime": 107.6819, + "eval_samples_per_second": 18.573, + "eval_steps_per_second": 4.643, + "step": 720000 + }, + { + "epoch": 1.87, + "learning_rate": 2.0044533038174506e-05, + "loss": 0.0063, + "step": 720010 + }, + { + "epoch": 1.87, + "learning_rate": 2.0040644821803044e-05, + "loss": 0.008, + "step": 720020 + }, + { + "epoch": 1.87, + "learning_rate": 2.003675660543158e-05, + "loss": 0.0078, + "step": 720030 + }, + { + "epoch": 1.87, + "learning_rate": 2.0032868389060114e-05, + "loss": 0.0081, + "step": 720040 + }, + { + "epoch": 1.87, + "learning_rate": 2.002898017268865e-05, + "loss": 0.01, + "step": 720050 + }, + { + "epoch": 1.87, + "learning_rate": 2.0025091956317187e-05, + "loss": 0.0063, + "step": 720060 + }, + { + "epoch": 1.87, + "learning_rate": 2.0021203739945718e-05, + "loss": 0.006, + "step": 720070 + }, + { + "epoch": 1.87, + "learning_rate": 2.0017315523574253e-05, + "loss": 0.0062, + "step": 720080 + }, + { + "epoch": 1.87, + "learning_rate": 2.0013427307202788e-05, + "loss": 0.0067, + "step": 720090 + }, + { + "epoch": 1.87, + "learning_rate": 2.0009539090831323e-05, + "loss": 0.0106, + "step": 720100 + }, + { + "epoch": 1.87, + "learning_rate": 2.000565087445986e-05, + "loss": 0.0111, + "step": 720110 + }, + { + "epoch": 1.87, + "learning_rate": 2.0001762658088396e-05, + "loss": 0.0089, + "step": 720120 + }, + { + "epoch": 1.87, + "learning_rate": 1.999787444171693e-05, + "loss": 0.0069, + "step": 720130 + }, + { + "epoch": 1.87, + "learning_rate": 1.9993986225345466e-05, + "loss": 0.0092, + "step": 720140 + }, + { + "epoch": 1.87, + "learning_rate": 1.9990098008974004e-05, + "loss": 0.0071, + "step": 720150 + }, + { + "epoch": 1.87, + "learning_rate": 1.998620979260254e-05, + "loss": 0.0106, + "step": 720160 + }, + { + "epoch": 1.87, + "learning_rate": 1.9982321576231074e-05, + "loss": 0.0101, + "step": 720170 + }, + { + "epoch": 1.87, + "learning_rate": 1.997843335985961e-05, + "loss": 0.0053, + "step": 720180 + }, + { + "epoch": 1.87, + "learning_rate": 1.9974545143488147e-05, + "loss": 0.0063, + "step": 720190 + }, + { + "epoch": 1.87, + "learning_rate": 1.9970656927116678e-05, + "loss": 0.0065, + "step": 720200 + }, + { + "epoch": 1.87, + "learning_rate": 1.9966768710745213e-05, + "loss": 0.0062, + "step": 720210 + }, + { + "epoch": 1.87, + "learning_rate": 1.9962880494373748e-05, + "loss": 0.0091, + "step": 720220 + }, + { + "epoch": 1.87, + "learning_rate": 1.9958992278002283e-05, + "loss": 0.0071, + "step": 720230 + }, + { + "epoch": 1.87, + "learning_rate": 1.995510406163082e-05, + "loss": 0.0087, + "step": 720240 + }, + { + "epoch": 1.87, + "learning_rate": 1.9951215845259356e-05, + "loss": 0.0065, + "step": 720250 + }, + { + "epoch": 1.87, + "learning_rate": 1.994732762888789e-05, + "loss": 0.0101, + "step": 720260 + }, + { + "epoch": 1.87, + "learning_rate": 1.9943439412516426e-05, + "loss": 0.0073, + "step": 720270 + }, + { + "epoch": 1.87, + "learning_rate": 1.9939551196144964e-05, + "loss": 0.006, + "step": 720280 + }, + { + "epoch": 1.87, + "learning_rate": 1.99356629797735e-05, + "loss": 0.005, + "step": 720290 + }, + { + "epoch": 1.87, + "learning_rate": 1.9931774763402034e-05, + "loss": 0.0062, + "step": 720300 + }, + { + "epoch": 1.87, + "learning_rate": 1.992788654703057e-05, + "loss": 0.0067, + "step": 720310 + }, + { + "epoch": 1.87, + "learning_rate": 1.99239983306591e-05, + "loss": 0.0087, + "step": 720320 + }, + { + "epoch": 1.87, + "learning_rate": 1.9920110114287638e-05, + "loss": 0.0078, + "step": 720330 + }, + { + "epoch": 1.87, + "learning_rate": 1.9916221897916173e-05, + "loss": 0.0062, + "step": 720340 + }, + { + "epoch": 1.87, + "learning_rate": 1.9912333681544708e-05, + "loss": 0.0055, + "step": 720350 + }, + { + "epoch": 1.87, + "learning_rate": 1.9908445465173243e-05, + "loss": 0.0079, + "step": 720360 + }, + { + "epoch": 1.87, + "learning_rate": 1.990455724880178e-05, + "loss": 0.0062, + "step": 720370 + }, + { + "epoch": 1.87, + "learning_rate": 1.9900669032430316e-05, + "loss": 0.0064, + "step": 720380 + }, + { + "epoch": 1.87, + "learning_rate": 1.989678081605885e-05, + "loss": 0.0099, + "step": 720390 + }, + { + "epoch": 1.87, + "learning_rate": 1.9892892599687386e-05, + "loss": 0.0068, + "step": 720400 + }, + { + "epoch": 1.87, + "learning_rate": 1.9889004383315924e-05, + "loss": 0.0097, + "step": 720410 + }, + { + "epoch": 1.87, + "learning_rate": 1.988511616694446e-05, + "loss": 0.0069, + "step": 720420 + }, + { + "epoch": 1.87, + "learning_rate": 1.9881227950572994e-05, + "loss": 0.0113, + "step": 720430 + }, + { + "epoch": 1.87, + "learning_rate": 1.9877339734201525e-05, + "loss": 0.0058, + "step": 720440 + }, + { + "epoch": 1.87, + "learning_rate": 1.987345151783006e-05, + "loss": 0.007, + "step": 720450 + }, + { + "epoch": 1.87, + "learning_rate": 1.9869563301458598e-05, + "loss": 0.0076, + "step": 720460 + }, + { + "epoch": 1.87, + "learning_rate": 1.9865675085087133e-05, + "loss": 0.0065, + "step": 720470 + }, + { + "epoch": 1.87, + "learning_rate": 1.9861786868715668e-05, + "loss": 0.0079, + "step": 720480 + }, + { + "epoch": 1.87, + "learning_rate": 1.9857898652344203e-05, + "loss": 0.007, + "step": 720490 + }, + { + "epoch": 1.87, + "learning_rate": 1.9854010435972738e-05, + "loss": 0.0132, + "step": 720500 + }, + { + "epoch": 1.87, + "learning_rate": 1.9850122219601276e-05, + "loss": 0.0084, + "step": 720510 + }, + { + "epoch": 1.87, + "learning_rate": 1.984623400322981e-05, + "loss": 0.0061, + "step": 720520 + }, + { + "epoch": 1.87, + "learning_rate": 1.9842345786858346e-05, + "loss": 0.0078, + "step": 720530 + }, + { + "epoch": 1.87, + "learning_rate": 1.983845757048688e-05, + "loss": 0.0065, + "step": 720540 + }, + { + "epoch": 1.87, + "learning_rate": 1.983456935411542e-05, + "loss": 0.0058, + "step": 720550 + }, + { + "epoch": 1.87, + "learning_rate": 1.9830681137743953e-05, + "loss": 0.007, + "step": 720560 + }, + { + "epoch": 1.87, + "learning_rate": 1.9826792921372485e-05, + "loss": 0.0096, + "step": 720570 + }, + { + "epoch": 1.87, + "learning_rate": 1.982290470500102e-05, + "loss": 0.0049, + "step": 720580 + }, + { + "epoch": 1.87, + "learning_rate": 1.9819016488629555e-05, + "loss": 0.0069, + "step": 720590 + }, + { + "epoch": 1.87, + "learning_rate": 1.9815128272258093e-05, + "loss": 0.0075, + "step": 720600 + }, + { + "epoch": 1.87, + "learning_rate": 1.9811240055886628e-05, + "loss": 0.0076, + "step": 720610 + }, + { + "epoch": 1.87, + "learning_rate": 1.9807351839515163e-05, + "loss": 0.0076, + "step": 720620 + }, + { + "epoch": 1.87, + "learning_rate": 1.9803463623143698e-05, + "loss": 0.0059, + "step": 720630 + }, + { + "epoch": 1.87, + "learning_rate": 1.9799575406772236e-05, + "loss": 0.0074, + "step": 720640 + }, + { + "epoch": 1.87, + "learning_rate": 1.979568719040077e-05, + "loss": 0.0086, + "step": 720650 + }, + { + "epoch": 1.87, + "learning_rate": 1.9791798974029305e-05, + "loss": 0.0068, + "step": 720660 + }, + { + "epoch": 1.87, + "learning_rate": 1.978791075765784e-05, + "loss": 0.0072, + "step": 720670 + }, + { + "epoch": 1.87, + "learning_rate": 1.978402254128638e-05, + "loss": 0.0072, + "step": 720680 + }, + { + "epoch": 1.87, + "learning_rate": 1.978013432491491e-05, + "loss": 0.0064, + "step": 720690 + }, + { + "epoch": 1.87, + "learning_rate": 1.9776246108543445e-05, + "loss": 0.0074, + "step": 720700 + }, + { + "epoch": 1.87, + "learning_rate": 1.977235789217198e-05, + "loss": 0.008, + "step": 720710 + }, + { + "epoch": 1.87, + "learning_rate": 1.9768469675800515e-05, + "loss": 0.0083, + "step": 720720 + }, + { + "epoch": 1.87, + "learning_rate": 1.9764581459429053e-05, + "loss": 0.0079, + "step": 720730 + }, + { + "epoch": 1.87, + "learning_rate": 1.9760693243057588e-05, + "loss": 0.0115, + "step": 720740 + }, + { + "epoch": 1.87, + "learning_rate": 1.9756805026686123e-05, + "loss": 0.0095, + "step": 720750 + }, + { + "epoch": 1.87, + "learning_rate": 1.9752916810314657e-05, + "loss": 0.0072, + "step": 720760 + }, + { + "epoch": 1.87, + "learning_rate": 1.9749028593943196e-05, + "loss": 0.0081, + "step": 720770 + }, + { + "epoch": 1.87, + "learning_rate": 1.974514037757173e-05, + "loss": 0.0057, + "step": 720780 + }, + { + "epoch": 1.87, + "learning_rate": 1.9741252161200265e-05, + "loss": 0.0076, + "step": 720790 + }, + { + "epoch": 1.87, + "learning_rate": 1.97373639448288e-05, + "loss": 0.0056, + "step": 720800 + }, + { + "epoch": 1.87, + "learning_rate": 1.973347572845734e-05, + "loss": 0.0057, + "step": 720810 + }, + { + "epoch": 1.87, + "learning_rate": 1.972958751208587e-05, + "loss": 0.0061, + "step": 720820 + }, + { + "epoch": 1.87, + "learning_rate": 1.9725699295714405e-05, + "loss": 0.0051, + "step": 720830 + }, + { + "epoch": 1.87, + "learning_rate": 1.972181107934294e-05, + "loss": 0.007, + "step": 720840 + }, + { + "epoch": 1.87, + "learning_rate": 1.9717922862971475e-05, + "loss": 0.0054, + "step": 720850 + }, + { + "epoch": 1.87, + "learning_rate": 1.9714034646600013e-05, + "loss": 0.0074, + "step": 720860 + }, + { + "epoch": 1.87, + "learning_rate": 1.9710146430228548e-05, + "loss": 0.0084, + "step": 720870 + }, + { + "epoch": 1.87, + "learning_rate": 1.9706258213857083e-05, + "loss": 0.0086, + "step": 720880 + }, + { + "epoch": 1.87, + "learning_rate": 1.9702369997485617e-05, + "loss": 0.0077, + "step": 720890 + }, + { + "epoch": 1.87, + "learning_rate": 1.9698481781114156e-05, + "loss": 0.0076, + "step": 720900 + }, + { + "epoch": 1.87, + "learning_rate": 1.969459356474269e-05, + "loss": 0.0074, + "step": 720910 + }, + { + "epoch": 1.87, + "learning_rate": 1.9690705348371225e-05, + "loss": 0.0072, + "step": 720920 + }, + { + "epoch": 1.87, + "learning_rate": 1.968681713199976e-05, + "loss": 0.0068, + "step": 720930 + }, + { + "epoch": 1.87, + "learning_rate": 1.9682928915628292e-05, + "loss": 0.0075, + "step": 720940 + }, + { + "epoch": 1.87, + "learning_rate": 1.967904069925683e-05, + "loss": 0.0086, + "step": 720950 + }, + { + "epoch": 1.87, + "learning_rate": 1.9675152482885365e-05, + "loss": 0.0089, + "step": 720960 + }, + { + "epoch": 1.87, + "learning_rate": 1.96712642665139e-05, + "loss": 0.0059, + "step": 720970 + }, + { + "epoch": 1.87, + "learning_rate": 1.9667376050142435e-05, + "loss": 0.007, + "step": 720980 + }, + { + "epoch": 1.87, + "learning_rate": 1.9663487833770973e-05, + "loss": 0.0065, + "step": 720990 + }, + { + "epoch": 1.87, + "learning_rate": 1.9659599617399508e-05, + "loss": 0.0056, + "step": 721000 + }, + { + "epoch": 1.87, + "eval_cer": 0.881688689953826, + "eval_loss": 0.004578019957989454, + "eval_runtime": 107.5931, + "eval_samples_per_second": 18.589, + "eval_steps_per_second": 4.647, + "step": 721000 + }, + { + "epoch": 1.87, + "learning_rate": 1.9655711401028043e-05, + "loss": 0.008, + "step": 721010 + }, + { + "epoch": 1.87, + "learning_rate": 1.9651823184656577e-05, + "loss": 0.0082, + "step": 721020 + }, + { + "epoch": 1.87, + "learning_rate": 1.9647934968285116e-05, + "loss": 0.0098, + "step": 721030 + }, + { + "epoch": 1.87, + "learning_rate": 1.964404675191365e-05, + "loss": 0.0103, + "step": 721040 + }, + { + "epoch": 1.87, + "learning_rate": 1.9640158535542185e-05, + "loss": 0.0064, + "step": 721050 + }, + { + "epoch": 1.87, + "learning_rate": 1.9636270319170717e-05, + "loss": 0.0061, + "step": 721060 + }, + { + "epoch": 1.87, + "learning_rate": 1.9632382102799252e-05, + "loss": 0.0079, + "step": 721070 + }, + { + "epoch": 1.87, + "learning_rate": 1.962849388642779e-05, + "loss": 0.0061, + "step": 721080 + }, + { + "epoch": 1.87, + "learning_rate": 1.9624605670056325e-05, + "loss": 0.0079, + "step": 721090 + }, + { + "epoch": 1.87, + "learning_rate": 1.962071745368486e-05, + "loss": 0.0054, + "step": 721100 + }, + { + "epoch": 1.87, + "learning_rate": 1.9616829237313395e-05, + "loss": 0.0077, + "step": 721110 + }, + { + "epoch": 1.87, + "learning_rate": 1.9612941020941933e-05, + "loss": 0.007, + "step": 721120 + }, + { + "epoch": 1.87, + "learning_rate": 1.9609052804570468e-05, + "loss": 0.0075, + "step": 721130 + }, + { + "epoch": 1.87, + "learning_rate": 1.9605164588199003e-05, + "loss": 0.008, + "step": 721140 + }, + { + "epoch": 1.87, + "learning_rate": 1.9601276371827537e-05, + "loss": 0.0082, + "step": 721150 + }, + { + "epoch": 1.87, + "learning_rate": 1.9597388155456076e-05, + "loss": 0.0077, + "step": 721160 + }, + { + "epoch": 1.87, + "learning_rate": 1.959349993908461e-05, + "loss": 0.0062, + "step": 721170 + }, + { + "epoch": 1.87, + "learning_rate": 1.9589611722713145e-05, + "loss": 0.0073, + "step": 721180 + }, + { + "epoch": 1.87, + "learning_rate": 1.9585723506341677e-05, + "loss": 0.0067, + "step": 721190 + }, + { + "epoch": 1.87, + "learning_rate": 1.9581835289970212e-05, + "loss": 0.0074, + "step": 721200 + }, + { + "epoch": 1.87, + "learning_rate": 1.957794707359875e-05, + "loss": 0.0053, + "step": 721210 + }, + { + "epoch": 1.87, + "learning_rate": 1.9574058857227285e-05, + "loss": 0.006, + "step": 721220 + }, + { + "epoch": 1.87, + "learning_rate": 1.957017064085582e-05, + "loss": 0.0089, + "step": 721230 + }, + { + "epoch": 1.87, + "learning_rate": 1.9566282424484355e-05, + "loss": 0.0084, + "step": 721240 + }, + { + "epoch": 1.87, + "learning_rate": 1.9562394208112893e-05, + "loss": 0.0109, + "step": 721250 + }, + { + "epoch": 1.87, + "learning_rate": 1.9558505991741428e-05, + "loss": 0.0072, + "step": 721260 + }, + { + "epoch": 1.87, + "learning_rate": 1.9554617775369963e-05, + "loss": 0.0075, + "step": 721270 + }, + { + "epoch": 1.87, + "learning_rate": 1.9550729558998497e-05, + "loss": 0.0076, + "step": 721280 + }, + { + "epoch": 1.87, + "learning_rate": 1.9546841342627036e-05, + "loss": 0.0065, + "step": 721290 + }, + { + "epoch": 1.87, + "learning_rate": 1.954295312625557e-05, + "loss": 0.0057, + "step": 721300 + }, + { + "epoch": 1.87, + "learning_rate": 1.9539064909884102e-05, + "loss": 0.008, + "step": 721310 + }, + { + "epoch": 1.87, + "learning_rate": 1.9535176693512637e-05, + "loss": 0.0058, + "step": 721320 + }, + { + "epoch": 1.87, + "learning_rate": 1.9531288477141172e-05, + "loss": 0.0063, + "step": 721330 + }, + { + "epoch": 1.87, + "learning_rate": 1.952740026076971e-05, + "loss": 0.0097, + "step": 721340 + }, + { + "epoch": 1.87, + "learning_rate": 1.9523512044398245e-05, + "loss": 0.0123, + "step": 721350 + }, + { + "epoch": 1.87, + "learning_rate": 1.951962382802678e-05, + "loss": 0.0094, + "step": 721360 + }, + { + "epoch": 1.87, + "learning_rate": 1.9515735611655315e-05, + "loss": 0.0084, + "step": 721370 + }, + { + "epoch": 1.87, + "learning_rate": 1.9511847395283853e-05, + "loss": 0.0064, + "step": 721380 + }, + { + "epoch": 1.87, + "learning_rate": 1.9507959178912388e-05, + "loss": 0.0068, + "step": 721390 + }, + { + "epoch": 1.87, + "learning_rate": 1.9504070962540923e-05, + "loss": 0.0065, + "step": 721400 + }, + { + "epoch": 1.87, + "learning_rate": 1.9500182746169457e-05, + "loss": 0.0065, + "step": 721410 + }, + { + "epoch": 1.87, + "learning_rate": 1.9496294529797996e-05, + "loss": 0.0087, + "step": 721420 + }, + { + "epoch": 1.87, + "learning_rate": 1.949240631342653e-05, + "loss": 0.0069, + "step": 721430 + }, + { + "epoch": 1.87, + "learning_rate": 1.9488518097055062e-05, + "loss": 0.0072, + "step": 721440 + }, + { + "epoch": 1.87, + "learning_rate": 1.9484629880683597e-05, + "loss": 0.0056, + "step": 721450 + }, + { + "epoch": 1.87, + "learning_rate": 1.948074166431213e-05, + "loss": 0.0092, + "step": 721460 + }, + { + "epoch": 1.87, + "learning_rate": 1.947685344794067e-05, + "loss": 0.0068, + "step": 721470 + }, + { + "epoch": 1.87, + "learning_rate": 1.9472965231569205e-05, + "loss": 0.0068, + "step": 721480 + }, + { + "epoch": 1.87, + "learning_rate": 1.946907701519774e-05, + "loss": 0.008, + "step": 721490 + }, + { + "epoch": 1.87, + "learning_rate": 1.9465188798826275e-05, + "loss": 0.009, + "step": 721500 + }, + { + "epoch": 1.87, + "learning_rate": 1.9461300582454813e-05, + "loss": 0.0083, + "step": 721510 + }, + { + "epoch": 1.87, + "learning_rate": 1.9457412366083348e-05, + "loss": 0.0053, + "step": 721520 + }, + { + "epoch": 1.87, + "learning_rate": 1.9453524149711882e-05, + "loss": 0.0075, + "step": 721530 + }, + { + "epoch": 1.87, + "learning_rate": 1.9449635933340417e-05, + "loss": 0.0081, + "step": 721540 + }, + { + "epoch": 1.87, + "learning_rate": 1.9445747716968956e-05, + "loss": 0.0057, + "step": 721550 + }, + { + "epoch": 1.87, + "learning_rate": 1.9441859500597487e-05, + "loss": 0.0081, + "step": 721560 + }, + { + "epoch": 1.87, + "learning_rate": 1.9437971284226022e-05, + "loss": 0.0086, + "step": 721570 + }, + { + "epoch": 1.87, + "learning_rate": 1.9434083067854557e-05, + "loss": 0.0064, + "step": 721580 + }, + { + "epoch": 1.87, + "learning_rate": 1.943019485148309e-05, + "loss": 0.0072, + "step": 721590 + }, + { + "epoch": 1.87, + "learning_rate": 1.942630663511163e-05, + "loss": 0.0061, + "step": 721600 + }, + { + "epoch": 1.87, + "learning_rate": 1.9422418418740165e-05, + "loss": 0.0078, + "step": 721610 + }, + { + "epoch": 1.87, + "learning_rate": 1.94185302023687e-05, + "loss": 0.0074, + "step": 721620 + }, + { + "epoch": 1.87, + "learning_rate": 1.9414641985997234e-05, + "loss": 0.0125, + "step": 721630 + }, + { + "epoch": 1.87, + "learning_rate": 1.9410753769625773e-05, + "loss": 0.0065, + "step": 721640 + }, + { + "epoch": 1.87, + "learning_rate": 1.9406865553254308e-05, + "loss": 0.0084, + "step": 721650 + }, + { + "epoch": 1.87, + "learning_rate": 1.9402977336882842e-05, + "loss": 0.0064, + "step": 721660 + }, + { + "epoch": 1.87, + "learning_rate": 1.9399089120511377e-05, + "loss": 0.0052, + "step": 721670 + }, + { + "epoch": 1.87, + "learning_rate": 1.9395200904139916e-05, + "loss": 0.0062, + "step": 721680 + }, + { + "epoch": 1.87, + "learning_rate": 1.9391312687768447e-05, + "loss": 0.0094, + "step": 721690 + }, + { + "epoch": 1.87, + "learning_rate": 1.9387424471396982e-05, + "loss": 0.0079, + "step": 721700 + }, + { + "epoch": 1.87, + "learning_rate": 1.9383536255025517e-05, + "loss": 0.0107, + "step": 721710 + }, + { + "epoch": 1.87, + "learning_rate": 1.937964803865405e-05, + "loss": 0.0045, + "step": 721720 + }, + { + "epoch": 1.87, + "learning_rate": 1.937575982228259e-05, + "loss": 0.0081, + "step": 721730 + }, + { + "epoch": 1.87, + "learning_rate": 1.9371871605911125e-05, + "loss": 0.007, + "step": 721740 + }, + { + "epoch": 1.87, + "learning_rate": 1.936798338953966e-05, + "loss": 0.0085, + "step": 721750 + }, + { + "epoch": 1.87, + "learning_rate": 1.9364095173168194e-05, + "loss": 0.0079, + "step": 721760 + }, + { + "epoch": 1.87, + "learning_rate": 1.9360206956796733e-05, + "loss": 0.0099, + "step": 721770 + }, + { + "epoch": 1.87, + "learning_rate": 1.9356318740425268e-05, + "loss": 0.0076, + "step": 721780 + }, + { + "epoch": 1.87, + "learning_rate": 1.9352430524053802e-05, + "loss": 0.0052, + "step": 721790 + }, + { + "epoch": 1.87, + "learning_rate": 1.9348542307682337e-05, + "loss": 0.0065, + "step": 721800 + }, + { + "epoch": 1.87, + "learning_rate": 1.934465409131087e-05, + "loss": 0.0089, + "step": 721810 + }, + { + "epoch": 1.87, + "learning_rate": 1.9340765874939407e-05, + "loss": 0.0068, + "step": 721820 + }, + { + "epoch": 1.87, + "learning_rate": 1.9336877658567942e-05, + "loss": 0.0086, + "step": 721830 + }, + { + "epoch": 1.87, + "learning_rate": 1.9332989442196477e-05, + "loss": 0.0073, + "step": 721840 + }, + { + "epoch": 1.87, + "learning_rate": 1.932910122582501e-05, + "loss": 0.0108, + "step": 721850 + }, + { + "epoch": 1.87, + "learning_rate": 1.932521300945355e-05, + "loss": 0.0064, + "step": 721860 + }, + { + "epoch": 1.87, + "learning_rate": 1.9321324793082085e-05, + "loss": 0.0092, + "step": 721870 + }, + { + "epoch": 1.87, + "learning_rate": 1.931743657671062e-05, + "loss": 0.0088, + "step": 721880 + }, + { + "epoch": 1.87, + "learning_rate": 1.9313548360339154e-05, + "loss": 0.0062, + "step": 721890 + }, + { + "epoch": 1.87, + "learning_rate": 1.930966014396769e-05, + "loss": 0.0069, + "step": 721900 + }, + { + "epoch": 1.87, + "learning_rate": 1.9305771927596228e-05, + "loss": 0.0088, + "step": 721910 + }, + { + "epoch": 1.87, + "learning_rate": 1.9301883711224762e-05, + "loss": 0.0066, + "step": 721920 + }, + { + "epoch": 1.87, + "learning_rate": 1.9297995494853294e-05, + "loss": 0.0076, + "step": 721930 + }, + { + "epoch": 1.87, + "learning_rate": 1.929410727848183e-05, + "loss": 0.0081, + "step": 721940 + }, + { + "epoch": 1.87, + "learning_rate": 1.9290219062110364e-05, + "loss": 0.0074, + "step": 721950 + }, + { + "epoch": 1.87, + "learning_rate": 1.9286330845738902e-05, + "loss": 0.0081, + "step": 721960 + }, + { + "epoch": 1.87, + "learning_rate": 1.9282442629367437e-05, + "loss": 0.0066, + "step": 721970 + }, + { + "epoch": 1.87, + "learning_rate": 1.927855441299597e-05, + "loss": 0.0085, + "step": 721980 + }, + { + "epoch": 1.87, + "learning_rate": 1.9274666196624506e-05, + "loss": 0.0044, + "step": 721990 + }, + { + "epoch": 1.87, + "learning_rate": 1.9270777980253045e-05, + "loss": 0.0066, + "step": 722000 + }, + { + "epoch": 1.87, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.004583498928695917, + "eval_runtime": 107.8568, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 722000 + }, + { + "epoch": 1.87, + "learning_rate": 1.926688976388158e-05, + "loss": 0.0056, + "step": 722010 + }, + { + "epoch": 1.87, + "learning_rate": 1.9263001547510114e-05, + "loss": 0.0065, + "step": 722020 + }, + { + "epoch": 1.87, + "learning_rate": 1.925911333113865e-05, + "loss": 0.0063, + "step": 722030 + }, + { + "epoch": 1.87, + "learning_rate": 1.9255225114767188e-05, + "loss": 0.0082, + "step": 722040 + }, + { + "epoch": 1.87, + "learning_rate": 1.9251336898395722e-05, + "loss": 0.0068, + "step": 722050 + }, + { + "epoch": 1.87, + "learning_rate": 1.9247448682024254e-05, + "loss": 0.0073, + "step": 722060 + }, + { + "epoch": 1.87, + "learning_rate": 1.924356046565279e-05, + "loss": 0.007, + "step": 722070 + }, + { + "epoch": 1.87, + "learning_rate": 1.9239672249281324e-05, + "loss": 0.0084, + "step": 722080 + }, + { + "epoch": 1.87, + "learning_rate": 1.9235784032909862e-05, + "loss": 0.011, + "step": 722090 + }, + { + "epoch": 1.87, + "learning_rate": 1.9231895816538397e-05, + "loss": 0.0075, + "step": 722100 + }, + { + "epoch": 1.87, + "learning_rate": 1.922800760016693e-05, + "loss": 0.006, + "step": 722110 + }, + { + "epoch": 1.87, + "learning_rate": 1.9224119383795466e-05, + "loss": 0.0069, + "step": 722120 + }, + { + "epoch": 1.87, + "learning_rate": 1.9220231167424005e-05, + "loss": 0.0086, + "step": 722130 + }, + { + "epoch": 1.87, + "learning_rate": 1.921634295105254e-05, + "loss": 0.0074, + "step": 722140 + }, + { + "epoch": 1.87, + "learning_rate": 1.9212454734681074e-05, + "loss": 0.0049, + "step": 722150 + }, + { + "epoch": 1.87, + "learning_rate": 1.920856651830961e-05, + "loss": 0.0076, + "step": 722160 + }, + { + "epoch": 1.87, + "learning_rate": 1.9204678301938148e-05, + "loss": 0.0085, + "step": 722170 + }, + { + "epoch": 1.87, + "learning_rate": 1.920079008556668e-05, + "loss": 0.0065, + "step": 722180 + }, + { + "epoch": 1.87, + "learning_rate": 1.9196901869195214e-05, + "loss": 0.0074, + "step": 722190 + }, + { + "epoch": 1.87, + "learning_rate": 1.919301365282375e-05, + "loss": 0.0093, + "step": 722200 + }, + { + "epoch": 1.87, + "learning_rate": 1.9189125436452284e-05, + "loss": 0.008, + "step": 722210 + }, + { + "epoch": 1.87, + "learning_rate": 1.9185237220080822e-05, + "loss": 0.007, + "step": 722220 + }, + { + "epoch": 1.87, + "learning_rate": 1.9181349003709357e-05, + "loss": 0.0076, + "step": 722230 + }, + { + "epoch": 1.87, + "learning_rate": 1.917746078733789e-05, + "loss": 0.0067, + "step": 722240 + }, + { + "epoch": 1.87, + "learning_rate": 1.9173572570966426e-05, + "loss": 0.0058, + "step": 722250 + }, + { + "epoch": 1.87, + "learning_rate": 1.9169684354594965e-05, + "loss": 0.0084, + "step": 722260 + }, + { + "epoch": 1.87, + "learning_rate": 1.91657961382235e-05, + "loss": 0.0093, + "step": 722270 + }, + { + "epoch": 1.87, + "learning_rate": 1.9161907921852034e-05, + "loss": 0.0072, + "step": 722280 + }, + { + "epoch": 1.87, + "learning_rate": 1.915801970548057e-05, + "loss": 0.0069, + "step": 722290 + }, + { + "epoch": 1.87, + "learning_rate": 1.9154131489109107e-05, + "loss": 0.0075, + "step": 722300 + }, + { + "epoch": 1.87, + "learning_rate": 1.915024327273764e-05, + "loss": 0.0093, + "step": 722310 + }, + { + "epoch": 1.87, + "learning_rate": 1.9146355056366174e-05, + "loss": 0.0051, + "step": 722320 + }, + { + "epoch": 1.87, + "learning_rate": 1.914246683999471e-05, + "loss": 0.0067, + "step": 722330 + }, + { + "epoch": 1.87, + "learning_rate": 1.9138578623623244e-05, + "loss": 0.0078, + "step": 722340 + }, + { + "epoch": 1.87, + "learning_rate": 1.9134690407251782e-05, + "loss": 0.0061, + "step": 722350 + }, + { + "epoch": 1.87, + "learning_rate": 1.9130802190880317e-05, + "loss": 0.008, + "step": 722360 + }, + { + "epoch": 1.87, + "learning_rate": 1.912691397450885e-05, + "loss": 0.0064, + "step": 722370 + }, + { + "epoch": 1.87, + "learning_rate": 1.9123025758137386e-05, + "loss": 0.0082, + "step": 722380 + }, + { + "epoch": 1.87, + "learning_rate": 1.9119137541765925e-05, + "loss": 0.0089, + "step": 722390 + }, + { + "epoch": 1.87, + "learning_rate": 1.911524932539446e-05, + "loss": 0.0068, + "step": 722400 + }, + { + "epoch": 1.87, + "learning_rate": 1.9111361109022994e-05, + "loss": 0.0082, + "step": 722410 + }, + { + "epoch": 1.87, + "learning_rate": 1.910747289265153e-05, + "loss": 0.0084, + "step": 722420 + }, + { + "epoch": 1.87, + "learning_rate": 1.910358467628006e-05, + "loss": 0.0099, + "step": 722430 + }, + { + "epoch": 1.87, + "learning_rate": 1.90996964599086e-05, + "loss": 0.0087, + "step": 722440 + }, + { + "epoch": 1.87, + "learning_rate": 1.9095808243537134e-05, + "loss": 0.006, + "step": 722450 + }, + { + "epoch": 1.87, + "learning_rate": 1.909192002716567e-05, + "loss": 0.0063, + "step": 722460 + }, + { + "epoch": 1.87, + "learning_rate": 1.9088031810794204e-05, + "loss": 0.0062, + "step": 722470 + }, + { + "epoch": 1.87, + "learning_rate": 1.9084143594422742e-05, + "loss": 0.0066, + "step": 722480 + }, + { + "epoch": 1.87, + "learning_rate": 1.9080255378051277e-05, + "loss": 0.0062, + "step": 722490 + }, + { + "epoch": 1.87, + "learning_rate": 1.907636716167981e-05, + "loss": 0.0075, + "step": 722500 + }, + { + "epoch": 1.87, + "learning_rate": 1.9072478945308346e-05, + "loss": 0.0066, + "step": 722510 + }, + { + "epoch": 1.87, + "learning_rate": 1.9068590728936885e-05, + "loss": 0.0086, + "step": 722520 + }, + { + "epoch": 1.87, + "learning_rate": 1.906470251256542e-05, + "loss": 0.007, + "step": 722530 + }, + { + "epoch": 1.87, + "learning_rate": 1.9060814296193954e-05, + "loss": 0.0102, + "step": 722540 + }, + { + "epoch": 1.87, + "learning_rate": 1.9056926079822486e-05, + "loss": 0.0079, + "step": 722550 + }, + { + "epoch": 1.87, + "learning_rate": 1.905303786345102e-05, + "loss": 0.0076, + "step": 722560 + }, + { + "epoch": 1.87, + "learning_rate": 1.904914964707956e-05, + "loss": 0.0059, + "step": 722570 + }, + { + "epoch": 1.87, + "learning_rate": 1.9045261430708094e-05, + "loss": 0.0072, + "step": 722580 + }, + { + "epoch": 1.87, + "learning_rate": 1.904137321433663e-05, + "loss": 0.006, + "step": 722590 + }, + { + "epoch": 1.87, + "learning_rate": 1.9037484997965163e-05, + "loss": 0.0072, + "step": 722600 + }, + { + "epoch": 1.87, + "learning_rate": 1.9033596781593702e-05, + "loss": 0.0062, + "step": 722610 + }, + { + "epoch": 1.87, + "learning_rate": 1.9029708565222237e-05, + "loss": 0.007, + "step": 722620 + }, + { + "epoch": 1.87, + "learning_rate": 1.902582034885077e-05, + "loss": 0.007, + "step": 722630 + }, + { + "epoch": 1.87, + "learning_rate": 1.9021932132479306e-05, + "loss": 0.0066, + "step": 722640 + }, + { + "epoch": 1.87, + "learning_rate": 1.9018043916107845e-05, + "loss": 0.0059, + "step": 722650 + }, + { + "epoch": 1.87, + "learning_rate": 1.901415569973638e-05, + "loss": 0.0087, + "step": 722660 + }, + { + "epoch": 1.87, + "learning_rate": 1.9010267483364914e-05, + "loss": 0.007, + "step": 722670 + }, + { + "epoch": 1.87, + "learning_rate": 1.9006379266993446e-05, + "loss": 0.0065, + "step": 722680 + }, + { + "epoch": 1.87, + "learning_rate": 1.900249105062198e-05, + "loss": 0.0091, + "step": 722690 + }, + { + "epoch": 1.87, + "learning_rate": 1.899860283425052e-05, + "loss": 0.0067, + "step": 722700 + }, + { + "epoch": 1.87, + "learning_rate": 1.8994714617879054e-05, + "loss": 0.0069, + "step": 722710 + }, + { + "epoch": 1.87, + "learning_rate": 1.899082640150759e-05, + "loss": 0.0098, + "step": 722720 + }, + { + "epoch": 1.87, + "learning_rate": 1.8986938185136123e-05, + "loss": 0.0102, + "step": 722730 + }, + { + "epoch": 1.87, + "learning_rate": 1.8983049968764662e-05, + "loss": 0.0068, + "step": 722740 + }, + { + "epoch": 1.87, + "learning_rate": 1.8979161752393197e-05, + "loss": 0.0072, + "step": 722750 + }, + { + "epoch": 1.87, + "learning_rate": 1.897527353602173e-05, + "loss": 0.0088, + "step": 722760 + }, + { + "epoch": 1.87, + "learning_rate": 1.8971385319650266e-05, + "loss": 0.0095, + "step": 722770 + }, + { + "epoch": 1.87, + "learning_rate": 1.8967497103278805e-05, + "loss": 0.0063, + "step": 722780 + }, + { + "epoch": 1.87, + "learning_rate": 1.896360888690734e-05, + "loss": 0.0069, + "step": 722790 + }, + { + "epoch": 1.87, + "learning_rate": 1.895972067053587e-05, + "loss": 0.0083, + "step": 722800 + }, + { + "epoch": 1.87, + "learning_rate": 1.8955832454164406e-05, + "loss": 0.006, + "step": 722810 + }, + { + "epoch": 1.87, + "learning_rate": 1.895194423779294e-05, + "loss": 0.0075, + "step": 722820 + }, + { + "epoch": 1.87, + "learning_rate": 1.894805602142148e-05, + "loss": 0.0062, + "step": 722830 + }, + { + "epoch": 1.87, + "learning_rate": 1.8944167805050014e-05, + "loss": 0.0077, + "step": 722840 + }, + { + "epoch": 1.87, + "learning_rate": 1.894027958867855e-05, + "loss": 0.0073, + "step": 722850 + }, + { + "epoch": 1.87, + "learning_rate": 1.8936391372307083e-05, + "loss": 0.007, + "step": 722860 + }, + { + "epoch": 1.87, + "learning_rate": 1.8932503155935622e-05, + "loss": 0.0101, + "step": 722870 + }, + { + "epoch": 1.87, + "learning_rate": 1.8928614939564157e-05, + "loss": 0.0071, + "step": 722880 + }, + { + "epoch": 1.87, + "learning_rate": 1.892472672319269e-05, + "loss": 0.0068, + "step": 722890 + }, + { + "epoch": 1.87, + "learning_rate": 1.8920838506821226e-05, + "loss": 0.0054, + "step": 722900 + }, + { + "epoch": 1.87, + "learning_rate": 1.8916950290449765e-05, + "loss": 0.0116, + "step": 722910 + }, + { + "epoch": 1.87, + "learning_rate": 1.89130620740783e-05, + "loss": 0.008, + "step": 722920 + }, + { + "epoch": 1.87, + "learning_rate": 1.890917385770683e-05, + "loss": 0.0055, + "step": 722930 + }, + { + "epoch": 1.87, + "learning_rate": 1.8905285641335366e-05, + "loss": 0.0056, + "step": 722940 + }, + { + "epoch": 1.87, + "learning_rate": 1.89013974249639e-05, + "loss": 0.0086, + "step": 722950 + }, + { + "epoch": 1.87, + "learning_rate": 1.889750920859244e-05, + "loss": 0.0089, + "step": 722960 + }, + { + "epoch": 1.87, + "learning_rate": 1.8893620992220974e-05, + "loss": 0.0129, + "step": 722970 + }, + { + "epoch": 1.87, + "learning_rate": 1.888973277584951e-05, + "loss": 0.0079, + "step": 722980 + }, + { + "epoch": 1.87, + "learning_rate": 1.8885844559478043e-05, + "loss": 0.0055, + "step": 722990 + }, + { + "epoch": 1.87, + "learning_rate": 1.888195634310658e-05, + "loss": 0.0082, + "step": 723000 + }, + { + "epoch": 1.87, + "eval_cer": 0.8816648961259449, + "eval_loss": 0.004544729832559824, + "eval_runtime": 107.9044, + "eval_samples_per_second": 18.535, + "eval_steps_per_second": 4.634, + "step": 723000 + }, + { + "epoch": 1.87, + "learning_rate": 1.8878068126735117e-05, + "loss": 0.0091, + "step": 723010 + }, + { + "epoch": 1.87, + "learning_rate": 1.887417991036365e-05, + "loss": 0.0069, + "step": 723020 + }, + { + "epoch": 1.87, + "learning_rate": 1.8870291693992186e-05, + "loss": 0.0084, + "step": 723030 + }, + { + "epoch": 1.87, + "learning_rate": 1.8866403477620725e-05, + "loss": 0.0118, + "step": 723040 + }, + { + "epoch": 1.87, + "learning_rate": 1.8862515261249256e-05, + "loss": 0.0062, + "step": 723050 + }, + { + "epoch": 1.87, + "learning_rate": 1.885862704487779e-05, + "loss": 0.0066, + "step": 723060 + }, + { + "epoch": 1.87, + "learning_rate": 1.8854738828506326e-05, + "loss": 0.0081, + "step": 723070 + }, + { + "epoch": 1.87, + "learning_rate": 1.885085061213486e-05, + "loss": 0.0088, + "step": 723080 + }, + { + "epoch": 1.87, + "learning_rate": 1.88469623957634e-05, + "loss": 0.0066, + "step": 723090 + }, + { + "epoch": 1.87, + "learning_rate": 1.8843074179391934e-05, + "loss": 0.0077, + "step": 723100 + }, + { + "epoch": 1.87, + "learning_rate": 1.883918596302047e-05, + "loss": 0.0083, + "step": 723110 + }, + { + "epoch": 1.87, + "learning_rate": 1.8835297746649003e-05, + "loss": 0.0075, + "step": 723120 + }, + { + "epoch": 1.87, + "learning_rate": 1.883140953027754e-05, + "loss": 0.0065, + "step": 723130 + }, + { + "epoch": 1.87, + "learning_rate": 1.8827521313906077e-05, + "loss": 0.0061, + "step": 723140 + }, + { + "epoch": 1.87, + "learning_rate": 1.882363309753461e-05, + "loss": 0.0034, + "step": 723150 + }, + { + "epoch": 1.87, + "learning_rate": 1.8819744881163146e-05, + "loss": 0.0075, + "step": 723160 + }, + { + "epoch": 1.87, + "learning_rate": 1.8815856664791678e-05, + "loss": 0.0064, + "step": 723170 + }, + { + "epoch": 1.87, + "learning_rate": 1.8811968448420216e-05, + "loss": 0.0092, + "step": 723180 + }, + { + "epoch": 1.87, + "learning_rate": 1.880808023204875e-05, + "loss": 0.0078, + "step": 723190 + }, + { + "epoch": 1.87, + "learning_rate": 1.8804192015677286e-05, + "loss": 0.0085, + "step": 723200 + }, + { + "epoch": 1.87, + "learning_rate": 1.880030379930582e-05, + "loss": 0.0069, + "step": 723210 + }, + { + "epoch": 1.87, + "learning_rate": 1.879641558293436e-05, + "loss": 0.0057, + "step": 723220 + }, + { + "epoch": 1.87, + "learning_rate": 1.8792527366562894e-05, + "loss": 0.0057, + "step": 723230 + }, + { + "epoch": 1.87, + "learning_rate": 1.878863915019143e-05, + "loss": 0.0094, + "step": 723240 + }, + { + "epoch": 1.87, + "learning_rate": 1.8784750933819963e-05, + "loss": 0.0078, + "step": 723250 + }, + { + "epoch": 1.87, + "learning_rate": 1.8780862717448498e-05, + "loss": 0.0085, + "step": 723260 + }, + { + "epoch": 1.87, + "learning_rate": 1.8776974501077036e-05, + "loss": 0.0088, + "step": 723270 + }, + { + "epoch": 1.87, + "learning_rate": 1.877308628470557e-05, + "loss": 0.0079, + "step": 723280 + }, + { + "epoch": 1.87, + "learning_rate": 1.8769198068334106e-05, + "loss": 0.0087, + "step": 723290 + }, + { + "epoch": 1.87, + "learning_rate": 1.8765309851962638e-05, + "loss": 0.0056, + "step": 723300 + }, + { + "epoch": 1.87, + "learning_rate": 1.8761421635591173e-05, + "loss": 0.0055, + "step": 723310 + }, + { + "epoch": 1.87, + "learning_rate": 1.875753341921971e-05, + "loss": 0.0076, + "step": 723320 + }, + { + "epoch": 1.87, + "learning_rate": 1.8753645202848246e-05, + "loss": 0.0075, + "step": 723330 + }, + { + "epoch": 1.88, + "learning_rate": 1.874975698647678e-05, + "loss": 0.008, + "step": 723340 + }, + { + "epoch": 1.88, + "learning_rate": 1.8745868770105315e-05, + "loss": 0.0061, + "step": 723350 + }, + { + "epoch": 1.88, + "learning_rate": 1.8741980553733854e-05, + "loss": 0.006, + "step": 723360 + }, + { + "epoch": 1.88, + "learning_rate": 1.873809233736239e-05, + "loss": 0.0083, + "step": 723370 + }, + { + "epoch": 1.88, + "learning_rate": 1.8734204120990923e-05, + "loss": 0.0054, + "step": 723380 + }, + { + "epoch": 1.88, + "learning_rate": 1.8730315904619458e-05, + "loss": 0.0079, + "step": 723390 + }, + { + "epoch": 1.88, + "learning_rate": 1.8726427688247993e-05, + "loss": 0.0066, + "step": 723400 + }, + { + "epoch": 1.88, + "learning_rate": 1.8722539471876528e-05, + "loss": 0.0077, + "step": 723410 + }, + { + "epoch": 1.88, + "learning_rate": 1.8718651255505066e-05, + "loss": 0.0053, + "step": 723420 + }, + { + "epoch": 1.88, + "learning_rate": 1.87147630391336e-05, + "loss": 0.0103, + "step": 723430 + }, + { + "epoch": 1.88, + "learning_rate": 1.8710874822762136e-05, + "loss": 0.0069, + "step": 723440 + }, + { + "epoch": 1.88, + "learning_rate": 1.870698660639067e-05, + "loss": 0.01, + "step": 723450 + }, + { + "epoch": 1.88, + "learning_rate": 1.8703098390019206e-05, + "loss": 0.0119, + "step": 723460 + }, + { + "epoch": 1.88, + "learning_rate": 1.869921017364774e-05, + "loss": 0.0089, + "step": 723470 + }, + { + "epoch": 1.88, + "learning_rate": 1.8695321957276275e-05, + "loss": 0.0104, + "step": 723480 + }, + { + "epoch": 1.88, + "learning_rate": 1.8691433740904814e-05, + "loss": 0.0078, + "step": 723490 + }, + { + "epoch": 1.88, + "learning_rate": 1.868754552453335e-05, + "loss": 0.0058, + "step": 723500 + }, + { + "epoch": 1.88, + "learning_rate": 1.8683657308161883e-05, + "loss": 0.0089, + "step": 723510 + }, + { + "epoch": 1.88, + "learning_rate": 1.8679769091790418e-05, + "loss": 0.0064, + "step": 723520 + }, + { + "epoch": 1.88, + "learning_rate": 1.8675880875418953e-05, + "loss": 0.0056, + "step": 723530 + }, + { + "epoch": 1.88, + "learning_rate": 1.8671992659047488e-05, + "loss": 0.0072, + "step": 723540 + }, + { + "epoch": 1.88, + "learning_rate": 1.8668104442676026e-05, + "loss": 0.0069, + "step": 723550 + }, + { + "epoch": 1.88, + "learning_rate": 1.866421622630456e-05, + "loss": 0.0069, + "step": 723560 + }, + { + "epoch": 1.88, + "learning_rate": 1.8660328009933096e-05, + "loss": 0.006, + "step": 723570 + }, + { + "epoch": 1.88, + "learning_rate": 1.865643979356163e-05, + "loss": 0.0053, + "step": 723580 + }, + { + "epoch": 1.88, + "learning_rate": 1.8652551577190166e-05, + "loss": 0.006, + "step": 723590 + }, + { + "epoch": 1.88, + "learning_rate": 1.86486633608187e-05, + "loss": 0.0079, + "step": 723600 + }, + { + "epoch": 1.88, + "learning_rate": 1.8644775144447235e-05, + "loss": 0.0095, + "step": 723610 + }, + { + "epoch": 1.88, + "learning_rate": 1.8640886928075774e-05, + "loss": 0.0068, + "step": 723620 + }, + { + "epoch": 1.88, + "learning_rate": 1.863699871170431e-05, + "loss": 0.0067, + "step": 723630 + }, + { + "epoch": 1.88, + "learning_rate": 1.8633110495332843e-05, + "loss": 0.0067, + "step": 723640 + }, + { + "epoch": 1.88, + "learning_rate": 1.8629222278961378e-05, + "loss": 0.0066, + "step": 723650 + }, + { + "epoch": 1.88, + "learning_rate": 1.8625334062589913e-05, + "loss": 0.0168, + "step": 723660 + }, + { + "epoch": 1.88, + "learning_rate": 1.8621445846218448e-05, + "loss": 0.0073, + "step": 723670 + }, + { + "epoch": 1.88, + "learning_rate": 1.8617557629846986e-05, + "loss": 0.0076, + "step": 723680 + }, + { + "epoch": 1.88, + "learning_rate": 1.861366941347552e-05, + "loss": 0.0069, + "step": 723690 + }, + { + "epoch": 1.88, + "learning_rate": 1.8609781197104052e-05, + "loss": 0.005, + "step": 723700 + }, + { + "epoch": 1.88, + "learning_rate": 1.860589298073259e-05, + "loss": 0.0065, + "step": 723710 + }, + { + "epoch": 1.88, + "learning_rate": 1.8602004764361126e-05, + "loss": 0.0051, + "step": 723720 + }, + { + "epoch": 1.88, + "learning_rate": 1.859811654798966e-05, + "loss": 0.007, + "step": 723730 + }, + { + "epoch": 1.88, + "learning_rate": 1.8594228331618195e-05, + "loss": 0.0065, + "step": 723740 + }, + { + "epoch": 1.88, + "learning_rate": 1.8590340115246734e-05, + "loss": 0.007, + "step": 723750 + }, + { + "epoch": 1.88, + "learning_rate": 1.8586451898875265e-05, + "loss": 0.0047, + "step": 723760 + }, + { + "epoch": 1.88, + "learning_rate": 1.8582563682503803e-05, + "loss": 0.0064, + "step": 723770 + }, + { + "epoch": 1.88, + "learning_rate": 1.8578675466132338e-05, + "loss": 0.0078, + "step": 723780 + }, + { + "epoch": 1.88, + "learning_rate": 1.8574787249760873e-05, + "loss": 0.0104, + "step": 723790 + }, + { + "epoch": 1.88, + "learning_rate": 1.8570899033389408e-05, + "loss": 0.0066, + "step": 723800 + }, + { + "epoch": 1.88, + "learning_rate": 1.8567010817017946e-05, + "loss": 0.0051, + "step": 723810 + }, + { + "epoch": 1.88, + "learning_rate": 1.856312260064648e-05, + "loss": 0.007, + "step": 723820 + }, + { + "epoch": 1.88, + "learning_rate": 1.8559234384275012e-05, + "loss": 0.0099, + "step": 723830 + }, + { + "epoch": 1.88, + "learning_rate": 1.855534616790355e-05, + "loss": 0.0055, + "step": 723840 + }, + { + "epoch": 1.88, + "learning_rate": 1.8551457951532086e-05, + "loss": 0.0081, + "step": 723850 + }, + { + "epoch": 1.88, + "learning_rate": 1.854756973516062e-05, + "loss": 0.0108, + "step": 723860 + }, + { + "epoch": 1.88, + "learning_rate": 1.8543681518789155e-05, + "loss": 0.0115, + "step": 723870 + }, + { + "epoch": 1.88, + "learning_rate": 1.8539793302417694e-05, + "loss": 0.0119, + "step": 723880 + }, + { + "epoch": 1.88, + "learning_rate": 1.8535905086046225e-05, + "loss": 0.0069, + "step": 723890 + }, + { + "epoch": 1.88, + "learning_rate": 1.8532016869674763e-05, + "loss": 0.0084, + "step": 723900 + }, + { + "epoch": 1.88, + "learning_rate": 1.8528128653303298e-05, + "loss": 0.0069, + "step": 723910 + }, + { + "epoch": 1.88, + "learning_rate": 1.8524240436931833e-05, + "loss": 0.0083, + "step": 723920 + }, + { + "epoch": 1.88, + "learning_rate": 1.8520352220560368e-05, + "loss": 0.0069, + "step": 723930 + }, + { + "epoch": 1.88, + "learning_rate": 1.8516464004188903e-05, + "loss": 0.0071, + "step": 723940 + }, + { + "epoch": 1.88, + "learning_rate": 1.8512575787817438e-05, + "loss": 0.0079, + "step": 723950 + }, + { + "epoch": 1.88, + "learning_rate": 1.8508687571445972e-05, + "loss": 0.0088, + "step": 723960 + }, + { + "epoch": 1.88, + "learning_rate": 1.850479935507451e-05, + "loss": 0.0076, + "step": 723970 + }, + { + "epoch": 1.88, + "learning_rate": 1.8500911138703046e-05, + "loss": 0.0057, + "step": 723980 + }, + { + "epoch": 1.88, + "learning_rate": 1.849702292233158e-05, + "loss": 0.007, + "step": 723990 + }, + { + "epoch": 1.88, + "learning_rate": 1.8493134705960115e-05, + "loss": 0.0073, + "step": 724000 + }, + { + "epoch": 1.88, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.004569494165480137, + "eval_runtime": 107.7253, + "eval_samples_per_second": 18.566, + "eval_steps_per_second": 4.641, + "step": 724000 + }, + { + "epoch": 1.88, + "learning_rate": 1.848924648958865e-05, + "loss": 0.007, + "step": 724010 + }, + { + "epoch": 1.88, + "learning_rate": 1.8485358273217185e-05, + "loss": 0.0067, + "step": 724020 + }, + { + "epoch": 1.88, + "learning_rate": 1.848147005684572e-05, + "loss": 0.0092, + "step": 724030 + }, + { + "epoch": 1.88, + "learning_rate": 1.8477581840474258e-05, + "loss": 0.0058, + "step": 724040 + }, + { + "epoch": 1.88, + "learning_rate": 1.8473693624102793e-05, + "loss": 0.0074, + "step": 724050 + }, + { + "epoch": 1.88, + "learning_rate": 1.8469805407731328e-05, + "loss": 0.0109, + "step": 724060 + }, + { + "epoch": 1.88, + "learning_rate": 1.8465917191359863e-05, + "loss": 0.0093, + "step": 724070 + }, + { + "epoch": 1.88, + "learning_rate": 1.8462028974988398e-05, + "loss": 0.0084, + "step": 724080 + }, + { + "epoch": 1.88, + "learning_rate": 1.8458140758616932e-05, + "loss": 0.0075, + "step": 724090 + }, + { + "epoch": 1.88, + "learning_rate": 1.845425254224547e-05, + "loss": 0.0072, + "step": 724100 + }, + { + "epoch": 1.88, + "learning_rate": 1.8450364325874006e-05, + "loss": 0.0071, + "step": 724110 + }, + { + "epoch": 1.88, + "learning_rate": 1.844647610950254e-05, + "loss": 0.0049, + "step": 724120 + }, + { + "epoch": 1.88, + "learning_rate": 1.8442587893131075e-05, + "loss": 0.008, + "step": 724130 + }, + { + "epoch": 1.88, + "learning_rate": 1.843869967675961e-05, + "loss": 0.0065, + "step": 724140 + }, + { + "epoch": 1.88, + "learning_rate": 1.8434811460388145e-05, + "loss": 0.0062, + "step": 724150 + }, + { + "epoch": 1.88, + "learning_rate": 1.843092324401668e-05, + "loss": 0.0105, + "step": 724160 + }, + { + "epoch": 1.88, + "learning_rate": 1.8427035027645218e-05, + "loss": 0.0072, + "step": 724170 + }, + { + "epoch": 1.88, + "learning_rate": 1.8423146811273753e-05, + "loss": 0.0037, + "step": 724180 + }, + { + "epoch": 1.88, + "learning_rate": 1.8419258594902288e-05, + "loss": 0.0051, + "step": 724190 + }, + { + "epoch": 1.88, + "learning_rate": 1.8415370378530823e-05, + "loss": 0.0089, + "step": 724200 + }, + { + "epoch": 1.88, + "learning_rate": 1.8411482162159358e-05, + "loss": 0.0081, + "step": 724210 + }, + { + "epoch": 1.88, + "learning_rate": 1.8407593945787892e-05, + "loss": 0.0126, + "step": 724220 + }, + { + "epoch": 1.88, + "learning_rate": 1.840370572941643e-05, + "loss": 0.0079, + "step": 724230 + }, + { + "epoch": 1.88, + "learning_rate": 1.8399817513044965e-05, + "loss": 0.0068, + "step": 724240 + }, + { + "epoch": 1.88, + "learning_rate": 1.83959292966735e-05, + "loss": 0.0069, + "step": 724250 + }, + { + "epoch": 1.88, + "learning_rate": 1.8392041080302035e-05, + "loss": 0.0096, + "step": 724260 + }, + { + "epoch": 1.88, + "learning_rate": 1.838815286393057e-05, + "loss": 0.0075, + "step": 724270 + }, + { + "epoch": 1.88, + "learning_rate": 1.8384264647559105e-05, + "loss": 0.0079, + "step": 724280 + }, + { + "epoch": 1.88, + "learning_rate": 1.838037643118764e-05, + "loss": 0.0088, + "step": 724290 + }, + { + "epoch": 1.88, + "learning_rate": 1.8376488214816178e-05, + "loss": 0.0071, + "step": 724300 + }, + { + "epoch": 1.88, + "learning_rate": 1.8372599998444713e-05, + "loss": 0.0069, + "step": 724310 + }, + { + "epoch": 1.88, + "learning_rate": 1.8368711782073248e-05, + "loss": 0.0062, + "step": 724320 + }, + { + "epoch": 1.88, + "learning_rate": 1.8364823565701783e-05, + "loss": 0.0067, + "step": 724330 + }, + { + "epoch": 1.88, + "learning_rate": 1.8360935349330317e-05, + "loss": 0.007, + "step": 724340 + }, + { + "epoch": 1.88, + "learning_rate": 1.8357047132958852e-05, + "loss": 0.007, + "step": 724350 + }, + { + "epoch": 1.88, + "learning_rate": 1.835315891658739e-05, + "loss": 0.0071, + "step": 724360 + }, + { + "epoch": 1.88, + "learning_rate": 1.8349270700215925e-05, + "loss": 0.006, + "step": 724370 + }, + { + "epoch": 1.88, + "learning_rate": 1.8345382483844457e-05, + "loss": 0.0086, + "step": 724380 + }, + { + "epoch": 1.88, + "learning_rate": 1.8341494267472995e-05, + "loss": 0.0077, + "step": 724390 + }, + { + "epoch": 1.88, + "learning_rate": 1.833760605110153e-05, + "loss": 0.0089, + "step": 724400 + }, + { + "epoch": 1.88, + "learning_rate": 1.8333717834730065e-05, + "loss": 0.0069, + "step": 724410 + }, + { + "epoch": 1.88, + "learning_rate": 1.83298296183586e-05, + "loss": 0.0085, + "step": 724420 + }, + { + "epoch": 1.88, + "learning_rate": 1.8325941401987138e-05, + "loss": 0.0065, + "step": 724430 + }, + { + "epoch": 1.88, + "learning_rate": 1.8322053185615673e-05, + "loss": 0.0063, + "step": 724440 + }, + { + "epoch": 1.88, + "learning_rate": 1.8318164969244208e-05, + "loss": 0.0073, + "step": 724450 + }, + { + "epoch": 1.88, + "learning_rate": 1.8314276752872743e-05, + "loss": 0.0118, + "step": 724460 + }, + { + "epoch": 1.88, + "learning_rate": 1.8310388536501277e-05, + "loss": 0.0128, + "step": 724470 + }, + { + "epoch": 1.88, + "learning_rate": 1.8306500320129812e-05, + "loss": 0.0069, + "step": 724480 + }, + { + "epoch": 1.88, + "learning_rate": 1.830261210375835e-05, + "loss": 0.0061, + "step": 724490 + }, + { + "epoch": 1.88, + "learning_rate": 1.8298723887386885e-05, + "loss": 0.0092, + "step": 724500 + }, + { + "epoch": 1.88, + "learning_rate": 1.8294835671015417e-05, + "loss": 0.008, + "step": 724510 + }, + { + "epoch": 1.88, + "learning_rate": 1.8290947454643955e-05, + "loss": 0.0075, + "step": 724520 + }, + { + "epoch": 1.88, + "learning_rate": 1.828705923827249e-05, + "loss": 0.0062, + "step": 724530 + }, + { + "epoch": 1.88, + "learning_rate": 1.8283171021901025e-05, + "loss": 0.0063, + "step": 724540 + }, + { + "epoch": 1.88, + "learning_rate": 1.827928280552956e-05, + "loss": 0.0064, + "step": 724550 + }, + { + "epoch": 1.88, + "learning_rate": 1.8275394589158098e-05, + "loss": 0.0072, + "step": 724560 + }, + { + "epoch": 1.88, + "learning_rate": 1.827150637278663e-05, + "loss": 0.0075, + "step": 724570 + }, + { + "epoch": 1.88, + "learning_rate": 1.8267618156415168e-05, + "loss": 0.008, + "step": 724580 + }, + { + "epoch": 1.88, + "learning_rate": 1.8263729940043703e-05, + "loss": 0.0088, + "step": 724590 + }, + { + "epoch": 1.88, + "learning_rate": 1.8259841723672237e-05, + "loss": 0.0104, + "step": 724600 + }, + { + "epoch": 1.88, + "learning_rate": 1.8255953507300772e-05, + "loss": 0.0072, + "step": 724610 + }, + { + "epoch": 1.88, + "learning_rate": 1.825206529092931e-05, + "loss": 0.0082, + "step": 724620 + }, + { + "epoch": 1.88, + "learning_rate": 1.8248177074557842e-05, + "loss": 0.0078, + "step": 724630 + }, + { + "epoch": 1.88, + "learning_rate": 1.8244288858186377e-05, + "loss": 0.0077, + "step": 724640 + }, + { + "epoch": 1.88, + "learning_rate": 1.8240400641814915e-05, + "loss": 0.0069, + "step": 724650 + }, + { + "epoch": 1.88, + "learning_rate": 1.823651242544345e-05, + "loss": 0.0075, + "step": 724660 + }, + { + "epoch": 1.88, + "learning_rate": 1.8232624209071985e-05, + "loss": 0.0064, + "step": 724670 + }, + { + "epoch": 1.88, + "learning_rate": 1.822873599270052e-05, + "loss": 0.0078, + "step": 724680 + }, + { + "epoch": 1.88, + "learning_rate": 1.8224847776329055e-05, + "loss": 0.01, + "step": 724690 + }, + { + "epoch": 1.88, + "learning_rate": 1.822095955995759e-05, + "loss": 0.0075, + "step": 724700 + }, + { + "epoch": 1.88, + "learning_rate": 1.8217071343586124e-05, + "loss": 0.0075, + "step": 724710 + }, + { + "epoch": 1.88, + "learning_rate": 1.8213183127214663e-05, + "loss": 0.0074, + "step": 724720 + }, + { + "epoch": 1.88, + "learning_rate": 1.8209294910843197e-05, + "loss": 0.0134, + "step": 724730 + }, + { + "epoch": 1.88, + "learning_rate": 1.8205406694471732e-05, + "loss": 0.0058, + "step": 724740 + }, + { + "epoch": 1.88, + "learning_rate": 1.8201518478100267e-05, + "loss": 0.007, + "step": 724750 + }, + { + "epoch": 1.88, + "learning_rate": 1.8197630261728802e-05, + "loss": 0.0065, + "step": 724760 + }, + { + "epoch": 1.88, + "learning_rate": 1.8193742045357337e-05, + "loss": 0.0097, + "step": 724770 + }, + { + "epoch": 1.88, + "learning_rate": 1.8189853828985875e-05, + "loss": 0.0056, + "step": 724780 + }, + { + "epoch": 1.88, + "learning_rate": 1.818596561261441e-05, + "loss": 0.0084, + "step": 724790 + }, + { + "epoch": 1.88, + "learning_rate": 1.8182077396242945e-05, + "loss": 0.0067, + "step": 724800 + }, + { + "epoch": 1.88, + "learning_rate": 1.817818917987148e-05, + "loss": 0.0069, + "step": 724810 + }, + { + "epoch": 1.88, + "learning_rate": 1.8174300963500015e-05, + "loss": 0.0081, + "step": 724820 + }, + { + "epoch": 1.88, + "learning_rate": 1.817041274712855e-05, + "loss": 0.0063, + "step": 724830 + }, + { + "epoch": 1.88, + "learning_rate": 1.8166524530757084e-05, + "loss": 0.0077, + "step": 724840 + }, + { + "epoch": 1.88, + "learning_rate": 1.8162636314385623e-05, + "loss": 0.0084, + "step": 724850 + }, + { + "epoch": 1.88, + "learning_rate": 1.8158748098014157e-05, + "loss": 0.0089, + "step": 724860 + }, + { + "epoch": 1.88, + "learning_rate": 1.8154859881642692e-05, + "loss": 0.0062, + "step": 724870 + }, + { + "epoch": 1.88, + "learning_rate": 1.8150971665271227e-05, + "loss": 0.0079, + "step": 724880 + }, + { + "epoch": 1.88, + "learning_rate": 1.8147083448899762e-05, + "loss": 0.0068, + "step": 724890 + }, + { + "epoch": 1.88, + "learning_rate": 1.8143195232528297e-05, + "loss": 0.007, + "step": 724900 + }, + { + "epoch": 1.88, + "learning_rate": 1.8139307016156835e-05, + "loss": 0.0078, + "step": 724910 + }, + { + "epoch": 1.88, + "learning_rate": 1.813541879978537e-05, + "loss": 0.0071, + "step": 724920 + }, + { + "epoch": 1.88, + "learning_rate": 1.8131530583413905e-05, + "loss": 0.007, + "step": 724930 + }, + { + "epoch": 1.88, + "learning_rate": 1.812764236704244e-05, + "loss": 0.0096, + "step": 724940 + }, + { + "epoch": 1.88, + "learning_rate": 1.8123754150670975e-05, + "loss": 0.0084, + "step": 724950 + }, + { + "epoch": 1.88, + "learning_rate": 1.811986593429951e-05, + "loss": 0.0083, + "step": 724960 + }, + { + "epoch": 1.88, + "learning_rate": 1.8115977717928044e-05, + "loss": 0.0058, + "step": 724970 + }, + { + "epoch": 1.88, + "learning_rate": 1.8112089501556583e-05, + "loss": 0.0062, + "step": 724980 + }, + { + "epoch": 1.88, + "learning_rate": 1.8108201285185117e-05, + "loss": 0.0095, + "step": 724990 + }, + { + "epoch": 1.88, + "learning_rate": 1.8104313068813652e-05, + "loss": 0.0082, + "step": 725000 + }, + { + "epoch": 1.88, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.004590142983943224, + "eval_runtime": 107.8781, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 725000 + }, + { + "epoch": 1.88, + "learning_rate": 1.8100424852442187e-05, + "loss": 0.0062, + "step": 725010 + }, + { + "epoch": 1.88, + "learning_rate": 1.8096536636070722e-05, + "loss": 0.0078, + "step": 725020 + }, + { + "epoch": 1.88, + "learning_rate": 1.8092648419699257e-05, + "loss": 0.0069, + "step": 725030 + }, + { + "epoch": 1.88, + "learning_rate": 1.8088760203327795e-05, + "loss": 0.0066, + "step": 725040 + }, + { + "epoch": 1.88, + "learning_rate": 1.808487198695633e-05, + "loss": 0.0073, + "step": 725050 + }, + { + "epoch": 1.88, + "learning_rate": 1.8080983770584865e-05, + "loss": 0.0071, + "step": 725060 + }, + { + "epoch": 1.88, + "learning_rate": 1.80770955542134e-05, + "loss": 0.0111, + "step": 725070 + }, + { + "epoch": 1.88, + "learning_rate": 1.8073207337841935e-05, + "loss": 0.0088, + "step": 725080 + }, + { + "epoch": 1.88, + "learning_rate": 1.806931912147047e-05, + "loss": 0.0079, + "step": 725090 + }, + { + "epoch": 1.88, + "learning_rate": 1.8065430905099004e-05, + "loss": 0.006, + "step": 725100 + }, + { + "epoch": 1.88, + "learning_rate": 1.8061542688727542e-05, + "loss": 0.0063, + "step": 725110 + }, + { + "epoch": 1.88, + "learning_rate": 1.8057654472356077e-05, + "loss": 0.0051, + "step": 725120 + }, + { + "epoch": 1.88, + "learning_rate": 1.8053766255984612e-05, + "loss": 0.0089, + "step": 725130 + }, + { + "epoch": 1.88, + "learning_rate": 1.8049878039613147e-05, + "loss": 0.0057, + "step": 725140 + }, + { + "epoch": 1.88, + "learning_rate": 1.8045989823241682e-05, + "loss": 0.006, + "step": 725150 + }, + { + "epoch": 1.88, + "learning_rate": 1.8042101606870217e-05, + "loss": 0.0078, + "step": 725160 + }, + { + "epoch": 1.88, + "learning_rate": 1.8038213390498755e-05, + "loss": 0.0065, + "step": 725170 + }, + { + "epoch": 1.88, + "learning_rate": 1.803432517412729e-05, + "loss": 0.0076, + "step": 725180 + }, + { + "epoch": 1.88, + "learning_rate": 1.803043695775582e-05, + "loss": 0.0076, + "step": 725190 + }, + { + "epoch": 1.88, + "learning_rate": 1.802654874138436e-05, + "loss": 0.0079, + "step": 725200 + }, + { + "epoch": 1.88, + "learning_rate": 1.8022660525012894e-05, + "loss": 0.0123, + "step": 725210 + }, + { + "epoch": 1.88, + "learning_rate": 1.801877230864143e-05, + "loss": 0.0068, + "step": 725220 + }, + { + "epoch": 1.88, + "learning_rate": 1.8014884092269964e-05, + "loss": 0.0081, + "step": 725230 + }, + { + "epoch": 1.88, + "learning_rate": 1.8010995875898502e-05, + "loss": 0.0054, + "step": 725240 + }, + { + "epoch": 1.88, + "learning_rate": 1.8007107659527034e-05, + "loss": 0.005, + "step": 725250 + }, + { + "epoch": 1.88, + "learning_rate": 1.8003219443155572e-05, + "loss": 0.0079, + "step": 725260 + }, + { + "epoch": 1.88, + "learning_rate": 1.7999331226784107e-05, + "loss": 0.0069, + "step": 725270 + }, + { + "epoch": 1.88, + "learning_rate": 1.7995443010412642e-05, + "loss": 0.005, + "step": 725280 + }, + { + "epoch": 1.88, + "learning_rate": 1.7991554794041177e-05, + "loss": 0.0119, + "step": 725290 + }, + { + "epoch": 1.88, + "learning_rate": 1.7987666577669715e-05, + "loss": 0.0086, + "step": 725300 + }, + { + "epoch": 1.88, + "learning_rate": 1.7983778361298246e-05, + "loss": 0.0122, + "step": 725310 + }, + { + "epoch": 1.88, + "learning_rate": 1.797989014492678e-05, + "loss": 0.0044, + "step": 725320 + }, + { + "epoch": 1.88, + "learning_rate": 1.797600192855532e-05, + "loss": 0.0084, + "step": 725330 + }, + { + "epoch": 1.88, + "learning_rate": 1.7972113712183854e-05, + "loss": 0.0115, + "step": 725340 + }, + { + "epoch": 1.88, + "learning_rate": 1.796822549581239e-05, + "loss": 0.0088, + "step": 725350 + }, + { + "epoch": 1.88, + "learning_rate": 1.7964337279440924e-05, + "loss": 0.0076, + "step": 725360 + }, + { + "epoch": 1.88, + "learning_rate": 1.7960449063069462e-05, + "loss": 0.0051, + "step": 725370 + }, + { + "epoch": 1.88, + "learning_rate": 1.7956560846697994e-05, + "loss": 0.0071, + "step": 725380 + }, + { + "epoch": 1.88, + "learning_rate": 1.795267263032653e-05, + "loss": 0.0072, + "step": 725390 + }, + { + "epoch": 1.88, + "learning_rate": 1.7948784413955067e-05, + "loss": 0.0072, + "step": 725400 + }, + { + "epoch": 1.88, + "learning_rate": 1.7944896197583602e-05, + "loss": 0.0076, + "step": 725410 + }, + { + "epoch": 1.88, + "learning_rate": 1.7941007981212137e-05, + "loss": 0.0071, + "step": 725420 + }, + { + "epoch": 1.88, + "learning_rate": 1.793711976484067e-05, + "loss": 0.0096, + "step": 725430 + }, + { + "epoch": 1.88, + "learning_rate": 1.7933231548469206e-05, + "loss": 0.0066, + "step": 725440 + }, + { + "epoch": 1.88, + "learning_rate": 1.792934333209774e-05, + "loss": 0.006, + "step": 725450 + }, + { + "epoch": 1.88, + "learning_rate": 1.792545511572628e-05, + "loss": 0.007, + "step": 725460 + }, + { + "epoch": 1.88, + "learning_rate": 1.7921566899354814e-05, + "loss": 0.0071, + "step": 725470 + }, + { + "epoch": 1.88, + "learning_rate": 1.791767868298335e-05, + "loss": 0.0074, + "step": 725480 + }, + { + "epoch": 1.88, + "learning_rate": 1.7913790466611884e-05, + "loss": 0.0069, + "step": 725490 + }, + { + "epoch": 1.88, + "learning_rate": 1.790990225024042e-05, + "loss": 0.0051, + "step": 725500 + }, + { + "epoch": 1.88, + "learning_rate": 1.7906014033868954e-05, + "loss": 0.0066, + "step": 725510 + }, + { + "epoch": 1.88, + "learning_rate": 1.790212581749749e-05, + "loss": 0.0086, + "step": 725520 + }, + { + "epoch": 1.88, + "learning_rate": 1.7898237601126027e-05, + "loss": 0.006, + "step": 725530 + }, + { + "epoch": 1.88, + "learning_rate": 1.7894349384754562e-05, + "loss": 0.0101, + "step": 725540 + }, + { + "epoch": 1.88, + "learning_rate": 1.7890461168383097e-05, + "loss": 0.0082, + "step": 725550 + }, + { + "epoch": 1.88, + "learning_rate": 1.788657295201163e-05, + "loss": 0.0069, + "step": 725560 + }, + { + "epoch": 1.88, + "learning_rate": 1.7882684735640166e-05, + "loss": 0.0066, + "step": 725570 + }, + { + "epoch": 1.88, + "learning_rate": 1.78787965192687e-05, + "loss": 0.0065, + "step": 725580 + }, + { + "epoch": 1.88, + "learning_rate": 1.787490830289724e-05, + "loss": 0.0078, + "step": 725590 + }, + { + "epoch": 1.88, + "learning_rate": 1.7871020086525774e-05, + "loss": 0.0057, + "step": 725600 + }, + { + "epoch": 1.88, + "learning_rate": 1.786713187015431e-05, + "loss": 0.0062, + "step": 725610 + }, + { + "epoch": 1.88, + "learning_rate": 1.7863243653782844e-05, + "loss": 0.0064, + "step": 725620 + }, + { + "epoch": 1.88, + "learning_rate": 1.785935543741138e-05, + "loss": 0.0081, + "step": 725630 + }, + { + "epoch": 1.88, + "learning_rate": 1.7855467221039914e-05, + "loss": 0.0079, + "step": 725640 + }, + { + "epoch": 1.88, + "learning_rate": 1.785157900466845e-05, + "loss": 0.0105, + "step": 725650 + }, + { + "epoch": 1.88, + "learning_rate": 1.7847690788296987e-05, + "loss": 0.0049, + "step": 725660 + }, + { + "epoch": 1.88, + "learning_rate": 1.7843802571925522e-05, + "loss": 0.0085, + "step": 725670 + }, + { + "epoch": 1.88, + "learning_rate": 1.7839914355554057e-05, + "loss": 0.0062, + "step": 725680 + }, + { + "epoch": 1.88, + "learning_rate": 1.783602613918259e-05, + "loss": 0.0075, + "step": 725690 + }, + { + "epoch": 1.88, + "learning_rate": 1.7832137922811126e-05, + "loss": 0.0077, + "step": 725700 + }, + { + "epoch": 1.88, + "learning_rate": 1.782824970643966e-05, + "loss": 0.0046, + "step": 725710 + }, + { + "epoch": 1.88, + "learning_rate": 1.78243614900682e-05, + "loss": 0.0054, + "step": 725720 + }, + { + "epoch": 1.88, + "learning_rate": 1.7820473273696734e-05, + "loss": 0.005, + "step": 725730 + }, + { + "epoch": 1.88, + "learning_rate": 1.781658505732527e-05, + "loss": 0.0094, + "step": 725740 + }, + { + "epoch": 1.88, + "learning_rate": 1.7812696840953804e-05, + "loss": 0.0137, + "step": 725750 + }, + { + "epoch": 1.88, + "learning_rate": 1.780880862458234e-05, + "loss": 0.0082, + "step": 725760 + }, + { + "epoch": 1.88, + "learning_rate": 1.7804920408210874e-05, + "loss": 0.0055, + "step": 725770 + }, + { + "epoch": 1.88, + "learning_rate": 1.780103219183941e-05, + "loss": 0.0065, + "step": 725780 + }, + { + "epoch": 1.88, + "learning_rate": 1.7797143975467947e-05, + "loss": 0.0045, + "step": 725790 + }, + { + "epoch": 1.88, + "learning_rate": 1.7793255759096482e-05, + "loss": 0.0093, + "step": 725800 + }, + { + "epoch": 1.88, + "learning_rate": 1.7789367542725017e-05, + "loss": 0.0061, + "step": 725810 + }, + { + "epoch": 1.88, + "learning_rate": 1.778547932635355e-05, + "loss": 0.006, + "step": 725820 + }, + { + "epoch": 1.88, + "learning_rate": 1.7781591109982086e-05, + "loss": 0.0072, + "step": 725830 + }, + { + "epoch": 1.88, + "learning_rate": 1.777770289361062e-05, + "loss": 0.0073, + "step": 725840 + }, + { + "epoch": 1.88, + "learning_rate": 1.777381467723916e-05, + "loss": 0.0083, + "step": 725850 + }, + { + "epoch": 1.88, + "learning_rate": 1.7769926460867694e-05, + "loss": 0.0078, + "step": 725860 + }, + { + "epoch": 1.88, + "learning_rate": 1.7766038244496226e-05, + "loss": 0.0118, + "step": 725870 + }, + { + "epoch": 1.88, + "learning_rate": 1.7762150028124764e-05, + "loss": 0.0052, + "step": 725880 + }, + { + "epoch": 1.88, + "learning_rate": 1.77582618117533e-05, + "loss": 0.0064, + "step": 725890 + }, + { + "epoch": 1.88, + "learning_rate": 1.7754373595381834e-05, + "loss": 0.0066, + "step": 725900 + }, + { + "epoch": 1.88, + "learning_rate": 1.775048537901037e-05, + "loss": 0.01, + "step": 725910 + }, + { + "epoch": 1.88, + "learning_rate": 1.7746597162638907e-05, + "loss": 0.0086, + "step": 725920 + }, + { + "epoch": 1.88, + "learning_rate": 1.774270894626744e-05, + "loss": 0.009, + "step": 725930 + }, + { + "epoch": 1.88, + "learning_rate": 1.7738820729895977e-05, + "loss": 0.0088, + "step": 725940 + }, + { + "epoch": 1.88, + "learning_rate": 1.773493251352451e-05, + "loss": 0.0071, + "step": 725950 + }, + { + "epoch": 1.88, + "learning_rate": 1.7731044297153046e-05, + "loss": 0.01, + "step": 725960 + }, + { + "epoch": 1.88, + "learning_rate": 1.772715608078158e-05, + "loss": 0.0065, + "step": 725970 + }, + { + "epoch": 1.88, + "learning_rate": 1.772326786441012e-05, + "loss": 0.0077, + "step": 725980 + }, + { + "epoch": 1.88, + "learning_rate": 1.7719379648038654e-05, + "loss": 0.0061, + "step": 725990 + }, + { + "epoch": 1.88, + "learning_rate": 1.7715491431667186e-05, + "loss": 0.0098, + "step": 726000 + }, + { + "epoch": 1.88, + "eval_cer": 0.88167329394755, + "eval_loss": 0.004557341802865267, + "eval_runtime": 107.9128, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 726000 + }, + { + "epoch": 1.88, + "learning_rate": 1.7711603215295724e-05, + "loss": 0.0057, + "step": 726010 + }, + { + "epoch": 1.88, + "learning_rate": 1.770771499892426e-05, + "loss": 0.011, + "step": 726020 + }, + { + "epoch": 1.88, + "learning_rate": 1.7703826782552794e-05, + "loss": 0.0065, + "step": 726030 + }, + { + "epoch": 1.88, + "learning_rate": 1.769993856618133e-05, + "loss": 0.0106, + "step": 726040 + }, + { + "epoch": 1.88, + "learning_rate": 1.7696050349809867e-05, + "loss": 0.0054, + "step": 726050 + }, + { + "epoch": 1.88, + "learning_rate": 1.76921621334384e-05, + "loss": 0.0062, + "step": 726060 + }, + { + "epoch": 1.88, + "learning_rate": 1.7688273917066933e-05, + "loss": 0.0056, + "step": 726070 + }, + { + "epoch": 1.88, + "learning_rate": 1.768438570069547e-05, + "loss": 0.0085, + "step": 726080 + }, + { + "epoch": 1.88, + "learning_rate": 1.7680497484324006e-05, + "loss": 0.0054, + "step": 726090 + }, + { + "epoch": 1.88, + "learning_rate": 1.767660926795254e-05, + "loss": 0.0102, + "step": 726100 + }, + { + "epoch": 1.88, + "learning_rate": 1.7672721051581076e-05, + "loss": 0.0058, + "step": 726110 + }, + { + "epoch": 1.88, + "learning_rate": 1.766883283520961e-05, + "loss": 0.007, + "step": 726120 + }, + { + "epoch": 1.88, + "learning_rate": 1.7664944618838146e-05, + "loss": 0.0077, + "step": 726130 + }, + { + "epoch": 1.88, + "learning_rate": 1.7661056402466684e-05, + "loss": 0.0091, + "step": 726140 + }, + { + "epoch": 1.88, + "learning_rate": 1.765716818609522e-05, + "loss": 0.0083, + "step": 726150 + }, + { + "epoch": 1.88, + "learning_rate": 1.7653279969723754e-05, + "loss": 0.0086, + "step": 726160 + }, + { + "epoch": 1.88, + "learning_rate": 1.764939175335229e-05, + "loss": 0.0084, + "step": 726170 + }, + { + "epoch": 1.88, + "learning_rate": 1.7645503536980823e-05, + "loss": 0.0097, + "step": 726180 + }, + { + "epoch": 1.88, + "learning_rate": 1.764161532060936e-05, + "loss": 0.009, + "step": 726190 + }, + { + "epoch": 1.88, + "learning_rate": 1.7637727104237893e-05, + "loss": 0.0081, + "step": 726200 + }, + { + "epoch": 1.88, + "learning_rate": 1.763383888786643e-05, + "loss": 0.008, + "step": 726210 + }, + { + "epoch": 1.88, + "learning_rate": 1.7629950671494966e-05, + "loss": 0.0088, + "step": 726220 + }, + { + "epoch": 1.88, + "learning_rate": 1.76260624551235e-05, + "loss": 0.0072, + "step": 726230 + }, + { + "epoch": 1.88, + "learning_rate": 1.7622174238752036e-05, + "loss": 0.0059, + "step": 726240 + }, + { + "epoch": 1.88, + "learning_rate": 1.761828602238057e-05, + "loss": 0.0067, + "step": 726250 + }, + { + "epoch": 1.88, + "learning_rate": 1.7614397806009106e-05, + "loss": 0.01, + "step": 726260 + }, + { + "epoch": 1.88, + "learning_rate": 1.7610509589637644e-05, + "loss": 0.0082, + "step": 726270 + }, + { + "epoch": 1.88, + "learning_rate": 1.760662137326618e-05, + "loss": 0.0064, + "step": 726280 + }, + { + "epoch": 1.88, + "learning_rate": 1.7602733156894714e-05, + "loss": 0.0063, + "step": 726290 + }, + { + "epoch": 1.88, + "learning_rate": 1.759884494052325e-05, + "loss": 0.0063, + "step": 726300 + }, + { + "epoch": 1.88, + "learning_rate": 1.7594956724151783e-05, + "loss": 0.008, + "step": 726310 + }, + { + "epoch": 1.88, + "learning_rate": 1.759106850778032e-05, + "loss": 0.0094, + "step": 726320 + }, + { + "epoch": 1.88, + "learning_rate": 1.7587180291408853e-05, + "loss": 0.0063, + "step": 726330 + }, + { + "epoch": 1.88, + "learning_rate": 1.758329207503739e-05, + "loss": 0.0089, + "step": 726340 + }, + { + "epoch": 1.88, + "learning_rate": 1.7579403858665926e-05, + "loss": 0.0059, + "step": 726350 + }, + { + "epoch": 1.88, + "learning_rate": 1.757551564229446e-05, + "loss": 0.0064, + "step": 726360 + }, + { + "epoch": 1.88, + "learning_rate": 1.7571627425922996e-05, + "loss": 0.0058, + "step": 726370 + }, + { + "epoch": 1.88, + "learning_rate": 1.756773920955153e-05, + "loss": 0.0086, + "step": 726380 + }, + { + "epoch": 1.88, + "learning_rate": 1.7563850993180066e-05, + "loss": 0.0104, + "step": 726390 + }, + { + "epoch": 1.88, + "learning_rate": 1.7559962776808604e-05, + "loss": 0.0089, + "step": 726400 + }, + { + "epoch": 1.88, + "learning_rate": 1.755607456043714e-05, + "loss": 0.0082, + "step": 726410 + }, + { + "epoch": 1.88, + "learning_rate": 1.7552186344065674e-05, + "loss": 0.0051, + "step": 726420 + }, + { + "epoch": 1.88, + "learning_rate": 1.754829812769421e-05, + "loss": 0.0067, + "step": 726430 + }, + { + "epoch": 1.88, + "learning_rate": 1.7544409911322743e-05, + "loss": 0.0062, + "step": 726440 + }, + { + "epoch": 1.88, + "learning_rate": 1.7540521694951278e-05, + "loss": 0.0114, + "step": 726450 + }, + { + "epoch": 1.88, + "learning_rate": 1.7536633478579813e-05, + "loss": 0.0067, + "step": 726460 + }, + { + "epoch": 1.88, + "learning_rate": 1.753274526220835e-05, + "loss": 0.0085, + "step": 726470 + }, + { + "epoch": 1.88, + "learning_rate": 1.7528857045836886e-05, + "loss": 0.0072, + "step": 726480 + }, + { + "epoch": 1.88, + "learning_rate": 1.752496882946542e-05, + "loss": 0.0084, + "step": 726490 + }, + { + "epoch": 1.88, + "learning_rate": 1.7521080613093956e-05, + "loss": 0.0067, + "step": 726500 + }, + { + "epoch": 1.88, + "learning_rate": 1.751719239672249e-05, + "loss": 0.0081, + "step": 726510 + }, + { + "epoch": 1.88, + "learning_rate": 1.7513304180351026e-05, + "loss": 0.0057, + "step": 726520 + }, + { + "epoch": 1.88, + "learning_rate": 1.7509415963979564e-05, + "loss": 0.0068, + "step": 726530 + }, + { + "epoch": 1.88, + "learning_rate": 1.75055277476081e-05, + "loss": 0.0049, + "step": 726540 + }, + { + "epoch": 1.88, + "learning_rate": 1.750163953123663e-05, + "loss": 0.0096, + "step": 726550 + }, + { + "epoch": 1.88, + "learning_rate": 1.749775131486517e-05, + "loss": 0.0076, + "step": 726560 + }, + { + "epoch": 1.88, + "learning_rate": 1.7493863098493703e-05, + "loss": 0.0082, + "step": 726570 + }, + { + "epoch": 1.88, + "learning_rate": 1.7489974882122238e-05, + "loss": 0.0071, + "step": 726580 + }, + { + "epoch": 1.88, + "learning_rate": 1.7486086665750773e-05, + "loss": 0.0086, + "step": 726590 + }, + { + "epoch": 1.88, + "learning_rate": 1.748219844937931e-05, + "loss": 0.0074, + "step": 726600 + }, + { + "epoch": 1.88, + "learning_rate": 1.7478310233007846e-05, + "loss": 0.0069, + "step": 726610 + }, + { + "epoch": 1.88, + "learning_rate": 1.747442201663638e-05, + "loss": 0.0083, + "step": 726620 + }, + { + "epoch": 1.88, + "learning_rate": 1.7470533800264916e-05, + "loss": 0.0076, + "step": 726630 + }, + { + "epoch": 1.88, + "learning_rate": 1.746664558389345e-05, + "loss": 0.0055, + "step": 726640 + }, + { + "epoch": 1.88, + "learning_rate": 1.7462757367521986e-05, + "loss": 0.008, + "step": 726650 + }, + { + "epoch": 1.88, + "learning_rate": 1.7458869151150524e-05, + "loss": 0.0053, + "step": 726660 + }, + { + "epoch": 1.88, + "learning_rate": 1.745498093477906e-05, + "loss": 0.0107, + "step": 726670 + }, + { + "epoch": 1.88, + "learning_rate": 1.745109271840759e-05, + "loss": 0.0056, + "step": 726680 + }, + { + "epoch": 1.88, + "learning_rate": 1.744720450203613e-05, + "loss": 0.007, + "step": 726690 + }, + { + "epoch": 1.88, + "learning_rate": 1.7443316285664663e-05, + "loss": 0.0062, + "step": 726700 + }, + { + "epoch": 1.88, + "learning_rate": 1.7439428069293198e-05, + "loss": 0.0052, + "step": 726710 + }, + { + "epoch": 1.88, + "learning_rate": 1.7435539852921733e-05, + "loss": 0.0074, + "step": 726720 + }, + { + "epoch": 1.88, + "learning_rate": 1.743165163655027e-05, + "loss": 0.0065, + "step": 726730 + }, + { + "epoch": 1.88, + "learning_rate": 1.7427763420178803e-05, + "loss": 0.006, + "step": 726740 + }, + { + "epoch": 1.88, + "learning_rate": 1.742387520380734e-05, + "loss": 0.0089, + "step": 726750 + }, + { + "epoch": 1.88, + "learning_rate": 1.7419986987435876e-05, + "loss": 0.0055, + "step": 726760 + }, + { + "epoch": 1.88, + "learning_rate": 1.741609877106441e-05, + "loss": 0.0078, + "step": 726770 + }, + { + "epoch": 1.88, + "learning_rate": 1.7412210554692946e-05, + "loss": 0.0062, + "step": 726780 + }, + { + "epoch": 1.88, + "learning_rate": 1.740832233832148e-05, + "loss": 0.008, + "step": 726790 + }, + { + "epoch": 1.88, + "learning_rate": 1.7404434121950015e-05, + "loss": 0.0073, + "step": 726800 + }, + { + "epoch": 1.88, + "learning_rate": 1.740054590557855e-05, + "loss": 0.0076, + "step": 726810 + }, + { + "epoch": 1.88, + "learning_rate": 1.739665768920709e-05, + "loss": 0.0088, + "step": 726820 + }, + { + "epoch": 1.88, + "learning_rate": 1.7392769472835623e-05, + "loss": 0.0053, + "step": 726830 + }, + { + "epoch": 1.88, + "learning_rate": 1.7388881256464158e-05, + "loss": 0.0078, + "step": 726840 + }, + { + "epoch": 1.88, + "learning_rate": 1.7384993040092693e-05, + "loss": 0.0074, + "step": 726850 + }, + { + "epoch": 1.88, + "learning_rate": 1.7381104823721228e-05, + "loss": 0.0063, + "step": 726860 + }, + { + "epoch": 1.88, + "learning_rate": 1.7377216607349763e-05, + "loss": 0.0074, + "step": 726870 + }, + { + "epoch": 1.88, + "learning_rate": 1.7373328390978298e-05, + "loss": 0.0076, + "step": 726880 + }, + { + "epoch": 1.88, + "learning_rate": 1.7369440174606836e-05, + "loss": 0.0072, + "step": 726890 + }, + { + "epoch": 1.88, + "learning_rate": 1.736555195823537e-05, + "loss": 0.0072, + "step": 726900 + }, + { + "epoch": 1.88, + "learning_rate": 1.7361663741863906e-05, + "loss": 0.0067, + "step": 726910 + }, + { + "epoch": 1.88, + "learning_rate": 1.735777552549244e-05, + "loss": 0.0064, + "step": 726920 + }, + { + "epoch": 1.88, + "learning_rate": 1.7353887309120975e-05, + "loss": 0.0055, + "step": 726930 + }, + { + "epoch": 1.88, + "learning_rate": 1.734999909274951e-05, + "loss": 0.0074, + "step": 726940 + }, + { + "epoch": 1.88, + "learning_rate": 1.734611087637805e-05, + "loss": 0.006, + "step": 726950 + }, + { + "epoch": 1.88, + "learning_rate": 1.7342222660006583e-05, + "loss": 0.0094, + "step": 726960 + }, + { + "epoch": 1.88, + "learning_rate": 1.7338334443635118e-05, + "loss": 0.0047, + "step": 726970 + }, + { + "epoch": 1.88, + "learning_rate": 1.7334446227263653e-05, + "loss": 0.0091, + "step": 726980 + }, + { + "epoch": 1.88, + "learning_rate": 1.7330558010892188e-05, + "loss": 0.0086, + "step": 726990 + }, + { + "epoch": 1.88, + "learning_rate": 1.7326669794520723e-05, + "loss": 0.0083, + "step": 727000 + }, + { + "epoch": 1.88, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.004555822350084782, + "eval_runtime": 107.8877, + "eval_samples_per_second": 18.538, + "eval_steps_per_second": 4.634, + "step": 727000 + }, + { + "epoch": 1.88, + "learning_rate": 1.7322781578149258e-05, + "loss": 0.007, + "step": 727010 + }, + { + "epoch": 1.88, + "learning_rate": 1.7318893361777796e-05, + "loss": 0.0041, + "step": 727020 + }, + { + "epoch": 1.88, + "learning_rate": 1.731500514540633e-05, + "loss": 0.0105, + "step": 727030 + }, + { + "epoch": 1.88, + "learning_rate": 1.7311116929034866e-05, + "loss": 0.0072, + "step": 727040 + }, + { + "epoch": 1.88, + "learning_rate": 1.73072287126634e-05, + "loss": 0.008, + "step": 727050 + }, + { + "epoch": 1.88, + "learning_rate": 1.7303340496291935e-05, + "loss": 0.0062, + "step": 727060 + }, + { + "epoch": 1.88, + "learning_rate": 1.729945227992047e-05, + "loss": 0.0072, + "step": 727070 + }, + { + "epoch": 1.88, + "learning_rate": 1.729556406354901e-05, + "loss": 0.0107, + "step": 727080 + }, + { + "epoch": 1.88, + "learning_rate": 1.7291675847177543e-05, + "loss": 0.0055, + "step": 727090 + }, + { + "epoch": 1.88, + "learning_rate": 1.7287787630806078e-05, + "loss": 0.0059, + "step": 727100 + }, + { + "epoch": 1.88, + "learning_rate": 1.7283899414434613e-05, + "loss": 0.0108, + "step": 727110 + }, + { + "epoch": 1.88, + "learning_rate": 1.7280011198063148e-05, + "loss": 0.0078, + "step": 727120 + }, + { + "epoch": 1.88, + "learning_rate": 1.7276122981691683e-05, + "loss": 0.0081, + "step": 727130 + }, + { + "epoch": 1.88, + "learning_rate": 1.7272234765320218e-05, + "loss": 0.0069, + "step": 727140 + }, + { + "epoch": 1.88, + "learning_rate": 1.7268346548948756e-05, + "loss": 0.0057, + "step": 727150 + }, + { + "epoch": 1.88, + "learning_rate": 1.726445833257729e-05, + "loss": 0.0058, + "step": 727160 + }, + { + "epoch": 1.88, + "learning_rate": 1.7260570116205826e-05, + "loss": 0.0056, + "step": 727170 + }, + { + "epoch": 1.88, + "learning_rate": 1.725668189983436e-05, + "loss": 0.0073, + "step": 727180 + }, + { + "epoch": 1.88, + "learning_rate": 1.7252793683462895e-05, + "loss": 0.0047, + "step": 727190 + }, + { + "epoch": 1.89, + "learning_rate": 1.724890546709143e-05, + "loss": 0.005, + "step": 727200 + }, + { + "epoch": 1.89, + "learning_rate": 1.724501725071997e-05, + "loss": 0.0082, + "step": 727210 + }, + { + "epoch": 1.89, + "learning_rate": 1.7241129034348503e-05, + "loss": 0.0098, + "step": 727220 + }, + { + "epoch": 1.89, + "learning_rate": 1.7237240817977038e-05, + "loss": 0.0093, + "step": 727230 + }, + { + "epoch": 1.89, + "learning_rate": 1.7233352601605573e-05, + "loss": 0.0064, + "step": 727240 + }, + { + "epoch": 1.89, + "learning_rate": 1.7229464385234108e-05, + "loss": 0.0095, + "step": 727250 + }, + { + "epoch": 1.89, + "learning_rate": 1.7225576168862643e-05, + "loss": 0.0071, + "step": 727260 + }, + { + "epoch": 1.89, + "learning_rate": 1.7221687952491178e-05, + "loss": 0.0056, + "step": 727270 + }, + { + "epoch": 1.89, + "learning_rate": 1.7217799736119716e-05, + "loss": 0.0059, + "step": 727280 + }, + { + "epoch": 1.89, + "learning_rate": 1.721391151974825e-05, + "loss": 0.0063, + "step": 727290 + }, + { + "epoch": 1.89, + "learning_rate": 1.7210023303376786e-05, + "loss": 0.0077, + "step": 727300 + }, + { + "epoch": 1.89, + "learning_rate": 1.720613508700532e-05, + "loss": 0.006, + "step": 727310 + }, + { + "epoch": 1.89, + "learning_rate": 1.7202246870633855e-05, + "loss": 0.0096, + "step": 727320 + }, + { + "epoch": 1.89, + "learning_rate": 1.719835865426239e-05, + "loss": 0.0082, + "step": 727330 + }, + { + "epoch": 1.89, + "learning_rate": 1.719447043789093e-05, + "loss": 0.0109, + "step": 727340 + }, + { + "epoch": 1.89, + "learning_rate": 1.7190582221519463e-05, + "loss": 0.0096, + "step": 727350 + }, + { + "epoch": 1.89, + "learning_rate": 1.7186694005147995e-05, + "loss": 0.0062, + "step": 727360 + }, + { + "epoch": 1.89, + "learning_rate": 1.7182805788776533e-05, + "loss": 0.0041, + "step": 727370 + }, + { + "epoch": 1.89, + "learning_rate": 1.7178917572405068e-05, + "loss": 0.0059, + "step": 727380 + }, + { + "epoch": 1.89, + "learning_rate": 1.7175029356033603e-05, + "loss": 0.007, + "step": 727390 + }, + { + "epoch": 1.89, + "learning_rate": 1.7171141139662138e-05, + "loss": 0.0071, + "step": 727400 + }, + { + "epoch": 1.89, + "learning_rate": 1.7167252923290676e-05, + "loss": 0.0063, + "step": 727410 + }, + { + "epoch": 1.89, + "learning_rate": 1.7163364706919207e-05, + "loss": 0.0079, + "step": 727420 + }, + { + "epoch": 1.89, + "learning_rate": 1.7159476490547746e-05, + "loss": 0.0081, + "step": 727430 + }, + { + "epoch": 1.89, + "learning_rate": 1.715558827417628e-05, + "loss": 0.0065, + "step": 727440 + }, + { + "epoch": 1.89, + "learning_rate": 1.7151700057804815e-05, + "loss": 0.0104, + "step": 727450 + }, + { + "epoch": 1.89, + "learning_rate": 1.714781184143335e-05, + "loss": 0.0077, + "step": 727460 + }, + { + "epoch": 1.89, + "learning_rate": 1.7143923625061885e-05, + "loss": 0.0042, + "step": 727470 + }, + { + "epoch": 1.89, + "learning_rate": 1.714003540869042e-05, + "loss": 0.0077, + "step": 727480 + }, + { + "epoch": 1.89, + "learning_rate": 1.7136147192318955e-05, + "loss": 0.0073, + "step": 727490 + }, + { + "epoch": 1.89, + "learning_rate": 1.7132258975947493e-05, + "loss": 0.0041, + "step": 727500 + }, + { + "epoch": 1.89, + "learning_rate": 1.7128370759576028e-05, + "loss": 0.0084, + "step": 727510 + }, + { + "epoch": 1.89, + "learning_rate": 1.7124482543204563e-05, + "loss": 0.0103, + "step": 727520 + }, + { + "epoch": 1.89, + "learning_rate": 1.7120594326833098e-05, + "loss": 0.0091, + "step": 727530 + }, + { + "epoch": 1.89, + "learning_rate": 1.7116706110461636e-05, + "loss": 0.0108, + "step": 727540 + }, + { + "epoch": 1.89, + "learning_rate": 1.7112817894090167e-05, + "loss": 0.0061, + "step": 727550 + }, + { + "epoch": 1.89, + "learning_rate": 1.7108929677718702e-05, + "loss": 0.008, + "step": 727560 + }, + { + "epoch": 1.89, + "learning_rate": 1.710504146134724e-05, + "loss": 0.007, + "step": 727570 + }, + { + "epoch": 1.89, + "learning_rate": 1.7101153244975775e-05, + "loss": 0.0071, + "step": 727580 + }, + { + "epoch": 1.89, + "learning_rate": 1.709726502860431e-05, + "loss": 0.0074, + "step": 727590 + }, + { + "epoch": 1.89, + "learning_rate": 1.7093376812232845e-05, + "loss": 0.0061, + "step": 727600 + }, + { + "epoch": 1.89, + "learning_rate": 1.708948859586138e-05, + "loss": 0.0074, + "step": 727610 + }, + { + "epoch": 1.89, + "learning_rate": 1.7085600379489915e-05, + "loss": 0.0071, + "step": 727620 + }, + { + "epoch": 1.89, + "learning_rate": 1.7081712163118453e-05, + "loss": 0.0078, + "step": 727630 + }, + { + "epoch": 1.89, + "learning_rate": 1.7077823946746988e-05, + "loss": 0.0062, + "step": 727640 + }, + { + "epoch": 1.89, + "learning_rate": 1.7073935730375523e-05, + "loss": 0.0076, + "step": 727650 + }, + { + "epoch": 1.89, + "learning_rate": 1.7070047514004058e-05, + "loss": 0.007, + "step": 727660 + }, + { + "epoch": 1.89, + "learning_rate": 1.7066159297632592e-05, + "loss": 0.007, + "step": 727670 + }, + { + "epoch": 1.89, + "learning_rate": 1.7062271081261127e-05, + "loss": 0.0071, + "step": 727680 + }, + { + "epoch": 1.89, + "learning_rate": 1.7058382864889662e-05, + "loss": 0.0057, + "step": 727690 + }, + { + "epoch": 1.89, + "learning_rate": 1.70544946485182e-05, + "loss": 0.0079, + "step": 727700 + }, + { + "epoch": 1.89, + "learning_rate": 1.7050606432146735e-05, + "loss": 0.0065, + "step": 727710 + }, + { + "epoch": 1.89, + "learning_rate": 1.704671821577527e-05, + "loss": 0.0071, + "step": 727720 + }, + { + "epoch": 1.89, + "learning_rate": 1.7042829999403805e-05, + "loss": 0.0063, + "step": 727730 + }, + { + "epoch": 1.89, + "learning_rate": 1.703894178303234e-05, + "loss": 0.0086, + "step": 727740 + }, + { + "epoch": 1.89, + "learning_rate": 1.7035053566660875e-05, + "loss": 0.0093, + "step": 727750 + }, + { + "epoch": 1.89, + "learning_rate": 1.7031165350289413e-05, + "loss": 0.0055, + "step": 727760 + }, + { + "epoch": 1.89, + "learning_rate": 1.7027277133917948e-05, + "loss": 0.0069, + "step": 727770 + }, + { + "epoch": 1.89, + "learning_rate": 1.7023388917546483e-05, + "loss": 0.0073, + "step": 727780 + }, + { + "epoch": 1.89, + "learning_rate": 1.7019500701175018e-05, + "loss": 0.0088, + "step": 727790 + }, + { + "epoch": 1.89, + "learning_rate": 1.7015612484803552e-05, + "loss": 0.0063, + "step": 727800 + }, + { + "epoch": 1.89, + "learning_rate": 1.7011724268432087e-05, + "loss": 0.0086, + "step": 727810 + }, + { + "epoch": 1.89, + "learning_rate": 1.7007836052060622e-05, + "loss": 0.0066, + "step": 727820 + }, + { + "epoch": 1.89, + "learning_rate": 1.700394783568916e-05, + "loss": 0.0051, + "step": 727830 + }, + { + "epoch": 1.89, + "learning_rate": 1.7000059619317695e-05, + "loss": 0.0079, + "step": 727840 + }, + { + "epoch": 1.89, + "learning_rate": 1.699617140294623e-05, + "loss": 0.0089, + "step": 727850 + }, + { + "epoch": 1.89, + "learning_rate": 1.6992283186574765e-05, + "loss": 0.0081, + "step": 727860 + }, + { + "epoch": 1.89, + "learning_rate": 1.69883949702033e-05, + "loss": 0.0107, + "step": 727870 + }, + { + "epoch": 1.89, + "learning_rate": 1.6984506753831835e-05, + "loss": 0.0073, + "step": 727880 + }, + { + "epoch": 1.89, + "learning_rate": 1.6980618537460373e-05, + "loss": 0.0066, + "step": 727890 + }, + { + "epoch": 1.89, + "learning_rate": 1.6976730321088908e-05, + "loss": 0.0061, + "step": 727900 + }, + { + "epoch": 1.89, + "learning_rate": 1.6972842104717443e-05, + "loss": 0.0067, + "step": 727910 + }, + { + "epoch": 1.89, + "learning_rate": 1.6968953888345977e-05, + "loss": 0.0096, + "step": 727920 + }, + { + "epoch": 1.89, + "learning_rate": 1.6965065671974512e-05, + "loss": 0.0065, + "step": 727930 + }, + { + "epoch": 1.89, + "learning_rate": 1.6961177455603047e-05, + "loss": 0.0053, + "step": 727940 + }, + { + "epoch": 1.89, + "learning_rate": 1.6957289239231582e-05, + "loss": 0.0078, + "step": 727950 + }, + { + "epoch": 1.89, + "learning_rate": 1.695340102286012e-05, + "loss": 0.0081, + "step": 727960 + }, + { + "epoch": 1.89, + "learning_rate": 1.6949512806488655e-05, + "loss": 0.0069, + "step": 727970 + }, + { + "epoch": 1.89, + "learning_rate": 1.694562459011719e-05, + "loss": 0.0066, + "step": 727980 + }, + { + "epoch": 1.89, + "learning_rate": 1.6941736373745725e-05, + "loss": 0.006, + "step": 727990 + }, + { + "epoch": 1.89, + "learning_rate": 1.693784815737426e-05, + "loss": 0.0083, + "step": 728000 + }, + { + "epoch": 1.89, + "eval_cer": 0.8816536990304715, + "eval_loss": 0.004557101055979729, + "eval_runtime": 107.9878, + "eval_samples_per_second": 18.521, + "eval_steps_per_second": 4.63, + "step": 728000 + }, + { + "epoch": 1.89, + "learning_rate": 1.6933959941002795e-05, + "loss": 0.0058, + "step": 728010 + }, + { + "epoch": 1.89, + "learning_rate": 1.6930071724631333e-05, + "loss": 0.0069, + "step": 728020 + }, + { + "epoch": 1.89, + "learning_rate": 1.6926183508259868e-05, + "loss": 0.0079, + "step": 728030 + }, + { + "epoch": 1.89, + "learning_rate": 1.69222952918884e-05, + "loss": 0.0083, + "step": 728040 + }, + { + "epoch": 1.89, + "learning_rate": 1.6918407075516937e-05, + "loss": 0.0102, + "step": 728050 + }, + { + "epoch": 1.89, + "learning_rate": 1.6914518859145472e-05, + "loss": 0.0055, + "step": 728060 + }, + { + "epoch": 1.89, + "learning_rate": 1.6910630642774007e-05, + "loss": 0.0071, + "step": 728070 + }, + { + "epoch": 1.89, + "learning_rate": 1.6906742426402542e-05, + "loss": 0.0076, + "step": 728080 + }, + { + "epoch": 1.89, + "learning_rate": 1.690285421003108e-05, + "loss": 0.0068, + "step": 728090 + }, + { + "epoch": 1.89, + "learning_rate": 1.6898965993659612e-05, + "loss": 0.0075, + "step": 728100 + }, + { + "epoch": 1.89, + "learning_rate": 1.689507777728815e-05, + "loss": 0.0055, + "step": 728110 + }, + { + "epoch": 1.89, + "learning_rate": 1.6891189560916685e-05, + "loss": 0.0073, + "step": 728120 + }, + { + "epoch": 1.89, + "learning_rate": 1.688730134454522e-05, + "loss": 0.0073, + "step": 728130 + }, + { + "epoch": 1.89, + "learning_rate": 1.6883413128173755e-05, + "loss": 0.0094, + "step": 728140 + }, + { + "epoch": 1.89, + "learning_rate": 1.687952491180229e-05, + "loss": 0.0075, + "step": 728150 + }, + { + "epoch": 1.89, + "learning_rate": 1.6875636695430828e-05, + "loss": 0.0066, + "step": 728160 + }, + { + "epoch": 1.89, + "learning_rate": 1.687174847905936e-05, + "loss": 0.0063, + "step": 728170 + }, + { + "epoch": 1.89, + "learning_rate": 1.6867860262687897e-05, + "loss": 0.0088, + "step": 728180 + }, + { + "epoch": 1.89, + "learning_rate": 1.6863972046316432e-05, + "loss": 0.0058, + "step": 728190 + }, + { + "epoch": 1.89, + "learning_rate": 1.6860083829944967e-05, + "loss": 0.0059, + "step": 728200 + }, + { + "epoch": 1.89, + "learning_rate": 1.6856195613573502e-05, + "loss": 0.0054, + "step": 728210 + }, + { + "epoch": 1.89, + "learning_rate": 1.685230739720204e-05, + "loss": 0.0107, + "step": 728220 + }, + { + "epoch": 1.89, + "learning_rate": 1.6848419180830572e-05, + "loss": 0.0136, + "step": 728230 + }, + { + "epoch": 1.89, + "learning_rate": 1.6844530964459107e-05, + "loss": 0.0065, + "step": 728240 + }, + { + "epoch": 1.89, + "learning_rate": 1.6840642748087645e-05, + "loss": 0.0075, + "step": 728250 + }, + { + "epoch": 1.89, + "learning_rate": 1.683675453171618e-05, + "loss": 0.0086, + "step": 728260 + }, + { + "epoch": 1.89, + "learning_rate": 1.6832866315344715e-05, + "loss": 0.0101, + "step": 728270 + }, + { + "epoch": 1.89, + "learning_rate": 1.682897809897325e-05, + "loss": 0.0084, + "step": 728280 + }, + { + "epoch": 1.89, + "learning_rate": 1.6825089882601784e-05, + "loss": 0.0087, + "step": 728290 + }, + { + "epoch": 1.89, + "learning_rate": 1.682120166623032e-05, + "loss": 0.0107, + "step": 728300 + }, + { + "epoch": 1.89, + "learning_rate": 1.6817313449858857e-05, + "loss": 0.0084, + "step": 728310 + }, + { + "epoch": 1.89, + "learning_rate": 1.6813425233487392e-05, + "loss": 0.0069, + "step": 728320 + }, + { + "epoch": 1.89, + "learning_rate": 1.6809537017115927e-05, + "loss": 0.0064, + "step": 728330 + }, + { + "epoch": 1.89, + "learning_rate": 1.6805648800744462e-05, + "loss": 0.0061, + "step": 728340 + }, + { + "epoch": 1.89, + "learning_rate": 1.6801760584372997e-05, + "loss": 0.0085, + "step": 728350 + }, + { + "epoch": 1.89, + "learning_rate": 1.6797872368001532e-05, + "loss": 0.0073, + "step": 728360 + }, + { + "epoch": 1.89, + "learning_rate": 1.6793984151630067e-05, + "loss": 0.0078, + "step": 728370 + }, + { + "epoch": 1.89, + "learning_rate": 1.6790095935258605e-05, + "loss": 0.0054, + "step": 728380 + }, + { + "epoch": 1.89, + "learning_rate": 1.678620771888714e-05, + "loss": 0.0073, + "step": 728390 + }, + { + "epoch": 1.89, + "learning_rate": 1.6782319502515675e-05, + "loss": 0.0084, + "step": 728400 + }, + { + "epoch": 1.89, + "learning_rate": 1.677843128614421e-05, + "loss": 0.0088, + "step": 728410 + }, + { + "epoch": 1.89, + "learning_rate": 1.6774543069772744e-05, + "loss": 0.0067, + "step": 728420 + }, + { + "epoch": 1.89, + "learning_rate": 1.677065485340128e-05, + "loss": 0.0058, + "step": 728430 + }, + { + "epoch": 1.89, + "learning_rate": 1.6766766637029817e-05, + "loss": 0.0078, + "step": 728440 + }, + { + "epoch": 1.89, + "learning_rate": 1.6762878420658352e-05, + "loss": 0.0058, + "step": 728450 + }, + { + "epoch": 1.89, + "learning_rate": 1.6758990204286887e-05, + "loss": 0.0057, + "step": 728460 + }, + { + "epoch": 1.89, + "learning_rate": 1.6755101987915422e-05, + "loss": 0.0073, + "step": 728470 + }, + { + "epoch": 1.89, + "learning_rate": 1.6751213771543957e-05, + "loss": 0.0074, + "step": 728480 + }, + { + "epoch": 1.89, + "learning_rate": 1.674732555517249e-05, + "loss": 0.0115, + "step": 728490 + }, + { + "epoch": 1.89, + "learning_rate": 1.6743437338801027e-05, + "loss": 0.006, + "step": 728500 + }, + { + "epoch": 1.89, + "learning_rate": 1.6739549122429565e-05, + "loss": 0.0069, + "step": 728510 + }, + { + "epoch": 1.89, + "learning_rate": 1.67356609060581e-05, + "loss": 0.005, + "step": 728520 + }, + { + "epoch": 1.89, + "learning_rate": 1.6731772689686635e-05, + "loss": 0.0088, + "step": 728530 + }, + { + "epoch": 1.89, + "learning_rate": 1.672788447331517e-05, + "loss": 0.0068, + "step": 728540 + }, + { + "epoch": 1.89, + "learning_rate": 1.6723996256943704e-05, + "loss": 0.0081, + "step": 728550 + }, + { + "epoch": 1.89, + "learning_rate": 1.672010804057224e-05, + "loss": 0.0069, + "step": 728560 + }, + { + "epoch": 1.89, + "learning_rate": 1.6716219824200777e-05, + "loss": 0.0083, + "step": 728570 + }, + { + "epoch": 1.89, + "learning_rate": 1.6712331607829312e-05, + "loss": 0.0071, + "step": 728580 + }, + { + "epoch": 1.89, + "learning_rate": 1.6708443391457847e-05, + "loss": 0.0071, + "step": 728590 + }, + { + "epoch": 1.89, + "learning_rate": 1.6704555175086382e-05, + "loss": 0.0065, + "step": 728600 + }, + { + "epoch": 1.89, + "learning_rate": 1.6700666958714917e-05, + "loss": 0.008, + "step": 728610 + }, + { + "epoch": 1.89, + "learning_rate": 1.669677874234345e-05, + "loss": 0.009, + "step": 728620 + }, + { + "epoch": 1.89, + "learning_rate": 1.6692890525971987e-05, + "loss": 0.008, + "step": 728630 + }, + { + "epoch": 1.89, + "learning_rate": 1.6689002309600525e-05, + "loss": 0.0105, + "step": 728640 + }, + { + "epoch": 1.89, + "learning_rate": 1.668511409322906e-05, + "loss": 0.0064, + "step": 728650 + }, + { + "epoch": 1.89, + "learning_rate": 1.6681225876857595e-05, + "loss": 0.0099, + "step": 728660 + }, + { + "epoch": 1.89, + "learning_rate": 1.667733766048613e-05, + "loss": 0.0074, + "step": 728670 + }, + { + "epoch": 1.89, + "learning_rate": 1.6673449444114664e-05, + "loss": 0.0072, + "step": 728680 + }, + { + "epoch": 1.89, + "learning_rate": 1.66695612277432e-05, + "loss": 0.0055, + "step": 728690 + }, + { + "epoch": 1.89, + "learning_rate": 1.6665673011371737e-05, + "loss": 0.0066, + "step": 728700 + }, + { + "epoch": 1.89, + "learning_rate": 1.6661784795000272e-05, + "loss": 0.0078, + "step": 728710 + }, + { + "epoch": 1.89, + "learning_rate": 1.6657896578628807e-05, + "loss": 0.0065, + "step": 728720 + }, + { + "epoch": 1.89, + "learning_rate": 1.6654008362257342e-05, + "loss": 0.01, + "step": 728730 + }, + { + "epoch": 1.89, + "learning_rate": 1.6650120145885877e-05, + "loss": 0.0058, + "step": 728740 + }, + { + "epoch": 1.89, + "learning_rate": 1.664623192951441e-05, + "loss": 0.0084, + "step": 728750 + }, + { + "epoch": 1.89, + "learning_rate": 1.6642343713142947e-05, + "loss": 0.008, + "step": 728760 + }, + { + "epoch": 1.89, + "learning_rate": 1.6638455496771485e-05, + "loss": 0.0085, + "step": 728770 + }, + { + "epoch": 1.89, + "learning_rate": 1.663456728040002e-05, + "loss": 0.0067, + "step": 728780 + }, + { + "epoch": 1.89, + "learning_rate": 1.6630679064028554e-05, + "loss": 0.0088, + "step": 728790 + }, + { + "epoch": 1.89, + "learning_rate": 1.662679084765709e-05, + "loss": 0.0094, + "step": 728800 + }, + { + "epoch": 1.89, + "learning_rate": 1.6622902631285624e-05, + "loss": 0.0094, + "step": 728810 + }, + { + "epoch": 1.89, + "learning_rate": 1.661901441491416e-05, + "loss": 0.0064, + "step": 728820 + }, + { + "epoch": 1.89, + "learning_rate": 1.6615126198542694e-05, + "loss": 0.0077, + "step": 728830 + }, + { + "epoch": 1.89, + "learning_rate": 1.6611237982171232e-05, + "loss": 0.0065, + "step": 728840 + }, + { + "epoch": 1.89, + "learning_rate": 1.6607349765799764e-05, + "loss": 0.0074, + "step": 728850 + }, + { + "epoch": 1.89, + "learning_rate": 1.6603461549428302e-05, + "loss": 0.0049, + "step": 728860 + }, + { + "epoch": 1.89, + "learning_rate": 1.6599573333056837e-05, + "loss": 0.0076, + "step": 728870 + }, + { + "epoch": 1.89, + "learning_rate": 1.659568511668537e-05, + "loss": 0.0063, + "step": 728880 + }, + { + "epoch": 1.89, + "learning_rate": 1.6591796900313906e-05, + "loss": 0.0081, + "step": 728890 + }, + { + "epoch": 1.89, + "learning_rate": 1.6587908683942445e-05, + "loss": 0.0065, + "step": 728900 + }, + { + "epoch": 1.89, + "learning_rate": 1.6584020467570976e-05, + "loss": 0.0072, + "step": 728910 + }, + { + "epoch": 1.89, + "learning_rate": 1.658013225119951e-05, + "loss": 0.0069, + "step": 728920 + }, + { + "epoch": 1.89, + "learning_rate": 1.657624403482805e-05, + "loss": 0.0103, + "step": 728930 + }, + { + "epoch": 1.89, + "learning_rate": 1.6572355818456584e-05, + "loss": 0.0053, + "step": 728940 + }, + { + "epoch": 1.89, + "learning_rate": 1.656846760208512e-05, + "loss": 0.0051, + "step": 728950 + }, + { + "epoch": 1.89, + "learning_rate": 1.6564579385713654e-05, + "loss": 0.0075, + "step": 728960 + }, + { + "epoch": 1.89, + "learning_rate": 1.656069116934219e-05, + "loss": 0.0063, + "step": 728970 + }, + { + "epoch": 1.89, + "learning_rate": 1.6556802952970724e-05, + "loss": 0.007, + "step": 728980 + }, + { + "epoch": 1.89, + "learning_rate": 1.6552914736599262e-05, + "loss": 0.0079, + "step": 728990 + }, + { + "epoch": 1.89, + "learning_rate": 1.6549026520227797e-05, + "loss": 0.0087, + "step": 729000 + }, + { + "epoch": 1.89, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.004516036249697208, + "eval_runtime": 107.8591, + "eval_samples_per_second": 18.543, + "eval_steps_per_second": 4.636, + "step": 729000 + }, + { + "epoch": 1.89, + "learning_rate": 1.654513830385633e-05, + "loss": 0.0087, + "step": 729010 + }, + { + "epoch": 1.89, + "learning_rate": 1.6541250087484866e-05, + "loss": 0.0127, + "step": 729020 + }, + { + "epoch": 1.89, + "learning_rate": 1.6537361871113405e-05, + "loss": 0.0065, + "step": 729030 + }, + { + "epoch": 1.89, + "learning_rate": 1.6533473654741936e-05, + "loss": 0.0053, + "step": 729040 + }, + { + "epoch": 1.89, + "learning_rate": 1.652958543837047e-05, + "loss": 0.0085, + "step": 729050 + }, + { + "epoch": 1.89, + "learning_rate": 1.652569722199901e-05, + "loss": 0.0072, + "step": 729060 + }, + { + "epoch": 1.89, + "learning_rate": 1.6521809005627544e-05, + "loss": 0.006, + "step": 729070 + }, + { + "epoch": 1.89, + "learning_rate": 1.651792078925608e-05, + "loss": 0.0103, + "step": 729080 + }, + { + "epoch": 1.89, + "learning_rate": 1.6514032572884614e-05, + "loss": 0.007, + "step": 729090 + }, + { + "epoch": 1.89, + "learning_rate": 1.651014435651315e-05, + "loss": 0.0071, + "step": 729100 + }, + { + "epoch": 1.89, + "learning_rate": 1.6506256140141684e-05, + "loss": 0.0066, + "step": 729110 + }, + { + "epoch": 1.89, + "learning_rate": 1.6502367923770222e-05, + "loss": 0.0058, + "step": 729120 + }, + { + "epoch": 1.89, + "learning_rate": 1.6498479707398757e-05, + "loss": 0.0085, + "step": 729130 + }, + { + "epoch": 1.89, + "learning_rate": 1.649459149102729e-05, + "loss": 0.0061, + "step": 729140 + }, + { + "epoch": 1.89, + "learning_rate": 1.6490703274655826e-05, + "loss": 0.0081, + "step": 729150 + }, + { + "epoch": 1.89, + "learning_rate": 1.648681505828436e-05, + "loss": 0.0067, + "step": 729160 + }, + { + "epoch": 1.89, + "learning_rate": 1.6482926841912896e-05, + "loss": 0.0069, + "step": 729170 + }, + { + "epoch": 1.89, + "learning_rate": 1.647903862554143e-05, + "loss": 0.0062, + "step": 729180 + }, + { + "epoch": 1.89, + "learning_rate": 1.647515040916997e-05, + "loss": 0.0061, + "step": 729190 + }, + { + "epoch": 1.89, + "learning_rate": 1.6471262192798504e-05, + "loss": 0.0051, + "step": 729200 + }, + { + "epoch": 1.89, + "learning_rate": 1.646737397642704e-05, + "loss": 0.0065, + "step": 729210 + }, + { + "epoch": 1.89, + "learning_rate": 1.6463485760055574e-05, + "loss": 0.0095, + "step": 729220 + }, + { + "epoch": 1.89, + "learning_rate": 1.645959754368411e-05, + "loss": 0.0055, + "step": 729230 + }, + { + "epoch": 1.89, + "learning_rate": 1.6455709327312644e-05, + "loss": 0.0065, + "step": 729240 + }, + { + "epoch": 1.89, + "learning_rate": 1.6451821110941182e-05, + "loss": 0.0057, + "step": 729250 + }, + { + "epoch": 1.89, + "learning_rate": 1.6447932894569717e-05, + "loss": 0.0054, + "step": 729260 + }, + { + "epoch": 1.89, + "learning_rate": 1.644404467819825e-05, + "loss": 0.0068, + "step": 729270 + }, + { + "epoch": 1.89, + "learning_rate": 1.6440156461826786e-05, + "loss": 0.0056, + "step": 729280 + }, + { + "epoch": 1.89, + "learning_rate": 1.643626824545532e-05, + "loss": 0.0068, + "step": 729290 + }, + { + "epoch": 1.89, + "learning_rate": 1.6432380029083856e-05, + "loss": 0.0059, + "step": 729300 + }, + { + "epoch": 1.89, + "learning_rate": 1.642849181271239e-05, + "loss": 0.0063, + "step": 729310 + }, + { + "epoch": 1.89, + "learning_rate": 1.642460359634093e-05, + "loss": 0.008, + "step": 729320 + }, + { + "epoch": 1.89, + "learning_rate": 1.6420715379969464e-05, + "loss": 0.0062, + "step": 729330 + }, + { + "epoch": 1.89, + "learning_rate": 1.6416827163598e-05, + "loss": 0.0063, + "step": 729340 + }, + { + "epoch": 1.89, + "learning_rate": 1.6412938947226534e-05, + "loss": 0.0065, + "step": 729350 + }, + { + "epoch": 1.89, + "learning_rate": 1.640905073085507e-05, + "loss": 0.0089, + "step": 729360 + }, + { + "epoch": 1.89, + "learning_rate": 1.6405162514483604e-05, + "loss": 0.0058, + "step": 729370 + }, + { + "epoch": 1.89, + "learning_rate": 1.6401274298112142e-05, + "loss": 0.0073, + "step": 729380 + }, + { + "epoch": 1.89, + "learning_rate": 1.6397386081740677e-05, + "loss": 0.0059, + "step": 729390 + }, + { + "epoch": 1.89, + "learning_rate": 1.639349786536921e-05, + "loss": 0.0071, + "step": 729400 + }, + { + "epoch": 1.89, + "learning_rate": 1.6389609648997746e-05, + "loss": 0.0071, + "step": 729410 + }, + { + "epoch": 1.89, + "learning_rate": 1.638572143262628e-05, + "loss": 0.0094, + "step": 729420 + }, + { + "epoch": 1.89, + "learning_rate": 1.6381833216254816e-05, + "loss": 0.0056, + "step": 729430 + }, + { + "epoch": 1.89, + "learning_rate": 1.637794499988335e-05, + "loss": 0.0096, + "step": 729440 + }, + { + "epoch": 1.89, + "learning_rate": 1.637405678351189e-05, + "loss": 0.0076, + "step": 729450 + }, + { + "epoch": 1.89, + "learning_rate": 1.6370168567140424e-05, + "loss": 0.0085, + "step": 729460 + }, + { + "epoch": 1.89, + "learning_rate": 1.636628035076896e-05, + "loss": 0.009, + "step": 729470 + }, + { + "epoch": 1.89, + "learning_rate": 1.6362392134397494e-05, + "loss": 0.0093, + "step": 729480 + }, + { + "epoch": 1.89, + "learning_rate": 1.635850391802603e-05, + "loss": 0.0085, + "step": 729490 + }, + { + "epoch": 1.89, + "learning_rate": 1.6354615701654564e-05, + "loss": 0.005, + "step": 729500 + }, + { + "epoch": 1.89, + "learning_rate": 1.6350727485283102e-05, + "loss": 0.0083, + "step": 729510 + }, + { + "epoch": 1.89, + "learning_rate": 1.6346839268911637e-05, + "loss": 0.0056, + "step": 729520 + }, + { + "epoch": 1.89, + "learning_rate": 1.6342951052540168e-05, + "loss": 0.0063, + "step": 729530 + }, + { + "epoch": 1.89, + "learning_rate": 1.6339062836168706e-05, + "loss": 0.0046, + "step": 729540 + }, + { + "epoch": 1.89, + "learning_rate": 1.633517461979724e-05, + "loss": 0.0069, + "step": 729550 + }, + { + "epoch": 1.89, + "learning_rate": 1.6331286403425776e-05, + "loss": 0.0049, + "step": 729560 + }, + { + "epoch": 1.89, + "learning_rate": 1.632739818705431e-05, + "loss": 0.0051, + "step": 729570 + }, + { + "epoch": 1.89, + "learning_rate": 1.632350997068285e-05, + "loss": 0.0093, + "step": 729580 + }, + { + "epoch": 1.89, + "learning_rate": 1.631962175431138e-05, + "loss": 0.0099, + "step": 729590 + }, + { + "epoch": 1.89, + "learning_rate": 1.6315733537939916e-05, + "loss": 0.0072, + "step": 729600 + }, + { + "epoch": 1.89, + "learning_rate": 1.6311845321568454e-05, + "loss": 0.0069, + "step": 729610 + }, + { + "epoch": 1.89, + "learning_rate": 1.630795710519699e-05, + "loss": 0.0071, + "step": 729620 + }, + { + "epoch": 1.89, + "learning_rate": 1.6304068888825524e-05, + "loss": 0.0084, + "step": 729630 + }, + { + "epoch": 1.89, + "learning_rate": 1.630018067245406e-05, + "loss": 0.0073, + "step": 729640 + }, + { + "epoch": 1.89, + "learning_rate": 1.6296292456082597e-05, + "loss": 0.0086, + "step": 729650 + }, + { + "epoch": 1.89, + "learning_rate": 1.6292404239711128e-05, + "loss": 0.0087, + "step": 729660 + }, + { + "epoch": 1.89, + "learning_rate": 1.6288516023339666e-05, + "loss": 0.0056, + "step": 729670 + }, + { + "epoch": 1.89, + "learning_rate": 1.62846278069682e-05, + "loss": 0.0053, + "step": 729680 + }, + { + "epoch": 1.89, + "learning_rate": 1.6280739590596736e-05, + "loss": 0.0059, + "step": 729690 + }, + { + "epoch": 1.89, + "learning_rate": 1.627685137422527e-05, + "loss": 0.0096, + "step": 729700 + }, + { + "epoch": 1.89, + "learning_rate": 1.627296315785381e-05, + "loss": 0.007, + "step": 729710 + }, + { + "epoch": 1.89, + "learning_rate": 1.626907494148234e-05, + "loss": 0.006, + "step": 729720 + }, + { + "epoch": 1.89, + "learning_rate": 1.6265186725110876e-05, + "loss": 0.0059, + "step": 729730 + }, + { + "epoch": 1.89, + "learning_rate": 1.6261298508739414e-05, + "loss": 0.0088, + "step": 729740 + }, + { + "epoch": 1.89, + "learning_rate": 1.625741029236795e-05, + "loss": 0.007, + "step": 729750 + }, + { + "epoch": 1.89, + "learning_rate": 1.6253522075996483e-05, + "loss": 0.0056, + "step": 729760 + }, + { + "epoch": 1.89, + "learning_rate": 1.624963385962502e-05, + "loss": 0.0059, + "step": 729770 + }, + { + "epoch": 1.89, + "learning_rate": 1.6245745643253553e-05, + "loss": 0.0088, + "step": 729780 + }, + { + "epoch": 1.89, + "learning_rate": 1.6241857426882088e-05, + "loss": 0.0085, + "step": 729790 + }, + { + "epoch": 1.89, + "learning_rate": 1.6237969210510626e-05, + "loss": 0.007, + "step": 729800 + }, + { + "epoch": 1.89, + "learning_rate": 1.623408099413916e-05, + "loss": 0.007, + "step": 729810 + }, + { + "epoch": 1.89, + "learning_rate": 1.6230192777767696e-05, + "loss": 0.0056, + "step": 729820 + }, + { + "epoch": 1.89, + "learning_rate": 1.622630456139623e-05, + "loss": 0.0051, + "step": 729830 + }, + { + "epoch": 1.89, + "learning_rate": 1.6222416345024766e-05, + "loss": 0.0063, + "step": 729840 + }, + { + "epoch": 1.89, + "learning_rate": 1.62185281286533e-05, + "loss": 0.0079, + "step": 729850 + }, + { + "epoch": 1.89, + "learning_rate": 1.6214639912281835e-05, + "loss": 0.0042, + "step": 729860 + }, + { + "epoch": 1.89, + "learning_rate": 1.6210751695910374e-05, + "loss": 0.0086, + "step": 729870 + }, + { + "epoch": 1.89, + "learning_rate": 1.620686347953891e-05, + "loss": 0.0064, + "step": 729880 + }, + { + "epoch": 1.89, + "learning_rate": 1.6202975263167443e-05, + "loss": 0.0064, + "step": 729890 + }, + { + "epoch": 1.89, + "learning_rate": 1.619908704679598e-05, + "loss": 0.0069, + "step": 729900 + }, + { + "epoch": 1.89, + "learning_rate": 1.6195198830424513e-05, + "loss": 0.0069, + "step": 729910 + }, + { + "epoch": 1.89, + "learning_rate": 1.6191310614053048e-05, + "loss": 0.0101, + "step": 729920 + }, + { + "epoch": 1.89, + "learning_rate": 1.6187422397681586e-05, + "loss": 0.0064, + "step": 729930 + }, + { + "epoch": 1.89, + "learning_rate": 1.618353418131012e-05, + "loss": 0.0081, + "step": 729940 + }, + { + "epoch": 1.89, + "learning_rate": 1.6179645964938656e-05, + "loss": 0.0049, + "step": 729950 + }, + { + "epoch": 1.89, + "learning_rate": 1.617575774856719e-05, + "loss": 0.0078, + "step": 729960 + }, + { + "epoch": 1.89, + "learning_rate": 1.6171869532195726e-05, + "loss": 0.006, + "step": 729970 + }, + { + "epoch": 1.89, + "learning_rate": 1.616798131582426e-05, + "loss": 0.0079, + "step": 729980 + }, + { + "epoch": 1.89, + "learning_rate": 1.6164093099452795e-05, + "loss": 0.0062, + "step": 729990 + }, + { + "epoch": 1.89, + "learning_rate": 1.6160204883081334e-05, + "loss": 0.0071, + "step": 730000 + }, + { + "epoch": 1.89, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.004505546763539314, + "eval_runtime": 107.7228, + "eval_samples_per_second": 18.566, + "eval_steps_per_second": 4.642, + "step": 730000 + }, + { + "epoch": 1.89, + "learning_rate": 1.615631666670987e-05, + "loss": 0.0076, + "step": 730010 + }, + { + "epoch": 1.89, + "learning_rate": 1.6152428450338403e-05, + "loss": 0.0074, + "step": 730020 + }, + { + "epoch": 1.89, + "learning_rate": 1.6148540233966938e-05, + "loss": 0.0059, + "step": 730030 + }, + { + "epoch": 1.89, + "learning_rate": 1.6144652017595473e-05, + "loss": 0.0079, + "step": 730040 + }, + { + "epoch": 1.89, + "learning_rate": 1.6140763801224008e-05, + "loss": 0.0085, + "step": 730050 + }, + { + "epoch": 1.89, + "learning_rate": 1.6136875584852546e-05, + "loss": 0.0053, + "step": 730060 + }, + { + "epoch": 1.89, + "learning_rate": 1.613298736848108e-05, + "loss": 0.0067, + "step": 730070 + }, + { + "epoch": 1.89, + "learning_rate": 1.6129099152109616e-05, + "loss": 0.0056, + "step": 730080 + }, + { + "epoch": 1.89, + "learning_rate": 1.612521093573815e-05, + "loss": 0.0126, + "step": 730090 + }, + { + "epoch": 1.89, + "learning_rate": 1.6121322719366686e-05, + "loss": 0.012, + "step": 730100 + }, + { + "epoch": 1.89, + "learning_rate": 1.611743450299522e-05, + "loss": 0.0072, + "step": 730110 + }, + { + "epoch": 1.89, + "learning_rate": 1.6113546286623755e-05, + "loss": 0.0077, + "step": 730120 + }, + { + "epoch": 1.89, + "learning_rate": 1.6109658070252294e-05, + "loss": 0.0107, + "step": 730130 + }, + { + "epoch": 1.89, + "learning_rate": 1.610576985388083e-05, + "loss": 0.0053, + "step": 730140 + }, + { + "epoch": 1.89, + "learning_rate": 1.6101881637509363e-05, + "loss": 0.0057, + "step": 730150 + }, + { + "epoch": 1.89, + "learning_rate": 1.6097993421137898e-05, + "loss": 0.0056, + "step": 730160 + }, + { + "epoch": 1.89, + "learning_rate": 1.6094105204766433e-05, + "loss": 0.0052, + "step": 730170 + }, + { + "epoch": 1.89, + "learning_rate": 1.6090216988394968e-05, + "loss": 0.0084, + "step": 730180 + }, + { + "epoch": 1.89, + "learning_rate": 1.6086328772023506e-05, + "loss": 0.0092, + "step": 730190 + }, + { + "epoch": 1.89, + "learning_rate": 1.608244055565204e-05, + "loss": 0.0043, + "step": 730200 + }, + { + "epoch": 1.89, + "learning_rate": 1.6078552339280573e-05, + "loss": 0.0071, + "step": 730210 + }, + { + "epoch": 1.89, + "learning_rate": 1.607466412290911e-05, + "loss": 0.004, + "step": 730220 + }, + { + "epoch": 1.89, + "learning_rate": 1.6070775906537646e-05, + "loss": 0.0071, + "step": 730230 + }, + { + "epoch": 1.89, + "learning_rate": 1.606688769016618e-05, + "loss": 0.0082, + "step": 730240 + }, + { + "epoch": 1.89, + "learning_rate": 1.6062999473794715e-05, + "loss": 0.0073, + "step": 730250 + }, + { + "epoch": 1.89, + "learning_rate": 1.6059111257423254e-05, + "loss": 0.0078, + "step": 730260 + }, + { + "epoch": 1.89, + "learning_rate": 1.605522304105179e-05, + "loss": 0.0077, + "step": 730270 + }, + { + "epoch": 1.89, + "learning_rate": 1.605133482468032e-05, + "loss": 0.0048, + "step": 730280 + }, + { + "epoch": 1.89, + "learning_rate": 1.6047446608308858e-05, + "loss": 0.0101, + "step": 730290 + }, + { + "epoch": 1.89, + "learning_rate": 1.6043558391937393e-05, + "loss": 0.0084, + "step": 730300 + }, + { + "epoch": 1.89, + "learning_rate": 1.6039670175565928e-05, + "loss": 0.0093, + "step": 730310 + }, + { + "epoch": 1.89, + "learning_rate": 1.6035781959194463e-05, + "loss": 0.0078, + "step": 730320 + }, + { + "epoch": 1.89, + "learning_rate": 1.6031893742823e-05, + "loss": 0.0072, + "step": 730330 + }, + { + "epoch": 1.89, + "learning_rate": 1.6028005526451533e-05, + "loss": 0.0065, + "step": 730340 + }, + { + "epoch": 1.89, + "learning_rate": 1.602411731008007e-05, + "loss": 0.0072, + "step": 730350 + }, + { + "epoch": 1.89, + "learning_rate": 1.6020229093708606e-05, + "loss": 0.0075, + "step": 730360 + }, + { + "epoch": 1.89, + "learning_rate": 1.601634087733714e-05, + "loss": 0.0085, + "step": 730370 + }, + { + "epoch": 1.89, + "learning_rate": 1.6012452660965675e-05, + "loss": 0.0062, + "step": 730380 + }, + { + "epoch": 1.89, + "learning_rate": 1.6008564444594214e-05, + "loss": 0.0063, + "step": 730390 + }, + { + "epoch": 1.89, + "learning_rate": 1.6004676228222745e-05, + "loss": 0.0069, + "step": 730400 + }, + { + "epoch": 1.89, + "learning_rate": 1.600078801185128e-05, + "loss": 0.0045, + "step": 730410 + }, + { + "epoch": 1.89, + "learning_rate": 1.5996899795479818e-05, + "loss": 0.0055, + "step": 730420 + }, + { + "epoch": 1.89, + "learning_rate": 1.5993011579108353e-05, + "loss": 0.0074, + "step": 730430 + }, + { + "epoch": 1.89, + "learning_rate": 1.5989123362736888e-05, + "loss": 0.0074, + "step": 730440 + }, + { + "epoch": 1.89, + "learning_rate": 1.5985235146365423e-05, + "loss": 0.0054, + "step": 730450 + }, + { + "epoch": 1.89, + "learning_rate": 1.5981346929993958e-05, + "loss": 0.0073, + "step": 730460 + }, + { + "epoch": 1.89, + "learning_rate": 1.5977458713622493e-05, + "loss": 0.0057, + "step": 730470 + }, + { + "epoch": 1.89, + "learning_rate": 1.597357049725103e-05, + "loss": 0.007, + "step": 730480 + }, + { + "epoch": 1.89, + "learning_rate": 1.5969682280879566e-05, + "loss": 0.0073, + "step": 730490 + }, + { + "epoch": 1.89, + "learning_rate": 1.59657940645081e-05, + "loss": 0.0072, + "step": 730500 + }, + { + "epoch": 1.89, + "learning_rate": 1.5961905848136635e-05, + "loss": 0.0057, + "step": 730510 + }, + { + "epoch": 1.89, + "learning_rate": 1.595801763176517e-05, + "loss": 0.0074, + "step": 730520 + }, + { + "epoch": 1.89, + "learning_rate": 1.5954129415393705e-05, + "loss": 0.0075, + "step": 730530 + }, + { + "epoch": 1.89, + "learning_rate": 1.595024119902224e-05, + "loss": 0.0058, + "step": 730540 + }, + { + "epoch": 1.89, + "learning_rate": 1.5946352982650778e-05, + "loss": 0.006, + "step": 730550 + }, + { + "epoch": 1.89, + "learning_rate": 1.5942464766279313e-05, + "loss": 0.0075, + "step": 730560 + }, + { + "epoch": 1.89, + "learning_rate": 1.5938576549907848e-05, + "loss": 0.0075, + "step": 730570 + }, + { + "epoch": 1.89, + "learning_rate": 1.5934688333536383e-05, + "loss": 0.0082, + "step": 730580 + }, + { + "epoch": 1.89, + "learning_rate": 1.5930800117164918e-05, + "loss": 0.0074, + "step": 730590 + }, + { + "epoch": 1.89, + "learning_rate": 1.5926911900793453e-05, + "loss": 0.0061, + "step": 730600 + }, + { + "epoch": 1.89, + "learning_rate": 1.592302368442199e-05, + "loss": 0.0058, + "step": 730610 + }, + { + "epoch": 1.89, + "learning_rate": 1.5919135468050526e-05, + "loss": 0.0083, + "step": 730620 + }, + { + "epoch": 1.89, + "learning_rate": 1.591524725167906e-05, + "loss": 0.0066, + "step": 730630 + }, + { + "epoch": 1.89, + "learning_rate": 1.5911359035307595e-05, + "loss": 0.0063, + "step": 730640 + }, + { + "epoch": 1.89, + "learning_rate": 1.590747081893613e-05, + "loss": 0.0063, + "step": 730650 + }, + { + "epoch": 1.89, + "learning_rate": 1.5903582602564665e-05, + "loss": 0.0062, + "step": 730660 + }, + { + "epoch": 1.89, + "learning_rate": 1.58996943861932e-05, + "loss": 0.0073, + "step": 730670 + }, + { + "epoch": 1.89, + "learning_rate": 1.5895806169821738e-05, + "loss": 0.007, + "step": 730680 + }, + { + "epoch": 1.89, + "learning_rate": 1.5891917953450273e-05, + "loss": 0.0066, + "step": 730690 + }, + { + "epoch": 1.89, + "learning_rate": 1.5888029737078808e-05, + "loss": 0.0062, + "step": 730700 + }, + { + "epoch": 1.89, + "learning_rate": 1.5884141520707343e-05, + "loss": 0.0088, + "step": 730710 + }, + { + "epoch": 1.89, + "learning_rate": 1.5880253304335878e-05, + "loss": 0.0072, + "step": 730720 + }, + { + "epoch": 1.89, + "learning_rate": 1.5876365087964412e-05, + "loss": 0.0079, + "step": 730730 + }, + { + "epoch": 1.89, + "learning_rate": 1.587247687159295e-05, + "loss": 0.0074, + "step": 730740 + }, + { + "epoch": 1.89, + "learning_rate": 1.5868588655221486e-05, + "loss": 0.0056, + "step": 730750 + }, + { + "epoch": 1.89, + "learning_rate": 1.586470043885002e-05, + "loss": 0.0075, + "step": 730760 + }, + { + "epoch": 1.89, + "learning_rate": 1.5860812222478555e-05, + "loss": 0.0064, + "step": 730770 + }, + { + "epoch": 1.89, + "learning_rate": 1.585692400610709e-05, + "loss": 0.0055, + "step": 730780 + }, + { + "epoch": 1.89, + "learning_rate": 1.5853035789735625e-05, + "loss": 0.0078, + "step": 730790 + }, + { + "epoch": 1.89, + "learning_rate": 1.584914757336416e-05, + "loss": 0.0148, + "step": 730800 + }, + { + "epoch": 1.89, + "learning_rate": 1.5845259356992698e-05, + "loss": 0.0072, + "step": 730810 + }, + { + "epoch": 1.89, + "learning_rate": 1.5841371140621233e-05, + "loss": 0.0059, + "step": 730820 + }, + { + "epoch": 1.89, + "learning_rate": 1.5837482924249768e-05, + "loss": 0.0087, + "step": 730830 + }, + { + "epoch": 1.89, + "learning_rate": 1.5833594707878303e-05, + "loss": 0.0084, + "step": 730840 + }, + { + "epoch": 1.89, + "learning_rate": 1.5829706491506838e-05, + "loss": 0.0056, + "step": 730850 + }, + { + "epoch": 1.89, + "learning_rate": 1.5825818275135372e-05, + "loss": 0.0058, + "step": 730860 + }, + { + "epoch": 1.89, + "learning_rate": 1.582193005876391e-05, + "loss": 0.0071, + "step": 730870 + }, + { + "epoch": 1.89, + "learning_rate": 1.5818041842392446e-05, + "loss": 0.0066, + "step": 730880 + }, + { + "epoch": 1.89, + "learning_rate": 1.581415362602098e-05, + "loss": 0.009, + "step": 730890 + }, + { + "epoch": 1.89, + "learning_rate": 1.5810265409649515e-05, + "loss": 0.0059, + "step": 730900 + }, + { + "epoch": 1.89, + "learning_rate": 1.580637719327805e-05, + "loss": 0.0059, + "step": 730910 + }, + { + "epoch": 1.89, + "learning_rate": 1.5802488976906585e-05, + "loss": 0.0052, + "step": 730920 + }, + { + "epoch": 1.89, + "learning_rate": 1.579860076053512e-05, + "loss": 0.007, + "step": 730930 + }, + { + "epoch": 1.89, + "learning_rate": 1.5794712544163658e-05, + "loss": 0.0068, + "step": 730940 + }, + { + "epoch": 1.89, + "learning_rate": 1.5790824327792193e-05, + "loss": 0.0094, + "step": 730950 + }, + { + "epoch": 1.89, + "learning_rate": 1.5786936111420724e-05, + "loss": 0.0046, + "step": 730960 + }, + { + "epoch": 1.89, + "learning_rate": 1.5783047895049263e-05, + "loss": 0.0052, + "step": 730970 + }, + { + "epoch": 1.89, + "learning_rate": 1.5779159678677798e-05, + "loss": 0.0081, + "step": 730980 + }, + { + "epoch": 1.89, + "learning_rate": 1.5775271462306332e-05, + "loss": 0.0067, + "step": 730990 + }, + { + "epoch": 1.89, + "learning_rate": 1.5771383245934867e-05, + "loss": 0.0073, + "step": 731000 + }, + { + "epoch": 1.89, + "eval_cer": 0.881657897941274, + "eval_loss": 0.004491262603551149, + "eval_runtime": 107.9137, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 731000 + }, + { + "epoch": 1.89, + "learning_rate": 1.5767495029563406e-05, + "loss": 0.0076, + "step": 731010 + }, + { + "epoch": 1.89, + "learning_rate": 1.5763606813191937e-05, + "loss": 0.0068, + "step": 731020 + }, + { + "epoch": 1.89, + "learning_rate": 1.5759718596820475e-05, + "loss": 0.0068, + "step": 731030 + }, + { + "epoch": 1.89, + "learning_rate": 1.575583038044901e-05, + "loss": 0.009, + "step": 731040 + }, + { + "epoch": 1.89, + "learning_rate": 1.5751942164077545e-05, + "loss": 0.0069, + "step": 731050 + }, + { + "epoch": 1.9, + "learning_rate": 1.574805394770608e-05, + "loss": 0.0065, + "step": 731060 + }, + { + "epoch": 1.9, + "learning_rate": 1.5744165731334618e-05, + "loss": 0.0066, + "step": 731070 + }, + { + "epoch": 1.9, + "learning_rate": 1.574027751496315e-05, + "loss": 0.0066, + "step": 731080 + }, + { + "epoch": 1.9, + "learning_rate": 1.5736389298591684e-05, + "loss": 0.0088, + "step": 731090 + }, + { + "epoch": 1.9, + "learning_rate": 1.5732501082220223e-05, + "loss": 0.0086, + "step": 731100 + }, + { + "epoch": 1.9, + "learning_rate": 1.5728612865848758e-05, + "loss": 0.0051, + "step": 731110 + }, + { + "epoch": 1.9, + "learning_rate": 1.5724724649477292e-05, + "loss": 0.0085, + "step": 731120 + }, + { + "epoch": 1.9, + "learning_rate": 1.5720836433105827e-05, + "loss": 0.0053, + "step": 731130 + }, + { + "epoch": 1.9, + "learning_rate": 1.5716948216734362e-05, + "loss": 0.0075, + "step": 731140 + }, + { + "epoch": 1.9, + "learning_rate": 1.5713060000362897e-05, + "loss": 0.0057, + "step": 731150 + }, + { + "epoch": 1.9, + "learning_rate": 1.5709171783991435e-05, + "loss": 0.0064, + "step": 731160 + }, + { + "epoch": 1.9, + "learning_rate": 1.570528356761997e-05, + "loss": 0.0067, + "step": 731170 + }, + { + "epoch": 1.9, + "learning_rate": 1.5701395351248505e-05, + "loss": 0.0086, + "step": 731180 + }, + { + "epoch": 1.9, + "learning_rate": 1.569750713487704e-05, + "loss": 0.0056, + "step": 731190 + }, + { + "epoch": 1.9, + "learning_rate": 1.5693618918505578e-05, + "loss": 0.0078, + "step": 731200 + }, + { + "epoch": 1.9, + "learning_rate": 1.568973070213411e-05, + "loss": 0.0073, + "step": 731210 + }, + { + "epoch": 1.9, + "learning_rate": 1.5685842485762644e-05, + "loss": 0.0094, + "step": 731220 + }, + { + "epoch": 1.9, + "learning_rate": 1.5681954269391183e-05, + "loss": 0.0057, + "step": 731230 + }, + { + "epoch": 1.9, + "learning_rate": 1.5678066053019718e-05, + "loss": 0.0083, + "step": 731240 + }, + { + "epoch": 1.9, + "learning_rate": 1.5674177836648252e-05, + "loss": 0.0088, + "step": 731250 + }, + { + "epoch": 1.9, + "learning_rate": 1.5670289620276787e-05, + "loss": 0.0068, + "step": 731260 + }, + { + "epoch": 1.9, + "learning_rate": 1.5666401403905322e-05, + "loss": 0.0089, + "step": 731270 + }, + { + "epoch": 1.9, + "learning_rate": 1.5662513187533857e-05, + "loss": 0.0094, + "step": 731280 + }, + { + "epoch": 1.9, + "learning_rate": 1.5658624971162395e-05, + "loss": 0.0074, + "step": 731290 + }, + { + "epoch": 1.9, + "learning_rate": 1.565473675479093e-05, + "loss": 0.0065, + "step": 731300 + }, + { + "epoch": 1.9, + "learning_rate": 1.5650848538419465e-05, + "loss": 0.0073, + "step": 731310 + }, + { + "epoch": 1.9, + "learning_rate": 1.5646960322048e-05, + "loss": 0.0103, + "step": 731320 + }, + { + "epoch": 1.9, + "learning_rate": 1.5643072105676535e-05, + "loss": 0.0082, + "step": 731330 + }, + { + "epoch": 1.9, + "learning_rate": 1.563918388930507e-05, + "loss": 0.0057, + "step": 731340 + }, + { + "epoch": 1.9, + "learning_rate": 1.5635295672933604e-05, + "loss": 0.0048, + "step": 731350 + }, + { + "epoch": 1.9, + "learning_rate": 1.5631407456562143e-05, + "loss": 0.0056, + "step": 731360 + }, + { + "epoch": 1.9, + "learning_rate": 1.5627519240190677e-05, + "loss": 0.009, + "step": 731370 + }, + { + "epoch": 1.9, + "learning_rate": 1.5623631023819212e-05, + "loss": 0.0059, + "step": 731380 + }, + { + "epoch": 1.9, + "learning_rate": 1.5619742807447747e-05, + "loss": 0.0079, + "step": 731390 + }, + { + "epoch": 1.9, + "learning_rate": 1.5615854591076282e-05, + "loss": 0.0071, + "step": 731400 + }, + { + "epoch": 1.9, + "learning_rate": 1.5611966374704817e-05, + "loss": 0.007, + "step": 731410 + }, + { + "epoch": 1.9, + "learning_rate": 1.5608078158333355e-05, + "loss": 0.0073, + "step": 731420 + }, + { + "epoch": 1.9, + "learning_rate": 1.560418994196189e-05, + "loss": 0.0099, + "step": 731430 + }, + { + "epoch": 1.9, + "learning_rate": 1.5600301725590425e-05, + "loss": 0.0057, + "step": 731440 + }, + { + "epoch": 1.9, + "learning_rate": 1.559641350921896e-05, + "loss": 0.0137, + "step": 731450 + }, + { + "epoch": 1.9, + "learning_rate": 1.5592525292847495e-05, + "loss": 0.0091, + "step": 731460 + }, + { + "epoch": 1.9, + "learning_rate": 1.558863707647603e-05, + "loss": 0.0055, + "step": 731470 + }, + { + "epoch": 1.9, + "learning_rate": 1.5584748860104564e-05, + "loss": 0.0054, + "step": 731480 + }, + { + "epoch": 1.9, + "learning_rate": 1.5580860643733103e-05, + "loss": 0.0089, + "step": 731490 + }, + { + "epoch": 1.9, + "learning_rate": 1.5576972427361637e-05, + "loss": 0.004, + "step": 731500 + }, + { + "epoch": 1.9, + "learning_rate": 1.5573084210990172e-05, + "loss": 0.007, + "step": 731510 + }, + { + "epoch": 1.9, + "learning_rate": 1.5569195994618707e-05, + "loss": 0.0095, + "step": 731520 + }, + { + "epoch": 1.9, + "learning_rate": 1.5565307778247242e-05, + "loss": 0.0058, + "step": 731530 + }, + { + "epoch": 1.9, + "learning_rate": 1.5561419561875777e-05, + "loss": 0.0042, + "step": 731540 + }, + { + "epoch": 1.9, + "learning_rate": 1.5557531345504315e-05, + "loss": 0.0097, + "step": 731550 + }, + { + "epoch": 1.9, + "learning_rate": 1.555364312913285e-05, + "loss": 0.0083, + "step": 731560 + }, + { + "epoch": 1.9, + "learning_rate": 1.5549754912761385e-05, + "loss": 0.0076, + "step": 731570 + }, + { + "epoch": 1.9, + "learning_rate": 1.554586669638992e-05, + "loss": 0.0075, + "step": 731580 + }, + { + "epoch": 1.9, + "learning_rate": 1.5541978480018455e-05, + "loss": 0.0072, + "step": 731590 + }, + { + "epoch": 1.9, + "learning_rate": 1.553809026364699e-05, + "loss": 0.0095, + "step": 731600 + }, + { + "epoch": 1.9, + "learning_rate": 1.5534202047275524e-05, + "loss": 0.0109, + "step": 731610 + }, + { + "epoch": 1.9, + "learning_rate": 1.5530313830904063e-05, + "loss": 0.006, + "step": 731620 + }, + { + "epoch": 1.9, + "learning_rate": 1.5526425614532597e-05, + "loss": 0.0052, + "step": 731630 + }, + { + "epoch": 1.9, + "learning_rate": 1.5522537398161132e-05, + "loss": 0.0094, + "step": 731640 + }, + { + "epoch": 1.9, + "learning_rate": 1.5518649181789667e-05, + "loss": 0.0069, + "step": 731650 + }, + { + "epoch": 1.9, + "learning_rate": 1.5514760965418202e-05, + "loss": 0.0077, + "step": 731660 + }, + { + "epoch": 1.9, + "learning_rate": 1.5510872749046737e-05, + "loss": 0.0081, + "step": 731670 + }, + { + "epoch": 1.9, + "learning_rate": 1.5506984532675272e-05, + "loss": 0.0073, + "step": 731680 + }, + { + "epoch": 1.9, + "learning_rate": 1.550309631630381e-05, + "loss": 0.0073, + "step": 731690 + }, + { + "epoch": 1.9, + "learning_rate": 1.549920809993234e-05, + "loss": 0.0087, + "step": 731700 + }, + { + "epoch": 1.9, + "learning_rate": 1.549531988356088e-05, + "loss": 0.008, + "step": 731710 + }, + { + "epoch": 1.9, + "learning_rate": 1.5491431667189415e-05, + "loss": 0.0091, + "step": 731720 + }, + { + "epoch": 1.9, + "learning_rate": 1.548754345081795e-05, + "loss": 0.0068, + "step": 731730 + }, + { + "epoch": 1.9, + "learning_rate": 1.5483655234446484e-05, + "loss": 0.0072, + "step": 731740 + }, + { + "epoch": 1.9, + "learning_rate": 1.5479767018075023e-05, + "loss": 0.0072, + "step": 731750 + }, + { + "epoch": 1.9, + "learning_rate": 1.5475878801703554e-05, + "loss": 0.0087, + "step": 731760 + }, + { + "epoch": 1.9, + "learning_rate": 1.547199058533209e-05, + "loss": 0.0058, + "step": 731770 + }, + { + "epoch": 1.9, + "learning_rate": 1.5468102368960627e-05, + "loss": 0.0061, + "step": 731780 + }, + { + "epoch": 1.9, + "learning_rate": 1.5464214152589162e-05, + "loss": 0.0055, + "step": 731790 + }, + { + "epoch": 1.9, + "learning_rate": 1.5460325936217697e-05, + "loss": 0.0068, + "step": 731800 + }, + { + "epoch": 1.9, + "learning_rate": 1.5456437719846232e-05, + "loss": 0.0063, + "step": 731810 + }, + { + "epoch": 1.9, + "learning_rate": 1.545254950347477e-05, + "loss": 0.0067, + "step": 731820 + }, + { + "epoch": 1.9, + "learning_rate": 1.54486612871033e-05, + "loss": 0.007, + "step": 731830 + }, + { + "epoch": 1.9, + "learning_rate": 1.544477307073184e-05, + "loss": 0.0059, + "step": 731840 + }, + { + "epoch": 1.9, + "learning_rate": 1.5440884854360375e-05, + "loss": 0.0072, + "step": 731850 + }, + { + "epoch": 1.9, + "learning_rate": 1.543699663798891e-05, + "loss": 0.0057, + "step": 731860 + }, + { + "epoch": 1.9, + "learning_rate": 1.5433108421617444e-05, + "loss": 0.0076, + "step": 731870 + }, + { + "epoch": 1.9, + "learning_rate": 1.5429220205245983e-05, + "loss": 0.0064, + "step": 731880 + }, + { + "epoch": 1.9, + "learning_rate": 1.5425331988874514e-05, + "loss": 0.0063, + "step": 731890 + }, + { + "epoch": 1.9, + "learning_rate": 1.542144377250305e-05, + "loss": 0.0079, + "step": 731900 + }, + { + "epoch": 1.9, + "learning_rate": 1.5417555556131587e-05, + "loss": 0.0066, + "step": 731910 + }, + { + "epoch": 1.9, + "learning_rate": 1.5413667339760122e-05, + "loss": 0.0085, + "step": 731920 + }, + { + "epoch": 1.9, + "learning_rate": 1.5409779123388657e-05, + "loss": 0.0058, + "step": 731930 + }, + { + "epoch": 1.9, + "learning_rate": 1.5405890907017192e-05, + "loss": 0.0058, + "step": 731940 + }, + { + "epoch": 1.9, + "learning_rate": 1.5402002690645727e-05, + "loss": 0.0051, + "step": 731950 + }, + { + "epoch": 1.9, + "learning_rate": 1.539811447427426e-05, + "loss": 0.0067, + "step": 731960 + }, + { + "epoch": 1.9, + "learning_rate": 1.53942262579028e-05, + "loss": 0.0066, + "step": 731970 + }, + { + "epoch": 1.9, + "learning_rate": 1.5390338041531335e-05, + "loss": 0.0062, + "step": 731980 + }, + { + "epoch": 1.9, + "learning_rate": 1.538644982515987e-05, + "loss": 0.007, + "step": 731990 + }, + { + "epoch": 1.9, + "learning_rate": 1.5382561608788404e-05, + "loss": 0.0063, + "step": 732000 + }, + { + "epoch": 1.9, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.004524824675172567, + "eval_runtime": 107.8657, + "eval_samples_per_second": 18.542, + "eval_steps_per_second": 4.635, + "step": 732000 + }, + { + "epoch": 1.9, + "learning_rate": 1.537867339241694e-05, + "loss": 0.0089, + "step": 732010 + }, + { + "epoch": 1.9, + "learning_rate": 1.5374785176045474e-05, + "loss": 0.0103, + "step": 732020 + }, + { + "epoch": 1.9, + "learning_rate": 1.537089695967401e-05, + "loss": 0.0067, + "step": 732030 + }, + { + "epoch": 1.9, + "learning_rate": 1.5367008743302547e-05, + "loss": 0.0067, + "step": 732040 + }, + { + "epoch": 1.9, + "learning_rate": 1.5363120526931082e-05, + "loss": 0.008, + "step": 732050 + }, + { + "epoch": 1.9, + "learning_rate": 1.5359232310559617e-05, + "loss": 0.007, + "step": 732060 + }, + { + "epoch": 1.9, + "learning_rate": 1.535534409418815e-05, + "loss": 0.0062, + "step": 732070 + }, + { + "epoch": 1.9, + "learning_rate": 1.5351455877816687e-05, + "loss": 0.0062, + "step": 732080 + }, + { + "epoch": 1.9, + "learning_rate": 1.534756766144522e-05, + "loss": 0.0079, + "step": 732090 + }, + { + "epoch": 1.9, + "learning_rate": 1.534367944507376e-05, + "loss": 0.006, + "step": 732100 + }, + { + "epoch": 1.9, + "learning_rate": 1.5339791228702295e-05, + "loss": 0.0075, + "step": 732110 + }, + { + "epoch": 1.9, + "learning_rate": 1.533590301233083e-05, + "loss": 0.0065, + "step": 732120 + }, + { + "epoch": 1.9, + "learning_rate": 1.5332014795959364e-05, + "loss": 0.0069, + "step": 732130 + }, + { + "epoch": 1.9, + "learning_rate": 1.53281265795879e-05, + "loss": 0.0068, + "step": 732140 + }, + { + "epoch": 1.9, + "learning_rate": 1.5324238363216434e-05, + "loss": 0.0065, + "step": 732150 + }, + { + "epoch": 1.9, + "learning_rate": 1.532035014684497e-05, + "loss": 0.0061, + "step": 732160 + }, + { + "epoch": 1.9, + "learning_rate": 1.5316461930473507e-05, + "loss": 0.0066, + "step": 732170 + }, + { + "epoch": 1.9, + "learning_rate": 1.5312573714102042e-05, + "loss": 0.0075, + "step": 732180 + }, + { + "epoch": 1.9, + "learning_rate": 1.5308685497730577e-05, + "loss": 0.0085, + "step": 732190 + }, + { + "epoch": 1.9, + "learning_rate": 1.530479728135911e-05, + "loss": 0.0076, + "step": 732200 + }, + { + "epoch": 1.9, + "learning_rate": 1.5300909064987647e-05, + "loss": 0.0073, + "step": 732210 + }, + { + "epoch": 1.9, + "learning_rate": 1.529702084861618e-05, + "loss": 0.006, + "step": 732220 + }, + { + "epoch": 1.9, + "learning_rate": 1.529313263224472e-05, + "loss": 0.0056, + "step": 732230 + }, + { + "epoch": 1.9, + "learning_rate": 1.5289244415873254e-05, + "loss": 0.0087, + "step": 732240 + }, + { + "epoch": 1.9, + "learning_rate": 1.528535619950179e-05, + "loss": 0.0055, + "step": 732250 + }, + { + "epoch": 1.9, + "learning_rate": 1.5281467983130324e-05, + "loss": 0.0071, + "step": 732260 + }, + { + "epoch": 1.9, + "learning_rate": 1.527757976675886e-05, + "loss": 0.0067, + "step": 732270 + }, + { + "epoch": 1.9, + "learning_rate": 1.5273691550387394e-05, + "loss": 0.0136, + "step": 732280 + }, + { + "epoch": 1.9, + "learning_rate": 1.526980333401593e-05, + "loss": 0.0077, + "step": 732290 + }, + { + "epoch": 1.9, + "learning_rate": 1.5265915117644467e-05, + "loss": 0.007, + "step": 732300 + }, + { + "epoch": 1.9, + "learning_rate": 1.5262026901273002e-05, + "loss": 0.0066, + "step": 732310 + }, + { + "epoch": 1.9, + "learning_rate": 1.5258138684901535e-05, + "loss": 0.0072, + "step": 732320 + }, + { + "epoch": 1.9, + "learning_rate": 1.5254250468530072e-05, + "loss": 0.0059, + "step": 732330 + }, + { + "epoch": 1.9, + "learning_rate": 1.5250362252158606e-05, + "loss": 0.0086, + "step": 732340 + }, + { + "epoch": 1.9, + "learning_rate": 1.5246474035787141e-05, + "loss": 0.0089, + "step": 732350 + }, + { + "epoch": 1.9, + "learning_rate": 1.5242585819415678e-05, + "loss": 0.005, + "step": 732360 + }, + { + "epoch": 1.9, + "learning_rate": 1.5238697603044213e-05, + "loss": 0.0065, + "step": 732370 + }, + { + "epoch": 1.9, + "learning_rate": 1.5234809386672748e-05, + "loss": 0.0092, + "step": 732380 + }, + { + "epoch": 1.9, + "learning_rate": 1.5230921170301282e-05, + "loss": 0.0084, + "step": 732390 + }, + { + "epoch": 1.9, + "learning_rate": 1.5227032953929819e-05, + "loss": 0.0053, + "step": 732400 + }, + { + "epoch": 1.9, + "learning_rate": 1.5223144737558354e-05, + "loss": 0.0085, + "step": 732410 + }, + { + "epoch": 1.9, + "learning_rate": 1.521925652118689e-05, + "loss": 0.0091, + "step": 732420 + }, + { + "epoch": 1.9, + "learning_rate": 1.5215368304815425e-05, + "loss": 0.0059, + "step": 732430 + }, + { + "epoch": 1.9, + "learning_rate": 1.5211480088443962e-05, + "loss": 0.0049, + "step": 732440 + }, + { + "epoch": 1.9, + "learning_rate": 1.5207591872072495e-05, + "loss": 0.0072, + "step": 732450 + }, + { + "epoch": 1.9, + "learning_rate": 1.520370365570103e-05, + "loss": 0.0058, + "step": 732460 + }, + { + "epoch": 1.9, + "learning_rate": 1.5199815439329566e-05, + "loss": 0.0081, + "step": 732470 + }, + { + "epoch": 1.9, + "learning_rate": 1.5195927222958101e-05, + "loss": 0.007, + "step": 732480 + }, + { + "epoch": 1.9, + "learning_rate": 1.5192039006586638e-05, + "loss": 0.0056, + "step": 732490 + }, + { + "epoch": 1.9, + "learning_rate": 1.5188150790215173e-05, + "loss": 0.0084, + "step": 732500 + }, + { + "epoch": 1.9, + "learning_rate": 1.5184262573843708e-05, + "loss": 0.0076, + "step": 732510 + }, + { + "epoch": 1.9, + "learning_rate": 1.5180374357472242e-05, + "loss": 0.0074, + "step": 732520 + }, + { + "epoch": 1.9, + "learning_rate": 1.5176486141100779e-05, + "loss": 0.0055, + "step": 732530 + }, + { + "epoch": 1.9, + "learning_rate": 1.5172597924729314e-05, + "loss": 0.0086, + "step": 732540 + }, + { + "epoch": 1.9, + "learning_rate": 1.516870970835785e-05, + "loss": 0.0108, + "step": 732550 + }, + { + "epoch": 1.9, + "learning_rate": 1.5164821491986385e-05, + "loss": 0.0058, + "step": 732560 + }, + { + "epoch": 1.9, + "learning_rate": 1.5160933275614918e-05, + "loss": 0.0081, + "step": 732570 + }, + { + "epoch": 1.9, + "learning_rate": 1.5157045059243455e-05, + "loss": 0.0072, + "step": 732580 + }, + { + "epoch": 1.9, + "learning_rate": 1.515315684287199e-05, + "loss": 0.0078, + "step": 732590 + }, + { + "epoch": 1.9, + "learning_rate": 1.5149268626500526e-05, + "loss": 0.0053, + "step": 732600 + }, + { + "epoch": 1.9, + "learning_rate": 1.5145380410129061e-05, + "loss": 0.0084, + "step": 732610 + }, + { + "epoch": 1.9, + "learning_rate": 1.5141492193757598e-05, + "loss": 0.0063, + "step": 732620 + }, + { + "epoch": 1.9, + "learning_rate": 1.5137603977386131e-05, + "loss": 0.0078, + "step": 732630 + }, + { + "epoch": 1.9, + "learning_rate": 1.5133715761014668e-05, + "loss": 0.0084, + "step": 732640 + }, + { + "epoch": 1.9, + "learning_rate": 1.5129827544643202e-05, + "loss": 0.0082, + "step": 732650 + }, + { + "epoch": 1.9, + "learning_rate": 1.5125939328271739e-05, + "loss": 0.0082, + "step": 732660 + }, + { + "epoch": 1.9, + "learning_rate": 1.5122051111900274e-05, + "loss": 0.0041, + "step": 732670 + }, + { + "epoch": 1.9, + "learning_rate": 1.511816289552881e-05, + "loss": 0.0088, + "step": 732680 + }, + { + "epoch": 1.9, + "learning_rate": 1.5114274679157344e-05, + "loss": 0.0086, + "step": 732690 + }, + { + "epoch": 1.9, + "learning_rate": 1.5110386462785878e-05, + "loss": 0.007, + "step": 732700 + }, + { + "epoch": 1.9, + "learning_rate": 1.5106498246414415e-05, + "loss": 0.006, + "step": 732710 + }, + { + "epoch": 1.9, + "learning_rate": 1.510261003004295e-05, + "loss": 0.0053, + "step": 732720 + }, + { + "epoch": 1.9, + "learning_rate": 1.5098721813671486e-05, + "loss": 0.0063, + "step": 732730 + }, + { + "epoch": 1.9, + "learning_rate": 1.5094833597300021e-05, + "loss": 0.0058, + "step": 732740 + }, + { + "epoch": 1.9, + "learning_rate": 1.5090945380928558e-05, + "loss": 0.0075, + "step": 732750 + }, + { + "epoch": 1.9, + "learning_rate": 1.5087057164557091e-05, + "loss": 0.011, + "step": 732760 + }, + { + "epoch": 1.9, + "learning_rate": 1.5083168948185628e-05, + "loss": 0.012, + "step": 732770 + }, + { + "epoch": 1.9, + "learning_rate": 1.5079280731814162e-05, + "loss": 0.0062, + "step": 732780 + }, + { + "epoch": 1.9, + "learning_rate": 1.5075392515442699e-05, + "loss": 0.0081, + "step": 732790 + }, + { + "epoch": 1.9, + "learning_rate": 1.5071504299071234e-05, + "loss": 0.0065, + "step": 732800 + }, + { + "epoch": 1.9, + "learning_rate": 1.506761608269977e-05, + "loss": 0.0059, + "step": 732810 + }, + { + "epoch": 1.9, + "learning_rate": 1.5063727866328304e-05, + "loss": 0.0073, + "step": 732820 + }, + { + "epoch": 1.9, + "learning_rate": 1.5059839649956838e-05, + "loss": 0.0072, + "step": 732830 + }, + { + "epoch": 1.9, + "learning_rate": 1.5055951433585375e-05, + "loss": 0.0085, + "step": 732840 + }, + { + "epoch": 1.9, + "learning_rate": 1.505206321721391e-05, + "loss": 0.0072, + "step": 732850 + }, + { + "epoch": 1.9, + "learning_rate": 1.5048175000842446e-05, + "loss": 0.0054, + "step": 732860 + }, + { + "epoch": 1.9, + "learning_rate": 1.5044286784470981e-05, + "loss": 0.0091, + "step": 732870 + }, + { + "epoch": 1.9, + "learning_rate": 1.5040398568099516e-05, + "loss": 0.0072, + "step": 732880 + }, + { + "epoch": 1.9, + "learning_rate": 1.5036510351728051e-05, + "loss": 0.0059, + "step": 732890 + }, + { + "epoch": 1.9, + "learning_rate": 1.5032622135356588e-05, + "loss": 0.0121, + "step": 732900 + }, + { + "epoch": 1.9, + "learning_rate": 1.5028733918985122e-05, + "loss": 0.0054, + "step": 732910 + }, + { + "epoch": 1.9, + "learning_rate": 1.5024845702613659e-05, + "loss": 0.0083, + "step": 732920 + }, + { + "epoch": 1.9, + "learning_rate": 1.5020957486242194e-05, + "loss": 0.0089, + "step": 732930 + }, + { + "epoch": 1.9, + "learning_rate": 1.5017069269870727e-05, + "loss": 0.0062, + "step": 732940 + }, + { + "epoch": 1.9, + "learning_rate": 1.5013181053499264e-05, + "loss": 0.0082, + "step": 732950 + }, + { + "epoch": 1.9, + "learning_rate": 1.5009292837127798e-05, + "loss": 0.0057, + "step": 732960 + }, + { + "epoch": 1.9, + "learning_rate": 1.5005404620756335e-05, + "loss": 0.0055, + "step": 732970 + }, + { + "epoch": 1.9, + "learning_rate": 1.500151640438487e-05, + "loss": 0.0091, + "step": 732980 + }, + { + "epoch": 1.9, + "learning_rate": 1.4997628188013406e-05, + "loss": 0.006, + "step": 732990 + }, + { + "epoch": 1.9, + "learning_rate": 1.4993739971641941e-05, + "loss": 0.0092, + "step": 733000 + }, + { + "epoch": 1.9, + "eval_cer": 0.8816718943106159, + "eval_loss": 0.004549098201096058, + "eval_runtime": 107.784, + "eval_samples_per_second": 18.556, + "eval_steps_per_second": 4.639, + "step": 733000 + }, + { + "epoch": 1.9, + "learning_rate": 1.4989851755270476e-05, + "loss": 0.0063, + "step": 733010 + }, + { + "epoch": 1.9, + "learning_rate": 1.4985963538899011e-05, + "loss": 0.0087, + "step": 733020 + }, + { + "epoch": 1.9, + "learning_rate": 1.4982075322527546e-05, + "loss": 0.0084, + "step": 733030 + }, + { + "epoch": 1.9, + "learning_rate": 1.4978187106156082e-05, + "loss": 0.0079, + "step": 733040 + }, + { + "epoch": 1.9, + "learning_rate": 1.4974298889784617e-05, + "loss": 0.0069, + "step": 733050 + }, + { + "epoch": 1.9, + "learning_rate": 1.4970410673413154e-05, + "loss": 0.0075, + "step": 733060 + }, + { + "epoch": 1.9, + "learning_rate": 1.4966522457041687e-05, + "loss": 0.0075, + "step": 733070 + }, + { + "epoch": 1.9, + "learning_rate": 1.4962634240670224e-05, + "loss": 0.0069, + "step": 733080 + }, + { + "epoch": 1.9, + "learning_rate": 1.4958746024298758e-05, + "loss": 0.009, + "step": 733090 + }, + { + "epoch": 1.9, + "learning_rate": 1.4954857807927295e-05, + "loss": 0.0064, + "step": 733100 + }, + { + "epoch": 1.9, + "learning_rate": 1.495096959155583e-05, + "loss": 0.0059, + "step": 733110 + }, + { + "epoch": 1.9, + "learning_rate": 1.4947081375184366e-05, + "loss": 0.0071, + "step": 733120 + }, + { + "epoch": 1.9, + "learning_rate": 1.49431931588129e-05, + "loss": 0.0078, + "step": 733130 + }, + { + "epoch": 1.9, + "learning_rate": 1.4939304942441434e-05, + "loss": 0.0067, + "step": 733140 + }, + { + "epoch": 1.9, + "learning_rate": 1.4935416726069971e-05, + "loss": 0.0064, + "step": 733150 + }, + { + "epoch": 1.9, + "learning_rate": 1.4931528509698506e-05, + "loss": 0.0056, + "step": 733160 + }, + { + "epoch": 1.9, + "learning_rate": 1.4927640293327042e-05, + "loss": 0.006, + "step": 733170 + }, + { + "epoch": 1.9, + "learning_rate": 1.4923752076955577e-05, + "loss": 0.0056, + "step": 733180 + }, + { + "epoch": 1.9, + "learning_rate": 1.4919863860584112e-05, + "loss": 0.0061, + "step": 733190 + }, + { + "epoch": 1.9, + "learning_rate": 1.4915975644212647e-05, + "loss": 0.0056, + "step": 733200 + }, + { + "epoch": 1.9, + "learning_rate": 1.4912087427841183e-05, + "loss": 0.0064, + "step": 733210 + }, + { + "epoch": 1.9, + "learning_rate": 1.4908199211469718e-05, + "loss": 0.0081, + "step": 733220 + }, + { + "epoch": 1.9, + "learning_rate": 1.4904310995098255e-05, + "loss": 0.0062, + "step": 733230 + }, + { + "epoch": 1.9, + "learning_rate": 1.490042277872679e-05, + "loss": 0.0064, + "step": 733240 + }, + { + "epoch": 1.9, + "learning_rate": 1.4896534562355323e-05, + "loss": 0.0078, + "step": 733250 + }, + { + "epoch": 1.9, + "learning_rate": 1.489264634598386e-05, + "loss": 0.0048, + "step": 733260 + }, + { + "epoch": 1.9, + "learning_rate": 1.4888758129612394e-05, + "loss": 0.009, + "step": 733270 + }, + { + "epoch": 1.9, + "learning_rate": 1.4884869913240931e-05, + "loss": 0.0081, + "step": 733280 + }, + { + "epoch": 1.9, + "learning_rate": 1.4880981696869466e-05, + "loss": 0.008, + "step": 733290 + }, + { + "epoch": 1.9, + "learning_rate": 1.4877093480498002e-05, + "loss": 0.0079, + "step": 733300 + }, + { + "epoch": 1.9, + "learning_rate": 1.4873205264126537e-05, + "loss": 0.0072, + "step": 733310 + }, + { + "epoch": 1.9, + "learning_rate": 1.4869317047755072e-05, + "loss": 0.008, + "step": 733320 + }, + { + "epoch": 1.9, + "learning_rate": 1.4865428831383607e-05, + "loss": 0.005, + "step": 733330 + }, + { + "epoch": 1.9, + "learning_rate": 1.4861540615012143e-05, + "loss": 0.0076, + "step": 733340 + }, + { + "epoch": 1.9, + "learning_rate": 1.4857652398640678e-05, + "loss": 0.0107, + "step": 733350 + }, + { + "epoch": 1.9, + "learning_rate": 1.4853764182269215e-05, + "loss": 0.0055, + "step": 733360 + }, + { + "epoch": 1.9, + "learning_rate": 1.484987596589775e-05, + "loss": 0.0072, + "step": 733370 + }, + { + "epoch": 1.9, + "learning_rate": 1.4845987749526283e-05, + "loss": 0.0065, + "step": 733380 + }, + { + "epoch": 1.9, + "learning_rate": 1.484209953315482e-05, + "loss": 0.0066, + "step": 733390 + }, + { + "epoch": 1.9, + "learning_rate": 1.4838211316783354e-05, + "loss": 0.0066, + "step": 733400 + }, + { + "epoch": 1.9, + "learning_rate": 1.4834323100411891e-05, + "loss": 0.0067, + "step": 733410 + }, + { + "epoch": 1.9, + "learning_rate": 1.4830434884040426e-05, + "loss": 0.0062, + "step": 733420 + }, + { + "epoch": 1.9, + "learning_rate": 1.4826546667668962e-05, + "loss": 0.0054, + "step": 733430 + }, + { + "epoch": 1.9, + "learning_rate": 1.4822658451297495e-05, + "loss": 0.0079, + "step": 733440 + }, + { + "epoch": 1.9, + "learning_rate": 1.4818770234926032e-05, + "loss": 0.009, + "step": 733450 + }, + { + "epoch": 1.9, + "learning_rate": 1.4814882018554567e-05, + "loss": 0.0062, + "step": 733460 + }, + { + "epoch": 1.9, + "learning_rate": 1.4810993802183103e-05, + "loss": 0.0059, + "step": 733470 + }, + { + "epoch": 1.9, + "learning_rate": 1.4807105585811638e-05, + "loss": 0.0064, + "step": 733480 + }, + { + "epoch": 1.9, + "learning_rate": 1.4803217369440175e-05, + "loss": 0.0076, + "step": 733490 + }, + { + "epoch": 1.9, + "learning_rate": 1.4799329153068708e-05, + "loss": 0.0063, + "step": 733500 + }, + { + "epoch": 1.9, + "learning_rate": 1.4795440936697243e-05, + "loss": 0.0083, + "step": 733510 + }, + { + "epoch": 1.9, + "learning_rate": 1.479155272032578e-05, + "loss": 0.0061, + "step": 733520 + }, + { + "epoch": 1.9, + "learning_rate": 1.4787664503954314e-05, + "loss": 0.0064, + "step": 733530 + }, + { + "epoch": 1.9, + "learning_rate": 1.4783776287582851e-05, + "loss": 0.0041, + "step": 733540 + }, + { + "epoch": 1.9, + "learning_rate": 1.4779888071211386e-05, + "loss": 0.0048, + "step": 733550 + }, + { + "epoch": 1.9, + "learning_rate": 1.477599985483992e-05, + "loss": 0.0073, + "step": 733560 + }, + { + "epoch": 1.9, + "learning_rate": 1.4772111638468455e-05, + "loss": 0.009, + "step": 733570 + }, + { + "epoch": 1.9, + "learning_rate": 1.4768223422096992e-05, + "loss": 0.0073, + "step": 733580 + }, + { + "epoch": 1.9, + "learning_rate": 1.4764335205725527e-05, + "loss": 0.0067, + "step": 733590 + }, + { + "epoch": 1.9, + "learning_rate": 1.4760446989354063e-05, + "loss": 0.0043, + "step": 733600 + }, + { + "epoch": 1.9, + "learning_rate": 1.4756558772982598e-05, + "loss": 0.0084, + "step": 733610 + }, + { + "epoch": 1.9, + "learning_rate": 1.4752670556611135e-05, + "loss": 0.006, + "step": 733620 + }, + { + "epoch": 1.9, + "learning_rate": 1.4748782340239668e-05, + "loss": 0.0051, + "step": 733630 + }, + { + "epoch": 1.9, + "learning_rate": 1.4744894123868203e-05, + "loss": 0.0078, + "step": 733640 + }, + { + "epoch": 1.9, + "learning_rate": 1.474100590749674e-05, + "loss": 0.0072, + "step": 733650 + }, + { + "epoch": 1.9, + "learning_rate": 1.4737117691125274e-05, + "loss": 0.0077, + "step": 733660 + }, + { + "epoch": 1.9, + "learning_rate": 1.473322947475381e-05, + "loss": 0.0075, + "step": 733670 + }, + { + "epoch": 1.9, + "learning_rate": 1.4729341258382346e-05, + "loss": 0.0077, + "step": 733680 + }, + { + "epoch": 1.9, + "learning_rate": 1.472545304201088e-05, + "loss": 0.0087, + "step": 733690 + }, + { + "epoch": 1.9, + "learning_rate": 1.4721564825639415e-05, + "loss": 0.0064, + "step": 733700 + }, + { + "epoch": 1.9, + "learning_rate": 1.4717676609267952e-05, + "loss": 0.0049, + "step": 733710 + }, + { + "epoch": 1.9, + "learning_rate": 1.4713788392896487e-05, + "loss": 0.0087, + "step": 733720 + }, + { + "epoch": 1.9, + "learning_rate": 1.4709900176525022e-05, + "loss": 0.0072, + "step": 733730 + }, + { + "epoch": 1.9, + "learning_rate": 1.4706011960153558e-05, + "loss": 0.0085, + "step": 733740 + }, + { + "epoch": 1.9, + "learning_rate": 1.4702123743782091e-05, + "loss": 0.008, + "step": 733750 + }, + { + "epoch": 1.9, + "learning_rate": 1.4698235527410628e-05, + "loss": 0.0062, + "step": 733760 + }, + { + "epoch": 1.9, + "learning_rate": 1.4694347311039163e-05, + "loss": 0.0082, + "step": 733770 + }, + { + "epoch": 1.9, + "learning_rate": 1.46904590946677e-05, + "loss": 0.0077, + "step": 733780 + }, + { + "epoch": 1.9, + "learning_rate": 1.4686570878296234e-05, + "loss": 0.0087, + "step": 733790 + }, + { + "epoch": 1.9, + "learning_rate": 1.468268266192477e-05, + "loss": 0.0059, + "step": 733800 + }, + { + "epoch": 1.9, + "learning_rate": 1.4678794445553304e-05, + "loss": 0.0053, + "step": 733810 + }, + { + "epoch": 1.9, + "learning_rate": 1.4674906229181839e-05, + "loss": 0.0079, + "step": 733820 + }, + { + "epoch": 1.9, + "learning_rate": 1.4671018012810375e-05, + "loss": 0.0088, + "step": 733830 + }, + { + "epoch": 1.9, + "learning_rate": 1.466712979643891e-05, + "loss": 0.0059, + "step": 733840 + }, + { + "epoch": 1.9, + "learning_rate": 1.4663241580067447e-05, + "loss": 0.0077, + "step": 733850 + }, + { + "epoch": 1.9, + "learning_rate": 1.4659353363695982e-05, + "loss": 0.0097, + "step": 733860 + }, + { + "epoch": 1.9, + "learning_rate": 1.4655465147324517e-05, + "loss": 0.0075, + "step": 733870 + }, + { + "epoch": 1.9, + "learning_rate": 1.4651576930953051e-05, + "loss": 0.0091, + "step": 733880 + }, + { + "epoch": 1.9, + "learning_rate": 1.4647688714581588e-05, + "loss": 0.0077, + "step": 733890 + }, + { + "epoch": 1.9, + "learning_rate": 1.4643800498210123e-05, + "loss": 0.007, + "step": 733900 + }, + { + "epoch": 1.9, + "learning_rate": 1.463991228183866e-05, + "loss": 0.007, + "step": 733910 + }, + { + "epoch": 1.9, + "learning_rate": 1.4636024065467194e-05, + "loss": 0.0069, + "step": 733920 + }, + { + "epoch": 1.9, + "learning_rate": 1.463213584909573e-05, + "loss": 0.0063, + "step": 733930 + }, + { + "epoch": 1.9, + "learning_rate": 1.4628247632724264e-05, + "loss": 0.0057, + "step": 733940 + }, + { + "epoch": 1.9, + "learning_rate": 1.4624359416352799e-05, + "loss": 0.0158, + "step": 733950 + }, + { + "epoch": 1.9, + "learning_rate": 1.4620471199981335e-05, + "loss": 0.0068, + "step": 733960 + }, + { + "epoch": 1.9, + "learning_rate": 1.461658298360987e-05, + "loss": 0.0057, + "step": 733970 + }, + { + "epoch": 1.9, + "learning_rate": 1.4612694767238407e-05, + "loss": 0.0065, + "step": 733980 + }, + { + "epoch": 1.9, + "learning_rate": 1.4608806550866942e-05, + "loss": 0.0094, + "step": 733990 + }, + { + "epoch": 1.9, + "learning_rate": 1.4604918334495477e-05, + "loss": 0.0072, + "step": 734000 + }, + { + "epoch": 1.9, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.0044957599602639675, + "eval_runtime": 107.9535, + "eval_samples_per_second": 18.526, + "eval_steps_per_second": 4.632, + "step": 734000 + }, + { + "epoch": 1.9, + "learning_rate": 1.4601030118124011e-05, + "loss": 0.0064, + "step": 734010 + }, + { + "epoch": 1.9, + "learning_rate": 1.4597141901752548e-05, + "loss": 0.011, + "step": 734020 + }, + { + "epoch": 1.9, + "learning_rate": 1.4593253685381083e-05, + "loss": 0.0067, + "step": 734030 + }, + { + "epoch": 1.9, + "learning_rate": 1.458936546900962e-05, + "loss": 0.0082, + "step": 734040 + }, + { + "epoch": 1.9, + "learning_rate": 1.4585477252638154e-05, + "loss": 0.0079, + "step": 734050 + }, + { + "epoch": 1.9, + "learning_rate": 1.4581589036266687e-05, + "loss": 0.0081, + "step": 734060 + }, + { + "epoch": 1.9, + "learning_rate": 1.4577700819895224e-05, + "loss": 0.008, + "step": 734070 + }, + { + "epoch": 1.9, + "learning_rate": 1.4573812603523759e-05, + "loss": 0.0085, + "step": 734080 + }, + { + "epoch": 1.9, + "learning_rate": 1.4569924387152295e-05, + "loss": 0.0061, + "step": 734090 + }, + { + "epoch": 1.9, + "learning_rate": 1.456603617078083e-05, + "loss": 0.0077, + "step": 734100 + }, + { + "epoch": 1.9, + "learning_rate": 1.4562147954409367e-05, + "loss": 0.0075, + "step": 734110 + }, + { + "epoch": 1.9, + "learning_rate": 1.45582597380379e-05, + "loss": 0.0085, + "step": 734120 + }, + { + "epoch": 1.9, + "learning_rate": 1.4554371521666436e-05, + "loss": 0.0079, + "step": 734130 + }, + { + "epoch": 1.9, + "learning_rate": 1.4550483305294971e-05, + "loss": 0.0058, + "step": 734140 + }, + { + "epoch": 1.9, + "learning_rate": 1.4546595088923508e-05, + "loss": 0.008, + "step": 734150 + }, + { + "epoch": 1.9, + "learning_rate": 1.4542706872552043e-05, + "loss": 0.0063, + "step": 734160 + }, + { + "epoch": 1.9, + "learning_rate": 1.453881865618058e-05, + "loss": 0.0067, + "step": 734170 + }, + { + "epoch": 1.9, + "learning_rate": 1.4534930439809112e-05, + "loss": 0.0059, + "step": 734180 + }, + { + "epoch": 1.9, + "learning_rate": 1.4531042223437647e-05, + "loss": 0.0106, + "step": 734190 + }, + { + "epoch": 1.9, + "learning_rate": 1.4527154007066184e-05, + "loss": 0.0087, + "step": 734200 + }, + { + "epoch": 1.9, + "learning_rate": 1.4523265790694719e-05, + "loss": 0.0065, + "step": 734210 + }, + { + "epoch": 1.9, + "learning_rate": 1.4519377574323255e-05, + "loss": 0.0059, + "step": 734220 + }, + { + "epoch": 1.9, + "learning_rate": 1.451548935795179e-05, + "loss": 0.0062, + "step": 734230 + }, + { + "epoch": 1.9, + "learning_rate": 1.4511601141580327e-05, + "loss": 0.0065, + "step": 734240 + }, + { + "epoch": 1.9, + "learning_rate": 1.450771292520886e-05, + "loss": 0.0072, + "step": 734250 + }, + { + "epoch": 1.9, + "learning_rate": 1.4503824708837396e-05, + "loss": 0.0096, + "step": 734260 + }, + { + "epoch": 1.9, + "learning_rate": 1.4499936492465931e-05, + "loss": 0.007, + "step": 734270 + }, + { + "epoch": 1.9, + "learning_rate": 1.4496048276094468e-05, + "loss": 0.0061, + "step": 734280 + }, + { + "epoch": 1.9, + "learning_rate": 1.4492160059723003e-05, + "loss": 0.0086, + "step": 734290 + }, + { + "epoch": 1.9, + "learning_rate": 1.448827184335154e-05, + "loss": 0.006, + "step": 734300 + }, + { + "epoch": 1.9, + "learning_rate": 1.4484383626980072e-05, + "loss": 0.0107, + "step": 734310 + }, + { + "epoch": 1.9, + "learning_rate": 1.4480495410608607e-05, + "loss": 0.0055, + "step": 734320 + }, + { + "epoch": 1.9, + "learning_rate": 1.4476607194237144e-05, + "loss": 0.0068, + "step": 734330 + }, + { + "epoch": 1.9, + "learning_rate": 1.4472718977865679e-05, + "loss": 0.0066, + "step": 734340 + }, + { + "epoch": 1.9, + "learning_rate": 1.4468830761494215e-05, + "loss": 0.0069, + "step": 734350 + }, + { + "epoch": 1.9, + "learning_rate": 1.446494254512275e-05, + "loss": 0.0067, + "step": 734360 + }, + { + "epoch": 1.9, + "learning_rate": 1.4461054328751285e-05, + "loss": 0.0126, + "step": 734370 + }, + { + "epoch": 1.9, + "learning_rate": 1.445716611237982e-05, + "loss": 0.0074, + "step": 734380 + }, + { + "epoch": 1.9, + "learning_rate": 1.4453277896008356e-05, + "loss": 0.0075, + "step": 734390 + }, + { + "epoch": 1.9, + "learning_rate": 1.4449389679636891e-05, + "loss": 0.007, + "step": 734400 + }, + { + "epoch": 1.9, + "learning_rate": 1.4445501463265426e-05, + "loss": 0.0055, + "step": 734410 + }, + { + "epoch": 1.9, + "learning_rate": 1.4441613246893963e-05, + "loss": 0.0096, + "step": 734420 + }, + { + "epoch": 1.9, + "learning_rate": 1.4437725030522496e-05, + "loss": 0.0091, + "step": 734430 + }, + { + "epoch": 1.9, + "learning_rate": 1.4433836814151032e-05, + "loss": 0.0063, + "step": 734440 + }, + { + "epoch": 1.9, + "learning_rate": 1.4429948597779567e-05, + "loss": 0.006, + "step": 734450 + }, + { + "epoch": 1.9, + "learning_rate": 1.4426060381408104e-05, + "loss": 0.0084, + "step": 734460 + }, + { + "epoch": 1.9, + "learning_rate": 1.4422172165036639e-05, + "loss": 0.0052, + "step": 734470 + }, + { + "epoch": 1.9, + "learning_rate": 1.4418283948665175e-05, + "loss": 0.01, + "step": 734480 + }, + { + "epoch": 1.9, + "learning_rate": 1.4414395732293708e-05, + "loss": 0.0162, + "step": 734490 + }, + { + "epoch": 1.9, + "learning_rate": 1.4410507515922243e-05, + "loss": 0.0057, + "step": 734500 + }, + { + "epoch": 1.9, + "learning_rate": 1.440661929955078e-05, + "loss": 0.0071, + "step": 734510 + }, + { + "epoch": 1.9, + "learning_rate": 1.4402731083179315e-05, + "loss": 0.0094, + "step": 734520 + }, + { + "epoch": 1.9, + "learning_rate": 1.4398842866807851e-05, + "loss": 0.0087, + "step": 734530 + }, + { + "epoch": 1.9, + "learning_rate": 1.4394954650436386e-05, + "loss": 0.0087, + "step": 734540 + }, + { + "epoch": 1.9, + "learning_rate": 1.4391066434064923e-05, + "loss": 0.007, + "step": 734550 + }, + { + "epoch": 1.9, + "learning_rate": 1.4387178217693456e-05, + "loss": 0.0084, + "step": 734560 + }, + { + "epoch": 1.9, + "learning_rate": 1.4383290001321992e-05, + "loss": 0.0068, + "step": 734570 + }, + { + "epoch": 1.9, + "learning_rate": 1.4379401784950527e-05, + "loss": 0.0067, + "step": 734580 + }, + { + "epoch": 1.9, + "learning_rate": 1.4375513568579064e-05, + "loss": 0.0063, + "step": 734590 + }, + { + "epoch": 1.9, + "learning_rate": 1.4371625352207599e-05, + "loss": 0.0053, + "step": 734600 + }, + { + "epoch": 1.9, + "learning_rate": 1.4367737135836135e-05, + "loss": 0.0069, + "step": 734610 + }, + { + "epoch": 1.9, + "learning_rate": 1.4363848919464668e-05, + "loss": 0.0053, + "step": 734620 + }, + { + "epoch": 1.9, + "learning_rate": 1.4359960703093203e-05, + "loss": 0.0066, + "step": 734630 + }, + { + "epoch": 1.9, + "learning_rate": 1.435607248672174e-05, + "loss": 0.0083, + "step": 734640 + }, + { + "epoch": 1.9, + "learning_rate": 1.4352184270350275e-05, + "loss": 0.0078, + "step": 734650 + }, + { + "epoch": 1.9, + "learning_rate": 1.4348296053978811e-05, + "loss": 0.0056, + "step": 734660 + }, + { + "epoch": 1.9, + "learning_rate": 1.4344407837607346e-05, + "loss": 0.0077, + "step": 734670 + }, + { + "epoch": 1.9, + "learning_rate": 1.4340519621235881e-05, + "loss": 0.0093, + "step": 734680 + }, + { + "epoch": 1.9, + "learning_rate": 1.4336631404864416e-05, + "loss": 0.0099, + "step": 734690 + }, + { + "epoch": 1.9, + "learning_rate": 1.4332743188492952e-05, + "loss": 0.0058, + "step": 734700 + }, + { + "epoch": 1.9, + "learning_rate": 1.4328854972121487e-05, + "loss": 0.0062, + "step": 734710 + }, + { + "epoch": 1.9, + "learning_rate": 1.4324966755750024e-05, + "loss": 0.0066, + "step": 734720 + }, + { + "epoch": 1.9, + "learning_rate": 1.4321078539378559e-05, + "loss": 0.0077, + "step": 734730 + }, + { + "epoch": 1.9, + "learning_rate": 1.4317190323007092e-05, + "loss": 0.006, + "step": 734740 + }, + { + "epoch": 1.9, + "learning_rate": 1.4313302106635628e-05, + "loss": 0.006, + "step": 734750 + }, + { + "epoch": 1.9, + "learning_rate": 1.4309413890264163e-05, + "loss": 0.0066, + "step": 734760 + }, + { + "epoch": 1.9, + "learning_rate": 1.43055256738927e-05, + "loss": 0.0075, + "step": 734770 + }, + { + "epoch": 1.9, + "learning_rate": 1.4301637457521235e-05, + "loss": 0.0059, + "step": 734780 + }, + { + "epoch": 1.9, + "learning_rate": 1.4297749241149771e-05, + "loss": 0.009, + "step": 734790 + }, + { + "epoch": 1.9, + "learning_rate": 1.4293861024778304e-05, + "loss": 0.009, + "step": 734800 + }, + { + "epoch": 1.9, + "learning_rate": 1.4289972808406841e-05, + "loss": 0.0056, + "step": 734810 + }, + { + "epoch": 1.9, + "learning_rate": 1.4286084592035376e-05, + "loss": 0.0069, + "step": 734820 + }, + { + "epoch": 1.9, + "learning_rate": 1.4282196375663912e-05, + "loss": 0.0039, + "step": 734830 + }, + { + "epoch": 1.9, + "learning_rate": 1.4278308159292447e-05, + "loss": 0.0046, + "step": 734840 + }, + { + "epoch": 1.9, + "learning_rate": 1.4274419942920984e-05, + "loss": 0.0062, + "step": 734850 + }, + { + "epoch": 1.9, + "learning_rate": 1.4270531726549519e-05, + "loss": 0.0077, + "step": 734860 + }, + { + "epoch": 1.9, + "learning_rate": 1.4266643510178052e-05, + "loss": 0.0079, + "step": 734870 + }, + { + "epoch": 1.9, + "learning_rate": 1.4262755293806588e-05, + "loss": 0.0074, + "step": 734880 + }, + { + "epoch": 1.9, + "learning_rate": 1.4258867077435123e-05, + "loss": 0.0075, + "step": 734890 + }, + { + "epoch": 1.9, + "learning_rate": 1.425497886106366e-05, + "loss": 0.0082, + "step": 734900 + }, + { + "epoch": 1.9, + "learning_rate": 1.4251090644692195e-05, + "loss": 0.0048, + "step": 734910 + }, + { + "epoch": 1.91, + "learning_rate": 1.4247202428320731e-05, + "loss": 0.0075, + "step": 734920 + }, + { + "epoch": 1.91, + "learning_rate": 1.4243314211949264e-05, + "loss": 0.0066, + "step": 734930 + }, + { + "epoch": 1.91, + "learning_rate": 1.4239425995577801e-05, + "loss": 0.0073, + "step": 734940 + }, + { + "epoch": 1.91, + "learning_rate": 1.4235537779206336e-05, + "loss": 0.0059, + "step": 734950 + }, + { + "epoch": 1.91, + "learning_rate": 1.4231649562834872e-05, + "loss": 0.0079, + "step": 734960 + }, + { + "epoch": 1.91, + "learning_rate": 1.4227761346463407e-05, + "loss": 0.0077, + "step": 734970 + }, + { + "epoch": 1.91, + "learning_rate": 1.4223873130091944e-05, + "loss": 0.0063, + "step": 734980 + }, + { + "epoch": 1.91, + "learning_rate": 1.4219984913720477e-05, + "loss": 0.0045, + "step": 734990 + }, + { + "epoch": 1.91, + "learning_rate": 1.4216096697349012e-05, + "loss": 0.0104, + "step": 735000 + }, + { + "epoch": 1.91, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.004462803713977337, + "eval_runtime": 108.0687, + "eval_samples_per_second": 18.507, + "eval_steps_per_second": 4.627, + "step": 735000 + }, + { + "epoch": 1.91, + "learning_rate": 1.4212208480977548e-05, + "loss": 0.0057, + "step": 735010 + }, + { + "epoch": 1.91, + "learning_rate": 1.4208320264606083e-05, + "loss": 0.0098, + "step": 735020 + }, + { + "epoch": 1.91, + "learning_rate": 1.420443204823462e-05, + "loss": 0.006, + "step": 735030 + }, + { + "epoch": 1.91, + "learning_rate": 1.4200543831863155e-05, + "loss": 0.01, + "step": 735040 + }, + { + "epoch": 1.91, + "learning_rate": 1.419665561549169e-05, + "loss": 0.0084, + "step": 735050 + }, + { + "epoch": 1.91, + "learning_rate": 1.4192767399120224e-05, + "loss": 0.0058, + "step": 735060 + }, + { + "epoch": 1.91, + "learning_rate": 1.4188879182748761e-05, + "loss": 0.0079, + "step": 735070 + }, + { + "epoch": 1.91, + "learning_rate": 1.4184990966377296e-05, + "loss": 0.0076, + "step": 735080 + }, + { + "epoch": 1.91, + "learning_rate": 1.4181102750005832e-05, + "loss": 0.007, + "step": 735090 + }, + { + "epoch": 1.91, + "learning_rate": 1.4177214533634367e-05, + "loss": 0.0091, + "step": 735100 + }, + { + "epoch": 1.91, + "learning_rate": 1.41733263172629e-05, + "loss": 0.0063, + "step": 735110 + }, + { + "epoch": 1.91, + "learning_rate": 1.4169438100891437e-05, + "loss": 0.0082, + "step": 735120 + }, + { + "epoch": 1.91, + "learning_rate": 1.4165549884519972e-05, + "loss": 0.0058, + "step": 735130 + }, + { + "epoch": 1.91, + "learning_rate": 1.4161661668148508e-05, + "loss": 0.0067, + "step": 735140 + }, + { + "epoch": 1.91, + "learning_rate": 1.4157773451777043e-05, + "loss": 0.0089, + "step": 735150 + }, + { + "epoch": 1.91, + "learning_rate": 1.415388523540558e-05, + "loss": 0.0073, + "step": 735160 + }, + { + "epoch": 1.91, + "learning_rate": 1.4149997019034115e-05, + "loss": 0.0066, + "step": 735170 + }, + { + "epoch": 1.91, + "learning_rate": 1.4146108802662648e-05, + "loss": 0.0079, + "step": 735180 + }, + { + "epoch": 1.91, + "learning_rate": 1.4142220586291184e-05, + "loss": 0.0063, + "step": 735190 + }, + { + "epoch": 1.91, + "learning_rate": 1.413833236991972e-05, + "loss": 0.0076, + "step": 735200 + }, + { + "epoch": 1.91, + "learning_rate": 1.4134444153548256e-05, + "loss": 0.0055, + "step": 735210 + }, + { + "epoch": 1.91, + "learning_rate": 1.413055593717679e-05, + "loss": 0.0058, + "step": 735220 + }, + { + "epoch": 1.91, + "learning_rate": 1.4126667720805327e-05, + "loss": 0.0077, + "step": 735230 + }, + { + "epoch": 1.91, + "learning_rate": 1.412277950443386e-05, + "loss": 0.0094, + "step": 735240 + }, + { + "epoch": 1.91, + "learning_rate": 1.4118891288062397e-05, + "loss": 0.0045, + "step": 735250 + }, + { + "epoch": 1.91, + "learning_rate": 1.4115003071690932e-05, + "loss": 0.0069, + "step": 735260 + }, + { + "epoch": 1.91, + "learning_rate": 1.4111114855319468e-05, + "loss": 0.0086, + "step": 735270 + }, + { + "epoch": 1.91, + "learning_rate": 1.4107226638948003e-05, + "loss": 0.008, + "step": 735280 + }, + { + "epoch": 1.91, + "learning_rate": 1.410333842257654e-05, + "loss": 0.0089, + "step": 735290 + }, + { + "epoch": 1.91, + "learning_rate": 1.4099450206205073e-05, + "loss": 0.0066, + "step": 735300 + }, + { + "epoch": 1.91, + "learning_rate": 1.4095561989833608e-05, + "loss": 0.0059, + "step": 735310 + }, + { + "epoch": 1.91, + "learning_rate": 1.4091673773462144e-05, + "loss": 0.0078, + "step": 735320 + }, + { + "epoch": 1.91, + "learning_rate": 1.408778555709068e-05, + "loss": 0.0084, + "step": 735330 + }, + { + "epoch": 1.91, + "learning_rate": 1.4083897340719216e-05, + "loss": 0.0094, + "step": 735340 + }, + { + "epoch": 1.91, + "learning_rate": 1.408000912434775e-05, + "loss": 0.006, + "step": 735350 + }, + { + "epoch": 1.91, + "learning_rate": 1.4076120907976285e-05, + "loss": 0.0072, + "step": 735360 + }, + { + "epoch": 1.91, + "learning_rate": 1.407223269160482e-05, + "loss": 0.0077, + "step": 735370 + }, + { + "epoch": 1.91, + "learning_rate": 1.4068344475233357e-05, + "loss": 0.0093, + "step": 735380 + }, + { + "epoch": 1.91, + "learning_rate": 1.4064456258861892e-05, + "loss": 0.005, + "step": 735390 + }, + { + "epoch": 1.91, + "learning_rate": 1.4060568042490428e-05, + "loss": 0.0069, + "step": 735400 + }, + { + "epoch": 1.91, + "learning_rate": 1.4056679826118963e-05, + "loss": 0.0058, + "step": 735410 + }, + { + "epoch": 1.91, + "learning_rate": 1.4052791609747496e-05, + "loss": 0.0079, + "step": 735420 + }, + { + "epoch": 1.91, + "learning_rate": 1.4048903393376033e-05, + "loss": 0.0056, + "step": 735430 + }, + { + "epoch": 1.91, + "learning_rate": 1.4045015177004568e-05, + "loss": 0.0067, + "step": 735440 + }, + { + "epoch": 1.91, + "learning_rate": 1.4041126960633104e-05, + "loss": 0.0073, + "step": 735450 + }, + { + "epoch": 1.91, + "learning_rate": 1.4037238744261639e-05, + "loss": 0.0093, + "step": 735460 + }, + { + "epoch": 1.91, + "learning_rate": 1.4033350527890176e-05, + "loss": 0.0091, + "step": 735470 + }, + { + "epoch": 1.91, + "learning_rate": 1.402946231151871e-05, + "loss": 0.0055, + "step": 735480 + }, + { + "epoch": 1.91, + "learning_rate": 1.4025574095147245e-05, + "loss": 0.0046, + "step": 735490 + }, + { + "epoch": 1.91, + "learning_rate": 1.402168587877578e-05, + "loss": 0.0085, + "step": 735500 + }, + { + "epoch": 1.91, + "learning_rate": 1.4017797662404317e-05, + "loss": 0.0075, + "step": 735510 + }, + { + "epoch": 1.91, + "learning_rate": 1.4013909446032852e-05, + "loss": 0.0083, + "step": 735520 + }, + { + "epoch": 1.91, + "learning_rate": 1.4010021229661388e-05, + "loss": 0.0065, + "step": 735530 + }, + { + "epoch": 1.91, + "learning_rate": 1.4006133013289923e-05, + "loss": 0.0059, + "step": 735540 + }, + { + "epoch": 1.91, + "learning_rate": 1.4002244796918456e-05, + "loss": 0.0066, + "step": 735550 + }, + { + "epoch": 1.91, + "learning_rate": 1.3998356580546993e-05, + "loss": 0.0066, + "step": 735560 + }, + { + "epoch": 1.91, + "learning_rate": 1.3994468364175528e-05, + "loss": 0.0056, + "step": 735570 + }, + { + "epoch": 1.91, + "learning_rate": 1.3990580147804064e-05, + "loss": 0.0062, + "step": 735580 + }, + { + "epoch": 1.91, + "learning_rate": 1.3986691931432599e-05, + "loss": 0.0113, + "step": 735590 + }, + { + "epoch": 1.91, + "learning_rate": 1.3982803715061136e-05, + "loss": 0.0092, + "step": 735600 + }, + { + "epoch": 1.91, + "learning_rate": 1.3978915498689669e-05, + "loss": 0.0063, + "step": 735610 + }, + { + "epoch": 1.91, + "learning_rate": 1.3975027282318205e-05, + "loss": 0.0065, + "step": 735620 + }, + { + "epoch": 1.91, + "learning_rate": 1.397113906594674e-05, + "loss": 0.008, + "step": 735630 + }, + { + "epoch": 1.91, + "learning_rate": 1.3967250849575277e-05, + "loss": 0.0087, + "step": 735640 + }, + { + "epoch": 1.91, + "learning_rate": 1.3963362633203812e-05, + "loss": 0.0071, + "step": 735650 + }, + { + "epoch": 1.91, + "learning_rate": 1.3959474416832348e-05, + "loss": 0.0068, + "step": 735660 + }, + { + "epoch": 1.91, + "learning_rate": 1.3955586200460881e-05, + "loss": 0.0071, + "step": 735670 + }, + { + "epoch": 1.91, + "learning_rate": 1.3951697984089416e-05, + "loss": 0.0073, + "step": 735680 + }, + { + "epoch": 1.91, + "learning_rate": 1.3947809767717953e-05, + "loss": 0.0059, + "step": 735690 + }, + { + "epoch": 1.91, + "learning_rate": 1.3943921551346488e-05, + "loss": 0.0086, + "step": 735700 + }, + { + "epoch": 1.91, + "learning_rate": 1.3940033334975024e-05, + "loss": 0.0077, + "step": 735710 + }, + { + "epoch": 1.91, + "learning_rate": 1.3936145118603559e-05, + "loss": 0.0081, + "step": 735720 + }, + { + "epoch": 1.91, + "learning_rate": 1.3932256902232094e-05, + "loss": 0.0079, + "step": 735730 + }, + { + "epoch": 1.91, + "learning_rate": 1.3928368685860629e-05, + "loss": 0.0097, + "step": 735740 + }, + { + "epoch": 1.91, + "learning_rate": 1.3924480469489165e-05, + "loss": 0.0058, + "step": 735750 + }, + { + "epoch": 1.91, + "learning_rate": 1.39205922531177e-05, + "loss": 0.0081, + "step": 735760 + }, + { + "epoch": 1.91, + "learning_rate": 1.3916704036746237e-05, + "loss": 0.0067, + "step": 735770 + }, + { + "epoch": 1.91, + "learning_rate": 1.3912815820374772e-05, + "loss": 0.0068, + "step": 735780 + }, + { + "epoch": 1.91, + "learning_rate": 1.3908927604003307e-05, + "loss": 0.0078, + "step": 735790 + }, + { + "epoch": 1.91, + "learning_rate": 1.3905039387631841e-05, + "loss": 0.0057, + "step": 735800 + }, + { + "epoch": 1.91, + "learning_rate": 1.3901151171260376e-05, + "loss": 0.0063, + "step": 735810 + }, + { + "epoch": 1.91, + "learning_rate": 1.3897262954888913e-05, + "loss": 0.0072, + "step": 735820 + }, + { + "epoch": 1.91, + "learning_rate": 1.3893374738517448e-05, + "loss": 0.0063, + "step": 735830 + }, + { + "epoch": 1.91, + "learning_rate": 1.3889486522145984e-05, + "loss": 0.0088, + "step": 735840 + }, + { + "epoch": 1.91, + "learning_rate": 1.3885598305774519e-05, + "loss": 0.0097, + "step": 735850 + }, + { + "epoch": 1.91, + "learning_rate": 1.3881710089403052e-05, + "loss": 0.0079, + "step": 735860 + }, + { + "epoch": 1.91, + "learning_rate": 1.3877821873031589e-05, + "loss": 0.0065, + "step": 735870 + }, + { + "epoch": 1.91, + "learning_rate": 1.3873933656660124e-05, + "loss": 0.0093, + "step": 735880 + }, + { + "epoch": 1.91, + "learning_rate": 1.387004544028866e-05, + "loss": 0.0073, + "step": 735890 + }, + { + "epoch": 1.91, + "learning_rate": 1.3866157223917195e-05, + "loss": 0.0091, + "step": 735900 + }, + { + "epoch": 1.91, + "learning_rate": 1.3862269007545732e-05, + "loss": 0.0066, + "step": 735910 + }, + { + "epoch": 1.91, + "learning_rate": 1.3858380791174265e-05, + "loss": 0.0048, + "step": 735920 + }, + { + "epoch": 1.91, + "learning_rate": 1.3854492574802801e-05, + "loss": 0.0065, + "step": 735930 + }, + { + "epoch": 1.91, + "learning_rate": 1.3850604358431336e-05, + "loss": 0.0068, + "step": 735940 + }, + { + "epoch": 1.91, + "learning_rate": 1.3846716142059873e-05, + "loss": 0.0091, + "step": 735950 + }, + { + "epoch": 1.91, + "learning_rate": 1.3842827925688408e-05, + "loss": 0.0064, + "step": 735960 + }, + { + "epoch": 1.91, + "learning_rate": 1.3838939709316944e-05, + "loss": 0.0064, + "step": 735970 + }, + { + "epoch": 1.91, + "learning_rate": 1.3835051492945477e-05, + "loss": 0.0082, + "step": 735980 + }, + { + "epoch": 1.91, + "learning_rate": 1.3831163276574012e-05, + "loss": 0.0101, + "step": 735990 + }, + { + "epoch": 1.91, + "learning_rate": 1.3827275060202549e-05, + "loss": 0.0074, + "step": 736000 + }, + { + "epoch": 1.91, + "eval_cer": 0.8816550986674057, + "eval_loss": 0.004494575317949057, + "eval_runtime": 107.9239, + "eval_samples_per_second": 18.532, + "eval_steps_per_second": 4.633, + "step": 736000 + }, + { + "epoch": 1.91, + "learning_rate": 1.3823386843831084e-05, + "loss": 0.0083, + "step": 736010 + }, + { + "epoch": 1.91, + "learning_rate": 1.381949862745962e-05, + "loss": 0.0069, + "step": 736020 + }, + { + "epoch": 1.91, + "learning_rate": 1.3815610411088155e-05, + "loss": 0.0076, + "step": 736030 + }, + { + "epoch": 1.91, + "learning_rate": 1.381172219471669e-05, + "loss": 0.008, + "step": 736040 + }, + { + "epoch": 1.91, + "learning_rate": 1.3807833978345225e-05, + "loss": 0.0088, + "step": 736050 + }, + { + "epoch": 1.91, + "learning_rate": 1.3803945761973761e-05, + "loss": 0.0073, + "step": 736060 + }, + { + "epoch": 1.91, + "learning_rate": 1.3800057545602296e-05, + "loss": 0.0077, + "step": 736070 + }, + { + "epoch": 1.91, + "learning_rate": 1.3796169329230833e-05, + "loss": 0.0084, + "step": 736080 + }, + { + "epoch": 1.91, + "learning_rate": 1.3792281112859368e-05, + "loss": 0.0082, + "step": 736090 + }, + { + "epoch": 1.91, + "learning_rate": 1.3788392896487904e-05, + "loss": 0.0047, + "step": 736100 + }, + { + "epoch": 1.91, + "learning_rate": 1.3784504680116437e-05, + "loss": 0.0073, + "step": 736110 + }, + { + "epoch": 1.91, + "learning_rate": 1.3780616463744972e-05, + "loss": 0.0079, + "step": 736120 + }, + { + "epoch": 1.91, + "learning_rate": 1.3776728247373509e-05, + "loss": 0.0066, + "step": 736130 + }, + { + "epoch": 1.91, + "learning_rate": 1.3772840031002044e-05, + "loss": 0.0067, + "step": 736140 + }, + { + "epoch": 1.91, + "learning_rate": 1.376895181463058e-05, + "loss": 0.0061, + "step": 736150 + }, + { + "epoch": 1.91, + "learning_rate": 1.3765063598259115e-05, + "loss": 0.0055, + "step": 736160 + }, + { + "epoch": 1.91, + "learning_rate": 1.376117538188765e-05, + "loss": 0.0085, + "step": 736170 + }, + { + "epoch": 1.91, + "learning_rate": 1.3757287165516185e-05, + "loss": 0.0096, + "step": 736180 + }, + { + "epoch": 1.91, + "learning_rate": 1.3753398949144721e-05, + "loss": 0.0099, + "step": 736190 + }, + { + "epoch": 1.91, + "learning_rate": 1.3749510732773256e-05, + "loss": 0.0087, + "step": 736200 + }, + { + "epoch": 1.91, + "learning_rate": 1.3745622516401793e-05, + "loss": 0.0071, + "step": 736210 + }, + { + "epoch": 1.91, + "learning_rate": 1.3741734300030328e-05, + "loss": 0.0087, + "step": 736220 + }, + { + "epoch": 1.91, + "learning_rate": 1.373784608365886e-05, + "loss": 0.0081, + "step": 736230 + }, + { + "epoch": 1.91, + "learning_rate": 1.3733957867287397e-05, + "loss": 0.0075, + "step": 736240 + }, + { + "epoch": 1.91, + "learning_rate": 1.3730069650915932e-05, + "loss": 0.0071, + "step": 736250 + }, + { + "epoch": 1.91, + "learning_rate": 1.3726181434544469e-05, + "loss": 0.0068, + "step": 736260 + }, + { + "epoch": 1.91, + "learning_rate": 1.3722293218173004e-05, + "loss": 0.0076, + "step": 736270 + }, + { + "epoch": 1.91, + "learning_rate": 1.371840500180154e-05, + "loss": 0.0067, + "step": 736280 + }, + { + "epoch": 1.91, + "learning_rate": 1.3714516785430073e-05, + "loss": 0.007, + "step": 736290 + }, + { + "epoch": 1.91, + "learning_rate": 1.371062856905861e-05, + "loss": 0.0063, + "step": 736300 + }, + { + "epoch": 1.91, + "learning_rate": 1.3706740352687145e-05, + "loss": 0.0052, + "step": 736310 + }, + { + "epoch": 1.91, + "learning_rate": 1.3702852136315681e-05, + "loss": 0.0056, + "step": 736320 + }, + { + "epoch": 1.91, + "learning_rate": 1.3698963919944216e-05, + "loss": 0.0052, + "step": 736330 + }, + { + "epoch": 1.91, + "learning_rate": 1.3695075703572753e-05, + "loss": 0.0068, + "step": 736340 + }, + { + "epoch": 1.91, + "learning_rate": 1.3691187487201286e-05, + "loss": 0.0057, + "step": 736350 + }, + { + "epoch": 1.91, + "learning_rate": 1.368729927082982e-05, + "loss": 0.0061, + "step": 736360 + }, + { + "epoch": 1.91, + "learning_rate": 1.3683411054458357e-05, + "loss": 0.0073, + "step": 736370 + }, + { + "epoch": 1.91, + "learning_rate": 1.3679522838086892e-05, + "loss": 0.0052, + "step": 736380 + }, + { + "epoch": 1.91, + "learning_rate": 1.3675634621715429e-05, + "loss": 0.0054, + "step": 736390 + }, + { + "epoch": 1.91, + "learning_rate": 1.3671746405343964e-05, + "loss": 0.008, + "step": 736400 + }, + { + "epoch": 1.91, + "learning_rate": 1.36678581889725e-05, + "loss": 0.0049, + "step": 736410 + }, + { + "epoch": 1.91, + "learning_rate": 1.3663969972601033e-05, + "loss": 0.0086, + "step": 736420 + }, + { + "epoch": 1.91, + "learning_rate": 1.366008175622957e-05, + "loss": 0.0064, + "step": 736430 + }, + { + "epoch": 1.91, + "learning_rate": 1.3656193539858105e-05, + "loss": 0.0063, + "step": 736440 + }, + { + "epoch": 1.91, + "learning_rate": 1.3652305323486641e-05, + "loss": 0.0074, + "step": 736450 + }, + { + "epoch": 1.91, + "learning_rate": 1.3648417107115176e-05, + "loss": 0.0085, + "step": 736460 + }, + { + "epoch": 1.91, + "learning_rate": 1.3644528890743713e-05, + "loss": 0.0088, + "step": 736470 + }, + { + "epoch": 1.91, + "learning_rate": 1.3640640674372246e-05, + "loss": 0.0065, + "step": 736480 + }, + { + "epoch": 1.91, + "learning_rate": 1.363675245800078e-05, + "loss": 0.0082, + "step": 736490 + }, + { + "epoch": 1.91, + "learning_rate": 1.3632864241629317e-05, + "loss": 0.006, + "step": 736500 + }, + { + "epoch": 1.91, + "learning_rate": 1.3628976025257852e-05, + "loss": 0.009, + "step": 736510 + }, + { + "epoch": 1.91, + "learning_rate": 1.3625087808886389e-05, + "loss": 0.0078, + "step": 736520 + }, + { + "epoch": 1.91, + "learning_rate": 1.3621199592514924e-05, + "loss": 0.0068, + "step": 736530 + }, + { + "epoch": 1.91, + "learning_rate": 1.3617311376143458e-05, + "loss": 0.0082, + "step": 736540 + }, + { + "epoch": 1.91, + "learning_rate": 1.3613423159771993e-05, + "loss": 0.0061, + "step": 736550 + }, + { + "epoch": 1.91, + "learning_rate": 1.3609534943400528e-05, + "loss": 0.0043, + "step": 736560 + }, + { + "epoch": 1.91, + "learning_rate": 1.3605646727029065e-05, + "loss": 0.0066, + "step": 736570 + }, + { + "epoch": 1.91, + "learning_rate": 1.36017585106576e-05, + "loss": 0.0056, + "step": 736580 + }, + { + "epoch": 1.91, + "learning_rate": 1.3597870294286136e-05, + "loss": 0.0084, + "step": 736590 + }, + { + "epoch": 1.91, + "learning_rate": 1.359398207791467e-05, + "loss": 0.0083, + "step": 736600 + }, + { + "epoch": 1.91, + "learning_rate": 1.3590093861543206e-05, + "loss": 0.0071, + "step": 736610 + }, + { + "epoch": 1.91, + "learning_rate": 1.358620564517174e-05, + "loss": 0.0071, + "step": 736620 + }, + { + "epoch": 1.91, + "learning_rate": 1.3582317428800277e-05, + "loss": 0.0054, + "step": 736630 + }, + { + "epoch": 1.91, + "learning_rate": 1.3578429212428812e-05, + "loss": 0.0057, + "step": 736640 + }, + { + "epoch": 1.91, + "learning_rate": 1.3574540996057349e-05, + "loss": 0.0081, + "step": 736650 + }, + { + "epoch": 1.91, + "learning_rate": 1.3570652779685882e-05, + "loss": 0.0077, + "step": 736660 + }, + { + "epoch": 1.91, + "learning_rate": 1.3566764563314417e-05, + "loss": 0.0057, + "step": 736670 + }, + { + "epoch": 1.91, + "learning_rate": 1.3562876346942953e-05, + "loss": 0.0069, + "step": 736680 + }, + { + "epoch": 1.91, + "learning_rate": 1.3558988130571488e-05, + "loss": 0.0074, + "step": 736690 + }, + { + "epoch": 1.91, + "learning_rate": 1.3555099914200025e-05, + "loss": 0.0077, + "step": 736700 + }, + { + "epoch": 1.91, + "learning_rate": 1.355121169782856e-05, + "loss": 0.006, + "step": 736710 + }, + { + "epoch": 1.91, + "learning_rate": 1.3547323481457096e-05, + "loss": 0.0055, + "step": 736720 + }, + { + "epoch": 1.91, + "learning_rate": 1.354343526508563e-05, + "loss": 0.0055, + "step": 736730 + }, + { + "epoch": 1.91, + "learning_rate": 1.3539547048714166e-05, + "loss": 0.0067, + "step": 736740 + }, + { + "epoch": 1.91, + "learning_rate": 1.35356588323427e-05, + "loss": 0.0107, + "step": 736750 + }, + { + "epoch": 1.91, + "learning_rate": 1.3531770615971237e-05, + "loss": 0.0068, + "step": 736760 + }, + { + "epoch": 1.91, + "learning_rate": 1.3527882399599772e-05, + "loss": 0.007, + "step": 736770 + }, + { + "epoch": 1.91, + "learning_rate": 1.3523994183228309e-05, + "loss": 0.0066, + "step": 736780 + }, + { + "epoch": 1.91, + "learning_rate": 1.3520105966856842e-05, + "loss": 0.0059, + "step": 736790 + }, + { + "epoch": 1.91, + "learning_rate": 1.3516217750485377e-05, + "loss": 0.0089, + "step": 736800 + }, + { + "epoch": 1.91, + "learning_rate": 1.3512329534113913e-05, + "loss": 0.0072, + "step": 736810 + }, + { + "epoch": 1.91, + "learning_rate": 1.3508441317742448e-05, + "loss": 0.0082, + "step": 736820 + }, + { + "epoch": 1.91, + "learning_rate": 1.3504553101370985e-05, + "loss": 0.0113, + "step": 736830 + }, + { + "epoch": 1.91, + "learning_rate": 1.350066488499952e-05, + "loss": 0.0083, + "step": 736840 + }, + { + "epoch": 1.91, + "learning_rate": 1.3496776668628054e-05, + "loss": 0.0068, + "step": 736850 + }, + { + "epoch": 1.91, + "learning_rate": 1.349288845225659e-05, + "loss": 0.0045, + "step": 736860 + }, + { + "epoch": 1.91, + "learning_rate": 1.3489000235885126e-05, + "loss": 0.0065, + "step": 736870 + }, + { + "epoch": 1.91, + "learning_rate": 1.348511201951366e-05, + "loss": 0.0058, + "step": 736880 + }, + { + "epoch": 1.91, + "learning_rate": 1.3481223803142197e-05, + "loss": 0.0064, + "step": 736890 + }, + { + "epoch": 1.91, + "learning_rate": 1.3477335586770732e-05, + "loss": 0.0083, + "step": 736900 + }, + { + "epoch": 1.91, + "learning_rate": 1.3473447370399265e-05, + "loss": 0.0071, + "step": 736910 + }, + { + "epoch": 1.91, + "learning_rate": 1.3469559154027802e-05, + "loss": 0.0073, + "step": 736920 + }, + { + "epoch": 1.91, + "learning_rate": 1.3465670937656337e-05, + "loss": 0.0075, + "step": 736930 + }, + { + "epoch": 1.91, + "learning_rate": 1.3461782721284873e-05, + "loss": 0.0111, + "step": 736940 + }, + { + "epoch": 1.91, + "learning_rate": 1.3457894504913408e-05, + "loss": 0.0068, + "step": 736950 + }, + { + "epoch": 1.91, + "learning_rate": 1.3454006288541945e-05, + "loss": 0.0067, + "step": 736960 + }, + { + "epoch": 1.91, + "learning_rate": 1.3450118072170478e-05, + "loss": 0.0078, + "step": 736970 + }, + { + "epoch": 1.91, + "learning_rate": 1.3446229855799014e-05, + "loss": 0.005, + "step": 736980 + }, + { + "epoch": 1.91, + "learning_rate": 1.344234163942755e-05, + "loss": 0.0102, + "step": 736990 + }, + { + "epoch": 1.91, + "learning_rate": 1.3438453423056086e-05, + "loss": 0.0076, + "step": 737000 + }, + { + "epoch": 1.91, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.004480063449591398, + "eval_runtime": 107.9366, + "eval_samples_per_second": 18.529, + "eval_steps_per_second": 4.632, + "step": 737000 + }, + { + "epoch": 1.91, + "learning_rate": 1.343456520668462e-05, + "loss": 0.0063, + "step": 737010 + }, + { + "epoch": 1.91, + "learning_rate": 1.3430676990313157e-05, + "loss": 0.0056, + "step": 737020 + }, + { + "epoch": 1.91, + "learning_rate": 1.3426788773941692e-05, + "loss": 0.0078, + "step": 737030 + }, + { + "epoch": 1.91, + "learning_rate": 1.3422900557570225e-05, + "loss": 0.0046, + "step": 737040 + }, + { + "epoch": 1.91, + "learning_rate": 1.3419012341198762e-05, + "loss": 0.0082, + "step": 737050 + }, + { + "epoch": 1.91, + "learning_rate": 1.3415124124827297e-05, + "loss": 0.0084, + "step": 737060 + }, + { + "epoch": 1.91, + "learning_rate": 1.3411235908455833e-05, + "loss": 0.0127, + "step": 737070 + }, + { + "epoch": 1.91, + "learning_rate": 1.3407347692084368e-05, + "loss": 0.0067, + "step": 737080 + }, + { + "epoch": 1.91, + "learning_rate": 1.3403459475712905e-05, + "loss": 0.0075, + "step": 737090 + }, + { + "epoch": 1.91, + "learning_rate": 1.3399571259341438e-05, + "loss": 0.0092, + "step": 737100 + }, + { + "epoch": 1.91, + "learning_rate": 1.3395683042969974e-05, + "loss": 0.006, + "step": 737110 + }, + { + "epoch": 1.91, + "learning_rate": 1.339179482659851e-05, + "loss": 0.006, + "step": 737120 + }, + { + "epoch": 1.91, + "learning_rate": 1.3387906610227046e-05, + "loss": 0.0054, + "step": 737130 + }, + { + "epoch": 1.91, + "learning_rate": 1.338401839385558e-05, + "loss": 0.0083, + "step": 737140 + }, + { + "epoch": 1.91, + "learning_rate": 1.3380130177484117e-05, + "loss": 0.0059, + "step": 737150 + }, + { + "epoch": 1.91, + "learning_rate": 1.337624196111265e-05, + "loss": 0.0052, + "step": 737160 + }, + { + "epoch": 1.91, + "learning_rate": 1.3372353744741185e-05, + "loss": 0.0074, + "step": 737170 + }, + { + "epoch": 1.91, + "learning_rate": 1.3368465528369722e-05, + "loss": 0.0053, + "step": 737180 + }, + { + "epoch": 1.91, + "learning_rate": 1.3364577311998257e-05, + "loss": 0.007, + "step": 737190 + }, + { + "epoch": 1.91, + "learning_rate": 1.3360689095626793e-05, + "loss": 0.0084, + "step": 737200 + }, + { + "epoch": 1.91, + "learning_rate": 1.3356800879255328e-05, + "loss": 0.006, + "step": 737210 + }, + { + "epoch": 1.91, + "learning_rate": 1.3352912662883863e-05, + "loss": 0.0068, + "step": 737220 + }, + { + "epoch": 1.91, + "learning_rate": 1.3349024446512398e-05, + "loss": 0.0093, + "step": 737230 + }, + { + "epoch": 1.91, + "learning_rate": 1.3345136230140933e-05, + "loss": 0.0071, + "step": 737240 + }, + { + "epoch": 1.91, + "learning_rate": 1.3341248013769469e-05, + "loss": 0.005, + "step": 737250 + }, + { + "epoch": 1.91, + "learning_rate": 1.3337359797398004e-05, + "loss": 0.0072, + "step": 737260 + }, + { + "epoch": 1.91, + "learning_rate": 1.333347158102654e-05, + "loss": 0.0073, + "step": 737270 + }, + { + "epoch": 1.91, + "learning_rate": 1.3329583364655074e-05, + "loss": 0.0067, + "step": 737280 + }, + { + "epoch": 1.91, + "learning_rate": 1.332569514828361e-05, + "loss": 0.0071, + "step": 737290 + }, + { + "epoch": 1.91, + "learning_rate": 1.3321806931912145e-05, + "loss": 0.0107, + "step": 737300 + }, + { + "epoch": 1.91, + "learning_rate": 1.3317918715540682e-05, + "loss": 0.0114, + "step": 737310 + }, + { + "epoch": 1.91, + "learning_rate": 1.3314030499169217e-05, + "loss": 0.0082, + "step": 737320 + }, + { + "epoch": 1.91, + "learning_rate": 1.3310142282797753e-05, + "loss": 0.0057, + "step": 737330 + }, + { + "epoch": 1.91, + "learning_rate": 1.3306254066426288e-05, + "loss": 0.0092, + "step": 737340 + }, + { + "epoch": 1.91, + "learning_rate": 1.3302365850054821e-05, + "loss": 0.0069, + "step": 737350 + }, + { + "epoch": 1.91, + "learning_rate": 1.3298477633683358e-05, + "loss": 0.0077, + "step": 737360 + }, + { + "epoch": 1.91, + "learning_rate": 1.3294589417311893e-05, + "loss": 0.0063, + "step": 737370 + }, + { + "epoch": 1.91, + "learning_rate": 1.3290701200940429e-05, + "loss": 0.01, + "step": 737380 + }, + { + "epoch": 1.91, + "learning_rate": 1.3286812984568964e-05, + "loss": 0.0055, + "step": 737390 + }, + { + "epoch": 1.91, + "learning_rate": 1.32829247681975e-05, + "loss": 0.0063, + "step": 737400 + }, + { + "epoch": 1.91, + "learning_rate": 1.3279036551826034e-05, + "loss": 0.0075, + "step": 737410 + }, + { + "epoch": 1.91, + "learning_rate": 1.327514833545457e-05, + "loss": 0.0065, + "step": 737420 + }, + { + "epoch": 1.91, + "learning_rate": 1.3271260119083105e-05, + "loss": 0.0075, + "step": 737430 + }, + { + "epoch": 1.91, + "learning_rate": 1.3267371902711642e-05, + "loss": 0.0087, + "step": 737440 + }, + { + "epoch": 1.91, + "learning_rate": 1.3263483686340177e-05, + "loss": 0.0061, + "step": 737450 + }, + { + "epoch": 1.91, + "learning_rate": 1.3259595469968713e-05, + "loss": 0.0088, + "step": 737460 + }, + { + "epoch": 1.91, + "learning_rate": 1.3255707253597246e-05, + "loss": 0.0071, + "step": 737470 + }, + { + "epoch": 1.91, + "learning_rate": 1.3251819037225781e-05, + "loss": 0.0057, + "step": 737480 + }, + { + "epoch": 1.91, + "learning_rate": 1.3247930820854318e-05, + "loss": 0.006, + "step": 737490 + }, + { + "epoch": 1.91, + "learning_rate": 1.3244042604482853e-05, + "loss": 0.0072, + "step": 737500 + }, + { + "epoch": 1.91, + "learning_rate": 1.3240154388111389e-05, + "loss": 0.0053, + "step": 737510 + }, + { + "epoch": 1.91, + "learning_rate": 1.3236266171739924e-05, + "loss": 0.0059, + "step": 737520 + }, + { + "epoch": 1.91, + "learning_rate": 1.3232377955368459e-05, + "loss": 0.0061, + "step": 737530 + }, + { + "epoch": 1.91, + "learning_rate": 1.3228489738996994e-05, + "loss": 0.009, + "step": 737540 + }, + { + "epoch": 1.91, + "learning_rate": 1.322460152262553e-05, + "loss": 0.007, + "step": 737550 + }, + { + "epoch": 1.91, + "learning_rate": 1.3220713306254065e-05, + "loss": 0.0073, + "step": 737560 + }, + { + "epoch": 1.91, + "learning_rate": 1.3216825089882602e-05, + "loss": 0.007, + "step": 737570 + }, + { + "epoch": 1.91, + "learning_rate": 1.3212936873511137e-05, + "loss": 0.0082, + "step": 737580 + }, + { + "epoch": 1.91, + "learning_rate": 1.320904865713967e-05, + "loss": 0.0076, + "step": 737590 + }, + { + "epoch": 1.91, + "learning_rate": 1.3205160440768206e-05, + "loss": 0.0072, + "step": 737600 + }, + { + "epoch": 1.91, + "learning_rate": 1.3201272224396741e-05, + "loss": 0.0071, + "step": 737610 + }, + { + "epoch": 1.91, + "learning_rate": 1.3197384008025278e-05, + "loss": 0.0073, + "step": 737620 + }, + { + "epoch": 1.91, + "learning_rate": 1.3193495791653813e-05, + "loss": 0.011, + "step": 737630 + }, + { + "epoch": 1.91, + "learning_rate": 1.3189607575282349e-05, + "loss": 0.0057, + "step": 737640 + }, + { + "epoch": 1.91, + "learning_rate": 1.3185719358910884e-05, + "loss": 0.0059, + "step": 737650 + }, + { + "epoch": 1.91, + "learning_rate": 1.3181831142539419e-05, + "loss": 0.0077, + "step": 737660 + }, + { + "epoch": 1.91, + "learning_rate": 1.3177942926167954e-05, + "loss": 0.0092, + "step": 737670 + }, + { + "epoch": 1.91, + "learning_rate": 1.317405470979649e-05, + "loss": 0.0062, + "step": 737680 + }, + { + "epoch": 1.91, + "learning_rate": 1.3170166493425025e-05, + "loss": 0.0077, + "step": 737690 + }, + { + "epoch": 1.91, + "learning_rate": 1.3166278277053562e-05, + "loss": 0.0072, + "step": 737700 + }, + { + "epoch": 1.91, + "learning_rate": 1.3162390060682096e-05, + "loss": 0.008, + "step": 737710 + }, + { + "epoch": 1.91, + "learning_rate": 1.315850184431063e-05, + "loss": 0.0049, + "step": 737720 + }, + { + "epoch": 1.91, + "learning_rate": 1.3154613627939166e-05, + "loss": 0.0049, + "step": 737730 + }, + { + "epoch": 1.91, + "learning_rate": 1.3150725411567701e-05, + "loss": 0.0078, + "step": 737740 + }, + { + "epoch": 1.91, + "learning_rate": 1.3146837195196238e-05, + "loss": 0.006, + "step": 737750 + }, + { + "epoch": 1.91, + "learning_rate": 1.3142948978824772e-05, + "loss": 0.0063, + "step": 737760 + }, + { + "epoch": 1.91, + "learning_rate": 1.3139060762453309e-05, + "loss": 0.0099, + "step": 737770 + }, + { + "epoch": 1.91, + "learning_rate": 1.3135172546081842e-05, + "loss": 0.0078, + "step": 737780 + }, + { + "epoch": 1.91, + "learning_rate": 1.3131284329710379e-05, + "loss": 0.0097, + "step": 737790 + }, + { + "epoch": 1.91, + "learning_rate": 1.3127396113338914e-05, + "loss": 0.0058, + "step": 737800 + }, + { + "epoch": 1.91, + "learning_rate": 1.312350789696745e-05, + "loss": 0.0079, + "step": 737810 + }, + { + "epoch": 1.91, + "learning_rate": 1.3119619680595985e-05, + "loss": 0.0089, + "step": 737820 + }, + { + "epoch": 1.91, + "learning_rate": 1.3115731464224522e-05, + "loss": 0.009, + "step": 737830 + }, + { + "epoch": 1.91, + "learning_rate": 1.3111843247853055e-05, + "loss": 0.0056, + "step": 737840 + }, + { + "epoch": 1.91, + "learning_rate": 1.310795503148159e-05, + "loss": 0.0078, + "step": 737850 + }, + { + "epoch": 1.91, + "learning_rate": 1.3104066815110126e-05, + "loss": 0.0048, + "step": 737860 + }, + { + "epoch": 1.91, + "learning_rate": 1.3100178598738661e-05, + "loss": 0.008, + "step": 737870 + }, + { + "epoch": 1.91, + "learning_rate": 1.3096290382367198e-05, + "loss": 0.007, + "step": 737880 + }, + { + "epoch": 1.91, + "learning_rate": 1.3092402165995732e-05, + "loss": 0.0065, + "step": 737890 + }, + { + "epoch": 1.91, + "learning_rate": 1.3088513949624269e-05, + "loss": 0.006, + "step": 737900 + }, + { + "epoch": 1.91, + "learning_rate": 1.3084625733252802e-05, + "loss": 0.0093, + "step": 737910 + }, + { + "epoch": 1.91, + "learning_rate": 1.3080737516881339e-05, + "loss": 0.0065, + "step": 737920 + }, + { + "epoch": 1.91, + "learning_rate": 1.3076849300509874e-05, + "loss": 0.0101, + "step": 737930 + }, + { + "epoch": 1.91, + "learning_rate": 1.3072961084138408e-05, + "loss": 0.0096, + "step": 737940 + }, + { + "epoch": 1.91, + "learning_rate": 1.3069072867766945e-05, + "loss": 0.0059, + "step": 737950 + }, + { + "epoch": 1.91, + "learning_rate": 1.306518465139548e-05, + "loss": 0.0077, + "step": 737960 + }, + { + "epoch": 1.91, + "learning_rate": 1.3061296435024015e-05, + "loss": 0.0067, + "step": 737970 + }, + { + "epoch": 1.91, + "learning_rate": 1.305740821865255e-05, + "loss": 0.0067, + "step": 737980 + }, + { + "epoch": 1.91, + "learning_rate": 1.3053520002281086e-05, + "loss": 0.0058, + "step": 737990 + }, + { + "epoch": 1.91, + "learning_rate": 1.3049631785909621e-05, + "loss": 0.0075, + "step": 738000 + }, + { + "epoch": 1.91, + "eval_cer": 0.8816536990304715, + "eval_loss": 0.004501659423112869, + "eval_runtime": 107.8766, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 738000 + }, + { + "epoch": 1.91, + "learning_rate": 1.3045743569538158e-05, + "loss": 0.0072, + "step": 738010 + }, + { + "epoch": 1.91, + "learning_rate": 1.3041855353166692e-05, + "loss": 0.0074, + "step": 738020 + }, + { + "epoch": 1.91, + "learning_rate": 1.3037967136795226e-05, + "loss": 0.0069, + "step": 738030 + }, + { + "epoch": 1.91, + "learning_rate": 1.3034078920423762e-05, + "loss": 0.0073, + "step": 738040 + }, + { + "epoch": 1.91, + "learning_rate": 1.3030190704052297e-05, + "loss": 0.0061, + "step": 738050 + }, + { + "epoch": 1.91, + "learning_rate": 1.3026302487680834e-05, + "loss": 0.0071, + "step": 738060 + }, + { + "epoch": 1.91, + "learning_rate": 1.3022414271309368e-05, + "loss": 0.0055, + "step": 738070 + }, + { + "epoch": 1.91, + "learning_rate": 1.3018526054937905e-05, + "loss": 0.0069, + "step": 738080 + }, + { + "epoch": 1.91, + "learning_rate": 1.3014637838566438e-05, + "loss": 0.0072, + "step": 738090 + }, + { + "epoch": 1.91, + "learning_rate": 1.3010749622194975e-05, + "loss": 0.0099, + "step": 738100 + }, + { + "epoch": 1.91, + "learning_rate": 1.300686140582351e-05, + "loss": 0.0075, + "step": 738110 + }, + { + "epoch": 1.91, + "learning_rate": 1.3002973189452046e-05, + "loss": 0.0074, + "step": 738120 + }, + { + "epoch": 1.91, + "learning_rate": 1.2999084973080581e-05, + "loss": 0.0085, + "step": 738130 + }, + { + "epoch": 1.91, + "learning_rate": 1.2995196756709118e-05, + "loss": 0.0059, + "step": 738140 + }, + { + "epoch": 1.91, + "learning_rate": 1.299130854033765e-05, + "loss": 0.0063, + "step": 738150 + }, + { + "epoch": 1.91, + "learning_rate": 1.2987420323966186e-05, + "loss": 0.0128, + "step": 738160 + }, + { + "epoch": 1.91, + "learning_rate": 1.2983532107594722e-05, + "loss": 0.0059, + "step": 738170 + }, + { + "epoch": 1.91, + "learning_rate": 1.2979643891223257e-05, + "loss": 0.0061, + "step": 738180 + }, + { + "epoch": 1.91, + "learning_rate": 1.2975755674851794e-05, + "loss": 0.0072, + "step": 738190 + }, + { + "epoch": 1.91, + "learning_rate": 1.2971867458480328e-05, + "loss": 0.0053, + "step": 738200 + }, + { + "epoch": 1.91, + "learning_rate": 1.2967979242108865e-05, + "loss": 0.0078, + "step": 738210 + }, + { + "epoch": 1.91, + "learning_rate": 1.2964091025737398e-05, + "loss": 0.0099, + "step": 738220 + }, + { + "epoch": 1.91, + "learning_rate": 1.2960202809365935e-05, + "loss": 0.0063, + "step": 738230 + }, + { + "epoch": 1.91, + "learning_rate": 1.295631459299447e-05, + "loss": 0.0069, + "step": 738240 + }, + { + "epoch": 1.91, + "learning_rate": 1.2952426376623006e-05, + "loss": 0.006, + "step": 738250 + }, + { + "epoch": 1.91, + "learning_rate": 1.2948538160251541e-05, + "loss": 0.0075, + "step": 738260 + }, + { + "epoch": 1.91, + "learning_rate": 1.2944649943880078e-05, + "loss": 0.0069, + "step": 738270 + }, + { + "epoch": 1.91, + "learning_rate": 1.294076172750861e-05, + "loss": 0.0087, + "step": 738280 + }, + { + "epoch": 1.91, + "learning_rate": 1.2936873511137146e-05, + "loss": 0.0071, + "step": 738290 + }, + { + "epoch": 1.91, + "learning_rate": 1.2932985294765682e-05, + "loss": 0.006, + "step": 738300 + }, + { + "epoch": 1.91, + "learning_rate": 1.2929097078394217e-05, + "loss": 0.0054, + "step": 738310 + }, + { + "epoch": 1.91, + "learning_rate": 1.2925208862022754e-05, + "loss": 0.0049, + "step": 738320 + }, + { + "epoch": 1.91, + "learning_rate": 1.2921320645651288e-05, + "loss": 0.0061, + "step": 738330 + }, + { + "epoch": 1.91, + "learning_rate": 1.2917432429279823e-05, + "loss": 0.0082, + "step": 738340 + }, + { + "epoch": 1.91, + "learning_rate": 1.2913544212908358e-05, + "loss": 0.0102, + "step": 738350 + }, + { + "epoch": 1.91, + "learning_rate": 1.2909655996536895e-05, + "loss": 0.0066, + "step": 738360 + }, + { + "epoch": 1.91, + "learning_rate": 1.290576778016543e-05, + "loss": 0.008, + "step": 738370 + }, + { + "epoch": 1.91, + "learning_rate": 1.2901879563793966e-05, + "loss": 0.0073, + "step": 738380 + }, + { + "epoch": 1.91, + "learning_rate": 1.2897991347422501e-05, + "loss": 0.0069, + "step": 738390 + }, + { + "epoch": 1.91, + "learning_rate": 1.2894103131051034e-05, + "loss": 0.0087, + "step": 738400 + }, + { + "epoch": 1.91, + "learning_rate": 1.289021491467957e-05, + "loss": 0.0067, + "step": 738410 + }, + { + "epoch": 1.91, + "learning_rate": 1.2886326698308106e-05, + "loss": 0.0068, + "step": 738420 + }, + { + "epoch": 1.91, + "learning_rate": 1.2882438481936642e-05, + "loss": 0.0064, + "step": 738430 + }, + { + "epoch": 1.91, + "learning_rate": 1.2878550265565177e-05, + "loss": 0.007, + "step": 738440 + }, + { + "epoch": 1.91, + "learning_rate": 1.2874662049193714e-05, + "loss": 0.0056, + "step": 738450 + }, + { + "epoch": 1.91, + "learning_rate": 1.2870773832822247e-05, + "loss": 0.0058, + "step": 738460 + }, + { + "epoch": 1.91, + "learning_rate": 1.2866885616450783e-05, + "loss": 0.0071, + "step": 738470 + }, + { + "epoch": 1.91, + "learning_rate": 1.2862997400079318e-05, + "loss": 0.0071, + "step": 738480 + }, + { + "epoch": 1.91, + "learning_rate": 1.2859109183707855e-05, + "loss": 0.0065, + "step": 738490 + }, + { + "epoch": 1.91, + "learning_rate": 1.285522096733639e-05, + "loss": 0.0057, + "step": 738500 + }, + { + "epoch": 1.91, + "learning_rate": 1.2851332750964926e-05, + "loss": 0.0093, + "step": 738510 + }, + { + "epoch": 1.91, + "learning_rate": 1.2847444534593461e-05, + "loss": 0.0053, + "step": 738520 + }, + { + "epoch": 1.91, + "learning_rate": 1.2843556318221994e-05, + "loss": 0.0089, + "step": 738530 + }, + { + "epoch": 1.91, + "learning_rate": 1.283966810185053e-05, + "loss": 0.0077, + "step": 738540 + }, + { + "epoch": 1.91, + "learning_rate": 1.2835779885479066e-05, + "loss": 0.0054, + "step": 738550 + }, + { + "epoch": 1.91, + "learning_rate": 1.2831891669107602e-05, + "loss": 0.0085, + "step": 738560 + }, + { + "epoch": 1.91, + "learning_rate": 1.2828003452736137e-05, + "loss": 0.0073, + "step": 738570 + }, + { + "epoch": 1.91, + "learning_rate": 1.2824115236364673e-05, + "loss": 0.0065, + "step": 738580 + }, + { + "epoch": 1.91, + "learning_rate": 1.2820227019993207e-05, + "loss": 0.0071, + "step": 738590 + }, + { + "epoch": 1.91, + "learning_rate": 1.2816338803621743e-05, + "loss": 0.0087, + "step": 738600 + }, + { + "epoch": 1.91, + "learning_rate": 1.2812450587250278e-05, + "loss": 0.0076, + "step": 738610 + }, + { + "epoch": 1.91, + "learning_rate": 1.2808562370878813e-05, + "loss": 0.0051, + "step": 738620 + }, + { + "epoch": 1.91, + "learning_rate": 1.280467415450735e-05, + "loss": 0.0083, + "step": 738630 + }, + { + "epoch": 1.91, + "learning_rate": 1.2800785938135884e-05, + "loss": 0.0061, + "step": 738640 + }, + { + "epoch": 1.91, + "learning_rate": 1.279689772176442e-05, + "loss": 0.0079, + "step": 738650 + }, + { + "epoch": 1.91, + "learning_rate": 1.2793009505392954e-05, + "loss": 0.0062, + "step": 738660 + }, + { + "epoch": 1.91, + "learning_rate": 1.278912128902149e-05, + "loss": 0.0057, + "step": 738670 + }, + { + "epoch": 1.91, + "learning_rate": 1.2785233072650025e-05, + "loss": 0.0054, + "step": 738680 + }, + { + "epoch": 1.91, + "learning_rate": 1.2781344856278562e-05, + "loss": 0.0074, + "step": 738690 + }, + { + "epoch": 1.91, + "learning_rate": 1.2777456639907097e-05, + "loss": 0.0067, + "step": 738700 + }, + { + "epoch": 1.91, + "learning_rate": 1.277356842353563e-05, + "loss": 0.0082, + "step": 738710 + }, + { + "epoch": 1.91, + "learning_rate": 1.2769680207164167e-05, + "loss": 0.0049, + "step": 738720 + }, + { + "epoch": 1.91, + "learning_rate": 1.2765791990792701e-05, + "loss": 0.0065, + "step": 738730 + }, + { + "epoch": 1.91, + "learning_rate": 1.2761903774421238e-05, + "loss": 0.0078, + "step": 738740 + }, + { + "epoch": 1.91, + "learning_rate": 1.2758015558049773e-05, + "loss": 0.0077, + "step": 738750 + }, + { + "epoch": 1.91, + "learning_rate": 1.275412734167831e-05, + "loss": 0.0096, + "step": 738760 + }, + { + "epoch": 1.91, + "learning_rate": 1.2750239125306843e-05, + "loss": 0.0069, + "step": 738770 + }, + { + "epoch": 1.92, + "learning_rate": 1.274635090893538e-05, + "loss": 0.0056, + "step": 738780 + }, + { + "epoch": 1.92, + "learning_rate": 1.2742462692563914e-05, + "loss": 0.0055, + "step": 738790 + }, + { + "epoch": 1.92, + "learning_rate": 1.273857447619245e-05, + "loss": 0.007, + "step": 738800 + }, + { + "epoch": 1.92, + "learning_rate": 1.2734686259820985e-05, + "loss": 0.0078, + "step": 738810 + }, + { + "epoch": 1.92, + "learning_rate": 1.2730798043449522e-05, + "loss": 0.007, + "step": 738820 + }, + { + "epoch": 1.92, + "learning_rate": 1.2726909827078057e-05, + "loss": 0.0064, + "step": 738830 + }, + { + "epoch": 1.92, + "learning_rate": 1.272302161070659e-05, + "loss": 0.0085, + "step": 738840 + }, + { + "epoch": 1.92, + "learning_rate": 1.2719133394335127e-05, + "loss": 0.0091, + "step": 738850 + }, + { + "epoch": 1.92, + "learning_rate": 1.2715245177963661e-05, + "loss": 0.0074, + "step": 738860 + }, + { + "epoch": 1.92, + "learning_rate": 1.2711356961592198e-05, + "loss": 0.0058, + "step": 738870 + }, + { + "epoch": 1.92, + "learning_rate": 1.2707468745220733e-05, + "loss": 0.0099, + "step": 738880 + }, + { + "epoch": 1.92, + "learning_rate": 1.270358052884927e-05, + "loss": 0.0079, + "step": 738890 + }, + { + "epoch": 1.92, + "learning_rate": 1.2699692312477803e-05, + "loss": 0.0053, + "step": 738900 + }, + { + "epoch": 1.92, + "learning_rate": 1.269580409610634e-05, + "loss": 0.0061, + "step": 738910 + }, + { + "epoch": 1.92, + "learning_rate": 1.2691915879734874e-05, + "loss": 0.006, + "step": 738920 + }, + { + "epoch": 1.92, + "learning_rate": 1.268802766336341e-05, + "loss": 0.01, + "step": 738930 + }, + { + "epoch": 1.92, + "learning_rate": 1.2684139446991945e-05, + "loss": 0.0073, + "step": 738940 + }, + { + "epoch": 1.92, + "learning_rate": 1.2680251230620482e-05, + "loss": 0.0067, + "step": 738950 + }, + { + "epoch": 1.92, + "learning_rate": 1.2676363014249015e-05, + "loss": 0.0082, + "step": 738960 + }, + { + "epoch": 1.92, + "learning_rate": 1.267247479787755e-05, + "loss": 0.0073, + "step": 738970 + }, + { + "epoch": 1.92, + "learning_rate": 1.2668586581506087e-05, + "loss": 0.0074, + "step": 738980 + }, + { + "epoch": 1.92, + "learning_rate": 1.2664698365134621e-05, + "loss": 0.0083, + "step": 738990 + }, + { + "epoch": 1.92, + "learning_rate": 1.2660810148763158e-05, + "loss": 0.0075, + "step": 739000 + }, + { + "epoch": 1.92, + "eval_cer": 0.8816592975782083, + "eval_loss": 0.004513974767178297, + "eval_runtime": 107.8813, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 739000 + }, + { + "epoch": 1.92, + "learning_rate": 1.2656921932391693e-05, + "loss": 0.008, + "step": 739010 + }, + { + "epoch": 1.92, + "learning_rate": 1.2653033716020228e-05, + "loss": 0.0059, + "step": 739020 + }, + { + "epoch": 1.92, + "learning_rate": 1.2649145499648763e-05, + "loss": 0.0075, + "step": 739030 + }, + { + "epoch": 1.92, + "learning_rate": 1.2645257283277299e-05, + "loss": 0.0052, + "step": 739040 + }, + { + "epoch": 1.92, + "learning_rate": 1.2641369066905834e-05, + "loss": 0.0087, + "step": 739050 + }, + { + "epoch": 1.92, + "learning_rate": 1.263748085053437e-05, + "loss": 0.0091, + "step": 739060 + }, + { + "epoch": 1.92, + "learning_rate": 1.2633592634162905e-05, + "loss": 0.0053, + "step": 739070 + }, + { + "epoch": 1.92, + "learning_rate": 1.2629704417791439e-05, + "loss": 0.0049, + "step": 739080 + }, + { + "epoch": 1.92, + "learning_rate": 1.2625816201419975e-05, + "loss": 0.0069, + "step": 739090 + }, + { + "epoch": 1.92, + "learning_rate": 1.262192798504851e-05, + "loss": 0.0079, + "step": 739100 + }, + { + "epoch": 1.92, + "learning_rate": 1.2618039768677047e-05, + "loss": 0.0062, + "step": 739110 + }, + { + "epoch": 1.92, + "learning_rate": 1.2614151552305581e-05, + "loss": 0.0082, + "step": 739120 + }, + { + "epoch": 1.92, + "learning_rate": 1.2610263335934118e-05, + "loss": 0.0058, + "step": 739130 + }, + { + "epoch": 1.92, + "learning_rate": 1.2606375119562653e-05, + "loss": 0.0079, + "step": 739140 + }, + { + "epoch": 1.92, + "learning_rate": 1.2602486903191188e-05, + "loss": 0.0055, + "step": 739150 + }, + { + "epoch": 1.92, + "learning_rate": 1.2598598686819723e-05, + "loss": 0.006, + "step": 739160 + }, + { + "epoch": 1.92, + "learning_rate": 1.2594710470448259e-05, + "loss": 0.0099, + "step": 739170 + }, + { + "epoch": 1.92, + "learning_rate": 1.2590822254076794e-05, + "loss": 0.0083, + "step": 739180 + }, + { + "epoch": 1.92, + "learning_rate": 1.258693403770533e-05, + "loss": 0.0075, + "step": 739190 + }, + { + "epoch": 1.92, + "learning_rate": 1.2583045821333865e-05, + "loss": 0.0064, + "step": 739200 + }, + { + "epoch": 1.92, + "learning_rate": 1.2579157604962399e-05, + "loss": 0.0089, + "step": 739210 + }, + { + "epoch": 1.92, + "learning_rate": 1.2575269388590935e-05, + "loss": 0.0062, + "step": 739220 + }, + { + "epoch": 1.92, + "learning_rate": 1.257138117221947e-05, + "loss": 0.0052, + "step": 739230 + }, + { + "epoch": 1.92, + "learning_rate": 1.2567492955848007e-05, + "loss": 0.0096, + "step": 739240 + }, + { + "epoch": 1.92, + "learning_rate": 1.2563604739476541e-05, + "loss": 0.0081, + "step": 739250 + }, + { + "epoch": 1.92, + "learning_rate": 1.2559716523105078e-05, + "loss": 0.0088, + "step": 739260 + }, + { + "epoch": 1.92, + "learning_rate": 1.2555828306733611e-05, + "loss": 0.0083, + "step": 739270 + }, + { + "epoch": 1.92, + "learning_rate": 1.2551940090362148e-05, + "loss": 0.0074, + "step": 739280 + }, + { + "epoch": 1.92, + "learning_rate": 1.2548051873990683e-05, + "loss": 0.0074, + "step": 739290 + }, + { + "epoch": 1.92, + "learning_rate": 1.2544163657619219e-05, + "loss": 0.0107, + "step": 739300 + }, + { + "epoch": 1.92, + "learning_rate": 1.2540275441247754e-05, + "loss": 0.0081, + "step": 739310 + }, + { + "epoch": 1.92, + "learning_rate": 1.2536387224876289e-05, + "loss": 0.0073, + "step": 739320 + }, + { + "epoch": 1.92, + "learning_rate": 1.2532499008504824e-05, + "loss": 0.0079, + "step": 739330 + }, + { + "epoch": 1.92, + "learning_rate": 1.2528610792133359e-05, + "loss": 0.0108, + "step": 739340 + }, + { + "epoch": 1.92, + "learning_rate": 1.2524722575761895e-05, + "loss": 0.0079, + "step": 739350 + }, + { + "epoch": 1.92, + "learning_rate": 1.252083435939043e-05, + "loss": 0.0085, + "step": 739360 + }, + { + "epoch": 1.92, + "learning_rate": 1.2516946143018967e-05, + "loss": 0.0121, + "step": 739370 + }, + { + "epoch": 1.92, + "learning_rate": 1.2513057926647501e-05, + "loss": 0.0069, + "step": 739380 + }, + { + "epoch": 1.92, + "learning_rate": 1.2509169710276035e-05, + "loss": 0.007, + "step": 739390 + }, + { + "epoch": 1.92, + "learning_rate": 1.2505281493904571e-05, + "loss": 0.0068, + "step": 739400 + }, + { + "epoch": 1.92, + "learning_rate": 1.2501393277533106e-05, + "loss": 0.0079, + "step": 739410 + }, + { + "epoch": 1.92, + "learning_rate": 1.2497505061161643e-05, + "loss": 0.007, + "step": 739420 + }, + { + "epoch": 1.92, + "learning_rate": 1.2493616844790177e-05, + "loss": 0.0063, + "step": 739430 + }, + { + "epoch": 1.92, + "learning_rate": 1.2489728628418714e-05, + "loss": 0.0088, + "step": 739440 + }, + { + "epoch": 1.92, + "learning_rate": 1.2485840412047249e-05, + "loss": 0.0066, + "step": 739450 + }, + { + "epoch": 1.92, + "learning_rate": 1.2481952195675784e-05, + "loss": 0.0056, + "step": 739460 + }, + { + "epoch": 1.92, + "learning_rate": 1.2478063979304319e-05, + "loss": 0.006, + "step": 739470 + }, + { + "epoch": 1.92, + "learning_rate": 1.2474175762932855e-05, + "loss": 0.011, + "step": 739480 + }, + { + "epoch": 1.92, + "learning_rate": 1.247028754656139e-05, + "loss": 0.0113, + "step": 739490 + }, + { + "epoch": 1.92, + "learning_rate": 1.2466399330189926e-05, + "loss": 0.0085, + "step": 739500 + }, + { + "epoch": 1.92, + "learning_rate": 1.2462511113818461e-05, + "loss": 0.0062, + "step": 739510 + }, + { + "epoch": 1.92, + "learning_rate": 1.2458622897446995e-05, + "loss": 0.0049, + "step": 739520 + }, + { + "epoch": 1.92, + "learning_rate": 1.2454734681075531e-05, + "loss": 0.0071, + "step": 739530 + }, + { + "epoch": 1.92, + "learning_rate": 1.2450846464704066e-05, + "loss": 0.0066, + "step": 739540 + }, + { + "epoch": 1.92, + "learning_rate": 1.2446958248332602e-05, + "loss": 0.0071, + "step": 739550 + }, + { + "epoch": 1.92, + "learning_rate": 1.2443070031961137e-05, + "loss": 0.008, + "step": 739560 + }, + { + "epoch": 1.92, + "learning_rate": 1.2439181815589674e-05, + "loss": 0.0071, + "step": 739570 + }, + { + "epoch": 1.92, + "learning_rate": 1.2435293599218207e-05, + "loss": 0.0055, + "step": 739580 + }, + { + "epoch": 1.92, + "learning_rate": 1.2431405382846744e-05, + "loss": 0.007, + "step": 739590 + }, + { + "epoch": 1.92, + "learning_rate": 1.2427517166475278e-05, + "loss": 0.0085, + "step": 739600 + }, + { + "epoch": 1.92, + "learning_rate": 1.2423628950103815e-05, + "loss": 0.0078, + "step": 739610 + }, + { + "epoch": 1.92, + "learning_rate": 1.241974073373235e-05, + "loss": 0.0047, + "step": 739620 + }, + { + "epoch": 1.92, + "learning_rate": 1.2415852517360886e-05, + "loss": 0.0058, + "step": 739630 + }, + { + "epoch": 1.92, + "learning_rate": 1.241196430098942e-05, + "loss": 0.0073, + "step": 739640 + }, + { + "epoch": 1.92, + "learning_rate": 1.2408076084617954e-05, + "loss": 0.007, + "step": 739650 + }, + { + "epoch": 1.92, + "learning_rate": 1.2404187868246491e-05, + "loss": 0.0069, + "step": 739660 + }, + { + "epoch": 1.92, + "learning_rate": 1.2400299651875026e-05, + "loss": 0.0086, + "step": 739670 + }, + { + "epoch": 1.92, + "learning_rate": 1.2396411435503562e-05, + "loss": 0.0068, + "step": 739680 + }, + { + "epoch": 1.92, + "learning_rate": 1.2392523219132097e-05, + "loss": 0.0073, + "step": 739690 + }, + { + "epoch": 1.92, + "learning_rate": 1.2388635002760632e-05, + "loss": 0.0073, + "step": 739700 + }, + { + "epoch": 1.92, + "learning_rate": 1.2384746786389167e-05, + "loss": 0.0102, + "step": 739710 + }, + { + "epoch": 1.92, + "learning_rate": 1.2380858570017704e-05, + "loss": 0.0097, + "step": 739720 + }, + { + "epoch": 1.92, + "learning_rate": 1.2376970353646238e-05, + "loss": 0.0059, + "step": 739730 + }, + { + "epoch": 1.92, + "learning_rate": 1.2373082137274775e-05, + "loss": 0.0087, + "step": 739740 + }, + { + "epoch": 1.92, + "learning_rate": 1.236919392090331e-05, + "loss": 0.0047, + "step": 739750 + }, + { + "epoch": 1.92, + "learning_rate": 1.2365305704531846e-05, + "loss": 0.008, + "step": 739760 + }, + { + "epoch": 1.92, + "learning_rate": 1.236141748816038e-05, + "loss": 0.0064, + "step": 739770 + }, + { + "epoch": 1.92, + "learning_rate": 1.2357529271788914e-05, + "loss": 0.0076, + "step": 739780 + }, + { + "epoch": 1.92, + "learning_rate": 1.2353641055417451e-05, + "loss": 0.0084, + "step": 739790 + }, + { + "epoch": 1.92, + "learning_rate": 1.2349752839045986e-05, + "loss": 0.0101, + "step": 739800 + }, + { + "epoch": 1.92, + "learning_rate": 1.2345864622674522e-05, + "loss": 0.0068, + "step": 739810 + }, + { + "epoch": 1.92, + "learning_rate": 1.2341976406303057e-05, + "loss": 0.0079, + "step": 739820 + }, + { + "epoch": 1.92, + "learning_rate": 1.2338088189931592e-05, + "loss": 0.0061, + "step": 739830 + }, + { + "epoch": 1.92, + "learning_rate": 1.2334199973560127e-05, + "loss": 0.0098, + "step": 739840 + }, + { + "epoch": 1.92, + "learning_rate": 1.2330311757188664e-05, + "loss": 0.0068, + "step": 739850 + }, + { + "epoch": 1.92, + "learning_rate": 1.2326423540817198e-05, + "loss": 0.0077, + "step": 739860 + }, + { + "epoch": 1.92, + "learning_rate": 1.2322535324445735e-05, + "loss": 0.0094, + "step": 739870 + }, + { + "epoch": 1.92, + "learning_rate": 1.231864710807427e-05, + "loss": 0.0088, + "step": 739880 + }, + { + "epoch": 1.92, + "learning_rate": 1.2314758891702803e-05, + "loss": 0.0078, + "step": 739890 + }, + { + "epoch": 1.92, + "learning_rate": 1.231087067533134e-05, + "loss": 0.0069, + "step": 739900 + }, + { + "epoch": 1.92, + "learning_rate": 1.2306982458959874e-05, + "loss": 0.0081, + "step": 739910 + }, + { + "epoch": 1.92, + "learning_rate": 1.2303094242588411e-05, + "loss": 0.0067, + "step": 739920 + }, + { + "epoch": 1.92, + "learning_rate": 1.2299206026216946e-05, + "loss": 0.012, + "step": 739930 + }, + { + "epoch": 1.92, + "learning_rate": 1.2295317809845482e-05, + "loss": 0.0073, + "step": 739940 + }, + { + "epoch": 1.92, + "learning_rate": 1.2291429593474016e-05, + "loss": 0.008, + "step": 739950 + }, + { + "epoch": 1.92, + "learning_rate": 1.2287541377102552e-05, + "loss": 0.01, + "step": 739960 + }, + { + "epoch": 1.92, + "learning_rate": 1.2283653160731087e-05, + "loss": 0.0063, + "step": 739970 + }, + { + "epoch": 1.92, + "learning_rate": 1.2279764944359624e-05, + "loss": 0.0076, + "step": 739980 + }, + { + "epoch": 1.92, + "learning_rate": 1.2275876727988158e-05, + "loss": 0.0093, + "step": 739990 + }, + { + "epoch": 1.92, + "learning_rate": 1.2271988511616693e-05, + "loss": 0.0065, + "step": 740000 + }, + { + "epoch": 1.92, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.004454230424016714, + "eval_runtime": 108.0552, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 740000 + }, + { + "epoch": 1.92, + "learning_rate": 1.2268100295245228e-05, + "loss": 0.0118, + "step": 740010 + }, + { + "epoch": 1.92, + "learning_rate": 1.2264212078873763e-05, + "loss": 0.0093, + "step": 740020 + }, + { + "epoch": 1.92, + "learning_rate": 1.22603238625023e-05, + "loss": 0.0056, + "step": 740030 + }, + { + "epoch": 1.92, + "learning_rate": 1.2256435646130834e-05, + "loss": 0.0078, + "step": 740040 + }, + { + "epoch": 1.92, + "learning_rate": 1.2252547429759371e-05, + "loss": 0.0089, + "step": 740050 + }, + { + "epoch": 1.92, + "learning_rate": 1.2248659213387906e-05, + "loss": 0.0092, + "step": 740060 + }, + { + "epoch": 1.92, + "learning_rate": 1.2244770997016442e-05, + "loss": 0.0068, + "step": 740070 + }, + { + "epoch": 1.92, + "learning_rate": 1.2240882780644976e-05, + "loss": 0.0081, + "step": 740080 + }, + { + "epoch": 1.92, + "learning_rate": 1.223699456427351e-05, + "loss": 0.0106, + "step": 740090 + }, + { + "epoch": 1.92, + "learning_rate": 1.2233106347902047e-05, + "loss": 0.0077, + "step": 740100 + }, + { + "epoch": 1.92, + "learning_rate": 1.2229218131530582e-05, + "loss": 0.0112, + "step": 740110 + }, + { + "epoch": 1.92, + "learning_rate": 1.2225329915159118e-05, + "loss": 0.007, + "step": 740120 + }, + { + "epoch": 1.92, + "learning_rate": 1.2221441698787653e-05, + "loss": 0.0076, + "step": 740130 + }, + { + "epoch": 1.92, + "learning_rate": 1.2217553482416188e-05, + "loss": 0.0073, + "step": 740140 + }, + { + "epoch": 1.92, + "learning_rate": 1.2213665266044723e-05, + "loss": 0.0074, + "step": 740150 + }, + { + "epoch": 1.92, + "learning_rate": 1.220977704967326e-05, + "loss": 0.0052, + "step": 740160 + }, + { + "epoch": 1.92, + "learning_rate": 1.2205888833301794e-05, + "loss": 0.0072, + "step": 740170 + }, + { + "epoch": 1.92, + "learning_rate": 1.2202000616930331e-05, + "loss": 0.0088, + "step": 740180 + }, + { + "epoch": 1.92, + "learning_rate": 1.2198112400558866e-05, + "loss": 0.0068, + "step": 740190 + }, + { + "epoch": 1.92, + "learning_rate": 1.2194224184187399e-05, + "loss": 0.0069, + "step": 740200 + }, + { + "epoch": 1.92, + "learning_rate": 1.2190335967815936e-05, + "loss": 0.006, + "step": 740210 + }, + { + "epoch": 1.92, + "learning_rate": 1.218644775144447e-05, + "loss": 0.0067, + "step": 740220 + }, + { + "epoch": 1.92, + "learning_rate": 1.2182559535073007e-05, + "loss": 0.0068, + "step": 740230 + }, + { + "epoch": 1.92, + "learning_rate": 1.2178671318701542e-05, + "loss": 0.008, + "step": 740240 + }, + { + "epoch": 1.92, + "learning_rate": 1.2174783102330078e-05, + "loss": 0.0063, + "step": 740250 + }, + { + "epoch": 1.92, + "learning_rate": 1.2170894885958612e-05, + "loss": 0.0078, + "step": 740260 + }, + { + "epoch": 1.92, + "learning_rate": 1.2167006669587148e-05, + "loss": 0.0077, + "step": 740270 + }, + { + "epoch": 1.92, + "learning_rate": 1.2163118453215683e-05, + "loss": 0.0078, + "step": 740280 + }, + { + "epoch": 1.92, + "learning_rate": 1.215923023684422e-05, + "loss": 0.0066, + "step": 740290 + }, + { + "epoch": 1.92, + "learning_rate": 1.2155342020472754e-05, + "loss": 0.0071, + "step": 740300 + }, + { + "epoch": 1.92, + "learning_rate": 1.2151453804101291e-05, + "loss": 0.008, + "step": 740310 + }, + { + "epoch": 1.92, + "learning_rate": 1.2147565587729824e-05, + "loss": 0.0083, + "step": 740320 + }, + { + "epoch": 1.92, + "learning_rate": 1.2143677371358359e-05, + "loss": 0.0092, + "step": 740330 + }, + { + "epoch": 1.92, + "learning_rate": 1.2139789154986896e-05, + "loss": 0.008, + "step": 740340 + }, + { + "epoch": 1.92, + "learning_rate": 1.213590093861543e-05, + "loss": 0.0072, + "step": 740350 + }, + { + "epoch": 1.92, + "learning_rate": 1.2132012722243967e-05, + "loss": 0.005, + "step": 740360 + }, + { + "epoch": 1.92, + "learning_rate": 1.2128124505872502e-05, + "loss": 0.0059, + "step": 740370 + }, + { + "epoch": 1.92, + "learning_rate": 1.2124236289501038e-05, + "loss": 0.0063, + "step": 740380 + }, + { + "epoch": 1.92, + "learning_rate": 1.2120348073129572e-05, + "loss": 0.0077, + "step": 740390 + }, + { + "epoch": 1.92, + "learning_rate": 1.2116459856758108e-05, + "loss": 0.0077, + "step": 740400 + }, + { + "epoch": 1.92, + "learning_rate": 1.2112571640386643e-05, + "loss": 0.0051, + "step": 740410 + }, + { + "epoch": 1.92, + "learning_rate": 1.210868342401518e-05, + "loss": 0.0058, + "step": 740420 + }, + { + "epoch": 1.92, + "learning_rate": 1.2104795207643714e-05, + "loss": 0.0063, + "step": 740430 + }, + { + "epoch": 1.92, + "learning_rate": 1.2100906991272251e-05, + "loss": 0.0075, + "step": 740440 + }, + { + "epoch": 1.92, + "learning_rate": 1.2097018774900784e-05, + "loss": 0.0098, + "step": 740450 + }, + { + "epoch": 1.92, + "learning_rate": 1.2093130558529319e-05, + "loss": 0.0068, + "step": 740460 + }, + { + "epoch": 1.92, + "learning_rate": 1.2089242342157855e-05, + "loss": 0.0055, + "step": 740470 + }, + { + "epoch": 1.92, + "learning_rate": 1.208535412578639e-05, + "loss": 0.0092, + "step": 740480 + }, + { + "epoch": 1.92, + "learning_rate": 1.2081465909414927e-05, + "loss": 0.0082, + "step": 740490 + }, + { + "epoch": 1.92, + "learning_rate": 1.2077577693043462e-05, + "loss": 0.0085, + "step": 740500 + }, + { + "epoch": 1.92, + "learning_rate": 1.2073689476671997e-05, + "loss": 0.0056, + "step": 740510 + }, + { + "epoch": 1.92, + "learning_rate": 1.2069801260300531e-05, + "loss": 0.0086, + "step": 740520 + }, + { + "epoch": 1.92, + "learning_rate": 1.2065913043929068e-05, + "loss": 0.0088, + "step": 740530 + }, + { + "epoch": 1.92, + "learning_rate": 1.2062024827557603e-05, + "loss": 0.0076, + "step": 740540 + }, + { + "epoch": 1.92, + "learning_rate": 1.205813661118614e-05, + "loss": 0.0061, + "step": 740550 + }, + { + "epoch": 1.92, + "learning_rate": 1.2054248394814674e-05, + "loss": 0.0089, + "step": 740560 + }, + { + "epoch": 1.92, + "learning_rate": 1.2050360178443207e-05, + "loss": 0.0076, + "step": 740570 + }, + { + "epoch": 1.92, + "learning_rate": 1.2046471962071744e-05, + "loss": 0.013, + "step": 740580 + }, + { + "epoch": 1.92, + "learning_rate": 1.2042583745700279e-05, + "loss": 0.0074, + "step": 740590 + }, + { + "epoch": 1.92, + "learning_rate": 1.2038695529328815e-05, + "loss": 0.0069, + "step": 740600 + }, + { + "epoch": 1.92, + "learning_rate": 1.203480731295735e-05, + "loss": 0.0068, + "step": 740610 + }, + { + "epoch": 1.92, + "learning_rate": 1.2030919096585887e-05, + "loss": 0.0061, + "step": 740620 + }, + { + "epoch": 1.92, + "learning_rate": 1.202703088021442e-05, + "loss": 0.0101, + "step": 740630 + }, + { + "epoch": 1.92, + "learning_rate": 1.2023142663842957e-05, + "loss": 0.0053, + "step": 740640 + }, + { + "epoch": 1.92, + "learning_rate": 1.2019254447471491e-05, + "loss": 0.0066, + "step": 740650 + }, + { + "epoch": 1.92, + "learning_rate": 1.2015366231100028e-05, + "loss": 0.0073, + "step": 740660 + }, + { + "epoch": 1.92, + "learning_rate": 1.2011478014728563e-05, + "loss": 0.0058, + "step": 740670 + }, + { + "epoch": 1.92, + "learning_rate": 1.20075897983571e-05, + "loss": 0.0059, + "step": 740680 + }, + { + "epoch": 1.92, + "learning_rate": 1.2003701581985634e-05, + "loss": 0.0069, + "step": 740690 + }, + { + "epoch": 1.92, + "learning_rate": 1.1999813365614167e-05, + "loss": 0.0063, + "step": 740700 + }, + { + "epoch": 1.92, + "learning_rate": 1.1995925149242704e-05, + "loss": 0.005, + "step": 740710 + }, + { + "epoch": 1.92, + "learning_rate": 1.1992036932871239e-05, + "loss": 0.0074, + "step": 740720 + }, + { + "epoch": 1.92, + "learning_rate": 1.1988148716499775e-05, + "loss": 0.0068, + "step": 740730 + }, + { + "epoch": 1.92, + "learning_rate": 1.198426050012831e-05, + "loss": 0.0087, + "step": 740740 + }, + { + "epoch": 1.92, + "learning_rate": 1.1980372283756847e-05, + "loss": 0.0063, + "step": 740750 + }, + { + "epoch": 1.92, + "learning_rate": 1.197648406738538e-05, + "loss": 0.0073, + "step": 740760 + }, + { + "epoch": 1.92, + "learning_rate": 1.1972595851013915e-05, + "loss": 0.0105, + "step": 740770 + }, + { + "epoch": 1.92, + "learning_rate": 1.1968707634642451e-05, + "loss": 0.0087, + "step": 740780 + }, + { + "epoch": 1.92, + "learning_rate": 1.1964819418270986e-05, + "loss": 0.0072, + "step": 740790 + }, + { + "epoch": 1.92, + "learning_rate": 1.1960931201899523e-05, + "loss": 0.01, + "step": 740800 + }, + { + "epoch": 1.92, + "learning_rate": 1.1957042985528058e-05, + "loss": 0.0085, + "step": 740810 + }, + { + "epoch": 1.92, + "learning_rate": 1.1953154769156593e-05, + "loss": 0.0053, + "step": 740820 + }, + { + "epoch": 1.92, + "learning_rate": 1.1949266552785127e-05, + "loss": 0.0069, + "step": 740830 + }, + { + "epoch": 1.92, + "learning_rate": 1.1945378336413664e-05, + "loss": 0.0061, + "step": 740840 + }, + { + "epoch": 1.92, + "learning_rate": 1.1941490120042199e-05, + "loss": 0.0074, + "step": 740850 + }, + { + "epoch": 1.92, + "learning_rate": 1.1937601903670735e-05, + "loss": 0.0062, + "step": 740860 + }, + { + "epoch": 1.92, + "learning_rate": 1.193371368729927e-05, + "loss": 0.0061, + "step": 740870 + }, + { + "epoch": 1.92, + "learning_rate": 1.1929825470927803e-05, + "loss": 0.0075, + "step": 740880 + }, + { + "epoch": 1.92, + "learning_rate": 1.192593725455634e-05, + "loss": 0.0088, + "step": 740890 + }, + { + "epoch": 1.92, + "learning_rate": 1.1922049038184875e-05, + "loss": 0.0061, + "step": 740900 + }, + { + "epoch": 1.92, + "learning_rate": 1.1918160821813411e-05, + "loss": 0.0086, + "step": 740910 + }, + { + "epoch": 1.92, + "learning_rate": 1.1914272605441946e-05, + "loss": 0.0062, + "step": 740920 + }, + { + "epoch": 1.92, + "learning_rate": 1.1910384389070483e-05, + "loss": 0.0061, + "step": 740930 + }, + { + "epoch": 1.92, + "learning_rate": 1.1906496172699016e-05, + "loss": 0.0049, + "step": 740940 + }, + { + "epoch": 1.92, + "learning_rate": 1.1902607956327553e-05, + "loss": 0.0074, + "step": 740950 + }, + { + "epoch": 1.92, + "learning_rate": 1.1898719739956087e-05, + "loss": 0.0051, + "step": 740960 + }, + { + "epoch": 1.92, + "learning_rate": 1.1894831523584624e-05, + "loss": 0.0079, + "step": 740970 + }, + { + "epoch": 1.92, + "learning_rate": 1.1890943307213159e-05, + "loss": 0.0064, + "step": 740980 + }, + { + "epoch": 1.92, + "learning_rate": 1.1887055090841695e-05, + "loss": 0.0059, + "step": 740990 + }, + { + "epoch": 1.92, + "learning_rate": 1.188316687447023e-05, + "loss": 0.007, + "step": 741000 + }, + { + "epoch": 1.92, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.004421970807015896, + "eval_runtime": 108.0147, + "eval_samples_per_second": 18.516, + "eval_steps_per_second": 4.629, + "step": 741000 + }, + { + "epoch": 1.92, + "learning_rate": 1.1879278658098763e-05, + "loss": 0.0069, + "step": 741010 + }, + { + "epoch": 1.92, + "learning_rate": 1.18753904417273e-05, + "loss": 0.0086, + "step": 741020 + }, + { + "epoch": 1.92, + "learning_rate": 1.1871502225355835e-05, + "loss": 0.0042, + "step": 741030 + }, + { + "epoch": 1.92, + "learning_rate": 1.1867614008984371e-05, + "loss": 0.0071, + "step": 741040 + }, + { + "epoch": 1.92, + "learning_rate": 1.1863725792612906e-05, + "loss": 0.0065, + "step": 741050 + }, + { + "epoch": 1.92, + "learning_rate": 1.1859837576241443e-05, + "loss": 0.0078, + "step": 741060 + }, + { + "epoch": 1.92, + "learning_rate": 1.1855949359869976e-05, + "loss": 0.0062, + "step": 741070 + }, + { + "epoch": 1.92, + "learning_rate": 1.1852061143498513e-05, + "loss": 0.0057, + "step": 741080 + }, + { + "epoch": 1.92, + "learning_rate": 1.1848172927127047e-05, + "loss": 0.0049, + "step": 741090 + }, + { + "epoch": 1.92, + "learning_rate": 1.1844284710755584e-05, + "loss": 0.0052, + "step": 741100 + }, + { + "epoch": 1.92, + "learning_rate": 1.1840396494384119e-05, + "loss": 0.0056, + "step": 741110 + }, + { + "epoch": 1.92, + "learning_rate": 1.1836508278012655e-05, + "loss": 0.0058, + "step": 741120 + }, + { + "epoch": 1.92, + "learning_rate": 1.1832620061641189e-05, + "loss": 0.0068, + "step": 741130 + }, + { + "epoch": 1.92, + "learning_rate": 1.1828731845269723e-05, + "loss": 0.0067, + "step": 741140 + }, + { + "epoch": 1.92, + "learning_rate": 1.182484362889826e-05, + "loss": 0.0053, + "step": 741150 + }, + { + "epoch": 1.92, + "learning_rate": 1.1820955412526795e-05, + "loss": 0.0089, + "step": 741160 + }, + { + "epoch": 1.92, + "learning_rate": 1.1817067196155331e-05, + "loss": 0.0063, + "step": 741170 + }, + { + "epoch": 1.92, + "learning_rate": 1.1813178979783866e-05, + "loss": 0.0057, + "step": 741180 + }, + { + "epoch": 1.92, + "learning_rate": 1.1809290763412401e-05, + "loss": 0.0075, + "step": 741190 + }, + { + "epoch": 1.92, + "learning_rate": 1.1805402547040936e-05, + "loss": 0.0084, + "step": 741200 + }, + { + "epoch": 1.92, + "learning_rate": 1.1801514330669472e-05, + "loss": 0.0072, + "step": 741210 + }, + { + "epoch": 1.92, + "learning_rate": 1.1797626114298007e-05, + "loss": 0.0084, + "step": 741220 + }, + { + "epoch": 1.92, + "learning_rate": 1.1793737897926544e-05, + "loss": 0.0059, + "step": 741230 + }, + { + "epoch": 1.92, + "learning_rate": 1.1789849681555079e-05, + "loss": 0.0087, + "step": 741240 + }, + { + "epoch": 1.92, + "learning_rate": 1.1785961465183612e-05, + "loss": 0.0078, + "step": 741250 + }, + { + "epoch": 1.92, + "learning_rate": 1.1782073248812149e-05, + "loss": 0.006, + "step": 741260 + }, + { + "epoch": 1.92, + "learning_rate": 1.1778185032440683e-05, + "loss": 0.0056, + "step": 741270 + }, + { + "epoch": 1.92, + "learning_rate": 1.177429681606922e-05, + "loss": 0.0052, + "step": 741280 + }, + { + "epoch": 1.92, + "learning_rate": 1.1770408599697755e-05, + "loss": 0.0064, + "step": 741290 + }, + { + "epoch": 1.92, + "learning_rate": 1.1766520383326291e-05, + "loss": 0.0051, + "step": 741300 + }, + { + "epoch": 1.92, + "learning_rate": 1.1762632166954826e-05, + "loss": 0.0078, + "step": 741310 + }, + { + "epoch": 1.92, + "learning_rate": 1.1758743950583361e-05, + "loss": 0.0066, + "step": 741320 + }, + { + "epoch": 1.92, + "learning_rate": 1.1754855734211896e-05, + "loss": 0.01, + "step": 741330 + }, + { + "epoch": 1.92, + "learning_rate": 1.1750967517840432e-05, + "loss": 0.0062, + "step": 741340 + }, + { + "epoch": 1.92, + "learning_rate": 1.1747079301468967e-05, + "loss": 0.0049, + "step": 741350 + }, + { + "epoch": 1.92, + "learning_rate": 1.1743191085097504e-05, + "loss": 0.0069, + "step": 741360 + }, + { + "epoch": 1.92, + "learning_rate": 1.1739302868726039e-05, + "loss": 0.0097, + "step": 741370 + }, + { + "epoch": 1.92, + "learning_rate": 1.1735414652354572e-05, + "loss": 0.0052, + "step": 741380 + }, + { + "epoch": 1.92, + "learning_rate": 1.1731526435983108e-05, + "loss": 0.007, + "step": 741390 + }, + { + "epoch": 1.92, + "learning_rate": 1.1727638219611643e-05, + "loss": 0.0074, + "step": 741400 + }, + { + "epoch": 1.92, + "learning_rate": 1.172375000324018e-05, + "loss": 0.0082, + "step": 741410 + }, + { + "epoch": 1.92, + "learning_rate": 1.1719861786868715e-05, + "loss": 0.01, + "step": 741420 + }, + { + "epoch": 1.92, + "learning_rate": 1.1715973570497251e-05, + "loss": 0.0086, + "step": 741430 + }, + { + "epoch": 1.92, + "learning_rate": 1.1712085354125784e-05, + "loss": 0.0069, + "step": 741440 + }, + { + "epoch": 1.92, + "learning_rate": 1.170819713775432e-05, + "loss": 0.0065, + "step": 741450 + }, + { + "epoch": 1.92, + "learning_rate": 1.1704308921382856e-05, + "loss": 0.0063, + "step": 741460 + }, + { + "epoch": 1.92, + "learning_rate": 1.170042070501139e-05, + "loss": 0.0073, + "step": 741470 + }, + { + "epoch": 1.92, + "learning_rate": 1.1696532488639927e-05, + "loss": 0.0053, + "step": 741480 + }, + { + "epoch": 1.92, + "learning_rate": 1.1692644272268462e-05, + "loss": 0.0069, + "step": 741490 + }, + { + "epoch": 1.92, + "learning_rate": 1.1688756055896997e-05, + "loss": 0.0078, + "step": 741500 + }, + { + "epoch": 1.92, + "learning_rate": 1.1684867839525532e-05, + "loss": 0.0076, + "step": 741510 + }, + { + "epoch": 1.92, + "learning_rate": 1.1680979623154068e-05, + "loss": 0.0101, + "step": 741520 + }, + { + "epoch": 1.92, + "learning_rate": 1.1677091406782603e-05, + "loss": 0.0057, + "step": 741530 + }, + { + "epoch": 1.92, + "learning_rate": 1.167320319041114e-05, + "loss": 0.0083, + "step": 741540 + }, + { + "epoch": 1.92, + "learning_rate": 1.1669314974039675e-05, + "loss": 0.0063, + "step": 741550 + }, + { + "epoch": 1.92, + "learning_rate": 1.1665426757668208e-05, + "loss": 0.0051, + "step": 741560 + }, + { + "epoch": 1.92, + "learning_rate": 1.1661538541296744e-05, + "loss": 0.0079, + "step": 741570 + }, + { + "epoch": 1.92, + "learning_rate": 1.165765032492528e-05, + "loss": 0.0138, + "step": 741580 + }, + { + "epoch": 1.92, + "learning_rate": 1.1653762108553816e-05, + "loss": 0.0063, + "step": 741590 + }, + { + "epoch": 1.92, + "learning_rate": 1.164987389218235e-05, + "loss": 0.0049, + "step": 741600 + }, + { + "epoch": 1.92, + "learning_rate": 1.1645985675810887e-05, + "loss": 0.0048, + "step": 741610 + }, + { + "epoch": 1.92, + "learning_rate": 1.1642097459439422e-05, + "loss": 0.0092, + "step": 741620 + }, + { + "epoch": 1.92, + "learning_rate": 1.1638209243067957e-05, + "loss": 0.0066, + "step": 741630 + }, + { + "epoch": 1.92, + "learning_rate": 1.1634321026696492e-05, + "loss": 0.0073, + "step": 741640 + }, + { + "epoch": 1.92, + "learning_rate": 1.1630432810325028e-05, + "loss": 0.0055, + "step": 741650 + }, + { + "epoch": 1.92, + "learning_rate": 1.1626544593953563e-05, + "loss": 0.0076, + "step": 741660 + }, + { + "epoch": 1.92, + "learning_rate": 1.16226563775821e-05, + "loss": 0.0057, + "step": 741670 + }, + { + "epoch": 1.92, + "learning_rate": 1.1618768161210635e-05, + "loss": 0.0068, + "step": 741680 + }, + { + "epoch": 1.92, + "learning_rate": 1.1614879944839168e-05, + "loss": 0.0083, + "step": 741690 + }, + { + "epoch": 1.92, + "learning_rate": 1.1610991728467704e-05, + "loss": 0.0063, + "step": 741700 + }, + { + "epoch": 1.92, + "learning_rate": 1.160710351209624e-05, + "loss": 0.0109, + "step": 741710 + }, + { + "epoch": 1.92, + "learning_rate": 1.1603215295724776e-05, + "loss": 0.0086, + "step": 741720 + }, + { + "epoch": 1.92, + "learning_rate": 1.159932707935331e-05, + "loss": 0.0051, + "step": 741730 + }, + { + "epoch": 1.92, + "learning_rate": 1.1595438862981847e-05, + "loss": 0.0041, + "step": 741740 + }, + { + "epoch": 1.92, + "learning_rate": 1.159155064661038e-05, + "loss": 0.0065, + "step": 741750 + }, + { + "epoch": 1.92, + "learning_rate": 1.1587662430238917e-05, + "loss": 0.0049, + "step": 741760 + }, + { + "epoch": 1.92, + "learning_rate": 1.1583774213867452e-05, + "loss": 0.0073, + "step": 741770 + }, + { + "epoch": 1.92, + "learning_rate": 1.1579885997495988e-05, + "loss": 0.0064, + "step": 741780 + }, + { + "epoch": 1.92, + "learning_rate": 1.1575997781124523e-05, + "loss": 0.0072, + "step": 741790 + }, + { + "epoch": 1.92, + "learning_rate": 1.157210956475306e-05, + "loss": 0.0088, + "step": 741800 + }, + { + "epoch": 1.92, + "learning_rate": 1.1568221348381593e-05, + "loss": 0.0071, + "step": 741810 + }, + { + "epoch": 1.92, + "learning_rate": 1.1564333132010128e-05, + "loss": 0.0069, + "step": 741820 + }, + { + "epoch": 1.92, + "learning_rate": 1.1560444915638664e-05, + "loss": 0.007, + "step": 741830 + }, + { + "epoch": 1.92, + "learning_rate": 1.15565566992672e-05, + "loss": 0.007, + "step": 741840 + }, + { + "epoch": 1.92, + "learning_rate": 1.1552668482895736e-05, + "loss": 0.0081, + "step": 741850 + }, + { + "epoch": 1.92, + "learning_rate": 1.154878026652427e-05, + "loss": 0.0096, + "step": 741860 + }, + { + "epoch": 1.92, + "learning_rate": 1.1544892050152806e-05, + "loss": 0.0087, + "step": 741870 + }, + { + "epoch": 1.92, + "learning_rate": 1.154100383378134e-05, + "loss": 0.0069, + "step": 741880 + }, + { + "epoch": 1.92, + "learning_rate": 1.1537115617409877e-05, + "loss": 0.0054, + "step": 741890 + }, + { + "epoch": 1.92, + "learning_rate": 1.1533227401038412e-05, + "loss": 0.0071, + "step": 741900 + }, + { + "epoch": 1.92, + "learning_rate": 1.1529339184666948e-05, + "loss": 0.0058, + "step": 741910 + }, + { + "epoch": 1.92, + "learning_rate": 1.1525450968295483e-05, + "loss": 0.0069, + "step": 741920 + }, + { + "epoch": 1.92, + "learning_rate": 1.152156275192402e-05, + "loss": 0.0066, + "step": 741930 + }, + { + "epoch": 1.92, + "learning_rate": 1.1517674535552553e-05, + "loss": 0.0053, + "step": 741940 + }, + { + "epoch": 1.92, + "learning_rate": 1.1513786319181088e-05, + "loss": 0.0086, + "step": 741950 + }, + { + "epoch": 1.92, + "learning_rate": 1.1509898102809624e-05, + "loss": 0.0102, + "step": 741960 + }, + { + "epoch": 1.92, + "learning_rate": 1.150600988643816e-05, + "loss": 0.0057, + "step": 741970 + }, + { + "epoch": 1.92, + "learning_rate": 1.1502121670066696e-05, + "loss": 0.0072, + "step": 741980 + }, + { + "epoch": 1.92, + "learning_rate": 1.149823345369523e-05, + "loss": 0.008, + "step": 741990 + }, + { + "epoch": 1.92, + "learning_rate": 1.1494345237323766e-05, + "loss": 0.0085, + "step": 742000 + }, + { + "epoch": 1.92, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.004464298021048307, + "eval_runtime": 107.8257, + "eval_samples_per_second": 18.548, + "eval_steps_per_second": 4.637, + "step": 742000 + }, + { + "epoch": 1.92, + "learning_rate": 1.14904570209523e-05, + "loss": 0.0036, + "step": 742010 + }, + { + "epoch": 1.92, + "learning_rate": 1.1486568804580837e-05, + "loss": 0.0067, + "step": 742020 + }, + { + "epoch": 1.92, + "learning_rate": 1.1482680588209372e-05, + "loss": 0.0072, + "step": 742030 + }, + { + "epoch": 1.92, + "learning_rate": 1.1478792371837908e-05, + "loss": 0.0057, + "step": 742040 + }, + { + "epoch": 1.92, + "learning_rate": 1.1474904155466443e-05, + "loss": 0.0089, + "step": 742050 + }, + { + "epoch": 1.92, + "learning_rate": 1.1471015939094976e-05, + "loss": 0.0065, + "step": 742060 + }, + { + "epoch": 1.92, + "learning_rate": 1.1467127722723513e-05, + "loss": 0.0066, + "step": 742070 + }, + { + "epoch": 1.92, + "learning_rate": 1.1463239506352048e-05, + "loss": 0.0072, + "step": 742080 + }, + { + "epoch": 1.92, + "learning_rate": 1.1459351289980584e-05, + "loss": 0.0094, + "step": 742090 + }, + { + "epoch": 1.92, + "learning_rate": 1.145546307360912e-05, + "loss": 0.0061, + "step": 742100 + }, + { + "epoch": 1.92, + "learning_rate": 1.1451574857237656e-05, + "loss": 0.0069, + "step": 742110 + }, + { + "epoch": 1.92, + "learning_rate": 1.1447686640866189e-05, + "loss": 0.0057, + "step": 742120 + }, + { + "epoch": 1.92, + "learning_rate": 1.1443798424494724e-05, + "loss": 0.0067, + "step": 742130 + }, + { + "epoch": 1.92, + "learning_rate": 1.143991020812326e-05, + "loss": 0.0063, + "step": 742140 + }, + { + "epoch": 1.92, + "learning_rate": 1.1436021991751795e-05, + "loss": 0.0079, + "step": 742150 + }, + { + "epoch": 1.92, + "learning_rate": 1.1432133775380332e-05, + "loss": 0.0063, + "step": 742160 + }, + { + "epoch": 1.92, + "learning_rate": 1.1428245559008867e-05, + "loss": 0.0062, + "step": 742170 + }, + { + "epoch": 1.92, + "learning_rate": 1.1424357342637401e-05, + "loss": 0.0073, + "step": 742180 + }, + { + "epoch": 1.92, + "learning_rate": 1.1420469126265936e-05, + "loss": 0.0075, + "step": 742190 + }, + { + "epoch": 1.92, + "learning_rate": 1.1416580909894473e-05, + "loss": 0.0056, + "step": 742200 + }, + { + "epoch": 1.92, + "learning_rate": 1.1412692693523008e-05, + "loss": 0.0095, + "step": 742210 + }, + { + "epoch": 1.92, + "learning_rate": 1.1408804477151544e-05, + "loss": 0.0079, + "step": 742220 + }, + { + "epoch": 1.92, + "learning_rate": 1.140491626078008e-05, + "loss": 0.0041, + "step": 742230 + }, + { + "epoch": 1.92, + "learning_rate": 1.1401028044408616e-05, + "loss": 0.008, + "step": 742240 + }, + { + "epoch": 1.92, + "learning_rate": 1.1397139828037149e-05, + "loss": 0.0063, + "step": 742250 + }, + { + "epoch": 1.92, + "learning_rate": 1.1393251611665684e-05, + "loss": 0.0097, + "step": 742260 + }, + { + "epoch": 1.92, + "learning_rate": 1.138936339529422e-05, + "loss": 0.0087, + "step": 742270 + }, + { + "epoch": 1.92, + "learning_rate": 1.1385475178922755e-05, + "loss": 0.0097, + "step": 742280 + }, + { + "epoch": 1.92, + "learning_rate": 1.1381586962551292e-05, + "loss": 0.0069, + "step": 742290 + }, + { + "epoch": 1.92, + "learning_rate": 1.1377698746179827e-05, + "loss": 0.0051, + "step": 742300 + }, + { + "epoch": 1.92, + "learning_rate": 1.1373810529808361e-05, + "loss": 0.0085, + "step": 742310 + }, + { + "epoch": 1.92, + "learning_rate": 1.1369922313436896e-05, + "loss": 0.0088, + "step": 742320 + }, + { + "epoch": 1.92, + "learning_rate": 1.1366034097065433e-05, + "loss": 0.0054, + "step": 742330 + }, + { + "epoch": 1.92, + "learning_rate": 1.1362145880693968e-05, + "loss": 0.0074, + "step": 742340 + }, + { + "epoch": 1.92, + "learning_rate": 1.1358257664322504e-05, + "loss": 0.0081, + "step": 742350 + }, + { + "epoch": 1.92, + "learning_rate": 1.135436944795104e-05, + "loss": 0.0059, + "step": 742360 + }, + { + "epoch": 1.92, + "learning_rate": 1.1350481231579572e-05, + "loss": 0.0072, + "step": 742370 + }, + { + "epoch": 1.92, + "learning_rate": 1.1346593015208109e-05, + "loss": 0.0085, + "step": 742380 + }, + { + "epoch": 1.92, + "learning_rate": 1.1342704798836644e-05, + "loss": 0.0073, + "step": 742390 + }, + { + "epoch": 1.92, + "learning_rate": 1.133881658246518e-05, + "loss": 0.0072, + "step": 742400 + }, + { + "epoch": 1.92, + "learning_rate": 1.1334928366093715e-05, + "loss": 0.0067, + "step": 742410 + }, + { + "epoch": 1.92, + "learning_rate": 1.1331040149722252e-05, + "loss": 0.0071, + "step": 742420 + }, + { + "epoch": 1.92, + "learning_rate": 1.1327151933350785e-05, + "loss": 0.0071, + "step": 742430 + }, + { + "epoch": 1.92, + "learning_rate": 1.1323263716979321e-05, + "loss": 0.0062, + "step": 742440 + }, + { + "epoch": 1.92, + "learning_rate": 1.1319375500607856e-05, + "loss": 0.0047, + "step": 742450 + }, + { + "epoch": 1.92, + "learning_rate": 1.1315487284236393e-05, + "loss": 0.0052, + "step": 742460 + }, + { + "epoch": 1.92, + "learning_rate": 1.1311599067864928e-05, + "loss": 0.0077, + "step": 742470 + }, + { + "epoch": 1.92, + "learning_rate": 1.1307710851493464e-05, + "loss": 0.0077, + "step": 742480 + }, + { + "epoch": 1.92, + "learning_rate": 1.1303822635121999e-05, + "loss": 0.0061, + "step": 742490 + }, + { + "epoch": 1.92, + "learning_rate": 1.1299934418750532e-05, + "loss": 0.006, + "step": 742500 + }, + { + "epoch": 1.92, + "learning_rate": 1.1296046202379069e-05, + "loss": 0.0052, + "step": 742510 + }, + { + "epoch": 1.92, + "learning_rate": 1.1292157986007604e-05, + "loss": 0.0063, + "step": 742520 + }, + { + "epoch": 1.92, + "learning_rate": 1.128826976963614e-05, + "loss": 0.0074, + "step": 742530 + }, + { + "epoch": 1.92, + "learning_rate": 1.1284381553264675e-05, + "loss": 0.0086, + "step": 742540 + }, + { + "epoch": 1.92, + "learning_rate": 1.1280493336893212e-05, + "loss": 0.0094, + "step": 742550 + }, + { + "epoch": 1.92, + "learning_rate": 1.1276605120521745e-05, + "loss": 0.0112, + "step": 742560 + }, + { + "epoch": 1.92, + "learning_rate": 1.1272716904150281e-05, + "loss": 0.0074, + "step": 742570 + }, + { + "epoch": 1.92, + "learning_rate": 1.1268828687778816e-05, + "loss": 0.0069, + "step": 742580 + }, + { + "epoch": 1.92, + "learning_rate": 1.1264940471407353e-05, + "loss": 0.0083, + "step": 742590 + }, + { + "epoch": 1.92, + "learning_rate": 1.1261052255035888e-05, + "loss": 0.0063, + "step": 742600 + }, + { + "epoch": 1.92, + "learning_rate": 1.1257164038664424e-05, + "loss": 0.0072, + "step": 742610 + }, + { + "epoch": 1.92, + "learning_rate": 1.1253275822292957e-05, + "loss": 0.0053, + "step": 742620 + }, + { + "epoch": 1.93, + "learning_rate": 1.1249387605921492e-05, + "loss": 0.0058, + "step": 742630 + }, + { + "epoch": 1.93, + "learning_rate": 1.1245499389550029e-05, + "loss": 0.006, + "step": 742640 + }, + { + "epoch": 1.93, + "learning_rate": 1.1241611173178564e-05, + "loss": 0.0077, + "step": 742650 + }, + { + "epoch": 1.93, + "learning_rate": 1.12377229568071e-05, + "loss": 0.0066, + "step": 742660 + }, + { + "epoch": 1.93, + "learning_rate": 1.1233834740435635e-05, + "loss": 0.0076, + "step": 742670 + }, + { + "epoch": 1.93, + "learning_rate": 1.122994652406417e-05, + "loss": 0.0075, + "step": 742680 + }, + { + "epoch": 1.93, + "learning_rate": 1.1226058307692705e-05, + "loss": 0.007, + "step": 742690 + }, + { + "epoch": 1.93, + "learning_rate": 1.1222170091321241e-05, + "loss": 0.0062, + "step": 742700 + }, + { + "epoch": 1.93, + "learning_rate": 1.1218281874949776e-05, + "loss": 0.006, + "step": 742710 + }, + { + "epoch": 1.93, + "learning_rate": 1.1214393658578313e-05, + "loss": 0.0084, + "step": 742720 + }, + { + "epoch": 1.93, + "learning_rate": 1.1210505442206848e-05, + "loss": 0.0071, + "step": 742730 + }, + { + "epoch": 1.93, + "learning_rate": 1.1206617225835381e-05, + "loss": 0.007, + "step": 742740 + }, + { + "epoch": 1.93, + "learning_rate": 1.1202729009463917e-05, + "loss": 0.0075, + "step": 742750 + }, + { + "epoch": 1.93, + "learning_rate": 1.1198840793092452e-05, + "loss": 0.0089, + "step": 742760 + }, + { + "epoch": 1.93, + "learning_rate": 1.1194952576720989e-05, + "loss": 0.0078, + "step": 742770 + }, + { + "epoch": 1.93, + "learning_rate": 1.1191064360349524e-05, + "loss": 0.0059, + "step": 742780 + }, + { + "epoch": 1.93, + "learning_rate": 1.118717614397806e-05, + "loss": 0.0069, + "step": 742790 + }, + { + "epoch": 1.93, + "learning_rate": 1.1183287927606595e-05, + "loss": 0.0084, + "step": 742800 + }, + { + "epoch": 1.93, + "learning_rate": 1.117939971123513e-05, + "loss": 0.0047, + "step": 742810 + }, + { + "epoch": 1.93, + "learning_rate": 1.1175511494863665e-05, + "loss": 0.0078, + "step": 742820 + }, + { + "epoch": 1.93, + "learning_rate": 1.11716232784922e-05, + "loss": 0.0057, + "step": 742830 + }, + { + "epoch": 1.93, + "learning_rate": 1.1167735062120736e-05, + "loss": 0.0093, + "step": 742840 + }, + { + "epoch": 1.93, + "learning_rate": 1.1163846845749271e-05, + "loss": 0.0044, + "step": 742850 + }, + { + "epoch": 1.93, + "learning_rate": 1.1159958629377808e-05, + "loss": 0.0078, + "step": 742860 + }, + { + "epoch": 1.93, + "learning_rate": 1.115607041300634e-05, + "loss": 0.0064, + "step": 742870 + }, + { + "epoch": 1.93, + "learning_rate": 1.1152182196634877e-05, + "loss": 0.0072, + "step": 742880 + }, + { + "epoch": 1.93, + "learning_rate": 1.1148293980263412e-05, + "loss": 0.0059, + "step": 742890 + }, + { + "epoch": 1.93, + "learning_rate": 1.1144405763891949e-05, + "loss": 0.0078, + "step": 742900 + }, + { + "epoch": 1.93, + "learning_rate": 1.1140517547520484e-05, + "loss": 0.0085, + "step": 742910 + }, + { + "epoch": 1.93, + "learning_rate": 1.113662933114902e-05, + "loss": 0.0068, + "step": 742920 + }, + { + "epoch": 1.93, + "learning_rate": 1.1132741114777553e-05, + "loss": 0.0048, + "step": 742930 + }, + { + "epoch": 1.93, + "learning_rate": 1.1128852898406088e-05, + "loss": 0.0079, + "step": 742940 + }, + { + "epoch": 1.93, + "learning_rate": 1.1124964682034625e-05, + "loss": 0.0074, + "step": 742950 + }, + { + "epoch": 1.93, + "learning_rate": 1.112107646566316e-05, + "loss": 0.0072, + "step": 742960 + }, + { + "epoch": 1.93, + "learning_rate": 1.1117188249291696e-05, + "loss": 0.0067, + "step": 742970 + }, + { + "epoch": 1.93, + "learning_rate": 1.1113300032920231e-05, + "loss": 0.0064, + "step": 742980 + }, + { + "epoch": 1.93, + "learning_rate": 1.1109411816548766e-05, + "loss": 0.0061, + "step": 742990 + }, + { + "epoch": 1.93, + "learning_rate": 1.11055236001773e-05, + "loss": 0.0076, + "step": 743000 + }, + { + "epoch": 1.93, + "eval_cer": 0.8816606972151424, + "eval_loss": 0.004454338923096657, + "eval_runtime": 107.8248, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 743000 + }, + { + "epoch": 1.93, + "learning_rate": 1.1101635383805837e-05, + "loss": 0.0086, + "step": 743010 + }, + { + "epoch": 1.93, + "learning_rate": 1.1097747167434372e-05, + "loss": 0.005, + "step": 743020 + }, + { + "epoch": 1.93, + "learning_rate": 1.1093858951062909e-05, + "loss": 0.0075, + "step": 743030 + }, + { + "epoch": 1.93, + "learning_rate": 1.1089970734691444e-05, + "loss": 0.0053, + "step": 743040 + }, + { + "epoch": 1.93, + "learning_rate": 1.1086082518319977e-05, + "loss": 0.0062, + "step": 743050 + }, + { + "epoch": 1.93, + "learning_rate": 1.1082194301948513e-05, + "loss": 0.0068, + "step": 743060 + }, + { + "epoch": 1.93, + "learning_rate": 1.1078306085577048e-05, + "loss": 0.0076, + "step": 743070 + }, + { + "epoch": 1.93, + "learning_rate": 1.1074417869205585e-05, + "loss": 0.008, + "step": 743080 + }, + { + "epoch": 1.93, + "learning_rate": 1.107052965283412e-05, + "loss": 0.0071, + "step": 743090 + }, + { + "epoch": 1.93, + "learning_rate": 1.1066641436462656e-05, + "loss": 0.0063, + "step": 743100 + }, + { + "epoch": 1.93, + "learning_rate": 1.1062753220091191e-05, + "loss": 0.0072, + "step": 743110 + }, + { + "epoch": 1.93, + "learning_rate": 1.1058865003719726e-05, + "loss": 0.0119, + "step": 743120 + }, + { + "epoch": 1.93, + "learning_rate": 1.105497678734826e-05, + "loss": 0.0075, + "step": 743130 + }, + { + "epoch": 1.93, + "learning_rate": 1.1051088570976797e-05, + "loss": 0.0077, + "step": 743140 + }, + { + "epoch": 1.93, + "learning_rate": 1.1047200354605332e-05, + "loss": 0.0123, + "step": 743150 + }, + { + "epoch": 1.93, + "learning_rate": 1.1043312138233869e-05, + "loss": 0.0074, + "step": 743160 + }, + { + "epoch": 1.93, + "learning_rate": 1.1039423921862404e-05, + "loss": 0.0073, + "step": 743170 + }, + { + "epoch": 1.93, + "learning_rate": 1.1035535705490937e-05, + "loss": 0.0061, + "step": 743180 + }, + { + "epoch": 1.93, + "learning_rate": 1.1031647489119473e-05, + "loss": 0.0068, + "step": 743190 + }, + { + "epoch": 1.93, + "learning_rate": 1.1027759272748008e-05, + "loss": 0.0086, + "step": 743200 + }, + { + "epoch": 1.93, + "learning_rate": 1.1023871056376545e-05, + "loss": 0.0057, + "step": 743210 + }, + { + "epoch": 1.93, + "learning_rate": 1.101998284000508e-05, + "loss": 0.0056, + "step": 743220 + }, + { + "epoch": 1.93, + "learning_rate": 1.1016094623633616e-05, + "loss": 0.0061, + "step": 743230 + }, + { + "epoch": 1.93, + "learning_rate": 1.101220640726215e-05, + "loss": 0.0053, + "step": 743240 + }, + { + "epoch": 1.93, + "learning_rate": 1.1008318190890686e-05, + "loss": 0.0081, + "step": 743250 + }, + { + "epoch": 1.93, + "learning_rate": 1.100442997451922e-05, + "loss": 0.0086, + "step": 743260 + }, + { + "epoch": 1.93, + "learning_rate": 1.1000541758147757e-05, + "loss": 0.0057, + "step": 743270 + }, + { + "epoch": 1.93, + "learning_rate": 1.0996653541776292e-05, + "loss": 0.0081, + "step": 743280 + }, + { + "epoch": 1.93, + "learning_rate": 1.0992765325404829e-05, + "loss": 0.0086, + "step": 743290 + }, + { + "epoch": 1.93, + "learning_rate": 1.0988877109033362e-05, + "loss": 0.0091, + "step": 743300 + }, + { + "epoch": 1.93, + "learning_rate": 1.0984988892661897e-05, + "loss": 0.0065, + "step": 743310 + }, + { + "epoch": 1.93, + "learning_rate": 1.0981100676290433e-05, + "loss": 0.0083, + "step": 743320 + }, + { + "epoch": 1.93, + "learning_rate": 1.0977212459918968e-05, + "loss": 0.0141, + "step": 743330 + }, + { + "epoch": 1.93, + "learning_rate": 1.0973324243547505e-05, + "loss": 0.0064, + "step": 743340 + }, + { + "epoch": 1.93, + "learning_rate": 1.096943602717604e-05, + "loss": 0.0073, + "step": 743350 + }, + { + "epoch": 1.93, + "learning_rate": 1.0965547810804574e-05, + "loss": 0.0061, + "step": 743360 + }, + { + "epoch": 1.93, + "learning_rate": 1.096165959443311e-05, + "loss": 0.006, + "step": 743370 + }, + { + "epoch": 1.93, + "learning_rate": 1.0957771378061646e-05, + "loss": 0.0057, + "step": 743380 + }, + { + "epoch": 1.93, + "learning_rate": 1.095388316169018e-05, + "loss": 0.0056, + "step": 743390 + }, + { + "epoch": 1.93, + "learning_rate": 1.0949994945318717e-05, + "loss": 0.0069, + "step": 743400 + }, + { + "epoch": 1.93, + "learning_rate": 1.0946106728947252e-05, + "loss": 0.0079, + "step": 743410 + }, + { + "epoch": 1.93, + "learning_rate": 1.0942218512575789e-05, + "loss": 0.0071, + "step": 743420 + }, + { + "epoch": 1.93, + "learning_rate": 1.0938330296204322e-05, + "loss": 0.0052, + "step": 743430 + }, + { + "epoch": 1.93, + "learning_rate": 1.0934442079832857e-05, + "loss": 0.0066, + "step": 743440 + }, + { + "epoch": 1.93, + "learning_rate": 1.0930553863461393e-05, + "loss": 0.0071, + "step": 743450 + }, + { + "epoch": 1.93, + "learning_rate": 1.0926665647089928e-05, + "loss": 0.0059, + "step": 743460 + }, + { + "epoch": 1.93, + "learning_rate": 1.0922777430718465e-05, + "loss": 0.0069, + "step": 743470 + }, + { + "epoch": 1.93, + "learning_rate": 1.0918889214347e-05, + "loss": 0.0066, + "step": 743480 + }, + { + "epoch": 1.93, + "learning_rate": 1.0915000997975534e-05, + "loss": 0.0069, + "step": 743490 + }, + { + "epoch": 1.93, + "learning_rate": 1.091111278160407e-05, + "loss": 0.009, + "step": 743500 + }, + { + "epoch": 1.93, + "learning_rate": 1.0907224565232604e-05, + "loss": 0.0092, + "step": 743510 + }, + { + "epoch": 1.93, + "learning_rate": 1.090333634886114e-05, + "loss": 0.0033, + "step": 743520 + }, + { + "epoch": 1.93, + "learning_rate": 1.0899448132489676e-05, + "loss": 0.0076, + "step": 743530 + }, + { + "epoch": 1.93, + "learning_rate": 1.0895559916118212e-05, + "loss": 0.006, + "step": 743540 + }, + { + "epoch": 1.93, + "learning_rate": 1.0891671699746745e-05, + "loss": 0.006, + "step": 743550 + }, + { + "epoch": 1.93, + "learning_rate": 1.0887783483375282e-05, + "loss": 0.006, + "step": 743560 + }, + { + "epoch": 1.93, + "learning_rate": 1.0883895267003817e-05, + "loss": 0.0115, + "step": 743570 + }, + { + "epoch": 1.93, + "learning_rate": 1.0880007050632353e-05, + "loss": 0.0071, + "step": 743580 + }, + { + "epoch": 1.93, + "learning_rate": 1.0876118834260888e-05, + "loss": 0.0052, + "step": 743590 + }, + { + "epoch": 1.93, + "learning_rate": 1.0872230617889425e-05, + "loss": 0.0066, + "step": 743600 + }, + { + "epoch": 1.93, + "learning_rate": 1.0868342401517958e-05, + "loss": 0.0059, + "step": 743610 + }, + { + "epoch": 1.93, + "learning_rate": 1.0864454185146493e-05, + "loss": 0.0067, + "step": 743620 + }, + { + "epoch": 1.93, + "learning_rate": 1.086056596877503e-05, + "loss": 0.0059, + "step": 743630 + }, + { + "epoch": 1.93, + "learning_rate": 1.0856677752403564e-05, + "loss": 0.0083, + "step": 743640 + }, + { + "epoch": 1.93, + "learning_rate": 1.08527895360321e-05, + "loss": 0.0063, + "step": 743650 + }, + { + "epoch": 1.93, + "learning_rate": 1.0848901319660636e-05, + "loss": 0.0086, + "step": 743660 + }, + { + "epoch": 1.93, + "learning_rate": 1.084501310328917e-05, + "loss": 0.0075, + "step": 743670 + }, + { + "epoch": 1.93, + "learning_rate": 1.0841124886917705e-05, + "loss": 0.0066, + "step": 743680 + }, + { + "epoch": 1.93, + "learning_rate": 1.0837236670546242e-05, + "loss": 0.0057, + "step": 743690 + }, + { + "epoch": 1.93, + "learning_rate": 1.0833348454174777e-05, + "loss": 0.007, + "step": 743700 + }, + { + "epoch": 1.93, + "learning_rate": 1.0829460237803313e-05, + "loss": 0.0064, + "step": 743710 + }, + { + "epoch": 1.93, + "learning_rate": 1.0825572021431848e-05, + "loss": 0.0055, + "step": 743720 + }, + { + "epoch": 1.93, + "learning_rate": 1.0821683805060385e-05, + "loss": 0.0053, + "step": 743730 + }, + { + "epoch": 1.93, + "learning_rate": 1.0817795588688918e-05, + "loss": 0.0061, + "step": 743740 + }, + { + "epoch": 1.93, + "learning_rate": 1.0813907372317453e-05, + "loss": 0.0078, + "step": 743750 + }, + { + "epoch": 1.93, + "learning_rate": 1.081001915594599e-05, + "loss": 0.0076, + "step": 743760 + }, + { + "epoch": 1.93, + "learning_rate": 1.0806130939574524e-05, + "loss": 0.0081, + "step": 743770 + }, + { + "epoch": 1.93, + "learning_rate": 1.080224272320306e-05, + "loss": 0.01, + "step": 743780 + }, + { + "epoch": 1.93, + "learning_rate": 1.0798354506831596e-05, + "loss": 0.0073, + "step": 743790 + }, + { + "epoch": 1.93, + "learning_rate": 1.079446629046013e-05, + "loss": 0.0062, + "step": 743800 + }, + { + "epoch": 1.93, + "learning_rate": 1.0790578074088665e-05, + "loss": 0.006, + "step": 743810 + }, + { + "epoch": 1.93, + "learning_rate": 1.0786689857717202e-05, + "loss": 0.006, + "step": 743820 + }, + { + "epoch": 1.93, + "learning_rate": 1.0782801641345737e-05, + "loss": 0.0072, + "step": 743830 + }, + { + "epoch": 1.93, + "learning_rate": 1.0778913424974273e-05, + "loss": 0.0078, + "step": 743840 + }, + { + "epoch": 1.93, + "learning_rate": 1.0775025208602808e-05, + "loss": 0.0063, + "step": 743850 + }, + { + "epoch": 1.93, + "learning_rate": 1.0771136992231341e-05, + "loss": 0.0084, + "step": 743860 + }, + { + "epoch": 1.93, + "learning_rate": 1.0767248775859878e-05, + "loss": 0.007, + "step": 743870 + }, + { + "epoch": 1.93, + "learning_rate": 1.0763360559488413e-05, + "loss": 0.0089, + "step": 743880 + }, + { + "epoch": 1.93, + "learning_rate": 1.075947234311695e-05, + "loss": 0.0052, + "step": 743890 + }, + { + "epoch": 1.93, + "learning_rate": 1.0755584126745484e-05, + "loss": 0.0068, + "step": 743900 + }, + { + "epoch": 1.93, + "learning_rate": 1.075169591037402e-05, + "loss": 0.0054, + "step": 743910 + }, + { + "epoch": 1.93, + "learning_rate": 1.0747807694002554e-05, + "loss": 0.0049, + "step": 743920 + }, + { + "epoch": 1.93, + "learning_rate": 1.074391947763109e-05, + "loss": 0.0051, + "step": 743930 + }, + { + "epoch": 1.93, + "learning_rate": 1.0740031261259625e-05, + "loss": 0.0078, + "step": 743940 + }, + { + "epoch": 1.93, + "learning_rate": 1.0736143044888162e-05, + "loss": 0.0085, + "step": 743950 + }, + { + "epoch": 1.93, + "learning_rate": 1.0732254828516697e-05, + "loss": 0.0064, + "step": 743960 + }, + { + "epoch": 1.93, + "learning_rate": 1.0728366612145233e-05, + "loss": 0.0071, + "step": 743970 + }, + { + "epoch": 1.93, + "learning_rate": 1.0724478395773766e-05, + "loss": 0.0062, + "step": 743980 + }, + { + "epoch": 1.93, + "learning_rate": 1.0720590179402301e-05, + "loss": 0.0072, + "step": 743990 + }, + { + "epoch": 1.93, + "learning_rate": 1.0716701963030838e-05, + "loss": 0.0062, + "step": 744000 + }, + { + "epoch": 1.93, + "eval_cer": 0.8816704946736816, + "eval_loss": 0.0045136138796806335, + "eval_runtime": 107.8856, + "eval_samples_per_second": 18.538, + "eval_steps_per_second": 4.635, + "step": 744000 + }, + { + "epoch": 1.93, + "learning_rate": 1.0712813746659373e-05, + "loss": 0.0057, + "step": 744010 + }, + { + "epoch": 1.93, + "learning_rate": 1.070892553028791e-05, + "loss": 0.0105, + "step": 744020 + }, + { + "epoch": 1.93, + "learning_rate": 1.0705037313916444e-05, + "loss": 0.0097, + "step": 744030 + }, + { + "epoch": 1.93, + "learning_rate": 1.070114909754498e-05, + "loss": 0.0081, + "step": 744040 + }, + { + "epoch": 1.93, + "learning_rate": 1.0697260881173514e-05, + "loss": 0.0055, + "step": 744050 + }, + { + "epoch": 1.93, + "learning_rate": 1.069337266480205e-05, + "loss": 0.01, + "step": 744060 + }, + { + "epoch": 1.93, + "learning_rate": 1.0689484448430585e-05, + "loss": 0.0062, + "step": 744070 + }, + { + "epoch": 1.93, + "learning_rate": 1.0685596232059122e-05, + "loss": 0.0064, + "step": 744080 + }, + { + "epoch": 1.93, + "learning_rate": 1.0681708015687657e-05, + "loss": 0.0051, + "step": 744090 + }, + { + "epoch": 1.93, + "learning_rate": 1.0677819799316193e-05, + "loss": 0.0069, + "step": 744100 + }, + { + "epoch": 1.93, + "learning_rate": 1.0673931582944726e-05, + "loss": 0.0062, + "step": 744110 + }, + { + "epoch": 1.93, + "learning_rate": 1.0670043366573261e-05, + "loss": 0.0046, + "step": 744120 + }, + { + "epoch": 1.93, + "learning_rate": 1.0666155150201798e-05, + "loss": 0.0063, + "step": 744130 + }, + { + "epoch": 1.93, + "learning_rate": 1.0662266933830333e-05, + "loss": 0.0068, + "step": 744140 + }, + { + "epoch": 1.93, + "learning_rate": 1.065837871745887e-05, + "loss": 0.0072, + "step": 744150 + }, + { + "epoch": 1.93, + "learning_rate": 1.0654490501087404e-05, + "loss": 0.0083, + "step": 744160 + }, + { + "epoch": 1.93, + "learning_rate": 1.0650602284715939e-05, + "loss": 0.0061, + "step": 744170 + }, + { + "epoch": 1.93, + "learning_rate": 1.0646714068344474e-05, + "loss": 0.0062, + "step": 744180 + }, + { + "epoch": 1.93, + "learning_rate": 1.064282585197301e-05, + "loss": 0.0078, + "step": 744190 + }, + { + "epoch": 1.93, + "learning_rate": 1.0638937635601545e-05, + "loss": 0.0075, + "step": 744200 + }, + { + "epoch": 1.93, + "learning_rate": 1.063504941923008e-05, + "loss": 0.007, + "step": 744210 + }, + { + "epoch": 1.93, + "learning_rate": 1.0631161202858617e-05, + "loss": 0.0091, + "step": 744220 + }, + { + "epoch": 1.93, + "learning_rate": 1.062727298648715e-05, + "loss": 0.0072, + "step": 744230 + }, + { + "epoch": 1.93, + "learning_rate": 1.0623384770115686e-05, + "loss": 0.0113, + "step": 744240 + }, + { + "epoch": 1.93, + "learning_rate": 1.0619496553744221e-05, + "loss": 0.0072, + "step": 744250 + }, + { + "epoch": 1.93, + "learning_rate": 1.0615608337372758e-05, + "loss": 0.006, + "step": 744260 + }, + { + "epoch": 1.93, + "learning_rate": 1.0611720121001293e-05, + "loss": 0.0076, + "step": 744270 + }, + { + "epoch": 1.93, + "learning_rate": 1.0607831904629829e-05, + "loss": 0.0052, + "step": 744280 + }, + { + "epoch": 1.93, + "learning_rate": 1.0603943688258362e-05, + "loss": 0.0083, + "step": 744290 + }, + { + "epoch": 1.93, + "learning_rate": 1.0600055471886897e-05, + "loss": 0.0078, + "step": 744300 + }, + { + "epoch": 1.93, + "learning_rate": 1.0596167255515434e-05, + "loss": 0.0063, + "step": 744310 + }, + { + "epoch": 1.93, + "learning_rate": 1.0592279039143969e-05, + "loss": 0.0095, + "step": 744320 + }, + { + "epoch": 1.93, + "learning_rate": 1.0588390822772505e-05, + "loss": 0.0071, + "step": 744330 + }, + { + "epoch": 1.93, + "learning_rate": 1.058450260640104e-05, + "loss": 0.0068, + "step": 744340 + }, + { + "epoch": 1.93, + "learning_rate": 1.0580614390029577e-05, + "loss": 0.004, + "step": 744350 + }, + { + "epoch": 1.93, + "learning_rate": 1.057672617365811e-05, + "loss": 0.0055, + "step": 744360 + }, + { + "epoch": 1.93, + "learning_rate": 1.0572837957286646e-05, + "loss": 0.0052, + "step": 744370 + }, + { + "epoch": 1.93, + "learning_rate": 1.0568949740915181e-05, + "loss": 0.0054, + "step": 744380 + }, + { + "epoch": 1.93, + "learning_rate": 1.0565061524543718e-05, + "loss": 0.0094, + "step": 744390 + }, + { + "epoch": 1.93, + "learning_rate": 1.0561173308172253e-05, + "loss": 0.0095, + "step": 744400 + }, + { + "epoch": 1.93, + "learning_rate": 1.0557285091800789e-05, + "loss": 0.0084, + "step": 744410 + }, + { + "epoch": 1.93, + "learning_rate": 1.0553396875429322e-05, + "loss": 0.0078, + "step": 744420 + }, + { + "epoch": 1.93, + "learning_rate": 1.0549508659057857e-05, + "loss": 0.0059, + "step": 744430 + }, + { + "epoch": 1.93, + "learning_rate": 1.0545620442686394e-05, + "loss": 0.0076, + "step": 744440 + }, + { + "epoch": 1.93, + "learning_rate": 1.0541732226314929e-05, + "loss": 0.0073, + "step": 744450 + }, + { + "epoch": 1.93, + "learning_rate": 1.0537844009943465e-05, + "loss": 0.0054, + "step": 744460 + }, + { + "epoch": 1.93, + "learning_rate": 1.0533955793572e-05, + "loss": 0.0072, + "step": 744470 + }, + { + "epoch": 1.93, + "learning_rate": 1.0530067577200535e-05, + "loss": 0.0095, + "step": 744480 + }, + { + "epoch": 1.93, + "learning_rate": 1.052617936082907e-05, + "loss": 0.008, + "step": 744490 + }, + { + "epoch": 1.93, + "learning_rate": 1.0522291144457606e-05, + "loss": 0.0078, + "step": 744500 + }, + { + "epoch": 1.93, + "learning_rate": 1.0518402928086141e-05, + "loss": 0.0045, + "step": 744510 + }, + { + "epoch": 1.93, + "learning_rate": 1.0514514711714678e-05, + "loss": 0.0075, + "step": 744520 + }, + { + "epoch": 1.93, + "learning_rate": 1.0510626495343213e-05, + "loss": 0.0075, + "step": 744530 + }, + { + "epoch": 1.93, + "learning_rate": 1.0506738278971746e-05, + "loss": 0.0098, + "step": 744540 + }, + { + "epoch": 1.93, + "learning_rate": 1.0502850062600282e-05, + "loss": 0.0074, + "step": 744550 + }, + { + "epoch": 1.93, + "learning_rate": 1.0498961846228817e-05, + "loss": 0.0074, + "step": 744560 + }, + { + "epoch": 1.93, + "learning_rate": 1.0495073629857354e-05, + "loss": 0.0099, + "step": 744570 + }, + { + "epoch": 1.93, + "learning_rate": 1.0491185413485889e-05, + "loss": 0.009, + "step": 744580 + }, + { + "epoch": 1.93, + "learning_rate": 1.0487297197114425e-05, + "loss": 0.0054, + "step": 744590 + }, + { + "epoch": 1.93, + "learning_rate": 1.0483408980742958e-05, + "loss": 0.0064, + "step": 744600 + }, + { + "epoch": 1.93, + "learning_rate": 1.0479520764371495e-05, + "loss": 0.0095, + "step": 744610 + }, + { + "epoch": 1.93, + "learning_rate": 1.047563254800003e-05, + "loss": 0.0074, + "step": 744620 + }, + { + "epoch": 1.93, + "learning_rate": 1.0471744331628566e-05, + "loss": 0.0065, + "step": 744630 + }, + { + "epoch": 1.93, + "learning_rate": 1.0467856115257101e-05, + "loss": 0.0072, + "step": 744640 + }, + { + "epoch": 1.93, + "learning_rate": 1.0463967898885638e-05, + "loss": 0.0072, + "step": 744650 + }, + { + "epoch": 1.93, + "learning_rate": 1.0460079682514173e-05, + "loss": 0.0075, + "step": 744660 + }, + { + "epoch": 1.93, + "learning_rate": 1.0456191466142706e-05, + "loss": 0.0075, + "step": 744670 + }, + { + "epoch": 1.93, + "learning_rate": 1.0452303249771242e-05, + "loss": 0.0066, + "step": 744680 + }, + { + "epoch": 1.93, + "learning_rate": 1.0448415033399777e-05, + "loss": 0.0063, + "step": 744690 + }, + { + "epoch": 1.93, + "learning_rate": 1.0444526817028314e-05, + "loss": 0.0058, + "step": 744700 + }, + { + "epoch": 1.93, + "learning_rate": 1.0440638600656849e-05, + "loss": 0.0066, + "step": 744710 + }, + { + "epoch": 1.93, + "learning_rate": 1.0436750384285385e-05, + "loss": 0.009, + "step": 744720 + }, + { + "epoch": 1.93, + "learning_rate": 1.0432862167913918e-05, + "loss": 0.0064, + "step": 744730 + }, + { + "epoch": 1.93, + "learning_rate": 1.0428973951542455e-05, + "loss": 0.0067, + "step": 744740 + }, + { + "epoch": 1.93, + "learning_rate": 1.042508573517099e-05, + "loss": 0.0058, + "step": 744750 + }, + { + "epoch": 1.93, + "learning_rate": 1.0421197518799526e-05, + "loss": 0.0054, + "step": 744760 + }, + { + "epoch": 1.93, + "learning_rate": 1.0417309302428061e-05, + "loss": 0.0059, + "step": 744770 + }, + { + "epoch": 1.93, + "learning_rate": 1.0413421086056598e-05, + "loss": 0.0053, + "step": 744780 + }, + { + "epoch": 1.93, + "learning_rate": 1.040953286968513e-05, + "loss": 0.0068, + "step": 744790 + }, + { + "epoch": 1.93, + "learning_rate": 1.0405644653313666e-05, + "loss": 0.0064, + "step": 744800 + }, + { + "epoch": 1.93, + "learning_rate": 1.0401756436942202e-05, + "loss": 0.0066, + "step": 744810 + }, + { + "epoch": 1.93, + "learning_rate": 1.0397868220570737e-05, + "loss": 0.0051, + "step": 744820 + }, + { + "epoch": 1.93, + "learning_rate": 1.0393980004199274e-05, + "loss": 0.0066, + "step": 744830 + }, + { + "epoch": 1.93, + "learning_rate": 1.0390091787827808e-05, + "loss": 0.0068, + "step": 744840 + }, + { + "epoch": 1.93, + "learning_rate": 1.0386203571456343e-05, + "loss": 0.0059, + "step": 744850 + }, + { + "epoch": 1.93, + "learning_rate": 1.0382315355084878e-05, + "loss": 0.0071, + "step": 744860 + }, + { + "epoch": 1.93, + "learning_rate": 1.0378427138713415e-05, + "loss": 0.0071, + "step": 744870 + }, + { + "epoch": 1.93, + "learning_rate": 1.037453892234195e-05, + "loss": 0.0061, + "step": 744880 + }, + { + "epoch": 1.93, + "learning_rate": 1.0370650705970484e-05, + "loss": 0.0059, + "step": 744890 + }, + { + "epoch": 1.93, + "learning_rate": 1.0366762489599021e-05, + "loss": 0.0071, + "step": 744900 + }, + { + "epoch": 1.93, + "learning_rate": 1.0362874273227554e-05, + "loss": 0.0079, + "step": 744910 + }, + { + "epoch": 1.93, + "learning_rate": 1.035898605685609e-05, + "loss": 0.0069, + "step": 744920 + }, + { + "epoch": 1.93, + "learning_rate": 1.0355097840484626e-05, + "loss": 0.0056, + "step": 744930 + }, + { + "epoch": 1.93, + "learning_rate": 1.0351209624113162e-05, + "loss": 0.0048, + "step": 744940 + }, + { + "epoch": 1.93, + "learning_rate": 1.0347321407741697e-05, + "loss": 0.0074, + "step": 744950 + }, + { + "epoch": 1.93, + "learning_rate": 1.0343433191370234e-05, + "loss": 0.0054, + "step": 744960 + }, + { + "epoch": 1.93, + "learning_rate": 1.0339544974998768e-05, + "loss": 0.0064, + "step": 744970 + }, + { + "epoch": 1.93, + "learning_rate": 1.0335656758627302e-05, + "loss": 0.0092, + "step": 744980 + }, + { + "epoch": 1.93, + "learning_rate": 1.0331768542255838e-05, + "loss": 0.0072, + "step": 744990 + }, + { + "epoch": 1.93, + "learning_rate": 1.0327880325884373e-05, + "loss": 0.0089, + "step": 745000 + }, + { + "epoch": 1.93, + "eval_cer": 0.8816620968520765, + "eval_loss": 0.0044491966255009174, + "eval_runtime": 107.8288, + "eval_samples_per_second": 18.548, + "eval_steps_per_second": 4.637, + "step": 745000 + }, + { + "epoch": 1.93, + "learning_rate": 1.032399210951291e-05, + "loss": 0.0082, + "step": 745010 + }, + { + "epoch": 1.93, + "learning_rate": 1.0320103893141444e-05, + "loss": 0.0073, + "step": 745020 + }, + { + "epoch": 1.93, + "learning_rate": 1.0316215676769981e-05, + "loss": 0.0064, + "step": 745030 + }, + { + "epoch": 1.93, + "learning_rate": 1.0312327460398514e-05, + "loss": 0.0047, + "step": 745040 + }, + { + "epoch": 1.93, + "learning_rate": 1.030843924402705e-05, + "loss": 0.0069, + "step": 745050 + }, + { + "epoch": 1.93, + "learning_rate": 1.0304551027655586e-05, + "loss": 0.007, + "step": 745060 + }, + { + "epoch": 1.93, + "learning_rate": 1.0300662811284122e-05, + "loss": 0.0083, + "step": 745070 + }, + { + "epoch": 1.93, + "learning_rate": 1.0296774594912657e-05, + "loss": 0.0086, + "step": 745080 + }, + { + "epoch": 1.93, + "learning_rate": 1.0292886378541194e-05, + "loss": 0.007, + "step": 745090 + }, + { + "epoch": 1.93, + "learning_rate": 1.0288998162169727e-05, + "loss": 0.0079, + "step": 745100 + }, + { + "epoch": 1.93, + "learning_rate": 1.0285109945798262e-05, + "loss": 0.0069, + "step": 745110 + }, + { + "epoch": 1.93, + "learning_rate": 1.0281221729426798e-05, + "loss": 0.0062, + "step": 745120 + }, + { + "epoch": 1.93, + "learning_rate": 1.0277333513055333e-05, + "loss": 0.0048, + "step": 745130 + }, + { + "epoch": 1.93, + "learning_rate": 1.027344529668387e-05, + "loss": 0.006, + "step": 745140 + }, + { + "epoch": 1.93, + "learning_rate": 1.0269557080312404e-05, + "loss": 0.0075, + "step": 745150 + }, + { + "epoch": 1.93, + "learning_rate": 1.026566886394094e-05, + "loss": 0.0087, + "step": 745160 + }, + { + "epoch": 1.93, + "learning_rate": 1.0261780647569474e-05, + "loss": 0.0104, + "step": 745170 + }, + { + "epoch": 1.93, + "learning_rate": 1.025789243119801e-05, + "loss": 0.007, + "step": 745180 + }, + { + "epoch": 1.93, + "learning_rate": 1.0254004214826546e-05, + "loss": 0.0054, + "step": 745190 + }, + { + "epoch": 1.93, + "learning_rate": 1.0250115998455082e-05, + "loss": 0.0078, + "step": 745200 + }, + { + "epoch": 1.93, + "learning_rate": 1.0246227782083617e-05, + "loss": 0.0059, + "step": 745210 + }, + { + "epoch": 1.93, + "learning_rate": 1.024233956571215e-05, + "loss": 0.0088, + "step": 745220 + }, + { + "epoch": 1.93, + "learning_rate": 1.0238451349340687e-05, + "loss": 0.008, + "step": 745230 + }, + { + "epoch": 1.93, + "learning_rate": 1.0234563132969222e-05, + "loss": 0.0075, + "step": 745240 + }, + { + "epoch": 1.93, + "learning_rate": 1.0230674916597758e-05, + "loss": 0.0077, + "step": 745250 + }, + { + "epoch": 1.93, + "learning_rate": 1.0226786700226293e-05, + "loss": 0.0063, + "step": 745260 + }, + { + "epoch": 1.93, + "learning_rate": 1.022289848385483e-05, + "loss": 0.0122, + "step": 745270 + }, + { + "epoch": 1.93, + "learning_rate": 1.0219010267483364e-05, + "loss": 0.0063, + "step": 745280 + }, + { + "epoch": 1.93, + "learning_rate": 1.02151220511119e-05, + "loss": 0.0076, + "step": 745290 + }, + { + "epoch": 1.93, + "learning_rate": 1.0211233834740434e-05, + "loss": 0.0049, + "step": 745300 + }, + { + "epoch": 1.93, + "learning_rate": 1.020734561836897e-05, + "loss": 0.0075, + "step": 745310 + }, + { + "epoch": 1.93, + "learning_rate": 1.0203457401997506e-05, + "loss": 0.0056, + "step": 745320 + }, + { + "epoch": 1.93, + "learning_rate": 1.0199569185626042e-05, + "loss": 0.008, + "step": 745330 + }, + { + "epoch": 1.93, + "learning_rate": 1.0195680969254577e-05, + "loss": 0.0074, + "step": 745340 + }, + { + "epoch": 1.93, + "learning_rate": 1.019179275288311e-05, + "loss": 0.0076, + "step": 745350 + }, + { + "epoch": 1.93, + "learning_rate": 1.0187904536511647e-05, + "loss": 0.005, + "step": 745360 + }, + { + "epoch": 1.93, + "learning_rate": 1.0184016320140182e-05, + "loss": 0.0087, + "step": 745370 + }, + { + "epoch": 1.93, + "learning_rate": 1.0180128103768718e-05, + "loss": 0.0068, + "step": 745380 + }, + { + "epoch": 1.93, + "learning_rate": 1.0176239887397253e-05, + "loss": 0.0081, + "step": 745390 + }, + { + "epoch": 1.93, + "learning_rate": 1.017235167102579e-05, + "loss": 0.007, + "step": 745400 + }, + { + "epoch": 1.93, + "learning_rate": 1.0168463454654323e-05, + "loss": 0.0064, + "step": 745410 + }, + { + "epoch": 1.93, + "learning_rate": 1.016457523828286e-05, + "loss": 0.0076, + "step": 745420 + }, + { + "epoch": 1.93, + "learning_rate": 1.0160687021911394e-05, + "loss": 0.0112, + "step": 745430 + }, + { + "epoch": 1.93, + "learning_rate": 1.015679880553993e-05, + "loss": 0.0083, + "step": 745440 + }, + { + "epoch": 1.93, + "learning_rate": 1.0152910589168466e-05, + "loss": 0.0088, + "step": 745450 + }, + { + "epoch": 1.93, + "learning_rate": 1.0149022372797002e-05, + "loss": 0.0073, + "step": 745460 + }, + { + "epoch": 1.93, + "learning_rate": 1.0145134156425535e-05, + "loss": 0.005, + "step": 745470 + }, + { + "epoch": 1.93, + "learning_rate": 1.014124594005407e-05, + "loss": 0.007, + "step": 745480 + }, + { + "epoch": 1.93, + "learning_rate": 1.0137357723682607e-05, + "loss": 0.0051, + "step": 745490 + }, + { + "epoch": 1.93, + "learning_rate": 1.0133469507311142e-05, + "loss": 0.0094, + "step": 745500 + }, + { + "epoch": 1.93, + "learning_rate": 1.0129581290939678e-05, + "loss": 0.008, + "step": 745510 + }, + { + "epoch": 1.93, + "learning_rate": 1.0125693074568213e-05, + "loss": 0.0062, + "step": 745520 + }, + { + "epoch": 1.93, + "learning_rate": 1.0121804858196748e-05, + "loss": 0.0059, + "step": 745530 + }, + { + "epoch": 1.93, + "learning_rate": 1.0117916641825283e-05, + "loss": 0.0078, + "step": 745540 + }, + { + "epoch": 1.93, + "learning_rate": 1.011402842545382e-05, + "loss": 0.0057, + "step": 745550 + }, + { + "epoch": 1.93, + "learning_rate": 1.0110140209082354e-05, + "loss": 0.0053, + "step": 745560 + }, + { + "epoch": 1.93, + "learning_rate": 1.010625199271089e-05, + "loss": 0.0051, + "step": 745570 + }, + { + "epoch": 1.93, + "learning_rate": 1.0102363776339426e-05, + "loss": 0.008, + "step": 745580 + }, + { + "epoch": 1.93, + "learning_rate": 1.009847555996796e-05, + "loss": 0.0074, + "step": 745590 + }, + { + "epoch": 1.93, + "learning_rate": 1.0094587343596495e-05, + "loss": 0.0079, + "step": 745600 + }, + { + "epoch": 1.93, + "learning_rate": 1.009069912722503e-05, + "loss": 0.0078, + "step": 745610 + }, + { + "epoch": 1.93, + "learning_rate": 1.0086810910853567e-05, + "loss": 0.006, + "step": 745620 + }, + { + "epoch": 1.93, + "learning_rate": 1.0082922694482102e-05, + "loss": 0.0073, + "step": 745630 + }, + { + "epoch": 1.93, + "learning_rate": 1.0079034478110638e-05, + "loss": 0.0059, + "step": 745640 + }, + { + "epoch": 1.93, + "learning_rate": 1.0075146261739173e-05, + "loss": 0.0099, + "step": 745650 + }, + { + "epoch": 1.93, + "learning_rate": 1.0071258045367706e-05, + "loss": 0.0047, + "step": 745660 + }, + { + "epoch": 1.93, + "learning_rate": 1.0067369828996243e-05, + "loss": 0.0059, + "step": 745670 + }, + { + "epoch": 1.93, + "learning_rate": 1.0063481612624778e-05, + "loss": 0.0077, + "step": 745680 + }, + { + "epoch": 1.93, + "learning_rate": 1.0059593396253314e-05, + "loss": 0.0068, + "step": 745690 + }, + { + "epoch": 1.93, + "learning_rate": 1.0055705179881849e-05, + "loss": 0.0078, + "step": 745700 + }, + { + "epoch": 1.93, + "learning_rate": 1.0051816963510385e-05, + "loss": 0.0076, + "step": 745710 + }, + { + "epoch": 1.93, + "learning_rate": 1.0047928747138919e-05, + "loss": 0.0067, + "step": 745720 + }, + { + "epoch": 1.93, + "learning_rate": 1.0044040530767455e-05, + "loss": 0.0072, + "step": 745730 + }, + { + "epoch": 1.93, + "learning_rate": 1.004015231439599e-05, + "loss": 0.006, + "step": 745740 + }, + { + "epoch": 1.93, + "learning_rate": 1.0036264098024527e-05, + "loss": 0.0058, + "step": 745750 + }, + { + "epoch": 1.93, + "learning_rate": 1.0032375881653061e-05, + "loss": 0.0047, + "step": 745760 + }, + { + "epoch": 1.93, + "learning_rate": 1.0028487665281598e-05, + "loss": 0.0062, + "step": 745770 + }, + { + "epoch": 1.93, + "learning_rate": 1.0024599448910131e-05, + "loss": 0.0119, + "step": 745780 + }, + { + "epoch": 1.93, + "learning_rate": 1.0020711232538666e-05, + "loss": 0.0061, + "step": 745790 + }, + { + "epoch": 1.93, + "learning_rate": 1.0016823016167203e-05, + "loss": 0.009, + "step": 745800 + }, + { + "epoch": 1.93, + "learning_rate": 1.0012934799795737e-05, + "loss": 0.004, + "step": 745810 + }, + { + "epoch": 1.93, + "learning_rate": 1.0009046583424274e-05, + "loss": 0.0068, + "step": 745820 + }, + { + "epoch": 1.93, + "learning_rate": 1.0005158367052809e-05, + "loss": 0.0066, + "step": 745830 + }, + { + "epoch": 1.93, + "learning_rate": 1.0001270150681344e-05, + "loss": 0.0059, + "step": 745840 + }, + { + "epoch": 1.93, + "learning_rate": 9.997381934309879e-06, + "loss": 0.0071, + "step": 745850 + }, + { + "epoch": 1.93, + "learning_rate": 9.993493717938415e-06, + "loss": 0.0057, + "step": 745860 + }, + { + "epoch": 1.93, + "learning_rate": 9.98960550156695e-06, + "loss": 0.0103, + "step": 745870 + }, + { + "epoch": 1.93, + "learning_rate": 9.985717285195487e-06, + "loss": 0.0073, + "step": 745880 + }, + { + "epoch": 1.93, + "learning_rate": 9.981829068824021e-06, + "loss": 0.0093, + "step": 745890 + }, + { + "epoch": 1.93, + "learning_rate": 9.977940852452558e-06, + "loss": 0.007, + "step": 745900 + }, + { + "epoch": 1.93, + "learning_rate": 9.974052636081091e-06, + "loss": 0.009, + "step": 745910 + }, + { + "epoch": 1.93, + "learning_rate": 9.970164419709626e-06, + "loss": 0.008, + "step": 745920 + }, + { + "epoch": 1.93, + "learning_rate": 9.966276203338163e-06, + "loss": 0.0082, + "step": 745930 + }, + { + "epoch": 1.93, + "learning_rate": 9.962387986966697e-06, + "loss": 0.0066, + "step": 745940 + }, + { + "epoch": 1.93, + "learning_rate": 9.958499770595234e-06, + "loss": 0.0061, + "step": 745950 + }, + { + "epoch": 1.93, + "learning_rate": 9.954611554223769e-06, + "loss": 0.0054, + "step": 745960 + }, + { + "epoch": 1.93, + "learning_rate": 9.950723337852304e-06, + "loss": 0.0055, + "step": 745970 + }, + { + "epoch": 1.93, + "learning_rate": 9.946835121480839e-06, + "loss": 0.0091, + "step": 745980 + }, + { + "epoch": 1.93, + "learning_rate": 9.942946905109375e-06, + "loss": 0.0091, + "step": 745990 + }, + { + "epoch": 1.93, + "learning_rate": 9.93905868873791e-06, + "loss": 0.0067, + "step": 746000 + }, + { + "epoch": 1.93, + "eval_cer": 0.8816802921322209, + "eval_loss": 0.004460540134459734, + "eval_runtime": 107.8774, + "eval_samples_per_second": 18.54, + "eval_steps_per_second": 4.635, + "step": 746000 + }, + { + "epoch": 1.93, + "learning_rate": 9.935170472366447e-06, + "loss": 0.006, + "step": 746010 + }, + { + "epoch": 1.93, + "learning_rate": 9.931282255994981e-06, + "loss": 0.0063, + "step": 746020 + }, + { + "epoch": 1.93, + "learning_rate": 9.927394039623515e-06, + "loss": 0.0051, + "step": 746030 + }, + { + "epoch": 1.93, + "learning_rate": 9.923505823252051e-06, + "loss": 0.0071, + "step": 746040 + }, + { + "epoch": 1.93, + "learning_rate": 9.919617606880586e-06, + "loss": 0.0056, + "step": 746050 + }, + { + "epoch": 1.93, + "learning_rate": 9.915729390509123e-06, + "loss": 0.0052, + "step": 746060 + }, + { + "epoch": 1.93, + "learning_rate": 9.911841174137657e-06, + "loss": 0.0068, + "step": 746070 + }, + { + "epoch": 1.93, + "learning_rate": 9.907952957766194e-06, + "loss": 0.0074, + "step": 746080 + }, + { + "epoch": 1.93, + "learning_rate": 9.904064741394727e-06, + "loss": 0.0048, + "step": 746090 + }, + { + "epoch": 1.93, + "learning_rate": 9.900176525023264e-06, + "loss": 0.0074, + "step": 746100 + }, + { + "epoch": 1.93, + "learning_rate": 9.896288308651799e-06, + "loss": 0.0055, + "step": 746110 + }, + { + "epoch": 1.93, + "learning_rate": 9.892400092280335e-06, + "loss": 0.0046, + "step": 746120 + }, + { + "epoch": 1.93, + "learning_rate": 9.88851187590887e-06, + "loss": 0.0057, + "step": 746130 + }, + { + "epoch": 1.93, + "learning_rate": 9.884623659537407e-06, + "loss": 0.0089, + "step": 746140 + }, + { + "epoch": 1.93, + "learning_rate": 9.88073544316594e-06, + "loss": 0.0096, + "step": 746150 + }, + { + "epoch": 1.93, + "learning_rate": 9.876847226794475e-06, + "loss": 0.008, + "step": 746160 + }, + { + "epoch": 1.93, + "learning_rate": 9.872959010423011e-06, + "loss": 0.0114, + "step": 746170 + }, + { + "epoch": 1.93, + "learning_rate": 9.869070794051546e-06, + "loss": 0.0065, + "step": 746180 + }, + { + "epoch": 1.93, + "learning_rate": 9.865182577680083e-06, + "loss": 0.0072, + "step": 746190 + }, + { + "epoch": 1.93, + "learning_rate": 9.861294361308617e-06, + "loss": 0.0087, + "step": 746200 + }, + { + "epoch": 1.93, + "learning_rate": 9.857406144937154e-06, + "loss": 0.0061, + "step": 746210 + }, + { + "epoch": 1.93, + "learning_rate": 9.853517928565687e-06, + "loss": 0.0055, + "step": 746220 + }, + { + "epoch": 1.93, + "learning_rate": 9.849629712194224e-06, + "loss": 0.0096, + "step": 746230 + }, + { + "epoch": 1.93, + "learning_rate": 9.845741495822759e-06, + "loss": 0.0054, + "step": 746240 + }, + { + "epoch": 1.93, + "learning_rate": 9.841853279451295e-06, + "loss": 0.01, + "step": 746250 + }, + { + "epoch": 1.93, + "learning_rate": 9.83796506307983e-06, + "loss": 0.0056, + "step": 746260 + }, + { + "epoch": 1.93, + "learning_rate": 9.834076846708365e-06, + "loss": 0.007, + "step": 746270 + }, + { + "epoch": 1.93, + "learning_rate": 9.8301886303369e-06, + "loss": 0.0062, + "step": 746280 + }, + { + "epoch": 1.93, + "learning_rate": 9.826300413965435e-06, + "loss": 0.0081, + "step": 746290 + }, + { + "epoch": 1.93, + "learning_rate": 9.822412197593971e-06, + "loss": 0.0092, + "step": 746300 + }, + { + "epoch": 1.93, + "learning_rate": 9.818523981222506e-06, + "loss": 0.0095, + "step": 746310 + }, + { + "epoch": 1.93, + "learning_rate": 9.814635764851043e-06, + "loss": 0.0099, + "step": 746320 + }, + { + "epoch": 1.93, + "learning_rate": 9.810747548479577e-06, + "loss": 0.0058, + "step": 746330 + }, + { + "epoch": 1.93, + "learning_rate": 9.80685933210811e-06, + "loss": 0.0079, + "step": 746340 + }, + { + "epoch": 1.93, + "learning_rate": 9.802971115736647e-06, + "loss": 0.007, + "step": 746350 + }, + { + "epoch": 1.93, + "learning_rate": 9.799082899365182e-06, + "loss": 0.0077, + "step": 746360 + }, + { + "epoch": 1.93, + "learning_rate": 9.795194682993719e-06, + "loss": 0.005, + "step": 746370 + }, + { + "epoch": 1.93, + "learning_rate": 9.791306466622253e-06, + "loss": 0.0102, + "step": 746380 + }, + { + "epoch": 1.93, + "learning_rate": 9.78741825025079e-06, + "loss": 0.0061, + "step": 746390 + }, + { + "epoch": 1.93, + "learning_rate": 9.783530033879323e-06, + "loss": 0.0107, + "step": 746400 + }, + { + "epoch": 1.93, + "learning_rate": 9.77964181750786e-06, + "loss": 0.0076, + "step": 746410 + }, + { + "epoch": 1.93, + "learning_rate": 9.775753601136395e-06, + "loss": 0.0102, + "step": 746420 + }, + { + "epoch": 1.93, + "learning_rate": 9.771865384764931e-06, + "loss": 0.0104, + "step": 746430 + }, + { + "epoch": 1.93, + "learning_rate": 9.767977168393466e-06, + "loss": 0.0066, + "step": 746440 + }, + { + "epoch": 1.93, + "learning_rate": 9.764088952022003e-06, + "loss": 0.0085, + "step": 746450 + }, + { + "epoch": 1.93, + "learning_rate": 9.760200735650536e-06, + "loss": 0.0047, + "step": 746460 + }, + { + "epoch": 1.93, + "learning_rate": 9.75631251927907e-06, + "loss": 0.0065, + "step": 746470 + }, + { + "epoch": 1.93, + "learning_rate": 9.752424302907607e-06, + "loss": 0.0066, + "step": 746480 + }, + { + "epoch": 1.94, + "learning_rate": 9.748536086536142e-06, + "loss": 0.0062, + "step": 746490 + }, + { + "epoch": 1.94, + "learning_rate": 9.744647870164679e-06, + "loss": 0.0074, + "step": 746500 + }, + { + "epoch": 1.94, + "learning_rate": 9.740759653793213e-06, + "loss": 0.006, + "step": 746510 + }, + { + "epoch": 1.94, + "learning_rate": 9.73687143742175e-06, + "loss": 0.0057, + "step": 746520 + }, + { + "epoch": 1.94, + "learning_rate": 9.732983221050283e-06, + "loss": 0.0065, + "step": 746530 + }, + { + "epoch": 1.94, + "learning_rate": 9.72909500467882e-06, + "loss": 0.0067, + "step": 746540 + }, + { + "epoch": 1.94, + "learning_rate": 9.725206788307355e-06, + "loss": 0.0089, + "step": 746550 + }, + { + "epoch": 1.94, + "learning_rate": 9.721318571935891e-06, + "loss": 0.0064, + "step": 746560 + }, + { + "epoch": 1.94, + "learning_rate": 9.717430355564426e-06, + "loss": 0.0072, + "step": 746570 + }, + { + "epoch": 1.94, + "learning_rate": 9.713542139192962e-06, + "loss": 0.0059, + "step": 746580 + }, + { + "epoch": 1.94, + "learning_rate": 9.709653922821496e-06, + "loss": 0.0106, + "step": 746590 + }, + { + "epoch": 1.94, + "learning_rate": 9.70576570645003e-06, + "loss": 0.0064, + "step": 746600 + }, + { + "epoch": 1.94, + "learning_rate": 9.701877490078567e-06, + "loss": 0.0067, + "step": 746610 + }, + { + "epoch": 1.94, + "learning_rate": 9.697989273707102e-06, + "loss": 0.008, + "step": 746620 + }, + { + "epoch": 1.94, + "learning_rate": 9.694101057335638e-06, + "loss": 0.0114, + "step": 746630 + }, + { + "epoch": 1.94, + "learning_rate": 9.690212840964173e-06, + "loss": 0.0054, + "step": 746640 + }, + { + "epoch": 1.94, + "learning_rate": 9.686324624592708e-06, + "loss": 0.0073, + "step": 746650 + }, + { + "epoch": 1.94, + "learning_rate": 9.682436408221243e-06, + "loss": 0.006, + "step": 746660 + }, + { + "epoch": 1.94, + "learning_rate": 9.67854819184978e-06, + "loss": 0.0062, + "step": 746670 + }, + { + "epoch": 1.94, + "learning_rate": 9.674659975478314e-06, + "loss": 0.0076, + "step": 746680 + }, + { + "epoch": 1.94, + "learning_rate": 9.670771759106851e-06, + "loss": 0.0073, + "step": 746690 + }, + { + "epoch": 1.94, + "learning_rate": 9.666883542735386e-06, + "loss": 0.0089, + "step": 746700 + }, + { + "epoch": 1.94, + "learning_rate": 9.662995326363919e-06, + "loss": 0.0086, + "step": 746710 + }, + { + "epoch": 1.94, + "learning_rate": 9.659107109992456e-06, + "loss": 0.0053, + "step": 746720 + }, + { + "epoch": 1.94, + "learning_rate": 9.65521889362099e-06, + "loss": 0.0053, + "step": 746730 + }, + { + "epoch": 1.94, + "learning_rate": 9.651330677249527e-06, + "loss": 0.0104, + "step": 746740 + }, + { + "epoch": 1.94, + "learning_rate": 9.647442460878062e-06, + "loss": 0.0067, + "step": 746750 + }, + { + "epoch": 1.94, + "learning_rate": 9.643554244506598e-06, + "loss": 0.0074, + "step": 746760 + }, + { + "epoch": 1.94, + "learning_rate": 9.639666028135132e-06, + "loss": 0.0064, + "step": 746770 + }, + { + "epoch": 1.94, + "learning_rate": 9.635777811763668e-06, + "loss": 0.0061, + "step": 746780 + }, + { + "epoch": 1.94, + "learning_rate": 9.631889595392203e-06, + "loss": 0.0065, + "step": 746790 + }, + { + "epoch": 1.94, + "learning_rate": 9.62800137902074e-06, + "loss": 0.0067, + "step": 746800 + }, + { + "epoch": 1.94, + "learning_rate": 9.624113162649274e-06, + "loss": 0.0063, + "step": 746810 + }, + { + "epoch": 1.94, + "learning_rate": 9.620224946277811e-06, + "loss": 0.0052, + "step": 746820 + }, + { + "epoch": 1.94, + "learning_rate": 9.616336729906346e-06, + "loss": 0.0071, + "step": 746830 + }, + { + "epoch": 1.94, + "learning_rate": 9.612448513534879e-06, + "loss": 0.0083, + "step": 746840 + }, + { + "epoch": 1.94, + "learning_rate": 9.608560297163416e-06, + "loss": 0.0076, + "step": 746850 + }, + { + "epoch": 1.94, + "learning_rate": 9.60467208079195e-06, + "loss": 0.0047, + "step": 746860 + }, + { + "epoch": 1.94, + "learning_rate": 9.600783864420487e-06, + "loss": 0.0092, + "step": 746870 + }, + { + "epoch": 1.94, + "learning_rate": 9.596895648049022e-06, + "loss": 0.0069, + "step": 746880 + }, + { + "epoch": 1.94, + "learning_rate": 9.593007431677558e-06, + "loss": 0.0087, + "step": 746890 + }, + { + "epoch": 1.94, + "learning_rate": 9.589119215306092e-06, + "loss": 0.0089, + "step": 746900 + }, + { + "epoch": 1.94, + "learning_rate": 9.585230998934628e-06, + "loss": 0.0075, + "step": 746910 + }, + { + "epoch": 1.94, + "learning_rate": 9.581342782563163e-06, + "loss": 0.0062, + "step": 746920 + }, + { + "epoch": 1.94, + "learning_rate": 9.5774545661917e-06, + "loss": 0.0079, + "step": 746930 + }, + { + "epoch": 1.94, + "learning_rate": 9.573566349820234e-06, + "loss": 0.0065, + "step": 746940 + }, + { + "epoch": 1.94, + "learning_rate": 9.569678133448771e-06, + "loss": 0.0088, + "step": 746950 + }, + { + "epoch": 1.94, + "learning_rate": 9.565789917077304e-06, + "loss": 0.0065, + "step": 746960 + }, + { + "epoch": 1.94, + "learning_rate": 9.561901700705839e-06, + "loss": 0.007, + "step": 746970 + }, + { + "epoch": 1.94, + "learning_rate": 9.558013484334376e-06, + "loss": 0.0051, + "step": 746980 + }, + { + "epoch": 1.94, + "learning_rate": 9.55412526796291e-06, + "loss": 0.009, + "step": 746990 + }, + { + "epoch": 1.94, + "learning_rate": 9.550237051591447e-06, + "loss": 0.0055, + "step": 747000 + }, + { + "epoch": 1.94, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.0044586677104234695, + "eval_runtime": 107.824, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 747000 + }, + { + "epoch": 1.94, + "learning_rate": 9.546348835219982e-06, + "loss": 0.0108, + "step": 747010 + }, + { + "epoch": 1.94, + "learning_rate": 9.542460618848515e-06, + "loss": 0.0068, + "step": 747020 + }, + { + "epoch": 1.94, + "learning_rate": 9.538572402477052e-06, + "loss": 0.0128, + "step": 747030 + }, + { + "epoch": 1.94, + "learning_rate": 9.534684186105586e-06, + "loss": 0.0101, + "step": 747040 + }, + { + "epoch": 1.94, + "learning_rate": 9.530795969734123e-06, + "loss": 0.008, + "step": 747050 + }, + { + "epoch": 1.94, + "learning_rate": 9.526907753362658e-06, + "loss": 0.0068, + "step": 747060 + }, + { + "epoch": 1.94, + "learning_rate": 9.523019536991194e-06, + "loss": 0.007, + "step": 747070 + }, + { + "epoch": 1.94, + "learning_rate": 9.51913132061973e-06, + "loss": 0.0146, + "step": 747080 + }, + { + "epoch": 1.94, + "learning_rate": 9.515243104248264e-06, + "loss": 0.0066, + "step": 747090 + }, + { + "epoch": 1.94, + "learning_rate": 9.511354887876799e-06, + "loss": 0.0061, + "step": 747100 + }, + { + "epoch": 1.94, + "learning_rate": 9.507466671505336e-06, + "loss": 0.0091, + "step": 747110 + }, + { + "epoch": 1.94, + "learning_rate": 9.50357845513387e-06, + "loss": 0.0046, + "step": 747120 + }, + { + "epoch": 1.94, + "learning_rate": 9.499690238762407e-06, + "loss": 0.007, + "step": 747130 + }, + { + "epoch": 1.94, + "learning_rate": 9.495802022390942e-06, + "loss": 0.0059, + "step": 747140 + }, + { + "epoch": 1.94, + "learning_rate": 9.491913806019475e-06, + "loss": 0.0059, + "step": 747150 + }, + { + "epoch": 1.94, + "learning_rate": 9.488025589648012e-06, + "loss": 0.0054, + "step": 747160 + }, + { + "epoch": 1.94, + "learning_rate": 9.484137373276546e-06, + "loss": 0.0053, + "step": 747170 + }, + { + "epoch": 1.94, + "learning_rate": 9.480249156905083e-06, + "loss": 0.0058, + "step": 747180 + }, + { + "epoch": 1.94, + "learning_rate": 9.476360940533618e-06, + "loss": 0.0071, + "step": 747190 + }, + { + "epoch": 1.94, + "learning_rate": 9.472472724162154e-06, + "loss": 0.0065, + "step": 747200 + }, + { + "epoch": 1.94, + "learning_rate": 9.468584507790688e-06, + "loss": 0.0065, + "step": 747210 + }, + { + "epoch": 1.94, + "learning_rate": 9.464696291419224e-06, + "loss": 0.0073, + "step": 747220 + }, + { + "epoch": 1.94, + "learning_rate": 9.460808075047759e-06, + "loss": 0.0105, + "step": 747230 + }, + { + "epoch": 1.94, + "learning_rate": 9.456919858676296e-06, + "loss": 0.008, + "step": 747240 + }, + { + "epoch": 1.94, + "learning_rate": 9.45303164230483e-06, + "loss": 0.0051, + "step": 747250 + }, + { + "epoch": 1.94, + "learning_rate": 9.449143425933367e-06, + "loss": 0.0078, + "step": 747260 + }, + { + "epoch": 1.94, + "learning_rate": 9.4452552095619e-06, + "loss": 0.0077, + "step": 747270 + }, + { + "epoch": 1.94, + "learning_rate": 9.441366993190435e-06, + "loss": 0.0086, + "step": 747280 + }, + { + "epoch": 1.94, + "learning_rate": 9.437478776818972e-06, + "loss": 0.0076, + "step": 747290 + }, + { + "epoch": 1.94, + "learning_rate": 9.433590560447506e-06, + "loss": 0.0059, + "step": 747300 + }, + { + "epoch": 1.94, + "learning_rate": 9.429702344076043e-06, + "loss": 0.0054, + "step": 747310 + }, + { + "epoch": 1.94, + "learning_rate": 9.425814127704578e-06, + "loss": 0.0067, + "step": 747320 + }, + { + "epoch": 1.94, + "learning_rate": 9.421925911333113e-06, + "loss": 0.0072, + "step": 747330 + }, + { + "epoch": 1.94, + "learning_rate": 9.418037694961648e-06, + "loss": 0.0082, + "step": 747340 + }, + { + "epoch": 1.94, + "learning_rate": 9.414149478590184e-06, + "loss": 0.0079, + "step": 747350 + }, + { + "epoch": 1.94, + "learning_rate": 9.410261262218719e-06, + "loss": 0.0066, + "step": 747360 + }, + { + "epoch": 1.94, + "learning_rate": 9.406373045847256e-06, + "loss": 0.0068, + "step": 747370 + }, + { + "epoch": 1.94, + "learning_rate": 9.40248482947579e-06, + "loss": 0.0066, + "step": 747380 + }, + { + "epoch": 1.94, + "learning_rate": 9.398596613104327e-06, + "loss": 0.0045, + "step": 747390 + }, + { + "epoch": 1.94, + "learning_rate": 9.39470839673286e-06, + "loss": 0.0063, + "step": 747400 + }, + { + "epoch": 1.94, + "learning_rate": 9.390820180361395e-06, + "loss": 0.0082, + "step": 747410 + }, + { + "epoch": 1.94, + "learning_rate": 9.386931963989932e-06, + "loss": 0.0056, + "step": 747420 + }, + { + "epoch": 1.94, + "learning_rate": 9.383043747618466e-06, + "loss": 0.0075, + "step": 747430 + }, + { + "epoch": 1.94, + "learning_rate": 9.379155531247003e-06, + "loss": 0.0075, + "step": 747440 + }, + { + "epoch": 1.94, + "learning_rate": 9.375267314875538e-06, + "loss": 0.0065, + "step": 747450 + }, + { + "epoch": 1.94, + "learning_rate": 9.371379098504073e-06, + "loss": 0.006, + "step": 747460 + }, + { + "epoch": 1.94, + "learning_rate": 9.367490882132608e-06, + "loss": 0.0081, + "step": 747470 + }, + { + "epoch": 1.94, + "learning_rate": 9.363602665761144e-06, + "loss": 0.0068, + "step": 747480 + }, + { + "epoch": 1.94, + "learning_rate": 9.359714449389679e-06, + "loss": 0.0058, + "step": 747490 + }, + { + "epoch": 1.94, + "learning_rate": 9.355826233018214e-06, + "loss": 0.008, + "step": 747500 + }, + { + "epoch": 1.94, + "learning_rate": 9.351938016646749e-06, + "loss": 0.007, + "step": 747510 + }, + { + "epoch": 1.94, + "learning_rate": 9.348049800275285e-06, + "loss": 0.0068, + "step": 747520 + }, + { + "epoch": 1.94, + "learning_rate": 9.34416158390382e-06, + "loss": 0.0048, + "step": 747530 + }, + { + "epoch": 1.94, + "learning_rate": 9.340273367532355e-06, + "loss": 0.0053, + "step": 747540 + }, + { + "epoch": 1.94, + "learning_rate": 9.336385151160891e-06, + "loss": 0.0078, + "step": 747550 + }, + { + "epoch": 1.94, + "learning_rate": 9.332496934789426e-06, + "loss": 0.0071, + "step": 747560 + }, + { + "epoch": 1.94, + "learning_rate": 9.328608718417961e-06, + "loss": 0.0092, + "step": 747570 + }, + { + "epoch": 1.94, + "learning_rate": 9.324720502046498e-06, + "loss": 0.0071, + "step": 747580 + }, + { + "epoch": 1.94, + "learning_rate": 9.320832285675033e-06, + "loss": 0.0065, + "step": 747590 + }, + { + "epoch": 1.94, + "learning_rate": 9.316944069303567e-06, + "loss": 0.0076, + "step": 747600 + }, + { + "epoch": 1.94, + "learning_rate": 9.313055852932104e-06, + "loss": 0.006, + "step": 747610 + }, + { + "epoch": 1.94, + "learning_rate": 9.309167636560639e-06, + "loss": 0.0062, + "step": 747620 + }, + { + "epoch": 1.94, + "learning_rate": 9.305279420189174e-06, + "loss": 0.0039, + "step": 747630 + }, + { + "epoch": 1.94, + "learning_rate": 9.301391203817709e-06, + "loss": 0.0067, + "step": 747640 + }, + { + "epoch": 1.94, + "learning_rate": 9.297502987446245e-06, + "loss": 0.0082, + "step": 747650 + }, + { + "epoch": 1.94, + "learning_rate": 9.29361477107478e-06, + "loss": 0.0105, + "step": 747660 + }, + { + "epoch": 1.94, + "learning_rate": 9.289726554703315e-06, + "loss": 0.0062, + "step": 747670 + }, + { + "epoch": 1.94, + "learning_rate": 9.285838338331851e-06, + "loss": 0.0078, + "step": 747680 + }, + { + "epoch": 1.94, + "learning_rate": 9.281950121960386e-06, + "loss": 0.0082, + "step": 747690 + }, + { + "epoch": 1.94, + "learning_rate": 9.278061905588921e-06, + "loss": 0.0072, + "step": 747700 + }, + { + "epoch": 1.94, + "learning_rate": 9.274173689217458e-06, + "loss": 0.0099, + "step": 747710 + }, + { + "epoch": 1.94, + "learning_rate": 9.270285472845991e-06, + "loss": 0.0069, + "step": 747720 + }, + { + "epoch": 1.94, + "learning_rate": 9.266397256474527e-06, + "loss": 0.0076, + "step": 747730 + }, + { + "epoch": 1.94, + "learning_rate": 9.262509040103062e-06, + "loss": 0.0063, + "step": 747740 + }, + { + "epoch": 1.94, + "learning_rate": 9.258620823731597e-06, + "loss": 0.0063, + "step": 747750 + }, + { + "epoch": 1.94, + "learning_rate": 9.254732607360134e-06, + "loss": 0.0053, + "step": 747760 + }, + { + "epoch": 1.94, + "learning_rate": 9.250844390988669e-06, + "loss": 0.0099, + "step": 747770 + }, + { + "epoch": 1.94, + "learning_rate": 9.246956174617203e-06, + "loss": 0.0063, + "step": 747780 + }, + { + "epoch": 1.94, + "learning_rate": 9.24306795824574e-06, + "loss": 0.0085, + "step": 747790 + }, + { + "epoch": 1.94, + "learning_rate": 9.239179741874275e-06, + "loss": 0.0064, + "step": 747800 + }, + { + "epoch": 1.94, + "learning_rate": 9.23529152550281e-06, + "loss": 0.0062, + "step": 747810 + }, + { + "epoch": 1.94, + "learning_rate": 9.231403309131346e-06, + "loss": 0.0076, + "step": 747820 + }, + { + "epoch": 1.94, + "learning_rate": 9.227515092759881e-06, + "loss": 0.0047, + "step": 747830 + }, + { + "epoch": 1.94, + "learning_rate": 9.223626876388416e-06, + "loss": 0.0065, + "step": 747840 + }, + { + "epoch": 1.94, + "learning_rate": 9.219738660016951e-06, + "loss": 0.005, + "step": 747850 + }, + { + "epoch": 1.94, + "learning_rate": 9.215850443645487e-06, + "loss": 0.011, + "step": 747860 + }, + { + "epoch": 1.94, + "learning_rate": 9.211962227274022e-06, + "loss": 0.0052, + "step": 747870 + }, + { + "epoch": 1.94, + "learning_rate": 9.208074010902557e-06, + "loss": 0.0053, + "step": 747880 + }, + { + "epoch": 1.94, + "learning_rate": 9.204185794531094e-06, + "loss": 0.0046, + "step": 747890 + }, + { + "epoch": 1.94, + "learning_rate": 9.200297578159629e-06, + "loss": 0.0074, + "step": 747900 + }, + { + "epoch": 1.94, + "learning_rate": 9.196409361788163e-06, + "loss": 0.0063, + "step": 747910 + }, + { + "epoch": 1.94, + "learning_rate": 9.1925211454167e-06, + "loss": 0.0044, + "step": 747920 + }, + { + "epoch": 1.94, + "learning_rate": 9.188632929045235e-06, + "loss": 0.0067, + "step": 747930 + }, + { + "epoch": 1.94, + "learning_rate": 9.18474471267377e-06, + "loss": 0.0081, + "step": 747940 + }, + { + "epoch": 1.94, + "learning_rate": 9.180856496302306e-06, + "loss": 0.0049, + "step": 747950 + }, + { + "epoch": 1.94, + "learning_rate": 9.176968279930841e-06, + "loss": 0.0068, + "step": 747960 + }, + { + "epoch": 1.94, + "learning_rate": 9.173080063559376e-06, + "loss": 0.0049, + "step": 747970 + }, + { + "epoch": 1.94, + "learning_rate": 9.169191847187911e-06, + "loss": 0.0061, + "step": 747980 + }, + { + "epoch": 1.94, + "learning_rate": 9.165303630816447e-06, + "loss": 0.0086, + "step": 747990 + }, + { + "epoch": 1.94, + "learning_rate": 9.161415414444982e-06, + "loss": 0.0062, + "step": 748000 + }, + { + "epoch": 1.94, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.004467161372303963, + "eval_runtime": 107.7694, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.64, + "step": 748000 + }, + { + "epoch": 1.94, + "learning_rate": 9.157527198073517e-06, + "loss": 0.0074, + "step": 748010 + }, + { + "epoch": 1.94, + "learning_rate": 9.153638981702054e-06, + "loss": 0.0083, + "step": 748020 + }, + { + "epoch": 1.94, + "learning_rate": 9.149750765330589e-06, + "loss": 0.0077, + "step": 748030 + }, + { + "epoch": 1.94, + "learning_rate": 9.145862548959123e-06, + "loss": 0.0063, + "step": 748040 + }, + { + "epoch": 1.94, + "learning_rate": 9.14197433258766e-06, + "loss": 0.0051, + "step": 748050 + }, + { + "epoch": 1.94, + "learning_rate": 9.138086116216193e-06, + "loss": 0.0089, + "step": 748060 + }, + { + "epoch": 1.94, + "learning_rate": 9.13419789984473e-06, + "loss": 0.0056, + "step": 748070 + }, + { + "epoch": 1.94, + "learning_rate": 9.130309683473265e-06, + "loss": 0.0133, + "step": 748080 + }, + { + "epoch": 1.94, + "learning_rate": 9.1264214671018e-06, + "loss": 0.0096, + "step": 748090 + }, + { + "epoch": 1.94, + "learning_rate": 9.122533250730336e-06, + "loss": 0.0062, + "step": 748100 + }, + { + "epoch": 1.94, + "learning_rate": 9.11864503435887e-06, + "loss": 0.0067, + "step": 748110 + }, + { + "epoch": 1.94, + "learning_rate": 9.114756817987406e-06, + "loss": 0.0072, + "step": 748120 + }, + { + "epoch": 1.94, + "learning_rate": 9.110868601615942e-06, + "loss": 0.006, + "step": 748130 + }, + { + "epoch": 1.94, + "learning_rate": 9.106980385244477e-06, + "loss": 0.0083, + "step": 748140 + }, + { + "epoch": 1.94, + "learning_rate": 9.103092168873014e-06, + "loss": 0.0062, + "step": 748150 + }, + { + "epoch": 1.94, + "learning_rate": 9.099203952501549e-06, + "loss": 0.0074, + "step": 748160 + }, + { + "epoch": 1.94, + "learning_rate": 9.095315736130083e-06, + "loss": 0.0069, + "step": 748170 + }, + { + "epoch": 1.94, + "learning_rate": 9.09142751975862e-06, + "loss": 0.0073, + "step": 748180 + }, + { + "epoch": 1.94, + "learning_rate": 9.087539303387153e-06, + "loss": 0.0079, + "step": 748190 + }, + { + "epoch": 1.94, + "learning_rate": 9.08365108701569e-06, + "loss": 0.0063, + "step": 748200 + }, + { + "epoch": 1.94, + "learning_rate": 9.079762870644225e-06, + "loss": 0.006, + "step": 748210 + }, + { + "epoch": 1.94, + "learning_rate": 9.07587465427276e-06, + "loss": 0.0073, + "step": 748220 + }, + { + "epoch": 1.94, + "learning_rate": 9.071986437901296e-06, + "loss": 0.0069, + "step": 748230 + }, + { + "epoch": 1.94, + "learning_rate": 9.06809822152983e-06, + "loss": 0.0063, + "step": 748240 + }, + { + "epoch": 1.94, + "learning_rate": 9.064210005158366e-06, + "loss": 0.0061, + "step": 748250 + }, + { + "epoch": 1.94, + "learning_rate": 9.060321788786902e-06, + "loss": 0.0069, + "step": 748260 + }, + { + "epoch": 1.94, + "learning_rate": 9.056433572415437e-06, + "loss": 0.0059, + "step": 748270 + }, + { + "epoch": 1.94, + "learning_rate": 9.052545356043972e-06, + "loss": 0.0079, + "step": 748280 + }, + { + "epoch": 1.94, + "learning_rate": 9.048657139672509e-06, + "loss": 0.0058, + "step": 748290 + }, + { + "epoch": 1.94, + "learning_rate": 9.044768923301043e-06, + "loss": 0.0076, + "step": 748300 + }, + { + "epoch": 1.94, + "learning_rate": 9.040880706929578e-06, + "loss": 0.0066, + "step": 748310 + }, + { + "epoch": 1.94, + "learning_rate": 9.036992490558113e-06, + "loss": 0.008, + "step": 748320 + }, + { + "epoch": 1.94, + "learning_rate": 9.03310427418665e-06, + "loss": 0.0044, + "step": 748330 + }, + { + "epoch": 1.94, + "learning_rate": 9.029216057815185e-06, + "loss": 0.0102, + "step": 748340 + }, + { + "epoch": 1.94, + "learning_rate": 9.02532784144372e-06, + "loss": 0.0048, + "step": 748350 + }, + { + "epoch": 1.94, + "learning_rate": 9.021439625072256e-06, + "loss": 0.0076, + "step": 748360 + }, + { + "epoch": 1.94, + "learning_rate": 9.01755140870079e-06, + "loss": 0.0052, + "step": 748370 + }, + { + "epoch": 1.94, + "learning_rate": 9.013663192329326e-06, + "loss": 0.0068, + "step": 748380 + }, + { + "epoch": 1.94, + "learning_rate": 9.009774975957862e-06, + "loss": 0.007, + "step": 748390 + }, + { + "epoch": 1.94, + "learning_rate": 9.005886759586395e-06, + "loss": 0.0057, + "step": 748400 + }, + { + "epoch": 1.94, + "learning_rate": 9.001998543214932e-06, + "loss": 0.0074, + "step": 748410 + }, + { + "epoch": 1.94, + "learning_rate": 8.998110326843467e-06, + "loss": 0.0065, + "step": 748420 + }, + { + "epoch": 1.94, + "learning_rate": 8.994222110472002e-06, + "loss": 0.0091, + "step": 748430 + }, + { + "epoch": 1.94, + "learning_rate": 8.990333894100538e-06, + "loss": 0.0061, + "step": 748440 + }, + { + "epoch": 1.94, + "learning_rate": 8.986445677729073e-06, + "loss": 0.0083, + "step": 748450 + }, + { + "epoch": 1.94, + "learning_rate": 8.98255746135761e-06, + "loss": 0.0075, + "step": 748460 + }, + { + "epoch": 1.94, + "learning_rate": 8.978669244986144e-06, + "loss": 0.0069, + "step": 748470 + }, + { + "epoch": 1.94, + "learning_rate": 8.97478102861468e-06, + "loss": 0.0064, + "step": 748480 + }, + { + "epoch": 1.94, + "learning_rate": 8.970892812243216e-06, + "loss": 0.0076, + "step": 748490 + }, + { + "epoch": 1.94, + "learning_rate": 8.96700459587175e-06, + "loss": 0.0084, + "step": 748500 + }, + { + "epoch": 1.94, + "learning_rate": 8.963116379500286e-06, + "loss": 0.0062, + "step": 748510 + }, + { + "epoch": 1.94, + "learning_rate": 8.959228163128822e-06, + "loss": 0.0062, + "step": 748520 + }, + { + "epoch": 1.94, + "learning_rate": 8.955339946757355e-06, + "loss": 0.0069, + "step": 748530 + }, + { + "epoch": 1.94, + "learning_rate": 8.951451730385892e-06, + "loss": 0.0058, + "step": 748540 + }, + { + "epoch": 1.94, + "learning_rate": 8.947563514014427e-06, + "loss": 0.0068, + "step": 748550 + }, + { + "epoch": 1.94, + "learning_rate": 8.943675297642962e-06, + "loss": 0.0093, + "step": 748560 + }, + { + "epoch": 1.94, + "learning_rate": 8.939787081271498e-06, + "loss": 0.0062, + "step": 748570 + }, + { + "epoch": 1.94, + "learning_rate": 8.935898864900033e-06, + "loss": 0.0065, + "step": 748580 + }, + { + "epoch": 1.94, + "learning_rate": 8.932010648528568e-06, + "loss": 0.0087, + "step": 748590 + }, + { + "epoch": 1.94, + "learning_rate": 8.928122432157104e-06, + "loss": 0.0079, + "step": 748600 + }, + { + "epoch": 1.94, + "learning_rate": 8.92423421578564e-06, + "loss": 0.0072, + "step": 748610 + }, + { + "epoch": 1.94, + "learning_rate": 8.920345999414174e-06, + "loss": 0.0091, + "step": 748620 + }, + { + "epoch": 1.94, + "learning_rate": 8.91645778304271e-06, + "loss": 0.0088, + "step": 748630 + }, + { + "epoch": 1.94, + "learning_rate": 8.912569566671246e-06, + "loss": 0.0056, + "step": 748640 + }, + { + "epoch": 1.94, + "learning_rate": 8.90868135029978e-06, + "loss": 0.0054, + "step": 748650 + }, + { + "epoch": 1.94, + "learning_rate": 8.904793133928315e-06, + "loss": 0.0062, + "step": 748660 + }, + { + "epoch": 1.94, + "learning_rate": 8.900904917556852e-06, + "loss": 0.0075, + "step": 748670 + }, + { + "epoch": 1.94, + "learning_rate": 8.897016701185387e-06, + "loss": 0.0071, + "step": 748680 + }, + { + "epoch": 1.94, + "learning_rate": 8.893128484813922e-06, + "loss": 0.0081, + "step": 748690 + }, + { + "epoch": 1.94, + "learning_rate": 8.889240268442458e-06, + "loss": 0.0088, + "step": 748700 + }, + { + "epoch": 1.94, + "learning_rate": 8.885352052070993e-06, + "loss": 0.0073, + "step": 748710 + }, + { + "epoch": 1.94, + "learning_rate": 8.881463835699528e-06, + "loss": 0.0089, + "step": 748720 + }, + { + "epoch": 1.94, + "learning_rate": 8.877575619328064e-06, + "loss": 0.0084, + "step": 748730 + }, + { + "epoch": 1.94, + "learning_rate": 8.8736874029566e-06, + "loss": 0.0053, + "step": 748740 + }, + { + "epoch": 1.94, + "learning_rate": 8.869799186585134e-06, + "loss": 0.0068, + "step": 748750 + }, + { + "epoch": 1.94, + "learning_rate": 8.865910970213669e-06, + "loss": 0.0071, + "step": 748760 + }, + { + "epoch": 1.94, + "learning_rate": 8.862022753842206e-06, + "loss": 0.0078, + "step": 748770 + }, + { + "epoch": 1.94, + "learning_rate": 8.85813453747074e-06, + "loss": 0.0114, + "step": 748780 + }, + { + "epoch": 1.94, + "learning_rate": 8.854246321099275e-06, + "loss": 0.0071, + "step": 748790 + }, + { + "epoch": 1.94, + "learning_rate": 8.850358104727812e-06, + "loss": 0.0073, + "step": 748800 + }, + { + "epoch": 1.94, + "learning_rate": 8.846469888356347e-06, + "loss": 0.0063, + "step": 748810 + }, + { + "epoch": 1.94, + "learning_rate": 8.842581671984882e-06, + "loss": 0.0117, + "step": 748820 + }, + { + "epoch": 1.94, + "learning_rate": 8.838693455613418e-06, + "loss": 0.0097, + "step": 748830 + }, + { + "epoch": 1.94, + "learning_rate": 8.834805239241953e-06, + "loss": 0.0059, + "step": 748840 + }, + { + "epoch": 1.94, + "learning_rate": 8.830917022870488e-06, + "loss": 0.0079, + "step": 748850 + }, + { + "epoch": 1.94, + "learning_rate": 8.827028806499024e-06, + "loss": 0.007, + "step": 748860 + }, + { + "epoch": 1.94, + "learning_rate": 8.823140590127558e-06, + "loss": 0.0074, + "step": 748870 + }, + { + "epoch": 1.94, + "learning_rate": 8.819252373756094e-06, + "loss": 0.0048, + "step": 748880 + }, + { + "epoch": 1.94, + "learning_rate": 8.815364157384629e-06, + "loss": 0.0062, + "step": 748890 + }, + { + "epoch": 1.94, + "learning_rate": 8.811475941013164e-06, + "loss": 0.0084, + "step": 748900 + }, + { + "epoch": 1.94, + "learning_rate": 8.8075877246417e-06, + "loss": 0.0091, + "step": 748910 + }, + { + "epoch": 1.94, + "learning_rate": 8.803699508270235e-06, + "loss": 0.0093, + "step": 748920 + }, + { + "epoch": 1.94, + "learning_rate": 8.79981129189877e-06, + "loss": 0.004, + "step": 748930 + }, + { + "epoch": 1.94, + "learning_rate": 8.795923075527307e-06, + "loss": 0.0066, + "step": 748940 + }, + { + "epoch": 1.94, + "learning_rate": 8.792034859155842e-06, + "loss": 0.0067, + "step": 748950 + }, + { + "epoch": 1.94, + "learning_rate": 8.788146642784376e-06, + "loss": 0.0038, + "step": 748960 + }, + { + "epoch": 1.94, + "learning_rate": 8.784258426412913e-06, + "loss": 0.0068, + "step": 748970 + }, + { + "epoch": 1.94, + "learning_rate": 8.780370210041448e-06, + "loss": 0.006, + "step": 748980 + }, + { + "epoch": 1.94, + "learning_rate": 8.776481993669983e-06, + "loss": 0.0062, + "step": 748990 + }, + { + "epoch": 1.94, + "learning_rate": 8.772593777298518e-06, + "loss": 0.0066, + "step": 749000 + }, + { + "epoch": 1.94, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.004472545813769102, + "eval_runtime": 108.118, + "eval_samples_per_second": 18.498, + "eval_steps_per_second": 4.625, + "step": 749000 + }, + { + "epoch": 1.94, + "learning_rate": 8.768705560927054e-06, + "loss": 0.0079, + "step": 749010 + }, + { + "epoch": 1.94, + "learning_rate": 8.764817344555589e-06, + "loss": 0.0056, + "step": 749020 + }, + { + "epoch": 1.94, + "learning_rate": 8.760929128184124e-06, + "loss": 0.0103, + "step": 749030 + }, + { + "epoch": 1.94, + "learning_rate": 8.75704091181266e-06, + "loss": 0.0065, + "step": 749040 + }, + { + "epoch": 1.94, + "learning_rate": 8.753152695441195e-06, + "loss": 0.0095, + "step": 749050 + }, + { + "epoch": 1.94, + "learning_rate": 8.74926447906973e-06, + "loss": 0.0077, + "step": 749060 + }, + { + "epoch": 1.94, + "learning_rate": 8.745376262698267e-06, + "loss": 0.0071, + "step": 749070 + }, + { + "epoch": 1.94, + "learning_rate": 8.741488046326802e-06, + "loss": 0.0076, + "step": 749080 + }, + { + "epoch": 1.94, + "learning_rate": 8.737599829955336e-06, + "loss": 0.0089, + "step": 749090 + }, + { + "epoch": 1.94, + "learning_rate": 8.733711613583871e-06, + "loss": 0.0065, + "step": 749100 + }, + { + "epoch": 1.94, + "learning_rate": 8.729823397212408e-06, + "loss": 0.0055, + "step": 749110 + }, + { + "epoch": 1.94, + "learning_rate": 8.725935180840943e-06, + "loss": 0.0091, + "step": 749120 + }, + { + "epoch": 1.94, + "learning_rate": 8.722046964469478e-06, + "loss": 0.0064, + "step": 749130 + }, + { + "epoch": 1.94, + "learning_rate": 8.718158748098014e-06, + "loss": 0.008, + "step": 749140 + }, + { + "epoch": 1.94, + "learning_rate": 8.714270531726549e-06, + "loss": 0.0054, + "step": 749150 + }, + { + "epoch": 1.94, + "learning_rate": 8.710382315355084e-06, + "loss": 0.0071, + "step": 749160 + }, + { + "epoch": 1.94, + "learning_rate": 8.70649409898362e-06, + "loss": 0.0071, + "step": 749170 + }, + { + "epoch": 1.94, + "learning_rate": 8.702605882612155e-06, + "loss": 0.0056, + "step": 749180 + }, + { + "epoch": 1.94, + "learning_rate": 8.69871766624069e-06, + "loss": 0.0076, + "step": 749190 + }, + { + "epoch": 1.94, + "learning_rate": 8.694829449869227e-06, + "loss": 0.0049, + "step": 749200 + }, + { + "epoch": 1.94, + "learning_rate": 8.69094123349776e-06, + "loss": 0.0062, + "step": 749210 + }, + { + "epoch": 1.94, + "learning_rate": 8.687053017126296e-06, + "loss": 0.0063, + "step": 749220 + }, + { + "epoch": 1.94, + "learning_rate": 8.683164800754831e-06, + "loss": 0.0064, + "step": 749230 + }, + { + "epoch": 1.94, + "learning_rate": 8.679276584383366e-06, + "loss": 0.0078, + "step": 749240 + }, + { + "epoch": 1.94, + "learning_rate": 8.675388368011903e-06, + "loss": 0.0077, + "step": 749250 + }, + { + "epoch": 1.94, + "learning_rate": 8.671500151640438e-06, + "loss": 0.0072, + "step": 749260 + }, + { + "epoch": 1.94, + "learning_rate": 8.667611935268972e-06, + "loss": 0.0076, + "step": 749270 + }, + { + "epoch": 1.94, + "learning_rate": 8.663723718897509e-06, + "loss": 0.0064, + "step": 749280 + }, + { + "epoch": 1.94, + "learning_rate": 8.659835502526044e-06, + "loss": 0.0098, + "step": 749290 + }, + { + "epoch": 1.94, + "learning_rate": 8.655947286154579e-06, + "loss": 0.0104, + "step": 749300 + }, + { + "epoch": 1.94, + "learning_rate": 8.652059069783115e-06, + "loss": 0.005, + "step": 749310 + }, + { + "epoch": 1.94, + "learning_rate": 8.64817085341165e-06, + "loss": 0.0073, + "step": 749320 + }, + { + "epoch": 1.94, + "learning_rate": 8.644282637040185e-06, + "loss": 0.0063, + "step": 749330 + }, + { + "epoch": 1.94, + "learning_rate": 8.64039442066872e-06, + "loss": 0.0062, + "step": 749340 + }, + { + "epoch": 1.94, + "learning_rate": 8.636506204297256e-06, + "loss": 0.0054, + "step": 749350 + }, + { + "epoch": 1.94, + "learning_rate": 8.632617987925791e-06, + "loss": 0.0069, + "step": 749360 + }, + { + "epoch": 1.94, + "learning_rate": 8.628729771554326e-06, + "loss": 0.0061, + "step": 749370 + }, + { + "epoch": 1.94, + "learning_rate": 8.624841555182863e-06, + "loss": 0.0086, + "step": 749380 + }, + { + "epoch": 1.94, + "learning_rate": 8.620953338811397e-06, + "loss": 0.0078, + "step": 749390 + }, + { + "epoch": 1.94, + "learning_rate": 8.617065122439932e-06, + "loss": 0.007, + "step": 749400 + }, + { + "epoch": 1.94, + "learning_rate": 8.613176906068469e-06, + "loss": 0.0051, + "step": 749410 + }, + { + "epoch": 1.94, + "learning_rate": 8.609288689697004e-06, + "loss": 0.0066, + "step": 749420 + }, + { + "epoch": 1.94, + "learning_rate": 8.605400473325539e-06, + "loss": 0.0074, + "step": 749430 + }, + { + "epoch": 1.94, + "learning_rate": 8.601512256954073e-06, + "loss": 0.0056, + "step": 749440 + }, + { + "epoch": 1.94, + "learning_rate": 8.59762404058261e-06, + "loss": 0.0095, + "step": 749450 + }, + { + "epoch": 1.94, + "learning_rate": 8.593735824211145e-06, + "loss": 0.0089, + "step": 749460 + }, + { + "epoch": 1.94, + "learning_rate": 8.58984760783968e-06, + "loss": 0.0085, + "step": 749470 + }, + { + "epoch": 1.94, + "learning_rate": 8.585959391468216e-06, + "loss": 0.0063, + "step": 749480 + }, + { + "epoch": 1.94, + "learning_rate": 8.582071175096751e-06, + "loss": 0.0052, + "step": 749490 + }, + { + "epoch": 1.94, + "learning_rate": 8.578182958725286e-06, + "loss": 0.0068, + "step": 749500 + }, + { + "epoch": 1.94, + "learning_rate": 8.574294742353823e-06, + "loss": 0.0083, + "step": 749510 + }, + { + "epoch": 1.94, + "learning_rate": 8.570406525982357e-06, + "loss": 0.0086, + "step": 749520 + }, + { + "epoch": 1.94, + "learning_rate": 8.566518309610892e-06, + "loss": 0.0074, + "step": 749530 + }, + { + "epoch": 1.94, + "learning_rate": 8.562630093239429e-06, + "loss": 0.008, + "step": 749540 + }, + { + "epoch": 1.94, + "learning_rate": 8.558741876867962e-06, + "loss": 0.0077, + "step": 749550 + }, + { + "epoch": 1.94, + "learning_rate": 8.554853660496499e-06, + "loss": 0.0064, + "step": 749560 + }, + { + "epoch": 1.94, + "learning_rate": 8.550965444125033e-06, + "loss": 0.0071, + "step": 749570 + }, + { + "epoch": 1.94, + "learning_rate": 8.547077227753568e-06, + "loss": 0.0044, + "step": 749580 + }, + { + "epoch": 1.94, + "learning_rate": 8.543189011382105e-06, + "loss": 0.0077, + "step": 749590 + }, + { + "epoch": 1.94, + "learning_rate": 8.53930079501064e-06, + "loss": 0.0092, + "step": 749600 + }, + { + "epoch": 1.94, + "learning_rate": 8.535412578639175e-06, + "loss": 0.0094, + "step": 749610 + }, + { + "epoch": 1.94, + "learning_rate": 8.531524362267711e-06, + "loss": 0.0076, + "step": 749620 + }, + { + "epoch": 1.94, + "learning_rate": 8.527636145896246e-06, + "loss": 0.0088, + "step": 749630 + }, + { + "epoch": 1.94, + "learning_rate": 8.523747929524781e-06, + "loss": 0.0064, + "step": 749640 + }, + { + "epoch": 1.94, + "learning_rate": 8.519859713153317e-06, + "loss": 0.0067, + "step": 749650 + }, + { + "epoch": 1.94, + "learning_rate": 8.515971496781852e-06, + "loss": 0.0078, + "step": 749660 + }, + { + "epoch": 1.94, + "learning_rate": 8.512083280410387e-06, + "loss": 0.0054, + "step": 749670 + }, + { + "epoch": 1.94, + "learning_rate": 8.508195064038922e-06, + "loss": 0.0073, + "step": 749680 + }, + { + "epoch": 1.94, + "learning_rate": 8.504306847667459e-06, + "loss": 0.0077, + "step": 749690 + }, + { + "epoch": 1.94, + "learning_rate": 8.500418631295993e-06, + "loss": 0.0057, + "step": 749700 + }, + { + "epoch": 1.94, + "learning_rate": 8.496530414924528e-06, + "loss": 0.0045, + "step": 749710 + }, + { + "epoch": 1.94, + "learning_rate": 8.492642198553065e-06, + "loss": 0.0072, + "step": 749720 + }, + { + "epoch": 1.94, + "learning_rate": 8.4887539821816e-06, + "loss": 0.0059, + "step": 749730 + }, + { + "epoch": 1.94, + "learning_rate": 8.484865765810135e-06, + "loss": 0.0089, + "step": 749740 + }, + { + "epoch": 1.94, + "learning_rate": 8.480977549438671e-06, + "loss": 0.0087, + "step": 749750 + }, + { + "epoch": 1.94, + "learning_rate": 8.477089333067206e-06, + "loss": 0.0061, + "step": 749760 + }, + { + "epoch": 1.94, + "learning_rate": 8.473201116695741e-06, + "loss": 0.0059, + "step": 749770 + }, + { + "epoch": 1.94, + "learning_rate": 8.469312900324276e-06, + "loss": 0.0075, + "step": 749780 + }, + { + "epoch": 1.94, + "learning_rate": 8.465424683952812e-06, + "loss": 0.0069, + "step": 749790 + }, + { + "epoch": 1.94, + "learning_rate": 8.461536467581347e-06, + "loss": 0.0057, + "step": 749800 + }, + { + "epoch": 1.94, + "learning_rate": 8.457648251209882e-06, + "loss": 0.0059, + "step": 749810 + }, + { + "epoch": 1.94, + "learning_rate": 8.453760034838419e-06, + "loss": 0.0053, + "step": 749820 + }, + { + "epoch": 1.94, + "learning_rate": 8.449871818466953e-06, + "loss": 0.0057, + "step": 749830 + }, + { + "epoch": 1.94, + "learning_rate": 8.445983602095488e-06, + "loss": 0.005, + "step": 749840 + }, + { + "epoch": 1.94, + "learning_rate": 8.442095385724025e-06, + "loss": 0.0065, + "step": 749850 + }, + { + "epoch": 1.94, + "learning_rate": 8.43820716935256e-06, + "loss": 0.0057, + "step": 749860 + }, + { + "epoch": 1.94, + "learning_rate": 8.434318952981095e-06, + "loss": 0.0059, + "step": 749870 + }, + { + "epoch": 1.94, + "learning_rate": 8.430430736609631e-06, + "loss": 0.0058, + "step": 749880 + }, + { + "epoch": 1.94, + "learning_rate": 8.426542520238164e-06, + "loss": 0.0104, + "step": 749890 + }, + { + "epoch": 1.94, + "learning_rate": 8.4226543038667e-06, + "loss": 0.0083, + "step": 749900 + }, + { + "epoch": 1.94, + "learning_rate": 8.418766087495236e-06, + "loss": 0.0072, + "step": 749910 + }, + { + "epoch": 1.94, + "learning_rate": 8.41487787112377e-06, + "loss": 0.0095, + "step": 749920 + }, + { + "epoch": 1.94, + "learning_rate": 8.410989654752307e-06, + "loss": 0.0084, + "step": 749930 + }, + { + "epoch": 1.94, + "learning_rate": 8.407101438380842e-06, + "loss": 0.0065, + "step": 749940 + }, + { + "epoch": 1.94, + "learning_rate": 8.403213222009377e-06, + "loss": 0.0071, + "step": 749950 + }, + { + "epoch": 1.94, + "learning_rate": 8.399325005637913e-06, + "loss": 0.0101, + "step": 749960 + }, + { + "epoch": 1.94, + "learning_rate": 8.395436789266448e-06, + "loss": 0.0067, + "step": 749970 + }, + { + "epoch": 1.94, + "learning_rate": 8.391548572894983e-06, + "loss": 0.0079, + "step": 749980 + }, + { + "epoch": 1.94, + "learning_rate": 8.38766035652352e-06, + "loss": 0.0076, + "step": 749990 + }, + { + "epoch": 1.94, + "learning_rate": 8.383772140152055e-06, + "loss": 0.007, + "step": 750000 + }, + { + "epoch": 1.94, + "eval_cer": 0.8816662957628791, + "eval_loss": 0.00447363406419754, + "eval_runtime": 107.9666, + "eval_samples_per_second": 18.524, + "eval_steps_per_second": 4.631, + "step": 750000 + }, + { + "epoch": 1.94, + "learning_rate": 8.379883923780591e-06, + "loss": 0.0101, + "step": 750010 + }, + { + "epoch": 1.94, + "learning_rate": 8.375995707409124e-06, + "loss": 0.0045, + "step": 750020 + }, + { + "epoch": 1.94, + "learning_rate": 8.37210749103766e-06, + "loss": 0.0071, + "step": 750030 + }, + { + "epoch": 1.94, + "learning_rate": 8.368219274666196e-06, + "loss": 0.0054, + "step": 750040 + }, + { + "epoch": 1.94, + "learning_rate": 8.36433105829473e-06, + "loss": 0.0067, + "step": 750050 + }, + { + "epoch": 1.94, + "learning_rate": 8.360442841923267e-06, + "loss": 0.0062, + "step": 750060 + }, + { + "epoch": 1.94, + "learning_rate": 8.356554625551802e-06, + "loss": 0.006, + "step": 750070 + }, + { + "epoch": 1.94, + "learning_rate": 8.352666409180337e-06, + "loss": 0.0057, + "step": 750080 + }, + { + "epoch": 1.94, + "learning_rate": 8.348778192808873e-06, + "loss": 0.0066, + "step": 750090 + }, + { + "epoch": 1.94, + "learning_rate": 8.344889976437408e-06, + "loss": 0.0099, + "step": 750100 + }, + { + "epoch": 1.94, + "learning_rate": 8.341001760065943e-06, + "loss": 0.005, + "step": 750110 + }, + { + "epoch": 1.94, + "learning_rate": 8.33711354369448e-06, + "loss": 0.0069, + "step": 750120 + }, + { + "epoch": 1.94, + "learning_rate": 8.333225327323015e-06, + "loss": 0.0092, + "step": 750130 + }, + { + "epoch": 1.94, + "learning_rate": 8.32933711095155e-06, + "loss": 0.0087, + "step": 750140 + }, + { + "epoch": 1.94, + "learning_rate": 8.325448894580084e-06, + "loss": 0.0059, + "step": 750150 + }, + { + "epoch": 1.94, + "learning_rate": 8.32156067820862e-06, + "loss": 0.0065, + "step": 750160 + }, + { + "epoch": 1.94, + "learning_rate": 8.317672461837156e-06, + "loss": 0.0065, + "step": 750170 + }, + { + "epoch": 1.94, + "learning_rate": 8.31378424546569e-06, + "loss": 0.0081, + "step": 750180 + }, + { + "epoch": 1.94, + "learning_rate": 8.309896029094227e-06, + "loss": 0.0071, + "step": 750190 + }, + { + "epoch": 1.94, + "learning_rate": 8.306007812722762e-06, + "loss": 0.0085, + "step": 750200 + }, + { + "epoch": 1.94, + "learning_rate": 8.302119596351297e-06, + "loss": 0.0067, + "step": 750210 + }, + { + "epoch": 1.94, + "learning_rate": 8.298231379979833e-06, + "loss": 0.0057, + "step": 750220 + }, + { + "epoch": 1.94, + "learning_rate": 8.294343163608367e-06, + "loss": 0.0052, + "step": 750230 + }, + { + "epoch": 1.94, + "learning_rate": 8.290454947236903e-06, + "loss": 0.0074, + "step": 750240 + }, + { + "epoch": 1.94, + "learning_rate": 8.286566730865438e-06, + "loss": 0.0071, + "step": 750250 + }, + { + "epoch": 1.94, + "learning_rate": 8.282678514493973e-06, + "loss": 0.0091, + "step": 750260 + }, + { + "epoch": 1.94, + "learning_rate": 8.27879029812251e-06, + "loss": 0.0066, + "step": 750270 + }, + { + "epoch": 1.94, + "learning_rate": 8.274902081751044e-06, + "loss": 0.0066, + "step": 750280 + }, + { + "epoch": 1.94, + "learning_rate": 8.271013865379579e-06, + "loss": 0.0085, + "step": 750290 + }, + { + "epoch": 1.94, + "learning_rate": 8.267125649008116e-06, + "loss": 0.007, + "step": 750300 + }, + { + "epoch": 1.94, + "learning_rate": 8.26323743263665e-06, + "loss": 0.008, + "step": 750310 + }, + { + "epoch": 1.94, + "learning_rate": 8.259349216265187e-06, + "loss": 0.0059, + "step": 750320 + }, + { + "epoch": 1.94, + "learning_rate": 8.255460999893722e-06, + "loss": 0.0058, + "step": 750330 + }, + { + "epoch": 1.94, + "learning_rate": 8.251572783522257e-06, + "loss": 0.0072, + "step": 750340 + }, + { + "epoch": 1.95, + "learning_rate": 8.247684567150793e-06, + "loss": 0.009, + "step": 750350 + }, + { + "epoch": 1.95, + "learning_rate": 8.243796350779326e-06, + "loss": 0.0054, + "step": 750360 + }, + { + "epoch": 1.95, + "learning_rate": 8.239908134407863e-06, + "loss": 0.0061, + "step": 750370 + }, + { + "epoch": 1.95, + "learning_rate": 8.236019918036398e-06, + "loss": 0.0069, + "step": 750380 + }, + { + "epoch": 1.95, + "learning_rate": 8.232131701664933e-06, + "loss": 0.0075, + "step": 750390 + }, + { + "epoch": 1.95, + "learning_rate": 8.22824348529347e-06, + "loss": 0.0056, + "step": 750400 + }, + { + "epoch": 1.95, + "learning_rate": 8.224355268922004e-06, + "loss": 0.0049, + "step": 750410 + }, + { + "epoch": 1.95, + "learning_rate": 8.220467052550539e-06, + "loss": 0.0056, + "step": 750420 + }, + { + "epoch": 1.95, + "learning_rate": 8.216578836179076e-06, + "loss": 0.0091, + "step": 750430 + }, + { + "epoch": 1.95, + "learning_rate": 8.21269061980761e-06, + "loss": 0.0056, + "step": 750440 + }, + { + "epoch": 1.95, + "learning_rate": 8.208802403436145e-06, + "loss": 0.0121, + "step": 750450 + }, + { + "epoch": 1.95, + "learning_rate": 8.204914187064682e-06, + "loss": 0.0071, + "step": 750460 + }, + { + "epoch": 1.95, + "learning_rate": 8.201025970693217e-06, + "loss": 0.0073, + "step": 750470 + }, + { + "epoch": 1.95, + "learning_rate": 8.197137754321752e-06, + "loss": 0.0076, + "step": 750480 + }, + { + "epoch": 1.95, + "learning_rate": 8.193249537950286e-06, + "loss": 0.0071, + "step": 750490 + }, + { + "epoch": 1.95, + "learning_rate": 8.189361321578823e-06, + "loss": 0.0062, + "step": 750500 + }, + { + "epoch": 1.95, + "learning_rate": 8.185473105207358e-06, + "loss": 0.0089, + "step": 750510 + }, + { + "epoch": 1.95, + "learning_rate": 8.181584888835893e-06, + "loss": 0.0072, + "step": 750520 + }, + { + "epoch": 1.95, + "learning_rate": 8.17769667246443e-06, + "loss": 0.0072, + "step": 750530 + }, + { + "epoch": 1.95, + "learning_rate": 8.173808456092964e-06, + "loss": 0.009, + "step": 750540 + }, + { + "epoch": 1.95, + "learning_rate": 8.169920239721499e-06, + "loss": 0.0049, + "step": 750550 + }, + { + "epoch": 1.95, + "learning_rate": 8.166032023350036e-06, + "loss": 0.0058, + "step": 750560 + }, + { + "epoch": 1.95, + "learning_rate": 8.162143806978569e-06, + "loss": 0.006, + "step": 750570 + }, + { + "epoch": 1.95, + "learning_rate": 8.158255590607105e-06, + "loss": 0.0075, + "step": 750580 + }, + { + "epoch": 1.95, + "learning_rate": 8.15436737423564e-06, + "loss": 0.0083, + "step": 750590 + }, + { + "epoch": 1.95, + "learning_rate": 8.150479157864177e-06, + "loss": 0.008, + "step": 750600 + }, + { + "epoch": 1.95, + "learning_rate": 8.146590941492712e-06, + "loss": 0.0047, + "step": 750610 + }, + { + "epoch": 1.95, + "learning_rate": 8.142702725121246e-06, + "loss": 0.0054, + "step": 750620 + }, + { + "epoch": 1.95, + "learning_rate": 8.138814508749783e-06, + "loss": 0.0067, + "step": 750630 + }, + { + "epoch": 1.95, + "learning_rate": 8.134926292378318e-06, + "loss": 0.0077, + "step": 750640 + }, + { + "epoch": 1.95, + "learning_rate": 8.131038076006853e-06, + "loss": 0.0075, + "step": 750650 + }, + { + "epoch": 1.95, + "learning_rate": 8.12714985963539e-06, + "loss": 0.0057, + "step": 750660 + }, + { + "epoch": 1.95, + "learning_rate": 8.123261643263924e-06, + "loss": 0.0069, + "step": 750670 + }, + { + "epoch": 1.95, + "learning_rate": 8.119373426892459e-06, + "loss": 0.0083, + "step": 750680 + }, + { + "epoch": 1.95, + "learning_rate": 8.115485210520996e-06, + "loss": 0.0082, + "step": 750690 + }, + { + "epoch": 1.95, + "learning_rate": 8.111596994149529e-06, + "loss": 0.0072, + "step": 750700 + }, + { + "epoch": 1.95, + "learning_rate": 8.107708777778065e-06, + "loss": 0.0071, + "step": 750710 + }, + { + "epoch": 1.95, + "learning_rate": 8.1038205614066e-06, + "loss": 0.0082, + "step": 750720 + }, + { + "epoch": 1.95, + "learning_rate": 8.099932345035135e-06, + "loss": 0.0093, + "step": 750730 + }, + { + "epoch": 1.95, + "learning_rate": 8.096044128663672e-06, + "loss": 0.0076, + "step": 750740 + }, + { + "epoch": 1.95, + "learning_rate": 8.092155912292206e-06, + "loss": 0.0077, + "step": 750750 + }, + { + "epoch": 1.95, + "learning_rate": 8.088267695920741e-06, + "loss": 0.0053, + "step": 750760 + }, + { + "epoch": 1.95, + "learning_rate": 8.084379479549278e-06, + "loss": 0.0063, + "step": 750770 + }, + { + "epoch": 1.95, + "learning_rate": 8.080491263177813e-06, + "loss": 0.0092, + "step": 750780 + }, + { + "epoch": 1.95, + "learning_rate": 8.076603046806348e-06, + "loss": 0.0062, + "step": 750790 + }, + { + "epoch": 1.95, + "learning_rate": 8.072714830434884e-06, + "loss": 0.0076, + "step": 750800 + }, + { + "epoch": 1.95, + "learning_rate": 8.068826614063419e-06, + "loss": 0.0076, + "step": 750810 + }, + { + "epoch": 1.95, + "learning_rate": 8.064938397691954e-06, + "loss": 0.0114, + "step": 750820 + }, + { + "epoch": 1.95, + "learning_rate": 8.061050181320489e-06, + "loss": 0.0104, + "step": 750830 + }, + { + "epoch": 1.95, + "learning_rate": 8.057161964949025e-06, + "loss": 0.0061, + "step": 750840 + }, + { + "epoch": 1.95, + "learning_rate": 8.05327374857756e-06, + "loss": 0.0049, + "step": 750850 + }, + { + "epoch": 1.95, + "learning_rate": 8.049385532206095e-06, + "loss": 0.0059, + "step": 750860 + }, + { + "epoch": 1.95, + "learning_rate": 8.045497315834632e-06, + "loss": 0.0078, + "step": 750870 + }, + { + "epoch": 1.95, + "learning_rate": 8.041609099463166e-06, + "loss": 0.006, + "step": 750880 + }, + { + "epoch": 1.95, + "learning_rate": 8.037720883091701e-06, + "loss": 0.0062, + "step": 750890 + }, + { + "epoch": 1.95, + "learning_rate": 8.033832666720238e-06, + "loss": 0.0068, + "step": 750900 + }, + { + "epoch": 1.95, + "learning_rate": 8.029944450348773e-06, + "loss": 0.0063, + "step": 750910 + }, + { + "epoch": 1.95, + "learning_rate": 8.026056233977308e-06, + "loss": 0.0066, + "step": 750920 + }, + { + "epoch": 1.95, + "learning_rate": 8.022168017605842e-06, + "loss": 0.0058, + "step": 750930 + }, + { + "epoch": 1.95, + "learning_rate": 8.018279801234379e-06, + "loss": 0.0069, + "step": 750940 + }, + { + "epoch": 1.95, + "learning_rate": 8.014391584862914e-06, + "loss": 0.0078, + "step": 750950 + }, + { + "epoch": 1.95, + "learning_rate": 8.010503368491449e-06, + "loss": 0.0071, + "step": 750960 + }, + { + "epoch": 1.95, + "learning_rate": 8.006615152119985e-06, + "loss": 0.0068, + "step": 750970 + }, + { + "epoch": 1.95, + "learning_rate": 8.00272693574852e-06, + "loss": 0.0084, + "step": 750980 + }, + { + "epoch": 1.95, + "learning_rate": 7.998838719377055e-06, + "loss": 0.0057, + "step": 750990 + }, + { + "epoch": 1.95, + "learning_rate": 7.994950503005592e-06, + "loss": 0.0091, + "step": 751000 + }, + { + "epoch": 1.95, + "eval_cer": 0.8816690950367475, + "eval_loss": 0.004483851604163647, + "eval_runtime": 107.9182, + "eval_samples_per_second": 18.533, + "eval_steps_per_second": 4.633, + "step": 751000 + }, + { + "epoch": 1.95, + "learning_rate": 7.991062286634126e-06, + "loss": 0.0082, + "step": 751010 + }, + { + "epoch": 1.95, + "learning_rate": 7.987174070262661e-06, + "loss": 0.0057, + "step": 751020 + }, + { + "epoch": 1.95, + "learning_rate": 7.983285853891198e-06, + "loss": 0.0054, + "step": 751030 + }, + { + "epoch": 1.95, + "learning_rate": 7.979397637519731e-06, + "loss": 0.0099, + "step": 751040 + }, + { + "epoch": 1.95, + "learning_rate": 7.975509421148268e-06, + "loss": 0.0041, + "step": 751050 + }, + { + "epoch": 1.95, + "learning_rate": 7.971621204776802e-06, + "loss": 0.0077, + "step": 751060 + }, + { + "epoch": 1.95, + "learning_rate": 7.967732988405337e-06, + "loss": 0.0064, + "step": 751070 + }, + { + "epoch": 1.95, + "learning_rate": 7.963844772033874e-06, + "loss": 0.0066, + "step": 751080 + }, + { + "epoch": 1.95, + "learning_rate": 7.959956555662409e-06, + "loss": 0.0059, + "step": 751090 + }, + { + "epoch": 1.95, + "learning_rate": 7.956068339290944e-06, + "loss": 0.0077, + "step": 751100 + }, + { + "epoch": 1.95, + "learning_rate": 7.95218012291948e-06, + "loss": 0.0078, + "step": 751110 + }, + { + "epoch": 1.95, + "learning_rate": 7.948291906548015e-06, + "loss": 0.0058, + "step": 751120 + }, + { + "epoch": 1.95, + "learning_rate": 7.94440369017655e-06, + "loss": 0.0048, + "step": 751130 + }, + { + "epoch": 1.95, + "learning_rate": 7.940515473805086e-06, + "loss": 0.0074, + "step": 751140 + }, + { + "epoch": 1.95, + "learning_rate": 7.936627257433621e-06, + "loss": 0.0047, + "step": 751150 + }, + { + "epoch": 1.95, + "learning_rate": 7.932739041062156e-06, + "loss": 0.0095, + "step": 751160 + }, + { + "epoch": 1.95, + "learning_rate": 7.928850824690691e-06, + "loss": 0.0078, + "step": 751170 + }, + { + "epoch": 1.95, + "learning_rate": 7.924962608319227e-06, + "loss": 0.0065, + "step": 751180 + }, + { + "epoch": 1.95, + "learning_rate": 7.921074391947762e-06, + "loss": 0.0088, + "step": 751190 + }, + { + "epoch": 1.95, + "learning_rate": 7.917186175576297e-06, + "loss": 0.006, + "step": 751200 + }, + { + "epoch": 1.95, + "learning_rate": 7.913297959204834e-06, + "loss": 0.006, + "step": 751210 + }, + { + "epoch": 1.95, + "learning_rate": 7.909409742833369e-06, + "loss": 0.0078, + "step": 751220 + }, + { + "epoch": 1.95, + "learning_rate": 7.905521526461903e-06, + "loss": 0.0071, + "step": 751230 + }, + { + "epoch": 1.95, + "learning_rate": 7.90163331009044e-06, + "loss": 0.0059, + "step": 751240 + }, + { + "epoch": 1.95, + "learning_rate": 7.897745093718975e-06, + "loss": 0.0067, + "step": 751250 + }, + { + "epoch": 1.95, + "learning_rate": 7.89385687734751e-06, + "loss": 0.0064, + "step": 751260 + }, + { + "epoch": 1.95, + "learning_rate": 7.889968660976045e-06, + "loss": 0.0071, + "step": 751270 + }, + { + "epoch": 1.95, + "learning_rate": 7.886080444604581e-06, + "loss": 0.006, + "step": 751280 + }, + { + "epoch": 1.95, + "learning_rate": 7.882192228233116e-06, + "loss": 0.0067, + "step": 751290 + }, + { + "epoch": 1.95, + "learning_rate": 7.878304011861651e-06, + "loss": 0.0077, + "step": 751300 + }, + { + "epoch": 1.95, + "learning_rate": 7.874415795490187e-06, + "loss": 0.007, + "step": 751310 + }, + { + "epoch": 1.95, + "learning_rate": 7.870527579118722e-06, + "loss": 0.0088, + "step": 751320 + }, + { + "epoch": 1.95, + "learning_rate": 7.866639362747257e-06, + "loss": 0.0083, + "step": 751330 + }, + { + "epoch": 1.95, + "learning_rate": 7.862751146375794e-06, + "loss": 0.0055, + "step": 751340 + }, + { + "epoch": 1.95, + "learning_rate": 7.858862930004329e-06, + "loss": 0.0079, + "step": 751350 + }, + { + "epoch": 1.95, + "learning_rate": 7.854974713632863e-06, + "loss": 0.0066, + "step": 751360 + }, + { + "epoch": 1.95, + "learning_rate": 7.8510864972614e-06, + "loss": 0.0071, + "step": 751370 + }, + { + "epoch": 1.95, + "learning_rate": 7.847198280889933e-06, + "loss": 0.0124, + "step": 751380 + }, + { + "epoch": 1.95, + "learning_rate": 7.84331006451847e-06, + "loss": 0.0073, + "step": 751390 + }, + { + "epoch": 1.95, + "learning_rate": 7.839421848147005e-06, + "loss": 0.0071, + "step": 751400 + }, + { + "epoch": 1.95, + "learning_rate": 7.83553363177554e-06, + "loss": 0.0093, + "step": 751410 + }, + { + "epoch": 1.95, + "learning_rate": 7.831645415404076e-06, + "loss": 0.0068, + "step": 751420 + }, + { + "epoch": 1.95, + "learning_rate": 7.827757199032611e-06, + "loss": 0.007, + "step": 751430 + }, + { + "epoch": 1.95, + "learning_rate": 7.823868982661146e-06, + "loss": 0.0072, + "step": 751440 + }, + { + "epoch": 1.95, + "learning_rate": 7.819980766289682e-06, + "loss": 0.0055, + "step": 751450 + }, + { + "epoch": 1.95, + "learning_rate": 7.816092549918217e-06, + "loss": 0.0087, + "step": 751460 + }, + { + "epoch": 1.95, + "learning_rate": 7.812204333546752e-06, + "loss": 0.0057, + "step": 751470 + }, + { + "epoch": 1.95, + "learning_rate": 7.808316117175289e-06, + "loss": 0.0078, + "step": 751480 + }, + { + "epoch": 1.95, + "learning_rate": 7.804427900803823e-06, + "loss": 0.0055, + "step": 751490 + }, + { + "epoch": 1.95, + "learning_rate": 7.800539684432358e-06, + "loss": 0.0077, + "step": 751500 + }, + { + "epoch": 1.95, + "learning_rate": 7.796651468060893e-06, + "loss": 0.0121, + "step": 751510 + }, + { + "epoch": 1.95, + "learning_rate": 7.79276325168943e-06, + "loss": 0.0061, + "step": 751520 + }, + { + "epoch": 1.95, + "learning_rate": 7.788875035317965e-06, + "loss": 0.0086, + "step": 751530 + }, + { + "epoch": 1.95, + "learning_rate": 7.7849868189465e-06, + "loss": 0.008, + "step": 751540 + }, + { + "epoch": 1.95, + "learning_rate": 7.781098602575036e-06, + "loss": 0.0073, + "step": 751550 + }, + { + "epoch": 1.95, + "learning_rate": 7.777210386203571e-06, + "loss": 0.0067, + "step": 751560 + }, + { + "epoch": 1.95, + "learning_rate": 7.773322169832106e-06, + "loss": 0.0076, + "step": 751570 + }, + { + "epoch": 1.95, + "learning_rate": 7.769433953460642e-06, + "loss": 0.0076, + "step": 751580 + }, + { + "epoch": 1.95, + "learning_rate": 7.765545737089177e-06, + "loss": 0.0062, + "step": 751590 + }, + { + "epoch": 1.95, + "learning_rate": 7.761657520717712e-06, + "loss": 0.0078, + "step": 751600 + }, + { + "epoch": 1.95, + "learning_rate": 7.757769304346247e-06, + "loss": 0.0063, + "step": 751610 + }, + { + "epoch": 1.95, + "learning_rate": 7.753881087974783e-06, + "loss": 0.0061, + "step": 751620 + }, + { + "epoch": 1.95, + "learning_rate": 7.749992871603318e-06, + "loss": 0.007, + "step": 751630 + }, + { + "epoch": 1.95, + "learning_rate": 7.746104655231853e-06, + "loss": 0.0074, + "step": 751640 + }, + { + "epoch": 1.95, + "learning_rate": 7.74221643886039e-06, + "loss": 0.0062, + "step": 751650 + }, + { + "epoch": 1.95, + "learning_rate": 7.738328222488925e-06, + "loss": 0.0123, + "step": 751660 + }, + { + "epoch": 1.95, + "learning_rate": 7.73444000611746e-06, + "loss": 0.0071, + "step": 751670 + }, + { + "epoch": 1.95, + "learning_rate": 7.730551789745996e-06, + "loss": 0.0063, + "step": 751680 + }, + { + "epoch": 1.95, + "learning_rate": 7.72666357337453e-06, + "loss": 0.0074, + "step": 751690 + }, + { + "epoch": 1.95, + "learning_rate": 7.722775357003066e-06, + "loss": 0.0094, + "step": 751700 + }, + { + "epoch": 1.95, + "learning_rate": 7.718887140631602e-06, + "loss": 0.0078, + "step": 751710 + }, + { + "epoch": 1.95, + "learning_rate": 7.714998924260135e-06, + "loss": 0.0077, + "step": 751720 + }, + { + "epoch": 1.95, + "learning_rate": 7.711110707888672e-06, + "loss": 0.0061, + "step": 751730 + }, + { + "epoch": 1.95, + "learning_rate": 7.707222491517207e-06, + "loss": 0.0068, + "step": 751740 + }, + { + "epoch": 1.95, + "learning_rate": 7.703334275145742e-06, + "loss": 0.0064, + "step": 751750 + }, + { + "epoch": 1.95, + "learning_rate": 7.699446058774278e-06, + "loss": 0.0054, + "step": 751760 + }, + { + "epoch": 1.95, + "learning_rate": 7.695557842402813e-06, + "loss": 0.0053, + "step": 751770 + }, + { + "epoch": 1.95, + "learning_rate": 7.691669626031348e-06, + "loss": 0.012, + "step": 751780 + }, + { + "epoch": 1.95, + "learning_rate": 7.687781409659885e-06, + "loss": 0.0049, + "step": 751790 + }, + { + "epoch": 1.95, + "learning_rate": 7.68389319328842e-06, + "loss": 0.0082, + "step": 751800 + }, + { + "epoch": 1.95, + "learning_rate": 7.680004976916954e-06, + "loss": 0.0084, + "step": 751810 + }, + { + "epoch": 1.95, + "learning_rate": 7.67611676054549e-06, + "loss": 0.0054, + "step": 751820 + }, + { + "epoch": 1.95, + "learning_rate": 7.672228544174026e-06, + "loss": 0.0056, + "step": 751830 + }, + { + "epoch": 1.95, + "learning_rate": 7.668340327802562e-06, + "loss": 0.0105, + "step": 751840 + }, + { + "epoch": 1.95, + "learning_rate": 7.664452111431095e-06, + "loss": 0.0066, + "step": 751850 + }, + { + "epoch": 1.95, + "learning_rate": 7.660563895059632e-06, + "loss": 0.0074, + "step": 751860 + }, + { + "epoch": 1.95, + "learning_rate": 7.656675678688167e-06, + "loss": 0.0058, + "step": 751870 + }, + { + "epoch": 1.95, + "learning_rate": 7.652787462316702e-06, + "loss": 0.0076, + "step": 751880 + }, + { + "epoch": 1.95, + "learning_rate": 7.648899245945238e-06, + "loss": 0.0083, + "step": 751890 + }, + { + "epoch": 1.95, + "learning_rate": 7.645011029573773e-06, + "loss": 0.0064, + "step": 751900 + }, + { + "epoch": 1.95, + "learning_rate": 7.641122813202308e-06, + "loss": 0.0054, + "step": 751910 + }, + { + "epoch": 1.95, + "learning_rate": 7.637234596830844e-06, + "loss": 0.0085, + "step": 751920 + }, + { + "epoch": 1.95, + "learning_rate": 7.63334638045938e-06, + "loss": 0.007, + "step": 751930 + }, + { + "epoch": 1.95, + "learning_rate": 7.629458164087914e-06, + "loss": 0.0044, + "step": 751940 + }, + { + "epoch": 1.95, + "learning_rate": 7.62556994771645e-06, + "loss": 0.0089, + "step": 751950 + }, + { + "epoch": 1.95, + "learning_rate": 7.621681731344986e-06, + "loss": 0.0061, + "step": 751960 + }, + { + "epoch": 1.95, + "learning_rate": 7.6177935149735205e-06, + "loss": 0.0072, + "step": 751970 + }, + { + "epoch": 1.95, + "learning_rate": 7.613905298602056e-06, + "loss": 0.0086, + "step": 751980 + }, + { + "epoch": 1.95, + "learning_rate": 7.610017082230592e-06, + "loss": 0.007, + "step": 751990 + }, + { + "epoch": 1.95, + "learning_rate": 7.606128865859126e-06, + "loss": 0.0071, + "step": 752000 + }, + { + "epoch": 1.95, + "eval_cer": 0.8816676953998133, + "eval_loss": 0.004463730845600367, + "eval_runtime": 107.8824, + "eval_samples_per_second": 18.539, + "eval_steps_per_second": 4.635, + "step": 752000 + }, + { + "epoch": 1.95, + "learning_rate": 7.602240649487662e-06, + "loss": 0.0076, + "step": 752010 + }, + { + "epoch": 1.95, + "learning_rate": 7.598352433116197e-06, + "loss": 0.007, + "step": 752020 + }, + { + "epoch": 1.95, + "learning_rate": 7.594464216744732e-06, + "loss": 0.0065, + "step": 752030 + }, + { + "epoch": 1.95, + "learning_rate": 7.590576000373268e-06, + "loss": 0.0075, + "step": 752040 + }, + { + "epoch": 1.95, + "learning_rate": 7.586687784001804e-06, + "loss": 0.0036, + "step": 752050 + }, + { + "epoch": 1.95, + "learning_rate": 7.5827995676303385e-06, + "loss": 0.0057, + "step": 752060 + }, + { + "epoch": 1.95, + "learning_rate": 7.578911351258874e-06, + "loss": 0.0108, + "step": 752070 + }, + { + "epoch": 1.95, + "learning_rate": 7.57502313488741e-06, + "loss": 0.0082, + "step": 752080 + }, + { + "epoch": 1.95, + "learning_rate": 7.571134918515945e-06, + "loss": 0.0058, + "step": 752090 + }, + { + "epoch": 1.95, + "learning_rate": 7.5672467021444805e-06, + "loss": 0.0071, + "step": 752100 + }, + { + "epoch": 1.95, + "learning_rate": 7.563358485773016e-06, + "loss": 0.0056, + "step": 752110 + }, + { + "epoch": 1.95, + "learning_rate": 7.55947026940155e-06, + "loss": 0.0068, + "step": 752120 + }, + { + "epoch": 1.95, + "learning_rate": 7.555582053030086e-06, + "loss": 0.0071, + "step": 752130 + }, + { + "epoch": 1.95, + "learning_rate": 7.551693836658622e-06, + "loss": 0.0054, + "step": 752140 + }, + { + "epoch": 1.95, + "learning_rate": 7.547805620287157e-06, + "loss": 0.006, + "step": 752150 + }, + { + "epoch": 1.95, + "learning_rate": 7.543917403915692e-06, + "loss": 0.0061, + "step": 752160 + }, + { + "epoch": 1.95, + "learning_rate": 7.540029187544228e-06, + "loss": 0.0076, + "step": 752170 + }, + { + "epoch": 1.95, + "learning_rate": 7.536140971172764e-06, + "loss": 0.0083, + "step": 752180 + }, + { + "epoch": 1.95, + "learning_rate": 7.5322527548012985e-06, + "loss": 0.0053, + "step": 752190 + }, + { + "epoch": 1.95, + "learning_rate": 7.528364538429834e-06, + "loss": 0.0074, + "step": 752200 + }, + { + "epoch": 1.95, + "learning_rate": 7.52447632205837e-06, + "loss": 0.0083, + "step": 752210 + }, + { + "epoch": 1.95, + "learning_rate": 7.520588105686905e-06, + "loss": 0.0063, + "step": 752220 + }, + { + "epoch": 1.95, + "learning_rate": 7.51669988931544e-06, + "loss": 0.0061, + "step": 752230 + }, + { + "epoch": 1.95, + "learning_rate": 7.512811672943975e-06, + "loss": 0.0112, + "step": 752240 + }, + { + "epoch": 1.95, + "learning_rate": 7.50892345657251e-06, + "loss": 0.0058, + "step": 752250 + }, + { + "epoch": 1.95, + "learning_rate": 7.505035240201046e-06, + "loss": 0.0068, + "step": 752260 + }, + { + "epoch": 1.95, + "learning_rate": 7.501147023829582e-06, + "loss": 0.0068, + "step": 752270 + }, + { + "epoch": 1.95, + "learning_rate": 7.4972588074581165e-06, + "loss": 0.0081, + "step": 752280 + }, + { + "epoch": 1.95, + "learning_rate": 7.493370591086652e-06, + "loss": 0.0069, + "step": 752290 + }, + { + "epoch": 1.95, + "learning_rate": 7.489482374715188e-06, + "loss": 0.0091, + "step": 752300 + }, + { + "epoch": 1.95, + "learning_rate": 7.485594158343723e-06, + "loss": 0.0076, + "step": 752310 + }, + { + "epoch": 1.95, + "learning_rate": 7.4817059419722584e-06, + "loss": 0.0065, + "step": 752320 + }, + { + "epoch": 1.95, + "learning_rate": 7.477817725600794e-06, + "loss": 0.0088, + "step": 752330 + }, + { + "epoch": 1.95, + "learning_rate": 7.473929509229328e-06, + "loss": 0.0083, + "step": 752340 + }, + { + "epoch": 1.95, + "learning_rate": 7.470041292857864e-06, + "loss": 0.0074, + "step": 752350 + }, + { + "epoch": 1.95, + "learning_rate": 7.4661530764864e-06, + "loss": 0.007, + "step": 752360 + }, + { + "epoch": 1.95, + "learning_rate": 7.4622648601149344e-06, + "loss": 0.0072, + "step": 752370 + }, + { + "epoch": 1.95, + "learning_rate": 7.45837664374347e-06, + "loss": 0.0074, + "step": 752380 + }, + { + "epoch": 1.95, + "learning_rate": 7.454488427372006e-06, + "loss": 0.0055, + "step": 752390 + }, + { + "epoch": 1.95, + "learning_rate": 7.450600211000541e-06, + "loss": 0.0073, + "step": 752400 + }, + { + "epoch": 1.95, + "learning_rate": 7.4467119946290764e-06, + "loss": 0.0064, + "step": 752410 + }, + { + "epoch": 1.95, + "learning_rate": 7.442823778257612e-06, + "loss": 0.0071, + "step": 752420 + }, + { + "epoch": 1.95, + "learning_rate": 7.438935561886147e-06, + "loss": 0.0068, + "step": 752430 + }, + { + "epoch": 1.95, + "learning_rate": 7.435047345514683e-06, + "loss": 0.0061, + "step": 752440 + }, + { + "epoch": 1.95, + "learning_rate": 7.431159129143218e-06, + "loss": 0.0091, + "step": 752450 + }, + { + "epoch": 1.95, + "learning_rate": 7.427270912771754e-06, + "loss": 0.006, + "step": 752460 + }, + { + "epoch": 1.95, + "learning_rate": 7.423382696400288e-06, + "loss": 0.008, + "step": 752470 + }, + { + "epoch": 1.95, + "learning_rate": 7.419494480028824e-06, + "loss": 0.0091, + "step": 752480 + }, + { + "epoch": 1.95, + "learning_rate": 7.4156062636573596e-06, + "loss": 0.0075, + "step": 752490 + }, + { + "epoch": 1.95, + "learning_rate": 7.411718047285894e-06, + "loss": 0.0053, + "step": 752500 + }, + { + "epoch": 1.95, + "learning_rate": 7.40782983091443e-06, + "loss": 0.0066, + "step": 752510 + }, + { + "epoch": 1.95, + "learning_rate": 7.403941614542966e-06, + "loss": 0.0074, + "step": 752520 + }, + { + "epoch": 1.95, + "learning_rate": 7.400053398171501e-06, + "loss": 0.0073, + "step": 752530 + }, + { + "epoch": 1.95, + "learning_rate": 7.396165181800036e-06, + "loss": 0.0053, + "step": 752540 + }, + { + "epoch": 1.95, + "learning_rate": 7.392276965428572e-06, + "loss": 0.0087, + "step": 752550 + }, + { + "epoch": 1.95, + "learning_rate": 7.388388749057107e-06, + "loss": 0.0062, + "step": 752560 + }, + { + "epoch": 1.95, + "learning_rate": 7.384500532685643e-06, + "loss": 0.006, + "step": 752570 + }, + { + "epoch": 1.95, + "learning_rate": 7.3806123163141775e-06, + "loss": 0.0069, + "step": 752580 + }, + { + "epoch": 1.95, + "learning_rate": 7.376724099942712e-06, + "loss": 0.0051, + "step": 752590 + }, + { + "epoch": 1.95, + "learning_rate": 7.372835883571248e-06, + "loss": 0.007, + "step": 752600 + }, + { + "epoch": 1.95, + "learning_rate": 7.368947667199784e-06, + "loss": 0.0063, + "step": 752610 + }, + { + "epoch": 1.95, + "learning_rate": 7.365059450828319e-06, + "loss": 0.007, + "step": 752620 + }, + { + "epoch": 1.95, + "learning_rate": 7.361171234456854e-06, + "loss": 0.0049, + "step": 752630 + }, + { + "epoch": 1.95, + "learning_rate": 7.35728301808539e-06, + "loss": 0.0054, + "step": 752640 + }, + { + "epoch": 1.95, + "learning_rate": 7.353394801713925e-06, + "loss": 0.0075, + "step": 752650 + }, + { + "epoch": 1.95, + "learning_rate": 7.349506585342461e-06, + "loss": 0.0053, + "step": 752660 + }, + { + "epoch": 1.95, + "learning_rate": 7.345618368970996e-06, + "loss": 0.0074, + "step": 752670 + }, + { + "epoch": 1.95, + "learning_rate": 7.34173015259953e-06, + "loss": 0.0073, + "step": 752680 + }, + { + "epoch": 1.95, + "learning_rate": 7.337841936228066e-06, + "loss": 0.0097, + "step": 752690 + }, + { + "epoch": 1.95, + "learning_rate": 7.333953719856602e-06, + "loss": 0.006, + "step": 752700 + }, + { + "epoch": 1.95, + "learning_rate": 7.330065503485137e-06, + "loss": 0.0059, + "step": 752710 + }, + { + "epoch": 1.95, + "learning_rate": 7.326177287113672e-06, + "loss": 0.0075, + "step": 752720 + }, + { + "epoch": 1.95, + "learning_rate": 7.322289070742208e-06, + "loss": 0.0093, + "step": 752730 + }, + { + "epoch": 1.95, + "learning_rate": 7.318400854370744e-06, + "loss": 0.0073, + "step": 752740 + }, + { + "epoch": 1.95, + "learning_rate": 7.314512637999279e-06, + "loss": 0.0083, + "step": 752750 + }, + { + "epoch": 1.95, + "learning_rate": 7.310624421627814e-06, + "loss": 0.0089, + "step": 752760 + }, + { + "epoch": 1.95, + "learning_rate": 7.30673620525635e-06, + "loss": 0.0065, + "step": 752770 + }, + { + "epoch": 1.95, + "learning_rate": 7.302847988884885e-06, + "loss": 0.0063, + "step": 752780 + }, + { + "epoch": 1.95, + "learning_rate": 7.298959772513421e-06, + "loss": 0.0061, + "step": 752790 + }, + { + "epoch": 1.95, + "learning_rate": 7.295071556141956e-06, + "loss": 0.0093, + "step": 752800 + }, + { + "epoch": 1.95, + "learning_rate": 7.29118333977049e-06, + "loss": 0.0069, + "step": 752810 + }, + { + "epoch": 1.95, + "learning_rate": 7.287295123399026e-06, + "loss": 0.0093, + "step": 752820 + }, + { + "epoch": 1.95, + "learning_rate": 7.283406907027562e-06, + "loss": 0.0071, + "step": 752830 + }, + { + "epoch": 1.95, + "learning_rate": 7.279518690656097e-06, + "loss": 0.0049, + "step": 752840 + }, + { + "epoch": 1.95, + "learning_rate": 7.275630474284632e-06, + "loss": 0.0062, + "step": 752850 + }, + { + "epoch": 1.95, + "learning_rate": 7.271742257913168e-06, + "loss": 0.0067, + "step": 752860 + }, + { + "epoch": 1.95, + "learning_rate": 7.267854041541703e-06, + "loss": 0.009, + "step": 752870 + }, + { + "epoch": 1.95, + "learning_rate": 7.263965825170239e-06, + "loss": 0.006, + "step": 752880 + }, + { + "epoch": 1.95, + "learning_rate": 7.260077608798774e-06, + "loss": 0.0069, + "step": 752890 + }, + { + "epoch": 1.95, + "learning_rate": 7.256189392427309e-06, + "loss": 0.0075, + "step": 752900 + }, + { + "epoch": 1.95, + "learning_rate": 7.252301176055845e-06, + "loss": 0.0065, + "step": 752910 + }, + { + "epoch": 1.95, + "learning_rate": 7.24841295968438e-06, + "loss": 0.0055, + "step": 752920 + }, + { + "epoch": 1.95, + "learning_rate": 7.244524743312915e-06, + "loss": 0.0046, + "step": 752930 + }, + { + "epoch": 1.95, + "learning_rate": 7.24063652694145e-06, + "loss": 0.0054, + "step": 752940 + }, + { + "epoch": 1.95, + "learning_rate": 7.236748310569986e-06, + "loss": 0.0076, + "step": 752950 + }, + { + "epoch": 1.95, + "learning_rate": 7.232860094198521e-06, + "loss": 0.0065, + "step": 752960 + }, + { + "epoch": 1.95, + "learning_rate": 7.228971877827057e-06, + "loss": 0.0071, + "step": 752970 + }, + { + "epoch": 1.95, + "learning_rate": 7.225083661455592e-06, + "loss": 0.0084, + "step": 752980 + }, + { + "epoch": 1.95, + "learning_rate": 7.221195445084127e-06, + "loss": 0.0088, + "step": 752990 + }, + { + "epoch": 1.95, + "learning_rate": 7.217307228712663e-06, + "loss": 0.0054, + "step": 753000 + }, + { + "epoch": 1.95, + "eval_cer": 0.8816774928583525, + "eval_loss": 0.004489977844059467, + "eval_runtime": 107.9347, + "eval_samples_per_second": 18.53, + "eval_steps_per_second": 4.632, + "step": 753000 + }, + { + "epoch": 1.95, + "learning_rate": 7.213419012341199e-06, + "loss": 0.0053, + "step": 753010 + }, + { + "epoch": 1.95, + "learning_rate": 7.209530795969733e-06, + "loss": 0.0079, + "step": 753020 + }, + { + "epoch": 1.95, + "learning_rate": 7.205642579598268e-06, + "loss": 0.0054, + "step": 753030 + }, + { + "epoch": 1.95, + "learning_rate": 7.201754363226804e-06, + "loss": 0.0088, + "step": 753040 + }, + { + "epoch": 1.95, + "learning_rate": 7.19786614685534e-06, + "loss": 0.0062, + "step": 753050 + }, + { + "epoch": 1.95, + "learning_rate": 7.193977930483875e-06, + "loss": 0.0068, + "step": 753060 + }, + { + "epoch": 1.95, + "learning_rate": 7.19008971411241e-06, + "loss": 0.0074, + "step": 753070 + }, + { + "epoch": 1.95, + "learning_rate": 7.186201497740946e-06, + "loss": 0.0065, + "step": 753080 + }, + { + "epoch": 1.95, + "learning_rate": 7.182313281369481e-06, + "loss": 0.0079, + "step": 753090 + }, + { + "epoch": 1.95, + "learning_rate": 7.178425064998017e-06, + "loss": 0.0045, + "step": 753100 + }, + { + "epoch": 1.95, + "learning_rate": 7.174536848626552e-06, + "loss": 0.0067, + "step": 753110 + }, + { + "epoch": 1.95, + "learning_rate": 7.170648632255087e-06, + "loss": 0.0067, + "step": 753120 + }, + { + "epoch": 1.95, + "learning_rate": 7.166760415883623e-06, + "loss": 0.0082, + "step": 753130 + }, + { + "epoch": 1.95, + "learning_rate": 7.162872199512159e-06, + "loss": 0.0066, + "step": 753140 + }, + { + "epoch": 1.95, + "learning_rate": 7.158983983140693e-06, + "loss": 0.0075, + "step": 753150 + }, + { + "epoch": 1.95, + "learning_rate": 7.155095766769228e-06, + "loss": 0.008, + "step": 753160 + }, + { + "epoch": 1.95, + "learning_rate": 7.151207550397764e-06, + "loss": 0.0071, + "step": 753170 + }, + { + "epoch": 1.95, + "learning_rate": 7.147319334026299e-06, + "loss": 0.0064, + "step": 753180 + }, + { + "epoch": 1.95, + "learning_rate": 7.143431117654835e-06, + "loss": 0.0085, + "step": 753190 + }, + { + "epoch": 1.95, + "learning_rate": 7.13954290128337e-06, + "loss": 0.0074, + "step": 753200 + }, + { + "epoch": 1.95, + "learning_rate": 7.135654684911905e-06, + "loss": 0.0051, + "step": 753210 + }, + { + "epoch": 1.95, + "learning_rate": 7.131766468540441e-06, + "loss": 0.0054, + "step": 753220 + }, + { + "epoch": 1.95, + "learning_rate": 7.127878252168977e-06, + "loss": 0.0082, + "step": 753230 + }, + { + "epoch": 1.95, + "learning_rate": 7.1239900357975114e-06, + "loss": 0.0055, + "step": 753240 + }, + { + "epoch": 1.95, + "learning_rate": 7.120101819426047e-06, + "loss": 0.0068, + "step": 753250 + }, + { + "epoch": 1.95, + "learning_rate": 7.116213603054583e-06, + "loss": 0.0116, + "step": 753260 + }, + { + "epoch": 1.95, + "learning_rate": 7.112325386683117e-06, + "loss": 0.0062, + "step": 753270 + }, + { + "epoch": 1.95, + "learning_rate": 7.108437170311653e-06, + "loss": 0.0052, + "step": 753280 + }, + { + "epoch": 1.95, + "learning_rate": 7.104548953940188e-06, + "loss": 0.0076, + "step": 753290 + }, + { + "epoch": 1.95, + "learning_rate": 7.100660737568723e-06, + "loss": 0.0051, + "step": 753300 + }, + { + "epoch": 1.95, + "learning_rate": 7.096772521197259e-06, + "loss": 0.0055, + "step": 753310 + }, + { + "epoch": 1.95, + "learning_rate": 7.0928843048257946e-06, + "loss": 0.0086, + "step": 753320 + }, + { + "epoch": 1.95, + "learning_rate": 7.0889960884543294e-06, + "loss": 0.0091, + "step": 753330 + }, + { + "epoch": 1.95, + "learning_rate": 7.085107872082865e-06, + "loss": 0.0059, + "step": 753340 + }, + { + "epoch": 1.95, + "learning_rate": 7.081219655711401e-06, + "loss": 0.0067, + "step": 753350 + }, + { + "epoch": 1.95, + "learning_rate": 7.0773314393399366e-06, + "loss": 0.0081, + "step": 753360 + }, + { + "epoch": 1.95, + "learning_rate": 7.0734432229684706e-06, + "loss": 0.0058, + "step": 753370 + }, + { + "epoch": 1.95, + "learning_rate": 7.069555006597006e-06, + "loss": 0.0053, + "step": 753380 + }, + { + "epoch": 1.95, + "learning_rate": 7.065666790225542e-06, + "loss": 0.0068, + "step": 753390 + }, + { + "epoch": 1.95, + "learning_rate": 7.061778573854077e-06, + "loss": 0.0078, + "step": 753400 + }, + { + "epoch": 1.95, + "learning_rate": 7.0578903574826126e-06, + "loss": 0.009, + "step": 753410 + }, + { + "epoch": 1.95, + "learning_rate": 7.054002141111148e-06, + "loss": 0.0085, + "step": 753420 + }, + { + "epoch": 1.95, + "learning_rate": 7.050113924739683e-06, + "loss": 0.0064, + "step": 753430 + }, + { + "epoch": 1.95, + "learning_rate": 7.046225708368219e-06, + "loss": 0.0067, + "step": 753440 + }, + { + "epoch": 1.95, + "learning_rate": 7.0423374919967545e-06, + "loss": 0.006, + "step": 753450 + }, + { + "epoch": 1.95, + "learning_rate": 7.038449275625289e-06, + "loss": 0.0066, + "step": 753460 + }, + { + "epoch": 1.95, + "learning_rate": 7.034561059253825e-06, + "loss": 0.0063, + "step": 753470 + }, + { + "epoch": 1.95, + "learning_rate": 7.030672842882361e-06, + "loss": 0.0054, + "step": 753480 + }, + { + "epoch": 1.95, + "learning_rate": 7.026784626510895e-06, + "loss": 0.0055, + "step": 753490 + }, + { + "epoch": 1.95, + "learning_rate": 7.0228964101394305e-06, + "loss": 0.0068, + "step": 753500 + }, + { + "epoch": 1.95, + "learning_rate": 7.019008193767966e-06, + "loss": 0.0063, + "step": 753510 + }, + { + "epoch": 1.95, + "learning_rate": 7.015119977396501e-06, + "loss": 0.0049, + "step": 753520 + }, + { + "epoch": 1.95, + "learning_rate": 7.011231761025037e-06, + "loss": 0.0075, + "step": 753530 + }, + { + "epoch": 1.95, + "learning_rate": 7.0073435446535725e-06, + "loss": 0.0059, + "step": 753540 + }, + { + "epoch": 1.95, + "learning_rate": 7.003455328282107e-06, + "loss": 0.0059, + "step": 753550 + }, + { + "epoch": 1.95, + "learning_rate": 6.999567111910643e-06, + "loss": 0.0094, + "step": 753560 + }, + { + "epoch": 1.95, + "learning_rate": 6.995678895539179e-06, + "loss": 0.0075, + "step": 753570 + }, + { + "epoch": 1.95, + "learning_rate": 6.991790679167714e-06, + "loss": 0.0078, + "step": 753580 + }, + { + "epoch": 1.95, + "learning_rate": 6.987902462796249e-06, + "loss": 0.0086, + "step": 753590 + }, + { + "epoch": 1.95, + "learning_rate": 6.984014246424785e-06, + "loss": 0.0092, + "step": 753600 + }, + { + "epoch": 1.95, + "learning_rate": 6.980126030053319e-06, + "loss": 0.0094, + "step": 753610 + }, + { + "epoch": 1.95, + "learning_rate": 6.976237813681855e-06, + "loss": 0.0061, + "step": 753620 + }, + { + "epoch": 1.95, + "learning_rate": 6.9723495973103905e-06, + "loss": 0.008, + "step": 753630 + }, + { + "epoch": 1.95, + "learning_rate": 6.968461380938925e-06, + "loss": 0.0059, + "step": 753640 + }, + { + "epoch": 1.95, + "learning_rate": 6.964573164567461e-06, + "loss": 0.0061, + "step": 753650 + }, + { + "epoch": 1.95, + "learning_rate": 6.960684948195997e-06, + "loss": 0.0074, + "step": 753660 + }, + { + "epoch": 1.95, + "learning_rate": 6.9567967318245325e-06, + "loss": 0.0068, + "step": 753670 + }, + { + "epoch": 1.95, + "learning_rate": 6.952908515453067e-06, + "loss": 0.0068, + "step": 753680 + }, + { + "epoch": 1.95, + "learning_rate": 6.949020299081603e-06, + "loss": 0.0072, + "step": 753690 + }, + { + "epoch": 1.95, + "learning_rate": 6.945132082710139e-06, + "loss": 0.0061, + "step": 753700 + }, + { + "epoch": 1.95, + "learning_rate": 6.941243866338673e-06, + "loss": 0.0071, + "step": 753710 + }, + { + "epoch": 1.95, + "learning_rate": 6.9373556499672085e-06, + "loss": 0.0067, + "step": 753720 + }, + { + "epoch": 1.95, + "learning_rate": 6.933467433595744e-06, + "loss": 0.0085, + "step": 753730 + }, + { + "epoch": 1.95, + "learning_rate": 6.929579217224279e-06, + "loss": 0.0068, + "step": 753740 + }, + { + "epoch": 1.95, + "learning_rate": 6.925691000852815e-06, + "loss": 0.0054, + "step": 753750 + }, + { + "epoch": 1.95, + "learning_rate": 6.9218027844813505e-06, + "loss": 0.0065, + "step": 753760 + }, + { + "epoch": 1.95, + "learning_rate": 6.917914568109885e-06, + "loss": 0.006, + "step": 753770 + }, + { + "epoch": 1.95, + "learning_rate": 6.914026351738421e-06, + "loss": 0.0056, + "step": 753780 + }, + { + "epoch": 1.95, + "learning_rate": 6.910138135366957e-06, + "loss": 0.0067, + "step": 753790 + }, + { + "epoch": 1.95, + "learning_rate": 6.906249918995492e-06, + "loss": 0.0051, + "step": 753800 + }, + { + "epoch": 1.95, + "learning_rate": 6.902361702624027e-06, + "loss": 0.0085, + "step": 753810 + }, + { + "epoch": 1.95, + "learning_rate": 6.898473486252563e-06, + "loss": 0.007, + "step": 753820 + }, + { + "epoch": 1.95, + "learning_rate": 6.894585269881097e-06, + "loss": 0.0057, + "step": 753830 + }, + { + "epoch": 1.95, + "learning_rate": 6.890697053509633e-06, + "loss": 0.0077, + "step": 753840 + }, + { + "epoch": 1.95, + "learning_rate": 6.8868088371381685e-06, + "loss": 0.0075, + "step": 753850 + }, + { + "epoch": 1.95, + "learning_rate": 6.882920620766703e-06, + "loss": 0.0072, + "step": 753860 + }, + { + "epoch": 1.95, + "learning_rate": 6.879032404395239e-06, + "loss": 0.0074, + "step": 753870 + }, + { + "epoch": 1.95, + "learning_rate": 6.875144188023775e-06, + "loss": 0.008, + "step": 753880 + }, + { + "epoch": 1.95, + "learning_rate": 6.87125597165231e-06, + "loss": 0.0053, + "step": 753890 + }, + { + "epoch": 1.95, + "learning_rate": 6.867367755280845e-06, + "loss": 0.0098, + "step": 753900 + }, + { + "epoch": 1.95, + "learning_rate": 6.863479538909381e-06, + "loss": 0.005, + "step": 753910 + }, + { + "epoch": 1.95, + "learning_rate": 6.859591322537916e-06, + "loss": 0.0065, + "step": 753920 + }, + { + "epoch": 1.95, + "learning_rate": 6.855703106166452e-06, + "loss": 0.0057, + "step": 753930 + }, + { + "epoch": 1.95, + "learning_rate": 6.851814889794987e-06, + "loss": 0.0073, + "step": 753940 + }, + { + "epoch": 1.95, + "learning_rate": 6.847926673423521e-06, + "loss": 0.0064, + "step": 753950 + }, + { + "epoch": 1.95, + "learning_rate": 6.844038457052057e-06, + "loss": 0.0063, + "step": 753960 + }, + { + "epoch": 1.95, + "learning_rate": 6.840150240680593e-06, + "loss": 0.0076, + "step": 753970 + }, + { + "epoch": 1.95, + "learning_rate": 6.8362620243091285e-06, + "loss": 0.0071, + "step": 753980 + }, + { + "epoch": 1.95, + "learning_rate": 6.832373807937663e-06, + "loss": 0.0063, + "step": 753990 + }, + { + "epoch": 1.95, + "learning_rate": 6.828485591566199e-06, + "loss": 0.006, + "step": 754000 + }, + { + "epoch": 1.95, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.004459910560399294, + "eval_runtime": 107.9724, + "eval_samples_per_second": 18.523, + "eval_steps_per_second": 4.631, + "step": 754000 + }, + { + "epoch": 1.95, + "learning_rate": 6.824597375194735e-06, + "loss": 0.0062, + "step": 754010 + }, + { + "epoch": 1.95, + "learning_rate": 6.82070915882327e-06, + "loss": 0.0076, + "step": 754020 + }, + { + "epoch": 1.95, + "learning_rate": 6.816820942451805e-06, + "loss": 0.0079, + "step": 754030 + }, + { + "epoch": 1.95, + "learning_rate": 6.812932726080341e-06, + "loss": 0.008, + "step": 754040 + }, + { + "epoch": 1.95, + "learning_rate": 6.809044509708875e-06, + "loss": 0.008, + "step": 754050 + }, + { + "epoch": 1.95, + "learning_rate": 6.805156293337411e-06, + "loss": 0.0057, + "step": 754060 + }, + { + "epoch": 1.95, + "learning_rate": 6.8012680769659464e-06, + "loss": 0.008, + "step": 754070 + }, + { + "epoch": 1.95, + "learning_rate": 6.797379860594481e-06, + "loss": 0.0081, + "step": 754080 + }, + { + "epoch": 1.95, + "learning_rate": 6.793491644223017e-06, + "loss": 0.0065, + "step": 754090 + }, + { + "epoch": 1.95, + "learning_rate": 6.789603427851553e-06, + "loss": 0.0068, + "step": 754100 + }, + { + "epoch": 1.95, + "learning_rate": 6.785715211480088e-06, + "loss": 0.0056, + "step": 754110 + }, + { + "epoch": 1.95, + "learning_rate": 6.781826995108623e-06, + "loss": 0.0077, + "step": 754120 + }, + { + "epoch": 1.95, + "learning_rate": 6.777938778737159e-06, + "loss": 0.0097, + "step": 754130 + }, + { + "epoch": 1.95, + "learning_rate": 6.774050562365694e-06, + "loss": 0.0074, + "step": 754140 + }, + { + "epoch": 1.95, + "learning_rate": 6.77016234599423e-06, + "loss": 0.009, + "step": 754150 + }, + { + "epoch": 1.95, + "learning_rate": 6.766274129622765e-06, + "loss": 0.0075, + "step": 754160 + }, + { + "epoch": 1.95, + "learning_rate": 6.762385913251299e-06, + "loss": 0.0057, + "step": 754170 + }, + { + "epoch": 1.95, + "learning_rate": 6.758497696879835e-06, + "loss": 0.0061, + "step": 754180 + }, + { + "epoch": 1.95, + "learning_rate": 6.754609480508371e-06, + "loss": 0.0056, + "step": 754190 + }, + { + "epoch": 1.95, + "learning_rate": 6.750721264136906e-06, + "loss": 0.0059, + "step": 754200 + }, + { + "epoch": 1.96, + "learning_rate": 6.746833047765441e-06, + "loss": 0.0063, + "step": 754210 + }, + { + "epoch": 1.96, + "learning_rate": 6.742944831393977e-06, + "loss": 0.0093, + "step": 754220 + }, + { + "epoch": 1.96, + "learning_rate": 6.739056615022512e-06, + "loss": 0.0056, + "step": 754230 + }, + { + "epoch": 1.96, + "learning_rate": 6.7351683986510476e-06, + "loss": 0.0058, + "step": 754240 + }, + { + "epoch": 1.96, + "learning_rate": 6.731280182279583e-06, + "loss": 0.0087, + "step": 754250 + }, + { + "epoch": 1.96, + "learning_rate": 6.727391965908118e-06, + "loss": 0.0067, + "step": 754260 + }, + { + "epoch": 1.96, + "learning_rate": 6.723503749536654e-06, + "loss": 0.0076, + "step": 754270 + }, + { + "epoch": 1.96, + "learning_rate": 6.7196155331651896e-06, + "loss": 0.0066, + "step": 754280 + }, + { + "epoch": 1.96, + "learning_rate": 6.715727316793725e-06, + "loss": 0.0061, + "step": 754290 + }, + { + "epoch": 1.96, + "learning_rate": 6.711839100422259e-06, + "loss": 0.0092, + "step": 754300 + }, + { + "epoch": 1.96, + "learning_rate": 6.707950884050795e-06, + "loss": 0.0063, + "step": 754310 + }, + { + "epoch": 1.96, + "learning_rate": 6.704062667679331e-06, + "loss": 0.0086, + "step": 754320 + }, + { + "epoch": 1.96, + "learning_rate": 6.7001744513078656e-06, + "loss": 0.0081, + "step": 754330 + }, + { + "epoch": 1.96, + "learning_rate": 6.696286234936401e-06, + "loss": 0.0074, + "step": 754340 + }, + { + "epoch": 1.96, + "learning_rate": 6.692398018564937e-06, + "loss": 0.0065, + "step": 754350 + }, + { + "epoch": 1.96, + "learning_rate": 6.688509802193472e-06, + "loss": 0.0055, + "step": 754360 + }, + { + "epoch": 1.96, + "learning_rate": 6.6846215858220075e-06, + "loss": 0.0072, + "step": 754370 + }, + { + "epoch": 1.96, + "learning_rate": 6.680733369450543e-06, + "loss": 0.0068, + "step": 754380 + }, + { + "epoch": 1.96, + "learning_rate": 6.676845153079077e-06, + "loss": 0.0072, + "step": 754390 + }, + { + "epoch": 1.96, + "learning_rate": 6.672956936707613e-06, + "loss": 0.0098, + "step": 754400 + }, + { + "epoch": 1.96, + "learning_rate": 6.669068720336149e-06, + "loss": 0.0069, + "step": 754410 + }, + { + "epoch": 1.96, + "learning_rate": 6.6651805039646835e-06, + "loss": 0.0061, + "step": 754420 + }, + { + "epoch": 1.96, + "learning_rate": 6.661292287593219e-06, + "loss": 0.0081, + "step": 754430 + }, + { + "epoch": 1.96, + "learning_rate": 6.657404071221755e-06, + "loss": 0.0079, + "step": 754440 + }, + { + "epoch": 1.96, + "learning_rate": 6.65351585485029e-06, + "loss": 0.0085, + "step": 754450 + }, + { + "epoch": 1.96, + "learning_rate": 6.6496276384788255e-06, + "loss": 0.0065, + "step": 754460 + }, + { + "epoch": 1.96, + "learning_rate": 6.645739422107361e-06, + "loss": 0.0051, + "step": 754470 + }, + { + "epoch": 1.96, + "learning_rate": 6.641851205735896e-06, + "loss": 0.0057, + "step": 754480 + }, + { + "epoch": 1.96, + "learning_rate": 6.637962989364432e-06, + "loss": 0.0053, + "step": 754490 + }, + { + "epoch": 1.96, + "learning_rate": 6.6340747729929675e-06, + "loss": 0.0075, + "step": 754500 + }, + { + "epoch": 1.96, + "learning_rate": 6.6301865566215015e-06, + "loss": 0.0077, + "step": 754510 + }, + { + "epoch": 1.96, + "learning_rate": 6.626298340250037e-06, + "loss": 0.0082, + "step": 754520 + }, + { + "epoch": 1.96, + "learning_rate": 6.622410123878573e-06, + "loss": 0.0085, + "step": 754530 + }, + { + "epoch": 1.96, + "learning_rate": 6.618521907507108e-06, + "loss": 0.007, + "step": 754540 + }, + { + "epoch": 1.96, + "learning_rate": 6.6146336911356435e-06, + "loss": 0.004, + "step": 754550 + }, + { + "epoch": 1.96, + "learning_rate": 6.610745474764179e-06, + "loss": 0.0095, + "step": 754560 + }, + { + "epoch": 1.96, + "learning_rate": 6.606857258392714e-06, + "loss": 0.006, + "step": 754570 + }, + { + "epoch": 1.96, + "learning_rate": 6.60296904202125e-06, + "loss": 0.0074, + "step": 754580 + }, + { + "epoch": 1.96, + "learning_rate": 6.5990808256497855e-06, + "loss": 0.0064, + "step": 754590 + }, + { + "epoch": 1.96, + "learning_rate": 6.595192609278321e-06, + "loss": 0.0059, + "step": 754600 + }, + { + "epoch": 1.96, + "learning_rate": 6.591304392906856e-06, + "loss": 0.0063, + "step": 754610 + }, + { + "epoch": 1.96, + "learning_rate": 6.587416176535392e-06, + "loss": 0.0054, + "step": 754620 + }, + { + "epoch": 1.96, + "learning_rate": 6.5835279601639275e-06, + "loss": 0.0044, + "step": 754630 + }, + { + "epoch": 1.96, + "learning_rate": 6.5796397437924615e-06, + "loss": 0.0057, + "step": 754640 + }, + { + "epoch": 1.96, + "learning_rate": 6.575751527420997e-06, + "loss": 0.0082, + "step": 754650 + }, + { + "epoch": 1.96, + "learning_rate": 6.571863311049533e-06, + "loss": 0.0094, + "step": 754660 + }, + { + "epoch": 1.96, + "learning_rate": 6.567975094678068e-06, + "loss": 0.0101, + "step": 754670 + }, + { + "epoch": 1.96, + "learning_rate": 6.5640868783066035e-06, + "loss": 0.0061, + "step": 754680 + }, + { + "epoch": 1.96, + "learning_rate": 6.560198661935139e-06, + "loss": 0.0056, + "step": 754690 + }, + { + "epoch": 1.96, + "learning_rate": 6.556310445563674e-06, + "loss": 0.0065, + "step": 754700 + }, + { + "epoch": 1.96, + "learning_rate": 6.55242222919221e-06, + "loss": 0.0092, + "step": 754710 + }, + { + "epoch": 1.96, + "learning_rate": 6.5485340128207455e-06, + "loss": 0.0079, + "step": 754720 + }, + { + "epoch": 1.96, + "learning_rate": 6.5446457964492795e-06, + "loss": 0.0071, + "step": 754730 + }, + { + "epoch": 1.96, + "learning_rate": 6.540757580077815e-06, + "loss": 0.0047, + "step": 754740 + }, + { + "epoch": 1.96, + "learning_rate": 6.536869363706351e-06, + "loss": 0.0087, + "step": 754750 + }, + { + "epoch": 1.96, + "learning_rate": 6.532981147334886e-06, + "loss": 0.0066, + "step": 754760 + }, + { + "epoch": 1.96, + "learning_rate": 6.5290929309634215e-06, + "loss": 0.0067, + "step": 754770 + }, + { + "epoch": 1.96, + "learning_rate": 6.525204714591957e-06, + "loss": 0.0104, + "step": 754780 + }, + { + "epoch": 1.96, + "learning_rate": 6.521316498220492e-06, + "loss": 0.0079, + "step": 754790 + }, + { + "epoch": 1.96, + "learning_rate": 6.517428281849028e-06, + "loss": 0.0071, + "step": 754800 + }, + { + "epoch": 1.96, + "learning_rate": 6.5135400654775635e-06, + "loss": 0.0085, + "step": 754810 + }, + { + "epoch": 1.96, + "learning_rate": 6.509651849106098e-06, + "loss": 0.0083, + "step": 754820 + }, + { + "epoch": 1.96, + "learning_rate": 6.505763632734634e-06, + "loss": 0.0062, + "step": 754830 + }, + { + "epoch": 1.96, + "learning_rate": 6.50187541636317e-06, + "loss": 0.0058, + "step": 754840 + }, + { + "epoch": 1.96, + "learning_rate": 6.497987199991704e-06, + "loss": 0.0095, + "step": 754850 + }, + { + "epoch": 1.96, + "learning_rate": 6.4940989836202395e-06, + "loss": 0.0058, + "step": 754860 + }, + { + "epoch": 1.96, + "learning_rate": 6.490210767248775e-06, + "loss": 0.0082, + "step": 754870 + }, + { + "epoch": 1.96, + "learning_rate": 6.48632255087731e-06, + "loss": 0.0056, + "step": 754880 + }, + { + "epoch": 1.96, + "learning_rate": 6.482434334505846e-06, + "loss": 0.0094, + "step": 754890 + }, + { + "epoch": 1.96, + "learning_rate": 6.4785461181343815e-06, + "loss": 0.0099, + "step": 754900 + }, + { + "epoch": 1.96, + "learning_rate": 6.474657901762917e-06, + "loss": 0.0051, + "step": 754910 + }, + { + "epoch": 1.96, + "learning_rate": 6.470769685391452e-06, + "loss": 0.0076, + "step": 754920 + }, + { + "epoch": 1.96, + "learning_rate": 6.466881469019988e-06, + "loss": 0.0081, + "step": 754930 + }, + { + "epoch": 1.96, + "learning_rate": 6.4629932526485234e-06, + "loss": 0.0094, + "step": 754940 + }, + { + "epoch": 1.96, + "learning_rate": 6.459105036277058e-06, + "loss": 0.0071, + "step": 754950 + }, + { + "epoch": 1.96, + "learning_rate": 6.455216819905594e-06, + "loss": 0.0077, + "step": 754960 + }, + { + "epoch": 1.96, + "learning_rate": 6.45132860353413e-06, + "loss": 0.0062, + "step": 754970 + }, + { + "epoch": 1.96, + "learning_rate": 6.447440387162664e-06, + "loss": 0.0063, + "step": 754980 + }, + { + "epoch": 1.96, + "learning_rate": 6.4435521707911994e-06, + "loss": 0.0062, + "step": 754990 + }, + { + "epoch": 1.96, + "learning_rate": 6.439663954419735e-06, + "loss": 0.0078, + "step": 755000 + }, + { + "epoch": 1.96, + "eval_cer": 0.8816844910430235, + "eval_loss": 0.004422630183398724, + "eval_runtime": 107.997, + "eval_samples_per_second": 18.519, + "eval_steps_per_second": 4.63, + "step": 755000 + }, + { + "epoch": 1.96, + "learning_rate": 6.43577573804827e-06, + "loss": 0.0054, + "step": 755010 + }, + { + "epoch": 1.96, + "learning_rate": 6.431887521676806e-06, + "loss": 0.0058, + "step": 755020 + }, + { + "epoch": 1.96, + "learning_rate": 6.4279993053053414e-06, + "loss": 0.0085, + "step": 755030 + }, + { + "epoch": 1.96, + "learning_rate": 6.424111088933876e-06, + "loss": 0.0067, + "step": 755040 + }, + { + "epoch": 1.96, + "learning_rate": 6.420222872562412e-06, + "loss": 0.0135, + "step": 755050 + }, + { + "epoch": 1.96, + "learning_rate": 6.416334656190948e-06, + "loss": 0.0077, + "step": 755060 + }, + { + "epoch": 1.96, + "learning_rate": 6.412446439819482e-06, + "loss": 0.0065, + "step": 755070 + }, + { + "epoch": 1.96, + "learning_rate": 6.4085582234480174e-06, + "loss": 0.0071, + "step": 755080 + }, + { + "epoch": 1.96, + "learning_rate": 6.404670007076553e-06, + "loss": 0.0072, + "step": 755090 + }, + { + "epoch": 1.96, + "learning_rate": 6.400781790705088e-06, + "loss": 0.0056, + "step": 755100 + }, + { + "epoch": 1.96, + "learning_rate": 6.396893574333624e-06, + "loss": 0.0062, + "step": 755110 + }, + { + "epoch": 1.96, + "learning_rate": 6.3930053579621594e-06, + "loss": 0.0085, + "step": 755120 + }, + { + "epoch": 1.96, + "learning_rate": 6.389117141590694e-06, + "loss": 0.0079, + "step": 755130 + }, + { + "epoch": 1.96, + "learning_rate": 6.38522892521923e-06, + "loss": 0.0084, + "step": 755140 + }, + { + "epoch": 1.96, + "learning_rate": 6.381340708847766e-06, + "loss": 0.0051, + "step": 755150 + }, + { + "epoch": 1.96, + "learning_rate": 6.3774524924763006e-06, + "loss": 0.0068, + "step": 755160 + }, + { + "epoch": 1.96, + "learning_rate": 6.373564276104836e-06, + "loss": 0.007, + "step": 755170 + }, + { + "epoch": 1.96, + "learning_rate": 6.369676059733372e-06, + "loss": 0.0063, + "step": 755180 + }, + { + "epoch": 1.96, + "learning_rate": 6.365787843361908e-06, + "loss": 0.0078, + "step": 755190 + }, + { + "epoch": 1.96, + "learning_rate": 6.361899626990442e-06, + "loss": 0.008, + "step": 755200 + }, + { + "epoch": 1.96, + "learning_rate": 6.358011410618977e-06, + "loss": 0.0065, + "step": 755210 + }, + { + "epoch": 1.96, + "learning_rate": 6.354123194247513e-06, + "loss": 0.0084, + "step": 755220 + }, + { + "epoch": 1.96, + "learning_rate": 6.350234977876048e-06, + "loss": 0.0087, + "step": 755230 + }, + { + "epoch": 1.96, + "learning_rate": 6.346346761504584e-06, + "loss": 0.0092, + "step": 755240 + }, + { + "epoch": 1.96, + "learning_rate": 6.342458545133119e-06, + "loss": 0.0067, + "step": 755250 + }, + { + "epoch": 1.96, + "learning_rate": 6.338570328761654e-06, + "loss": 0.0062, + "step": 755260 + }, + { + "epoch": 1.96, + "learning_rate": 6.33468211239019e-06, + "loss": 0.0083, + "step": 755270 + }, + { + "epoch": 1.96, + "learning_rate": 6.330793896018726e-06, + "loss": 0.0062, + "step": 755280 + }, + { + "epoch": 1.96, + "learning_rate": 6.3269056796472605e-06, + "loss": 0.0059, + "step": 755290 + }, + { + "epoch": 1.96, + "learning_rate": 6.323017463275796e-06, + "loss": 0.0059, + "step": 755300 + }, + { + "epoch": 1.96, + "learning_rate": 6.319129246904332e-06, + "loss": 0.0055, + "step": 755310 + }, + { + "epoch": 1.96, + "learning_rate": 6.315241030532866e-06, + "loss": 0.0063, + "step": 755320 + }, + { + "epoch": 1.96, + "learning_rate": 6.311352814161402e-06, + "loss": 0.0054, + "step": 755330 + }, + { + "epoch": 1.96, + "learning_rate": 6.307464597789937e-06, + "loss": 0.006, + "step": 755340 + }, + { + "epoch": 1.96, + "learning_rate": 6.303576381418472e-06, + "loss": 0.0057, + "step": 755350 + }, + { + "epoch": 1.96, + "learning_rate": 6.299688165047008e-06, + "loss": 0.0105, + "step": 755360 + }, + { + "epoch": 1.96, + "learning_rate": 6.295799948675544e-06, + "loss": 0.0091, + "step": 755370 + }, + { + "epoch": 1.96, + "learning_rate": 6.2919117323040785e-06, + "loss": 0.0088, + "step": 755380 + }, + { + "epoch": 1.96, + "learning_rate": 6.288023515932614e-06, + "loss": 0.0072, + "step": 755390 + }, + { + "epoch": 1.96, + "learning_rate": 6.28413529956115e-06, + "loss": 0.0071, + "step": 755400 + }, + { + "epoch": 1.96, + "learning_rate": 6.280247083189684e-06, + "loss": 0.0065, + "step": 755410 + }, + { + "epoch": 1.96, + "learning_rate": 6.27635886681822e-06, + "loss": 0.0075, + "step": 755420 + }, + { + "epoch": 1.96, + "learning_rate": 6.272470650446755e-06, + "loss": 0.0036, + "step": 755430 + }, + { + "epoch": 1.96, + "learning_rate": 6.26858243407529e-06, + "loss": 0.0061, + "step": 755440 + }, + { + "epoch": 1.96, + "learning_rate": 6.264694217703826e-06, + "loss": 0.005, + "step": 755450 + }, + { + "epoch": 1.96, + "learning_rate": 6.260806001332362e-06, + "loss": 0.008, + "step": 755460 + }, + { + "epoch": 1.96, + "learning_rate": 6.2569177849608965e-06, + "loss": 0.0066, + "step": 755470 + }, + { + "epoch": 1.96, + "learning_rate": 6.253029568589432e-06, + "loss": 0.0064, + "step": 755480 + }, + { + "epoch": 1.96, + "learning_rate": 6.249141352217968e-06, + "loss": 0.0064, + "step": 755490 + }, + { + "epoch": 1.96, + "learning_rate": 6.245253135846504e-06, + "loss": 0.0071, + "step": 755500 + }, + { + "epoch": 1.96, + "learning_rate": 6.2413649194750385e-06, + "loss": 0.0072, + "step": 755510 + }, + { + "epoch": 1.96, + "learning_rate": 6.237476703103574e-06, + "loss": 0.0065, + "step": 755520 + }, + { + "epoch": 1.96, + "learning_rate": 6.23358848673211e-06, + "loss": 0.0065, + "step": 755530 + }, + { + "epoch": 1.96, + "learning_rate": 6.229700270360644e-06, + "loss": 0.0054, + "step": 755540 + }, + { + "epoch": 1.96, + "learning_rate": 6.22581205398918e-06, + "loss": 0.0073, + "step": 755550 + }, + { + "epoch": 1.96, + "learning_rate": 6.221923837617715e-06, + "loss": 0.0056, + "step": 755560 + }, + { + "epoch": 1.96, + "learning_rate": 6.21803562124625e-06, + "loss": 0.0082, + "step": 755570 + }, + { + "epoch": 1.96, + "learning_rate": 6.214147404874786e-06, + "loss": 0.0073, + "step": 755580 + }, + { + "epoch": 1.96, + "learning_rate": 6.210259188503322e-06, + "loss": 0.0059, + "step": 755590 + }, + { + "epoch": 1.96, + "learning_rate": 6.2063709721318565e-06, + "loss": 0.0064, + "step": 755600 + }, + { + "epoch": 1.96, + "learning_rate": 6.202482755760392e-06, + "loss": 0.0072, + "step": 755610 + }, + { + "epoch": 1.96, + "learning_rate": 6.198594539388928e-06, + "loss": 0.0047, + "step": 755620 + }, + { + "epoch": 1.96, + "learning_rate": 6.194706323017463e-06, + "loss": 0.008, + "step": 755630 + }, + { + "epoch": 1.96, + "learning_rate": 6.1908181066459985e-06, + "loss": 0.0072, + "step": 755640 + }, + { + "epoch": 1.96, + "learning_rate": 6.186929890274534e-06, + "loss": 0.0095, + "step": 755650 + }, + { + "epoch": 1.96, + "learning_rate": 6.183041673903068e-06, + "loss": 0.0085, + "step": 755660 + }, + { + "epoch": 1.96, + "learning_rate": 6.179153457531604e-06, + "loss": 0.0068, + "step": 755670 + }, + { + "epoch": 1.96, + "learning_rate": 6.17526524116014e-06, + "loss": 0.0082, + "step": 755680 + }, + { + "epoch": 1.96, + "learning_rate": 6.1713770247886745e-06, + "loss": 0.0069, + "step": 755690 + }, + { + "epoch": 1.96, + "learning_rate": 6.16748880841721e-06, + "loss": 0.0056, + "step": 755700 + }, + { + "epoch": 1.96, + "learning_rate": 6.163600592045746e-06, + "loss": 0.007, + "step": 755710 + }, + { + "epoch": 1.96, + "learning_rate": 6.159712375674281e-06, + "loss": 0.0061, + "step": 755720 + }, + { + "epoch": 1.96, + "learning_rate": 6.1558241593028165e-06, + "loss": 0.0056, + "step": 755730 + }, + { + "epoch": 1.96, + "learning_rate": 6.151935942931352e-06, + "loss": 0.0082, + "step": 755740 + }, + { + "epoch": 1.96, + "learning_rate": 6.148047726559886e-06, + "loss": 0.0097, + "step": 755750 + }, + { + "epoch": 1.96, + "learning_rate": 6.144159510188422e-06, + "loss": 0.0053, + "step": 755760 + }, + { + "epoch": 1.96, + "learning_rate": 6.140271293816958e-06, + "loss": 0.0062, + "step": 755770 + }, + { + "epoch": 1.96, + "learning_rate": 6.1363830774454925e-06, + "loss": 0.0054, + "step": 755780 + }, + { + "epoch": 1.96, + "learning_rate": 6.132494861074028e-06, + "loss": 0.0079, + "step": 755790 + }, + { + "epoch": 1.96, + "learning_rate": 6.128606644702564e-06, + "loss": 0.0065, + "step": 755800 + }, + { + "epoch": 1.96, + "learning_rate": 6.1247184283311e-06, + "loss": 0.0078, + "step": 755810 + }, + { + "epoch": 1.96, + "learning_rate": 6.1208302119596345e-06, + "loss": 0.0064, + "step": 755820 + }, + { + "epoch": 1.96, + "learning_rate": 6.11694199558817e-06, + "loss": 0.009, + "step": 755830 + }, + { + "epoch": 1.96, + "learning_rate": 6.113053779216706e-06, + "loss": 0.005, + "step": 755840 + }, + { + "epoch": 1.96, + "learning_rate": 6.109165562845241e-06, + "loss": 0.009, + "step": 755850 + }, + { + "epoch": 1.96, + "learning_rate": 6.1052773464737764e-06, + "loss": 0.0091, + "step": 755860 + }, + { + "epoch": 1.96, + "learning_rate": 6.101389130102312e-06, + "loss": 0.006, + "step": 755870 + }, + { + "epoch": 1.96, + "learning_rate": 6.097500913730846e-06, + "loss": 0.0078, + "step": 755880 + }, + { + "epoch": 1.96, + "learning_rate": 6.093612697359382e-06, + "loss": 0.0071, + "step": 755890 + }, + { + "epoch": 1.96, + "learning_rate": 6.089724480987918e-06, + "loss": 0.0097, + "step": 755900 + }, + { + "epoch": 1.96, + "learning_rate": 6.0858362646164524e-06, + "loss": 0.0069, + "step": 755910 + }, + { + "epoch": 1.96, + "learning_rate": 6.081948048244988e-06, + "loss": 0.0061, + "step": 755920 + }, + { + "epoch": 1.96, + "learning_rate": 6.078059831873524e-06, + "loss": 0.0092, + "step": 755930 + }, + { + "epoch": 1.96, + "learning_rate": 6.074171615502059e-06, + "loss": 0.0051, + "step": 755940 + }, + { + "epoch": 1.96, + "learning_rate": 6.0702833991305944e-06, + "loss": 0.0051, + "step": 755950 + }, + { + "epoch": 1.96, + "learning_rate": 6.06639518275913e-06, + "loss": 0.0075, + "step": 755960 + }, + { + "epoch": 1.96, + "learning_rate": 6.062506966387665e-06, + "loss": 0.0075, + "step": 755970 + }, + { + "epoch": 1.96, + "learning_rate": 6.058618750016201e-06, + "loss": 0.0083, + "step": 755980 + }, + { + "epoch": 1.96, + "learning_rate": 6.054730533644736e-06, + "loss": 0.0068, + "step": 755990 + }, + { + "epoch": 1.96, + "learning_rate": 6.0508423172732704e-06, + "loss": 0.0069, + "step": 756000 + }, + { + "epoch": 1.96, + "eval_cer": 0.8816816917691551, + "eval_loss": 0.0044304681941866875, + "eval_runtime": 107.8956, + "eval_samples_per_second": 18.536, + "eval_steps_per_second": 4.634, + "step": 756000 + }, + { + "epoch": 1.96, + "learning_rate": 6.046954100901806e-06, + "loss": 0.0073, + "step": 756010 + }, + { + "epoch": 1.96, + "learning_rate": 6.043065884530342e-06, + "loss": 0.0079, + "step": 756020 + }, + { + "epoch": 1.96, + "learning_rate": 6.039177668158877e-06, + "loss": 0.0056, + "step": 756030 + }, + { + "epoch": 1.96, + "learning_rate": 6.035289451787412e-06, + "loss": 0.0072, + "step": 756040 + }, + { + "epoch": 1.96, + "learning_rate": 6.031401235415948e-06, + "loss": 0.0086, + "step": 756050 + }, + { + "epoch": 1.96, + "learning_rate": 6.027513019044483e-06, + "loss": 0.0083, + "step": 756060 + }, + { + "epoch": 1.96, + "learning_rate": 6.023624802673019e-06, + "loss": 0.0082, + "step": 756070 + }, + { + "epoch": 1.96, + "learning_rate": 6.019736586301554e-06, + "loss": 0.0087, + "step": 756080 + }, + { + "epoch": 1.96, + "learning_rate": 6.0158483699300884e-06, + "loss": 0.005, + "step": 756090 + }, + { + "epoch": 1.96, + "learning_rate": 6.011960153558624e-06, + "loss": 0.0061, + "step": 756100 + }, + { + "epoch": 1.96, + "learning_rate": 6.00807193718716e-06, + "loss": 0.0051, + "step": 756110 + }, + { + "epoch": 1.96, + "learning_rate": 6.0041837208156956e-06, + "loss": 0.0056, + "step": 756120 + }, + { + "epoch": 1.96, + "learning_rate": 6.00029550444423e-06, + "loss": 0.0057, + "step": 756130 + }, + { + "epoch": 1.96, + "learning_rate": 5.996407288072766e-06, + "loss": 0.0071, + "step": 756140 + }, + { + "epoch": 1.96, + "learning_rate": 5.992519071701302e-06, + "loss": 0.0122, + "step": 756150 + }, + { + "epoch": 1.96, + "learning_rate": 5.988630855329837e-06, + "loss": 0.0069, + "step": 756160 + }, + { + "epoch": 1.96, + "learning_rate": 5.984742638958372e-06, + "loss": 0.0075, + "step": 756170 + }, + { + "epoch": 1.96, + "learning_rate": 5.980854422586908e-06, + "loss": 0.0071, + "step": 756180 + }, + { + "epoch": 1.96, + "learning_rate": 5.976966206215443e-06, + "loss": 0.0062, + "step": 756190 + }, + { + "epoch": 1.96, + "learning_rate": 5.973077989843979e-06, + "loss": 0.0057, + "step": 756200 + }, + { + "epoch": 1.96, + "learning_rate": 5.969189773472514e-06, + "loss": 0.0093, + "step": 756210 + }, + { + "epoch": 1.96, + "learning_rate": 5.965301557101048e-06, + "loss": 0.0072, + "step": 756220 + }, + { + "epoch": 1.96, + "learning_rate": 5.961413340729584e-06, + "loss": 0.0097, + "step": 756230 + }, + { + "epoch": 1.96, + "learning_rate": 5.95752512435812e-06, + "loss": 0.0069, + "step": 756240 + }, + { + "epoch": 1.96, + "learning_rate": 5.953636907986655e-06, + "loss": 0.0054, + "step": 756250 + }, + { + "epoch": 1.96, + "learning_rate": 5.94974869161519e-06, + "loss": 0.0041, + "step": 756260 + }, + { + "epoch": 1.96, + "learning_rate": 5.945860475243726e-06, + "loss": 0.0062, + "step": 756270 + }, + { + "epoch": 1.96, + "learning_rate": 5.941972258872261e-06, + "loss": 0.0067, + "step": 756280 + }, + { + "epoch": 1.96, + "learning_rate": 5.938084042500797e-06, + "loss": 0.008, + "step": 756290 + }, + { + "epoch": 1.96, + "learning_rate": 5.934195826129332e-06, + "loss": 0.0056, + "step": 756300 + }, + { + "epoch": 1.96, + "learning_rate": 5.930307609757867e-06, + "loss": 0.0058, + "step": 756310 + }, + { + "epoch": 1.96, + "learning_rate": 5.926419393386403e-06, + "loss": 0.0099, + "step": 756320 + }, + { + "epoch": 1.96, + "learning_rate": 5.922531177014939e-06, + "loss": 0.006, + "step": 756330 + }, + { + "epoch": 1.96, + "learning_rate": 5.918642960643473e-06, + "loss": 0.0071, + "step": 756340 + }, + { + "epoch": 1.96, + "learning_rate": 5.914754744272008e-06, + "loss": 0.0066, + "step": 756350 + }, + { + "epoch": 1.96, + "learning_rate": 5.910866527900544e-06, + "loss": 0.0059, + "step": 756360 + }, + { + "epoch": 1.96, + "learning_rate": 5.906978311529079e-06, + "loss": 0.0077, + "step": 756370 + }, + { + "epoch": 1.96, + "learning_rate": 5.903090095157615e-06, + "loss": 0.007, + "step": 756380 + }, + { + "epoch": 1.96, + "learning_rate": 5.89920187878615e-06, + "loss": 0.0081, + "step": 756390 + }, + { + "epoch": 1.96, + "learning_rate": 5.895313662414685e-06, + "loss": 0.0077, + "step": 756400 + }, + { + "epoch": 1.96, + "learning_rate": 5.891425446043221e-06, + "loss": 0.0068, + "step": 756410 + }, + { + "epoch": 1.96, + "learning_rate": 5.887537229671757e-06, + "loss": 0.0069, + "step": 756420 + }, + { + "epoch": 1.96, + "learning_rate": 5.883649013300292e-06, + "loss": 0.007, + "step": 756430 + }, + { + "epoch": 1.96, + "learning_rate": 5.879760796928826e-06, + "loss": 0.0067, + "step": 756440 + }, + { + "epoch": 1.96, + "learning_rate": 5.875872580557362e-06, + "loss": 0.005, + "step": 756450 + }, + { + "epoch": 1.96, + "learning_rate": 5.871984364185898e-06, + "loss": 0.0052, + "step": 756460 + }, + { + "epoch": 1.96, + "learning_rate": 5.868096147814433e-06, + "loss": 0.0071, + "step": 756470 + }, + { + "epoch": 1.96, + "learning_rate": 5.864207931442968e-06, + "loss": 0.0078, + "step": 756480 + }, + { + "epoch": 1.96, + "learning_rate": 5.860319715071504e-06, + "loss": 0.0078, + "step": 756490 + }, + { + "epoch": 1.96, + "learning_rate": 5.856431498700039e-06, + "loss": 0.0068, + "step": 756500 + }, + { + "epoch": 1.96, + "learning_rate": 5.852543282328575e-06, + "loss": 0.0056, + "step": 756510 + }, + { + "epoch": 1.96, + "learning_rate": 5.84865506595711e-06, + "loss": 0.005, + "step": 756520 + }, + { + "epoch": 1.96, + "learning_rate": 5.844766849585645e-06, + "loss": 0.0088, + "step": 756530 + }, + { + "epoch": 1.96, + "learning_rate": 5.840878633214181e-06, + "loss": 0.006, + "step": 756540 + }, + { + "epoch": 1.96, + "learning_rate": 5.836990416842717e-06, + "loss": 0.0081, + "step": 756550 + }, + { + "epoch": 1.96, + "learning_rate": 5.833102200471251e-06, + "loss": 0.0099, + "step": 756560 + }, + { + "epoch": 1.96, + "learning_rate": 5.829213984099786e-06, + "loss": 0.0084, + "step": 756570 + }, + { + "epoch": 1.96, + "learning_rate": 5.825325767728322e-06, + "loss": 0.0057, + "step": 756580 + }, + { + "epoch": 1.96, + "learning_rate": 5.821437551356857e-06, + "loss": 0.0056, + "step": 756590 + }, + { + "epoch": 1.96, + "learning_rate": 5.817549334985393e-06, + "loss": 0.008, + "step": 756600 + }, + { + "epoch": 1.96, + "learning_rate": 5.813661118613928e-06, + "loss": 0.0078, + "step": 756610 + }, + { + "epoch": 1.96, + "learning_rate": 5.809772902242463e-06, + "loss": 0.008, + "step": 756620 + }, + { + "epoch": 1.96, + "learning_rate": 5.805884685870999e-06, + "loss": 0.0071, + "step": 756630 + }, + { + "epoch": 1.96, + "learning_rate": 5.801996469499535e-06, + "loss": 0.0104, + "step": 756640 + }, + { + "epoch": 1.96, + "learning_rate": 5.7981082531280695e-06, + "loss": 0.0068, + "step": 756650 + }, + { + "epoch": 1.96, + "learning_rate": 5.794220036756605e-06, + "loss": 0.0051, + "step": 756660 + }, + { + "epoch": 1.96, + "learning_rate": 5.790331820385141e-06, + "loss": 0.0064, + "step": 756670 + }, + { + "epoch": 1.96, + "learning_rate": 5.786443604013675e-06, + "loss": 0.0067, + "step": 756680 + }, + { + "epoch": 1.96, + "learning_rate": 5.782555387642211e-06, + "loss": 0.0071, + "step": 756690 + }, + { + "epoch": 1.96, + "learning_rate": 5.778667171270746e-06, + "loss": 0.0057, + "step": 756700 + }, + { + "epoch": 1.96, + "learning_rate": 5.774778954899281e-06, + "loss": 0.009, + "step": 756710 + }, + { + "epoch": 1.96, + "learning_rate": 5.770890738527817e-06, + "loss": 0.0113, + "step": 756720 + }, + { + "epoch": 1.96, + "learning_rate": 5.767002522156353e-06, + "loss": 0.0093, + "step": 756730 + }, + { + "epoch": 1.96, + "learning_rate": 5.763114305784888e-06, + "loss": 0.0065, + "step": 756740 + }, + { + "epoch": 1.96, + "learning_rate": 5.759226089413423e-06, + "loss": 0.0061, + "step": 756750 + }, + { + "epoch": 1.96, + "learning_rate": 5.755337873041959e-06, + "loss": 0.0059, + "step": 756760 + }, + { + "epoch": 1.96, + "learning_rate": 5.751449656670495e-06, + "loss": 0.0078, + "step": 756770 + }, + { + "epoch": 1.96, + "learning_rate": 5.747561440299029e-06, + "loss": 0.0052, + "step": 756780 + }, + { + "epoch": 1.96, + "learning_rate": 5.743673223927564e-06, + "loss": 0.007, + "step": 756790 + }, + { + "epoch": 1.96, + "learning_rate": 5.7397850075561e-06, + "loss": 0.0074, + "step": 756800 + }, + { + "epoch": 1.96, + "learning_rate": 5.735896791184635e-06, + "loss": 0.0094, + "step": 756810 + }, + { + "epoch": 1.96, + "learning_rate": 5.732008574813171e-06, + "loss": 0.0057, + "step": 756820 + }, + { + "epoch": 1.96, + "learning_rate": 5.728120358441706e-06, + "loss": 0.0088, + "step": 756830 + }, + { + "epoch": 1.96, + "learning_rate": 5.724232142070241e-06, + "loss": 0.007, + "step": 756840 + }, + { + "epoch": 1.96, + "learning_rate": 5.720343925698777e-06, + "loss": 0.0072, + "step": 756850 + }, + { + "epoch": 1.96, + "learning_rate": 5.7164557093273126e-06, + "loss": 0.0055, + "step": 756860 + }, + { + "epoch": 1.96, + "learning_rate": 5.7125674929558474e-06, + "loss": 0.0086, + "step": 756870 + }, + { + "epoch": 1.96, + "learning_rate": 5.708679276584383e-06, + "loss": 0.0069, + "step": 756880 + }, + { + "epoch": 1.96, + "learning_rate": 5.704791060212919e-06, + "loss": 0.0079, + "step": 756890 + }, + { + "epoch": 1.96, + "learning_rate": 5.700902843841453e-06, + "loss": 0.0082, + "step": 756900 + }, + { + "epoch": 1.96, + "learning_rate": 5.6970146274699886e-06, + "loss": 0.0063, + "step": 756910 + }, + { + "epoch": 1.96, + "learning_rate": 5.693126411098524e-06, + "loss": 0.007, + "step": 756920 + }, + { + "epoch": 1.96, + "learning_rate": 5.689238194727059e-06, + "loss": 0.0069, + "step": 756930 + }, + { + "epoch": 1.96, + "learning_rate": 5.685349978355595e-06, + "loss": 0.0062, + "step": 756940 + }, + { + "epoch": 1.96, + "learning_rate": 5.6814617619841306e-06, + "loss": 0.0052, + "step": 756950 + }, + { + "epoch": 1.96, + "learning_rate": 5.677573545612665e-06, + "loss": 0.0073, + "step": 756960 + }, + { + "epoch": 1.96, + "learning_rate": 5.673685329241201e-06, + "loss": 0.0082, + "step": 756970 + }, + { + "epoch": 1.96, + "learning_rate": 5.669797112869737e-06, + "loss": 0.0057, + "step": 756980 + }, + { + "epoch": 1.96, + "learning_rate": 5.665908896498272e-06, + "loss": 0.0066, + "step": 756990 + }, + { + "epoch": 1.96, + "learning_rate": 5.662020680126807e-06, + "loss": 0.0082, + "step": 757000 + }, + { + "epoch": 1.96, + "eval_cer": 0.8816760932214184, + "eval_loss": 0.004407000262290239, + "eval_runtime": 107.9473, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 757000 + }, + { + "epoch": 1.96, + "learning_rate": 5.658132463755343e-06, + "loss": 0.0073, + "step": 757010 + }, + { + "epoch": 1.96, + "learning_rate": 5.654244247383877e-06, + "loss": 0.0082, + "step": 757020 + }, + { + "epoch": 1.96, + "learning_rate": 5.650356031012413e-06, + "loss": 0.0049, + "step": 757030 + }, + { + "epoch": 1.96, + "learning_rate": 5.6464678146409485e-06, + "loss": 0.007, + "step": 757040 + }, + { + "epoch": 1.96, + "learning_rate": 5.642579598269484e-06, + "loss": 0.0073, + "step": 757050 + }, + { + "epoch": 1.96, + "learning_rate": 5.638691381898019e-06, + "loss": 0.0067, + "step": 757060 + }, + { + "epoch": 1.96, + "learning_rate": 5.634803165526555e-06, + "loss": 0.0075, + "step": 757070 + }, + { + "epoch": 1.96, + "learning_rate": 5.6309149491550905e-06, + "loss": 0.0078, + "step": 757080 + }, + { + "epoch": 1.96, + "learning_rate": 5.627026732783625e-06, + "loss": 0.0083, + "step": 757090 + }, + { + "epoch": 1.96, + "learning_rate": 5.623138516412161e-06, + "loss": 0.0063, + "step": 757100 + }, + { + "epoch": 1.96, + "learning_rate": 5.619250300040697e-06, + "loss": 0.0083, + "step": 757110 + }, + { + "epoch": 1.96, + "learning_rate": 5.615362083669231e-06, + "loss": 0.0077, + "step": 757120 + }, + { + "epoch": 1.96, + "learning_rate": 5.6114738672977665e-06, + "loss": 0.0086, + "step": 757130 + }, + { + "epoch": 1.96, + "learning_rate": 5.607585650926302e-06, + "loss": 0.0058, + "step": 757140 + }, + { + "epoch": 1.96, + "learning_rate": 5.603697434554837e-06, + "loss": 0.0081, + "step": 757150 + }, + { + "epoch": 1.96, + "learning_rate": 5.599809218183373e-06, + "loss": 0.0107, + "step": 757160 + }, + { + "epoch": 1.96, + "learning_rate": 5.5959210018119085e-06, + "loss": 0.0085, + "step": 757170 + }, + { + "epoch": 1.96, + "learning_rate": 5.592032785440443e-06, + "loss": 0.0056, + "step": 757180 + }, + { + "epoch": 1.96, + "learning_rate": 5.588144569068979e-06, + "loss": 0.0084, + "step": 757190 + }, + { + "epoch": 1.96, + "learning_rate": 5.584256352697515e-06, + "loss": 0.0063, + "step": 757200 + }, + { + "epoch": 1.96, + "learning_rate": 5.58036813632605e-06, + "loss": 0.008, + "step": 757210 + }, + { + "epoch": 1.96, + "learning_rate": 5.576479919954585e-06, + "loss": 0.0051, + "step": 757220 + }, + { + "epoch": 1.96, + "learning_rate": 5.572591703583121e-06, + "loss": 0.0059, + "step": 757230 + }, + { + "epoch": 1.96, + "learning_rate": 5.568703487211655e-06, + "loss": 0.0052, + "step": 757240 + }, + { + "epoch": 1.96, + "learning_rate": 5.564815270840191e-06, + "loss": 0.0106, + "step": 757250 + }, + { + "epoch": 1.96, + "learning_rate": 5.5609270544687265e-06, + "loss": 0.0087, + "step": 757260 + }, + { + "epoch": 1.96, + "learning_rate": 5.557038838097261e-06, + "loss": 0.006, + "step": 757270 + }, + { + "epoch": 1.96, + "learning_rate": 5.553150621725797e-06, + "loss": 0.0062, + "step": 757280 + }, + { + "epoch": 1.96, + "learning_rate": 5.549262405354333e-06, + "loss": 0.0055, + "step": 757290 + }, + { + "epoch": 1.96, + "learning_rate": 5.545374188982868e-06, + "loss": 0.0075, + "step": 757300 + }, + { + "epoch": 1.96, + "learning_rate": 5.541485972611403e-06, + "loss": 0.0055, + "step": 757310 + }, + { + "epoch": 1.96, + "learning_rate": 5.537597756239939e-06, + "loss": 0.0119, + "step": 757320 + }, + { + "epoch": 1.96, + "learning_rate": 5.533709539868474e-06, + "loss": 0.0042, + "step": 757330 + }, + { + "epoch": 1.96, + "learning_rate": 5.52982132349701e-06, + "loss": 0.0053, + "step": 757340 + }, + { + "epoch": 1.96, + "learning_rate": 5.525933107125545e-06, + "loss": 0.0065, + "step": 757350 + }, + { + "epoch": 1.96, + "learning_rate": 5.522044890754081e-06, + "loss": 0.0092, + "step": 757360 + }, + { + "epoch": 1.96, + "learning_rate": 5.518156674382615e-06, + "loss": 0.0082, + "step": 757370 + }, + { + "epoch": 1.96, + "learning_rate": 5.514268458011151e-06, + "loss": 0.0089, + "step": 757380 + }, + { + "epoch": 1.96, + "learning_rate": 5.5103802416396865e-06, + "loss": 0.0066, + "step": 757390 + }, + { + "epoch": 1.96, + "learning_rate": 5.506492025268221e-06, + "loss": 0.0072, + "step": 757400 + }, + { + "epoch": 1.96, + "learning_rate": 5.502603808896757e-06, + "loss": 0.011, + "step": 757410 + }, + { + "epoch": 1.96, + "learning_rate": 5.498715592525293e-06, + "loss": 0.0061, + "step": 757420 + }, + { + "epoch": 1.96, + "learning_rate": 5.494827376153828e-06, + "loss": 0.0093, + "step": 757430 + }, + { + "epoch": 1.96, + "learning_rate": 5.490939159782363e-06, + "loss": 0.008, + "step": 757440 + }, + { + "epoch": 1.96, + "learning_rate": 5.487050943410899e-06, + "loss": 0.0062, + "step": 757450 + }, + { + "epoch": 1.96, + "learning_rate": 5.483162727039434e-06, + "loss": 0.0064, + "step": 757460 + }, + { + "epoch": 1.96, + "learning_rate": 5.479274510667969e-06, + "loss": 0.0061, + "step": 757470 + }, + { + "epoch": 1.96, + "learning_rate": 5.4753862942965045e-06, + "loss": 0.0057, + "step": 757480 + }, + { + "epoch": 1.96, + "learning_rate": 5.471498077925039e-06, + "loss": 0.0066, + "step": 757490 + }, + { + "epoch": 1.96, + "learning_rate": 5.467609861553575e-06, + "loss": 0.0073, + "step": 757500 + }, + { + "epoch": 1.96, + "learning_rate": 5.463721645182111e-06, + "loss": 0.0083, + "step": 757510 + }, + { + "epoch": 1.96, + "learning_rate": 5.459833428810646e-06, + "loss": 0.0101, + "step": 757520 + }, + { + "epoch": 1.96, + "learning_rate": 5.455945212439181e-06, + "loss": 0.0071, + "step": 757530 + }, + { + "epoch": 1.96, + "learning_rate": 5.452056996067717e-06, + "loss": 0.0057, + "step": 757540 + }, + { + "epoch": 1.96, + "learning_rate": 5.448168779696252e-06, + "loss": 0.0063, + "step": 757550 + }, + { + "epoch": 1.96, + "learning_rate": 5.444280563324788e-06, + "loss": 0.0066, + "step": 757560 + }, + { + "epoch": 1.96, + "learning_rate": 5.440392346953323e-06, + "loss": 0.0088, + "step": 757570 + }, + { + "epoch": 1.96, + "learning_rate": 5.436504130581857e-06, + "loss": 0.0082, + "step": 757580 + }, + { + "epoch": 1.96, + "learning_rate": 5.432615914210393e-06, + "loss": 0.0072, + "step": 757590 + }, + { + "epoch": 1.96, + "learning_rate": 5.428727697838929e-06, + "loss": 0.0094, + "step": 757600 + }, + { + "epoch": 1.96, + "learning_rate": 5.424839481467464e-06, + "loss": 0.0094, + "step": 757610 + }, + { + "epoch": 1.96, + "learning_rate": 5.420951265095999e-06, + "loss": 0.0076, + "step": 757620 + }, + { + "epoch": 1.96, + "learning_rate": 5.417063048724535e-06, + "loss": 0.0073, + "step": 757630 + }, + { + "epoch": 1.96, + "learning_rate": 5.413174832353071e-06, + "loss": 0.0058, + "step": 757640 + }, + { + "epoch": 1.96, + "learning_rate": 5.409286615981606e-06, + "loss": 0.007, + "step": 757650 + }, + { + "epoch": 1.96, + "learning_rate": 5.405398399610141e-06, + "loss": 0.0109, + "step": 757660 + }, + { + "epoch": 1.96, + "learning_rate": 5.401510183238677e-06, + "loss": 0.0061, + "step": 757670 + }, + { + "epoch": 1.96, + "learning_rate": 5.397621966867212e-06, + "loss": 0.0084, + "step": 757680 + }, + { + "epoch": 1.96, + "learning_rate": 5.393733750495748e-06, + "loss": 0.0082, + "step": 757690 + }, + { + "epoch": 1.96, + "learning_rate": 5.389845534124283e-06, + "loss": 0.0064, + "step": 757700 + }, + { + "epoch": 1.96, + "learning_rate": 5.385957317752817e-06, + "loss": 0.0054, + "step": 757710 + }, + { + "epoch": 1.96, + "learning_rate": 5.382069101381353e-06, + "loss": 0.007, + "step": 757720 + }, + { + "epoch": 1.96, + "learning_rate": 5.378180885009889e-06, + "loss": 0.0065, + "step": 757730 + }, + { + "epoch": 1.96, + "learning_rate": 5.374292668638424e-06, + "loss": 0.0087, + "step": 757740 + }, + { + "epoch": 1.96, + "learning_rate": 5.370404452266959e-06, + "loss": 0.0079, + "step": 757750 + }, + { + "epoch": 1.96, + "learning_rate": 5.366516235895495e-06, + "loss": 0.005, + "step": 757760 + }, + { + "epoch": 1.96, + "learning_rate": 5.36262801952403e-06, + "loss": 0.0088, + "step": 757770 + }, + { + "epoch": 1.96, + "learning_rate": 5.3587398031525656e-06, + "loss": 0.0075, + "step": 757780 + }, + { + "epoch": 1.96, + "learning_rate": 5.354851586781101e-06, + "loss": 0.0065, + "step": 757790 + }, + { + "epoch": 1.96, + "learning_rate": 5.350963370409636e-06, + "loss": 0.0072, + "step": 757800 + }, + { + "epoch": 1.96, + "learning_rate": 5.347075154038171e-06, + "loss": 0.0059, + "step": 757810 + }, + { + "epoch": 1.96, + "learning_rate": 5.343186937666707e-06, + "loss": 0.0106, + "step": 757820 + }, + { + "epoch": 1.96, + "learning_rate": 5.3392987212952416e-06, + "loss": 0.0072, + "step": 757830 + }, + { + "epoch": 1.96, + "learning_rate": 5.335410504923777e-06, + "loss": 0.0091, + "step": 757840 + }, + { + "epoch": 1.96, + "learning_rate": 5.331522288552313e-06, + "loss": 0.0061, + "step": 757850 + }, + { + "epoch": 1.96, + "learning_rate": 5.327634072180848e-06, + "loss": 0.0056, + "step": 757860 + }, + { + "epoch": 1.96, + "learning_rate": 5.3237458558093836e-06, + "loss": 0.0077, + "step": 757870 + }, + { + "epoch": 1.96, + "learning_rate": 5.319857639437919e-06, + "loss": 0.0092, + "step": 757880 + }, + { + "epoch": 1.96, + "learning_rate": 5.315969423066454e-06, + "loss": 0.0091, + "step": 757890 + }, + { + "epoch": 1.96, + "learning_rate": 5.31208120669499e-06, + "loss": 0.0079, + "step": 757900 + }, + { + "epoch": 1.96, + "learning_rate": 5.3081929903235255e-06, + "loss": 0.0068, + "step": 757910 + }, + { + "epoch": 1.96, + "learning_rate": 5.3043047739520596e-06, + "loss": 0.0062, + "step": 757920 + }, + { + "epoch": 1.96, + "learning_rate": 5.300416557580595e-06, + "loss": 0.0064, + "step": 757930 + }, + { + "epoch": 1.96, + "learning_rate": 5.296528341209131e-06, + "loss": 0.0074, + "step": 757940 + }, + { + "epoch": 1.96, + "learning_rate": 5.292640124837667e-06, + "loss": 0.0073, + "step": 757950 + }, + { + "epoch": 1.96, + "learning_rate": 5.2887519084662015e-06, + "loss": 0.0065, + "step": 757960 + }, + { + "epoch": 1.96, + "learning_rate": 5.284863692094737e-06, + "loss": 0.0074, + "step": 757970 + }, + { + "epoch": 1.96, + "learning_rate": 5.280975475723273e-06, + "loss": 0.0113, + "step": 757980 + }, + { + "epoch": 1.96, + "learning_rate": 5.277087259351808e-06, + "loss": 0.0063, + "step": 757990 + }, + { + "epoch": 1.96, + "learning_rate": 5.2731990429803435e-06, + "loss": 0.0063, + "step": 758000 + }, + { + "epoch": 1.96, + "eval_cer": 0.8816634964890108, + "eval_loss": 0.0044049047864973545, + "eval_runtime": 108.0473, + "eval_samples_per_second": 18.51, + "eval_steps_per_second": 4.628, + "step": 758000 + }, + { + "epoch": 1.96, + "learning_rate": 5.269310826608879e-06, + "loss": 0.0068, + "step": 758010 + }, + { + "epoch": 1.96, + "learning_rate": 5.265422610237414e-06, + "loss": 0.0066, + "step": 758020 + }, + { + "epoch": 1.96, + "learning_rate": 5.26153439386595e-06, + "loss": 0.0089, + "step": 758030 + }, + { + "epoch": 1.96, + "learning_rate": 5.2576461774944855e-06, + "loss": 0.0094, + "step": 758040 + }, + { + "epoch": 1.96, + "learning_rate": 5.2537579611230195e-06, + "loss": 0.0059, + "step": 758050 + }, + { + "epoch": 1.96, + "learning_rate": 5.249869744751555e-06, + "loss": 0.0058, + "step": 758060 + }, + { + "epoch": 1.97, + "learning_rate": 5.245981528380091e-06, + "loss": 0.006, + "step": 758070 + }, + { + "epoch": 1.97, + "learning_rate": 5.242093312008626e-06, + "loss": 0.0056, + "step": 758080 + }, + { + "epoch": 1.97, + "learning_rate": 5.2382050956371615e-06, + "loss": 0.0065, + "step": 758090 + }, + { + "epoch": 1.97, + "learning_rate": 5.234316879265697e-06, + "loss": 0.0087, + "step": 758100 + }, + { + "epoch": 1.97, + "learning_rate": 5.230428662894232e-06, + "loss": 0.0062, + "step": 758110 + }, + { + "epoch": 1.97, + "learning_rate": 5.226540446522768e-06, + "loss": 0.008, + "step": 758120 + }, + { + "epoch": 1.97, + "learning_rate": 5.2226522301513035e-06, + "loss": 0.0065, + "step": 758130 + }, + { + "epoch": 1.97, + "learning_rate": 5.218764013779838e-06, + "loss": 0.0073, + "step": 758140 + }, + { + "epoch": 1.97, + "learning_rate": 5.214875797408374e-06, + "loss": 0.0073, + "step": 758150 + }, + { + "epoch": 1.97, + "learning_rate": 5.210987581036909e-06, + "loss": 0.006, + "step": 758160 + }, + { + "epoch": 1.97, + "learning_rate": 5.207099364665444e-06, + "loss": 0.0082, + "step": 758170 + }, + { + "epoch": 1.97, + "learning_rate": 5.2032111482939795e-06, + "loss": 0.0063, + "step": 758180 + }, + { + "epoch": 1.97, + "learning_rate": 5.199322931922515e-06, + "loss": 0.0067, + "step": 758190 + }, + { + "epoch": 1.97, + "learning_rate": 5.19543471555105e-06, + "loss": 0.0056, + "step": 758200 + }, + { + "epoch": 1.97, + "learning_rate": 5.191546499179586e-06, + "loss": 0.0051, + "step": 758210 + }, + { + "epoch": 1.97, + "learning_rate": 5.1876582828081215e-06, + "loss": 0.0064, + "step": 758220 + }, + { + "epoch": 1.97, + "learning_rate": 5.183770066436656e-06, + "loss": 0.0061, + "step": 758230 + }, + { + "epoch": 1.97, + "learning_rate": 5.179881850065192e-06, + "loss": 0.0074, + "step": 758240 + }, + { + "epoch": 1.97, + "learning_rate": 5.175993633693728e-06, + "loss": 0.0074, + "step": 758250 + }, + { + "epoch": 1.97, + "learning_rate": 5.1721054173222635e-06, + "loss": 0.0079, + "step": 758260 + }, + { + "epoch": 1.97, + "learning_rate": 5.1682172009507975e-06, + "loss": 0.0046, + "step": 758270 + }, + { + "epoch": 1.97, + "learning_rate": 5.164328984579333e-06, + "loss": 0.0044, + "step": 758280 + }, + { + "epoch": 1.97, + "learning_rate": 5.160440768207869e-06, + "loss": 0.0081, + "step": 758290 + }, + { + "epoch": 1.97, + "learning_rate": 5.156552551836404e-06, + "loss": 0.0069, + "step": 758300 + }, + { + "epoch": 1.97, + "learning_rate": 5.1526643354649395e-06, + "loss": 0.0086, + "step": 758310 + }, + { + "epoch": 1.97, + "learning_rate": 5.148776119093475e-06, + "loss": 0.0059, + "step": 758320 + }, + { + "epoch": 1.97, + "learning_rate": 5.14488790272201e-06, + "loss": 0.0056, + "step": 758330 + }, + { + "epoch": 1.97, + "learning_rate": 5.140999686350546e-06, + "loss": 0.0068, + "step": 758340 + }, + { + "epoch": 1.97, + "learning_rate": 5.1371114699790815e-06, + "loss": 0.0063, + "step": 758350 + }, + { + "epoch": 1.97, + "learning_rate": 5.133223253607616e-06, + "loss": 0.0057, + "step": 758360 + }, + { + "epoch": 1.97, + "learning_rate": 5.129335037236152e-06, + "loss": 0.0061, + "step": 758370 + }, + { + "epoch": 1.97, + "learning_rate": 5.125446820864688e-06, + "loss": 0.0062, + "step": 758380 + }, + { + "epoch": 1.97, + "learning_rate": 5.121558604493222e-06, + "loss": 0.0075, + "step": 758390 + }, + { + "epoch": 1.97, + "learning_rate": 5.1176703881217575e-06, + "loss": 0.0074, + "step": 758400 + }, + { + "epoch": 1.97, + "learning_rate": 5.113782171750293e-06, + "loss": 0.0088, + "step": 758410 + }, + { + "epoch": 1.97, + "learning_rate": 5.109893955378828e-06, + "loss": 0.0074, + "step": 758420 + }, + { + "epoch": 1.97, + "learning_rate": 5.106005739007364e-06, + "loss": 0.0086, + "step": 758430 + }, + { + "epoch": 1.97, + "learning_rate": 5.1021175226358995e-06, + "loss": 0.0055, + "step": 758440 + }, + { + "epoch": 1.97, + "learning_rate": 5.098229306264434e-06, + "loss": 0.0069, + "step": 758450 + }, + { + "epoch": 1.97, + "learning_rate": 5.09434108989297e-06, + "loss": 0.0062, + "step": 758460 + }, + { + "epoch": 1.97, + "learning_rate": 5.090452873521506e-06, + "loss": 0.0052, + "step": 758470 + }, + { + "epoch": 1.97, + "learning_rate": 5.086564657150041e-06, + "loss": 0.0079, + "step": 758480 + }, + { + "epoch": 1.97, + "learning_rate": 5.082676440778576e-06, + "loss": 0.0077, + "step": 758490 + }, + { + "epoch": 1.97, + "learning_rate": 5.078788224407112e-06, + "loss": 0.0075, + "step": 758500 + }, + { + "epoch": 1.97, + "learning_rate": 5.074900008035646e-06, + "loss": 0.0082, + "step": 758510 + }, + { + "epoch": 1.97, + "learning_rate": 5.071011791664182e-06, + "loss": 0.006, + "step": 758520 + }, + { + "epoch": 1.97, + "learning_rate": 5.0671235752927175e-06, + "loss": 0.0063, + "step": 758530 + }, + { + "epoch": 1.97, + "learning_rate": 5.063235358921252e-06, + "loss": 0.0085, + "step": 758540 + }, + { + "epoch": 1.97, + "learning_rate": 5.059347142549788e-06, + "loss": 0.0067, + "step": 758550 + }, + { + "epoch": 1.97, + "learning_rate": 5.055458926178324e-06, + "loss": 0.006, + "step": 758560 + }, + { + "epoch": 1.97, + "learning_rate": 5.0515707098068594e-06, + "loss": 0.007, + "step": 758570 + }, + { + "epoch": 1.97, + "learning_rate": 5.047682493435394e-06, + "loss": 0.0077, + "step": 758580 + }, + { + "epoch": 1.97, + "learning_rate": 5.04379427706393e-06, + "loss": 0.008, + "step": 758590 + }, + { + "epoch": 1.97, + "learning_rate": 5.039906060692466e-06, + "loss": 0.0069, + "step": 758600 + }, + { + "epoch": 1.97, + "learning_rate": 5.036017844321e-06, + "loss": 0.0067, + "step": 758610 + }, + { + "epoch": 1.97, + "learning_rate": 5.0321296279495354e-06, + "loss": 0.0059, + "step": 758620 + }, + { + "epoch": 1.97, + "learning_rate": 5.028241411578071e-06, + "loss": 0.0077, + "step": 758630 + }, + { + "epoch": 1.97, + "learning_rate": 5.024353195206606e-06, + "loss": 0.0074, + "step": 758640 + }, + { + "epoch": 1.97, + "learning_rate": 5.020464978835142e-06, + "loss": 0.0052, + "step": 758650 + }, + { + "epoch": 1.97, + "learning_rate": 5.0165767624636774e-06, + "loss": 0.0051, + "step": 758660 + }, + { + "epoch": 1.97, + "learning_rate": 5.012688546092212e-06, + "loss": 0.0068, + "step": 758670 + }, + { + "epoch": 1.97, + "learning_rate": 5.008800329720748e-06, + "loss": 0.0076, + "step": 758680 + }, + { + "epoch": 1.97, + "learning_rate": 5.004912113349284e-06, + "loss": 0.0089, + "step": 758690 + }, + { + "epoch": 1.97, + "learning_rate": 5.0010238969778186e-06, + "loss": 0.0058, + "step": 758700 + }, + { + "epoch": 1.97, + "learning_rate": 4.997135680606354e-06, + "loss": 0.0062, + "step": 758710 + }, + { + "epoch": 1.97, + "learning_rate": 4.99324746423489e-06, + "loss": 0.0078, + "step": 758720 + }, + { + "epoch": 1.97, + "learning_rate": 4.989359247863424e-06, + "loss": 0.0072, + "step": 758730 + }, + { + "epoch": 1.97, + "learning_rate": 4.98547103149196e-06, + "loss": 0.0088, + "step": 758740 + }, + { + "epoch": 1.97, + "learning_rate": 4.981582815120495e-06, + "loss": 0.0086, + "step": 758750 + }, + { + "epoch": 1.97, + "learning_rate": 4.97769459874903e-06, + "loss": 0.0079, + "step": 758760 + }, + { + "epoch": 1.97, + "learning_rate": 4.973806382377566e-06, + "loss": 0.0061, + "step": 758770 + }, + { + "epoch": 1.97, + "learning_rate": 4.969918166006102e-06, + "loss": 0.008, + "step": 758780 + }, + { + "epoch": 1.97, + "learning_rate": 4.9660299496346366e-06, + "loss": 0.0076, + "step": 758790 + }, + { + "epoch": 1.97, + "learning_rate": 4.962141733263172e-06, + "loss": 0.0087, + "step": 758800 + }, + { + "epoch": 1.97, + "learning_rate": 4.958253516891708e-06, + "loss": 0.0089, + "step": 758810 + }, + { + "epoch": 1.97, + "learning_rate": 4.954365300520243e-06, + "loss": 0.0084, + "step": 758820 + }, + { + "epoch": 1.97, + "learning_rate": 4.9504770841487785e-06, + "loss": 0.0065, + "step": 758830 + }, + { + "epoch": 1.97, + "learning_rate": 4.946588867777314e-06, + "loss": 0.0055, + "step": 758840 + }, + { + "epoch": 1.97, + "learning_rate": 4.942700651405848e-06, + "loss": 0.0101, + "step": 758850 + }, + { + "epoch": 1.97, + "learning_rate": 4.938812435034384e-06, + "loss": 0.0071, + "step": 758860 + }, + { + "epoch": 1.97, + "learning_rate": 4.93492421866292e-06, + "loss": 0.0067, + "step": 758870 + }, + { + "epoch": 1.97, + "learning_rate": 4.931036002291455e-06, + "loss": 0.0114, + "step": 758880 + }, + { + "epoch": 1.97, + "learning_rate": 4.92714778591999e-06, + "loss": 0.0053, + "step": 758890 + }, + { + "epoch": 1.97, + "learning_rate": 4.923259569548526e-06, + "loss": 0.0067, + "step": 758900 + }, + { + "epoch": 1.97, + "learning_rate": 4.919371353177062e-06, + "loss": 0.0064, + "step": 758910 + }, + { + "epoch": 1.97, + "learning_rate": 4.9154831368055965e-06, + "loss": 0.0051, + "step": 758920 + }, + { + "epoch": 1.97, + "learning_rate": 4.911594920434132e-06, + "loss": 0.0074, + "step": 758930 + }, + { + "epoch": 1.97, + "learning_rate": 4.907706704062668e-06, + "loss": 0.0098, + "step": 758940 + }, + { + "epoch": 1.97, + "learning_rate": 4.903818487691202e-06, + "loss": 0.0072, + "step": 758950 + }, + { + "epoch": 1.97, + "learning_rate": 4.899930271319738e-06, + "loss": 0.0062, + "step": 758960 + }, + { + "epoch": 1.97, + "learning_rate": 4.896042054948273e-06, + "loss": 0.0084, + "step": 758970 + }, + { + "epoch": 1.97, + "learning_rate": 4.892153838576808e-06, + "loss": 0.0072, + "step": 758980 + }, + { + "epoch": 1.97, + "learning_rate": 4.888265622205344e-06, + "loss": 0.0092, + "step": 758990 + }, + { + "epoch": 1.97, + "learning_rate": 4.88437740583388e-06, + "loss": 0.0065, + "step": 759000 + }, + { + "epoch": 1.97, + "eval_cer": 0.8816746935844841, + "eval_loss": 0.004368713591247797, + "eval_runtime": 107.9594, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, + "step": 759000 + }, + { + "epoch": 1.97, + "learning_rate": 4.8804891894624145e-06, + "loss": 0.0074, + "step": 759010 + }, + { + "epoch": 1.97, + "learning_rate": 4.87660097309095e-06, + "loss": 0.0064, + "step": 759020 + }, + { + "epoch": 1.97, + "learning_rate": 4.872712756719486e-06, + "loss": 0.0095, + "step": 759030 + }, + { + "epoch": 1.97, + "learning_rate": 4.868824540348021e-06, + "loss": 0.0046, + "step": 759040 + }, + { + "epoch": 1.97, + "learning_rate": 4.8649363239765565e-06, + "loss": 0.0068, + "step": 759050 + }, + { + "epoch": 1.97, + "learning_rate": 4.861048107605092e-06, + "loss": 0.0081, + "step": 759060 + }, + { + "epoch": 1.97, + "learning_rate": 4.857159891233626e-06, + "loss": 0.008, + "step": 759070 + }, + { + "epoch": 1.97, + "learning_rate": 4.853271674862162e-06, + "loss": 0.0072, + "step": 759080 + }, + { + "epoch": 1.97, + "learning_rate": 4.849383458490698e-06, + "loss": 0.0083, + "step": 759090 + }, + { + "epoch": 1.97, + "learning_rate": 4.8454952421192325e-06, + "loss": 0.0075, + "step": 759100 + }, + { + "epoch": 1.97, + "learning_rate": 4.841607025747768e-06, + "loss": 0.0042, + "step": 759110 + }, + { + "epoch": 1.97, + "learning_rate": 4.837718809376304e-06, + "loss": 0.006, + "step": 759120 + }, + { + "epoch": 1.97, + "learning_rate": 4.833830593004839e-06, + "loss": 0.0077, + "step": 759130 + }, + { + "epoch": 1.97, + "learning_rate": 4.8299423766333745e-06, + "loss": 0.0095, + "step": 759140 + }, + { + "epoch": 1.97, + "learning_rate": 4.82605416026191e-06, + "loss": 0.006, + "step": 759150 + }, + { + "epoch": 1.97, + "learning_rate": 4.822165943890445e-06, + "loss": 0.0076, + "step": 759160 + }, + { + "epoch": 1.97, + "learning_rate": 4.818277727518981e-06, + "loss": 0.0067, + "step": 759170 + }, + { + "epoch": 1.97, + "learning_rate": 4.8143895111475165e-06, + "loss": 0.0076, + "step": 759180 + }, + { + "epoch": 1.97, + "learning_rate": 4.810501294776052e-06, + "loss": 0.0099, + "step": 759190 + }, + { + "epoch": 1.97, + "learning_rate": 4.806613078404586e-06, + "loss": 0.0055, + "step": 759200 + }, + { + "epoch": 1.97, + "learning_rate": 4.802724862033122e-06, + "loss": 0.0085, + "step": 759210 + }, + { + "epoch": 1.97, + "learning_rate": 4.798836645661658e-06, + "loss": 0.0052, + "step": 759220 + }, + { + "epoch": 1.97, + "learning_rate": 4.7949484292901925e-06, + "loss": 0.0072, + "step": 759230 + }, + { + "epoch": 1.97, + "learning_rate": 4.791060212918728e-06, + "loss": 0.0056, + "step": 759240 + }, + { + "epoch": 1.97, + "learning_rate": 4.787171996547264e-06, + "loss": 0.0085, + "step": 759250 + }, + { + "epoch": 1.97, + "learning_rate": 4.783283780175799e-06, + "loss": 0.01, + "step": 759260 + }, + { + "epoch": 1.97, + "learning_rate": 4.7793955638043345e-06, + "loss": 0.007, + "step": 759270 + }, + { + "epoch": 1.97, + "learning_rate": 4.77550734743287e-06, + "loss": 0.0067, + "step": 759280 + }, + { + "epoch": 1.97, + "learning_rate": 4.771619131061404e-06, + "loss": 0.0068, + "step": 759290 + }, + { + "epoch": 1.97, + "learning_rate": 4.76773091468994e-06, + "loss": 0.0106, + "step": 759300 + }, + { + "epoch": 1.97, + "learning_rate": 4.763842698318476e-06, + "loss": 0.0076, + "step": 759310 + }, + { + "epoch": 1.97, + "learning_rate": 4.7599544819470105e-06, + "loss": 0.0093, + "step": 759320 + }, + { + "epoch": 1.97, + "learning_rate": 4.756066265575546e-06, + "loss": 0.0076, + "step": 759330 + }, + { + "epoch": 1.97, + "learning_rate": 4.752178049204082e-06, + "loss": 0.0068, + "step": 759340 + }, + { + "epoch": 1.97, + "learning_rate": 4.748289832832617e-06, + "loss": 0.0069, + "step": 759350 + }, + { + "epoch": 1.97, + "learning_rate": 4.7444016164611525e-06, + "loss": 0.0083, + "step": 759360 + }, + { + "epoch": 1.97, + "learning_rate": 4.740513400089688e-06, + "loss": 0.0101, + "step": 759370 + }, + { + "epoch": 1.97, + "learning_rate": 4.736625183718223e-06, + "loss": 0.0079, + "step": 759380 + }, + { + "epoch": 1.97, + "learning_rate": 4.732736967346759e-06, + "loss": 0.0143, + "step": 759390 + }, + { + "epoch": 1.97, + "learning_rate": 4.7288487509752944e-06, + "loss": 0.0065, + "step": 759400 + }, + { + "epoch": 1.97, + "learning_rate": 4.7249605346038285e-06, + "loss": 0.0069, + "step": 759410 + }, + { + "epoch": 1.97, + "learning_rate": 4.721072318232364e-06, + "loss": 0.0064, + "step": 759420 + }, + { + "epoch": 1.97, + "learning_rate": 4.7171841018609e-06, + "loss": 0.0062, + "step": 759430 + }, + { + "epoch": 1.97, + "learning_rate": 4.713295885489435e-06, + "loss": 0.0095, + "step": 759440 + }, + { + "epoch": 1.97, + "learning_rate": 4.7094076691179705e-06, + "loss": 0.0076, + "step": 759450 + }, + { + "epoch": 1.97, + "learning_rate": 4.705519452746506e-06, + "loss": 0.0053, + "step": 759460 + }, + { + "epoch": 1.97, + "learning_rate": 4.701631236375041e-06, + "loss": 0.0074, + "step": 759470 + }, + { + "epoch": 1.97, + "learning_rate": 4.697743020003577e-06, + "loss": 0.0074, + "step": 759480 + }, + { + "epoch": 1.97, + "learning_rate": 4.6938548036321124e-06, + "loss": 0.0089, + "step": 759490 + }, + { + "epoch": 1.97, + "learning_rate": 4.689966587260648e-06, + "loss": 0.0068, + "step": 759500 + }, + { + "epoch": 1.97, + "learning_rate": 4.686078370889183e-06, + "loss": 0.0069, + "step": 759510 + }, + { + "epoch": 1.97, + "learning_rate": 4.682190154517719e-06, + "loss": 0.0058, + "step": 759520 + }, + { + "epoch": 1.97, + "learning_rate": 4.678301938146254e-06, + "loss": 0.0066, + "step": 759530 + }, + { + "epoch": 1.97, + "learning_rate": 4.6744137217747884e-06, + "loss": 0.0053, + "step": 759540 + }, + { + "epoch": 1.97, + "learning_rate": 4.670525505403324e-06, + "loss": 0.0061, + "step": 759550 + }, + { + "epoch": 1.97, + "learning_rate": 4.66663728903186e-06, + "loss": 0.0055, + "step": 759560 + }, + { + "epoch": 1.97, + "learning_rate": 4.6627490726603956e-06, + "loss": 0.007, + "step": 759570 + }, + { + "epoch": 1.97, + "learning_rate": 4.6588608562889304e-06, + "loss": 0.0058, + "step": 759580 + }, + { + "epoch": 1.97, + "learning_rate": 4.654972639917465e-06, + "loss": 0.0053, + "step": 759590 + }, + { + "epoch": 1.97, + "learning_rate": 4.651084423546001e-06, + "loss": 0.0071, + "step": 759600 + }, + { + "epoch": 1.97, + "learning_rate": 4.647196207174537e-06, + "loss": 0.0046, + "step": 759610 + }, + { + "epoch": 1.97, + "learning_rate": 4.6433079908030716e-06, + "loss": 0.0068, + "step": 759620 + }, + { + "epoch": 1.97, + "learning_rate": 4.639419774431607e-06, + "loss": 0.0066, + "step": 759630 + }, + { + "epoch": 1.97, + "learning_rate": 4.635531558060142e-06, + "loss": 0.0062, + "step": 759640 + }, + { + "epoch": 1.97, + "learning_rate": 4.631643341688678e-06, + "loss": 0.0085, + "step": 759650 + }, + { + "epoch": 1.97, + "learning_rate": 4.6277551253172136e-06, + "loss": 0.0051, + "step": 759660 + }, + { + "epoch": 1.97, + "learning_rate": 4.623866908945748e-06, + "loss": 0.0059, + "step": 759670 + }, + { + "epoch": 1.97, + "learning_rate": 4.619978692574284e-06, + "loss": 0.0091, + "step": 759680 + }, + { + "epoch": 1.97, + "learning_rate": 4.61609047620282e-06, + "loss": 0.0077, + "step": 759690 + }, + { + "epoch": 1.97, + "learning_rate": 4.612202259831355e-06, + "loss": 0.0079, + "step": 759700 + }, + { + "epoch": 1.97, + "learning_rate": 4.60831404345989e-06, + "loss": 0.0078, + "step": 759710 + }, + { + "epoch": 1.97, + "learning_rate": 4.604425827088425e-06, + "loss": 0.0066, + "step": 759720 + }, + { + "epoch": 1.97, + "learning_rate": 4.600537610716961e-06, + "loss": 0.0068, + "step": 759730 + }, + { + "epoch": 1.97, + "learning_rate": 4.596649394345497e-06, + "loss": 0.0043, + "step": 759740 + }, + { + "epoch": 1.97, + "learning_rate": 4.5927611779740315e-06, + "loss": 0.008, + "step": 759750 + }, + { + "epoch": 1.97, + "learning_rate": 4.588872961602566e-06, + "loss": 0.0065, + "step": 759760 + }, + { + "epoch": 1.97, + "learning_rate": 4.584984745231102e-06, + "loss": 0.0066, + "step": 759770 + }, + { + "epoch": 1.97, + "learning_rate": 4.581096528859638e-06, + "loss": 0.0078, + "step": 759780 + }, + { + "epoch": 1.97, + "learning_rate": 4.577208312488173e-06, + "loss": 0.0055, + "step": 759790 + }, + { + "epoch": 1.97, + "learning_rate": 4.573320096116708e-06, + "loss": 0.0071, + "step": 759800 + }, + { + "epoch": 1.97, + "learning_rate": 4.569431879745243e-06, + "loss": 0.0058, + "step": 759810 + }, + { + "epoch": 1.97, + "learning_rate": 4.565543663373779e-06, + "loss": 0.007, + "step": 759820 + }, + { + "epoch": 1.97, + "learning_rate": 4.561655447002315e-06, + "loss": 0.0082, + "step": 759830 + }, + { + "epoch": 1.97, + "learning_rate": 4.5577672306308495e-06, + "loss": 0.0066, + "step": 759840 + }, + { + "epoch": 1.97, + "learning_rate": 4.553879014259385e-06, + "loss": 0.0066, + "step": 759850 + }, + { + "epoch": 1.97, + "learning_rate": 4.549990797887921e-06, + "loss": 0.0059, + "step": 759860 + }, + { + "epoch": 1.97, + "learning_rate": 4.546102581516456e-06, + "loss": 0.0072, + "step": 759870 + }, + { + "epoch": 1.97, + "learning_rate": 4.5422143651449915e-06, + "loss": 0.01, + "step": 759880 + }, + { + "epoch": 1.97, + "learning_rate": 4.538326148773526e-06, + "loss": 0.0045, + "step": 759890 + }, + { + "epoch": 1.97, + "learning_rate": 4.534437932402062e-06, + "loss": 0.0061, + "step": 759900 + }, + { + "epoch": 1.97, + "learning_rate": 4.530549716030598e-06, + "loss": 0.0072, + "step": 759910 + }, + { + "epoch": 1.97, + "learning_rate": 4.526661499659133e-06, + "loss": 0.0042, + "step": 759920 + }, + { + "epoch": 1.97, + "learning_rate": 4.5227732832876675e-06, + "loss": 0.0065, + "step": 759930 + }, + { + "epoch": 1.97, + "learning_rate": 4.518885066916203e-06, + "loss": 0.0089, + "step": 759940 + }, + { + "epoch": 1.97, + "learning_rate": 4.514996850544739e-06, + "loss": 0.0049, + "step": 759950 + }, + { + "epoch": 1.97, + "learning_rate": 4.511108634173274e-06, + "loss": 0.0058, + "step": 759960 + }, + { + "epoch": 1.97, + "learning_rate": 4.5072204178018095e-06, + "loss": 0.0104, + "step": 759970 + }, + { + "epoch": 1.97, + "learning_rate": 4.503332201430344e-06, + "loss": 0.0064, + "step": 759980 + }, + { + "epoch": 1.97, + "learning_rate": 4.49944398505888e-06, + "loss": 0.0079, + "step": 759990 + }, + { + "epoch": 1.97, + "learning_rate": 4.495555768687416e-06, + "loss": 0.0055, + "step": 760000 + }, + { + "epoch": 1.97, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.004402776248753071, + "eval_runtime": 107.9755, + "eval_samples_per_second": 18.523, + "eval_steps_per_second": 4.631, + "step": 760000 + }, + { + "epoch": 1.97, + "learning_rate": 4.491667552315951e-06, + "loss": 0.0056, + "step": 760010 + }, + { + "epoch": 1.97, + "learning_rate": 4.487779335944486e-06, + "loss": 0.0072, + "step": 760020 + }, + { + "epoch": 1.97, + "learning_rate": 4.483891119573022e-06, + "loss": 0.0071, + "step": 760030 + }, + { + "epoch": 1.97, + "learning_rate": 4.480002903201557e-06, + "loss": 0.0063, + "step": 760040 + }, + { + "epoch": 1.97, + "learning_rate": 4.476114686830093e-06, + "loss": 0.0047, + "step": 760050 + }, + { + "epoch": 1.97, + "learning_rate": 4.4722264704586275e-06, + "loss": 0.0066, + "step": 760060 + }, + { + "epoch": 1.97, + "learning_rate": 4.468338254087163e-06, + "loss": 0.0083, + "step": 760070 + }, + { + "epoch": 1.97, + "learning_rate": 4.464450037715699e-06, + "loss": 0.0065, + "step": 760080 + }, + { + "epoch": 1.97, + "learning_rate": 4.460561821344234e-06, + "loss": 0.0081, + "step": 760090 + }, + { + "epoch": 1.97, + "learning_rate": 4.456673604972769e-06, + "loss": 0.0069, + "step": 760100 + }, + { + "epoch": 1.97, + "learning_rate": 4.452785388601304e-06, + "loss": 0.0115, + "step": 760110 + }, + { + "epoch": 1.97, + "learning_rate": 4.44889717222984e-06, + "loss": 0.0062, + "step": 760120 + }, + { + "epoch": 1.97, + "learning_rate": 4.445008955858375e-06, + "loss": 0.0057, + "step": 760130 + }, + { + "epoch": 1.97, + "learning_rate": 4.441120739486911e-06, + "loss": 0.0074, + "step": 760140 + }, + { + "epoch": 1.97, + "learning_rate": 4.4372325231154455e-06, + "loss": 0.0086, + "step": 760150 + }, + { + "epoch": 1.97, + "learning_rate": 4.433344306743981e-06, + "loss": 0.0059, + "step": 760160 + }, + { + "epoch": 1.97, + "learning_rate": 4.429456090372517e-06, + "loss": 0.0048, + "step": 760170 + }, + { + "epoch": 1.97, + "learning_rate": 4.425567874001052e-06, + "loss": 0.0053, + "step": 760180 + }, + { + "epoch": 1.97, + "learning_rate": 4.4216796576295875e-06, + "loss": 0.0086, + "step": 760190 + }, + { + "epoch": 1.97, + "learning_rate": 4.417791441258123e-06, + "loss": 0.0085, + "step": 760200 + }, + { + "epoch": 1.97, + "learning_rate": 4.413903224886658e-06, + "loss": 0.0091, + "step": 760210 + }, + { + "epoch": 1.97, + "learning_rate": 4.410015008515194e-06, + "loss": 0.0053, + "step": 760220 + }, + { + "epoch": 1.97, + "learning_rate": 4.406126792143729e-06, + "loss": 0.0057, + "step": 760230 + }, + { + "epoch": 1.97, + "learning_rate": 4.402238575772264e-06, + "loss": 0.0046, + "step": 760240 + }, + { + "epoch": 1.97, + "learning_rate": 4.3983503594008e-06, + "loss": 0.0061, + "step": 760250 + }, + { + "epoch": 1.97, + "learning_rate": 4.394462143029335e-06, + "loss": 0.0064, + "step": 760260 + }, + { + "epoch": 1.97, + "learning_rate": 4.39057392665787e-06, + "loss": 0.0071, + "step": 760270 + }, + { + "epoch": 1.97, + "learning_rate": 4.3866857102864055e-06, + "loss": 0.0061, + "step": 760280 + }, + { + "epoch": 1.97, + "learning_rate": 4.382797493914941e-06, + "loss": 0.0079, + "step": 760290 + }, + { + "epoch": 1.97, + "learning_rate": 4.378909277543476e-06, + "loss": 0.0074, + "step": 760300 + }, + { + "epoch": 1.97, + "learning_rate": 4.375021061172012e-06, + "loss": 0.0063, + "step": 760310 + }, + { + "epoch": 1.97, + "learning_rate": 4.371132844800547e-06, + "loss": 0.0076, + "step": 760320 + }, + { + "epoch": 1.97, + "learning_rate": 4.367244628429082e-06, + "loss": 0.0061, + "step": 760330 + }, + { + "epoch": 1.97, + "learning_rate": 4.363356412057618e-06, + "loss": 0.0077, + "step": 760340 + }, + { + "epoch": 1.97, + "learning_rate": 4.359468195686153e-06, + "loss": 0.0075, + "step": 760350 + }, + { + "epoch": 1.97, + "learning_rate": 4.355579979314689e-06, + "loss": 0.0078, + "step": 760360 + }, + { + "epoch": 1.97, + "learning_rate": 4.351691762943224e-06, + "loss": 0.0053, + "step": 760370 + }, + { + "epoch": 1.97, + "learning_rate": 4.347803546571759e-06, + "loss": 0.0081, + "step": 760380 + }, + { + "epoch": 1.97, + "learning_rate": 4.343915330200295e-06, + "loss": 0.0055, + "step": 760390 + }, + { + "epoch": 1.97, + "learning_rate": 4.34002711382883e-06, + "loss": 0.0055, + "step": 760400 + }, + { + "epoch": 1.97, + "learning_rate": 4.3361388974573654e-06, + "loss": 0.0082, + "step": 760410 + }, + { + "epoch": 1.97, + "learning_rate": 4.332250681085901e-06, + "loss": 0.008, + "step": 760420 + }, + { + "epoch": 1.97, + "learning_rate": 4.328362464714436e-06, + "loss": 0.0079, + "step": 760430 + }, + { + "epoch": 1.97, + "learning_rate": 4.324474248342971e-06, + "loss": 0.0087, + "step": 760440 + }, + { + "epoch": 1.97, + "learning_rate": 4.320586031971507e-06, + "loss": 0.0063, + "step": 760450 + }, + { + "epoch": 1.97, + "learning_rate": 4.316697815600042e-06, + "loss": 0.0091, + "step": 760460 + }, + { + "epoch": 1.97, + "learning_rate": 4.312809599228578e-06, + "loss": 0.0065, + "step": 760470 + }, + { + "epoch": 1.97, + "learning_rate": 4.308921382857113e-06, + "loss": 0.006, + "step": 760480 + }, + { + "epoch": 1.97, + "learning_rate": 4.305033166485648e-06, + "loss": 0.0099, + "step": 760490 + }, + { + "epoch": 1.97, + "learning_rate": 4.3011449501141834e-06, + "loss": 0.0086, + "step": 760500 + }, + { + "epoch": 1.97, + "learning_rate": 4.297256733742719e-06, + "loss": 0.0059, + "step": 760510 + }, + { + "epoch": 1.97, + "learning_rate": 4.293368517371254e-06, + "loss": 0.0072, + "step": 760520 + }, + { + "epoch": 1.97, + "learning_rate": 4.28948030099979e-06, + "loss": 0.0074, + "step": 760530 + }, + { + "epoch": 1.97, + "learning_rate": 4.285592084628325e-06, + "loss": 0.0055, + "step": 760540 + }, + { + "epoch": 1.97, + "learning_rate": 4.28170386825686e-06, + "loss": 0.0077, + "step": 760550 + }, + { + "epoch": 1.97, + "learning_rate": 4.277815651885396e-06, + "loss": 0.0118, + "step": 760560 + }, + { + "epoch": 1.97, + "learning_rate": 4.273927435513931e-06, + "loss": 0.0073, + "step": 760570 + }, + { + "epoch": 1.97, + "learning_rate": 4.2700392191424666e-06, + "loss": 0.0078, + "step": 760580 + }, + { + "epoch": 1.97, + "learning_rate": 4.266151002771002e-06, + "loss": 0.0058, + "step": 760590 + }, + { + "epoch": 1.97, + "learning_rate": 4.262262786399537e-06, + "loss": 0.0049, + "step": 760600 + }, + { + "epoch": 1.97, + "learning_rate": 4.258374570028072e-06, + "loss": 0.0085, + "step": 760610 + }, + { + "epoch": 1.97, + "learning_rate": 4.254486353656608e-06, + "loss": 0.0064, + "step": 760620 + }, + { + "epoch": 1.97, + "learning_rate": 4.250598137285143e-06, + "loss": 0.0068, + "step": 760630 + }, + { + "epoch": 1.97, + "learning_rate": 4.246709920913679e-06, + "loss": 0.0053, + "step": 760640 + }, + { + "epoch": 1.97, + "learning_rate": 4.242821704542214e-06, + "loss": 0.0036, + "step": 760650 + }, + { + "epoch": 1.97, + "learning_rate": 4.238933488170749e-06, + "loss": 0.0078, + "step": 760660 + }, + { + "epoch": 1.97, + "learning_rate": 4.2350452717992845e-06, + "loss": 0.0068, + "step": 760670 + }, + { + "epoch": 1.97, + "learning_rate": 4.23115705542782e-06, + "loss": 0.008, + "step": 760680 + }, + { + "epoch": 1.97, + "learning_rate": 4.227268839056355e-06, + "loss": 0.0061, + "step": 760690 + }, + { + "epoch": 1.97, + "learning_rate": 4.223380622684891e-06, + "loss": 0.0056, + "step": 760700 + }, + { + "epoch": 1.97, + "learning_rate": 4.2194924063134265e-06, + "loss": 0.0059, + "step": 760710 + }, + { + "epoch": 1.97, + "learning_rate": 4.215604189941961e-06, + "loss": 0.006, + "step": 760720 + }, + { + "epoch": 1.97, + "learning_rate": 4.211715973570497e-06, + "loss": 0.0068, + "step": 760730 + }, + { + "epoch": 1.97, + "learning_rate": 4.207827757199032e-06, + "loss": 0.0079, + "step": 760740 + }, + { + "epoch": 1.97, + "learning_rate": 4.203939540827568e-06, + "loss": 0.0064, + "step": 760750 + }, + { + "epoch": 1.97, + "learning_rate": 4.200051324456103e-06, + "loss": 0.0073, + "step": 760760 + }, + { + "epoch": 1.97, + "learning_rate": 4.196163108084638e-06, + "loss": 0.0062, + "step": 760770 + }, + { + "epoch": 1.97, + "learning_rate": 4.192274891713174e-06, + "loss": 0.0079, + "step": 760780 + }, + { + "epoch": 1.97, + "learning_rate": 4.188386675341709e-06, + "loss": 0.0062, + "step": 760790 + }, + { + "epoch": 1.97, + "learning_rate": 4.1844984589702445e-06, + "loss": 0.01, + "step": 760800 + }, + { + "epoch": 1.97, + "learning_rate": 4.18061024259878e-06, + "loss": 0.0064, + "step": 760810 + }, + { + "epoch": 1.97, + "learning_rate": 4.176722026227315e-06, + "loss": 0.0077, + "step": 760820 + }, + { + "epoch": 1.97, + "learning_rate": 4.17283380985585e-06, + "loss": 0.0067, + "step": 760830 + }, + { + "epoch": 1.97, + "learning_rate": 4.168945593484386e-06, + "loss": 0.0063, + "step": 760840 + }, + { + "epoch": 1.97, + "learning_rate": 4.165057377112921e-06, + "loss": 0.007, + "step": 760850 + }, + { + "epoch": 1.97, + "learning_rate": 4.161169160741456e-06, + "loss": 0.0056, + "step": 760860 + }, + { + "epoch": 1.97, + "learning_rate": 4.157280944369992e-06, + "loss": 0.0065, + "step": 760870 + }, + { + "epoch": 1.97, + "learning_rate": 4.153392727998528e-06, + "loss": 0.0077, + "step": 760880 + }, + { + "epoch": 1.97, + "learning_rate": 4.1495045116270625e-06, + "loss": 0.0074, + "step": 760890 + }, + { + "epoch": 1.97, + "learning_rate": 4.145616295255598e-06, + "loss": 0.0092, + "step": 760900 + }, + { + "epoch": 1.97, + "learning_rate": 4.141728078884133e-06, + "loss": 0.006, + "step": 760910 + }, + { + "epoch": 1.97, + "learning_rate": 4.137839862512669e-06, + "loss": 0.0105, + "step": 760920 + }, + { + "epoch": 1.97, + "learning_rate": 4.1339516461412045e-06, + "loss": 0.0071, + "step": 760930 + }, + { + "epoch": 1.97, + "learning_rate": 4.130063429769739e-06, + "loss": 0.0095, + "step": 760940 + }, + { + "epoch": 1.97, + "learning_rate": 4.126175213398275e-06, + "loss": 0.0067, + "step": 760950 + }, + { + "epoch": 1.97, + "learning_rate": 4.12228699702681e-06, + "loss": 0.0065, + "step": 760960 + }, + { + "epoch": 1.97, + "learning_rate": 4.118398780655346e-06, + "loss": 0.0068, + "step": 760970 + }, + { + "epoch": 1.97, + "learning_rate": 4.114510564283881e-06, + "loss": 0.0065, + "step": 760980 + }, + { + "epoch": 1.97, + "learning_rate": 4.110622347912416e-06, + "loss": 0.0054, + "step": 760990 + }, + { + "epoch": 1.97, + "learning_rate": 4.106734131540951e-06, + "loss": 0.0046, + "step": 761000 + }, + { + "epoch": 1.97, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.00441008573397994, + "eval_runtime": 107.8116, + "eval_samples_per_second": 18.551, + "eval_steps_per_second": 4.638, + "step": 761000 + }, + { + "epoch": 1.97, + "learning_rate": 4.102845915169487e-06, + "loss": 0.0075, + "step": 761010 + }, + { + "epoch": 1.97, + "learning_rate": 4.0989576987980225e-06, + "loss": 0.0078, + "step": 761020 + }, + { + "epoch": 1.97, + "learning_rate": 4.095069482426557e-06, + "loss": 0.0074, + "step": 761030 + }, + { + "epoch": 1.97, + "learning_rate": 4.091181266055093e-06, + "loss": 0.0066, + "step": 761040 + }, + { + "epoch": 1.97, + "learning_rate": 4.087293049683629e-06, + "loss": 0.0059, + "step": 761050 + }, + { + "epoch": 1.97, + "learning_rate": 4.083404833312164e-06, + "loss": 0.0075, + "step": 761060 + }, + { + "epoch": 1.97, + "learning_rate": 4.079516616940699e-06, + "loss": 0.0061, + "step": 761070 + }, + { + "epoch": 1.97, + "learning_rate": 4.075628400569234e-06, + "loss": 0.0063, + "step": 761080 + }, + { + "epoch": 1.97, + "learning_rate": 4.07174018419777e-06, + "loss": 0.0079, + "step": 761090 + }, + { + "epoch": 1.97, + "learning_rate": 4.067851967826306e-06, + "loss": 0.0071, + "step": 761100 + }, + { + "epoch": 1.97, + "learning_rate": 4.0639637514548405e-06, + "loss": 0.009, + "step": 761110 + }, + { + "epoch": 1.97, + "learning_rate": 4.060075535083376e-06, + "loss": 0.0115, + "step": 761120 + }, + { + "epoch": 1.97, + "learning_rate": 4.056187318711911e-06, + "loss": 0.0052, + "step": 761130 + }, + { + "epoch": 1.97, + "learning_rate": 4.052299102340447e-06, + "loss": 0.011, + "step": 761140 + }, + { + "epoch": 1.97, + "learning_rate": 4.0484108859689825e-06, + "loss": 0.0063, + "step": 761150 + }, + { + "epoch": 1.97, + "learning_rate": 4.044522669597517e-06, + "loss": 0.0059, + "step": 761160 + }, + { + "epoch": 1.97, + "learning_rate": 4.040634453226052e-06, + "loss": 0.0056, + "step": 761170 + }, + { + "epoch": 1.97, + "learning_rate": 4.036746236854588e-06, + "loss": 0.0081, + "step": 761180 + }, + { + "epoch": 1.97, + "learning_rate": 4.032858020483124e-06, + "loss": 0.0075, + "step": 761190 + }, + { + "epoch": 1.97, + "learning_rate": 4.0289698041116585e-06, + "loss": 0.0093, + "step": 761200 + }, + { + "epoch": 1.97, + "learning_rate": 4.025081587740194e-06, + "loss": 0.006, + "step": 761210 + }, + { + "epoch": 1.97, + "learning_rate": 4.02119337136873e-06, + "loss": 0.0054, + "step": 761220 + }, + { + "epoch": 1.97, + "learning_rate": 4.017305154997265e-06, + "loss": 0.0072, + "step": 761230 + }, + { + "epoch": 1.97, + "learning_rate": 4.0134169386258004e-06, + "loss": 0.011, + "step": 761240 + }, + { + "epoch": 1.97, + "learning_rate": 4.009528722254335e-06, + "loss": 0.0068, + "step": 761250 + }, + { + "epoch": 1.97, + "learning_rate": 4.005640505882871e-06, + "loss": 0.01, + "step": 761260 + }, + { + "epoch": 1.97, + "learning_rate": 4.001752289511407e-06, + "loss": 0.005, + "step": 761270 + }, + { + "epoch": 1.97, + "learning_rate": 3.997864073139942e-06, + "loss": 0.0065, + "step": 761280 + }, + { + "epoch": 1.97, + "learning_rate": 3.993975856768477e-06, + "loss": 0.0098, + "step": 761290 + }, + { + "epoch": 1.97, + "learning_rate": 3.990087640397012e-06, + "loss": 0.0085, + "step": 761300 + }, + { + "epoch": 1.97, + "learning_rate": 3.986199424025548e-06, + "loss": 0.0055, + "step": 761310 + }, + { + "epoch": 1.97, + "learning_rate": 3.9823112076540836e-06, + "loss": 0.0063, + "step": 761320 + }, + { + "epoch": 1.97, + "learning_rate": 3.9784229912826184e-06, + "loss": 0.0062, + "step": 761330 + }, + { + "epoch": 1.97, + "learning_rate": 3.974534774911153e-06, + "loss": 0.0047, + "step": 761340 + }, + { + "epoch": 1.97, + "learning_rate": 3.970646558539689e-06, + "loss": 0.0066, + "step": 761350 + }, + { + "epoch": 1.97, + "learning_rate": 3.966758342168225e-06, + "loss": 0.0054, + "step": 761360 + }, + { + "epoch": 1.97, + "learning_rate": 3.9628701257967596e-06, + "loss": 0.0069, + "step": 761370 + }, + { + "epoch": 1.97, + "learning_rate": 3.958981909425295e-06, + "loss": 0.0069, + "step": 761380 + }, + { + "epoch": 1.97, + "learning_rate": 3.955093693053831e-06, + "loss": 0.0054, + "step": 761390 + }, + { + "epoch": 1.97, + "learning_rate": 3.951205476682367e-06, + "loss": 0.0069, + "step": 761400 + }, + { + "epoch": 1.97, + "learning_rate": 3.9473172603109016e-06, + "loss": 0.0116, + "step": 761410 + }, + { + "epoch": 1.97, + "learning_rate": 3.9434290439394364e-06, + "loss": 0.006, + "step": 761420 + }, + { + "epoch": 1.97, + "learning_rate": 3.939540827567972e-06, + "loss": 0.0091, + "step": 761430 + }, + { + "epoch": 1.97, + "learning_rate": 3.935652611196508e-06, + "loss": 0.0058, + "step": 761440 + }, + { + "epoch": 1.97, + "learning_rate": 3.931764394825043e-06, + "loss": 0.0077, + "step": 761450 + }, + { + "epoch": 1.97, + "learning_rate": 3.927876178453578e-06, + "loss": 0.0079, + "step": 761460 + }, + { + "epoch": 1.97, + "learning_rate": 3.923987962082113e-06, + "loss": 0.0063, + "step": 761470 + }, + { + "epoch": 1.97, + "learning_rate": 3.920099745710649e-06, + "loss": 0.0067, + "step": 761480 + }, + { + "epoch": 1.97, + "learning_rate": 3.916211529339185e-06, + "loss": 0.0067, + "step": 761490 + }, + { + "epoch": 1.97, + "learning_rate": 3.9123233129677196e-06, + "loss": 0.0095, + "step": 761500 + }, + { + "epoch": 1.97, + "learning_rate": 3.908435096596254e-06, + "loss": 0.005, + "step": 761510 + }, + { + "epoch": 1.97, + "learning_rate": 3.90454688022479e-06, + "loss": 0.0074, + "step": 761520 + }, + { + "epoch": 1.97, + "learning_rate": 3.900658663853326e-06, + "loss": 0.0085, + "step": 761530 + }, + { + "epoch": 1.97, + "learning_rate": 3.8967704474818615e-06, + "loss": 0.0063, + "step": 761540 + }, + { + "epoch": 1.97, + "learning_rate": 3.892882231110396e-06, + "loss": 0.007, + "step": 761550 + }, + { + "epoch": 1.97, + "learning_rate": 3.888994014738932e-06, + "loss": 0.0057, + "step": 761560 + }, + { + "epoch": 1.97, + "learning_rate": 3.885105798367468e-06, + "loss": 0.0059, + "step": 761570 + }, + { + "epoch": 1.97, + "learning_rate": 3.881217581996003e-06, + "loss": 0.0057, + "step": 761580 + }, + { + "epoch": 1.97, + "learning_rate": 3.8773293656245375e-06, + "loss": 0.0055, + "step": 761590 + }, + { + "epoch": 1.97, + "learning_rate": 3.873441149253073e-06, + "loss": 0.0084, + "step": 761600 + }, + { + "epoch": 1.97, + "learning_rate": 3.869552932881609e-06, + "loss": 0.0059, + "step": 761610 + }, + { + "epoch": 1.97, + "learning_rate": 3.865664716510144e-06, + "loss": 0.0055, + "step": 761620 + }, + { + "epoch": 1.97, + "learning_rate": 3.8617765001386795e-06, + "loss": 0.0068, + "step": 761630 + }, + { + "epoch": 1.97, + "learning_rate": 3.857888283767214e-06, + "loss": 0.0062, + "step": 761640 + }, + { + "epoch": 1.97, + "learning_rate": 3.85400006739575e-06, + "loss": 0.01, + "step": 761650 + }, + { + "epoch": 1.97, + "learning_rate": 3.850111851024286e-06, + "loss": 0.0055, + "step": 761660 + }, + { + "epoch": 1.97, + "learning_rate": 3.846223634652821e-06, + "loss": 0.0044, + "step": 761670 + }, + { + "epoch": 1.97, + "learning_rate": 3.8423354182813555e-06, + "loss": 0.0066, + "step": 761680 + }, + { + "epoch": 1.97, + "learning_rate": 3.838447201909891e-06, + "loss": 0.0078, + "step": 761690 + }, + { + "epoch": 1.97, + "learning_rate": 3.834558985538427e-06, + "loss": 0.0065, + "step": 761700 + }, + { + "epoch": 1.97, + "learning_rate": 3.830670769166963e-06, + "loss": 0.0076, + "step": 761710 + }, + { + "epoch": 1.97, + "learning_rate": 3.8267825527954975e-06, + "loss": 0.0074, + "step": 761720 + }, + { + "epoch": 1.97, + "learning_rate": 3.822894336424033e-06, + "loss": 0.0045, + "step": 761730 + }, + { + "epoch": 1.97, + "learning_rate": 3.819006120052569e-06, + "loss": 0.0069, + "step": 761740 + }, + { + "epoch": 1.97, + "learning_rate": 3.815117903681104e-06, + "loss": 0.0057, + "step": 761750 + }, + { + "epoch": 1.97, + "learning_rate": 3.811229687309639e-06, + "loss": 0.0064, + "step": 761760 + }, + { + "epoch": 1.97, + "learning_rate": 3.8073414709381748e-06, + "loss": 0.0063, + "step": 761770 + }, + { + "epoch": 1.97, + "learning_rate": 3.8034532545667096e-06, + "loss": 0.0057, + "step": 761780 + }, + { + "epoch": 1.97, + "learning_rate": 3.799565038195245e-06, + "loss": 0.0059, + "step": 761790 + }, + { + "epoch": 1.97, + "learning_rate": 3.7956768218237806e-06, + "loss": 0.0088, + "step": 761800 + }, + { + "epoch": 1.97, + "learning_rate": 3.791788605452316e-06, + "loss": 0.0072, + "step": 761810 + }, + { + "epoch": 1.97, + "learning_rate": 3.7879003890808512e-06, + "loss": 0.0067, + "step": 761820 + }, + { + "epoch": 1.97, + "learning_rate": 3.7840121727093865e-06, + "loss": 0.0125, + "step": 761830 + }, + { + "epoch": 1.97, + "learning_rate": 3.7801239563379218e-06, + "loss": 0.007, + "step": 761840 + }, + { + "epoch": 1.97, + "learning_rate": 3.7762357399664575e-06, + "loss": 0.0059, + "step": 761850 + }, + { + "epoch": 1.97, + "learning_rate": 3.7723475235949928e-06, + "loss": 0.0071, + "step": 761860 + }, + { + "epoch": 1.97, + "learning_rate": 3.768459307223528e-06, + "loss": 0.0055, + "step": 761870 + }, + { + "epoch": 1.97, + "learning_rate": 3.7645710908520638e-06, + "loss": 0.0042, + "step": 761880 + }, + { + "epoch": 1.97, + "learning_rate": 3.7606828744805986e-06, + "loss": 0.0078, + "step": 761890 + }, + { + "epoch": 1.97, + "learning_rate": 3.756794658109134e-06, + "loss": 0.0064, + "step": 761900 + }, + { + "epoch": 1.97, + "learning_rate": 3.7529064417376696e-06, + "loss": 0.0085, + "step": 761910 + }, + { + "epoch": 1.98, + "learning_rate": 3.749018225366205e-06, + "loss": 0.0084, + "step": 761920 + }, + { + "epoch": 1.98, + "learning_rate": 3.74513000899474e-06, + "loss": 0.0058, + "step": 761930 + }, + { + "epoch": 1.98, + "learning_rate": 3.741241792623276e-06, + "loss": 0.0058, + "step": 761940 + }, + { + "epoch": 1.98, + "learning_rate": 3.7373535762518108e-06, + "loss": 0.006, + "step": 761950 + }, + { + "epoch": 1.98, + "learning_rate": 3.733465359880346e-06, + "loss": 0.0076, + "step": 761960 + }, + { + "epoch": 1.98, + "learning_rate": 3.7295771435088818e-06, + "loss": 0.007, + "step": 761970 + }, + { + "epoch": 1.98, + "learning_rate": 3.725688927137417e-06, + "loss": 0.0066, + "step": 761980 + }, + { + "epoch": 1.98, + "learning_rate": 3.7218007107659523e-06, + "loss": 0.008, + "step": 761990 + }, + { + "epoch": 1.98, + "learning_rate": 3.7179124943944876e-06, + "loss": 0.01, + "step": 762000 + }, + { + "epoch": 1.98, + "eval_cer": 0.8816900895907601, + "eval_loss": 0.0043979547917842865, + "eval_runtime": 107.9627, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, + "step": 762000 + }, + { + "epoch": 1.98, + "learning_rate": 3.714024278023023e-06, + "loss": 0.0057, + "step": 762010 + }, + { + "epoch": 1.98, + "learning_rate": 3.7101360616515586e-06, + "loss": 0.0092, + "step": 762020 + }, + { + "epoch": 1.98, + "learning_rate": 3.706247845280094e-06, + "loss": 0.0064, + "step": 762030 + }, + { + "epoch": 1.98, + "learning_rate": 3.702359628908629e-06, + "loss": 0.0096, + "step": 762040 + }, + { + "epoch": 1.98, + "learning_rate": 3.698471412537165e-06, + "loss": 0.0087, + "step": 762050 + }, + { + "epoch": 1.98, + "learning_rate": 3.6945831961656997e-06, + "loss": 0.0046, + "step": 762060 + }, + { + "epoch": 1.98, + "learning_rate": 3.690694979794235e-06, + "loss": 0.0067, + "step": 762070 + }, + { + "epoch": 1.98, + "learning_rate": 3.6868067634227707e-06, + "loss": 0.0079, + "step": 762080 + }, + { + "epoch": 1.98, + "learning_rate": 3.682918547051306e-06, + "loss": 0.0066, + "step": 762090 + }, + { + "epoch": 1.98, + "learning_rate": 3.6790303306798413e-06, + "loss": 0.0087, + "step": 762100 + }, + { + "epoch": 1.98, + "learning_rate": 3.675142114308377e-06, + "loss": 0.007, + "step": 762110 + }, + { + "epoch": 1.98, + "learning_rate": 3.671253897936912e-06, + "loss": 0.0078, + "step": 762120 + }, + { + "epoch": 1.98, + "learning_rate": 3.667365681565447e-06, + "loss": 0.0063, + "step": 762130 + }, + { + "epoch": 1.98, + "learning_rate": 3.663477465193983e-06, + "loss": 0.007, + "step": 762140 + }, + { + "epoch": 1.98, + "learning_rate": 3.659589248822518e-06, + "loss": 0.0078, + "step": 762150 + }, + { + "epoch": 1.98, + "learning_rate": 3.655701032451054e-06, + "loss": 0.0058, + "step": 762160 + }, + { + "epoch": 1.98, + "learning_rate": 3.651812816079589e-06, + "loss": 0.0054, + "step": 762170 + }, + { + "epoch": 1.98, + "learning_rate": 3.647924599708124e-06, + "loss": 0.0074, + "step": 762180 + }, + { + "epoch": 1.98, + "learning_rate": 3.6440363833366597e-06, + "loss": 0.0069, + "step": 762190 + }, + { + "epoch": 1.98, + "learning_rate": 3.640148166965195e-06, + "loss": 0.0076, + "step": 762200 + }, + { + "epoch": 1.98, + "learning_rate": 3.6362599505937303e-06, + "loss": 0.0082, + "step": 762210 + }, + { + "epoch": 1.98, + "learning_rate": 3.632371734222266e-06, + "loss": 0.0077, + "step": 762220 + }, + { + "epoch": 1.98, + "learning_rate": 3.628483517850801e-06, + "loss": 0.0072, + "step": 762230 + }, + { + "epoch": 1.98, + "learning_rate": 3.624595301479336e-06, + "loss": 0.0078, + "step": 762240 + }, + { + "epoch": 1.98, + "learning_rate": 3.620707085107872e-06, + "loss": 0.0048, + "step": 762250 + }, + { + "epoch": 1.98, + "learning_rate": 3.616818868736407e-06, + "loss": 0.0089, + "step": 762260 + }, + { + "epoch": 1.98, + "learning_rate": 3.6129306523649424e-06, + "loss": 0.0066, + "step": 762270 + }, + { + "epoch": 1.98, + "learning_rate": 3.609042435993478e-06, + "loss": 0.0075, + "step": 762280 + }, + { + "epoch": 1.98, + "learning_rate": 3.605154219622013e-06, + "loss": 0.0112, + "step": 762290 + }, + { + "epoch": 1.98, + "learning_rate": 3.6012660032505483e-06, + "loss": 0.0059, + "step": 762300 + }, + { + "epoch": 1.98, + "learning_rate": 3.597377786879084e-06, + "loss": 0.0049, + "step": 762310 + }, + { + "epoch": 1.98, + "learning_rate": 3.5934895705076193e-06, + "loss": 0.0069, + "step": 762320 + }, + { + "epoch": 1.98, + "learning_rate": 3.589601354136155e-06, + "loss": 0.0059, + "step": 762330 + }, + { + "epoch": 1.98, + "learning_rate": 3.5857131377646903e-06, + "loss": 0.0082, + "step": 762340 + }, + { + "epoch": 1.98, + "learning_rate": 3.581824921393225e-06, + "loss": 0.0074, + "step": 762350 + }, + { + "epoch": 1.98, + "learning_rate": 3.577936705021761e-06, + "loss": 0.0058, + "step": 762360 + }, + { + "epoch": 1.98, + "learning_rate": 3.574048488650296e-06, + "loss": 0.0075, + "step": 762370 + }, + { + "epoch": 1.98, + "learning_rate": 3.5701602722788314e-06, + "loss": 0.0077, + "step": 762380 + }, + { + "epoch": 1.98, + "learning_rate": 3.566272055907367e-06, + "loss": 0.0062, + "step": 762390 + }, + { + "epoch": 1.98, + "learning_rate": 3.562383839535902e-06, + "loss": 0.0097, + "step": 762400 + }, + { + "epoch": 1.98, + "learning_rate": 3.5584956231644373e-06, + "loss": 0.0073, + "step": 762410 + }, + { + "epoch": 1.98, + "learning_rate": 3.554607406792973e-06, + "loss": 0.0063, + "step": 762420 + }, + { + "epoch": 1.98, + "learning_rate": 3.5507191904215083e-06, + "loss": 0.0074, + "step": 762430 + }, + { + "epoch": 1.98, + "learning_rate": 3.5468309740500435e-06, + "loss": 0.0059, + "step": 762440 + }, + { + "epoch": 1.98, + "learning_rate": 3.5429427576785793e-06, + "loss": 0.0068, + "step": 762450 + }, + { + "epoch": 1.98, + "learning_rate": 3.539054541307114e-06, + "loss": 0.0063, + "step": 762460 + }, + { + "epoch": 1.98, + "learning_rate": 3.53516632493565e-06, + "loss": 0.005, + "step": 762470 + }, + { + "epoch": 1.98, + "learning_rate": 3.531278108564185e-06, + "loss": 0.0075, + "step": 762480 + }, + { + "epoch": 1.98, + "learning_rate": 3.5273898921927204e-06, + "loss": 0.0071, + "step": 762490 + }, + { + "epoch": 1.98, + "learning_rate": 3.523501675821256e-06, + "loss": 0.005, + "step": 762500 + }, + { + "epoch": 1.98, + "learning_rate": 3.5196134594497914e-06, + "loss": 0.0096, + "step": 762510 + }, + { + "epoch": 1.98, + "learning_rate": 3.5157252430783262e-06, + "loss": 0.0068, + "step": 762520 + }, + { + "epoch": 1.98, + "learning_rate": 3.511837026706862e-06, + "loss": 0.0079, + "step": 762530 + }, + { + "epoch": 1.98, + "learning_rate": 3.5079488103353972e-06, + "loss": 0.0051, + "step": 762540 + }, + { + "epoch": 1.98, + "learning_rate": 3.5040605939639325e-06, + "loss": 0.008, + "step": 762550 + }, + { + "epoch": 1.98, + "learning_rate": 3.5001723775924682e-06, + "loss": 0.0054, + "step": 762560 + }, + { + "epoch": 1.98, + "learning_rate": 3.496284161221003e-06, + "loss": 0.0068, + "step": 762570 + }, + { + "epoch": 1.98, + "learning_rate": 3.4923959448495384e-06, + "loss": 0.008, + "step": 762580 + }, + { + "epoch": 1.98, + "learning_rate": 3.488507728478074e-06, + "loss": 0.0062, + "step": 762590 + }, + { + "epoch": 1.98, + "learning_rate": 3.4846195121066094e-06, + "loss": 0.0053, + "step": 762600 + }, + { + "epoch": 1.98, + "learning_rate": 3.480731295735145e-06, + "loss": 0.008, + "step": 762610 + }, + { + "epoch": 1.98, + "learning_rate": 3.4768430793636804e-06, + "loss": 0.0079, + "step": 762620 + }, + { + "epoch": 1.98, + "learning_rate": 3.4729548629922152e-06, + "loss": 0.0057, + "step": 762630 + }, + { + "epoch": 1.98, + "learning_rate": 3.469066646620751e-06, + "loss": 0.0046, + "step": 762640 + }, + { + "epoch": 1.98, + "learning_rate": 3.4651784302492862e-06, + "loss": 0.0058, + "step": 762650 + }, + { + "epoch": 1.98, + "learning_rate": 3.4612902138778215e-06, + "loss": 0.0073, + "step": 762660 + }, + { + "epoch": 1.98, + "learning_rate": 3.4574019975063572e-06, + "loss": 0.0072, + "step": 762670 + }, + { + "epoch": 1.98, + "learning_rate": 3.4535137811348925e-06, + "loss": 0.008, + "step": 762680 + }, + { + "epoch": 1.98, + "learning_rate": 3.4496255647634274e-06, + "loss": 0.0041, + "step": 762690 + }, + { + "epoch": 1.98, + "learning_rate": 3.445737348391963e-06, + "loss": 0.0048, + "step": 762700 + }, + { + "epoch": 1.98, + "learning_rate": 3.4418491320204984e-06, + "loss": 0.0102, + "step": 762710 + }, + { + "epoch": 1.98, + "learning_rate": 3.4379609156490336e-06, + "loss": 0.0055, + "step": 762720 + }, + { + "epoch": 1.98, + "learning_rate": 3.4340726992775694e-06, + "loss": 0.0051, + "step": 762730 + }, + { + "epoch": 1.98, + "learning_rate": 3.430184482906104e-06, + "loss": 0.0092, + "step": 762740 + }, + { + "epoch": 1.98, + "learning_rate": 3.4262962665346395e-06, + "loss": 0.0061, + "step": 762750 + }, + { + "epoch": 1.98, + "learning_rate": 3.422408050163175e-06, + "loss": 0.006, + "step": 762760 + }, + { + "epoch": 1.98, + "learning_rate": 3.4185198337917105e-06, + "loss": 0.0073, + "step": 762770 + }, + { + "epoch": 1.98, + "learning_rate": 3.414631617420246e-06, + "loss": 0.007, + "step": 762780 + }, + { + "epoch": 1.98, + "learning_rate": 3.4107434010487815e-06, + "loss": 0.0069, + "step": 762790 + }, + { + "epoch": 1.98, + "learning_rate": 3.4068551846773163e-06, + "loss": 0.0074, + "step": 762800 + }, + { + "epoch": 1.98, + "learning_rate": 3.402966968305852e-06, + "loss": 0.01, + "step": 762810 + }, + { + "epoch": 1.98, + "learning_rate": 3.3990787519343873e-06, + "loss": 0.008, + "step": 762820 + }, + { + "epoch": 1.98, + "learning_rate": 3.3951905355629226e-06, + "loss": 0.0096, + "step": 762830 + }, + { + "epoch": 1.98, + "learning_rate": 3.3913023191914583e-06, + "loss": 0.0081, + "step": 762840 + }, + { + "epoch": 1.98, + "learning_rate": 3.3874141028199936e-06, + "loss": 0.007, + "step": 762850 + }, + { + "epoch": 1.98, + "learning_rate": 3.3835258864485285e-06, + "loss": 0.0067, + "step": 762860 + }, + { + "epoch": 1.98, + "learning_rate": 3.379637670077064e-06, + "loss": 0.0062, + "step": 762870 + }, + { + "epoch": 1.98, + "learning_rate": 3.3757494537055995e-06, + "loss": 0.0077, + "step": 762880 + }, + { + "epoch": 1.98, + "learning_rate": 3.3718612373341348e-06, + "loss": 0.0054, + "step": 762890 + }, + { + "epoch": 1.98, + "learning_rate": 3.3679730209626705e-06, + "loss": 0.0083, + "step": 762900 + }, + { + "epoch": 1.98, + "learning_rate": 3.3640848045912053e-06, + "loss": 0.0072, + "step": 762910 + }, + { + "epoch": 1.98, + "learning_rate": 3.360196588219741e-06, + "loss": 0.0085, + "step": 762920 + }, + { + "epoch": 1.98, + "learning_rate": 3.3563083718482763e-06, + "loss": 0.0065, + "step": 762930 + }, + { + "epoch": 1.98, + "learning_rate": 3.3524201554768116e-06, + "loss": 0.0064, + "step": 762940 + }, + { + "epoch": 1.98, + "learning_rate": 3.3485319391053473e-06, + "loss": 0.0077, + "step": 762950 + }, + { + "epoch": 1.98, + "learning_rate": 3.3446437227338826e-06, + "loss": 0.0078, + "step": 762960 + }, + { + "epoch": 1.98, + "learning_rate": 3.3407555063624175e-06, + "loss": 0.0073, + "step": 762970 + }, + { + "epoch": 1.98, + "learning_rate": 3.336867289990953e-06, + "loss": 0.0072, + "step": 762980 + }, + { + "epoch": 1.98, + "learning_rate": 3.3329790736194885e-06, + "loss": 0.0071, + "step": 762990 + }, + { + "epoch": 1.98, + "learning_rate": 3.3290908572480237e-06, + "loss": 0.0095, + "step": 763000 + }, + { + "epoch": 1.98, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.004390762187540531, + "eval_runtime": 107.772, + "eval_samples_per_second": 18.558, + "eval_steps_per_second": 4.639, + "step": 763000 + }, + { + "epoch": 1.98, + "learning_rate": 3.3252026408765594e-06, + "loss": 0.0091, + "step": 763010 + }, + { + "epoch": 1.98, + "learning_rate": 3.3213144245050947e-06, + "loss": 0.0068, + "step": 763020 + }, + { + "epoch": 1.98, + "learning_rate": 3.3174262081336296e-06, + "loss": 0.0058, + "step": 763030 + }, + { + "epoch": 1.98, + "learning_rate": 3.3135379917621653e-06, + "loss": 0.0066, + "step": 763040 + }, + { + "epoch": 1.98, + "learning_rate": 3.3096497753907006e-06, + "loss": 0.0067, + "step": 763050 + }, + { + "epoch": 1.98, + "learning_rate": 3.305761559019236e-06, + "loss": 0.0065, + "step": 763060 + }, + { + "epoch": 1.98, + "learning_rate": 3.3018733426477716e-06, + "loss": 0.0092, + "step": 763070 + }, + { + "epoch": 1.98, + "learning_rate": 3.2979851262763064e-06, + "loss": 0.0046, + "step": 763080 + }, + { + "epoch": 1.98, + "learning_rate": 3.294096909904842e-06, + "loss": 0.0053, + "step": 763090 + }, + { + "epoch": 1.98, + "learning_rate": 3.2902086935333774e-06, + "loss": 0.0056, + "step": 763100 + }, + { + "epoch": 1.98, + "learning_rate": 3.2863204771619127e-06, + "loss": 0.0059, + "step": 763110 + }, + { + "epoch": 1.98, + "learning_rate": 3.2824322607904484e-06, + "loss": 0.0062, + "step": 763120 + }, + { + "epoch": 1.98, + "learning_rate": 3.2785440444189837e-06, + "loss": 0.0068, + "step": 763130 + }, + { + "epoch": 1.98, + "learning_rate": 3.2746558280475186e-06, + "loss": 0.0091, + "step": 763140 + }, + { + "epoch": 1.98, + "learning_rate": 3.2707676116760543e-06, + "loss": 0.006, + "step": 763150 + }, + { + "epoch": 1.98, + "learning_rate": 3.2668793953045896e-06, + "loss": 0.0085, + "step": 763160 + }, + { + "epoch": 1.98, + "learning_rate": 3.262991178933125e-06, + "loss": 0.0065, + "step": 763170 + }, + { + "epoch": 1.98, + "learning_rate": 3.2591029625616606e-06, + "loss": 0.0052, + "step": 763180 + }, + { + "epoch": 1.98, + "learning_rate": 3.255214746190196e-06, + "loss": 0.0084, + "step": 763190 + }, + { + "epoch": 1.98, + "learning_rate": 3.2513265298187307e-06, + "loss": 0.004, + "step": 763200 + }, + { + "epoch": 1.98, + "learning_rate": 3.2474383134472664e-06, + "loss": 0.0055, + "step": 763210 + }, + { + "epoch": 1.98, + "learning_rate": 3.2435500970758017e-06, + "loss": 0.0065, + "step": 763220 + }, + { + "epoch": 1.98, + "learning_rate": 3.2396618807043374e-06, + "loss": 0.0096, + "step": 763230 + }, + { + "epoch": 1.98, + "learning_rate": 3.2357736643328727e-06, + "loss": 0.0058, + "step": 763240 + }, + { + "epoch": 1.98, + "learning_rate": 3.2318854479614076e-06, + "loss": 0.0089, + "step": 763250 + }, + { + "epoch": 1.98, + "learning_rate": 3.2279972315899433e-06, + "loss": 0.0059, + "step": 763260 + }, + { + "epoch": 1.98, + "learning_rate": 3.2241090152184786e-06, + "loss": 0.0061, + "step": 763270 + }, + { + "epoch": 1.98, + "learning_rate": 3.220220798847014e-06, + "loss": 0.0076, + "step": 763280 + }, + { + "epoch": 1.98, + "learning_rate": 3.2163325824755495e-06, + "loss": 0.007, + "step": 763290 + }, + { + "epoch": 1.98, + "learning_rate": 3.212444366104085e-06, + "loss": 0.0061, + "step": 763300 + }, + { + "epoch": 1.98, + "learning_rate": 3.2085561497326197e-06, + "loss": 0.0067, + "step": 763310 + }, + { + "epoch": 1.98, + "learning_rate": 3.2046679333611554e-06, + "loss": 0.0072, + "step": 763320 + }, + { + "epoch": 1.98, + "learning_rate": 3.2007797169896907e-06, + "loss": 0.0066, + "step": 763330 + }, + { + "epoch": 1.98, + "learning_rate": 3.196891500618226e-06, + "loss": 0.0099, + "step": 763340 + }, + { + "epoch": 1.98, + "learning_rate": 3.1930032842467617e-06, + "loss": 0.0083, + "step": 763350 + }, + { + "epoch": 1.98, + "learning_rate": 3.189115067875297e-06, + "loss": 0.0079, + "step": 763360 + }, + { + "epoch": 1.98, + "learning_rate": 3.185226851503832e-06, + "loss": 0.0062, + "step": 763370 + }, + { + "epoch": 1.98, + "learning_rate": 3.1813386351323675e-06, + "loss": 0.0076, + "step": 763380 + }, + { + "epoch": 1.98, + "learning_rate": 3.177450418760903e-06, + "loss": 0.0087, + "step": 763390 + }, + { + "epoch": 1.98, + "learning_rate": 3.1735622023894385e-06, + "loss": 0.0054, + "step": 763400 + }, + { + "epoch": 1.98, + "learning_rate": 3.169673986017974e-06, + "loss": 0.0063, + "step": 763410 + }, + { + "epoch": 1.98, + "learning_rate": 3.1657857696465087e-06, + "loss": 0.0062, + "step": 763420 + }, + { + "epoch": 1.98, + "learning_rate": 3.1618975532750444e-06, + "loss": 0.007, + "step": 763430 + }, + { + "epoch": 1.98, + "learning_rate": 3.1580093369035797e-06, + "loss": 0.0061, + "step": 763440 + }, + { + "epoch": 1.98, + "learning_rate": 3.154121120532115e-06, + "loss": 0.0082, + "step": 763450 + }, + { + "epoch": 1.98, + "learning_rate": 3.1502329041606507e-06, + "loss": 0.0074, + "step": 763460 + }, + { + "epoch": 1.98, + "learning_rate": 3.146344687789186e-06, + "loss": 0.0064, + "step": 763470 + }, + { + "epoch": 1.98, + "learning_rate": 3.142456471417721e-06, + "loss": 0.0067, + "step": 763480 + }, + { + "epoch": 1.98, + "learning_rate": 3.1385682550462565e-06, + "loss": 0.0069, + "step": 763490 + }, + { + "epoch": 1.98, + "learning_rate": 3.134680038674792e-06, + "loss": 0.0068, + "step": 763500 + }, + { + "epoch": 1.98, + "learning_rate": 3.130791822303327e-06, + "loss": 0.005, + "step": 763510 + }, + { + "epoch": 1.98, + "learning_rate": 3.126903605931863e-06, + "loss": 0.0058, + "step": 763520 + }, + { + "epoch": 1.98, + "learning_rate": 3.123015389560398e-06, + "loss": 0.0076, + "step": 763530 + }, + { + "epoch": 1.98, + "learning_rate": 3.119127173188934e-06, + "loss": 0.0078, + "step": 763540 + }, + { + "epoch": 1.98, + "learning_rate": 3.1152389568174687e-06, + "loss": 0.0057, + "step": 763550 + }, + { + "epoch": 1.98, + "learning_rate": 3.111350740446004e-06, + "loss": 0.0057, + "step": 763560 + }, + { + "epoch": 1.98, + "learning_rate": 3.1074625240745396e-06, + "loss": 0.0065, + "step": 763570 + }, + { + "epoch": 1.98, + "learning_rate": 3.103574307703075e-06, + "loss": 0.0076, + "step": 763580 + }, + { + "epoch": 1.98, + "learning_rate": 3.09968609133161e-06, + "loss": 0.0064, + "step": 763590 + }, + { + "epoch": 1.98, + "learning_rate": 3.0957978749601455e-06, + "loss": 0.0104, + "step": 763600 + }, + { + "epoch": 1.98, + "learning_rate": 3.0919096585886808e-06, + "loss": 0.008, + "step": 763610 + }, + { + "epoch": 1.98, + "learning_rate": 3.088021442217216e-06, + "loss": 0.0061, + "step": 763620 + }, + { + "epoch": 1.98, + "learning_rate": 3.0841332258457518e-06, + "loss": 0.0067, + "step": 763630 + }, + { + "epoch": 1.98, + "learning_rate": 3.080245009474287e-06, + "loss": 0.0094, + "step": 763640 + }, + { + "epoch": 1.98, + "learning_rate": 3.076356793102822e-06, + "loss": 0.0056, + "step": 763650 + }, + { + "epoch": 1.98, + "learning_rate": 3.0724685767313576e-06, + "loss": 0.0056, + "step": 763660 + }, + { + "epoch": 1.98, + "learning_rate": 3.068580360359893e-06, + "loss": 0.0084, + "step": 763670 + }, + { + "epoch": 1.98, + "learning_rate": 3.064692143988428e-06, + "loss": 0.0061, + "step": 763680 + }, + { + "epoch": 1.98, + "learning_rate": 3.060803927616964e-06, + "loss": 0.0061, + "step": 763690 + }, + { + "epoch": 1.98, + "learning_rate": 3.056915711245499e-06, + "loss": 0.0103, + "step": 763700 + }, + { + "epoch": 1.98, + "learning_rate": 3.053027494874035e-06, + "loss": 0.0086, + "step": 763710 + }, + { + "epoch": 1.98, + "learning_rate": 3.0491392785025698e-06, + "loss": 0.0077, + "step": 763720 + }, + { + "epoch": 1.98, + "learning_rate": 3.045251062131105e-06, + "loss": 0.0073, + "step": 763730 + }, + { + "epoch": 1.98, + "learning_rate": 3.0413628457596408e-06, + "loss": 0.0071, + "step": 763740 + }, + { + "epoch": 1.98, + "learning_rate": 3.037474629388176e-06, + "loss": 0.005, + "step": 763750 + }, + { + "epoch": 1.98, + "learning_rate": 3.033586413016711e-06, + "loss": 0.0059, + "step": 763760 + }, + { + "epoch": 1.98, + "learning_rate": 3.0296981966452466e-06, + "loss": 0.0097, + "step": 763770 + }, + { + "epoch": 1.98, + "learning_rate": 3.025809980273782e-06, + "loss": 0.0075, + "step": 763780 + }, + { + "epoch": 1.98, + "learning_rate": 3.021921763902317e-06, + "loss": 0.0061, + "step": 763790 + }, + { + "epoch": 1.98, + "learning_rate": 3.018033547530853e-06, + "loss": 0.0068, + "step": 763800 + }, + { + "epoch": 1.98, + "learning_rate": 3.014145331159388e-06, + "loss": 0.0088, + "step": 763810 + }, + { + "epoch": 1.98, + "learning_rate": 3.010257114787923e-06, + "loss": 0.006, + "step": 763820 + }, + { + "epoch": 1.98, + "learning_rate": 3.0063688984164587e-06, + "loss": 0.007, + "step": 763830 + }, + { + "epoch": 1.98, + "learning_rate": 3.002480682044994e-06, + "loss": 0.0075, + "step": 763840 + }, + { + "epoch": 1.98, + "learning_rate": 2.9985924656735297e-06, + "loss": 0.0083, + "step": 763850 + }, + { + "epoch": 1.98, + "learning_rate": 2.994704249302065e-06, + "loss": 0.0071, + "step": 763860 + }, + { + "epoch": 1.98, + "learning_rate": 2.9908160329306003e-06, + "loss": 0.0075, + "step": 763870 + }, + { + "epoch": 1.98, + "learning_rate": 2.986927816559136e-06, + "loss": 0.0095, + "step": 763880 + }, + { + "epoch": 1.98, + "learning_rate": 2.983039600187671e-06, + "loss": 0.0059, + "step": 763890 + }, + { + "epoch": 1.98, + "learning_rate": 2.979151383816206e-06, + "loss": 0.0063, + "step": 763900 + }, + { + "epoch": 1.98, + "learning_rate": 2.975263167444742e-06, + "loss": 0.0055, + "step": 763910 + }, + { + "epoch": 1.98, + "learning_rate": 2.971374951073277e-06, + "loss": 0.0073, + "step": 763920 + }, + { + "epoch": 1.98, + "learning_rate": 2.967486734701812e-06, + "loss": 0.0089, + "step": 763930 + }, + { + "epoch": 1.98, + "learning_rate": 2.9635985183303477e-06, + "loss": 0.0083, + "step": 763940 + }, + { + "epoch": 1.98, + "learning_rate": 2.959710301958883e-06, + "loss": 0.0069, + "step": 763950 + }, + { + "epoch": 1.98, + "learning_rate": 2.9558220855874183e-06, + "loss": 0.0103, + "step": 763960 + }, + { + "epoch": 1.98, + "learning_rate": 2.951933869215954e-06, + "loss": 0.0056, + "step": 763970 + }, + { + "epoch": 1.98, + "learning_rate": 2.9480456528444893e-06, + "loss": 0.0071, + "step": 763980 + }, + { + "epoch": 1.98, + "learning_rate": 2.944157436473025e-06, + "loss": 0.0088, + "step": 763990 + }, + { + "epoch": 1.98, + "learning_rate": 2.94026922010156e-06, + "loss": 0.0063, + "step": 764000 + }, + { + "epoch": 1.98, + "eval_cer": 0.8816872903168917, + "eval_loss": 0.004406400490552187, + "eval_runtime": 107.9975, + "eval_samples_per_second": 18.519, + "eval_steps_per_second": 4.63, + "step": 764000 + }, + { + "epoch": 1.98, + "learning_rate": 2.936381003730095e-06, + "loss": 0.0069, + "step": 764010 + }, + { + "epoch": 1.98, + "learning_rate": 2.932492787358631e-06, + "loss": 0.0057, + "step": 764020 + }, + { + "epoch": 1.98, + "learning_rate": 2.928604570987166e-06, + "loss": 0.0065, + "step": 764030 + }, + { + "epoch": 1.98, + "learning_rate": 2.9247163546157014e-06, + "loss": 0.0085, + "step": 764040 + }, + { + "epoch": 1.98, + "learning_rate": 2.920828138244237e-06, + "loss": 0.0103, + "step": 764050 + }, + { + "epoch": 1.98, + "learning_rate": 2.916939921872772e-06, + "loss": 0.0075, + "step": 764060 + }, + { + "epoch": 1.98, + "learning_rate": 2.9130517055013073e-06, + "loss": 0.0057, + "step": 764070 + }, + { + "epoch": 1.98, + "learning_rate": 2.909163489129843e-06, + "loss": 0.007, + "step": 764080 + }, + { + "epoch": 1.98, + "learning_rate": 2.9052752727583783e-06, + "loss": 0.0073, + "step": 764090 + }, + { + "epoch": 1.98, + "learning_rate": 2.901387056386913e-06, + "loss": 0.0086, + "step": 764100 + }, + { + "epoch": 1.98, + "learning_rate": 2.897498840015449e-06, + "loss": 0.0061, + "step": 764110 + }, + { + "epoch": 1.98, + "learning_rate": 2.893610623643984e-06, + "loss": 0.0067, + "step": 764120 + }, + { + "epoch": 1.98, + "learning_rate": 2.8897224072725194e-06, + "loss": 0.006, + "step": 764130 + }, + { + "epoch": 1.98, + "learning_rate": 2.885834190901055e-06, + "loss": 0.0052, + "step": 764140 + }, + { + "epoch": 1.98, + "learning_rate": 2.8819459745295904e-06, + "loss": 0.0059, + "step": 764150 + }, + { + "epoch": 1.98, + "learning_rate": 2.878057758158126e-06, + "loss": 0.0073, + "step": 764160 + }, + { + "epoch": 1.98, + "learning_rate": 2.874169541786661e-06, + "loss": 0.0058, + "step": 764170 + }, + { + "epoch": 1.98, + "learning_rate": 2.8702813254151963e-06, + "loss": 0.0105, + "step": 764180 + }, + { + "epoch": 1.98, + "learning_rate": 2.866393109043732e-06, + "loss": 0.0102, + "step": 764190 + }, + { + "epoch": 1.98, + "learning_rate": 2.8625048926722673e-06, + "loss": 0.0059, + "step": 764200 + }, + { + "epoch": 1.98, + "learning_rate": 2.8586166763008025e-06, + "loss": 0.0056, + "step": 764210 + }, + { + "epoch": 1.98, + "learning_rate": 2.8547284599293383e-06, + "loss": 0.0068, + "step": 764220 + }, + { + "epoch": 1.98, + "learning_rate": 2.850840243557873e-06, + "loss": 0.0069, + "step": 764230 + }, + { + "epoch": 1.98, + "learning_rate": 2.8469520271864084e-06, + "loss": 0.007, + "step": 764240 + }, + { + "epoch": 1.98, + "learning_rate": 2.843063810814944e-06, + "loss": 0.0046, + "step": 764250 + }, + { + "epoch": 1.98, + "learning_rate": 2.8391755944434794e-06, + "loss": 0.0074, + "step": 764260 + }, + { + "epoch": 1.98, + "learning_rate": 2.8352873780720147e-06, + "loss": 0.0083, + "step": 764270 + }, + { + "epoch": 1.98, + "learning_rate": 2.83139916170055e-06, + "loss": 0.005, + "step": 764280 + }, + { + "epoch": 1.98, + "learning_rate": 2.8275109453290852e-06, + "loss": 0.0076, + "step": 764290 + }, + { + "epoch": 1.98, + "learning_rate": 2.823622728957621e-06, + "loss": 0.0094, + "step": 764300 + }, + { + "epoch": 1.98, + "learning_rate": 2.8197345125861562e-06, + "loss": 0.0069, + "step": 764310 + }, + { + "epoch": 1.98, + "learning_rate": 2.8158462962146915e-06, + "loss": 0.0083, + "step": 764320 + }, + { + "epoch": 1.98, + "learning_rate": 2.8119580798432272e-06, + "loss": 0.0085, + "step": 764330 + }, + { + "epoch": 1.98, + "learning_rate": 2.808069863471762e-06, + "loss": 0.0088, + "step": 764340 + }, + { + "epoch": 1.98, + "learning_rate": 2.8041816471002974e-06, + "loss": 0.0116, + "step": 764350 + }, + { + "epoch": 1.98, + "learning_rate": 2.800293430728833e-06, + "loss": 0.0079, + "step": 764360 + }, + { + "epoch": 1.98, + "learning_rate": 2.7964052143573684e-06, + "loss": 0.0082, + "step": 764370 + }, + { + "epoch": 1.98, + "learning_rate": 2.7925169979859037e-06, + "loss": 0.01, + "step": 764380 + }, + { + "epoch": 1.98, + "learning_rate": 2.7886287816144394e-06, + "loss": 0.0063, + "step": 764390 + }, + { + "epoch": 1.98, + "learning_rate": 2.7847405652429742e-06, + "loss": 0.0062, + "step": 764400 + }, + { + "epoch": 1.98, + "learning_rate": 2.7808523488715095e-06, + "loss": 0.0064, + "step": 764410 + }, + { + "epoch": 1.98, + "learning_rate": 2.7769641325000452e-06, + "loss": 0.0075, + "step": 764420 + }, + { + "epoch": 1.98, + "learning_rate": 2.7730759161285805e-06, + "loss": 0.0055, + "step": 764430 + }, + { + "epoch": 1.98, + "learning_rate": 2.769187699757116e-06, + "loss": 0.0072, + "step": 764440 + }, + { + "epoch": 1.98, + "learning_rate": 2.765299483385651e-06, + "loss": 0.005, + "step": 764450 + }, + { + "epoch": 1.98, + "learning_rate": 2.7614112670141864e-06, + "loss": 0.0052, + "step": 764460 + }, + { + "epoch": 1.98, + "learning_rate": 2.757523050642722e-06, + "loss": 0.0063, + "step": 764470 + }, + { + "epoch": 1.98, + "learning_rate": 2.7536348342712574e-06, + "loss": 0.0067, + "step": 764480 + }, + { + "epoch": 1.98, + "learning_rate": 2.7497466178997926e-06, + "loss": 0.0061, + "step": 764490 + }, + { + "epoch": 1.98, + "learning_rate": 2.7458584015283284e-06, + "loss": 0.007, + "step": 764500 + }, + { + "epoch": 1.98, + "learning_rate": 2.7419701851568632e-06, + "loss": 0.0058, + "step": 764510 + }, + { + "epoch": 1.98, + "learning_rate": 2.7380819687853985e-06, + "loss": 0.0055, + "step": 764520 + }, + { + "epoch": 1.98, + "learning_rate": 2.734193752413934e-06, + "loss": 0.0053, + "step": 764530 + }, + { + "epoch": 1.98, + "learning_rate": 2.7303055360424695e-06, + "loss": 0.0057, + "step": 764540 + }, + { + "epoch": 1.98, + "learning_rate": 2.7264173196710048e-06, + "loss": 0.0071, + "step": 764550 + }, + { + "epoch": 1.98, + "learning_rate": 2.7225291032995405e-06, + "loss": 0.0063, + "step": 764560 + }, + { + "epoch": 1.98, + "learning_rate": 2.7186408869280753e-06, + "loss": 0.0059, + "step": 764570 + }, + { + "epoch": 1.98, + "learning_rate": 2.7147526705566106e-06, + "loss": 0.0076, + "step": 764580 + }, + { + "epoch": 1.98, + "learning_rate": 2.7108644541851463e-06, + "loss": 0.0093, + "step": 764590 + }, + { + "epoch": 1.98, + "learning_rate": 2.7069762378136816e-06, + "loss": 0.008, + "step": 764600 + }, + { + "epoch": 1.98, + "learning_rate": 2.7030880214422173e-06, + "loss": 0.0086, + "step": 764610 + }, + { + "epoch": 1.98, + "learning_rate": 2.699199805070752e-06, + "loss": 0.0082, + "step": 764620 + }, + { + "epoch": 1.98, + "learning_rate": 2.6953115886992875e-06, + "loss": 0.0063, + "step": 764630 + }, + { + "epoch": 1.98, + "learning_rate": 2.691423372327823e-06, + "loss": 0.0065, + "step": 764640 + }, + { + "epoch": 1.98, + "learning_rate": 2.6875351559563585e-06, + "loss": 0.0074, + "step": 764650 + }, + { + "epoch": 1.98, + "learning_rate": 2.6836469395848938e-06, + "loss": 0.0072, + "step": 764660 + }, + { + "epoch": 1.98, + "learning_rate": 2.6797587232134295e-06, + "loss": 0.0076, + "step": 764670 + }, + { + "epoch": 1.98, + "learning_rate": 2.6758705068419643e-06, + "loss": 0.0078, + "step": 764680 + }, + { + "epoch": 1.98, + "learning_rate": 2.6719822904704996e-06, + "loss": 0.0071, + "step": 764690 + }, + { + "epoch": 1.98, + "learning_rate": 2.6680940740990353e-06, + "loss": 0.0053, + "step": 764700 + }, + { + "epoch": 1.98, + "learning_rate": 2.6642058577275706e-06, + "loss": 0.0065, + "step": 764710 + }, + { + "epoch": 1.98, + "learning_rate": 2.660317641356106e-06, + "loss": 0.0065, + "step": 764720 + }, + { + "epoch": 1.98, + "learning_rate": 2.6564294249846416e-06, + "loss": 0.0092, + "step": 764730 + }, + { + "epoch": 1.98, + "learning_rate": 2.6525412086131765e-06, + "loss": 0.0083, + "step": 764740 + }, + { + "epoch": 1.98, + "learning_rate": 2.6486529922417117e-06, + "loss": 0.0073, + "step": 764750 + }, + { + "epoch": 1.98, + "learning_rate": 2.6447647758702475e-06, + "loss": 0.0071, + "step": 764760 + }, + { + "epoch": 1.98, + "learning_rate": 2.6408765594987827e-06, + "loss": 0.0053, + "step": 764770 + }, + { + "epoch": 1.98, + "learning_rate": 2.6369883431273185e-06, + "loss": 0.008, + "step": 764780 + }, + { + "epoch": 1.98, + "learning_rate": 2.6331001267558533e-06, + "loss": 0.0083, + "step": 764790 + }, + { + "epoch": 1.98, + "learning_rate": 2.6292119103843886e-06, + "loss": 0.0087, + "step": 764800 + }, + { + "epoch": 1.98, + "learning_rate": 2.6253236940129243e-06, + "loss": 0.0092, + "step": 764810 + }, + { + "epoch": 1.98, + "learning_rate": 2.6214354776414596e-06, + "loss": 0.0061, + "step": 764820 + }, + { + "epoch": 1.98, + "learning_rate": 2.617547261269995e-06, + "loss": 0.0058, + "step": 764830 + }, + { + "epoch": 1.98, + "learning_rate": 2.6136590448985306e-06, + "loss": 0.0068, + "step": 764840 + }, + { + "epoch": 1.98, + "learning_rate": 2.6097708285270654e-06, + "loss": 0.0062, + "step": 764850 + }, + { + "epoch": 1.98, + "learning_rate": 2.6058826121556007e-06, + "loss": 0.0091, + "step": 764860 + }, + { + "epoch": 1.98, + "learning_rate": 2.6019943957841364e-06, + "loss": 0.0067, + "step": 764870 + }, + { + "epoch": 1.98, + "learning_rate": 2.5981061794126717e-06, + "loss": 0.0066, + "step": 764880 + }, + { + "epoch": 1.98, + "learning_rate": 2.594217963041207e-06, + "loss": 0.0064, + "step": 764890 + }, + { + "epoch": 1.98, + "learning_rate": 2.5903297466697427e-06, + "loss": 0.0077, + "step": 764900 + }, + { + "epoch": 1.98, + "learning_rate": 2.5864415302982776e-06, + "loss": 0.0064, + "step": 764910 + }, + { + "epoch": 1.98, + "learning_rate": 2.5825533139268133e-06, + "loss": 0.0066, + "step": 764920 + }, + { + "epoch": 1.98, + "learning_rate": 2.5786650975553486e-06, + "loss": 0.0065, + "step": 764930 + }, + { + "epoch": 1.98, + "learning_rate": 2.574776881183884e-06, + "loss": 0.0069, + "step": 764940 + }, + { + "epoch": 1.98, + "learning_rate": 2.5708886648124196e-06, + "loss": 0.0076, + "step": 764950 + }, + { + "epoch": 1.98, + "learning_rate": 2.567000448440955e-06, + "loss": 0.0067, + "step": 764960 + }, + { + "epoch": 1.98, + "learning_rate": 2.5631122320694897e-06, + "loss": 0.0054, + "step": 764970 + }, + { + "epoch": 1.98, + "learning_rate": 2.5592240156980254e-06, + "loss": 0.0072, + "step": 764980 + }, + { + "epoch": 1.98, + "learning_rate": 2.5553357993265607e-06, + "loss": 0.0092, + "step": 764990 + }, + { + "epoch": 1.98, + "learning_rate": 2.551447582955096e-06, + "loss": 0.0062, + "step": 765000 + }, + { + "epoch": 1.98, + "eval_cer": 0.8816942885015627, + "eval_loss": 0.004388539120554924, + "eval_runtime": 107.9641, + "eval_samples_per_second": 18.525, + "eval_steps_per_second": 4.631, + "step": 765000 + }, + { + "epoch": 1.98, + "learning_rate": 2.5475593665836317e-06, + "loss": 0.0057, + "step": 765010 + }, + { + "epoch": 1.98, + "learning_rate": 2.5436711502121666e-06, + "loss": 0.0068, + "step": 765020 + }, + { + "epoch": 1.98, + "learning_rate": 2.539782933840702e-06, + "loss": 0.0075, + "step": 765030 + }, + { + "epoch": 1.98, + "learning_rate": 2.5358947174692376e-06, + "loss": 0.0046, + "step": 765040 + }, + { + "epoch": 1.98, + "learning_rate": 2.532006501097773e-06, + "loss": 0.0071, + "step": 765050 + }, + { + "epoch": 1.98, + "learning_rate": 2.5281182847263085e-06, + "loss": 0.0069, + "step": 765060 + }, + { + "epoch": 1.98, + "learning_rate": 2.524230068354844e-06, + "loss": 0.0082, + "step": 765070 + }, + { + "epoch": 1.98, + "learning_rate": 2.5203418519833787e-06, + "loss": 0.0069, + "step": 765080 + }, + { + "epoch": 1.98, + "learning_rate": 2.5164536356119144e-06, + "loss": 0.0084, + "step": 765090 + }, + { + "epoch": 1.98, + "learning_rate": 2.5125654192404497e-06, + "loss": 0.0054, + "step": 765100 + }, + { + "epoch": 1.98, + "learning_rate": 2.508677202868985e-06, + "loss": 0.0072, + "step": 765110 + }, + { + "epoch": 1.98, + "learning_rate": 2.5047889864975207e-06, + "loss": 0.0042, + "step": 765120 + }, + { + "epoch": 1.98, + "learning_rate": 2.500900770126056e-06, + "loss": 0.0046, + "step": 765130 + }, + { + "epoch": 1.98, + "learning_rate": 2.497012553754591e-06, + "loss": 0.0061, + "step": 765140 + }, + { + "epoch": 1.98, + "learning_rate": 2.4931243373831265e-06, + "loss": 0.0075, + "step": 765150 + }, + { + "epoch": 1.98, + "learning_rate": 2.489236121011662e-06, + "loss": 0.0079, + "step": 765160 + }, + { + "epoch": 1.98, + "learning_rate": 2.485347904640197e-06, + "loss": 0.0075, + "step": 765170 + }, + { + "epoch": 1.98, + "learning_rate": 2.481459688268733e-06, + "loss": 0.0082, + "step": 765180 + }, + { + "epoch": 1.98, + "learning_rate": 2.4775714718972677e-06, + "loss": 0.0061, + "step": 765190 + }, + { + "epoch": 1.98, + "learning_rate": 2.473683255525803e-06, + "loss": 0.0096, + "step": 765200 + }, + { + "epoch": 1.98, + "learning_rate": 2.4697950391543387e-06, + "loss": 0.0078, + "step": 765210 + }, + { + "epoch": 1.98, + "learning_rate": 2.465906822782874e-06, + "loss": 0.0061, + "step": 765220 + }, + { + "epoch": 1.98, + "learning_rate": 2.4620186064114097e-06, + "loss": 0.0062, + "step": 765230 + }, + { + "epoch": 1.98, + "learning_rate": 2.458130390039945e-06, + "loss": 0.0063, + "step": 765240 + }, + { + "epoch": 1.98, + "learning_rate": 2.45424217366848e-06, + "loss": 0.0059, + "step": 765250 + }, + { + "epoch": 1.98, + "learning_rate": 2.4503539572970155e-06, + "loss": 0.0073, + "step": 765260 + }, + { + "epoch": 1.98, + "learning_rate": 2.446465740925551e-06, + "loss": 0.0064, + "step": 765270 + }, + { + "epoch": 1.98, + "learning_rate": 2.442577524554086e-06, + "loss": 0.0076, + "step": 765280 + }, + { + "epoch": 1.98, + "learning_rate": 2.438689308182622e-06, + "loss": 0.0068, + "step": 765290 + }, + { + "epoch": 1.98, + "learning_rate": 2.434801091811157e-06, + "loss": 0.0077, + "step": 765300 + }, + { + "epoch": 1.98, + "learning_rate": 2.430912875439692e-06, + "loss": 0.0062, + "step": 765310 + }, + { + "epoch": 1.98, + "learning_rate": 2.4270246590682277e-06, + "loss": 0.0066, + "step": 765320 + }, + { + "epoch": 1.98, + "learning_rate": 2.423136442696763e-06, + "loss": 0.006, + "step": 765330 + }, + { + "epoch": 1.98, + "learning_rate": 2.4192482263252982e-06, + "loss": 0.0095, + "step": 765340 + }, + { + "epoch": 1.98, + "learning_rate": 2.415360009953834e-06, + "loss": 0.0088, + "step": 765350 + }, + { + "epoch": 1.98, + "learning_rate": 2.411471793582369e-06, + "loss": 0.0073, + "step": 765360 + }, + { + "epoch": 1.98, + "learning_rate": 2.4075835772109045e-06, + "loss": 0.0084, + "step": 765370 + }, + { + "epoch": 1.98, + "learning_rate": 2.4036953608394398e-06, + "loss": 0.0087, + "step": 765380 + }, + { + "epoch": 1.98, + "learning_rate": 2.399807144467975e-06, + "loss": 0.0079, + "step": 765390 + }, + { + "epoch": 1.98, + "learning_rate": 2.3959189280965108e-06, + "loss": 0.0058, + "step": 765400 + }, + { + "epoch": 1.98, + "learning_rate": 2.392030711725046e-06, + "loss": 0.0059, + "step": 765410 + }, + { + "epoch": 1.98, + "learning_rate": 2.388142495353581e-06, + "loss": 0.0061, + "step": 765420 + }, + { + "epoch": 1.98, + "learning_rate": 2.3842542789821166e-06, + "loss": 0.0079, + "step": 765430 + }, + { + "epoch": 1.98, + "learning_rate": 2.380366062610652e-06, + "loss": 0.0051, + "step": 765440 + }, + { + "epoch": 1.98, + "learning_rate": 2.376477846239187e-06, + "loss": 0.0071, + "step": 765450 + }, + { + "epoch": 1.98, + "learning_rate": 2.372589629867723e-06, + "loss": 0.0047, + "step": 765460 + }, + { + "epoch": 1.98, + "learning_rate": 2.368701413496258e-06, + "loss": 0.0037, + "step": 765470 + }, + { + "epoch": 1.98, + "learning_rate": 2.364813197124793e-06, + "loss": 0.0073, + "step": 765480 + }, + { + "epoch": 1.98, + "learning_rate": 2.3609249807533288e-06, + "loss": 0.006, + "step": 765490 + }, + { + "epoch": 1.98, + "learning_rate": 2.357036764381864e-06, + "loss": 0.006, + "step": 765500 + }, + { + "epoch": 1.98, + "learning_rate": 2.3531485480103993e-06, + "loss": 0.007, + "step": 765510 + }, + { + "epoch": 1.98, + "learning_rate": 2.349260331638935e-06, + "loss": 0.0068, + "step": 765520 + }, + { + "epoch": 1.98, + "learning_rate": 2.34537211526747e-06, + "loss": 0.0077, + "step": 765530 + }, + { + "epoch": 1.98, + "learning_rate": 2.3414838988960056e-06, + "loss": 0.0057, + "step": 765540 + }, + { + "epoch": 1.98, + "learning_rate": 2.337595682524541e-06, + "loss": 0.0068, + "step": 765550 + }, + { + "epoch": 1.98, + "learning_rate": 2.3337074661530766e-06, + "loss": 0.0099, + "step": 765560 + }, + { + "epoch": 1.98, + "learning_rate": 2.3298192497816115e-06, + "loss": 0.0061, + "step": 765570 + }, + { + "epoch": 1.98, + "learning_rate": 2.325931033410147e-06, + "loss": 0.0101, + "step": 765580 + }, + { + "epoch": 1.98, + "learning_rate": 2.3220428170386825e-06, + "loss": 0.0069, + "step": 765590 + }, + { + "epoch": 1.98, + "learning_rate": 2.3181546006672178e-06, + "loss": 0.0064, + "step": 765600 + }, + { + "epoch": 1.98, + "learning_rate": 2.314266384295753e-06, + "loss": 0.006, + "step": 765610 + }, + { + "epoch": 1.98, + "learning_rate": 2.3103781679242883e-06, + "loss": 0.0066, + "step": 765620 + }, + { + "epoch": 1.98, + "learning_rate": 2.3064899515528236e-06, + "loss": 0.0045, + "step": 765630 + }, + { + "epoch": 1.98, + "learning_rate": 2.3026017351813593e-06, + "loss": 0.0069, + "step": 765640 + }, + { + "epoch": 1.98, + "learning_rate": 2.2987135188098946e-06, + "loss": 0.0058, + "step": 765650 + }, + { + "epoch": 1.98, + "learning_rate": 2.29482530243843e-06, + "loss": 0.0062, + "step": 765660 + }, + { + "epoch": 1.98, + "learning_rate": 2.290937086066965e-06, + "loss": 0.0074, + "step": 765670 + }, + { + "epoch": 1.98, + "learning_rate": 2.2870488696955005e-06, + "loss": 0.0066, + "step": 765680 + }, + { + "epoch": 1.98, + "learning_rate": 2.283160653324036e-06, + "loss": 0.0069, + "step": 765690 + }, + { + "epoch": 1.98, + "learning_rate": 2.279272436952571e-06, + "loss": 0.0076, + "step": 765700 + }, + { + "epoch": 1.98, + "learning_rate": 2.2753842205811067e-06, + "loss": 0.0067, + "step": 765710 + }, + { + "epoch": 1.98, + "learning_rate": 2.271496004209642e-06, + "loss": 0.0073, + "step": 765720 + }, + { + "epoch": 1.98, + "learning_rate": 2.2676077878381777e-06, + "loss": 0.0066, + "step": 765730 + }, + { + "epoch": 1.98, + "learning_rate": 2.2637195714667126e-06, + "loss": 0.0078, + "step": 765740 + }, + { + "epoch": 1.98, + "learning_rate": 2.2598313550952483e-06, + "loss": 0.0074, + "step": 765750 + }, + { + "epoch": 1.98, + "learning_rate": 2.2559431387237836e-06, + "loss": 0.0093, + "step": 765760 + }, + { + "epoch": 1.98, + "learning_rate": 2.252054922352319e-06, + "loss": 0.0051, + "step": 765770 + }, + { + "epoch": 1.99, + "learning_rate": 2.248166705980854e-06, + "loss": 0.006, + "step": 765780 + }, + { + "epoch": 1.99, + "learning_rate": 2.2442784896093894e-06, + "loss": 0.006, + "step": 765790 + }, + { + "epoch": 1.99, + "learning_rate": 2.240390273237925e-06, + "loss": 0.0049, + "step": 765800 + }, + { + "epoch": 1.99, + "learning_rate": 2.2365020568664604e-06, + "loss": 0.0064, + "step": 765810 + }, + { + "epoch": 1.99, + "learning_rate": 2.2326138404949957e-06, + "loss": 0.0069, + "step": 765820 + }, + { + "epoch": 1.99, + "learning_rate": 2.228725624123531e-06, + "loss": 0.0058, + "step": 765830 + }, + { + "epoch": 1.99, + "learning_rate": 2.2248374077520663e-06, + "loss": 0.0057, + "step": 765840 + }, + { + "epoch": 1.99, + "learning_rate": 2.2209491913806016e-06, + "loss": 0.0049, + "step": 765850 + }, + { + "epoch": 1.99, + "learning_rate": 2.2170609750091373e-06, + "loss": 0.0131, + "step": 765860 + }, + { + "epoch": 1.99, + "learning_rate": 2.2131727586376726e-06, + "loss": 0.0057, + "step": 765870 + }, + { + "epoch": 1.99, + "learning_rate": 2.209284542266208e-06, + "loss": 0.0082, + "step": 765880 + }, + { + "epoch": 1.99, + "learning_rate": 2.205396325894743e-06, + "loss": 0.005, + "step": 765890 + }, + { + "epoch": 1.99, + "learning_rate": 2.201508109523279e-06, + "loss": 0.007, + "step": 765900 + }, + { + "epoch": 1.99, + "learning_rate": 2.1976198931518137e-06, + "loss": 0.0071, + "step": 765910 + }, + { + "epoch": 1.99, + "learning_rate": 2.1937316767803494e-06, + "loss": 0.0054, + "step": 765920 + }, + { + "epoch": 1.99, + "learning_rate": 2.1898434604088847e-06, + "loss": 0.0069, + "step": 765930 + }, + { + "epoch": 1.99, + "learning_rate": 2.18595524403742e-06, + "loss": 0.0082, + "step": 765940 + }, + { + "epoch": 1.99, + "learning_rate": 2.1820670276659553e-06, + "loss": 0.0068, + "step": 765950 + }, + { + "epoch": 1.99, + "learning_rate": 2.1781788112944906e-06, + "loss": 0.0094, + "step": 765960 + }, + { + "epoch": 1.99, + "learning_rate": 2.1742905949230263e-06, + "loss": 0.008, + "step": 765970 + }, + { + "epoch": 1.99, + "learning_rate": 2.1704023785515615e-06, + "loss": 0.0065, + "step": 765980 + }, + { + "epoch": 1.99, + "learning_rate": 2.166514162180097e-06, + "loss": 0.0065, + "step": 765990 + }, + { + "epoch": 1.99, + "learning_rate": 2.162625945808632e-06, + "loss": 0.008, + "step": 766000 + }, + { + "epoch": 1.99, + "eval_cer": 0.8816956881384969, + "eval_loss": 0.004399578087031841, + "eval_runtime": 107.8197, + "eval_samples_per_second": 18.549, + "eval_steps_per_second": 4.637, + "step": 766000 + }, + { + "epoch": 1.99, + "learning_rate": 2.1587377294371674e-06, + "loss": 0.0067, + "step": 766010 + }, + { + "epoch": 1.99, + "learning_rate": 2.1548495130657027e-06, + "loss": 0.0061, + "step": 766020 + }, + { + "epoch": 1.99, + "learning_rate": 2.1509612966942384e-06, + "loss": 0.0066, + "step": 766030 + }, + { + "epoch": 1.99, + "learning_rate": 2.1470730803227737e-06, + "loss": 0.0051, + "step": 766040 + }, + { + "epoch": 1.99, + "learning_rate": 2.143184863951309e-06, + "loss": 0.0076, + "step": 766050 + }, + { + "epoch": 1.99, + "learning_rate": 2.1392966475798443e-06, + "loss": 0.007, + "step": 766060 + }, + { + "epoch": 1.99, + "learning_rate": 2.13540843120838e-06, + "loss": 0.0073, + "step": 766070 + }, + { + "epoch": 1.99, + "learning_rate": 2.131520214836915e-06, + "loss": 0.0064, + "step": 766080 + }, + { + "epoch": 1.99, + "learning_rate": 2.1276319984654505e-06, + "loss": 0.0075, + "step": 766090 + }, + { + "epoch": 1.99, + "learning_rate": 2.123743782093986e-06, + "loss": 0.0097, + "step": 766100 + }, + { + "epoch": 1.99, + "learning_rate": 2.119855565722521e-06, + "loss": 0.0078, + "step": 766110 + }, + { + "epoch": 1.99, + "learning_rate": 2.1159673493510564e-06, + "loss": 0.0056, + "step": 766120 + }, + { + "epoch": 1.99, + "learning_rate": 2.1120791329795917e-06, + "loss": 0.0054, + "step": 766130 + }, + { + "epoch": 1.99, + "learning_rate": 2.1081909166081274e-06, + "loss": 0.0077, + "step": 766140 + }, + { + "epoch": 1.99, + "learning_rate": 2.1043027002366627e-06, + "loss": 0.0063, + "step": 766150 + }, + { + "epoch": 1.99, + "learning_rate": 2.100414483865198e-06, + "loss": 0.0062, + "step": 766160 + }, + { + "epoch": 1.99, + "learning_rate": 2.0965262674937332e-06, + "loss": 0.005, + "step": 766170 + }, + { + "epoch": 1.99, + "learning_rate": 2.092638051122269e-06, + "loss": 0.0086, + "step": 766180 + }, + { + "epoch": 1.99, + "learning_rate": 2.088749834750804e-06, + "loss": 0.005, + "step": 766190 + }, + { + "epoch": 1.99, + "learning_rate": 2.0848616183793395e-06, + "loss": 0.0067, + "step": 766200 + }, + { + "epoch": 1.99, + "learning_rate": 2.080973402007875e-06, + "loss": 0.0068, + "step": 766210 + }, + { + "epoch": 1.99, + "learning_rate": 2.07708518563641e-06, + "loss": 0.0093, + "step": 766220 + }, + { + "epoch": 1.99, + "learning_rate": 2.0731969692649454e-06, + "loss": 0.0059, + "step": 766230 + }, + { + "epoch": 1.99, + "learning_rate": 2.069308752893481e-06, + "loss": 0.0068, + "step": 766240 + }, + { + "epoch": 1.99, + "learning_rate": 2.0654205365220164e-06, + "loss": 0.0082, + "step": 766250 + }, + { + "epoch": 1.99, + "learning_rate": 2.0615323201505516e-06, + "loss": 0.0067, + "step": 766260 + }, + { + "epoch": 1.99, + "learning_rate": 2.057644103779087e-06, + "loss": 0.0062, + "step": 766270 + }, + { + "epoch": 1.99, + "learning_rate": 2.0537558874076222e-06, + "loss": 0.0065, + "step": 766280 + }, + { + "epoch": 1.99, + "learning_rate": 2.0498676710361575e-06, + "loss": 0.0061, + "step": 766290 + }, + { + "epoch": 1.99, + "learning_rate": 2.0459794546646928e-06, + "loss": 0.0057, + "step": 766300 + }, + { + "epoch": 1.99, + "learning_rate": 2.0420912382932285e-06, + "loss": 0.0076, + "step": 766310 + }, + { + "epoch": 1.99, + "learning_rate": 2.0382030219217638e-06, + "loss": 0.0069, + "step": 766320 + }, + { + "epoch": 1.99, + "learning_rate": 2.034314805550299e-06, + "loss": 0.0083, + "step": 766330 + }, + { + "epoch": 1.99, + "learning_rate": 2.0304265891788343e-06, + "loss": 0.0077, + "step": 766340 + }, + { + "epoch": 1.99, + "learning_rate": 2.02653837280737e-06, + "loss": 0.0085, + "step": 766350 + }, + { + "epoch": 1.99, + "learning_rate": 2.022650156435905e-06, + "loss": 0.0069, + "step": 766360 + }, + { + "epoch": 1.99, + "learning_rate": 2.0187619400644406e-06, + "loss": 0.0055, + "step": 766370 + }, + { + "epoch": 1.99, + "learning_rate": 2.014873723692976e-06, + "loss": 0.0055, + "step": 766380 + }, + { + "epoch": 1.99, + "learning_rate": 2.010985507321511e-06, + "loss": 0.0085, + "step": 766390 + }, + { + "epoch": 1.99, + "learning_rate": 2.0070972909500465e-06, + "loss": 0.0049, + "step": 766400 + }, + { + "epoch": 1.99, + "learning_rate": 2.003209074578582e-06, + "loss": 0.0058, + "step": 766410 + }, + { + "epoch": 1.99, + "learning_rate": 1.9993208582071175e-06, + "loss": 0.006, + "step": 766420 + }, + { + "epoch": 1.99, + "learning_rate": 1.9954326418356528e-06, + "loss": 0.0074, + "step": 766430 + }, + { + "epoch": 1.99, + "learning_rate": 1.991544425464188e-06, + "loss": 0.0065, + "step": 766440 + }, + { + "epoch": 1.99, + "learning_rate": 1.9876562090927233e-06, + "loss": 0.0084, + "step": 766450 + }, + { + "epoch": 1.99, + "learning_rate": 1.9837679927212586e-06, + "loss": 0.0062, + "step": 766460 + }, + { + "epoch": 1.99, + "learning_rate": 1.979879776349794e-06, + "loss": 0.0052, + "step": 766470 + }, + { + "epoch": 1.99, + "learning_rate": 1.9759915599783296e-06, + "loss": 0.0071, + "step": 766480 + }, + { + "epoch": 1.99, + "learning_rate": 1.972103343606865e-06, + "loss": 0.0063, + "step": 766490 + }, + { + "epoch": 1.99, + "learning_rate": 1.9682151272354e-06, + "loss": 0.008, + "step": 766500 + }, + { + "epoch": 1.99, + "learning_rate": 1.9643269108639355e-06, + "loss": 0.006, + "step": 766510 + }, + { + "epoch": 1.99, + "learning_rate": 1.960438694492471e-06, + "loss": 0.0066, + "step": 766520 + }, + { + "epoch": 1.99, + "learning_rate": 1.956550478121006e-06, + "loss": 0.0061, + "step": 766530 + }, + { + "epoch": 1.99, + "learning_rate": 1.9526622617495417e-06, + "loss": 0.0063, + "step": 766540 + }, + { + "epoch": 1.99, + "learning_rate": 1.948774045378077e-06, + "loss": 0.0088, + "step": 766550 + }, + { + "epoch": 1.99, + "learning_rate": 1.9448858290066123e-06, + "loss": 0.0067, + "step": 766560 + }, + { + "epoch": 1.99, + "learning_rate": 1.9409976126351476e-06, + "loss": 0.0076, + "step": 766570 + }, + { + "epoch": 1.99, + "learning_rate": 1.9371093962636833e-06, + "loss": 0.0059, + "step": 766580 + }, + { + "epoch": 1.99, + "learning_rate": 1.9332211798922186e-06, + "loss": 0.0078, + "step": 766590 + }, + { + "epoch": 1.99, + "learning_rate": 1.929332963520754e-06, + "loss": 0.005, + "step": 766600 + }, + { + "epoch": 1.99, + "learning_rate": 1.925444747149289e-06, + "loss": 0.0056, + "step": 766610 + }, + { + "epoch": 1.99, + "learning_rate": 1.9215565307778244e-06, + "loss": 0.0076, + "step": 766620 + }, + { + "epoch": 1.99, + "learning_rate": 1.91766831440636e-06, + "loss": 0.0056, + "step": 766630 + }, + { + "epoch": 1.99, + "learning_rate": 1.913780098034895e-06, + "loss": 0.0104, + "step": 766640 + }, + { + "epoch": 1.99, + "learning_rate": 1.9098918816634307e-06, + "loss": 0.0103, + "step": 766650 + }, + { + "epoch": 1.99, + "learning_rate": 1.906003665291966e-06, + "loss": 0.0056, + "step": 766660 + }, + { + "epoch": 1.99, + "learning_rate": 1.9021154489205013e-06, + "loss": 0.0054, + "step": 766670 + }, + { + "epoch": 1.99, + "learning_rate": 1.8982272325490368e-06, + "loss": 0.0056, + "step": 766680 + }, + { + "epoch": 1.99, + "learning_rate": 1.894339016177572e-06, + "loss": 0.0091, + "step": 766690 + }, + { + "epoch": 1.99, + "learning_rate": 1.8904507998061074e-06, + "loss": 0.0056, + "step": 766700 + }, + { + "epoch": 1.99, + "learning_rate": 1.8865625834346429e-06, + "loss": 0.0064, + "step": 766710 + }, + { + "epoch": 1.99, + "learning_rate": 1.8826743670631781e-06, + "loss": 0.0068, + "step": 766720 + }, + { + "epoch": 1.99, + "learning_rate": 1.8787861506917136e-06, + "loss": 0.0056, + "step": 766730 + }, + { + "epoch": 1.99, + "learning_rate": 1.8748979343202487e-06, + "loss": 0.0068, + "step": 766740 + }, + { + "epoch": 1.99, + "learning_rate": 1.8710097179487842e-06, + "loss": 0.0045, + "step": 766750 + }, + { + "epoch": 1.99, + "learning_rate": 1.8671215015773197e-06, + "loss": 0.0067, + "step": 766760 + }, + { + "epoch": 1.99, + "learning_rate": 1.8632332852058548e-06, + "loss": 0.0047, + "step": 766770 + }, + { + "epoch": 1.99, + "learning_rate": 1.8593450688343903e-06, + "loss": 0.0087, + "step": 766780 + }, + { + "epoch": 1.99, + "learning_rate": 1.8554568524629258e-06, + "loss": 0.0072, + "step": 766790 + }, + { + "epoch": 1.99, + "learning_rate": 1.851568636091461e-06, + "loss": 0.0057, + "step": 766800 + }, + { + "epoch": 1.99, + "learning_rate": 1.8476804197199963e-06, + "loss": 0.0083, + "step": 766810 + }, + { + "epoch": 1.99, + "learning_rate": 1.8437922033485318e-06, + "loss": 0.0076, + "step": 766820 + }, + { + "epoch": 1.99, + "learning_rate": 1.8399039869770671e-06, + "loss": 0.0063, + "step": 766830 + }, + { + "epoch": 1.99, + "learning_rate": 1.8360157706056024e-06, + "loss": 0.0067, + "step": 766840 + }, + { + "epoch": 1.99, + "learning_rate": 1.832127554234138e-06, + "loss": 0.005, + "step": 766850 + }, + { + "epoch": 1.99, + "learning_rate": 1.8282393378626732e-06, + "loss": 0.0063, + "step": 766860 + }, + { + "epoch": 1.99, + "learning_rate": 1.8243511214912087e-06, + "loss": 0.0086, + "step": 766870 + }, + { + "epoch": 1.99, + "learning_rate": 1.820462905119744e-06, + "loss": 0.0081, + "step": 766880 + }, + { + "epoch": 1.99, + "learning_rate": 1.8165746887482793e-06, + "loss": 0.0063, + "step": 766890 + }, + { + "epoch": 1.99, + "learning_rate": 1.8126864723768148e-06, + "loss": 0.0071, + "step": 766900 + }, + { + "epoch": 1.99, + "learning_rate": 1.8087982560053498e-06, + "loss": 0.0069, + "step": 766910 + }, + { + "epoch": 1.99, + "learning_rate": 1.8049100396338853e-06, + "loss": 0.0066, + "step": 766920 + }, + { + "epoch": 1.99, + "learning_rate": 1.8010218232624208e-06, + "loss": 0.0085, + "step": 766930 + }, + { + "epoch": 1.99, + "learning_rate": 1.7971336068909563e-06, + "loss": 0.0077, + "step": 766940 + }, + { + "epoch": 1.99, + "learning_rate": 1.7932453905194914e-06, + "loss": 0.0066, + "step": 766950 + }, + { + "epoch": 1.99, + "learning_rate": 1.7893571741480269e-06, + "loss": 0.0077, + "step": 766960 + }, + { + "epoch": 1.99, + "learning_rate": 1.7854689577765622e-06, + "loss": 0.0063, + "step": 766970 + }, + { + "epoch": 1.99, + "learning_rate": 1.7815807414050975e-06, + "loss": 0.0054, + "step": 766980 + }, + { + "epoch": 1.99, + "learning_rate": 1.777692525033633e-06, + "loss": 0.0073, + "step": 766990 + }, + { + "epoch": 1.99, + "learning_rate": 1.7738043086621682e-06, + "loss": 0.0079, + "step": 767000 + }, + { + "epoch": 1.99, + "eval_cer": 0.8816928888646285, + "eval_loss": 0.004389285109937191, + "eval_runtime": 108.0952, + "eval_samples_per_second": 18.502, + "eval_steps_per_second": 4.626, + "step": 767000 + }, + { + "epoch": 1.99, + "learning_rate": 1.7699160922907037e-06, + "loss": 0.0067, + "step": 767010 + }, + { + "epoch": 1.99, + "learning_rate": 1.766027875919239e-06, + "loss": 0.0054, + "step": 767020 + }, + { + "epoch": 1.99, + "learning_rate": 1.7621396595477743e-06, + "loss": 0.0094, + "step": 767030 + }, + { + "epoch": 1.99, + "learning_rate": 1.7582514431763098e-06, + "loss": 0.0083, + "step": 767040 + }, + { + "epoch": 1.99, + "learning_rate": 1.754363226804845e-06, + "loss": 0.0087, + "step": 767050 + }, + { + "epoch": 1.99, + "learning_rate": 1.7504750104333804e-06, + "loss": 0.0076, + "step": 767060 + }, + { + "epoch": 1.99, + "learning_rate": 1.7465867940619159e-06, + "loss": 0.0056, + "step": 767070 + }, + { + "epoch": 1.99, + "learning_rate": 1.742698577690451e-06, + "loss": 0.0055, + "step": 767080 + }, + { + "epoch": 1.99, + "learning_rate": 1.7388103613189864e-06, + "loss": 0.0115, + "step": 767090 + }, + { + "epoch": 1.99, + "learning_rate": 1.734922144947522e-06, + "loss": 0.0086, + "step": 767100 + }, + { + "epoch": 1.99, + "learning_rate": 1.7310339285760574e-06, + "loss": 0.0076, + "step": 767110 + }, + { + "epoch": 1.99, + "learning_rate": 1.7271457122045925e-06, + "loss": 0.009, + "step": 767120 + }, + { + "epoch": 1.99, + "learning_rate": 1.723257495833128e-06, + "loss": 0.0059, + "step": 767130 + }, + { + "epoch": 1.99, + "learning_rate": 1.7193692794616635e-06, + "loss": 0.0054, + "step": 767140 + }, + { + "epoch": 1.99, + "learning_rate": 1.7154810630901986e-06, + "loss": 0.0058, + "step": 767150 + }, + { + "epoch": 1.99, + "learning_rate": 1.711592846718734e-06, + "loss": 0.0079, + "step": 767160 + }, + { + "epoch": 1.99, + "learning_rate": 1.7077046303472694e-06, + "loss": 0.008, + "step": 767170 + }, + { + "epoch": 1.99, + "learning_rate": 1.7038164139758049e-06, + "loss": 0.0061, + "step": 767180 + }, + { + "epoch": 1.99, + "learning_rate": 1.6999281976043401e-06, + "loss": 0.0079, + "step": 767190 + }, + { + "epoch": 1.99, + "learning_rate": 1.6960399812328754e-06, + "loss": 0.0055, + "step": 767200 + }, + { + "epoch": 1.99, + "learning_rate": 1.692151764861411e-06, + "loss": 0.0063, + "step": 767210 + }, + { + "epoch": 1.99, + "learning_rate": 1.6882635484899462e-06, + "loss": 0.0087, + "step": 767220 + }, + { + "epoch": 1.99, + "learning_rate": 1.6843753321184815e-06, + "loss": 0.0081, + "step": 767230 + }, + { + "epoch": 1.99, + "learning_rate": 1.680487115747017e-06, + "loss": 0.0061, + "step": 767240 + }, + { + "epoch": 1.99, + "learning_rate": 1.6765988993755525e-06, + "loss": 0.0063, + "step": 767250 + }, + { + "epoch": 1.99, + "learning_rate": 1.6727106830040876e-06, + "loss": 0.0067, + "step": 767260 + }, + { + "epoch": 1.99, + "learning_rate": 1.668822466632623e-06, + "loss": 0.0054, + "step": 767270 + }, + { + "epoch": 1.99, + "learning_rate": 1.6649342502611586e-06, + "loss": 0.0054, + "step": 767280 + }, + { + "epoch": 1.99, + "learning_rate": 1.6610460338896936e-06, + "loss": 0.0073, + "step": 767290 + }, + { + "epoch": 1.99, + "learning_rate": 1.6571578175182291e-06, + "loss": 0.0101, + "step": 767300 + }, + { + "epoch": 1.99, + "learning_rate": 1.6532696011467646e-06, + "loss": 0.0135, + "step": 767310 + }, + { + "epoch": 1.99, + "learning_rate": 1.6493813847753e-06, + "loss": 0.0066, + "step": 767320 + }, + { + "epoch": 1.99, + "learning_rate": 1.6454931684038352e-06, + "loss": 0.0067, + "step": 767330 + }, + { + "epoch": 1.99, + "learning_rate": 1.6416049520323705e-06, + "loss": 0.0068, + "step": 767340 + }, + { + "epoch": 1.99, + "learning_rate": 1.637716735660906e-06, + "loss": 0.0096, + "step": 767350 + }, + { + "epoch": 1.99, + "learning_rate": 1.6338285192894413e-06, + "loss": 0.0089, + "step": 767360 + }, + { + "epoch": 1.99, + "learning_rate": 1.6299403029179765e-06, + "loss": 0.0068, + "step": 767370 + }, + { + "epoch": 1.99, + "learning_rate": 1.626052086546512e-06, + "loss": 0.0059, + "step": 767380 + }, + { + "epoch": 1.99, + "learning_rate": 1.6221638701750473e-06, + "loss": 0.0068, + "step": 767390 + }, + { + "epoch": 1.99, + "learning_rate": 1.6182756538035826e-06, + "loss": 0.0104, + "step": 767400 + }, + { + "epoch": 1.99, + "learning_rate": 1.614387437432118e-06, + "loss": 0.0051, + "step": 767410 + }, + { + "epoch": 1.99, + "learning_rate": 1.6104992210606536e-06, + "loss": 0.0072, + "step": 767420 + }, + { + "epoch": 1.99, + "learning_rate": 1.6066110046891887e-06, + "loss": 0.0053, + "step": 767430 + }, + { + "epoch": 1.99, + "learning_rate": 1.6027227883177242e-06, + "loss": 0.0081, + "step": 767440 + }, + { + "epoch": 1.99, + "learning_rate": 1.5988345719462597e-06, + "loss": 0.0076, + "step": 767450 + }, + { + "epoch": 1.99, + "learning_rate": 1.5949463555747947e-06, + "loss": 0.0067, + "step": 767460 + }, + { + "epoch": 1.99, + "learning_rate": 1.5910581392033302e-06, + "loss": 0.007, + "step": 767470 + }, + { + "epoch": 1.99, + "learning_rate": 1.5871699228318657e-06, + "loss": 0.0058, + "step": 767480 + }, + { + "epoch": 1.99, + "learning_rate": 1.583281706460401e-06, + "loss": 0.0056, + "step": 767490 + }, + { + "epoch": 1.99, + "learning_rate": 1.5793934900889363e-06, + "loss": 0.008, + "step": 767500 + }, + { + "epoch": 1.99, + "learning_rate": 1.5755052737174716e-06, + "loss": 0.004, + "step": 767510 + }, + { + "epoch": 1.99, + "learning_rate": 1.571617057346007e-06, + "loss": 0.0064, + "step": 767520 + }, + { + "epoch": 1.99, + "learning_rate": 1.5677288409745424e-06, + "loss": 0.0077, + "step": 767530 + }, + { + "epoch": 1.99, + "learning_rate": 1.5638406246030777e-06, + "loss": 0.0089, + "step": 767540 + }, + { + "epoch": 1.99, + "learning_rate": 1.5599524082316132e-06, + "loss": 0.0054, + "step": 767550 + }, + { + "epoch": 1.99, + "learning_rate": 1.5560641918601487e-06, + "loss": 0.0087, + "step": 767560 + }, + { + "epoch": 1.99, + "learning_rate": 1.5521759754886837e-06, + "loss": 0.0078, + "step": 767570 + }, + { + "epoch": 1.99, + "learning_rate": 1.5482877591172192e-06, + "loss": 0.0069, + "step": 767580 + }, + { + "epoch": 1.99, + "learning_rate": 1.5443995427457547e-06, + "loss": 0.009, + "step": 767590 + }, + { + "epoch": 1.99, + "learning_rate": 1.5405113263742898e-06, + "loss": 0.0078, + "step": 767600 + }, + { + "epoch": 1.99, + "learning_rate": 1.5366231100028253e-06, + "loss": 0.0062, + "step": 767610 + }, + { + "epoch": 1.99, + "learning_rate": 1.5327348936313608e-06, + "loss": 0.0079, + "step": 767620 + }, + { + "epoch": 1.99, + "learning_rate": 1.528846677259896e-06, + "loss": 0.0071, + "step": 767630 + }, + { + "epoch": 1.99, + "learning_rate": 1.5249584608884314e-06, + "loss": 0.0097, + "step": 767640 + }, + { + "epoch": 1.99, + "learning_rate": 1.5210702445169669e-06, + "loss": 0.0069, + "step": 767650 + }, + { + "epoch": 1.99, + "learning_rate": 1.5171820281455021e-06, + "loss": 0.0055, + "step": 767660 + }, + { + "epoch": 1.99, + "learning_rate": 1.5132938117740374e-06, + "loss": 0.0062, + "step": 767670 + }, + { + "epoch": 1.99, + "learning_rate": 1.5094055954025727e-06, + "loss": 0.008, + "step": 767680 + }, + { + "epoch": 1.99, + "learning_rate": 1.5055173790311082e-06, + "loss": 0.0056, + "step": 767690 + }, + { + "epoch": 1.99, + "learning_rate": 1.5016291626596437e-06, + "loss": 0.0068, + "step": 767700 + }, + { + "epoch": 1.99, + "learning_rate": 1.4977409462881788e-06, + "loss": 0.006, + "step": 767710 + }, + { + "epoch": 1.99, + "learning_rate": 1.4938527299167143e-06, + "loss": 0.0065, + "step": 767720 + }, + { + "epoch": 1.99, + "learning_rate": 1.4899645135452498e-06, + "loss": 0.0057, + "step": 767730 + }, + { + "epoch": 1.99, + "learning_rate": 1.4860762971737848e-06, + "loss": 0.0061, + "step": 767740 + }, + { + "epoch": 1.99, + "learning_rate": 1.4821880808023203e-06, + "loss": 0.0069, + "step": 767750 + }, + { + "epoch": 1.99, + "learning_rate": 1.4782998644308558e-06, + "loss": 0.0066, + "step": 767760 + }, + { + "epoch": 1.99, + "learning_rate": 1.474411648059391e-06, + "loss": 0.0056, + "step": 767770 + }, + { + "epoch": 1.99, + "learning_rate": 1.4705234316879264e-06, + "loss": 0.0066, + "step": 767780 + }, + { + "epoch": 1.99, + "learning_rate": 1.466635215316462e-06, + "loss": 0.0089, + "step": 767790 + }, + { + "epoch": 1.99, + "learning_rate": 1.4627469989449972e-06, + "loss": 0.0083, + "step": 767800 + }, + { + "epoch": 1.99, + "learning_rate": 1.4588587825735325e-06, + "loss": 0.0071, + "step": 767810 + }, + { + "epoch": 1.99, + "learning_rate": 1.454970566202068e-06, + "loss": 0.0078, + "step": 767820 + }, + { + "epoch": 1.99, + "learning_rate": 1.4510823498306033e-06, + "loss": 0.0042, + "step": 767830 + }, + { + "epoch": 1.99, + "learning_rate": 1.4471941334591385e-06, + "loss": 0.0089, + "step": 767840 + }, + { + "epoch": 1.99, + "learning_rate": 1.4433059170876738e-06, + "loss": 0.0074, + "step": 767850 + }, + { + "epoch": 1.99, + "learning_rate": 1.4394177007162093e-06, + "loss": 0.0073, + "step": 767860 + }, + { + "epoch": 1.99, + "learning_rate": 1.4355294843447448e-06, + "loss": 0.005, + "step": 767870 + }, + { + "epoch": 1.99, + "learning_rate": 1.4316412679732799e-06, + "loss": 0.0067, + "step": 767880 + }, + { + "epoch": 1.99, + "learning_rate": 1.4277530516018154e-06, + "loss": 0.0061, + "step": 767890 + }, + { + "epoch": 1.99, + "learning_rate": 1.4238648352303509e-06, + "loss": 0.0053, + "step": 767900 + }, + { + "epoch": 1.99, + "learning_rate": 1.419976618858886e-06, + "loss": 0.0061, + "step": 767910 + }, + { + "epoch": 1.99, + "learning_rate": 1.4160884024874215e-06, + "loss": 0.0087, + "step": 767920 + }, + { + "epoch": 1.99, + "learning_rate": 1.412200186115957e-06, + "loss": 0.0084, + "step": 767930 + }, + { + "epoch": 1.99, + "learning_rate": 1.4083119697444922e-06, + "loss": 0.0075, + "step": 767940 + }, + { + "epoch": 1.99, + "learning_rate": 1.4044237533730275e-06, + "loss": 0.0082, + "step": 767950 + }, + { + "epoch": 1.99, + "learning_rate": 1.400535537001563e-06, + "loss": 0.0071, + "step": 767960 + }, + { + "epoch": 1.99, + "learning_rate": 1.3966473206300983e-06, + "loss": 0.0074, + "step": 767970 + }, + { + "epoch": 1.99, + "learning_rate": 1.3927591042586336e-06, + "loss": 0.0049, + "step": 767980 + }, + { + "epoch": 1.99, + "learning_rate": 1.388870887887169e-06, + "loss": 0.0047, + "step": 767990 + }, + { + "epoch": 1.99, + "learning_rate": 1.3849826715157044e-06, + "loss": 0.0059, + "step": 768000 + }, + { + "epoch": 1.99, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.004371436312794685, + "eval_runtime": 108.0539, + "eval_samples_per_second": 18.509, + "eval_steps_per_second": 4.627, + "step": 768000 + }, + { + "epoch": 1.99, + "learning_rate": 1.3810944551442399e-06, + "loss": 0.0103, + "step": 768010 + }, + { + "epoch": 1.99, + "learning_rate": 1.3772062387727752e-06, + "loss": 0.0067, + "step": 768020 + }, + { + "epoch": 1.99, + "learning_rate": 1.3733180224013104e-06, + "loss": 0.0046, + "step": 768030 + }, + { + "epoch": 1.99, + "learning_rate": 1.369429806029846e-06, + "loss": 0.0063, + "step": 768040 + }, + { + "epoch": 1.99, + "learning_rate": 1.365541589658381e-06, + "loss": 0.0059, + "step": 768050 + }, + { + "epoch": 1.99, + "learning_rate": 1.3616533732869165e-06, + "loss": 0.0071, + "step": 768060 + }, + { + "epoch": 1.99, + "learning_rate": 1.357765156915452e-06, + "loss": 0.009, + "step": 768070 + }, + { + "epoch": 1.99, + "learning_rate": 1.353876940543987e-06, + "loss": 0.0067, + "step": 768080 + }, + { + "epoch": 1.99, + "learning_rate": 1.3499887241725226e-06, + "loss": 0.0095, + "step": 768090 + }, + { + "epoch": 1.99, + "learning_rate": 1.346100507801058e-06, + "loss": 0.0063, + "step": 768100 + }, + { + "epoch": 1.99, + "learning_rate": 1.3422122914295934e-06, + "loss": 0.0059, + "step": 768110 + }, + { + "epoch": 1.99, + "learning_rate": 1.3383240750581286e-06, + "loss": 0.0066, + "step": 768120 + }, + { + "epoch": 1.99, + "learning_rate": 1.3344358586866641e-06, + "loss": 0.0058, + "step": 768130 + }, + { + "epoch": 1.99, + "learning_rate": 1.3305476423151994e-06, + "loss": 0.007, + "step": 768140 + }, + { + "epoch": 1.99, + "learning_rate": 1.3266594259437347e-06, + "loss": 0.0082, + "step": 768150 + }, + { + "epoch": 1.99, + "learning_rate": 1.3227712095722702e-06, + "loss": 0.0073, + "step": 768160 + }, + { + "epoch": 1.99, + "learning_rate": 1.3188829932008055e-06, + "loss": 0.0051, + "step": 768170 + }, + { + "epoch": 1.99, + "learning_rate": 1.314994776829341e-06, + "loss": 0.0073, + "step": 768180 + }, + { + "epoch": 1.99, + "learning_rate": 1.3111065604578763e-06, + "loss": 0.0056, + "step": 768190 + }, + { + "epoch": 1.99, + "learning_rate": 1.3072183440864116e-06, + "loss": 0.0055, + "step": 768200 + }, + { + "epoch": 1.99, + "learning_rate": 1.303330127714947e-06, + "loss": 0.0057, + "step": 768210 + }, + { + "epoch": 1.99, + "learning_rate": 1.2994419113434821e-06, + "loss": 0.0057, + "step": 768220 + }, + { + "epoch": 1.99, + "learning_rate": 1.2955536949720176e-06, + "loss": 0.007, + "step": 768230 + }, + { + "epoch": 1.99, + "learning_rate": 1.2916654786005531e-06, + "loss": 0.0073, + "step": 768240 + }, + { + "epoch": 1.99, + "learning_rate": 1.2877772622290886e-06, + "loss": 0.0064, + "step": 768250 + }, + { + "epoch": 1.99, + "learning_rate": 1.2838890458576237e-06, + "loss": 0.0083, + "step": 768260 + }, + { + "epoch": 1.99, + "learning_rate": 1.2800008294861592e-06, + "loss": 0.0114, + "step": 768270 + }, + { + "epoch": 1.99, + "learning_rate": 1.2761126131146945e-06, + "loss": 0.0065, + "step": 768280 + }, + { + "epoch": 1.99, + "learning_rate": 1.2722243967432298e-06, + "loss": 0.0052, + "step": 768290 + }, + { + "epoch": 1.99, + "learning_rate": 1.2683361803717652e-06, + "loss": 0.0054, + "step": 768300 + }, + { + "epoch": 1.99, + "learning_rate": 1.2644479640003005e-06, + "loss": 0.0062, + "step": 768310 + }, + { + "epoch": 1.99, + "learning_rate": 1.260559747628836e-06, + "loss": 0.0066, + "step": 768320 + }, + { + "epoch": 1.99, + "learning_rate": 1.2566715312573713e-06, + "loss": 0.0058, + "step": 768330 + }, + { + "epoch": 1.99, + "learning_rate": 1.2527833148859066e-06, + "loss": 0.0062, + "step": 768340 + }, + { + "epoch": 1.99, + "learning_rate": 1.248895098514442e-06, + "loss": 0.0073, + "step": 768350 + }, + { + "epoch": 1.99, + "learning_rate": 1.2450068821429774e-06, + "loss": 0.0082, + "step": 768360 + }, + { + "epoch": 1.99, + "learning_rate": 1.2411186657715127e-06, + "loss": 0.0067, + "step": 768370 + }, + { + "epoch": 1.99, + "learning_rate": 1.2372304494000482e-06, + "loss": 0.0061, + "step": 768380 + }, + { + "epoch": 1.99, + "learning_rate": 1.2333422330285837e-06, + "loss": 0.0068, + "step": 768390 + }, + { + "epoch": 1.99, + "learning_rate": 1.2294540166571187e-06, + "loss": 0.0085, + "step": 768400 + }, + { + "epoch": 1.99, + "learning_rate": 1.2255658002856542e-06, + "loss": 0.0064, + "step": 768410 + }, + { + "epoch": 1.99, + "learning_rate": 1.2216775839141897e-06, + "loss": 0.0085, + "step": 768420 + }, + { + "epoch": 1.99, + "learning_rate": 1.2177893675427248e-06, + "loss": 0.0079, + "step": 768430 + }, + { + "epoch": 1.99, + "learning_rate": 1.2139011511712603e-06, + "loss": 0.0053, + "step": 768440 + }, + { + "epoch": 1.99, + "learning_rate": 1.2100129347997958e-06, + "loss": 0.0076, + "step": 768450 + }, + { + "epoch": 1.99, + "learning_rate": 1.2061247184283309e-06, + "loss": 0.0091, + "step": 768460 + }, + { + "epoch": 1.99, + "learning_rate": 1.2022365020568664e-06, + "loss": 0.0092, + "step": 768470 + }, + { + "epoch": 1.99, + "learning_rate": 1.1983482856854017e-06, + "loss": 0.0064, + "step": 768480 + }, + { + "epoch": 1.99, + "learning_rate": 1.1944600693139371e-06, + "loss": 0.0083, + "step": 768490 + }, + { + "epoch": 1.99, + "learning_rate": 1.1905718529424724e-06, + "loss": 0.0058, + "step": 768500 + }, + { + "epoch": 1.99, + "learning_rate": 1.1866836365710077e-06, + "loss": 0.0066, + "step": 768510 + }, + { + "epoch": 1.99, + "learning_rate": 1.1827954201995432e-06, + "loss": 0.0044, + "step": 768520 + }, + { + "epoch": 1.99, + "learning_rate": 1.1789072038280785e-06, + "loss": 0.0101, + "step": 768530 + }, + { + "epoch": 1.99, + "learning_rate": 1.1750189874566138e-06, + "loss": 0.0076, + "step": 768540 + }, + { + "epoch": 1.99, + "learning_rate": 1.1711307710851493e-06, + "loss": 0.0125, + "step": 768550 + }, + { + "epoch": 1.99, + "learning_rate": 1.1672425547136846e-06, + "loss": 0.0063, + "step": 768560 + }, + { + "epoch": 1.99, + "learning_rate": 1.16335433834222e-06, + "loss": 0.0081, + "step": 768570 + }, { "epoch": 1.99, - "learning_rate": 2.06749373142762e-06, - "loss": 0.0066, - "step": 393690 + "learning_rate": 1.1594661219707553e-06, + "loss": 0.0074, + "step": 768580 }, { "epoch": 1.99, - "learning_rate": 2.0599260384136098e-06, - "loss": 0.0069, - "step": 393700 + "learning_rate": 1.1555779055992906e-06, + "loss": 0.0064, + "step": 768590 }, { "epoch": 1.99, - "learning_rate": 2.0523583453995992e-06, - "loss": 0.0059, - "step": 393710 + "learning_rate": 1.1516896892278261e-06, + "loss": 0.0077, + "step": 768600 }, { "epoch": 1.99, - "learning_rate": 2.0447906523855887e-06, - "loss": 0.0066, - "step": 393720 + "learning_rate": 1.1478014728563614e-06, + "loss": 0.0085, + "step": 768610 }, { "epoch": 1.99, - "learning_rate": 2.0372229593715787e-06, - "loss": 0.007, - "step": 393730 + "learning_rate": 1.143913256484897e-06, + "loss": 0.0071, + "step": 768620 }, { "epoch": 1.99, - "learning_rate": 2.029655266357568e-06, - "loss": 0.0072, - "step": 393740 + "learning_rate": 1.1400250401134322e-06, + "loss": 0.0087, + "step": 768630 }, { "epoch": 1.99, - "learning_rate": 2.022087573343558e-06, - "loss": 0.0047, - "step": 393750 + "learning_rate": 1.1361368237419675e-06, + "loss": 0.0081, + "step": 768640 }, { "epoch": 1.99, - "learning_rate": 2.0145198803295475e-06, + "learning_rate": 1.1322486073705028e-06, "loss": 0.0066, - "step": 393760 + "step": 768650 }, { "epoch": 1.99, - "learning_rate": 2.0069521873155375e-06, - "loss": 0.0054, - "step": 393770 + "learning_rate": 1.1283603909990383e-06, + "loss": 0.0066, + "step": 768660 }, { "epoch": 1.99, - "learning_rate": 1.999384494301527e-06, - "loss": 0.0057, - "step": 393780 + "learning_rate": 1.1244721746275735e-06, + "loss": 0.0069, + "step": 768670 }, { "epoch": 1.99, - "learning_rate": 1.991816801287517e-06, - "loss": 0.0039, - "step": 393790 + "learning_rate": 1.1205839582561088e-06, + "loss": 0.0063, + "step": 768680 }, { "epoch": 1.99, - "learning_rate": 1.9842491082735063e-06, - "loss": 0.005, - "step": 393800 + "learning_rate": 1.1166957418846443e-06, + "loss": 0.009, + "step": 768690 }, { "epoch": 1.99, - "learning_rate": 1.9766814152594963e-06, - "loss": 0.0051, - "step": 393810 + "learning_rate": 1.1128075255131796e-06, + "loss": 0.0077, + "step": 768700 }, { "epoch": 1.99, - "learning_rate": 1.9691137222454857e-06, - "loss": 0.006, - "step": 393820 + "learning_rate": 1.108919309141715e-06, + "loss": 0.0063, + "step": 768710 }, { "epoch": 1.99, - "learning_rate": 1.9615460292314752e-06, - "loss": 0.0049, - "step": 393830 + "learning_rate": 1.1050310927702504e-06, + "loss": 0.0044, + "step": 768720 }, { "epoch": 1.99, - "learning_rate": 1.953978336217465e-06, - "loss": 0.0051, - "step": 393840 + "learning_rate": 1.1011428763987857e-06, + "loss": 0.0092, + "step": 768730 }, { "epoch": 1.99, - "learning_rate": 1.9464106432034546e-06, - "loss": 0.0055, - "step": 393850 + "learning_rate": 1.0972546600273212e-06, + "loss": 0.0062, + "step": 768740 }, { "epoch": 1.99, - "learning_rate": 1.9388429501894446e-06, - "loss": 0.0036, - "step": 393860 + "learning_rate": 1.0933664436558565e-06, + "loss": 0.007, + "step": 768750 }, { "epoch": 1.99, - "learning_rate": 1.931275257175434e-06, - "loss": 0.0066, - "step": 393870 + "learning_rate": 1.089478227284392e-06, + "loss": 0.0064, + "step": 768760 }, { "epoch": 1.99, - "learning_rate": 1.923707564161424e-06, - "loss": 0.0051, - "step": 393880 + "learning_rate": 1.0855900109129272e-06, + "loss": 0.0099, + "step": 768770 }, { "epoch": 1.99, - "learning_rate": 1.9161398711474134e-06, - "loss": 0.0059, - "step": 393890 + "learning_rate": 1.0817017945414625e-06, + "loss": 0.0072, + "step": 768780 }, { "epoch": 1.99, - "learning_rate": 1.9085721781334034e-06, - "loss": 0.0053, - "step": 393900 + "learning_rate": 1.077813578169998e-06, + "loss": 0.0101, + "step": 768790 }, { "epoch": 1.99, - "learning_rate": 1.9010044851193928e-06, - "loss": 0.007, - "step": 393910 + "learning_rate": 1.0739253617985333e-06, + "loss": 0.0067, + "step": 768800 }, { "epoch": 1.99, - "learning_rate": 1.8934367921053825e-06, - "loss": 0.0079, - "step": 393920 + "learning_rate": 1.0700371454270686e-06, + "loss": 0.0087, + "step": 768810 }, { "epoch": 1.99, - "learning_rate": 1.8858690990913722e-06, - "loss": 0.0077, - "step": 393930 + "learning_rate": 1.0661489290556039e-06, + "loss": 0.0091, + "step": 768820 }, { "epoch": 1.99, - "learning_rate": 1.878301406077362e-06, - "loss": 0.0078, - "step": 393940 + "learning_rate": 1.0622607126841394e-06, + "loss": 0.0061, + "step": 768830 }, { "epoch": 1.99, - "learning_rate": 1.8707337130633517e-06, - "loss": 0.006, - "step": 393950 + "learning_rate": 1.0583724963126747e-06, + "loss": 0.007, + "step": 768840 }, { "epoch": 1.99, - "learning_rate": 1.8631660200493414e-06, - "loss": 0.0053, - "step": 393960 + "learning_rate": 1.05448427994121e-06, + "loss": 0.0066, + "step": 768850 }, { "epoch": 1.99, - "learning_rate": 1.855598327035331e-06, - "loss": 0.0037, - "step": 393970 + "learning_rate": 1.0505960635697454e-06, + "loss": 0.0095, + "step": 768860 }, { "epoch": 1.99, - "learning_rate": 1.8480306340213203e-06, - "loss": 0.0062, - "step": 393980 + "learning_rate": 1.0467078471982807e-06, + "loss": 0.0066, + "step": 768870 }, { "epoch": 1.99, - "learning_rate": 1.84046294100731e-06, - "loss": 0.006, - "step": 393990 + "learning_rate": 1.0428196308268162e-06, + "loss": 0.0057, + "step": 768880 }, { "epoch": 1.99, - "learning_rate": 1.8328952479932997e-06, - "loss": 0.0053, - "step": 394000 + "learning_rate": 1.0389314144553515e-06, + "loss": 0.0059, + "step": 768890 }, { "epoch": 1.99, - "eval_cer": 0.9144168841162651, - "eval_loss": 0.004111087881028652, - "eval_runtime": 116.0484, - "eval_samples_per_second": 17.234, - "eval_steps_per_second": 4.309, - "step": 394000 + "learning_rate": 1.0350431980838868e-06, + "loss": 0.0066, + "step": 768900 }, { "epoch": 1.99, - "learning_rate": 1.8253275549792894e-06, - "loss": 0.0062, - "step": 394010 + "learning_rate": 1.0311549817124223e-06, + "loss": 0.0079, + "step": 768910 }, { "epoch": 1.99, - "learning_rate": 1.8177598619652791e-06, - "loss": 0.0054, - "step": 394020 + "learning_rate": 1.0272667653409576e-06, + "loss": 0.0088, + "step": 768920 }, { "epoch": 1.99, - "learning_rate": 1.8101921689512688e-06, - "loss": 0.0059, - "step": 394030 + "learning_rate": 1.023378548969493e-06, + "loss": 0.0074, + "step": 768930 }, { "epoch": 1.99, - "learning_rate": 1.8026244759372585e-06, - "loss": 0.005, - "step": 394040 + "learning_rate": 1.0194903325980284e-06, + "loss": 0.0076, + "step": 768940 }, { "epoch": 1.99, - "learning_rate": 1.7950567829232482e-06, - "loss": 0.0062, - "step": 394050 + "learning_rate": 1.0156021162265636e-06, + "loss": 0.0057, + "step": 768950 }, { "epoch": 1.99, - "learning_rate": 1.787489089909238e-06, - "loss": 0.0051, - "step": 394060 + "learning_rate": 1.0117138998550991e-06, + "loss": 0.0072, + "step": 768960 }, { "epoch": 1.99, - "learning_rate": 1.7799213968952276e-06, - "loss": 0.0051, - "step": 394070 + "learning_rate": 1.0078256834836344e-06, + "loss": 0.0064, + "step": 768970 }, { "epoch": 1.99, - "learning_rate": 1.7723537038812173e-06, - "loss": 0.0047, - "step": 394080 + "learning_rate": 1.0039374671121697e-06, + "loss": 0.0075, + "step": 768980 }, { "epoch": 1.99, - "learning_rate": 1.764786010867207e-06, - "loss": 0.0046, - "step": 394090 + "learning_rate": 1.000049250740705e-06, + "loss": 0.0074, + "step": 768990 }, { "epoch": 1.99, - "learning_rate": 1.7572183178531965e-06, - "loss": 0.0053, - "step": 394100 + "learning_rate": 9.961610343692405e-07, + "loss": 0.0086, + "step": 769000 }, { "epoch": 1.99, - "learning_rate": 1.7496506248391862e-06, - "loss": 0.0046, - "step": 394110 + "eval_cer": 0.8816788924952867, + "eval_loss": 0.0043708933517336845, + "eval_runtime": 107.9473, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 769000 }, { "epoch": 1.99, - "learning_rate": 1.742082931825176e-06, + "learning_rate": 9.922728179977758e-07, "loss": 0.0062, - "step": 394120 + "step": 769010 }, { "epoch": 1.99, - "learning_rate": 1.7345152388111656e-06, - "loss": 0.0045, - "step": 394130 + "learning_rate": 9.883846016263113e-07, + "loss": 0.0065, + "step": 769020 }, { "epoch": 1.99, - "learning_rate": 1.7269475457971553e-06, - "loss": 0.006, - "step": 394140 + "learning_rate": 9.844963852548466e-07, + "loss": 0.0067, + "step": 769030 }, { "epoch": 1.99, - "learning_rate": 1.719379852783145e-06, - "loss": 0.0057, - "step": 394150 + "learning_rate": 9.806081688833818e-07, + "loss": 0.0072, + "step": 769040 }, { "epoch": 1.99, - "learning_rate": 1.7118121597691347e-06, - "loss": 0.0055, - "step": 394160 + "learning_rate": 9.767199525119173e-07, + "loss": 0.0084, + "step": 769050 }, { "epoch": 1.99, - "learning_rate": 1.7042444667551244e-06, - "loss": 0.0048, - "step": 394170 + "learning_rate": 9.728317361404526e-07, + "loss": 0.0086, + "step": 769060 }, { "epoch": 1.99, - "learning_rate": 1.6966767737411141e-06, - "loss": 0.0041, - "step": 394180 + "learning_rate": 9.689435197689881e-07, + "loss": 0.0098, + "step": 769070 }, { "epoch": 1.99, - "learning_rate": 1.6891090807271038e-06, - "loss": 0.0071, - "step": 394190 + "learning_rate": 9.650553033975234e-07, + "loss": 0.0072, + "step": 769080 }, { "epoch": 1.99, - "learning_rate": 1.6815413877130935e-06, - "loss": 0.0059, - "step": 394200 + "learning_rate": 9.611670870260587e-07, + "loss": 0.0071, + "step": 769090 }, { "epoch": 1.99, - "learning_rate": 1.673973694699083e-06, - "loss": 0.0045, - "step": 394210 + "learning_rate": 9.572788706545942e-07, + "loss": 0.0058, + "step": 769100 }, { "epoch": 1.99, - "learning_rate": 1.6664060016850727e-06, - "loss": 0.0053, - "step": 394220 + "learning_rate": 9.533906542831295e-07, + "loss": 0.0097, + "step": 769110 }, { "epoch": 1.99, - "learning_rate": 1.6588383086710624e-06, - "loss": 0.0075, - "step": 394230 + "learning_rate": 9.495024379116649e-07, + "loss": 0.0098, + "step": 769120 }, { "epoch": 1.99, - "learning_rate": 1.6512706156570521e-06, - "loss": 0.0047, - "step": 394240 + "learning_rate": 9.456142215402002e-07, + "loss": 0.0126, + "step": 769130 }, { "epoch": 1.99, - "learning_rate": 1.6437029226430418e-06, - "loss": 0.0053, - "step": 394250 + "learning_rate": 9.417260051687356e-07, + "loss": 0.0062, + "step": 769140 }, { "epoch": 1.99, - "learning_rate": 1.6361352296290315e-06, - "loss": 0.0046, - "step": 394260 + "learning_rate": 9.378377887972709e-07, + "loss": 0.0059, + "step": 769150 }, { "epoch": 1.99, - "learning_rate": 1.6285675366150212e-06, - "loss": 0.0049, - "step": 394270 + "learning_rate": 9.339495724258062e-07, + "loss": 0.0071, + "step": 769160 }, { "epoch": 1.99, - "learning_rate": 1.620999843601011e-06, - "loss": 0.007, - "step": 394280 + "learning_rate": 9.300613560543416e-07, + "loss": 0.0067, + "step": 769170 }, { "epoch": 1.99, - "learning_rate": 1.6134321505870006e-06, - "loss": 0.0071, - "step": 394290 + "learning_rate": 9.26173139682877e-07, + "loss": 0.0065, + "step": 769180 }, { "epoch": 1.99, - "learning_rate": 1.6058644575729903e-06, - "loss": 0.0059, - "step": 394300 + "learning_rate": 9.222849233114124e-07, + "loss": 0.0079, + "step": 769190 }, { "epoch": 1.99, - "learning_rate": 1.59829676455898e-06, - "loss": 0.0046, - "step": 394310 + "learning_rate": 9.183967069399477e-07, + "loss": 0.0054, + "step": 769200 }, { "epoch": 1.99, - "learning_rate": 1.5907290715449697e-06, - "loss": 0.0058, - "step": 394320 + "learning_rate": 9.145084905684832e-07, + "loss": 0.0067, + "step": 769210 }, { "epoch": 1.99, - "learning_rate": 1.5831613785309592e-06, - "loss": 0.0063, - "step": 394330 + "learning_rate": 9.106202741970185e-07, + "loss": 0.0074, + "step": 769220 }, { "epoch": 1.99, - "learning_rate": 1.575593685516949e-06, - "loss": 0.005, - "step": 394340 + "learning_rate": 9.067320578255537e-07, + "loss": 0.0075, + "step": 769230 }, { "epoch": 1.99, - "learning_rate": 1.5680259925029386e-06, - "loss": 0.0046, - "step": 394350 + "learning_rate": 9.028438414540891e-07, + "loss": 0.009, + "step": 769240 }, { "epoch": 1.99, - "learning_rate": 1.5604582994889283e-06, - "loss": 0.0044, - "step": 394360 + "learning_rate": 8.989556250826245e-07, + "loss": 0.0071, + "step": 769250 }, { "epoch": 1.99, - "learning_rate": 1.552890606474918e-06, - "loss": 0.005, - "step": 394370 + "learning_rate": 8.950674087111599e-07, + "loss": 0.0064, + "step": 769260 }, { "epoch": 1.99, - "learning_rate": 1.5453229134609077e-06, - "loss": 0.0063, - "step": 394380 + "learning_rate": 8.911791923396952e-07, + "loss": 0.0052, + "step": 769270 }, { "epoch": 1.99, - "learning_rate": 1.5377552204468974e-06, - "loss": 0.0064, - "step": 394390 + "learning_rate": 8.872909759682306e-07, + "loss": 0.0081, + "step": 769280 }, { "epoch": 1.99, - "learning_rate": 1.5301875274328871e-06, - "loss": 0.0061, - "step": 394400 + "learning_rate": 8.83402759596766e-07, + "loss": 0.0066, + "step": 769290 }, { "epoch": 1.99, - "learning_rate": 1.5226198344188768e-06, - "loss": 0.0071, - "step": 394410 + "learning_rate": 8.795145432253013e-07, + "loss": 0.0044, + "step": 769300 }, { "epoch": 1.99, - "learning_rate": 1.5150521414048665e-06, - "loss": 0.006, - "step": 394420 + "learning_rate": 8.756263268538368e-07, + "loss": 0.0074, + "step": 769310 }, { "epoch": 1.99, - "learning_rate": 1.5074844483908562e-06, - "loss": 0.0063, - "step": 394430 + "learning_rate": 8.71738110482372e-07, + "loss": 0.0085, + "step": 769320 }, { "epoch": 1.99, - "learning_rate": 1.499916755376846e-06, - "loss": 0.0037, - "step": 394440 + "learning_rate": 8.678498941109074e-07, + "loss": 0.0075, + "step": 769330 }, { "epoch": 1.99, - "learning_rate": 1.4923490623628354e-06, - "loss": 0.0047, - "step": 394450 + "learning_rate": 8.639616777394427e-07, + "loss": 0.0068, + "step": 769340 }, { "epoch": 1.99, - "learning_rate": 1.4847813693488251e-06, - "loss": 0.0053, - "step": 394460 + "learning_rate": 8.600734613679781e-07, + "loss": 0.005, + "step": 769350 }, { "epoch": 1.99, - "learning_rate": 1.4772136763348148e-06, - "loss": 0.0051, - "step": 394470 + "learning_rate": 8.561852449965135e-07, + "loss": 0.0087, + "step": 769360 }, { "epoch": 1.99, - "learning_rate": 1.4696459833208045e-06, - "loss": 0.005, - "step": 394480 + "learning_rate": 8.522970286250488e-07, + "loss": 0.0068, + "step": 769370 }, { "epoch": 1.99, - "learning_rate": 1.4620782903067942e-06, - "loss": 0.0075, - "step": 394490 + "learning_rate": 8.484088122535843e-07, + "loss": 0.0048, + "step": 769380 }, { "epoch": 1.99, - "learning_rate": 1.454510597292784e-06, - "loss": 0.0063, - "step": 394500 + "learning_rate": 8.445205958821196e-07, + "loss": 0.0076, + "step": 769390 }, { "epoch": 1.99, - "learning_rate": 1.4469429042787736e-06, - "loss": 0.0043, - "step": 394510 + "learning_rate": 8.406323795106549e-07, + "loss": 0.0074, + "step": 769400 }, { "epoch": 1.99, - "learning_rate": 1.4393752112647631e-06, - "loss": 0.0044, - "step": 394520 + "learning_rate": 8.367441631391904e-07, + "loss": 0.0069, + "step": 769410 }, { "epoch": 1.99, - "learning_rate": 1.4318075182507528e-06, - "loss": 0.0048, - "step": 394530 + "learning_rate": 8.328559467677256e-07, + "loss": 0.0085, + "step": 769420 }, { "epoch": 1.99, - "learning_rate": 1.4242398252367423e-06, - "loss": 0.0061, - "step": 394540 + "learning_rate": 8.28967730396261e-07, + "loss": 0.006, + "step": 769430 }, { "epoch": 1.99, - "learning_rate": 1.416672132222732e-06, - "loss": 0.007, - "step": 394550 + "learning_rate": 8.250795140247963e-07, + "loss": 0.0068, + "step": 769440 }, { "epoch": 1.99, - "learning_rate": 1.4091044392087217e-06, - "loss": 0.0042, - "step": 394560 + "learning_rate": 8.211912976533318e-07, + "loss": 0.0064, + "step": 769450 }, { "epoch": 1.99, - "learning_rate": 1.4015367461947114e-06, - "loss": 0.0042, - "step": 394570 + "learning_rate": 8.173030812818671e-07, + "loss": 0.005, + "step": 769460 }, { "epoch": 1.99, - "learning_rate": 1.3939690531807011e-06, - "loss": 0.005, - "step": 394580 + "learning_rate": 8.134148649104024e-07, + "loss": 0.0055, + "step": 769470 }, { "epoch": 1.99, - "learning_rate": 1.3864013601666908e-06, - "loss": 0.0062, - "step": 394590 + "learning_rate": 8.095266485389379e-07, + "loss": 0.0079, + "step": 769480 }, { "epoch": 1.99, - "learning_rate": 1.3788336671526805e-06, - "loss": 0.0074, - "step": 394600 + "learning_rate": 8.056384321674732e-07, + "loss": 0.0073, + "step": 769490 }, { "epoch": 1.99, - "learning_rate": 1.3712659741386702e-06, + "learning_rate": 8.017502157960086e-07, "loss": 0.0055, - "step": 394610 + "step": 769500 }, { "epoch": 1.99, - "learning_rate": 1.36369828112466e-06, - "loss": 0.0052, - "step": 394620 + "learning_rate": 7.978619994245438e-07, + "loss": 0.0067, + "step": 769510 }, { "epoch": 1.99, - "learning_rate": 1.3561305881106496e-06, - "loss": 0.004, - "step": 394630 + "learning_rate": 7.939737830530793e-07, + "loss": 0.0098, + "step": 769520 }, { "epoch": 1.99, - "learning_rate": 1.3485628950966393e-06, - "loss": 0.0093, - "step": 394640 + "learning_rate": 7.900855666816146e-07, + "loss": 0.0102, + "step": 769530 }, { "epoch": 1.99, - "learning_rate": 1.340995202082629e-06, - "loss": 0.0063, - "step": 394650 + "learning_rate": 7.861973503101499e-07, + "loss": 0.0067, + "step": 769540 }, { "epoch": 1.99, - "learning_rate": 1.3334275090686185e-06, - "loss": 0.0048, - "step": 394660 + "learning_rate": 7.823091339386854e-07, + "loss": 0.0049, + "step": 769550 }, { "epoch": 1.99, - "learning_rate": 1.3258598160546082e-06, - "loss": 0.0072, - "step": 394670 + "learning_rate": 7.784209175672207e-07, + "loss": 0.007, + "step": 769560 }, { "epoch": 1.99, - "learning_rate": 1.318292123040598e-06, - "loss": 0.0054, - "step": 394680 + "learning_rate": 7.745327011957561e-07, + "loss": 0.0056, + "step": 769570 }, { "epoch": 1.99, - "learning_rate": 1.3107244300265876e-06, - "loss": 0.0043, - "step": 394690 + "learning_rate": 7.706444848242915e-07, + "loss": 0.0058, + "step": 769580 }, { "epoch": 1.99, - "learning_rate": 1.3031567370125773e-06, - "loss": 0.0046, - "step": 394700 + "learning_rate": 7.667562684528268e-07, + "loss": 0.0077, + "step": 769590 }, { "epoch": 1.99, - "learning_rate": 1.295589043998567e-06, - "loss": 0.0046, - "step": 394710 + "learning_rate": 7.628680520813621e-07, + "loss": 0.0066, + "step": 769600 }, { "epoch": 1.99, - "learning_rate": 1.2880213509845567e-06, - "loss": 0.0069, - "step": 394720 + "learning_rate": 7.589798357098974e-07, + "loss": 0.0092, + "step": 769610 }, { "epoch": 1.99, - "learning_rate": 1.2804536579705464e-06, - "loss": 0.0058, - "step": 394730 + "learning_rate": 7.550916193384329e-07, + "loss": 0.0065, + "step": 769620 }, { "epoch": 1.99, - "learning_rate": 1.2728859649565361e-06, - "loss": 0.0044, - "step": 394740 + "learning_rate": 7.512034029669682e-07, + "loss": 0.0068, + "step": 769630 }, { - "epoch": 1.99, - "learning_rate": 1.2653182719425258e-06, - "loss": 0.0052, - "step": 394750 + "epoch": 2.0, + "learning_rate": 7.473151865955036e-07, + "loss": 0.008, + "step": 769640 }, { - "epoch": 1.99, - "learning_rate": 1.2577505789285155e-06, + "epoch": 2.0, + "learning_rate": 7.43426970224039e-07, "loss": 0.0067, - "step": 394760 + "step": 769650 }, { - "epoch": 1.99, - "learning_rate": 1.2501828859145052e-06, - "loss": 0.0053, - "step": 394770 + "epoch": 2.0, + "learning_rate": 7.395387538525743e-07, + "loss": 0.0068, + "step": 769660 }, { - "epoch": 1.99, - "learning_rate": 1.2426151929004947e-06, - "loss": 0.0084, - "step": 394780 + "epoch": 2.0, + "learning_rate": 7.356505374811097e-07, + "loss": 0.0044, + "step": 769670 }, { - "epoch": 1.99, - "learning_rate": 1.2350474998864844e-06, - "loss": 0.0058, - "step": 394790 + "epoch": 2.0, + "learning_rate": 7.31762321109645e-07, + "loss": 0.0061, + "step": 769680 }, { - "epoch": 1.99, - "learning_rate": 1.2274798068724741e-06, + "epoch": 2.0, + "learning_rate": 7.278741047381805e-07, "loss": 0.0066, - "step": 394800 + "step": 769690 }, { - "epoch": 1.99, - "learning_rate": 1.2199121138584638e-06, - "loss": 0.0061, - "step": 394810 + "epoch": 2.0, + "learning_rate": 7.239858883667157e-07, + "loss": 0.0058, + "step": 769700 }, { - "epoch": 1.99, - "learning_rate": 1.2123444208444535e-06, - "loss": 0.0048, - "step": 394820 + "epoch": 2.0, + "learning_rate": 7.200976719952512e-07, + "loss": 0.0074, + "step": 769710 }, { - "epoch": 1.99, - "learning_rate": 1.2047767278304432e-06, - "loss": 0.0051, - "step": 394830 + "epoch": 2.0, + "learning_rate": 7.162094556237865e-07, + "loss": 0.006, + "step": 769720 }, { - "epoch": 1.99, - "learning_rate": 1.197209034816433e-06, - "loss": 0.0089, - "step": 394840 + "epoch": 2.0, + "learning_rate": 7.123212392523218e-07, + "loss": 0.0064, + "step": 769730 }, { - "epoch": 1.99, - "learning_rate": 1.1896413418024226e-06, - "loss": 0.0069, - "step": 394850 + "epoch": 2.0, + "learning_rate": 7.084330228808572e-07, + "loss": 0.0092, + "step": 769740 }, { - "epoch": 1.99, - "learning_rate": 1.1820736487884123e-06, - "loss": 0.0043, - "step": 394860 + "epoch": 2.0, + "learning_rate": 7.045448065093926e-07, + "loss": 0.0077, + "step": 769750 }, { - "epoch": 1.99, - "learning_rate": 1.174505955774402e-06, - "loss": 0.0074, - "step": 394870 + "epoch": 2.0, + "learning_rate": 7.00656590137928e-07, + "loss": 0.0064, + "step": 769760 }, { - "epoch": 1.99, - "learning_rate": 1.1669382627603917e-06, - "loss": 0.0052, - "step": 394880 + "epoch": 2.0, + "learning_rate": 6.967683737664633e-07, + "loss": 0.0066, + "step": 769770 }, { - "epoch": 1.99, - "learning_rate": 1.1593705697463812e-06, - "loss": 0.0048, - "step": 394890 + "epoch": 2.0, + "learning_rate": 6.928801573949986e-07, + "loss": 0.0072, + "step": 769780 }, { - "epoch": 1.99, - "learning_rate": 1.151802876732371e-06, - "loss": 0.0045, - "step": 394900 + "epoch": 2.0, + "learning_rate": 6.88991941023534e-07, + "loss": 0.0073, + "step": 769790 }, { - "epoch": 1.99, - "learning_rate": 1.1442351837183606e-06, - "loss": 0.0047, - "step": 394910 + "epoch": 2.0, + "learning_rate": 6.851037246520693e-07, + "loss": 0.0083, + "step": 769800 }, { - "epoch": 1.99, - "learning_rate": 1.1366674907043503e-06, - "loss": 0.0048, - "step": 394920 + "epoch": 2.0, + "learning_rate": 6.812155082806047e-07, + "loss": 0.007, + "step": 769810 }, { - "epoch": 1.99, - "learning_rate": 1.12909979769034e-06, - "loss": 0.0046, - "step": 394930 + "epoch": 2.0, + "learning_rate": 6.773272919091401e-07, + "loss": 0.0075, + "step": 769820 }, { - "epoch": 1.99, - "learning_rate": 1.1215321046763295e-06, - "loss": 0.0046, - "step": 394940 + "epoch": 2.0, + "learning_rate": 6.734390755376755e-07, + "loss": 0.0079, + "step": 769830 }, { - "epoch": 1.99, - "learning_rate": 1.1139644116623192e-06, - "loss": 0.0043, - "step": 394950 + "epoch": 2.0, + "learning_rate": 6.695508591662108e-07, + "loss": 0.0095, + "step": 769840 }, { - "epoch": 1.99, - "learning_rate": 1.106396718648309e-06, - "loss": 0.0062, - "step": 394960 + "epoch": 2.0, + "learning_rate": 6.656626427947462e-07, + "loss": 0.0066, + "step": 769850 }, { - "epoch": 1.99, - "learning_rate": 1.0988290256342986e-06, + "epoch": 2.0, + "learning_rate": 6.617744264232816e-07, + "loss": 0.0075, + "step": 769860 + }, + { + "epoch": 2.0, + "learning_rate": 6.578862100518169e-07, + "loss": 0.0068, + "step": 769870 + }, + { + "epoch": 2.0, + "learning_rate": 6.539979936803524e-07, + "loss": 0.0087, + "step": 769880 + }, + { + "epoch": 2.0, + "learning_rate": 6.501097773088876e-07, "loss": 0.0056, - "step": 394970 + "step": 769890 }, { - "epoch": 1.99, - "learning_rate": 1.0912613326202883e-06, - "loss": 0.0034, - "step": 394980 + "epoch": 2.0, + "learning_rate": 6.46221560937423e-07, + "loss": 0.0067, + "step": 769900 }, { - "epoch": 1.99, - "learning_rate": 1.083693639606278e-06, - "loss": 0.0043, - "step": 394990 + "epoch": 2.0, + "learning_rate": 6.423333445659583e-07, + "loss": 0.0055, + "step": 769910 }, { - "epoch": 1.99, - "learning_rate": 1.0761259465922677e-06, - "loss": 0.0048, - "step": 395000 + "epoch": 2.0, + "learning_rate": 6.384451281944937e-07, + "loss": 0.0064, + "step": 769920 }, { - "epoch": 1.99, - "eval_cer": 0.9144168841162651, - "eval_loss": 0.004111517686396837, - "eval_runtime": 115.9763, - "eval_samples_per_second": 17.245, - "eval_steps_per_second": 4.311, - "step": 395000 + "epoch": 2.0, + "learning_rate": 6.345569118230291e-07, + "loss": 0.0068, + "step": 769930 }, { - "epoch": 1.99, - "learning_rate": 1.0685582535782574e-06, - "loss": 0.0043, - "step": 395010 + "epoch": 2.0, + "learning_rate": 6.306686954515644e-07, + "loss": 0.0055, + "step": 769940 }, { - "epoch": 1.99, - "learning_rate": 1.0609905605642471e-06, - "loss": 0.0083, - "step": 395020 + "epoch": 2.0, + "learning_rate": 6.267804790800999e-07, + "loss": 0.0082, + "step": 769950 }, { - "epoch": 1.99, - "learning_rate": 1.0534228675502368e-06, + "epoch": 2.0, + "learning_rate": 6.228922627086352e-07, + "loss": 0.0077, + "step": 769960 + }, + { + "epoch": 2.0, + "learning_rate": 6.190040463371704e-07, "loss": 0.0055, - "step": 395030 + "step": 769970 }, { - "epoch": 1.99, - "learning_rate": 1.0458551745362265e-06, - "loss": 0.0054, - "step": 395040 + "epoch": 2.0, + "learning_rate": 6.151158299657059e-07, + "loss": 0.0089, + "step": 769980 }, { - "epoch": 1.99, - "learning_rate": 1.0382874815222162e-06, - "loss": 0.0062, - "step": 395050 + "epoch": 2.0, + "learning_rate": 6.112276135942412e-07, + "loss": 0.0051, + "step": 769990 }, { - "epoch": 1.99, - "learning_rate": 1.0307197885082057e-06, - "loss": 0.0048, - "step": 395060 + "epoch": 2.0, + "learning_rate": 6.073393972227766e-07, + "loss": 0.0051, + "step": 770000 }, { - "epoch": 1.99, - "learning_rate": 1.0231520954941954e-06, + "epoch": 2.0, + "eval_cer": 0.8816788924952867, + "eval_loss": 0.00436586607247591, + "eval_runtime": 108.0178, + "eval_samples_per_second": 18.515, + "eval_steps_per_second": 4.629, + "step": 770000 + }, + { + "epoch": 2.0, + "learning_rate": 6.034511808513119e-07, "loss": 0.0065, - "step": 395070 + "step": 770010 }, { - "epoch": 1.99, - "learning_rate": 1.0155844024801851e-06, - "loss": 0.0055, - "step": 395080 + "epoch": 2.0, + "learning_rate": 5.995629644798474e-07, + "loss": 0.0052, + "step": 770020 }, { - "epoch": 1.99, - "learning_rate": 1.0080167094661748e-06, + "epoch": 2.0, + "learning_rate": 5.956747481083827e-07, + "loss": 0.008, + "step": 770030 + }, + { + "epoch": 2.0, + "learning_rate": 5.91786531736918e-07, "loss": 0.0058, - "step": 395090 + "step": 770040 }, { - "epoch": 1.99, - "learning_rate": 1.0004490164521645e-06, - "loss": 0.0066, - "step": 395100 + "epoch": 2.0, + "learning_rate": 5.878983153654535e-07, + "loss": 0.0072, + "step": 770050 }, { - "epoch": 1.99, - "learning_rate": 9.928813234381542e-07, - "loss": 0.0042, - "step": 395110 + "epoch": 2.0, + "learning_rate": 5.840100989939888e-07, + "loss": 0.0079, + "step": 770060 }, { - "epoch": 1.99, - "learning_rate": 9.85313630424144e-07, - "loss": 0.0051, - "step": 395120 + "epoch": 2.0, + "learning_rate": 5.801218826225241e-07, + "loss": 0.0043, + "step": 770070 }, { - "epoch": 1.99, - "learning_rate": 9.777459374101336e-07, - "loss": 0.0048, - "step": 395130 + "epoch": 2.0, + "learning_rate": 5.762336662510594e-07, + "loss": 0.0069, + "step": 770080 }, { - "epoch": 1.99, - "learning_rate": 9.701782443961233e-07, - "loss": 0.0041, - "step": 395140 + "epoch": 2.0, + "learning_rate": 5.723454498795948e-07, + "loss": 0.0128, + "step": 770090 }, { - "epoch": 1.99, - "learning_rate": 9.62610551382113e-07, - "loss": 0.0046, - "step": 395150 + "epoch": 2.0, + "learning_rate": 5.684572335081302e-07, + "loss": 0.0064, + "step": 770100 }, { - "epoch": 1.99, - "learning_rate": 9.550428583681027e-07, - "loss": 0.0058, - "step": 395160 + "epoch": 2.0, + "learning_rate": 5.645690171366656e-07, + "loss": 0.0059, + "step": 770110 }, { - "epoch": 1.99, - "learning_rate": 9.474751653540923e-07, - "loss": 0.0049, - "step": 395170 + "epoch": 2.0, + "learning_rate": 5.60680800765201e-07, + "loss": 0.0053, + "step": 770120 }, { - "epoch": 1.99, - "learning_rate": 9.39907472340082e-07, - "loss": 0.0058, - "step": 395180 + "epoch": 2.0, + "learning_rate": 5.567925843937363e-07, + "loss": 0.0107, + "step": 770130 }, { - "epoch": 1.99, - "learning_rate": 9.323397793260717e-07, - "loss": 0.0057, - "step": 395190 + "epoch": 2.0, + "learning_rate": 5.529043680222717e-07, + "loss": 0.0075, + "step": 770140 }, { - "epoch": 1.99, - "learning_rate": 9.247720863120612e-07, - "loss": 0.0089, - "step": 395200 + "epoch": 2.0, + "learning_rate": 5.490161516508071e-07, + "loss": 0.0054, + "step": 770150 }, { - "epoch": 1.99, - "learning_rate": 9.172043932980509e-07, - "loss": 0.006, - "step": 395210 + "epoch": 2.0, + "learning_rate": 5.451279352793423e-07, + "loss": 0.0061, + "step": 770160 }, { - "epoch": 1.99, - "learning_rate": 9.096367002840406e-07, - "loss": 0.005, - "step": 395220 + "epoch": 2.0, + "learning_rate": 5.412397189078777e-07, + "loss": 0.0061, + "step": 770170 }, { - "epoch": 1.99, - "learning_rate": 9.020690072700303e-07, - "loss": 0.0051, - "step": 395230 + "epoch": 2.0, + "learning_rate": 5.373515025364131e-07, + "loss": 0.0068, + "step": 770180 }, { - "epoch": 1.99, - "learning_rate": 8.9450131425602e-07, - "loss": 0.006, - "step": 395240 + "epoch": 2.0, + "learning_rate": 5.334632861649484e-07, + "loss": 0.0064, + "step": 770190 }, { - "epoch": 1.99, - "learning_rate": 8.869336212420096e-07, + "epoch": 2.0, + "learning_rate": 5.295750697934838e-07, "loss": 0.0049, - "step": 395250 + "step": 770200 }, { - "epoch": 1.99, - "learning_rate": 8.793659282279993e-07, - "loss": 0.0057, - "step": 395260 + "epoch": 2.0, + "learning_rate": 5.256868534220192e-07, + "loss": 0.0084, + "step": 770210 }, { - "epoch": 1.99, - "learning_rate": 8.71798235213989e-07, - "loss": 0.0048, - "step": 395270 + "epoch": 2.0, + "learning_rate": 5.217986370505546e-07, + "loss": 0.0049, + "step": 770220 }, { - "epoch": 1.99, - "learning_rate": 8.642305421999787e-07, - "loss": 0.004, - "step": 395280 + "epoch": 2.0, + "learning_rate": 5.179104206790899e-07, + "loss": 0.0052, + "step": 770230 }, { - "epoch": 1.99, - "learning_rate": 8.566628491859684e-07, - "loss": 0.0033, - "step": 395290 + "epoch": 2.0, + "learning_rate": 5.140222043076253e-07, + "loss": 0.006, + "step": 770240 }, { - "epoch": 1.99, - "learning_rate": 8.490951561719581e-07, - "loss": 0.0053, - "step": 395300 + "epoch": 2.0, + "learning_rate": 5.101339879361605e-07, + "loss": 0.0058, + "step": 770250 }, { - "epoch": 1.99, - "learning_rate": 8.415274631579477e-07, + "epoch": 2.0, + "learning_rate": 5.062457715646959e-07, + "loss": 0.0064, + "step": 770260 + }, + { + "epoch": 2.0, + "learning_rate": 5.023575551932313e-07, + "loss": 0.0116, + "step": 770270 + }, + { + "epoch": 2.0, + "learning_rate": 4.984693388217667e-07, "loss": 0.0056, - "step": 395310 + "step": 770280 }, { - "epoch": 1.99, - "learning_rate": 8.339597701439374e-07, - "loss": 0.0054, - "step": 395320 + "epoch": 2.0, + "learning_rate": 4.945811224503021e-07, + "loss": 0.0058, + "step": 770290 }, { - "epoch": 1.99, - "learning_rate": 8.263920771299271e-07, - "loss": 0.0045, - "step": 395330 + "epoch": 2.0, + "learning_rate": 4.906929060788375e-07, + "loss": 0.0069, + "step": 770300 }, { - "epoch": 1.99, - "learning_rate": 8.188243841159168e-07, - "loss": 0.0059, - "step": 395340 + "epoch": 2.0, + "learning_rate": 4.868046897073728e-07, + "loss": 0.0073, + "step": 770310 }, { - "epoch": 1.99, - "learning_rate": 8.112566911019065e-07, - "loss": 0.0061, - "step": 395350 + "epoch": 2.0, + "learning_rate": 4.829164733359082e-07, + "loss": 0.0056, + "step": 770320 }, { - "epoch": 1.99, - "learning_rate": 8.036889980878962e-07, - "loss": 0.005, - "step": 395360 + "epoch": 2.0, + "learning_rate": 4.790282569644435e-07, + "loss": 0.0067, + "step": 770330 }, { - "epoch": 1.99, - "learning_rate": 7.961213050738858e-07, + "epoch": 2.0, + "learning_rate": 4.7514004059297885e-07, + "loss": 0.0064, + "step": 770340 + }, + { + "epoch": 2.0, + "learning_rate": 4.7125182422151424e-07, "loss": 0.0051, - "step": 395370 + "step": 770350 }, { - "epoch": 1.99, - "learning_rate": 7.885536120598755e-07, + "epoch": 2.0, + "learning_rate": 4.6736360785004963e-07, + "loss": 0.0059, + "step": 770360 + }, + { + "epoch": 2.0, + "learning_rate": 4.6347539147858497e-07, "loss": 0.0066, - "step": 395380 + "step": 770370 }, { - "epoch": 1.99, - "learning_rate": 7.809859190458652e-07, - "loss": 0.0048, - "step": 395390 + "epoch": 2.0, + "learning_rate": 4.595871751071203e-07, + "loss": 0.0063, + "step": 770380 }, { - "epoch": 1.99, - "learning_rate": 7.734182260318549e-07, - "loss": 0.0054, - "step": 395400 + "epoch": 2.0, + "learning_rate": 4.5569895873565565e-07, + "loss": 0.0088, + "step": 770390 }, { - "epoch": 1.99, - "learning_rate": 7.658505330178446e-07, + "epoch": 2.0, + "learning_rate": 4.5181074236419104e-07, + "loss": 0.0102, + "step": 770400 + }, + { + "epoch": 2.0, + "learning_rate": 4.4792252599272643e-07, + "loss": 0.0071, + "step": 770410 + }, + { + "epoch": 2.0, + "learning_rate": 4.4403430962126177e-07, + "loss": 0.0058, + "step": 770420 + }, + { + "epoch": 2.0, + "learning_rate": 4.4014609324979716e-07, "loss": 0.0068, - "step": 395410 + "step": 770430 }, { - "epoch": 1.99, - "learning_rate": 7.582828400038343e-07, - "loss": 0.0089, - "step": 395420 + "epoch": 2.0, + "learning_rate": 4.3625787687833244e-07, + "loss": 0.0063, + "step": 770440 }, { - "epoch": 1.99, - "learning_rate": 7.507151469898239e-07, - "loss": 0.0066, - "step": 395430 + "epoch": 2.0, + "learning_rate": 4.3236966050686783e-07, + "loss": 0.0061, + "step": 770450 }, { "epoch": 2.0, - "learning_rate": 7.431474539758136e-07, - "loss": 0.0056, - "step": 395440 + "learning_rate": 4.284814441354032e-07, + "loss": 0.0107, + "step": 770460 }, { "epoch": 2.0, - "learning_rate": 7.355797609618033e-07, - "loss": 0.0045, - "step": 395450 + "learning_rate": 4.2459322776393856e-07, + "loss": 0.0053, + "step": 770470 }, { "epoch": 2.0, - "learning_rate": 7.28012067947793e-07, - "loss": 0.0056, - "step": 395460 + "learning_rate": 4.2070501139247395e-07, + "loss": 0.0092, + "step": 770480 }, { "epoch": 2.0, - "learning_rate": 7.204443749337827e-07, - "loss": 0.0042, - "step": 395470 + "learning_rate": 4.168167950210093e-07, + "loss": 0.0077, + "step": 770490 }, { "epoch": 2.0, - "learning_rate": 7.128766819197722e-07, - "loss": 0.0059, - "step": 395480 + "learning_rate": 4.1292857864954463e-07, + "loss": 0.0075, + "step": 770500 }, { "epoch": 2.0, - "learning_rate": 7.053089889057619e-07, - "loss": 0.008, - "step": 395490 + "learning_rate": 4.0904036227807997e-07, + "loss": 0.0115, + "step": 770510 }, { "epoch": 2.0, - "learning_rate": 6.977412958917516e-07, - "loss": 0.0062, - "step": 395500 + "learning_rate": 4.0515214590661536e-07, + "loss": 0.0079, + "step": 770520 }, { "epoch": 2.0, - "learning_rate": 6.901736028777413e-07, - "loss": 0.0062, - "step": 395510 + "learning_rate": 4.0126392953515075e-07, + "loss": 0.007, + "step": 770530 }, { "epoch": 2.0, - "learning_rate": 6.82605909863731e-07, - "loss": 0.0042, - "step": 395520 + "learning_rate": 3.973757131636861e-07, + "loss": 0.0064, + "step": 770540 }, { "epoch": 2.0, - "learning_rate": 6.750382168497206e-07, - "loss": 0.004, - "step": 395530 + "learning_rate": 3.934874967922215e-07, + "loss": 0.0063, + "step": 770550 }, { "epoch": 2.0, - "learning_rate": 6.674705238357103e-07, - "loss": 0.0054, - "step": 395540 + "learning_rate": 3.8959928042075687e-07, + "loss": 0.007, + "step": 770560 }, { "epoch": 2.0, - "learning_rate": 6.599028308217e-07, - "loss": 0.0066, - "step": 395550 + "learning_rate": 3.8571106404929216e-07, + "loss": 0.01, + "step": 770570 }, { "epoch": 2.0, - "learning_rate": 6.523351378076897e-07, - "loss": 0.0051, - "step": 395560 + "learning_rate": 3.8182284767782755e-07, + "loss": 0.0093, + "step": 770580 }, { "epoch": 2.0, - "learning_rate": 6.447674447936794e-07, - "loss": 0.0068, - "step": 395570 + "learning_rate": 3.779346313063629e-07, + "loss": 0.0092, + "step": 770590 }, { "epoch": 2.0, - "learning_rate": 6.371997517796691e-07, - "loss": 0.0058, - "step": 395580 + "learning_rate": 3.740464149348983e-07, + "loss": 0.0078, + "step": 770600 }, { "epoch": 2.0, - "learning_rate": 6.296320587656587e-07, + "learning_rate": 3.7015819856343367e-07, "loss": 0.0053, - "step": 395590 + "step": 770610 }, { "epoch": 2.0, - "learning_rate": 6.220643657516484e-07, - "loss": 0.0043, - "step": 395600 + "learning_rate": 3.66269982191969e-07, + "loss": 0.0061, + "step": 770620 }, { "epoch": 2.0, - "learning_rate": 6.144966727376381e-07, - "loss": 0.0056, - "step": 395610 + "learning_rate": 3.6238176582050434e-07, + "loss": 0.0084, + "step": 770630 }, { "epoch": 2.0, - "learning_rate": 6.069289797236278e-07, - "loss": 0.0036, - "step": 395620 + "learning_rate": 3.584935494490397e-07, + "loss": 0.0091, + "step": 770640 }, { "epoch": 2.0, - "learning_rate": 5.993612867096175e-07, - "loss": 0.0052, - "step": 395630 + "learning_rate": 3.5460533307757507e-07, + "loss": 0.0083, + "step": 770650 }, { "epoch": 2.0, - "learning_rate": 5.917935936956072e-07, - "loss": 0.0069, - "step": 395640 + "learning_rate": 3.507171167061104e-07, + "loss": 0.0064, + "step": 770660 }, { "epoch": 2.0, - "learning_rate": 5.842259006815968e-07, - "loss": 0.0048, - "step": 395650 + "learning_rate": 3.468289003346458e-07, + "loss": 0.0055, + "step": 770670 }, { "epoch": 2.0, - "learning_rate": 5.766582076675865e-07, - "loss": 0.0064, - "step": 395660 + "learning_rate": 3.429406839631812e-07, + "loss": 0.0087, + "step": 770680 }, { "epoch": 2.0, - "learning_rate": 5.690905146535762e-07, - "loss": 0.005, - "step": 395670 + "learning_rate": 3.390524675917165e-07, + "loss": 0.0072, + "step": 770690 }, { "epoch": 2.0, - "learning_rate": 5.615228216395658e-07, - "loss": 0.0061, - "step": 395680 + "learning_rate": 3.3516425122025187e-07, + "loss": 0.0071, + "step": 770700 }, { "epoch": 2.0, - "learning_rate": 5.539551286255555e-07, - "loss": 0.0051, - "step": 395690 + "learning_rate": 3.312760348487872e-07, + "loss": 0.0065, + "step": 770710 }, { "epoch": 2.0, - "learning_rate": 5.463874356115452e-07, + "learning_rate": 3.273878184773226e-07, + "loss": 0.0083, + "step": 770720 + }, + { + "epoch": 2.0, + "learning_rate": 3.23499602105858e-07, + "loss": 0.0073, + "step": 770730 + }, + { + "epoch": 2.0, + "learning_rate": 3.196113857343933e-07, "loss": 0.0065, - "step": 395700 + "step": 770740 }, { "epoch": 2.0, - "learning_rate": 5.388197425975349e-07, - "loss": 0.0054, - "step": 395710 + "learning_rate": 3.157231693629287e-07, + "loss": 0.0089, + "step": 770750 }, { "epoch": 2.0, - "learning_rate": 5.312520495835246e-07, - "loss": 0.0042, - "step": 395720 + "learning_rate": 3.11834952991464e-07, + "loss": 0.0087, + "step": 770760 }, { "epoch": 2.0, - "learning_rate": 5.236843565695142e-07, - "loss": 0.0079, - "step": 395730 + "learning_rate": 3.079467366199994e-07, + "loss": 0.0083, + "step": 770770 }, { "epoch": 2.0, - "learning_rate": 5.161166635555039e-07, - "loss": 0.0063, - "step": 395740 + "learning_rate": 3.040585202485348e-07, + "loss": 0.0059, + "step": 770780 }, { "epoch": 2.0, - "learning_rate": 5.085489705414936e-07, - "loss": 0.0047, - "step": 395750 + "learning_rate": 3.001703038770701e-07, + "loss": 0.0055, + "step": 770790 + }, + { + "epoch": 2.0, + "learning_rate": 2.962820875056055e-07, + "loss": 0.0077, + "step": 770800 + }, + { + "epoch": 2.0, + "learning_rate": 2.9239387113414085e-07, + "loss": 0.0056, + "step": 770810 }, { "epoch": 2.0, - "learning_rate": 5.009812775274833e-07, + "learning_rate": 2.8850565476267624e-07, "loss": 0.0086, - "step": 395760 + "step": 770820 }, { "epoch": 2.0, - "learning_rate": 4.93413584513473e-07, - "loss": 0.0062, - "step": 395770 + "learning_rate": 2.846174383912116e-07, + "loss": 0.0038, + "step": 770830 }, { "epoch": 2.0, - "learning_rate": 4.858458914994627e-07, - "loss": 0.0044, - "step": 395780 + "learning_rate": 2.807292220197469e-07, + "loss": 0.0069, + "step": 770840 }, { "epoch": 2.0, - "learning_rate": 4.782781984854523e-07, - "loss": 0.0036, - "step": 395790 + "learning_rate": 2.768410056482823e-07, + "loss": 0.0064, + "step": 770850 }, { "epoch": 2.0, - "learning_rate": 4.70710505471442e-07, - "loss": 0.0067, - "step": 395800 + "learning_rate": 2.7295278927681764e-07, + "loss": 0.0126, + "step": 770860 }, { "epoch": 2.0, - "learning_rate": 4.631428124574317e-07, - "loss": 0.0058, - "step": 395810 + "learning_rate": 2.69064572905353e-07, + "loss": 0.0084, + "step": 770870 }, { "epoch": 2.0, - "learning_rate": 4.5557511944342136e-07, + "learning_rate": 2.6517635653388837e-07, + "loss": 0.0053, + "step": 770880 + }, + { + "epoch": 2.0, + "learning_rate": 2.6128814016242376e-07, "loss": 0.0068, - "step": 395820 + "step": 770890 }, { "epoch": 2.0, - "learning_rate": 4.48007426429411e-07, - "loss": 0.0067, - "step": 395830 + "learning_rate": 2.573999237909591e-07, + "loss": 0.0053, + "step": 770900 }, { "epoch": 2.0, - "learning_rate": 4.404397334154007e-07, - "loss": 0.0083, - "step": 395840 + "learning_rate": 2.5351170741949444e-07, + "loss": 0.0073, + "step": 770910 }, { "epoch": 2.0, - "learning_rate": 4.328720404013904e-07, - "loss": 0.005, - "step": 395850 + "learning_rate": 2.4962349104802983e-07, + "loss": 0.0065, + "step": 770920 }, { "epoch": 2.0, - "learning_rate": 4.2530434738738006e-07, - "loss": 0.006, - "step": 395860 + "learning_rate": 2.4573527467656517e-07, + "loss": 0.0073, + "step": 770930 }, { "epoch": 2.0, - "learning_rate": 4.1773665437336976e-07, - "loss": 0.0043, - "step": 395870 + "learning_rate": 2.4184705830510056e-07, + "loss": 0.0066, + "step": 770940 }, { "epoch": 2.0, - "learning_rate": 4.1016896135935946e-07, - "loss": 0.0056, - "step": 395880 + "learning_rate": 2.3795884193363592e-07, + "loss": 0.0074, + "step": 770950 }, { "epoch": 2.0, - "learning_rate": 4.026012683453491e-07, - "loss": 0.0065, - "step": 395890 + "learning_rate": 2.3407062556217126e-07, + "loss": 0.0095, + "step": 770960 }, { "epoch": 2.0, - "learning_rate": 3.950335753313388e-07, - "loss": 0.0047, - "step": 395900 + "learning_rate": 2.3018240919070663e-07, + "loss": 0.006, + "step": 770970 }, { "epoch": 2.0, - "learning_rate": 3.8746588231732846e-07, - "loss": 0.0051, - "step": 395910 + "learning_rate": 2.26294192819242e-07, + "loss": 0.0079, + "step": 770980 }, { "epoch": 2.0, - "learning_rate": 3.7989818930331816e-07, - "loss": 0.0048, - "step": 395920 + "learning_rate": 2.2240597644777733e-07, + "loss": 0.0069, + "step": 770990 }, { "epoch": 2.0, - "learning_rate": 3.7233049628930786e-07, - "loss": 0.0056, - "step": 395930 + "learning_rate": 2.185177600763127e-07, + "loss": 0.0071, + "step": 771000 }, { "epoch": 2.0, - "learning_rate": 3.647628032752975e-07, - "loss": 0.0061, - "step": 395940 + "eval_cer": 0.8816788924952867, + "eval_loss": 0.004364285618066788, + "eval_runtime": 107.9463, + "eval_samples_per_second": 18.528, + "eval_steps_per_second": 4.632, + "step": 771000 }, { "epoch": 2.0, - "learning_rate": 3.5719511026128716e-07, - "loss": 0.004, - "step": 395950 + "learning_rate": 2.1462954370484808e-07, + "loss": 0.0041, + "step": 771010 }, { "epoch": 2.0, - "learning_rate": 3.4962741724727686e-07, - "loss": 0.0052, - "step": 395960 + "learning_rate": 2.1074132733338342e-07, + "loss": 0.0091, + "step": 771020 }, { "epoch": 2.0, - "learning_rate": 3.420597242332665e-07, - "loss": 0.0054, - "step": 395970 + "learning_rate": 2.068531109619188e-07, + "loss": 0.0075, + "step": 771030 }, { "epoch": 2.0, - "learning_rate": 3.344920312192562e-07, - "loss": 0.0061, - "step": 395980 + "learning_rate": 2.0296489459045415e-07, + "loss": 0.0069, + "step": 771040 }, { "epoch": 2.0, - "learning_rate": 3.269243382052459e-07, - "loss": 0.005, - "step": 395990 + "learning_rate": 1.990766782189895e-07, + "loss": 0.0062, + "step": 771050 }, { "epoch": 2.0, - "learning_rate": 3.1935664519123556e-07, - "loss": 0.0044, - "step": 396000 + "learning_rate": 1.9518846184752488e-07, + "loss": 0.0067, + "step": 771060 }, { "epoch": 2.0, - "eval_cer": 0.9144159137201398, - "eval_loss": 0.004107584245502949, - "eval_runtime": 116.1979, - "eval_samples_per_second": 17.212, - "eval_steps_per_second": 4.303, - "step": 396000 + "learning_rate": 1.9130024547606024e-07, + "loss": 0.0062, + "step": 771070 }, { "epoch": 2.0, - "learning_rate": 3.1178895217722526e-07, - "loss": 0.0042, - "step": 396010 + "learning_rate": 1.874120291045956e-07, + "loss": 0.01, + "step": 771080 + }, + { + "epoch": 2.0, + "learning_rate": 1.8352381273313095e-07, + "loss": 0.007, + "step": 771090 }, { "epoch": 2.0, - "learning_rate": 3.0422125916321496e-07, + "learning_rate": 1.796355963616663e-07, "loss": 0.0065, - "step": 396020 + "step": 771100 }, { "epoch": 2.0, - "learning_rate": 2.966535661492046e-07, - "loss": 0.0079, - "step": 396030 + "learning_rate": 1.757473799902017e-07, + "loss": 0.0065, + "step": 771110 }, { "epoch": 2.0, - "learning_rate": 2.890858731351943e-07, - "loss": 0.0049, - "step": 396040 + "learning_rate": 1.7185916361873704e-07, + "loss": 0.0053, + "step": 771120 + }, + { + "epoch": 2.0, + "learning_rate": 1.679709472472724e-07, + "loss": 0.0059, + "step": 771130 + }, + { + "epoch": 2.0, + "learning_rate": 1.6408273087580777e-07, + "loss": 0.0062, + "step": 771140 }, { "epoch": 2.0, - "learning_rate": 2.8151818012118396e-07, + "learning_rate": 1.601945145043431e-07, "loss": 0.0066, - "step": 396050 + "step": 771150 }, { "epoch": 2.0, - "learning_rate": 2.7395048710717366e-07, - "loss": 0.0055, - "step": 396060 + "learning_rate": 1.563062981328785e-07, + "loss": 0.0076, + "step": 771160 }, { "epoch": 2.0, - "learning_rate": 2.663827940931633e-07, - "loss": 0.0048, - "step": 396070 + "learning_rate": 1.5241808176141386e-07, + "loss": 0.0112, + "step": 771170 }, { "epoch": 2.0, - "learning_rate": 2.58815101079153e-07, - "loss": 0.0059, - "step": 396080 + "learning_rate": 1.485298653899492e-07, + "loss": 0.0067, + "step": 771180 }, { "epoch": 2.0, - "learning_rate": 2.512474080651427e-07, - "loss": 0.0055, - "step": 396090 + "learning_rate": 1.4464164901848456e-07, + "loss": 0.0063, + "step": 771190 }, { "epoch": 2.0, - "learning_rate": 2.4367971505113236e-07, - "loss": 0.0039, - "step": 396100 + "learning_rate": 1.4075343264701993e-07, + "loss": 0.0078, + "step": 771200 }, { "epoch": 2.0, - "learning_rate": 2.3611202203712206e-07, - "loss": 0.0043, - "step": 396110 + "learning_rate": 1.368652162755553e-07, + "loss": 0.0077, + "step": 771210 }, { "epoch": 2.0, - "learning_rate": 2.285443290231117e-07, - "loss": 0.0069, - "step": 396120 + "learning_rate": 1.3297699990409066e-07, + "loss": 0.0093, + "step": 771220 }, { "epoch": 2.0, - "learning_rate": 2.2097663600910138e-07, - "loss": 0.0048, - "step": 396130 + "learning_rate": 1.2908878353262602e-07, + "loss": 0.0099, + "step": 771230 }, { "epoch": 2.0, - "learning_rate": 2.1340894299509105e-07, - "loss": 0.0041, - "step": 396140 + "learning_rate": 1.252005671611614e-07, + "loss": 0.0067, + "step": 771240 }, { "epoch": 2.0, - "learning_rate": 2.0584124998108076e-07, - "loss": 0.0069, - "step": 396150 + "learning_rate": 1.2131235078969672e-07, + "loss": 0.0088, + "step": 771250 }, { "epoch": 2.0, - "learning_rate": 1.9827355696707043e-07, - "loss": 0.0048, - "step": 396160 + "learning_rate": 1.174241344182321e-07, + "loss": 0.0064, + "step": 771260 }, { "epoch": 2.0, - "learning_rate": 1.907058639530601e-07, - "loss": 0.0061, - "step": 396170 + "learning_rate": 1.1353591804676745e-07, + "loss": 0.0065, + "step": 771270 }, { "epoch": 2.0, - "learning_rate": 1.831381709390498e-07, - "loss": 0.0049, - "step": 396180 + "learning_rate": 1.0964770167530282e-07, + "loss": 0.0083, + "step": 771280 }, { "epoch": 2.0, - "learning_rate": 1.7557047792503945e-07, - "loss": 0.0058, - "step": 396190 + "learning_rate": 1.0575948530383818e-07, + "loss": 0.006, + "step": 771290 }, { "epoch": 2.0, - "learning_rate": 1.6800278491102913e-07, - "loss": 0.0052, - "step": 396200 + "learning_rate": 1.0187126893237353e-07, + "loss": 0.0068, + "step": 771300 }, { "epoch": 2.0, - "learning_rate": 1.604350918970188e-07, - "loss": 0.0048, - "step": 396210 + "learning_rate": 9.79830525609089e-08, + "loss": 0.0067, + "step": 771310 }, { "epoch": 2.0, - "learning_rate": 1.528673988830085e-07, - "loss": 0.0044, - "step": 396220 + "learning_rate": 9.409483618944426e-08, + "loss": 0.006, + "step": 771320 }, { "epoch": 2.0, - "learning_rate": 1.4529970586899818e-07, - "loss": 0.0069, - "step": 396230 + "learning_rate": 9.020661981797961e-08, + "loss": 0.0059, + "step": 771330 }, { "epoch": 2.0, - "learning_rate": 1.3773201285498785e-07, - "loss": 0.0053, - "step": 396240 + "learning_rate": 8.631840344651499e-08, + "loss": 0.0068, + "step": 771340 }, { "epoch": 2.0, - "learning_rate": 1.3016431984097753e-07, - "loss": 0.0071, - "step": 396250 + "learning_rate": 8.243018707505034e-08, + "loss": 0.0079, + "step": 771350 }, { "epoch": 2.0, - "learning_rate": 1.225966268269672e-07, - "loss": 0.0066, - "step": 396260 + "learning_rate": 7.854197070358571e-08, + "loss": 0.0049, + "step": 771360 }, { "epoch": 2.0, - "learning_rate": 1.1502893381295688e-07, - "loss": 0.0054, - "step": 396270 + "learning_rate": 7.465375433212107e-08, + "loss": 0.0048, + "step": 771370 }, { "epoch": 2.0, - "learning_rate": 1.0746124079894656e-07, - "loss": 0.006, - "step": 396280 + "learning_rate": 7.076553796065642e-08, + "loss": 0.0066, + "step": 771380 }, { "epoch": 2.0, - "learning_rate": 9.989354778493625e-08, - "loss": 0.0061, - "step": 396290 + "learning_rate": 6.687732158919179e-08, + "loss": 0.0075, + "step": 771390 }, { "epoch": 2.0, - "learning_rate": 9.232585477092593e-08, - "loss": 0.0059, - "step": 396300 + "learning_rate": 6.298910521772715e-08, + "loss": 0.0064, + "step": 771400 }, { "epoch": 2.0, - "learning_rate": 8.47581617569156e-08, - "loss": 0.0049, - "step": 396310 + "learning_rate": 5.910088884626251e-08, + "loss": 0.0066, + "step": 771410 }, { "epoch": 2.0, - "learning_rate": 7.719046874290528e-08, - "loss": 0.0063, - "step": 396320 + "learning_rate": 5.5212672474797874e-08, + "loss": 0.0103, + "step": 771420 }, { "epoch": 2.0, - "learning_rate": 6.962277572889495e-08, - "loss": 0.0069, - "step": 396330 + "learning_rate": 5.132445610333324e-08, + "loss": 0.0052, + "step": 771430 }, { "epoch": 2.0, - "learning_rate": 6.205508271488464e-08, - "loss": 0.0054, - "step": 396340 + "learning_rate": 4.743623973186859e-08, + "loss": 0.0088, + "step": 771440 + }, + { + "epoch": 2.0, + "learning_rate": 4.3548023360403954e-08, + "loss": 0.0068, + "step": 771450 }, { "epoch": 2.0, - "learning_rate": 5.4487389700874314e-08, + "learning_rate": 3.965980698893932e-08, "loss": 0.0046, - "step": 396350 + "step": 771460 }, { "epoch": 2.0, - "learning_rate": 4.6919696686863995e-08, - "loss": 0.0044, - "step": 396360 + "learning_rate": 3.5771590617474676e-08, + "loss": 0.0062, + "step": 771470 }, { "epoch": 2.0, - "learning_rate": 3.935200367285367e-08, - "loss": 0.0049, - "step": 396370 + "learning_rate": 3.1883374246010034e-08, + "loss": 0.011, + "step": 771480 }, { "epoch": 2.0, - "learning_rate": 3.178431065884335e-08, - "loss": 0.0076, - "step": 396380 + "learning_rate": 2.7995157874545402e-08, + "loss": 0.0047, + "step": 771490 }, { "epoch": 2.0, - "learning_rate": 2.421661764483303e-08, - "loss": 0.0049, - "step": 396390 + "learning_rate": 2.410694150308076e-08, + "loss": 0.0062, + "step": 771500 }, { "epoch": 2.0, - "learning_rate": 1.6648924630822707e-08, - "loss": 0.007, - "step": 396400 + "learning_rate": 2.0218725131616124e-08, + "loss": 0.005, + "step": 771510 }, { "epoch": 2.0, - "learning_rate": 9.081231616812386e-09, - "loss": 0.0071, - "step": 396410 + "learning_rate": 1.6330508760151485e-08, + "loss": 0.0062, + "step": 771520 }, { "epoch": 2.0, - "learning_rate": 1.5135386028020643e-09, - "loss": 0.0046, - "step": 396420 + "learning_rate": 1.2442292388686843e-08, + "loss": 0.0069, + "step": 771530 + }, + { + "epoch": 2.0, + "learning_rate": 8.554076017222206e-09, + "loss": 0.0052, + "step": 771540 + }, + { + "epoch": 2.0, + "learning_rate": 4.665859645757567e-09, + "loss": 0.0056, + "step": 771550 + }, + { + "epoch": 2.0, + "learning_rate": 7.776432742929277e-10, + "loss": 0.0065, + "step": 771560 }, { "epoch": 2.0, - "step": 396422, - "total_flos": 1.969031441954304e+18, - "train_loss": 0.013614018808192265, - "train_runtime": 415192.129, - "train_samples_per_second": 30.553, - "train_steps_per_second": 0.955 + "step": 771562, + "total_flos": 2.7387918028032307e+18, + "train_loss": 0.015195539450556274, + "train_runtime": 661141.8667, + "train_samples_per_second": 37.344, + "train_steps_per_second": 1.167 } ], - "max_steps": 396422, + "max_steps": 771562, "num_train_epochs": 2, - "total_flos": 1.969031441954304e+18, + "total_flos": 2.7387918028032307e+18, "trial_name": null, "trial_params": null } diff --git a/training_args.bin b/training_args.bin index dd7ed437e2e51efe83f1dc0ea00a5bbae4a92271..b651c633befdfaeb5f04697d80cc7767ec998aca 100644 --- a/training_args.bin +++ b/training_args.bin @@ -1,3 +1,3 @@ version https://git-lfs.github.com/spec/v1 -oid sha256:1cd15191290a2c0e137c6f35a6f650076ece6690fadfa42b7621140db2393fbb +oid sha256:af0d77e3580564697cbe300261b556af6cb371b3e4c8b296c8a6fc9f93eb7626 size 4155